| Yann Collet | 394bdd7 | 2017-08-29 09:24:11 -0700 | [diff] [blame^] | 1 | /* |
| 2 | * Copyright (c) 2016-present, Yann Collet, Facebook, Inc. |
| Yann Collet | 4ded9e5 | 2016-08-30 10:04:33 -0700 | [diff] [blame] | 3 | * All rights reserved. |
| 4 | * |
| Yann Collet | 394bdd7 | 2017-08-29 09:24:11 -0700 | [diff] [blame^] | 5 | * This source code is licensed under both the BSD-style license (found in the |
| 6 | * LICENSE file in the root directory of this source tree) and the GPLv2 (found |
| 7 | * in the COPYING file in the root directory of this source tree). |
| Yann Collet | 4ded9e5 | 2016-08-30 10:04:33 -0700 | [diff] [blame] | 8 | */ |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 9 | |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 10 | |
| 11 | #include <stdlib.h> // malloc, exit |
| 12 | #include <stdio.h> // printf |
| 13 | #include <string.h> // strerror |
| 14 | #include <errno.h> // errno |
| 15 | #include <sys/stat.h> // stat |
| 16 | #include <zstd.h> // presumes zstd library is installed |
| 17 | |
| 18 | |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 19 | static off_t fsize_orDie(const char *filename) |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 20 | { |
| 21 | struct stat st; |
| 22 | if (stat(filename, &st) == 0) return st.st_size; |
| 23 | /* error */ |
| 24 | perror(filename); |
| 25 | exit(1); |
| 26 | } |
| 27 | |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 28 | static FILE* fopen_orDie(const char *filename, const char *instruction) |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 29 | { |
| 30 | FILE* const inFile = fopen(filename, instruction); |
| 31 | if (inFile) return inFile; |
| 32 | /* error */ |
| 33 | perror(filename); |
| 34 | exit(2); |
| 35 | } |
| 36 | |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 37 | static void* malloc_orDie(size_t size) |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 38 | { |
| 39 | void* const buff = malloc(size); |
| 40 | if (buff) return buff; |
| 41 | /* error */ |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 42 | perror("malloc"); |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 43 | exit(3); |
| 44 | } |
| 45 | |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 46 | static void* loadFile_orDie(const char* fileName, size_t* size) |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 47 | { |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 48 | off_t const buffSize = fsize_orDie(fileName); |
| 49 | FILE* const inFile = fopen_orDie(fileName, "rb"); |
| 50 | void* const buffer = malloc_orDie(buffSize); |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 51 | size_t const readSize = fread(buffer, 1, buffSize, inFile); |
| 52 | if (readSize != (size_t)buffSize) { |
| 53 | fprintf(stderr, "fread: %s : %s \n", fileName, strerror(errno)); |
| 54 | exit(4); |
| 55 | } |
| 56 | fclose(inFile); |
| 57 | *size = buffSize; |
| 58 | return buffer; |
| 59 | } |
| 60 | |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 61 | static void saveFile_orDie(const char* fileName, const void* buff, size_t buffSize) |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 62 | { |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 63 | FILE* const oFile = fopen_orDie(fileName, "wb"); |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 64 | size_t const wSize = fwrite(buff, 1, buffSize, oFile); |
| 65 | if (wSize != (size_t)buffSize) { |
| 66 | fprintf(stderr, "fwrite: %s : %s \n", fileName, strerror(errno)); |
| 67 | exit(5); |
| 68 | } |
| 69 | if (fclose(oFile)) { |
| 70 | perror(fileName); |
| 71 | exit(6); |
| 72 | } |
| 73 | } |
| 74 | |
| 75 | /* createDict() : |
| 76 | `dictFileName` is supposed to have been created using `zstd --train` */ |
| Yann Collet | a266464 | 2016-09-09 19:33:56 +0200 | [diff] [blame] | 77 | static ZSTD_CDict* createCDict_orDie(const char* dictFileName, int cLevel) |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 78 | { |
| 79 | size_t dictSize; |
| 80 | printf("loading dictionary %s \n", dictFileName); |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 81 | void* const dictBuffer = loadFile_orDie(dictFileName, &dictSize); |
| Yann Collet | a266464 | 2016-09-09 19:33:56 +0200 | [diff] [blame] | 82 | ZSTD_CDict* const cdict = ZSTD_createCDict(dictBuffer, dictSize, cLevel); |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 83 | if (!cdict) { |
| 84 | fprintf(stderr, "ZSTD_createCDict error \n"); |
| 85 | exit(7); |
| 86 | } |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 87 | free(dictBuffer); |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 88 | return cdict; |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 89 | } |
| 90 | |
| 91 | |
| 92 | static void compress(const char* fname, const char* oname, const ZSTD_CDict* cdict) |
| 93 | { |
| 94 | size_t fSize; |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 95 | void* const fBuff = loadFile_orDie(fname, &fSize); |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 96 | size_t const cBuffSize = ZSTD_compressBound(fSize); |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 97 | void* const cBuff = malloc_orDie(cBuffSize); |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 98 | |
| 99 | ZSTD_CCtx* const cctx = ZSTD_createCCtx(); |
| Yann Collet | a266464 | 2016-09-09 19:33:56 +0200 | [diff] [blame] | 100 | if (cctx==NULL) { fprintf(stderr, "ZSTD_createCCtx() error \n"); exit(10); } |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 101 | size_t const cSize = ZSTD_compress_usingCDict(cctx, cBuff, cBuffSize, fBuff, fSize, cdict); |
| 102 | if (ZSTD_isError(cSize)) { |
| 103 | fprintf(stderr, "error compressing %s : %s \n", fname, ZSTD_getErrorName(cSize)); |
| 104 | exit(7); |
| 105 | } |
| 106 | |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 107 | saveFile_orDie(oname, cBuff, cSize); |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 108 | |
| 109 | /* success */ |
| 110 | printf("%25s : %6u -> %7u - %s \n", fname, (unsigned)fSize, (unsigned)cSize, oname); |
| 111 | |
| Yann Collet | a266464 | 2016-09-09 19:33:56 +0200 | [diff] [blame] | 112 | ZSTD_freeCCtx(cctx); /* never fails */ |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 113 | free(fBuff); |
| 114 | free(cBuff); |
| 115 | } |
| 116 | |
| 117 | |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 118 | static char* createOutFilename_orDie(const char* filename) |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 119 | { |
| 120 | size_t const inL = strlen(filename); |
| 121 | size_t const outL = inL + 5; |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 122 | void* outSpace = malloc_orDie(outL); |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 123 | memset(outSpace, 0, outL); |
| 124 | strcat(outSpace, filename); |
| 125 | strcat(outSpace, ".zst"); |
| 126 | return (char*)outSpace; |
| 127 | } |
| 128 | |
| 129 | int main(int argc, const char** argv) |
| 130 | { |
| 131 | const char* const exeName = argv[0]; |
| Yann Collet | a266464 | 2016-09-09 19:33:56 +0200 | [diff] [blame] | 132 | int const cLevel = 3; |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 133 | |
| 134 | if (argc<3) { |
| 135 | fprintf(stderr, "wrong arguments\n"); |
| 136 | fprintf(stderr, "usage:\n"); |
| 137 | fprintf(stderr, "%s [FILES] dictionary\n", exeName); |
| 138 | return 1; |
| 139 | } |
| 140 | |
| 141 | /* load dictionary only once */ |
| 142 | const char* const dictName = argv[argc-1]; |
| Yann Collet | a266464 | 2016-09-09 19:33:56 +0200 | [diff] [blame] | 143 | ZSTD_CDict* const dictPtr = createCDict_orDie(dictName, cLevel); |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 144 | |
| 145 | int u; |
| 146 | for (u=1; u<argc-1; u++) { |
| 147 | const char* inFilename = argv[u]; |
| Yann Collet | 373d4f9 | 2016-08-01 17:36:11 +0200 | [diff] [blame] | 148 | char* const outFilename = createOutFilename_orDie(inFilename); |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 149 | compress(inFilename, outFilename, dictPtr); |
| 150 | free(outFilename); |
| 151 | } |
| 152 | |
| Yann Collet | 0b2d682 | 2016-08-01 17:39:06 +0200 | [diff] [blame] | 153 | ZSTD_freeCDict(dictPtr); |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 154 | printf("All %u files compressed. \n", argc-2); |
| Yann Collet | 0763905 | 2016-08-03 01:57:57 +0200 | [diff] [blame] | 155 | return 0; |
| Yann Collet | cadd7cd | 2016-07-15 18:52:37 +0200 | [diff] [blame] | 156 | } |