zstd/examples/dictionary_compression.c

98 lines
3.2 KiB
C
Raw Normal View History

/*
* Copyright (c) 2016-2020 Yann Collet, Facebook, Inc.
2016-08-30 17:04:33 +00:00
* All rights reserved.
*
* This source code is licensed under both the BSD-style license (found in the
* LICENSE file in the root directory of this source tree) and the GPLv2 (found
* in the COPYING file in the root directory of this source tree).
* You may select, at your option, one of the above-listed licenses.
2016-08-30 17:04:33 +00:00
*/
2016-07-15 16:52:37 +00:00
#include <stdio.h> // printf
#include <stdlib.h> // free
#include <string.h> // memset, strcat
2016-07-15 16:52:37 +00:00
#include <zstd.h> // presumes zstd library is installed
#include "common.h" // Helper functions, CHECK(), and CHECK_ZSTD()
2016-07-15 16:52:37 +00:00
/* createDict() :
`dictFileName` is supposed to have been created using `zstd --train` */
2016-09-09 17:33:56 +00:00
static ZSTD_CDict* createCDict_orDie(const char* dictFileName, int cLevel)
2016-07-15 16:52:37 +00:00
{
size_t dictSize;
printf("loading dictionary %s \n", dictFileName);
void* const dictBuffer = mallocAndLoadFile_orDie(dictFileName, &dictSize);
2016-09-09 17:33:56 +00:00
ZSTD_CDict* const cdict = ZSTD_createCDict(dictBuffer, dictSize, cLevel);
CHECK(cdict != NULL, "ZSTD_createCDict() failed!");
2016-07-15 16:52:37 +00:00
free(dictBuffer);
2016-08-01 15:36:11 +00:00
return cdict;
2016-07-15 16:52:37 +00:00
}
static void compress(const char* fname, const char* oname, const ZSTD_CDict* cdict)
{
size_t fSize;
void* const fBuff = mallocAndLoadFile_orDie(fname, &fSize);
2016-07-15 16:52:37 +00:00
size_t const cBuffSize = ZSTD_compressBound(fSize);
2016-08-01 15:36:11 +00:00
void* const cBuff = malloc_orDie(cBuffSize);
2016-07-15 16:52:37 +00:00
/* Compress using the dictionary.
* This function writes the dictionary id, and content size into the header.
* But, it doesn't use a checksum. You can control these options using the
* advanced API: ZSTD_CCtx_setParameter(), ZSTD_CCtx_refCDict(),
* and ZSTD_compress2().
*/
2016-07-15 16:52:37 +00:00
ZSTD_CCtx* const cctx = ZSTD_createCCtx();
CHECK(cctx != NULL, "ZSTD_createCCtx() failed!");
2016-07-15 16:52:37 +00:00
size_t const cSize = ZSTD_compress_usingCDict(cctx, cBuff, cBuffSize, fBuff, fSize, cdict);
CHECK_ZSTD(cSize);
2016-07-15 16:52:37 +00:00
2016-08-01 15:36:11 +00:00
saveFile_orDie(oname, cBuff, cSize);
2016-07-15 16:52:37 +00:00
/* success */
printf("%25s : %6u -> %7u - %s \n", fname, (unsigned)fSize, (unsigned)cSize, oname);
2016-09-09 17:33:56 +00:00
ZSTD_freeCCtx(cctx); /* never fails */
2016-07-15 16:52:37 +00:00
free(fBuff);
free(cBuff);
}
2016-08-01 15:36:11 +00:00
static char* createOutFilename_orDie(const char* filename)
2016-07-15 16:52:37 +00:00
{
size_t const inL = strlen(filename);
size_t const outL = inL + 5;
2016-08-01 15:36:11 +00:00
void* outSpace = malloc_orDie(outL);
2016-07-15 16:52:37 +00:00
memset(outSpace, 0, outL);
strcat(outSpace, filename);
strcat(outSpace, ".zst");
return (char*)outSpace;
}
int main(int argc, const char** argv)
{
const char* const exeName = argv[0];
2016-09-09 17:33:56 +00:00
int const cLevel = 3;
2016-07-15 16:52:37 +00:00
if (argc<3) {
fprintf(stderr, "wrong arguments\n");
fprintf(stderr, "usage:\n");
fprintf(stderr, "%s [FILES] dictionary\n", exeName);
return 1;
}
/* load dictionary only once */
const char* const dictName = argv[argc-1];
2016-09-09 17:33:56 +00:00
ZSTD_CDict* const dictPtr = createCDict_orDie(dictName, cLevel);
2016-07-15 16:52:37 +00:00
int u;
for (u=1; u<argc-1; u++) {
const char* inFilename = argv[u];
2016-08-01 15:36:11 +00:00
char* const outFilename = createOutFilename_orDie(inFilename);
2016-07-15 16:52:37 +00:00
compress(inFilename, outFilename, dictPtr);
free(outFilename);
}
2016-08-01 15:39:06 +00:00
ZSTD_freeCDict(dictPtr);
2016-07-15 16:52:37 +00:00
printf("All %u files compressed. \n", argc-2);
return 0;
2016-07-15 16:52:37 +00:00
}