831 lines
29 KiB
C
831 lines
29 KiB
C
/*
|
|
LZ4io.c - LZ4 File/Stream Interface
|
|
Copyright (C) Yann Collet 2011-2015
|
|
|
|
GPL v2 License
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License along
|
|
with this program; if not, write to the Free Software Foundation, Inc.,
|
|
51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
|
|
You can contact the author at :
|
|
- LZ4 source repository : https://github.com/Cyan4973/lz4
|
|
- LZ4 public forum : https://groups.google.com/forum/#!forum/lz4c
|
|
*/
|
|
/*
|
|
Note : this is stand-alone program.
|
|
It is not part of LZ4 compression library, it is a user code of the LZ4 library.
|
|
- The license of LZ4 library is BSD.
|
|
- The license of xxHash library is BSD.
|
|
- The license of this source file is GPLv2.
|
|
*/
|
|
|
|
/**************************************
|
|
* Compiler Options
|
|
**************************************/
|
|
#ifdef _MSC_VER /* Visual Studio */
|
|
# define _CRT_SECURE_NO_WARNINGS
|
|
# define _CRT_SECURE_NO_DEPRECATE /* VS2005 */
|
|
# pragma warning(disable : 4127) /* disable: C4127: conditional expression is constant */
|
|
#endif
|
|
|
|
#define _LARGE_FILES /* Large file support on 32-bits AIX */
|
|
#define _FILE_OFFSET_BITS 64 /* Large file support on 32-bits unix */
|
|
|
|
|
|
/*****************************
|
|
* Includes
|
|
*****************************/
|
|
#include <stdio.h> /* fprintf, fopen, fread, stdin, stdout */
|
|
#include <stdlib.h> /* malloc, free */
|
|
#include <string.h> /* strcmp, strlen */
|
|
#include <time.h> /* clock */
|
|
#include <sys/types.h> /* stat64 */
|
|
#include <sys/stat.h> /* stat64 */
|
|
#include "lz4io.h"
|
|
#include "lz4.h" /* still required for legacy format */
|
|
#include "lz4hc.h" /* still required for legacy format */
|
|
#include "lz4frame.h"
|
|
|
|
|
|
/******************************
|
|
* OS-specific Includes
|
|
******************************/
|
|
#if defined(MSDOS) || defined(OS2) || defined(WIN32) || defined(_WIN32) || defined(__CYGWIN__)
|
|
# include <fcntl.h> /* _O_BINARY */
|
|
# include <io.h> /* _setmode, _fileno, _get_osfhandle */
|
|
# define SET_BINARY_MODE(file) _setmode(_fileno(file), _O_BINARY)
|
|
# include <Windows.h> /* DeviceIoControl, HANDLE, FSCTL_SET_SPARSE */
|
|
# define SET_SPARSE_FILE_MODE(file) { DWORD dw; DeviceIoControl((HANDLE) _get_osfhandle(_fileno(file)), FSCTL_SET_SPARSE, 0, 0, 0, 0, &dw, 0); }
|
|
# if defined(_MSC_VER) && (_MSC_VER >= 1400) /* Avoid MSVC fseek()'s 2GiB barrier */
|
|
# define fseek _fseeki64
|
|
# endif
|
|
#else
|
|
# define SET_BINARY_MODE(file)
|
|
# define SET_SPARSE_FILE_MODE(file)
|
|
#endif
|
|
|
|
|
|
/*****************************
|
|
* Constants
|
|
*****************************/
|
|
#define KB *(1 <<10)
|
|
#define MB *(1 <<20)
|
|
#define GB *(1U<<30)
|
|
|
|
#define _1BIT 0x01
|
|
#define _2BITS 0x03
|
|
#define _3BITS 0x07
|
|
#define _4BITS 0x0F
|
|
#define _8BITS 0xFF
|
|
|
|
#define MAGICNUMBER_SIZE 4
|
|
#define LZ4IO_MAGICNUMBER 0x184D2204
|
|
#define LZ4IO_SKIPPABLE0 0x184D2A50
|
|
#define LZ4IO_SKIPPABLEMASK 0xFFFFFFF0
|
|
#define LEGACY_MAGICNUMBER 0x184C2102
|
|
|
|
#define CACHELINE 64
|
|
#define LEGACY_BLOCKSIZE (8 MB)
|
|
#define MIN_STREAM_BUFSIZE (192 KB)
|
|
#define LZ4IO_BLOCKSIZEID_DEFAULT 7
|
|
|
|
#define sizeT sizeof(size_t)
|
|
#define maskT (sizeT - 1)
|
|
|
|
|
|
/**************************************
|
|
* Macros
|
|
**************************************/
|
|
#define DISPLAY(...) fprintf(stderr, __VA_ARGS__)
|
|
#define DISPLAYLEVEL(l, ...) if (g_displayLevel>=l) { DISPLAY(__VA_ARGS__); }
|
|
static int g_displayLevel = 0; /* 0 : no display ; 1: errors ; 2 : + result + interaction + warnings ; 3 : + progression; 4 : + information */
|
|
|
|
#define DISPLAYUPDATE(l, ...) if (g_displayLevel>=l) { \
|
|
if ((LZ4IO_GetMilliSpan(g_time) > refreshRate) || (g_displayLevel>=4)) \
|
|
{ g_time = clock(); DISPLAY(__VA_ARGS__); \
|
|
if (g_displayLevel>=4) fflush(stdout); } }
|
|
static const unsigned refreshRate = 150;
|
|
static clock_t g_time = 0;
|
|
|
|
|
|
/**************************************
|
|
* Local Parameters
|
|
**************************************/
|
|
static int g_overwrite = 1;
|
|
static int g_blockSizeId = LZ4IO_BLOCKSIZEID_DEFAULT;
|
|
static int g_blockChecksum = 0;
|
|
static int g_streamChecksum = 1;
|
|
static int g_blockIndependence = 1;
|
|
static int g_sparseFileSupport = 0;
|
|
static int g_contentSizeFlag = 0;
|
|
|
|
static const int minBlockSizeID = 4;
|
|
static const int maxBlockSizeID = 7;
|
|
|
|
|
|
/**************************************
|
|
* Exceptions
|
|
***************************************/
|
|
#define DEBUG 0
|
|
#define DEBUGOUTPUT(...) if (DEBUG) DISPLAY(__VA_ARGS__);
|
|
#define EXM_THROW(error, ...) \
|
|
{ \
|
|
DEBUGOUTPUT("Error defined at %s, line %i : \n", __FILE__, __LINE__); \
|
|
DISPLAYLEVEL(1, "Error %i : ", error); \
|
|
DISPLAYLEVEL(1, __VA_ARGS__); \
|
|
DISPLAYLEVEL(1, "\n"); \
|
|
exit(error); \
|
|
}
|
|
|
|
|
|
/**************************************
|
|
* Version modifiers
|
|
**************************************/
|
|
#define EXTENDED_ARGUMENTS
|
|
#define EXTENDED_HELP
|
|
#define EXTENDED_FORMAT
|
|
#define DEFAULT_DECOMPRESSOR decodeLZ4S
|
|
|
|
|
|
/* ************************************************** */
|
|
/* ****************** Parameters ******************** */
|
|
/* ************************************************** */
|
|
|
|
/* Default setting : overwrite = 1; return : overwrite mode (0/1) */
|
|
int LZ4IO_setOverwrite(int yes)
|
|
{
|
|
g_overwrite = (yes!=0);
|
|
return g_overwrite;
|
|
}
|
|
|
|
/* blockSizeID : valid values : 4-5-6-7 */
|
|
int LZ4IO_setBlockSizeID(int bsid)
|
|
{
|
|
static const int blockSizeTable[] = { 64 KB, 256 KB, 1 MB, 4 MB };
|
|
if ((bsid < minBlockSizeID) || (bsid > maxBlockSizeID)) return -1;
|
|
g_blockSizeId = bsid;
|
|
return blockSizeTable[g_blockSizeId-minBlockSizeID];
|
|
}
|
|
|
|
int LZ4IO_setBlockMode(LZ4IO_blockMode_t blockMode)
|
|
{
|
|
g_blockIndependence = (blockMode == LZ4IO_blockIndependent);
|
|
return g_blockIndependence;
|
|
}
|
|
|
|
/* Default setting : no checksum */
|
|
int LZ4IO_setBlockChecksumMode(int xxhash)
|
|
{
|
|
g_blockChecksum = (xxhash != 0);
|
|
return g_blockChecksum;
|
|
}
|
|
|
|
/* Default setting : checksum enabled */
|
|
int LZ4IO_setStreamChecksumMode(int xxhash)
|
|
{
|
|
g_streamChecksum = (xxhash != 0);
|
|
return g_streamChecksum;
|
|
}
|
|
|
|
/* Default setting : 0 (no notification) */
|
|
int LZ4IO_setNotificationLevel(int level)
|
|
{
|
|
g_displayLevel = level;
|
|
return g_displayLevel;
|
|
}
|
|
|
|
/* Default setting : 0 (disabled) */
|
|
int LZ4IO_setSparseFile(int enable)
|
|
{
|
|
g_sparseFileSupport = (enable!=0);
|
|
return g_sparseFileSupport;
|
|
}
|
|
|
|
/* Default setting : 0 (disabled) */
|
|
int LZ4IO_setContentSize(int enable)
|
|
{
|
|
g_contentSizeFlag = (enable!=0);
|
|
return g_contentSizeFlag;
|
|
}
|
|
|
|
static unsigned LZ4IO_GetMilliSpan(clock_t nPrevious)
|
|
{
|
|
clock_t nCurrent = clock();
|
|
unsigned nSpan = (unsigned)(((nCurrent - nPrevious) * 1000) / CLOCKS_PER_SEC);
|
|
return nSpan;
|
|
}
|
|
|
|
static unsigned long long LZ4IO_GetFileSize(const char* infilename)
|
|
{
|
|
int r;
|
|
#if defined(_MSC_VER)
|
|
struct _stat64 statbuf;
|
|
r = _stat64(infilename, &statbuf);
|
|
#else
|
|
struct stat statbuf;
|
|
r = stat(infilename, &statbuf);
|
|
#endif
|
|
if (r || !S_ISREG(statbuf.st_mode)) return 0; /* No good... */
|
|
return (unsigned long long)statbuf.st_size;
|
|
}
|
|
|
|
|
|
/* ************************************************************************ **
|
|
** ********************** LZ4 File / Pipe compression ********************* **
|
|
** ************************************************************************ */
|
|
|
|
static int LZ4IO_GetBlockSize_FromBlockId (int id) { return (1 << (8 + (2 * id))); }
|
|
static int LZ4IO_isSkippableMagicNumber(unsigned int magic) { return (magic & LZ4IO_SKIPPABLEMASK) == LZ4IO_SKIPPABLE0; }
|
|
|
|
|
|
static int get_fileHandle(const char* input_filename, const char* output_filename, FILE** pfinput, FILE** pfoutput)
|
|
{
|
|
|
|
if (!strcmp (input_filename, stdinmark))
|
|
{
|
|
DISPLAYLEVEL(4,"Using stdin for input\n");
|
|
*pfinput = stdin;
|
|
SET_BINARY_MODE(stdin);
|
|
}
|
|
else
|
|
{
|
|
*pfinput = fopen(input_filename, "rb");
|
|
}
|
|
|
|
if (!strcmp (output_filename, stdoutmark))
|
|
{
|
|
DISPLAYLEVEL(4,"Using stdout for output\n");
|
|
*pfoutput = stdout;
|
|
SET_BINARY_MODE(stdout);
|
|
}
|
|
else
|
|
{
|
|
/* Check if destination file already exists */
|
|
*pfoutput=0;
|
|
if (output_filename != nulmark) *pfoutput = fopen( output_filename, "rb" );
|
|
if (*pfoutput!=0)
|
|
{
|
|
fclose(*pfoutput);
|
|
if (!g_overwrite)
|
|
{
|
|
char ch;
|
|
DISPLAYLEVEL(2, "Warning : %s already exists\n", output_filename);
|
|
DISPLAYLEVEL(2, "Overwrite ? (Y/N) : ");
|
|
if (g_displayLevel <= 1) EXM_THROW(11, "Operation aborted : %s already exists", output_filename); /* No interaction possible */
|
|
ch = (char)getchar();
|
|
if ((ch!='Y') && (ch!='y')) EXM_THROW(11, "Operation aborted : %s already exists", output_filename);
|
|
}
|
|
}
|
|
*pfoutput = fopen( output_filename, "wb" );
|
|
}
|
|
|
|
if ( *pfinput==0 ) EXM_THROW(12, "Pb opening %s", input_filename);
|
|
if ( *pfoutput==0) EXM_THROW(13, "Pb opening %s", output_filename);
|
|
|
|
return 0;
|
|
}
|
|
|
|
|
|
|
|
/***************************************
|
|
* Legacy Compression
|
|
***************************************/
|
|
|
|
/* unoptimized version; solves endianess & alignment issues */
|
|
static void LZ4IO_writeLE32 (void* p, unsigned value32)
|
|
{
|
|
unsigned char* dstPtr = (unsigned char*)p;
|
|
dstPtr[0] = (unsigned char)value32;
|
|
dstPtr[1] = (unsigned char)(value32 >> 8);
|
|
dstPtr[2] = (unsigned char)(value32 >> 16);
|
|
dstPtr[3] = (unsigned char)(value32 >> 24);
|
|
}
|
|
|
|
/* LZ4IO_compressFilename_Legacy :
|
|
* This function is intentionally "hidden" (not published in .h)
|
|
* It generates compressed streams using the old 'legacy' format */
|
|
int LZ4IO_compressFilename_Legacy(const char* input_filename, const char* output_filename, int compressionlevel)
|
|
{
|
|
int (*compressionFunction)(const char*, char*, int);
|
|
unsigned long long filesize = 0;
|
|
unsigned long long compressedfilesize = MAGICNUMBER_SIZE;
|
|
char* in_buff;
|
|
char* out_buff;
|
|
FILE* finput;
|
|
FILE* foutput;
|
|
clock_t start, end;
|
|
size_t sizeCheck;
|
|
|
|
|
|
/* Init */
|
|
start = clock();
|
|
if (compressionlevel < 3) compressionFunction = LZ4_compress; else compressionFunction = LZ4_compressHC;
|
|
|
|
get_fileHandle(input_filename, output_filename, &finput, &foutput);
|
|
if ((g_displayLevel==2) && (compressionlevel==1)) g_displayLevel=3;
|
|
|
|
/* Allocate Memory */
|
|
in_buff = (char*)malloc(LEGACY_BLOCKSIZE);
|
|
out_buff = (char*)malloc(LZ4_compressBound(LEGACY_BLOCKSIZE));
|
|
if (!in_buff || !out_buff) EXM_THROW(21, "Allocation error : not enough memory");
|
|
|
|
/* Write Archive Header */
|
|
LZ4IO_writeLE32(out_buff, LEGACY_MAGICNUMBER);
|
|
sizeCheck = fwrite(out_buff, 1, MAGICNUMBER_SIZE, foutput);
|
|
if (sizeCheck!=MAGICNUMBER_SIZE) EXM_THROW(22, "Write error : cannot write header");
|
|
|
|
/* Main Loop */
|
|
while (1)
|
|
{
|
|
unsigned int outSize;
|
|
/* Read Block */
|
|
int inSize = (int) fread(in_buff, (size_t)1, (size_t)LEGACY_BLOCKSIZE, finput);
|
|
if( inSize<=0 ) break;
|
|
filesize += inSize;
|
|
|
|
/* Compress Block */
|
|
outSize = compressionFunction(in_buff, out_buff+4, inSize);
|
|
compressedfilesize += outSize+4;
|
|
DISPLAYUPDATE(3, "\rRead : %i MB ==> %.2f%% ", (int)(filesize>>20), (double)compressedfilesize/filesize*100);
|
|
|
|
/* Write Block */
|
|
LZ4IO_writeLE32(out_buff, outSize);
|
|
sizeCheck = fwrite(out_buff, 1, outSize+4, foutput);
|
|
if (sizeCheck!=(size_t)(outSize+4)) EXM_THROW(23, "Write error : cannot write compressed block");
|
|
}
|
|
|
|
/* Status */
|
|
end = clock();
|
|
DISPLAYLEVEL(2, "\r%79s\r", "");
|
|
DISPLAYLEVEL(2,"Compressed %llu bytes into %llu bytes ==> %.2f%%\n",
|
|
(unsigned long long) filesize, (unsigned long long) compressedfilesize, (double)compressedfilesize/filesize*100);
|
|
{
|
|
double seconds = (double)(end - start)/CLOCKS_PER_SEC;
|
|
DISPLAYLEVEL(4,"Done in %.2f s ==> %.2f MB/s\n", seconds, (double)filesize / seconds / 1024 / 1024);
|
|
}
|
|
|
|
/* Close & Free */
|
|
free(in_buff);
|
|
free(out_buff);
|
|
fclose(finput);
|
|
fclose(foutput);
|
|
|
|
return 0;
|
|
}
|
|
|
|
|
|
/*********************************************
|
|
* Compression using Frame format
|
|
*********************************************/
|
|
|
|
int LZ4IO_compressFilename(const char* input_filename, const char* output_filename, int compressionLevel)
|
|
{
|
|
unsigned long long filesize = 0;
|
|
unsigned long long compressedfilesize = 0;
|
|
char* in_buff;
|
|
char* out_buff;
|
|
FILE* finput;
|
|
FILE* foutput;
|
|
clock_t start, end;
|
|
int blockSize;
|
|
size_t sizeCheck, headerSize, readSize, outBuffSize;
|
|
LZ4F_compressionContext_t ctx;
|
|
LZ4F_errorCode_t errorCode;
|
|
LZ4F_preferences_t prefs;
|
|
|
|
|
|
/* Init */
|
|
start = clock();
|
|
memset(&prefs, 0, sizeof(prefs));
|
|
if ((g_displayLevel==2) && (compressionLevel>=3)) g_displayLevel=3;
|
|
errorCode = LZ4F_createCompressionContext(&ctx, LZ4F_VERSION);
|
|
if (LZ4F_isError(errorCode)) EXM_THROW(30, "Allocation error : can't create LZ4F context : %s", LZ4F_getErrorName(errorCode));
|
|
get_fileHandle(input_filename, output_filename, &finput, &foutput);
|
|
blockSize = LZ4IO_GetBlockSize_FromBlockId (g_blockSizeId);
|
|
|
|
/* Set compression parameters */
|
|
prefs.autoFlush = 1;
|
|
prefs.compressionLevel = compressionLevel;
|
|
prefs.frameInfo.blockMode = (blockMode_t)g_blockIndependence;
|
|
prefs.frameInfo.blockSizeID = (blockSizeID_t)g_blockSizeId;
|
|
prefs.frameInfo.contentChecksumFlag = (contentChecksum_t)g_streamChecksum;
|
|
if (g_contentSizeFlag)
|
|
{
|
|
unsigned long long fileSize = LZ4IO_GetFileSize(input_filename);
|
|
prefs.frameInfo.frameOSize = fileSize; /* == 0 if input == stdin */
|
|
}
|
|
|
|
/* Allocate Memory */
|
|
in_buff = (char*)malloc(blockSize);
|
|
outBuffSize = LZ4F_compressBound(blockSize, &prefs);
|
|
out_buff = (char*)malloc(outBuffSize);
|
|
if (!in_buff || !out_buff) EXM_THROW(31, "Allocation error : not enough memory");
|
|
|
|
/* Write Archive Header */
|
|
headerSize = LZ4F_compressBegin(ctx, out_buff, outBuffSize, &prefs);
|
|
if (LZ4F_isError(headerSize)) EXM_THROW(32, "File header generation failed : %s", LZ4F_getErrorName(headerSize));
|
|
sizeCheck = fwrite(out_buff, 1, headerSize, foutput);
|
|
if (sizeCheck!=headerSize) EXM_THROW(33, "Write error : cannot write header");
|
|
compressedfilesize += headerSize;
|
|
|
|
/* read first block */
|
|
readSize = fread(in_buff, (size_t)1, (size_t)blockSize, finput);
|
|
filesize += readSize;
|
|
|
|
/* Main Loop */
|
|
while (readSize>0)
|
|
{
|
|
size_t outSize;
|
|
|
|
/* Compress Block */
|
|
outSize = LZ4F_compressUpdate(ctx, out_buff, outBuffSize, in_buff, readSize, NULL);
|
|
if (LZ4F_isError(outSize)) EXM_THROW(34, "Compression failed : %s", LZ4F_getErrorName(outSize));
|
|
compressedfilesize += outSize;
|
|
DISPLAYUPDATE(3, "\rRead : %i MB ==> %.2f%% ", (int)(filesize>>20), (double)compressedfilesize/filesize*100);
|
|
|
|
/* Write Block */
|
|
sizeCheck = fwrite(out_buff, 1, outSize, foutput);
|
|
if (sizeCheck!=outSize) EXM_THROW(35, "Write error : cannot write compressed block");
|
|
|
|
/* Read next block */
|
|
readSize = fread(in_buff, (size_t)1, (size_t)blockSize, finput);
|
|
filesize += readSize;
|
|
}
|
|
|
|
/* End of Stream mark */
|
|
headerSize = LZ4F_compressEnd(ctx, out_buff, outBuffSize, NULL);
|
|
if (LZ4F_isError(headerSize)) EXM_THROW(36, "End of file generation failed : %s", LZ4F_getErrorName(headerSize));
|
|
|
|
sizeCheck = fwrite(out_buff, 1, headerSize, foutput);
|
|
if (sizeCheck!=headerSize) EXM_THROW(37, "Write error : cannot write end of stream");
|
|
compressedfilesize += headerSize;
|
|
|
|
/* Close & Free */
|
|
free(in_buff);
|
|
free(out_buff);
|
|
fclose(finput);
|
|
fclose(foutput);
|
|
errorCode = LZ4F_freeCompressionContext(ctx);
|
|
if (LZ4F_isError(errorCode)) EXM_THROW(38, "Error : can't free LZ4F context resource : %s", LZ4F_getErrorName(errorCode));
|
|
|
|
/* Final Status */
|
|
end = clock();
|
|
DISPLAYLEVEL(2, "\r%79s\r", "");
|
|
DISPLAYLEVEL(2, "Compressed %llu bytes into %llu bytes ==> %.2f%%\n",
|
|
(unsigned long long) filesize, (unsigned long long) compressedfilesize, (double)compressedfilesize/filesize*100);
|
|
{
|
|
double seconds = (double)(end - start)/CLOCKS_PER_SEC;
|
|
DISPLAYLEVEL(4, "Done in %.2f s ==> %.2f MB/s\n", seconds, (double)filesize / seconds / 1024 / 1024);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
|
|
#define FNSPACE 30
|
|
int LZ4IO_compressMultipleFilenames(const char** inFileNamesTable, int ifntSize, const char* suffix, int compressionlevel)
|
|
{
|
|
int i;
|
|
char* outFileName = (char*)malloc(FNSPACE);
|
|
size_t ofnSize = FNSPACE;
|
|
const size_t suffixSize = strlen(suffix);
|
|
|
|
for (i=0; i<ifntSize; i++)
|
|
{
|
|
size_t ifnSize = strlen(inFileNamesTable[i]);
|
|
if (ofnSize <= ifnSize+suffixSize+1) { free(outFileName); ofnSize = ifnSize + 20; outFileName = (char*)malloc(ofnSize); }
|
|
strcpy(outFileName, inFileNamesTable[i]);
|
|
strcat(outFileName, suffix);
|
|
LZ4IO_compressFilename(inFileNamesTable[i], outFileName, compressionlevel);
|
|
}
|
|
free(outFileName);
|
|
return 0;
|
|
}
|
|
|
|
|
|
/* ********************************************************************* */
|
|
/* ********************** LZ4 file-stream Decompression **************** */
|
|
/* ********************************************************************* */
|
|
|
|
static unsigned LZ4IO_readLE32 (const void* s)
|
|
{
|
|
const unsigned char* srcPtr = (const unsigned char*)s;
|
|
unsigned value32 = srcPtr[0];
|
|
value32 += (srcPtr[1]<<8);
|
|
value32 += (srcPtr[2]<<16);
|
|
value32 += (srcPtr[3]<<24);
|
|
return value32;
|
|
}
|
|
|
|
static unsigned long long decodeLegacyStream(FILE* finput, FILE* foutput)
|
|
{
|
|
unsigned long long filesize = 0;
|
|
char* in_buff;
|
|
char* out_buff;
|
|
|
|
/* Allocate Memory */
|
|
in_buff = (char*)malloc(LZ4_compressBound(LEGACY_BLOCKSIZE));
|
|
out_buff = (char*)malloc(LEGACY_BLOCKSIZE);
|
|
if (!in_buff || !out_buff) EXM_THROW(51, "Allocation error : not enough memory");
|
|
|
|
/* Main Loop */
|
|
while (1)
|
|
{
|
|
int decodeSize;
|
|
size_t sizeCheck;
|
|
unsigned int blockSize;
|
|
|
|
/* Block Size */
|
|
sizeCheck = fread(in_buff, 1, 4, finput);
|
|
if (sizeCheck==0) break; /* Nothing to read : file read is completed */
|
|
blockSize = LZ4IO_readLE32(in_buff); /* Convert to Little Endian */
|
|
if (blockSize > LZ4_COMPRESSBOUND(LEGACY_BLOCKSIZE))
|
|
{ /* Cannot read next block : maybe new stream ? */
|
|
fseek(finput, -4, SEEK_CUR);
|
|
break;
|
|
}
|
|
|
|
/* Read Block */
|
|
sizeCheck = fread(in_buff, 1, blockSize, finput);
|
|
if (sizeCheck!=blockSize) EXM_THROW(52, "Read error : cannot access compressed block !");
|
|
|
|
/* Decode Block */
|
|
decodeSize = LZ4_decompress_safe(in_buff, out_buff, blockSize, LEGACY_BLOCKSIZE);
|
|
if (decodeSize < 0) EXM_THROW(53, "Decoding Failed ! Corrupted input detected !");
|
|
filesize += decodeSize;
|
|
|
|
/* Write Block */
|
|
sizeCheck = fwrite(out_buff, 1, decodeSize, foutput);
|
|
if (sizeCheck != (size_t)decodeSize) EXM_THROW(54, "Write error : cannot write decoded block into output\n");
|
|
}
|
|
|
|
/* Free */
|
|
free(in_buff);
|
|
free(out_buff);
|
|
|
|
return filesize;
|
|
}
|
|
|
|
|
|
static unsigned long long decodeLZ4S(FILE* finput, FILE* foutput)
|
|
{
|
|
unsigned long long filesize = 0;
|
|
void* inBuff;
|
|
void* outBuff;
|
|
# define HEADERMAX 20
|
|
char headerBuff[HEADERMAX];
|
|
size_t sizeCheck;
|
|
const size_t inBuffSize = 256 KB;
|
|
const size_t outBuffSize = 256 KB;
|
|
LZ4F_decompressionContext_t ctx;
|
|
LZ4F_errorCode_t errorCode;
|
|
unsigned storedSkips = 0;
|
|
|
|
/* init */
|
|
errorCode = LZ4F_createDecompressionContext(&ctx, LZ4F_VERSION);
|
|
if (LZ4F_isError(errorCode)) EXM_THROW(60, "Can't create context : %s", LZ4F_getErrorName(errorCode));
|
|
LZ4IO_writeLE32(headerBuff, LZ4IO_MAGICNUMBER); /* regenerated here, as it was already read from finput */
|
|
|
|
/* Allocate Memory */
|
|
inBuff = malloc(256 KB);
|
|
outBuff = malloc(256 KB);
|
|
if (!inBuff || !outBuff) EXM_THROW(61, "Allocation error : not enough memory");
|
|
|
|
/* Init feed with magic number (already consumed from FILE) */
|
|
{
|
|
size_t inSize = 4;
|
|
size_t outSize=0;
|
|
LZ4IO_writeLE32(inBuff, LZ4IO_MAGICNUMBER);
|
|
errorCode = LZ4F_decompress(ctx, outBuff, &outSize, inBuff, &inSize, NULL);
|
|
if (LZ4F_isError(errorCode)) EXM_THROW(62, "Header error : %s", LZ4F_getErrorName(errorCode));
|
|
}
|
|
|
|
|
|
/* Main Loop */
|
|
for (;;)
|
|
{
|
|
size_t readSize;
|
|
size_t pos = 0;
|
|
|
|
/* Read input */
|
|
readSize = fread(inBuff, 1, inBuffSize, finput);
|
|
if (!readSize) break; /* empty file or stream */
|
|
|
|
while (pos < readSize)
|
|
{
|
|
/* Decode Input (at least partially) */
|
|
size_t remaining = readSize - pos;
|
|
size_t decodedBytes = outBuffSize;
|
|
errorCode = LZ4F_decompress(ctx, outBuff, &decodedBytes, (char*)inBuff+pos, &remaining, NULL);
|
|
if (LZ4F_isError(errorCode)) EXM_THROW(66, "Decompression error : %s", LZ4F_getErrorName(errorCode));
|
|
pos += remaining;
|
|
|
|
if (decodedBytes)
|
|
{
|
|
/* Write Block */
|
|
filesize += decodedBytes;
|
|
if (g_sparseFileSupport)
|
|
{
|
|
size_t* const oBuffStartT = (size_t*)outBuff; /* since outBuff is malloc'ed, it's aligned on size_t */
|
|
size_t* oBuffPosT = oBuffStartT;
|
|
size_t oBuffSizeT = decodedBytes / sizeT;
|
|
size_t* const oBuffEndT = oBuffStartT + oBuffSizeT;
|
|
static const size_t bs0T = (32 KB) / sizeT;
|
|
while (oBuffPosT < oBuffEndT)
|
|
{
|
|
size_t seg0SizeT = bs0T;
|
|
size_t nb0T;
|
|
int seekResult;
|
|
if (seg0SizeT > oBuffSizeT) seg0SizeT = oBuffSizeT;
|
|
oBuffSizeT -= seg0SizeT;
|
|
for (nb0T=0; (nb0T < seg0SizeT) && (oBuffPosT[nb0T] == 0); nb0T++) ;
|
|
storedSkips += (unsigned)(nb0T * sizeT);
|
|
if (storedSkips > 1 GB) /* avoid int overflow */
|
|
{
|
|
seekResult = fseek(foutput, 1 GB, SEEK_CUR);
|
|
if (seekResult != 0) EXM_THROW(68, "1 GB skip error (sparse file)");
|
|
storedSkips -= 1 GB;
|
|
}
|
|
if (nb0T != seg0SizeT) /* not all 0s */
|
|
{
|
|
seekResult = fseek(foutput, storedSkips, SEEK_CUR);
|
|
if (seekResult) EXM_THROW(68, "Skip error (sparse file)");
|
|
storedSkips = 0;
|
|
seg0SizeT -= nb0T;
|
|
oBuffPosT += nb0T;
|
|
sizeCheck = fwrite(oBuffPosT, sizeT, seg0SizeT, foutput);
|
|
if (sizeCheck != seg0SizeT) EXM_THROW(68, "Write error : cannot write decoded block");
|
|
}
|
|
oBuffPosT += seg0SizeT;
|
|
}
|
|
if (decodedBytes & maskT) /* size not multiple of sizeT (necessarily end of block) */
|
|
{
|
|
const char* const restStart = (char*)oBuffEndT;
|
|
const char* restPtr = restStart;
|
|
size_t restSize = decodedBytes & maskT;
|
|
const char* const restEnd = restStart + restSize;
|
|
for (; (restPtr < restEnd) && (*restPtr == 0); restPtr++) ;
|
|
storedSkips += (unsigned) (restPtr - restStart);
|
|
if (restPtr != restEnd)
|
|
{
|
|
int seekResult = fseek(foutput, storedSkips, SEEK_CUR);
|
|
if (seekResult) EXM_THROW(68, "Skip error (end of block)");
|
|
storedSkips = 0;
|
|
sizeCheck = fwrite(restPtr, 1, restEnd - restPtr, foutput);
|
|
if (sizeCheck != (size_t)(restEnd - restPtr)) EXM_THROW(68, "Write error : cannot write decoded end of block");
|
|
}
|
|
}
|
|
}
|
|
else
|
|
{
|
|
sizeCheck = fwrite(outBuff, 1, decodedBytes, foutput);
|
|
if (sizeCheck != decodedBytes) EXM_THROW(68, "Write error : cannot write decoded block");
|
|
}
|
|
}
|
|
}
|
|
|
|
}
|
|
|
|
if ((g_sparseFileSupport) && (storedSkips>0))
|
|
{
|
|
int seekResult;
|
|
storedSkips --;
|
|
seekResult = fseek(foutput, storedSkips, SEEK_CUR);
|
|
if (seekResult != 0) EXM_THROW(69, "Final skip error (sparse file)\n");
|
|
memset(outBuff, 0, 1);
|
|
sizeCheck = fwrite(outBuff, 1, 1, foutput);
|
|
if (sizeCheck != 1) EXM_THROW(69, "Write error : cannot write last zero\n");
|
|
}
|
|
|
|
/* Free */
|
|
free(inBuff);
|
|
free(outBuff);
|
|
errorCode = LZ4F_freeDecompressionContext(ctx);
|
|
if (LZ4F_isError(errorCode)) EXM_THROW(69, "Error : can't free LZ4F context resource : %s", LZ4F_getErrorName(errorCode));
|
|
|
|
return filesize;
|
|
}
|
|
|
|
|
|
static unsigned long long LZ4IO_passThrough(FILE* finput, FILE* foutput, unsigned char U32store[MAGICNUMBER_SIZE])
|
|
{
|
|
void* buffer = malloc(64 KB);
|
|
size_t read = 1, sizeCheck;
|
|
unsigned long long total = MAGICNUMBER_SIZE;
|
|
|
|
sizeCheck = fwrite(U32store, 1, MAGICNUMBER_SIZE, foutput);
|
|
if (sizeCheck != MAGICNUMBER_SIZE) EXM_THROW(50, "Pass-through error at start");
|
|
|
|
while (read)
|
|
{
|
|
read = fread(buffer, 1, 64 KB, finput);
|
|
total += read;
|
|
sizeCheck = fwrite(buffer, 1, read, foutput);
|
|
if (sizeCheck != read) EXM_THROW(50, "Pass-through error");
|
|
}
|
|
|
|
free(buffer);
|
|
return total;
|
|
}
|
|
|
|
|
|
#define ENDOFSTREAM ((unsigned long long)-1)
|
|
static unsigned long long selectDecoder( FILE* finput, FILE* foutput)
|
|
{
|
|
unsigned char U32store[MAGICNUMBER_SIZE];
|
|
unsigned magicNumber, size;
|
|
int errorNb;
|
|
size_t nbReadBytes;
|
|
static unsigned nbCalls = 0;
|
|
|
|
/* init */
|
|
nbCalls++;
|
|
|
|
/* Check Archive Header */
|
|
nbReadBytes = fread(U32store, 1, MAGICNUMBER_SIZE, finput);
|
|
if (nbReadBytes==0) return ENDOFSTREAM; /* EOF */
|
|
if (nbReadBytes != MAGICNUMBER_SIZE) EXM_THROW(40, "Unrecognized header : Magic Number unreadable");
|
|
magicNumber = LZ4IO_readLE32(U32store); /* Little Endian format */
|
|
if (LZ4IO_isSkippableMagicNumber(magicNumber)) magicNumber = LZ4IO_SKIPPABLE0; /* fold skippable magic numbers */
|
|
|
|
switch(magicNumber)
|
|
{
|
|
case LZ4IO_MAGICNUMBER:
|
|
return DEFAULT_DECOMPRESSOR(finput, foutput);
|
|
case LEGACY_MAGICNUMBER:
|
|
DISPLAYLEVEL(4, "Detected : Legacy format \n");
|
|
return decodeLegacyStream(finput, foutput);
|
|
case LZ4IO_SKIPPABLE0:
|
|
DISPLAYLEVEL(4, "Skipping detected skippable area \n");
|
|
nbReadBytes = fread(U32store, 1, 4, finput);
|
|
if (nbReadBytes != 4) EXM_THROW(42, "Stream error : skippable size unreadable");
|
|
size = LZ4IO_readLE32(U32store); /* Little Endian format */
|
|
errorNb = fseek(finput, size, SEEK_CUR);
|
|
if (errorNb != 0) EXM_THROW(43, "Stream error : cannot skip skippable area");
|
|
return selectDecoder(finput, foutput);
|
|
EXTENDED_FORMAT;
|
|
default:
|
|
if (nbCalls == 1) /* just started */
|
|
{
|
|
if (g_overwrite)
|
|
return LZ4IO_passThrough(finput, foutput, U32store);
|
|
EXM_THROW(44,"Unrecognized header : file cannot be decoded"); /* Wrong magic number at the beginning of 1st stream */
|
|
}
|
|
DISPLAYLEVEL(2, "Stream followed by unrecognized data\n");
|
|
return ENDOFSTREAM;
|
|
}
|
|
}
|
|
|
|
|
|
int LZ4IO_decompressFilename(const char* input_filename, const char* output_filename)
|
|
{
|
|
unsigned long long filesize = 0, decodedSize=0;
|
|
FILE* finput;
|
|
FILE* foutput;
|
|
clock_t start, end;
|
|
|
|
|
|
/* Init */
|
|
start = clock();
|
|
get_fileHandle(input_filename, output_filename, &finput, &foutput);
|
|
|
|
/* sparse file */
|
|
if (g_sparseFileSupport && foutput) { SET_SPARSE_FILE_MODE(foutput); }
|
|
|
|
/* Loop over multiple streams */
|
|
do
|
|
{
|
|
decodedSize = selectDecoder(finput, foutput);
|
|
if (decodedSize != ENDOFSTREAM)
|
|
filesize += decodedSize;
|
|
} while (decodedSize != ENDOFSTREAM);
|
|
|
|
/* Final Status */
|
|
end = clock();
|
|
DISPLAYLEVEL(2, "\r%79s\r", "");
|
|
DISPLAYLEVEL(2, "Successfully decoded %llu bytes \n", filesize);
|
|
{
|
|
double seconds = (double)(end - start)/CLOCKS_PER_SEC;
|
|
DISPLAYLEVEL(4, "Done in %.2f s ==> %.2f MB/s\n", seconds, (double)filesize / seconds / 1024 / 1024);
|
|
}
|
|
|
|
/* Close */
|
|
fclose(finput);
|
|
fclose(foutput);
|
|
|
|
/* Error status = OK */
|
|
return 0;
|
|
}
|
|
|