e185b252f0
Cleaner C99 detection, thanks to Elad Modified Basic Types, as recommended by Wayne Scott Simplified compression function Corrected : warning on missing #undef in lz4hc, thanks Arseny Kapoulkine Modified length loops as suggested by Wouter Vermaelen Modified pragma pack directive for older versions of GCC, as reported by Peter Costello Updated xxHash to r29 Indent lz4hc.c with spaces git-svn-id: https://lz4.googlecode.com/svn/trunk@95 650e7d94-2a16-8b24-b05c-7c0b3f6821cd
856 lines
30 KiB
C
856 lines
30 KiB
C
/*
|
|
LZ4c - LZ4 Compression CLI program
|
|
Copyright (C) Yann Collet 2011-2013
|
|
GPL v2 License
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License along
|
|
with this program; if not, write to the Free Software Foundation, Inc.,
|
|
51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
|
|
You can contact the author at :
|
|
- LZ4 homepage : http://fastcompression.blogspot.com/p/lz4.html
|
|
- LZ4 source repository : http://code.google.com/p/lz4/
|
|
*/
|
|
/*
|
|
Note : this is stand-alone program.
|
|
It is not part of LZ4 compression library, it is a user program of LZ4 library.
|
|
The license of LZ4 library is BSD.
|
|
The license of xxHash library is BSD.
|
|
The license of this compression CLI program is GPLv2.
|
|
*/
|
|
|
|
//**************************************
|
|
// Compiler Options
|
|
//**************************************
|
|
// Disable some Visual warning messages
|
|
#ifdef _MSC_VER // Visual Studio
|
|
# define _CRT_SECURE_NO_WARNINGS
|
|
# define _CRT_SECURE_NO_DEPRECATE // VS2005
|
|
# pragma warning(disable : 4127) // disable: C4127: conditional expression is constant
|
|
#endif
|
|
|
|
|
|
//****************************
|
|
// Includes
|
|
//****************************
|
|
#include <stdio.h> // fprintf, fopen, fread, _fileno(?)
|
|
#include <stdlib.h> // malloc
|
|
#include <string.h> // strcmp
|
|
#include <time.h> // clock
|
|
#ifdef _WIN32
|
|
#include <io.h> // _setmode
|
|
#include <fcntl.h> // _O_BINARY
|
|
#endif
|
|
#include "lz4.h"
|
|
#include "lz4hc.h"
|
|
#include "bench.h"
|
|
#include "xxhash.h"
|
|
|
|
|
|
//**************************************
|
|
// Compiler-specific functions
|
|
//**************************************
|
|
#define GCC_VERSION (__GNUC__ * 100 + __GNUC_MINOR__)
|
|
|
|
#if defined(_MSC_VER) // Visual Studio
|
|
# define swap32 _byteswap_ulong
|
|
#elif GCC_VERSION >= 403
|
|
# define swap32 __builtin_bswap32
|
|
#else
|
|
static inline unsigned int swap32(unsigned int x) {
|
|
return ((x << 24) & 0xff000000 ) |
|
|
((x << 8) & 0x00ff0000 ) |
|
|
((x >> 8) & 0x0000ff00 ) |
|
|
((x >> 24) & 0x000000ff );
|
|
}
|
|
#endif
|
|
|
|
|
|
//****************************
|
|
// Constants
|
|
//****************************
|
|
#define COMPRESSOR_NAME "LZ4 Compression CLI"
|
|
#define COMPRESSOR_VERSION ""
|
|
#define COMPILED __DATE__
|
|
#define AUTHOR "Yann Collet"
|
|
#define EXTENSION ".lz4"
|
|
#define WELCOME_MESSAGE "*** %s %s, by %s (%s) ***\n", COMPRESSOR_NAME, COMPRESSOR_VERSION, AUTHOR, COMPILED
|
|
|
|
#define CACHELINE 64
|
|
#define MAGICNUMBER_SIZE 4
|
|
#define LZ4S_MAGICNUMBER 0x184D2204
|
|
#define LZ4S_BLOCKSIZEID_DEFAULT 7
|
|
#define LZ4S_CHECKSUM_SEED 0
|
|
|
|
#define LZ4S_SKIPPABLE0 0x184D2A50
|
|
#define LZ4S_SKIPPABLEMASK 0xFFFFFFF0
|
|
|
|
#define LEGACY_MAGICNUMBER 0x184C2102
|
|
#define LEGACY_BLOCKSIZE (8<<20) // 8 MB
|
|
|
|
#define _1BIT 1
|
|
#define _2BITS 0x03
|
|
#define _3BITS 0x07
|
|
#define _4BITS 0x0F
|
|
#define _8BITS 0xFF
|
|
|
|
//**************************************
|
|
// Architecture Macros
|
|
//**************************************
|
|
static const int one = 1;
|
|
#define CPU_LITTLE_ENDIAN (*(char*)(&one))
|
|
#define CPU_BIG_ENDIAN (!CPU_LITTLE_ENDIAN)
|
|
#define LITTLE_ENDIAN_32(i) (CPU_LITTLE_ENDIAN?(i):swap32(i))
|
|
|
|
|
|
//**************************************
|
|
// Macros
|
|
//**************************************
|
|
#define DISPLAY(...) fprintf(stderr, __VA_ARGS__)
|
|
|
|
|
|
//**************************************
|
|
// Special input/output
|
|
//**************************************
|
|
#define NULL_INPUT "null"
|
|
char stdinmark[] = "stdin";
|
|
char stdoutmark[] = "stdout";
|
|
#ifdef _WIN32
|
|
char nulmark[] = "nul";
|
|
#else
|
|
char nulmark[] = "/dev/null";
|
|
#endif
|
|
|
|
|
|
//**************************************
|
|
// Local Parameters
|
|
//**************************************
|
|
static int overwrite = 0;
|
|
static int blockSizeId = LZ4S_BLOCKSIZEID_DEFAULT;
|
|
static int blockChecksum = 0;
|
|
static int streamChecksum = 1;
|
|
|
|
//**************************************
|
|
// Exceptions
|
|
//**************************************
|
|
#define DEBUG 0
|
|
#define DEBUGOUTPUT(...) if (DEBUG) DISPLAY(__VA_ARGS__);
|
|
#define EXM_THROW(error, ...) \
|
|
{ \
|
|
DEBUGOUTPUT("Error defined at %s, line %i : \n", __FILE__, __LINE__); \
|
|
DISPLAY("Error %i : ", error); \
|
|
DISPLAY(__VA_ARGS__); \
|
|
DISPLAY("\n"); \
|
|
exit(error); \
|
|
}
|
|
|
|
|
|
|
|
//****************************
|
|
// Functions
|
|
//****************************
|
|
int usage(char* exename)
|
|
{
|
|
DISPLAY( "Usage :\n");
|
|
DISPLAY( " %s [arg] input [output]\n", exename);
|
|
DISPLAY( "Arguments :\n");
|
|
DISPLAY( " -c0/-c : Fast compression (default) \n");
|
|
DISPLAY( " -c1/-hc: High compression \n");
|
|
DISPLAY( " -d : decompression \n");
|
|
DISPLAY( " -y : overwrite without prompting \n");
|
|
DISPLAY( " -H : Help (this text + advanced options)\n");
|
|
return 0;
|
|
}
|
|
|
|
int usage_advanced()
|
|
{
|
|
DISPLAY( "\nAdvanced options :\n");
|
|
DISPLAY( " -t : test compressed file \n");
|
|
DISPLAY( " -B# : Block size [4-7](default : 7)\n");
|
|
DISPLAY( " -x : enable block checksum (default:disabled)\n");
|
|
DISPLAY( " -nx : disable stream checksum (default:enabled)\n");
|
|
DISPLAY( " -b# : benchmark files, using # [0-1] compression level\n");
|
|
DISPLAY( " -i# : iteration loops [1-9](default : 3), benchmark mode only\n");
|
|
DISPLAY( "input : can be 'stdin' (pipe) or a filename\n");
|
|
DISPLAY( "output : can be 'stdout'(pipe) or a filename or 'null'\n");
|
|
DISPLAY( " example : lz4c -hc stdin compressedfile.lz4");
|
|
return 0;
|
|
}
|
|
|
|
|
|
int badusage(char* exename)
|
|
{
|
|
DISPLAY("Wrong parameters\n");
|
|
usage(exename);
|
|
return 0;
|
|
}
|
|
|
|
|
|
static int LZ4S_GetBlocksize_FromBlockId (int id) { return (1 << (8 + (2 * id))); }
|
|
static unsigned int LZ4S_GetCheckBits_FromXXH (unsigned int xxh) { return (xxh >> 8) & _8BITS; }
|
|
|
|
|
|
int get_fileHandle(char* input_filename, char* output_filename, FILE** pfinput, FILE** pfoutput)
|
|
{
|
|
|
|
if (!strcmp (input_filename, stdinmark))
|
|
{
|
|
DISPLAY( "Using stdin for input\n");
|
|
*pfinput = stdin;
|
|
#ifdef _WIN32 // Need to set stdin/stdout to binary mode specifically for windows
|
|
_setmode( _fileno( stdin ), _O_BINARY );
|
|
#endif
|
|
}
|
|
else
|
|
{
|
|
*pfinput = fopen(input_filename, "rb");
|
|
}
|
|
|
|
if (!strcmp (output_filename, stdoutmark))
|
|
{
|
|
DISPLAY( "Using stdout for output\n");
|
|
*pfoutput = stdout;
|
|
#ifdef _WIN32 // Need to set stdin/stdout to binary mode specifically for windows
|
|
_setmode( _fileno( stdout ), _O_BINARY );
|
|
#endif
|
|
}
|
|
else
|
|
{
|
|
// Check if destination file already exists
|
|
*pfoutput=0;
|
|
if (output_filename != nulmark) *pfoutput = fopen( output_filename, "rb" );
|
|
if (*pfoutput!=0)
|
|
{
|
|
char ch;
|
|
fclose(*pfoutput);
|
|
DISPLAY( "Warning : %s already exists\n", output_filename);
|
|
if (!overwrite)
|
|
{
|
|
DISPLAY( "Overwrite ? (Y/N) : ");
|
|
ch = (char)getchar();
|
|
if (ch!='Y') EXM_THROW(11, "Operation aborted : %s already exists", output_filename);
|
|
}
|
|
}
|
|
*pfoutput = fopen( output_filename, "wb" );
|
|
}
|
|
|
|
if ( *pfinput==0 ) EXM_THROW(12, "Pb opening %s", input_filename);
|
|
if ( *pfoutput==0) EXM_THROW(13, "Pb opening %s", output_filename);
|
|
|
|
return 0;
|
|
}
|
|
|
|
|
|
|
|
int legacy_compress_file(char* input_filename, char* output_filename, int compressionlevel)
|
|
{
|
|
int (*compressionFunction)(const char*, char*, int);
|
|
unsigned long long filesize = 0;
|
|
unsigned long long compressedfilesize = MAGICNUMBER_SIZE;
|
|
char* in_buff;
|
|
char* out_buff;
|
|
FILE* finput;
|
|
FILE* foutput;
|
|
int displayLevel = (compressionlevel>0);
|
|
clock_t start, end;
|
|
size_t sizeCheck;
|
|
|
|
|
|
// Init
|
|
switch (compressionlevel)
|
|
{
|
|
case 0 : compressionFunction = LZ4_compress; break;
|
|
case 1 : compressionFunction = LZ4_compressHC; break;
|
|
default : compressionFunction = LZ4_compress;
|
|
}
|
|
start = clock();
|
|
get_fileHandle(input_filename, output_filename, &finput, &foutput);
|
|
|
|
// Allocate Memory
|
|
in_buff = (char*)malloc(LEGACY_BLOCKSIZE);
|
|
out_buff = (char*)malloc(LZ4_compressBound(LEGACY_BLOCKSIZE));
|
|
if (!in_buff || !out_buff) EXM_THROW(21, "Allocation error : not enough memory");
|
|
|
|
// Write Archive Header
|
|
*(unsigned int*)out_buff = LITTLE_ENDIAN_32(LEGACY_MAGICNUMBER);
|
|
sizeCheck = fwrite(out_buff, 1, MAGICNUMBER_SIZE, foutput);
|
|
if (sizeCheck!=MAGICNUMBER_SIZE) EXM_THROW(22, "Write error : cannot write header");
|
|
|
|
// Main Loop
|
|
while (1)
|
|
{
|
|
unsigned int outSize;
|
|
// Read Block
|
|
int inSize = (int) fread(in_buff, (size_t)1, (size_t)LEGACY_BLOCKSIZE, finput);
|
|
if( inSize<=0 ) break;
|
|
filesize += inSize;
|
|
if (displayLevel) DISPLAY("Read : %i MB \r", (int)(filesize>>20));
|
|
|
|
// Compress Block
|
|
outSize = compressionFunction(in_buff, out_buff+4, inSize);
|
|
compressedfilesize += outSize+4;
|
|
if (displayLevel) DISPLAY("Read : %i MB ==> %.2f%%\r", (int)(filesize>>20), (double)compressedfilesize/filesize*100);
|
|
|
|
// Write Block
|
|
* (unsigned int*) out_buff = LITTLE_ENDIAN_32(outSize);
|
|
sizeCheck = fwrite(out_buff, 1, outSize+4, foutput);
|
|
if (sizeCheck!=(size_t)(outSize+4)) EXM_THROW(23, "Write error : cannot write compressed block");
|
|
}
|
|
|
|
// Status
|
|
end = clock();
|
|
DISPLAY( "Compressed %llu bytes into %llu bytes ==> %.2f%%\n",
|
|
(unsigned long long) filesize, (unsigned long long) compressedfilesize, (double)compressedfilesize/filesize*100);
|
|
{
|
|
double seconds = (double)(end - start)/CLOCKS_PER_SEC;
|
|
DISPLAY( "Done in %.2f s ==> %.2f MB/s\n", seconds, (double)filesize / seconds / 1024 / 1024);
|
|
}
|
|
|
|
// Close & Free
|
|
free(in_buff);
|
|
free(out_buff);
|
|
fclose(finput);
|
|
fclose(foutput);
|
|
|
|
return 0;
|
|
}
|
|
|
|
|
|
int compress_file(char* input_filename, char* output_filename, int compressionlevel)
|
|
{
|
|
int (*compressionFunction)(const char*, char*, int, int);
|
|
unsigned long long filesize = 0;
|
|
unsigned long long compressedfilesize = 0;
|
|
unsigned int checkbits;
|
|
char* in_buff;
|
|
char* out_buff;
|
|
FILE* finput;
|
|
FILE* foutput;
|
|
int errorcode;
|
|
int displayLevel = (compressionlevel>0);
|
|
clock_t start, end;
|
|
int blockSize;
|
|
size_t sizeCheck, header_size;
|
|
void* streamChecksumState=NULL;
|
|
|
|
|
|
// Init
|
|
start = clock();
|
|
switch (compressionlevel)
|
|
{
|
|
case 0 : compressionFunction = LZ4_compress_limitedOutput; break;
|
|
case 1 : compressionFunction = LZ4_compressHC_limitedOutput; break;
|
|
default : compressionFunction = LZ4_compress_limitedOutput;
|
|
}
|
|
errorcode = get_fileHandle(input_filename, output_filename, &finput, &foutput);
|
|
if (errorcode) return errorcode;
|
|
blockSize = LZ4S_GetBlocksize_FromBlockId (blockSizeId);
|
|
|
|
// Allocate Memory
|
|
in_buff = (char*)malloc(blockSize);
|
|
out_buff = (char*)malloc(blockSize+CACHELINE);
|
|
if (!in_buff || !out_buff) EXM_THROW(31, "Allocation error : not enough memory");
|
|
if (streamChecksum) streamChecksumState = XXH32_init(LZ4S_CHECKSUM_SEED);
|
|
|
|
// Write Archive Header
|
|
*(unsigned int*)out_buff = LITTLE_ENDIAN_32(LZ4S_MAGICNUMBER); // Magic Number, in Little Endian convention
|
|
*(out_buff+4) = 0x60; // Version("01"), Block independence
|
|
*(out_buff+4) |= blockChecksum << 4;
|
|
*(out_buff+4) |= streamChecksum << 2;
|
|
*(out_buff+5) = (char)(blockSizeId<<4); // Block Size
|
|
checkbits = XXH32((out_buff+4), 2, LZ4S_CHECKSUM_SEED);
|
|
checkbits = LZ4S_GetCheckBits_FromXXH(checkbits);
|
|
*(out_buff+6) = (unsigned char) checkbits;
|
|
header_size = 7;
|
|
sizeCheck = fwrite(out_buff, 1, header_size, foutput);
|
|
if (sizeCheck!=header_size) EXM_THROW(32, "Write error : cannot write header");
|
|
compressedfilesize += header_size;
|
|
|
|
// Main Loop
|
|
while (1)
|
|
{
|
|
unsigned int outSize;
|
|
// Read Block
|
|
unsigned int inSize = (unsigned int) fread(in_buff, (size_t)1, (size_t)blockSize, finput);
|
|
if( inSize<=0 ) break;
|
|
filesize += inSize;
|
|
if (displayLevel) DISPLAY("Read : %i MB \r", (int)(filesize>>20));
|
|
if (streamChecksum) XXH32_update(streamChecksumState, in_buff, inSize);
|
|
|
|
// Compress Block
|
|
outSize = compressionFunction(in_buff, out_buff+4, inSize, inSize-1);
|
|
if (outSize > 0) compressedfilesize += outSize+4; else compressedfilesize += inSize+4;
|
|
if (blockChecksum) compressedfilesize+=4;
|
|
if (displayLevel) DISPLAY("Read : %i MB ==> %.2f%%\r", (int)(filesize>>20), (double)compressedfilesize/filesize*100);
|
|
|
|
// Write Block
|
|
if (outSize > 0)
|
|
{
|
|
unsigned int checksum;
|
|
int sizeToWrite;
|
|
* (unsigned int*) out_buff = LITTLE_ENDIAN_32(outSize);
|
|
if (blockChecksum)
|
|
{
|
|
checksum = XXH32(out_buff+4, outSize, LZ4S_CHECKSUM_SEED);
|
|
* (unsigned int*) (out_buff+4+outSize) = LITTLE_ENDIAN_32(checksum);
|
|
}
|
|
sizeToWrite = 4 + outSize + (4*blockChecksum);
|
|
sizeCheck = fwrite(out_buff, 1, sizeToWrite, foutput);
|
|
if (sizeCheck!=(size_t)(sizeToWrite)) EXM_THROW(33, "Write error : cannot write compressed block");
|
|
|
|
}
|
|
else // Copy Original
|
|
{
|
|
unsigned int checksum;
|
|
* (unsigned int*) out_buff = LITTLE_ENDIAN_32(inSize|0x80000000); // Add Uncompressed flag
|
|
sizeCheck = fwrite(out_buff, 1, 4, foutput);
|
|
if (sizeCheck!=(size_t)(4)) EXM_THROW(34, "Write error : cannot write block header");
|
|
sizeCheck = fwrite(in_buff, 1, inSize, foutput);
|
|
if (sizeCheck!=(size_t)(inSize)) EXM_THROW(35, "Write error : cannot write block");
|
|
if (blockChecksum)
|
|
{
|
|
checksum = XXH32(in_buff, inSize, LZ4S_CHECKSUM_SEED);
|
|
* (unsigned int*) out_buff = LITTLE_ENDIAN_32(checksum);
|
|
sizeCheck = fwrite(out_buff, 1, 4, foutput);
|
|
if (sizeCheck!=(size_t)(4)) EXM_THROW(36, "Write error : cannot write block checksum");
|
|
}
|
|
}
|
|
}
|
|
|
|
// End of Stream mark
|
|
* (unsigned int*) out_buff = 0;
|
|
sizeCheck = fwrite(out_buff, 1, 4, foutput);
|
|
if (sizeCheck!=(size_t)(4)) EXM_THROW(37, "Write error : cannot write end of stream");
|
|
compressedfilesize += 4;
|
|
if (streamChecksum)
|
|
{
|
|
unsigned int checksum = XXH32_digest(streamChecksumState);
|
|
* (unsigned int*) out_buff = LITTLE_ENDIAN_32(checksum);
|
|
sizeCheck = fwrite(out_buff, 1, 4, foutput);
|
|
if (sizeCheck!=(size_t)(4)) EXM_THROW(37, "Write error : cannot write stream checksum");
|
|
compressedfilesize += 4;
|
|
}
|
|
|
|
// Status
|
|
end = clock();
|
|
DISPLAY( "Compressed %llu bytes into %llu bytes ==> %.2f%%\n",
|
|
(unsigned long long) filesize, (unsigned long long) compressedfilesize, (double)compressedfilesize/filesize*100);
|
|
{
|
|
double seconds = (double)(end - start)/CLOCKS_PER_SEC;
|
|
DISPLAY( "Done in %.2f s ==> %.2f MB/s\n", seconds, (double)filesize / seconds / 1024 / 1024);
|
|
}
|
|
|
|
// Close & Free
|
|
free(in_buff);
|
|
free(out_buff);
|
|
fclose(finput);
|
|
fclose(foutput);
|
|
|
|
return 0;
|
|
}
|
|
|
|
|
|
unsigned long long decodeLegacyStream(FILE* finput, FILE* foutput)
|
|
{
|
|
unsigned long long filesize = 0;
|
|
char* in_buff;
|
|
char* out_buff;
|
|
size_t uselessRet;
|
|
int sinkint;
|
|
unsigned int blockSize;
|
|
size_t sizeCheck;
|
|
|
|
|
|
// Allocate Memory
|
|
in_buff = (char*)malloc(LZ4_compressBound(LEGACY_BLOCKSIZE));
|
|
out_buff = (char*)malloc(LEGACY_BLOCKSIZE);
|
|
if (!in_buff || !out_buff) EXM_THROW(51, "Allocation error : not enough memory");
|
|
|
|
// Main Loop
|
|
while (1)
|
|
{
|
|
// Block Size
|
|
uselessRet = fread(&blockSize, 1, 4, finput);
|
|
if( uselessRet==0 ) break; // Nothing to read : file read is completed
|
|
blockSize = LITTLE_ENDIAN_32(blockSize); // Convert to Little Endian
|
|
if (blockSize > LZ4_COMPRESSBOUND(LEGACY_BLOCKSIZE))
|
|
{ // Cannot read next block : maybe new stream ?
|
|
fseek(finput, -4, SEEK_CUR);
|
|
break;
|
|
}
|
|
|
|
// Read Block
|
|
uselessRet = fread(in_buff, 1, blockSize, finput);
|
|
|
|
// Decode Block
|
|
sinkint = LZ4_decompress_safe(in_buff, out_buff, blockSize, LEGACY_BLOCKSIZE);
|
|
if (sinkint < 0) EXM_THROW(52, "Decoding Failed ! Corrupted input detected !");
|
|
filesize += sinkint;
|
|
|
|
// Write Block
|
|
sizeCheck = fwrite(out_buff, 1, sinkint, foutput);
|
|
if (sizeCheck != (size_t)sinkint) EXM_THROW(53, "Write error : cannot write decoded block\n");
|
|
}
|
|
|
|
// Free
|
|
free(in_buff);
|
|
free(out_buff);
|
|
|
|
return filesize;
|
|
}
|
|
|
|
|
|
unsigned long long decodeLZ4S(FILE* finput, FILE* foutput)
|
|
{
|
|
unsigned long long filesize = 0;
|
|
char* in_buff;
|
|
char* out_buff;
|
|
unsigned char descriptor[3];
|
|
size_t nbReadBytes;
|
|
int decodedBytes;
|
|
unsigned int maxBlockSize;
|
|
size_t sizeCheck;
|
|
int blockChecksumFlag, streamChecksumFlag;
|
|
void* streamChecksumState=NULL;
|
|
|
|
// Decode stream descriptor
|
|
nbReadBytes = fread(descriptor, 1, 3, finput);
|
|
if (nbReadBytes != 3) EXM_THROW(61, "Unreadable header");
|
|
{
|
|
int version = (descriptor[0] >> 6) & _2BITS;
|
|
int independance = (descriptor[0] >> 5) & _1BIT;
|
|
int streamSize = (descriptor[0] >> 3) & _1BIT;
|
|
int reserved1 = (descriptor[0] >> 1) & _1BIT;
|
|
int dictionary = (descriptor[0] >> 0) & _1BIT;
|
|
|
|
int reserved2 = (descriptor[1] >> 7) & _1BIT;
|
|
int blockSizeId = (descriptor[1] >> 4) & _3BITS;
|
|
int reserved3 = (descriptor[1] >> 0) & _4BITS;
|
|
int checkBits = (descriptor[2] >> 0) & _8BITS;
|
|
int checkBits_xxh32;
|
|
|
|
blockChecksumFlag = (descriptor[0] >> 4) & _1BIT;
|
|
streamChecksumFlag= (descriptor[0] >> 2) & _1BIT;
|
|
|
|
if (version != 1) EXM_THROW(62, "Wrong version number");
|
|
if (independance != 1) EXM_THROW(63, "Does not support block inter-dependence");
|
|
if (streamSize == 1) EXM_THROW(64, "Does not support stream size");
|
|
if (reserved1 != 0) EXM_THROW(65, "Wrong value for reserved bits");
|
|
if (dictionary == 1) EXM_THROW(66, "Does not support dictionary");
|
|
if (reserved2 != 0) EXM_THROW(67, "Wrong value for reserved bits");
|
|
if (blockSizeId < 4) EXM_THROW(68, "Unsupported block size");
|
|
if (reserved3 != 0) EXM_THROW(67, "Wrong value for reserved bits");
|
|
maxBlockSize = LZ4S_GetBlocksize_FromBlockId(blockSizeId);
|
|
// Checkbits verification
|
|
descriptor[1] &= 0xF0;
|
|
checkBits_xxh32 = XXH32(descriptor, 2, LZ4S_CHECKSUM_SEED);
|
|
checkBits_xxh32 = LZ4S_GetCheckBits_FromXXH(checkBits_xxh32);
|
|
if (checkBits != checkBits_xxh32) EXM_THROW(69, "Stream descriptor error detected");
|
|
}
|
|
|
|
// Allocate Memory
|
|
in_buff = (char*)malloc(maxBlockSize);
|
|
out_buff = (char*)malloc(maxBlockSize);
|
|
if (!in_buff || !out_buff) EXM_THROW(70, "Allocation error : not enough memory");
|
|
if (streamChecksumFlag) streamChecksumState = XXH32_init(LZ4S_CHECKSUM_SEED);
|
|
|
|
// Main Loop
|
|
while (1)
|
|
{
|
|
unsigned int blockSize, uncompressedFlag;
|
|
|
|
// Block Size
|
|
nbReadBytes = fread(&blockSize, 1, 4, finput);
|
|
if( nbReadBytes != 4 ) EXM_THROW(71, "Read error : cannot read next block size");
|
|
if (blockSize == 0) break; // End of Stream Mark : stream is completed
|
|
blockSize = LITTLE_ENDIAN_32(blockSize); // Convert to little endian
|
|
uncompressedFlag = blockSize >> 31;
|
|
blockSize &= 0x7FFFFFFF;
|
|
if (blockSize > maxBlockSize) EXM_THROW(72, "Error : invalid block size");
|
|
|
|
// Read Block
|
|
nbReadBytes = fread(in_buff, 1, blockSize, finput);
|
|
if( nbReadBytes != blockSize ) EXM_THROW(73, "Read error : cannot read data block" );
|
|
|
|
// Check Block
|
|
if (blockChecksumFlag)
|
|
{
|
|
unsigned int checksum = XXH32(in_buff, blockSize, LZ4S_CHECKSUM_SEED);
|
|
unsigned int readChecksum;
|
|
sizeCheck = fread(&readChecksum, 1, 4, finput);
|
|
if( sizeCheck != 4 ) EXM_THROW(74, "Read error : cannot read next block size");
|
|
readChecksum = LITTLE_ENDIAN_32(readChecksum); // Convert to little endian
|
|
if (checksum != readChecksum) EXM_THROW(75, "Error : invalid block checksum detected");
|
|
}
|
|
|
|
if (uncompressedFlag)
|
|
{
|
|
// Write uncompressed Block
|
|
sizeCheck = fwrite(in_buff, 1, blockSize, foutput);
|
|
if (sizeCheck != (size_t)blockSize) EXM_THROW(76, "Write error : cannot write data block");
|
|
filesize += blockSize;
|
|
if (streamChecksumFlag) XXH32_update(streamChecksumState, in_buff, blockSize);
|
|
}
|
|
else
|
|
{
|
|
// Decode Block
|
|
decodedBytes = LZ4_decompress_safe(in_buff, out_buff, blockSize, maxBlockSize);
|
|
if (decodedBytes < 0) EXM_THROW(77, "Decoding Failed ! Corrupted input detected !");
|
|
filesize += decodedBytes;
|
|
if (streamChecksumFlag) XXH32_update(streamChecksumState, out_buff, decodedBytes);
|
|
|
|
// Write Block
|
|
sizeCheck = fwrite(out_buff, 1, decodedBytes, foutput);
|
|
if (sizeCheck != (size_t)decodedBytes) EXM_THROW(78, "Write error : cannot write decoded block\n");
|
|
}
|
|
}
|
|
|
|
// Stream Checksum
|
|
if (streamChecksumFlag)
|
|
{
|
|
unsigned int checksum = XXH32_digest(streamChecksumState);
|
|
unsigned int readChecksum;
|
|
sizeCheck = fread(&readChecksum, 1, 4, finput);
|
|
if (sizeCheck != 4) EXM_THROW(74, "Read error : cannot read stream checksum");
|
|
readChecksum = LITTLE_ENDIAN_32(readChecksum); // Convert to little endian
|
|
if (checksum != readChecksum) EXM_THROW(75, "Error : invalid stream checksum detected");
|
|
}
|
|
|
|
// Free
|
|
free(in_buff);
|
|
free(out_buff);
|
|
|
|
return filesize;
|
|
}
|
|
|
|
|
|
unsigned long long selectDecoder( FILE* finput, FILE* foutput)
|
|
{
|
|
unsigned int magicNumber, size;
|
|
int errorNb;
|
|
size_t nbReadBytes;
|
|
|
|
// Check Archive Header
|
|
nbReadBytes = fread(&magicNumber, 1, MAGICNUMBER_SIZE, finput);
|
|
if (nbReadBytes==0) return 0; // EOF
|
|
if (nbReadBytes != MAGICNUMBER_SIZE) EXM_THROW(41, "Unrecognized header : Magic Number unreadable");
|
|
magicNumber = LITTLE_ENDIAN_32(magicNumber); // Convert to Little Endian format
|
|
if ((magicNumber & LZ4S_SKIPPABLEMASK) == LZ4S_SKIPPABLE0) magicNumber = LZ4S_SKIPPABLE0; // fold skippable magic numbers
|
|
|
|
switch(magicNumber)
|
|
{
|
|
case LZ4S_MAGICNUMBER:
|
|
return decodeLZ4S(finput, foutput);
|
|
case LEGACY_MAGICNUMBER:
|
|
DISPLAY("Detected : Legacy format \n");
|
|
return decodeLegacyStream(finput, foutput);
|
|
case LZ4S_SKIPPABLE0:
|
|
nbReadBytes = fread(&size, 1, 4, finput);
|
|
if (nbReadBytes != 4) EXM_THROW(42, "Stream error : skippable size unreadable");
|
|
size = LITTLE_ENDIAN_32(size); // Convert to Little Endian format
|
|
errorNb = fseek(finput, size, SEEK_CUR);
|
|
if (errorNb != 0) EXM_THROW(43, "Stream error : cannot skip skippable area");
|
|
return selectDecoder(finput, foutput);
|
|
default:
|
|
if (ftell(finput) == MAGICNUMBER_SIZE) EXM_THROW(44,"Unrecognized header : file cannot be decoded"); // Wrong magic number at the beginning of 1st stream
|
|
DISPLAY("Stream followed by unrecognized data\n");
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
|
|
int decodeFile(char* input_filename, char* output_filename)
|
|
{
|
|
unsigned long long filesize = 0, decodedSize=0;
|
|
FILE* finput;
|
|
FILE* foutput;
|
|
clock_t start, end;
|
|
|
|
|
|
// Init
|
|
start = clock();
|
|
get_fileHandle(input_filename, output_filename, &finput, &foutput);
|
|
|
|
// Loop over multiple streams
|
|
do
|
|
{
|
|
decodedSize = selectDecoder(finput, foutput);
|
|
filesize += decodedSize;
|
|
} while (decodedSize);
|
|
|
|
// Final Status
|
|
end = clock();
|
|
DISPLAY( "Successfully decoded %llu bytes \n", filesize);
|
|
{
|
|
double seconds = (double)(end - start)/CLOCKS_PER_SEC;
|
|
DISPLAY( "Done in %.2f s ==> %.2f MB/s\n", seconds, (double)filesize / seconds / 1024 / 1024);
|
|
}
|
|
|
|
// Close
|
|
fclose(finput);
|
|
fclose(foutput);
|
|
|
|
// Error status = OK
|
|
return 0;
|
|
}
|
|
|
|
|
|
int main(int argc, char** argv)
|
|
{
|
|
int i,
|
|
cLevel=0,
|
|
decode=0,
|
|
bench=0,
|
|
filenamesStart=2,
|
|
legacy_format=0;
|
|
char* exename=argv[0];
|
|
char* input_filename=0;
|
|
char* output_filename=0;
|
|
char nullinput[] = NULL_INPUT;
|
|
char extension[] = EXTENSION;
|
|
|
|
// Welcome message
|
|
DISPLAY( WELCOME_MESSAGE);
|
|
|
|
if (argc<2) { badusage(exename); return 1; }
|
|
|
|
for(i=1; i<argc; i++)
|
|
{
|
|
char* argument = argv[i];
|
|
|
|
if(!argument) continue; // Protection if argument empty
|
|
|
|
// Decode command (note : aggregated commands are allowed)
|
|
if (argument[0]=='-')
|
|
{
|
|
while (argument[1]!=0)
|
|
{
|
|
argument ++;
|
|
|
|
switch(argument[0])
|
|
{
|
|
// Display help on usage
|
|
case 'H': usage(exename); usage_advanced(); return 0;
|
|
|
|
// Compression (default)
|
|
case 'c': if ((argument[1] >='0') && (argument[1] <='1')) { cLevel=argument[1] - '0'; argument++; } break;
|
|
case 'h': if (argument[1]=='c') { cLevel=1; argument++; } break;
|
|
|
|
// Checksum management
|
|
case 'x': blockChecksum=1; break;
|
|
case 'n': if (argument[1]=='x') { streamChecksum=0; argument++; break; } else { badusage(exename); return 1; }
|
|
|
|
// Use Legacy format (hidden option)
|
|
case 'l': legacy_format=1; break;
|
|
|
|
// Decoding
|
|
case 'd': decode=1; break;
|
|
|
|
// Bench
|
|
case 'b': bench=1;
|
|
if ((argument[1] >='0') && (argument[1] <='1')) { cLevel=argument[1] - '0'; argument++; }
|
|
break;
|
|
|
|
// Modify Block Size
|
|
case 'B':
|
|
if ((argument[1] >='4') && (argument[1] <='7'))
|
|
{
|
|
int B = argument[1] - '0';
|
|
int S = 1 << (8 + 2*B);
|
|
BMK_SetBlocksize(S);
|
|
blockSizeId = B;
|
|
argument++;
|
|
}
|
|
break;
|
|
|
|
// Modify Nb Iterations (benchmark only)
|
|
case 'i':
|
|
if ((argument[1] >='1') && (argument[1] <='9'))
|
|
{
|
|
int iters = argument[1] - '0';
|
|
BMK_SetNbIterations(iters);
|
|
argument++;
|
|
}
|
|
break;
|
|
|
|
// Pause at the end (benchmark only) (hidden option)
|
|
case 'p': BMK_SetPause(); break;
|
|
|
|
// Test
|
|
case 't': decode=1; output_filename=nulmark; break;
|
|
|
|
// Overwrite
|
|
case 'y': overwrite=1; break;
|
|
|
|
// Unrecognised command
|
|
default : badusage(exename); return 1;
|
|
}
|
|
}
|
|
continue;
|
|
}
|
|
|
|
// first provided filename is input
|
|
if (!input_filename) { input_filename=argument; filenamesStart=i; continue; }
|
|
|
|
// second provided filename is output
|
|
if (!output_filename)
|
|
{
|
|
output_filename=argument;
|
|
if (!strcmp (output_filename, nullinput)) output_filename = nulmark;
|
|
continue;
|
|
}
|
|
}
|
|
|
|
// No input filename ==> Error
|
|
if(!input_filename) { badusage(exename); return 1; }
|
|
|
|
if (bench) return BMK_benchFile(argv+filenamesStart, argc-filenamesStart, cLevel);
|
|
|
|
// No output filename ==> build one automatically (for compression only)
|
|
if (!output_filename)
|
|
{
|
|
if (!decode) // compression
|
|
{
|
|
int i=0, l=0;
|
|
while (input_filename[l]!=0) l++;
|
|
output_filename = (char*)calloc(1,l+5);
|
|
for (i=0;i<l;i++) output_filename[i] = input_filename[i];
|
|
for (i=l;i<l+4;i++) output_filename[i] = extension[i-l];
|
|
}
|
|
else
|
|
{
|
|
int inl=0,outl;
|
|
while (input_filename[inl]!=0) inl++;
|
|
output_filename = (char*)calloc(1,inl+1);
|
|
for (outl=0;outl<inl;outl++) output_filename[outl] = input_filename[outl];
|
|
if (inl>4)
|
|
while ((outl >= inl-4) && (input_filename[outl] == extension[outl-inl+4])) output_filename[outl--]=0;
|
|
if (outl != inl-5) output_filename = NULL;
|
|
}
|
|
if (!output_filename) { badusage(exename); return 1; }
|
|
}
|
|
|
|
if (decode) return decodeFile(input_filename, output_filename);
|
|
|
|
// compression is default action
|
|
if (legacy_format)
|
|
{
|
|
DISPLAY("! Generating compressed LZ4 using Legacy format (deprecated !) ! \n");
|
|
return legacy_compress_file(input_filename, output_filename, cLevel);
|
|
}
|
|
else
|
|
{
|
|
return compress_file(input_filename, output_filename, cLevel);
|
|
}
|
|
}
|