Add a Benchmarking Tool For Compression with Context Re-Use
This commit is contained in:
parent
6c23f03b93
commit
8c006b19bb
@ -62,7 +62,7 @@ NB_LOOPS ?= -i1
|
||||
|
||||
default: all
|
||||
|
||||
all: fullbench fuzzer frametest datagen
|
||||
all: fullbench fuzzer frametest datagen framebench
|
||||
|
||||
all32: CFLAGS+=-m32
|
||||
all32: all
|
||||
@ -98,6 +98,9 @@ fuzzer : lz4.o lz4hc.o xxhash.o fuzzer.c
|
||||
frametest: lz4frame.o lz4.o lz4hc.o xxhash.o frametest.c
|
||||
$(CC) $(FLAGS) $^ -o $@$(EXT)
|
||||
|
||||
framebench: lz4frame.o lz4.o lz4hc.o xxhash.o framebench.c
|
||||
$(CC) $(FLAGS) $^ -o $@$(EXT)
|
||||
|
||||
datagen : $(PRGDIR)/datagen.c datagencli.c
|
||||
$(CC) $(FLAGS) -I$(PRGDIR) $^ -o $@$(EXT)
|
||||
|
||||
@ -109,7 +112,8 @@ clean:
|
||||
fullbench$(EXT) fullbench32$(EXT) \
|
||||
fuzzer$(EXT) fuzzer32$(EXT) \
|
||||
frametest$(EXT) frametest32$(EXT) \
|
||||
fasttest$(EXT) datagen$(EXT) checkTag$(EXT)
|
||||
framebench$(EXT) \
|
||||
fasttest$(EXT) datagen$(EXT)
|
||||
@rm -fR $(TESTDIR)
|
||||
@echo Cleaning completed
|
||||
|
||||
|
293
tests/framebench.c
Normal file
293
tests/framebench.c
Normal file
@ -0,0 +1,293 @@
|
||||
#include <assert.h>
|
||||
#include <stdint.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
#include <sys/types.h>
|
||||
#include <sys/stat.h>
|
||||
#include <time.h>
|
||||
#include <unistd.h>
|
||||
|
||||
#include "lz4.h"
|
||||
#include "lz4frame.h"
|
||||
#include "lz4frame_static.h"
|
||||
|
||||
#define LZ4F_CHECK(x) { typeof(x) _x = (x); if (LZ4F_isError(_x)) { fprintf(stderr, "Error!: %s\n", LZ4F_getErrorName(_x)); return 0; } }
|
||||
|
||||
typedef struct {
|
||||
size_t iter;
|
||||
LZ4_stream_t *ctx;
|
||||
LZ4F_cctx *cctx;
|
||||
char *obuf;
|
||||
size_t osize;
|
||||
const char* ibuf;
|
||||
size_t isize;
|
||||
size_t num_ibuf;
|
||||
const LZ4F_CDict* cdict;
|
||||
LZ4F_preferences_t* prefs;
|
||||
const LZ4F_compressOptions_t* options;
|
||||
} bench_params_t;
|
||||
|
||||
size_t compress_frame(bench_params_t *p) {
|
||||
size_t iter = p->iter;
|
||||
char *obuf = p->obuf;
|
||||
size_t osize = p->osize;
|
||||
const char* ibuf = p->ibuf;
|
||||
size_t isize = p->isize;
|
||||
size_t num_ibuf = p->num_ibuf;
|
||||
const LZ4F_CDict* cdict = p->cdict;
|
||||
LZ4F_preferences_t* prefs = p->prefs;
|
||||
|
||||
size_t oused;
|
||||
|
||||
prefs->frameInfo.contentSize = isize;
|
||||
|
||||
oused = LZ4F_compressFrame_usingCDict(
|
||||
obuf,
|
||||
osize,
|
||||
ibuf + ((iter * 2654435761U) % num_ibuf) * isize,
|
||||
isize,
|
||||
cdict,
|
||||
prefs);
|
||||
LZ4F_CHECK(oused);
|
||||
|
||||
return oused;
|
||||
}
|
||||
|
||||
size_t compress_begin(bench_params_t *p) {
|
||||
size_t iter = p->iter;
|
||||
LZ4F_cctx *cctx = p->cctx;
|
||||
char *obuf = p->obuf;
|
||||
size_t osize = p->osize;
|
||||
const char* ibuf = p->ibuf;
|
||||
size_t isize = p->isize;
|
||||
size_t num_ibuf = p->num_ibuf;
|
||||
const LZ4F_CDict* cdict = p->cdict;
|
||||
LZ4F_preferences_t* prefs = p->prefs;
|
||||
const LZ4F_compressOptions_t* options = p->options;
|
||||
|
||||
char *oend = obuf + osize;
|
||||
size_t oused;
|
||||
|
||||
prefs->frameInfo.contentSize = isize;
|
||||
|
||||
oused = LZ4F_compressBegin_usingCDict(cctx, obuf, oend - obuf, cdict, prefs);
|
||||
LZ4F_CHECK(oused);
|
||||
obuf += oused;
|
||||
oused = LZ4F_compressUpdate(
|
||||
cctx,
|
||||
obuf,
|
||||
oend - obuf,
|
||||
ibuf + ((iter * 2654435761U) % num_ibuf) * isize,
|
||||
isize,
|
||||
options);
|
||||
LZ4F_CHECK(oused);
|
||||
obuf += oused;
|
||||
oused = LZ4F_compressEnd(cctx, obuf, oend - obuf, options);
|
||||
LZ4F_CHECK(oused);
|
||||
|
||||
return obuf - p->obuf;
|
||||
}
|
||||
|
||||
size_t compress_default(bench_params_t *p) {
|
||||
size_t iter = p->iter;
|
||||
char *obuf = p->obuf;
|
||||
size_t osize = p->osize;
|
||||
const char* ibuf = p->ibuf;
|
||||
size_t isize = p->isize;
|
||||
size_t num_ibuf = p->num_ibuf;
|
||||
|
||||
char *oend = obuf + osize;
|
||||
size_t oused;
|
||||
|
||||
oused = LZ4_compress_default(ibuf + ((iter * 2654435761U) % num_ibuf) * isize, obuf, isize, oend - obuf);
|
||||
obuf += oused;
|
||||
|
||||
return obuf - p->obuf;
|
||||
}
|
||||
|
||||
size_t compress_extState(bench_params_t *p) {
|
||||
size_t iter = p->iter;
|
||||
LZ4_stream_t *ctx = p->ctx;
|
||||
char *obuf = p->obuf;
|
||||
size_t osize = p->osize;
|
||||
const char* ibuf = p->ibuf;
|
||||
size_t isize = p->isize;
|
||||
size_t num_ibuf = p->num_ibuf;
|
||||
|
||||
char *oend = obuf + osize;
|
||||
size_t oused;
|
||||
|
||||
oused = LZ4_compress_fast_extState(ctx, ibuf + ((iter * 2654435761U) % num_ibuf) * isize, obuf, isize, oend - obuf, 0);
|
||||
obuf += oused;
|
||||
|
||||
return obuf - p->obuf;
|
||||
}
|
||||
|
||||
uint64_t bench(
|
||||
size_t (*fun)(bench_params_t *),
|
||||
uint64_t repetitions,
|
||||
bench_params_t *params,
|
||||
size_t *osizePtr
|
||||
) {
|
||||
struct timespec start, end;
|
||||
size_t i, osize = 0;
|
||||
|
||||
if (clock_gettime(CLOCK_MONOTONIC_RAW, &start)) return 0;
|
||||
|
||||
for (i = 0; i < repetitions; i++) {
|
||||
size_t o;
|
||||
params->iter = i;
|
||||
o = fun(params);
|
||||
if (!o) return 0;
|
||||
osize += o;
|
||||
}
|
||||
|
||||
if (clock_gettime(CLOCK_MONOTONIC_RAW, &end)) return 0;
|
||||
|
||||
*osizePtr = osize / repetitions;
|
||||
return (1000 * 1000 * 1000 * end.tv_sec + end.tv_nsec) - (1000 * 1000 * 1000 * start.tv_sec + start.tv_nsec);
|
||||
}
|
||||
|
||||
int main(int argc, char *argv[]) {
|
||||
|
||||
|
||||
struct stat st;
|
||||
size_t bytes_read;
|
||||
|
||||
const char *dict_fn;
|
||||
size_t dict_size;
|
||||
char *dict_buf;
|
||||
FILE *dict_file;
|
||||
|
||||
const char *in_fn;
|
||||
size_t in_size;
|
||||
size_t num_in_buf;
|
||||
size_t cur_in_buf;
|
||||
char *in_buf;
|
||||
FILE *in_file;
|
||||
|
||||
size_t out_size;
|
||||
char *out_buf;
|
||||
|
||||
LZ4_stream_t *ctx;
|
||||
LZ4F_cctx *cctx;
|
||||
LZ4F_CDict *cdict;
|
||||
LZ4F_preferences_t prefs;
|
||||
LZ4F_compressOptions_t options;
|
||||
|
||||
size_t out_used;
|
||||
|
||||
uint64_t time_taken;
|
||||
uint64_t repetitions;
|
||||
|
||||
bench_params_t params;
|
||||
|
||||
if (argc != 3) return 1;
|
||||
dict_fn = argv[1];
|
||||
in_fn = argv[2];
|
||||
|
||||
if (stat(dict_fn, &st)) return 1;
|
||||
dict_size = st.st_size;
|
||||
dict_buf = (char *)malloc(dict_size);
|
||||
if (!dict_buf) return 1;
|
||||
dict_file = fopen(dict_fn, "r");
|
||||
bytes_read = fread(dict_buf, 1, dict_size, dict_file);
|
||||
if (bytes_read != dict_size) return 1;
|
||||
|
||||
if (stat(in_fn, &st)) return 1;
|
||||
in_size = st.st_size;
|
||||
num_in_buf = 256 * 1024 * 1024 / in_size;
|
||||
if (num_in_buf == 0) {
|
||||
num_in_buf = 1;
|
||||
}
|
||||
|
||||
in_buf = (char *)malloc(in_size * num_in_buf);
|
||||
if (!in_buf) return 1;
|
||||
in_file = fopen(in_fn, "r");
|
||||
bytes_read = fread(in_buf, 1, in_size, in_file);
|
||||
if (bytes_read != in_size) return 1;
|
||||
|
||||
for(cur_in_buf = 1; cur_in_buf < num_in_buf; cur_in_buf++) {
|
||||
memcpy(in_buf + cur_in_buf * in_size, in_buf, in_size);
|
||||
}
|
||||
|
||||
if (in_size <= 1024) {
|
||||
repetitions = 100000;
|
||||
} else
|
||||
if (in_size <= 16384) {
|
||||
repetitions = 10000;
|
||||
} else
|
||||
if (in_size <= 131072) {
|
||||
repetitions = 1000;
|
||||
} else
|
||||
if (in_size <= 1048576) {
|
||||
repetitions = 100;
|
||||
} else {
|
||||
repetitions = 50;
|
||||
}
|
||||
|
||||
memset(&prefs, 0, sizeof(prefs));
|
||||
prefs.autoFlush = 1;
|
||||
if (in_size < 64 * 1024)
|
||||
prefs.frameInfo.blockMode = LZ4F_blockIndependent;
|
||||
prefs.frameInfo.contentSize = in_size;
|
||||
|
||||
memset(&options, 0, sizeof(options));
|
||||
options.stableSrc = 1;
|
||||
|
||||
out_size = LZ4F_compressFrameBound(in_size, &prefs);
|
||||
out_buf = (char *)malloc(out_size);
|
||||
if (!out_buf) return 1;
|
||||
|
||||
if (LZ4F_isError(LZ4F_createCompressionContext(&cctx, LZ4F_VERSION))) return 1;
|
||||
if (cctx == NULL) return 1;
|
||||
|
||||
ctx = LZ4_createStream();
|
||||
if (ctx == NULL) return 1;
|
||||
|
||||
cdict = LZ4F_createCDict(dict_buf, dict_size);
|
||||
if (!cdict) return 1;
|
||||
|
||||
fprintf(stderr, "dict size: %zd\n", dict_size);
|
||||
fprintf(stderr, "input size: %zd\n", in_size);
|
||||
|
||||
params.ctx = ctx;
|
||||
params.cctx = cctx;
|
||||
params.obuf = out_buf;
|
||||
params.osize = out_size;
|
||||
params.ibuf = in_buf;
|
||||
params.isize = in_size;
|
||||
params.num_ibuf = num_in_buf;
|
||||
params.cdict = NULL;
|
||||
params.prefs = &prefs;
|
||||
params.options = &options;
|
||||
|
||||
time_taken = bench(compress_default, repetitions, ¶ms, &out_used);
|
||||
|
||||
fprintf(stderr, "LZ4_compress_default : %8ld B -> %8ld B, %9ld ns/iter, %6.1lf MB/s\n", in_size, out_used, time_taken / repetitions, ((double) 1000 * in_size * repetitions) / time_taken);
|
||||
|
||||
time_taken = bench(compress_extState, repetitions, ¶ms, &out_used);
|
||||
|
||||
fprintf(stderr, "LZ4_compress_fast_extState : %8ld B -> %8ld B, %9ld ns/iter, %6.1lf MB/s\n", in_size, out_used, time_taken / repetitions, ((double) 1000 * in_size * repetitions) / time_taken);
|
||||
|
||||
time_taken = bench(compress_frame, repetitions, ¶ms, &out_used);
|
||||
|
||||
fprintf(stderr, "LZ4F_compressFrame : %8ld B -> %8ld B, %9ld ns/iter, %6.1lf MB/s\n", in_size, out_used, time_taken / repetitions, ((double) 1000 * in_size * repetitions) / time_taken);
|
||||
|
||||
time_taken = bench(compress_begin, repetitions, ¶ms, &out_used);
|
||||
|
||||
fprintf(stderr, "LZ4F_compressBegin : %8ld B -> %8ld B, %9ld ns/iter, %6.1lf MB/s\n", in_size, out_used, time_taken / repetitions, ((double) 1000 * in_size * repetitions) / time_taken);
|
||||
|
||||
params.cdict = cdict;
|
||||
|
||||
time_taken = bench(compress_frame, repetitions, ¶ms, &out_used);
|
||||
|
||||
fprintf(stderr, "LZ4F_compressFrame_usingCDict: %8ld B -> %8ld B, %9ld ns/iter, %6.1lf MB/s\n", in_size, out_used, time_taken / repetitions, ((double) 1000 * in_size * repetitions) / time_taken);
|
||||
|
||||
time_taken = bench(compress_begin, repetitions, ¶ms, &out_used);
|
||||
|
||||
fprintf(stderr, "LZ4F_compressBegin_usingCDict: %8ld B -> %8ld B, %9ld ns/iter, %6.1lf MB/s\n", in_size, out_used, time_taken / repetitions, ((double) 1000 * in_size * repetitions) / time_taken);
|
||||
|
||||
return 0;
|
||||
}
|
Loading…
Reference in New Issue
Block a user