#!/bin/sh set -e die() { println "$@" 1>&2 exit 1 } roundTripTest() { if [ -n "$3" ]; then cLevel="$3" proba="$2" else cLevel="$2" proba="" fi if [ -n "$4" ]; then dLevel="$4" else dLevel="$cLevel" fi rm -f tmp1 tmp2 println "roundTripTest: ./datagen $1 $proba | $ZSTD -v$cLevel | $ZSTD -d$dLevel" ./datagen $1 $proba | $MD5SUM > tmp1 ./datagen $1 $proba | $ZSTD --ultra -v$cLevel | $ZSTD -d$dLevel | $MD5SUM > tmp2 $DIFF -q tmp1 tmp2 } fileRoundTripTest() { if [ -n "$3" ]; then local_c="$3" local_p="$2" else local_c="$2" local_p="" fi if [ -n "$4" ]; then local_d="$4" else local_d="$local_c" fi rm -f tmp.zstd tmp.md5.1 tmp.md5.2 println "fileRoundTripTest: ./datagen $1 $local_p > tmp && $ZSTD -v$local_c -c tmp | $ZSTD -d$local_d" ./datagen $1 $local_p > tmp < tmp $MD5SUM > tmp.md5.1 $ZSTD --ultra -v$local_c -c tmp | $ZSTD -d$local_d | $MD5SUM > tmp.md5.2 $DIFF -q tmp.md5.1 tmp.md5.2 } truncateLastByte() { dd bs=1 count=$(($(wc -c < "$1") - 1)) if="$1" } println() { printf '%b\n' "${*}" } SCRIPT_DIR=$(cd "$(dirname "$0")" && pwd) PRGDIR="$SCRIPT_DIR/../programs" TESTDIR="$SCRIPT_DIR/../tests" UNAME=$(uname) isTerminal=false if [ -t 0 ] && [ -t 1 ] then isTerminal=true fi isWindows=false INTOVOID="/dev/null" case "$UNAME" in GNU) DEVDEVICE="/dev/random" ;; *) DEVDEVICE="/dev/zero" ;; esac case "$OS" in Windows*) isWindows=true INTOVOID="NUL" DEVDEVICE="NUL" ;; esac case "$UNAME" in Darwin) MD5SUM="md5 -r" ;; FreeBSD) MD5SUM="gmd5sum" ;; OpenBSD) MD5SUM="md5" ;; *) MD5SUM="md5sum" ;; esac DIFF="diff" case "$UNAME" in SunOS) DIFF="gdiff" ;; esac println "\nStarting playTests.sh isWindows=$isWindows ZSTD='$ZSTD'" [ -n "$ZSTD" ] || die "ZSTD variable must be defined!" if echo hello | $ZSTD -v -T2 2>&1 > $INTOVOID | grep -q 'multi-threading is disabled' then hasMT="" else hasMT="true" fi println "\n===> simple tests " ./datagen > tmp println "test : basic compression " $ZSTD -f tmp # trivial compression case, creates tmp.zst println "test : basic decompression" $ZSTD -df tmp.zst # trivial decompression case (overwrites tmp) println "test : too large compression level => auto-fix" $ZSTD -99 -f tmp # too large compression level, automatic sized down $ZSTD -5000000000 -f tmp && die "too large numeric value : must fail" println "test : --fast aka negative compression levels" $ZSTD --fast -f tmp # == -1 $ZSTD --fast=3 -f tmp # == -3 $ZSTD --fast=200000 -f tmp # too low compression level, automatic fixed $ZSTD --fast=5000000000 -f tmp && die "too large numeric value : must fail" $ZSTD -c --fast=0 tmp > $INTOVOID && die "--fast must not accept value 0" println "test : too large numeric argument" $ZSTD --fast=9999999999 -f tmp && die "should have refused numeric value" println "test : set compression level with environment variable ZSTD_CLEVEL" ZSTD_CLEVEL=12 $ZSTD -f tmp # positive compression level ZSTD_CLEVEL=-12 $ZSTD -f tmp # negative compression level ZSTD_CLEVEL=+12 $ZSTD -f tmp # valid: verbose '+' sign ZSTD_CLEVEL='' $ZSTD -f tmp # empty env var, warn and revert to default setting ZSTD_CLEVEL=- $ZSTD -f tmp # malformed env var, warn and revert to default setting ZSTD_CLEVEL=a $ZSTD -f tmp # malformed env var, warn and revert to default setting ZSTD_CLEVEL=+a $ZSTD -f tmp # malformed env var, warn and revert to default setting ZSTD_CLEVEL=3a7 $ZSTD -f tmp # malformed env var, warn and revert to default setting ZSTD_CLEVEL=50000000000 $ZSTD -f tmp # numeric value too large, warn and revert to default setting println "test : override ZSTD_CLEVEL with command line option" ZSTD_CLEVEL=12 $ZSTD --fast=3 -f tmp # overridden by command line option println "test : compress to stdout" $ZSTD tmp -c > tmpCompressed $ZSTD tmp --stdout > tmpCompressed # long command format println "test : compress to named file" rm tmpCompressed $ZSTD tmp -o tmpCompressed test -f tmpCompressed # file must be created println "test : -o must be followed by filename (must fail)" $ZSTD tmp -of tmpCompressed && die "-o must be followed by filename " println "test : force write, correct order" $ZSTD tmp -fo tmpCompressed println "test : forgotten argument" cp tmp tmp2 $ZSTD tmp2 -fo && die "-o must be followed by filename " println "test : implied stdout when input is stdin" println bob | $ZSTD | $ZSTD -d if [ "$isTerminal" = true ]; then println "test : compressed data to terminal" println bob | $ZSTD && die "should have refused : compressed data to terminal" println "test : compressed data from terminal (a hang here is a test fail, zstd is wrongly waiting on data from terminal)" $ZSTD -d > $INTOVOID && die "should have refused : compressed data from terminal" fi println "test : null-length file roundtrip" println -n '' | $ZSTD - --stdout | $ZSTD -d --stdout println "test : ensure small file doesn't add 3-bytes null block" ./datagen -g1 > tmp1 $ZSTD tmp1 -c | wc -c | grep "14" $ZSTD < tmp1 | wc -c | grep "14" println "test : decompress file with wrong suffix (must fail)" $ZSTD -d tmpCompressed && die "wrong suffix error not detected!" $ZSTD -df tmp && die "should have refused : wrong extension" println "test : decompress into stdout" $ZSTD -d tmpCompressed -c > tmpResult # decompression using stdout $ZSTD --decompress tmpCompressed -c > tmpResult $ZSTD --decompress tmpCompressed --stdout > tmpResult println "test : decompress from stdin into stdout" $ZSTD -dc < tmp.zst > $INTOVOID # combine decompression, stdin & stdout $ZSTD -dc - < tmp.zst > $INTOVOID $ZSTD -d < tmp.zst > $INTOVOID # implicit stdout when stdin is used $ZSTD -d - < tmp.zst > $INTOVOID println "test : impose memory limitation (must fail)" $ZSTD -d -f tmp.zst -M2K -c > $INTOVOID && die "decompression needs more memory than allowed" $ZSTD -d -f tmp.zst --memlimit=2K -c > $INTOVOID && die "decompression needs more memory than allowed" # long command $ZSTD -d -f tmp.zst --memory=2K -c > $INTOVOID && die "decompression needs more memory than allowed" # long command $ZSTD -d -f tmp.zst --memlimit-decompress=2K -c > $INTOVOID && die "decompression needs more memory than allowed" # long command println "test : overwrite protection" $ZSTD -q tmp && die "overwrite check failed!" println "test : force overwrite" $ZSTD -q -f tmp $ZSTD -q --force tmp println "test : overwrite readonly file" rm -f tmpro tmpro.zst println foo > tmpro.zst println foo > tmpro chmod 400 tmpro.zst $ZSTD -q tmpro && die "should have refused to overwrite read-only file" $ZSTD -q -f tmpro println "test: --no-progress flag" $ZSTD tmpro -c --no-progress | $ZSTD -d -f -o "$INTOVOID" --no-progress $ZSTD tmpro -cv --no-progress | $ZSTD -dv -f -o "$INTOVOID" --no-progress rm -f tmpro tmpro.zst println "test: overwrite input file (must fail)" $ZSTD tmp -fo tmp && die "zstd compression overwrote the input file" $ZSTD tmp.zst -dfo tmp.zst && die "zstd decompression overwrote the input file" println "test: detect that input file does not exist" $ZSTD nothere && die "zstd hasn't detected that input file does not exist" println "test: --[no-]compress-literals" $ZSTD tmp -c --no-compress-literals -1 | $ZSTD -t $ZSTD tmp -c --no-compress-literals --fast=1 | $ZSTD -t $ZSTD tmp -c --no-compress-literals -19 | $ZSTD -t $ZSTD tmp -c --compress-literals -1 | $ZSTD -t $ZSTD tmp -c --compress-literals --fast=1 | $ZSTD -t $ZSTD tmp -c --compress-literals -19 | $ZSTD -t $ZSTD -b --fast=1 -i1e1 tmp --compress-literals $ZSTD -b --fast=1 -i1e1 tmp --no-compress-literals println "test : file removal" $ZSTD -f --rm tmp test ! -f tmp # tmp should no longer be present $ZSTD -f -d --rm tmp.zst test ! -f tmp.zst # tmp.zst should no longer be present println "test : should quietly not remove non-regular file" println hello > tmp $ZSTD tmp -f -o "$DEVDEVICE" 2>tmplog > "$INTOVOID" grep -v "Refusing to remove non-regular file" tmplog rm -f tmplog $ZSTD tmp -f -o "$INTOVOID" 2>&1 | grep -v "Refusing to remove non-regular file" println "test : --rm on stdin" println a | $ZSTD --rm > $INTOVOID # --rm should remain silent rm tmp $ZSTD -f tmp && die "tmp not present : should have failed" test ! -f tmp.zst # tmp.zst should not be created println "test : -d -f do not delete destination when source is not present" touch tmp # create destination file $ZSTD -d -f tmp.zst && die "attempt to decompress a non existing file" test -f tmp # destination file should still be present println "test : -f do not delete destination when source is not present" rm tmp # erase source file touch tmp.zst # create destination file $ZSTD -f tmp && die "attempt to compress a non existing file" test -f tmp.zst # destination file should still be present rm tmp* println "test : compress multiple files" println hello > tmp1 println world > tmp2 $ZSTD tmp1 tmp2 -o "$INTOVOID" -f $ZSTD tmp1 tmp2 -c | $ZSTD -t $ZSTD tmp1 tmp2 -o tmp.zst test ! -f tmp1.zst test ! -f tmp2.zst $ZSTD tmp1 tmp2 $ZSTD -t tmp1.zst tmp2.zst $ZSTD -dc tmp1.zst tmp2.zst $ZSTD tmp1.zst tmp2.zst -o "$INTOVOID" -f $ZSTD -d tmp1.zst tmp2.zst -o tmp touch tmpexists $ZSTD tmp1 tmp2 -f -o tmpexists $ZSTD tmp1 tmp2 -o tmpexists && die "should have refused to overwrite" # Bug: PR #972 if [ "$?" -eq 139 ]; then die "should not have segfaulted" fi rm tmp* println "\n===> Advanced compression parameters " println "Hello world!" | $ZSTD --zstd=windowLog=21, - -o tmp.zst && die "wrong parameters not detected!" println "Hello world!" | $ZSTD --zstd=windowLo=21 - -o tmp.zst && die "wrong parameters not detected!" println "Hello world!" | $ZSTD --zstd=windowLog=21,slog - -o tmp.zst && die "wrong parameters not detected!" println "Hello world!" | $ZSTD --zstd=strategy=10 - -o tmp.zst && die "parameter out of bound not detected!" # > btultra2 : does not exist test ! -f tmp.zst # tmp.zst should not be created roundTripTest -g512K roundTripTest -g512K " --zstd=mml=3,tlen=48,strat=6" roundTripTest -g512K " --zstd=strat=6,wlog=23,clog=23,hlog=22,slog=6" roundTripTest -g512K " --zstd=windowLog=23,chainLog=23,hashLog=22,searchLog=6,minMatch=3,targetLength=48,strategy=6" roundTripTest -g512K " --single-thread --long --zstd=ldmHashLog=20,ldmMinMatch=64,ldmBucketSizeLog=1,ldmHashRateLog=7" roundTripTest -g512K " --single-thread --long --zstd=lhlog=20,lmml=64,lblog=1,lhrlog=7" roundTripTest -g64K "19 --zstd=strat=9" # btultra2 println "\n===> Pass-Through mode " println "Hello world 1!" | $ZSTD -df println "Hello world 2!" | $ZSTD -dcf println "Hello world 3!" > tmp1 $ZSTD -dcf tmp1 println "\n===> frame concatenation " println "hello " > hello.tmp println "world!" > world.tmp cat hello.tmp world.tmp > helloworld.tmp $ZSTD -c hello.tmp > hello.zstd $ZSTD -c world.tmp > world.zstd cat hello.zstd world.zstd > helloworld.zstd $ZSTD -dc helloworld.zstd > result.tmp cat result.tmp $DIFF helloworld.tmp result.tmp println "frame concatenation without checksum" $ZSTD -c hello.tmp > hello.zstd --no-check $ZSTD -c world.tmp > world.zstd --no-check cat hello.zstd world.zstd > helloworld.zstd $ZSTD -dc helloworld.zstd > result.tmp $DIFF helloworld.tmp result.tmp println "testing zstdcat symlink" ln -sf $ZSTD zstdcat ./zstdcat helloworld.zstd > result.tmp $DIFF helloworld.tmp result.tmp ln -s helloworld.zstd helloworld.link.zstd ./zstdcat helloworld.link.zstd > result.tmp $DIFF helloworld.tmp result.tmp rm zstdcat rm result.tmp println "testing zcat symlink" ln -sf $ZSTD zcat ./zcat helloworld.zstd > result.tmp $DIFF helloworld.tmp result.tmp ./zcat helloworld.link.zstd > result.tmp $DIFF helloworld.tmp result.tmp rm zcat rm ./*.tmp ./*.zstd println "frame concatenation tests completed" if [ "$isWindows" = false ] && [ "$UNAME" != 'SunOS' ] && [ "$UNAME" != "OpenBSD" ] ; then println "\n**** flush write error test **** " println "println foo | $ZSTD > /dev/full" println foo | $ZSTD > /dev/full && die "write error not detected!" println "println foo | $ZSTD | $ZSTD -d > /dev/full" println foo | $ZSTD | $ZSTD -d > /dev/full && die "write error not detected!" fi if [ "$isWindows" = false ] && [ "$UNAME" != 'SunOS' ] ; then println "\n===> symbolic link test " rm -f hello.tmp world.tmp world2.tmp hello.tmp.zst world.tmp.zst println "hello world" > hello.tmp ln -s hello.tmp world.tmp ln -s hello.tmp world2.tmp $ZSTD world.tmp hello.tmp || true test -f hello.tmp.zst # regular file should have been compressed! test ! -f world.tmp.zst # symbolic link should not have been compressed! $ZSTD world.tmp || true test ! -f world.tmp.zst # symbolic link should not have been compressed! $ZSTD world.tmp world2.tmp || true test ! -f world.tmp.zst # symbolic link should not have been compressed! test ! -f world2.tmp.zst # symbolic link should not have been compressed! $ZSTD world.tmp hello.tmp -f test -f world.tmp.zst # symbolic link should have been compressed with --force rm -f hello.tmp world.tmp world2.tmp hello.tmp.zst world.tmp.zst fi println "\n===> test sparse file support " ./datagen -g5M -P100 > tmpSparse $ZSTD tmpSparse -c | $ZSTD -dv -o tmpSparseRegen $DIFF -s tmpSparse tmpSparseRegen $ZSTD tmpSparse -c | $ZSTD -dv --sparse -c > tmpOutSparse $DIFF -s tmpSparse tmpOutSparse $ZSTD tmpSparse -c | $ZSTD -dv --no-sparse -c > tmpOutNoSparse $DIFF -s tmpSparse tmpOutNoSparse ls -ls tmpSparse* # look at file size and block size on disk ./datagen -s1 -g1200007 -P100 | $ZSTD | $ZSTD -dv --sparse -c > tmpSparseOdd # Odd size file (to not finish on an exact nb of blocks) ./datagen -s1 -g1200007 -P100 | $DIFF -s - tmpSparseOdd ls -ls tmpSparseOdd # look at file size and block size on disk println "\n Sparse Compatibility with Console :" println "Hello World 1 !" | $ZSTD | $ZSTD -d -c println "Hello World 2 !" | $ZSTD | $ZSTD -d | cat println "\n Sparse Compatibility with Append :" ./datagen -P100 -g1M > tmpSparse1M cat tmpSparse1M tmpSparse1M > tmpSparse2M $ZSTD -v -f tmpSparse1M -o tmpSparseCompressed $ZSTD -d -v -f tmpSparseCompressed -o tmpSparseRegenerated $ZSTD -d -v -f tmpSparseCompressed -c >> tmpSparseRegenerated ls -ls tmpSparse* # look at file size and block size on disk $DIFF tmpSparse2M tmpSparseRegenerated rm tmpSparse* println "\n===> multiple files tests " ./datagen -s1 > tmp1 2> $INTOVOID ./datagen -s2 -g100K > tmp2 2> $INTOVOID ./datagen -s3 -g1M > tmp3 2> $INTOVOID println "compress tmp* : " $ZSTD -f tmp* ls -ls tmp* rm tmp1 tmp2 tmp3 println "decompress tmp* : " $ZSTD -df ./*.zst ls -ls tmp* println "compress tmp* into stdout > tmpall : " $ZSTD -c tmp1 tmp2 tmp3 > tmpall ls -ls tmp* # check size of tmpall (should be tmp1.zst + tmp2.zst + tmp3.zst) println "decompress tmpall* into stdout > tmpdec : " cp tmpall tmpall2 $ZSTD -dc tmpall* > tmpdec ls -ls tmp* # check size of tmpdec (should be 2*(tmp1 + tmp2 + tmp3)) println "compress multiple files including a missing one (notHere) : " $ZSTD -f tmp1 notHere tmp2 && die "missing file not detected!" println "\n===> stream-size mode" ./datagen -g11000 > tmp println "test : basic file compression vs sized streaming compression" file_size=$($ZSTD -14 -f tmp -o tmp.zst && wc -c < tmp.zst) stream_size=$(cat tmp | $ZSTD -14 --stream-size=11000 | wc -c) if [ "$stream_size" -gt "$file_size" ]; then die "hinted compression larger than expected" fi println "test : sized streaming compression and decompression" cat tmp | $ZSTD -14 -f tmp -o --stream-size=11000 tmp.zst $ZSTD -df tmp.zst -o tmp_decompress cmp tmp tmp_decompress || die "difference between original and decompressed file" println "test : incorrect stream size" cat tmp | $ZSTD -14 -f -o tmp.zst --stream-size=11001 && die "should fail with incorrect stream size" println "\n===> size-hint mode" ./datagen -g11000 > tmp ./datagen -g11000 > tmp2 ./datagen > tmpDict println "test : basic file compression vs hinted streaming compression" file_size=$($ZSTD -14 -f tmp -o tmp.zst && wc -c < tmp.zst) stream_size=$(cat tmp | $ZSTD -14 --size-hint=11000 | wc -c) if [ "$stream_size" -ge "$file_size" ]; then die "hinted compression larger than expected" fi println "test : hinted streaming compression and decompression" cat tmp | $ZSTD -14 -f -o tmp.zst --size-hint=11000 $ZSTD -df tmp.zst -o tmp_decompress cmp tmp tmp_decompress || die "difference between original and decompressed file" println "test : hinted streaming compression with dictionary" cat tmp | $ZSTD -14 -f -D tmpDict --size-hint=11000 | $ZSTD -t -D tmpDict println "test : multiple file compression with hints and dictionary" $ZSTD -14 -f -D tmpDict --size-hint=11000 tmp tmp2 $ZSTD -14 -f -o tmp1_.zst -D tmpDict --size-hint=11000 tmp $ZSTD -14 -f -o tmp2_.zst -D tmpDict --size-hint=11000 tmp2 cmp tmp.zst tmp1_.zst || die "first file's output differs" cmp tmp2.zst tmp2_.zst || die "second file's output differs" println "test : incorrect hinted stream sizes" cat tmp | $ZSTD -14 -f --size-hint=11050 | $ZSTD -t # slightly too high cat tmp | $ZSTD -14 -f --size-hint=10950 | $ZSTD -t # slightly too low cat tmp | $ZSTD -14 -f --size-hint=22000 | $ZSTD -t # considerably too high cat tmp | $ZSTD -14 -f --size-hint=5500 | $ZSTD -t # considerably too low println "\n===> dictionary tests " println "- test with raw dict (content only) " ./datagen > tmpDict ./datagen -g1M | $MD5SUM > tmp1 ./datagen -g1M | $ZSTD -D tmpDict | $ZSTD -D tmpDict -dvq | $MD5SUM > tmp2 $DIFF -q tmp1 tmp2 println "- Create first dictionary " TESTFILE="$PRGDIR"/zstdcli.c $ZSTD --train "$TESTDIR"/*.c "$PRGDIR"/*.c -o tmpDict cp "$TESTFILE" tmp println "- Test dictionary compression with tmpDict as an input file and dictionary" $ZSTD -f tmpDict -D tmpDict && die "compression error not detected!" println "- Dictionary compression roundtrip" $ZSTD -f tmp -D tmpDict $ZSTD -d tmp.zst -D tmpDict -fo result $DIFF "$TESTFILE" result println "- Dictionary compression with btlazy2 strategy" $ZSTD -f tmp -D tmpDict --zstd=strategy=6 $ZSTD -d tmp.zst -D tmpDict -fo result $DIFF "$TESTFILE" result if [ -n "$hasMT" ] then println "- Test dictionary compression with multithreading " ./datagen -g5M | $ZSTD -T2 -D tmpDict | $ZSTD -t -D tmpDict # fails with v1.3.2 fi println "- Create second (different) dictionary " $ZSTD --train "$TESTDIR"/*.c "$PRGDIR"/*.c "$PRGDIR"/*.h -o tmpDictC $ZSTD -d tmp.zst -D tmpDictC -fo result && die "wrong dictionary not detected!" println "- Create dictionary with short dictID" $ZSTD --train "$TESTDIR"/*.c "$PRGDIR"/*.c --dictID=1 -o tmpDict1 cmp tmpDict tmpDict1 && die "dictionaries should have different ID !" println "- Create dictionary with wrong dictID parameter order (must fail)" $ZSTD --train "$TESTDIR"/*.c "$PRGDIR"/*.c --dictID -o 1 tmpDict1 && die "wrong order : --dictID must be followed by argument " println "- Create dictionary with size limit" $ZSTD --train "$TESTDIR"/*.c "$PRGDIR"/*.c -o tmpDict2 --maxdict=4K -v println "- Create dictionary with small size limit" $ZSTD --train "$TESTDIR"/*.c "$PRGDIR"/*.c -o tmpDict3 --maxdict=1K -v println "- Create dictionary with wrong parameter order (must fail)" $ZSTD --train "$TESTDIR"/*.c "$PRGDIR"/*.c -o tmpDict3 --maxdict -v 4K && die "wrong order : --maxdict must be followed by argument " println "- Compress without dictID" $ZSTD -f tmp -D tmpDict1 --no-dictID $ZSTD -d tmp.zst -D tmpDict -fo result $DIFF "$TESTFILE" result println "- Compress with wrong argument order (must fail)" $ZSTD tmp -Df tmpDict1 -c > $INTOVOID && die "-D must be followed by dictionary name " println "- Compress multiple files with dictionary" rm -rf dirTestDict mkdir dirTestDict cp "$TESTDIR"/*.c dirTestDict cp "$PRGDIR"/*.c dirTestDict cp "$PRGDIR"/*.h dirTestDict $MD5SUM dirTestDict/* > tmph1 $ZSTD -f --rm dirTestDict/* -D tmpDictC $ZSTD -d --rm dirTestDict/*.zst -D tmpDictC # note : use internal checksum by default case "$UNAME" in Darwin) println "md5sum -c not supported on OS-X : test skipped" ;; # not compatible with OS-X's md5 *) $MD5SUM -c tmph1 ;; esac rm -rf dirTestDict println "- dictionary builder on bogus input" println "Hello World" > tmp $ZSTD --train-legacy -q tmp && die "Dictionary training should fail : not enough input source" ./datagen -P0 -g10M > tmp $ZSTD --train-legacy -q tmp && die "Dictionary training should fail : source is pure noise" println "- Test -o before --train" rm -f tmpDict dictionary $ZSTD -o tmpDict --train "$TESTDIR"/*.c "$PRGDIR"/*.c test -f tmpDict $ZSTD --train "$TESTDIR"/*.c "$PRGDIR"/*.c test -f dictionary rm tmp* dictionary println "\n===> fastCover dictionary builder : advanced options " TESTFILE="$PRGDIR"/zstdcli.c ./datagen > tmpDict println "- Create first dictionary" $ZSTD --train-fastcover=k=46,d=8,f=15,split=80 "$TESTDIR"/*.c "$PRGDIR"/*.c -o tmpDict cp "$TESTFILE" tmp $ZSTD -f tmp -D tmpDict $ZSTD -d tmp.zst -D tmpDict -fo result $DIFF "$TESTFILE" result println "- Create second (different) dictionary" $ZSTD --train-fastcover=k=56,d=8 "$TESTDIR"/*.c "$PRGDIR"/*.c "$PRGDIR"/*.h -o tmpDictC $ZSTD -d tmp.zst -D tmpDictC -fo result && die "wrong dictionary not detected!" $ZSTD --train-fastcover=k=56,d=8 && die "Create dictionary without input file" println "- Create dictionary with short dictID" $ZSTD --train-fastcover=k=46,d=8,f=15,split=80 "$TESTDIR"/*.c "$PRGDIR"/*.c --dictID=1 -o tmpDict1 cmp tmpDict tmpDict1 && die "dictionaries should have different ID !" println "- Create dictionaries with shrink-dict flag enabled" $ZSTD --train-fastcover=steps=256,shrink "$TESTDIR"/*.c "$PRGDIR"/*.c -o tmpShrinkDict $ZSTD --train-fastcover=steps=256,shrink=1 "$TESTDIR"/*.c "$PRGDIR"/*.c -o tmpShrinkDict1 $ZSTD --train-fastcover=steps=256,shrink=5 "$TESTDIR"/*.c "$PRGDIR"/*.c -o tmpShrinkDict2 println "- Create dictionary with size limit" $ZSTD --train-fastcover=steps=8 "$TESTDIR"/*.c "$PRGDIR"/*.c -o tmpDict2 --maxdict=4K println "- Compare size of dictionary from 90% training samples with 80% training samples" $ZSTD --train-fastcover=split=90 -r "$TESTDIR"/*.c "$PRGDIR"/*.c $ZSTD --train-fastcover=split=80 -r "$TESTDIR"/*.c "$PRGDIR"/*.c println "- Create dictionary using all samples for both training and testing" $ZSTD --train-fastcover=split=100 -r "$TESTDIR"/*.c "$PRGDIR"/*.c println "- Create dictionary using f=16" $ZSTD --train-fastcover=f=16 -r "$TESTDIR"/*.c "$PRGDIR"/*.c $ZSTD --train-fastcover=accel=15 -r "$TESTDIR"/*.c "$PRGDIR"/*.c && die "Created dictionary using accel=15" println "- Create dictionary using accel=2" $ZSTD --train-fastcover=accel=2 -r "$TESTDIR"/*.c "$PRGDIR"/*.c println "- Create dictionary using accel=10" $ZSTD --train-fastcover=accel=10 -r "$TESTDIR"/*.c "$PRGDIR"/*.c println "- Create dictionary with multithreading" $ZSTD --train-fastcover -T4 -r "$TESTDIR"/*.c "$PRGDIR"/*.c println "- Test -o before --train-fastcover" rm -f tmpDict dictionary $ZSTD -o tmpDict --train-fastcover "$TESTDIR"/*.c "$PRGDIR"/*.c test -f tmpDict $ZSTD --train-fastcover "$TESTDIR"/*.c "$PRGDIR"/*.c test -f dictionary rm tmp* dictionary println "\n===> legacy dictionary builder " TESTFILE="$PRGDIR"/zstdcli.c ./datagen > tmpDict println "- Create first dictionary" $ZSTD --train-legacy=selectivity=8 "$TESTDIR"/*.c "$PRGDIR"/*.c -o tmpDict cp "$TESTFILE" tmp $ZSTD -f tmp -D tmpDict $ZSTD -d tmp.zst -D tmpDict -fo result $DIFF "$TESTFILE" result $ZSTD --train-legacy=s=8 && die "Create dictionary without input files (should error)" println "- Create second (different) dictionary" $ZSTD --train-legacy=s=5 "$TESTDIR"/*.c "$PRGDIR"/*.c "$PRGDIR"/*.h -o tmpDictC $ZSTD -d tmp.zst -D tmpDictC -fo result && die "wrong dictionary not detected!" println "- Create dictionary with short dictID" $ZSTD --train-legacy -s5 "$TESTDIR"/*.c "$PRGDIR"/*.c --dictID=1 -o tmpDict1 cmp tmpDict tmpDict1 && die "dictionaries should have different ID !" println "- Create dictionary with size limit" $ZSTD --train-legacy -s9 "$TESTDIR"/*.c "$PRGDIR"/*.c -o tmpDict2 --maxdict=4K println "- Test -o before --train-legacy" rm -f tmpDict dictionary $ZSTD -o tmpDict --train-legacy "$TESTDIR"/*.c "$PRGDIR"/*.c test -f tmpDict $ZSTD --train-legacy "$TESTDIR"/*.c "$PRGDIR"/*.c test -f dictionary rm tmp* dictionary println "\n===> integrity tests " println "test one file (tmp1.zst) " ./datagen > tmp1 $ZSTD tmp1 $ZSTD -t tmp1.zst $ZSTD --test tmp1.zst println "test multiple files (*.zst) " $ZSTD -t ./*.zst println "test bad files (*) " $ZSTD -t ./* && die "bad files not detected !" $ZSTD -t tmp1 && die "bad file not detected !" cp tmp1 tmp2.zst $ZSTD -t tmp2.zst && die "bad file not detected !" ./datagen -g0 > tmp3 $ZSTD -t tmp3 && die "bad file not detected !" # detects 0-sized files as bad println "test --rm and --test combined " $ZSTD -t --rm tmp1.zst test -f tmp1.zst # check file is still present split -b16384 tmp1.zst tmpSplit. $ZSTD -t tmpSplit.* && die "bad file not detected !" ./datagen | $ZSTD -c | $ZSTD -t println "\n===> golden files tests " $ZSTD -t -r "$TESTDIR/files" $ZSTD -c -r "$TESTDIR/files" | $ZSTD -t println "\n===> benchmark mode tests " println "bench one file" ./datagen > tmp1 $ZSTD -bi0 tmp1 println "bench multiple levels" $ZSTD -i0b0e3 tmp1 println "bench negative level" $ZSTD -bi0 --fast tmp1 println "with recursive and quiet modes" $ZSTD -rqi1b1e2 tmp1 println "benchmark decompression only" $ZSTD -f tmp1 $ZSTD -b -d -i1 tmp1.zst println "\n===> zstd compatibility tests " ./datagen > tmp rm -f tmp.zst $ZSTD --format=zstd -f tmp test -f tmp.zst println "\n===> gzip compatibility tests " GZIPMODE=1 $ZSTD --format=gzip -V || GZIPMODE=0 if [ $GZIPMODE -eq 1 ]; then println "gzip support detected" GZIPEXE=1 gzip -V || GZIPEXE=0 if [ $GZIPEXE -eq 1 ]; then ./datagen > tmp $ZSTD --format=gzip -f tmp gzip -t -v tmp.gz gzip -f tmp $ZSTD -d -f -v tmp.gz rm tmp* else println "gzip binary not detected" fi else println "gzip mode not supported" fi println "\n===> gzip frame tests " if [ $GZIPMODE -eq 1 ]; then ./datagen > tmp $ZSTD -f --format=gzip tmp $ZSTD -f tmp cat tmp.gz tmp.zst tmp.gz tmp.zst | $ZSTD -d -f -o tmp truncateLastByte tmp.gz | $ZSTD -t > $INTOVOID && die "incomplete frame not detected !" rm tmp* else println "gzip mode not supported" fi if [ $GZIPMODE -eq 1 ]; then ./datagen > tmp rm -f tmp.zst $ZSTD --format=gzip --format=zstd -f tmp test -f tmp.zst fi println "\n===> xz compatibility tests " LZMAMODE=1 $ZSTD --format=xz -V || LZMAMODE=0 if [ $LZMAMODE -eq 1 ]; then println "xz support detected" XZEXE=1 xz -Q -V && lzma -Q -V || XZEXE=0 if [ $XZEXE -eq 1 ]; then println "Testing zstd xz and lzma support" ./datagen > tmp $ZSTD --format=lzma -f tmp $ZSTD --format=xz -f tmp xz -Q -t -v tmp.xz xz -Q -t -v tmp.lzma xz -Q -f -k tmp lzma -Q -f -k --lzma1 tmp $ZSTD -d -f -v tmp.xz $ZSTD -d -f -v tmp.lzma rm tmp* println "Creating symlinks" ln -s $ZSTD ./xz ln -s $ZSTD ./unxz ln -s $ZSTD ./lzma ln -s $ZSTD ./unlzma println "Testing xz and lzma symlinks" ./datagen > tmp ./xz tmp xz -Q -d tmp.xz ./lzma tmp lzma -Q -d tmp.lzma println "Testing unxz and unlzma symlinks" xz -Q tmp ./xz -d tmp.xz lzma -Q tmp ./lzma -d tmp.lzma rm xz unxz lzma unlzma rm tmp* else println "xz binary not detected" fi else println "xz mode not supported" fi println "\n===> xz frame tests " if [ $LZMAMODE -eq 1 ]; then ./datagen > tmp $ZSTD -f --format=xz tmp $ZSTD -f --format=lzma tmp $ZSTD -f tmp cat tmp.xz tmp.lzma tmp.zst tmp.lzma tmp.xz tmp.zst | $ZSTD -d -f -o tmp truncateLastByte tmp.xz | $ZSTD -t > $INTOVOID && die "incomplete frame not detected !" truncateLastByte tmp.lzma | $ZSTD -t > $INTOVOID && die "incomplete frame not detected !" rm tmp* else println "xz mode not supported" fi println "\n===> lz4 compatibility tests " LZ4MODE=1 $ZSTD --format=lz4 -V || LZ4MODE=0 if [ $LZ4MODE -eq 1 ]; then println "lz4 support detected" LZ4EXE=1 lz4 -V || LZ4EXE=0 if [ $LZ4EXE -eq 1 ]; then ./datagen > tmp $ZSTD --format=lz4 -f tmp lz4 -t -v tmp.lz4 lz4 -f tmp $ZSTD -d -f -v tmp.lz4 rm tmp* else println "lz4 binary not detected" fi else println "lz4 mode not supported" fi println "\n===> lz4 frame tests " if [ $LZ4MODE -eq 1 ]; then ./datagen > tmp $ZSTD -f --format=lz4 tmp $ZSTD -f tmp cat tmp.lz4 tmp.zst tmp.lz4 tmp.zst | $ZSTD -d -f -o tmp truncateLastByte tmp.lz4 | $ZSTD -t > $INTOVOID && die "incomplete frame not detected !" rm tmp* else println "lz4 mode not supported" fi println "\n===> suffix list test" ! $ZSTD -d tmp.abc 2> tmplg if [ $GZIPMODE -ne 1 ]; then grep ".gz" tmplg > $INTOVOID && die "Unsupported suffix listed" fi if [ $LZMAMODE -ne 1 ]; then grep ".lzma" tmplg > $INTOVOID && die "Unsupported suffix listed" grep ".xz" tmplg > $INTOVOID && die "Unsupported suffix listed" fi if [ $LZ4MODE -ne 1 ]; then grep ".lz4" tmplg > $INTOVOID && die "Unsupported suffix listed" fi println "\n===> zstd round-trip tests " roundTripTest roundTripTest -g15K # TableID==3 roundTripTest -g127K # TableID==2 roundTripTest -g255K # TableID==1 roundTripTest -g522K # TableID==0 roundTripTest -g519K 6 # greedy, hash chain roundTripTest -g517K 16 # btlazy2 roundTripTest -g516K 19 # btopt fileRoundTripTest -g500K println "\n===> zstd long distance matching round-trip tests " roundTripTest -g0 "2 --single-thread --long" roundTripTest -g1000K "1 --single-thread --long" roundTripTest -g517K "6 --single-thread --long" roundTripTest -g516K "16 --single-thread --long" roundTripTest -g518K "19 --single-thread --long" fileRoundTripTest -g5M "3 --single-thread --long" roundTripTest -g96K "5 --single-thread" if [ -n "$hasMT" ] then println "\n===> zstdmt round-trip tests " roundTripTest -g4M "1 -T0" roundTripTest -g8M "3 -T2" roundTripTest -g8000K "2 --threads=2" fileRoundTripTest -g4M "19 -T2 -B1M" println "\n===> zstdmt long distance matching round-trip tests " roundTripTest -g8M "3 --long=24 -T2" println "\n===> ovLog tests " ./datagen -g2MB > tmp refSize=$($ZSTD tmp -6 -c --zstd=wlog=18 | wc -c) ov9Size=$($ZSTD tmp -6 -c --zstd=wlog=18,ovlog=9 | wc -c) ov1Size=$($ZSTD tmp -6 -c --zstd=wlog=18,ovlog=1 | wc -c) if [ "$refSize" -eq "$ov9Size" ]; then echo ov9Size should be different from refSize exit 1 fi if [ "$refSize" -eq "$ov1Size" ]; then echo ov1Size should be different from refSize exit 1 fi if [ "$ov9Size" -ge "$ov1Size" ]; then echo ov9Size="$ov9Size" should be smaller than ov1Size="$ov1Size" exit 1 fi else println "\n===> no multithreading, skipping zstdmt tests " fi rm tmp* println "\n===> zstd --list/-l single frame tests " ./datagen > tmp1 ./datagen > tmp2 ./datagen > tmp3 $ZSTD tmp* $ZSTD -l ./*.zst $ZSTD -lv ./*.zst | grep "Decompressed Size:" # check that decompressed size is present in header $ZSTD --list ./*.zst $ZSTD --list -v ./*.zst println "\n===> zstd --list/-l multiple frame tests " cat tmp1.zst tmp2.zst > tmp12.zst cat tmp12.zst tmp3.zst > tmp123.zst $ZSTD -l ./*.zst $ZSTD -lv ./*.zst println "\n===> zstd --list/-l error detection tests " $ZSTD -l tmp1 tmp1.zst && die "-l must fail on non-zstd file" $ZSTD --list tmp* && die "-l must fail on non-zstd file" $ZSTD -lv tmp1* && die "-l must fail on non-zstd file" $ZSTD --list -v tmp2 tmp12.zst && die "-l must fail on non-zstd file" println "test : detect truncated compressed file " TEST_DATA_FILE=truncatable-input.txt FULL_COMPRESSED_FILE=${TEST_DATA_FILE}.zst TRUNCATED_COMPRESSED_FILE=truncated-input.txt.zst ./datagen -g50000 > $TEST_DATA_FILE $ZSTD -f $TEST_DATA_FILE -o $FULL_COMPRESSED_FILE dd bs=1 count=100 if=$FULL_COMPRESSED_FILE of=$TRUNCATED_COMPRESSED_FILE $ZSTD --list $TRUNCATED_COMPRESSED_FILE && die "-l must fail on truncated file" rm $TEST_DATA_FILE rm $FULL_COMPRESSED_FILE rm $TRUNCATED_COMPRESSED_FILE println "\n===> zstd --list/-l errors when presented with stdin / no files" $ZSTD -l && die "-l must fail on empty list of files" $ZSTD -l - && die "-l does not work on stdin" $ZSTD -l < tmp1.zst && die "-l does not work on stdin" $ZSTD -l - < tmp1.zst && die "-l does not work on stdin" $ZSTD -l - tmp1.zst && die "-l does not work on stdin" $ZSTD -l - tmp1.zst < tmp1.zst && die "-l does not work on stdin" $ZSTD -l tmp1.zst < tmp2.zst # this will check tmp1.zst, but not tmp2.zst, which is not an error : zstd simply doesn't read stdin in this case. It must not error just because stdin is not a tty println "\n===> zstd --list/-l test with null files " ./datagen -g0 > tmp5 $ZSTD tmp5 $ZSTD -l tmp5.zst $ZSTD -l tmp5* && die "-l must fail on non-zstd file" $ZSTD -lv tmp5.zst | grep "Decompressed Size: 0.00 KB (0 B)" # check that 0 size is present in header $ZSTD -lv tmp5* && die "-l must fail on non-zstd file" println "\n===> zstd --list/-l test with no content size field " ./datagen -g513K | $ZSTD > tmp6.zst $ZSTD -l tmp6.zst $ZSTD -lv tmp6.zst | grep "Decompressed Size:" && die "Field :Decompressed Size: should not be available in this compressed file" println "\n===> zstd --list/-l test with no checksum " $ZSTD -f --no-check tmp1 $ZSTD -l tmp1.zst $ZSTD -lv tmp1.zst rm tmp* println "\n===> zstd long distance matching tests " roundTripTest -g0 " --single-thread --long" roundTripTest -g9M "2 --single-thread --long" # Test parameter parsing roundTripTest -g1M -P50 "1 --single-thread --long=29" " --memory=512MB" roundTripTest -g1M -P50 "1 --single-thread --long=29 --zstd=wlog=28" " --memory=256MB" roundTripTest -g1M -P50 "1 --single-thread --long=29" " --long=28 --memory=512MB" roundTripTest -g1M -P50 "1 --single-thread --long=29" " --zstd=wlog=28 --memory=512MB" if [ -n "$hasMT" ] then println "\n===> adaptive mode " roundTripTest -g270000000 " --adapt" roundTripTest -g27000000 " --adapt=min=1,max=4" println "===> test: --adapt must fail on incoherent bounds " ./datagen > tmp $ZSTD -f -vv --adapt=min=10,max=9 tmp && die "--adapt must fail on incoherent bounds" println "\n===> rsyncable mode " roundTripTest -g10M " --rsyncable" roundTripTest -g10M " --rsyncable -B100K" println "===> test: --rsyncable must fail with --single-thread" $ZSTD -f -vv --rsyncable --single-thread tmp && die "--rsyncable must fail with --single-thread" fi if [ "$1" != "--test-large-data" ]; then println "Skipping large data tests" exit 0 fi ############################################################################# println "\n===> large files tests " roundTripTest -g270000000 1 roundTripTest -g250000000 2 roundTripTest -g230000000 3 roundTripTest -g140000000 -P60 4 roundTripTest -g130000000 -P62 5 roundTripTest -g120000000 -P65 6 roundTripTest -g70000000 -P70 7 roundTripTest -g60000000 -P71 8 roundTripTest -g50000000 -P73 9 roundTripTest -g35000000 -P75 10 roundTripTest -g30000000 -P76 11 roundTripTest -g25000000 -P78 12 roundTripTest -g18000013 -P80 13 roundTripTest -g18000014 -P80 14 roundTripTest -g18000015 -P81 15 roundTripTest -g18000016 -P84 16 roundTripTest -g18000017 -P88 17 roundTripTest -g18000018 -P94 18 roundTripTest -g18000019 -P96 19 roundTripTest -g5000000000 -P99 1 roundTripTest -g1700000000 -P0 "1 --zstd=strategy=6" # ensure btlazy2 can survive an overflow rescale fileRoundTripTest -g4193M -P99 1 println "\n===> zstd long, long distance matching round-trip tests " roundTripTest -g270000000 "1 --single-thread --long" roundTripTest -g130000000 -P60 "5 --single-thread --long" roundTripTest -g35000000 -P70 "8 --single-thread --long" roundTripTest -g18000001 -P80 "18 --single-thread --long" # Test large window logs roundTripTest -g700M -P50 "1 --single-thread --long=29" roundTripTest -g600M -P50 "1 --single-thread --long --zstd=wlog=29,clog=28" if [ -n "$hasMT" ] then println "\n===> zstdmt long round-trip tests " roundTripTest -g80000000 -P99 "19 -T2" " " roundTripTest -g5000000000 -P99 "1 -T2" " " roundTripTest -g500000000 -P97 "1 -T999" " " fileRoundTripTest -g4103M -P98 " -T0" " " roundTripTest -g400000000 -P97 "1 --long=24 -T2" " " # Exposes the bug in https://github.com/facebook/zstd/pull/1678 # This test fails on 4 different travis builds at the time of writing # because it needs to allocate 8 GB of memory. # roundTripTest -g10G -P99 "1 -T1 --long=31 --zstd=clog=27 --fast=1000" else println "\n**** no multithreading, skipping zstdmt tests **** " fi println "\n===> cover dictionary builder : advanced options " TESTFILE="$PRGDIR"/zstdcli.c ./datagen > tmpDict println "- Create first dictionary" $ZSTD --train-cover=k=46,d=8,split=80 "$TESTDIR"/*.c "$PRGDIR"/*.c -o tmpDict cp "$TESTFILE" tmp $ZSTD -f tmp -D tmpDict $ZSTD -d tmp.zst -D tmpDict -fo result $DIFF "$TESTFILE" result $ZSTD --train-cover=k=56,d=8 && die "Create dictionary without input file (should error)" println "- Create second (different) dictionary" $ZSTD --train-cover=k=56,d=8 "$TESTDIR"/*.c "$PRGDIR"/*.c "$PRGDIR"/*.h -o tmpDictC $ZSTD -d tmp.zst -D tmpDictC -fo result && die "wrong dictionary not detected!" println "- Create dictionary using shrink-dict flag" $ZSTD --train-cover=steps=256,shrink "$TESTDIR"/*.c "$PRGDIR"/*.c --dictID=1 -o tmpShrinkDict $ZSTD --train-cover=steps=256,shrink=1 "$TESTDIR"/*.c "$PRGDIR"/*.c --dictID=1 -o tmpShrinkDict1 $ZSTD --train-cover=steps=256,shrink=5 "$TESTDIR"/*.c "$PRGDIR"/*.c --dictID=1 -o tmpShrinkDict2 println "- Create dictionary with short dictID" $ZSTD --train-cover=k=46,d=8,split=80 "$TESTDIR"/*.c "$PRGDIR"/*.c --dictID=1 -o tmpDict1 cmp tmpDict tmpDict1 && die "dictionaries should have different ID !" println "- Create dictionary with size limit" $ZSTD --train-cover=steps=8 "$TESTDIR"/*.c "$PRGDIR"/*.c -o tmpDict2 --maxdict=4K println "- Compare size of dictionary from 90% training samples with 80% training samples" $ZSTD --train-cover=split=90 -r "$TESTDIR"/*.c "$PRGDIR"/*.c $ZSTD --train-cover=split=80 -r "$TESTDIR"/*.c "$PRGDIR"/*.c println "- Create dictionary using all samples for both training and testing" $ZSTD --train-cover=split=100 -r "$TESTDIR"/*.c "$PRGDIR"/*.c println "- Test -o before --train-cover" rm -f tmpDict dictionary $ZSTD -o tmpDict --train-cover "$TESTDIR"/*.c "$PRGDIR"/*.c test -f tmpDict $ZSTD --train-cover "$TESTDIR"/*.c "$PRGDIR"/*.c test -f dictionary rm -f tmp* dictionary rm -f tmp*