valyala · dciliske · May 8, 2020 · May 8, 2020
diff --git a/cparams.go b/cparams.go
@@ -0,0 +1,197 @@
+package gozstd
+
+type CParameter int
+
+// The right way to make these enums is by importing the zstd.h header and assigning
+//   their values from the cgo interface. However, I cannot for the life of me figure
+//   out how to actually get cgo to do this.
+
+const (
+	/* compression parameters
+	 * Note: When compressing with a ZSTD_CDict these parameters are superseded
+	 * by the parameters used to construct the ZSTD_CDict.
+	 * See ZSTD_CCtx_refCDict() for more info (superseded-by-cdict). */
+	/* Set compression parameters according to pre-defined cLevel table.
+	 * Note that exact compression parameters are dynamically determined,
+	 * depending on both compression level and srcSize (when known).
+	 * Default level is ZSTD_CLEVEL_DEFAULT==3.
+	 * Special: value 0 means default, which is controlled by ZSTD_CLEVEL_DEFAULT.
+	 * Note 1 : it's possible to pass a negative compression level.
+	 * Note 2 : setting a level resets all other compression parameters to default */
+	ZSTD_c_compressionLevel = 100
+
+	/* Advanced compression parameters :
+	 * It's possible to pin down compression parameters to some specific values.
+	 * In which case, these values are no longer dynamically selected by the compressor */
+
+	/* Maximum allowed back-reference distance, expressed as power of 2.
+	 * This will set a memory budget for streaming decompression,
+	 * with larger values requiring more memory
+	 * and typically compressing more.
+	 * Must be clamped between ZSTD_WINDOWLOG_MIN and ZSTD_WINDOWLOG_MAX.
+	 * Special: value 0 means "use default windowLog".
+	 * Note: Using a windowLog greater than ZSTD_WINDOWLOG_LIMIT_DEFAULT
+	 *       requires explicitly allowing such size at streaming decompression stage. */
+	ZSTD_c_windowLog = 101
+
+	/* Size of the initial probe table, as a power of 2.
+	 * Resulting memory usage is (1 << (hashLog+2)).
+	 * Must be clamped between ZSTD_HASHLOG_MIN and ZSTD_HASHLOG_MAX.
+	 * Larger tables improve compression ratio of strategies <= dFast,
+	 * and improve speed of strategies > dFast.
+	 * Special: value 0 means "use default hashLog". */
+	ZSTD_c_hashLog = 102
+
+	/* Size of the multi-probe search table, as a power of 2.
+	 * Resulting memory usage is (1 << (chainLog+2)).
+	 * Must be clamped between ZSTD_CHAINLOG_MIN and ZSTD_CHAINLOG_MAX.
+	 * Larger tables result in better and slower compression.
+	 * This parameter is useless for "fast" strategy.
+	 * It's still useful when using "dfast" strategy,
+	 * in which case it defines a secondary probe table.
+	 * Special: value 0 means "use default chainLog". */
+	ZSTD_c_chainLog = 103
+
+	/* Number of search attempts, as a power of 2.
+	 * More attempts result in better and slower compression.
+	 * This parameter is useless for "fast" and "dFast" strategies.
+	 * Special: value 0 means "use default searchLog". */
+	ZSTD_c_searchLog = 104
+
+	/* Minimum size of searched matches.
+	 * Note that Zstandard can still find matches of smaller size,
+	 * it just tweaks its search algorithm to look for this size and larger.
+	 * Larger values increase compression and decompression speed, but decrease ratio.
+	 * Must be clamped between ZSTD_MINMATCH_MIN and ZSTD_MINMATCH_MAX.
+	 * Note that currently, for all strategies < btopt, effective minimum is 4.
+	 *                    , for all strategies > fast, effective maximum is 6.
+	 * Special: value 0 means "use default minMatchLength". */
+	ZSTD_c_minMatch = 105
+
+	/* Impact of this field depends on strategy.
+	 * For strategies btopt, btultra & btultra2:
+	 *     Length of Match considered "good enough" to stop search.
+	 *     Larger values make compression stronger, and slower.
+	 * For strategy fast:
+	 *     Distance between match sampling.
+	 *     Larger values make compression faster, and weaker.
+	 * Special: value 0 means "use default targetLength". */
+	ZSTD_c_targetLength = 106
+
+	/* See ZSTD_strategy enum definition.
+	 * The higher the value of selected strategy, the more complex it is,
+	 * resulting in stronger and slower compression.
+	 * Special: value 0 means "use default strategy". */
+	ZSTD_c_strategy = 107
+
+	/* LDM mode parameters */
+
+	/* Enable long distance matching.
+	 * This parameter is designed to improve compression ratio
+	 * for large inputs, by finding large matches at long distance.
+	 * It increases memory usage and window size.
+	 * Note: enabling this parameter increases default ZSTD_c_windowLog to 128 MB
+	 * except when expressly set to a different value. */
+	ZSTD_c_enableLongDistanceMatching = 160
+
+	/* Size of the table for long distance matching, as a power of 2.
+	 * Larger values increase memory usage and compression ratio,
+	 * but decrease compression speed.
+	 * Must be clamped between ZSTD_HASHLOG_MIN and ZSTD_HASHLOG_MAX
+	 * default: windowlog - 7.
+	 * Special: value 0 means "automatically determine hashlog". */
+	ZSTD_c_ldmHashLog = 161
+
+	/* Minimum match size for long distance matcher.
+	 * Larger/too small values usually decrease compression ratio.
+	 * Must be clamped between ZSTD_LDM_MINMATCH_MIN and ZSTD_LDM_MINMATCH_MAX.
+	 * Special: value 0 means "use default value" (default: 64). */
+	ZSTD_c_ldmMinMatch = 162
+
+	/* Log size of each bucket in the LDM hash table for collision resolution.
+	 * Larger values improve collision resolution but decrease compression speed.
+	 * The maximum value is ZSTD_LDM_BUCKETSIZELOG_MAX.
+	 * Special: value 0 means "use default value" (default: 3). */
+	ZSTD_c_ldmBucketSizeLog = 163
+
+	/* Frequency of inserting/looking up entries into the LDM hash table.
+	 * Must be clamped between 0 and (ZSTD_WINDOWLOG_MAX - ZSTD_HASHLOG_MIN).
+	 * Default is MAX(0, (windowLog - ldmHashLog)), optimizing hash table usage.
+	 * Larger values improve compression speed.
+	 * Deviating far from default value will likely result in a compression ratio decrease.
+	 * Special: value 0 means "automatically determine hashRateLog". */
+	ZSTD_c_ldmHashRateLog = 164
+
+	/* frame parameters */
+
+	/* Content size will be written into frame header _whenever known_ (default:1)
+	 * Content size must be known at the beginning of compression.
+	 * This is automatically the case when using ZSTD_compress2(),
+	 * For streaming scenarios, content size must be provided with ZSTD_CCtx_setPledgedSrcSize() */
+	ZSTD_c_contentSizeFlag = 200
+
+	/* A 32-bits checksum of content is written at end of frame (default:0) */
+	ZSTD_c_checksumFlag = 201
+
+	/* When applicable, dictionary's ID is written into frame header (default:1) */
+	ZSTD_c_dictIDFlag = 202
+
+	/* multi-threading parameters */
+	/* These parameters are only useful if multi-threading is enabled (compiled with build macro ZSTD_MULTITHREAD).
+	 * They return an error otherwise. */
+
+	/* Select how many threads will be spawned to compress in parallel.
+	 * When nbWorkers >= 1, triggers asynchronous mode when used with ZSTD_compressStream*() :
+	 * ZSTD_compressStream*() consumes input and flush output if possible, but immediately gives back control to caller,
+	 * while compression work is performed in parallel, within worker threads.
+	 * (note : a strong exception to this rule is when first invocation of ZSTD_compressStream2() sets ZSTD_e_end :
+	 *  in which case, ZSTD_compressStream2() delegates to ZSTD_compress2(), which is always a blocking call).
+	 * More workers improve speed, but also increase memory usage.
+	 * Default value is `0`, aka "single-threaded mode" : no worker is spawned, compression is performed inside Caller's thread, all invocations are blocking */
+	ZSTD_c_nbWorkers = 400
+
+	/* Size of a compression job. This value is enforced only when nbWorkers >= 1.
+	 * Each compression job is completed in parallel, so this value can indirectly impact the nb of active threads.
+	 * 0 means default, which is dynamically determined based on compression parameters.
+	 * Job size must be a minimum of overlap size, or 1 MB, whichever is largest.
+	 * The minimum size is automatically and transparently enforced. */
+	ZSTD_c_jobSize = 401
+
+	/* Control the overlap size, as a fraction of window size.
+	 * The overlap size is an amount of data reloaded from previous job at the beginning of a new job.
+	 * It helps preserve compression ratio, while each job is compressed in parallel.
+	 * This value is enforced only when nbWorkers >= 1.
+	 * Larger values increase compression ratio, but decrease speed.
+	 * Possible values range from 0 to 9 :
+	 * - 0 means "default" : value will be determined by the library, depending on strategy
+	 * - 1 means "no overlap"
+	 * - 9 means "full overlap", using a full window size.
+	 * Each intermediate rank increases/decreases load size by a factor 2 :
+	 * 9: full window;  8: w/2;  7: w/4;  6: w/8;  5:w/16;  4: w/32;  3:w/64;  2:w/128;  1:no overlap;  0:default
+	 * default value varies between 6 and 9, depending on strategy */
+	ZSTD_c_overlapLog = 402
+)
+
+type ZSTD_ResetDirective int
+
+const (
+	ZSTD_reset_session_only           = 1
+	ZSTD_reset_parameters             = 2
+	ZSTD_reset_session_and_parameters = 3
+)
+
+type ZSTD_CompressionStrategy int
+
+const (
+	ZSTD_fast     = 1
+	ZSTD_dfast    = 2
+	ZSTD_greedy   = 3
+	ZSTD_lazy     = 4
+	ZSTD_lazy2    = 5
+	ZSTD_btlazy2  = 6
+	ZSTD_btopt    = 7
+	ZSTD_btultra  = 8
+	ZSTD_btultra2 = 9
+	/* note : new strategies _might_ be added in the future.
+	   Only the order (from fast to strong) is guaranteed */
+)
diff --git a/gozstd.go b/gozstd.go
@@ -17,6 +17,10 @@ static size_t ZSTD_compressCCtx_wrapper(ZSTD_CCtx* ctx, uintptr_t dst, size_t ds
     return ZSTD_compressCCtx(ctx, (void*)dst, dstCapacity, (const void*)src, srcSize, compressionLevel);
 }
 
+static size_t ZSTD_compress2_wrapper(ZSTD_CCtx* ctx, uintptr_t dst, size_t dstCapacity, uintptr_t src, size_t srcSize) {
+    return ZSTD_compress2(ctx, (void*)dst, dstCapacity, (const void*)src, srcSize);
+}
+
 static size_t ZSTD_compress_usingCDict_wrapper(ZSTD_CCtx* ctx, uintptr_t dst, size_t dstCapacity, uintptr_t src, size_t srcSize, const ZSTD_CDict* cdict) {
     return ZSTD_compress_usingCDict(ctx, (void*)dst, dstCapacity, (const void*)src, srcSize, cdict);
 }
@@ -36,6 +40,7 @@ static unsigned long long ZSTD_getFrameContentSize_wrapper(uintptr_t src, size_t
 import "C"
 
 import (
+	"errors"
 	"fmt"
 	"io"
 	"runtime"
@@ -114,6 +119,66 @@ type cctxWrapper struct {
 	cctx *C.ZSTD_CCtx
 }
 
+type CCtx cctxWrapper
+
+// NewCCtx creates a new compression context
+func NewCCtx() *CCtx {
+	ctx := (*CCtx)(cctxPool.Get().(*cctxWrapper))
+	ctx.SetParameter(ZSTD_c_compressionLevel, 0)
+	return ctx
+}
+
+func (cctx *CCtx) Reset(reset ZSTD_ResetDirective) error {
+	result := C.ZSTD_CCtx_reset(cctx.cctx,
+		C.ZSTD_ResetDirective(reset))
+	isErr := C.ZSTD_isError(C.size_t(result))
+	if isErr != 0 {
+		return errors.New("Error reseting context: " + errStr(result))
+	}
+	return nil
+}
+
+// SetParameter sets compression parameters for the given context
+func (cctx *CCtx) SetParameter(param CParameter, value int) error {
+	result := C.ZSTD_CCtx_setParameter(cctx.cctx,
+		C.ZSTD_cParameter(param), C.int(value))
+	isErr := C.ZSTD_isError(C.size_t(result))
+	if isErr != 0 {
+		return errors.New("Error setting parameter: " + errStr(result))
+	}
+	return nil
+}
+
+/*
+*  Total input data size to be compressed as a single frame.
+*  Value will be written in frame header, unless if explicitly forbidden using ZSTD_c_contentSizeFlag.
+*  This value will also be controlled at end of frame, and trigger an error if not respected.
+* @result : 0, or an error code (which can be tested with ZSTD_isError()).
+*  Note 1 : pledgedSrcSize==0 actually means zero, aka an empty frame.
+*           In order to mean "unknown content size", pass constant ZSTD_CONTENTSIZE_UNKNOWN.
+*           ZSTD_CONTENTSIZE_UNKNOWN is default value for any new frame.
+*  Note 2 : pledgedSrcSize is only valid once, for the next frame.
+*           It's discarded at the end of the frame, and replaced by ZSTD_CONTENTSIZE_UNKNOWN.
+*  Note 3 : Whenever all input data is provided and consumed in a single round,
+*           for example with ZSTD_compress2(),
+*           or invoking immediately ZSTD_compressStream2(,,,ZSTD_e_end),
+*           this value is automatically overridden by srcSize instead.
+ */
+func (cctx *CCtx) SetPledgedSrcSize(PledgedSrcSize uint64) error {
+	result := C.ZSTD_CCtx_setPledgedSrcSize(cctx.cctx,
+		C.ulonglong(PledgedSrcSize))
+	isErr := C.ZSTD_isError(C.size_t(result))
+	if isErr != 0 {
+		return errors.New("Error setting pledged size: " + errStr(result))
+	}
+	return nil
+}
+
+func (cctx *CCtx) Compress(dst, src []byte) ([]byte, error) {
+	ctxWrap := cctxWrapper{cctx.cctx}
+	return compress2(&ctxWrap, dst, src)
+}
+
 func compress(cctx, cctxDict *cctxWrapper, dst, src []byte, cd *CDict, compressionLevel int) []byte {
 	if len(src) == 0 {
 		return dst
@@ -147,6 +212,45 @@ func compress(cctx, cctxDict *cctxWrapper, dst, src []byte, cd *CDict, compressi
 	return dst[:dstLen+compressedSize]
 }
 
+func compress2(cctx *cctxWrapper, dst, src []byte) ([]byte, error) {
+	if len(src) == 0 {
+		return dst, nil
+	}
+
+	dstLen := len(dst)
+	if cap(dst) > dstLen {
+		// Fast path - try compressing without dst resize.
+		result := compress2Internal(cctx, dst[dstLen:cap(dst)], src, false)
+		compressedSize := int(result)
+		if compressedSize >= 0 {
+			// All OK.
+			return dst[:dstLen+compressedSize], nil
+		}
+
+		if C.ZSTD_getErrorCode(result) != C.ZSTD_error_dstSize_tooSmall {
+			// Unexpected error.
+			return dst, errors.New("Unexpected error during compression" + errStr(result))
+		}
+	}
+
+	// Slow path - resize dst to fit compressed data.
+	compressBound := int(C.ZSTD_compressBound(C.size_t(len(src)))) + 1
+	if n := dstLen + compressBound - cap(dst) + dstLen; n > 0 {
+		// This should be optimized since go 1.11 - see https://golang.org/doc/go1.11#performance-compiler.
+		dst = append(dst[:cap(dst)], make([]byte, n)...)
+	}
+
+	result := compress2Internal(cctx, dst[dstLen:dstLen+compressBound], src, false)
+	compressedSize := int(result)
+	if int(result) >= 0 {
+		return dst[:dstLen+compressedSize], nil
+	}
+	if C.ZSTD_getErrorCode(result) != 0 {
+		return dst, fmt.Errorf("Unexpected error in ZSTD_compress2_wrapper: %s", errStr(result))
+	}
+	return dst[:dstLen+compressedSize], nil
+}
+
 func compressInternal(cctx, cctxDict *cctxWrapper, dst, src []byte, cd *CDict, compressionLevel int, mustSucceed bool) C.size_t {
 	if cd != nil {
 		result := C.ZSTD_compress_usingCDict_wrapper(cctxDict.cctx,
@@ -178,6 +282,21 @@ func compressInternal(cctx, cctxDict *cctxWrapper, dst, src []byte, cd *CDict, c
 	return result
 }
 
+func compress2Internal(cctx *cctxWrapper, dst, src []byte, mustSucceed bool) C.size_t {
+	result := C.ZSTD_compress2_wrapper(cctx.cctx,
+		C.uintptr_t(uintptr(unsafe.Pointer(&dst[0]))),
+		C.size_t(cap(dst)),
+		C.uintptr_t(uintptr(unsafe.Pointer(&src[0]))),
+		C.size_t(len(src)))
+	// Prevent from GC'ing of dst and src during CGO call above.
+	runtime.KeepAlive(dst)
+	runtime.KeepAlive(src)
+	if mustSucceed {
+		ensureNoError("ZSTD_compressCCtx_wrapper", result)
+	}
+	return result
+}
+
 // Decompress appends decompressed src to dst and returns the result.
 func Decompress(dst, src []byte) ([]byte, error) {
 	return DecompressDict(dst, src, nil)