upstream/mercurial-mirror Commit - r40157:73fef626

zstandard: vendor python-zstandard 0.10.1...

Gregory Szorc -

r40157:73fef626 default

parent child

Expand all files

The requested changes are too big and content was truncated. Show full diff

contrib/python-zstandard/c-ext/compressionchunker.c

0 created 644 +360 0

			@@ -0,0 +1,360 b''
		1	/**
		2	* Copyright (c) 2018-present, Gregory Szorc
		3	* All rights reserved.
		4	*
		5	* This software may be modified and distributed under the terms
		6	* of the BSD license. See the LICENSE file for details.
		7	*/
		8
		9	#include "python-zstandard.h"
		10
		11	extern PyObject* ZstdError;
		12
		13	PyDoc_STRVAR(ZstdCompressionChunkerIterator__doc__,
		14	"Iterator of output chunks from ZstdCompressionChunker.\n"
		15	);
		16
		17	static void ZstdCompressionChunkerIterator_dealloc(ZstdCompressionChunkerIterator* self) {
		18	Py_XDECREF(self->chunker);
		19
		20	PyObject_Del(self);
		21	}
		22
		23	static PyObject* ZstdCompressionChunkerIterator_iter(PyObject* self) {
		24	Py_INCREF(self);
		25	return self;
		26	}
		27
		28	static PyObject* ZstdCompressionChunkerIterator_iternext(ZstdCompressionChunkerIterator* self) {
		29	size_t zresult;
		30	PyObject* chunk;
		31	ZstdCompressionChunker* chunker = self->chunker;
		32	ZSTD_EndDirective zFlushMode;
		33
		34	if (self->mode != compressionchunker_mode_normal && chunker->input.pos != chunker->input.size) {
		35	PyErr_SetString(ZstdError, "input should have been fully consumed before calling flush() or finish()");
		36	return NULL;
		37	}
		38
		39	if (chunker->finished) {
		40	return NULL;
		41	}
		42
		43	/* If we have data left in the input, consume it. */
		44	while (chunker->input.pos < chunker->input.size) {
		45	Py_BEGIN_ALLOW_THREADS
		46	zresult = ZSTD_compress_generic(chunker->compressor->cctx, &chunker->output,
		47	&chunker->input, ZSTD_e_continue);
		48	Py_END_ALLOW_THREADS
		49
		50	/* Input is fully consumed. */
		51	if (chunker->input.pos == chunker->input.size) {
		52	chunker->input.src = NULL;
		53	chunker->input.pos = 0;
		54	chunker->input.size = 0;
		55	PyBuffer_Release(&chunker->inBuffer);
		56	}
		57
		58	if (ZSTD_isError(zresult)) {
		59	PyErr_Format(ZstdError, "zstd compress error: %s", ZSTD_getErrorName(zresult));
		60	return NULL;
		61	}
		62
		63	/* If it produced a full output chunk, emit it. */
		64	if (chunker->output.pos == chunker->output.size) {
		65	chunk = PyBytes_FromStringAndSize(chunker->output.dst, chunker->output.pos);
		66	if (!chunk) {
		67	return NULL;
		68	}
		69
		70	chunker->output.pos = 0;
		71
		72	return chunk;
		73	}
		74
		75	/* Else continue to compress available input data. */
		76	}
		77
		78	/* We also need this here for the special case of an empty input buffer. */
		79	if (chunker->input.pos == chunker->input.size) {
		80	chunker->input.src = NULL;
		81	chunker->input.pos = 0;
		82	chunker->input.size = 0;
		83	PyBuffer_Release(&chunker->inBuffer);
		84	}
		85
		86	/* No more input data. A partial chunk may be in chunker->output.
		87	* If we're in normal compression mode, we're done. Otherwise if we're in
		88	* flush or finish mode, we need to emit what data remains.
		89	*/
		90	if (self->mode == compressionchunker_mode_normal) {
		91	/* We don't need to set StopIteration. */
		92	return NULL;
		93	}
		94
		95	if (self->mode == compressionchunker_mode_flush) {
		96	zFlushMode = ZSTD_e_flush;
		97	}
		98	else if (self->mode == compressionchunker_mode_finish) {
		99	zFlushMode = ZSTD_e_end;
		100	}
		101	else {
		102	PyErr_SetString(ZstdError, "unhandled compression mode; this should never happen");
		103	return NULL;
		104	}
		105
		106	Py_BEGIN_ALLOW_THREADS
		107	zresult = ZSTD_compress_generic(chunker->compressor->cctx, &chunker->output,
		108	&chunker->input, zFlushMode);
		109	Py_END_ALLOW_THREADS
		110
		111	if (ZSTD_isError(zresult)) {
		112	PyErr_Format(ZstdError, "zstd compress error: %s",
		113	ZSTD_getErrorName(zresult));
		114	return NULL;
		115	}
		116
		117	if (!zresult && chunker->output.pos == 0) {
		118	return NULL;
		119	}
		120
		121	chunk = PyBytes_FromStringAndSize(chunker->output.dst, chunker->output.pos);
		122	if (!chunk) {
		123	return NULL;
		124	}
		125
		126	chunker->output.pos = 0;
		127
		128	if (!zresult && self->mode == compressionchunker_mode_finish) {
		129	chunker->finished = 1;
		130	}
		131
		132	return chunk;
		133	}
		134
		135	PyTypeObject ZstdCompressionChunkerIteratorType = {
		136	PyVarObject_HEAD_INIT(NULL, 0)
		137	"zstd.ZstdCompressionChunkerIterator", /* tp_name */
		138	sizeof(ZstdCompressionChunkerIterator), /* tp_basicsize */
		139	0, /* tp_itemsize */
		140	(destructor)ZstdCompressionChunkerIterator_dealloc, /* tp_dealloc */
		141	0, /* tp_print */
		142	0, /* tp_getattr */
		143	0, /* tp_setattr */
		144	0, /* tp_compare */
		145	0, /* tp_repr */
		146	0, /* tp_as_number */
		147	0, /* tp_as_sequence */
		148	0, /* tp_as_mapping */
		149	0, /* tp_hash */
		150	0, /* tp_call */
		151	0, /* tp_str */
		152	0, /* tp_getattro */
		153	0, /* tp_setattro */
		154	0, /* tp_as_buffer */
		155	Py_TPFLAGS_DEFAULT \| Py_TPFLAGS_BASETYPE, /* tp_flags */
		156	ZstdCompressionChunkerIterator__doc__, /* tp_doc */
		157	0, /* tp_traverse */
		158	0, /* tp_clear */
		159	0, /* tp_richcompare */
		160	0, /* tp_weaklistoffset */
		161	ZstdCompressionChunkerIterator_iter, /* tp_iter */
		162	(iternextfunc)ZstdCompressionChunkerIterator_iternext, /* tp_iternext */
		163	0, /* tp_methods */
		164	0, /* tp_members */
		165	0, /* tp_getset */
		166	0, /* tp_base */
		167	0, /* tp_dict */
		168	0, /* tp_descr_get */
		169	0, /* tp_descr_set */
		170	0, /* tp_dictoffset */
		171	0, /* tp_init */
		172	0, /* tp_alloc */
		173	PyType_GenericNew, /* tp_new */
		174	};
		175
		176	PyDoc_STRVAR(ZstdCompressionChunker__doc__,
		177	"Compress chunks iteratively into exact chunk sizes.\n"
		178	);
		179
		180	static void ZstdCompressionChunker_dealloc(ZstdCompressionChunker* self) {
		181	PyBuffer_Release(&self->inBuffer);
		182	self->input.src = NULL;
		183
		184	PyMem_Free(self->output.dst);
		185	self->output.dst = NULL;
		186
		187	Py_XDECREF(self->compressor);
		188
		189	PyObject_Del(self);
		190	}
		191
		192	static ZstdCompressionChunkerIterator* ZstdCompressionChunker_compress(ZstdCompressionChunker* self, PyObject* args, PyObject* kwargs) {
		193	static char* kwlist[] = {
		194	"data",
		195	NULL
		196	};
		197
		198	ZstdCompressionChunkerIterator* result;
		199
		200	if (self->finished) {
		201	PyErr_SetString(ZstdError, "cannot call compress() after compression finished");
		202	return NULL;
		203	}
		204
		205	if (self->inBuffer.obj) {
		206	PyErr_SetString(ZstdError,
		207	"cannot perform operation before consuming output from previous operation");
		208	return NULL;
		209	}
		210
		211	#if PY_MAJOR_VERSION >= 3
		212	if (!PyArg_ParseTupleAndKeywords(args, kwargs, "y*:compress",
		213	#else
		214	if (!PyArg_ParseTupleAndKeywords(args, kwargs, "s*:compress",
		215	#endif
		216	kwlist, &self->inBuffer)) {
		217	return NULL;
		218	}
		219
		220	if (!PyBuffer_IsContiguous(&self->inBuffer, 'C') \|\| self->inBuffer.ndim > 1) {
		221	PyErr_SetString(PyExc_ValueError,
		222	"data buffer should be contiguous and have at most one dimension");
		223	PyBuffer_Release(&self->inBuffer);
		224	return NULL;
		225	}
		226
		227	result = (ZstdCompressionChunkerIterator)PyObject_CallObject((PyObject)&ZstdCompressionChunkerIteratorType, NULL);
		228	if (!result) {
		229	PyBuffer_Release(&self->inBuffer);
		230	return NULL;
		231	}
		232
		233	self->input.src = self->inBuffer.buf;
		234	self->input.size = self->inBuffer.len;
		235	self->input.pos = 0;
		236
		237	result->chunker = self;
		238	Py_INCREF(result->chunker);
		239
		240	result->mode = compressionchunker_mode_normal;
		241
		242	return result;
		243	}
		244
		245	static ZstdCompressionChunkerIterator* ZstdCompressionChunker_finish(ZstdCompressionChunker* self) {
		246	ZstdCompressionChunkerIterator* result;
		247
		248	if (self->finished) {
		249	PyErr_SetString(ZstdError, "cannot call finish() after compression finished");
		250	return NULL;
		251	}
		252
		253	if (self->inBuffer.obj) {
		254	PyErr_SetString(ZstdError,
		255	"cannot call finish() before consuming output from previous operation");
		256	return NULL;
		257	}
		258
		259	result = (ZstdCompressionChunkerIterator)PyObject_CallObject((PyObject)&ZstdCompressionChunkerIteratorType, NULL);
		260	if (!result) {
		261	return NULL;
		262	}
		263
		264	result->chunker = self;
		265	Py_INCREF(result->chunker);
		266
		267	result->mode = compressionchunker_mode_finish;
		268
		269	return result;
		270	}
		271
		272	static ZstdCompressionChunkerIterator* ZstdCompressionChunker_flush(ZstdCompressionChunker* self, PyObject* args, PyObject* kwargs) {
		273	ZstdCompressionChunkerIterator* result;
		274
		275	if (self->finished) {
		276	PyErr_SetString(ZstdError, "cannot call flush() after compression finished");
		277	return NULL;
		278	}
		279
		280	if (self->inBuffer.obj) {
		281	PyErr_SetString(ZstdError,
		282	"cannot call flush() before consuming output from previous operation");
		283	return NULL;
		284	}
		285
		286	result = (ZstdCompressionChunkerIterator)PyObject_CallObject((PyObject)&ZstdCompressionChunkerIteratorType, NULL);
		287	if (!result) {
		288	return NULL;
		289	}
		290
		291	result->chunker = self;
		292	Py_INCREF(result->chunker);
		293
		294	result->mode = compressionchunker_mode_flush;
		295
		296	return result;
		297	}
		298
		299	static PyMethodDef ZstdCompressionChunker_methods[] = {
		300	{ "compress", (PyCFunction)ZstdCompressionChunker_compress, METH_VARARGS \| METH_KEYWORDS,
		301	PyDoc_STR("compress data") },
		302	{ "finish", (PyCFunction)ZstdCompressionChunker_finish, METH_NOARGS,
		303	PyDoc_STR("finish compression operation") },
		304	{ "flush", (PyCFunction)ZstdCompressionChunker_flush, METH_VARARGS \| METH_KEYWORDS,
		305	PyDoc_STR("finish compression operation") },
		306	{ NULL, NULL }
		307	};
		308
		309	PyTypeObject ZstdCompressionChunkerType = {
		310	PyVarObject_HEAD_INIT(NULL, 0)
		311	"zstd.ZstdCompressionChunkerType", /* tp_name */
		312	sizeof(ZstdCompressionChunker), /* tp_basicsize */
		313	0, /* tp_itemsize */
		314	(destructor)ZstdCompressionChunker_dealloc, /* tp_dealloc */
		315	0, /* tp_print */
		316	0, /* tp_getattr */
		317	0, /* tp_setattr */
		318	0, /* tp_compare */
		319	0, /* tp_repr */
		320	0, /* tp_as_number */
		321	0, /* tp_as_sequence */
		322	0, /* tp_as_mapping */
		323	0, /* tp_hash */
		324	0, /* tp_call */
		325	0, /* tp_str */
		326	0, /* tp_getattro */
		327	0, /* tp_setattro */
		328	0, /* tp_as_buffer */
		329	Py_TPFLAGS_DEFAULT \| Py_TPFLAGS_BASETYPE, /* tp_flags */
		330	ZstdCompressionChunker__doc__, /* tp_doc */
		331	0, /* tp_traverse */
		332	0, /* tp_clear */
		333	0, /* tp_richcompare */
		334	0, /* tp_weaklistoffset */
		335	0, /* tp_iter */
		336	0, /* tp_iternext */
		337	ZstdCompressionChunker_methods, /* tp_methods */
		338	0, /* tp_members */
		339	0, /* tp_getset */
		340	0, /* tp_base */
		341	0, /* tp_dict */
		342	0, /* tp_descr_get */
		343	0, /* tp_descr_set */
		344	0, /* tp_dictoffset */
		345	0, /* tp_init */
		346	0, /* tp_alloc */
		347	PyType_GenericNew, /* tp_new */
		348	};
		349
		350	void compressionchunker_module_init(PyObject* module) {
		351	Py_TYPE(&ZstdCompressionChunkerIteratorType) = &PyType_Type;
		352	if (PyType_Ready(&ZstdCompressionChunkerIteratorType) < 0) {
		353	return;
		354	}
		355
		356	Py_TYPE(&ZstdCompressionChunkerType) = &PyType_Type;
		357	if (PyType_Ready(&ZstdCompressionChunkerType) < 0) {
		358	return;
		359	}
		360	}

contrib/python-zstandard/zstd/common/debug.c

0 created 644 +44 0

			@@ -0,0 +1,44 b''
		1	/* ******************************************************************
		2	debug
		3	Part of FSE library
		4	Copyright (C) 2013-present, Yann Collet.
		5
		6	BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
		7
		8	Redistribution and use in source and binary forms, with or without
		9	modification, are permitted provided that the following conditions are
		10	met:
		11
		12	* Redistributions of source code must retain the above copyright
		13	notice, this list of conditions and the following disclaimer.
		14	* Redistributions in binary form must reproduce the above
		15	copyright notice, this list of conditions and the following disclaimer
		16	in the documentation and/or other materials provided with the
		17	distribution.
		18
		19	THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
		20	"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
		21	LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
		22	A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
		23	OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
		24	SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
		25	LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
		26	DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
		27	THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
		28	(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
		29	OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
		30
		31	You can contact the author at :
		32	- Source repository : https://github.com/Cyan4973/FiniteStateEntropy
		33	****************************************************************** */
		34
		35
		36	/*
		37	* This module only hosts one global variable
		38	* which can be used to dynamically influence the verbosity of traces,
		39	* such as DEBUGLOG and RAWLOG
		40	*/
		41
		42	#include "debug.h"
		43
		44	int g_debuglevel = DEBUGLEVEL;

contrib/python-zstandard/zstd/common/debug.h

0 created 644 +123 0

			@@ -0,0 +1,123 b''
		1	/* ******************************************************************
		2	debug
		3	Part of FSE library
		4	Copyright (C) 2013-present, Yann Collet.
		5
		6	BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
		7
		8	Redistribution and use in source and binary forms, with or without
		9	modification, are permitted provided that the following conditions are
		10	met:
		11
		12	* Redistributions of source code must retain the above copyright
		13	notice, this list of conditions and the following disclaimer.
		14	* Redistributions in binary form must reproduce the above
		15	copyright notice, this list of conditions and the following disclaimer
		16	in the documentation and/or other materials provided with the
		17	distribution.
		18
		19	THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
		20	"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
		21	LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
		22	A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
		23	OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
		24	SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
		25	LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
		26	DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
		27	THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
		28	(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
		29	OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
		30
		31	You can contact the author at :
		32	- Source repository : https://github.com/Cyan4973/FiniteStateEntropy
		33	****************************************************************** */
		34
		35
		36	/*
		37	* The purpose of this header is to enable debug functions.
		38	* They regroup assert(), DEBUGLOG() and RAWLOG() for run-time,
		39	* and DEBUG_STATIC_ASSERT() for compile-time.
		40	*
		41	* By default, DEBUGLEVEL==0, which means run-time debug is disabled.
		42	*
		43	* Level 1 enables assert() only.
		44	* Starting level 2, traces can be generated and pushed to stderr.
		45	* The higher the level, the more verbose the traces.
		46	*
		47	* It's possible to dynamically adjust level using variable g_debug_level,
		48	* which is only declared if DEBUGLEVEL>=2,
		49	* and is a global variable, not multi-thread protected (use with care)
		50	*/
		51
		52	#ifndef DEBUG_H_12987983217
		53	#define DEBUG_H_12987983217
		54
		55	#if defined (__cplusplus)
		56	extern "C" {
		57	#endif
		58
		59
		60	/* static assert is triggered at compile time, leaving no runtime artefact,
		61	* but can only work with compile-time constants.
		62	* This variant can only be used inside a function. */
		63	#define DEBUG_STATIC_ASSERT(c) (void)sizeof(char[(c) ? 1 : -1])
		64
		65
		66	/* DEBUGLEVEL is expected to be defined externally,
		67	* typically through compiler command line.
		68	* Value must be a number. */
		69	#ifndef DEBUGLEVEL
		70	# define DEBUGLEVEL 0
		71	#endif
		72
		73	/* recommended values for DEBUGLEVEL :
		74	* 0 : no debug, all run-time functions disabled
		75	* 1 : no display, enables assert() only
		76	* 2 : reserved, for currently active debug path
		77	* 3 : events once per object lifetime (CCtx, CDict, etc.)
		78	* 4 : events once per frame
		79	* 5 : events once per block
		80	* 6 : events once per sequence (verbose)
		81	* 7+: events at every position (very verbose)
		82	*
		83	* It's generally inconvenient to output traces > 5.
		84	* In which case, it's possible to selectively enable higher verbosity levels
		85	* by modifying g_debug_level.
		86	*/
		87
		88	#if (DEBUGLEVEL>=1)
		89	# include <assert.h>
		90	#else
		91	# ifndef assert /* assert may be already defined, due to prior #include <assert.h> */
		92	# define assert(condition) ((void)0) /* disable assert (default) */
		93	# endif
		94	#endif
		95
		96	#if (DEBUGLEVEL>=2)
		97	# include <stdio.h>
		98	extern int g_debuglevel; /* here, this variable is only declared,
		99	it actually lives in debug.c,
		100	and is shared by the whole process.
		101	It's typically used to enable very verbose levels
		102	on selective conditions (such as position in src) */
		103
		104	# define RAWLOG(l, ...) { \
		105	if (l<=g_debuglevel) { \
		106	fprintf(stderr, __VA_ARGS__); \
		107	} }
		108	# define DEBUGLOG(l, ...) { \
		109	if (l<=g_debuglevel) { \
		110	fprintf(stderr, __FILE__ ": " __VA_ARGS__); \
		111	fprintf(stderr, " \n"); \
		112	} }
		113	#else
		114	# define RAWLOG(l, ...) {} /* disabled */
		115	# define DEBUGLOG(l, ...) {} /* disabled */
		116	#endif
		117
		118
		119	#if defined (__cplusplus)
		120	}
		121	#endif
		122
		123	#endif /* DEBUG_H_12987983217 */

contrib/python-zstandard/zstd/compress/hist.c

0 created 644 +195 0

			@@ -0,0 +1,195 b''
		1	/* ******************************************************************
		2	hist : Histogram functions
		3	part of Finite State Entropy project
		4	Copyright (C) 2013-present, Yann Collet.
		5
		6	BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
		7
		8	Redistribution and use in source and binary forms, with or without
		9	modification, are permitted provided that the following conditions are
		10	met:
		11
		12	* Redistributions of source code must retain the above copyright
		13	notice, this list of conditions and the following disclaimer.
		14	* Redistributions in binary form must reproduce the above
		15	copyright notice, this list of conditions and the following disclaimer
		16	in the documentation and/or other materials provided with the
		17	distribution.
		18
		19	THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
		20	"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
		21	LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
		22	A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
		23	OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
		24	SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
		25	LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
		26	DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
		27	THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
		28	(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
		29	OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
		30
		31	You can contact the author at :
		32	- FSE source repository : https://github.com/Cyan4973/FiniteStateEntropy
		33	- Public forum : https://groups.google.com/forum/#!forum/lz4c
		34	****************************************************************** */
		35
		36	/* --- dependencies --- */
		37	#include "mem.h" /* U32, BYTE, etc. */
		38	#include "debug.h" /* assert, DEBUGLOG */
		39	#include "error_private.h" /* ERROR */
		40	#include "hist.h"
		41
		42
		43	/* --- Error management --- */
		44	unsigned HIST_isError(size_t code) { return ERR_isError(code); }
		45
		46	/-*************************************************************
		47	* Histogram functions
		48	****************************************************************/
		49	unsigned HIST_count_simple(unsigned* count, unsigned* maxSymbolValuePtr,
		50	const void* src, size_t srcSize)
		51	{
		52	const BYTE* ip = (const BYTE*)src;
		53	const BYTE* const end = ip + srcSize;
		54	unsigned maxSymbolValue = *maxSymbolValuePtr;
		55	unsigned largestCount=0;
		56
		57	memset(count, 0, (maxSymbolValue+1) * sizeof(*count));
		58	if (srcSize==0) { *maxSymbolValuePtr = 0; return 0; }
		59
		60	while (ip<end) {
		61	assert(*ip <= maxSymbolValue);
		62	count[*ip++]++;
		63	}
		64
		65	while (!count[maxSymbolValue]) maxSymbolValue--;
		66	*maxSymbolValuePtr = maxSymbolValue;
		67
		68	{ U32 s;
		69	for (s=0; s<=maxSymbolValue; s++)
		70	if (count[s] > largestCount) largestCount = count[s];
		71	}
		72
		73	return largestCount;
		74	}
		75
		76
		77	/* HIST_count_parallel_wksp() :
		78	* store histogram into 4 intermediate tables, recombined at the end.
		79	* this design makes better use of OoO cpus,
		80	* and is noticeably faster when some values are heavily repeated.
		81	* But it needs some additional workspace for intermediate tables.
		82	* `workSpace` size must be a table of size >= HIST_WKSP_SIZE_U32.
		83	* @return : largest histogram frequency,
		84	* or an error code (notably when histogram would be larger than maxSymbolValuePtr). /
		85	static size_t HIST_count_parallel_wksp(
		86	unsigned* count, unsigned* maxSymbolValuePtr,
		87	const void* source, size_t sourceSize,
		88	unsigned checkMax,
		89	unsigned* const workSpace)
		90	{
		91	const BYTE* ip = (const BYTE*)source;
		92	const BYTE* const iend = ip+sourceSize;
		93	unsigned maxSymbolValue = *maxSymbolValuePtr;
		94	unsigned max=0;
		95	U32* const Counting1 = workSpace;
		96	U32* const Counting2 = Counting1 + 256;
		97	U32* const Counting3 = Counting2 + 256;
		98	U32* const Counting4 = Counting3 + 256;
		99
		100	memset(workSpace, 0, 4256sizeof(unsigned));
		101
		102	/* safety checks */
		103	if (!sourceSize) {
		104	memset(count, 0, maxSymbolValue + 1);
		105	*maxSymbolValuePtr = 0;
		106	return 0;
		107	}
		108	if (!maxSymbolValue) maxSymbolValue = 255; /* 0 == default */
		109
		110	/* by stripes of 16 bytes */
		111	{ U32 cached = MEM_read32(ip); ip += 4;
		112	while (ip < iend-15) {
		113	U32 c = cached; cached = MEM_read32(ip); ip += 4;
		114	Counting1[(BYTE) c ]++;
		115	Counting2[(BYTE)(c>>8) ]++;
		116	Counting3[(BYTE)(c>>16)]++;
		117	Counting4[ c>>24 ]++;
		118	c = cached; cached = MEM_read32(ip); ip += 4;
		119	Counting1[(BYTE) c ]++;
		120	Counting2[(BYTE)(c>>8) ]++;
		121	Counting3[(BYTE)(c>>16)]++;
		122	Counting4[ c>>24 ]++;
		123	c = cached; cached = MEM_read32(ip); ip += 4;
		124	Counting1[(BYTE) c ]++;
		125	Counting2[(BYTE)(c>>8) ]++;
		126	Counting3[(BYTE)(c>>16)]++;
		127	Counting4[ c>>24 ]++;
		128	c = cached; cached = MEM_read32(ip); ip += 4;
		129	Counting1[(BYTE) c ]++;
		130	Counting2[(BYTE)(c>>8) ]++;
		131	Counting3[(BYTE)(c>>16)]++;
		132	Counting4[ c>>24 ]++;
		133	}
		134	ip-=4;
		135	}
		136
		137	/* finish last symbols */
		138	while (ip<iend) Counting1[*ip++]++;
		139
		140	if (checkMax) { /* verify stats will fit into destination table */
		141	U32 s; for (s=255; s>maxSymbolValue; s--) {
		142	Counting1[s] += Counting2[s] + Counting3[s] + Counting4[s];
		143	if (Counting1[s]) return ERROR(maxSymbolValue_tooSmall);
		144	} }
		145
		146	{ U32 s;
		147	if (maxSymbolValue > 255) maxSymbolValue = 255;
		148	for (s=0; s<=maxSymbolValue; s++) {
		149	count[s] = Counting1[s] + Counting2[s] + Counting3[s] + Counting4[s];
		150	if (count[s] > max) max = count[s];
		151	} }
		152
		153	while (!count[maxSymbolValue]) maxSymbolValue--;
		154	*maxSymbolValuePtr = maxSymbolValue;
		155	return (size_t)max;
		156	}
		157
		158	/* HIST_countFast_wksp() :
		159	* Same as HIST_countFast(), but using an externally provided scratch buffer.
		160	* `workSpace` size must be table of >= HIST_WKSP_SIZE_U32 unsigned */
		161	size_t HIST_countFast_wksp(unsigned* count, unsigned* maxSymbolValuePtr,
		162	const void* source, size_t sourceSize,
		163	unsigned* workSpace)
		164	{
		165	if (sourceSize < 1500) /* heuristic threshold */
		166	return HIST_count_simple(count, maxSymbolValuePtr, source, sourceSize);
		167	return HIST_count_parallel_wksp(count, maxSymbolValuePtr, source, sourceSize, 0, workSpace);
		168	}
		169
		170	/* fast variant (unsafe : won't check if src contains values beyond count[] limit) */
		171	size_t HIST_countFast(unsigned* count, unsigned* maxSymbolValuePtr,
		172	const void* source, size_t sourceSize)
		173	{
		174	unsigned tmpCounters[HIST_WKSP_SIZE_U32];
		175	return HIST_countFast_wksp(count, maxSymbolValuePtr, source, sourceSize, tmpCounters);
		176	}
		177
		178	/* HIST_count_wksp() :
		179	* Same as HIST_count(), but using an externally provided scratch buffer.
		180	* `workSpace` size must be table of >= HIST_WKSP_SIZE_U32 unsigned */
		181	size_t HIST_count_wksp(unsigned* count, unsigned* maxSymbolValuePtr,
		182	const void* source, size_t sourceSize, unsigned* workSpace)
		183	{
		184	if (*maxSymbolValuePtr < 255)
		185	return HIST_count_parallel_wksp(count, maxSymbolValuePtr, source, sourceSize, 1, workSpace);
		186	*maxSymbolValuePtr = 255;
		187	return HIST_countFast_wksp(count, maxSymbolValuePtr, source, sourceSize, workSpace);
		188	}
		189
		190	size_t HIST_count(unsigned* count, unsigned* maxSymbolValuePtr,
		191	const void* src, size_t srcSize)
		192	{
		193	unsigned tmpCounters[HIST_WKSP_SIZE_U32];
		194	return HIST_count_wksp(count, maxSymbolValuePtr, src, srcSize, tmpCounters);
		195	}

contrib/python-zstandard/zstd/compress/hist.h

0 created 644 +92 0

			@@ -0,0 +1,92 b''
		1	/* ******************************************************************
		2	hist : Histogram functions
		3	part of Finite State Entropy project
		4	Copyright (C) 2013-present, Yann Collet.
		5
		6	BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
		7
		8	Redistribution and use in source and binary forms, with or without
		9	modification, are permitted provided that the following conditions are
		10	met:
		11
		12	* Redistributions of source code must retain the above copyright
		13	notice, this list of conditions and the following disclaimer.
		14	* Redistributions in binary form must reproduce the above
		15	copyright notice, this list of conditions and the following disclaimer
		16	in the documentation and/or other materials provided with the
		17	distribution.
		18
		19	THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
		20	"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
		21	LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
		22	A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
		23	OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
		24	SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
		25	LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
		26	DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
		27	THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
		28	(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
		29	OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
		30
		31	You can contact the author at :
		32	- FSE source repository : https://github.com/Cyan4973/FiniteStateEntropy
		33	- Public forum : https://groups.google.com/forum/#!forum/lz4c
		34	****************************************************************** */
		35
		36	/* --- dependencies --- */
		37	#include <stddef.h> /* size_t */
		38
		39
		40	/* --- simple histogram functions --- */
		41
		42	/*! HIST_count():
		43	* Provides the precise count of each byte within a table 'count'.
		44	* 'count' is a table of unsigned int, of minimum size (*maxSymbolValuePtr+1).
		45	* Updates *maxSymbolValuePtr with actual largest symbol value detected.
		46	* @return : count of the most frequent symbol (which isn't identified).
		47	* or an error code, which can be tested using HIST_isError().
		48	* note : if return == srcSize, there is only one symbol.
		49	*/
		50	size_t HIST_count(unsigned* count, unsigned* maxSymbolValuePtr,
		51	const void* src, size_t srcSize);
		52
		53	unsigned HIST_isError(size_t code); /*< tells if a return value is an error code /
		54
		55
		56	/* --- advanced histogram functions --- */
		57
		58	#define HIST_WKSP_SIZE_U32 1024
		59	/** HIST_count_wksp() :
		60	* Same as HIST_count(), but using an externally provided scratch buffer.
		61	* Benefit is this function will use very little stack space.
		62	* `workSpace` must be a table of unsigned of size >= HIST_WKSP_SIZE_U32
		63	*/
		64	size_t HIST_count_wksp(unsigned* count, unsigned* maxSymbolValuePtr,
		65	const void* src, size_t srcSize,
		66	unsigned* workSpace);
		67
		68	/** HIST_countFast() :
		69	* same as HIST_count(), but blindly trusts that all byte values within src are <= *maxSymbolValuePtr.
		70	* This function is unsafe, and will segfault if any value within `src` is `> *maxSymbolValuePtr`
		71	*/
		72	size_t HIST_countFast(unsigned* count, unsigned* maxSymbolValuePtr,
		73	const void* src, size_t srcSize);
		74
		75	/** HIST_countFast_wksp() :
		76	* Same as HIST_countFast(), but using an externally provided scratch buffer.
		77	* `workSpace` must be a table of unsigned of size >= HIST_WKSP_SIZE_U32
		78	*/
		79	size_t HIST_countFast_wksp(unsigned* count, unsigned* maxSymbolValuePtr,
		80	const void* src, size_t srcSize,
		81	unsigned* workSpace);
		82
		83	/*! HIST_count_simple() :
		84	* Same as HIST_countFast(), this function is unsafe,
		85	* and will segfault if any value within `src` is `> *maxSymbolValuePtr`.
		86	* It is also a bit slower for large inputs.
		87	* However, it does not need any additional memory (not even on stack).
		88	* @return : count of the most frequent symbol.
		89	* Note this function doesn't produce any error (i.e. it must succeed).
		90	*/
		91	unsigned HIST_count_simple(unsigned* count, unsigned* maxSymbolValuePtr,
		92	const void* src, size_t srcSize);

contrib/python-zstandard/zstd/dictBuilder/cover.h

0 created 644 0 0

	1		NO CONTENT: new file 100644
The requested commit or file is too big and content was truncated. Show full diff

contrib/python-zstandard/zstd/dictBuilder/fastcover.c

0 created 644 0 0

	1		NO CONTENT: new file 100644
The requested commit or file is too big and content was truncated. Show full diff

contrib/clang-format-ignorelist

0 +7 0

              mercurial/cext/revlog.c
              # Vendored code that we should never format:
              contrib/python-zstandard/c-ext/bufferutil.c
+             contrib/python-zstandard/c-ext/compressionchunker.c
              contrib/python-zstandard/c-ext/compressiondict.c
              contrib/python-zstandard/c-ext/compressionparams.c
              contrib/python-zstandard/c-ext/compressionreader.c
              contrib/python-zstandard/zstd/common/bitstream.h
              contrib/python-zstandard/zstd/common/compiler.h
              contrib/python-zstandard/zstd/common/cpu.h
+             contrib/python-zstandard/zstd/common/debug.c
+             contrib/python-zstandard/zstd/common/debug.h
              contrib/python-zstandard/zstd/common/entropy_common.c
              contrib/python-zstandard/zstd/common/error_private.c
              contrib/python-zstandard/zstd/common/error_private.h
              contrib/python-zstandard/zstd/common/zstd_errors.h
              contrib/python-zstandard/zstd/common/zstd_internal.h
              contrib/python-zstandard/zstd/compress/fse_compress.c
+             contrib/python-zstandard/zstd/compress/hist.c
+             contrib/python-zstandard/zstd/compress/hist.h
              contrib/python-zstandard/zstd/compress/huf_compress.c
              contrib/python-zstandard/zstd/compress/zstd_compress.c
              contrib/python-zstandard/zstd/compress/zstd_compress_internal.h
              contrib/python-zstandard/zstd/deprecated/zbuff_decompress.c
              contrib/python-zstandard/zstd/deprecated/zbuff.h
              contrib/python-zstandard/zstd/dictBuilder/cover.c
+             contrib/python-zstandard/zstd/dictBuilder/cover.h
              contrib/python-zstandard/zstd/dictBuilder/divsufsort.c
              contrib/python-zstandard/zstd/dictBuilder/divsufsort.h
+             contrib/python-zstandard/zstd/dictBuilder/fastcover.c
              contrib/python-zstandard/zstd/dictBuilder/zdict.c
              contrib/python-zstandard/zstd/dictBuilder/zdict.h
              contrib/python-zstandard/zstd/zstd.h

contrib/python-zstandard/MANIFEST.in

0 +3 0

              graft c-ext
+             graft debian
              graft zstd
              graft tests
              include make_cffi.py
              include setup_zstd.py
              include zstd.c
+             include zstd_cffi.py
              include LICENSE
+             include NEWS.rst

contrib/python-zstandard/NEWS.rst

0 +119 -1

		@@ -30,6 +30,19 b' Actions Blocking Release'
30	30	* Remove low-level compression parameters from ``ZstdCompressor.__init__`` and
31	31	require use of ``CompressionParameters``.
32	32	* Expose ``ZSTD_getFrameProgression()`` from more compressor types.
	33	* Support modifying compression parameters mid operation when supported by
	34	zstd API.
	35	* Expose ``ZSTD_CLEVEL_DEFAULT`` constant.
	36	* Support ``ZSTD_p_forceAttachDict`` compression parameter.
	37	* Use ``ZSTD_CCtx_getParameter()``/``ZSTD_CCtxParam_getParameter()`` for retrieving
	38	compression parameters.
	39	* Consider exposing ``ZSTDMT_toFlushNow()``.
	40	* Expose ``ZDICT_trainFromBuffer_fastCover()``,
	41	``ZDICT_optimizeTrainFromBuffer_fastCover``.
	42	* Expose and enforce ``ZSTD_minCLevel()`` for minimum compression level.
	43	* Consider a ``chunker()`` API for decompression.
	44	* Consider stats for ``chunker()`` API, including finding the last consumed
	45	offset of input data.
33	46
34	47	Other Actions Not Blocking Release
35	48	---------------------------------------
		@@ -38,6 +51,111 b' Other Actions Not Blocking Release'
38	51	* API for ensuring max memory ceiling isn't exceeded.
39	52	* Move off nose for testing.
40	53
	54	0.10.1 (released 2018-10-08)
	55	============================
	56
	57	Backwards Compatibility Notes
	58	-----------------------------
	59
	60	* ``ZstdCompressor.stream_reader().closed`` is now a property instead of a
	61	method (#58).
	62	* ``ZstdDecompressor.stream_reader().closed`` is now a property instead of a
	63	method (#58).
	64
	65	Changes
	66	-------
	67
	68	* Stop attempting to package Python 3.6 for Miniconda. The latest version of
	69	Miniconda is using Python 3.7. The Python 3.6 Miniconda packages were a lie
	70	since this were built against Python 3.7.
	71	* ``ZstdCompressor.stream_reader()``'s and ``ZstdDecompressor.stream_reader()``'s
	72	``closed`` attribute is now a read-only property instead of a method. This now
	73	properly matches the ``IOBase`` API and allows instances to be used in more
	74	places that accept ``IOBase`` instances.
	75
	76	0.10.0 (released 2018-10-08)
	77	============================
	78
	79	Backwards Compatibility Notes
	80	-----------------------------
	81
	82	* ``ZstdDecompressor.stream_reader().read()`` now consistently requires an
	83	argument in both the C and CFFI backends. Before, the CFFI implementation
	84	would assume a default value of ``-1``, which was later rejected.
	85	* The ``compress_literals`` argument and attribute has been removed from
	86	``zstd.ZstdCompressionParameters`` because it was removed by the zstd 1.3.5
	87	API.
	88	* ``ZSTD_CCtx_setParametersUsingCCtxParams()`` is no longer called on every
	89	operation performed against ``ZstdCompressor`` instances. The reason for this
	90	change is that the zstd 1.3.5 API no longer allows this without calling
	91	``ZSTD_CCtx_resetParameters()`` first. But if we called
	92	``ZSTD_CCtx_resetParameters()`` on every operation, we'd have to redo
	93	potentially expensive setup when using dictionaries. We now call
	94	``ZSTD_CCtx_reset()`` on every operation and don't attempt to change
	95	compression parameters.
	96	* Objects returned by ``ZstdCompressor.stream_reader()`` no longer need to be
	97	used as a context manager. The context manager interface still exists and its
	98	behavior is unchanged.
	99	* Objects returned by ``ZstdDecompressor.stream_reader()`` no longer need to be
	100	used as a context manager. The context manager interface still exists and its
	101	behavior is unchanged.
	102
	103	Bug Fixes
	104	---------
	105
	106	* ``ZstdDecompressor.decompressobj().decompress()`` should now return all data
	107	from internal buffers in more scenarios. Before, it was possible for data to
	108	remain in internal buffers. This data would be emitted on a subsequent call
	109	to ``decompress()``. The overall output stream would still be valid. But if
	110	callers were expecting input data to exactly map to output data (say the
	111	producer had used ``flush(COMPRESSOBJ_FLUSH_BLOCK)`` and was attempting to
	112	map input chunks to output chunks), then the previous behavior would be
	113	wrong. The new behavior is such that output from
	114	``flush(COMPRESSOBJ_FLUSH_BLOCK)`` fed into ``decompressobj().decompress()``
	115	should produce all available compressed input.
	116	* ``ZstdDecompressor.stream_reader().read()`` should no longer segfault after
	117	a previous context manager resulted in error (#56).
	118	* ``ZstdCompressor.compressobj().flush(COMPRESSOBJ_FLUSH_BLOCK)`` now returns
	119	all data necessary to flush a block. Before, it was possible for the
	120	``flush()`` to not emit all data necessary to fully represent a block. This
	121	would mean decompressors wouldn't be able to decompress all data that had been
	122	fed into the compressor and ``flush()``ed. (#55).
	123
	124	New Features
	125	------------
	126
	127	* New module constants ``BLOCKSIZELOG_MAX``, ``BLOCKSIZE_MAX``,
	128	``TARGETLENGTH_MAX`` that expose constants from libzstd.
	129	* New ``ZstdCompressor.chunker()`` API for manually feeding data into a
	130	compressor and emitting chunks of a fixed size. Like ``compressobj()``, the
	131	API doesn't impose restrictions on the input or output types for the
	132	data streams. Unlike ``compressobj()``, it ensures output chunks are of a
	133	fixed size. This makes this API useful when the compressed output is being
	134	fed into an I/O layer, where uniform write sizes are useful.
	135	* ``ZstdCompressor.stream_reader()`` no longer needs to be used as a context
	136	manager (#34).
	137	* ``ZstdDecompressor.stream_reader()`` no longer needs to be used as a context
	138	manager (#34).
	139	* Bundled zstandard library upgraded from 1.3.4 to 1.3.6.
	140
	141	Changes
	142	-------
	143
	144	* Added ``zstd_cffi.py`` and ``NEWS.rst`` to ``MANIFEST.in``.
	145	* ``zstandard.__version__`` is now defined (#50).
	146	* Upgrade pip, setuptools, wheel, and cibuildwheel packages to latest versions.
	147	* Upgrade various packages used in CI to latest versions. Notably tox (in
	148	order to support Python 3.7).
	149	* Use relative paths in setup.py to appease Python 3.7 (#51).
	150	* Added CI for Python 3.7.
	151
	152	0.9.1 (released 2018-06-04)
	153	===========================
	154
	155	* Debian packaging support.
	156	* Fix typo in setup.py (#44).
	157	* Support building with mingw compiler (#46).
	158
41	159	0.9.0 (released 2018-04-08)
42	160	===========================
43	161
		@@ -90,7 +208,7 b' Bug Fixes'
90	208	New Features
91	209	------------
92	210
93		* Bundlded zstandard library upgraded from 1.1.3 to 1.3.4. This delivers various
	211	* Bundled zstandard library upgraded from 1.1.3 to 1.3.4. This delivers various
94	212	bug fixes and performance improvements. It also gives us access to newer
95	213	features.
96	214	* Support for negative compression levels.

contrib/python-zstandard/README.rst

0 +88 -13

                 with open(path, 'rb') as fh:
                     cctx = zstd.ZstdCompressor()
+                    reader = cctx.stream_reader(fh)
+                    while True:
+                        chunk = reader.read(16384)
+                        if not chunk:
+                            break
+                        # Do something with compressed chunk.
+             Instances can also be used as context managers::
+                with open(path, 'rb') as fh:
                     with cctx.stream_reader(fh) as reader:
                         while True:
                             chunk = reader.read(16384)
                             # Do something with compressed chunk.
-             The stream can only be read within a context manager. When the context
-             manager exits, the stream is closed and the underlying resource is
-             released and future operations against the compression stream stream will fail.
+             When the context manager exists or ``close()`` is called, the stream is closed,
+             underlying resources are released, and future operations against the compression
+             stream will fail.
              The ``source`` argument to ``stream_reader()`` can be any object with a
              ``read(size)`` method or any object implementing the *buffer protocol*.
                 data = cobj.compress(b'foobar')
                 data = cobj.flush()
+             Chunker API
+             ^^^^^^^^^^^
+             ``chunker(size=None, chunk_size=COMPRESSION_RECOMMENDED_OUTPUT_SIZE)`` returns
+             an object that can be used to iteratively feed chunks of data into a compressor
+             and produce output chunks of a uniform size.
+             The object returned by ``chunker()`` exposes the following methods:
+             ``compress(data)``
+                Feeds new input data into the compressor.
+             ``flush()``
+                Flushes all data currently in the compressor.
+             ``finish()``
+                Signals the end of input data. No new data can be compressed after this
+                method is called.
+             ``compress()``, ``flush()``, and ``finish()`` all return an iterator of
+             ``bytes`` instances holding compressed data. The iterator may be empty. Callers
+             MUST iterate through all elements of the returned iterator before performing
+             another operation on the object.
+             All chunks emitted by ``compress()`` will have a length of ``chunk_size``.
+             ``flush()`` and ``finish()`` may return a final chunk smaller than
+             ``chunk_size``.
+             Here is how the API should be used::
+                cctx = zstd.ZstdCompressor()
+                chunker = cctx.chunker(chunk_size=32768)
+                with open(path, 'rb') as fh:
+                    while True:
+                        in_chunk = fh.read(32768)
+                        if not in_chunk:
+                            break
+                        for out_chunk in chunker.compress(in_chunk):
+                            # Do something with output chunk of size 32768.
+                    for out_chunk in chunker.finish():
+                        # Do something with output chunks that finalize the zstd frame.
+             The ``chunker()`` API is often a better alternative to ``compressobj()``.
+             ``compressobj()`` will emit output data as it is available. This results in a
+             *stream* of output chunks of varying sizes. The consistency of the output chunk
+             size with ``chunker()`` is more appropriate for many usages, such as sending
+             compressed data to a socket.
+             ``compressobj()`` may also perform extra memory reallocations in order to
+             dynamically adjust the sizes of the output chunks. Since ``chunker()`` output
+             chunks are all the same size (except for flushed or final chunks), there is
+             less memory allocation overhead.
              Batch Compression API
              ^^^^^^^^^^^^^^^^^^^^^
                 with open(path, 'rb') as fh:
                     dctx = zstd.ZstdDecompressor()
-                    with dctx.stream_reader(fh) as reader:
-                        while True:
-                            chunk = reader.read(16384)
-                            if not chunk:
-                                break
+                    reader = dctx.stream_reader(fh)
+                    while True:
+                        chunk = reader.read(16384)
+                         if not chunk:
+                             break
+                         # Do something with decompressed chunk.
-                            # Do something with decompressed chunk.
+             The stream can also be used as a context manager::
-             The stream can only be read within a context manager. When the context
-             manager exits, the stream is closed and the underlying resource is
-             released and future operations against the stream will fail.
+                with open(path, 'rb') as fh:
+                    dctx = zstd.ZstdDecompressor()
+                    with dctx.stream_reader(fh) as reader:
+                        ...
+             When used as a context manager, the stream is closed and the underlying
+             resources are released when the context manager exits. Future operations against
+             the stream will fail.
              The ``source`` argument to ``stream_reader()`` can be any object with a
              ``read(size)`` method or any object implementing the *buffer protocol*.
              * write_dict_id
              * job_size
              * overlap_size_log
-             * compress_literals
              * force_max_window
              * enable_ldm
              * ldm_hash_log

contrib/python-zstandard/c-ext/compressionparams.c

0 +2 -27

              	TRY_SET_PARAMETER(params, ZSTD_p_nbWorkers, obj->threads);
              	TRY_SET_PARAMETER(params, ZSTD_p_jobSize, obj->jobSize);
              	TRY_SET_PARAMETER(params, ZSTD_p_overlapSizeLog, obj->overlapSizeLog);
-             	TRY_SET_PARAMETER(params, ZSTD_p_compressLiterals, obj->compressLiterals);
              	TRY_SET_PARAMETER(params, ZSTD_p_forceMaxWindow, obj->forceMaxWindow);
              	TRY_SET_PARAMETER(params, ZSTD_p_enableLongDistanceMatching, obj->enableLongDistanceMatching);
              	TRY_SET_PARAMETER(params, ZSTD_p_ldmHashLog, obj->ldmHashLog);
              		"ldm_bucket_size_log",
              		"ldm_hash_every_log",
              		"threads",
-             		"compress_literals",
              		NULL
              	};
              	unsigned ldmHashEveryLog = 0;
              	int threads = 0;
-             	/* Setting value 0 has the effect of disabling. So we use -1 as a default
-             	 * to detect whether to set. Then we automatically derive the expected value
-             	 * based on the level, just like zstandard does itself. */
-             	int compressLiterals = -1;
              	if (!PyArg_ParseTupleAndKeywords(args, kwargs,
-             		"|IiIIIIIIIIIIIIIIIIIIii:CompressionParameters",
+             		"|IiIIIIIIIIIIIIIIIIIIi:CompressionParameters",
              		kwlist, &format, &compressionLevel, &windowLog, &hashLog, &chainLog,
              		&searchLog, &minMatch, &targetLength, &compressionStrategy,
              		&contentSizeFlag, &checksumFlag, &dictIDFlag, &jobSize, &overlapSizeLog,
              		&forceMaxWindow, &enableLDM, &ldmHashLog, &ldmMinMatch, &ldmBucketSizeLog,
-             		&ldmHashEveryLog, &threads, &compressLiterals)) {
+             		&ldmHashEveryLog, &threads)) {
              		return -1;
              	}
              		threads = cpu_count();
              	}
-             	if (compressLiterals < 0) {
-             		compressLiterals = compressionLevel >= 0;
+             	}
              	self->format = format;
              	self->compressionLevel = compressionLevel;
              	self->windowLog = windowLog;
              	self->threads = threads;
              	self->jobSize = jobSize;
              	self->overlapSizeLog = overlapSizeLog;
-             	self->compressLiterals = compressLiterals;
              	self->forceMaxWindow = forceMaxWindow;
              	self->enableLongDistanceMatching = enableLDM;
              	self->ldmHashLog = ldmHashLog;
              		Py_DECREF(val);
              	}
-             	val = PyDict_GetItemString(kwargs, "compress_literals");
-             	if (!val) {
-             		val = PyLong_FromLong(level >= 0 ? 1 : 0);
-             		if (!val) {
-             			goto cleanup;
+             		}
-             		PyDict_SetItemString(kwargs, "compress_literals", val);
-             		Py_DECREF(val);
+             	}
              	result = PyObject_New(ZstdCompressionParametersObject, &ZstdCompressionParametersType);
              	if (!result) {
              		goto cleanup;
              	{ "overlap_size_log", T_UINT,
              	  offsetof(ZstdCompressionParametersObject, overlapSizeLog), READONLY,
              	  "Size of previous input reloaded at the beginning of each job" },
-             	{ "compress_literals", T_UINT,
-             	  offsetof(ZstdCompressionParametersObject, compressLiterals), READONLY,
-             	  "whether Huffman compression of literals is in use" },
              	{ "force_max_window", T_UINT,
              	  offsetof(ZstdCompressionParametersObject, forceMaxWindow), READONLY,
              	  "force back references to remain smaller than window size" },

contrib/python-zstandard/c-ext/compressionreader.c

0 +7 -26

              }
              static ZstdCompressionReader* reader_enter(ZstdCompressionReader* self) {
-             	size_t zresult;
              	if (self->entered) {
              		PyErr_SetString(PyExc_ValueError, "cannot __enter__ multiple times");
              		return NULL;
              	}
-             	zresult = ZSTD_CCtx_setPledgedSrcSize(self->compressor->cctx, self->sourceSize);
-             	if (ZSTD_isError(zresult)) {
-             		PyErr_Format(ZstdError, "error setting source size: %s",
-             			ZSTD_getErrorName(zresult));
-             		return NULL;
+             	}
              	self->entered = 1;
              	Py_INCREF(self);
              	Py_RETURN_NONE;
              }
-             static PyObject* reader_closed(ZstdCompressionReader* self) {
-             	if (self->closed) {
-             		Py_RETURN_TRUE;
+             	}
-             	else {
-             		Py_RETURN_FALSE;
+             	}
+             }
              static PyObject* reader_tell(ZstdCompressionReader* self) {
              	/* TODO should this raise OSError since stream isn't seekable? */
              	return PyLong_FromUnsignedLongLong(self->bytesCompressed);
              	size_t zresult;
              	size_t oldPos;
-             	if (!self->entered) {
-             		PyErr_SetString(ZstdError, "read() must be called from an active context manager");
-             		return NULL;
+             	}
              	if (self->closed) {
              		PyErr_SetString(PyExc_ValueError, "stream is closed");
              		return NULL;
              	PyDoc_STR("Exit a compression context") },
              	{ "close", (PyCFunction)reader_close, METH_NOARGS,
              	PyDoc_STR("Close the stream so it cannot perform any more operations") },
-             	{ "closed", (PyCFunction)reader_closed, METH_NOARGS,
-             	PyDoc_STR("Whether stream is closed") },
              	{ "flush", (PyCFunction)reader_flush, METH_NOARGS, PyDoc_STR("no-ops") },
              	{ "isatty", (PyCFunction)reader_isatty, METH_NOARGS, PyDoc_STR("Returns False") },
              	{ "readable", (PyCFunction)reader_readable, METH_NOARGS,
              	{ NULL, NULL }
              };
+             static PyMemberDef reader_members[] = {
+             	{ "closed", T_BOOL, offsetof(ZstdCompressionReader, closed),
+             	  READONLY, "whether stream is closed" },
+             	{ NULL }
+             };
              PyTypeObject ZstdCompressionReaderType = {
              	PyVarObject_HEAD_INIT(NULL, 0)
              	"zstd.ZstdCompressionReader", /* tp_name */
              	reader_iter, /* tp_iter */
              	reader_iternext, /* tp_iternext */
              	reader_methods, /* tp_methods */
-, /* tp_members */
+             	reader_members, /* tp_members */
 , /* tp_getset */
 , /* tp_base */
 , /* tp_dict */

contrib/python-zstandard/c-ext/compressionwriter.c

0 +5 -4

              			return NULL;
              		}
-             		if (!output.pos) {
-             			break;
+             		}
              		/* Copy data from output buffer to writer. */
              		if (output.pos) {
              #if PY_MAJOR_VERSION >= 3
              			totalWrite += output.pos;
              			self->bytesCompressed += output.pos;
              		}
              		output.pos = 0;
+             		if (!zresult) {
+             			break;
+             		}
              	}
              	PyMem_Free(output.dst);

contrib/python-zstandard/c-ext/compressobj.c

0 +19 -36

              	PyObject* result = NULL;
              	Py_ssize_t resultSize = 0;
              	ZSTD_inBuffer input;
+             	ZSTD_EndDirective zFlushMode;
              	if (!PyArg_ParseTupleAndKeywords(args, kwargs, "|i:flush", kwlist, &flushMode)) {
              		return NULL;
              		return NULL;
              	}
+             	switch (flushMode) {
+             		case compressorobj_flush_block:
+             			zFlushMode = ZSTD_e_flush;
+             			break;
+             		case compressorobj_flush_finish:
+             			zFlushMode = ZSTD_e_end;
+             			self->finished = 1;
+             			break;
+             		default:
+             			PyErr_SetString(ZstdError, "unhandled flush mode");
+             			return NULL;
+             	}
              	assert(self->output.pos == 0);
              	input.src = NULL;
              	input.size = 0;
              	input.pos = 0;
-             	if (flushMode == compressorobj_flush_block) {
-             		/* The output buffer is of size ZSTD_CStreamOutSize(), which is
-             		   guaranteed to hold a full block. */
+             	while (1) {
              		Py_BEGIN_ALLOW_THREADS
-             			zresult = ZSTD_compress_generic(self->compressor->cctx, &self->output,
-             				&input, ZSTD_e_flush);
+             		zresult = ZSTD_compress_generic(self->compressor->cctx, &self->output,
+             			&input, zFlushMode);
              		Py_END_ALLOW_THREADS
              		if (ZSTD_isError(zresult)) {
-             			PyErr_Format(ZstdError, "zstd compress error: %s", ZSTD_getErrorName(zresult));
-             			return NULL;
+             		}
-             		/* Output buffer is guaranteed to hold full block. */
-             		assert(zresult == 0);
-             		if (self->output.pos) {
-             			result = PyBytes_FromStringAndSize(self->output.dst, self->output.pos);
-             			if (!result) {
-             				return NULL;
+             			}
+             		}
-             		self->output.pos = 0;
-             		if (result) {
-             			return result;
+             		}
-             		else {
-             			return PyBytes_FromString("");
+             		}
+             	}
-             	assert(flushMode == compressorobj_flush_finish);
-             	self->finished = 1;
-             	while (1) {
-             		zresult = ZSTD_compress_generic(self->compressor->cctx, &self->output,
-             			&input, ZSTD_e_end);
-             		if (ZSTD_isError(zresult)) {
              			PyErr_Format(ZstdError, "error ending compression stream: %s",
              				ZSTD_getErrorName(zresult));
              			return NULL;

contrib/python-zstandard/c-ext/compressor.c

0 +70 -23

              extern PyObject* ZstdError;
-             int ensure_cctx(ZstdCompressor* compressor) {
+             int setup_cctx(ZstdCompressor* compressor) {
              	size_t zresult;
              	assert(compressor);
              	assert(compressor->cctx);
              	assert(compressor->params);
-             	ZSTD_CCtx_reset(compressor->cctx);
              	zresult = ZSTD_CCtx_setParametersUsingCCtxParams(compressor->cctx, compressor->params);
              	if (ZSTD_isError(zresult)) {
              		PyErr_Format(ZstdError, "could not set compression parameters: %s",
              		Py_INCREF(dict);
              	}
-             	if (ensure_cctx(self)) {
-             		return -1;
+             	}
+                 if (setup_cctx(self)) {
+                     return -1;
+                 }
              	return 0;
              }
              		return NULL;
              	}
-             	if (ensure_cctx(self)) {
-             		return NULL;
+             	}
+             	ZSTD_CCtx_reset(self->cctx);
              	zresult = ZSTD_CCtx_setPledgedSrcSize(self->cctx, sourceSize);
              	if (ZSTD_isError(zresult)) {
              	unsigned long long sourceSize = ZSTD_CONTENTSIZE_UNKNOWN;
              	size_t readSize = ZSTD_CStreamInSize();
              	ZstdCompressionReader* result = NULL;
+             	size_t zresult;
              	if (!PyArg_ParseTupleAndKeywords(args, kwargs, "O|Kk:stream_reader", kwlist,
              		&source, &sourceSize, &readSize)) {
              		goto except;
              	}
-             	if (ensure_cctx(self)) {
+             	ZSTD_CCtx_reset(self->cctx);
+             	zresult = ZSTD_CCtx_setPledgedSrcSize(self->cctx, sourceSize);
+             	if (ZSTD_isError(zresult)) {
+             		PyErr_Format(ZstdError, "error setting source source: %s",
+             			ZSTD_getErrorName(zresult));
              		goto except;
              	}
              	result->compressor = self;
              	Py_INCREF(self);
-             	result->sourceSize = sourceSize;
              	return result;
              		goto finally;
              	}
-             	if (ensure_cctx(self)) {
-             		goto finally;
+             	}
+             	ZSTD_CCtx_reset(self->cctx);
              	destSize = ZSTD_compressBound(source.len);
              	output = PyBytes_FromStringAndSize(NULL, destSize);
              		return NULL;
              	}
-             	if (ensure_cctx(self)) {
-             		return NULL;
+             	}
+             	ZSTD_CCtx_reset(self->cctx);
              	zresult = ZSTD_CCtx_setPledgedSrcSize(self->cctx, inSize);
              	if (ZSTD_isError(zresult)) {
              		goto except;
              	}
-             	if (ensure_cctx(self)) {
-             		return NULL;
+             	}
+             	ZSTD_CCtx_reset(self->cctx);
              	zresult = ZSTD_CCtx_setPledgedSrcSize(self->cctx, sourceSize);
              	if (ZSTD_isError(zresult)) {
              		return NULL;
              	}
-             	if (ensure_cctx(self)) {
-             		return NULL;
+             	}
+             	ZSTD_CCtx_reset(self->cctx);
              	result = (ZstdCompressionWriter*)PyObject_CallObject((PyObject*)&ZstdCompressionWriterType, NULL);
              	if (!result) {
              	return result;
              }
+             PyDoc_STRVAR(ZstdCompressor_chunker__doc__,
+             "Create an object for iterative compressing to same-sized chunks.\n"
+             );
+             static ZstdCompressionChunker* ZstdCompressor_chunker(ZstdCompressor* self, PyObject* args, PyObject* kwargs) {
+             	static char* kwlist[] = {
+             		"size",
+             		"chunk_size",
+             		NULL
+             	};
+             	unsigned long long sourceSize = ZSTD_CONTENTSIZE_UNKNOWN;
+             	size_t chunkSize = ZSTD_CStreamOutSize();
+             	ZstdCompressionChunker* chunker;
+             	size_t zresult;
+             	if (!PyArg_ParseTupleAndKeywords(args, kwargs, "|Kk:chunker", kwlist,
+             		&sourceSize, &chunkSize)) {
+             		return NULL;
+             	}
+             	ZSTD_CCtx_reset(self->cctx);
+             	zresult = ZSTD_CCtx_setPledgedSrcSize(self->cctx, sourceSize);
+             	if (ZSTD_isError(zresult)) {
+             		PyErr_Format(ZstdError, "error setting source size: %s",
+             			ZSTD_getErrorName(zresult));
+             		return NULL;
+             	}
+             	chunker = (ZstdCompressionChunker*)PyObject_CallObject((PyObject*)&ZstdCompressionChunkerType, NULL);
+             	if (!chunker) {
+             		return NULL;
+             	}
+             	chunker->output.dst = PyMem_Malloc(chunkSize);
+             	if (!chunker->output.dst) {
+             		PyErr_NoMemory();
+             		Py_DECREF(chunker);
+             		return NULL;
+             	}
+             	chunker->output.size = chunkSize;
+             	chunker->output.pos = 0;
+             	chunker->compressor = self;
+             	Py_INCREF(chunker->compressor);
+             	chunker->chunkSize = chunkSize;
+             	return chunker;
+             }
              typedef struct {
              	void* sourceData;
              	size_t sourceSize;
              }
              static PyMethodDef ZstdCompressor_methods[] = {
+             	{ "chunker", (PyCFunction)ZstdCompressor_chunker,
+             	METH_VARARGS | METH_KEYWORDS, ZstdCompressor_chunker__doc__ },
              	{ "compress", (PyCFunction)ZstdCompressor_compress,
              	METH_VARARGS | METH_KEYWORDS, ZstdCompressor_compress__doc__ },
              	{ "compressobj", (PyCFunction)ZstdCompressor_compressobj,

contrib/python-zstandard/c-ext/constants.c

0 +3 -2

              #else
              	version = PyString_FromString(PYTHON_ZSTANDARD_VERSION);
              #endif
-             	Py_INCREF(version);
              	PyModule_AddObject(mod, "__version__", version);
              	ZstdError = PyErr_NewException("zstd.ZstdError", NULL, NULL);
              	PyTuple_SetItem(zstdVersion, 0, PyLong_FromLong(ZSTD_VERSION_MAJOR));
              	PyTuple_SetItem(zstdVersion, 1, PyLong_FromLong(ZSTD_VERSION_MINOR));
              	PyTuple_SetItem(zstdVersion, 2, PyLong_FromLong(ZSTD_VERSION_RELEASE));
-             	Py_INCREF(zstdVersion);
              	PyModule_AddObject(mod, "ZSTD_VERSION", zstdVersion);
              	frameHeader = PyBytes_FromStringAndSize(frame_header, sizeof(frame_header));
              		(long)ZSTD_DStreamOutSize());
              	PyModule_AddIntConstant(mod, "MAGIC_NUMBER", ZSTD_MAGICNUMBER);
+             	PyModule_AddIntConstant(mod, "BLOCKSIZELOG_MAX", ZSTD_BLOCKSIZELOG_MAX);
+             	PyModule_AddIntConstant(mod, "BLOCKSIZE_MAX", ZSTD_BLOCKSIZE_MAX);
              	PyModule_AddIntConstant(mod, "WINDOWLOG_MIN", ZSTD_WINDOWLOG_MIN);
              	PyModule_AddIntConstant(mod, "WINDOWLOG_MAX", ZSTD_WINDOWLOG_MAX);
              	PyModule_AddIntConstant(mod, "CHAINLOG_MIN", ZSTD_CHAINLOG_MIN);
              	PyModule_AddIntConstant(mod, "SEARCHLENGTH_MIN", ZSTD_SEARCHLENGTH_MIN);
              	PyModule_AddIntConstant(mod, "SEARCHLENGTH_MAX", ZSTD_SEARCHLENGTH_MAX);
              	PyModule_AddIntConstant(mod, "TARGETLENGTH_MIN", ZSTD_TARGETLENGTH_MIN);
+             	PyModule_AddIntConstant(mod, "TARGETLENGTH_MAX", ZSTD_TARGETLENGTH_MAX);
              	PyModule_AddIntConstant(mod, "LDM_MINMATCH_MIN", ZSTD_LDM_MINMATCH_MIN);
              	PyModule_AddIntConstant(mod, "LDM_MINMATCH_MAX", ZSTD_LDM_MINMATCH_MAX);
              	PyModule_AddIntConstant(mod, "LDM_BUCKETSIZELOG_MAX", ZSTD_LDM_BUCKETSIZELOG_MAX);

contrib/python-zstandard/c-ext/decompressionreader.c

0 +7 -26

              		return NULL;
              	}
-             	if (ensure_dctx(self->decompressor, 1)) {
-             		return NULL;
+             	}
              	self->entered = 1;
              	Py_INCREF(self);
              	Py_RETURN_NONE;
              }
-             static PyObject* reader_closed(ZstdDecompressionReader* self) {
-             	if (self->closed) {
-             		Py_RETURN_TRUE;
+             	}
-             	else {
-             		Py_RETURN_FALSE;
+             	}
+             }
              static PyObject* reader_flush(PyObject* self) {
              	Py_RETURN_NONE;
              }
              	ZSTD_outBuffer output;
              	size_t zresult;
-             	if (!self->entered) {
-             		PyErr_SetString(ZstdError, "read() must be called from an active context manager");
-             		return NULL;
+             	}
              	if (self->closed) {
              		PyErr_SetString(PyExc_ValueError, "stream is closed");
              		return NULL;
              	unsigned long long readAmount = 0;
              	size_t defaultOutSize = ZSTD_DStreamOutSize();
-             	if (!self->entered) {
-             		PyErr_SetString(ZstdError, "seek() must be called from an active context manager");
-             		return NULL;
+             	}
              	if (self->closed) {
              		PyErr_SetString(PyExc_ValueError, "stream is closed");
              		return NULL;
              	PyDoc_STR("Exit a compression context") },
              	{ "close", (PyCFunction)reader_close, METH_NOARGS,
              	PyDoc_STR("Close the stream so it cannot perform any more operations") },
-             	{ "closed", (PyCFunction)reader_closed, METH_NOARGS,
-             	PyDoc_STR("Whether stream is closed") },
              	{ "flush", (PyCFunction)reader_flush, METH_NOARGS, PyDoc_STR("no-ops") },
              	{ "isatty", (PyCFunction)reader_isatty, METH_NOARGS, PyDoc_STR("Returns False") },
              	{ "readable", (PyCFunction)reader_readable, METH_NOARGS,
              	{ NULL, NULL }
              };
+             static PyMemberDef reader_members[] = {
+             	{ "closed", T_BOOL, offsetof(ZstdDecompressionReader, closed),
+             	  READONLY, "whether stream is closed" },
+             	{ NULL }
+             };
              PyTypeObject ZstdDecompressionReaderType = {
              	PyVarObject_HEAD_INIT(NULL, 0)
              	"zstd.ZstdDecompressionReader", /* tp_name */
              	reader_iter, /* tp_iter */
              	reader_iternext, /* tp_iternext */
              	reader_methods, /* tp_methods */
-, /* tp_members */
+             	reader_members, /* tp_members */
 , /* tp_getset */
 , /* tp_base */
 , /* tp_dict */

contrib/python-zstandard/c-ext/decompressobj.c

0 +14 -3

              	PyObject* result = NULL;
              	Py_ssize_t resultSize = 0;
+             	output.dst = NULL;
              	if (self->finished) {
              		PyErr_SetString(ZstdError, "cannot use a decompressobj multiple times");
              		return NULL;
              		goto finally;
              	}
+             	/* Special case of empty input. Output will always be empty. */
+             	if (source.len == 0) {
+             		result = PyBytes_FromString("");
+             		goto finally;
+             	}
              	input.src = source.buf;
              	input.size = source.len;
              	input.pos = 0;
              	output.size = self->outSize;
              	output.pos = 0;
-             	/* Read input until exhausted. */
-             	while (input.pos < input.size) {
+             	while (1) {
              		Py_BEGIN_ALLOW_THREADS
              		zresult = ZSTD_decompress_generic(self->decompressor->dctx, &output, &input);
              		Py_END_ALLOW_THREADS
              					goto except;
              				}
              			}
+             		}
-             			output.pos = 0;
+             		if (zresult == 0 || (input.pos == input.size && output.pos == 0)) {
+             			break;
              		}
+             		output.pos = 0;
              	}
              	if (!result) {

contrib/python-zstandard/c-ext/decompressor.c

0 +4 0

              		return NULL;
              	}
+             	if (ensure_dctx(self, 1)) {
+             		return NULL;
+             	}
              	result = (ZstdDecompressionReader*)PyObject_CallObject((PyObject*)&ZstdDecompressionReaderType, NULL);
              	if (NULL == result) {
              		return NULL;

contrib/python-zstandard/c-ext/python-zstandard.h

0 +30 -3

              #include <zstd.h>
              #include <zdict.h>
-             #define PYTHON_ZSTANDARD_VERSION "0.9.0"
+             /* Remember to change the string in zstandard/__init__ as well */
+             #define PYTHON_ZSTANDARD_VERSION "0.10.1"
              typedef enum {
              	compressorobj_flush_finish,
              	unsigned threads;
              	unsigned jobSize;
              	unsigned overlapSizeLog;
-             	unsigned compressLiterals;
              	unsigned forceMaxWindow;
              	unsigned enableLongDistanceMatching;
              	unsigned ldmHashLog;
              	ZstdCompressor* compressor;
              	PyObject* reader;
              	Py_buffer buffer;
-             	unsigned long long sourceSize;
              	size_t readSize;
              	int entered;
              typedef struct {
              	PyObject_HEAD
+             	ZstdCompressor* compressor;
+             	ZSTD_inBuffer input;
+             	ZSTD_outBuffer output;
+             	Py_buffer inBuffer;
+             	int finished;
+             	size_t chunkSize;
+             } ZstdCompressionChunker;
+             extern PyTypeObject ZstdCompressionChunkerType;
+             typedef enum {
+             	compressionchunker_mode_normal,
+             	compressionchunker_mode_flush,
+             	compressionchunker_mode_finish,
+             } CompressionChunkerMode;
+             typedef struct {
+             	PyObject_HEAD
+             	ZstdCompressionChunker* chunker;
+             	CompressionChunkerMode mode;
+             } ZstdCompressionChunkerIterator;
+             extern PyTypeObject ZstdCompressionChunkerIteratorType;
+             typedef struct {
+             	PyObject_HEAD
              	ZSTD_DCtx* dctx;
              	ZstdCompressionDict* dict;
              	size_t maxWindowSize;

contrib/python-zstandard/make_cffi.py

0 +3 0

              HERE = os.path.abspath(os.path.dirname(__file__))
              SOURCES = ['zstd/%s' % p for p in (
+                 'common/debug.c',
                  'common/entropy_common.c',
                  'common/error_private.c',
                  'common/fse_decompress.c',
                  'common/xxhash.c',
                  'common/zstd_common.c',
                  'compress/fse_compress.c',
+                 'compress/hist.c',
                  'compress/huf_compress.c',
                  'compress/zstd_compress.c',
                  'compress/zstd_double_fast.c',
                  'decompress/huf_decompress.c',
                  'decompress/zstd_decompress.c',
                  'dictBuilder/cover.c',
+                 'dictBuilder/fastcover.c',
                  'dictBuilder/divsufsort.c',
                  'dictBuilder/zdict.c',
              )]

contrib/python-zstandard/setup_zstd.py

0 +39 -11

              import distutils.ccompiler
              import os
-             import sys
              from distutils.extension import Extension
              zstd_sources = ['zstd/%s' % p for p in (
+                 'common/debug.c',
                  'common/entropy_common.c',
                  'common/error_private.c',
                  'common/fse_decompress.c',
                  'common/xxhash.c',
                  'common/zstd_common.c',
                  'compress/fse_compress.c',
+                 'compress/hist.c',
                  'compress/huf_compress.c',
                  'compress/zstd_compress.c',
                  'compress/zstd_double_fast.c',
                  'decompress/zstd_decompress.c',
                  'dictBuilder/cover.c',
                  'dictBuilder/divsufsort.c',
+                 'dictBuilder/fastcover.c',
                  'dictBuilder/zdict.c',
              )]
                  'c-ext/compressobj.c',
                  'c-ext/compressor.c',
                  'c-ext/compressoriterator.c',
+                 'c-ext/compressionchunker.c',
                  'c-ext/compressionparams.c',
                  'c-ext/compressionreader.c',
                  'c-ext/compressionwriter.c',
              def get_c_extension(support_legacy=False, system_zstd=False, name='zstd',
-                                 warnings_as_errors=False):
-                 """Obtain a distutils.extension.Extension for the C extension."""
-                 root = os.path.abspath(os.path.dirname(__file__))
+                                 warnings_as_errors=False, root=None):
+                 """Obtain a distutils.extension.Extension for the C extension.
+                 ``support_legacy`` controls whether to compile in legacy zstd format support.
+                 ``system_zstd`` controls whether to compile against the system zstd library.
+                 For this to work, the system zstd library and headers must match what
+                 python-zstandard is coded against exactly.
+                 ``name`` is the module name of the C extension to produce.
+                 ``warnings_as_errors`` controls whether compiler warnings are turned into
+                 compiler errors.
-                 sources = set([os.path.join(root, p) for p in ext_sources])
+                 ``root`` defines a root path that source should be computed as relative
+                 to. This should be the directory with the main ``setup.py`` that is
+                 being invoked. If not defined, paths will be relative to this file.
+                 """
+                 actual_root = os.path.abspath(os.path.dirname(__file__))
+                 root = root or actual_root
+                 sources = set([os.path.join(actual_root, p) for p in ext_sources])
                  if not system_zstd:
-                     sources.update([os.path.join(root, p) for p in zstd_sources])
+                     sources.update([os.path.join(actual_root, p) for p in zstd_sources])
                      if support_legacy:
-                         sources.update([os.path.join(root, p) for p in zstd_sources_legacy])
+                         sources.update([os.path.join(actual_root, p)
+                                         for p in zstd_sources_legacy])
                  sources = list(sources)
-                 include_dirs = set([os.path.join(root, d) for d in ext_includes])
+                 include_dirs = set([os.path.join(actual_root, d) for d in ext_includes])
                  if not system_zstd:
-                     include_dirs.update([os.path.join(root, d) for d in zstd_includes])
+                     include_dirs.update([os.path.join(actual_root, d)
+                                          for d in zstd_includes])
                      if support_legacy:
-                         include_dirs.update([os.path.join(root, d) for d in zstd_includes_legacy])
+                         include_dirs.update([os.path.join(actual_root, d)
+                                              for d in zstd_includes_legacy])
                  include_dirs = list(include_dirs)
-                 depends = [os.path.join(root, p) for p in zstd_depends]
+                 depends = [os.path.join(actual_root, p) for p in zstd_depends]
                  compiler = distutils.ccompiler.new_compiler()
                  libraries = ['zstd'] if system_zstd else []
+                 # Python 3.7 doesn't like absolute paths. So normalize to relative.
+                 sources = [os.path.relpath(p, root) for p in sources]
+                 include_dirs = [os.path.relpath(p, root) for p in include_dirs]
+                 depends = [os.path.relpath(p, root) for p in depends]
                  # TODO compile with optimizations.
                  return Extension(name, sources,
                                   include_dirs=include_dirs,

contrib/python-zstandard/tests/test_compressor.py

0 +209 -12

                      no_params = zstd.get_frame_parameters(no_dict_id)
                      with_params = zstd.get_frame_parameters(with_dict_id)
                      self.assertEqual(no_params.dict_id, 0)
-                     self.assertEqual(with_params.dict_id, 1387616518)
+                     self.assertEqual(with_params.dict_id, 1880053135)
                  def test_compress_dict_multiple(self):
                      samples = []
                      self.assertEqual(params.dict_id, d.dict_id())
                      self.assertEqual(result,
-                                      b'\x28\xb5\x2f\xfd\x23\x06\x59\xb5\x52\x03\x19\x00\x00'
+                                      b'\x28\xb5\x2f\xfd\x23\x8f\x55\x0f\x70\x03\x19\x00\x00'
                                       b'\x66\x6f\x6f')
                  def test_multithreaded_compression_params(self):
                                       b'\x28\xb5\x2f\xfd\x00\x48\x18\x00\x00foo')
                      self.assertEqual(cobj.compress(b'bar'), b'')
                      # 3 byte header plus content.
-                     self.assertEqual(cobj.flush(), b'\x19\x00\x00bar')
+                     self.assertEqual(cobj.flush(zstd.COMPRESSOBJ_FLUSH_BLOCK),
+                                      b'\x18\x00\x00bar')
+                     self.assertEqual(cobj.flush(), b'\x01\x00\x00')
                  def test_flush_empty_block(self):
                      cctx = zstd.ZstdCompressor(write_checksum=True)
                  def test_context_manager(self):
                      cctx = zstd.ZstdCompressor()
-                     reader = cctx.stream_reader(b'foo' * 60)
-                     with self.assertRaisesRegexp(zstd.ZstdError, 'read\(\) must be called from an active'):
-                         reader.read(10)
                      with cctx.stream_reader(b'foo') as reader:
                          with self.assertRaisesRegexp(ValueError, 'cannot __enter__ multiple times'):
                              with reader as reader2:
                                  pass
+                 def test_no_context_manager(self):
+                     cctx = zstd.ZstdCompressor()
+                     reader = cctx.stream_reader(b'foo')
+                     reader.read(4)
+                     self.assertFalse(reader.closed)
+                     reader.close()
+                     self.assertTrue(reader.closed)
+                     with self.assertRaisesRegexp(ValueError, 'stream is closed'):
+                         reader.read(1)
                  def test_not_implemented(self):
                      cctx = zstd.ZstdCompressor()
                          self.assertFalse(reader.writable())
                          self.assertFalse(reader.seekable())
                          self.assertFalse(reader.isatty())
+                         self.assertFalse(reader.closed)
                          self.assertIsNone(reader.flush())
+                         self.assertFalse(reader.closed)
+                     self.assertTrue(reader.closed)
                  def test_read_closed(self):
                      cctx = zstd.ZstdCompressor()
                      with cctx.stream_reader(b'foo' * 60) as reader:
                          reader.close()
+                         self.assertTrue(reader.closed)
                          with self.assertRaisesRegexp(ValueError, 'stream is closed'):
                              reader.read(10)
                          while reader.read(8192):
                              pass
-                     with self.assertRaisesRegexp(zstd.ZstdError, 'read\(\) must be called from an active'):
+                     with self.assertRaisesRegexp(ValueError, 'stream is closed'):
                          reader.read(10)
                  def test_bad_size(self):
                      d = zstd.train_dictionary(8192, samples)
                      h = hashlib.sha1(d.as_bytes()).hexdigest()
-                     self.assertEqual(h, '3040faa0ddc37d50e71a4dd28052cb8db5d9d027')
+                     self.assertEqual(h, '2b3b6428da5bf2c9cc9d4bb58ba0bc5990dd0e79')
                      buffer = io.BytesIO()
                      cctx = zstd.ZstdCompressor(level=9, dict_data=d)
                      self.assertEqual(params.window_size, 2097152)
                      self.assertEqual(params.dict_id, d.dict_id())
                      self.assertFalse(params.has_checksum)
-                     self.assertEqual(compressed,
-                                      b'\x28\xb5\x2f\xfd\x03\x58\x06\x59\xb5\x52\x5d\x00'
-                                      b'\x00\x00\x02\xfc\x3d\x3f\xd9\xb0\x51\x03\x45\x89')
+                     h = hashlib.sha1(compressed).hexdigest()
+                     self.assertEqual(h, '23f88344263678478f5f82298e0a5d1833125786')
+                     source = b'foo' + b'bar' + (b'foo' * 16384)
+                     dctx = zstd.ZstdDecompressor(dict_data=d)
+                     self.assertEqual(dctx.decompress(compressed, max_output_size=len(source)),
+                                      source)
                  def test_compression_params(self):
                      params = zstd.ZstdCompressionParameters(
                      b''.join(cctx.read_to_iter(source))
+             @make_cffi
+             class TestCompressor_chunker(unittest.TestCase):
+                 def test_empty(self):
+                     cctx = zstd.ZstdCompressor(write_content_size=False)
+                     chunker = cctx.chunker()
+                     it = chunker.compress(b'')
+                     with self.assertRaises(StopIteration):
+                         next(it)
+                     it = chunker.finish()
+                     self.assertEqual(next(it), b'\x28\xb5\x2f\xfd\x00\x50\x01\x00\x00')
+                     with self.assertRaises(StopIteration):
+                         next(it)
+                 def test_simple_input(self):
+                     cctx = zstd.ZstdCompressor()
+                     chunker = cctx.chunker()
+                     it = chunker.compress(b'foobar')
+                     with self.assertRaises(StopIteration):
+                         next(it)
+                     it = chunker.compress(b'baz' * 30)
+                     with self.assertRaises(StopIteration):
+                         next(it)
+                     it = chunker.finish()
+                     self.assertEqual(next(it),
+                                      b'\x28\xb5\x2f\xfd\x00\x50\x7d\x00\x00\x48\x66\x6f'
+                                      b'\x6f\x62\x61\x72\x62\x61\x7a\x01\x00\xe4\xe4\x8e')
+                     with self.assertRaises(StopIteration):
+                         next(it)
+                 def test_input_size(self):
+                     cctx = zstd.ZstdCompressor()
+                     chunker = cctx.chunker(size=1024)
+                     it = chunker.compress(b'x' * 1000)
+                     with self.assertRaises(StopIteration):
+                         next(it)
+                     it = chunker.compress(b'y' * 24)
+                     with self.assertRaises(StopIteration):
+                         next(it)
+                     chunks = list(chunker.finish())
+                     self.assertEqual(chunks, [
+                         b'\x28\xb5\x2f\xfd\x60\x00\x03\x65\x00\x00\x18\x78\x78\x79\x02\x00'
+                         b'\xa0\x16\xe3\x2b\x80\x05'
+                     ])
+                     dctx = zstd.ZstdDecompressor()
+                     self.assertEqual(dctx.decompress(b''.join(chunks)),
+                                      (b'x' * 1000) + (b'y' * 24))
+                 def test_small_chunk_size(self):
+                     cctx = zstd.ZstdCompressor()
+                     chunker = cctx.chunker(chunk_size=1)
+                     chunks = list(chunker.compress(b'foo' * 1024))
+                     self.assertEqual(chunks, [])
+                     chunks = list(chunker.finish())
+                     self.assertTrue(all(len(chunk) == 1 for chunk in chunks))
+                     self.assertEqual(
+                         b''.join(chunks),
+                         b'\x28\xb5\x2f\xfd\x00\x50\x55\x00\x00\x18\x66\x6f\x6f\x01\x00'
+                         b'\xfa\xd3\x77\x43')
+                     dctx = zstd.ZstdDecompressor()
+                     self.assertEqual(dctx.decompress(b''.join(chunks),
+                                                      max_output_size=10000),
+                                      b'foo' * 1024)
+                 def test_input_types(self):
+                     cctx = zstd.ZstdCompressor()
+                     mutable_array = bytearray(3)
+                     mutable_array[:] = b'foo'
+                     sources = [
+                         memoryview(b'foo'),
+                         bytearray(b'foo'),
+                         mutable_array,
+                     ]
+                     for source in sources:
+                         chunker = cctx.chunker()
+                         self.assertEqual(list(chunker.compress(source)), [])
+                         self.assertEqual(list(chunker.finish()), [
+                             b'\x28\xb5\x2f\xfd\x00\x50\x19\x00\x00\x66\x6f\x6f'
+                         ])
+                 def test_flush(self):
+                     cctx = zstd.ZstdCompressor()
+                     chunker = cctx.chunker()
+                     self.assertEqual(list(chunker.compress(b'foo' * 1024)), [])
+                     self.assertEqual(list(chunker.compress(b'bar' * 1024)), [])
+                     chunks1 = list(chunker.flush())
+                     self.assertEqual(chunks1, [
+                         b'\x28\xb5\x2f\xfd\x00\x50\x8c\x00\x00\x30\x66\x6f\x6f\x62\x61\x72'
+                         b'\x02\x00\xfa\x03\xfe\xd0\x9f\xbe\x1b\x02'
+                     ])
+                     self.assertEqual(list(chunker.flush()), [])
+                     self.assertEqual(list(chunker.flush()), [])
+                     self.assertEqual(list(chunker.compress(b'baz' * 1024)), [])
+                     chunks2 = list(chunker.flush())
+                     self.assertEqual(len(chunks2), 1)
+                     chunks3 = list(chunker.finish())
+                     self.assertEqual(len(chunks2), 1)
+                     dctx = zstd.ZstdDecompressor()
+                     self.assertEqual(dctx.decompress(b''.join(chunks1 + chunks2 + chunks3),
+                                                      max_output_size=10000),
+                                      (b'foo' * 1024) + (b'bar' * 1024) + (b'baz' * 1024))
+                 def test_compress_after_finish(self):
+                     cctx = zstd.ZstdCompressor()
+                     chunker = cctx.chunker()
+                     list(chunker.compress(b'foo'))
+                     list(chunker.finish())
+                     with self.assertRaisesRegexp(
+                             zstd.ZstdError,
+                             'cannot call compress\(\) after compression finished'):
+                         list(chunker.compress(b'foo'))
+                 def test_flush_after_finish(self):
+                     cctx = zstd.ZstdCompressor()
+                     chunker = cctx.chunker()
+                     list(chunker.compress(b'foo'))
+                     list(chunker.finish())
+                     with self.assertRaisesRegexp(
+                             zstd.ZstdError,
+                             'cannot call flush\(\) after compression finished'):
+                         list(chunker.flush())
+                 def test_finish_after_finish(self):
+                     cctx = zstd.ZstdCompressor()
+                     chunker = cctx.chunker()
+                     list(chunker.compress(b'foo'))
+                     list(chunker.finish())
+                     with self.assertRaisesRegexp(
+                             zstd.ZstdError,
+                             'cannot call finish\(\) after compression finished'):
+                         list(chunker.finish())
              class TestCompressor_multi_compress_to_buffer(unittest.TestCase):
                  def test_invalid_inputs(self):
                      cctx = zstd.ZstdCompressor()

contrib/python-zstandard/tests/test_compressor_fuzzing.py

0 +132 0

		@@ -135,6 +135,51 b' class TestCompressor_compressobj_fuzzing'
135	135
136	136	self.assertEqual(b''.join(chunks), ref_frame)
137	137
	138	@hypothesis.settings(
	139	suppress_health_check=[hypothesis.HealthCheck.large_base_example])
	140	@hypothesis.given(original=strategies.sampled_from(random_input_data()),
	141	level=strategies.integers(min_value=1, max_value=5),
	142	chunk_sizes=strategies.data(),
	143	flushes=strategies.data())
	144	def test_flush_block(self, original, level, chunk_sizes, flushes):
	145	cctx = zstd.ZstdCompressor(level=level)
	146	cobj = cctx.compressobj()
	147
	148	dctx = zstd.ZstdDecompressor()
	149	dobj = dctx.decompressobj()
	150
	151	compressed_chunks = []
	152	decompressed_chunks = []
	153	i = 0
	154	while True:
	155	input_size = chunk_sizes.draw(strategies.integers(1, 4096))
	156	source = original[i:i + input_size]
	157	if not source:
	158	break
	159
	160	i += input_size
	161
	162	chunk = cobj.compress(source)
	163	compressed_chunks.append(chunk)
	164	decompressed_chunks.append(dobj.decompress(chunk))
	165
	166	if not flushes.draw(strategies.booleans()):
	167	continue
	168
	169	chunk = cobj.flush(zstd.COMPRESSOBJ_FLUSH_BLOCK)
	170	compressed_chunks.append(chunk)
	171	decompressed_chunks.append(dobj.decompress(chunk))
	172
	173	self.assertEqual(b''.join(decompressed_chunks), original[0:i])
	174
	175	chunk = cobj.flush(zstd.COMPRESSOBJ_FLUSH_FINISH)
	176	compressed_chunks.append(chunk)
	177	decompressed_chunks.append(dobj.decompress(chunk))
	178
	179	self.assertEqual(dctx.decompress(b''.join(compressed_chunks),
	180	max_output_size=len(original)),
	181	original)
	182	self.assertEqual(b''.join(decompressed_chunks), original)
138	183
139	184	@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
140	185	@make_cffi
		@@ -186,3 +231,90 b' class TestCompressor_multi_compress_to_b'
186	231
187	232	for i, frame in enumerate(result):
188	233	self.assertEqual(dctx.decompress(frame), original[i])
	234
	235
	236	@unittest.skipUnless('ZSTD_SLOW_TESTS' in os.environ, 'ZSTD_SLOW_TESTS not set')
	237	@make_cffi
	238	class TestCompressor_chunker_fuzzing(unittest.TestCase):
	239	@hypothesis.settings(
	240	suppress_health_check=[hypothesis.HealthCheck.large_base_example])
	241	@hypothesis.given(original=strategies.sampled_from(random_input_data()),
	242	level=strategies.integers(min_value=1, max_value=5),
	243	chunk_size=strategies.integers(
	244	min_value=1,
	245	max_value=32 * 1048576),
	246	input_sizes=strategies.data())
	247	def test_random_input_sizes(self, original, level, chunk_size, input_sizes):
	248	cctx = zstd.ZstdCompressor(level=level)
	249	chunker = cctx.chunker(chunk_size=chunk_size)
	250
	251	chunks = []
	252	i = 0
	253	while True:
	254	input_size = input_sizes.draw(strategies.integers(1, 4096))
	255	source = original[i:i + input_size]
	256	if not source:
	257	break
	258
	259	chunks.extend(chunker.compress(source))
	260	i += input_size
	261
	262	chunks.extend(chunker.finish())
	263
	264	dctx = zstd.ZstdDecompressor()
	265
	266	self.assertEqual(dctx.decompress(b''.join(chunks),
	267	max_output_size=len(original)),
	268	original)
	269
	270	self.assertTrue(all(len(chunk) == chunk_size for chunk in chunks[:-1]))
	271
	272	@hypothesis.settings(
	273	suppress_health_check=[hypothesis.HealthCheck.large_base_example])
	274	@hypothesis.given(original=strategies.sampled_from(random_input_data()),
	275	level=strategies.integers(min_value=1, max_value=5),
	276	chunk_size=strategies.integers(
	277	min_value=1,
	278	max_value=32 * 1048576),
	279	input_sizes=strategies.data(),
	280	flushes=strategies.data())
	281	def test_flush_block(self, original, level, chunk_size, input_sizes,
	282	flushes):
	283	cctx = zstd.ZstdCompressor(level=level)
	284	chunker = cctx.chunker(chunk_size=chunk_size)
	285
	286	dctx = zstd.ZstdDecompressor()
	287	dobj = dctx.decompressobj()
	288
	289	compressed_chunks = []
	290	decompressed_chunks = []
	291	i = 0
	292	while True:
	293	input_size = input_sizes.draw(strategies.integers(1, 4096))
	294	source = original[i:i + input_size]
	295	if not source:
	296	break
	297
	298	i += input_size
	299
	300	chunks = list(chunker.compress(source))
	301	compressed_chunks.extend(chunks)
	302	decompressed_chunks.append(dobj.decompress(b''.join(chunks)))
	303
	304	if not flushes.draw(strategies.booleans()):
	305	continue
	306
	307	chunks = list(chunker.flush())
	308	compressed_chunks.extend(chunks)
	309	decompressed_chunks.append(dobj.decompress(b''.join(chunks)))
	310
	311	self.assertEqual(b''.join(decompressed_chunks), original[0:i])
	312
	313	chunks = list(chunker.finish())
	314	compressed_chunks.extend(chunks)
	315	decompressed_chunks.append(dobj.decompress(b''.join(chunks)))
	316
	317	self.assertEqual(dctx.decompress(b''.join(compressed_chunks),
	318	max_output_size=len(original)),
	319	original)
	320	self.assertEqual(b''.join(decompressed_chunks), original) No newline at end of file

contrib/python-zstandard/tests/test_data_structures.py

0 +2 -10

                                                     hash_log=zstd.HASHLOG_MAX,
                                                     search_log=zstd.SEARCHLOG_MAX,
                                                     min_match=zstd.SEARCHLENGTH_MAX - 1,
+                                                    target_length=zstd.TARGETLENGTH_MAX,
                                                     compression_strategy=zstd.STRATEGY_BTULTRA)
                  def test_from_level(self):
                      p = zstd.ZstdCompressionParameters.from_level(-4)
                      self.assertEqual(p.window_log, 19)
-                     self.assertEqual(p.compress_literals, 0)
                  def test_members(self):
                      p = zstd.ZstdCompressionParameters(window_log=10,
                      self.assertEqual(p.job_size, 1048576)
                      self.assertEqual(p.overlap_size_log, 6)
-                     p = zstd.ZstdCompressionParameters(compression_level=2)
-                     self.assertEqual(p.compress_literals, 1)
-                     p = zstd.ZstdCompressionParameters(compress_literals=False)
-                     self.assertEqual(p.compress_literals, 0)
                      p = zstd.ZstdCompressionParameters(compression_level=-1)
                      self.assertEqual(p.compression_level, -1)
-                     self.assertEqual(p.compress_literals, 0)
-                     p = zstd.ZstdCompressionParameters(compression_level=-2, compress_literals=True)
+                     p = zstd.ZstdCompressionParameters(compression_level=-2)
                      self.assertEqual(p.compression_level, -2)
-                     self.assertEqual(p.compress_literals, 1)
                      p = zstd.ZstdCompressionParameters(force_max_window=True)
                      self.assertEqual(p.force_max_window, 1)

contrib/python-zstandard/tests/test_data_structures_fuzzing.py

0 +1 -1

              s_searchlength = strategies.integers(min_value=zstd.SEARCHLENGTH_MIN,
                                                   max_value=zstd.SEARCHLENGTH_MAX)
              s_targetlength = strategies.integers(min_value=zstd.TARGETLENGTH_MIN,
-                                                  max_value=2**32)
+                                                  max_value=zstd.TARGETLENGTH_MAX)
              s_strategy = strategies.sampled_from((zstd.STRATEGY_FAST,
                                                      zstd.STRATEGY_DFAST,
                                                      zstd.STRATEGY_GREEDY,

contrib/python-zstandard/tests/test_decompressor.py

0 +49 -10

                  def test_context_manager(self):
                      dctx = zstd.ZstdDecompressor()
-                     reader = dctx.stream_reader(b'foo')
-                     with self.assertRaisesRegexp(zstd.ZstdError, 'read\(\) must be called from an active'):
-                         reader.read(1)
                      with dctx.stream_reader(b'foo') as reader:
                          with self.assertRaisesRegexp(ValueError, 'cannot __enter__ multiple times'):
                              with reader as reader2:
                      dctx = zstd.ZstdDecompressor()
                      with dctx.stream_reader(b'foo') as reader:
+                         self.assertFalse(reader.closed)
                          self.assertTrue(reader.readable())
                          self.assertFalse(reader.writable())
                          self.assertTrue(reader.seekable())
                          self.assertFalse(reader.isatty())
+                         self.assertFalse(reader.closed)
                          self.assertIsNone(reader.flush())
+                         self.assertFalse(reader.closed)
+                     self.assertTrue(reader.closed)
                  def test_read_closed(self):
                      dctx = zstd.ZstdDecompressor()
                      with dctx.stream_reader(b'foo') as reader:
                          reader.close()
+                         self.assertTrue(reader.closed)
                          with self.assertRaisesRegexp(ValueError, 'stream is closed'):
                              reader.read(1)
                          self.assertEqual(reader.tell(), len(source))
                          # Read after EOF should return empty bytes.
-                         self.assertEqual(reader.read(), b'')
+                         self.assertEqual(reader.read(1), b'')
                          self.assertEqual(reader.tell(), len(result))
-                     self.assertTrue(reader.closed())
+                     self.assertTrue(reader.closed)
                  def test_read_buffer_small_chunks(self):
                      cctx = zstd.ZstdCompressor()
                          chunk = reader.read(8192)
                          self.assertEqual(chunk, source)
                          self.assertEqual(reader.tell(), len(source))
-                         self.assertEqual(reader.read(), b'')
+                         self.assertEqual(reader.read(1), b'')
                          self.assertEqual(reader.tell(), len(source))
+                         self.assertFalse(reader.closed)
+                     self.assertTrue(reader.closed)
                  def test_read_stream_small_chunks(self):
                      cctx = zstd.ZstdCompressor()
                          while reader.read(16):
                              pass
-                     with self.assertRaisesRegexp(zstd.ZstdError, 'read\(\) must be called from an active'):
+                     self.assertTrue(reader.closed)
+                     with self.assertRaisesRegexp(ValueError, 'stream is closed'):
                          reader.read(10)
                  def test_illegal_seeks(self):
                          with self.assertRaisesRegexp(ValueError, 'stream is closed'):
                              reader.seek(4, os.SEEK_SET)
-                     with self.assertRaisesRegexp(
-                         zstd.ZstdError, 'seek\(\) must be called from an active context'):
+                     with self.assertRaisesRegexp(ValueError, 'stream is closed'):
                          reader.seek(0)
                  def test_seek(self):
                          reader.seek(4, os.SEEK_CUR)
                          self.assertEqual(reader.read(2), b'ar')
+                 def test_no_context_manager(self):
+                     source = b'foobar' * 60
+                     cctx = zstd.ZstdCompressor()
+                     frame = cctx.compress(source)
+                     dctx = zstd.ZstdDecompressor()
+                     reader = dctx.stream_reader(frame)
+                     self.assertEqual(reader.read(6), b'foobar')
+                     self.assertEqual(reader.read(18), b'foobar' * 3)
+                     self.assertFalse(reader.closed)
+                     # Calling close prevents subsequent use.
+                     reader.close()
+                     self.assertTrue(reader.closed)
+                     with self.assertRaisesRegexp(ValueError, 'stream is closed'):
+                         reader.read(6)
+                 def test_read_after_error(self):
+                     source = io.BytesIO(b'')
+                     dctx = zstd.ZstdDecompressor()
+                     reader = dctx.stream_reader(source)
+                     with reader:
+                         with self.assertRaises(TypeError):
+                             reader.read()
+                     with reader:
+                         with self.assertRaisesRegexp(ValueError, 'stream is closed'):
+                             reader.read(100)
              @make_cffi
              class TestDecompressor_decompressobj(unittest.TestCase):

contrib/python-zstandard/tests/test_module_attributes.py

0 +6 -1

              @make_cffi
              class TestModuleAttributes(unittest.TestCase):
                  def test_version(self):
-                     self.assertEqual(zstd.ZSTD_VERSION, (1, 3, 4))
+                     self.assertEqual(zstd.ZSTD_VERSION, (1, 3, 6))
+                     self.assertEqual(zstd.__version__, '0.10.1')
                  def test_constants(self):
                      self.assertEqual(zstd.MAX_COMPRESSION_LEVEL, 22)
                          'DECOMPRESSION_RECOMMENDED_INPUT_SIZE',
                          'DECOMPRESSION_RECOMMENDED_OUTPUT_SIZE',
                          'MAGIC_NUMBER',
+                         'BLOCKSIZELOG_MAX',
+                         'BLOCKSIZE_MAX',
                          'WINDOWLOG_MIN',
                          'WINDOWLOG_MAX',
                          'CHAINLOG_MIN',
                          'SEARCHLENGTH_MIN',
                          'SEARCHLENGTH_MAX',
                          'TARGETLENGTH_MIN',
+                         'TARGETLENGTH_MAX',
                          'LDM_MINMATCH_MIN',
                          'LDM_MINMATCH_MAX',
                          'LDM_BUCKETSIZELOG_MAX',

contrib/python-zstandard/tests/test_train_dictionary.py

0 +2 -1

                      d = zstd.train_dictionary(8192, generate_samples(), threads=-1, steps=1,
                                                d=16)
-                     self.assertEqual(d.k, 50)
+                     # This varies by platform.
+                     self.assertIn(d.k, (50, 2000))
                      self.assertEqual(d.d, 16)
              @make_cffi

contrib/python-zstandard/zstandard/__init__.py

0 +3 0

              else:
                  raise ImportError('unknown module import policy: %s; use default, cffi_fallback, '
                                    'cext, or cffi' % _module_policy)
+             # Keep this in sync with python-zstandard.h.
+             __version__ = '0.10.1'

contrib/python-zstandard/zstd.c

0 +3 -1

              void compressor_module_init(PyObject* mod);
              void compressionparams_module_init(PyObject* mod);
              void constants_module_init(PyObject* mod);
+             void compressionchunker_module_init(PyObject* mod);
              void compressiondict_module_init(PyObject* mod);
              void compressionreader_module_init(PyObject* mod);
              void compressionwriter_module_init(PyObject* mod);
              	   We detect this mismatch here and refuse to load the module if this
              	   scenario is detected.
              	*/
-             	if (ZSTD_VERSION_NUMBER != 10304 || ZSTD_versionNumber() != 10304) {
+             	if (ZSTD_VERSION_NUMBER != 10306 || ZSTD_versionNumber() != 10306) {
              		PyErr_SetString(PyExc_ImportError, "zstd C API mismatch; Python bindings not compiled against expected zstd version");
              		return;
              	}
              	compressiondict_module_init(m);
              	compressobj_module_init(m);
              	compressor_module_init(m);
+             	compressionchunker_module_init(m);
              	compressionreader_module_init(m);
              	compressionwriter_module_init(m);
              	compressoriterator_module_init(m);

contrib/python-zstandard/zstd/common/bitstream.h

0 +6 -19

              /* ******************************************************************
                 bitstream
                 Part of FSE library
-                header file (to include)
-                Copyright (C) 2013-2017, Yann Collet.
+                Copyright (C) 2013-present, Yann Collet.
                 BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
              *  Dependencies
              ******************************************/
              #include "mem.h"            /* unaligned access routines */
+             #include "debug.h"          /* assert(), DEBUGLOG(), RAWLOG() */
              #include "error_private.h"  /* error codes and messages */
-             /*-*************************************
-             *  Debug
-             ***************************************/
-             #if defined(BIT_DEBUG) && (BIT_DEBUG>=1)
-             #  include <assert.h>
-             #else
-             #  ifndef assert
-             #    define assert(condition) ((void)0)
-             #  endif
-             #endif
              /*=========================================
              *  Target specific
              =========================================*/
               * A critical property of these streams is that they encode and decode in **reverse** direction.
               * So the first bit sequence you add will be the last to be read, like a LIFO stack.
               */
-             typedef struct
+             {
+             typedef struct {
                  size_t bitContainer;
                  unsigned bitPos;
                  char*  startPtr;
              /*-********************************************
              *  bitStream decoding API (read backward)
              **********************************************/
-             typedef struct
+             {
+             typedef struct {
                  size_t   bitContainer;
                  unsigned bitsConsumed;
                  const char* ptr;
              }
              /*! BIT_addBitsFast() :
-              *  works only if `value` is _clean_, meaning all high bits above nbBits are 0 */
+              *  works only if `value` is _clean_,
+              *  meaning all high bits above nbBits are 0 */
              MEM_STATIC void BIT_addBitsFast(BIT_CStream_t* bitC,
                                              size_t value, unsigned nbBits)
              {

contrib/python-zstandard/zstd/common/compiler.h

0 +32 -10

               * Enabled for clang & gcc >=4.8 on x86 when BMI2 isn't enabled by default.
               */
              #ifndef DYNAMIC_BMI2
-               #if (defined(__clang__) && __has_attribute(__target__)) \
+               #if ((defined(__clang__) && __has_attribute(__target__)) \
                    || (defined(__GNUC__) \
-                       && (__GNUC__ >= 5 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 8))) \
+                       && (__GNUC__ >= 5 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 8)))) \
                    && (defined(__x86_64__) || defined(_M_X86)) \
                    && !defined(__BMI2__)
                #  define DYNAMIC_BMI2 1
                #endif
              #endif
-             /* prefetch */
-             #if defined(_MSC_VER) && (defined(_M_X64) || defined(_M_I86))  /* _mm_prefetch() is not defined outside of x86/x64 */
-             #  include <mmintrin.h>   /* https://msdn.microsoft.com/fr-fr/library/84szxsww(v=vs.90).aspx */
-             #  define PREFETCH(ptr)   _mm_prefetch((const char*)ptr, _MM_HINT_T0)
-             #elif defined(__GNUC__)
-             #  define PREFETCH(ptr)   __builtin_prefetch(ptr, 0, 0)
+             /* prefetch
+              * can be disabled, by declaring NO_PREFETCH macro
+              * All prefetch invocations use a single default locality 2,
+              * generating instruction prefetcht1,
+              * which, according to Intel, means "load data into L2 cache".
+              * This is a good enough "middle ground" for the time being,
+              * though in theory, it would be better to specialize locality depending on data being prefetched.
+              * Tests could not determine any sensible difference based on locality value. */
+             #if defined(NO_PREFETCH)
+             #  define PREFETCH(ptr)     (void)(ptr)  /* disabled */
              #else
-             #  define PREFETCH(ptr)   /* disabled */
-             #endif
+             #  if defined(_MSC_VER) && (defined(_M_X64) || defined(_M_I86))  /* _mm_prefetch() is not defined outside of x86/x64 */
+             #    include <mmintrin.h>   /* https://msdn.microsoft.com/fr-fr/library/84szxsww(v=vs.90).aspx */
+             #    define PREFETCH(ptr)   _mm_prefetch((const char*)(ptr), _MM_HINT_T1)
+             #  elif defined(__GNUC__) && ( (__GNUC__ >= 4) || ( (__GNUC__ == 3) && (__GNUC_MINOR__ >= 1) ) )
+             #    define PREFETCH(ptr)   __builtin_prefetch((ptr), 0 /* rw==read */, 2 /* locality */)
+             #  else
+             #    define PREFETCH(ptr)   (void)(ptr)  /* disabled */
+             #  endif
+             #endif  /* NO_PREFETCH */
+             #define CACHELINE_SIZE 64
+             #define PREFETCH_AREA(p, s)  {            \
+                 const char* const _ptr = (const char*)(p);  \
+                 size_t const _size = (size_t)(s);     \
+                 size_t _pos;                          \
+                 for (_pos=0; _pos<_size; _pos+=CACHELINE_SIZE) {  \
+                     PREFETCH(_ptr + _pos);            \
+                 }                                     \
+             }
              /* disable warnings */
              #ifdef _MSC_VER    /* Visual Studio */

contrib/python-zstandard/zstd/common/cpu.h

0 +2 -3

                  U32 f1d = 0;
                  U32 f7b = 0;
                  U32 f7c = 0;
-             #ifdef _MSC_VER
+             #if defined(_MSC_VER) && (defined(_M_X64) || defined(_M_IX86))
                  int reg[4];
                  __cpuid((int*)reg, 0);
                  {
                        "cpuid\n\t"
                        "popl %%ebx\n\t"
                        : "=a"(f1a), "=c"(f1c), "=d"(f1d)
-                       : "a"(1)
-                       :);
+                       : "a"(1));
                  }
                  if (n >= 7) {
                    __asm__(

contrib/python-zstandard/zstd/common/entropy_common.c

0 +16 -1

                  unsigned charnum = 0;
                  int previous0 = 0;
-                 if (hbSize < 4) return ERROR(srcSize_wrong);
+                 if (hbSize < 4) {
+                     /* This function only works when hbSize >= 4 */
+                     char buffer[4];
+                     memset(buffer, 0, sizeof(buffer));
+                     memcpy(buffer, headerBuffer, hbSize);
+                     {   size_t const countSize = FSE_readNCount(normalizedCounter, maxSVPtr, tableLogPtr,
+                                                                 buffer, sizeof(buffer));
+                         if (FSE_isError(countSize)) return countSize;
+                         if (countSize > hbSize) return ERROR(corruption_detected);
+                         return countSize;
+                 }   }
+                 assert(hbSize >= 4);
+                 /* init */
+                 memset(normalizedCounter, 0, (*maxSVPtr+1) * sizeof(normalizedCounter[0]));   /* all symbols not present in NCount have a frequency of 0 */
                  bitStream = MEM_readLE32(ip);
                  nbBits = (bitStream & 0xF) + FSE_MIN_TABLELOG;   /* extract tableLog */
                  if (nbBits > FSE_TABLELOG_ABSOLUTE_MAX) return ERROR(tableLog_tooLarge);
                          if (n0 > *maxSVPtr) return ERROR(maxSymbolValue_tooSmall);
                          while (charnum < n0) normalizedCounter[charnum++] = 0;
                          if ((ip <= iend-7) || (ip + (bitCount>>3) <= iend-4)) {
+                             assert((bitCount >> 3) <= 3); /* For first condition to work */
                              ip += bitCount>>3;
                              bitCount &= 7;
                              bitStream = MEM_readLE32(ip) >> bitCount;

contrib/python-zstandard/zstd/common/fse.h

0 +45 -41

              #define FSE_VERSION_NUMBER  (FSE_VERSION_MAJOR *100*100 + FSE_VERSION_MINOR *100 + FSE_VERSION_RELEASE)
              FSE_PUBLIC_API unsigned FSE_versionNumber(void);   /**< library version number; to be used when checking dll version */
              /*-****************************************
              *  FSE simple functions
              ******************************************/
              ******************************************/
              /*!
              FSE_compress() does the following:
-. count symbol occurrence from source[] into table count[]
+. count symbol occurrence from source[] into table count[] (see hist.h)
 . normalize counters so that sum(count[]) == Power_of_2 (2^tableLog)
 . save normalized counters to memory buffer using writeNCount()
 . build encoding table 'CTable' from normalized counters
              /* *** COMPRESSION *** */
-             /*! FSE_count():
-                 Provides the precise count of each byte within a table 'count'.
-                 'count' is a table of unsigned int, of minimum size (*maxSymbolValuePtr+1).
-                 *maxSymbolValuePtr will be updated if detected smaller than initial value.
-                 @return : the count of the most frequent symbol (which is not identified).
-                           if return == srcSize, there is only one symbol.
-                           Can also return an error code, which can be tested with FSE_isError(). */
-             FSE_PUBLIC_API size_t FSE_count(unsigned* count, unsigned* maxSymbolValuePtr, const void* src, size_t srcSize);
              /*! FSE_optimalTableLog():
                  dynamically downsize 'tableLog' when conditions are met.
                  It saves CPU time, by using smaller tables, while preserving or even improving compression ratio.
                  'normalizedCounter' is a table of short, of minimum size (maxSymbolValue+1).
                  @return : tableLog,
                            or an errorCode, which can be tested using FSE_isError() */
-             FSE_PUBLIC_API size_t FSE_normalizeCount(short* normalizedCounter, unsigned tableLog, const unsigned* count, size_t srcSize, unsigned maxSymbolValue);
+             FSE_PUBLIC_API size_t FSE_normalizeCount(short* normalizedCounter, unsigned tableLog,
+                                 const unsigned* count, size_t srcSize, unsigned maxSymbolValue);
              /*! FSE_NCountWriteBound():
                  Provides the maximum possible size of an FSE normalized table, given 'maxSymbolValue' and 'tableLog'.
                  Compactly save 'normalizedCounter' into 'buffer'.
                  @return : size of the compressed table,
                            or an errorCode, which can be tested using FSE_isError(). */
-             FSE_PUBLIC_API size_t FSE_writeNCount (void* buffer, size_t bufferSize, const short* normalizedCounter, unsigned maxSymbolValue, unsigned tableLog);
+             FSE_PUBLIC_API size_t FSE_writeNCount (void* buffer, size_t bufferSize,
+                                              const short* normalizedCounter,
+                                              unsigned maxSymbolValue, unsigned tableLog);
              /*! Constructor and Destructor of FSE_CTable.
                  Note that FSE_CTable size depends on 'tableLog' and 'maxSymbolValue' */
                  @return : size read from 'rBuffer',
                            or an errorCode, which can be tested using FSE_isError().
                            maxSymbolValuePtr[0] and tableLogPtr[0] will also be updated with their respective values */
-             FSE_PUBLIC_API size_t FSE_readNCount (short* normalizedCounter, unsigned* maxSymbolValuePtr, unsigned* tableLogPtr, const void* rBuffer, size_t rBuffSize);
+             FSE_PUBLIC_API size_t FSE_readNCount (short* normalizedCounter,
+                                        unsigned* maxSymbolValuePtr, unsigned* tableLogPtr,
+                                        const void* rBuffer, size_t rBuffSize);
              /*! Constructor and Destructor of FSE_DTable.
                  Note that its size depends on 'tableLog' */
              /* *****************************************
-             *  FSE advanced API
-             *******************************************/
-             /* FSE_count_wksp() :
-              * Same as FSE_count(), but using an externally provided scratch buffer.
-              * `workSpace` size must be table of >= `1024` unsigned
-              */
-             size_t FSE_count_wksp(unsigned* count, unsigned* maxSymbolValuePtr,
-                              const void* source, size_t sourceSize, unsigned* workSpace);
-             /** FSE_countFast() :
-              *  same as FSE_count(), but blindly trusts that all byte values within src are <= *maxSymbolValuePtr
-              */
-             size_t FSE_countFast(unsigned* count, unsigned* maxSymbolValuePtr, const void* src, size_t srcSize);
-             /* FSE_countFast_wksp() :
-              * Same as FSE_countFast(), but using an externally provided scratch buffer.
-              * `workSpace` must be a table of minimum `1024` unsigned
-              */
-             size_t FSE_countFast_wksp(unsigned* count, unsigned* maxSymbolValuePtr, const void* src, size_t srcSize, unsigned* workSpace);
-             /*! FSE_count_simple() :
-              * Same as FSE_countFast(), but does not use any additional memory (not even on stack).
-              * This function is unsafe, and will segfault if any value within `src` is `> *maxSymbolValuePtr` (presuming it's also the size of `count`).
-             */
-             size_t FSE_count_simple(unsigned* count, unsigned* maxSymbolValuePtr, const void* src, size_t srcSize);
+              *  FSE advanced API
+              ***************************************** */
              unsigned FSE_optimalTableLog_internal(unsigned maxTableLog, size_t srcSize, unsigned maxSymbolValue, unsigned minus);
              /**< same as FSE_optimalTableLog(), which used `minus==2` */
              }
+             /* FSE_getMaxNbBits() :
+              * Approximate maximum cost of a symbol, in bits.
+              * Fractional get rounded up (i.e : a symbol with a normalized frequency of 3 gives the same result as a frequency of 2)
+              * note 1 : assume symbolValue is valid (<= maxSymbolValue)
+              * note 2 : if freq[symbolValue]==0, @return a fake cost of tableLog+1 bits */
+             MEM_STATIC U32 FSE_getMaxNbBits(const void* symbolTTPtr, U32 symbolValue)
+             {
+                 const FSE_symbolCompressionTransform* symbolTT = (const FSE_symbolCompressionTransform*) symbolTTPtr;
+                 return (symbolTT[symbolValue].deltaNbBits + ((1<<16)-1)) >> 16;
+             }
+             /* FSE_bitCost() :
+              * Approximate symbol cost, as fractional value, using fixed-point format (accuracyLog fractional bits)
+              * note 1 : assume symbolValue is valid (<= maxSymbolValue)
+              * note 2 : if freq[symbolValue]==0, @return a fake cost of tableLog+1 bits */
+             MEM_STATIC U32 FSE_bitCost(const void* symbolTTPtr, U32 tableLog, U32 symbolValue, U32 accuracyLog)
+             {
+                 const FSE_symbolCompressionTransform* symbolTT = (const FSE_symbolCompressionTransform*) symbolTTPtr;
+                 U32 const minNbBits = symbolTT[symbolValue].deltaNbBits >> 16;
+                 U32 const threshold = (minNbBits+1) << 16;
+                 assert(tableLog < 16);
+                 assert(accuracyLog < 31-tableLog);  /* ensure enough room for renormalization double shift */
+                 {   U32 const tableSize = 1 << tableLog;
+                     U32 const deltaFromThreshold = threshold - (symbolTT[symbolValue].deltaNbBits + tableSize);
+                     U32 const normalizedDeltaFromThreshold = (deltaFromThreshold << accuracyLog) >> tableLog;   /* linear interpolation (very approximate) */
+                     U32 const bitMultiplier = 1 << accuracyLog;
+                     assert(symbolTT[symbolValue].deltaNbBits + tableSize <= threshold);
+                     assert(normalizedDeltaFromThreshold <= bitMultiplier);
+                     return (minNbBits+1)*bitMultiplier - normalizedDeltaFromThreshold;
+                 }
+             }
              /* ======    Decompression    ====== */
              typedef struct {

contrib/python-zstandard/zstd/common/fse_decompress.c

0 +1 -1

              *  Error Management
              ****************************************************************/
              #define FSE_isError ERR_isError
-             #define FSE_STATIC_ASSERT(c) { enum { FSE_static_assert = 1/(int)(!!(c)) }; }   /* use only *after* variable declarations */
+             #define FSE_STATIC_ASSERT(c) DEBUG_STATIC_ASSERT(c)   /* use only *after* variable declarations */
              /* check and forward error code */
              #define CHECK_F(f) { size_t const e = f; if (FSE_isError(e)) return e; }

contrib/python-zstandard/zstd/common/huf.h

0 +34 -27

              /* ******************************************************************
-                Huffman coder, part of New Generation Entropy library
-                header file
-                Copyright (C) 2013-2016, Yann Collet.
+                huff0 huffman codec,
+                part of Finite State Entropy library
+                Copyright (C) 2013-present, Yann Collet.
                 BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
              /* static allocation of HUF's DTable */
              typedef U32 HUF_DTable;
              #define HUF_DTABLE_SIZE(maxTableLog)   (1 + (1<<(maxTableLog)))
-             #define HUF_CREATE_STATIC_DTABLEX2(DTable, maxTableLog) \
+             #define HUF_CREATE_STATIC_DTABLEX1(DTable, maxTableLog) \
                      HUF_DTable DTable[HUF_DTABLE_SIZE((maxTableLog)-1)] = { ((U32)((maxTableLog)-1) * 0x01000001) }
-             #define HUF_CREATE_STATIC_DTABLEX4(DTable, maxTableLog) \
+             #define HUF_CREATE_STATIC_DTABLEX2(DTable, maxTableLog) \
                      HUF_DTable DTable[HUF_DTABLE_SIZE(maxTableLog)] = { ((U32)(maxTableLog) * 0x01000001) }
              /* ****************************************
              *  Advanced decompression functions
              ******************************************/
-             size_t HUF_decompress4X2 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /**< single-symbol decoder */
-             size_t HUF_decompress4X4 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /**< double-symbols decoder */
+             size_t HUF_decompress4X1 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /**< single-symbol decoder */
+             size_t HUF_decompress4X2 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /**< double-symbols decoder */
              size_t HUF_decompress4X_DCtx (HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /**< decodes RLE and uncompressed */
              size_t HUF_decompress4X_hufOnly(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize); /**< considers RLE and uncompressed as errors */
              size_t HUF_decompress4X_hufOnly_wksp(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize, void* workSpace, size_t wkspSize); /**< considers RLE and uncompressed as errors */
-             size_t HUF_decompress4X2_DCtx(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /**< single-symbol decoder */
-             size_t HUF_decompress4X2_DCtx_wksp(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize, void* workSpace, size_t wkspSize);   /**< single-symbol decoder */
-             size_t HUF_decompress4X4_DCtx(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /**< double-symbols decoder */
-             size_t HUF_decompress4X4_DCtx_wksp(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize, void* workSpace, size_t wkspSize);   /**< double-symbols decoder */
+             size_t HUF_decompress4X1_DCtx(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /**< single-symbol decoder */
+             size_t HUF_decompress4X1_DCtx_wksp(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize, void* workSpace, size_t wkspSize);   /**< single-symbol decoder */
+             size_t HUF_decompress4X2_DCtx(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /**< double-symbols decoder */
+             size_t HUF_decompress4X2_DCtx_wksp(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize, void* workSpace, size_t wkspSize);   /**< double-symbols decoder */
              /* ****************************************
              typedef enum {
                 HUF_repeat_none,  /**< Cannot use the previous table */
                 HUF_repeat_check, /**< Can use the previous table but it must be checked. Note : The previous table must have been constructed by HUF_compress{1, 4}X_repeat */
-                HUF_repeat_valid  /**< Can use the previous table and it is asumed to be valid */
+                HUF_repeat_valid  /**< Can use the previous table and it is assumed to be valid */
               } HUF_repeat;
              /** HUF_compress4X_repeat() :
               *  Same as HUF_compress4X_wksp(), but considers using hufTable if *repeat != HUF_repeat_none.
               */
              #define HUF_CTABLE_WORKSPACE_SIZE_U32 (2*HUF_SYMBOLVALUE_MAX +1 +1)
              #define HUF_CTABLE_WORKSPACE_SIZE (HUF_CTABLE_WORKSPACE_SIZE_U32 * sizeof(unsigned))
-             size_t HUF_buildCTable_wksp (HUF_CElt* tree, const U32* count, U32 maxSymbolValue, U32 maxNbBits, void* workSpace, size_t wkspSize);
+             size_t HUF_buildCTable_wksp (HUF_CElt* tree,
+                                    const U32* count, U32 maxSymbolValue, U32 maxNbBits,
+                                          void* workSpace, size_t wkspSize);
              /*! HUF_readStats() :
               *  Read compact Huffman tree, saved by HUF_writeCTable().
               *  Loading a CTable saved with HUF_writeCTable() */
              size_t HUF_readCTable (HUF_CElt* CTable, unsigned* maxSymbolValuePtr, const void* src, size_t srcSize);
+             /** HUF_getNbBits() :
+              *  Read nbBits from CTable symbolTable, for symbol `symbolValue` presumed <= HUF_SYMBOLVALUE_MAX
+              *  Note 1 : is not inlined, as HUF_CElt definition is private
+              *  Note 2 : const void* used, so that it can provide a statically allocated table as argument (which uses type U32) */
+             U32 HUF_getNbBits(const void* symbolTable, U32 symbolValue);
              /*
               * HUF_decompress() does the following:
-              * 1. select the decompression algorithm (X2, X4) based on pre-computed heuristics
+              * 1. select the decompression algorithm (X1, X2) based on pre-computed heuristics
               * 2. build Huffman table from save, using HUF_readDTableX?()
               * 3. decode 1 or 4 segments in parallel using HUF_decompress?X?_usingDTable()
               */
              /** HUF_selectDecoder() :
               *  Tells which decoder is likely to decode faster,
               *  based on a set of pre-computed metrics.
-              * @return : 0==HUF_decompress4X2, 1==HUF_decompress4X4 .
+              * @return : 0==HUF_decompress4X1, 1==HUF_decompress4X2 .
               *  Assumption : 0 < dstSize <= 128 KB */
              U32 HUF_selectDecoder (size_t dstSize, size_t cSrcSize);
              /**
               *  The minimum workspace size for the `workSpace` used in
-              *  HUF_readDTableX2_wksp() and HUF_readDTableX4_wksp().
+              *  HUF_readDTableX1_wksp() and HUF_readDTableX2_wksp().
               *
               *  The space used depends on HUF_TABLELOG_MAX, ranging from ~1500 bytes when
               *  HUF_TABLE_LOG_MAX=12 to ~1850 bytes when HUF_TABLE_LOG_MAX=15.
              #define HUF_DECOMPRESS_WORKSPACE_SIZE (2 << 10)
              #define HUF_DECOMPRESS_WORKSPACE_SIZE_U32 (HUF_DECOMPRESS_WORKSPACE_SIZE / sizeof(U32))
+             size_t HUF_readDTableX1 (HUF_DTable* DTable, const void* src, size_t srcSize);
+             size_t HUF_readDTableX1_wksp (HUF_DTable* DTable, const void* src, size_t srcSize, void* workSpace, size_t wkspSize);
              size_t HUF_readDTableX2 (HUF_DTable* DTable, const void* src, size_t srcSize);
              size_t HUF_readDTableX2_wksp (HUF_DTable* DTable, const void* src, size_t srcSize, void* workSpace, size_t wkspSize);
-             size_t HUF_readDTableX4 (HUF_DTable* DTable, const void* src, size_t srcSize);
-             size_t HUF_readDTableX4_wksp (HUF_DTable* DTable, const void* src, size_t srcSize, void* workSpace, size_t wkspSize);
              size_t HUF_decompress4X_usingDTable(void* dst, size_t maxDstSize, const void* cSrc, size_t cSrcSize, const HUF_DTable* DTable);
+             size_t HUF_decompress4X1_usingDTable(void* dst, size_t maxDstSize, const void* cSrc, size_t cSrcSize, const HUF_DTable* DTable);
              size_t HUF_decompress4X2_usingDTable(void* dst, size_t maxDstSize, const void* cSrc, size_t cSrcSize, const HUF_DTable* DTable);
-             size_t HUF_decompress4X4_usingDTable(void* dst, size_t maxDstSize, const void* cSrc, size_t cSrcSize, const HUF_DTable* DTable);
              /* ====================== */
                                     void* workSpace, size_t wkspSize,   /**< `workSpace` must be aligned on 4-bytes boundaries, `wkspSize` must be >= HUF_WORKSPACE_SIZE */
                                     HUF_CElt* hufTable, HUF_repeat* repeat, int preferRepeat, int bmi2);
-             size_t HUF_decompress1X2 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /* single-symbol decoder */
-             size_t HUF_decompress1X4 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /* double-symbol decoder */
+             size_t HUF_decompress1X1 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /* single-symbol decoder */
+             size_t HUF_decompress1X2 (void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /* double-symbol decoder */
              size_t HUF_decompress1X_DCtx (HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);
              size_t HUF_decompress1X_DCtx_wksp (HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize, void* workSpace, size_t wkspSize);
-             size_t HUF_decompress1X2_DCtx(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /**< single-symbol decoder */
-             size_t HUF_decompress1X2_DCtx_wksp(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize, void* workSpace, size_t wkspSize);   /**< single-symbol decoder */
-             size_t HUF_decompress1X4_DCtx(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /**< double-symbols decoder */
-             size_t HUF_decompress1X4_DCtx_wksp(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize, void* workSpace, size_t wkspSize);   /**< double-symbols decoder */
+             size_t HUF_decompress1X1_DCtx(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /**< single-symbol decoder */
+             size_t HUF_decompress1X1_DCtx_wksp(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize, void* workSpace, size_t wkspSize);   /**< single-symbol decoder */
+             size_t HUF_decompress1X2_DCtx(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize);   /**< double-symbols decoder */
+             size_t HUF_decompress1X2_DCtx_wksp(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize, void* workSpace, size_t wkspSize);   /**< double-symbols decoder */
              size_t HUF_decompress1X_usingDTable(void* dst, size_t maxDstSize, const void* cSrc, size_t cSrcSize, const HUF_DTable* DTable);   /**< automatic selection of sing or double symbol decoder, based on DTable */
+             size_t HUF_decompress1X1_usingDTable(void* dst, size_t maxDstSize, const void* cSrc, size_t cSrcSize, const HUF_DTable* DTable);
              size_t HUF_decompress1X2_usingDTable(void* dst, size_t maxDstSize, const void* cSrc, size_t cSrcSize, const HUF_DTable* DTable);
-             size_t HUF_decompress1X4_usingDTable(void* dst, size_t maxDstSize, const void* cSrc, size_t cSrcSize, const HUF_DTable* DTable);
              /* BMI2 variants.
               * If the CPU has BMI2 support, pass bmi2=1, otherwise pass bmi2=0.
               */
              size_t HUF_decompress1X_usingDTable_bmi2(void* dst, size_t maxDstSize, const void* cSrc, size_t cSrcSize, const HUF_DTable* DTable, int bmi2);
-             size_t HUF_decompress1X2_DCtx_wksp_bmi2(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize, void* workSpace, size_t wkspSize, int bmi2);
+             size_t HUF_decompress1X1_DCtx_wksp_bmi2(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize, void* workSpace, size_t wkspSize, int bmi2);
              size_t HUF_decompress4X_usingDTable_bmi2(void* dst, size_t maxDstSize, const void* cSrc, size_t cSrcSize, const HUF_DTable* DTable, int bmi2);
              size_t HUF_decompress4X_hufOnly_wksp_bmi2(HUF_DTable* dctx, void* dst, size_t dstSize, const void* cSrc, size_t cSrcSize, void* workSpace, size_t wkspSize, int bmi2);

contrib/python-zstandard/zstd/common/mem.h

0 +12 0

                typedef  uint64_t U64;
                typedef   int64_t S64;
              #else
+             # include <limits.h>
+             #if CHAR_BIT != 8
+             #  error "this implementation requires char to be exactly 8-bit type"
+             #endif
                typedef unsigned char      BYTE;
+             #if USHRT_MAX != 65535
+             #  error "this implementation requires short to be exactly 16-bit type"
+             #endif
                typedef unsigned short      U16;
                typedef   signed short      S16;
+             #if UINT_MAX != 4294967295
+             #  error "this implementation requires int to be exactly 32-bit type"
+             #endif
                typedef unsigned int        U32;
                typedef   signed int        S32;
+             /* note : there are no limits defined for long long type in C90.
+              * limits exist in C99, however, in such case, <stdint.h> is preferred */
                typedef unsigned long long  U64;
                typedef   signed long long  S64;
              #endif

contrib/python-zstandard/zstd/common/pool.c

0 +89 -32

              /* ======   Dependencies   ======= */
-             #include <stddef.h>  /* size_t */
+             #include <stddef.h>    /* size_t */
+             #include "debug.h"     /* assert */
+             #include "zstd_internal.h"  /* ZSTD_malloc, ZSTD_free */
              #include "pool.h"
-             #include "zstd_internal.h"  /* ZSTD_malloc, ZSTD_free */
              /* ======   Compiler specifics   ====== */
              #if defined(_MSC_VER)
              struct POOL_ctx_s {
                  ZSTD_customMem customMem;
                  /* Keep track of the threads */
-                 ZSTD_pthread_t *threads;
-                 size_t numThreads;
+                 ZSTD_pthread_t* threads;
+                 size_t threadCapacity;
+                 size_t threadLimit;
                  /* The queue is a circular buffer */
                  POOL_job *queue;
              };
              /* POOL_thread() :
-                Work thread for the thread pool.
-                Waits for jobs and executes them.
-                @returns : NULL on failure else non-null.
-             */
+              * Work thread for the thread pool.
+              * Waits for jobs and executes them.
+              * @returns : NULL on failure else non-null.
+              */
              static void* POOL_thread(void* opaque) {
                  POOL_ctx* const ctx = (POOL_ctx*)opaque;
                  if (!ctx) { return NULL; }
                      /* Lock the mutex and wait for a non-empty queue or until shutdown */
                      ZSTD_pthread_mutex_lock(&ctx->queueMutex);
-                     while (ctx->queueEmpty && !ctx->shutdown) {
+                     while ( ctx->queueEmpty
+                         || (ctx->numThreadsBusy >= ctx->threadLimit) ) {
+                         if (ctx->shutdown) {
+                             /* even if !queueEmpty, (possible if numThreadsBusy >= threadLimit),
+                              * a few threads will be shutdown while !queueEmpty,
+                              * but enough threads will remain active to finish the queue */
+                             ZSTD_pthread_mutex_unlock(&ctx->queueMutex);
+                             return opaque;
+                         }
                          ZSTD_pthread_cond_wait(&ctx->queuePopCond, &ctx->queueMutex);
                      }
-                     /* empty => shutting down: so stop */
-                     if (ctx->queueEmpty) {
-                         ZSTD_pthread_mutex_unlock(&ctx->queueMutex);
-                         return opaque;
+                     }
                      /* Pop a job off the queue */
                      {   POOL_job const job = ctx->queue[ctx->queueHead];
                          ctx->queueHead = (ctx->queueHead + 1) % ctx->queueSize;
                          job.function(job.opaque);
                          /* If the intended queue size was 0, signal after finishing job */
+                         ZSTD_pthread_mutex_lock(&ctx->queueMutex);
+                         ctx->numThreadsBusy--;
                          if (ctx->queueSize == 1) {
-                             ZSTD_pthread_mutex_lock(&ctx->queueMutex);
-                             ctx->numThreadsBusy--;
-                             ZSTD_pthread_mutex_unlock(&ctx->queueMutex);
                              ZSTD_pthread_cond_signal(&ctx->queuePushCond);
-                     }   }
+                         }
+                         ZSTD_pthread_mutex_unlock(&ctx->queueMutex);
+                     }
                  }  /* for (;;) */
-                 /* Unreachable */
+                 assert(0);  /* Unreachable */
              }
              POOL_ctx* POOL_create(size_t numThreads, size_t queueSize) {
                  return POOL_create_advanced(numThreads, queueSize, ZSTD_defaultCMem);
              }
-             POOL_ctx* POOL_create_advanced(size_t numThreads, size_t queueSize, ZSTD_customMem customMem) {
+             POOL_ctx* POOL_create_advanced(size_t numThreads, size_t queueSize,
+                                            ZSTD_customMem customMem) {
                  POOL_ctx* ctx;
-                 /* Check the parameters */
+                 /* Check parameters */
                  if (!numThreads) { return NULL; }
                  /* Allocate the context and zero initialize */
                  ctx = (POOL_ctx*)ZSTD_calloc(sizeof(POOL_ctx), customMem);
                  if (!ctx) { return NULL; }
                  /* Initialize the job queue.
-                  * It needs one extra space since one space is wasted to differentiate empty
-                  * and full queues.
+                  * It needs one extra space since one space is wasted to differentiate
+                  * empty and full queues.
                   */
                  ctx->queueSize = queueSize + 1;
                  ctx->queue = (POOL_job*)ZSTD_malloc(ctx->queueSize * sizeof(POOL_job), customMem);
                  ctx->shutdown = 0;
                  /* Allocate space for the thread handles */
                  ctx->threads = (ZSTD_pthread_t*)ZSTD_malloc(numThreads * sizeof(ZSTD_pthread_t), customMem);
-                 ctx->numThreads = 0;
+                 ctx->threadCapacity = 0;
                  ctx->customMem = customMem;
                  /* Check for errors */
                  if (!ctx->threads || !ctx->queue) { POOL_free(ctx); return NULL; }
                  {   size_t i;
                      for (i = 0; i < numThreads; ++i) {
                          if (ZSTD_pthread_create(&ctx->threads[i], NULL, &POOL_thread, ctx)) {
-                             ctx->numThreads = i;
+                             ctx->threadCapacity = i;
                              POOL_free(ctx);
                              return NULL;
                      }   }
-                     ctx->numThreads = numThreads;
+                     ctx->threadCapacity = numThreads;
+                     ctx->threadLimit = numThreads;
                  }
                  return ctx;
              }
                  ZSTD_pthread_cond_broadcast(&ctx->queuePopCond);
                  /* Join all of the threads */
                  {   size_t i;
-                     for (i = 0; i < ctx->numThreads; ++i) {
-                         ZSTD_pthread_join(ctx->threads[i], NULL);
+                     for (i = 0; i < ctx->threadCapacity; ++i) {
+                         ZSTD_pthread_join(ctx->threads[i], NULL);  /* note : could fail */
                  }   }
              }
                  ZSTD_free(ctx, ctx->customMem);
              }
              size_t POOL_sizeof(POOL_ctx *ctx) {
                  if (ctx==NULL) return 0;  /* supports sizeof NULL */
                  return sizeof(*ctx)
                      + ctx->queueSize * sizeof(POOL_job)
-                     + ctx->numThreads * sizeof(ZSTD_pthread_t);
+                     + ctx->threadCapacity * sizeof(ZSTD_pthread_t);
+             }
+             /* @return : 0 on success, 1 on error */
+             static int POOL_resize_internal(POOL_ctx* ctx, size_t numThreads)
+             {
+                 if (numThreads <= ctx->threadCapacity) {
+                     if (!numThreads) return 1;
+                     ctx->threadLimit = numThreads;
+                     return 0;
+                 }
+                 /* numThreads > threadCapacity */
+                 {   ZSTD_pthread_t* const threadPool = (ZSTD_pthread_t*)ZSTD_malloc(numThreads * sizeof(ZSTD_pthread_t), ctx->customMem);
+                     if (!threadPool) return 1;
+                     /* replace existing thread pool */
+                     memcpy(threadPool, ctx->threads, ctx->threadCapacity * sizeof(*threadPool));
+                     ZSTD_free(ctx->threads, ctx->customMem);
+                     ctx->threads = threadPool;
+                     /* Initialize additional threads */
+                     {   size_t threadId;
+                         for (threadId = ctx->threadCapacity; threadId < numThreads; ++threadId) {
+                             if (ZSTD_pthread_create(&threadPool[threadId], NULL, &POOL_thread, ctx)) {
+                                 ctx->threadCapacity = threadId;
+                                 return 1;
+                         }   }
+                 }   }
+                 /* successfully expanded */
+                 ctx->threadCapacity = numThreads;
+                 ctx->threadLimit = numThreads;
+                 return 0;
+             }
+             /* @return : 0 on success, 1 on error */
+             int POOL_resize(POOL_ctx* ctx, size_t numThreads)
+             {
+                 int result;
+                 if (ctx==NULL) return 1;
+                 ZSTD_pthread_mutex_lock(&ctx->queueMutex);
+                 result = POOL_resize_internal(ctx, numThreads);
+                 ZSTD_pthread_cond_broadcast(&ctx->queuePopCond);
+                 ZSTD_pthread_mutex_unlock(&ctx->queueMutex);
+                 return result;
              }
              /**
               * Returns 1 if the queue is full and 0 otherwise.
               *
-              * If the queueSize is 1 (the pool was created with an intended queueSize of 0),
-              * then a queue is empty if there is a thread free and no job is waiting.
+              * When queueSize is 1 (pool was created with an intended queueSize of 0),
+              * then a queue is empty if there is a thread free _and_ no job is waiting.
               */
              static int isQueueFull(POOL_ctx const* ctx) {
                  if (ctx->queueSize > 1) {
                      return ctx->queueHead == ((ctx->queueTail + 1) % ctx->queueSize);
                  } else {
-                     return ctx->numThreadsBusy == ctx->numThreads ||
+                     return (ctx->numThreadsBusy == ctx->threadLimit) ||
                             !ctx->queueEmpty;
                  }
              }
                  (void)ctx;
              }
+             int POOL_resize(POOL_ctx* ctx, size_t numThreads) {
+                 (void)ctx; (void)numThreads;
+                 return 0;
+             }
              void POOL_add(POOL_ctx* ctx, POOL_function function, void* opaque) {
                  (void)ctx;
                  function(opaque);

contrib/python-zstandard/zstd/common/pool.h

0 +29 -19

              */
              POOL_ctx* POOL_create(size_t numThreads, size_t queueSize);
-             POOL_ctx* POOL_create_advanced(size_t numThreads, size_t queueSize, ZSTD_customMem customMem);
+             POOL_ctx* POOL_create_advanced(size_t numThreads, size_t queueSize,
+                                            ZSTD_customMem customMem);
              /*! POOL_free() :
-                 Free a thread pool returned by POOL_create().
-             */
+              *  Free a thread pool returned by POOL_create().
+              */
              void POOL_free(POOL_ctx* ctx);
+             /*! POOL_resize() :
+              *  Expands or shrinks pool's number of threads.
+              *  This is more efficient than releasing + creating a new context,
+              *  since it tries to preserve and re-use existing threads.
+              * `numThreads` must be at least 1.
+              * @return : 0 when resize was successful,
+              *           !0 (typically 1) if there is an error.
+              *    note : only numThreads can be resized, queueSize remains unchanged.
+              */
+             int POOL_resize(POOL_ctx* ctx, size_t numThreads);
              /*! POOL_sizeof() :
-                 return memory usage of pool returned by POOL_create().
-             */
+              * @return threadpool memory usage
+              *  note : compatible with NULL (returns 0 in this case)
+              */
              size_t POOL_sizeof(POOL_ctx* ctx);
              /*! POOL_function :
-                 The function type that can be added to a thread pool.
-             */
+              *  The function type that can be added to a thread pool.
+              */
              typedef void (*POOL_function)(void*);
-             /*! POOL_add_function :
-                 The function type for a generic thread pool add function.
-             */
-             typedef void (*POOL_add_function)(void*, POOL_function, void*);
              /*! POOL_add() :
-                 Add the job `function(opaque)` to the thread pool. `ctx` must be valid.
-                 Possibly blocks until there is room in the queue.
-                 Note : The function may be executed asynchronously, so `opaque` must live until the function has been completed.
-             */
+              *  Add the job `function(opaque)` to the thread pool. `ctx` must be valid.
+              *  Possibly blocks until there is room in the queue.
+              *  Note : The function may be executed asynchronously,
+              *         therefore, `opaque` must live until function has been completed.
+              */
              void POOL_add(POOL_ctx* ctx, POOL_function function, void* opaque);
              /*! POOL_tryAdd() :
-                 Add the job `function(opaque)` to the thread pool if a worker is available.
-                 return immediately otherwise.
-                @return : 1 if successful, 0 if not.
-             */
+              *  Add the job `function(opaque)` to thread pool _if_ a worker is available.
+              *  Returns immediately even if not (does not block).
+              * @return : 1 if successful, 0 if not.
+              */
              int POOL_tryAdd(POOL_ctx* ctx, POOL_function function, void* opaque);

contrib/python-zstandard/zstd/common/xxhash.c

0 +1 0

              /* Modify the local functions below should you wish to use some other memory routines */
              /* for malloc(), free() */
              #include <stdlib.h>
+             #include <stddef.h>     /* size_t */
              static void* XXH_malloc(size_t s) { return malloc(s); }
              static void  XXH_free  (void* p)  { free(p); }
              /* for memcpy() */

contrib/python-zstandard/zstd/common/zstd_common.c

0 0 -5

               *  provides error code string from enum */
              const char* ZSTD_getErrorString(ZSTD_ErrorCode code) { return ERR_getErrorString(code); }
-             /*! g_debuglog_enable :
-              *  turn on/off debug traces (global switch) */
-             #if defined(ZSTD_DEBUG) && (ZSTD_DEBUG >= 2)
-             int g_debuglog_enable = 1;
-             #endif
              /*=**************************************************************

contrib/python-zstandard/zstd/common/zstd_internal.h

0 +6 -39

              ***************************************/
              #include "compiler.h"
              #include "mem.h"
+             #include "debug.h"                 /* assert, DEBUGLOG, RAWLOG, g_debuglevel */
              #include "error_private.h"
              #define ZSTD_STATIC_LINKING_ONLY
              #include "zstd.h"
              extern "C" {
              #endif
-             /*-*************************************
-             *  Debug
-             ***************************************/
-             #if defined(ZSTD_DEBUG) && (ZSTD_DEBUG>=1)
-             #  include <assert.h>
-             #else
-             #  ifndef assert
-             #    define assert(condition) ((void)0)
-             #  endif
-             #endif
-             #define ZSTD_STATIC_ASSERT(c) { enum { ZSTD_static_assert = 1/(int)(!!(c)) }; }
-             #if defined(ZSTD_DEBUG) && (ZSTD_DEBUG>=2)
-             #  include <stdio.h>
-             extern int g_debuglog_enable;
-             /* recommended values for ZSTD_DEBUG display levels :
-              * 1 : no display, enables assert() only
-              * 2 : reserved for currently active debug path
-              * 3 : events once per object lifetime (CCtx, CDict, etc.)
-              * 4 : events once per frame
-              * 5 : events once per block
-              * 6 : events once per sequence (*very* verbose) */
-             #  define RAWLOG(l, ...) {                                      \
-                             if ((g_debuglog_enable) & (l<=ZSTD_DEBUG)) {    \
-                                 fprintf(stderr, __VA_ARGS__);               \
-                         }   }
-             #  define DEBUGLOG(l, ...) {                                    \
-                             if ((g_debuglog_enable) & (l<=ZSTD_DEBUG)) {    \
-                                 fprintf(stderr, __FILE__ ": " __VA_ARGS__); \
-                                 fprintf(stderr, " \n");                     \
-                         }   }
-             #else
-             #  define RAWLOG(l, ...)      {}    /* disabled */
-             #  define DEBUGLOG(l, ...)    {}    /* disabled */
-             #endif
+             /* ---- static assert (debug) --- */
+             #define ZSTD_STATIC_ASSERT(c) DEBUG_STATIC_ASSERT(c)
              /*-*************************************
              static const size_t ZSTD_fcs_fieldSize[4] = { 0, 2, 4, 8 };
              static const size_t ZSTD_did_fieldSize[4] = { 0, 1, 2, 4 };
-             #define ZSTD_FRAMEIDSIZE 4
-             static const size_t ZSTD_frameIdSize = ZSTD_FRAMEIDSIZE;  /* magic number size */
+             #define ZSTD_FRAMEIDSIZE 4   /* magic number size */
              #define ZSTD_BLOCKHEADERSIZE 3   /* C standard doesn't allow `static const` variable to be init using another `static const` variable */
              static const size_t ZSTD_blockHeaderSize = ZSTD_BLOCKHEADERSIZE;
                  BYTE* llCode;
                  BYTE* mlCode;
                  BYTE* ofCode;
+                 size_t maxNbSeq;
+                 size_t maxNbLit;
                  U32   longLengthID;   /* 0 == no longLength; 1 == Lit.longLength; 2 == Match.longLength; */
                  U32   longLengthPos;
              } seqStore_t;

contrib/python-zstandard/zstd/compress/fse_compress.c

0 +82 -210

              /* ******************************************************************
                 FSE : Finite State Entropy encoder
-                Copyright (C) 2013-2015, Yann Collet.
+                Copyright (C) 2013-present, Yann Collet.
                 BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
              ****************************************************************/
              #include <stdlib.h>     /* malloc, free, qsort */
              #include <string.h>     /* memcpy, memset */
-             #include <stdio.h>      /* printf (debug) */
+             #include "compiler.h"
+             #include "mem.h"        /* U32, U16, etc. */
+             #include "debug.h"      /* assert, DEBUGLOG */
+             #include "hist.h"       /* HIST_count_wksp */
              #include "bitstream.h"
-             #include "compiler.h"
              #define FSE_STATIC_LINKING_ONLY
              #include "fse.h"
              #include "error_private.h"
              *  Error Management
              ****************************************************************/
              #define FSE_isError ERR_isError
-             #define FSE_STATIC_ASSERT(c) { enum { FSE_static_assert = 1/(int)(!!(c)) }; }   /* use only *after* variable declarations */
              /* **************************************************************
               * wkspSize should be sized to handle worst case situation, which is `1<<max_tableLog * sizeof(FSE_FUNCTION_TYPE)`
               * workSpace must also be properly aligned with FSE_FUNCTION_TYPE requirements
               */
-             size_t FSE_buildCTable_wksp(FSE_CTable* ct, const short* normalizedCounter, unsigned maxSymbolValue, unsigned tableLog, void* workSpace, size_t wkspSize)
+             size_t FSE_buildCTable_wksp(FSE_CTable* ct,
+                                   const short* normalizedCounter, unsigned maxSymbolValue, unsigned tableLog,
+                                         void* workSpace, size_t wkspSize)
              {
                  U32 const tableSize = 1 << tableLog;
                  U32 const tableMask = tableSize - 1;
                  if (((size_t)1 << tableLog) * sizeof(FSE_FUNCTION_TYPE) > wkspSize) return ERROR(tableLog_tooLarge);
                  tableU16[-2] = (U16) tableLog;
                  tableU16[-1] = (U16) maxSymbolValue;
+                 assert(tableLog < 16);   /* required for threshold strategy to work */
                  /* For explanations on how to distribute symbol values over the table :
-                 *  http://fastcompression.blogspot.fr/2014/02/fse-distributing-symbol-values.html */
+                  * http://fastcompression.blogspot.fr/2014/02/fse-distributing-symbol-values.html */
+                  #ifdef __clang_analyzer__
+                  memset(tableSymbol, 0, sizeof(*tableSymbol) * tableSize);   /* useless initialization, just to keep scan-build happy */
+                  #endif
                  /* symbol start positions */
                  {   U32 u;
                      U32 symbol;
                      for (symbol=0; symbol<=maxSymbolValue; symbol++) {
                          int nbOccurences;
-                         for (nbOccurences=0; nbOccurences<normalizedCounter[symbol]; nbOccurences++) {
+                         int const freq = normalizedCounter[symbol];
+                         for (nbOccurences=0; nbOccurences<freq; nbOccurences++) {
                              tableSymbol[position] = (FSE_FUNCTION_TYPE)symbol;
                              position = (position + step) & tableMask;
-                             while (position > highThreshold) position = (position + step) & tableMask;   /* Low proba area */
+                             while (position > highThreshold)
+                                 position = (position + step) & tableMask;   /* Low proba area */
                      }   }
-                     if (position!=0) return ERROR(GENERIC);   /* Must have gone through all positions */
+                     assert(position==0);  /* Must have initialized all positions */
                  }
                  /* Build table */
                      for (s=0; s<=maxSymbolValue; s++) {
                          switch (normalizedCounter[s])
                          {
-                         case  0: break;
+                         case  0:
+                             /* filling nonetheless, for compatibility with FSE_getMaxNbBits() */
+                             symbolTT[s].deltaNbBits = ((tableLog+1) << 16) - (1<<tableLog);
+                             break;
                          case -1:
                          case  1:
                                  total +=  normalizedCounter[s];
                  }   }   }   }
+             #if 0  /* debug : symbol costs */
+                 DEBUGLOG(5, "\n --- table statistics : ");
+                 {   U32 symbol;
+                     for (symbol=0; symbol<=maxSymbolValue; symbol++) {
+                         DEBUGLOG(5, "%3u: w=%3i,   maxBits=%u, fracBits=%.2f",
+                             symbol, normalizedCounter[symbol],
+                             FSE_getMaxNbBits(symbolTT, symbol),
+                             (double)FSE_bitCost(symbolTT, tableLog, symbol, 8) / 256);
+                     }
+                 }
+             #endif
                  return 0;
              }
              #ifndef FSE_COMMONDEFS_ONLY
              /*-**************************************************************
-             *  FSE NCount encoding-decoding
+             *  FSE NCount encoding
              ****************************************************************/
              size_t FSE_NCountWriteBound(unsigned maxSymbolValue, unsigned tableLog)
              {
                  return maxSymbolValue ? maxHeaderSize : FSE_NCOUNTBOUND;  /* maxSymbolValue==0 ? use default */
              }
-             static size_t FSE_writeNCount_generic (void* header, size_t headerBufferSize,
-                                                    const short* normalizedCounter, unsigned maxSymbolValue, unsigned tableLog,
-                                                    unsigned writeIsSafe)
+             static size_t
+             FSE_writeNCount_generic (void* header, size_t headerBufferSize,
+                                const short* normalizedCounter, unsigned maxSymbolValue, unsigned tableLog,
+                                      unsigned writeIsSafe)
              {
                  BYTE* const ostart = (BYTE*) header;
                  BYTE* out = ostart;
                  const int tableSize = 1 << tableLog;
                  int remaining;
                  int threshold;
-                 U32 bitStream;
-                 int bitCount;
-                 unsigned charnum = 0;
-                 int previous0 = 0;
+                 U32 bitStream = 0;
+                 int bitCount = 0;
+                 unsigned symbol = 0;
+                 unsigned const alphabetSize = maxSymbolValue + 1;
+                 int previousIs0 = 0;
-                 bitStream = 0;
-                 bitCount  = 0;
                  /* Table Size */
                  bitStream += (tableLog-FSE_MIN_TABLELOG) << bitCount;
                  bitCount  += 4;
                  threshold = tableSize;
                  nbBits = tableLog+1;
-                 while (remaining>1) {  /* stops at 1 */
-                     if (previous0) {
-                         unsigned start = charnum;
-                         while (!normalizedCounter[charnum]) charnum++;
-                         while (charnum >= start+24) {
+                 while ((symbol < alphabetSize) && (remaining>1)) {  /* stops at 1 */
+                     if (previousIs0) {
+                         unsigned start = symbol;
+                         while ((symbol < alphabetSize) && !normalizedCounter[symbol]) symbol++;
+                         if (symbol == alphabetSize) break;   /* incorrect distribution */
+                         while (symbol >= start+24) {
                              start+=24;
                              bitStream += 0xFFFFU << bitCount;
-                             if ((!writeIsSafe) && (out > oend-2)) return ERROR(dstSize_tooSmall);   /* Buffer overflow */
+                             if ((!writeIsSafe) && (out > oend-2))
+                                 return ERROR(dstSize_tooSmall);   /* Buffer overflow */
                              out[0] = (BYTE) bitStream;
                              out[1] = (BYTE)(bitStream>>8);
                              out+=2;
                              bitStream>>=16;
                          }
-                         while (charnum >= start+3) {
+                         while (symbol >= start+3) {
                              start+=3;
                              bitStream += 3 << bitCount;
                              bitCount += 2;
                          }
-                         bitStream += (charnum-start) << bitCount;
+                         bitStream += (symbol-start) << bitCount;
                          bitCount += 2;
                          if (bitCount>16) {
-                             if ((!writeIsSafe) && (out > oend - 2)) return ERROR(dstSize_tooSmall);   /* Buffer overflow */
+                             if ((!writeIsSafe) && (out > oend - 2))
+                                 return ERROR(dstSize_tooSmall);   /* Buffer overflow */
                              out[0] = (BYTE)bitStream;
                              out[1] = (BYTE)(bitStream>>8);
                              out += 2;
                              bitStream >>= 16;
                              bitCount -= 16;
                      }   }
-                     {   int count = normalizedCounter[charnum++];
-                         int const max = (2*threshold-1)-remaining;
+                     {   int count = normalizedCounter[symbol++];
+                         int const max = (2*threshold-1) - remaining;
                          remaining -= count < 0 ? -count : count;
                          count++;   /* +1 for extra accuracy */
-                         if (count>=threshold) count += max;   /* [0..max[ [max..threshold[ (...) [threshold+max 2*threshold[ */
+                         if (count>=threshold)
+                             count += max;   /* [0..max[ [max..threshold[ (...) [threshold+max 2*threshold[ */
                          bitStream += count << bitCount;
                          bitCount  += nbBits;
                          bitCount  -= (count<max);
-                         previous0  = (count==1);
+                         previousIs0  = (count==1);
                          if (remaining<1) return ERROR(GENERIC);
                          while (remaining<threshold) { nbBits--; threshold>>=1; }
                      }
                      if (bitCount>16) {
-                         if ((!writeIsSafe) && (out > oend - 2)) return ERROR(dstSize_tooSmall);   /* Buffer overflow */
+                         if ((!writeIsSafe) && (out > oend - 2))
+                             return ERROR(dstSize_tooSmall);   /* Buffer overflow */
                          out[0] = (BYTE)bitStream;
                          out[1] = (BYTE)(bitStream>>8);
                          out += 2;
                          bitCount -= 16;
                  }   }
+                 if (remaining != 1)
+                     return ERROR(GENERIC);  /* incorrect normalized distribution */
+                 assert(symbol <= alphabetSize);
                  /* flush remaining bitStream */
-                 if ((!writeIsSafe) && (out > oend - 2)) return ERROR(dstSize_tooSmall);   /* Buffer overflow */
+                 if ((!writeIsSafe) && (out > oend - 2))
+                     return ERROR(dstSize_tooSmall);   /* Buffer overflow */
                  out[0] = (BYTE)bitStream;
                  out[1] = (BYTE)(bitStream>>8);
                  out+= (bitCount+7) /8;
-                 if (charnum > maxSymbolValue + 1) return ERROR(GENERIC);
                  return (out-ostart);
              }
-             size_t FSE_writeNCount (void* buffer, size_t bufferSize, const short* normalizedCounter, unsigned maxSymbolValue, unsigned tableLog)
+             size_t FSE_writeNCount (void* buffer, size_t bufferSize,
+                               const short* normalizedCounter, unsigned maxSymbolValue, unsigned tableLog)
              {
                  if (tableLog > FSE_MAX_TABLELOG) return ERROR(tableLog_tooLarge);   /* Unsupported */
                  if (tableLog < FSE_MIN_TABLELOG) return ERROR(GENERIC);   /* Unsupported */
                  if (bufferSize < FSE_NCountWriteBound(maxSymbolValue, tableLog))
                      return FSE_writeNCount_generic(buffer, bufferSize, normalizedCounter, maxSymbolValue, tableLog, 0);
-                 return FSE_writeNCount_generic(buffer, bufferSize, normalizedCounter, maxSymbolValue, tableLog, 1);
+             }
-             /*-**************************************************************
-             *  Counting histogram
-             ****************************************************************/
-             /*! FSE_count_simple
-                 This function counts byte values within `src`, and store the histogram into table `count`.
-                 It doesn't use any additional memory.
-                 But this function is unsafe : it doesn't check that all values within `src` can fit into `count`.
-                 For this reason, prefer using a table `count` with 256 elements.
-                 @return : count of most numerous element.
-             */
-             size_t FSE_count_simple(unsigned* count, unsigned* maxSymbolValuePtr,
-                                     const void* src, size_t srcSize)
+             {
-                 const BYTE* ip = (const BYTE*)src;
-                 const BYTE* const end = ip + srcSize;
-                 unsigned maxSymbolValue = *maxSymbolValuePtr;
-                 unsigned max=0;
-                 memset(count, 0, (maxSymbolValue+1)*sizeof(*count));
-                 if (srcSize==0) { *maxSymbolValuePtr = 0; return 0; }
-                 while (ip<end) {
-                     assert(*ip <= maxSymbolValue);
-                     count[*ip++]++;
+                 }
-                 while (!count[maxSymbolValue]) maxSymbolValue--;
-                 *maxSymbolValuePtr = maxSymbolValue;
-                 { U32 s; for (s=0; s<=maxSymbolValue; s++) if (count[s] > max) max = count[s]; }
-                 return (size_t)max;
+                 return FSE_writeNCount_generic(buffer, bufferSize, normalizedCounter, maxSymbolValue, tableLog, 1 /* write in buffer is safe */);
              }
-             /* FSE_count_parallel_wksp() :
-              * Same as FSE_count_parallel(), but using an externally provided scratch buffer.
-              * `workSpace` size must be a minimum of `1024 * sizeof(unsigned)`.
-              * @return : largest histogram frequency, or an error code (notably when histogram would be larger than *maxSymbolValuePtr). */
-             static size_t FSE_count_parallel_wksp(
-                                             unsigned* count, unsigned* maxSymbolValuePtr,
-                                             const void* source, size_t sourceSize,
-                                             unsigned checkMax, unsigned* const workSpace)
+             {
-                 const BYTE* ip = (const BYTE*)source;
-                 const BYTE* const iend = ip+sourceSize;
-                 unsigned maxSymbolValue = *maxSymbolValuePtr;
-                 unsigned max=0;
-                 U32* const Counting1 = workSpace;
-                 U32* const Counting2 = Counting1 + 256;
-                 U32* const Counting3 = Counting2 + 256;
-                 U32* const Counting4 = Counting3 + 256;
-                 memset(workSpace, 0, 4*256*sizeof(unsigned));
-                 /* safety checks */
-                 if (!sourceSize) {
-                     memset(count, 0, maxSymbolValue + 1);
-                     *maxSymbolValuePtr = 0;
-                     return 0;
+                 }
-                 if (!maxSymbolValue) maxSymbolValue = 255;            /* 0 == default */
-                 /* by stripes of 16 bytes */
-                 {   U32 cached = MEM_read32(ip); ip += 4;
-                     while (ip < iend-15) {
-                         U32 c = cached; cached = MEM_read32(ip); ip += 4;
-                         Counting1[(BYTE) c     ]++;
-                         Counting2[(BYTE)(c>>8) ]++;
-                         Counting3[(BYTE)(c>>16)]++;
-                         Counting4[       c>>24 ]++;
-                         c = cached; cached = MEM_read32(ip); ip += 4;
-                         Counting1[(BYTE) c     ]++;
-                         Counting2[(BYTE)(c>>8) ]++;
-                         Counting3[(BYTE)(c>>16)]++;
-                         Counting4[       c>>24 ]++;
-                         c = cached; cached = MEM_read32(ip); ip += 4;
-                         Counting1[(BYTE) c     ]++;
-                         Counting2[(BYTE)(c>>8) ]++;
-                         Counting3[(BYTE)(c>>16)]++;
-                         Counting4[       c>>24 ]++;
-                         c = cached; cached = MEM_read32(ip); ip += 4;
-                         Counting1[(BYTE) c     ]++;
-                         Counting2[(BYTE)(c>>8) ]++;
-                         Counting3[(BYTE)(c>>16)]++;
-                         Counting4[       c>>24 ]++;
+                     }
-                     ip-=4;
+                 }
-                 /* finish last symbols */
-                 while (ip<iend) Counting1[*ip++]++;
-                 if (checkMax) {   /* verify stats will fit into destination table */
-                     U32 s; for (s=255; s>maxSymbolValue; s--) {
-                         Counting1[s] += Counting2[s] + Counting3[s] + Counting4[s];
-                         if (Counting1[s]) return ERROR(maxSymbolValue_tooSmall);
-                 }   }
-                 {   U32 s;
-                     if (maxSymbolValue > 255) maxSymbolValue = 255;
-                     for (s=0; s<=maxSymbolValue; s++) {
-                         count[s] = Counting1[s] + Counting2[s] + Counting3[s] + Counting4[s];
-                         if (count[s] > max) max = count[s];
-                 }   }
-                 while (!count[maxSymbolValue]) maxSymbolValue--;
-                 *maxSymbolValuePtr = maxSymbolValue;
-                 return (size_t)max;
+             }
-             /* FSE_countFast_wksp() :
-              * Same as FSE_countFast(), but using an externally provided scratch buffer.
-              * `workSpace` size must be table of >= `1024` unsigned */
-             size_t FSE_countFast_wksp(unsigned* count, unsigned* maxSymbolValuePtr,
-                                       const void* source, size_t sourceSize,
-                                       unsigned* workSpace)
+             {
-                 if (sourceSize < 1500) /* heuristic threshold */
-                     return FSE_count_simple(count, maxSymbolValuePtr, source, sourceSize);
-                 return FSE_count_parallel_wksp(count, maxSymbolValuePtr, source, sourceSize, 0, workSpace);
+             }
-             /* fast variant (unsafe : won't check if src contains values beyond count[] limit) */
-             size_t FSE_countFast(unsigned* count, unsigned* maxSymbolValuePtr,
-                                  const void* source, size_t sourceSize)
+             {
-                 unsigned tmpCounters[1024];
-                 return FSE_countFast_wksp(count, maxSymbolValuePtr, source, sourceSize, tmpCounters);
+             }
-             /* FSE_count_wksp() :
-              * Same as FSE_count(), but using an externally provided scratch buffer.
-              * `workSpace` size must be table of >= `1024` unsigned */
-             size_t FSE_count_wksp(unsigned* count, unsigned* maxSymbolValuePtr,
-                              const void* source, size_t sourceSize, unsigned* workSpace)
+             {
-                 if (*maxSymbolValuePtr < 255)
-                     return FSE_count_parallel_wksp(count, maxSymbolValuePtr, source, sourceSize, 1, workSpace);
-                 *maxSymbolValuePtr = 255;
-                 return FSE_countFast_wksp(count, maxSymbolValuePtr, source, sourceSize, workSpace);
+             }
-             size_t FSE_count(unsigned* count, unsigned* maxSymbolValuePtr,
-                              const void* src, size_t srcSize)
+             {
-                 unsigned tmpCounters[1024];
-                 return FSE_count_wksp(count, maxSymbolValuePtr, src, srcSize, tmpCounters);
+             }
              /*-**************************************************************
              *  FSE Compression Code
              ****************************************************************/
-             /*! FSE_sizeof_CTable() :
-                 FSE_CTable is a variable size structure which contains :
-                 `U16 tableLog;`
-                 `U16 maxSymbolValue;`
-                 `U16 nextStateNumber[1 << tableLog];`                         // This size is variable
-                 `FSE_symbolCompressionTransform symbolTT[maxSymbolValue+1];`  // This size is variable
-             Allocation is manual (C standard does not support variable-size structures).
-             */
-             size_t FSE_sizeof_CTable (unsigned maxSymbolValue, unsigned tableLog)
+             {
-                 if (tableLog > FSE_MAX_TABLELOG) return ERROR(tableLog_tooLarge);
-                 return FSE_CTABLE_SIZE_U32 (tableLog, maxSymbolValue) * sizeof(U32);
+             }
              FSE_CTable* FSE_createCTable (unsigned maxSymbolValue, unsigned tableLog)
              {
              /* provides the minimum logSize to safely represent a distribution */
              static unsigned FSE_minTableLog(size_t srcSize, unsigned maxSymbolValue)
              {
-                 U32 minBitsSrc = BIT_highbit32((U32)(srcSize - 1)) + 1;
+                 U32 minBitsSrc = BIT_highbit32((U32)(srcSize)) + 1;
                  U32 minBitsSymbols = BIT_highbit32(maxSymbolValue) + 2;
                  U32 minBits = minBitsSrc < minBitsSymbols ? minBitsSrc : minBitsSymbols;
                  assert(srcSize > 1); /* Not supported, RLE should be used instead */
                  }
                  ToDistribute = (1 << tableLog) - distributed;
+                 if (ToDistribute == 0)
+                     return 0;
                  if ((total / ToDistribute) > lowOne) {
                      /* risk of rounding to zero */
                      lowOne = (U32)((total * 3) / (ToDistribute * 2));
                      U32 s;
                      U32 nTotal = 0;
                      for (s=0; s<=maxSymbolValue; s++)
-                         printf("%3i: %4i \n", s, normalizedCounter[s]);
+                         RAWLOG(2, "%3i: %4i \n", s, normalizedCounter[s]);
                      for (s=0; s<=maxSymbolValue; s++)
                          nTotal += abs(normalizedCounter[s]);
                      if (nTotal != (1U<<tableLog))
-                         printf("Warning !!! Total == %u != %u !!!", nTotal, 1U<<tableLog);
+                         RAWLOG(2, "Warning !!! Total == %u != %u !!!", nTotal, 1U<<tableLog);
                      getchar();
                  }
              #endif
                  if (!tableLog) tableLog = FSE_DEFAULT_TABLELOG;
                  /* Scan input and build symbol stats */
-                 {   CHECK_V_F(maxCount, FSE_count_wksp(count, &maxSymbolValue, src, srcSize, (unsigned*)scratchBuffer) );
+                 {   CHECK_V_F(maxCount, HIST_count_wksp(count, &maxSymbolValue, src, srcSize, (unsigned*)scratchBuffer) );
                      if (maxCount == srcSize) return 1;   /* only a single symbol in src : rle */
                      if (maxCount == 1) return 0;         /* each symbol present maximum once => not compressible */
                      if (maxCount < (srcSize >> 7)) return 0;   /* Heuristic : not compressible enough */
              size_t FSE_compress2 (void* dst, size_t dstCapacity, const void* src, size_t srcSize, unsigned maxSymbolValue, unsigned tableLog)
              {
                  fseWkspMax_t scratchBuffer;
-                 FSE_STATIC_ASSERT(sizeof(scratchBuffer) >= FSE_WKSP_SIZE_U32(FSE_MAX_TABLELOG, FSE_MAX_SYMBOL_VALUE));   /* compilation failures here means scratchBuffer is not large enough */
+                 DEBUG_STATIC_ASSERT(sizeof(scratchBuffer) >= FSE_WKSP_SIZE_U32(FSE_MAX_TABLELOG, FSE_MAX_SYMBOL_VALUE));   /* compilation failures here means scratchBuffer is not large enough */
                  if (tableLog > FSE_MAX_TABLELOG) return ERROR(tableLog_tooLarge);
                  return FSE_compress_wksp(dst, dstCapacity, src, srcSize, maxSymbolValue, tableLog, &scratchBuffer, sizeof(scratchBuffer));
              }

contrib/python-zstandard/zstd/compress/huf_compress.c

0 +15 -7

              ****************************************************************/
              #include <string.h>     /* memcpy, memset */
              #include <stdio.h>      /* printf (debug) */
+             #include "compiler.h"
              #include "bitstream.h"
-             #include "compiler.h"
+             #include "hist.h"
              #define FSE_STATIC_LINKING_ONLY   /* FSE_optimalTableLog_internal */
              #include "fse.h"        /* header compression */
              #define HUF_STATIC_LINKING_ONLY
              *  Error Management
              ****************************************************************/
              #define HUF_isError ERR_isError
-             #define HUF_STATIC_ASSERT(c) { enum { HUF_static_assert = 1/(int)(!!(c)) }; }   /* use only *after* variable declarations */
+             #define HUF_STATIC_ASSERT(c) DEBUG_STATIC_ASSERT(c)   /* use only *after* variable declarations */
              #define CHECK_V_F(e, f) size_t const e = f; if (ERR_isError(e)) return e
              #define CHECK_F(f)   { CHECK_V_F(_var_err__, f); }
               * Note : all elements within weightTable are supposed to be <= HUF_TABLELOG_MAX.
               */
              #define MAX_FSE_TABLELOG_FOR_HUFF_HEADER 6
-             size_t HUF_compressWeights (void* dst, size_t dstSize, const void* weightTable, size_t wtSize)
+             static size_t HUF_compressWeights (void* dst, size_t dstSize, const void* weightTable, size_t wtSize)
              {
                  BYTE* const ostart = (BYTE*) dst;
                  BYTE* op = ostart;
                  if (wtSize <= 1) return 0;  /* Not compressible */
                  /* Scan input and build symbol stats */
-                 {   CHECK_V_F(maxCount, FSE_count_simple(count, &maxSymbolValue, weightTable, wtSize) );
+                 {   unsigned const maxCount = HIST_count_simple(count, &maxSymbolValue, weightTable, wtSize);   /* never fails */
                      if (maxCount == wtSize) return 1;   /* only a single symbol in src : rle */
-                     if (maxCount == 1) return 0;         /* each symbol present maximum once => not compressible */
+                     if (maxCount == 1) return 0;        /* each symbol present maximum once => not compressible */
                  }
                  tableLog = FSE_optimalTableLog(tableLog, wtSize, maxSymbolValue);
                  return readSize;
              }
+             U32 HUF_getNbBits(const void* symbolTable, U32 symbolValue)
+             {
+                 const HUF_CElt* table = (const HUF_CElt*)symbolTable;
+                 assert(symbolValue <= HUF_SYMBOLVALUE_MAX);
+                 return table[symbolValue].nbBits;
+             }
              typedef struct nodeElt_s {
                  U32 count;
                  }
                  /* Scan input and build symbol stats */
-                 {   CHECK_V_F(largest, FSE_count_wksp (table->count, &maxSymbolValue, (const BYTE*)src, srcSize, table->count) );
+                 {   CHECK_V_F(largest, HIST_count_wksp (table->count, &maxSymbolValue, (const BYTE*)src, srcSize, table->count) );
                      if (largest == srcSize) { *ostart = ((const BYTE*)src)[0]; return 1; }   /* single symbol, rle */
-                     if (largest <= (srcSize >> 7)+1) return 0;   /* heuristic : probably not compressible enough */
+                     if (largest <= (srcSize >> 7)+4) return 0;   /* heuristic : probably not compressible enough */
                  }
                  /* Check validity of previous table */

contrib/python-zstandard/zstd/compress/zstd_compress.c

0 +1002 -411

               * You may select, at your option, one of the above-listed licenses.
               */
-             /*-*************************************
-             *  Tuning parameters
-             ***************************************/
-             #ifndef ZSTD_CLEVEL_DEFAULT
-             #  define ZSTD_CLEVEL_DEFAULT 3
-             #endif
              /*-*************************************
              *  Dependencies
              ***************************************/
              #include <string.h>         /* memset */
              #include "cpu.h"
              #include "mem.h"
+             #include "hist.h"           /* HIST_countFast_wksp */
              #define FSE_STATIC_LINKING_ONLY   /* FSE_encodeSymbol */
              #include "fse.h"
              #define HUF_STATIC_LINKING_ONLY
                  size_t workspaceSize;
                  ZSTD_matchState_t matchState;
                  ZSTD_compressedBlockState_t cBlockState;
-                 ZSTD_compressionParameters cParams;
                  ZSTD_customMem customMem;
                  U32 dictID;
              };  /* typedef'd to ZSTD_CDict within "zstd.h" */
                  return ZSTD_createCCtx_advanced(ZSTD_defaultCMem);
              }
+             static void ZSTD_initCCtx(ZSTD_CCtx* cctx, ZSTD_customMem memManager)
+             {
+                 assert(cctx != NULL);
+                 memset(cctx, 0, sizeof(*cctx));
+                 cctx->customMem = memManager;
+                 cctx->bmi2 = ZSTD_cpuid_bmi2(ZSTD_cpuid());
+                 {   size_t const err = ZSTD_CCtx_resetParameters(cctx);
+                     assert(!ZSTD_isError(err));
+                     (void)err;
+                 }
+             }
              ZSTD_CCtx* ZSTD_createCCtx_advanced(ZSTD_customMem customMem)
              {
                  ZSTD_STATIC_ASSERT(zcss_init==0);
                  ZSTD_STATIC_ASSERT(ZSTD_CONTENTSIZE_UNKNOWN==(0ULL - 1));
                  if (!customMem.customAlloc ^ !customMem.customFree) return NULL;
-                 {   ZSTD_CCtx* const cctx = (ZSTD_CCtx*)ZSTD_calloc(sizeof(ZSTD_CCtx), customMem);
+                 {   ZSTD_CCtx* const cctx = (ZSTD_CCtx*)ZSTD_malloc(sizeof(ZSTD_CCtx), customMem);
                      if (!cctx) return NULL;
-                     cctx->customMem = customMem;
-                     cctx->requestedParams.compressionLevel = ZSTD_CLEVEL_DEFAULT;
-                     cctx->requestedParams.fParams.contentSizeFlag = 1;
-                     cctx->bmi2 = ZSTD_cpuid_bmi2(ZSTD_cpuid());
+                     ZSTD_initCCtx(cctx, customMem);
                      return cctx;
                  }
              }
                  return cctx;
              }
-             size_t ZSTD_freeCCtx(ZSTD_CCtx* cctx)
+             static void ZSTD_freeCCtxContent(ZSTD_CCtx* cctx)
              {
-                 if (cctx==NULL) return 0;   /* support free on NULL */
-                 if (cctx->staticSize) return ERROR(memory_allocation);   /* not compatible with static CCtx */
+                 assert(cctx != NULL);
+                 assert(cctx->staticSize == 0);
                  ZSTD_free(cctx->workSpace, cctx->customMem); cctx->workSpace = NULL;
                  ZSTD_freeCDict(cctx->cdictLocal); cctx->cdictLocal = NULL;
              #ifdef ZSTD_MULTITHREAD
                  ZSTDMT_freeCCtx(cctx->mtctx); cctx->mtctx = NULL;
              #endif
+             }
+             size_t ZSTD_freeCCtx(ZSTD_CCtx* cctx)
+             {
+                 if (cctx==NULL) return 0;   /* support free on NULL */
+                 if (cctx->staticSize) return ERROR(memory_allocation);   /* not compatible with static CCtx */
+                 ZSTD_freeCCtxContent(cctx);
                  ZSTD_free(cctx, cctx->customMem);
-                 return 0;   /* reserved as a potential error code in the future */
+                 return 0;
              }
              /* private API call, for dictBuilder only */
              const seqStore_t* ZSTD_getSeqStore(const ZSTD_CCtx* ctx) { return &(ctx->seqStore); }
-             ZSTD_compressionParameters ZSTD_getCParamsFromCCtxParams(
-                     const ZSTD_CCtx_params* CCtxParams, U64 srcSizeHint, size_t dictSize)
+             {
-                 ZSTD_compressionParameters cParams = ZSTD_getCParams(CCtxParams->compressionLevel, srcSizeHint, dictSize);
-                 if (CCtxParams->ldmParams.enableLdm) cParams.windowLog = ZSTD_LDM_DEFAULT_WINDOW_LOG;
-                 if (CCtxParams->cParams.windowLog) cParams.windowLog = CCtxParams->cParams.windowLog;
-                 if (CCtxParams->cParams.hashLog) cParams.hashLog = CCtxParams->cParams.hashLog;
-                 if (CCtxParams->cParams.chainLog) cParams.chainLog = CCtxParams->cParams.chainLog;
-                 if (CCtxParams->cParams.searchLog) cParams.searchLog = CCtxParams->cParams.searchLog;
-                 if (CCtxParams->cParams.searchLength) cParams.searchLength = CCtxParams->cParams.searchLength;
-                 if (CCtxParams->cParams.targetLength) cParams.targetLength = CCtxParams->cParams.targetLength;
-                 if (CCtxParams->cParams.strategy) cParams.strategy = CCtxParams->cParams.strategy;
-                 return cParams;
+             }
              static ZSTD_CCtx_params ZSTD_makeCCtxParamsFromCParams(
                      ZSTD_compressionParameters cParams)
              {
                  case ZSTD_p_minMatch:
                  case ZSTD_p_targetLength:
                  case ZSTD_p_compressionStrategy:
-                 case ZSTD_p_compressLiterals:
                      return 1;
                  case ZSTD_p_format:
                  case ZSTD_p_ldmMinMatch:
                  case ZSTD_p_ldmBucketSizeLog:
                  case ZSTD_p_ldmHashEveryLog:
+                 case ZSTD_p_forceAttachDict:
                  default:
                      return 0;
                  }
                      if (cctx->cdict) return ERROR(stage_wrong);
                      return ZSTD_CCtxParam_setParameter(&cctx->requestedParams, param, value);
-                 case ZSTD_p_compressLiterals:
                  case ZSTD_p_contentSizeFlag:
                  case ZSTD_p_checksumFlag:
                  case ZSTD_p_dictIDFlag:
                                                 * default : 0 when using a CDict, 1 when using a Prefix */
                      return ZSTD_CCtxParam_setParameter(&cctx->requestedParams, param, value);
+                 case ZSTD_p_forceAttachDict:
+                     return ZSTD_CCtxParam_setParameter(&cctx->requestedParams, param, value);
                  case ZSTD_p_nbWorkers:
                      if ((value>0) && cctx->staticSize) {
                          return ERROR(parameter_unsupported);  /* MT not compatible with static alloc */
                      int cLevel = (int)value;  /* cast expected to restore negative sign */
                      if (cLevel > ZSTD_maxCLevel()) cLevel = ZSTD_maxCLevel();
                      if (cLevel) {  /* 0 : does not change current level */
-                         CCtxParams->disableLiteralCompression = (cLevel<0);  /* negative levels disable huffman */
                          CCtxParams->compressionLevel = cLevel;
                      }
                      if (CCtxParams->compressionLevel >= 0) return CCtxParams->compressionLevel;
                      CCtxParams->cParams.strategy = (ZSTD_strategy)value;
                      return (size_t)CCtxParams->cParams.strategy;
-                 case ZSTD_p_compressLiterals:
-                     CCtxParams->disableLiteralCompression = !value;
-                     return !CCtxParams->disableLiteralCompression;
                  case ZSTD_p_contentSizeFlag :
                      /* Content size written in frame header _when known_ (default:1) */
                      DEBUGLOG(4, "set content size flag = %u", (value>0));
                      CCtxParams->forceWindow = (value > 0);
                      return CCtxParams->forceWindow;
+                 case ZSTD_p_forceAttachDict :
+                     CCtxParams->attachDictPref = value ?
+                                                 (value > 0 ? ZSTD_dictForceAttach : ZSTD_dictForceCopy) :
+                                                  ZSTD_dictDefaultAttach;
+                     return CCtxParams->attachDictPref;
                  case ZSTD_p_nbWorkers :
              #ifndef ZSTD_MULTITHREAD
                      if (value>0) return ERROR(parameter_unsupported);
                  }
              }
+             size_t ZSTD_CCtx_getParameter(ZSTD_CCtx* cctx, ZSTD_cParameter param, unsigned* value)
+             {
+                 return ZSTD_CCtxParam_getParameter(&cctx->requestedParams, param, value);
+             }
+             size_t ZSTD_CCtxParam_getParameter(
+                     ZSTD_CCtx_params* CCtxParams, ZSTD_cParameter param, unsigned* value)
+             {
+                 switch(param)
+                 {
+                 case ZSTD_p_format :
+                     *value = CCtxParams->format;
+                     break;
+                 case ZSTD_p_compressionLevel :
+                     *value = CCtxParams->compressionLevel;
+                     break;
+                 case ZSTD_p_windowLog :
+                     *value = CCtxParams->cParams.windowLog;
+                     break;
+                 case ZSTD_p_hashLog :
+                     *value = CCtxParams->cParams.hashLog;
+                     break;
+                 case ZSTD_p_chainLog :
+                     *value = CCtxParams->cParams.chainLog;
+                     break;
+                 case ZSTD_p_searchLog :
+                     *value = CCtxParams->cParams.searchLog;
+                     break;
+                 case ZSTD_p_minMatch :
+                     *value = CCtxParams->cParams.searchLength;
+                     break;
+                 case ZSTD_p_targetLength :
+                     *value = CCtxParams->cParams.targetLength;
+                     break;
+                 case ZSTD_p_compressionStrategy :
+                     *value = (unsigned)CCtxParams->cParams.strategy;
+                     break;
+                 case ZSTD_p_contentSizeFlag :
+                     *value = CCtxParams->fParams.contentSizeFlag;
+                     break;
+                 case ZSTD_p_checksumFlag :
+                     *value = CCtxParams->fParams.checksumFlag;
+                     break;
+                 case ZSTD_p_dictIDFlag :
+                     *value = !CCtxParams->fParams.noDictIDFlag;
+                     break;
+                 case ZSTD_p_forceMaxWindow :
+                     *value = CCtxParams->forceWindow;
+                     break;
+                 case ZSTD_p_forceAttachDict :
+                     *value = CCtxParams->attachDictPref;
+                     break;
+                 case ZSTD_p_nbWorkers :
+             #ifndef ZSTD_MULTITHREAD
+                     assert(CCtxParams->nbWorkers == 0);
+             #endif
+                     *value = CCtxParams->nbWorkers;
+                     break;
+                 case ZSTD_p_jobSize :
+             #ifndef ZSTD_MULTITHREAD
+                     return ERROR(parameter_unsupported);
+             #else
+                     *value = CCtxParams->jobSize;
+                     break;
+             #endif
+                 case ZSTD_p_overlapSizeLog :
+             #ifndef ZSTD_MULTITHREAD
+                     return ERROR(parameter_unsupported);
+             #else
+                     *value = CCtxParams->overlapSizeLog;
+                     break;
+             #endif
+                 case ZSTD_p_enableLongDistanceMatching :
+                     *value = CCtxParams->ldmParams.enableLdm;
+                     break;
+                 case ZSTD_p_ldmHashLog :
+                     *value = CCtxParams->ldmParams.hashLog;
+                     break;
+                 case ZSTD_p_ldmMinMatch :
+                     *value = CCtxParams->ldmParams.minMatchLength;
+                     break;
+                 case ZSTD_p_ldmBucketSizeLog :
+                     *value = CCtxParams->ldmParams.bucketSizeLog;
+                     break;
+                 case ZSTD_p_ldmHashEveryLog :
+                     *value = CCtxParams->ldmParams.hashEveryLog;
+                     break;
+                 default: return ERROR(parameter_unsupported);
+                 }
+                 return 0;
+             }
              /** ZSTD_CCtx_setParametersUsingCCtxParams() :
               *  just applies `params` into `cctx`
               *  no action is performed, parameters are merely stored.
              size_t ZSTD_CCtx_setParametersUsingCCtxParams(
                      ZSTD_CCtx* cctx, const ZSTD_CCtx_params* params)
              {
+                 DEBUGLOG(4, "ZSTD_CCtx_setParametersUsingCCtxParams");
                  if (cctx->streamStage != zcss_init) return ERROR(stage_wrong);
                  if (cctx->cdict) return ERROR(stage_wrong);
                  return 0;
              }
-             static void ZSTD_startNewCompression(ZSTD_CCtx* cctx)
+             /*! ZSTD_CCtx_reset() :
+              *  Also dumps dictionary */
+             void ZSTD_CCtx_reset(ZSTD_CCtx* cctx)
              {
                  cctx->streamStage = zcss_init;
                  cctx->pledgedSrcSizePlusOne = 0;
              }
-             /*! ZSTD_CCtx_reset() :
-              *  Also dumps dictionary */
-             void ZSTD_CCtx_reset(ZSTD_CCtx* cctx)
+             size_t ZSTD_CCtx_resetParameters(ZSTD_CCtx* cctx)
              {
-                 ZSTD_startNewCompression(cctx);
+                 if (cctx->streamStage != zcss_init) return ERROR(stage_wrong);
                  cctx->cdict = NULL;
+                 return ZSTD_CCtxParams_reset(&cctx->requestedParams);
              }
              /** ZSTD_checkCParams() :
                  CLAMPCHECK(cParams.hashLog, ZSTD_HASHLOG_MIN, ZSTD_HASHLOG_MAX);
                  CLAMPCHECK(cParams.searchLog, ZSTD_SEARCHLOG_MIN, ZSTD_SEARCHLOG_MAX);
                  CLAMPCHECK(cParams.searchLength, ZSTD_SEARCHLENGTH_MIN, ZSTD_SEARCHLENGTH_MAX);
-                 if ((U32)(cParams.targetLength) < ZSTD_TARGETLENGTH_MIN)
-                     return ERROR(parameter_unsupported);
+                 ZSTD_STATIC_ASSERT(ZSTD_TARGETLENGTH_MIN == 0);
+                 if (cParams.targetLength > ZSTD_TARGETLENGTH_MAX)
+                     return ERROR(parameter_outOfBound);
                  if ((U32)(cParams.strategy) > (U32)ZSTD_btultra)
                      return ERROR(parameter_unsupported);
                  return 0;
              /** ZSTD_clampCParams() :
               *  make CParam values within valid range.
               *  @return : valid CParams */
-             static ZSTD_compressionParameters ZSTD_clampCParams(ZSTD_compressionParameters cParams)
+             static ZSTD_compressionParameters
+             ZSTD_clampCParams(ZSTD_compressionParameters cParams)
              {
              #   define CLAMP(val,min,max) {      \
                      if (val<min) val=min;        \
                  CLAMP(cParams.hashLog, ZSTD_HASHLOG_MIN, ZSTD_HASHLOG_MAX);
                  CLAMP(cParams.searchLog, ZSTD_SEARCHLOG_MIN, ZSTD_SEARCHLOG_MAX);
                  CLAMP(cParams.searchLength, ZSTD_SEARCHLENGTH_MIN, ZSTD_SEARCHLENGTH_MAX);
-                 if ((U32)(cParams.targetLength) < ZSTD_TARGETLENGTH_MIN) cParams.targetLength = ZSTD_TARGETLENGTH_MIN;
-                 if ((U32)(cParams.strategy) > (U32)ZSTD_btultra) cParams.strategy = ZSTD_btultra;
+                 ZSTD_STATIC_ASSERT(ZSTD_TARGETLENGTH_MIN == 0);
+                 if (cParams.targetLength > ZSTD_TARGETLENGTH_MAX)
+                     cParams.targetLength = ZSTD_TARGETLENGTH_MAX;
+                 CLAMP(cParams.strategy, ZSTD_fast, ZSTD_btultra);
                  return cParams;
              }
                  optimize `cPar` for a given input (`srcSize` and `dictSize`).
                  mostly downsizing to reduce memory consumption and initialization latency.
                  Both `srcSize` and `dictSize` are optional (use 0 if unknown).
-                 Note : cPar is considered validated at this stage. Use ZSTD_checkCParams() to ensure that condition. */
-             ZSTD_compressionParameters ZSTD_adjustCParams_internal(ZSTD_compressionParameters cPar, unsigned long long srcSize, size_t dictSize)
+                 Note : cPar is assumed validated. Use ZSTD_checkCParams() to ensure this condition. */
+             static ZSTD_compressionParameters
+             ZSTD_adjustCParams_internal(ZSTD_compressionParameters cPar,
+                                         unsigned long long srcSize,
+                                         size_t dictSize)
              {
                  static const U64 minSrcSize = 513; /* (1<<9) + 1 */
                  static const U64 maxWindowResize = 1ULL << (ZSTD_WINDOWLOG_MAX-1);
                                          ZSTD_highbit32(tSize-1) + 1;
                      if (cPar.windowLog > srcLog) cPar.windowLog = srcLog;
                  }
-                 if (cPar.hashLog > cPar.windowLog) cPar.hashLog = cPar.windowLog;
+                 if (cPar.hashLog > cPar.windowLog+1) cPar.hashLog = cPar.windowLog+1;
                  {   U32 const cycleLog = ZSTD_cycleLog(cPar.chainLog, cPar.strategy);
                      if (cycleLog > cPar.windowLog)
                          cPar.chainLog -= (cycleLog - cPar.windowLog);
                  return cPar;
              }
-             ZSTD_compressionParameters ZSTD_adjustCParams(ZSTD_compressionParameters cPar, unsigned long long srcSize, size_t dictSize)
+             ZSTD_compressionParameters
+             ZSTD_adjustCParams(ZSTD_compressionParameters cPar,
+                                unsigned long long srcSize,
+                                size_t dictSize)
              {
                  cPar = ZSTD_clampCParams(cPar);
                  return ZSTD_adjustCParams_internal(cPar, srcSize, dictSize);
              }
-             static size_t ZSTD_sizeof_matchState(ZSTD_compressionParameters const* cParams, const U32 forCCtx)
+             ZSTD_compressionParameters ZSTD_getCParamsFromCCtxParams(
+                     const ZSTD_CCtx_params* CCtxParams, U64 srcSizeHint, size_t dictSize)
+             {
+                 ZSTD_compressionParameters cParams = ZSTD_getCParams(CCtxParams->compressionLevel, srcSizeHint, dictSize);
+                 if (CCtxParams->ldmParams.enableLdm) cParams.windowLog = ZSTD_LDM_DEFAULT_WINDOW_LOG;
+                 if (CCtxParams->cParams.windowLog) cParams.windowLog = CCtxParams->cParams.windowLog;
+                 if (CCtxParams->cParams.hashLog) cParams.hashLog = CCtxParams->cParams.hashLog;
+                 if (CCtxParams->cParams.chainLog) cParams.chainLog = CCtxParams->cParams.chainLog;
+                 if (CCtxParams->cParams.searchLog) cParams.searchLog = CCtxParams->cParams.searchLog;
+                 if (CCtxParams->cParams.searchLength) cParams.searchLength = CCtxParams->cParams.searchLength;
+                 if (CCtxParams->cParams.targetLength) cParams.targetLength = CCtxParams->cParams.targetLength;
+                 if (CCtxParams->cParams.strategy) cParams.strategy = CCtxParams->cParams.strategy;
+                 assert(!ZSTD_checkCParams(cParams));
+                 return ZSTD_adjustCParams_internal(cParams, srcSizeHint, dictSize);
+             }
+             static size_t
+             ZSTD_sizeof_matchState(const ZSTD_compressionParameters* const cParams,
+                                    const U32 forCCtx)
              {
                  size_t const chainSize = (cParams->strategy == ZSTD_fast) ? 0 : ((size_t)1 << cParams->chainLog);
                  size_t const hSize = ((size_t)1) << cParams->hashLog;
                      size_t const blockSize = MIN(ZSTD_BLOCKSIZE_MAX, (size_t)1 << cParams.windowLog);
                      U32    const divider = (cParams.searchLength==3) ? 3 : 4;
                      size_t const maxNbSeq = blockSize / divider;
-                     size_t const tokenSpace = blockSize + 11*maxNbSeq;
+                     size_t const tokenSpace = WILDCOPY_OVERLENGTH + blockSize + 11*maxNbSeq;
                      size_t const entropySpace = HUF_WORKSPACE_SIZE;
                      size_t const blockStateSpace = 2 * sizeof(ZSTD_compressedBlockState_t);
                      size_t const matchStateSize = ZSTD_sizeof_matchState(&cParams, /* forCCtx */ 1);
                  return ZSTD_estimateCStreamSize_usingCCtxParams(&params);
              }
-             static size_t ZSTD_estimateCStreamSize_internal(int compressionLevel) {
+             static size_t ZSTD_estimateCStreamSize_internal(int compressionLevel)
+             {
                  ZSTD_compressionParameters const cParams = ZSTD_getCParams(compressionLevel, 0, 0);
                  return ZSTD_estimateCStreamSize_usingCParams(cParams);
              }
-             size_t ZSTD_estimateCStreamSize(int compressionLevel) {
+             size_t ZSTD_estimateCStreamSize(int compressionLevel)
+             {
                  int level;
                  size_t memBudget = 0;
                  for (level=1; level<=compressionLevel; level++) {
                      fp.ingested = cctx->consumedSrcSize + buffered;
                      fp.consumed = cctx->consumedSrcSize;
                      fp.produced = cctx->producedCSize;
+                     fp.flushed  = cctx->producedCSize;   /* simplified; some data might still be left within streaming output buffer */
+                     fp.currentJobID = 0;
+                     fp.nbActiveWorkers = 0;
                      return fp;
              }   }
+             /*! ZSTD_toFlushNow()
+              *  Only useful for multithreading scenarios currently (nbWorkers >= 1).
+              */
+             size_t ZSTD_toFlushNow(ZSTD_CCtx* cctx)
+             {
+             #ifdef ZSTD_MULTITHREAD
+                 if (cctx->appliedParams.nbWorkers > 0) {
+                     return ZSTDMT_toFlushNow(cctx->mtctx);
+                 }
+             #endif
+                 (void)cctx;
+                 return 0;   /* over-simplification; could also check if context is currently running in streaming mode, and in which case, report how many bytes are left to be flushed within output buffer */
+             }
              static U32 ZSTD_equivalentCParams(ZSTD_compressionParameters cParams1,
                                                ZSTD_compressionParameters cParams2)
                       & ((cParams1.searchLength==3) == (cParams2.searchLength==3));  /* hashlog3 space */
              }
+             static void ZSTD_assertEqualCParams(ZSTD_compressionParameters cParams1,
+                                                 ZSTD_compressionParameters cParams2)
+             {
+                 (void)cParams1;
+                 (void)cParams2;
+                 assert(cParams1.windowLog    == cParams2.windowLog);
+                 assert(cParams1.chainLog     == cParams2.chainLog);
+                 assert(cParams1.hashLog      == cParams2.hashLog);
+                 assert(cParams1.searchLog    == cParams2.searchLog);
+                 assert(cParams1.searchLength == cParams2.searchLength);
+                 assert(cParams1.targetLength == cParams2.targetLength);
+                 assert(cParams1.strategy     == cParams2.strategy);
+             }
              /** The parameters are equivalent if ldm is not enabled in both sets or
               *  all the parameters are equivalent. */
              static U32 ZSTD_equivalentLdmParams(ldmParams_t ldmParams1,
              /* ZSTD_sufficientBuff() :
               * check internal buffers exist for streaming if buffPol == ZSTDb_buffered .
               * Note : they are assumed to be correctly sized if ZSTD_equivalentCParams()==1 */
-             static U32 ZSTD_sufficientBuff(size_t bufferSize1, size_t blockSize1,
+             static U32 ZSTD_sufficientBuff(size_t bufferSize1, size_t maxNbSeq1,
+                                         size_t maxNbLit1,
                                          ZSTD_buffered_policy_e buffPol2,
                                          ZSTD_compressionParameters cParams2,
                                          U64 pledgedSrcSize)
              {
                  size_t const windowSize2 = MAX(1, (size_t)MIN(((U64)1 << cParams2.windowLog), pledgedSrcSize));
                  size_t const blockSize2 = MIN(ZSTD_BLOCKSIZE_MAX, windowSize2);
+                 size_t const maxNbSeq2 = blockSize2 / ((cParams2.searchLength == 3) ? 3 : 4);
+                 size_t const maxNbLit2 = blockSize2;
                  size_t const neededBufferSize2 = (buffPol2==ZSTDb_buffered) ? windowSize2 + blockSize2 : 0;
-                 DEBUGLOG(4, "ZSTD_sufficientBuff: is windowSize2=%u <= wlog1=%u",
-                             (U32)windowSize2, cParams2.windowLog);
-                 DEBUGLOG(4, "ZSTD_sufficientBuff: is blockSize2=%u <= blockSize1=%u",
-                             (U32)blockSize2, (U32)blockSize1);
-                 return (blockSize2 <= blockSize1) /* seqStore space depends on blockSize */
+                 DEBUGLOG(4, "ZSTD_sufficientBuff: is neededBufferSize2=%u <= bufferSize1=%u",
+                             (U32)neededBufferSize2, (U32)bufferSize1);
+                 DEBUGLOG(4, "ZSTD_sufficientBuff: is maxNbSeq2=%u <= maxNbSeq1=%u",
+                             (U32)maxNbSeq2, (U32)maxNbSeq1);
+                 DEBUGLOG(4, "ZSTD_sufficientBuff: is maxNbLit2=%u <= maxNbLit1=%u",
+                             (U32)maxNbLit2, (U32)maxNbLit1);
+                 return (maxNbLit2 <= maxNbLit1)
+                      & (maxNbSeq2 <= maxNbSeq1)
                       & (neededBufferSize2 <= bufferSize1);
              }
              /** Equivalence for resetCCtx purposes */
              static U32 ZSTD_equivalentParams(ZSTD_CCtx_params params1,
                                               ZSTD_CCtx_params params2,
-                                              size_t buffSize1, size_t blockSize1,
+                                              size_t buffSize1,
+                                              size_t maxNbSeq1, size_t maxNbLit1,
                                               ZSTD_buffered_policy_e buffPol2,
                                               U64 pledgedSrcSize)
              {
                  DEBUGLOG(4, "ZSTD_equivalentParams: pledgedSrcSize=%u", (U32)pledgedSrcSize);
-                 return ZSTD_equivalentCParams(params1.cParams, params2.cParams) &&
-                        ZSTD_equivalentLdmParams(params1.ldmParams, params2.ldmParams) &&
-                        ZSTD_sufficientBuff(buffSize1, blockSize1, buffPol2, params2.cParams, pledgedSrcSize);
+                 if (!ZSTD_equivalentCParams(params1.cParams, params2.cParams)) {
+                   DEBUGLOG(4, "ZSTD_equivalentCParams() == 0");
+                   return 0;
+                 }
+                 if (!ZSTD_equivalentLdmParams(params1.ldmParams, params2.ldmParams)) {
+                   DEBUGLOG(4, "ZSTD_equivalentLdmParams() == 0");
+                   return 0;
+                 }
+                 if (!ZSTD_sufficientBuff(buffSize1, maxNbSeq1, maxNbLit1, buffPol2,
+                                          params2.cParams, pledgedSrcSize)) {
+                   DEBUGLOG(4, "ZSTD_sufficientBuff() == 0");
+                   return 0;
+                 }
+                 return 1;
              }
              static void ZSTD_reset_compressedBlockState(ZSTD_compressedBlockState_t* bs)
                  int i;
                  for (i = 0; i < ZSTD_REP_NUM; ++i)
                      bs->rep[i] = repStartValue[i];
-                 bs->entropy.hufCTable_repeatMode = HUF_repeat_none;
-                 bs->entropy.offcode_repeatMode = FSE_repeat_none;
-                 bs->entropy.matchlength_repeatMode = FSE_repeat_none;
-                 bs->entropy.litlength_repeatMode = FSE_repeat_none;
+                 bs->entropy.huf.repeatMode = HUF_repeat_none;
+                 bs->entropy.fse.offcode_repeatMode = FSE_repeat_none;
+                 bs->entropy.fse.matchlength_repeatMode = FSE_repeat_none;
+                 bs->entropy.fse.litlength_repeatMode = FSE_repeat_none;
              }
              /*! ZSTD_invalidateMatchState()
                  ZSTD_window_clear(&ms->window);
                  ms->nextToUpdate = ms->window.dictLimit + 1;
+                 ms->nextToUpdate3 = ms->window.dictLimit + 1;
                  ms->loadedDictEnd = 0;
                  ms->opt.litLengthSum = 0;  /* force reset of btopt stats */
+                 ms->dictMatchState = NULL;
              }
              /*! ZSTD_continueCCtx() :
                  cctx->blockSize = blockSize;   /* previous block size could be different even for same windowLog, due to pledgedSrcSize */
                  cctx->appliedParams = params;
+                 cctx->blockState.matchState.cParams = params.cParams;
                  cctx->pledgedSrcSizePlusOne = pledgedSrcSize+1;
                  cctx->consumedSrcSize = 0;
                  cctx->producedCSize = 0;
              typedef enum { ZSTDcrp_continue, ZSTDcrp_noMemset } ZSTD_compResetPolicy_e;
-             static void* ZSTD_reset_matchState(ZSTD_matchState_t* ms, void* ptr, ZSTD_compressionParameters const* cParams, ZSTD_compResetPolicy_e const crp, U32 const forCCtx)
+             static void*
+             ZSTD_reset_matchState(ZSTD_matchState_t* ms,
+                                   void* ptr,
+                             const ZSTD_compressionParameters* cParams,
+                                   ZSTD_compResetPolicy_e const crp, U32 const forCCtx)
              {
                  size_t const chainSize = (cParams->strategy == ZSTD_fast) ? 0 : ((size_t)1 << cParams->chainLog);
                  size_t const hSize = ((size_t)1) << cParams->hashLog;
                  ms->hashLog3 = hashLog3;
                  memset(&ms->window, 0, sizeof(ms->window));
+                 ms->window.dictLimit = 1;    /* start from 1, so that 1st position is valid */
+                 ms->window.lowLimit = 1;     /* it ensures first and later CCtx usages compress the same */
+                 ms->window.nextSrc = ms->window.base + 1;   /* see issue #1241 */
                  ZSTD_invalidateMatchState(ms);
                  /* opt parser space */
                  ms->hashTable3 = ms->chainTable + chainSize;
                  ptr = ms->hashTable3 + h3Size;
+                 ms->cParams = *cParams;
                  assert(((size_t)ptr & 3) == 0);
                  return ptr;
              }
+             #define ZSTD_WORKSPACETOOLARGE_FACTOR 3 /* define "workspace is too large" as this number of times larger than needed */
+             #define ZSTD_WORKSPACETOOLARGE_MAXDURATION 128  /* when workspace is continuously too large
+                                                      * during at least this number of times,
+                                                      * context's memory usage is considered wasteful,
+                                                      * because it's sized to handle a worst case scenario which rarely happens.
+                                                      * In which case, resize it down to free some memory */
              /*! ZSTD_resetCCtx_internal() :
                  note : `params` are assumed fully validated at this stage */
              static size_t ZSTD_resetCCtx_internal(ZSTD_CCtx* zc,
-                                                   ZSTD_CCtx_params params, U64 pledgedSrcSize,
+                                                   ZSTD_CCtx_params params,
+                                                   U64 pledgedSrcSize,
                                                    ZSTD_compResetPolicy_e const crp,
                                                    ZSTD_buffered_policy_e const zbuff)
              {
                  if (crp == ZSTDcrp_continue) {
                      if (ZSTD_equivalentParams(zc->appliedParams, params,
-                                             zc->inBuffSize, zc->blockSize,
-                                             zbuff, pledgedSrcSize)) {
-                         DEBUGLOG(4, "ZSTD_equivalentParams()==1 -> continue mode (wLog1=%u, blockSize1=%u)",
-                                     zc->appliedParams.cParams.windowLog, (U32)zc->blockSize);
-                         return ZSTD_continueCCtx(zc, params, pledgedSrcSize);
+                                               zc->inBuffSize,
+                                               zc->seqStore.maxNbSeq, zc->seqStore.maxNbLit,
+                                               zbuff, pledgedSrcSize)) {
+                         DEBUGLOG(4, "ZSTD_equivalentParams()==1 -> continue mode (wLog1=%u, blockSize1=%zu)",
+                                     zc->appliedParams.cParams.windowLog, zc->blockSize);
+                         zc->workSpaceOversizedDuration += (zc->workSpaceOversizedDuration > 0);   /* if it was too large, it still is */
+                         if (zc->workSpaceOversizedDuration <= ZSTD_WORKSPACETOOLARGE_MAXDURATION)
+                             return ZSTD_continueCCtx(zc, params, pledgedSrcSize);
                  }   }
                  DEBUGLOG(4, "ZSTD_equivalentParams()==0 -> reset CCtx");
                  if (params.ldmParams.enableLdm) {
                      /* Adjust long distance matching parameters */
-                     params.ldmParams.windowLog = params.cParams.windowLog;
                      ZSTD_ldm_adjustParameters(&params.ldmParams, &params.cParams);
                      assert(params.ldmParams.hashLog >= params.ldmParams.bucketSizeLog);
                      assert(params.ldmParams.hashEveryLog < 32);
-                     zc->ldmState.hashPower =
-                             ZSTD_ldm_getHashPower(params.ldmParams.minMatchLength);
+                     zc->ldmState.hashPower = ZSTD_ldm_getHashPower(params.ldmParams.minMatchLength);
                  }
                  {   size_t const windowSize = MAX(1, (size_t)MIN(((U64)1 << params.cParams.windowLog), pledgedSrcSize));
                      size_t const blockSize = MIN(ZSTD_BLOCKSIZE_MAX, windowSize);
                      U32    const divider = (params.cParams.searchLength==3) ? 3 : 4;
                      size_t const maxNbSeq = blockSize / divider;
-                     size_t const tokenSpace = blockSize + 11*maxNbSeq;
+                     size_t const tokenSpace = WILDCOPY_OVERLENGTH + blockSize + 11*maxNbSeq;
                      size_t const buffOutSize = (zbuff==ZSTDb_buffered) ? ZSTD_compressBound(blockSize)+1 : 0;
                      size_t const buffInSize = (zbuff==ZSTDb_buffered) ? windowSize + blockSize : 0;
                      size_t const matchStateSize = ZSTD_sizeof_matchState(&params.cParams, /* forCCtx */ 1);
                      size_t const maxNbLdmSeq = ZSTD_ldm_getMaxNbSeq(params.ldmParams, blockSize);
-                     void* ptr;
+                     void* ptr;   /* used to partition workSpace */
                      /* Check if workSpace is large enough, alloc a new one if needed */
                      {   size_t const entropySpace = HUF_WORKSPACE_SIZE;
                          size_t const neededSpace = entropySpace + blockStateSpace + ldmSpace +
                                                     ldmSeqSpace + matchStateSize + tokenSpace +
                                                     bufferSpace;
-                         DEBUGLOG(4, "Need %uKB workspace, including %uKB for match state, and %uKB for buffers",
-                                     (U32)(neededSpace>>10), (U32)(matchStateSize>>10), (U32)(bufferSpace>>10));
-                         DEBUGLOG(4, "windowSize: %u - blockSize: %u", (U32)windowSize, (U32)blockSize);
-                         if (zc->workSpaceSize < neededSpace) {  /* too small : resize */
-                             DEBUGLOG(4, "Need to update workSpaceSize from %uK to %uK",
-                                         (unsigned)(zc->workSpaceSize>>10),
-                                         (unsigned)(neededSpace>>10));
+                         int const workSpaceTooSmall = zc->workSpaceSize < neededSpace;
+                         int const workSpaceTooLarge = zc->workSpaceSize > ZSTD_WORKSPACETOOLARGE_FACTOR * neededSpace;
+                         int const workSpaceWasteful = workSpaceTooLarge && (zc->workSpaceOversizedDuration > ZSTD_WORKSPACETOOLARGE_MAXDURATION);
+                         zc->workSpaceOversizedDuration = workSpaceTooLarge ? zc->workSpaceOversizedDuration+1 : 0;
+                         DEBUGLOG(4, "Need %zuKB workspace, including %zuKB for match state, and %zuKB for buffers",
+                                     neededSpace>>10, matchStateSize>>10, bufferSpace>>10);
+                         DEBUGLOG(4, "windowSize: %zu - blockSize: %zu", windowSize, blockSize);
+                         if (workSpaceTooSmall || workSpaceWasteful) {
+                             DEBUGLOG(4, "Need to resize workSpaceSize from %zuKB to %zuKB",
+                                         zc->workSpaceSize >> 10,
+                                         neededSpace >> 10);
                              /* static cctx : no resize, error out */
                              if (zc->staticSize) return ERROR(memory_allocation);
                              zc->workSpace = ZSTD_malloc(neededSpace, zc->customMem);
                              if (zc->workSpace == NULL) return ERROR(memory_allocation);
                              zc->workSpaceSize = neededSpace;
-                             ptr = zc->workSpace;
-                             /* Statically sized space. entropyWorkspace never moves (but prev/next block swap places) */
+                             zc->workSpaceOversizedDuration = 0;
+                             /* Statically sized space.
+                              * entropyWorkspace never moves,
+                              * though prev/next block swap places */
                              assert(((size_t)zc->workSpace & 3) == 0);   /* ensure correct alignment */
                              assert(zc->workSpaceSize >= 2 * sizeof(ZSTD_compressedBlockState_t));
                              zc->blockState.prevCBlock = (ZSTD_compressedBlockState_t*)zc->workSpace;
                      /* init params */
                      zc->appliedParams = params;
+                     zc->blockState.matchState.cParams = params.cParams;
                      zc->pledgedSrcSizePlusOne = pledgedSrcSize+1;
                      zc->consumedSrcSize = 0;
                      zc->producedCSize = 0;
                      ptr = ZSTD_reset_matchState(&zc->blockState.matchState, ptr, &params.cParams, crp, /* forCCtx */ 1);
                      /* sequences storage */
+                     zc->seqStore.maxNbSeq = maxNbSeq;
                      zc->seqStore.sequencesStart = (seqDef*)ptr;
                      ptr = zc->seqStore.sequencesStart + maxNbSeq;
                      zc->seqStore.llCode = (BYTE*) ptr;
                      zc->seqStore.mlCode = zc->seqStore.llCode + maxNbSeq;
                      zc->seqStore.ofCode = zc->seqStore.mlCode + maxNbSeq;
                      zc->seqStore.litStart = zc->seqStore.ofCode + maxNbSeq;
-                     ptr = zc->seqStore.litStart + blockSize;
+                     /* ZSTD_wildcopy() is used to copy into the literals buffer,
+                      * so we have to oversize the buffer by WILDCOPY_OVERLENGTH bytes.
+                      */
+                     zc->seqStore.maxNbLit = blockSize;
+                     ptr = zc->seqStore.litStart + blockSize + WILDCOPY_OVERLENGTH;
                      /* ldm bucketOffsets table */
                      if (params.ldmParams.enableLdm) {
                  assert(!ZSTD_window_hasExtDict(cctx->blockState.matchState.window));
              }
-             static size_t ZSTD_resetCCtx_usingCDict(ZSTD_CCtx* cctx,
+             /* These are the approximate sizes for each strategy past which copying the
+              * dictionary tables into the working context is faster than using them
+              * in-place.
+              */
+             static const size_t attachDictSizeCutoffs[(unsigned)ZSTD_btultra+1] = {
+KB, /* unused */
+KB, /* ZSTD_fast */
+KB, /* ZSTD_dfast */
+KB, /* ZSTD_greedy */
+KB, /* ZSTD_lazy */
+KB, /* ZSTD_lazy2 */
+KB, /* ZSTD_btlazy2 */
+KB, /* ZSTD_btopt */
+KB /* ZSTD_btultra */
+             };
+             static int ZSTD_shouldAttachDict(const ZSTD_CDict* cdict,
+                                              ZSTD_CCtx_params params,
+                                              U64 pledgedSrcSize)
+             {
+                 size_t cutoff = attachDictSizeCutoffs[cdict->matchState.cParams.strategy];
+                 return ( pledgedSrcSize <= cutoff
+                       || pledgedSrcSize == ZSTD_CONTENTSIZE_UNKNOWN
+                       || params.attachDictPref == ZSTD_dictForceAttach )
+                     && params.attachDictPref != ZSTD_dictForceCopy
+                     && !params.forceWindow; /* dictMatchState isn't correctly
+                                              * handled in _enforceMaxDist */
+             }
+             static size_t ZSTD_resetCCtx_byAttachingCDict(
+                 ZSTD_CCtx* cctx,
+                 const ZSTD_CDict* cdict,
+                 ZSTD_CCtx_params params,
+                 U64 pledgedSrcSize,
+                 ZSTD_buffered_policy_e zbuff)
+             {
+                 {
+                     const ZSTD_compressionParameters *cdict_cParams = &cdict->matchState.cParams;
+                     unsigned const windowLog = params.cParams.windowLog;
+                     assert(windowLog != 0);
+                     /* Resize working context table params for input only, since the dict
+                      * has its own tables. */
+                     params.cParams = ZSTD_adjustCParams_internal(*cdict_cParams, pledgedSrcSize, 0);
+                     params.cParams.windowLog = windowLog;
+                     ZSTD_resetCCtx_internal(cctx, params, pledgedSrcSize,
+                                             ZSTDcrp_continue, zbuff);
+                     assert(cctx->appliedParams.cParams.strategy == cdict_cParams->strategy);
+                 }
+                 {
+                     const U32 cdictEnd = (U32)( cdict->matchState.window.nextSrc
+                                               - cdict->matchState.window.base);
+                     const U32 cdictLen = cdictEnd - cdict->matchState.window.dictLimit;
+                     if (cdictLen == 0) {
+                         /* don't even attach dictionaries with no contents */
+                         DEBUGLOG(4, "skipping attaching empty dictionary");
+                     } else {
+                         DEBUGLOG(4, "attaching dictionary into context");
+                         cctx->blockState.matchState.dictMatchState = &cdict->matchState;
+                         /* prep working match state so dict matches never have negative indices
+                          * when they are translated to the working context's index space. */
+                         if (cctx->blockState.matchState.window.dictLimit < cdictEnd) {
+                             cctx->blockState.matchState.window.nextSrc =
+                                 cctx->blockState.matchState.window.base + cdictEnd;
+                             ZSTD_window_clear(&cctx->blockState.matchState.window);
+                         }
+                         cctx->blockState.matchState.loadedDictEnd = cctx->blockState.matchState.window.dictLimit;
+                     }
+                 }
+                 cctx->dictID = cdict->dictID;
+                 /* copy block state */
+                 memcpy(cctx->blockState.prevCBlock, &cdict->cBlockState, sizeof(cdict->cBlockState));
+                 return 0;
+             }
+             static size_t ZSTD_resetCCtx_byCopyingCDict(ZSTD_CCtx* cctx,
                                          const ZSTD_CDict* cdict,
-                                         unsigned windowLog,
-                                         ZSTD_frameParameters fParams,
+                                         ZSTD_CCtx_params params,
                                          U64 pledgedSrcSize,
                                          ZSTD_buffered_policy_e zbuff)
              {
-                 {   ZSTD_CCtx_params params = cctx->requestedParams;
+                 const ZSTD_compressionParameters *cdict_cParams = &cdict->matchState.cParams;
+                 DEBUGLOG(4, "copying dictionary into context");
+                 {   unsigned const windowLog = params.cParams.windowLog;
+                     assert(windowLog != 0);
                      /* Copy only compression parameters related to tables. */
-                     params.cParams = cdict->cParams;
-                     if (windowLog) params.cParams.windowLog = windowLog;
-                     params.fParams = fParams;
+                     params.cParams = *cdict_cParams;
+                     params.cParams.windowLog = windowLog;
                      ZSTD_resetCCtx_internal(cctx, params, pledgedSrcSize,
                                              ZSTDcrp_noMemset, zbuff);
-                     assert(cctx->appliedParams.cParams.strategy == cdict->cParams.strategy);
-                     assert(cctx->appliedParams.cParams.hashLog == cdict->cParams.hashLog);
-                     assert(cctx->appliedParams.cParams.chainLog == cdict->cParams.chainLog);
+                     assert(cctx->appliedParams.cParams.strategy == cdict_cParams->strategy);
+                     assert(cctx->appliedParams.cParams.hashLog == cdict_cParams->hashLog);
+                     assert(cctx->appliedParams.cParams.chainLog == cdict_cParams->chainLog);
                  }
                  /* copy tables */
-                 {   size_t const chainSize = (cdict->cParams.strategy == ZSTD_fast) ? 0 : ((size_t)1 << cdict->cParams.chainLog);
-                     size_t const hSize =  (size_t)1 << cdict->cParams.hashLog;
+                 {   size_t const chainSize = (cdict_cParams->strategy == ZSTD_fast) ? 0 : ((size_t)1 << cdict_cParams->chainLog);
+                     size_t const hSize =  (size_t)1 << cdict_cParams->hashLog;
                      size_t const tableSpace = (chainSize + hSize) * sizeof(U32);
                      assert((U32*)cctx->blockState.matchState.chainTable == (U32*)cctx->blockState.matchState.hashTable + hSize);  /* chainTable must follow hashTable */
                      assert((U32*)cctx->blockState.matchState.hashTable3 == (U32*)cctx->blockState.matchState.chainTable + chainSize);
                      assert((U32*)cdict->matchState.hashTable3 == (U32*)cdict->matchState.chainTable + chainSize);
                      memcpy(cctx->blockState.matchState.hashTable, cdict->matchState.hashTable, tableSpace);   /* presumes all tables follow each other */
                  }
                  /* Zero the hashTable3, since the cdict never fills it */
                  {   size_t const h3Size = (size_t)1 << cctx->blockState.matchState.hashLog3;
                      assert(cdict->matchState.hashLog3 == 0);
                  }
                  /* copy dictionary offsets */
+                 {
-                     ZSTD_matchState_t const* srcMatchState = &cdict->matchState;
+                 {   ZSTD_matchState_t const* srcMatchState = &cdict->matchState;
                      ZSTD_matchState_t* dstMatchState = &cctx->blockState.matchState;
                      dstMatchState->window       = srcMatchState->window;
                      dstMatchState->nextToUpdate = srcMatchState->nextToUpdate;
                      dstMatchState->nextToUpdate3= srcMatchState->nextToUpdate3;
                      dstMatchState->loadedDictEnd= srcMatchState->loadedDictEnd;
                  }
                  cctx->dictID = cdict->dictID;
                  /* copy block state */
                  return 0;
              }
+             /* We have a choice between copying the dictionary context into the working
+              * context, or referencing the dictionary context from the working context
+              * in-place. We decide here which strategy to use. */
+             static size_t ZSTD_resetCCtx_usingCDict(ZSTD_CCtx* cctx,
+                                         const ZSTD_CDict* cdict,
+                                         ZSTD_CCtx_params params,
+                                         U64 pledgedSrcSize,
+                                         ZSTD_buffered_policy_e zbuff)
+             {
+                 DEBUGLOG(4, "ZSTD_resetCCtx_usingCDict (pledgedSrcSize=%u)", (U32)pledgedSrcSize);
+                 if (ZSTD_shouldAttachDict(cdict, params, pledgedSrcSize)) {
+                     return ZSTD_resetCCtx_byAttachingCDict(
+                         cctx, cdict, params, pledgedSrcSize, zbuff);
+                 } else {
+                     return ZSTD_resetCCtx_byCopyingCDict(
+                         cctx, cdict, params, pledgedSrcSize, zbuff);
+                 }
+             }
              /*! ZSTD_copyCCtx_internal() :
               *  Duplicate an existing context `srcCCtx` into another one `dstCCtx`.
               *  Only works during stage ZSTDcs_init (i.e. after creation, but before first call to ZSTD_compressContinue()).
                  /* copy dictionary offsets */
                  {
-                     ZSTD_matchState_t const* srcMatchState = &srcCCtx->blockState.matchState;
+                     const ZSTD_matchState_t* srcMatchState = &srcCCtx->blockState.matchState;
                      ZSTD_matchState_t* dstMatchState = &dstCCtx->blockState.matchState;
                      dstMatchState->window       = srcMatchState->window;
                      dstMatchState->nextToUpdate = srcMatchState->nextToUpdate;
              /* See doc/zstd_compression_format.md for detailed format description */
-             size_t ZSTD_noCompressBlock (void* dst, size_t dstCapacity, const void* src, size_t srcSize)
+             static size_t ZSTD_noCompressBlock (void* dst, size_t dstCapacity, const void* src, size_t srcSize, U32 lastBlock)
              {
+                 U32 const cBlockHeader24 = lastBlock + (((U32)bt_raw)<<1) + (U32)(srcSize << 3);
                  if (srcSize + ZSTD_blockHeaderSize > dstCapacity) return ERROR(dstSize_tooSmall);
+                 MEM_writeLE24(dst, cBlockHeader24);
                  memcpy((BYTE*)dst + ZSTD_blockHeaderSize, src, srcSize);
-                 MEM_writeLE24(dst, (U32)(srcSize << 2) + (U32)bt_raw);
-                 return ZSTD_blockHeaderSize+srcSize;
+                 return ZSTD_blockHeaderSize + srcSize;
              }
              static size_t ZSTD_noCompressLiterals (void* dst, size_t dstCapacity, const void* src, size_t srcSize)
              {
                  BYTE* const ostart = (BYTE* const)dst;
              }
-             static size_t ZSTD_minGain(size_t srcSize) { return (srcSize >> 6) + 2; }
-             static size_t ZSTD_compressLiterals (ZSTD_entropyCTables_t const* prevEntropy,
-                                                  ZSTD_entropyCTables_t* nextEntropy,
+             /* ZSTD_minGain() :
+              * minimum compression required
+              * to generate a compress block or a compressed literals section.
+              * note : use same formula for both situations */
+             static size_t ZSTD_minGain(size_t srcSize, ZSTD_strategy strat)
+             {
+                 U32 const minlog = (strat==ZSTD_btultra) ? 7 : 6;
+                 return (srcSize >> minlog) + 2;
+             }
+             static size_t ZSTD_compressLiterals (ZSTD_hufCTables_t const* prevHuf,
+                                                  ZSTD_hufCTables_t* nextHuf,
                                                   ZSTD_strategy strategy, int disableLiteralCompression,
                                                   void* dst, size_t dstCapacity,
                                             const void* src, size_t srcSize,
                                                   U32* workspace, const int bmi2)
              {
-                 size_t const minGain = ZSTD_minGain(srcSize);
+                 size_t const minGain = ZSTD_minGain(srcSize, strategy);
                  size_t const lhSize = 3 + (srcSize >= 1 KB) + (srcSize >= 16 KB);
                  BYTE*  const ostart = (BYTE*)dst;
                  U32 singleStream = srcSize < 256;
                              disableLiteralCompression);
                  /* Prepare nextEntropy assuming reusing the existing table */
-                 nextEntropy->hufCTable_repeatMode = prevEntropy->hufCTable_repeatMode;
-                 memcpy(nextEntropy->hufCTable, prevEntropy->hufCTable,
-                        sizeof(prevEntropy->hufCTable));
+                 memcpy(nextHuf, prevHuf, sizeof(*prevHuf));
                  if (disableLiteralCompression)
                      return ZSTD_noCompressLiterals(dst, dstCapacity, src, srcSize);
                  /* small ? don't even attempt compression (speed opt) */
              #   define COMPRESS_LITERALS_SIZE_MIN 63
-                 {   size_t const minLitSize = (prevEntropy->hufCTable_repeatMode == HUF_repeat_valid) ? 6 : COMPRESS_LITERALS_SIZE_MIN;
+                 {   size_t const minLitSize = (prevHuf->repeatMode == HUF_repeat_valid) ? 6 : COMPRESS_LITERALS_SIZE_MIN;
                      if (srcSize <= minLitSize) return ZSTD_noCompressLiterals(dst, dstCapacity, src, srcSize);
                  }
                  if (dstCapacity < lhSize+1) return ERROR(dstSize_tooSmall);   /* not enough space for compression */
-                 {   HUF_repeat repeat = prevEntropy->hufCTable_repeatMode;
+                 {   HUF_repeat repeat = prevHuf->repeatMode;
                      int const preferRepeat = strategy < ZSTD_lazy ? srcSize <= 1024 : 0;
                      if (repeat == HUF_repeat_valid && lhSize == 3) singleStream = 1;
                      cLitSize = singleStream ? HUF_compress1X_repeat(ostart+lhSize, dstCapacity-lhSize, src, srcSize, 255, 11,
-                                                   workspace, HUF_WORKSPACE_SIZE, (HUF_CElt*)nextEntropy->hufCTable, &repeat, preferRepeat, bmi2)
+                                                   workspace, HUF_WORKSPACE_SIZE, (HUF_CElt*)nextHuf->CTable, &repeat, preferRepeat, bmi2)
                                              : HUF_compress4X_repeat(ostart+lhSize, dstCapacity-lhSize, src, srcSize, 255, 11,
-                                                   workspace, HUF_WORKSPACE_SIZE, (HUF_CElt*)nextEntropy->hufCTable, &repeat, preferRepeat, bmi2);
+                                                   workspace, HUF_WORKSPACE_SIZE, (HUF_CElt*)nextHuf->CTable, &repeat, preferRepeat, bmi2);
                      if (repeat != HUF_repeat_none) {
                          /* reused the existing table */
                          hType = set_repeat;
                  }
                  if ((cLitSize==0) | (cLitSize >= srcSize - minGain) | ERR_isError(cLitSize)) {
-                     memcpy(nextEntropy->hufCTable, prevEntropy->hufCTable, sizeof(prevEntropy->hufCTable));
+                     memcpy(nextHuf, prevHuf, sizeof(*prevHuf));
                      return ZSTD_noCompressLiterals(dst, dstCapacity, src, srcSize);
                  }
                  if (cLitSize==1) {
-                     memcpy(nextEntropy->hufCTable, prevEntropy->hufCTable, sizeof(prevEntropy->hufCTable));
+                     memcpy(nextHuf, prevHuf, sizeof(*prevHuf));
                      return ZSTD_compressRleLiteralsBlock(dst, dstCapacity, src, srcSize);
                  }
                  if (hType == set_compressed) {
                      /* using a newly constructed table */
-                     nextEntropy->hufCTable_repeatMode = HUF_repeat_check;
+                     nextHuf->repeatMode = HUF_repeat_check;
                  }
                  /* Build header */
                  BYTE* const mlCodeTable = seqStorePtr->mlCode;
                  U32 const nbSeq = (U32)(seqStorePtr->sequences - seqStorePtr->sequencesStart);
                  U32 u;
+                 assert(nbSeq <= seqStorePtr->maxNbSeq);
                  for (u=0; u<nbSeq; u++) {
                      U32 const llv = sequences[u].litLength;
                      U32 const mlv = sequences[u].matchLength;
                      mlCodeTable[seqStorePtr->longLengthPos] = MaxML;
              }
+             /**
+              * -log2(x / 256) lookup table for x in [0, 256).
+              * If x == 0: Return 0
+              * Else: Return floor(-log2(x / 256) * 256)
+              */
+             static unsigned const kInverseProbabiltyLog256[256] = {
+,    2048, 1792, 1642, 1536, 1453, 1386, 1329, 1280, 1236, 1197, 1162,
+, 1100, 1073, 1047, 1024, 1001, 980,  960,  941,  923,  906,  889,
+,  859,  844,  830,  817,  804,  791,  779,  768,  756,  745,  734,
+,  714,  704,  694,  685,  676,  667,  658,  650,  642,  633,  626,
+,  610,  603,  595,  588,  581,  574,  567,  561,  554,  548,  542,
+,  529,  523,  517,  512,  506,  500,  495,  489,  484,  478,  473,
+,  463,  458,  453,  448,  443,  438,  434,  429,  424,  420,  415,
+,  407,  402,  398,  394,  390,  386,  382,  377,  373,  370,  366,
+,  358,  354,  350,  347,  343,  339,  336,  332,  329,  325,  322,
+,  315,  311,  308,  305,  302,  298,  295,  292,  289,  286,  282,
+,  276,  273,  270,  267,  264,  261,  258,  256,  253,  250,  247,
+,  241,  239,  236,  233,  230,  228,  225,  222,  220,  217,  215,
+,  209,  207,  204,  202,  199,  197,  194,  192,  190,  187,  185,
+,  180,  178,  175,  173,  171,  168,  166,  164,  162,  159,  157,
+,  153,  151,  149,  146,  144,  142,  140,  138,  136,  134,  132,
+,  128,  126,  123,  121,  119,  117,  115,  114,  112,  110,  108,
+,  104,  102,  100,  98,   96,   94,   93,   91,   89,   87,   85,
+,   82,   80,   78,   76,   74,   73,   71,   69,   67,   66,   64,
+,   61,   59,   57,   55,   54,   52,   50,   49,   47,   46,   44,
+,   41,   39,   37,   36,   34,   33,   31,   30,   28,   26,   25,
+,   22,   20,   19,   17,   16,   14,   13,   11,   10,   8,    7,
+,    4,    2,    1,
+             };
+             /**
+              * Returns the cost in bits of encoding the distribution described by count
+              * using the entropy bound.
+              */
+             static size_t ZSTD_entropyCost(unsigned const* count, unsigned const max, size_t const total)
+             {
+                 unsigned cost = 0;
+                 unsigned s;
+                 for (s = 0; s <= max; ++s) {
+                     unsigned norm = (unsigned)((256 * count[s]) / total);
+                     if (count[s] != 0 && norm == 0)
+                         norm = 1;
+                     assert(count[s] < total);
+                     cost += count[s] * kInverseProbabiltyLog256[norm];
+                 }
+                 return cost >> 8;
+             }
+             /**
+              * Returns the cost in bits of encoding the distribution in count using the
+              * table described by norm. The max symbol support by norm is assumed >= max.
+              * norm must be valid for every symbol with non-zero probability in count.
+              */
+             static size_t ZSTD_crossEntropyCost(short const* norm, unsigned accuracyLog,
+                                                 unsigned const* count, unsigned const max)
+             {
+                 unsigned const shift = 8 - accuracyLog;
+                 size_t cost = 0;
+                 unsigned s;
+                 assert(accuracyLog <= 8);
+                 for (s = 0; s <= max; ++s) {
+                     unsigned const normAcc = norm[s] != -1 ? norm[s] : 1;
+                     unsigned const norm256 = normAcc << shift;
+                     assert(norm256 > 0);
+                     assert(norm256 < 256);
+                     cost += count[s] * kInverseProbabiltyLog256[norm256];
+                 }
+                 return cost >> 8;
+             }
+             static unsigned ZSTD_getFSEMaxSymbolValue(FSE_CTable const* ctable) {
+               void const* ptr = ctable;
+               U16 const* u16ptr = (U16 const*)ptr;
+               U32 const maxSymbolValue = MEM_read16(u16ptr + 1);
+               return maxSymbolValue;
+             }
+             /**
+              * Returns the cost in bits of encoding the distribution in count using ctable.
+              * Returns an error if ctable cannot represent all the symbols in count.
+              */
+             static size_t ZSTD_fseBitCost(
+                 FSE_CTable const* ctable,
+                 unsigned const* count,
+                 unsigned const max)
+             {
+                 unsigned const kAccuracyLog = 8;
+                 size_t cost = 0;
+                 unsigned s;
+                 FSE_CState_t cstate;
+                 FSE_initCState(&cstate, ctable);
+                 if (ZSTD_getFSEMaxSymbolValue(ctable) < max) {
+                     DEBUGLOG(5, "Repeat FSE_CTable has maxSymbolValue %u < %u",
+                                 ZSTD_getFSEMaxSymbolValue(ctable), max);
+                     return ERROR(GENERIC);
+                 }
+                 for (s = 0; s <= max; ++s) {
+                     unsigned const tableLog = cstate.stateLog;
+                     unsigned const badCost = (tableLog + 1) << kAccuracyLog;
+                     unsigned const bitCost = FSE_bitCost(cstate.symbolTT, tableLog, s, kAccuracyLog);
+                     if (count[s] == 0)
+                         continue;
+                     if (bitCost >= badCost) {
+                         DEBUGLOG(5, "Repeat FSE_CTable has Prob[%u] == 0", s);
+                         return ERROR(GENERIC);
+                     }
+                     cost += count[s] * bitCost;
+                 }
+                 return cost >> kAccuracyLog;
+             }
+             /**
+              * Returns the cost in bytes of encoding the normalized count header.
+              * Returns an error if any of the helper functions return an error.
+              */
+             static size_t ZSTD_NCountCost(unsigned const* count, unsigned const max,
+                                           size_t const nbSeq, unsigned const FSELog)
+             {
+                 BYTE wksp[FSE_NCOUNTBOUND];
+                 S16 norm[MaxSeq + 1];
+                 const U32 tableLog = FSE_optimalTableLog(FSELog, nbSeq, max);
+                 CHECK_F(FSE_normalizeCount(norm, tableLog, count, nbSeq, max));
+                 return FSE_writeNCount(wksp, sizeof(wksp), norm, max, tableLog);
+             }
              typedef enum {
                  ZSTD_defaultDisallowed = 0,
                  ZSTD_defaultAllowed = 1
              } ZSTD_defaultPolicy_e;
-             MEM_STATIC
-             symbolEncodingType_e ZSTD_selectEncodingType(
-                     FSE_repeat* repeatMode, size_t const mostFrequent, size_t nbSeq,
-                     U32 defaultNormLog, ZSTD_defaultPolicy_e const isDefaultAllowed)
+             MEM_STATIC symbolEncodingType_e
+             ZSTD_selectEncodingType(
+                     FSE_repeat* repeatMode, unsigned const* count, unsigned const max,
+                     size_t const mostFrequent, size_t nbSeq, unsigned const FSELog,
+                     FSE_CTable const* prevCTable,
+                     short const* defaultNorm, U32 defaultNormLog,
+                     ZSTD_defaultPolicy_e const isDefaultAllowed,
+                     ZSTD_strategy const strategy)
              {
-             #define MIN_SEQ_FOR_DYNAMIC_FSE   64
-             #define MAX_SEQ_FOR_STATIC_FSE  1000
                  ZSTD_STATIC_ASSERT(ZSTD_defaultDisallowed == 0 && ZSTD_defaultAllowed != 0);
-                 if ((mostFrequent == nbSeq) && (!isDefaultAllowed || nbSeq > 2)) {
+                 if (mostFrequent == nbSeq) {
+                     *repeatMode = FSE_repeat_none;
+                     if (isDefaultAllowed && nbSeq <= 2) {
+                         /* Prefer set_basic over set_rle when there are 2 or less symbols,
+                          * since RLE uses 1 byte, but set_basic uses 5-6 bits per symbol.
+                          * If basic encoding isn't possible, always choose RLE.
+                          */
+                         DEBUGLOG(5, "Selected set_basic");
+                         return set_basic;
+                     }
                      DEBUGLOG(5, "Selected set_rle");
-                     /* Prefer set_basic over set_rle when there are 2 or less symbols,
-                      * since RLE uses 1 byte, but set_basic uses 5-6 bits per symbol.
-                      * If basic encoding isn't possible, always choose RLE.
-                      */
-                     *repeatMode = FSE_repeat_check;
                      return set_rle;
                  }
-                 if ( isDefaultAllowed
-                   && (*repeatMode == FSE_repeat_valid) && (nbSeq < MAX_SEQ_FOR_STATIC_FSE)) {
-                     DEBUGLOG(5, "Selected set_repeat");
-                     return set_repeat;
+                 }
-                 if ( isDefaultAllowed
-                   && ((nbSeq < MIN_SEQ_FOR_DYNAMIC_FSE) || (mostFrequent < (nbSeq >> (defaultNormLog-1)))) ) {
-                     DEBUGLOG(5, "Selected set_basic");
-                     /* The format allows default tables to be repeated, but it isn't useful.
-                      * When using simple heuristics to select encoding type, we don't want
-                      * to confuse these tables with dictionaries. When running more careful
-                      * analysis, we don't need to waste time checking both repeating tables
-                      * and default tables.
-                      */
-                     *repeatMode = FSE_repeat_none;
-                     return set_basic;
+                 if (strategy < ZSTD_lazy) {
+                     if (isDefaultAllowed) {
+                         size_t const staticFse_nbSeq_max = 1000;
+                         size_t const mult = 10 - strategy;
+                         size_t const baseLog = 3;
+                         size_t const dynamicFse_nbSeq_min = (((size_t)1 << defaultNormLog) * mult) >> baseLog;  /* 28-36 for offset, 56-72 for lengths */
+                         assert(defaultNormLog >= 5 && defaultNormLog <= 6);  /* xx_DEFAULTNORMLOG */
+                         assert(mult <= 9 && mult >= 7);
+                         if ( (*repeatMode == FSE_repeat_valid)
+                           && (nbSeq < staticFse_nbSeq_max) ) {
+                             DEBUGLOG(5, "Selected set_repeat");
+                             return set_repeat;
+                         }
+                         if ( (nbSeq < dynamicFse_nbSeq_min)
+                           || (mostFrequent < (nbSeq >> (defaultNormLog-1))) ) {
+                             DEBUGLOG(5, "Selected set_basic");
+                             /* The format allows default tables to be repeated, but it isn't useful.
+                              * When using simple heuristics to select encoding type, we don't want
+                              * to confuse these tables with dictionaries. When running more careful
+                              * analysis, we don't need to waste time checking both repeating tables
+                              * and default tables.
+                              */
+                             *repeatMode = FSE_repeat_none;
+                             return set_basic;
+                         }
+                     }
+                 } else {
+                     size_t const basicCost = isDefaultAllowed ? ZSTD_crossEntropyCost(defaultNorm, defaultNormLog, count, max) : ERROR(GENERIC);
+                     size_t const repeatCost = *repeatMode != FSE_repeat_none ? ZSTD_fseBitCost(prevCTable, count, max) : ERROR(GENERIC);
+                     size_t const NCountCost = ZSTD_NCountCost(count, max, nbSeq, FSELog);
+                     size_t const compressedCost = (NCountCost << 3) + ZSTD_entropyCost(count, max, nbSeq);
+                     if (isDefaultAllowed) {
+                         assert(!ZSTD_isError(basicCost));
+                         assert(!(*repeatMode == FSE_repeat_valid && ZSTD_isError(repeatCost)));
+                     }
+                     assert(!ZSTD_isError(NCountCost));
+                     assert(compressedCost < ERROR(maxCode));
+                     DEBUGLOG(5, "Estimated bit costs: basic=%u\trepeat=%u\tcompressed=%u",
+                                 (U32)basicCost, (U32)repeatCost, (U32)compressedCost);
+                     if (basicCost <= repeatCost && basicCost <= compressedCost) {
+                         DEBUGLOG(5, "Selected set_basic");
+                         assert(isDefaultAllowed);
+                         *repeatMode = FSE_repeat_none;
+                         return set_basic;
+                     }
+                     if (repeatCost <= compressedCost) {
+                         DEBUGLOG(5, "Selected set_repeat");
+                         assert(!ZSTD_isError(repeatCost));
+                         return set_repeat;
+                     }
+                     assert(compressedCost < basicCost && compressedCost < repeatCost);
                  }
                  DEBUGLOG(5, "Selected set_compressed");
                  *repeatMode = FSE_repeat_check;
                  return set_compressed;
              }
-             MEM_STATIC
-             size_t ZSTD_buildCTable(void* dst, size_t dstCapacity,
-                     FSE_CTable* nextCTable, U32 FSELog, symbolEncodingType_e type,
-                     U32* count, U32 max,
-                     BYTE const* codeTable, size_t nbSeq,
-                     S16 const* defaultNorm, U32 defaultNormLog, U32 defaultMax,
-                     FSE_CTable const* prevCTable, size_t prevCTableSize,
-                     void* workspace, size_t workspaceSize)
+             MEM_STATIC size_t
+             ZSTD_buildCTable(void* dst, size_t dstCapacity,
+                             FSE_CTable* nextCTable, U32 FSELog, symbolEncodingType_e type,
+                             U32* count, U32 max,
+                             const BYTE* codeTable, size_t nbSeq,
+                             const S16* defaultNorm, U32 defaultNormLog, U32 defaultMax,
+                             const FSE_CTable* prevCTable, size_t prevCTableSize,
+                             void* workspace, size_t workspaceSize)
              {
                  BYTE* op = (BYTE*)dst;
-                 BYTE const* const oend = op + dstCapacity;
+                 const BYTE* const oend = op + dstCapacity;
                  switch (type) {
                  case set_rle:
              #endif
-             size_t ZSTD_encodeSequences(
+             static size_t ZSTD_encodeSequences(
                          void* dst, size_t dstCapacity,
                          FSE_CTable const* CTable_MatchLength, BYTE const* mlCodeTable,
                          FSE_CTable const* CTable_OffsetBits, BYTE const* ofCodeTable,
                                            const int bmi2)
              {
                  const int longOffsets = cctxParams->cParams.windowLog > STREAM_ACCUMULATOR_MIN;
+                 ZSTD_strategy const strategy = cctxParams->cParams.strategy;
                  U32 count[MaxSeq+1];
-                 FSE_CTable* CTable_LitLength = nextEntropy->litlengthCTable;
-                 FSE_CTable* CTable_OffsetBits = nextEntropy->offcodeCTable;
-                 FSE_CTable* CTable_MatchLength = nextEntropy->matchlengthCTable;
+                 FSE_CTable* CTable_LitLength = nextEntropy->fse.litlengthCTable;
+                 FSE_CTable* CTable_OffsetBits = nextEntropy->fse.offcodeCTable;
+                 FSE_CTable* CTable_MatchLength = nextEntropy->fse.matchlengthCTable;
                  U32 LLtype, Offtype, MLtype;   /* compressed, raw or rle */
                  const seqDef* const sequences = seqStorePtr->sequencesStart;
                  const BYTE* const ofCodeTable = seqStorePtr->ofCode;
                  BYTE* op = ostart;
                  size_t const nbSeq = seqStorePtr->sequences - seqStorePtr->sequencesStart;
                  BYTE* seqHead;
+                 BYTE* lastNCount = NULL;
                  ZSTD_STATIC_ASSERT(HUF_WORKSPACE_SIZE >= (1<<MAX(MLFSELog,LLFSELog)));
                  /* Compress literals */
                  {   const BYTE* const literals = seqStorePtr->litStart;
                      size_t const litSize = seqStorePtr->lit - literals;
+                     int const disableLiteralCompression = (cctxParams->cParams.strategy == ZSTD_fast) && (cctxParams->cParams.targetLength > 0);
                      size_t const cSize = ZSTD_compressLiterals(
-                                                 prevEntropy, nextEntropy,
-                                                 cctxParams->cParams.strategy, cctxParams->disableLiteralCompression,
+                                                 &prevEntropy->huf, &nextEntropy->huf,
+                                                 cctxParams->cParams.strategy, disableLiteralCompression,
                                                  op, dstCapacity,
                                                  literals, litSize,
                                                  workspace, bmi2);
                  else
                      op[0]=0xFF, MEM_writeLE16(op+1, (U16)(nbSeq - LONGNBSEQ)), op+=3;
                  if (nbSeq==0) {
-                   memcpy(nextEntropy->litlengthCTable, prevEntropy->litlengthCTable, sizeof(prevEntropy->litlengthCTable));
-                   nextEntropy->litlength_repeatMode = prevEntropy->litlength_repeatMode;
-                   memcpy(nextEntropy->offcodeCTable, prevEntropy->offcodeCTable, sizeof(prevEntropy->offcodeCTable));
-                   nextEntropy->offcode_repeatMode = prevEntropy->offcode_repeatMode;
-                   memcpy(nextEntropy->matchlengthCTable, prevEntropy->matchlengthCTable, sizeof(prevEntropy->matchlengthCTable));
-                   nextEntropy->matchlength_repeatMode = prevEntropy->matchlength_repeatMode;
-                   return op - ostart;
+                     /* Copy the old tables over as if we repeated them */
+                     memcpy(&nextEntropy->fse, &prevEntropy->fse, sizeof(prevEntropy->fse));
+                     return op - ostart;
                  }
                  /* seqHead : flags for FSE encoding type */
                  ZSTD_seqToCodes(seqStorePtr);
                  /* build CTable for Literal Lengths */
                  {   U32 max = MaxLL;
-                     size_t const mostFrequent = FSE_countFast_wksp(count, &max, llCodeTable, nbSeq, workspace);
+                     size_t const mostFrequent = HIST_countFast_wksp(count, &max, llCodeTable, nbSeq, workspace);   /* can't fail */
                      DEBUGLOG(5, "Building LL table");
-                     nextEntropy->litlength_repeatMode = prevEntropy->litlength_repeatMode;
-                     LLtype = ZSTD_selectEncodingType(&nextEntropy->litlength_repeatMode, mostFrequent, nbSeq, LL_defaultNormLog, ZSTD_defaultAllowed);
+                     nextEntropy->fse.litlength_repeatMode = prevEntropy->fse.litlength_repeatMode;
+                     LLtype = ZSTD_selectEncodingType(&nextEntropy->fse.litlength_repeatMode, count, max, mostFrequent, nbSeq, LLFSELog, prevEntropy->fse.litlengthCTable, LL_defaultNorm, LL_defaultNormLog, ZSTD_defaultAllowed, strategy);
+                     assert(set_basic < set_compressed && set_rle < set_compressed);
+                     assert(!(LLtype < set_compressed && nextEntropy->fse.litlength_repeatMode != FSE_repeat_none)); /* We don't copy tables */
                      {   size_t const countSize = ZSTD_buildCTable(op, oend - op, CTable_LitLength, LLFSELog, (symbolEncodingType_e)LLtype,
-                                 count, max, llCodeTable, nbSeq, LL_defaultNorm, LL_defaultNormLog, MaxLL,
-                                 prevEntropy->litlengthCTable, sizeof(prevEntropy->litlengthCTable),
-                                 workspace, HUF_WORKSPACE_SIZE);
+                                                                 count, max, llCodeTable, nbSeq, LL_defaultNorm, LL_defaultNormLog, MaxLL,
+                                                                 prevEntropy->fse.litlengthCTable, sizeof(prevEntropy->fse.litlengthCTable),
+                                                                 workspace, HUF_WORKSPACE_SIZE);
                          if (ZSTD_isError(countSize)) return countSize;
+                         if (LLtype == set_compressed)
+                             lastNCount = op;
                          op += countSize;
                  }   }
                  /* build CTable for Offsets */
                  {   U32 max = MaxOff;
-                     size_t const mostFrequent = FSE_countFast_wksp(count, &max, ofCodeTable, nbSeq, workspace);
+                     size_t const mostFrequent = HIST_countFast_wksp(count, &max, ofCodeTable, nbSeq, workspace);  /* can't fail */
                      /* We can only use the basic table if max <= DefaultMaxOff, otherwise the offsets are too large */
                      ZSTD_defaultPolicy_e const defaultPolicy = (max <= DefaultMaxOff) ? ZSTD_defaultAllowed : ZSTD_defaultDisallowed;
                      DEBUGLOG(5, "Building OF table");
-                     nextEntropy->offcode_repeatMode = prevEntropy->offcode_repeatMode;
-                     Offtype = ZSTD_selectEncodingType(&nextEntropy->offcode_repeatMode, mostFrequent, nbSeq, OF_defaultNormLog, defaultPolicy);
+                     nextEntropy->fse.offcode_repeatMode = prevEntropy->fse.offcode_repeatMode;
+                     Offtype = ZSTD_selectEncodingType(&nextEntropy->fse.offcode_repeatMode, count, max, mostFrequent, nbSeq, OffFSELog, prevEntropy->fse.offcodeCTable, OF_defaultNorm, OF_defaultNormLog, defaultPolicy, strategy);
+                     assert(!(Offtype < set_compressed && nextEntropy->fse.offcode_repeatMode != FSE_repeat_none)); /* We don't copy tables */
                      {   size_t const countSize = ZSTD_buildCTable(op, oend - op, CTable_OffsetBits, OffFSELog, (symbolEncodingType_e)Offtype,
-                                 count, max, ofCodeTable, nbSeq, OF_defaultNorm, OF_defaultNormLog, DefaultMaxOff,
-                                 prevEntropy->offcodeCTable, sizeof(prevEntropy->offcodeCTable),
-                                 workspace, HUF_WORKSPACE_SIZE);
+                                                                 count, max, ofCodeTable, nbSeq, OF_defaultNorm, OF_defaultNormLog, DefaultMaxOff,
+                                                                 prevEntropy->fse.offcodeCTable, sizeof(prevEntropy->fse.offcodeCTable),
+                                                                 workspace, HUF_WORKSPACE_SIZE);
                          if (ZSTD_isError(countSize)) return countSize;
+                         if (Offtype == set_compressed)
+                             lastNCount = op;
                          op += countSize;
                  }   }
                  /* build CTable for MatchLengths */
                  {   U32 max = MaxML;
-                     size_t const mostFrequent = FSE_countFast_wksp(count, &max, mlCodeTable, nbSeq, workspace);
+                     size_t const mostFrequent = HIST_countFast_wksp(count, &max, mlCodeTable, nbSeq, workspace);   /* can't fail */
                      DEBUGLOG(5, "Building ML table");
-                     nextEntropy->matchlength_repeatMode = prevEntropy->matchlength_repeatMode;
-                     MLtype = ZSTD_selectEncodingType(&nextEntropy->matchlength_repeatMode, mostFrequent, nbSeq, ML_defaultNormLog, ZSTD_defaultAllowed);
+                     nextEntropy->fse.matchlength_repeatMode = prevEntropy->fse.matchlength_repeatMode;
+                     MLtype = ZSTD_selectEncodingType(&nextEntropy->fse.matchlength_repeatMode, count, max, mostFrequent, nbSeq, MLFSELog, prevEntropy->fse.matchlengthCTable, ML_defaultNorm, ML_defaultNormLog, ZSTD_defaultAllowed, strategy);
+                     assert(!(MLtype < set_compressed && nextEntropy->fse.matchlength_repeatMode != FSE_repeat_none)); /* We don't copy tables */
                      {   size_t const countSize = ZSTD_buildCTable(op, oend - op, CTable_MatchLength, MLFSELog, (symbolEncodingType_e)MLtype,
-                                 count, max, mlCodeTable, nbSeq, ML_defaultNorm, ML_defaultNormLog, MaxML,
-                                 prevEntropy->matchlengthCTable, sizeof(prevEntropy->matchlengthCTable),
-                                 workspace, HUF_WORKSPACE_SIZE);
+                                                                 count, max, mlCodeTable, nbSeq, ML_defaultNorm, ML_defaultNormLog, MaxML,
+                                                                 prevEntropy->fse.matchlengthCTable, sizeof(prevEntropy->fse.matchlengthCTable),
+                                                                 workspace, HUF_WORKSPACE_SIZE);
                          if (ZSTD_isError(countSize)) return countSize;
+                         if (MLtype == set_compressed)
+                             lastNCount = op;
                          op += countSize;
                  }   }
                                                      longOffsets, bmi2);
                      if (ZSTD_isError(bitstreamSize)) return bitstreamSize;
                      op += bitstreamSize;
+                     /* zstd versions <= 1.3.4 mistakenly report corruption when
+                      * FSE_readNCount() recieves a buffer < 4 bytes.
+                      * Fixed by https://github.com/facebook/zstd/pull/1146.
+                      * This can happen when the last set_compressed table present is 2
+                      * bytes and the bitstream is only one byte.
+                      * In this exceedingly rare case, we will simply emit an uncompressed
+                      * block, since it isn't worth optimizing.
+                      */
+                     if (lastNCount && (op - lastNCount) < 4) {
+                         /* NCountSize >= 2 && bitstreamSize > 0 ==> lastCountSize == 3 */
+                         assert(op - lastNCount == 3);
+                         DEBUGLOG(5, "Avoiding bug in zstd decoder in versions <= 1.3.4 by "
+                                     "emitting an uncompressed block.");
+                         return 0;
+                     }
                  }
                  return op - ostart;
              }
              MEM_STATIC size_t ZSTD_compressSequences(seqStore_t* seqStorePtr,
-                                           ZSTD_entropyCTables_t const* prevEntropy,
+                                     const ZSTD_entropyCTables_t* prevEntropy,
                                            ZSTD_entropyCTables_t* nextEntropy,
-                                           ZSTD_CCtx_params const* cctxParams,
+                                     const ZSTD_CCtx_params* cctxParams,
                                            void* dst, size_t dstCapacity,
                                            size_t srcSize, U32* workspace, int bmi2)
              {
                  size_t const cSize = ZSTD_compressSequences_internal(
                          seqStorePtr, prevEntropy, nextEntropy, cctxParams, dst, dstCapacity,
                          workspace, bmi2);
+                 if (cSize == 0) return 0;
                  /* When srcSize <= dstCapacity, there is enough space to write a raw uncompressed block.
                   * Since we ran out of space, block must be not compressible, so fall back to raw uncompressed block.
                   */
                  if (ZSTD_isError(cSize)) return cSize;
                  /* Check compressibility */
-                 {   size_t const maxCSize = srcSize - ZSTD_minGain(srcSize);  /* note : fixed formula, maybe should depend on compression level, or strategy */
+                 {   size_t const maxCSize = srcSize - ZSTD_minGain(srcSize, cctxParams->cParams.strategy);
                      if (cSize >= maxCSize) return 0;  /* block not compressed */
                  }
-                 /* We check that dictionaries have offset codes available for the first
-                  * block. After the first block, the offcode table might not have large
-                  * enough codes to represent the offsets in the data.
-                  */
-                 if (nextEntropy->offcode_repeatMode == FSE_repeat_valid)
-                     nextEntropy->offcode_repeatMode = FSE_repeat_check;
                  return cSize;
              }
              /* ZSTD_selectBlockCompressor() :
               * Not static, but internal use only (used by long distance matcher)
               * assumption : strat is a valid strategy */
-             ZSTD_blockCompressor ZSTD_selectBlockCompressor(ZSTD_strategy strat, int extDict)
+             ZSTD_blockCompressor ZSTD_selectBlockCompressor(ZSTD_strategy strat, ZSTD_dictMode_e dictMode)
              {
-                 static const ZSTD_blockCompressor blockCompressor[2][(unsigned)ZSTD_btultra+1] = {
+                 static const ZSTD_blockCompressor blockCompressor[3][(unsigned)ZSTD_btultra+1] = {
                      { ZSTD_compressBlock_fast  /* default for 0 */,
-                       ZSTD_compressBlock_fast, ZSTD_compressBlock_doubleFast, ZSTD_compressBlock_greedy,
-                       ZSTD_compressBlock_lazy, ZSTD_compressBlock_lazy2, ZSTD_compressBlock_btlazy2,
-                       ZSTD_compressBlock_btopt, ZSTD_compressBlock_btultra },
+                       ZSTD_compressBlock_fast,
+                       ZSTD_compressBlock_doubleFast,
+                       ZSTD_compressBlock_greedy,
+                       ZSTD_compressBlock_lazy,
+                       ZSTD_compressBlock_lazy2,
+                       ZSTD_compressBlock_btlazy2,
+                       ZSTD_compressBlock_btopt,
+                       ZSTD_compressBlock_btultra },
                      { ZSTD_compressBlock_fast_extDict  /* default for 0 */,
-                       ZSTD_compressBlock_fast_extDict, ZSTD_compressBlock_doubleFast_extDict, ZSTD_compressBlock_greedy_extDict,
-                       ZSTD_compressBlock_lazy_extDict,ZSTD_compressBlock_lazy2_extDict, ZSTD_compressBlock_btlazy2_extDict,
-                       ZSTD_compressBlock_btopt_extDict, ZSTD_compressBlock_btultra_extDict }
+                       ZSTD_compressBlock_fast_extDict,
+                       ZSTD_compressBlock_doubleFast_extDict,
+                       ZSTD_compressBlock_greedy_extDict,
+                       ZSTD_compressBlock_lazy_extDict,
+                       ZSTD_compressBlock_lazy2_extDict,
+                       ZSTD_compressBlock_btlazy2_extDict,
+                       ZSTD_compressBlock_btopt_extDict,
+                       ZSTD_compressBlock_btultra_extDict },
+                     { ZSTD_compressBlock_fast_dictMatchState  /* default for 0 */,
+                       ZSTD_compressBlock_fast_dictMatchState,
+                       ZSTD_compressBlock_doubleFast_dictMatchState,
+                       ZSTD_compressBlock_greedy_dictMatchState,
+                       ZSTD_compressBlock_lazy_dictMatchState,
+                       ZSTD_compressBlock_lazy2_dictMatchState,
+                       ZSTD_compressBlock_btlazy2_dictMatchState,
+                       ZSTD_compressBlock_btopt_dictMatchState,
+                       ZSTD_compressBlock_btultra_dictMatchState }
                  };
+                 ZSTD_blockCompressor selectedCompressor;
                  ZSTD_STATIC_ASSERT((unsigned)ZSTD_fast == 1);
                  assert((U32)strat >= (U32)ZSTD_fast);
                  assert((U32)strat <= (U32)ZSTD_btultra);
-                 return blockCompressor[extDict!=0][(U32)strat];
+                 selectedCompressor = blockCompressor[(int)dictMode][(U32)strat];
+                 assert(selectedCompressor != NULL);
+                 return selectedCompressor;
              }
              static void ZSTD_storeLastLiterals(seqStore_t* seqStorePtr,
                  seqStorePtr->lit += lastLLSize;
              }
-             static void ZSTD_resetSeqStore(seqStore_t* ssPtr)
+             void ZSTD_resetSeqStore(seqStore_t* ssPtr)
              {
                  ssPtr->lit = ssPtr->litStart;
                  ssPtr->sequences = ssPtr->sequencesStart;
                                                      const void* src, size_t srcSize)
              {
                  ZSTD_matchState_t* const ms = &zc->blockState.matchState;
-                 DEBUGLOG(5, "ZSTD_compressBlock_internal (dstCapacity=%u, dictLimit=%u, nextToUpdate=%u)",
-                             (U32)dstCapacity, ms->window.dictLimit, ms->nextToUpdate);
+                 size_t cSize;
+                 DEBUGLOG(5, "ZSTD_compressBlock_internal (dstCapacity=%zu, dictLimit=%u, nextToUpdate=%u)",
+                             dstCapacity, ms->window.dictLimit, ms->nextToUpdate);
+                 assert(srcSize <= ZSTD_BLOCKSIZE_MAX);
+                 /* Assert that we have correctly flushed the ctx params into the ms's copy */
+                 ZSTD_assertEqualCParams(zc->appliedParams.cParams, ms->cParams);
                  if (srcSize < MIN_CBLOCK_SIZE+ZSTD_blockHeaderSize+1) {
                      ZSTD_ldm_skipSequences(&zc->externSeqStore, srcSize, zc->appliedParams.cParams.searchLength);
-                     return 0;   /* don't even attempt compression below a certain srcSize */
+                     cSize = 0;
+                     goto out;  /* don't even attempt compression below a certain srcSize */
                  }
                  ZSTD_resetSeqStore(&(zc->seqStore));
+                 ms->opt.symbolCosts = &zc->blockState.prevCBlock->entropy;   /* required for optimal parser to read stats from dictionary */
+                 /* a gap between an attached dict and the current window is not safe,
+                  * they must remain adjacent, and when that stops being the case, the dict
+                  * must be unset */
+                 assert(ms->dictMatchState == NULL || ms->loadedDictEnd == ms->window.dictLimit);
                  /* limited update after a very long match */
                  {   const BYTE* const base = ms->window.base;
                      const BYTE* const istart = (const BYTE*)src;
                      const U32 current = (U32)(istart-base);
+                     if (sizeof(ptrdiff_t)==8) assert(istart - base < (ptrdiff_t)(U32)(-1));   /* ensure no overflow */
                      if (current > ms->nextToUpdate + 384)
                          ms->nextToUpdate = current - MIN(192, (U32)(current - ms->nextToUpdate - 384));
                  }
                  /* select and store sequences */
-                 {   U32 const extDict = ZSTD_window_hasExtDict(ms->window);
+                 {   ZSTD_dictMode_e const dictMode = ZSTD_matchState_dictMode(ms);
                      size_t lastLLSize;
                      {   int i;
                          for (i = 0; i < ZSTD_REP_NUM; ++i)
                              ZSTD_ldm_blockCompress(&zc->externSeqStore,
                                                     ms, &zc->seqStore,
                                                     zc->blockState.nextCBlock->rep,
-                                                    &zc->appliedParams.cParams,
-                                                    src, srcSize, extDict);
+                                                    src, srcSize);
                          assert(zc->externSeqStore.pos <= zc->externSeqStore.size);
                      } else if (zc->appliedParams.ldmParams.enableLdm) {
                          rawSeqStore_t ldmSeqStore = {NULL, 0, 0, 0};
                              ZSTD_ldm_blockCompress(&ldmSeqStore,
                                                     ms, &zc->seqStore,
                                                     zc->blockState.nextCBlock->rep,
-                                                    &zc->appliedParams.cParams,
-                                                    src, srcSize, extDict);
+                                                    src, srcSize);
                          assert(ldmSeqStore.pos == ldmSeqStore.size);
                      } else {   /* not long range mode */
-                         ZSTD_blockCompressor const blockCompressor = ZSTD_selectBlockCompressor(zc->appliedParams.cParams.strategy, extDict);
-                         lastLLSize = blockCompressor(ms, &zc->seqStore, zc->blockState.nextCBlock->rep, &zc->appliedParams.cParams, src, srcSize);
+                         ZSTD_blockCompressor const blockCompressor = ZSTD_selectBlockCompressor(zc->appliedParams.cParams.strategy, dictMode);
+                         lastLLSize = blockCompressor(ms, &zc->seqStore, zc->blockState.nextCBlock->rep, src, srcSize);
                      }
                      {   const BYTE* const lastLiterals = (const BYTE*)src + srcSize - lastLLSize;
                          ZSTD_storeLastLiterals(&zc->seqStore, lastLiterals, lastLLSize);
                  }   }
                  /* encode sequences and literals */
-                 {   size_t const cSize = ZSTD_compressSequences(&zc->seqStore,
-                                             &zc->blockState.prevCBlock->entropy, &zc->blockState.nextCBlock->entropy,
-                                             &zc->appliedParams,
-                                             dst, dstCapacity,
-                                             srcSize, zc->entropyWorkspace, zc->bmi2);
-                     if (ZSTD_isError(cSize) || cSize == 0) return cSize;
-                     /* confirm repcodes and entropy tables */
-                     {   ZSTD_compressedBlockState_t* const tmp = zc->blockState.prevCBlock;
-                         zc->blockState.prevCBlock = zc->blockState.nextCBlock;
-                         zc->blockState.nextCBlock = tmp;
+                     }
-                     return cSize;
+                 cSize = ZSTD_compressSequences(&zc->seqStore,
+                         &zc->blockState.prevCBlock->entropy, &zc->blockState.nextCBlock->entropy,
+                         &zc->appliedParams,
+                         dst, dstCapacity,
+                         srcSize, zc->entropyWorkspace, zc->bmi2);
+             out:
+                 if (!ZSTD_isError(cSize) && cSize != 0) {
+                     /* confirm repcodes and entropy tables when emitting a compressed block */
+                     ZSTD_compressedBlockState_t* const tmp = zc->blockState.prevCBlock;
+                     zc->blockState.prevCBlock = zc->blockState.nextCBlock;
+                     zc->blockState.nextCBlock = tmp;
                  }
+                 /* We check that dictionaries have offset codes available for the first
+                  * block. After the first block, the offcode table might not have large
+                  * enough codes to represent the offsets in the data.
+                  */
+                 if (zc->blockState.prevCBlock->entropy.fse.offcode_repeatMode == FSE_repeat_valid)
+                     zc->blockState.prevCBlock->entropy.fse.offcode_repeatMode = FSE_repeat_check;
+                 return cSize;
              }
                          ZSTD_STATIC_ASSERT(ZSTD_CHAINLOG_MAX <= 30);
                          ZSTD_STATIC_ASSERT(ZSTD_WINDOWLOG_MAX_32 <= 30);
                          ZSTD_STATIC_ASSERT(ZSTD_WINDOWLOG_MAX <= 31);
                          ZSTD_reduceIndex(cctx, correction);
                          if (ms->nextToUpdate < correction) ms->nextToUpdate = 0;
                          else ms->nextToUpdate -= correction;
                          ms->loadedDictEnd = 0;
+                         ms->dictMatchState = NULL;
                      }
-                     ZSTD_window_enforceMaxDist(&ms->window, ip + blockSize, maxDist, &ms->loadedDictEnd);
+                     ZSTD_window_enforceMaxDist(&ms->window, ip + blockSize, maxDist, &ms->loadedDictEnd, &ms->dictMatchState);
                      if (ms->nextToUpdate < ms->window.lowLimit) ms->nextToUpdate = ms->window.lowLimit;
                      {   size_t cSize = ZSTD_compressBlock_internal(cctx,
                          if (ZSTD_isError(cSize)) return cSize;
                          if (cSize == 0) {  /* block is not compressible */
-                             U32 const cBlockHeader24 = lastBlock + (((U32)bt_raw)<<1) + (U32)(blockSize << 3);
-                             if (blockSize + ZSTD_blockHeaderSize > dstCapacity) return ERROR(dstSize_tooSmall);
-                             MEM_writeLE32(op, cBlockHeader24);   /* 4th byte will be overwritten */
-                             memcpy(op + ZSTD_blockHeaderSize, ip, blockSize);
-                             cSize = ZSTD_blockHeaderSize + blockSize;
+                             cSize = ZSTD_noCompressBlock(op, dstCapacity, ip, blockSize, lastBlock);
+                             if (ZSTD_isError(cSize)) return cSize;
                          } else {
                              U32 const cBlockHeader24 = lastBlock + (((U32)bt_compressed)<<1) + (U32)(cSize << 3);
                              MEM_writeLE24(op, cBlockHeader24);
                  BYTE  const frameHeaderDecriptionByte = (BYTE)(dictIDSizeCode + (checksumFlag<<2) + (singleSegment<<5) + (fcsCode<<6) );
                  size_t pos=0;
+                 assert(!(params.fParams.contentSizeFlag && pledgedSrcSize == ZSTD_CONTENTSIZE_UNKNOWN));
                  if (dstCapacity < ZSTD_frameHeaderSize_max) return ERROR(dstSize_tooSmall);
                  DEBUGLOG(4, "ZSTD_writeFrameHeader : dictIDFlag : %u ; dictID : %u ; dictIDSizeCode : %u",
                              !params.fParams.noDictIDFlag, dictID,  dictIDSizeCode);
                                      const void* src, size_t srcSize,
                                             U32 frame, U32 lastFrameChunk)
              {
-                 ZSTD_matchState_t* ms = &cctx->blockState.matchState;
+                 ZSTD_matchState_t* const ms = &cctx->blockState.matchState;
                  size_t fhSize = 0;
                  DEBUGLOG(5, "ZSTD_compressContinue_internal, stage: %u, srcSize: %u",
                  if (!ZSTD_window_update(&ms->window, src, srcSize)) {
                      ms->nextToUpdate = ms->window.dictLimit;
                  }
-                 if (cctx->appliedParams.ldmParams.enableLdm)
+                 if (cctx->appliedParams.ldmParams.enableLdm) {
                      ZSTD_window_update(&cctx->ldmState.window, src, srcSize);
+                 }
+                 if (!frame) {
+                     /* overflow check and correction for block mode */
+                     if (ZSTD_window_needOverflowCorrection(ms->window, (const char*)src + srcSize)) {
+                         U32 const cycleLog = ZSTD_cycleLog(cctx->appliedParams.cParams.chainLog, cctx->appliedParams.cParams.strategy);
+                         U32 const correction = ZSTD_window_correctOverflow(&ms->window, cycleLog, 1 << cctx->appliedParams.cParams.windowLog, src);
+                         ZSTD_STATIC_ASSERT(ZSTD_CHAINLOG_MAX <= 30);
+                         ZSTD_STATIC_ASSERT(ZSTD_WINDOWLOG_MAX_32 <= 30);
+                         ZSTD_STATIC_ASSERT(ZSTD_WINDOWLOG_MAX <= 31);
+                         ZSTD_reduceIndex(cctx, correction);
+                         if (ms->nextToUpdate < correction) ms->nextToUpdate = 0;
+                         else ms->nextToUpdate -= correction;
+                         ms->loadedDictEnd = 0;
+                         ms->dictMatchState = NULL;
+                     }
+                 }
                  DEBUGLOG(5, "ZSTD_compressContinue_internal (blockSize=%u)", (U32)cctx->blockSize);
                  {   size_t const cSize = frame ?
                      if (ZSTD_isError(cSize)) return cSize;
                      cctx->consumedSrcSize += srcSize;
                      cctx->producedCSize += (cSize + fhSize);
-                     if (cctx->appliedParams.fParams.contentSizeFlag) {  /* control src size */
+                     assert(!(cctx->appliedParams.fParams.contentSizeFlag && cctx->pledgedSrcSizePlusOne == 0));
+                     if (cctx->pledgedSrcSizePlusOne != 0) {  /* control src size */
+                         ZSTD_STATIC_ASSERT(ZSTD_CONTENTSIZE_UNKNOWN == (unsigned long long)-1);
                          if (cctx->consumedSrcSize+1 > cctx->pledgedSrcSizePlusOne) {
                              DEBUGLOG(4, "error : pledgedSrcSize = %u, while realSrcSize >= %u",
                                  (U32)cctx->pledgedSrcSizePlusOne-1, (U32)cctx->consumedSrcSize);
              {
                  size_t const blockSizeMax = ZSTD_getBlockSize(cctx);
                  if (srcSize > blockSizeMax) return ERROR(srcSize_wrong);
                  return ZSTD_compressContinue_internal(cctx, dst, dstCapacity, src, srcSize, 0 /* frame mode */, 0 /* last chunk */);
              }
              /*! ZSTD_loadDictionaryContent() :
               *  @return : 0, or an error code
               */
-             static size_t ZSTD_loadDictionaryContent(ZSTD_matchState_t* ms, ZSTD_CCtx_params const* params, const void* src, size_t srcSize)
+             static size_t ZSTD_loadDictionaryContent(ZSTD_matchState_t* ms,
+                                                      ZSTD_CCtx_params const* params,
+                                                      const void* src, size_t srcSize,
+                                                      ZSTD_dictTableLoadMethod_e dtlm)
              {
                  const BYTE* const ip = (const BYTE*) src;
                  const BYTE* const iend = ip + srcSize;
-                 ZSTD_compressionParameters const* cParams = &params->cParams;
                  ZSTD_window_update(&ms->window, src, srcSize);
                  ms->loadedDictEnd = params->forceWindow ? 0 : (U32)(iend - ms->window.base);
+                 /* Assert that we the ms params match the params we're being given */
+                 ZSTD_assertEqualCParams(params->cParams, ms->cParams);
                  if (srcSize <= HASH_READ_SIZE) return 0;
                  switch(params->cParams.strategy)
                  {
                  case ZSTD_fast:
-                     ZSTD_fillHashTable(ms, cParams, iend);
+                     ZSTD_fillHashTable(ms, iend, dtlm);
                      break;
                  case ZSTD_dfast:
-                     ZSTD_fillDoubleHashTable(ms, cParams, iend);
+                     ZSTD_fillDoubleHashTable(ms, iend, dtlm);
                      break;
                  case ZSTD_greedy:
                  case ZSTD_lazy:
                  case ZSTD_lazy2:
                      if (srcSize >= HASH_READ_SIZE)
-                         ZSTD_insertAndFindFirstIndex(ms, cParams, iend-HASH_READ_SIZE);
+                         ZSTD_insertAndFindFirstIndex(ms, iend-HASH_READ_SIZE);
                      break;
                  case ZSTD_btlazy2:   /* we want the dictionary table fully sorted */
                  case ZSTD_btopt:
                  case ZSTD_btultra:
                      if (srcSize >= HASH_READ_SIZE)
-                         ZSTD_updateTree(ms, cParams, iend-HASH_READ_SIZE, iend);
+                         ZSTD_updateTree(ms, iend-HASH_READ_SIZE, iend);
                      break;
                  default:
               *  assumptions : magic number supposed already checked
               *                dictSize supposed > 8
               */
-             static size_t ZSTD_loadZstdDictionary(ZSTD_compressedBlockState_t* bs, ZSTD_matchState_t* ms, ZSTD_CCtx_params const* params, const void* dict, size_t dictSize, void* workspace)
+             static size_t ZSTD_loadZstdDictionary(ZSTD_compressedBlockState_t* bs,
+                                                   ZSTD_matchState_t* ms,
+                                                   ZSTD_CCtx_params const* params,
+                                                   const void* dict, size_t dictSize,
+                                                   ZSTD_dictTableLoadMethod_e dtlm,
+                                                   void* workspace)
              {
                  const BYTE* dictPtr = (const BYTE*)dict;
                  const BYTE* const dictEnd = dictPtr + dictSize;
                  size_t dictID;
                  ZSTD_STATIC_ASSERT(HUF_WORKSPACE_SIZE >= (1<<MAX(MLFSELog,LLFSELog)));
+                 assert(dictSize > 8);
+                 assert(MEM_readLE32(dictPtr) == ZSTD_MAGIC_DICTIONARY);
                  dictPtr += 4;   /* skip magic number */
                  dictID = params->fParams.noDictIDFlag ? 0 :  MEM_readLE32(dictPtr);
                  dictPtr += 4;
                  {   unsigned maxSymbolValue = 255;
-                     size_t const hufHeaderSize = HUF_readCTable((HUF_CElt*)bs->entropy.hufCTable, &maxSymbolValue, dictPtr, dictEnd-dictPtr);
+                     size_t const hufHeaderSize = HUF_readCTable((HUF_CElt*)bs->entropy.huf.CTable, &maxSymbolValue, dictPtr, dictEnd-dictPtr);
                      if (HUF_isError(hufHeaderSize)) return ERROR(dictionary_corrupted);
                      if (maxSymbolValue < 255) return ERROR(dictionary_corrupted);
                      dictPtr += hufHeaderSize;
                      if (FSE_isError(offcodeHeaderSize)) return ERROR(dictionary_corrupted);
                      if (offcodeLog > OffFSELog) return ERROR(dictionary_corrupted);
                      /* Defer checking offcodeMaxValue because we need to know the size of the dictionary content */
-                     CHECK_E( FSE_buildCTable_wksp(bs->entropy.offcodeCTable, offcodeNCount, offcodeMaxValue, offcodeLog, workspace, HUF_WORKSPACE_SIZE),
+                     /* fill all offset symbols to avoid garbage at end of table */
+                     CHECK_E( FSE_buildCTable_wksp(bs->entropy.fse.offcodeCTable, offcodeNCount, MaxOff, offcodeLog, workspace, HUF_WORKSPACE_SIZE),
                               dictionary_corrupted);
                      dictPtr += offcodeHeaderSize;
                  }
                      if (matchlengthLog > MLFSELog) return ERROR(dictionary_corrupted);
                      /* Every match length code must have non-zero probability */
                      CHECK_F( ZSTD_checkDictNCount(matchlengthNCount, matchlengthMaxValue, MaxML));
-                     CHECK_E( FSE_buildCTable_wksp(bs->entropy.matchlengthCTable, matchlengthNCount, matchlengthMaxValue, matchlengthLog, workspace, HUF_WORKSPACE_SIZE),
+                     CHECK_E( FSE_buildCTable_wksp(bs->entropy.fse.matchlengthCTable, matchlengthNCount, matchlengthMaxValue, matchlengthLog, workspace, HUF_WORKSPACE_SIZE),
                               dictionary_corrupted);
                      dictPtr += matchlengthHeaderSize;
                  }
                      if (litlengthLog > LLFSELog) return ERROR(dictionary_corrupted);
                      /* Every literal length code must have non-zero probability */
                      CHECK_F( ZSTD_checkDictNCount(litlengthNCount, litlengthMaxValue, MaxLL));
-                     CHECK_E( FSE_buildCTable_wksp(bs->entropy.litlengthCTable, litlengthNCount, litlengthMaxValue, litlengthLog, workspace, HUF_WORKSPACE_SIZE),
+                     CHECK_E( FSE_buildCTable_wksp(bs->entropy.fse.litlengthCTable, litlengthNCount, litlengthMaxValue, litlengthLog, workspace, HUF_WORKSPACE_SIZE),
                               dictionary_corrupted);
                      dictPtr += litlengthHeaderSize;
                  }
                              if (bs->rep[u] > dictContentSize) return ERROR(dictionary_corrupted);
                      }   }
-                     bs->entropy.hufCTable_repeatMode = HUF_repeat_valid;
-                     bs->entropy.offcode_repeatMode = FSE_repeat_valid;
-                     bs->entropy.matchlength_repeatMode = FSE_repeat_valid;
-                     bs->entropy.litlength_repeatMode = FSE_repeat_valid;
-                     CHECK_F(ZSTD_loadDictionaryContent(ms, params, dictPtr, dictContentSize));
+                     bs->entropy.huf.repeatMode = HUF_repeat_valid;
+                     bs->entropy.fse.offcode_repeatMode = FSE_repeat_valid;
+                     bs->entropy.fse.matchlength_repeatMode = FSE_repeat_valid;
+                     bs->entropy.fse.litlength_repeatMode = FSE_repeat_valid;
+                     CHECK_F(ZSTD_loadDictionaryContent(ms, params, dictPtr, dictContentSize, dtlm));
                      return dictID;
                  }
              }
              /** ZSTD_compress_insertDictionary() :
              *   @return : dictID, or an error code */
-             static size_t ZSTD_compress_insertDictionary(ZSTD_compressedBlockState_t* bs, ZSTD_matchState_t* ms,
-                                                          ZSTD_CCtx_params const* params,
-                                                    const void* dict, size_t dictSize,
-                                                          ZSTD_dictContentType_e dictContentType,
-                                                          void* workspace)
+             static size_t
+             ZSTD_compress_insertDictionary(ZSTD_compressedBlockState_t* bs,
+                                            ZSTD_matchState_t* ms,
+                                      const ZSTD_CCtx_params* params,
+                                      const void* dict, size_t dictSize,
+                                            ZSTD_dictContentType_e dictContentType,
+                                            ZSTD_dictTableLoadMethod_e dtlm,
+                                            void* workspace)
              {
                  DEBUGLOG(4, "ZSTD_compress_insertDictionary (dictSize=%u)", (U32)dictSize);
                  if ((dict==NULL) || (dictSize<=8)) return 0;
                  /* dict restricted modes */
                  if (dictContentType == ZSTD_dct_rawContent)
-                     return ZSTD_loadDictionaryContent(ms, params, dict, dictSize);
+                     return ZSTD_loadDictionaryContent(ms, params, dict, dictSize, dtlm);
                  if (MEM_readLE32(dict) != ZSTD_MAGIC_DICTIONARY) {
                      if (dictContentType == ZSTD_dct_auto) {
                          DEBUGLOG(4, "raw content dictionary detected");
-                         return ZSTD_loadDictionaryContent(ms, params, dict, dictSize);
+                         return ZSTD_loadDictionaryContent(ms, params, dict, dictSize, dtlm);
                      }
                      if (dictContentType == ZSTD_dct_fullDict)
                          return ERROR(dictionary_wrong);
                  }
                  /* dict as full zstd dictionary */
-                 return ZSTD_loadZstdDictionary(bs, ms, params, dict, dictSize, workspace);
+                 return ZSTD_loadZstdDictionary(bs, ms, params, dict, dictSize, dtlm, workspace);
              }
              /*! ZSTD_compressBegin_internal() :
               * @return : 0, or an error code */
-             size_t ZSTD_compressBegin_internal(ZSTD_CCtx* cctx,
-                                          const void* dict, size_t dictSize,
-                                          ZSTD_dictContentType_e dictContentType,
-                                          const ZSTD_CDict* cdict,
-                                          ZSTD_CCtx_params params, U64 pledgedSrcSize,
-                                          ZSTD_buffered_policy_e zbuff)
+             static size_t ZSTD_compressBegin_internal(ZSTD_CCtx* cctx,
+                                                 const void* dict, size_t dictSize,
+                                                 ZSTD_dictContentType_e dictContentType,
+                                                 ZSTD_dictTableLoadMethod_e dtlm,
+                                                 const ZSTD_CDict* cdict,
+                                                 ZSTD_CCtx_params params, U64 pledgedSrcSize,
+                                                 ZSTD_buffered_policy_e zbuff)
              {
                  DEBUGLOG(4, "ZSTD_compressBegin_internal: wlog=%u", params.cParams.windowLog);
                  /* params are supposed to be fully validated at this point */
                  assert(!((dict) && (cdict)));  /* either dict or cdict, not both */
                  if (cdict && cdict->dictContentSize>0) {
-                     cctx->requestedParams = params;
-                     return ZSTD_resetCCtx_usingCDict(cctx, cdict, params.cParams.windowLog,
-                                                      params.fParams, pledgedSrcSize, zbuff);
+                     return ZSTD_resetCCtx_usingCDict(cctx, cdict, params, pledgedSrcSize, zbuff);
                  }
                  CHECK_F( ZSTD_resetCCtx_internal(cctx, params, pledgedSrcSize,
                  {
                      size_t const dictID = ZSTD_compress_insertDictionary(
                              cctx->blockState.prevCBlock, &cctx->blockState.matchState,
-                             &params, dict, dictSize, dictContentType, cctx->entropyWorkspace);
+                             &params, dict, dictSize, dictContentType, dtlm, cctx->entropyWorkspace);
                      if (ZSTD_isError(dictID)) return dictID;
                      assert(dictID <= (size_t)(U32)-1);
                      cctx->dictID = (U32)dictID;
              size_t ZSTD_compressBegin_advanced_internal(ZSTD_CCtx* cctx,
                                                  const void* dict, size_t dictSize,
                                                  ZSTD_dictContentType_e dictContentType,
+                                                 ZSTD_dictTableLoadMethod_e dtlm,
                                                  const ZSTD_CDict* cdict,
                                                  ZSTD_CCtx_params params,
                                                  unsigned long long pledgedSrcSize)
                  /* compression parameters verification and optimization */
                  CHECK_F( ZSTD_checkCParams(params.cParams) );
                  return ZSTD_compressBegin_internal(cctx,
-                                                    dict, dictSize, dictContentType,
+                                                    dict, dictSize, dictContentType, dtlm,
                                                     cdict,
                                                     params, pledgedSrcSize,
                                                     ZSTDb_not_buffered);
                  ZSTD_CCtx_params const cctxParams =
                          ZSTD_assignParamsToCCtxParams(cctx->requestedParams, params);
                  return ZSTD_compressBegin_advanced_internal(cctx,
-                                                         dict, dictSize, ZSTD_dct_auto,
+                                                         dict, dictSize, ZSTD_dct_auto, ZSTD_dtlm_fast,
                                                          NULL /*cdict*/,
                                                          cctxParams, pledgedSrcSize);
              }
                  ZSTD_CCtx_params const cctxParams =
                          ZSTD_assignParamsToCCtxParams(cctx->requestedParams, params);
                  DEBUGLOG(4, "ZSTD_compressBegin_usingDict (dictSize=%u)", (U32)dictSize);
-                 return ZSTD_compressBegin_internal(cctx, dict, dictSize, ZSTD_dct_auto, NULL,
+                 return ZSTD_compressBegin_internal(cctx, dict, dictSize, ZSTD_dct_auto, ZSTD_dtlm_fast, NULL,
                                                     cctxParams, ZSTD_CONTENTSIZE_UNKNOWN, ZSTDb_not_buffered);
              }
                  if (ZSTD_isError(cSize)) return cSize;
                  endResult = ZSTD_writeEpilogue(cctx, (char*)dst + cSize, dstCapacity-cSize);
                  if (ZSTD_isError(endResult)) return endResult;
-                 if (cctx->appliedParams.fParams.contentSizeFlag) {  /* control src size */
+                 assert(!(cctx->appliedParams.fParams.contentSizeFlag && cctx->pledgedSrcSizePlusOne == 0));
+                 if (cctx->pledgedSrcSizePlusOne != 0) {  /* control src size */
+                     ZSTD_STATIC_ASSERT(ZSTD_CONTENTSIZE_UNKNOWN == (unsigned long long)-1);
                      DEBUGLOG(4, "end of frame : controlling src size");
                      if (cctx->pledgedSrcSizePlusOne != cctx->consumedSrcSize+1) {
                          DEBUGLOG(4, "error : pledgedSrcSize = %u, while realSrcSize = %u",
              static size_t ZSTD_compress_internal (ZSTD_CCtx* cctx,
-                                            void* dst, size_t dstCapacity,
-                                      const void* src, size_t srcSize,
-                                      const void* dict,size_t dictSize,
-                                            ZSTD_parameters params)
+                                                   void* dst, size_t dstCapacity,
+                                             const void* src, size_t srcSize,
+                                             const void* dict,size_t dictSize,
+                                                   ZSTD_parameters params)
              {
                  ZSTD_CCtx_params const cctxParams =
                          ZSTD_assignParamsToCCtxParams(cctx->requestedParams, params);
                  DEBUGLOG(4, "ZSTD_compress_internal");
                  return ZSTD_compress_advanced_internal(cctx,
-                                                       dst, dstCapacity,
-                                                       src, srcSize,
-                                                       dict, dictSize,
-                                                       cctxParams);
+                                                        dst, dstCapacity,
+                                                        src, srcSize,
+                                                        dict, dictSize,
+                                                        cctxParams);
              }
-             size_t ZSTD_compress_advanced (ZSTD_CCtx* ctx,
+             size_t ZSTD_compress_advanced (ZSTD_CCtx* cctx,
                                             void* dst, size_t dstCapacity,
                                       const void* src, size_t srcSize,
                                       const void* dict,size_t dictSize,
              {
                  DEBUGLOG(4, "ZSTD_compress_advanced");
                  CHECK_F(ZSTD_checkCParams(params.cParams));
-                 return ZSTD_compress_internal(ctx, dst, dstCapacity, src, srcSize, dict, dictSize, params);
+                 return ZSTD_compress_internal(cctx,
+                                               dst, dstCapacity,
+                                               src, srcSize,
+                                               dict, dictSize,
+                                               params);
              }
              /* Internal */
                      const void* dict,size_t dictSize,
                      ZSTD_CCtx_params params)
              {
-                 DEBUGLOG(4, "ZSTD_compress_advanced_internal (srcSize:%u)",
-                             (U32)srcSize);
-                 CHECK_F( ZSTD_compressBegin_internal(cctx, dict, dictSize, ZSTD_dct_auto, NULL,
-                                                      params, srcSize, ZSTDb_not_buffered) );
+                 DEBUGLOG(4, "ZSTD_compress_advanced_internal (srcSize:%u)", (U32)srcSize);
+                 CHECK_F( ZSTD_compressBegin_internal(cctx,
+                                      dict, dictSize, ZSTD_dct_auto, ZSTD_dtlm_fast, NULL,
+                                      params, srcSize, ZSTDb_not_buffered) );
                  return ZSTD_compressEnd(cctx, dst, dstCapacity, src, srcSize);
              }
-             size_t ZSTD_compress_usingDict(ZSTD_CCtx* cctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize,
-                                            const void* dict, size_t dictSize, int compressionLevel)
+             size_t ZSTD_compress_usingDict(ZSTD_CCtx* cctx,
+                                            void* dst, size_t dstCapacity,
+                                      const void* src, size_t srcSize,
+                                      const void* dict, size_t dictSize,
+                                            int compressionLevel)
              {
-                 ZSTD_parameters const params = ZSTD_getParams(compressionLevel, srcSize ? srcSize : 1, dict ? dictSize : 0);
+                 ZSTD_parameters const params = ZSTD_getParams(compressionLevel, srcSize + (!srcSize), dict ? dictSize : 0);
                  ZSTD_CCtx_params cctxParams = ZSTD_assignParamsToCCtxParams(cctx->requestedParams, params);
                  assert(params.fParams.contentSizeFlag == 1);
-                 ZSTD_CCtxParam_setParameter(&cctxParams, ZSTD_p_compressLiterals, compressionLevel>=0);
                  return ZSTD_compress_advanced_internal(cctx, dst, dstCapacity, src, srcSize, dict, dictSize, cctxParams);
              }
-             size_t ZSTD_compressCCtx (ZSTD_CCtx* cctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize, int compressionLevel)
+             size_t ZSTD_compressCCtx(ZSTD_CCtx* cctx,
+                                      void* dst, size_t dstCapacity,
+                                const void* src, size_t srcSize,
+                                      int compressionLevel)
              {
                  DEBUGLOG(4, "ZSTD_compressCCtx (srcSize=%u)", (U32)srcSize);
+                 assert(cctx != NULL);
                  return ZSTD_compress_usingDict(cctx, dst, dstCapacity, src, srcSize, NULL, 0, compressionLevel);
              }
-             size_t ZSTD_compress(void* dst, size_t dstCapacity, const void* src, size_t srcSize, int compressionLevel)
+             size_t ZSTD_compress(void* dst, size_t dstCapacity,
+                            const void* src, size_t srcSize,
+                                  int compressionLevel)
              {
                  size_t result;
                  ZSTD_CCtx ctxBody;
-                 memset(&ctxBody, 0, sizeof(ctxBody));
-                 ctxBody.customMem = ZSTD_defaultCMem;
+                 ZSTD_initCCtx(&ctxBody, ZSTD_defaultCMem);
                  result = ZSTD_compressCCtx(&ctxBody, dst, dstCapacity, src, srcSize, compressionLevel);
-                 ZSTD_free(ctxBody.workSpace, ZSTD_defaultCMem);  /* can't free ctxBody itself, as it's on stack; free only heap content */
+                 ZSTD_freeCCtxContent(&ctxBody);   /* can't free ctxBody itself, as it's on stack; free only heap content */
                  return result;
              }
                                  ZSTD_dictContentType_e dictContentType,
                                  ZSTD_compressionParameters cParams)
              {
-                 DEBUGLOG(3, "ZSTD_initCDict_internal, dictContentType %u", (U32)dictContentType);
+                 DEBUGLOG(3, "ZSTD_initCDict_internal (dictContentType:%u)", (U32)dictContentType);
                  assert(!ZSTD_checkCParams(cParams));
-                 cdict->cParams = cParams;
+                 cdict->matchState.cParams = cParams;
                  if ((dictLoadMethod == ZSTD_dlm_byRef) || (!dictBuffer) || (!dictSize)) {
                      cdict->dictBuffer = NULL;
                      cdict->dictContent = dictBuffer;
                      {   size_t const dictID = ZSTD_compress_insertDictionary(
                                  &cdict->cBlockState, &cdict->matchState, &params,
                                  cdict->dictContent, cdict->dictContentSize,
-                                 dictContentType, cdict->workspace);
+                                 dictContentType, ZSTD_dtlm_full, cdict->workspace);
                          if (ZSTD_isError(dictID)) return dictID;
                          assert(dictID <= (size_t)(U32)-1);
                          cdict->dictID = (U32)dictID;
              ZSTD_compressionParameters ZSTD_getCParamsFromCDict(const ZSTD_CDict* cdict)
              {
                  assert(cdict != NULL);
-                 return cdict->cParams;
+                 return cdict->matchState.cParams;
              }
              /* ZSTD_compressBegin_usingCDict_advanced() :
                      }
                      params.fParams = fParams;
                      return ZSTD_compressBegin_internal(cctx,
-                                                        NULL, 0, ZSTD_dct_auto,
+                                                        NULL, 0, ZSTD_dct_auto, ZSTD_dtlm_fast,
                                                         cdict,
                                                         params, pledgedSrcSize,
                                                         ZSTDb_not_buffered);
              {
                  ZSTD_frameParameters const fParams = { 0 /*content*/, 0 /*checksum*/, 0 /*noDictID*/ };
                  DEBUGLOG(4, "ZSTD_compressBegin_usingCDict : dictIDFlag == %u", !fParams.noDictIDFlag);
-                 return ZSTD_compressBegin_usingCDict_advanced(cctx, cdict, fParams, 0);
+                 return ZSTD_compressBegin_usingCDict_advanced(cctx, cdict, fParams, ZSTD_CONTENTSIZE_UNKNOWN);
              }
              size_t ZSTD_compress_usingCDict_advanced(ZSTD_CCtx* cctx,
              static size_t ZSTD_resetCStream_internal(ZSTD_CStream* cctx,
                                  const void* const dict, size_t const dictSize, ZSTD_dictContentType_e const dictContentType,
                                  const ZSTD_CDict* const cdict,
-                                 ZSTD_CCtx_params const params, unsigned long long const pledgedSrcSize)
+                                 ZSTD_CCtx_params params, unsigned long long const pledgedSrcSize)
              {
-                 DEBUGLOG(4, "ZSTD_resetCStream_internal (disableLiteralCompression=%i)",
-                             params.disableLiteralCompression);
+                 DEBUGLOG(4, "ZSTD_resetCStream_internal");
+                 /* Finalize the compression parameters */
+                 params.cParams = ZSTD_getCParamsFromCCtxParams(&params, pledgedSrcSize, dictSize);
                  /* params are supposed to be fully validated at this point */
                  assert(!ZSTD_isError(ZSTD_checkCParams(params.cParams)));
                  assert(!((dict) && (cdict)));  /* either dict or cdict, not both */
                  CHECK_F( ZSTD_compressBegin_internal(cctx,
-                                                      dict, dictSize, dictContentType,
+                                                      dict, dictSize, dictContentType, ZSTD_dtlm_fast,
                                                       cdict,
                                                       params, pledgedSrcSize,
                                                       ZSTDb_buffered) );
                  DEBUGLOG(4, "ZSTD_resetCStream: pledgedSrcSize = %u", (U32)pledgedSrcSize);
                  if (pledgedSrcSize==0) pledgedSrcSize = ZSTD_CONTENTSIZE_UNKNOWN;
                  params.fParams.contentSizeFlag = 1;
-                 params.cParams = ZSTD_getCParamsFromCCtxParams(&params, pledgedSrcSize, 0);
                  return ZSTD_resetCStream_internal(zcs, NULL, 0, ZSTD_dct_auto, zcs->cdict, params, pledgedSrcSize);
              }
                                  ZSTD_CCtx_params params, unsigned long long pledgedSrcSize)
              {
                  DEBUGLOG(4, "ZSTD_initCStream_internal");
+                 params.cParams = ZSTD_getCParamsFromCCtxParams(&params, pledgedSrcSize, dictSize);
                  assert(!ZSTD_isError(ZSTD_checkCParams(params.cParams)));
                  assert(!((dict) && (cdict)));  /* either dict or cdict, not both */
                              (U32)pledgedSrcSize, params.fParams.contentSizeFlag);
                  CHECK_F( ZSTD_checkCParams(params.cParams) );
                  if ((pledgedSrcSize==0) && (params.fParams.contentSizeFlag==0)) pledgedSrcSize = ZSTD_CONTENTSIZE_UNKNOWN;  /* for compatibility with older programs relying on this behavior. Users should now specify ZSTD_CONTENTSIZE_UNKNOWN. This line will be removed in the future. */
-                 {   ZSTD_CCtx_params const cctxParams = ZSTD_assignParamsToCCtxParams(zcs->requestedParams, params);
-                     return ZSTD_initCStream_internal(zcs, dict, dictSize, NULL /*cdict*/, cctxParams, pledgedSrcSize);
+                 }
+                 zcs->requestedParams = ZSTD_assignParamsToCCtxParams(zcs->requestedParams, params);
+                 return ZSTD_initCStream_internal(zcs, dict, dictSize, NULL /*cdict*/, zcs->requestedParams, pledgedSrcSize);
              }
              size_t ZSTD_initCStream_usingDict(ZSTD_CStream* zcs, const void* dict, size_t dictSize, int compressionLevel)
              {
-                 ZSTD_parameters const params = ZSTD_getParams(compressionLevel, 0, dictSize);
-                 ZSTD_CCtx_params const cctxParams =
-                         ZSTD_assignParamsToCCtxParams(zcs->requestedParams, params);
-                 return ZSTD_initCStream_internal(zcs, dict, dictSize, NULL, cctxParams, ZSTD_CONTENTSIZE_UNKNOWN);
+                 ZSTD_CCtxParams_init(&zcs->requestedParams, compressionLevel);
+                 return ZSTD_initCStream_internal(zcs, dict, dictSize, NULL, zcs->requestedParams, ZSTD_CONTENTSIZE_UNKNOWN);
              }
              size_t ZSTD_initCStream_srcSize(ZSTD_CStream* zcs, int compressionLevel, unsigned long long pss)
              {
                  U64 const pledgedSrcSize = (pss==0) ? ZSTD_CONTENTSIZE_UNKNOWN : pss;  /* temporary : 0 interpreted as "unknown" during transition period. Users willing to specify "unknown" **must** use ZSTD_CONTENTSIZE_UNKNOWN. `0` will be interpreted as "empty" in the future */
-                 ZSTD_parameters const params = ZSTD_getParams(compressionLevel, pledgedSrcSize, 0);
-                 ZSTD_CCtx_params const cctxParams = ZSTD_assignParamsToCCtxParams(zcs->requestedParams, params);
-                 return ZSTD_initCStream_internal(zcs, NULL, 0, NULL, cctxParams, pledgedSrcSize);
+                 ZSTD_CCtxParams_init(&zcs->requestedParams, compressionLevel);
+                 return ZSTD_initCStream_internal(zcs, NULL, 0, NULL, zcs->requestedParams, pledgedSrcSize);
              }
              size_t ZSTD_initCStream(ZSTD_CStream* zcs, int compressionLevel)
                              ip = iend;
                              op += cSize;
                              zcs->frameEnded = 1;
-                             ZSTD_startNewCompression(zcs);
+                             ZSTD_CCtx_reset(zcs);
                              someMoreWork = 0; break;
                          }
                          /* complete loading into inBuffer */
                                  if (zcs->frameEnded) {
                                      DEBUGLOG(5, "Frame completed directly in outBuffer");
                                      someMoreWork = 0;
-                                     ZSTD_startNewCompression(zcs);
+                                     ZSTD_CCtx_reset(zcs);
                                  }
                                  break;
                              }
                              if (zcs->frameEnded) {
                                  DEBUGLOG(5, "Frame completed on flush");
                                  someMoreWork = 0;
-                                 ZSTD_startNewCompression(zcs);
+                                 ZSTD_CCtx_reset(zcs);
                                  break;
                              }
                              zcs->streamStage = zcss_load;
                      params.cParams = ZSTD_getCParamsFromCCtxParams(
                              &cctx->requestedParams, cctx->pledgedSrcSizePlusOne-1, 0 /*dictSize*/);
              #ifdef ZSTD_MULTITHREAD
                      if ((cctx->pledgedSrcSizePlusOne-1) <= ZSTDMT_JOBSIZE_MIN) {
                          params.nbWorkers = 0; /* do not invoke multi-threading when src size is too small */
                      }
                      if (params.nbWorkers > 0) {
                          /* mt context creation */
-                         if (cctx->mtctx == NULL || (params.nbWorkers != ZSTDMT_getNbWorkers(cctx->mtctx))) {
+                         if (cctx->mtctx == NULL) {
                              DEBUGLOG(4, "ZSTD_compress_generic: creating new mtctx for nbWorkers=%u",
                                          params.nbWorkers);
-                             if (cctx->mtctx != NULL)
-                                 DEBUGLOG(4, "ZSTD_compress_generic: previous nbWorkers was %u",
-                                             ZSTDMT_getNbWorkers(cctx->mtctx));
-                             ZSTDMT_freeCCtx(cctx->mtctx);
                              cctx->mtctx = ZSTDMT_createCCtx_advanced(params.nbWorkers, cctx->customMem);
                              if (cctx->mtctx == NULL) return ERROR(memory_allocation);
                          }
                      {   size_t const flushMin = ZSTDMT_compressStream_generic(cctx->mtctx, output, input, endOp);
                          if ( ZSTD_isError(flushMin)
                            || (endOp == ZSTD_e_end && flushMin == 0) ) { /* compression completed */
-                             ZSTD_startNewCompression(cctx);
+                             ZSTD_CCtx_reset(cctx);
                          }
+                         DEBUGLOG(5, "completed ZSTD_compress_generic delegating to ZSTDMT_compressStream_generic");
                          return flushMin;
                  }   }
              #endif
              #define ZSTD_MAX_CLEVEL     22
              int ZSTD_maxCLevel(void) { return ZSTD_MAX_CLEVEL; }
+             int ZSTD_minCLevel(void) { return (int)-ZSTD_TARGETLENGTH_MAX; }
              static const ZSTD_compressionParameters ZSTD_defaultCParameters[4][ZSTD_MAX_CLEVEL+1] = {
              {   /* "default" - guarantees a monotonically increasing memory budget */
                  /* W,  C,  H,  S,  L, TL, strat */
                  { 19, 12, 13,  1,  6,  1, ZSTD_fast    },  /* base for negative levels */
-                 { 19, 13, 14,  1,  7,  1, ZSTD_fast    },  /* level  1 */
-                 { 19, 15, 16,  1,  6,  1, ZSTD_fast    },  /* level  2 */
-                 { 20, 16, 17,  1,  5,  8, ZSTD_dfast   },  /* level  3 */
-                 { 20, 17, 18,  1,  5,  8, ZSTD_dfast   },  /* level  4 */
-                 { 20, 17, 18,  2,  5, 16, ZSTD_greedy  },  /* level  5 */
-                 { 21, 17, 19,  2,  5, 16, ZSTD_lazy    },  /* level  6 */
-                 { 21, 18, 19,  3,  5, 16, ZSTD_lazy    },  /* level  7 */
-                 { 21, 18, 20,  3,  5, 16, ZSTD_lazy2   },  /* level  8 */
-                 { 21, 19, 20,  3,  5, 16, ZSTD_lazy2   },  /* level  9 */
-                 { 21, 19, 21,  4,  5, 16, ZSTD_lazy2   },  /* level 10 */
-                 { 22, 20, 22,  4,  5, 16, ZSTD_lazy2   },  /* level 11 */
+                 { 19, 13, 14,  1,  7,  0, ZSTD_fast    },  /* level  1 */
+                 { 19, 15, 16,  1,  6,  0, ZSTD_fast    },  /* level  2 */
+                 { 20, 16, 17,  1,  5,  1, ZSTD_dfast   },  /* level  3 */
+                 { 20, 18, 18,  1,  5,  1, ZSTD_dfast   },  /* level  4 */
+                 { 20, 18, 18,  2,  5,  2, ZSTD_greedy  },  /* level  5 */
+                 { 21, 18, 19,  2,  5,  4, ZSTD_lazy    },  /* level  6 */
+                 { 21, 18, 19,  3,  5,  8, ZSTD_lazy2   },  /* level  7 */
+                 { 21, 19, 19,  3,  5, 16, ZSTD_lazy2   },  /* level  8 */
+                 { 21, 19, 20,  4,  5, 16, ZSTD_lazy2   },  /* level  9 */
+                 { 21, 20, 21,  4,  5, 16, ZSTD_lazy2   },  /* level 10 */
+                 { 21, 21, 22,  4,  5, 16, ZSTD_lazy2   },  /* level 11 */
                  { 22, 20, 22,  5,  5, 16, ZSTD_lazy2   },  /* level 12 */
                  { 22, 21, 22,  4,  5, 32, ZSTD_btlazy2 },  /* level 13 */
                  { 22, 21, 22,  5,  5, 32, ZSTD_btlazy2 },  /* level 14 */
                  { 22, 22, 22,  6,  5, 32, ZSTD_btlazy2 },  /* level 15 */
                  { 22, 21, 22,  4,  5, 48, ZSTD_btopt   },  /* level 16 */
-                 { 23, 22, 22,  4,  4, 48, ZSTD_btopt   },  /* level 17 */
-                 { 23, 22, 22,  5,  3, 64, ZSTD_btopt   },  /* level 18 */
-                 { 23, 23, 22,  7,  3,128, ZSTD_btopt   },  /* level 19 */
-                 { 25, 25, 23,  7,  3,128, ZSTD_btultra },  /* level 20 */
-                 { 26, 26, 24,  7,  3,256, ZSTD_btultra },  /* level 21 */
-                 { 27, 27, 25,  9,  3,512, ZSTD_btultra },  /* level 22 */
+                 { 23, 22, 22,  4,  4, 64, ZSTD_btopt   },  /* level 17 */
+                 { 23, 23, 22,  6,  3,256, ZSTD_btopt   },  /* level 18 */
+                 { 23, 24, 22,  7,  3,256, ZSTD_btultra },  /* level 19 */
+                 { 25, 25, 23,  7,  3,256, ZSTD_btultra },  /* level 20 */
+                 { 26, 26, 24,  7,  3,512, ZSTD_btultra },  /* level 21 */
+                 { 27, 27, 25,  9,  3,999, ZSTD_btultra },  /* level 22 */
              },
              {   /* for srcSize <= 256 KB */
                  /* W,  C,  H,  S,  L,  T, strat */
                  { 18, 12, 13,  1,  5,  1, ZSTD_fast    },  /* base for negative levels */
-                 { 18, 13, 14,  1,  6,  1, ZSTD_fast    },  /* level  1 */
-                 { 18, 14, 13,  1,  5,  8, ZSTD_dfast   },  /* level  2 */
-                 { 18, 16, 15,  1,  5,  8, ZSTD_dfast   },  /* level  3 */
-                 { 18, 15, 17,  1,  5,  8, ZSTD_greedy  },  /* level  4.*/
-                 { 18, 16, 17,  4,  5,  8, ZSTD_greedy  },  /* level  5.*/
-                 { 18, 16, 17,  3,  5,  8, ZSTD_lazy    },  /* level  6.*/
-                 { 18, 17, 17,  4,  4,  8, ZSTD_lazy    },  /* level  7 */
-                 { 18, 17, 17,  4,  4,  8, ZSTD_lazy2   },  /* level  8 */
-                 { 18, 17, 17,  5,  4,  8, ZSTD_lazy2   },  /* level  9 */
-                 { 18, 17, 17,  6,  4,  8, ZSTD_lazy2   },  /* level 10 */
-                 { 18, 18, 17,  6,  4,  8, ZSTD_lazy2   },  /* level 11.*/
-                 { 18, 18, 17,  5,  4,  8, ZSTD_btlazy2 },  /* level 12.*/
-                 { 18, 19, 17,  7,  4,  8, ZSTD_btlazy2 },  /* level 13 */
-                 { 18, 18, 18,  4,  4, 16, ZSTD_btopt   },  /* level 14.*/
-                 { 18, 18, 18,  4,  3, 16, ZSTD_btopt   },  /* level 15.*/
-                 { 18, 19, 18,  6,  3, 32, ZSTD_btopt   },  /* level 16.*/
-                 { 18, 19, 18,  8,  3, 64, ZSTD_btopt   },  /* level 17.*/
-                 { 18, 19, 18,  9,  3,128, ZSTD_btopt   },  /* level 18.*/
-                 { 18, 19, 18, 10,  3,256, ZSTD_btopt   },  /* level 19.*/
-                 { 18, 19, 18, 11,  3,512, ZSTD_btultra },  /* level 20.*/
-                 { 18, 19, 18, 12,  3,512, ZSTD_btultra },  /* level 21.*/
-                 { 18, 19, 18, 13,  3,512, ZSTD_btultra },  /* level 22.*/
+                 { 18, 13, 14,  1,  6,  0, ZSTD_fast    },  /* level  1 */
+                 { 18, 14, 14,  1,  5,  1, ZSTD_dfast   },  /* level  2 */
+                 { 18, 16, 16,  1,  4,  1, ZSTD_dfast   },  /* level  3 */
+                 { 18, 16, 17,  2,  5,  2, ZSTD_greedy  },  /* level  4.*/
+                 { 18, 18, 18,  3,  5,  2, ZSTD_greedy  },  /* level  5.*/
+                 { 18, 18, 19,  3,  5,  4, ZSTD_lazy    },  /* level  6.*/
+                 { 18, 18, 19,  4,  4,  4, ZSTD_lazy    },  /* level  7 */
+                 { 18, 18, 19,  4,  4,  8, ZSTD_lazy2   },  /* level  8 */
+                 { 18, 18, 19,  5,  4,  8, ZSTD_lazy2   },  /* level  9 */
+                 { 18, 18, 19,  6,  4,  8, ZSTD_lazy2   },  /* level 10 */
+                 { 18, 18, 19,  5,  4, 16, ZSTD_btlazy2 },  /* level 11.*/
+                 { 18, 19, 19,  6,  4, 16, ZSTD_btlazy2 },  /* level 12.*/
+                 { 18, 19, 19,  8,  4, 16, ZSTD_btlazy2 },  /* level 13 */
+                 { 18, 18, 19,  4,  4, 24, ZSTD_btopt   },  /* level 14.*/
+                 { 18, 18, 19,  4,  3, 24, ZSTD_btopt   },  /* level 15.*/
+                 { 18, 19, 19,  6,  3, 64, ZSTD_btopt   },  /* level 16.*/
+                 { 18, 19, 19,  8,  3,128, ZSTD_btopt   },  /* level 17.*/
+                 { 18, 19, 19, 10,  3,256, ZSTD_btopt   },  /* level 18.*/
+                 { 18, 19, 19, 10,  3,256, ZSTD_btultra },  /* level 19.*/
+                 { 18, 19, 19, 11,  3,512, ZSTD_btultra },  /* level 20.*/
+                 { 18, 19, 19, 12,  3,512, ZSTD_btultra },  /* level 21.*/
+                 { 18, 19, 19, 13,  3,999, ZSTD_btultra },  /* level 22.*/
              },
              {   /* for srcSize <= 128 KB */
                  /* W,  C,  H,  S,  L,  T, strat */
-                 { 17, 12, 12,  1,  5,  1, ZSTD_fast    },  /* level  0 - not used */
-                 { 17, 12, 13,  1,  6,  1, ZSTD_fast    },  /* level  1 */
-                 { 17, 13, 16,  1,  5,  1, ZSTD_fast    },  /* level  2 */
-                 { 17, 16, 16,  2,  5,  8, ZSTD_dfast   },  /* level  3 */
-                 { 17, 13, 15,  3,  4,  8, ZSTD_greedy  },  /* level  4 */
-                 { 17, 15, 17,  4,  4,  8, ZSTD_greedy  },  /* level  5 */
-                 { 17, 16, 17,  3,  4,  8, ZSTD_lazy    },  /* level  6 */
-                 { 17, 15, 17,  4,  4,  8, ZSTD_lazy2   },  /* level  7 */
+                 { 17, 12, 12,  1,  5,  1, ZSTD_fast    },  /* base for negative levels */
+                 { 17, 12, 13,  1,  6,  0, ZSTD_fast    },  /* level  1 */
+                 { 17, 13, 15,  1,  5,  0, ZSTD_fast    },  /* level  2 */
+                 { 17, 15, 16,  2,  5,  1, ZSTD_dfast   },  /* level  3 */
+                 { 17, 17, 17,  2,  4,  1, ZSTD_dfast   },  /* level  4 */
+                 { 17, 16, 17,  3,  4,  2, ZSTD_greedy  },  /* level  5 */
+                 { 17, 17, 17,  3,  4,  4, ZSTD_lazy    },  /* level  6 */
+                 { 17, 17, 17,  3,  4,  8, ZSTD_lazy2   },  /* level  7 */
                  { 17, 17, 17,  4,  4,  8, ZSTD_lazy2   },  /* level  8 */
                  { 17, 17, 17,  5,  4,  8, ZSTD_lazy2   },  /* level  9 */
                  { 17, 17, 17,  6,  4,  8, ZSTD_lazy2   },  /* level 10 */
                  { 17, 17, 17,  7,  4,  8, ZSTD_lazy2   },  /* level 11 */
-                 { 17, 17, 17,  8,  4,  8, ZSTD_lazy2   },  /* level 12 */
-                 { 17, 18, 17,  6,  4,  8, ZSTD_btlazy2 },  /* level 13.*/
-                 { 17, 17, 17,  7,  3,  8, ZSTD_btopt   },  /* level 14.*/
-                 { 17, 17, 17,  7,  3, 16, ZSTD_btopt   },  /* level 15.*/
-                 { 17, 18, 17,  7,  3, 32, ZSTD_btopt   },  /* level 16.*/
-                 { 17, 18, 17,  7,  3, 64, ZSTD_btopt   },  /* level 17.*/
-                 { 17, 18, 17,  7,  3,256, ZSTD_btopt   },  /* level 18.*/
-                 { 17, 18, 17,  8,  3,256, ZSTD_btopt   },  /* level 19.*/
+                 { 17, 18, 17,  6,  4, 16, ZSTD_btlazy2 },  /* level 12 */
+                 { 17, 18, 17,  8,  4, 16, ZSTD_btlazy2 },  /* level 13.*/
+                 { 17, 18, 17,  4,  4, 32, ZSTD_btopt   },  /* level 14.*/
+                 { 17, 18, 17,  6,  3, 64, ZSTD_btopt   },  /* level 15.*/
+                 { 17, 18, 17,  7,  3,128, ZSTD_btopt   },  /* level 16.*/
+                 { 17, 18, 17,  7,  3,256, ZSTD_btopt   },  /* level 17.*/
+                 { 17, 18, 17,  8,  3,256, ZSTD_btopt   },  /* level 18.*/
+                 { 17, 18, 17,  8,  3,256, ZSTD_btultra },  /* level 19.*/
                  { 17, 18, 17,  9,  3,256, ZSTD_btultra },  /* level 20.*/
                  { 17, 18, 17, 10,  3,256, ZSTD_btultra },  /* level 21.*/
                  { 17, 18, 17, 11,  3,512, ZSTD_btultra },  /* level 22.*/
              {   /* for srcSize <= 16 KB */
                  /* W,  C,  H,  S,  L,  T, strat */
                  { 14, 12, 13,  1,  5,  1, ZSTD_fast    },  /* base for negative levels */
-                 { 14, 14, 14,  1,  6,  1, ZSTD_fast    },  /* level  1 */
-                 { 14, 14, 14,  1,  4,  1, ZSTD_fast    },  /* level  2 */
-                 { 14, 14, 14,  1,  4,  6, ZSTD_dfast   },  /* level  3.*/
-                 { 14, 14, 14,  4,  4,  6, ZSTD_greedy  },  /* level  4.*/
-                 { 14, 14, 14,  3,  4,  6, ZSTD_lazy    },  /* level  5.*/
-                 { 14, 14, 14,  4,  4,  6, ZSTD_lazy2   },  /* level  6 */
-                 { 14, 14, 14,  5,  4,  6, ZSTD_lazy2   },  /* level  7 */
-                 { 14, 14, 14,  6,  4,  6, ZSTD_lazy2   },  /* level  8.*/
-                 { 14, 15, 14,  6,  4,  6, ZSTD_btlazy2 },  /* level  9.*/
-                 { 14, 15, 14,  3,  3,  6, ZSTD_btopt   },  /* level 10.*/
-                 { 14, 15, 14,  6,  3,  8, ZSTD_btopt   },  /* level 11.*/
+                 { 14, 14, 15,  1,  5,  0, ZSTD_fast    },  /* level  1 */
+                 { 14, 14, 15,  1,  4,  0, ZSTD_fast    },  /* level  2 */
+                 { 14, 14, 14,  2,  4,  1, ZSTD_dfast   },  /* level  3.*/
+                 { 14, 14, 14,  4,  4,  2, ZSTD_greedy  },  /* level  4.*/
+                 { 14, 14, 14,  3,  4,  4, ZSTD_lazy    },  /* level  5.*/
+                 { 14, 14, 14,  4,  4,  8, ZSTD_lazy2   },  /* level  6 */
+                 { 14, 14, 14,  6,  4,  8, ZSTD_lazy2   },  /* level  7 */
+                 { 14, 14, 14,  8,  4,  8, ZSTD_lazy2   },  /* level  8.*/
+                 { 14, 15, 14,  5,  4,  8, ZSTD_btlazy2 },  /* level  9.*/
+                 { 14, 15, 14,  9,  4,  8, ZSTD_btlazy2 },  /* level 10.*/
+                 { 14, 15, 14,  3,  4, 12, ZSTD_btopt   },  /* level 11.*/
                  { 14, 15, 14,  6,  3, 16, ZSTD_btopt   },  /* level 12.*/
                  { 14, 15, 14,  6,  3, 24, ZSTD_btopt   },  /* level 13.*/
                  { 14, 15, 15,  6,  3, 48, ZSTD_btopt   },  /* level 14.*/
                  { 14, 15, 15,  6,  3, 64, ZSTD_btopt   },  /* level 15.*/
                  { 14, 15, 15,  6,  3, 96, ZSTD_btopt   },  /* level 16.*/
                  { 14, 15, 15,  6,  3,128, ZSTD_btopt   },  /* level 17.*/
-                 { 14, 15, 15,  6,  3,256, ZSTD_btopt   },  /* level 18.*/
-                 { 14, 15, 15,  7,  3,256, ZSTD_btopt   },  /* level 19.*/
+                 { 14, 15, 15,  8,  3,256, ZSTD_btopt   },  /* level 18.*/
+                 { 14, 15, 15,  6,  3,256, ZSTD_btultra },  /* level 19.*/
                  { 14, 15, 15,  8,  3,256, ZSTD_btultra },  /* level 20.*/
                  { 14, 15, 15,  9,  3,256, ZSTD_btultra },  /* level 21.*/
-                 { 14, 15, 15, 10,  3,256, ZSTD_btultra },  /* level 22.*/
+                 { 14, 15, 15, 10,  3,512, ZSTD_btultra },  /* level 22.*/
              },
              };

contrib/python-zstandard/zstd/compress/zstd_compress_internal.h

0 +125 -36

              extern "C" {
              #endif
              /*-*************************************
              *  Constants
              ***************************************/
                                                     It's not a big deal though : candidate will just be sorted again.
                                                     Additionnally, candidate position 1 will be lost.
                                                     But candidate 1 cannot hide a large tree of candidates, so it's a minimal loss.
-                                                    The benefit is that ZSTD_DUBT_UNSORTED_MARK cannot be misdhandled after table re-use with a different strategy */
+                                                    The benefit is that ZSTD_DUBT_UNSORTED_MARK cannot be misdhandled after table re-use with a different strategy
+                                                    Constant required by ZSTD_compressBlock_btlazy2() and ZSTD_reduceTable_internal() */
              /*-*************************************
              typedef enum { ZSTDcs_created=0, ZSTDcs_init, ZSTDcs_ongoing, ZSTDcs_ending } ZSTD_compressionStage_e;
              typedef enum { zcss_init=0, zcss_load, zcss_flush } ZSTD_cStreamStage;
+             typedef enum {
+                 ZSTD_dictDefaultAttach = 0,
+                 ZSTD_dictForceAttach = 1,
+                 ZSTD_dictForceCopy = -1,
+             } ZSTD_dictAttachPref_e;
              typedef struct ZSTD_prefixDict_s {
                  const void* dict;
                  size_t dictSize;
              } ZSTD_prefixDict;
              typedef struct {
-                 U32 hufCTable[HUF_CTABLE_SIZE_U32(255)];
+                 U32 CTable[HUF_CTABLE_SIZE_U32(255)];
+                 HUF_repeat repeatMode;
+             } ZSTD_hufCTables_t;
+             typedef struct {
                  FSE_CTable offcodeCTable[FSE_CTABLE_SIZE_U32(OffFSELog, MaxOff)];
                  FSE_CTable matchlengthCTable[FSE_CTABLE_SIZE_U32(MLFSELog, MaxML)];
                  FSE_CTable litlengthCTable[FSE_CTABLE_SIZE_U32(LLFSELog, MaxLL)];
-                 HUF_repeat hufCTable_repeatMode;
                  FSE_repeat offcode_repeatMode;
                  FSE_repeat matchlength_repeatMode;
                  FSE_repeat litlength_repeatMode;
+             } ZSTD_fseCTables_t;
+             typedef struct {
+                 ZSTD_hufCTables_t huf;
+                 ZSTD_fseCTables_t fse;
              } ZSTD_entropyCTables_t;
              typedef struct {
                  U32 rep[ZSTD_REP_NUM];
              } ZSTD_optimal_t;
+             typedef enum { zop_dynamic=0, zop_predef } ZSTD_OptPrice_e;
              typedef struct {
                  /* All tables are allocated inside cctx->workspace by ZSTD_resetCCtx_internal() */
-                 U32* litFreq;               /* table of literals statistics, of size 256 */
-                 U32* litLengthFreq;         /* table of litLength statistics, of size (MaxLL+1) */
-                 U32* matchLengthFreq;       /* table of matchLength statistics, of size (MaxML+1) */
-                 U32* offCodeFreq;           /* table of offCode statistics, of size (MaxOff+1) */
-                 ZSTD_match_t* matchTable;   /* list of found matches, of size ZSTD_OPT_NUM+1 */
-                 ZSTD_optimal_t* priceTable; /* All positions tracked by optimal parser, of size ZSTD_OPT_NUM+1 */
+                 U32* litFreq;                /* table of literals statistics, of size 256 */
+                 U32* litLengthFreq;          /* table of litLength statistics, of size (MaxLL+1) */
+                 U32* matchLengthFreq;        /* table of matchLength statistics, of size (MaxML+1) */
+                 U32* offCodeFreq;            /* table of offCode statistics, of size (MaxOff+1) */
+                 ZSTD_match_t* matchTable;    /* list of found matches, of size ZSTD_OPT_NUM+1 */
+                 ZSTD_optimal_t* priceTable;  /* All positions tracked by optimal parser, of size ZSTD_OPT_NUM+1 */
                  U32  litSum;                 /* nb of literals */
                  U32  litLengthSum;           /* nb of litLength codes */
                  U32  matchLengthSum;         /* nb of matchLength codes */
                  U32  offCodeSum;             /* nb of offset codes */
-                 /* begin updated by ZSTD_setLog2Prices */
-                 U32  log2litSum;             /* pow2 to compare log2(litfreq) to */
-                 U32  log2litLengthSum;       /* pow2 to compare log2(llfreq) to */
-                 U32  log2matchLengthSum;     /* pow2 to compare log2(mlfreq) to */
-                 U32  log2offCodeSum;         /* pow2 to compare log2(offreq) to */
-                 /* end : updated by ZSTD_setLog2Prices */
-                 U32  staticPrices;           /* prices follow a pre-defined cost structure, statistics are irrelevant */
+                 U32  litSumBasePrice;        /* to compare to log2(litfreq) */
+                 U32  litLengthSumBasePrice;  /* to compare to log2(llfreq)  */
+                 U32  matchLengthSumBasePrice;/* to compare to log2(mlfreq)  */
+                 U32  offCodeSumBasePrice;    /* to compare to log2(offreq)  */
+                 ZSTD_OptPrice_e priceType;   /* prices can be determined dynamically, or follow a pre-defined cost structure */
+                 const ZSTD_entropyCTables_t* symbolCosts;  /* pre-calculated dictionary statistics */
              } optState_t;
              typedef struct {
                  U32 lowLimit;           /* below that point, no more data */
              } ZSTD_window_t;
-             typedef struct {
-                 ZSTD_window_t window;      /* State for window round buffer management */
-                 U32 loadedDictEnd;         /* index of end of dictionary */
-                 U32 nextToUpdate;          /* index from which to continue table update */
-                 U32 nextToUpdate3;         /* index from which to continue table update */
-                 U32 hashLog3;              /* dispatch table : larger == faster, more memory */
+             typedef struct ZSTD_matchState_t ZSTD_matchState_t;
+             struct ZSTD_matchState_t {
+                 ZSTD_window_t window;   /* State for window round buffer management */
+                 U32 loadedDictEnd;      /* index of end of dictionary */
+                 U32 nextToUpdate;       /* index from which to continue table update */
+                 U32 nextToUpdate3;      /* index from which to continue table update */
+                 U32 hashLog3;           /* dispatch table : larger == faster, more memory */
                  U32* hashTable;
                  U32* hashTable3;
                  U32* chainTable;
                  optState_t opt;         /* optimal parser state */
-             } ZSTD_matchState_t;
+                 const ZSTD_matchState_t *dictMatchState;
+                 ZSTD_compressionParameters cParams;
+             };
              typedef struct {
                  ZSTD_compressedBlockState_t* prevCBlock;
                rawSeq* seq;     /* The start of the sequences */
                size_t pos;      /* The position where reading stopped. <= size. */
                size_t size;     /* The number of sequences. <= capacity. */
-               size_t capacity; /* The capacity of the `seq` pointer */
+               size_t capacity; /* The capacity starting from `seq` pointer */
              } rawSeqStore_t;
              struct ZSTD_CCtx_params_s {
                  ZSTD_frameParameters fParams;
                  int compressionLevel;
-                 int disableLiteralCompression;
                  int forceWindow;           /* force back-references to respect limit of
                                              * 1<<wLog, even for dictionary */
+                 ZSTD_dictAttachPref_e attachDictPref;
                  /* Multithreading: used to pass parameters to mtctx */
                  unsigned nbWorkers;
                  unsigned jobSize;
                  ZSTD_CCtx_params requestedParams;
                  ZSTD_CCtx_params appliedParams;
                  U32   dictID;
+                 int workSpaceOversizedDuration;
                  void* workSpace;
                  size_t workSpaceSize;
                  size_t blockSize;
              #endif
              };
+             typedef enum { ZSTD_dtlm_fast, ZSTD_dtlm_full } ZSTD_dictTableLoadMethod_e;
+             typedef enum { ZSTD_noDict = 0, ZSTD_extDict = 1, ZSTD_dictMatchState = 2 } ZSTD_dictMode_e;
              typedef size_t (*ZSTD_blockCompressor) (
                      ZSTD_matchState_t* bs, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
-             ZSTD_blockCompressor ZSTD_selectBlockCompressor(ZSTD_strategy strat, int extDict);
+                     void const* src, size_t srcSize);
+             ZSTD_blockCompressor ZSTD_selectBlockCompressor(ZSTD_strategy strat, ZSTD_dictMode_e dictMode);
              MEM_STATIC U32 ZSTD_LLcode(U32 litLength)
              */
              MEM_STATIC void ZSTD_storeSeq(seqStore_t* seqStorePtr, size_t litLength, const void* literals, U32 offsetCode, size_t mlBase)
              {
-             #if defined(ZSTD_DEBUG) && (ZSTD_DEBUG >= 6)
+             #if defined(DEBUGLEVEL) && (DEBUGLEVEL >= 6)
                  static const BYTE* g_start = NULL;
                  if (g_start==NULL) g_start = (const BYTE*)literals;  /* note : index only works for compression within a single segment */
                  {   U32 const pos = (U32)((const BYTE*)literals - g_start);
-                     DEBUGLOG(6, "Cpos%7u :%3u literals, match%3u bytes at dist.code%7u",
+                     DEBUGLOG(6, "Cpos%7u :%3u literals, match%4u bytes at offCode%7u",
                             pos, (U32)litLength, (U32)mlBase+MINMATCH, (U32)offsetCode);
                  }
              #endif
+                 assert((size_t)(seqStorePtr->sequences - seqStorePtr->sequencesStart) < seqStorePtr->maxNbSeq);
                  /* copy Literals */
-                 assert(seqStorePtr->lit + litLength <= seqStorePtr->litStart + 128 KB);
+                 assert(seqStorePtr->maxNbLit <= 128 KB);
+                 assert(seqStorePtr->lit + litLength <= seqStorePtr->litStart + seqStorePtr->maxNbLit);
                  ZSTD_wildcopy(seqStorePtr->lit, literals, litLength);
                  seqStorePtr->lit += litLength;
                  const BYTE* const vEnd = MIN( ip + (mEnd - match), iEnd);
                  size_t const matchLength = ZSTD_count(ip, match, vEnd);
                  if (match + matchLength != mEnd) return matchLength;
+                 DEBUGLOG(7, "ZSTD_count_2segments: found a 2-parts match (current length==%zu)", matchLength);
+                 DEBUGLOG(7, "distance from match beginning to end dictionary = %zi", mEnd - match);
+                 DEBUGLOG(7, "distance from current pos to end buffer = %zi", iEnd - ip);
+                 DEBUGLOG(7, "next byte : ip==%02X, istart==%02X", ip[matchLength], *iStart);
+                 DEBUGLOG(7, "final match length = %zu", matchLength + ZSTD_count(ip+matchLength, iStart, iEnd));
                  return matchLength + ZSTD_count(ip+matchLength, iStart, iEnd);
              }
              }
              /**
+              * ZSTD_matchState_dictMode():
+              * Inspects the provided matchState and figures out what dictMode should be
+              * passed to the compressor.
+              */
+             MEM_STATIC ZSTD_dictMode_e ZSTD_matchState_dictMode(const ZSTD_matchState_t *ms)
+             {
+                 return ZSTD_window_hasExtDict(ms->window) ?
+                     ZSTD_extDict :
+                     ms->dictMatchState != NULL ?
+                         ZSTD_dictMatchState :
+                         ZSTD_noDict;
+             }
+             /**
               * ZSTD_window_needOverflowCorrection():
               * Returns non-zero if the indices are getting too large and need overflow
               * protection.
               * ZSTD_window_enforceMaxDist():
               * Updates lowLimit so that:
               *    (srcEnd - base) - lowLimit == maxDist + loadedDictEnd
+              *
               * This allows a simple check that index >= lowLimit to see if index is valid.
               * This must be called before a block compression call, with srcEnd as the block
               * source end.
+              *
               * If loadedDictEndPtr is not NULL, we set it to zero once we update lowLimit.
               * This is because dictionaries are allowed to be referenced as long as the last
               * byte of the dictionary is in the window, but once they are out of range,
               * they cannot be referenced. If loadedDictEndPtr is NULL, we use
               * loadedDictEnd == 0.
+              *
+              * In normal dict mode, the dict is between lowLimit and dictLimit. In
+              * dictMatchState mode, lowLimit and dictLimit are the same, and the dictionary
+              * is below them. forceWindow and dictMatchState are therefore incompatible.
               */
              MEM_STATIC void ZSTD_window_enforceMaxDist(ZSTD_window_t* window,
                                                         void const* srcEnd, U32 maxDist,
-                                                        U32* loadedDictEndPtr)
+                                                        U32* loadedDictEndPtr,
+                                                        const ZSTD_matchState_t** dictMatchStatePtr)
              {
                  U32 const current = (U32)((BYTE const*)srcEnd - window->base);
                  U32 loadedDictEnd = loadedDictEndPtr != NULL ? *loadedDictEndPtr : 0;
+                 DEBUGLOG(5, "ZSTD_window_enforceMaxDist: current=%u, maxDist=%u", current, maxDist);
                  if (current > maxDist + loadedDictEnd) {
                      U32 const newLowLimit = current - maxDist;
                      if (window->lowLimit < newLowLimit) window->lowLimit = newLowLimit;
                      if (window->dictLimit < window->lowLimit) {
-                         DEBUGLOG(5, "Update dictLimit from %u to %u", window->dictLimit,
-                                  window->lowLimit);
+                         DEBUGLOG(5, "Update dictLimit to match lowLimit, from %u to %u",
+                                     window->dictLimit, window->lowLimit);
                          window->dictLimit = window->lowLimit;
                      }
                      if (loadedDictEndPtr)
                          *loadedDictEndPtr = 0;
+                     if (dictMatchStatePtr)
+                         *dictMatchStatePtr = NULL;
                  }
              }
              {
                  BYTE const* const ip = (BYTE const*)src;
                  U32 contiguous = 1;
+                 DEBUGLOG(5, "ZSTD_window_update");
                  /* Check if blocks follow each other */
                  if (src != window->nextSrc) {
                      /* not contiguous */
                      size_t const distanceFromBase = (size_t)(window->nextSrc - window->base);
-                     DEBUGLOG(5, "Non contiguous blocks, new segment starts at %u",
-                              window->dictLimit);
+                     DEBUGLOG(5, "Non contiguous blocks, new segment starts at %u", window->dictLimit);
                      window->lowLimit = window->dictLimit;
                      assert(distanceFromBase == (size_t)(U32)distanceFromBase);  /* should never overflow */
                      window->dictLimit = (U32)distanceFromBase;
                      ptrdiff_t const highInputIdx = (ip + srcSize) - window->dictBase;
                      U32 const lowLimitMax = (highInputIdx > (ptrdiff_t)window->dictLimit) ? window->dictLimit : (U32)highInputIdx;
                      window->lowLimit = lowLimitMax;
+                     DEBUGLOG(5, "Overlapping extDict and input : new lowLimit = %u", window->lowLimit);
                  }
                  return contiguous;
              }
+             /* debug functions */
+             MEM_STATIC double ZSTD_fWeight(U32 rawStat)
+             {
+                 U32 const fp_accuracy = 8;
+                 U32 const fp_multiplier = (1 << fp_accuracy);
+                 U32 const stat = rawStat + 1;
+                 U32 const hb = ZSTD_highbit32(stat);
+                 U32 const BWeight = hb * fp_multiplier;
+                 U32 const FWeight = (stat << fp_accuracy) >> hb;
+                 U32 const weight = BWeight + FWeight;
+                 assert(hb + fp_accuracy < 31);
+                 return (double)weight / fp_multiplier;
+             }
+             MEM_STATIC void ZSTD_debugTable(const U32* table, U32 max)
+             {
+                 unsigned u, sum;
+                 for (u=0, sum=0; u<=max; u++) sum += table[u];
+                 DEBUGLOG(2, "total nb elts: %u", sum);
+                 for (u=0; u<=max; u++) {
+                     DEBUGLOG(2, "%2u: %5u  (%.2f)",
+                             u, table[u], ZSTD_fWeight(sum) - ZSTD_fWeight(table[u]) );
+                 }
+             }
              #if defined (__cplusplus)
              }
              #endif
               * ============================================================== */
              /* ZSTD_getCParamsFromCCtxParams() :
-              * cParams are built depending on compressionLevel, src size hints,
+              * cParams are built depending on compressionLevel, src size hints,
               * LDM and manually set compression parameters.
               */
              ZSTD_compressionParameters ZSTD_getCParamsFromCCtxParams(
                                   const ZSTD_CDict* cdict,
                                   ZSTD_CCtx_params  params, unsigned long long pledgedSrcSize);
+             void ZSTD_resetSeqStore(seqStore_t* ssPtr);
              /*! ZSTD_compressStream_generic() :
               *  Private use only. To be called from zstdmt_compress.c in single-thread mode. */
              size_t ZSTD_compressStream_generic(ZSTD_CStream* zcs,
              size_t ZSTD_compressBegin_advanced_internal(ZSTD_CCtx* cctx,
                                                  const void* dict, size_t dictSize,
                                                  ZSTD_dictContentType_e dictContentType,
+                                                 ZSTD_dictTableLoadMethod_e dtlm,
                                                  const ZSTD_CDict* cdict,
                                                  ZSTD_CCtx_params params,
                                                  unsigned long long pledgedSrcSize);

contrib/python-zstandard/zstd/compress/zstd_double_fast.c

0 +267 -95

              void ZSTD_fillDoubleHashTable(ZSTD_matchState_t* ms,
-                                           ZSTD_compressionParameters const* cParams,
-                                           void const* end)
+                                           void const* end, ZSTD_dictTableLoadMethod_e dtlm)
              {
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
                  U32* const hashLarge = ms->hashTable;
                  U32  const hBitsL = cParams->hashLog;
                  U32  const mls = cParams->searchLength;
                              hashSmall[smHash] = current + i;
                          if (i == 0 || hashLarge[lgHash] == 0)
                              hashLarge[lgHash] = current + i;
+                         /* Only load extra positions for ZSTD_dtlm_full */
+                         if (dtlm == ZSTD_dtlm_fast)
+                             break;
                      }
                  }
              }
              FORCE_INLINE_TEMPLATE
              size_t ZSTD_compressBlock_doubleFast_generic(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize,
-                     U32 const mls /* template */)
+                     void const* src, size_t srcSize,
+                     U32 const mls /* template */, ZSTD_dictMode_e const dictMode)
              {
+                 ZSTD_compressionParameters const* cParams = &ms->cParams;
                  U32* const hashLong = ms->hashTable;
                  const U32 hBitsL = cParams->hashLog;
                  U32* const hashSmall = ms->chainTable;
                  const BYTE* const istart = (const BYTE*)src;
                  const BYTE* ip = istart;
                  const BYTE* anchor = istart;
-                 const U32 lowestIndex = ms->window.dictLimit;
-                 const BYTE* const lowest = base + lowestIndex;
+                 const U32 prefixLowestIndex = ms->window.dictLimit;
+                 const BYTE* const prefixLowest = base + prefixLowestIndex;
                  const BYTE* const iend = istart + srcSize;
                  const BYTE* const ilimit = iend - HASH_READ_SIZE;
                  U32 offset_1=rep[0], offset_2=rep[1];
                  U32 offsetSaved = 0;
+                 const ZSTD_matchState_t* const dms = ms->dictMatchState;
+                 const ZSTD_compressionParameters* const dictCParams =
+                                                  dictMode == ZSTD_dictMatchState ?
+                                                  &dms->cParams : NULL;
+                 const U32* const dictHashLong  = dictMode == ZSTD_dictMatchState ?
+                                                  dms->hashTable : NULL;
+                 const U32* const dictHashSmall = dictMode == ZSTD_dictMatchState ?
+                                                  dms->chainTable : NULL;
+                 const U32 dictStartIndex       = dictMode == ZSTD_dictMatchState ?
+                                                  dms->window.dictLimit : 0;
+                 const BYTE* const dictBase     = dictMode == ZSTD_dictMatchState ?
+                                                  dms->window.base : NULL;
+                 const BYTE* const dictStart    = dictMode == ZSTD_dictMatchState ?
+                                                  dictBase + dictStartIndex : NULL;
+                 const BYTE* const dictEnd      = dictMode == ZSTD_dictMatchState ?
+                                                  dms->window.nextSrc : NULL;
+                 const U32 dictIndexDelta       = dictMode == ZSTD_dictMatchState ?
+                                                  prefixLowestIndex - (U32)(dictEnd - dictBase) :
+;
+                 const U32 dictHBitsL           = dictMode == ZSTD_dictMatchState ?
+                                                  dictCParams->hashLog : hBitsL;
+                 const U32 dictHBitsS           = dictMode == ZSTD_dictMatchState ?
+                                                  dictCParams->chainLog : hBitsS;
+                 const U32 dictAndPrefixLength  = (U32)(ip - prefixLowest + dictEnd - dictStart);
+                 assert(dictMode == ZSTD_noDict || dictMode == ZSTD_dictMatchState);
                  /* init */
-                 ip += (ip==lowest);
-                 {   U32 const maxRep = (U32)(ip-lowest);
+                 ip += (dictAndPrefixLength == 0);
+                 if (dictMode == ZSTD_noDict) {
+                     U32 const maxRep = (U32)(ip - prefixLowest);
                      if (offset_2 > maxRep) offsetSaved = offset_2, offset_2 = 0;
                      if (offset_1 > maxRep) offsetSaved = offset_1, offset_1 = 0;
                  }
+                 if (dictMode == ZSTD_dictMatchState) {
+                     /* dictMatchState repCode checks don't currently handle repCode == 0
+                      * disabling. */
+                     assert(offset_1 <= dictAndPrefixLength);
+                     assert(offset_2 <= dictAndPrefixLength);
+                 }
                  /* Main Search Loop */
                  while (ip < ilimit) {   /* < instead of <=, because repcode check at (ip+1) */
                      size_t mLength;
+                     U32 offset;
                      size_t const h2 = ZSTD_hashPtr(ip, hBitsL, 8);
                      size_t const h = ZSTD_hashPtr(ip, hBitsS, mls);
+                     size_t const dictHL = ZSTD_hashPtr(ip, dictHBitsL, 8);
+                     size_t const dictHS = ZSTD_hashPtr(ip, dictHBitsS, mls);
                      U32 const current = (U32)(ip-base);
                      U32 const matchIndexL = hashLong[h2];
-                     U32 const matchIndexS = hashSmall[h];
+                     U32 matchIndexS = hashSmall[h];
                      const BYTE* matchLong = base + matchIndexL;
                      const BYTE* match = base + matchIndexS;
+                     const U32 repIndex = current + 1 - offset_1;
+                     const BYTE* repMatch = (dictMode == ZSTD_dictMatchState
+                                         && repIndex < prefixLowestIndex) ?
+                                            dictBase + (repIndex - dictIndexDelta) :
+                                            base + repIndex;
                      hashLong[h2] = hashSmall[h] = current;   /* update hash tables */
-                     assert(offset_1 <= current);   /* supposed guaranteed by construction */
-                     if ((offset_1 > 0) & (MEM_read32(ip+1-offset_1) == MEM_read32(ip+1))) {
-                         /* favor repcode */
+                     /* check dictMatchState repcode */
+                     if (dictMode == ZSTD_dictMatchState
+                         && ((U32)((prefixLowestIndex-1) - repIndex) >= 3 /* intentional underflow */)
+                         && (MEM_read32(repMatch) == MEM_read32(ip+1)) ) {
+                         const BYTE* repMatchEnd = repIndex < prefixLowestIndex ? dictEnd : iend;
+                         mLength = ZSTD_count_2segments(ip+1+4, repMatch+4, iend, repMatchEnd, prefixLowest) + 4;
+                         ip++;
+                         ZSTD_storeSeq(seqStore, ip-anchor, anchor, 0, mLength-MINMATCH);
+                         goto _match_stored;
+                     }
+                     /* check noDict repcode */
+                     if ( dictMode == ZSTD_noDict
+                       && ((offset_1 > 0) & (MEM_read32(ip+1-offset_1) == MEM_read32(ip+1)))) {
                          mLength = ZSTD_count(ip+1+4, ip+1+4-offset_1, iend) + 4;
                          ip++;
                          ZSTD_storeSeq(seqStore, ip-anchor, anchor, 0, mLength-MINMATCH);
-                     } else {
-                         U32 offset;
-                         if ( (matchIndexL > lowestIndex) && (MEM_read64(matchLong) == MEM_read64(ip)) ) {
+                         goto _match_stored;
+                     }
+                     if (matchIndexL > prefixLowestIndex) {
+                         /* check prefix long match */
+                         if (MEM_read64(matchLong) == MEM_read64(ip)) {
                              mLength = ZSTD_count(ip+8, matchLong+8, iend) + 8;
                              offset = (U32)(ip-matchLong);
-                             while (((ip>anchor) & (matchLong>lowest)) && (ip[-1] == matchLong[-1])) { ip--; matchLong--; mLength++; } /* catch up */
-                         } else if ( (matchIndexS > lowestIndex) && (MEM_read32(match) == MEM_read32(ip)) ) {
-                             size_t const hl3 = ZSTD_hashPtr(ip+1, hBitsL, 8);
-                             U32 const matchIndexL3 = hashLong[hl3];
-                             const BYTE* matchL3 = base + matchIndexL3;
-                             hashLong[hl3] = current + 1;
-                             if ( (matchIndexL3 > lowestIndex) && (MEM_read64(matchL3) == MEM_read64(ip+1)) ) {
+                             while (((ip>anchor) & (matchLong>prefixLowest)) && (ip[-1] == matchLong[-1])) { ip--; matchLong--; mLength++; } /* catch up */
+                             goto _match_found;
+                         }
+                     } else if (dictMode == ZSTD_dictMatchState) {
+                         /* check dictMatchState long match */
+                         U32 const dictMatchIndexL = dictHashLong[dictHL];
+                         const BYTE* dictMatchL = dictBase + dictMatchIndexL;
+                         assert(dictMatchL < dictEnd);
+                         if (dictMatchL > dictStart && MEM_read64(dictMatchL) == MEM_read64(ip)) {
+                             mLength = ZSTD_count_2segments(ip+8, dictMatchL+8, iend, dictEnd, prefixLowest) + 8;
+                             offset = (U32)(current - dictMatchIndexL - dictIndexDelta);
+                             while (((ip>anchor) & (dictMatchL>dictStart)) && (ip[-1] == dictMatchL[-1])) { ip--; dictMatchL--; mLength++; } /* catch up */
+                             goto _match_found;
+                         }
+                     }
+                     if (matchIndexS > prefixLowestIndex) {
+                         /* check prefix short match */
+                         if (MEM_read32(match) == MEM_read32(ip)) {
+                             goto _search_next_long;
+                         }
+                     } else if (dictMode == ZSTD_dictMatchState) {
+                         /* check dictMatchState short match */
+                         U32 const dictMatchIndexS = dictHashSmall[dictHS];
+                         match = dictBase + dictMatchIndexS;
+                         matchIndexS = dictMatchIndexS + dictIndexDelta;
+                         if (match > dictStart && MEM_read32(match) == MEM_read32(ip)) {
+                             goto _search_next_long;
+                         }
+                     }
+                     ip += ((ip-anchor) >> kSearchStrength) + 1;
+                     continue;
+             _search_next_long:
+                     {
+                         size_t const hl3 = ZSTD_hashPtr(ip+1, hBitsL, 8);
+                         size_t const dictHLNext = ZSTD_hashPtr(ip+1, dictHBitsL, 8);
+                         U32 const matchIndexL3 = hashLong[hl3];
+                         const BYTE* matchL3 = base + matchIndexL3;
+                         hashLong[hl3] = current + 1;
+                         /* check prefix long +1 match */
+                         if (matchIndexL3 > prefixLowestIndex) {
+                             if (MEM_read64(matchL3) == MEM_read64(ip+1)) {
                                  mLength = ZSTD_count(ip+9, matchL3+8, iend) + 8;
                                  ip++;
                                  offset = (U32)(ip-matchL3);
-                                 while (((ip>anchor) & (matchL3>lowest)) && (ip[-1] == matchL3[-1])) { ip--; matchL3--; mLength++; } /* catch up */
-                             } else {
-                                 mLength = ZSTD_count(ip+4, match+4, iend) + 4;
-                                 offset = (U32)(ip-match);
-                                 while (((ip>anchor) & (match>lowest)) && (ip[-1] == match[-1])) { ip--; match--; mLength++; } /* catch up */
+                                 while (((ip>anchor) & (matchL3>prefixLowest)) && (ip[-1] == matchL3[-1])) { ip--; matchL3--; mLength++; } /* catch up */
+                                 goto _match_found;
                              }
-                         } else {
-                             ip += ((ip-anchor) >> kSearchStrength) + 1;
-                             continue;
+                         } else if (dictMode == ZSTD_dictMatchState) {
+                             /* check dict long +1 match */
+                             U32 const dictMatchIndexL3 = dictHashLong[dictHLNext];
+                             const BYTE* dictMatchL3 = dictBase + dictMatchIndexL3;
+                             assert(dictMatchL3 < dictEnd);
+                             if (dictMatchL3 > dictStart && MEM_read64(dictMatchL3) == MEM_read64(ip+1)) {
+                                 mLength = ZSTD_count_2segments(ip+1+8, dictMatchL3+8, iend, dictEnd, prefixLowest) + 8;
+                                 ip++;
+                                 offset = (U32)(current + 1 - dictMatchIndexL3 - dictIndexDelta);
+                                 while (((ip>anchor) & (dictMatchL3>dictStart)) && (ip[-1] == dictMatchL3[-1])) { ip--; dictMatchL3--; mLength++; } /* catch up */
+                                 goto _match_found;
+                             }
                          }
-                         offset_2 = offset_1;
-                         offset_1 = offset;
-                         ZSTD_storeSeq(seqStore, ip-anchor, anchor, offset + ZSTD_REP_MOVE, mLength-MINMATCH);
                      }
+                     /* if no long +1 match, explore the short match we found */
+                     if (dictMode == ZSTD_dictMatchState && matchIndexS < prefixLowestIndex) {
+                         mLength = ZSTD_count_2segments(ip+4, match+4, iend, dictEnd, prefixLowest) + 4;
+                         offset = (U32)(current - matchIndexS);
+                         while (((ip>anchor) & (match>dictStart)) && (ip[-1] == match[-1])) { ip--; match--; mLength++; } /* catch up */
+                     } else {
+                         mLength = ZSTD_count(ip+4, match+4, iend) + 4;
+                         offset = (U32)(ip - match);
+                         while (((ip>anchor) & (match>prefixLowest)) && (ip[-1] == match[-1])) { ip--; match--; mLength++; } /* catch up */
+                     }
+                     /* fall-through */
+             _match_found:
+                     offset_2 = offset_1;
+                     offset_1 = offset;
+                     ZSTD_storeSeq(seqStore, ip-anchor, anchor, offset + ZSTD_REP_MOVE, mLength-MINMATCH);
+             _match_stored:
                      /* match found */
                      ip += mLength;
                      anchor = ip;
                              hashSmall[ZSTD_hashPtr(ip-2, hBitsS, mls)] = (U32)(ip-2-base);
                          /* check immediate repcode */
-                         while ( (ip <= ilimit)
-                              && ( (offset_2>0)
-                              & (MEM_read32(ip) == MEM_read32(ip - offset_2)) )) {
-                             /* store sequence */
-                             size_t const rLength = ZSTD_count(ip+4, ip+4-offset_2, iend) + 4;
-                             { U32 const tmpOff = offset_2; offset_2 = offset_1; offset_1 = tmpOff; } /* swap offset_2 <=> offset_1 */
-                             hashSmall[ZSTD_hashPtr(ip, hBitsS, mls)] = (U32)(ip-base);
-                             hashLong[ZSTD_hashPtr(ip, hBitsL, 8)] = (U32)(ip-base);
-                             ZSTD_storeSeq(seqStore, 0, anchor, 0, rLength-MINMATCH);
-                             ip += rLength;
-                             anchor = ip;
-                             continue;   /* faster when present ... (?) */
-                 }   }   }
+                         if (dictMode == ZSTD_dictMatchState) {
+                             while (ip <= ilimit) {
+                                 U32 const current2 = (U32)(ip-base);
+                                 U32 const repIndex2 = current2 - offset_2;
+                                 const BYTE* repMatch2 = dictMode == ZSTD_dictMatchState
+                                     && repIndex2 < prefixLowestIndex ?
+                                         dictBase - dictIndexDelta + repIndex2 :
+                                         base + repIndex2;
+                                 if ( ((U32)((prefixLowestIndex-1) - (U32)repIndex2) >= 3 /* intentional overflow */)
+                                    && (MEM_read32(repMatch2) == MEM_read32(ip)) ) {
+                                     const BYTE* const repEnd2 = repIndex2 < prefixLowestIndex ? dictEnd : iend;
+                                     size_t const repLength2 = ZSTD_count_2segments(ip+4, repMatch2+4, iend, repEnd2, prefixLowest) + 4;
+                                     U32 tmpOffset = offset_2; offset_2 = offset_1; offset_1 = tmpOffset;   /* swap offset_2 <=> offset_1 */
+                                     ZSTD_storeSeq(seqStore, 0, anchor, 0, repLength2-MINMATCH);
+                                     hashSmall[ZSTD_hashPtr(ip, hBitsS, mls)] = current2;
+                                     hashLong[ZSTD_hashPtr(ip, hBitsL, 8)] = current2;
+                                     ip += repLength2;
+                                     anchor = ip;
+                                     continue;
+                                 }
+                                 break;
+                             }
+                         }
+                         if (dictMode == ZSTD_noDict) {
+                             while ( (ip <= ilimit)
+                                  && ( (offset_2>0)
+                                     & (MEM_read32(ip) == MEM_read32(ip - offset_2)) )) {
+                                 /* store sequence */
+                                 size_t const rLength = ZSTD_count(ip+4, ip+4-offset_2, iend) + 4;
+                                 U32 const tmpOff = offset_2; offset_2 = offset_1; offset_1 = tmpOff;  /* swap offset_2 <=> offset_1 */
+                                 hashSmall[ZSTD_hashPtr(ip, hBitsS, mls)] = (U32)(ip-base);
+                                 hashLong[ZSTD_hashPtr(ip, hBitsL, 8)] = (U32)(ip-base);
+                                 ZSTD_storeSeq(seqStore, 0, anchor, 0, rLength-MINMATCH);
+                                 ip += rLength;
+                                 anchor = ip;
+                                 continue;   /* faster when present ... (?) */
+                 }   }   }   }
                  /* save reps for next block */
                  rep[0] = offset_1 ? offset_1 : offsetSaved;
              size_t ZSTD_compressBlock_doubleFast(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     void const* src, size_t srcSize)
              {
-                 const U32 mls = cParams->searchLength;
+                 const U32 mls = ms->cParams.searchLength;
                  switch(mls)
                  {
                  default: /* includes case 3 */
                  case 4 :
-                     return ZSTD_compressBlock_doubleFast_generic(ms, seqStore, rep, cParams, src, srcSize, 4);
+                     return ZSTD_compressBlock_doubleFast_generic(ms, seqStore, rep, src, srcSize, 4, ZSTD_noDict);
                  case 5 :
-                     return ZSTD_compressBlock_doubleFast_generic(ms, seqStore, rep, cParams, src, srcSize, 5);
+                     return ZSTD_compressBlock_doubleFast_generic(ms, seqStore, rep, src, srcSize, 5, ZSTD_noDict);
                  case 6 :
-                     return ZSTD_compressBlock_doubleFast_generic(ms, seqStore, rep, cParams, src, srcSize, 6);
+                     return ZSTD_compressBlock_doubleFast_generic(ms, seqStore, rep, src, srcSize, 6, ZSTD_noDict);
                  case 7 :
-                     return ZSTD_compressBlock_doubleFast_generic(ms, seqStore, rep, cParams, src, srcSize, 7);
+                     return ZSTD_compressBlock_doubleFast_generic(ms, seqStore, rep, src, srcSize, 7, ZSTD_noDict);
+                 }
+             }
+             size_t ZSTD_compressBlock_doubleFast_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize)
+             {
+                 const U32 mls = ms->cParams.searchLength;
+                 switch(mls)
+                 {
+                 default: /* includes case 3 */
+                 case 4 :
+                     return ZSTD_compressBlock_doubleFast_generic(ms, seqStore, rep, src, srcSize, 4, ZSTD_dictMatchState);
+                 case 5 :
+                     return ZSTD_compressBlock_doubleFast_generic(ms, seqStore, rep, src, srcSize, 5, ZSTD_dictMatchState);
+                 case 6 :
+                     return ZSTD_compressBlock_doubleFast_generic(ms, seqStore, rep, src, srcSize, 6, ZSTD_dictMatchState);
+                 case 7 :
+                     return ZSTD_compressBlock_doubleFast_generic(ms, seqStore, rep, src, srcSize, 7, ZSTD_dictMatchState);
                  }
              }
              static size_t ZSTD_compressBlock_doubleFast_extDict_generic(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize,
+                     void const* src, size_t srcSize,
                      U32 const mls /* template */)
              {
+                 ZSTD_compressionParameters const* cParams = &ms->cParams;
                  U32* const hashLong = ms->hashTable;
                  U32  const hBitsL = cParams->hashLog;
                  U32* const hashSmall = ms->chainTable;
                  U32  const hBitsS = cParams->chainLog;
-                 const BYTE* const base = ms->window.base;
-                 const BYTE* const dictBase = ms->window.dictBase;
                  const BYTE* const istart = (const BYTE*)src;
                  const BYTE* ip = istart;
                  const BYTE* anchor = istart;
-                 const U32   lowestIndex = ms->window.lowLimit;
-                 const BYTE* const dictStart = dictBase + lowestIndex;
-                 const U32   dictLimit = ms->window.dictLimit;
-                 const BYTE* const lowPrefixPtr = base + dictLimit;
-                 const BYTE* const dictEnd = dictBase + dictLimit;
                  const BYTE* const iend = istart + srcSize;
                  const BYTE* const ilimit = iend - 8;
+                 const U32   prefixStartIndex = ms->window.dictLimit;
+                 const BYTE* const base = ms->window.base;
+                 const BYTE* const prefixStart = base + prefixStartIndex;
+                 const U32   dictStartIndex = ms->window.lowLimit;
+                 const BYTE* const dictBase = ms->window.dictBase;
+                 const BYTE* const dictStart = dictBase + dictStartIndex;
+                 const BYTE* const dictEnd = dictBase + prefixStartIndex;
                  U32 offset_1=rep[0], offset_2=rep[1];
+                 DEBUGLOG(5, "ZSTD_compressBlock_doubleFast_extDict_generic (srcSize=%zu)", srcSize);
                  /* Search Loop */
                  while (ip < ilimit) {  /* < instead of <=, because (ip+1) */
                      const size_t hSmall = ZSTD_hashPtr(ip, hBitsS, mls);
                      const U32 matchIndex = hashSmall[hSmall];
-                     const BYTE* matchBase = matchIndex < dictLimit ? dictBase : base;
+                     const BYTE* const matchBase = matchIndex < prefixStartIndex ? dictBase : base;
                      const BYTE* match = matchBase + matchIndex;
                      const size_t hLong = ZSTD_hashPtr(ip, hBitsL, 8);
                      const U32 matchLongIndex = hashLong[hLong];
-                     const BYTE* matchLongBase = matchLongIndex < dictLimit ? dictBase : base;
+                     const BYTE* const matchLongBase = matchLongIndex < prefixStartIndex ? dictBase : base;
                      const BYTE* matchLong = matchLongBase + matchLongIndex;
                      const U32 current = (U32)(ip-base);
                      const U32 repIndex = current + 1 - offset_1;   /* offset_1 expected <= current +1 */
-                     const BYTE* repBase = repIndex < dictLimit ? dictBase : base;
-                     const BYTE* repMatch = repBase + repIndex;
+                     const BYTE* const repBase = repIndex < prefixStartIndex ? dictBase : base;
+                     const BYTE* const repMatch = repBase + repIndex;
                      size_t mLength;
                      hashSmall[hSmall] = hashLong[hLong] = current;   /* update hash table */
-                     if ( (((U32)((dictLimit-1) - repIndex) >= 3) /* intentional underflow */ & (repIndex > lowestIndex))
-                        && (MEM_read32(repMatch) == MEM_read32(ip+1)) ) {
-                         const BYTE* repMatchEnd = repIndex < dictLimit ? dictEnd : iend;
-                         mLength = ZSTD_count_2segments(ip+1+4, repMatch+4, iend, repMatchEnd, lowPrefixPtr) + 4;
+                     if ((((U32)((prefixStartIndex-1) - repIndex) >= 3) /* intentional underflow : ensure repIndex doesn't overlap dict + prefix */
+                         & (repIndex > dictStartIndex))
+                       && (MEM_read32(repMatch) == MEM_read32(ip+1)) ) {
+                         const BYTE* repMatchEnd = repIndex < prefixStartIndex ? dictEnd : iend;
+                         mLength = ZSTD_count_2segments(ip+1+4, repMatch+4, iend, repMatchEnd, prefixStart) + 4;
                          ip++;
                          ZSTD_storeSeq(seqStore, ip-anchor, anchor, 0, mLength-MINMATCH);
                      } else {
-                         if ((matchLongIndex > lowestIndex) && (MEM_read64(matchLong) == MEM_read64(ip))) {
-                             const BYTE* matchEnd = matchLongIndex < dictLimit ? dictEnd : iend;
-                             const BYTE* lowMatchPtr = matchLongIndex < dictLimit ? dictStart : lowPrefixPtr;
+                         if ((matchLongIndex > dictStartIndex) && (MEM_read64(matchLong) == MEM_read64(ip))) {
+                             const BYTE* const matchEnd = matchLongIndex < prefixStartIndex ? dictEnd : iend;
+                             const BYTE* const lowMatchPtr = matchLongIndex < prefixStartIndex ? dictStart : prefixStart;
                              U32 offset;
-                             mLength = ZSTD_count_2segments(ip+8, matchLong+8, iend, matchEnd, lowPrefixPtr) + 8;
+                             mLength = ZSTD_count_2segments(ip+8, matchLong+8, iend, matchEnd, prefixStart) + 8;
                              offset = current - matchLongIndex;
                              while (((ip>anchor) & (matchLong>lowMatchPtr)) && (ip[-1] == matchLong[-1])) { ip--; matchLong--; mLength++; }   /* catch up */
                              offset_2 = offset_1;
                              offset_1 = offset;
                              ZSTD_storeSeq(seqStore, ip-anchor, anchor, offset + ZSTD_REP_MOVE, mLength-MINMATCH);
-                         } else if ((matchIndex > lowestIndex) && (MEM_read32(match) == MEM_read32(ip))) {
+                         } else if ((matchIndex > dictStartIndex) && (MEM_read32(match) == MEM_read32(ip))) {
                              size_t const h3 = ZSTD_hashPtr(ip+1, hBitsL, 8);
                              U32 const matchIndex3 = hashLong[h3];
-                             const BYTE* const match3Base = matchIndex3 < dictLimit ? dictBase : base;
+                             const BYTE* const match3Base = matchIndex3 < prefixStartIndex ? dictBase : base;
                              const BYTE* match3 = match3Base + matchIndex3;
                              U32 offset;
                              hashLong[h3] = current + 1;
-                             if ( (matchIndex3 > lowestIndex) && (MEM_read64(match3) == MEM_read64(ip+1)) ) {
-                                 const BYTE* matchEnd = matchIndex3 < dictLimit ? dictEnd : iend;
-                                 const BYTE* lowMatchPtr = matchIndex3 < dictLimit ? dictStart : lowPrefixPtr;
-                                 mLength = ZSTD_count_2segments(ip+9, match3+8, iend, matchEnd, lowPrefixPtr) + 8;
+                             if ( (matchIndex3 > dictStartIndex) && (MEM_read64(match3) == MEM_read64(ip+1)) ) {
+                                 const BYTE* const matchEnd = matchIndex3 < prefixStartIndex ? dictEnd : iend;
+                                 const BYTE* const lowMatchPtr = matchIndex3 < prefixStartIndex ? dictStart : prefixStart;
+                                 mLength = ZSTD_count_2segments(ip+9, match3+8, iend, matchEnd, prefixStart) + 8;
                                  ip++;
                                  offset = current+1 - matchIndex3;
                                  while (((ip>anchor) & (match3>lowMatchPtr)) && (ip[-1] == match3[-1])) { ip--; match3--; mLength++; } /* catch up */
                              } else {
-                                 const BYTE* matchEnd = matchIndex < dictLimit ? dictEnd : iend;
-                                 const BYTE* lowMatchPtr = matchIndex < dictLimit ? dictStart : lowPrefixPtr;
-                                 mLength = ZSTD_count_2segments(ip+4, match+4, iend, matchEnd, lowPrefixPtr) + 4;
+                                 const BYTE* const matchEnd = matchIndex < prefixStartIndex ? dictEnd : iend;
+                                 const BYTE* const lowMatchPtr = matchIndex < prefixStartIndex ? dictStart : prefixStart;
+                                 mLength = ZSTD_count_2segments(ip+4, match+4, iend, matchEnd, prefixStart) + 4;
                                  offset = current - matchIndex;
                                  while (((ip>anchor) & (match>lowMatchPtr)) && (ip[-1] == match[-1])) { ip--; match--; mLength++; }   /* catch up */
                              }
                          while (ip <= ilimit) {
                              U32 const current2 = (U32)(ip-base);
                              U32 const repIndex2 = current2 - offset_2;
-                             const BYTE* repMatch2 = repIndex2 < dictLimit ? dictBase + repIndex2 : base + repIndex2;
-                             if ( (((U32)((dictLimit-1) - repIndex2) >= 3) & (repIndex2 > lowestIndex))  /* intentional overflow */
-                                && (MEM_read32(repMatch2) == MEM_read32(ip)) ) {
-                                 const BYTE* const repEnd2 = repIndex2 < dictLimit ? dictEnd : iend;
-                                 size_t const repLength2 = ZSTD_count_2segments(ip+4, repMatch2+4, iend, repEnd2, lowPrefixPtr) + 4;
-                                 U32 tmpOffset = offset_2; offset_2 = offset_1; offset_1 = tmpOffset;   /* swap offset_2 <=> offset_1 */
+                             const BYTE* repMatch2 = repIndex2 < prefixStartIndex ? dictBase + repIndex2 : base + repIndex2;
+                             if ( (((U32)((prefixStartIndex-1) - repIndex2) >= 3)   /* intentional overflow : ensure repIndex2 doesn't overlap dict + prefix */
+                                 & (repIndex2 > dictStartIndex))
+                               && (MEM_read32(repMatch2) == MEM_read32(ip)) ) {
+                                 const BYTE* const repEnd2 = repIndex2 < prefixStartIndex ? dictEnd : iend;
+                                 size_t const repLength2 = ZSTD_count_2segments(ip+4, repMatch2+4, iend, repEnd2, prefixStart) + 4;
+                                 U32 const tmpOffset = offset_2; offset_2 = offset_1; offset_1 = tmpOffset;   /* swap offset_2 <=> offset_1 */
                                  ZSTD_storeSeq(seqStore, 0, anchor, 0, repLength2-MINMATCH);
                                  hashSmall[ZSTD_hashPtr(ip, hBitsS, mls)] = current2;
                                  hashLong[ZSTD_hashPtr(ip, hBitsL, 8)] = current2;
              size_t ZSTD_compressBlock_doubleFast_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     void const* src, size_t srcSize)
              {
-                 U32 const mls = cParams->searchLength;
+                 U32 const mls = ms->cParams.searchLength;
                  switch(mls)
                  {
                  default: /* includes case 3 */
                  case 4 :
-                     return ZSTD_compressBlock_doubleFast_extDict_generic(ms, seqStore, rep, cParams, src, srcSize, 4);
+                     return ZSTD_compressBlock_doubleFast_extDict_generic(ms, seqStore, rep, src, srcSize, 4);
                  case 5 :
-                     return ZSTD_compressBlock_doubleFast_extDict_generic(ms, seqStore, rep, cParams, src, srcSize, 5);
+                     return ZSTD_compressBlock_doubleFast_extDict_generic(ms, seqStore, rep, src, srcSize, 5);
                  case 6 :
-                     return ZSTD_compressBlock_doubleFast_extDict_generic(ms, seqStore, rep, cParams, src, srcSize, 6);
+                     return ZSTD_compressBlock_doubleFast_extDict_generic(ms, seqStore, rep, src, srcSize, 6);
                  case 7 :
-                     return ZSTD_compressBlock_doubleFast_extDict_generic(ms, seqStore, rep, cParams, src, srcSize, 7);
+                     return ZSTD_compressBlock_doubleFast_extDict_generic(ms, seqStore, rep, src, srcSize, 7);
                  }
              }

contrib/python-zstandard/zstd/compress/zstd_double_fast.h

0 +6 -4

              #include "zstd_compress_internal.h"     /* ZSTD_CCtx, size_t */
              void ZSTD_fillDoubleHashTable(ZSTD_matchState_t* ms,
-                                           ZSTD_compressionParameters const* cParams,
-                                           void const* end);
+                                           void const* end, ZSTD_dictTableLoadMethod_e dtlm);
              size_t ZSTD_compressBlock_doubleFast(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
+             size_t ZSTD_compressBlock_doubleFast_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize);
              size_t ZSTD_compressBlock_doubleFast_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
              #if defined (__cplusplus)

contrib/python-zstandard/zstd/compress/zstd_fast.c

0 +201 -69

              void ZSTD_fillHashTable(ZSTD_matchState_t* ms,
-                                     ZSTD_compressionParameters const* cParams,
-                                     void const* end)
+                                     void const* end, ZSTD_dictTableLoadMethod_e dtlm)
              {
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
                  U32* const hashTable = ms->hashTable;
                  U32  const hBits = cParams->hashLog;
                  U32  const mls = cParams->searchLength;
                          size_t const hash = ZSTD_hashPtr(ip + i, hBits, mls);
                          if (i == 0 || hashTable[hash] == 0)
                              hashTable[hash] = current + i;
+                         /* Only load extra positions for ZSTD_dtlm_full */
+                         if (dtlm == ZSTD_dtlm_fast)
+                             break;
                      }
                  }
              }
              size_t ZSTD_compressBlock_fast_generic(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
                      void const* src, size_t srcSize,
-                     U32 const hlog, U32 const stepSize, U32 const mls)
+                     U32 const mls, ZSTD_dictMode_e const dictMode)
              {
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
                  U32* const hashTable = ms->hashTable;
+                 U32 const hlog = cParams->hashLog;
+                 /* support stepSize of 0 */
+                 U32 const stepSize = cParams->targetLength + !(cParams->targetLength);
                  const BYTE* const base = ms->window.base;
                  const BYTE* const istart = (const BYTE*)src;
                  const BYTE* ip = istart;
                  const BYTE* anchor = istart;
-                 const U32   lowestIndex = ms->window.dictLimit;
-                 const BYTE* const lowest = base + lowestIndex;
+                 const U32   prefixStartIndex = ms->window.dictLimit;
+                 const BYTE* const prefixStart = base + prefixStartIndex;
                  const BYTE* const iend = istart + srcSize;
                  const BYTE* const ilimit = iend - HASH_READ_SIZE;
                  U32 offset_1=rep[0], offset_2=rep[1];
                  U32 offsetSaved = 0;
+                 const ZSTD_matchState_t* const dms = ms->dictMatchState;
+                 const ZSTD_compressionParameters* const dictCParams =
+                                                  dictMode == ZSTD_dictMatchState ?
+                                                  &dms->cParams : NULL;
+                 const U32* const dictHashTable = dictMode == ZSTD_dictMatchState ?
+                                                  dms->hashTable : NULL;
+                 const U32 dictStartIndex       = dictMode == ZSTD_dictMatchState ?
+                                                  dms->window.dictLimit : 0;
+                 const BYTE* const dictBase     = dictMode == ZSTD_dictMatchState ?
+                                                  dms->window.base : NULL;
+                 const BYTE* const dictStart    = dictMode == ZSTD_dictMatchState ?
+                                                  dictBase + dictStartIndex : NULL;
+                 const BYTE* const dictEnd      = dictMode == ZSTD_dictMatchState ?
+                                                  dms->window.nextSrc : NULL;
+                 const U32 dictIndexDelta       = dictMode == ZSTD_dictMatchState ?
+                                                  prefixStartIndex - (U32)(dictEnd - dictBase) :
+;
+                 const U32 dictAndPrefixLength  = (U32)(ip - prefixStart + dictEnd - dictStart);
+                 const U32 dictHLog             = dictMode == ZSTD_dictMatchState ?
+                                                  dictCParams->hashLog : hlog;
+                 assert(dictMode == ZSTD_noDict || dictMode == ZSTD_dictMatchState);
+                 /* otherwise, we would get index underflow when translating a dict index
+                  * into a local index */
+                 assert(dictMode != ZSTD_dictMatchState
+                     || prefixStartIndex >= (U32)(dictEnd - dictBase));
                  /* init */
-                 ip += (ip==lowest);
-                 {   U32 const maxRep = (U32)(ip-lowest);
+                 ip += (dictAndPrefixLength == 0);
+                 if (dictMode == ZSTD_noDict) {
+                     U32 const maxRep = (U32)(ip - prefixStart);
                      if (offset_2 > maxRep) offsetSaved = offset_2, offset_2 = 0;
                      if (offset_1 > maxRep) offsetSaved = offset_1, offset_1 = 0;
                  }
+                 if (dictMode == ZSTD_dictMatchState) {
+                     /* dictMatchState repCode checks don't currently handle repCode == 0
+                      * disabling. */
+                     assert(offset_1 <= dictAndPrefixLength);
+                     assert(offset_2 <= dictAndPrefixLength);
+                 }
                  /* Main Search Loop */
                  while (ip < ilimit) {   /* < instead of <=, because repcode check at (ip+1) */
                      U32 const current = (U32)(ip-base);
                      U32 const matchIndex = hashTable[h];
                      const BYTE* match = base + matchIndex;
+                     const U32 repIndex = current + 1 - offset_1;
+                     const BYTE* repMatch = (dictMode == ZSTD_dictMatchState
+                                         && repIndex < prefixStartIndex) ?
+                                            dictBase + (repIndex - dictIndexDelta) :
+                                            base + repIndex;
                      hashTable[h] = current;   /* update hash table */
-                     if ((offset_1 > 0) & (MEM_read32(ip+1-offset_1) == MEM_read32(ip+1))) {
+                     if ( (dictMode == ZSTD_dictMatchState)
+                       && ((U32)((prefixStartIndex-1) - repIndex) >= 3) /* intentional underflow : ensure repIndex isn't overlapping dict + prefix */
+                       && (MEM_read32(repMatch) == MEM_read32(ip+1)) ) {
+                         const BYTE* const repMatchEnd = repIndex < prefixStartIndex ? dictEnd : iend;
+                         mLength = ZSTD_count_2segments(ip+1+4, repMatch+4, iend, repMatchEnd, prefixStart) + 4;
+                         ip++;
+                         ZSTD_storeSeq(seqStore, ip-anchor, anchor, 0, mLength-MINMATCH);
+                     } else if ( dictMode == ZSTD_noDict
+                              && ((offset_1 > 0) & (MEM_read32(ip+1-offset_1) == MEM_read32(ip+1)))) {
                          mLength = ZSTD_count(ip+1+4, ip+1+4-offset_1, iend) + 4;
                          ip++;
                          ZSTD_storeSeq(seqStore, ip-anchor, anchor, 0, mLength-MINMATCH);
-                     } else {
-                         if ( (matchIndex <= lowestIndex)
-                           || (MEM_read32(match) != MEM_read32(ip)) ) {
+                     } else if ( (matchIndex <= prefixStartIndex) ) {
+                         if (dictMode == ZSTD_dictMatchState) {
+                             size_t const dictHash = ZSTD_hashPtr(ip, dictHLog, mls);
+                             U32 const dictMatchIndex = dictHashTable[dictHash];
+                             const BYTE* dictMatch = dictBase + dictMatchIndex;
+                             if (dictMatchIndex <= dictStartIndex ||
+                                 MEM_read32(dictMatch) != MEM_read32(ip)) {
+                                 assert(stepSize >= 1);
+                                 ip += ((ip-anchor) >> kSearchStrength) + stepSize;
+                                 continue;
+                             } else {
+                                 /* found a dict match */
+                                 U32 const offset = (U32)(current-dictMatchIndex-dictIndexDelta);
+                                 mLength = ZSTD_count_2segments(ip+4, dictMatch+4, iend, dictEnd, prefixStart) + 4;
+                                 while (((ip>anchor) & (dictMatch>dictStart))
+                                      && (ip[-1] == dictMatch[-1])) {
+                                     ip--; dictMatch--; mLength++;
+                                 } /* catch up */
+                                 offset_2 = offset_1;
+                                 offset_1 = offset;
+                                 ZSTD_storeSeq(seqStore, ip-anchor, anchor, offset + ZSTD_REP_MOVE, mLength-MINMATCH);
+                             }
+                         } else {
                              assert(stepSize >= 1);
                              ip += ((ip-anchor) >> kSearchStrength) + stepSize;
                              continue;
                          }
+                     } else if (MEM_read32(match) != MEM_read32(ip)) {
+                         /* it's not a match, and we're not going to check the dictionary */
+                         assert(stepSize >= 1);
+                         ip += ((ip-anchor) >> kSearchStrength) + stepSize;
+                         continue;
+                     } else {
+                         /* found a regular match */
+                         U32 const offset = (U32)(ip-match);
                          mLength = ZSTD_count(ip+4, match+4, iend) + 4;
-                         {   U32 const offset = (U32)(ip-match);
-                             while (((ip>anchor) & (match>lowest)) && (ip[-1] == match[-1])) { ip--; match--; mLength++; } /* catch up */
-                             offset_2 = offset_1;
-                             offset_1 = offset;
-                             ZSTD_storeSeq(seqStore, ip-anchor, anchor, offset + ZSTD_REP_MOVE, mLength-MINMATCH);
-                     }   }
+                         while (((ip>anchor) & (match>prefixStart))
+                              && (ip[-1] == match[-1])) { ip--; match--; mLength++; } /* catch up */
+                         offset_2 = offset_1;
+                         offset_1 = offset;
+                         ZSTD_storeSeq(seqStore, ip-anchor, anchor, offset + ZSTD_REP_MOVE, mLength-MINMATCH);
+                     }
                      /* match found */
                      ip += mLength;
                      if (ip <= ilimit) {
                          /* Fill Table */
+                         assert(base+current+2 > istart);  /* check base overflow */
                          hashTable[ZSTD_hashPtr(base+current+2, hlog, mls)] = current+2;  /* here because current+2 could be > iend-8 */
                          hashTable[ZSTD_hashPtr(ip-2, hlog, mls)] = (U32)(ip-2-base);
                          /* check immediate repcode */
-                         while ( (ip <= ilimit)
-                              && ( (offset_2>0)
-                              & (MEM_read32(ip) == MEM_read32(ip - offset_2)) )) {
-                             /* store sequence */
-                             size_t const rLength = ZSTD_count(ip+4, ip+4-offset_2, iend) + 4;
-                             { U32 const tmpOff = offset_2; offset_2 = offset_1; offset_1 = tmpOff; }  /* swap offset_2 <=> offset_1 */
-                             hashTable[ZSTD_hashPtr(ip, hlog, mls)] = (U32)(ip-base);
-                             ZSTD_storeSeq(seqStore, 0, anchor, 0, rLength-MINMATCH);
-                             ip += rLength;
-                             anchor = ip;
-                             continue;   /* faster when present ... (?) */
-                 }   }   }
+                         if (dictMode == ZSTD_dictMatchState) {
+                             while (ip <= ilimit) {
+                                 U32 const current2 = (U32)(ip-base);
+                                 U32 const repIndex2 = current2 - offset_2;
+                                 const BYTE* repMatch2 = repIndex2 < prefixStartIndex ?
+                                         dictBase - dictIndexDelta + repIndex2 :
+                                         base + repIndex2;
+                                 if ( ((U32)((prefixStartIndex-1) - (U32)repIndex2) >= 3 /* intentional overflow */)
+                                    && (MEM_read32(repMatch2) == MEM_read32(ip)) ) {
+                                     const BYTE* const repEnd2 = repIndex2 < prefixStartIndex ? dictEnd : iend;
+                                     size_t const repLength2 = ZSTD_count_2segments(ip+4, repMatch2+4, iend, repEnd2, prefixStart) + 4;
+                                     U32 tmpOffset = offset_2; offset_2 = offset_1; offset_1 = tmpOffset;   /* swap offset_2 <=> offset_1 */
+                                     ZSTD_storeSeq(seqStore, 0, anchor, 0, repLength2-MINMATCH);
+                                     hashTable[ZSTD_hashPtr(ip, hlog, mls)] = current2;
+                                     ip += repLength2;
+                                     anchor = ip;
+                                     continue;
+                                 }
+                                 break;
+                             }
+                         }
+                         if (dictMode == ZSTD_noDict) {
+                             while ( (ip <= ilimit)
+                                  && ( (offset_2>0)
+                                     & (MEM_read32(ip) == MEM_read32(ip - offset_2)) )) {
+                                 /* store sequence */
+                                 size_t const rLength = ZSTD_count(ip+4, ip+4-offset_2, iend) + 4;
+                                 U32 const tmpOff = offset_2; offset_2 = offset_1; offset_1 = tmpOff;  /* swap offset_2 <=> offset_1 */
+                                 hashTable[ZSTD_hashPtr(ip, hlog, mls)] = (U32)(ip-base);
+                                 ZSTD_storeSeq(seqStore, 0, anchor, 0, rLength-MINMATCH);
+                                 ip += rLength;
+                                 anchor = ip;
+                                 continue;   /* faster when present ... (?) */
+                 }   }   }   }
                  /* save reps for next block */
                  rep[0] = offset_1 ? offset_1 : offsetSaved;
              size_t ZSTD_compressBlock_fast(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     void const* src, size_t srcSize)
              {
-                 U32 const hlog = cParams->hashLog;
+                 ZSTD_compressionParameters const* cParams = &ms->cParams;
                  U32 const mls = cParams->searchLength;
-                 U32 const stepSize = cParams->targetLength;
+                 assert(ms->dictMatchState == NULL);
                  switch(mls)
                  {
                  default: /* includes case 3 */
                  case 4 :
-                     return ZSTD_compressBlock_fast_generic(ms, seqStore, rep, src, srcSize, hlog, stepSize, 4);
+                     return ZSTD_compressBlock_fast_generic(ms, seqStore, rep, src, srcSize, 4, ZSTD_noDict);
                  case 5 :
-                     return ZSTD_compressBlock_fast_generic(ms, seqStore, rep, src, srcSize, hlog, stepSize, 5);
+                     return ZSTD_compressBlock_fast_generic(ms, seqStore, rep, src, srcSize, 5, ZSTD_noDict);
                  case 6 :
-                     return ZSTD_compressBlock_fast_generic(ms, seqStore, rep, src, srcSize, hlog, stepSize, 6);
+                     return ZSTD_compressBlock_fast_generic(ms, seqStore, rep, src, srcSize, 6, ZSTD_noDict);
                  case 7 :
-                     return ZSTD_compressBlock_fast_generic(ms, seqStore, rep, src, srcSize, hlog, stepSize, 7);
+                     return ZSTD_compressBlock_fast_generic(ms, seqStore, rep, src, srcSize, 7, ZSTD_noDict);
+                 }
+             }
+             size_t ZSTD_compressBlock_fast_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize)
+             {
+                 ZSTD_compressionParameters const* cParams = &ms->cParams;
+                 U32 const mls = cParams->searchLength;
+                 assert(ms->dictMatchState != NULL);
+                 switch(mls)
+                 {
+                 default: /* includes case 3 */
+                 case 4 :
+                     return ZSTD_compressBlock_fast_generic(ms, seqStore, rep, src, srcSize, 4, ZSTD_dictMatchState);
+                 case 5 :
+                     return ZSTD_compressBlock_fast_generic(ms, seqStore, rep, src, srcSize, 5, ZSTD_dictMatchState);
+                 case 6 :
+                     return ZSTD_compressBlock_fast_generic(ms, seqStore, rep, src, srcSize, 6, ZSTD_dictMatchState);
+                 case 7 :
+                     return ZSTD_compressBlock_fast_generic(ms, seqStore, rep, src, srcSize, 7, ZSTD_dictMatchState);
                  }
              }
              static size_t ZSTD_compressBlock_fast_extDict_generic(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     void const* src, size_t srcSize,
-                     U32 const hlog, U32 const stepSize, U32 const mls)
+                     void const* src, size_t srcSize, U32 const mls)
              {
-                 U32* hashTable = ms->hashTable;
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
+                 U32* const hashTable = ms->hashTable;
+                 U32 const hlog = cParams->hashLog;
+                 /* support stepSize of 0 */
+                 U32 const stepSize = cParams->targetLength + !(cParams->targetLength);
                  const BYTE* const base = ms->window.base;
                  const BYTE* const dictBase = ms->window.dictBase;
                  const BYTE* const istart = (const BYTE*)src;
                  const BYTE* ip = istart;
                  const BYTE* anchor = istart;
-                 const U32   lowestIndex = ms->window.lowLimit;
-                 const BYTE* const dictStart = dictBase + lowestIndex;
-                 const U32   dictLimit = ms->window.dictLimit;
-                 const BYTE* const lowPrefixPtr = base + dictLimit;
-                 const BYTE* const dictEnd = dictBase + dictLimit;
+                 const U32   dictStartIndex = ms->window.lowLimit;
+                 const BYTE* const dictStart = dictBase + dictStartIndex;
+                 const U32   prefixStartIndex = ms->window.dictLimit;
+                 const BYTE* const prefixStart = base + prefixStartIndex;
+                 const BYTE* const dictEnd = dictBase + prefixStartIndex;
                  const BYTE* const iend = istart + srcSize;
                  const BYTE* const ilimit = iend - 8;
                  U32 offset_1=rep[0], offset_2=rep[1];
                  /* Search Loop */
                  while (ip < ilimit) {  /* < instead of <=, because (ip+1) */
                      const size_t h = ZSTD_hashPtr(ip, hlog, mls);
-                     const U32 matchIndex = hashTable[h];
-                     const BYTE* matchBase = matchIndex < dictLimit ? dictBase : base;
-                     const BYTE* match = matchBase + matchIndex;
-                     const U32 current = (U32)(ip-base);
-                     const U32 repIndex = current + 1 - offset_1;   /* offset_1 expected <= current +1 */
-                     const BYTE* repBase = repIndex < dictLimit ? dictBase : base;
-                     const BYTE* repMatch = repBase + repIndex;
+                     const U32    matchIndex = hashTable[h];
+                     const BYTE* const matchBase = matchIndex < prefixStartIndex ? dictBase : base;
+                     const BYTE*  match = matchBase + matchIndex;
+                     const U32    current = (U32)(ip-base);
+                     const U32    repIndex = current + 1 - offset_1;
+                     const BYTE* const repBase = repIndex < prefixStartIndex ? dictBase : base;
+                     const BYTE* const repMatch = repBase + repIndex;
                      size_t mLength;
                      hashTable[h] = current;   /* update hash table */
+                     assert(offset_1 <= current +1);   /* check repIndex */
-                     if ( (((U32)((dictLimit-1) - repIndex) >= 3) /* intentional underflow */ & (repIndex > lowestIndex))
+                     if ( (((U32)((prefixStartIndex-1) - repIndex) >= 3) /* intentional underflow */ & (repIndex > dictStartIndex))
                         && (MEM_read32(repMatch) == MEM_read32(ip+1)) ) {
-                         const BYTE* repMatchEnd = repIndex < dictLimit ? dictEnd : iend;
-                         mLength = ZSTD_count_2segments(ip+1+4, repMatch+4, iend, repMatchEnd, lowPrefixPtr) + 4;
+                         const BYTE* repMatchEnd = repIndex < prefixStartIndex ? dictEnd : iend;
+                         mLength = ZSTD_count_2segments(ip+1+4, repMatch+4, iend, repMatchEnd, prefixStart) + 4;
                          ip++;
                          ZSTD_storeSeq(seqStore, ip-anchor, anchor, 0, mLength-MINMATCH);
                      } else {
-                         if ( (matchIndex < lowestIndex) ||
+                         if ( (matchIndex < dictStartIndex) ||
                               (MEM_read32(match) != MEM_read32(ip)) ) {
                              assert(stepSize >= 1);
                              ip += ((ip-anchor) >> kSearchStrength) + stepSize;
                              continue;
                          }
-                         {   const BYTE* matchEnd = matchIndex < dictLimit ? dictEnd : iend;
-                             const BYTE* lowMatchPtr = matchIndex < dictLimit ? dictStart : lowPrefixPtr;
+                         {   const BYTE* matchEnd = matchIndex < prefixStartIndex ? dictEnd : iend;
+                             const BYTE* lowMatchPtr = matchIndex < prefixStartIndex ? dictStart : prefixStart;
                              U32 offset;
-                             mLength = ZSTD_count_2segments(ip+4, match+4, iend, matchEnd, lowPrefixPtr) + 4;
+                             mLength = ZSTD_count_2segments(ip+4, match+4, iend, matchEnd, prefixStart) + 4;
                              while (((ip>anchor) & (match>lowMatchPtr)) && (ip[-1] == match[-1])) { ip--; match--; mLength++; }   /* catch up */
                              offset = current - matchIndex;
                              offset_2 = offset_1;
                          while (ip <= ilimit) {
                              U32 const current2 = (U32)(ip-base);
                              U32 const repIndex2 = current2 - offset_2;
-                             const BYTE* repMatch2 = repIndex2 < dictLimit ? dictBase + repIndex2 : base + repIndex2;
-                             if ( (((U32)((dictLimit-1) - repIndex2) >= 3) & (repIndex2 > lowestIndex))  /* intentional overflow */
+                             const BYTE* repMatch2 = repIndex2 < prefixStartIndex ? dictBase + repIndex2 : base + repIndex2;
+                             if ( (((U32)((prefixStartIndex-1) - repIndex2) >= 3) & (repIndex2 > dictStartIndex))  /* intentional overflow */
                                 && (MEM_read32(repMatch2) == MEM_read32(ip)) ) {
-                                 const BYTE* const repEnd2 = repIndex2 < dictLimit ? dictEnd : iend;
-                                 size_t const repLength2 = ZSTD_count_2segments(ip+4, repMatch2+4, iend, repEnd2, lowPrefixPtr) + 4;
+                                 const BYTE* const repEnd2 = repIndex2 < prefixStartIndex ? dictEnd : iend;
+                                 size_t const repLength2 = ZSTD_count_2segments(ip+4, repMatch2+4, iend, repEnd2, prefixStart) + 4;
                                  U32 tmpOffset = offset_2; offset_2 = offset_1; offset_1 = tmpOffset;   /* swap offset_2 <=> offset_1 */
                                  ZSTD_storeSeq(seqStore, 0, anchor, 0, repLength2-MINMATCH);
                                  hashTable[ZSTD_hashPtr(ip, hlog, mls)] = current2;
              size_t ZSTD_compressBlock_fast_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     void const* src, size_t srcSize)
              {
-                 U32 const hlog = cParams->hashLog;
+                 ZSTD_compressionParameters const* cParams = &ms->cParams;
                  U32 const mls = cParams->searchLength;
-                 U32 const stepSize = cParams->targetLength;
                  switch(mls)
                  {
                  default: /* includes case 3 */
                  case 4 :
-                     return ZSTD_compressBlock_fast_extDict_generic(ms, seqStore, rep, src, srcSize, hlog, stepSize, 4);
+                     return ZSTD_compressBlock_fast_extDict_generic(ms, seqStore, rep, src, srcSize, 4);
                  case 5 :
-                     return ZSTD_compressBlock_fast_extDict_generic(ms, seqStore, rep, src, srcSize, hlog, stepSize, 5);
+                     return ZSTD_compressBlock_fast_extDict_generic(ms, seqStore, rep, src, srcSize, 5);
                  case 6 :
-                     return ZSTD_compressBlock_fast_extDict_generic(ms, seqStore, rep, src, srcSize, hlog, stepSize, 6);
+                     return ZSTD_compressBlock_fast_extDict_generic(ms, seqStore, rep, src, srcSize, 6);
                  case 7 :
-                     return ZSTD_compressBlock_fast_extDict_generic(ms, seqStore, rep, src, srcSize, hlog, stepSize, 7);
+                     return ZSTD_compressBlock_fast_extDict_generic(ms, seqStore, rep, src, srcSize, 7);
                  }
              }

contrib/python-zstandard/zstd/compress/zstd_fast.h

0 +6 -4

              #include "zstd_compress_internal.h"
              void ZSTD_fillHashTable(ZSTD_matchState_t* ms,
-                                     ZSTD_compressionParameters const* cParams,
-                                     void const* end);
+                                     void const* end, ZSTD_dictTableLoadMethod_e dtlm);
              size_t ZSTD_compressBlock_fast(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
+             size_t ZSTD_compressBlock_fast_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize);
              size_t ZSTD_compressBlock_fast_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
              #if defined (__cplusplus)
              }

contrib/python-zstandard/zstd/compress/zstd_lazy.c

0 +396 -126

              *  Binary Tree search
              ***************************************/
-             void ZSTD_updateDUBT(
-                             ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
+             static void
+             ZSTD_updateDUBT(ZSTD_matchState_t* ms,
                              const BYTE* ip, const BYTE* iend,
                              U32 mls)
              {
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
                  U32* const hashTable = ms->hashTable;
                  U32  const hashLog = cParams->hashLog;
               *  sort one already inserted but unsorted position
               *  assumption : current >= btlow == (current - btmask)
               *  doesn't fail */
-             static void ZSTD_insertDUBT1(
-                              ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
+             static void
+             ZSTD_insertDUBT1(ZSTD_matchState_t* ms,
                               U32 current, const BYTE* inputEnd,
-                              U32 nbCompares, U32 btLow, int extDict)
+                              U32 nbCompares, U32 btLow, const ZSTD_dictMode_e dictMode)
              {
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
                  U32*   const bt = ms->chainTable;
                  U32    const btLog  = cParams->chainLog - 1;
                  U32    const btMask = (1 << btLog) - 1;
                      size_t matchLength = MIN(commonLengthSmaller, commonLengthLarger);   /* guaranteed minimum nb of common bytes */
                      assert(matchIndex < current);
-                     if ( (!extDict)
+                     if ( (dictMode != ZSTD_extDict)
                        || (matchIndex+matchLength >= dictLimit)  /* both in current segment*/
                        || (current < dictLimit) /* both in extDict */) {
-                         const BYTE* const mBase = !extDict || ((matchIndex+matchLength) >= dictLimit) ? base : dictBase;
+                         const BYTE* const mBase = ( (dictMode != ZSTD_extDict)
+                                                  || (matchIndex+matchLength >= dictLimit)) ?
+                                                     base : dictBase;
                          assert( (matchIndex+matchLength >= dictLimit)   /* might be wrong if extDict is incorrectly set to 0 */
                               || (current < dictLimit) );
                          match = mBase + matchIndex;
              }
-             static size_t ZSTD_DUBT_findBestMatch (
-                                         ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
-                                         const BYTE* const ip, const BYTE* const iend,
-                                         size_t* offsetPtr,
-                                         U32 const mls,
-                                         U32 const extDict)
+             static size_t
+             ZSTD_DUBT_findBetterDictMatch (
+                     ZSTD_matchState_t* ms,
+                     const BYTE* const ip, const BYTE* const iend,
+                     size_t* offsetPtr,
+                     U32 nbCompares,
+                     U32 const mls,
+                     const ZSTD_dictMode_e dictMode)
              {
+                 const ZSTD_matchState_t * const dms = ms->dictMatchState;
+                 const ZSTD_compressionParameters* const dmsCParams = &dms->cParams;
+                 const U32 * const dictHashTable = dms->hashTable;
+                 U32         const hashLog = dmsCParams->hashLog;
+                 size_t      const h  = ZSTD_hashPtr(ip, hashLog, mls);
+                 U32               dictMatchIndex = dictHashTable[h];
+                 const BYTE* const base = ms->window.base;
+                 const BYTE* const prefixStart = base + ms->window.dictLimit;
+                 U32         const current = (U32)(ip-base);
+                 const BYTE* const dictBase = dms->window.base;
+                 const BYTE* const dictEnd = dms->window.nextSrc;
+                 U32         const dictHighLimit = (U32)(dms->window.nextSrc - dms->window.base);
+                 U32         const dictLowLimit = dms->window.lowLimit;
+                 U32         const dictIndexDelta = ms->window.lowLimit - dictHighLimit;
+                 U32*        const dictBt = dms->chainTable;
+                 U32         const btLog  = dmsCParams->chainLog - 1;
+                 U32         const btMask = (1 << btLog) - 1;
+                 U32         const btLow = (btMask >= dictHighLimit - dictLowLimit) ? dictLowLimit : dictHighLimit - btMask;
+                 size_t commonLengthSmaller=0, commonLengthLarger=0, bestLength=0;
+                 U32 matchEndIdx = current+8+1;
+                 (void)dictMode;
+                 assert(dictMode == ZSTD_dictMatchState);
+                 while (nbCompares-- && (dictMatchIndex > dictLowLimit)) {
+                     U32* const nextPtr = dictBt + 2*(dictMatchIndex & btMask);
+                     size_t matchLength = MIN(commonLengthSmaller, commonLengthLarger);   /* guaranteed minimum nb of common bytes */
+                     const BYTE* match = dictBase + dictMatchIndex;
+                     matchLength += ZSTD_count_2segments(ip+matchLength, match+matchLength, iend, dictEnd, prefixStart);
+                     if (dictMatchIndex+matchLength >= dictHighLimit)
+                         match = base + dictMatchIndex + dictIndexDelta;   /* to prepare for next usage of match[matchLength] */
+                     if (matchLength > bestLength) {
+                         U32 matchIndex = dictMatchIndex + dictIndexDelta;
+                         if (matchLength > matchEndIdx - matchIndex)
+                             matchEndIdx = matchIndex + (U32)matchLength;
+                         if ( (4*(int)(matchLength-bestLength)) > (int)(ZSTD_highbit32(current-matchIndex+1) - ZSTD_highbit32((U32)offsetPtr[0]+1)) ) {
+                             DEBUGLOG(2, "ZSTD_DUBT_findBestDictMatch(%u) : found better match length %u -> %u and offsetCode %u -> %u (dictMatchIndex %u, matchIndex %u)",
+                                 current, (U32)bestLength, (U32)matchLength, (U32)*offsetPtr, ZSTD_REP_MOVE + current - matchIndex, dictMatchIndex, matchIndex);
+                             bestLength = matchLength, *offsetPtr = ZSTD_REP_MOVE + current - matchIndex;
+                         }
+                         if (ip+matchLength == iend) {   /* reached end of input : ip[matchLength] is not valid, no way to know if it's larger or smaller than match */
+                             break;   /* drop, to guarantee consistency (miss a little bit of compression) */
+                         }
+                     }
+                     DEBUGLOG(2, "matchLength:%6zu, match:%p, prefixStart:%p, ip:%p", matchLength, match, prefixStart, ip);
+                     if (match[matchLength] < ip[matchLength]) {
+                         if (dictMatchIndex <= btLow) { break; }   /* beyond tree size, stop the search */
+                         commonLengthSmaller = matchLength;    /* all smaller will now have at least this guaranteed common length */
+                         dictMatchIndex = nextPtr[1];              /* new matchIndex larger than previous (closer to current) */
+                     } else {
+                         /* match is larger than current */
+                         if (dictMatchIndex <= btLow) { break; }   /* beyond tree size, stop the search */
+                         commonLengthLarger = matchLength;
+                         dictMatchIndex = nextPtr[0];
+                     }
+                 }
+                 if (bestLength >= MINMATCH) {
+                     U32 const mIndex = current - ((U32)*offsetPtr - ZSTD_REP_MOVE); (void)mIndex;
+                     DEBUGLOG(2, "ZSTD_DUBT_findBestDictMatch(%u) : found match of length %u and offsetCode %u (pos %u)",
+                                 current, (U32)bestLength, (U32)*offsetPtr, mIndex);
+                 }
+                 return bestLength;
+             }
+             static size_t
+             ZSTD_DUBT_findBestMatch(ZSTD_matchState_t* ms,
+                                     const BYTE* const ip, const BYTE* const iend,
+                                     size_t* offsetPtr,
+                                     U32 const mls,
+                                     const ZSTD_dictMode_e dictMode)
+             {
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
                  U32*   const hashTable = ms->hashTable;
                  U32    const hashLog = cParams->hashLog;
                  size_t const h  = ZSTD_hashPtr(ip, hashLog, mls);
                  while (matchIndex) {  /* will end on matchIndex == 0 */
                      U32* const nextCandidateIdxPtr = bt + 2*(matchIndex&btMask) + 1;
                      U32 const nextCandidateIdx = *nextCandidateIdxPtr;
-                     ZSTD_insertDUBT1(ms, cParams, matchIndex, iend,
-                                      nbCandidates, unsortLimit, extDict);
+                     ZSTD_insertDUBT1(ms, matchIndex, iend,
+                                      nbCandidates, unsortLimit, dictMode);
                      matchIndex = nextCandidateIdx;
                      nbCandidates++;
                  }
                          size_t matchLength = MIN(commonLengthSmaller, commonLengthLarger);   /* guaranteed minimum nb of common bytes */
                          const BYTE* match;
-                         if ((!extDict) || (matchIndex+matchLength >= dictLimit)) {
+                         if ((dictMode != ZSTD_extDict) || (matchIndex+matchLength >= dictLimit)) {
                              match = base + matchIndex;
                              matchLength += ZSTD_count(ip+matchLength, match+matchLength, iend);
                          } else {
                      *smallerPtr = *largerPtr = 0;
+                     if (dictMode == ZSTD_dictMatchState && nbCompares) {
+                         bestLength = ZSTD_DUBT_findBetterDictMatch(ms, ip, iend, offsetPtr, nbCompares, mls, dictMode);
+                     }
                      assert(matchEndIdx > current+8); /* ensure nextToUpdate is increased */
                      ms->nextToUpdate = matchEndIdx - 8;   /* skip repetitive patterns */
                      if (bestLength >= MINMATCH) {
              /** ZSTD_BtFindBestMatch() : Tree updater, providing best match */
-             static size_t ZSTD_BtFindBestMatch (
-                                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
-                                     const BYTE* const ip, const BYTE* const iLimit,
-                                     size_t* offsetPtr,
-                                     const U32 mls /* template */)
+             FORCE_INLINE_TEMPLATE size_t
+             ZSTD_BtFindBestMatch( ZSTD_matchState_t* ms,
+                             const BYTE* const ip, const BYTE* const iLimit,
+                                   size_t* offsetPtr,
+                             const U32 mls /* template */,
+                             const ZSTD_dictMode_e dictMode)
              {
                  DEBUGLOG(7, "ZSTD_BtFindBestMatch");
                  if (ip < ms->window.base + ms->nextToUpdate) return 0;   /* skipped area */
-                 ZSTD_updateDUBT(ms, cParams, ip, iLimit, mls);
-                 return ZSTD_DUBT_findBestMatch(ms, cParams, ip, iLimit, offsetPtr, mls, 0);
+                 ZSTD_updateDUBT(ms, ip, iLimit, mls);
+                 return ZSTD_DUBT_findBestMatch(ms, ip, iLimit, offsetPtr, mls, dictMode);
              }
-             static size_t ZSTD_BtFindBestMatch_selectMLS (
-                                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
-                                     const BYTE* ip, const BYTE* const iLimit,
-                                     size_t* offsetPtr)
+             static size_t
+             ZSTD_BtFindBestMatch_selectMLS (  ZSTD_matchState_t* ms,
+                                         const BYTE* ip, const BYTE* const iLimit,
+                                               size_t* offsetPtr)
              {
-                 switch(cParams->searchLength)
+                 switch(ms->cParams.searchLength)
                  {
                  default : /* includes case 3 */
-                 case 4 : return ZSTD_BtFindBestMatch(ms, cParams, ip, iLimit, offsetPtr, 4);
-                 case 5 : return ZSTD_BtFindBestMatch(ms, cParams, ip, iLimit, offsetPtr, 5);
+                 case 4 : return ZSTD_BtFindBestMatch(ms, ip, iLimit, offsetPtr, 4, ZSTD_noDict);
+                 case 5 : return ZSTD_BtFindBestMatch(ms, ip, iLimit, offsetPtr, 5, ZSTD_noDict);
                  case 7 :
-                 case 6 : return ZSTD_BtFindBestMatch(ms, cParams, ip, iLimit, offsetPtr, 6);
+                 case 6 : return ZSTD_BtFindBestMatch(ms, ip, iLimit, offsetPtr, 6, ZSTD_noDict);
                  }
              }
-             /** Tree updater, providing best match */
-             static size_t ZSTD_BtFindBestMatch_extDict (
-                                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
-                                     const BYTE* const ip, const BYTE* const iLimit,
-                                     size_t* offsetPtr,
-                                     const U32 mls)
+             static size_t ZSTD_BtFindBestMatch_dictMatchState_selectMLS (
+                                     ZSTD_matchState_t* ms,
+                                     const BYTE* ip, const BYTE* const iLimit,
+                                     size_t* offsetPtr)
              {
-                 DEBUGLOG(7, "ZSTD_BtFindBestMatch_extDict");
-                 if (ip < ms->window.base + ms->nextToUpdate) return 0;   /* skipped area */
-                 ZSTD_updateDUBT(ms, cParams, ip, iLimit, mls);
-                 return ZSTD_DUBT_findBestMatch(ms, cParams, ip, iLimit, offsetPtr, mls, 1);
+                 switch(ms->cParams.searchLength)
+                 {
+                 default : /* includes case 3 */
+                 case 4 : return ZSTD_BtFindBestMatch(ms, ip, iLimit, offsetPtr, 4, ZSTD_dictMatchState);
+                 case 5 : return ZSTD_BtFindBestMatch(ms, ip, iLimit, offsetPtr, 5, ZSTD_dictMatchState);
+                 case 7 :
+                 case 6 : return ZSTD_BtFindBestMatch(ms, ip, iLimit, offsetPtr, 6, ZSTD_dictMatchState);
+                 }
              }
-             static size_t ZSTD_BtFindBestMatch_selectMLS_extDict (
-                                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
+             static size_t ZSTD_BtFindBestMatch_extDict_selectMLS (
+                                     ZSTD_matchState_t* ms,
                                      const BYTE* ip, const BYTE* const iLimit,
                                      size_t* offsetPtr)
              {
-                 switch(cParams->searchLength)
+                 switch(ms->cParams.searchLength)
                  {
                  default : /* includes case 3 */
-                 case 4 : return ZSTD_BtFindBestMatch_extDict(ms, cParams, ip, iLimit, offsetPtr, 4);
-                 case 5 : return ZSTD_BtFindBestMatch_extDict(ms, cParams, ip, iLimit, offsetPtr, 5);
+                 case 4 : return ZSTD_BtFindBestMatch(ms, ip, iLimit, offsetPtr, 4, ZSTD_extDict);
+                 case 5 : return ZSTD_BtFindBestMatch(ms, ip, iLimit, offsetPtr, 5, ZSTD_extDict);
                  case 7 :
-                 case 6 : return ZSTD_BtFindBestMatch_extDict(ms, cParams, ip, iLimit, offsetPtr, 6);
+                 case 6 : return ZSTD_BtFindBestMatch(ms, ip, iLimit, offsetPtr, 6, ZSTD_extDict);
                  }
              }
              /* Update chains up to ip (excluded)
                 Assumption : always within prefix (i.e. not within extDict) */
              static U32 ZSTD_insertAndFindFirstIndex_internal(
-                                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
+                                     ZSTD_matchState_t* ms,
+                                     const ZSTD_compressionParameters* const cParams,
                                      const BYTE* ip, U32 const mls)
              {
                  U32* const hashTable  = ms->hashTable;
                  return hashTable[ZSTD_hashPtr(ip, hashLog, mls)];
              }
-             U32 ZSTD_insertAndFindFirstIndex(
-                                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
-                                     const BYTE* ip)
+             {
-                 return ZSTD_insertAndFindFirstIndex_internal(ms, cParams, ip, cParams->searchLength);
+             U32 ZSTD_insertAndFindFirstIndex(ZSTD_matchState_t* ms, const BYTE* ip) {
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
+                 return ZSTD_insertAndFindFirstIndex_internal(ms, cParams, ip, ms->cParams.searchLength);
              }
              /* inlining is important to hardwire a hot branch (template emulation) */
              FORCE_INLINE_TEMPLATE
              size_t ZSTD_HcFindBestMatch_generic (
-                                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
+                                     ZSTD_matchState_t* ms,
                                      const BYTE* const ip, const BYTE* const iLimit,
                                      size_t* offsetPtr,
-                                     const U32 mls, const U32 extDict)
+                                     const U32 mls, const ZSTD_dictMode_e dictMode)
              {
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
                  U32* const chainTable = ms->chainTable;
                  const U32 chainSize = (1 << cParams->chainLog);
                  const U32 chainMask = chainSize-1;
                  for ( ; (matchIndex>lowLimit) & (nbAttempts>0) ; nbAttempts--) {
                      size_t currentMl=0;
-                     if ((!extDict) || matchIndex >= dictLimit) {
+                     if ((dictMode != ZSTD_extDict) || matchIndex >= dictLimit) {
                          const BYTE* const match = base + matchIndex;
                          if (match[ml] == ip[ml])   /* potentially better */
                              currentMl = ZSTD_count(ip, match, iLimit);
                      matchIndex = NEXT_IN_CHAIN(matchIndex, chainMask);
                  }
+                 if (dictMode == ZSTD_dictMatchState) {
+                     const ZSTD_matchState_t* const dms = ms->dictMatchState;
+                     const U32* const dmsChainTable = dms->chainTable;
+                     const U32 dmsChainSize         = (1 << dms->cParams.chainLog);
+                     const U32 dmsChainMask         = dmsChainSize - 1;
+                     const U32 dmsLowestIndex       = dms->window.dictLimit;
+                     const BYTE* const dmsBase      = dms->window.base;
+                     const BYTE* const dmsEnd       = dms->window.nextSrc;
+                     const U32 dmsSize              = (U32)(dmsEnd - dmsBase);
+                     const U32 dmsIndexDelta        = dictLimit - dmsSize;
+                     const U32 dmsMinChain = dmsSize > dmsChainSize ? dmsSize - dmsChainSize : 0;
+                     matchIndex = dms->hashTable[ZSTD_hashPtr(ip, dms->cParams.hashLog, mls)];
+                     for ( ; (matchIndex>dmsLowestIndex) & (nbAttempts>0) ; nbAttempts--) {
+                         size_t currentMl=0;
+                         const BYTE* const match = dmsBase + matchIndex;
+                         assert(match+4 <= dmsEnd);
+                         if (MEM_read32(match) == MEM_read32(ip))   /* assumption : matchIndex <= dictLimit-4 (by table construction) */
+                             currentMl = ZSTD_count_2segments(ip+4, match+4, iLimit, dmsEnd, prefixStart) + 4;
+                         /* save best solution */
+                         if (currentMl > ml) {
+                             ml = currentMl;
+                             *offsetPtr = current - (matchIndex + dmsIndexDelta) + ZSTD_REP_MOVE;
+                             if (ip+currentMl == iLimit) break; /* best possible, avoids read overflow on next attempt */
+                         }
+                         if (matchIndex <= dmsMinChain) break;
+                         matchIndex = dmsChainTable[matchIndex & dmsChainMask];
+                     }
+                 }
                  return ml;
              }
              FORCE_INLINE_TEMPLATE size_t ZSTD_HcFindBestMatch_selectMLS (
-                                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
+                                     ZSTD_matchState_t* ms,
                                      const BYTE* ip, const BYTE* const iLimit,
                                      size_t* offsetPtr)
              {
-                 switch(cParams->searchLength)
+                 switch(ms->cParams.searchLength)
                  {
                  default : /* includes case 3 */
-                 case 4 : return ZSTD_HcFindBestMatch_generic(ms, cParams, ip, iLimit, offsetPtr, 4, 0);
-                 case 5 : return ZSTD_HcFindBestMatch_generic(ms, cParams, ip, iLimit, offsetPtr, 5, 0);
+                 case 4 : return ZSTD_HcFindBestMatch_generic(ms, ip, iLimit, offsetPtr, 4, ZSTD_noDict);
+                 case 5 : return ZSTD_HcFindBestMatch_generic(ms, ip, iLimit, offsetPtr, 5, ZSTD_noDict);
                  case 7 :
-                 case 6 : return ZSTD_HcFindBestMatch_generic(ms, cParams, ip, iLimit, offsetPtr, 6, 0);
+                 case 6 : return ZSTD_HcFindBestMatch_generic(ms, ip, iLimit, offsetPtr, 6, ZSTD_noDict);
+                 }
+             }
+             static size_t ZSTD_HcFindBestMatch_dictMatchState_selectMLS (
+                                     ZSTD_matchState_t* ms,
+                                     const BYTE* ip, const BYTE* const iLimit,
+                                     size_t* offsetPtr)
+             {
+                 switch(ms->cParams.searchLength)
+                 {
+                 default : /* includes case 3 */
+                 case 4 : return ZSTD_HcFindBestMatch_generic(ms, ip, iLimit, offsetPtr, 4, ZSTD_dictMatchState);
+                 case 5 : return ZSTD_HcFindBestMatch_generic(ms, ip, iLimit, offsetPtr, 5, ZSTD_dictMatchState);
+                 case 7 :
+                 case 6 : return ZSTD_HcFindBestMatch_generic(ms, ip, iLimit, offsetPtr, 6, ZSTD_dictMatchState);
                  }
              }
              FORCE_INLINE_TEMPLATE size_t ZSTD_HcFindBestMatch_extDict_selectMLS (
-                                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
+                                     ZSTD_matchState_t* ms,
                                      const BYTE* ip, const BYTE* const iLimit,
-                                     size_t* const offsetPtr)
+                                     size_t* offsetPtr)
              {
-                 switch(cParams->searchLength)
+                 switch(ms->cParams.searchLength)
                  {
                  default : /* includes case 3 */
-                 case 4 : return ZSTD_HcFindBestMatch_generic(ms, cParams, ip, iLimit, offsetPtr, 4, 1);
-                 case 5 : return ZSTD_HcFindBestMatch_generic(ms, cParams, ip, iLimit, offsetPtr, 5, 1);
+                 case 4 : return ZSTD_HcFindBestMatch_generic(ms, ip, iLimit, offsetPtr, 4, ZSTD_extDict);
+                 case 5 : return ZSTD_HcFindBestMatch_generic(ms, ip, iLimit, offsetPtr, 5, ZSTD_extDict);
                  case 7 :
-                 case 6 : return ZSTD_HcFindBestMatch_generic(ms, cParams, ip, iLimit, offsetPtr, 6, 1);
+                 case 6 : return ZSTD_HcFindBestMatch_generic(ms, ip, iLimit, offsetPtr, 6, ZSTD_extDict);
                  }
              }
              size_t ZSTD_compressBlock_lazy_generic(
                                      ZSTD_matchState_t* ms, seqStore_t* seqStore,
                                      U32 rep[ZSTD_REP_NUM],
-                                     ZSTD_compressionParameters const* cParams,
                                      const void* src, size_t srcSize,
-                                     const U32 searchMethod, const U32 depth)
+                                     const U32 searchMethod, const U32 depth,
+                                     ZSTD_dictMode_e const dictMode)
              {
                  const BYTE* const istart = (const BYTE*)src;
                  const BYTE* ip = istart;
                  const BYTE* anchor = istart;
                  const BYTE* const iend = istart + srcSize;
                  const BYTE* const ilimit = iend - 8;
-                 const BYTE* const base = ms->window.base + ms->window.dictLimit;
+                 const BYTE* const base = ms->window.base;
+                 const U32 prefixLowestIndex = ms->window.dictLimit;
+                 const BYTE* const prefixLowest = base + prefixLowestIndex;
                  typedef size_t (*searchMax_f)(
-                                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
+                                     ZSTD_matchState_t* ms,
                                      const BYTE* ip, const BYTE* iLimit, size_t* offsetPtr);
-                 searchMax_f const searchMax = searchMethod ? ZSTD_BtFindBestMatch_selectMLS : ZSTD_HcFindBestMatch_selectMLS;
+                 searchMax_f const searchMax = dictMode == ZSTD_dictMatchState ?
+                     (searchMethod ? ZSTD_BtFindBestMatch_dictMatchState_selectMLS : ZSTD_HcFindBestMatch_dictMatchState_selectMLS) :
+                     (searchMethod ? ZSTD_BtFindBestMatch_selectMLS : ZSTD_HcFindBestMatch_selectMLS);
                  U32 offset_1 = rep[0], offset_2 = rep[1], savedOffset=0;
+                 const ZSTD_matchState_t* const dms = ms->dictMatchState;
+                 const U32 dictLowestIndex      = dictMode == ZSTD_dictMatchState ?
+                                                  dms->window.dictLimit : 0;
+                 const BYTE* const dictBase     = dictMode == ZSTD_dictMatchState ?
+                                                  dms->window.base : NULL;
+                 const BYTE* const dictLowest   = dictMode == ZSTD_dictMatchState ?
+                                                  dictBase + dictLowestIndex : NULL;
+                 const BYTE* const dictEnd      = dictMode == ZSTD_dictMatchState ?
+                                                  dms->window.nextSrc : NULL;
+                 const U32 dictIndexDelta       = dictMode == ZSTD_dictMatchState ?
+                                                  prefixLowestIndex - (U32)(dictEnd - dictBase) :
+;
+                 const U32 dictAndPrefixLength = (U32)(ip - prefixLowest + dictEnd - dictLowest);
                  /* init */
-                 ip += (ip==base);
+                 ip += (dictAndPrefixLength == 0);
                  ms->nextToUpdate3 = ms->nextToUpdate;
-                 {   U32 const maxRep = (U32)(ip-base);
+                 if (dictMode == ZSTD_noDict) {
+                     U32 const maxRep = (U32)(ip - prefixLowest);
                      if (offset_2 > maxRep) savedOffset = offset_2, offset_2 = 0;
                      if (offset_1 > maxRep) savedOffset = offset_1, offset_1 = 0;
                  }
+                 if (dictMode == ZSTD_dictMatchState) {
+                     /* dictMatchState repCode checks don't currently handle repCode == 0
+                      * disabling. */
+                     assert(offset_1 <= dictAndPrefixLength);
+                     assert(offset_2 <= dictAndPrefixLength);
+                 }
                  /* Match Loop */
                  while (ip < ilimit) {
                      const BYTE* start=ip+1;
                      /* check repCode */
-                     if ((offset_1>0) & (MEM_read32(ip+1) == MEM_read32(ip+1 - offset_1))) {
-                         /* repcode : we take it */
+                     if (dictMode == ZSTD_dictMatchState) {
+                         const U32 repIndex = (U32)(ip - base) + 1 - offset_1;
+                         const BYTE* repMatch = (dictMode == ZSTD_dictMatchState
+                                             && repIndex < prefixLowestIndex) ?
+                                                dictBase + (repIndex - dictIndexDelta) :
+                                                base + repIndex;
+                         if (((U32)((prefixLowestIndex-1) - repIndex) >= 3 /* intentional underflow */)
+                             && (MEM_read32(repMatch) == MEM_read32(ip+1)) ) {
+                             const BYTE* repMatchEnd = repIndex < prefixLowestIndex ? dictEnd : iend;
+                             matchLength = ZSTD_count_2segments(ip+1+4, repMatch+4, iend, repMatchEnd, prefixLowest) + 4;
+                             if (depth==0) goto _storeSequence;
+                         }
+                     }
+                     if ( dictMode == ZSTD_noDict
+                       && ((offset_1 > 0) & (MEM_read32(ip+1-offset_1) == MEM_read32(ip+1)))) {
                          matchLength = ZSTD_count(ip+1+4, ip+1+4-offset_1, iend) + 4;
                          if (depth==0) goto _storeSequence;
                      }
                      /* first search (depth 0) */
-                     {   size_t offsetFound = 99999999;
-                         size_t const ml2 = searchMax(ms, cParams, ip, iend, &offsetFound);
+                     {   size_t offsetFound = 999999999;
+                         size_t const ml2 = searchMax(ms, ip, iend, &offsetFound);
                          if (ml2 > matchLength)
                              matchLength = ml2, start = ip, offset=offsetFound;
                      }
                      if (depth>=1)
                      while (ip<ilimit) {
                          ip ++;
-                         if ((offset) && ((offset_1>0) & (MEM_read32(ip) == MEM_read32(ip - offset_1)))) {
+                         if ( (dictMode == ZSTD_noDict)
+                           && (offset) && ((offset_1>0) & (MEM_read32(ip) == MEM_read32(ip - offset_1)))) {
                              size_t const mlRep = ZSTD_count(ip+4, ip+4-offset_1, iend) + 4;
                              int const gain2 = (int)(mlRep * 3);
                              int const gain1 = (int)(matchLength*3 - ZSTD_highbit32((U32)offset+1) + 1);
                              if ((mlRep >= 4) && (gain2 > gain1))
                                  matchLength = mlRep, offset = 0, start = ip;
                          }
-                         {   size_t offset2=99999999;
-                             size_t const ml2 = searchMax(ms, cParams, ip, iend, &offset2);
+                         if (dictMode == ZSTD_dictMatchState) {
+                             const U32 repIndex = (U32)(ip - base) - offset_1;
+                             const BYTE* repMatch = repIndex < prefixLowestIndex ?
+                                            dictBase + (repIndex - dictIndexDelta) :
+                                            base + repIndex;
+                             if (((U32)((prefixLowestIndex-1) - repIndex) >= 3 /* intentional underflow */)
+                                 && (MEM_read32(repMatch) == MEM_read32(ip)) ) {
+                                 const BYTE* repMatchEnd = repIndex < prefixLowestIndex ? dictEnd : iend;
+                                 size_t const mlRep = ZSTD_count_2segments(ip+4, repMatch+4, iend, repMatchEnd, prefixLowest) + 4;
+                                 int const gain2 = (int)(mlRep * 3);
+                                 int const gain1 = (int)(matchLength*3 - ZSTD_highbit32((U32)offset+1) + 1);
+                                 if ((mlRep >= 4) && (gain2 > gain1))
+                                     matchLength = mlRep, offset = 0, start = ip;
+                             }
+                         }
+                         {   size_t offset2=999999999;
+                             size_t const ml2 = searchMax(ms, ip, iend, &offset2);
                              int const gain2 = (int)(ml2*4 - ZSTD_highbit32((U32)offset2+1));   /* raw approx */
                              int const gain1 = (int)(matchLength*4 - ZSTD_highbit32((U32)offset+1) + 4);
                              if ((ml2 >= 4) && (gain2 > gain1)) {
                          /* let's find an even better one */
                          if ((depth==2) && (ip<ilimit)) {
                              ip ++;
-                             if ((offset) && ((offset_1>0) & (MEM_read32(ip) == MEM_read32(ip - offset_1)))) {
-                                 size_t const ml2 = ZSTD_count(ip+4, ip+4-offset_1, iend) + 4;
-                                 int const gain2 = (int)(ml2 * 4);
+                             if ( (dictMode == ZSTD_noDict)
+                               && (offset) && ((offset_1>0) & (MEM_read32(ip) == MEM_read32(ip - offset_1)))) {
+                                 size_t const mlRep = ZSTD_count(ip+4, ip+4-offset_1, iend) + 4;
+                                 int const gain2 = (int)(mlRep * 4);
                                  int const gain1 = (int)(matchLength*4 - ZSTD_highbit32((U32)offset+1) + 1);
-                                 if ((ml2 >= 4) && (gain2 > gain1))
-                                     matchLength = ml2, offset = 0, start = ip;
+                                 if ((mlRep >= 4) && (gain2 > gain1))
+                                     matchLength = mlRep, offset = 0, start = ip;
                              }
-                             {   size_t offset2=99999999;
-                                 size_t const ml2 = searchMax(ms, cParams, ip, iend, &offset2);
+                             if (dictMode == ZSTD_dictMatchState) {
+                                 const U32 repIndex = (U32)(ip - base) - offset_1;
+                                 const BYTE* repMatch = repIndex < prefixLowestIndex ?
+                                                dictBase + (repIndex - dictIndexDelta) :
+                                                base + repIndex;
+                                 if (((U32)((prefixLowestIndex-1) - repIndex) >= 3 /* intentional underflow */)
+                                     && (MEM_read32(repMatch) == MEM_read32(ip)) ) {
+                                     const BYTE* repMatchEnd = repIndex < prefixLowestIndex ? dictEnd : iend;
+                                     size_t const mlRep = ZSTD_count_2segments(ip+4, repMatch+4, iend, repMatchEnd, prefixLowest) + 4;
+                                     int const gain2 = (int)(mlRep * 4);
+                                     int const gain1 = (int)(matchLength*4 - ZSTD_highbit32((U32)offset+1) + 1);
+                                     if ((mlRep >= 4) && (gain2 > gain1))
+                                         matchLength = mlRep, offset = 0, start = ip;
+                                 }
+                             }
+                             {   size_t offset2=999999999;
+                                 size_t const ml2 = searchMax(ms, ip, iend, &offset2);
                                  int const gain2 = (int)(ml2*4 - ZSTD_highbit32((U32)offset2+1));   /* raw approx */
                                  int const gain1 = (int)(matchLength*4 - ZSTD_highbit32((U32)offset+1) + 7);
                                  if ((ml2 >= 4) && (gain2 > gain1)) {
                       */
                      /* catch up */
                      if (offset) {
-                         while ( ((start > anchor) & (start - (offset-ZSTD_REP_MOVE) > base))
-                              && (start[-1] == (start-(offset-ZSTD_REP_MOVE))[-1]) )  /* only search for offset within prefix */
-                             { start--; matchLength++; }
+                         if (dictMode == ZSTD_noDict) {
+                             while ( ((start > anchor) & (start - (offset-ZSTD_REP_MOVE) > prefixLowest))
+                                  && (start[-1] == (start-(offset-ZSTD_REP_MOVE))[-1]) )  /* only search for offset within prefix */
+                                 { start--; matchLength++; }
+                         }
+                         if (dictMode == ZSTD_dictMatchState) {
+                             U32 const matchIndex = (U32)((start-base) - (offset - ZSTD_REP_MOVE));
+                             const BYTE* match = (matchIndex < prefixLowestIndex) ? dictBase + matchIndex - dictIndexDelta : base + matchIndex;
+                             const BYTE* const mStart = (matchIndex < prefixLowestIndex) ? dictLowest : prefixLowest;
+                             while ((start>anchor) && (match>mStart) && (start[-1] == match[-1])) { start--; match--; matchLength++; }  /* catch up */
+                         }
                          offset_2 = offset_1; offset_1 = (U32)(offset - ZSTD_REP_MOVE);
                      }
                      /* store sequence */
                      }
                      /* check immediate repcode */
-                     while ( ((ip <= ilimit) & (offset_2>0))
-                          && (MEM_read32(ip) == MEM_read32(ip - offset_2)) ) {
-                         /* store sequence */
-                         matchLength = ZSTD_count(ip+4, ip+4-offset_2, iend) + 4;
-                         offset = offset_2; offset_2 = offset_1; offset_1 = (U32)offset; /* swap repcodes */
-                         ZSTD_storeSeq(seqStore, 0, anchor, 0, matchLength-MINMATCH);
-                         ip += matchLength;
-                         anchor = ip;
-                         continue;   /* faster when present ... (?) */
-                 }   }
+                     if (dictMode == ZSTD_dictMatchState) {
+                         while (ip <= ilimit) {
+                             U32 const current2 = (U32)(ip-base);
+                             U32 const repIndex = current2 - offset_2;
+                             const BYTE* repMatch = dictMode == ZSTD_dictMatchState
+                                 && repIndex < prefixLowestIndex ?
+                                     dictBase - dictIndexDelta + repIndex :
+                                     base + repIndex;
+                             if ( ((U32)((prefixLowestIndex-1) - (U32)repIndex) >= 3 /* intentional overflow */)
+                                && (MEM_read32(repMatch) == MEM_read32(ip)) ) {
+                                 const BYTE* const repEnd2 = repIndex < prefixLowestIndex ? dictEnd : iend;
+                                 matchLength = ZSTD_count_2segments(ip+4, repMatch+4, iend, repEnd2, prefixLowest) + 4;
+                                 offset = offset_2; offset_2 = offset_1; offset_1 = (U32)offset;   /* swap offset_2 <=> offset_1 */
+                                 ZSTD_storeSeq(seqStore, 0, anchor, 0, matchLength-MINMATCH);
+                                 ip += matchLength;
+                                 anchor = ip;
+                                 continue;
+                             }
+                             break;
+                         }
+                     }
+                     if (dictMode == ZSTD_noDict) {
+                         while ( ((ip <= ilimit) & (offset_2>0))
+                              && (MEM_read32(ip) == MEM_read32(ip - offset_2)) ) {
+                             /* store sequence */
+                             matchLength = ZSTD_count(ip+4, ip+4-offset_2, iend) + 4;
+                             offset = offset_2; offset_2 = offset_1; offset_1 = (U32)offset; /* swap repcodes */
+                             ZSTD_storeSeq(seqStore, 0, anchor, 0, matchLength-MINMATCH);
+                             ip += matchLength;
+                             anchor = ip;
+                             continue;   /* faster when present ... (?) */
+                 }   }   }
                  /* Save reps for next block */
                  rep[0] = offset_1 ? offset_1 : savedOffset;
              size_t ZSTD_compressBlock_btlazy2(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     void const* src, size_t srcSize)
              {
-                 return ZSTD_compressBlock_lazy_generic(ms, seqStore, rep, cParams, src, srcSize, 1, 2);
+                 return ZSTD_compressBlock_lazy_generic(ms, seqStore, rep, src, srcSize, 1, 2, ZSTD_noDict);
              }
              size_t ZSTD_compressBlock_lazy2(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     void const* src, size_t srcSize)
              {
-                 return ZSTD_compressBlock_lazy_generic(ms, seqStore, rep, cParams, src, srcSize, 0, 2);
+                 return ZSTD_compressBlock_lazy_generic(ms, seqStore, rep, src, srcSize, 0, 2, ZSTD_noDict);
              }
              size_t ZSTD_compressBlock_lazy(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     void const* src, size_t srcSize)
              {
-                 return ZSTD_compressBlock_lazy_generic(ms, seqStore, rep, cParams, src, srcSize, 0, 1);
+                 return ZSTD_compressBlock_lazy_generic(ms, seqStore, rep, src, srcSize, 0, 1, ZSTD_noDict);
              }
              size_t ZSTD_compressBlock_greedy(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     void const* src, size_t srcSize)
+             {
+                 return ZSTD_compressBlock_lazy_generic(ms, seqStore, rep, src, srcSize, 0, 0, ZSTD_noDict);
+             }
+             size_t ZSTD_compressBlock_btlazy2_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize)
+             {
+                 return ZSTD_compressBlock_lazy_generic(ms, seqStore, rep, src, srcSize, 1, 2, ZSTD_dictMatchState);
+             }
+             size_t ZSTD_compressBlock_lazy2_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize)
              {
-                 return ZSTD_compressBlock_lazy_generic(ms, seqStore, rep, cParams, src, srcSize, 0, 0);
+                 return ZSTD_compressBlock_lazy_generic(ms, seqStore, rep, src, srcSize, 0, 2, ZSTD_dictMatchState);
+             }
+             size_t ZSTD_compressBlock_lazy_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize)
+             {
+                 return ZSTD_compressBlock_lazy_generic(ms, seqStore, rep, src, srcSize, 0, 1, ZSTD_dictMatchState);
+             }
+             size_t ZSTD_compressBlock_greedy_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize)
+             {
+                 return ZSTD_compressBlock_lazy_generic(ms, seqStore, rep, src, srcSize, 0, 0, ZSTD_dictMatchState);
              }
              size_t ZSTD_compressBlock_lazy_extDict_generic(
                                      ZSTD_matchState_t* ms, seqStore_t* seqStore,
                                      U32 rep[ZSTD_REP_NUM],
-                                     ZSTD_compressionParameters const* cParams,
                                      const void* src, size_t srcSize,
                                      const U32 searchMethod, const U32 depth)
              {
                  const BYTE* const dictStart  = dictBase + lowestIndex;
                  typedef size_t (*searchMax_f)(
-                                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
+                                     ZSTD_matchState_t* ms,
                                      const BYTE* ip, const BYTE* iLimit, size_t* offsetPtr);
-                 searchMax_f searchMax = searchMethod ? ZSTD_BtFindBestMatch_selectMLS_extDict : ZSTD_HcFindBestMatch_extDict_selectMLS;
+                 searchMax_f searchMax = searchMethod ? ZSTD_BtFindBestMatch_extDict_selectMLS : ZSTD_HcFindBestMatch_extDict_selectMLS;
                  U32 offset_1 = rep[0], offset_2 = rep[1];
                      }   }
                      /* first search (depth 0) */
-                     {   size_t offsetFound = 99999999;
-                         size_t const ml2 = searchMax(ms, cParams, ip, iend, &offsetFound);
+                     {   size_t offsetFound = 999999999;
+                         size_t const ml2 = searchMax(ms, ip, iend, &offsetFound);
                          if (ml2 > matchLength)
                              matchLength = ml2, start = ip, offset=offsetFound;
                      }
                          }   }
                          /* search match, depth 1 */
-                         {   size_t offset2=99999999;
-                             size_t const ml2 = searchMax(ms, cParams, ip, iend, &offset2);
+                         {   size_t offset2=999999999;
+                             size_t const ml2 = searchMax(ms, ip, iend, &offset2);
                              int const gain2 = (int)(ml2*4 - ZSTD_highbit32((U32)offset2+1));   /* raw approx */
                              int const gain1 = (int)(matchLength*4 - ZSTD_highbit32((U32)offset+1) + 4);
                              if ((ml2 >= 4) && (gain2 > gain1)) {
                              }   }
                              /* search match, depth 2 */
-                             {   size_t offset2=99999999;
-                                 size_t const ml2 = searchMax(ms, cParams, ip, iend, &offset2);
+                             {   size_t offset2=999999999;
+                                 size_t const ml2 = searchMax(ms, ip, iend, &offset2);
                                  int const gain2 = (int)(ml2*4 - ZSTD_highbit32((U32)offset2+1));   /* raw approx */
                                  int const gain1 = (int)(matchLength*4 - ZSTD_highbit32((U32)offset+1) + 7);
                                  if ((ml2 >= 4) && (gain2 > gain1)) {
              size_t ZSTD_compressBlock_greedy_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     void const* src, size_t srcSize)
              {
-                 return ZSTD_compressBlock_lazy_extDict_generic(ms, seqStore, rep, cParams, src, srcSize, 0, 0);
+                 return ZSTD_compressBlock_lazy_extDict_generic(ms, seqStore, rep, src, srcSize, 0, 0);
              }
              size_t ZSTD_compressBlock_lazy_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     void const* src, size_t srcSize)
              {
-                 return ZSTD_compressBlock_lazy_extDict_generic(ms, seqStore, rep, cParams, src, srcSize, 0, 1);
+                 return ZSTD_compressBlock_lazy_extDict_generic(ms, seqStore, rep, src, srcSize, 0, 1);
              }
              size_t ZSTD_compressBlock_lazy2_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     void const* src, size_t srcSize)
              {
-                 return ZSTD_compressBlock_lazy_extDict_generic(ms, seqStore, rep, cParams, src, srcSize, 0, 2);
+                 return ZSTD_compressBlock_lazy_extDict_generic(ms, seqStore, rep, src, srcSize, 0, 2);
              }
              size_t ZSTD_compressBlock_btlazy2_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     void const* src, size_t srcSize)
              {
-                 return ZSTD_compressBlock_lazy_extDict_generic(ms, seqStore, rep, cParams, src, srcSize, 1, 2);
+                 return ZSTD_compressBlock_lazy_extDict_generic(ms, seqStore, rep, src, srcSize, 1, 2);
              }

contrib/python-zstandard/zstd/compress/zstd_lazy.h

0 +22 -11

              #include "zstd_compress_internal.h"
-             U32 ZSTD_insertAndFindFirstIndex(
-                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
-                     const BYTE* ip);
+             U32 ZSTD_insertAndFindFirstIndex(ZSTD_matchState_t* ms, const BYTE* ip);
              void ZSTD_preserveUnsortedMark (U32* const table, U32 const size, U32 const reducerValue);  /*! used in ZSTD_reduceIndex(). pre-emptively increase value of ZSTD_DUBT_UNSORTED_MARK */
              size_t ZSTD_compressBlock_btlazy2(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
              size_t ZSTD_compressBlock_lazy2(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
              size_t ZSTD_compressBlock_lazy(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
              size_t ZSTD_compressBlock_greedy(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
+             size_t ZSTD_compressBlock_btlazy2_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize);
+             size_t ZSTD_compressBlock_lazy2_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize);
+             size_t ZSTD_compressBlock_lazy_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize);
+             size_t ZSTD_compressBlock_greedy_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize);
              size_t ZSTD_compressBlock_greedy_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
              size_t ZSTD_compressBlock_lazy_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
              size_t ZSTD_compressBlock_lazy2_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
              size_t ZSTD_compressBlock_btlazy2_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
              #if defined (__cplusplus)
              }

contrib/python-zstandard/zstd/compress/zstd_ldm.c

0 +19 -26

              #include "zstd_ldm.h"
+             #include "debug.h"
              #include "zstd_fast.h"          /* ZSTD_fillHashTable() */
              #include "zstd_double_fast.h"   /* ZSTD_fillDoubleHashTable() */
              void ZSTD_ldm_adjustParameters(ldmParams_t* params,
                                             ZSTD_compressionParameters const* cParams)
              {
-                 U32 const windowLog = cParams->windowLog;
+                 params->windowLog = cParams->windowLog;
                  ZSTD_STATIC_ASSERT(LDM_BUCKET_SIZE_LOG <= ZSTD_LDM_BUCKETSIZELOG_MAX);
                  DEBUGLOG(4, "ZSTD_ldm_adjustParameters");
                  if (!params->bucketSizeLog) params->bucketSizeLog = LDM_BUCKET_SIZE_LOG;
                    params->minMatchLength = minMatch;
                  }
                  if (params->hashLog == 0) {
-                     params->hashLog = MAX(ZSTD_HASHLOG_MIN, windowLog - LDM_HASH_RLOG);
+                     params->hashLog = MAX(ZSTD_HASHLOG_MIN, params->windowLog - LDM_HASH_RLOG);
                      assert(params->hashLog <= ZSTD_HASHLOG_MAX);
                  }
                  if (params->hashEveryLog == 0) {
-                     params->hashEveryLog =
-                             windowLog < params->hashLog ? 0 : windowLog - params->hashLog;
+                     params->hashEveryLog = params->windowLog < params->hashLog
+                                                ? 0
+                                                : params->windowLog - params->hashLog;
                  }
                  params->bucketSizeLog = MIN(params->bucketSizeLog, params->hashLog);
              }
               *  The tables for the other strategies are filled within their
               *  block compressors. */
              static size_t ZSTD_ldm_fillFastTables(ZSTD_matchState_t* ms,
-                                                   ZSTD_compressionParameters const* cParams,
                                                    void const* end)
              {
                  const BYTE* const iend = (const BYTE*)end;
-                 switch(cParams->strategy)
+                 switch(ms->cParams.strategy)
                  {
                  case ZSTD_fast:
-                     ZSTD_fillHashTable(ms, cParams, iend);
-                     ms->nextToUpdate = (U32)(iend - ms->window.base);
+                     ZSTD_fillHashTable(ms, iend, ZSTD_dtlm_fast);
                      break;
                  case ZSTD_dfast:
-                     ZSTD_fillDoubleHashTable(ms, cParams, iend);
-                     ms->nextToUpdate = (U32)(iend - ms->window.base);
+                     ZSTD_fillDoubleHashTable(ms, iend, ZSTD_dtlm_fast);
                      break;
                  case ZSTD_greedy:
                       *       * Try invalidation after the sequence generation and test the
                       *         the offset against maxDist directly.
                       */
-                     ZSTD_window_enforceMaxDist(&ldmState->window, chunkEnd, maxDist, NULL);
+                     ZSTD_window_enforceMaxDist(&ldmState->window, chunkEnd, maxDist, NULL, NULL);
                      /* 3. Generate the sequences for the chunk, and get newLeftoverSize. */
                      newLeftoverSize = ZSTD_ldm_generateSequences_internal(
                          ldmState, sequences, params, chunkStart, chunkSize);
              size_t ZSTD_ldm_blockCompress(rawSeqStore_t* rawSeqStore,
                  ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                 ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize,
-                 int const extDict)
+                 void const* src, size_t srcSize)
              {
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
                  unsigned const minMatch = cParams->searchLength;
                  ZSTD_blockCompressor const blockCompressor =
-                     ZSTD_selectBlockCompressor(cParams->strategy, extDict);
-                 BYTE const* const base = ms->window.base;
+                     ZSTD_selectBlockCompressor(cParams->strategy, ZSTD_matchState_dictMode(ms));
                  /* Input bounds */
                  BYTE const* const istart = (BYTE const*)src;
                  BYTE const* const iend = istart + srcSize;
                  /* Input positions */
                  BYTE const* ip = istart;
+                 DEBUGLOG(5, "ZSTD_ldm_blockCompress: srcSize=%zu", srcSize);
                  assert(rawSeqStore->pos <= rawSeqStore->size);
                  assert(rawSeqStore->size <= rawSeqStore->capacity);
                  /* Loop through each sequence and apply the block compressor to the lits */
                      /* Fill tables for block compressor */
                      ZSTD_ldm_limitTableUpdate(ms, ip);
-                     ZSTD_ldm_fillFastTables(ms, cParams, ip);
+                     ZSTD_ldm_fillFastTables(ms, ip);
                      /* Run the block compressor */
+                     DEBUGLOG(5, "calling block compressor on segment of size %u", sequence.litLength);
                      {
                          size_t const newLitLength =
-                             blockCompressor(ms, seqStore, rep, cParams, ip,
-                                             sequence.litLength);
+                             blockCompressor(ms, seqStore, rep, ip, sequence.litLength);
                          ip += sequence.litLength;
-                         ms->nextToUpdate = (U32)(ip - base);
                          /* Update the repcodes */
                          for (i = ZSTD_REP_NUM - 1; i > 0; i--)
                              rep[i] = rep[i-1];
                  }
                  /* Fill the tables for the block compressor */
                  ZSTD_ldm_limitTableUpdate(ms, ip);
-                 ZSTD_ldm_fillFastTables(ms, cParams, ip);
+                 ZSTD_ldm_fillFastTables(ms, ip);
                  /* Compress the last literals */
+                 {
-                     size_t const lastLiterals = blockCompressor(ms, seqStore, rep, cParams,
-                                                                 ip, iend - ip);
-                     ms->nextToUpdate = (U32)(iend - base);
-                     return lastLiterals;
+                 }
+                 return blockCompressor(ms, seqStore, rep, ip, iend - ip);
              }

contrib/python-zstandard/zstd/compress/zstd_ldm.h

0 +1 -3

               */
              size_t ZSTD_ldm_blockCompress(rawSeqStore_t* rawSeqStore,
                          ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                         ZSTD_compressionParameters const* cParams,
-                         void const* src, size_t srcSize,
-                         int const extDict);
+                         void const* src, size_t srcSize);
              /**
               * ZSTD_ldm_skipSequences():

contrib/python-zstandard/zstd/compress/zstd_opt.c

0 +511 -302

               */
              #include "zstd_compress_internal.h"
+             #include "hist.h"
              #include "zstd_opt.h"
-             #define ZSTD_LITFREQ_ADD    2   /* scaling factor for litFreq, so that frequencies adapt faster to new stats. Also used for matchSum (?) */
+             #define ZSTD_LITFREQ_ADD    2   /* scaling factor for litFreq, so that frequencies adapt faster to new stats */
              #define ZSTD_FREQ_DIV       4   /* log factor when using previous stats to init next stats */
              #define ZSTD_MAX_PRICE     (1<<30)
              /*-*************************************
              *  Price functions for optimal parser
              ***************************************/
-             static void ZSTD_setLog2Prices(optState_t* optPtr)
+             #if 0    /* approximation at bit level */
+             #  define BITCOST_ACCURACY 0
+             #  define BITCOST_MULTIPLIER (1 << BITCOST_ACCURACY)
+             #  define WEIGHT(stat)  ((void)opt, ZSTD_bitWeight(stat))
+             #elif 0  /* fractional bit accuracy */
+             #  define BITCOST_ACCURACY 8
+             #  define BITCOST_MULTIPLIER (1 << BITCOST_ACCURACY)
+             #  define WEIGHT(stat,opt) ((void)opt, ZSTD_fracWeight(stat))
+             #else    /* opt==approx, ultra==accurate */
+             #  define BITCOST_ACCURACY 8
+             #  define BITCOST_MULTIPLIER (1 << BITCOST_ACCURACY)
+             #  define WEIGHT(stat,opt) (opt ? ZSTD_fracWeight(stat) : ZSTD_bitWeight(stat))
+             #endif
+             MEM_STATIC U32 ZSTD_bitWeight(U32 stat)
+             {
+                 return (ZSTD_highbit32(stat+1) * BITCOST_MULTIPLIER);
+             }
+             MEM_STATIC U32 ZSTD_fracWeight(U32 rawStat)
              {
-                 optPtr->log2litSum = ZSTD_highbit32(optPtr->litSum+1);
-                 optPtr->log2litLengthSum = ZSTD_highbit32(optPtr->litLengthSum+1);
-                 optPtr->log2matchLengthSum = ZSTD_highbit32(optPtr->matchLengthSum+1);
-                 optPtr->log2offCodeSum = ZSTD_highbit32(optPtr->offCodeSum+1);
+                 U32 const stat = rawStat + 1;
+                 U32 const hb = ZSTD_highbit32(stat);
+                 U32 const BWeight = hb * BITCOST_MULTIPLIER;
+                 U32 const FWeight = (stat << BITCOST_ACCURACY) >> hb;
+                 U32 const weight = BWeight + FWeight;
+                 assert(hb + BITCOST_ACCURACY < 31);
+                 return weight;
+             }
+             /* debugging function, @return price in bytes */
+             MEM_STATIC double ZSTD_fCost(U32 price)
+             {
+                 return (double)price / (BITCOST_MULTIPLIER*8);
+             }
+             static void ZSTD_setBasePrices(optState_t* optPtr, int optLevel)
+             {
+                 optPtr->litSumBasePrice = WEIGHT(optPtr->litSum, optLevel);
+                 optPtr->litLengthSumBasePrice = WEIGHT(optPtr->litLengthSum, optLevel);
+                 optPtr->matchLengthSumBasePrice = WEIGHT(optPtr->matchLengthSum, optLevel);
+                 optPtr->offCodeSumBasePrice = WEIGHT(optPtr->offCodeSum, optLevel);
              }
+             static U32 ZSTD_downscaleStat(U32* table, U32 lastEltIndex, int malus)
+             {
+                 U32 s, sum=0;
+                 assert(ZSTD_FREQ_DIV+malus > 0 && ZSTD_FREQ_DIV+malus < 31);
+                 for (s=0; s<=lastEltIndex; s++) {
+                     table[s] = 1 + (table[s] >> (ZSTD_FREQ_DIV+malus));
+                     sum += table[s];
+                 }
+                 return sum;
+             }
              static void ZSTD_rescaleFreqs(optState_t* const optPtr,
-                                           const BYTE* const src, size_t const srcSize)
+                                           const BYTE* const src, size_t const srcSize,
+                                           int optLevel)
              {
-                 optPtr->staticPrices = 0;
+                 optPtr->priceType = zop_dynamic;
+                 if (optPtr->litLengthSum == 0) {  /* first block : init */
+                     if (srcSize <= 1024)   /* heuristic */
+                         optPtr->priceType = zop_predef;
+                     assert(optPtr->symbolCosts != NULL);
+                     if (optPtr->symbolCosts->huf.repeatMode == HUF_repeat_valid) { /* huffman table presumed generated by dictionary */
+                         optPtr->priceType = zop_dynamic;
-                 if (optPtr->litLengthSum == 0) {  /* first init */
-                     unsigned u;
-                     if (srcSize <= 1024) optPtr->staticPrices = 1;
+                         assert(optPtr->litFreq != NULL);
+                         optPtr->litSum = 0;
+                         {   unsigned lit;
+                             for (lit=0; lit<=MaxLit; lit++) {
+                                 U32 const scaleLog = 11;   /* scale to 2K */
+                                 U32 const bitCost = HUF_getNbBits(optPtr->symbolCosts->huf.CTable, lit);
+                                 assert(bitCost <= scaleLog);
+                                 optPtr->litFreq[lit] = bitCost ? 1 << (scaleLog-bitCost) : 1 /*minimum to calculate cost*/;
+                                 optPtr->litSum += optPtr->litFreq[lit];
+                         }   }
+                         {   unsigned ll;
+                             FSE_CState_t llstate;
+                             FSE_initCState(&llstate, optPtr->symbolCosts->fse.litlengthCTable);
+                             optPtr->litLengthSum = 0;
+                             for (ll=0; ll<=MaxLL; ll++) {
+                                 U32 const scaleLog = 10;   /* scale to 1K */
+                                 U32 const bitCost = FSE_getMaxNbBits(llstate.symbolTT, ll);
+                                 assert(bitCost < scaleLog);
+                                 optPtr->litLengthFreq[ll] = bitCost ? 1 << (scaleLog-bitCost) : 1 /*minimum to calculate cost*/;
+                                 optPtr->litLengthSum += optPtr->litLengthFreq[ll];
+                         }   }
-                     assert(optPtr->litFreq!=NULL);
-                     for (u=0; u<=MaxLit; u++)
-                         optPtr->litFreq[u] = 0;
-                     for (u=0; u<srcSize; u++)
-                         optPtr->litFreq[src[u]]++;
-                     optPtr->litSum = 0;
-                     for (u=0; u<=MaxLit; u++) {
-                         optPtr->litFreq[u] = 1 + (optPtr->litFreq[u] >> ZSTD_FREQ_DIV);
-                         optPtr->litSum += optPtr->litFreq[u];
+                         {   unsigned ml;
+                             FSE_CState_t mlstate;
+                             FSE_initCState(&mlstate, optPtr->symbolCosts->fse.matchlengthCTable);
+                             optPtr->matchLengthSum = 0;
+                             for (ml=0; ml<=MaxML; ml++) {
+                                 U32 const scaleLog = 10;
+                                 U32 const bitCost = FSE_getMaxNbBits(mlstate.symbolTT, ml);
+                                 assert(bitCost < scaleLog);
+                                 optPtr->matchLengthFreq[ml] = bitCost ? 1 << (scaleLog-bitCost) : 1 /*minimum to calculate cost*/;
+                                 optPtr->matchLengthSum += optPtr->matchLengthFreq[ml];
+                         }   }
+                         {   unsigned of;
+                             FSE_CState_t ofstate;
+                             FSE_initCState(&ofstate, optPtr->symbolCosts->fse.offcodeCTable);
+                             optPtr->offCodeSum = 0;
+                             for (of=0; of<=MaxOff; of++) {
+                                 U32 const scaleLog = 10;
+                                 U32 const bitCost = FSE_getMaxNbBits(ofstate.symbolTT, of);
+                                 assert(bitCost < scaleLog);
+                                 optPtr->offCodeFreq[of] = bitCost ? 1 << (scaleLog-bitCost) : 1 /*minimum to calculate cost*/;
+                                 optPtr->offCodeSum += optPtr->offCodeFreq[of];
+                         }   }
+                     } else {  /* not a dictionary */
+                         assert(optPtr->litFreq != NULL);
+                         {   unsigned lit = MaxLit;
+                             HIST_count_simple(optPtr->litFreq, &lit, src, srcSize);   /* use raw first block to init statistics */
+                         }
+                         optPtr->litSum = ZSTD_downscaleStat(optPtr->litFreq, MaxLit, 1);
+                         {   unsigned ll;
+                             for (ll=0; ll<=MaxLL; ll++)
+                                 optPtr->litLengthFreq[ll] = 1;
+                         }
+                         optPtr->litLengthSum = MaxLL+1;
+                         {   unsigned ml;
+                             for (ml=0; ml<=MaxML; ml++)
+                                 optPtr->matchLengthFreq[ml] = 1;
+                         }
+                         optPtr->matchLengthSum = MaxML+1;
+                         {   unsigned of;
+                             for (of=0; of<=MaxOff; of++)
+                                 optPtr->offCodeFreq[of] = 1;
+                         }
+                         optPtr->offCodeSum = MaxOff+1;
                      }
-                     for (u=0; u<=MaxLL; u++)
-                         optPtr->litLengthFreq[u] = 1;
-                     optPtr->litLengthSum = MaxLL+1;
-                     for (u=0; u<=MaxML; u++)
-                         optPtr->matchLengthFreq[u] = 1;
-                     optPtr->matchLengthSum = MaxML+1;
-                     for (u=0; u<=MaxOff; u++)
-                         optPtr->offCodeFreq[u] = 1;
-                     optPtr->offCodeSum = (MaxOff+1);
-                 } else {
-                     unsigned u;
+                 } else {   /* new block : re-use previous statistics, scaled down */
-                     optPtr->litSum = 0;
-                     for (u=0; u<=MaxLit; u++) {
-                         optPtr->litFreq[u] = 1 + (optPtr->litFreq[u] >> (ZSTD_FREQ_DIV+1));
-                         optPtr->litSum += optPtr->litFreq[u];
+                     }
-                     optPtr->litLengthSum = 0;
-                     for (u=0; u<=MaxLL; u++) {
-                         optPtr->litLengthFreq[u] = 1 + (optPtr->litLengthFreq[u]>>(ZSTD_FREQ_DIV+1));
-                         optPtr->litLengthSum += optPtr->litLengthFreq[u];
+                     }
-                     optPtr->matchLengthSum = 0;
-                     for (u=0; u<=MaxML; u++) {
-                         optPtr->matchLengthFreq[u] = 1 + (optPtr->matchLengthFreq[u]>>ZSTD_FREQ_DIV);
-                         optPtr->matchLengthSum += optPtr->matchLengthFreq[u];
+                     }
-                     optPtr->offCodeSum = 0;
-                     for (u=0; u<=MaxOff; u++) {
-                         optPtr->offCodeFreq[u] = 1 + (optPtr->offCodeFreq[u]>>ZSTD_FREQ_DIV);
-                         optPtr->offCodeSum += optPtr->offCodeFreq[u];
+                     }
+                     optPtr->litSum = ZSTD_downscaleStat(optPtr->litFreq, MaxLit, 1);
+                     optPtr->litLengthSum = ZSTD_downscaleStat(optPtr->litLengthFreq, MaxLL, 0);
+                     optPtr->matchLengthSum = ZSTD_downscaleStat(optPtr->matchLengthFreq, MaxML, 0);
+                     optPtr->offCodeSum = ZSTD_downscaleStat(optPtr->offCodeFreq, MaxOff, 0);
                  }
-                 ZSTD_setLog2Prices(optPtr);
+                 ZSTD_setBasePrices(optPtr, optLevel);
              }
              /* ZSTD_rawLiteralsCost() :
-              * cost of literals (only) in given segment (which length can be null)
-              * does not include cost of literalLength symbol */
+              * price of literals (only) in specified segment (which length can be 0).
+              * does not include price of literalLength symbol */
              static U32 ZSTD_rawLiteralsCost(const BYTE* const literals, U32 const litLength,
-                                             const optState_t* const optPtr)
+                                             const optState_t* const optPtr,
+                                             int optLevel)
              {
-                 if (optPtr->staticPrices) return (litLength*6);  /* 6 bit per literal - no statistic used */
                  if (litLength == 0) return 0;
+                 if (optPtr->priceType == zop_predef)
+                     return (litLength*6) * BITCOST_MULTIPLIER;  /* 6 bit per literal - no statistic used */
-                 /* literals */
-                 {   U32 u;
-                     U32 cost = litLength * optPtr->log2litSum;
-                     for (u=0; u < litLength; u++)
-                         cost -= ZSTD_highbit32(optPtr->litFreq[literals[u]]+1);
-                     return cost;
+                 /* dynamic statistics */
+                 {   U32 price = litLength * optPtr->litSumBasePrice;
+                     U32 u;
+                     for (u=0; u < litLength; u++) {
+                         assert(WEIGHT(optPtr->litFreq[literals[u]], optLevel) <= optPtr->litSumBasePrice);   /* literal cost should never be negative */
+                         price -= WEIGHT(optPtr->litFreq[literals[u]], optLevel);
+                     }
+                     return price;
                  }
              }
              /* ZSTD_litLengthPrice() :
               * cost of literalLength symbol */
-             static U32 ZSTD_litLengthPrice(U32 const litLength, const optState_t* const optPtr)
+             static U32 ZSTD_litLengthPrice(U32 const litLength, const optState_t* const optPtr, int optLevel)
              {
-                 if (optPtr->staticPrices) return ZSTD_highbit32((U32)litLength+1);
+                 if (optPtr->priceType == zop_predef) return WEIGHT(litLength, optLevel);
-                 /* literal Length */
+                 /* dynamic statistics */
                  {   U32 const llCode = ZSTD_LLcode(litLength);
-                     U32 const price = LL_bits[llCode] + optPtr->log2litLengthSum - ZSTD_highbit32(optPtr->litLengthFreq[llCode]+1);
-                     return price;
+                     return (LL_bits[llCode] * BITCOST_MULTIPLIER) + (optPtr->litLengthSumBasePrice - WEIGHT(optPtr->litLengthFreq[llCode], optLevel));
                  }
              }
-             /* ZSTD_litLengthPrice() :
-              * cost of the literal part of a sequence,
-              * including literals themselves, and literalLength symbol */
-             static U32 ZSTD_fullLiteralsCost(const BYTE* const literals, U32 const litLength,
-                                              const optState_t* const optPtr)
+             {
-                 return ZSTD_rawLiteralsCost(literals, litLength, optPtr)
-                      + ZSTD_litLengthPrice(litLength, optPtr);
+             }
              /* ZSTD_litLengthContribution() :
               * @return ( cost(litlength) - cost(0) )
               * this value can then be added to rawLiteralsCost()
               * to provide a cost which is directly comparable to a match ending at same position */
-             static int ZSTD_litLengthContribution(U32 const litLength, const optState_t* const optPtr)
+             static int ZSTD_litLengthContribution(U32 const litLength, const optState_t* const optPtr, int optLevel)
              {
-                 if (optPtr->staticPrices) return ZSTD_highbit32(litLength+1);
+                 if (optPtr->priceType >= zop_predef) return WEIGHT(litLength, optLevel);
-                 /* literal Length */
+                 /* dynamic statistics */
                  {   U32 const llCode = ZSTD_LLcode(litLength);
-                     int const contribution = LL_bits[llCode]
-                                     + ZSTD_highbit32(optPtr->litLengthFreq[0]+1)
-                                     - ZSTD_highbit32(optPtr->litLengthFreq[llCode]+1);
+                     int const contribution = (LL_bits[llCode] * BITCOST_MULTIPLIER)
+                                            + WEIGHT(optPtr->litLengthFreq[0], optLevel)   /* note: log2litLengthSum cancel out */
+                                            - WEIGHT(optPtr->litLengthFreq[llCode], optLevel);
              #if 1
                      return contribution;
              #else
               * which can be compared to the ending cost of a match
               * should a new match start at this position */
              static int ZSTD_literalsContribution(const BYTE* const literals, U32 const litLength,
-                                                  const optState_t* const optPtr)
+                                                  const optState_t* const optPtr,
+                                                  int optLevel)
              {
-                 int const contribution = ZSTD_rawLiteralsCost(literals, litLength, optPtr)
-                                        + ZSTD_litLengthContribution(litLength, optPtr);
+                 int const contribution = ZSTD_rawLiteralsCost(literals, litLength, optPtr, optLevel)
+                                        + ZSTD_litLengthContribution(litLength, optPtr, optLevel);
                  return contribution;
              }
               * Provides the cost of the match part (offset + matchLength) of a sequence
               * Must be combined with ZSTD_fullLiteralsCost() to get the full cost of a sequence.
               * optLevel: when <2, favors small offset for decompression speed (improved cache efficiency) */
-             FORCE_INLINE_TEMPLATE U32 ZSTD_getMatchPrice(
-                                                 U32 const offset, U32 const matchLength,
-                                                 const optState_t* const optPtr,
-                                                 int const optLevel)
+             FORCE_INLINE_TEMPLATE U32
+             ZSTD_getMatchPrice(U32 const offset,
+                                U32 const matchLength,
+                                const optState_t* const optPtr,
+                                int const optLevel)
              {
                  U32 price;
                  U32 const offCode = ZSTD_highbit32(offset+1);
                  U32 const mlBase = matchLength - MINMATCH;
                  assert(matchLength >= MINMATCH);
-                 if (optPtr->staticPrices)  /* fixed scheme, do not use statistics */
-                     return ZSTD_highbit32((U32)mlBase+1) + 16 + offCode;
+                 if (optPtr->priceType == zop_predef)  /* fixed scheme, do not use statistics */
+                     return WEIGHT(mlBase, optLevel) + ((16 + offCode) * BITCOST_MULTIPLIER);
-                 price = offCode + optPtr->log2offCodeSum - ZSTD_highbit32(optPtr->offCodeFreq[offCode]+1);
-                 if ((optLevel<2) /*static*/ && offCode >= 20) price += (offCode-19)*2; /* handicap for long distance offsets, favor decompression speed */
+                 /* dynamic statistics */
+                 price = (offCode * BITCOST_MULTIPLIER) + (optPtr->offCodeSumBasePrice - WEIGHT(optPtr->offCodeFreq[offCode], optLevel));
+                 if ((optLevel<2) /*static*/ && offCode >= 20)
+                     price += (offCode-19)*2 * BITCOST_MULTIPLIER; /* handicap for long distance offsets, favor decompression speed */
                  /* match Length */
                  {   U32 const mlCode = ZSTD_MLcode(mlBase);
-                     price += ML_bits[mlCode] + optPtr->log2matchLengthSum - ZSTD_highbit32(optPtr->matchLengthFreq[mlCode]+1);
+                     price += (ML_bits[mlCode] * BITCOST_MULTIPLIER) + (optPtr->matchLengthSumBasePrice - WEIGHT(optPtr->matchLengthFreq[mlCode], optLevel));
                  }
+                 price += BITCOST_MULTIPLIER / 5;   /* heuristic : make matches a bit more costly to favor less sequences -> faster decompression speed */
                  DEBUGLOG(8, "ZSTD_getMatchPrice(ml:%u) = %u", matchLength, price);
                  return price;
              }
+             /* ZSTD_updateStats() :
+              * assumption : literals + litLengtn <= iend */
              static void ZSTD_updateStats(optState_t* const optPtr,
                                           U32 litLength, const BYTE* literals,
                                           U32 offsetCode, U32 matchLength)
               *  ip : assumed <= iend-8 .
               * @return : nb of positions added */
              static U32 ZSTD_insertBt1(
-                             ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
+                             ZSTD_matchState_t* ms,
                              const BYTE* const ip, const BYTE* const iend,
-                             U32 const mls, U32 const extDict)
+                             U32 const mls, const int extDict)
              {
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
                  U32*   const hashTable = ms->hashTable;
                  U32    const hashLog = cParams->hashLog;
                  size_t const h  = ZSTD_hashPtr(ip, hashLog, mls);
                  U32* largerPtr  = smallerPtr + 1;
                  U32 dummy32;   /* to be nullified at the end */
                  U32 const windowLow = ms->window.lowLimit;
+                 U32 const matchLow = windowLow ? windowLow : 1;
                  U32 matchEndIdx = current+8+1;
                  size_t bestLength = 8;
                  U32 nbCompares = 1U << cParams->searchLog;
                  assert(ip <= iend-8);   /* required for h calculation */
                  hashTable[h] = current;   /* Update Hash Table */
-                 while (nbCompares-- && (matchIndex > windowLow)) {
+                 while (nbCompares-- && (matchIndex >= matchLow)) {
                      U32* const nextPtr = bt + 2*(matchIndex & btMask);
                      size_t matchLength = MIN(commonLengthSmaller, commonLengthLarger);   /* guaranteed minimum nb of common bytes */
                      assert(matchIndex < current);
                      }
              #endif
-                     if ((!extDict) || (matchIndex+matchLength >= dictLimit)) {
-                         assert(matchIndex+matchLength >= dictLimit);   /* might be wrong if extDict is incorrectly set to 0 */
+                     if (!extDict || (matchIndex+matchLength >= dictLimit)) {
+                         assert(matchIndex+matchLength >= dictLimit);   /* might be wrong if actually extDict */
                          match = base + matchIndex;
                          matchLength += ZSTD_count(ip+matchLength, match+matchLength, iend);
                      } else {
              FORCE_INLINE_TEMPLATE
              void ZSTD_updateTree_internal(
-                             ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
+                             ZSTD_matchState_t* ms,
                              const BYTE* const ip, const BYTE* const iend,
-                             const U32 mls, const U32 extDict)
+                             const U32 mls, const ZSTD_dictMode_e dictMode)
              {
                  const BYTE* const base = ms->window.base;
                  U32 const target = (U32)(ip - base);
                  U32 idx = ms->nextToUpdate;
-                 DEBUGLOG(7, "ZSTD_updateTree_internal, from %u to %u  (extDict:%u)",
-                             idx, target, extDict);
+                 DEBUGLOG(5, "ZSTD_updateTree_internal, from %u to %u  (dictMode:%u)",
+                             idx, target, dictMode);
                  while(idx < target)
-                     idx += ZSTD_insertBt1(ms, cParams, base+idx, iend, mls, extDict);
+                     idx += ZSTD_insertBt1(ms, base+idx, iend, mls, dictMode == ZSTD_extDict);
                  ms->nextToUpdate = target;
              }
-             void ZSTD_updateTree(
-                             ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
-                             const BYTE* ip, const BYTE* iend)
+             {
-                 ZSTD_updateTree_internal(ms, cParams, ip, iend, cParams->searchLength, 0 /*extDict*/);
+             void ZSTD_updateTree(ZSTD_matchState_t* ms, const BYTE* ip, const BYTE* iend) {
+                 ZSTD_updateTree_internal(ms, ip, iend, ms->cParams.searchLength, ZSTD_noDict);
              }
              FORCE_INLINE_TEMPLATE
              U32 ZSTD_insertBtAndGetAllMatches (
-                                 ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
-                                 const BYTE* const ip, const BYTE* const iLimit, int const extDict,
+                                 ZSTD_matchState_t* ms,
+                                 const BYTE* const ip, const BYTE* const iLimit, const ZSTD_dictMode_e dictMode,
                                  U32 rep[ZSTD_REP_NUM], U32 const ll0,
                                  ZSTD_match_t* matches, const U32 lengthToBeat, U32 const mls /* template */)
              {
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
                  U32 const sufficient_len = MIN(cParams->targetLength, ZSTD_OPT_NUM -1);
                  const BYTE* const base = ms->window.base;
                  U32 const current = (U32)(ip-base);
                  const BYTE* const prefixStart = base + dictLimit;
                  U32 const btLow = btMask >= current ? 0 : current - btMask;
                  U32 const windowLow = ms->window.lowLimit;
+                 U32 const matchLow = windowLow ? windowLow : 1;
                  U32* smallerPtr = bt + 2*(current&btMask);
                  U32* largerPtr  = bt + 2*(current&btMask) + 1;
                  U32 matchEndIdx = current+8+1;   /* farthest referenced position of any match => detects repetitive patterns */
                  U32 mnum = 0;
                  U32 nbCompares = 1U << cParams->searchLog;
+                 const ZSTD_matchState_t* dms    = dictMode == ZSTD_dictMatchState ? ms->dictMatchState : NULL;
+                 const ZSTD_compressionParameters* const dmsCParams =
+                                                   dictMode == ZSTD_dictMatchState ? &dms->cParams : NULL;
+                 const BYTE* const dmsBase       = dictMode == ZSTD_dictMatchState ? dms->window.base : NULL;
+                 const BYTE* const dmsEnd        = dictMode == ZSTD_dictMatchState ? dms->window.nextSrc : NULL;
+                 U32         const dmsHighLimit  = dictMode == ZSTD_dictMatchState ? (U32)(dmsEnd - dmsBase) : 0;
+                 U32         const dmsLowLimit   = dictMode == ZSTD_dictMatchState ? dms->window.lowLimit : 0;
+                 U32         const dmsIndexDelta = dictMode == ZSTD_dictMatchState ? windowLow - dmsHighLimit : 0;
+                 U32         const dmsHashLog    = dictMode == ZSTD_dictMatchState ? dmsCParams->hashLog : hashLog;
+                 U32         const dmsBtLog      = dictMode == ZSTD_dictMatchState ? dmsCParams->chainLog - 1 : btLog;
+                 U32         const dmsBtMask     = dictMode == ZSTD_dictMatchState ? (1U << dmsBtLog) - 1 : 0;
+                 U32         const dmsBtLow      = dictMode == ZSTD_dictMatchState && dmsBtMask < dmsHighLimit - dmsLowLimit ? dmsHighLimit - dmsBtMask : dmsLowLimit;
                  size_t bestLength = lengthToBeat-1;
-                 DEBUGLOG(7, "ZSTD_insertBtAndGetAllMatches");
+                 DEBUGLOG(8, "ZSTD_insertBtAndGetAllMatches: current=%u", current);
                  /* check repCode */
                  {   U32 const lastR = ZSTD_REP_NUM + ll0;
                                  repLen = (U32)ZSTD_count(ip+minMatch, ip+minMatch-repOffset, iLimit) + minMatch;
                              }
                          } else {  /* repIndex < dictLimit || repIndex >= current */
-                             const BYTE* const repMatch = dictBase + repIndex;
+                             const BYTE* const repMatch = dictMode == ZSTD_dictMatchState ?
+                                                          dmsBase + repIndex - dmsIndexDelta :
+                                                          dictBase + repIndex;
                              assert(current >= windowLow);
-                             if ( extDict /* this case only valid in extDict mode */
+                             if ( dictMode == ZSTD_extDict
                                && ( ((repOffset-1) /*intentional overflow*/ < current - windowLow)  /* equivalent to `current > repIndex >= windowLow` */
                                   & (((U32)((dictLimit-1) - repIndex) >= 3) ) /* intentional overflow : do not test positions overlapping 2 memory segments */)
                                && (ZSTD_readMINMATCH(ip, minMatch) == ZSTD_readMINMATCH(repMatch, minMatch)) ) {
                                  repLen = (U32)ZSTD_count_2segments(ip+minMatch, repMatch+minMatch, iLimit, dictEnd, prefixStart) + minMatch;
+                             }
+                             if (dictMode == ZSTD_dictMatchState
+                               && ( ((repOffset-1) /*intentional overflow*/ < current - (dmsLowLimit + dmsIndexDelta))  /* equivalent to `current > repIndex >= dmsLowLimit` */
+                                  & ((U32)((dictLimit-1) - repIndex) >= 3) ) /* intentional overflow : do not test positions overlapping 2 memory segments */
+                               && (ZSTD_readMINMATCH(ip, minMatch) == ZSTD_readMINMATCH(repMatch, minMatch)) ) {
+                                 repLen = (U32)ZSTD_count_2segments(ip+minMatch, repMatch+minMatch, iLimit, dmsEnd, prefixStart) + minMatch;
                          }   }
                          /* save longer solution */
                          if (repLen > bestLength) {
-                             DEBUGLOG(8, "found rep-match %u of length %u",
-                                         repCode - ll0, (U32)repLen);
+                             DEBUGLOG(8, "found repCode %u (ll0:%u, offset:%u) of length %u",
+                                         repCode, ll0, repOffset, repLen);
                              bestLength = repLen;
                              matches[mnum].off = repCode - ll0;
                              matches[mnum].len = (U32)repLen;
                  /* HC3 match finder */
                  if ((mls == 3) /*static*/ && (bestLength < mls)) {
                      U32 const matchIndex3 = ZSTD_insertAndFindFirstIndexHash3(ms, ip);
-                     if ((matchIndex3 > windowLow)
+                     if ((matchIndex3 >= matchLow)
                        & (current - matchIndex3 < (1<<18)) /*heuristic : longer distance likely too expensive*/ ) {
                          size_t mlen;
-                         if ((!extDict) /*static*/ || (matchIndex3 >= dictLimit)) {
+                         if ((dictMode == ZSTD_noDict) /*static*/ || (dictMode == ZSTD_dictMatchState) /*static*/ || (matchIndex3 >= dictLimit)) {
                              const BYTE* const match = base + matchIndex3;
                              mlen = ZSTD_count(ip, match, iLimit);
                          } else {
                                   (ip+mlen == iLimit) ) {  /* best possible length */
                                  ms->nextToUpdate = current+1;  /* skip insertion */
                                  return 1;
-                 }   }   }   }
+                             }
+                         }
+                     }
+                     /* no dictMatchState lookup: dicts don't have a populated HC3 table */
+                 }
                  hashTable[h] = current;   /* Update Hash Table */
-                 while (nbCompares-- && (matchIndex > windowLow)) {
+                 while (nbCompares-- && (matchIndex >= matchLow)) {
                      U32* const nextPtr = bt + 2*(matchIndex & btMask);
                      size_t matchLength = MIN(commonLengthSmaller, commonLengthLarger);   /* guaranteed minimum nb of common bytes */
                      const BYTE* match;
                      assert(current > matchIndex);
-                     if ((!extDict) || (matchIndex+matchLength >= dictLimit)) {
+                     if ((dictMode == ZSTD_noDict) || (dictMode == ZSTD_dictMatchState) || (matchIndex+matchLength >= dictLimit)) {
                          assert(matchIndex+matchLength >= dictLimit);  /* ensure the condition is correct when !extDict */
                          match = base + matchIndex;
                          matchLength += ZSTD_count(ip+matchLength, match+matchLength, iLimit);
                      }
                      if (matchLength > bestLength) {
-                         DEBUGLOG(8, "found match of length %u at distance %u",
-                                 (U32)matchLength, current - matchIndex);
+                         DEBUGLOG(8, "found match of length %u at distance %u (offCode=%u)",
+                                 (U32)matchLength, current - matchIndex, current - matchIndex + ZSTD_REP_MOVE);
                          assert(matchEndIdx > matchIndex);
                          if (matchLength > matchEndIdx - matchIndex)
                              matchEndIdx = matchIndex + (U32)matchLength;
                          matches[mnum].off = (current - matchIndex) + ZSTD_REP_MOVE;
                          matches[mnum].len = (U32)matchLength;
                          mnum++;
-                         if (matchLength > ZSTD_OPT_NUM) break;
-                         if (ip+matchLength == iLimit) {  /* equal : no way to know if inf or sup */
-                             break;   /* drop, to preserve bt consistency (miss a little bit of compression) */
+                         if ( (matchLength > ZSTD_OPT_NUM)
+                            | (ip+matchLength == iLimit) /* equal : no way to know if inf or sup */) {
+                             if (dictMode == ZSTD_dictMatchState) nbCompares = 0; /* break should also skip searching dms */
+                             break; /* drop, to preserve bt consistency (miss a little bit of compression) */
                          }
                      }
                  *smallerPtr = *largerPtr = 0;
+                 if (dictMode == ZSTD_dictMatchState && nbCompares) {
+                     size_t const dmsH = ZSTD_hashPtr(ip, dmsHashLog, mls);
+                     U32 dictMatchIndex = dms->hashTable[dmsH];
+                     const U32* const dmsBt = dms->chainTable;
+                     commonLengthSmaller = commonLengthLarger = 0;
+                     while (nbCompares-- && (dictMatchIndex > dmsLowLimit)) {
+                         const U32* const nextPtr = dmsBt + 2*(dictMatchIndex & dmsBtMask);
+                         size_t matchLength = MIN(commonLengthSmaller, commonLengthLarger);   /* guaranteed minimum nb of common bytes */
+                         const BYTE* match = dmsBase + dictMatchIndex;
+                         matchLength += ZSTD_count_2segments(ip+matchLength, match+matchLength, iLimit, dmsEnd, prefixStart);
+                         if (dictMatchIndex+matchLength >= dmsHighLimit)
+                             match = base + dictMatchIndex + dmsIndexDelta;   /* to prepare for next usage of match[matchLength] */
+                         if (matchLength > bestLength) {
+                             matchIndex = dictMatchIndex + dmsIndexDelta;
+                             DEBUGLOG(8, "found dms match of length %u at distance %u (offCode=%u)",
+                                     (U32)matchLength, current - matchIndex, current - matchIndex + ZSTD_REP_MOVE);
+                             if (matchLength > matchEndIdx - matchIndex)
+                                 matchEndIdx = matchIndex + (U32)matchLength;
+                             bestLength = matchLength;
+                             matches[mnum].off = (current - matchIndex) + ZSTD_REP_MOVE;
+                             matches[mnum].len = (U32)matchLength;
+                             mnum++;
+                             if ( (matchLength > ZSTD_OPT_NUM)
+                                | (ip+matchLength == iLimit) /* equal : no way to know if inf or sup */) {
+                                 break;   /* drop, to guarantee consistency (miss a little bit of compression) */
+                             }
+                         }
+                         if (dictMatchIndex <= dmsBtLow) { break; }   /* beyond tree size, stop the search */
+                         if (match[matchLength] < ip[matchLength]) {
+                             commonLengthSmaller = matchLength;    /* all smaller will now have at least this guaranteed common length */
+                             dictMatchIndex = nextPtr[1];              /* new matchIndex larger than previous (closer to current) */
+                         } else {
+                             /* match is larger than current */
+                             commonLengthLarger = matchLength;
+                             dictMatchIndex = nextPtr[0];
+                         }
+                     }
+                 }
                  assert(matchEndIdx > current+8);
                  ms->nextToUpdate = matchEndIdx - 8;  /* skip repetitive patterns */
                  return mnum;
              FORCE_INLINE_TEMPLATE U32 ZSTD_BtGetAllMatches (
-                                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
-                                     const BYTE* ip, const BYTE* const iHighLimit, int const extDict,
+                                     ZSTD_matchState_t* ms,
+                                     const BYTE* ip, const BYTE* const iHighLimit, const ZSTD_dictMode_e dictMode,
                                      U32 rep[ZSTD_REP_NUM], U32 const ll0,
                                      ZSTD_match_t* matches, U32 const lengthToBeat)
              {
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
                  U32 const matchLengthSearch = cParams->searchLength;
-                 DEBUGLOG(7, "ZSTD_BtGetAllMatches");
+                 DEBUGLOG(8, "ZSTD_BtGetAllMatches");
                  if (ip < ms->window.base + ms->nextToUpdate) return 0;   /* skipped area */
-                 ZSTD_updateTree_internal(ms, cParams, ip, iHighLimit, matchLengthSearch, extDict);
+                 ZSTD_updateTree_internal(ms, ip, iHighLimit, matchLengthSearch, dictMode);
                  switch(matchLengthSearch)
                  {
-                 case 3 : return ZSTD_insertBtAndGetAllMatches(ms, cParams, ip, iHighLimit, extDict, rep, ll0, matches, lengthToBeat, 3);
+                 case 3 : return ZSTD_insertBtAndGetAllMatches(ms, ip, iHighLimit, dictMode, rep, ll0, matches, lengthToBeat, 3);
                  default :
-                 case 4 : return ZSTD_insertBtAndGetAllMatches(ms, cParams, ip, iHighLimit, extDict, rep, ll0, matches, lengthToBeat, 4);
-                 case 5 : return ZSTD_insertBtAndGetAllMatches(ms, cParams, ip, iHighLimit, extDict, rep, ll0, matches, lengthToBeat, 5);
+                 case 4 : return ZSTD_insertBtAndGetAllMatches(ms, ip, iHighLimit, dictMode, rep, ll0, matches, lengthToBeat, 4);
+                 case 5 : return ZSTD_insertBtAndGetAllMatches(ms, ip, iHighLimit, dictMode, rep, ll0, matches, lengthToBeat, 5);
                  case 7 :
-                 case 6 : return ZSTD_insertBtAndGetAllMatches(ms, cParams, ip, iHighLimit, extDict, rep, ll0, matches, lengthToBeat, 6);
+                 case 6 : return ZSTD_insertBtAndGetAllMatches(ms, ip, iHighLimit, dictMode, rep, ll0, matches, lengthToBeat, 6);
                  }
              }
                  U32 rep[3];
              } repcodes_t;
-             repcodes_t ZSTD_updateRep(U32 const rep[3], U32 const offset, U32 const ll0)
+             static repcodes_t ZSTD_updateRep(U32 const rep[3], U32 const offset, U32 const ll0)
              {
                  repcodes_t newReps;
                  if (offset >= ZSTD_REP_NUM) {  /* full offset */
              }
-             typedef struct {
-                 const BYTE* anchor;
-                 U32 litlen;
-                 U32 rawLitCost;
-             } cachedLiteralPrice_t;
-             static U32 ZSTD_rawLiteralsCost_cached(
-                                         cachedLiteralPrice_t* const cachedLitPrice,
-                                         const BYTE* const anchor, U32 const litlen,
-                                         const optState_t* const optStatePtr)
+             static U32 ZSTD_totalLen(ZSTD_optimal_t sol)
              {
-                 U32 startCost;
-                 U32 remainingLength;
-                 const BYTE* startPosition;
-                 if (anchor == cachedLitPrice->anchor) {
-                     startCost = cachedLitPrice->rawLitCost;
-                     startPosition = anchor + cachedLitPrice->litlen;
-                     assert(litlen >= cachedLitPrice->litlen);
-                     remainingLength = litlen - cachedLitPrice->litlen;
-                 } else {
-                     startCost = 0;
-                     startPosition = anchor;
-                     remainingLength = litlen;
+                 }
-                 {   U32 const rawLitCost = startCost + ZSTD_rawLiteralsCost(startPosition, remainingLength, optStatePtr);
-                     cachedLitPrice->anchor = anchor;
-                     cachedLitPrice->litlen = litlen;
-                     cachedLitPrice->rawLitCost = rawLitCost;
-                     return rawLitCost;
+                 }
+                 return sol.litlen + sol.mlen;
              }
-             static U32 ZSTD_fullLiteralsCost_cached(
-                                         cachedLiteralPrice_t* const cachedLitPrice,
-                                         const BYTE* const anchor, U32 const litlen,
-                                         const optState_t* const optStatePtr)
+             {
-                 return ZSTD_rawLiteralsCost_cached(cachedLitPrice, anchor, litlen, optStatePtr)
-                      + ZSTD_litLengthPrice(litlen, optStatePtr);
+             }
-             static int ZSTD_literalsContribution_cached(
-                                         cachedLiteralPrice_t* const cachedLitPrice,
-                                         const BYTE* const anchor, U32 const litlen,
-                                         const optState_t* const optStatePtr)
+             {
-                 int const contribution = ZSTD_rawLiteralsCost_cached(cachedLitPrice, anchor, litlen, optStatePtr)
-                                        + ZSTD_litLengthContribution(litlen, optStatePtr);
-                 return contribution;
+             }
-             FORCE_INLINE_TEMPLATE
-             size_t ZSTD_compressBlock_opt_generic(ZSTD_matchState_t* ms,seqStore_t* seqStore,
-                                                   U32 rep[ZSTD_REP_NUM],
-                                                   ZSTD_compressionParameters const* cParams,
-                                                   const void* src, size_t srcSize,
-                                                   const int optLevel, const int extDict)
+             FORCE_INLINE_TEMPLATE size_t
+             ZSTD_compressBlock_opt_generic(ZSTD_matchState_t* ms,
+                                            seqStore_t* seqStore,
+                                            U32 rep[ZSTD_REP_NUM],
+                                            const void* src, size_t srcSize,
+                                            const int optLevel, const ZSTD_dictMode_e dictMode)
              {
                  optState_t* const optStatePtr = &ms->opt;
                  const BYTE* const istart = (const BYTE*)src;
                  const BYTE* const ilimit = iend - 8;
                  const BYTE* const base = ms->window.base;
                  const BYTE* const prefixStart = base + ms->window.dictLimit;
+                 const ZSTD_compressionParameters* const cParams = &ms->cParams;
                  U32 const sufficient_len = MIN(cParams->targetLength, ZSTD_OPT_NUM -1);
                  U32 const minMatch = (cParams->searchLength == 3) ? 3 : 4;
                  ZSTD_optimal_t* const opt = optStatePtr->priceTable;
                  ZSTD_match_t* const matches = optStatePtr->matchTable;
-                 cachedLiteralPrice_t cachedLitPrice;
+                 ZSTD_optimal_t lastSequence;
                  /* init */
                  DEBUGLOG(5, "ZSTD_compressBlock_opt_generic");
+                 assert(optLevel <= 2);
                  ms->nextToUpdate3 = ms->nextToUpdate;
-                 ZSTD_rescaleFreqs(optStatePtr, (const BYTE*)src, srcSize);
+                 ZSTD_rescaleFreqs(optStatePtr, (const BYTE*)src, srcSize, optLevel);
                  ip += (ip==prefixStart);
-                 memset(&cachedLitPrice, 0, sizeof(cachedLitPrice));
                  /* Match Loop */
                  while (ip < ilimit) {
                      U32 cur, last_pos = 0;
-                     U32 best_mlen, best_off;
                      /* find first match */
                      {   U32 const litlen = (U32)(ip - anchor);
                          U32 const ll0 = !litlen;
-                         U32 const nbMatches = ZSTD_BtGetAllMatches(ms, cParams, ip, iend, extDict, rep, ll0, matches, minMatch);
+                         U32 const nbMatches = ZSTD_BtGetAllMatches(ms, ip, iend, dictMode, rep, ll0, matches, minMatch);
                          if (!nbMatches) { ip++; continue; }
                          /* initialize opt[0] */
                          { U32 i ; for (i=0; i<ZSTD_REP_NUM; i++) opt[0].rep[i] = rep[i]; }
-                         opt[0].mlen = 1;
+                         opt[0].mlen = 0;  /* means is_a_literal */
                          opt[0].litlen = litlen;
+                         opt[0].price = ZSTD_literalsContribution(anchor, litlen, optStatePtr, optLevel);
                          /* large match -> immediate encoding */
                          {   U32 const maxML = matches[nbMatches-1].len;
-                             DEBUGLOG(7, "found %u matches of maxLength=%u and offset=%u at cPos=%u => start new serie",
-                                         nbMatches, maxML, matches[nbMatches-1].off, (U32)(ip-prefixStart));
+                             U32 const maxOffset = matches[nbMatches-1].off;
+                             DEBUGLOG(6, "found %u matches of maxLength=%u and maxOffCode=%u at cPos=%u => start new serie",
+                                         nbMatches, maxML, maxOffset, (U32)(ip-prefixStart));
                              if (maxML > sufficient_len) {
-                                 best_mlen = maxML;
-                                 best_off = matches[nbMatches-1].off;
-                                 DEBUGLOG(7, "large match (%u>%u), immediate encoding",
-                                             best_mlen, sufficient_len);
+                                 lastSequence.litlen = litlen;
+                                 lastSequence.mlen = maxML;
+                                 lastSequence.off = maxOffset;
+                                 DEBUGLOG(6, "large match (%u>%u), immediate encoding",
+                                             maxML, sufficient_len);
                                  cur = 0;
-                                 last_pos = 1;
+                                 last_pos = ZSTD_totalLen(lastSequence);
                                  goto _shortestPath;
                          }   }
                          /* set prices for first matches starting position == 0 */
-                         {   U32 const literalsPrice = ZSTD_fullLiteralsCost_cached(&cachedLitPrice, anchor, litlen, optStatePtr);
+                         {   U32 const literalsPrice = opt[0].price + ZSTD_litLengthPrice(0, optStatePtr, optLevel);
                              U32 pos;
                              U32 matchNb;
-                             for (pos = 0; pos < minMatch; pos++) {
-                                 opt[pos].mlen = 1;
-                                 opt[pos].price = ZSTD_MAX_PRICE;
+                             for (pos = 1; pos < minMatch; pos++) {
+                                 opt[pos].price = ZSTD_MAX_PRICE;   /* mlen, litlen and price will be fixed during forward scanning */
                              }
                              for (matchNb = 0; matchNb < nbMatches; matchNb++) {
                                  U32 const offset = matches[matchNb].off;
                                  U32 const end = matches[matchNb].len;
                                  repcodes_t const repHistory = ZSTD_updateRep(rep, offset, ll0);
                                  for ( ; pos <= end ; pos++ ) {
-                                     U32 const matchPrice = literalsPrice + ZSTD_getMatchPrice(offset, pos, optStatePtr, optLevel);
-                                     DEBUGLOG(7, "rPos:%u => set initial price : %u",
-                                                 pos, matchPrice);
+                                     U32 const matchPrice = ZSTD_getMatchPrice(offset, pos, optStatePtr, optLevel);
+                                     U32 const sequencePrice = literalsPrice + matchPrice;
+                                     DEBUGLOG(7, "rPos:%u => set initial price : %.2f",
+                                                 pos, ZSTD_fCost(sequencePrice));
                                      opt[pos].mlen = pos;
                                      opt[pos].off = offset;
                                      opt[pos].litlen = litlen;
-                                     opt[pos].price = matchPrice;
+                                     opt[pos].price = sequencePrice;
+                                     ZSTD_STATIC_ASSERT(sizeof(opt[pos].rep) == sizeof(repHistory));
                                      memcpy(opt[pos].rep, &repHistory, sizeof(repHistory));
                              }   }
                              last_pos = pos-1;
                      for (cur = 1; cur <= last_pos; cur++) {
                          const BYTE* const inr = ip + cur;
                          assert(cur < ZSTD_OPT_NUM);
+                         DEBUGLOG(7, "cPos:%zi==rPos:%u", inr-istart, cur)
                          /* Fix current position with one literal if cheaper */
-                         {   U32 const litlen = (opt[cur-1].mlen == 1) ? opt[cur-1].litlen + 1 : 1;
-                             int price;  /* note : contribution can be negative */
-                             if (cur > litlen) {
-                                 price = opt[cur - litlen].price + ZSTD_literalsContribution(inr-litlen, litlen, optStatePtr);
-                             } else {
-                                 price = ZSTD_literalsContribution_cached(&cachedLitPrice, anchor, litlen, optStatePtr);
+                             }
+                         {   U32 const litlen = (opt[cur-1].mlen == 0) ? opt[cur-1].litlen + 1 : 1;
+                             int const price = opt[cur-1].price
+                                             + ZSTD_rawLiteralsCost(ip+cur-1, 1, optStatePtr, optLevel)
+                                             + ZSTD_litLengthPrice(litlen, optStatePtr, optLevel)
+                                             - ZSTD_litLengthPrice(litlen-1, optStatePtr, optLevel);
                              assert(price < 1000000000); /* overflow check */
                              if (price <= opt[cur].price) {
-                                 DEBUGLOG(7, "rPos:%u : better price (%u<%u) using literal",
-                                             cur, price, opt[cur].price);
-                                 opt[cur].mlen = 1;
+                                 DEBUGLOG(7, "cPos:%zi==rPos:%u : better price (%.2f<=%.2f) using literal (ll==%u) (hist:%u,%u,%u)",
+                                             inr-istart, cur, ZSTD_fCost(price), ZSTD_fCost(opt[cur].price), litlen,
+                                             opt[cur-1].rep[0], opt[cur-1].rep[1], opt[cur-1].rep[2]);
+                                 opt[cur].mlen = 0;
                                  opt[cur].off = 0;
                                  opt[cur].litlen = litlen;
                                  opt[cur].price = price;
                                  memcpy(opt[cur].rep, opt[cur-1].rep, sizeof(opt[cur].rep));
-                         }   }
+                             } else {
+                                 DEBUGLOG(7, "cPos:%zi==rPos:%u : literal would cost more (%.2f>%.2f) (hist:%u,%u,%u)",
+                                             inr-istart, cur, ZSTD_fCost(price), ZSTD_fCost(opt[cur].price),
+                                             opt[cur].rep[0], opt[cur].rep[1], opt[cur].rep[2]);
+                             }
+                         }
                          /* last match must start at a minimum distance of 8 from oend */
                          if (inr > ilimit) continue;
                          if (cur == last_pos) break;
-                          if ( (optLevel==0) /*static*/
-                            && (opt[cur+1].price <= opt[cur].price) )
+                         if ( (optLevel==0) /*static_test*/
+                           && (opt[cur+1].price <= opt[cur].price + (BITCOST_MULTIPLIER/2)) ) {
+                             DEBUGLOG(7, "move to next rPos:%u : price is <=", cur+1);
                              continue;  /* skip unpromising positions; about ~+6% speed, -0.01 ratio */
+                         }
-                         {   U32 const ll0 = (opt[cur].mlen != 1);
-                             U32 const litlen = (opt[cur].mlen == 1) ? opt[cur].litlen : 0;
-                             U32 const previousPrice = (cur > litlen) ? opt[cur-litlen].price : 0;
-                             U32 const basePrice = previousPrice + ZSTD_fullLiteralsCost(inr-litlen, litlen, optStatePtr);
-                             U32 const nbMatches = ZSTD_BtGetAllMatches(ms, cParams, inr, iend, extDict, opt[cur].rep, ll0, matches, minMatch);
+                         {   U32 const ll0 = (opt[cur].mlen != 0);
+                             U32 const litlen = (opt[cur].mlen == 0) ? opt[cur].litlen : 0;
+                             U32 const previousPrice = opt[cur].price;
+                             U32 const basePrice = previousPrice + ZSTD_litLengthPrice(0, optStatePtr, optLevel);
+                             U32 const nbMatches = ZSTD_BtGetAllMatches(ms, inr, iend, dictMode, opt[cur].rep, ll0, matches, minMatch);
                              U32 matchNb;
-                             if (!nbMatches) continue;
+                             if (!nbMatches) {
+                                 DEBUGLOG(7, "rPos:%u : no match found", cur);
+                                 continue;
+                             }
                              {   U32 const maxML = matches[nbMatches-1].len;
-                                 DEBUGLOG(7, "rPos:%u, found %u matches, of maxLength=%u",
-                                             cur, nbMatches, maxML);
+                                 DEBUGLOG(7, "cPos:%zi==rPos:%u, found %u matches, of maxLength=%u",
+                                             inr-istart, cur, nbMatches, maxML);
                                  if ( (maxML > sufficient_len)
-                                    | (cur + maxML >= ZSTD_OPT_NUM) ) {
-                                     best_mlen = maxML;
-                                     best_off = matches[nbMatches-1].off;
-                                     last_pos = cur + 1;
+                                   || (cur + maxML >= ZSTD_OPT_NUM) ) {
+                                     lastSequence.mlen = maxML;
+                                     lastSequence.off = matches[nbMatches-1].off;
+                                     lastSequence.litlen = litlen;
+                                     cur -= (opt[cur].mlen==0) ? opt[cur].litlen : 0;  /* last sequence is actually only literals, fix cur to last match - note : may underflow, in which case, it's first sequence, and it's okay */
+                                     last_pos = cur + ZSTD_totalLen(lastSequence);
+                                     if (cur > ZSTD_OPT_NUM) cur = 0;   /* underflow => first match */
                                      goto _shortestPath;
+                                 }
+                             }
+                             }   }
                              /* set prices using matches found at position == cur */
                              for (matchNb = 0; matchNb < nbMatches; matchNb++) {
                                  U32 const startML = (matchNb>0) ? matches[matchNb-1].len+1 : minMatch;
                                  U32 mlen;
-                                 DEBUGLOG(7, "testing match %u => offCode=%u, mlen=%u, llen=%u",
+                                 DEBUGLOG(7, "testing match %u => offCode=%4u, mlen=%2u, llen=%2u",
                                              matchNb, matches[matchNb].off, lastML, litlen);
-                                 for (mlen = lastML; mlen >= startML; mlen--) {
+                                 for (mlen = lastML; mlen >= startML; mlen--) {  /* scan downward */
                                      U32 const pos = cur + mlen;
                                      int const price = basePrice + ZSTD_getMatchPrice(offset, mlen, optStatePtr, optLevel);
                                      if ((pos > last_pos) || (price < opt[pos].price)) {
-                                         DEBUGLOG(7, "rPos:%u => new better price (%u<%u)",
-                                                     pos, price, opt[pos].price);
-                                         while (last_pos < pos) { opt[last_pos+1].price = ZSTD_MAX_PRICE; last_pos++; }
+                                         DEBUGLOG(7, "rPos:%u (ml=%2u) => new better price (%.2f<%.2f)",
+                                                     pos, mlen, ZSTD_fCost(price), ZSTD_fCost(opt[pos].price));
+                                         while (last_pos < pos) { opt[last_pos+1].price = ZSTD_MAX_PRICE; last_pos++; }   /* fill empty positions */
                                          opt[pos].mlen = mlen;
                                          opt[pos].off = offset;
                                          opt[pos].litlen = litlen;
                                          opt[pos].price = price;
+                                         ZSTD_STATIC_ASSERT(sizeof(opt[pos].rep) == sizeof(repHistory));
                                          memcpy(opt[pos].rep, &repHistory, sizeof(repHistory));
                                      } else {
-                                         if (optLevel==0) break;  /* gets ~+10% speed for about -0.01 ratio loss */
+                                         DEBUGLOG(7, "rPos:%u (ml=%2u) => new price is worse (%.2f>=%.2f)",
+                                                     pos, mlen, ZSTD_fCost(price), ZSTD_fCost(opt[pos].price));
+                                         if (optLevel==0) break;  /* early update abort; gets ~+10% speed for about -0.01 ratio loss */
                                      }
                          }   }   }
                      }  /* for (cur = 1; cur <= last_pos; cur++) */
-                     best_mlen = opt[last_pos].mlen;
-                     best_off = opt[last_pos].off;
-                     cur = last_pos - best_mlen;
+                     lastSequence = opt[last_pos];
+                     cur = last_pos > ZSTD_totalLen(lastSequence) ? last_pos - ZSTD_totalLen(lastSequence) : 0;  /* single sequence, and it starts before `ip` */
+                     assert(cur < ZSTD_OPT_NUM);  /* control overflow*/
              _shortestPath:   /* cur, last_pos, best_mlen, best_off have to be set */
-                     assert(opt[0].mlen == 1);
+                     assert(opt[0].mlen == 0);
+                     {   U32 const storeEnd = cur + 1;
+                         U32 storeStart = storeEnd;
+                         U32 seqPos = cur;
-                     /* reverse traversal */
-                     DEBUGLOG(7, "start reverse traversal (last_pos:%u, cur:%u)",
-                                 last_pos, cur);
-                     {   U32 selectedMatchLength = best_mlen;
-                         U32 selectedOffset = best_off;
-                         U32 pos = cur;
-                         while (1) {
-                             U32 const mlen = opt[pos].mlen;
-                             U32 const off = opt[pos].off;
-                             opt[pos].mlen = selectedMatchLength;
-                             opt[pos].off = selectedOffset;
-                             selectedMatchLength = mlen;
-                             selectedOffset = off;
-                             if (mlen > pos) break;
-                             pos -= mlen;
-                     }   }
+                         DEBUGLOG(6, "start reverse traversal (last_pos:%u, cur:%u)",
+                                     last_pos, cur); (void)last_pos;
+                         assert(storeEnd < ZSTD_OPT_NUM);
+                         DEBUGLOG(6, "last sequence copied into pos=%u (llen=%u,mlen=%u,ofc=%u)",
+                                     storeEnd, lastSequence.litlen, lastSequence.mlen, lastSequence.off);
+                         opt[storeEnd] = lastSequence;
+                         while (seqPos > 0) {
+                             U32 const backDist = ZSTD_totalLen(opt[seqPos]);
+                             storeStart--;
+                             DEBUGLOG(6, "sequence from rPos=%u copied into pos=%u (llen=%u,mlen=%u,ofc=%u)",
+                                         seqPos, storeStart, opt[seqPos].litlen, opt[seqPos].mlen, opt[seqPos].off);
+                             opt[storeStart] = opt[seqPos];
+                             seqPos = (seqPos > backDist) ? seqPos - backDist : 0;
+                         }
-                     /* save sequences */
-                     {   U32 pos;
-                         for (pos=0; pos < last_pos; ) {
-                             U32 const llen = (U32)(ip - anchor);
-                             U32 const mlen = opt[pos].mlen;
-                             U32 const offset = opt[pos].off;
-                             if (mlen == 1) { ip++; pos++; continue; }  /* literal position => move on */
-                             pos += mlen; ip += mlen;
+                         /* save sequences */
+                         DEBUGLOG(6, "sending selected sequences into seqStore")
+                         {   U32 storePos;
+                             for (storePos=storeStart; storePos <= storeEnd; storePos++) {
+                                 U32 const llen = opt[storePos].litlen;
+                                 U32 const mlen = opt[storePos].mlen;
+                                 U32 const offCode = opt[storePos].off;
+                                 U32 const advance = llen + mlen;
+                                 DEBUGLOG(6, "considering seq starting at %zi, llen=%u, mlen=%u",
+                                             anchor - istart, llen, mlen);
+                                 if (mlen==0) {  /* only literals => must be last "sequence", actually starting a new stream of sequences */
+                                     assert(storePos == storeEnd);   /* must be last sequence */
+                                     ip = anchor + llen;     /* last "sequence" is a bunch of literals => don't progress anchor */
+                                     continue;   /* will finish */
+                                 }
-                             /* repcodes update : like ZSTD_updateRep(), but update in place */
-                             if (offset >= ZSTD_REP_NUM) {  /* full offset */
-                                 rep[2] = rep[1];
-                                 rep[1] = rep[0];
-                                 rep[0] = offset - ZSTD_REP_MOVE;
-                             } else {   /* repcode */
-                                 U32 const repCode = offset + (llen==0);
-                                 if (repCode) {  /* note : if repCode==0, no change */
-                                     U32 const currentOffset = (repCode==ZSTD_REP_NUM) ? (rep[0] - 1) : rep[repCode];
-                                     if (repCode >= 2) rep[2] = rep[1];
+                                 /* repcodes update : like ZSTD_updateRep(), but update in place */
+                                 if (offCode >= ZSTD_REP_NUM) {  /* full offset */
+                                     rep[2] = rep[1];
                                      rep[1] = rep[0];
-                                     rep[0] = currentOffset;
+                                 }
+                             }
+                                     rep[0] = offCode - ZSTD_REP_MOVE;
+                                 } else {   /* repcode */
+                                     U32 const repCode = offCode + (llen==0);
+                                     if (repCode) {  /* note : if repCode==0, no change */
+                                         U32 const currentOffset = (repCode==ZSTD_REP_NUM) ? (rep[0] - 1) : rep[repCode];
+                                         if (repCode >= 2) rep[2] = rep[1];
+                                         rep[1] = rep[0];
+                                         rep[0] = currentOffset;
+                                 }   }
-                             ZSTD_updateStats(optStatePtr, llen, anchor, offset, mlen);
-                             ZSTD_storeSeq(seqStore, llen, anchor, offset, mlen-MINMATCH);
-                             anchor = ip;
-                     }   }
-                     ZSTD_setLog2Prices(optStatePtr);
+                                 assert(anchor + llen <= iend);
+                                 ZSTD_updateStats(optStatePtr, llen, anchor, offCode, mlen);
+                                 ZSTD_storeSeq(seqStore, llen, anchor, offCode, mlen-MINMATCH);
+                                 anchor += advance;
+                                 ip = anchor;
+                         }   }
+                         ZSTD_setBasePrices(optStatePtr, optLevel);
+                     }
                  }   /* while (ip < ilimit) */
                  /* Return the last literals size */
              size_t ZSTD_compressBlock_btopt(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     const void* src, size_t srcSize)
              {
                  DEBUGLOG(5, "ZSTD_compressBlock_btopt");
-                 return ZSTD_compressBlock_opt_generic(ms, seqStore, rep, cParams, src, srcSize, 0 /*optLevel*/, 0 /*extDict*/);
+                 return ZSTD_compressBlock_opt_generic(ms, seqStore, rep, src, srcSize, 0 /*optLevel*/, ZSTD_noDict);
+             }
+             /* used in 2-pass strategy */
+             static U32 ZSTD_upscaleStat(U32* table, U32 lastEltIndex, int bonus)
+             {
+                 U32 s, sum=0;
+                 assert(ZSTD_FREQ_DIV+bonus > 0);
+                 for (s=0; s<=lastEltIndex; s++) {
+                     table[s] <<= ZSTD_FREQ_DIV+bonus;
+                     table[s]--;
+                     sum += table[s];
+                 }
+                 return sum;
+             }
+             /* used in 2-pass strategy */
+             MEM_STATIC void ZSTD_upscaleStats(optState_t* optPtr)
+             {
+                 optPtr->litSum = ZSTD_upscaleStat(optPtr->litFreq, MaxLit, 0);
+                 optPtr->litLengthSum = ZSTD_upscaleStat(optPtr->litLengthFreq, MaxLL, 1);
+                 optPtr->matchLengthSum = ZSTD_upscaleStat(optPtr->matchLengthFreq, MaxML, 1);
+                 optPtr->offCodeSum = ZSTD_upscaleStat(optPtr->offCodeFreq, MaxOff, 1);
              }
              size_t ZSTD_compressBlock_btultra(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     const void* src, size_t srcSize)
              {
-                 return ZSTD_compressBlock_opt_generic(ms, seqStore, rep, cParams, src, srcSize, 2 /*optLevel*/, 0 /*extDict*/);
+                 DEBUGLOG(5, "ZSTD_compressBlock_btultra (srcSize=%zu)", srcSize);
+             #if 0
+                 /* 2-pass strategy (disabled)
+                  * this strategy makes a first pass over first block to collect statistics
+                  * and seed next round's statistics with it.
+                  * The compression ratio gain is generally small (~0.5% on first block),
+                  * the cost is 2x cpu time on first block. */
+                 assert(srcSize <= ZSTD_BLOCKSIZE_MAX);
+                 if ( (ms->opt.litLengthSum==0)   /* first block */
+                   && (seqStore->sequences == seqStore->sequencesStart)   /* no ldm */
+                   && (ms->window.dictLimit == ms->window.lowLimit) ) {   /* no dictionary */
+                     U32 tmpRep[ZSTD_REP_NUM];
+                     DEBUGLOG(5, "ZSTD_compressBlock_btultra: first block: collecting statistics");
+                     assert(ms->nextToUpdate >= ms->window.dictLimit
+                         && ms->nextToUpdate <= ms->window.dictLimit + 1);
+                     memcpy(tmpRep, rep, sizeof(tmpRep));
+                     ZSTD_compressBlock_opt_generic(ms, seqStore, tmpRep, src, srcSize, 2 /*optLevel*/, ZSTD_noDict);   /* generate stats into ms->opt*/
+                     ZSTD_resetSeqStore(seqStore);
+                     /* invalidate first scan from history */
+                     ms->window.base -= srcSize;
+                     ms->window.dictLimit += (U32)srcSize;
+                     ms->window.lowLimit = ms->window.dictLimit;
+                     ms->nextToUpdate = ms->window.dictLimit;
+                     ms->nextToUpdate3 = ms->window.dictLimit;
+                     /* re-inforce weight of collected statistics */
+                     ZSTD_upscaleStats(&ms->opt);
+                 }
+             #endif
+                 return ZSTD_compressBlock_opt_generic(ms, seqStore, rep, src, srcSize, 2 /*optLevel*/, ZSTD_noDict);
+             }
+             size_t ZSTD_compressBlock_btopt_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     const void* src, size_t srcSize)
+             {
+                 return ZSTD_compressBlock_opt_generic(ms, seqStore, rep, src, srcSize, 0 /*optLevel*/, ZSTD_dictMatchState);
+             }
+             size_t ZSTD_compressBlock_btultra_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     const void* src, size_t srcSize)
+             {
+                 return ZSTD_compressBlock_opt_generic(ms, seqStore, rep, src, srcSize, 2 /*optLevel*/, ZSTD_dictMatchState);
              }
              size_t ZSTD_compressBlock_btopt_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     const void* src, size_t srcSize)
              {
-                 return ZSTD_compressBlock_opt_generic(ms, seqStore, rep, cParams, src, srcSize, 0 /*optLevel*/, 1 /*extDict*/);
+                 return ZSTD_compressBlock_opt_generic(ms, seqStore, rep, src, srcSize, 0 /*optLevel*/, ZSTD_extDict);
              }
              size_t ZSTD_compressBlock_btultra_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize)
+                     const void* src, size_t srcSize)
              {
-                 return ZSTD_compressBlock_opt_generic(ms, seqStore, rep, cParams, src, srcSize, 2 /*optLevel*/, 1 /*extDict*/);
+                 return ZSTD_compressBlock_opt_generic(ms, seqStore, rep, src, srcSize, 2 /*optLevel*/, ZSTD_extDict);
              }

contrib/python-zstandard/zstd/compress/zstd_opt.h

0 +13 -7

              #include "zstd_compress_internal.h"
-             void ZSTD_updateTree(
-                     ZSTD_matchState_t* ms, ZSTD_compressionParameters const* cParams,
-                     const BYTE* ip, const BYTE* iend);  /* used in ZSTD_loadDictionaryContent() */
+             /* used in ZSTD_loadDictionaryContent() */
+             void ZSTD_updateTree(ZSTD_matchState_t* ms, const BYTE* ip, const BYTE* iend);
              size_t ZSTD_compressBlock_btopt(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
              size_t ZSTD_compressBlock_btultra(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
+             size_t ZSTD_compressBlock_btopt_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize);
+             size_t ZSTD_compressBlock_btultra_dictMatchState(
+                     ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
+                     void const* src, size_t srcSize);
              size_t ZSTD_compressBlock_btopt_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
              size_t ZSTD_compressBlock_btultra_extDict(
                      ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
-                     ZSTD_compressionParameters const* cParams, void const* src, size_t srcSize);
+                     void const* src, size_t srcSize);
              #if defined (__cplusplus)
              }

contrib/python-zstandard/zstd/compress/zstdmt_compress.c

0 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

contrib/python-zstandard/zstd/compress/zstdmt_compress.h

0 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

contrib/python-zstandard/zstd/decompress/huf_decompress.c

0 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

contrib/python-zstandard/zstd/decompress/zstd_decompress.c

0 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

contrib/python-zstandard/zstd/dictBuilder/cover.c

0 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

contrib/python-zstandard/zstd/dictBuilder/divsufsort.c

0 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

contrib/python-zstandard/zstd/dictBuilder/zdict.c

0 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

contrib/python-zstandard/zstd/dictBuilder/zdict.h

0 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

contrib/python-zstandard/zstd/zstd.h

0 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

contrib/python-zstandard/zstd_cffi.py

0 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

setup.py

0 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages