123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501 |
- /**
- * Copyright (c) 2016-present, Gregory Szorc
- * All rights reserved.
- *
- * This software may be modified and distributed under the terms
- * of the BSD license. See the LICENSE file for details.
- */
- #include "python-zstandard.h"
- extern PyObject *ZstdError;
- int set_parameter(ZSTD_CCtx_params *params, ZSTD_cParameter param, int value) {
- size_t zresult = ZSTD_CCtxParams_setParameter(params, param, value);
- if (ZSTD_isError(zresult)) {
- PyErr_Format(ZstdError,
- "unable to set compression context parameter: %s",
- ZSTD_getErrorName(zresult));
- return 1;
- }
- return 0;
- }
- #define TRY_SET_PARAMETER(params, param, value) \
- if (set_parameter(params, param, value)) \
- return -1;
- #define TRY_COPY_PARAMETER(source, dest, param) \
- { \
- int result; \
- size_t zresult = ZSTD_CCtxParams_getParameter(source, param, &result); \
- if (ZSTD_isError(zresult)) { \
- return 1; \
- } \
- zresult = ZSTD_CCtxParams_setParameter(dest, param, result); \
- if (ZSTD_isError(zresult)) { \
- return 1; \
- } \
- }
- int set_parameters(ZSTD_CCtx_params *params,
- ZstdCompressionParametersObject *obj) {
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_nbWorkers);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_format);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_compressionLevel);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_windowLog);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_hashLog);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_chainLog);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_searchLog);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_minMatch);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_targetLength);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_strategy);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_contentSizeFlag);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_checksumFlag);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_dictIDFlag);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_jobSize);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_overlapLog);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_forceMaxWindow);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_enableLongDistanceMatching);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_ldmHashLog);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_ldmMinMatch);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_ldmBucketSizeLog);
- TRY_COPY_PARAMETER(obj->params, params, ZSTD_c_ldmHashRateLog);
- return 0;
- }
- int reset_params(ZstdCompressionParametersObject *params) {
- if (params->params) {
- ZSTD_CCtxParams_reset(params->params);
- }
- else {
- params->params = ZSTD_createCCtxParams();
- if (!params->params) {
- PyErr_NoMemory();
- return 1;
- }
- }
- return set_parameters(params->params, params);
- }
- #define TRY_GET_PARAMETER(params, param, value) \
- { \
- size_t zresult = ZSTD_CCtxParams_getParameter(params, param, value); \
- if (ZSTD_isError(zresult)) { \
- PyErr_Format(ZstdError, "unable to retrieve parameter: %s", \
- ZSTD_getErrorName(zresult)); \
- return 1; \
- } \
- }
- int to_cparams(ZstdCompressionParametersObject *params,
- ZSTD_compressionParameters *cparams) {
- int value;
- TRY_GET_PARAMETER(params->params, ZSTD_c_windowLog, &value);
- cparams->windowLog = value;
- TRY_GET_PARAMETER(params->params, ZSTD_c_chainLog, &value);
- cparams->chainLog = value;
- TRY_GET_PARAMETER(params->params, ZSTD_c_hashLog, &value);
- cparams->hashLog = value;
- TRY_GET_PARAMETER(params->params, ZSTD_c_searchLog, &value);
- cparams->searchLog = value;
- TRY_GET_PARAMETER(params->params, ZSTD_c_minMatch, &value);
- cparams->minMatch = value;
- TRY_GET_PARAMETER(params->params, ZSTD_c_targetLength, &value);
- cparams->targetLength = value;
- TRY_GET_PARAMETER(params->params, ZSTD_c_strategy, &value);
- cparams->strategy = value;
- return 0;
- }
- static int ZstdCompressionParameters_init(ZstdCompressionParametersObject *self,
- PyObject *args, PyObject *kwargs) {
- static char *kwlist[] = {"format",
- "compression_level",
- "window_log",
- "hash_log",
- "chain_log",
- "search_log",
- "min_match",
- "target_length",
- "strategy",
- "write_content_size",
- "write_checksum",
- "write_dict_id",
- "job_size",
- "overlap_log",
- "force_max_window",
- "enable_ldm",
- "ldm_hash_log",
- "ldm_min_match",
- "ldm_bucket_size_log",
- "ldm_hash_rate_log",
- "threads",
- NULL};
- int format = 0;
- int compressionLevel = 0;
- int windowLog = 0;
- int hashLog = 0;
- int chainLog = 0;
- int searchLog = 0;
- int minMatch = 0;
- int targetLength = 0;
- int strategy = -1;
- int contentSizeFlag = 1;
- int checksumFlag = 0;
- int dictIDFlag = 0;
- int jobSize = 0;
- int overlapLog = -1;
- int forceMaxWindow = 0;
- int enableLDM = 0;
- int ldmHashLog = 0;
- int ldmMinMatch = 0;
- int ldmBucketSizeLog = 0;
- int ldmHashRateLog = -1;
- int threads = 0;
- if (!PyArg_ParseTupleAndKeywords(
- args, kwargs, "|iiiiiiiiiiiiiiiiiiiii:ZstdCompressionParameters",
- kwlist, &format, &compressionLevel, &windowLog, &hashLog, &chainLog,
- &searchLog, &minMatch, &targetLength, &strategy, &contentSizeFlag,
- &checksumFlag, &dictIDFlag, &jobSize, &overlapLog, &forceMaxWindow,
- &enableLDM, &ldmHashLog, &ldmMinMatch, &ldmBucketSizeLog,
- &ldmHashRateLog, &threads)) {
- return -1;
- }
- if (reset_params(self)) {
- return -1;
- }
- if (threads < 0) {
- threads = cpu_count();
- }
- /* We need to set ZSTD_c_nbWorkers before ZSTD_c_jobSize and
- * ZSTD_c_overlapLog because setting ZSTD_c_nbWorkers resets the other
- * parameters. */
- TRY_SET_PARAMETER(self->params, ZSTD_c_nbWorkers, threads);
- TRY_SET_PARAMETER(self->params, ZSTD_c_format, format);
- TRY_SET_PARAMETER(self->params, ZSTD_c_compressionLevel, compressionLevel);
- TRY_SET_PARAMETER(self->params, ZSTD_c_windowLog, windowLog);
- TRY_SET_PARAMETER(self->params, ZSTD_c_hashLog, hashLog);
- TRY_SET_PARAMETER(self->params, ZSTD_c_chainLog, chainLog);
- TRY_SET_PARAMETER(self->params, ZSTD_c_searchLog, searchLog);
- TRY_SET_PARAMETER(self->params, ZSTD_c_minMatch, minMatch);
- TRY_SET_PARAMETER(self->params, ZSTD_c_targetLength, targetLength);
- if (strategy == -1) {
- strategy = 0;
- }
- TRY_SET_PARAMETER(self->params, ZSTD_c_strategy, strategy);
- TRY_SET_PARAMETER(self->params, ZSTD_c_contentSizeFlag, contentSizeFlag);
- TRY_SET_PARAMETER(self->params, ZSTD_c_checksumFlag, checksumFlag);
- TRY_SET_PARAMETER(self->params, ZSTD_c_dictIDFlag, dictIDFlag);
- TRY_SET_PARAMETER(self->params, ZSTD_c_jobSize, jobSize);
- if (overlapLog == -1) {
- overlapLog = 0;
- }
- TRY_SET_PARAMETER(self->params, ZSTD_c_overlapLog, overlapLog);
- TRY_SET_PARAMETER(self->params, ZSTD_c_forceMaxWindow, forceMaxWindow);
- TRY_SET_PARAMETER(self->params, ZSTD_c_enableLongDistanceMatching,
- enableLDM);
- TRY_SET_PARAMETER(self->params, ZSTD_c_ldmHashLog, ldmHashLog);
- TRY_SET_PARAMETER(self->params, ZSTD_c_ldmMinMatch, ldmMinMatch);
- TRY_SET_PARAMETER(self->params, ZSTD_c_ldmBucketSizeLog, ldmBucketSizeLog);
- if (ldmHashRateLog == -1) {
- ldmHashRateLog = 0;
- }
- TRY_SET_PARAMETER(self->params, ZSTD_c_ldmHashRateLog, ldmHashRateLog);
- return 0;
- }
- ZstdCompressionParametersObject *
- CompressionParameters_from_level(PyObject *undef, PyObject *args,
- PyObject *kwargs) {
- int managedKwargs = 0;
- int level;
- PyObject *sourceSize = NULL;
- PyObject *dictSize = NULL;
- unsigned PY_LONG_LONG iSourceSize = 0;
- Py_ssize_t iDictSize = 0;
- PyObject *val;
- ZSTD_compressionParameters params;
- ZstdCompressionParametersObject *result = NULL;
- int res;
- if (!PyArg_ParseTuple(args, "i:from_level", &level)) {
- return NULL;
- }
- if (!kwargs) {
- kwargs = PyDict_New();
- if (!kwargs) {
- return NULL;
- }
- managedKwargs = 1;
- }
- sourceSize = PyDict_GetItemString(kwargs, "source_size");
- if (sourceSize) {
- iSourceSize = PyLong_AsUnsignedLongLong(sourceSize);
- if (iSourceSize == (unsigned PY_LONG_LONG)(-1)) {
- goto cleanup;
- }
- PyDict_DelItemString(kwargs, "source_size");
- }
- dictSize = PyDict_GetItemString(kwargs, "dict_size");
- if (dictSize) {
- iDictSize = PyLong_AsSsize_t(dictSize);
- if (iDictSize == -1) {
- goto cleanup;
- }
- PyDict_DelItemString(kwargs, "dict_size");
- }
- params = ZSTD_getCParams(level, iSourceSize, iDictSize);
- /* Values derived from the input level and sizes are passed along to the
- constructor. But only if a value doesn't already exist. */
- val = PyDict_GetItemString(kwargs, "window_log");
- if (!val) {
- val = PyLong_FromUnsignedLong(params.windowLog);
- if (!val) {
- goto cleanup;
- }
- PyDict_SetItemString(kwargs, "window_log", val);
- Py_DECREF(val);
- }
- val = PyDict_GetItemString(kwargs, "chain_log");
- if (!val) {
- val = PyLong_FromUnsignedLong(params.chainLog);
- if (!val) {
- goto cleanup;
- }
- PyDict_SetItemString(kwargs, "chain_log", val);
- Py_DECREF(val);
- }
- val = PyDict_GetItemString(kwargs, "hash_log");
- if (!val) {
- val = PyLong_FromUnsignedLong(params.hashLog);
- if (!val) {
- goto cleanup;
- }
- PyDict_SetItemString(kwargs, "hash_log", val);
- Py_DECREF(val);
- }
- val = PyDict_GetItemString(kwargs, "search_log");
- if (!val) {
- val = PyLong_FromUnsignedLong(params.searchLog);
- if (!val) {
- goto cleanup;
- }
- PyDict_SetItemString(kwargs, "search_log", val);
- Py_DECREF(val);
- }
- val = PyDict_GetItemString(kwargs, "min_match");
- if (!val) {
- val = PyLong_FromUnsignedLong(params.minMatch);
- if (!val) {
- goto cleanup;
- }
- PyDict_SetItemString(kwargs, "min_match", val);
- Py_DECREF(val);
- }
- val = PyDict_GetItemString(kwargs, "target_length");
- if (!val) {
- val = PyLong_FromUnsignedLong(params.targetLength);
- if (!val) {
- goto cleanup;
- }
- PyDict_SetItemString(kwargs, "target_length", val);
- Py_DECREF(val);
- }
- val = PyDict_GetItemString(kwargs, "strategy");
- if (!val) {
- val = PyLong_FromUnsignedLong(params.strategy);
- if (!val) {
- goto cleanup;
- }
- PyDict_SetItemString(kwargs, "strategy", val);
- Py_DECREF(val);
- }
- result = PyObject_New(ZstdCompressionParametersObject,
- ZstdCompressionParametersType);
- if (!result) {
- goto cleanup;
- }
- result->params = NULL;
- val = PyTuple_New(0);
- if (!val) {
- Py_CLEAR(result);
- goto cleanup;
- }
- res = ZstdCompressionParameters_init(result, val, kwargs);
- Py_DECREF(val);
- if (res) {
- Py_CLEAR(result);
- goto cleanup;
- }
- cleanup:
- if (managedKwargs) {
- Py_DECREF(kwargs);
- }
- return result;
- }
- PyObject *ZstdCompressionParameters_estimated_compression_context_size(
- ZstdCompressionParametersObject *self) {
- return PyLong_FromSize_t(
- ZSTD_estimateCCtxSize_usingCCtxParams(self->params));
- }
- static void
- ZstdCompressionParameters_dealloc(ZstdCompressionParametersObject *self) {
- if (self->params) {
- ZSTD_freeCCtxParams(self->params);
- self->params = NULL;
- }
- PyObject_Del(self);
- }
- #define PARAM_GETTER(name, param) \
- PyObject *ZstdCompressionParameters_get_##name(PyObject *self, \
- void *unused) { \
- int result; \
- size_t zresult; \
- ZstdCompressionParametersObject *p = \
- (ZstdCompressionParametersObject *)(self); \
- zresult = ZSTD_CCtxParams_getParameter(p->params, param, &result); \
- if (ZSTD_isError(zresult)) { \
- PyErr_Format(ZstdError, "unable to get compression parameter: %s", \
- ZSTD_getErrorName(zresult)); \
- return NULL; \
- } \
- return PyLong_FromLong(result); \
- }
- PARAM_GETTER(format, ZSTD_c_format)
- PARAM_GETTER(compression_level, ZSTD_c_compressionLevel)
- PARAM_GETTER(window_log, ZSTD_c_windowLog)
- PARAM_GETTER(hash_log, ZSTD_c_hashLog)
- PARAM_GETTER(chain_log, ZSTD_c_chainLog)
- PARAM_GETTER(search_log, ZSTD_c_searchLog)
- PARAM_GETTER(min_match, ZSTD_c_minMatch)
- PARAM_GETTER(target_length, ZSTD_c_targetLength)
- PARAM_GETTER(strategy, ZSTD_c_strategy)
- PARAM_GETTER(write_content_size, ZSTD_c_contentSizeFlag)
- PARAM_GETTER(write_checksum, ZSTD_c_checksumFlag)
- PARAM_GETTER(write_dict_id, ZSTD_c_dictIDFlag)
- PARAM_GETTER(job_size, ZSTD_c_jobSize)
- PARAM_GETTER(overlap_log, ZSTD_c_overlapLog)
- PARAM_GETTER(force_max_window, ZSTD_c_forceMaxWindow)
- PARAM_GETTER(enable_ldm, ZSTD_c_enableLongDistanceMatching)
- PARAM_GETTER(ldm_hash_log, ZSTD_c_ldmHashLog)
- PARAM_GETTER(ldm_min_match, ZSTD_c_ldmMinMatch)
- PARAM_GETTER(ldm_bucket_size_log, ZSTD_c_ldmBucketSizeLog)
- PARAM_GETTER(ldm_hash_rate_log, ZSTD_c_ldmHashRateLog)
- PARAM_GETTER(threads, ZSTD_c_nbWorkers)
- static PyMethodDef ZstdCompressionParameters_methods[] = {
- {"from_level", (PyCFunction)CompressionParameters_from_level,
- METH_VARARGS | METH_KEYWORDS | METH_STATIC, NULL},
- {"estimated_compression_context_size",
- (PyCFunction)ZstdCompressionParameters_estimated_compression_context_size,
- METH_NOARGS, NULL},
- {NULL, NULL}};
- #define GET_SET_ENTRY(name) \
- { #name, ZstdCompressionParameters_get_##name, NULL, NULL, NULL }
- static PyGetSetDef ZstdCompressionParameters_getset[] = {
- GET_SET_ENTRY(format),
- GET_SET_ENTRY(compression_level),
- GET_SET_ENTRY(window_log),
- GET_SET_ENTRY(hash_log),
- GET_SET_ENTRY(chain_log),
- GET_SET_ENTRY(search_log),
- GET_SET_ENTRY(min_match),
- GET_SET_ENTRY(target_length),
- GET_SET_ENTRY(strategy),
- GET_SET_ENTRY(write_content_size),
- GET_SET_ENTRY(write_checksum),
- GET_SET_ENTRY(write_dict_id),
- GET_SET_ENTRY(threads),
- GET_SET_ENTRY(job_size),
- GET_SET_ENTRY(overlap_log),
- GET_SET_ENTRY(force_max_window),
- GET_SET_ENTRY(enable_ldm),
- GET_SET_ENTRY(ldm_hash_log),
- GET_SET_ENTRY(ldm_min_match),
- GET_SET_ENTRY(ldm_bucket_size_log),
- GET_SET_ENTRY(ldm_hash_rate_log),
- {NULL}};
- PyType_Slot ZstdCompressionParametersSlots[] = {
- {Py_tp_dealloc, ZstdCompressionParameters_dealloc},
- {Py_tp_methods, ZstdCompressionParameters_methods},
- {Py_tp_getset, ZstdCompressionParameters_getset},
- {Py_tp_init, ZstdCompressionParameters_init},
- {Py_tp_new, PyType_GenericNew},
- {0, NULL},
- };
- PyType_Spec ZstdCompressionParametersSpec = {
- "zstd.ZstdCompressionParameters",
- sizeof(ZstdCompressionParametersObject),
- 0,
- Py_TPFLAGS_DEFAULT | Py_TPFLAGS_BASETYPE,
- ZstdCompressionParametersSlots,
- };
- PyTypeObject *ZstdCompressionParametersType;
- void compressionparams_module_init(PyObject *mod) {
- ZstdCompressionParametersType =
- (PyTypeObject *)PyType_FromSpec(&ZstdCompressionParametersSpec);
- if (PyType_Ready(ZstdCompressionParametersType) < 0) {
- return;
- }
- Py_INCREF(ZstdCompressionParametersType);
- PyModule_AddObject(mod, "ZstdCompressionParameters",
- (PyObject *)ZstdCompressionParametersType);
- }
|