inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 1 | /* |
Yann Collet | 4ded9e5 | 2016-08-30 10:04:33 -0700 | [diff] [blame] | 2 | * Copyright (c) 2016-present, Yann Collet, Facebook, Inc. |
| 3 | * All rights reserved. |
| 4 | * |
| 5 | * This source code is licensed under the BSD-style license found in the |
| 6 | * LICENSE file in the root directory of this source tree. An additional grant |
| 7 | * of patent rights can be found in the PATENTS file in the same directory. |
| 8 | */ |
Yann Collet | 4856a00 | 2015-01-24 01:58:16 +0100 | [diff] [blame] | 9 | |
Yann Collet | 4856a00 | 2015-01-24 01:58:16 +0100 | [diff] [blame] | 10 | #if defined (__cplusplus) |
| 11 | extern "C" { |
| 12 | #endif |
| 13 | |
Nick Terrell | 05c00f2 | 2016-11-29 11:46:37 -0800 | [diff] [blame] | 14 | #ifndef ZSTD_H_235446 |
| 15 | #define ZSTD_H_235446 |
| 16 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 17 | /* ====== Dependency ======*/ |
Yann Collet | 4856a00 | 2015-01-24 01:58:16 +0100 | [diff] [blame] | 18 | #include <stddef.h> /* size_t */ |
| 19 | |
| 20 | |
Yann Collet | 426a9d4 | 2016-12-07 16:39:34 -0800 | [diff] [blame] | 21 | /* ===== ZSTDLIB_API : control library symbols visibility ===== */ |
| 22 | #if defined(__GNUC__) && (__GNUC__ >= 4) |
Nick Terrell | 8de46ab | 2016-12-16 13:27:30 -0800 | [diff] [blame] | 23 | # define ZSTDLIB_VISIBILITY __attribute__ ((visibility ("default"))) |
Christophe Chevalier | c6e8453 | 2015-12-07 17:44:09 +0100 | [diff] [blame] | 24 | #else |
Nick Terrell | 8de46ab | 2016-12-16 13:27:30 -0800 | [diff] [blame] | 25 | # define ZSTDLIB_VISIBILITY |
| 26 | #endif |
| 27 | #if defined(ZSTD_DLL_EXPORT) && (ZSTD_DLL_EXPORT==1) |
| 28 | # define ZSTDLIB_API __declspec(dllexport) ZSTDLIB_VISIBILITY |
| 29 | #elif defined(ZSTD_DLL_IMPORT) && (ZSTD_DLL_IMPORT==1) |
| 30 | # define ZSTDLIB_API __declspec(dllimport) ZSTDLIB_VISIBILITY /* It isn't required but allows to generate better code, saving a function pointer load from the IAT and an indirect jump.*/ |
| 31 | #else |
| 32 | # define ZSTDLIB_API ZSTDLIB_VISIBILITY |
Christophe Chevalier | c6e8453 | 2015-12-07 17:44:09 +0100 | [diff] [blame] | 33 | #endif |
| 34 | |
| 35 | |
inikep | 2d26133 | 2016-10-06 16:28:21 +0200 | [diff] [blame] | 36 | /******************************************************************************************************* |
| 37 | Introduction |
| 38 | |
Yann Collet | 37d1300 | 2016-10-24 17:22:12 -0700 | [diff] [blame] | 39 | zstd, short for Zstandard, is a fast lossless compression algorithm, targeting real-time compression scenarios |
inikep | 2d26133 | 2016-10-06 16:28:21 +0200 | [diff] [blame] | 40 | at zlib-level and better compression ratios. The zstd compression library provides in-memory compression and |
| 41 | decompression functions. The library supports compression levels from 1 up to ZSTD_maxCLevel() which is 22. |
Anders Oleson | 517577b | 2017-02-20 12:08:59 -0800 | [diff] [blame] | 42 | Levels >= 20, labeled `--ultra`, should be used with caution, as they require more memory. |
inikep | 2d26133 | 2016-10-06 16:28:21 +0200 | [diff] [blame] | 43 | Compression can be done in: |
| 44 | - a single step (described as Simple API) |
| 45 | - a single step, reusing a context (described as Explicit memory management) |
Yann Collet | 37d1300 | 2016-10-24 17:22:12 -0700 | [diff] [blame] | 46 | - unbounded multiple steps (described as Streaming compression) |
inikep | 2d26133 | 2016-10-06 16:28:21 +0200 | [diff] [blame] | 47 | The compression ratio achievable on small data can be highly improved using compression with a dictionary in: |
| 48 | - a single step (described as Simple dictionary API) |
Przemyslaw Skibinski | 984b66c | 2016-10-24 15:59:51 +0200 | [diff] [blame] | 49 | - a single step, reusing a dictionary (described as Fast dictionary API) |
inikep | 2d26133 | 2016-10-06 16:28:21 +0200 | [diff] [blame] | 50 | |
Yann Collet | 37d1300 | 2016-10-24 17:22:12 -0700 | [diff] [blame] | 51 | Advanced experimental functions can be accessed using #define ZSTD_STATIC_LINKING_ONLY before including zstd.h. |
| 52 | These APIs shall never be used with a dynamic library. |
inikep | 2d26133 | 2016-10-06 16:28:21 +0200 | [diff] [blame] | 53 | They are not "stable", their definition may change in the future. Only static linking is allowed. |
| 54 | *********************************************************************************************************/ |
| 55 | |
| 56 | /*------ Version ------*/ |
Yann Collet | 901e85f | 2016-08-31 07:51:25 -0700 | [diff] [blame] | 57 | #define ZSTD_VERSION_MAJOR 1 |
Yann Collet | 1eb2fdc | 2016-09-18 12:21:47 +0200 | [diff] [blame] | 58 | #define ZSTD_VERSION_MINOR 1 |
Yann Collet | f3dfcdc | 2017-03-21 12:18:28 -0700 | [diff] [blame] | 59 | #define ZSTD_VERSION_RELEASE 5 |
Yann Collet | e02808f | 2016-04-20 22:46:16 +0200 | [diff] [blame] | 60 | |
| 61 | #define ZSTD_LIB_VERSION ZSTD_VERSION_MAJOR.ZSTD_VERSION_MINOR.ZSTD_VERSION_RELEASE |
| 62 | #define ZSTD_QUOTE(str) #str |
| 63 | #define ZSTD_EXPAND_AND_QUOTE(str) ZSTD_QUOTE(str) |
| 64 | #define ZSTD_VERSION_STRING ZSTD_EXPAND_AND_QUOTE(ZSTD_LIB_VERSION) |
| 65 | |
Yann Collet | 213089c | 2015-06-18 07:43:16 -0800 | [diff] [blame] | 66 | #define ZSTD_VERSION_NUMBER (ZSTD_VERSION_MAJOR *100*100 + ZSTD_VERSION_MINOR *100 + ZSTD_VERSION_RELEASE) |
Yann Collet | 379908b | 2016-12-06 10:36:15 -0800 | [diff] [blame] | 67 | ZSTDLIB_API unsigned ZSTD_versionNumber(void); /**< library version number; to be used when checking dll version */ |
Yann Collet | 4856a00 | 2015-01-24 01:58:16 +0100 | [diff] [blame] | 68 | |
| 69 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 70 | /*************************************** |
Yann Collet | cf05b9d | 2016-07-18 16:52:10 +0200 | [diff] [blame] | 71 | * Simple API |
Yann Collet | 7010c27 | 2015-10-21 09:07:25 +0100 | [diff] [blame] | 72 | ***************************************/ |
Yann Collet | 953ce72 | 2016-02-04 15:28:14 +0100 | [diff] [blame] | 73 | /*! ZSTD_compress() : |
Yann Collet | 71ddeb6 | 2017-04-20 22:54:54 -0700 | [diff] [blame] | 74 | * Compresses `src` content as a single zstd compressed frame into already allocated `dst`. |
| 75 | * Hint : compression runs faster if `dstCapacity` >= `ZSTD_compressBound(srcSize)`. |
| 76 | * @return : compressed size written into `dst` (<= `dstCapacity), |
| 77 | * or an error code if it fails (which can be tested using ZSTD_isError()). */ |
Yann Collet | cf05b9d | 2016-07-18 16:52:10 +0200 | [diff] [blame] | 78 | ZSTDLIB_API size_t ZSTD_compress( void* dst, size_t dstCapacity, |
| 79 | const void* src, size_t srcSize, |
| 80 | int compressionLevel); |
Yann Collet | 4856a00 | 2015-01-24 01:58:16 +0100 | [diff] [blame] | 81 | |
Yann Collet | 953ce72 | 2016-02-04 15:28:14 +0100 | [diff] [blame] | 82 | /*! ZSTD_decompress() : |
Yann Collet | 71ddeb6 | 2017-04-20 22:54:54 -0700 | [diff] [blame] | 83 | * `compressedSize` : must be the _exact_ size of some number of compressed and/or skippable frames. |
| 84 | * `dstCapacity` is an upper bound of originalSize. |
| 85 | * If user cannot imply a maximum upper bound, it's better to use streaming mode to decompress data. |
| 86 | * @return : the number of bytes decompressed into `dst` (<= `dstCapacity`), |
| 87 | * or an errorCode if it fails (which can be tested using ZSTD_isError()). */ |
Yann Collet | 7d968c7 | 2016-02-03 02:11:32 +0100 | [diff] [blame] | 88 | ZSTDLIB_API size_t ZSTD_decompress( void* dst, size_t dstCapacity, |
Christophe Chevalier | c6e8453 | 2015-12-07 17:44:09 +0100 | [diff] [blame] | 89 | const void* src, size_t compressedSize); |
Yann Collet | 4856a00 | 2015-01-24 01:58:16 +0100 | [diff] [blame] | 90 | |
Yann Collet | ac175d4 | 2016-09-13 00:51:47 +0200 | [diff] [blame] | 91 | /*! ZSTD_getDecompressedSize() : |
Yann Collet | 71ddeb6 | 2017-04-20 22:54:54 -0700 | [diff] [blame] | 92 | * NOTE: This function is planned to be obsolete, in favour of ZSTD_getFrameContentSize. |
| 93 | * ZSTD_getFrameContentSize functions the same way, returning the decompressed size of a single |
| 94 | * frame, but distinguishes empty frames from frames with an unknown size, or errors. |
| 95 | * |
| 96 | * Additionally, ZSTD_findDecompressedSize can be used instead. It can handle multiple |
| 97 | * concatenated frames in one buffer, and so is more general. |
| 98 | * As a result however, it requires more computation and entire frames to be passed to it, |
| 99 | * as opposed to ZSTD_getFrameContentSize which requires only a single frame's header. |
| 100 | * |
| 101 | * 'src' is the start of a zstd compressed frame. |
| 102 | * @return : content size to be decompressed, as a 64-bits value _if known_, 0 otherwise. |
| 103 | * note 1 : decompressed size is an optional field, that may not be present, especially in streaming mode. |
| 104 | * When `return==0`, data to decompress could be any size. |
| 105 | * In which case, it's necessary to use streaming mode to decompress data. |
| 106 | * Optionally, application can still use ZSTD_decompress() while relying on implied limits. |
| 107 | * (For example, data may be necessarily cut into blocks <= 16 KB). |
| 108 | * note 2 : decompressed size is always present when compression is done with ZSTD_compress() |
| 109 | * note 3 : decompressed size can be very large (64-bits value), |
| 110 | * potentially larger than what local system can handle as a single memory segment. |
| 111 | * In which case, it's necessary to use streaming mode to decompress data. |
| 112 | * note 4 : If source is untrusted, decompressed size could be wrong or intentionally modified. |
| 113 | * Always ensure result fits within application's authorized limits. |
| 114 | * Each application can set its own limits. |
| 115 | * note 5 : when `return==0`, if precise failure cause is needed, use ZSTD_getFrameParams() to know more. */ |
Yann Collet | ac175d4 | 2016-09-13 00:51:47 +0200 | [diff] [blame] | 116 | ZSTDLIB_API unsigned long long ZSTD_getDecompressedSize(const void* src, size_t srcSize); |
| 117 | |
Yann Collet | 4110534 | 2016-07-27 15:09:11 +0200 | [diff] [blame] | 118 | |
Yann Collet | cf05b9d | 2016-07-18 16:52:10 +0200 | [diff] [blame] | 119 | /*====== Helper functions ======*/ |
Yann Collet | 4110534 | 2016-07-27 15:09:11 +0200 | [diff] [blame] | 120 | ZSTDLIB_API int ZSTD_maxCLevel(void); /*!< maximum compression level available */ |
| 121 | ZSTDLIB_API size_t ZSTD_compressBound(size_t srcSize); /*!< maximum compressed size in worst case scenario */ |
Yann Collet | 953ce72 | 2016-02-04 15:28:14 +0100 | [diff] [blame] | 122 | ZSTDLIB_API unsigned ZSTD_isError(size_t code); /*!< tells if a `size_t` function result is an error code */ |
Yann Collet | cf05b9d | 2016-07-18 16:52:10 +0200 | [diff] [blame] | 123 | ZSTDLIB_API const char* ZSTD_getErrorName(size_t code); /*!< provides readable string from an error code */ |
Yann Collet | 7010c27 | 2015-10-21 09:07:25 +0100 | [diff] [blame] | 124 | |
| 125 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 126 | /*************************************** |
Yann Collet | 7d968c7 | 2016-02-03 02:11:32 +0100 | [diff] [blame] | 127 | * Explicit memory management |
Yann Collet | 7010c27 | 2015-10-21 09:07:25 +0100 | [diff] [blame] | 128 | ***************************************/ |
Yann Collet | 37d1300 | 2016-10-24 17:22:12 -0700 | [diff] [blame] | 129 | /*= Compression context |
Yann Collet | 71ddeb6 | 2017-04-20 22:54:54 -0700 | [diff] [blame] | 130 | * When compressing many times, |
| 131 | * it is recommended to allocate a context just once, and re-use it for each successive compression operation. |
| 132 | * This will make workload friendlier for system's memory. |
| 133 | * Use one context per thread for parallel execution in multi-threaded environments. */ |
Yann Collet | 87c18b2 | 2016-08-26 01:43:47 +0200 | [diff] [blame] | 134 | typedef struct ZSTD_CCtx_s ZSTD_CCtx; |
Christophe Chevalier | c6e8453 | 2015-12-07 17:44:09 +0100 | [diff] [blame] | 135 | ZSTDLIB_API ZSTD_CCtx* ZSTD_createCCtx(void); |
Yann Collet | d469a98 | 2016-07-28 03:47:45 +0200 | [diff] [blame] | 136 | ZSTDLIB_API size_t ZSTD_freeCCtx(ZSTD_CCtx* cctx); |
Yann Collet | 7010c27 | 2015-10-21 09:07:25 +0100 | [diff] [blame] | 137 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 138 | /*! ZSTD_compressCCtx() : |
Yann Collet | 71ddeb6 | 2017-04-20 22:54:54 -0700 | [diff] [blame] | 139 | * Same as ZSTD_compress(), requires an allocated ZSTD_CCtx (see ZSTD_createCCtx()). */ |
Yann Collet | 7d968c7 | 2016-02-03 02:11:32 +0100 | [diff] [blame] | 140 | ZSTDLIB_API size_t ZSTD_compressCCtx(ZSTD_CCtx* ctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize, int compressionLevel); |
Yann Collet | 4856a00 | 2015-01-24 01:58:16 +0100 | [diff] [blame] | 141 | |
Sean Purcell | dec2b96 | 2017-03-14 11:24:09 -0700 | [diff] [blame] | 142 | /*= Decompression context |
Yann Collet | 71ddeb6 | 2017-04-20 22:54:54 -0700 | [diff] [blame] | 143 | * When decompressing many times, |
| 144 | * it is recommended to allocate a context just once, and re-use it for each successive compression operation. |
| 145 | * This will make workload friendlier for system's memory. |
| 146 | * Use one context per thread for parallel execution in multi-threaded environments. */ |
Yann Collet | 87c18b2 | 2016-08-26 01:43:47 +0200 | [diff] [blame] | 147 | typedef struct ZSTD_DCtx_s ZSTD_DCtx; |
Yann Collet | ecd651b | 2016-01-07 15:35:18 +0100 | [diff] [blame] | 148 | ZSTDLIB_API ZSTD_DCtx* ZSTD_createDCtx(void); |
Yann Collet | d469a98 | 2016-07-28 03:47:45 +0200 | [diff] [blame] | 149 | ZSTDLIB_API size_t ZSTD_freeDCtx(ZSTD_DCtx* dctx); |
Yann Collet | ecd651b | 2016-01-07 15:35:18 +0100 | [diff] [blame] | 150 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 151 | /*! ZSTD_decompressDCtx() : |
Yann Collet | 71ddeb6 | 2017-04-20 22:54:54 -0700 | [diff] [blame] | 152 | * Same as ZSTD_decompress(), requires an allocated ZSTD_DCtx (see ZSTD_createDCtx()). */ |
Yann Collet | 7d968c7 | 2016-02-03 02:11:32 +0100 | [diff] [blame] | 153 | ZSTDLIB_API size_t ZSTD_decompressDCtx(ZSTD_DCtx* ctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize); |
| 154 | |
| 155 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 156 | /************************** |
Yann Collet | 302fb53 | 2016-06-07 12:16:49 +0200 | [diff] [blame] | 157 | * Simple dictionary API |
| 158 | ***************************/ |
Yann Collet | 953ce72 | 2016-02-04 15:28:14 +0100 | [diff] [blame] | 159 | /*! ZSTD_compress_usingDict() : |
Yann Collet | d469a98 | 2016-07-28 03:47:45 +0200 | [diff] [blame] | 160 | * Compression using a predefined Dictionary (see dictBuilder/zdict.h). |
Nick Terrell | d82efd8 | 2016-11-02 16:47:53 -0700 | [diff] [blame] | 161 | * Note : This function loads the dictionary, resulting in significant startup delay. |
| 162 | * Note : When `dict == NULL || dictSize < 8` no dictionary is used. */ |
Yann Collet | 7d968c7 | 2016-02-03 02:11:32 +0100 | [diff] [blame] | 163 | ZSTDLIB_API size_t ZSTD_compress_usingDict(ZSTD_CCtx* ctx, |
| 164 | void* dst, size_t dstCapacity, |
| 165 | const void* src, size_t srcSize, |
| 166 | const void* dict,size_t dictSize, |
| 167 | int compressionLevel); |
| 168 | |
Yann Collet | 953ce72 | 2016-02-04 15:28:14 +0100 | [diff] [blame] | 169 | /*! ZSTD_decompress_usingDict() : |
Yann Collet | d469a98 | 2016-07-28 03:47:45 +0200 | [diff] [blame] | 170 | * Decompression using a predefined Dictionary (see dictBuilder/zdict.h). |
Yann Collet | 81e13ef | 2016-06-07 00:51:51 +0200 | [diff] [blame] | 171 | * Dictionary must be identical to the one used during compression. |
Nick Terrell | d82efd8 | 2016-11-02 16:47:53 -0700 | [diff] [blame] | 172 | * Note : This function loads the dictionary, resulting in significant startup delay. |
| 173 | * Note : When `dict == NULL || dictSize < 8` no dictionary is used. */ |
Yann Collet | 7d968c7 | 2016-02-03 02:11:32 +0100 | [diff] [blame] | 174 | ZSTDLIB_API size_t ZSTD_decompress_usingDict(ZSTD_DCtx* dctx, |
| 175 | void* dst, size_t dstCapacity, |
| 176 | const void* src, size_t srcSize, |
| 177 | const void* dict,size_t dictSize); |
Yann Collet | ecd651b | 2016-01-07 15:35:18 +0100 | [diff] [blame] | 178 | |
Yann Collet | 4856a00 | 2015-01-24 01:58:16 +0100 | [diff] [blame] | 179 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 180 | /**************************** |
Przemyslaw Skibinski | 984b66c | 2016-10-24 15:59:51 +0200 | [diff] [blame] | 181 | * Fast dictionary API |
Yann Collet | 302fb53 | 2016-06-07 12:16:49 +0200 | [diff] [blame] | 182 | ****************************/ |
inikep | 2d26133 | 2016-10-06 16:28:21 +0200 | [diff] [blame] | 183 | typedef struct ZSTD_CDict_s ZSTD_CDict; |
| 184 | |
Yann Collet | 302fb53 | 2016-06-07 12:16:49 +0200 | [diff] [blame] | 185 | /*! ZSTD_createCDict() : |
Yann Collet | 37d1300 | 2016-10-24 17:22:12 -0700 | [diff] [blame] | 186 | * When compressing multiple messages / blocks with the same dictionary, it's recommended to load it just once. |
| 187 | * ZSTD_createCDict() will create a digested dictionary, ready to start future compression operations without startup delay. |
| 188 | * ZSTD_CDict can be created once and used by multiple threads concurrently, as its usage is read-only. |
Yann Collet | 1f57c2e | 2016-12-21 16:20:11 +0100 | [diff] [blame] | 189 | * `dictBuffer` can be released after ZSTD_CDict creation, as its content is copied within CDict */ |
| 190 | ZSTDLIB_API ZSTD_CDict* ZSTD_createCDict(const void* dictBuffer, size_t dictSize, int compressionLevel); |
inikep | 2d26133 | 2016-10-06 16:28:21 +0200 | [diff] [blame] | 191 | |
| 192 | /*! ZSTD_freeCDict() : |
Nick Terrell | d82efd8 | 2016-11-02 16:47:53 -0700 | [diff] [blame] | 193 | * Function frees memory allocated by ZSTD_createCDict(). */ |
Yann Collet | 302fb53 | 2016-06-07 12:16:49 +0200 | [diff] [blame] | 194 | ZSTDLIB_API size_t ZSTD_freeCDict(ZSTD_CDict* CDict); |
| 195 | |
| 196 | /*! ZSTD_compress_usingCDict() : |
Yann Collet | 4f81818 | 2017-04-17 17:57:35 -0700 | [diff] [blame] | 197 | * Compression using a digested Dictionary. |
| 198 | * Faster startup than ZSTD_compress_usingDict(), recommended when same dictionary is used multiple times. |
| 199 | * Note that compression level is decided during dictionary creation. |
| 200 | * Frame parameters are hardcoded (dictID=yes, contentSize=yes, checksum=no) */ |
Yann Collet | 302fb53 | 2016-06-07 12:16:49 +0200 | [diff] [blame] | 201 | ZSTDLIB_API size_t ZSTD_compress_usingCDict(ZSTD_CCtx* cctx, |
| 202 | void* dst, size_t dstCapacity, |
| 203 | const void* src, size_t srcSize, |
| 204 | const ZSTD_CDict* cdict); |
| 205 | |
inikep | 2d26133 | 2016-10-06 16:28:21 +0200 | [diff] [blame] | 206 | |
| 207 | typedef struct ZSTD_DDict_s ZSTD_DDict; |
| 208 | |
Yann Collet | 302fb53 | 2016-06-07 12:16:49 +0200 | [diff] [blame] | 209 | /*! ZSTD_createDDict() : |
| 210 | * Create a digested dictionary, ready to start decompression operation without startup delay. |
Yann Collet | 4e5eea6 | 2016-12-21 16:44:35 +0100 | [diff] [blame] | 211 | * dictBuffer can be released after DDict creation, as its content is copied inside DDict */ |
| 212 | ZSTDLIB_API ZSTD_DDict* ZSTD_createDDict(const void* dictBuffer, size_t dictSize); |
inikep | 2d26133 | 2016-10-06 16:28:21 +0200 | [diff] [blame] | 213 | |
| 214 | /*! ZSTD_freeDDict() : |
| 215 | * Function frees memory allocated with ZSTD_createDDict() */ |
Yann Collet | 302fb53 | 2016-06-07 12:16:49 +0200 | [diff] [blame] | 216 | ZSTDLIB_API size_t ZSTD_freeDDict(ZSTD_DDict* ddict); |
| 217 | |
| 218 | /*! ZSTD_decompress_usingDDict() : |
Nick Terrell | d82efd8 | 2016-11-02 16:47:53 -0700 | [diff] [blame] | 219 | * Decompression using a digested Dictionary. |
Yann Collet | cf05b9d | 2016-07-18 16:52:10 +0200 | [diff] [blame] | 220 | * Faster startup than ZSTD_decompress_usingDict(), recommended when same dictionary is used multiple times. */ |
Yann Collet | 302fb53 | 2016-06-07 12:16:49 +0200 | [diff] [blame] | 221 | ZSTDLIB_API size_t ZSTD_decompress_usingDDict(ZSTD_DCtx* dctx, |
| 222 | void* dst, size_t dstCapacity, |
| 223 | const void* src, size_t srcSize, |
| 224 | const ZSTD_DDict* ddict); |
| 225 | |
| 226 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 227 | /**************************** |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 228 | * Streaming |
| 229 | ****************************/ |
| 230 | |
| 231 | typedef struct ZSTD_inBuffer_s { |
| 232 | const void* src; /**< start of input buffer */ |
| 233 | size_t size; /**< size of input buffer */ |
| 234 | size_t pos; /**< position where reading stopped. Will be updated. Necessarily 0 <= pos <= size */ |
| 235 | } ZSTD_inBuffer; |
| 236 | |
| 237 | typedef struct ZSTD_outBuffer_s { |
| 238 | void* dst; /**< start of output buffer */ |
| 239 | size_t size; /**< size of output buffer */ |
| 240 | size_t pos; /**< position where writing stopped. Will be updated. Necessarily 0 <= pos <= size */ |
| 241 | } ZSTD_outBuffer; |
| 242 | |
| 243 | |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 244 | |
inikep | ba1db37 | 2016-10-06 14:22:48 +0200 | [diff] [blame] | 245 | /*-*********************************************************************** |
Przemyslaw Skibinski | 984b66c | 2016-10-24 15:59:51 +0200 | [diff] [blame] | 246 | * Streaming compression - HowTo |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 247 | * |
| 248 | * A ZSTD_CStream object is required to track streaming operation. |
| 249 | * Use ZSTD_createCStream() and ZSTD_freeCStream() to create/release resources. |
| 250 | * ZSTD_CStream objects can be reused multiple times on consecutive compression operations. |
Yann Collet | 37d1300 | 2016-10-24 17:22:12 -0700 | [diff] [blame] | 251 | * It is recommended to re-use ZSTD_CStream in situations where many streaming operations will be achieved consecutively, |
| 252 | * since it will play nicer with system's memory, by re-using already allocated memory. |
| 253 | * Use one separate ZSTD_CStream per thread for parallel execution. |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 254 | * |
Yann Collet | 37d1300 | 2016-10-24 17:22:12 -0700 | [diff] [blame] | 255 | * Start a new compression by initializing ZSTD_CStream. |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 256 | * Use ZSTD_initCStream() to start a new compression operation. |
Yann Collet | e795c8a | 2016-12-13 16:39:36 +0100 | [diff] [blame] | 257 | * Use ZSTD_initCStream_usingDict() or ZSTD_initCStream_usingCDict() for a compression which requires a dictionary (experimental section) |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 258 | * |
| 259 | * Use ZSTD_compressStream() repetitively to consume input stream. |
Yann Collet | fa72f6b | 2016-09-05 17:39:56 +0200 | [diff] [blame] | 260 | * The function will automatically update both `pos` fields. |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 261 | * Note that it may not consume the entire input, in which case `pos < size`, |
| 262 | * and it's up to the caller to present again remaining data. |
Yann Collet | 4bf317d | 2016-08-28 07:43:34 -0700 | [diff] [blame] | 263 | * @return : a size hint, preferred nb of bytes to use as input for next function call |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 264 | * or an error code, which can be tested using ZSTD_isError(). |
Yann Collet | e795c8a | 2016-12-13 16:39:36 +0100 | [diff] [blame] | 265 | * Note 1 : it's just a hint, to help latency a little, any other value will work fine. |
| 266 | * Note 2 : size hint is guaranteed to be <= ZSTD_CStreamInSize() |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 267 | * |
Yann Collet | e795c8a | 2016-12-13 16:39:36 +0100 | [diff] [blame] | 268 | * At any moment, it's possible to flush whatever data remains within internal buffer, using ZSTD_flushStream(). |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 269 | * `output->pos` will be updated. |
Yann Collet | e795c8a | 2016-12-13 16:39:36 +0100 | [diff] [blame] | 270 | * Note that some content might still be left within internal buffer if `output->size` is too small. |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 271 | * @return : nb of bytes still present within internal buffer (0 if it's empty) |
| 272 | * or an error code, which can be tested using ZSTD_isError(). |
| 273 | * |
| 274 | * ZSTD_endStream() instructs to finish a frame. |
| 275 | * It will perform a flush and write frame epilogue. |
| 276 | * The epilogue is required for decoders to consider a frame completed. |
| 277 | * Similar to ZSTD_flushStream(), it may not be able to flush the full content if `output->size` is too small. |
| 278 | * In which case, call again ZSTD_endStream() to complete the flush. |
Yann Collet | e795c8a | 2016-12-13 16:39:36 +0100 | [diff] [blame] | 279 | * @return : nb of bytes still present within internal buffer (0 if it's empty, hence compression completed) |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 280 | * or an error code, which can be tested using ZSTD_isError(). |
| 281 | * |
| 282 | * *******************************************************************/ |
| 283 | |
| 284 | typedef struct ZSTD_CStream_s ZSTD_CStream; |
Sean Purcell | dec2b96 | 2017-03-14 11:24:09 -0700 | [diff] [blame] | 285 | /*===== ZSTD_CStream management functions =====*/ |
Yann Collet | 70e3b31 | 2016-08-23 01:18:06 +0200 | [diff] [blame] | 286 | ZSTDLIB_API ZSTD_CStream* ZSTD_createCStream(void); |
| 287 | ZSTDLIB_API size_t ZSTD_freeCStream(ZSTD_CStream* zcs); |
Yann Collet | e795c8a | 2016-12-13 16:39:36 +0100 | [diff] [blame] | 288 | |
Sean Purcell | dec2b96 | 2017-03-14 11:24:09 -0700 | [diff] [blame] | 289 | /*===== Streaming compression functions =====*/ |
Yann Collet | 70e3b31 | 2016-08-23 01:18:06 +0200 | [diff] [blame] | 290 | ZSTDLIB_API size_t ZSTD_initCStream(ZSTD_CStream* zcs, int compressionLevel); |
| 291 | ZSTDLIB_API size_t ZSTD_compressStream(ZSTD_CStream* zcs, ZSTD_outBuffer* output, ZSTD_inBuffer* input); |
| 292 | ZSTDLIB_API size_t ZSTD_flushStream(ZSTD_CStream* zcs, ZSTD_outBuffer* output); |
| 293 | ZSTDLIB_API size_t ZSTD_endStream(ZSTD_CStream* zcs, ZSTD_outBuffer* output); |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 294 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 295 | ZSTDLIB_API size_t ZSTD_CStreamInSize(void); /**< recommended size for input buffer */ |
| 296 | ZSTDLIB_API size_t ZSTD_CStreamOutSize(void); /**< recommended size for output buffer. Guarantee to successfully flush at least one complete compressed block in all circumstances. */ |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 297 | |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 298 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 299 | |
inikep | ba1db37 | 2016-10-06 14:22:48 +0200 | [diff] [blame] | 300 | /*-*************************************************************************** |
Przemyslaw Skibinski | 984b66c | 2016-10-24 15:59:51 +0200 | [diff] [blame] | 301 | * Streaming decompression - HowTo |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 302 | * |
| 303 | * A ZSTD_DStream object is required to track streaming operations. |
| 304 | * Use ZSTD_createDStream() and ZSTD_freeDStream() to create/release resources. |
Yann Collet | 17e482e | 2016-08-23 16:58:10 +0200 | [diff] [blame] | 305 | * ZSTD_DStream objects can be re-used multiple times. |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 306 | * |
| 307 | * Use ZSTD_initDStream() to start a new decompression operation, |
| 308 | * or ZSTD_initDStream_usingDict() if decompression requires a dictionary. |
Yann Collet | 7c83dfd | 2016-09-05 19:47:43 +0200 | [diff] [blame] | 309 | * @return : recommended first input size |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 310 | * |
| 311 | * Use ZSTD_decompressStream() repetitively to consume your input. |
Yann Collet | fa72f6b | 2016-09-05 17:39:56 +0200 | [diff] [blame] | 312 | * The function will update both `pos` fields. |
Yann Collet | b3060f7 | 2016-09-09 16:44:16 +0200 | [diff] [blame] | 313 | * If `input.pos < input.size`, some input has not been consumed. |
Yann Collet | 1d4208c | 2016-09-06 05:16:40 +0200 | [diff] [blame] | 314 | * It's up to the caller to present again remaining data. |
Yann Collet | b3060f7 | 2016-09-09 16:44:16 +0200 | [diff] [blame] | 315 | * If `output.pos < output.size`, decoder has flushed everything it could. |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 316 | * @return : 0 when a frame is completely decoded and fully flushed, |
Yann Collet | fa72f6b | 2016-09-05 17:39:56 +0200 | [diff] [blame] | 317 | * an error code, which can be tested using ZSTD_isError(), |
Yann Collet | 9ffbeea | 2016-12-02 18:37:38 -0800 | [diff] [blame] | 318 | * any other value > 0, which means there is still some decoding to do to complete current frame. |
| 319 | * The return value is a suggested next input size (a hint to improve latency) that will never load more than the current frame. |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 320 | * *******************************************************************************/ |
| 321 | |
| 322 | typedef struct ZSTD_DStream_s ZSTD_DStream; |
Sean Purcell | dec2b96 | 2017-03-14 11:24:09 -0700 | [diff] [blame] | 323 | /*===== ZSTD_DStream management functions =====*/ |
Yann Collet | 70e3b31 | 2016-08-23 01:18:06 +0200 | [diff] [blame] | 324 | ZSTDLIB_API ZSTD_DStream* ZSTD_createDStream(void); |
| 325 | ZSTDLIB_API size_t ZSTD_freeDStream(ZSTD_DStream* zds); |
Yann Collet | e795c8a | 2016-12-13 16:39:36 +0100 | [diff] [blame] | 326 | |
Sean Purcell | dec2b96 | 2017-03-14 11:24:09 -0700 | [diff] [blame] | 327 | /*===== Streaming decompression functions =====*/ |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 328 | ZSTDLIB_API size_t ZSTD_initDStream(ZSTD_DStream* zds); |
| 329 | ZSTDLIB_API size_t ZSTD_decompressStream(ZSTD_DStream* zds, ZSTD_outBuffer* output, ZSTD_inBuffer* input); |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 330 | |
Yann Collet | 70e3b31 | 2016-08-23 01:18:06 +0200 | [diff] [blame] | 331 | ZSTDLIB_API size_t ZSTD_DStreamInSize(void); /*!< recommended size for input buffer */ |
Yann Collet | 01c1992 | 2016-09-08 19:29:04 +0200 | [diff] [blame] | 332 | ZSTDLIB_API size_t ZSTD_DStreamOutSize(void); /*!< recommended size for output buffer. Guarantee to successfully flush at least one complete block in all circumstances. */ |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 333 | |
Nick Terrell | 05c00f2 | 2016-11-29 11:46:37 -0800 | [diff] [blame] | 334 | #endif /* ZSTD_H_235446 */ |
Yann Collet | 7be46bf | 2016-08-19 18:39:36 +0200 | [diff] [blame] | 335 | |
| 336 | |
Nick Terrell | 05c00f2 | 2016-11-29 11:46:37 -0800 | [diff] [blame] | 337 | #if defined(ZSTD_STATIC_LINKING_ONLY) && !defined(ZSTD_H_ZSTD_STATIC_LINKING_ONLY) |
| 338 | #define ZSTD_H_ZSTD_STATIC_LINKING_ONLY |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 339 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 340 | /**************************************************************************************** |
inikep | 2d26133 | 2016-10-06 16:28:21 +0200 | [diff] [blame] | 341 | * START OF ADVANCED AND EXPERIMENTAL FUNCTIONS |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 342 | * The definitions in this section are considered experimental. |
Yann Collet | a49e066 | 2016-06-21 11:54:03 +0200 | [diff] [blame] | 343 | * They should never be used with a dynamic library, as they may change in the future. |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 344 | * They are provided for advanced usages. |
| 345 | * Use them only in association with static linking. |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 346 | * ***************************************************************************************/ |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 347 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 348 | /* --- Constants ---*/ |
Yann Collet | 4e5eea6 | 2016-12-21 16:44:35 +0100 | [diff] [blame] | 349 | #define ZSTD_MAGICNUMBER 0xFD2FB528 /* >= v0.8.0 */ |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 350 | #define ZSTD_MAGIC_SKIPPABLE_START 0x184D2A50U |
| 351 | |
Sean Purcell | 2db7249 | 2017-02-09 10:50:43 -0800 | [diff] [blame] | 352 | #define ZSTD_CONTENTSIZE_UNKNOWN (0ULL - 1) |
| 353 | #define ZSTD_CONTENTSIZE_ERROR (0ULL - 2) |
| 354 | |
Sean Purcell | d44703d | 2017-03-01 14:36:25 -0800 | [diff] [blame] | 355 | #define ZSTD_WINDOWLOG_MAX_32 27 |
Yann Collet | ed3845d | 2016-07-08 12:57:10 +0200 | [diff] [blame] | 356 | #define ZSTD_WINDOWLOG_MAX_64 27 |
Nick Terrell | e65aab8 | 2017-03-08 15:40:13 -0800 | [diff] [blame] | 357 | #define ZSTD_WINDOWLOG_MAX ((unsigned)(sizeof(size_t) == 4 ? ZSTD_WINDOWLOG_MAX_32 : ZSTD_WINDOWLOG_MAX_64)) |
Yann Collet | cf409a7 | 2016-09-26 16:41:05 +0200 | [diff] [blame] | 358 | #define ZSTD_WINDOWLOG_MIN 10 |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 359 | #define ZSTD_HASHLOG_MAX ZSTD_WINDOWLOG_MAX |
Yann Collet | cf409a7 | 2016-09-26 16:41:05 +0200 | [diff] [blame] | 360 | #define ZSTD_HASHLOG_MIN 6 |
| 361 | #define ZSTD_CHAINLOG_MAX (ZSTD_WINDOWLOG_MAX+1) |
| 362 | #define ZSTD_CHAINLOG_MIN ZSTD_HASHLOG_MIN |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 363 | #define ZSTD_HASHLOG3_MAX 17 |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 364 | #define ZSTD_SEARCHLOG_MAX (ZSTD_WINDOWLOG_MAX-1) |
| 365 | #define ZSTD_SEARCHLOG_MIN 1 |
Yann Collet | 0e07bf3 | 2016-09-07 06:33:02 +0200 | [diff] [blame] | 366 | #define ZSTD_SEARCHLENGTH_MAX 7 /* only for ZSTD_fast, other strategies are limited to 6 */ |
| 367 | #define ZSTD_SEARCHLENGTH_MIN 3 /* only for ZSTD_btopt, other strategies are limited to 4 */ |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 368 | #define ZSTD_TARGETLENGTH_MIN 4 |
| 369 | #define ZSTD_TARGETLENGTH_MAX 999 |
| 370 | |
Yann Collet | 673f0d7 | 2016-06-06 00:26:38 +0200 | [diff] [blame] | 371 | #define ZSTD_FRAMEHEADERSIZE_MAX 18 /* for static allocation */ |
Yann Collet | ba75e9d | 2016-12-21 19:57:18 +0100 | [diff] [blame] | 372 | #define ZSTD_FRAMEHEADERSIZE_MIN 6 |
Yann Collet | 7c83dfd | 2016-09-05 19:47:43 +0200 | [diff] [blame] | 373 | static const size_t ZSTD_frameHeaderSize_prefix = 5; |
Yann Collet | ba75e9d | 2016-12-21 19:57:18 +0100 | [diff] [blame] | 374 | static const size_t ZSTD_frameHeaderSize_min = ZSTD_FRAMEHEADERSIZE_MIN; |
Yann Collet | 673f0d7 | 2016-06-06 00:26:38 +0200 | [diff] [blame] | 375 | static const size_t ZSTD_frameHeaderSize_max = ZSTD_FRAMEHEADERSIZE_MAX; |
| 376 | static const size_t ZSTD_skippableHeaderSize = 8; /* magic number + skippable frame length */ |
| 377 | |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 378 | |
Przemyslaw Skibinski | 984b66c | 2016-10-24 15:59:51 +0200 | [diff] [blame] | 379 | /*--- Advanced types ---*/ |
Przemyslaw Skibinski | 5c5f01f | 2016-10-25 12:25:07 +0200 | [diff] [blame] | 380 | typedef enum { ZSTD_fast, ZSTD_dfast, ZSTD_greedy, ZSTD_lazy, ZSTD_lazy2, ZSTD_btlazy2, ZSTD_btopt, ZSTD_btopt2 } ZSTD_strategy; /* from faster to stronger */ |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 381 | |
| 382 | typedef struct { |
Yann Collet | 655393c | 2016-08-14 00:16:20 +0200 | [diff] [blame] | 383 | unsigned windowLog; /**< largest match distance : larger == more compression, more memory needed during decompression */ |
| 384 | unsigned chainLog; /**< fully searched segment : larger == more compression, slower, more memory (useless for fast) */ |
| 385 | unsigned hashLog; /**< dispatch table : larger == faster, more memory */ |
| 386 | unsigned searchLog; /**< nb of searches : larger == more compression, slower */ |
| 387 | unsigned searchLength; /**< match length searched : larger == faster decompression, sometimes less compression */ |
| 388 | unsigned targetLength; /**< acceptable match size for optimal parser (only) : larger == more compression, slower */ |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 389 | ZSTD_strategy strategy; |
| 390 | } ZSTD_compressionParameters; |
| 391 | |
| 392 | typedef struct { |
Yann Collet | 0ec6a95 | 2017-01-02 00:49:42 +0100 | [diff] [blame] | 393 | unsigned contentSizeFlag; /**< 1: content size will be in frame header (when known) */ |
| 394 | unsigned checksumFlag; /**< 1: generate a 32-bits checksum at end of frame, for error detection */ |
| 395 | unsigned noDictIDFlag; /**< 1: no dictID will be saved into frame header (if dictionary compression) */ |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 396 | } ZSTD_frameParameters; |
| 397 | |
| 398 | typedef struct { |
| 399 | ZSTD_compressionParameters cParams; |
| 400 | ZSTD_frameParameters fParams; |
| 401 | } ZSTD_parameters; |
| 402 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 403 | /*= Custom memory allocation functions */ |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 404 | typedef void* (*ZSTD_allocFunction) (void* opaque, size_t size); |
| 405 | typedef void (*ZSTD_freeFunction) (void* opaque, void* address); |
| 406 | typedef struct { ZSTD_allocFunction customAlloc; ZSTD_freeFunction customFree; void* opaque; } ZSTD_customMem; |
| 407 | |
Sean Purcell | 2db7249 | 2017-02-09 10:50:43 -0800 | [diff] [blame] | 408 | /*************************************** |
Sean Purcell | d7bfcac | 2017-02-10 11:38:57 -0800 | [diff] [blame] | 409 | * Compressed size functions |
| 410 | ***************************************/ |
| 411 | |
Sean Purcell | 9050e19 | 2017-02-22 12:12:32 -0800 | [diff] [blame] | 412 | /*! ZSTD_findFrameCompressedSize() : |
Sean Purcell | 9757cc8 | 2017-02-22 12:27:15 -0800 | [diff] [blame] | 413 | * `src` should point to the start of a ZSTD encoded frame or skippable frame |
Sean Purcell | d7bfcac | 2017-02-10 11:38:57 -0800 | [diff] [blame] | 414 | * `srcSize` must be at least as large as the frame |
| 415 | * @return : the compressed size of the frame pointed to by `src`, suitable to pass to |
| 416 | * `ZSTD_decompress` or similar, or an error code if given invalid input. */ |
Sean Purcell | 9050e19 | 2017-02-22 12:12:32 -0800 | [diff] [blame] | 417 | ZSTDLIB_API size_t ZSTD_findFrameCompressedSize(const void* src, size_t srcSize); |
Sean Purcell | d7bfcac | 2017-02-10 11:38:57 -0800 | [diff] [blame] | 418 | |
| 419 | /*************************************** |
Sean Purcell | 2db7249 | 2017-02-09 10:50:43 -0800 | [diff] [blame] | 420 | * Decompressed size functions |
| 421 | ***************************************/ |
| 422 | /*! ZSTD_getFrameContentSize() : |
| 423 | * `src` should point to the start of a ZSTD encoded frame |
Sean Purcell | 269b2cd | 2017-02-09 13:25:30 -0800 | [diff] [blame] | 424 | * `srcSize` must be at least as large as the frame header. A value greater than or equal |
| 425 | * to `ZSTD_frameHeaderSize_max` is guaranteed to be large enough in all cases. |
Sean Purcell | 2db7249 | 2017-02-09 10:50:43 -0800 | [diff] [blame] | 426 | * @return : decompressed size of the frame pointed to be `src` if known, otherwise |
| 427 | * - ZSTD_CONTENTSIZE_UNKNOWN if the size cannot be determined |
Anders Oleson | 517577b | 2017-02-20 12:08:59 -0800 | [diff] [blame] | 428 | * - ZSTD_CONTENTSIZE_ERROR if an error occurred (e.g. invalid magic number, srcSize too small) */ |
Sean Purcell | 2db7249 | 2017-02-09 10:50:43 -0800 | [diff] [blame] | 429 | ZSTDLIB_API unsigned long long ZSTD_getFrameContentSize(const void *src, size_t srcSize); |
| 430 | |
| 431 | /*! ZSTD_findDecompressedSize() : |
| 432 | * `src` should point the start of a series of ZSTD encoded and/or skippable frames |
| 433 | * `srcSize` must be the _exact_ size of this series |
| 434 | * (i.e. there should be a frame boundary exactly `srcSize` bytes after `src`) |
| 435 | * @return : the decompressed size of all data in the contained frames, as a 64-bit value _if known_ |
| 436 | * - if the decompressed size cannot be determined: ZSTD_CONTENTSIZE_UNKNOWN |
| 437 | * - if an error occurred: ZSTD_CONTENTSIZE_ERROR |
| 438 | * |
| 439 | * note 1 : decompressed size is an optional field, that may not be present, especially in streaming mode. |
| 440 | * When `return==ZSTD_CONTENTSIZE_UNKNOWN`, data to decompress could be any size. |
| 441 | * In which case, it's necessary to use streaming mode to decompress data. |
| 442 | * Optionally, application can still use ZSTD_decompress() while relying on implied limits. |
| 443 | * (For example, data may be necessarily cut into blocks <= 16 KB). |
| 444 | * note 2 : decompressed size is always present when compression is done with ZSTD_compress() |
| 445 | * note 3 : decompressed size can be very large (64-bits value), |
| 446 | * potentially larger than what local system can handle as a single memory segment. |
| 447 | * In which case, it's necessary to use streaming mode to decompress data. |
| 448 | * note 4 : If source is untrusted, decompressed size could be wrong or intentionally modified. |
| 449 | * Always ensure result fits within application's authorized limits. |
| 450 | * Each application can set its own limits. |
| 451 | * note 5 : ZSTD_findDecompressedSize handles multiple frames, and so it must traverse the input to |
| 452 | * read each contained frame header. This is efficient as most of the data is skipped, |
| 453 | * however it does mean that all frame data must be present and valid. */ |
| 454 | ZSTDLIB_API unsigned long long ZSTD_findDecompressedSize(const void* src, size_t srcSize); |
| 455 | |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 456 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 457 | /*************************************** |
Yann Collet | 81e13ef | 2016-06-07 00:51:51 +0200 | [diff] [blame] | 458 | * Advanced compression functions |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 459 | ***************************************/ |
Yann Collet | 3ae543c | 2016-07-11 03:12:17 +0200 | [diff] [blame] | 460 | /*! ZSTD_estimateCCtxSize() : |
| 461 | * Gives the amount of memory allocated for a ZSTD_CCtx given a set of compression parameters. |
| 462 | * `frameContentSize` is an optional parameter, provide `0` if unknown */ |
Yann Collet | 8847238 | 2016-07-14 17:05:38 +0200 | [diff] [blame] | 463 | ZSTDLIB_API size_t ZSTD_estimateCCtxSize(ZSTD_compressionParameters cParams); |
Yann Collet | 3ae543c | 2016-07-11 03:12:17 +0200 | [diff] [blame] | 464 | |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 465 | /*! ZSTD_createCCtx_advanced() : |
| 466 | * Create a ZSTD compression context using external alloc and free functions */ |
| 467 | ZSTDLIB_API ZSTD_CCtx* ZSTD_createCCtx_advanced(ZSTD_customMem customMem); |
| 468 | |
Yann Collet | d7c6589 | 2016-09-15 02:50:27 +0200 | [diff] [blame] | 469 | /*! ZSTD_sizeofCCtx() : |
| 470 | * Gives the amount of memory used by a given ZSTD_CCtx */ |
| 471 | ZSTDLIB_API size_t ZSTD_sizeof_CCtx(const ZSTD_CCtx* cctx); |
| 472 | |
Yann Collet | 06e7697 | 2017-01-25 16:39:03 -0800 | [diff] [blame] | 473 | typedef enum { |
Yann Collet | 14312d8 | 2017-02-23 23:42:12 -0800 | [diff] [blame] | 474 | ZSTD_p_forceWindow, /* Force back-references to remain < windowSize, even when referencing Dictionary content (default:0) */ |
| 475 | ZSTD_p_forceRawDict /* Force loading dictionary in "content-only" mode (no header analysis) */ |
Yann Collet | 06e7697 | 2017-01-25 16:39:03 -0800 | [diff] [blame] | 476 | } ZSTD_CCtxParameter; |
Yann Collet | 4a62f79 | 2017-01-26 09:16:56 -0800 | [diff] [blame] | 477 | /*! ZSTD_setCCtxParameter() : |
| 478 | * Set advanced parameters, selected through enum ZSTD_CCtxParameter |
| 479 | * @result : 0, or an error code (which can be tested with ZSTD_isError()) */ |
Yann Collet | ef33d00 | 2017-01-26 12:24:21 -0800 | [diff] [blame] | 480 | ZSTDLIB_API size_t ZSTD_setCCtxParameter(ZSTD_CCtx* cctx, ZSTD_CCtxParameter param, unsigned value); |
Yann Collet | bb00274 | 2017-01-25 16:25:38 -0800 | [diff] [blame] | 481 | |
Yann Collet | 1f57c2e | 2016-12-21 16:20:11 +0100 | [diff] [blame] | 482 | /*! ZSTD_createCDict_byReference() : |
| 483 | * Create a digested dictionary for compression |
| 484 | * Dictionary content is simply referenced, and therefore stays in dictBuffer. |
| 485 | * It is important that dictBuffer outlives CDict, it must remain read accessible throughout the lifetime of CDict */ |
| 486 | ZSTDLIB_API ZSTD_CDict* ZSTD_createCDict_byReference(const void* dictBuffer, size_t dictSize, int compressionLevel); |
| 487 | |
Yann Collet | 81e13ef | 2016-06-07 00:51:51 +0200 | [diff] [blame] | 488 | /*! ZSTD_createCDict_advanced() : |
| 489 | * Create a ZSTD_CDict using external alloc and free, and customized compression parameters */ |
Yann Collet | 1f57c2e | 2016-12-21 16:20:11 +0100 | [diff] [blame] | 490 | ZSTDLIB_API ZSTD_CDict* ZSTD_createCDict_advanced(const void* dict, size_t dictSize, unsigned byReference, |
Yann Collet | 31533ba | 2017-04-27 00:29:04 -0700 | [diff] [blame] | 491 | ZSTD_compressionParameters cParams, ZSTD_customMem customMem); |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 492 | |
Yann Collet | d7c6589 | 2016-09-15 02:50:27 +0200 | [diff] [blame] | 493 | /*! ZSTD_sizeof_CDict() : |
| 494 | * Gives the amount of memory used by a given ZSTD_sizeof_CDict */ |
| 495 | ZSTDLIB_API size_t ZSTD_sizeof_CDict(const ZSTD_CDict* cdict); |
Yann Collet | 8e0ee68 | 2016-07-11 13:09:52 +0200 | [diff] [blame] | 496 | |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 497 | /*! ZSTD_getCParams() : |
Yann Collet | 2b36b23 | 2016-12-13 17:59:55 +0100 | [diff] [blame] | 498 | * @return ZSTD_compressionParameters structure for a selected compression level and estimated srcSize. |
| 499 | * `estimatedSrcSize` value is optional, select 0 if not known */ |
| 500 | ZSTDLIB_API ZSTD_compressionParameters ZSTD_getCParams(int compressionLevel, unsigned long long estimatedSrcSize, size_t dictSize); |
| 501 | |
| 502 | /*! ZSTD_getParams() : |
| 503 | * same as ZSTD_getCParams(), but @return a full `ZSTD_parameters` object instead of sub-component `ZSTD_compressionParameters`. |
| 504 | * All fields of `ZSTD_frameParameters` are set to default (0) */ |
| 505 | ZSTDLIB_API ZSTD_parameters ZSTD_getParams(int compressionLevel, unsigned long long estimatedSrcSize, size_t dictSize); |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 506 | |
Yann Collet | 3d2cd7f | 2016-06-27 15:12:26 +0200 | [diff] [blame] | 507 | /*! ZSTD_checkCParams() : |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 508 | * Ensure param values remain within authorized range */ |
| 509 | ZSTDLIB_API size_t ZSTD_checkCParams(ZSTD_compressionParameters params); |
| 510 | |
Yann Collet | 3d2cd7f | 2016-06-27 15:12:26 +0200 | [diff] [blame] | 511 | /*! ZSTD_adjustCParams() : |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 512 | * optimize params for a given `srcSize` and `dictSize`. |
| 513 | * both values are optional, select `0` if unknown. */ |
Yann Collet | 52c04fe | 2016-07-07 11:53:18 +0200 | [diff] [blame] | 514 | ZSTDLIB_API ZSTD_compressionParameters ZSTD_adjustCParams(ZSTD_compressionParameters cPar, unsigned long long srcSize, size_t dictSize); |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 515 | |
| 516 | /*! ZSTD_compress_advanced() : |
Yann Collet | f4bd857 | 2017-04-27 11:31:55 -0700 | [diff] [blame] | 517 | * Same as ZSTD_compress_usingDict(), with fine-tune control over each compression parameter */ |
| 518 | ZSTDLIB_API size_t ZSTD_compress_advanced (ZSTD_CCtx* cctx, |
| 519 | void* dst, size_t dstCapacity, |
| 520 | const void* src, size_t srcSize, |
| 521 | const void* dict,size_t dictSize, |
| 522 | ZSTD_parameters params); |
| 523 | |
| 524 | /*! ZSTD_compress_usingCDict_advanced() : |
| 525 | * Same as ZSTD_compress_usingCDict(), with fine-tune control over frame parameters */ |
| 526 | ZSTDLIB_API size_t ZSTD_compress_usingCDict_advanced(ZSTD_CCtx* cctx, |
| 527 | void* dst, size_t dstCapacity, |
| 528 | const void* src, size_t srcSize, |
| 529 | const ZSTD_CDict* cdict, ZSTD_frameParameters fParams); |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 530 | |
Yann Collet | 45c03c5 | 2016-06-14 13:46:11 +0200 | [diff] [blame] | 531 | |
Przemyslaw Skibinski | 984b66c | 2016-10-24 15:59:51 +0200 | [diff] [blame] | 532 | /*--- Advanced decompression functions ---*/ |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 533 | |
Yann Collet | 179b197 | 2016-11-02 17:30:49 -0700 | [diff] [blame] | 534 | /*! ZSTD_isFrame() : |
| 535 | * Tells if the content of `buffer` starts with a valid Frame Identifier. |
| 536 | * Note : Frame Identifier is 4 bytes. If `size < 4`, @return will always be 0. |
| 537 | * Note 2 : Legacy Frame Identifiers are considered valid only if Legacy Support is enabled. |
| 538 | * Note 3 : Skippable Frame Identifiers are considered valid. */ |
| 539 | ZSTDLIB_API unsigned ZSTD_isFrame(const void* buffer, size_t size); |
| 540 | |
Yann Collet | d158c35 | 2016-07-11 13:46:25 +0200 | [diff] [blame] | 541 | /*! ZSTD_estimateDCtxSize() : |
| 542 | * Gives the potential amount of memory allocated to create a ZSTD_DCtx */ |
| 543 | ZSTDLIB_API size_t ZSTD_estimateDCtxSize(void); |
| 544 | |
Yann Collet | 81e13ef | 2016-06-07 00:51:51 +0200 | [diff] [blame] | 545 | /*! ZSTD_createDCtx_advanced() : |
| 546 | * Create a ZSTD decompression context using external alloc and free functions */ |
| 547 | ZSTDLIB_API ZSTD_DCtx* ZSTD_createDCtx_advanced(ZSTD_customMem customMem); |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 548 | |
Yann Collet | d7c6589 | 2016-09-15 02:50:27 +0200 | [diff] [blame] | 549 | /*! ZSTD_sizeof_DCtx() : |
Yann Collet | d158c35 | 2016-07-11 13:46:25 +0200 | [diff] [blame] | 550 | * Gives the amount of memory used by a given ZSTD_DCtx */ |
Yann Collet | 70e3b31 | 2016-08-23 01:18:06 +0200 | [diff] [blame] | 551 | ZSTDLIB_API size_t ZSTD_sizeof_DCtx(const ZSTD_DCtx* dctx); |
Yann Collet | 8e0ee68 | 2016-07-11 13:09:52 +0200 | [diff] [blame] | 552 | |
Yann Collet | 4e5eea6 | 2016-12-21 16:44:35 +0100 | [diff] [blame] | 553 | /*! ZSTD_createDDict_byReference() : |
| 554 | * Create a digested dictionary, ready to start decompression operation without startup delay. |
| 555 | * Dictionary content is simply referenced, and therefore stays in dictBuffer. |
| 556 | * It is important that dictBuffer outlives DDict, it must remain read accessible throughout the lifetime of DDict */ |
| 557 | ZSTDLIB_API ZSTD_DDict* ZSTD_createDDict_byReference(const void* dictBuffer, size_t dictSize); |
| 558 | |
Sean Purcell | dec2b96 | 2017-03-14 11:24:09 -0700 | [diff] [blame] | 559 | /*! ZSTD_createDDict_advanced() : |
| 560 | * Create a ZSTD_DDict using external alloc and free, optionally by reference */ |
Yann Collet | 4e5eea6 | 2016-12-21 16:44:35 +0100 | [diff] [blame] | 561 | ZSTDLIB_API ZSTD_DDict* ZSTD_createDDict_advanced(const void* dict, size_t dictSize, |
| 562 | unsigned byReference, ZSTD_customMem customMem); |
| 563 | |
Yann Collet | e91c4b4 | 2016-09-14 16:55:44 +0200 | [diff] [blame] | 564 | /*! ZSTD_sizeof_DDict() : |
| 565 | * Gives the amount of memory used by a given ZSTD_DDict */ |
| 566 | ZSTDLIB_API size_t ZSTD_sizeof_DDict(const ZSTD_DDict* ddict); |
| 567 | |
Yann Collet | e7a41a5 | 2016-12-05 16:21:06 -0800 | [diff] [blame] | 568 | /*! ZSTD_getDictID_fromDict() : |
| 569 | * Provides the dictID stored within dictionary. |
| 570 | * if @return == 0, the dictionary is not conformant with Zstandard specification. |
| 571 | * It can still be loaded, but as a content-only dictionary. */ |
Nick Terrell | 8de46ab | 2016-12-16 13:27:30 -0800 | [diff] [blame] | 572 | ZSTDLIB_API unsigned ZSTD_getDictID_fromDict(const void* dict, size_t dictSize); |
Yann Collet | e7a41a5 | 2016-12-05 16:21:06 -0800 | [diff] [blame] | 573 | |
| 574 | /*! ZSTD_getDictID_fromDDict() : |
| 575 | * Provides the dictID of the dictionary loaded into `ddict`. |
| 576 | * If @return == 0, the dictionary is not conformant to Zstandard specification, or empty. |
| 577 | * Non-conformant dictionaries can still be loaded, but as content-only dictionaries. */ |
Nick Terrell | 8de46ab | 2016-12-16 13:27:30 -0800 | [diff] [blame] | 578 | ZSTDLIB_API unsigned ZSTD_getDictID_fromDDict(const ZSTD_DDict* ddict); |
Yann Collet | e7a41a5 | 2016-12-05 16:21:06 -0800 | [diff] [blame] | 579 | |
| 580 | /*! ZSTD_getDictID_fromFrame() : |
| 581 | * Provides the dictID required to decompressed the frame stored within `src`. |
| 582 | * If @return == 0, the dictID could not be decoded. |
| 583 | * This could for one of the following reasons : |
| 584 | * - The frame does not require a dictionary to be decoded (most common case). |
| 585 | * - The frame was built with dictID intentionally removed. Whatever dictionary is necessary is a hidden information. |
| 586 | * Note : this use case also happens when using a non-conformant dictionary. |
| 587 | * - `srcSize` is too small, and as a result, the frame header could not be decoded (only possible if `srcSize < ZSTD_FRAMEHEADERSIZE_MAX`). |
| 588 | * - This is not a Zstandard frame. |
| 589 | * When identifying the exact failure cause, it's possible to used ZSTD_getFrameParams(), which will provide a more precise error code. */ |
Nick Terrell | 8de46ab | 2016-12-16 13:27:30 -0800 | [diff] [blame] | 590 | ZSTDLIB_API unsigned ZSTD_getDictID_fromFrame(const void* src, size_t srcSize); |
Yann Collet | e7a41a5 | 2016-12-05 16:21:06 -0800 | [diff] [blame] | 591 | |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 592 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 593 | /******************************************************************** |
Przemyslaw Skibinski | 984b66c | 2016-10-24 15:59:51 +0200 | [diff] [blame] | 594 | * Advanced streaming functions |
Yann Collet | 5a0c8e2 | 2016-08-12 01:20:36 +0200 | [diff] [blame] | 595 | ********************************************************************/ |
| 596 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 597 | /*===== Advanced Streaming compression functions =====*/ |
Yann Collet | 70e3b31 | 2016-08-23 01:18:06 +0200 | [diff] [blame] | 598 | ZSTDLIB_API ZSTD_CStream* ZSTD_createCStream_advanced(ZSTD_customMem customMem); |
Yann Collet | 36c2a03 | 2017-04-05 22:06:21 -0700 | [diff] [blame] | 599 | ZSTDLIB_API size_t ZSTD_sizeof_CStream(const ZSTD_CStream* zcs); /**< size of CStream is variable, depending primarily on compression level */ |
Sean Purcell | 2db7249 | 2017-02-09 10:50:43 -0800 | [diff] [blame] | 600 | ZSTDLIB_API size_t ZSTD_initCStream_srcSize(ZSTD_CStream* zcs, int compressionLevel, unsigned long long pledgedSrcSize); /**< pledgedSrcSize must be correct, a size of 0 means unknown. for a frame size of 0 use initCStream_advanced */ |
Sean Purcell | 0b5370a | 2017-01-18 13:44:43 -0800 | [diff] [blame] | 601 | ZSTDLIB_API size_t ZSTD_initCStream_usingDict(ZSTD_CStream* zcs, const void* dict, size_t dictSize, int compressionLevel); /**< note: a dict will not be used if dict == NULL or dictSize < 8 */ |
Yann Collet | 70e3b31 | 2016-08-23 01:18:06 +0200 | [diff] [blame] | 602 | ZSTDLIB_API size_t ZSTD_initCStream_advanced(ZSTD_CStream* zcs, const void* dict, size_t dictSize, |
Sean Purcell | 0f5c95a | 2017-02-07 16:33:48 -0800 | [diff] [blame] | 603 | ZSTD_parameters params, unsigned long long pledgedSrcSize); /**< pledgedSrcSize is optional and can be 0 (meaning unknown). note: if the contentSizeFlag is set, pledgedSrcSize == 0 means the source size is actually 0 */ |
Yann Collet | 9516234 | 2016-10-25 16:19:52 -0700 | [diff] [blame] | 604 | ZSTDLIB_API size_t ZSTD_initCStream_usingCDict(ZSTD_CStream* zcs, const ZSTD_CDict* cdict); /**< note : cdict will just be referenced, and must outlive compression session */ |
Yann Collet | 77bf59e | 2017-04-27 11:43:04 -0700 | [diff] [blame^] | 605 | ZSTDLIB_API size_t ZSTD_initCStream_usingCDict_advanced(ZSTD_CStream* zcs, const ZSTD_CDict* cdict, unsigned long long pledgedSrcSize, ZSTD_frameParameters fParams); /**< same as ZSTD_initCStream_usingCDict(), with control over frame parameters */ |
Yann Collet | 36c2a03 | 2017-04-05 22:06:21 -0700 | [diff] [blame] | 606 | |
| 607 | /*! ZSTD_resetCStream() : |
| 608 | * start a new compression job, using same parameters from previous job. |
| 609 | * This is typically useful to skip dictionary loading stage, since it will re-use it in-place.. |
| 610 | * Note that zcs must be init at least once before using ZSTD_resetCStream(). |
| 611 | * pledgedSrcSize==0 means "srcSize unknown". |
| 612 | * If pledgedSrcSize > 0, its value must be correct, as it will be written in header, and controlled at the end. |
| 613 | * @return : 0, or an error code (which can be tested using ZSTD_isError()) */ |
| 614 | ZSTDLIB_API size_t ZSTD_resetCStream(ZSTD_CStream* zcs, unsigned long long pledgedSrcSize); |
Yann Collet | cb32763 | 2016-08-23 00:30:31 +0200 | [diff] [blame] | 615 | |
Yann Collet | 5a0c8e2 | 2016-08-12 01:20:36 +0200 | [diff] [blame] | 616 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 617 | /*===== Advanced Streaming decompression functions =====*/ |
Yann Collet | bb00274 | 2017-01-25 16:25:38 -0800 | [diff] [blame] | 618 | typedef enum { DStream_p_maxWindowSize } ZSTD_DStreamParameter_e; |
Yann Collet | 70e3b31 | 2016-08-23 01:18:06 +0200 | [diff] [blame] | 619 | ZSTDLIB_API ZSTD_DStream* ZSTD_createDStream_advanced(ZSTD_customMem customMem); |
Sean Purcell | 0b5370a | 2017-01-18 13:44:43 -0800 | [diff] [blame] | 620 | ZSTDLIB_API size_t ZSTD_initDStream_usingDict(ZSTD_DStream* zds, const void* dict, size_t dictSize); /**< note: a dict will not be used if dict == NULL or dictSize < 8 */ |
Yann Collet | 17e482e | 2016-08-23 16:58:10 +0200 | [diff] [blame] | 621 | ZSTDLIB_API size_t ZSTD_setDStreamParameter(ZSTD_DStream* zds, ZSTD_DStreamParameter_e paramType, unsigned paramValue); |
Yann Collet | 9516234 | 2016-10-25 16:19:52 -0700 | [diff] [blame] | 622 | ZSTDLIB_API size_t ZSTD_initDStream_usingDDict(ZSTD_DStream* zds, const ZSTD_DDict* ddict); /**< note : ddict will just be referenced, and must outlive decompression session */ |
Yann Collet | 4cb2129 | 2016-09-15 14:54:07 +0200 | [diff] [blame] | 623 | ZSTDLIB_API size_t ZSTD_resetDStream(ZSTD_DStream* zds); /**< re-use decompression parameters from previous init; saves dictionary loading */ |
Yann Collet | 70e3b31 | 2016-08-23 01:18:06 +0200 | [diff] [blame] | 624 | ZSTDLIB_API size_t ZSTD_sizeof_DStream(const ZSTD_DStream* zds); |
Yann Collet | 5a0c8e2 | 2016-08-12 01:20:36 +0200 | [diff] [blame] | 625 | |
| 626 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 627 | /********************************************************************* |
Yann Collet | 5a0c8e2 | 2016-08-12 01:20:36 +0200 | [diff] [blame] | 628 | * Buffer-less and synchronous inner streaming functions |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 629 | * |
| 630 | * This is an advanced API, giving full control over buffer management, for users which need direct control over memory. |
Yann Collet | 655393c | 2016-08-14 00:16:20 +0200 | [diff] [blame] | 631 | * But it's also a complex one, with many restrictions (documented below). |
Yann Collet | 37d1300 | 2016-10-24 17:22:12 -0700 | [diff] [blame] | 632 | * Prefer using normal streaming API for an easier experience |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 633 | ********************************************************************* */ |
Yann Collet | 60ba31c | 2016-07-28 19:55:09 +0200 | [diff] [blame] | 634 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 635 | /** |
| 636 | Buffer-less streaming compression (synchronous mode) |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 637 | |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 638 | A ZSTD_CCtx object is required to track streaming operations. |
Yann Collet | 45c03c5 | 2016-06-14 13:46:11 +0200 | [diff] [blame] | 639 | Use ZSTD_createCCtx() / ZSTD_freeCCtx() to manage resource. |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 640 | ZSTD_CCtx object can be re-used multiple times within successive compression operations. |
| 641 | |
| 642 | Start by initializing a context. |
| 643 | Use ZSTD_compressBegin(), or ZSTD_compressBegin_usingDict() for dictionary compression, |
| 644 | or ZSTD_compressBegin_advanced(), for finer parameter control. |
| 645 | It's also possible to duplicate a reference context which has already been initialized, using ZSTD_copyCCtx() |
| 646 | |
| 647 | Then, consume your input using ZSTD_compressContinue(). |
Yann Collet | a49e066 | 2016-06-21 11:54:03 +0200 | [diff] [blame] | 648 | There are some important considerations to keep in mind when using this advanced function : |
| 649 | - ZSTD_compressContinue() has no internal buffer. It uses externally provided buffer only. |
Yann Collet | 62470b4 | 2016-07-28 15:29:08 +0200 | [diff] [blame] | 650 | - Interface is synchronous : input is consumed entirely and produce 1+ (or more) compressed blocks. |
Yann Collet | a49e066 | 2016-06-21 11:54:03 +0200 | [diff] [blame] | 651 | - Caller must ensure there is enough space in `dst` to store compressed data under worst case scenario. |
| 652 | Worst case evaluation is provided by ZSTD_compressBound(). |
| 653 | ZSTD_compressContinue() doesn't guarantee recover after a failed compression. |
| 654 | - ZSTD_compressContinue() presumes prior input ***is still accessible and unmodified*** (up to maximum distance size, see WindowLog). |
| 655 | It remembers all previous contiguous blocks, plus one separated memory segment (which can itself consists of multiple contiguous blocks) |
| 656 | - ZSTD_compressContinue() detects that prior input has been overwritten when `src` buffer overlaps. |
| 657 | In which case, it will "discard" the relevant memory section from its history. |
| 658 | |
Yann Collet | 62470b4 | 2016-07-28 15:29:08 +0200 | [diff] [blame] | 659 | Finish a frame with ZSTD_compressEnd(), which will write the last block(s) and optional checksum. |
Yann Collet | 5eb749e | 2017-01-11 18:21:25 +0100 | [diff] [blame] | 660 | It's possible to use srcSize==0, in which case, it will write a final empty block to end the frame. |
| 661 | Without last block mark, frames will be considered unfinished (corrupted) by decoders. |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 662 | |
Yann Collet | 5eb749e | 2017-01-11 18:21:25 +0100 | [diff] [blame] | 663 | `ZSTD_CCtx` object can be re-used (ZSTD_compressBegin()) to compress some new frame. |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 664 | */ |
| 665 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 666 | /*===== Buffer-less streaming compression functions =====*/ |
| 667 | ZSTDLIB_API size_t ZSTD_compressBegin(ZSTD_CCtx* cctx, int compressionLevel); |
| 668 | ZSTDLIB_API size_t ZSTD_compressBegin_usingDict(ZSTD_CCtx* cctx, const void* dict, size_t dictSize, int compressionLevel); |
Sean Purcell | 0f5c95a | 2017-02-07 16:33:48 -0800 | [diff] [blame] | 669 | ZSTDLIB_API size_t ZSTD_compressBegin_advanced(ZSTD_CCtx* cctx, const void* dict, size_t dictSize, ZSTD_parameters params, unsigned long long pledgedSrcSize); /**< pledgedSrcSize is optional and can be 0 (meaning unknown). note: if the contentSizeFlag is set, pledgedSrcSize == 0 means the source size is actually 0 */ |
Yann Collet | 768df12 | 2017-04-26 15:42:10 -0700 | [diff] [blame] | 670 | ZSTDLIB_API size_t ZSTD_compressBegin_usingCDict(ZSTD_CCtx* cctx, const ZSTD_CDict* cdict); /**< note: fails if cdict==NULL */ |
Yann Collet | 715b9aa | 2017-04-18 13:55:53 -0700 | [diff] [blame] | 671 | ZSTDLIB_API size_t ZSTD_compressBegin_usingCDict_advanced(ZSTD_CCtx* const cctx, const ZSTD_CDict* const cdict, ZSTD_frameParameters const fParams, unsigned long long const pledgedSrcSize); /* compression parameters are already set within cdict. pledgedSrcSize=0 means null-size */ |
| 672 | ZSTDLIB_API size_t ZSTD_copyCCtx(ZSTD_CCtx* cctx, const ZSTD_CCtx* preparedCCtx, unsigned long long pledgedSrcSize); /**< note: if pledgedSrcSize can be 0, indicating unknown size. if it is non-zero, it must be accurate. for 0 size frames, use compressBegin_advanced */ |
| 673 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 674 | ZSTDLIB_API size_t ZSTD_compressContinue(ZSTD_CCtx* cctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize); |
| 675 | ZSTDLIB_API size_t ZSTD_compressEnd(ZSTD_CCtx* cctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize); |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 676 | |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 677 | |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 678 | |
inikep | ba1db37 | 2016-10-06 14:22:48 +0200 | [diff] [blame] | 679 | /*- |
Yann Collet | cf05b9d | 2016-07-18 16:52:10 +0200 | [diff] [blame] | 680 | Buffer-less streaming decompression (synchronous mode) |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 681 | |
| 682 | A ZSTD_DCtx object is required to track streaming operations. |
| 683 | Use ZSTD_createDCtx() / ZSTD_freeDCtx() to manage it. |
| 684 | A ZSTD_DCtx object can be re-used multiple times. |
| 685 | |
Yann Collet | 6b615d3 | 2016-07-29 19:40:37 +0200 | [diff] [blame] | 686 | First typical operation is to retrieve frame parameters, using ZSTD_getFrameParams(). |
| 687 | It fills a ZSTD_frameParams structure which provide important information to correctly decode the frame, |
| 688 | such as the minimum rolling buffer size to allocate to decompress data (`windowSize`), |
| 689 | and the dictionary ID used. |
| 690 | (Note : content size is optional, it may not be present. 0 means : content size unknown). |
| 691 | Note that these values could be wrong, either because of data malformation, or because an attacker is spoofing deliberate false information. |
| 692 | As a consequence, check that values remain within valid application range, especially `windowSize`, before allocation. |
| 693 | Each application can set its own limit, depending on local restrictions. For extended interoperability, it is recommended to support at least 8 MB. |
| 694 | Frame parameters are extracted from the beginning of the compressed frame. |
| 695 | Data fragment must be large enough to ensure successful decoding, typically `ZSTD_frameHeaderSize_max` bytes. |
| 696 | @result : 0 : successful decoding, the `ZSTD_frameParams` structure is correctly filled. |
| 697 | >0 : `srcSize` is too small, please provide at least @result bytes on next attempt. |
Yann Collet | d469a98 | 2016-07-28 03:47:45 +0200 | [diff] [blame] | 698 | errorCode, which can be tested using ZSTD_isError(). |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 699 | |
| 700 | Start decompression, with ZSTD_decompressBegin() or ZSTD_decompressBegin_usingDict(). |
| 701 | Alternatively, you can copy a prepared context, using ZSTD_copyDCtx(). |
| 702 | |
| 703 | Then use ZSTD_nextSrcSizeToDecompress() and ZSTD_decompressContinue() alternatively. |
Yann Collet | 6b615d3 | 2016-07-29 19:40:37 +0200 | [diff] [blame] | 704 | ZSTD_nextSrcSizeToDecompress() tells how many bytes to provide as 'srcSize' to ZSTD_decompressContinue(). |
| 705 | ZSTD_decompressContinue() requires this _exact_ amount of bytes, or it will fail. |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 706 | |
Yann Collet | 49bb004 | 2016-06-04 20:17:38 +0200 | [diff] [blame] | 707 | @result of ZSTD_decompressContinue() is the number of bytes regenerated within 'dst' (necessarily <= dstCapacity). |
Yann Collet | 6b615d3 | 2016-07-29 19:40:37 +0200 | [diff] [blame] | 708 | It can be zero, which is not an error; it just means ZSTD_decompressContinue() has decoded some metadata item. |
| 709 | It can also be an error code, which can be tested with ZSTD_isError(). |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 710 | |
Yann Collet | 3b6ae77 | 2016-07-08 23:42:22 +0200 | [diff] [blame] | 711 | ZSTD_decompressContinue() needs previous data blocks during decompression, up to `windowSize`. |
| 712 | They should preferably be located contiguously, prior to current block. |
| 713 | Alternatively, a round buffer of sufficient size is also possible. Sufficient size is determined by frame parameters. |
| 714 | ZSTD_decompressContinue() is very sensitive to contiguity, |
| 715 | if 2 blocks don't follow each other, make sure that either the compressor breaks contiguity at the same place, |
Yann Collet | d469a98 | 2016-07-28 03:47:45 +0200 | [diff] [blame] | 716 | or that previous contiguous segment is large enough to properly handle maximum back-reference. |
Yann Collet | 3b6ae77 | 2016-07-08 23:42:22 +0200 | [diff] [blame] | 717 | |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 718 | A frame is fully decoded when ZSTD_nextSrcSizeToDecompress() returns zero. |
| 719 | Context can then be reset to start a new decompression. |
| 720 | |
Yann Collet | 4c5bbf6 | 2016-07-28 20:30:25 +0200 | [diff] [blame] | 721 | Note : it's possible to know if next input to present is a header or a block, using ZSTD_nextInputType(). |
Yann Collet | 6b615d3 | 2016-07-29 19:40:37 +0200 | [diff] [blame] | 722 | This information is not required to properly decode a frame. |
Yann Collet | 3b6ae77 | 2016-07-08 23:42:22 +0200 | [diff] [blame] | 723 | |
Yann Collet | e795c8a | 2016-12-13 16:39:36 +0100 | [diff] [blame] | 724 | == Special case : skippable frames == |
Yann Collet | 3b6ae77 | 2016-07-08 23:42:22 +0200 | [diff] [blame] | 725 | |
Yann Collet | d469a98 | 2016-07-28 03:47:45 +0200 | [diff] [blame] | 726 | Skippable frames allow integration of user-defined data into a flow of concatenated frames. |
Yann Collet | 5b56739 | 2016-07-28 01:17:22 +0200 | [diff] [blame] | 727 | Skippable frames will be ignored (skipped) by a decompressor. The format of skippable frames is as follows : |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 728 | a) Skippable frame ID - 4 Bytes, Little endian format, any value from 0x184D2A50 to 0x184D2A5F |
| 729 | b) Frame Size - 4 Bytes, Little endian format, unsigned 32-bits |
| 730 | c) Frame Content - any content (User Data) of length equal to Frame Size |
| 731 | For skippable frames ZSTD_decompressContinue() always returns 0. |
| 732 | For skippable frames ZSTD_getFrameParams() returns fparamsPtr->windowLog==0 what means that a frame is skippable. |
Sean Purcell | 64417cd | 2017-02-22 13:29:01 -0800 | [diff] [blame] | 733 | Note : If fparamsPtr->frameContentSize==0, it is ambiguous: the frame might actually be a Zstd encoded frame with no content. |
| 734 | For purposes of decompression, it is valid in both cases to skip the frame using |
| 735 | ZSTD_findFrameCompressedSize to find its size in bytes. |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 736 | It also returns Frame Size as fparamsPtr->frameContentSize. |
| 737 | */ |
| 738 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 739 | typedef struct { |
| 740 | unsigned long long frameContentSize; |
| 741 | unsigned windowSize; |
| 742 | unsigned dictID; |
| 743 | unsigned checksumFlag; |
| 744 | } ZSTD_frameParams; |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 745 | |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 746 | /*===== Buffer-less streaming decompression functions =====*/ |
| 747 | ZSTDLIB_API size_t ZSTD_getFrameParams(ZSTD_frameParams* fparamsPtr, const void* src, size_t srcSize); /**< doesn't consume input, see details below */ |
| 748 | ZSTDLIB_API size_t ZSTD_decompressBegin(ZSTD_DCtx* dctx); |
| 749 | ZSTDLIB_API size_t ZSTD_decompressBegin_usingDict(ZSTD_DCtx* dctx, const void* dict, size_t dictSize); |
| 750 | ZSTDLIB_API void ZSTD_copyDCtx(ZSTD_DCtx* dctx, const ZSTD_DCtx* preparedDCtx); |
| 751 | ZSTDLIB_API size_t ZSTD_nextSrcSizeToDecompress(ZSTD_DCtx* dctx); |
| 752 | ZSTDLIB_API size_t ZSTD_decompressContinue(ZSTD_DCtx* dctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize); |
| 753 | typedef enum { ZSTDnit_frameHeader, ZSTDnit_blockHeader, ZSTDnit_block, ZSTDnit_lastBlock, ZSTDnit_checksum, ZSTDnit_skippableFrame } ZSTD_nextInputType_e; |
| 754 | ZSTDLIB_API ZSTD_nextInputType_e ZSTD_nextInputType(ZSTD_DCtx* dctx); |
| 755 | |
| 756 | /** |
| 757 | Block functions |
| 758 | |
| 759 | Block functions produce and decode raw zstd blocks, without frame metadata. |
Yann Collet | cf05b9d | 2016-07-18 16:52:10 +0200 | [diff] [blame] | 760 | Frame metadata cost is typically ~18 bytes, which can be non-negligible for very small blocks (< 100 bytes). |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 761 | User will have to take in charge required information to regenerate data, such as compressed and content sizes. |
| 762 | |
| 763 | A few rules to respect : |
Yann Collet | f246cf5 | 2016-07-06 20:30:52 +0200 | [diff] [blame] | 764 | - Compressing and decompressing require a context structure |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 765 | + Use ZSTD_createCCtx() and ZSTD_createDCtx() |
| 766 | - It is necessary to init context before starting |
Yann Collet | af4f45b | 2017-04-18 03:17:44 -0700 | [diff] [blame] | 767 | + compression : any ZSTD_compressBegin*() variant, including with dictionary |
| 768 | + decompression : any ZSTD_decompressBegin*() variant, including with dictionary |
| 769 | + copyCCtx() and copyDCtx() can be used too |
| 770 | - Block size is limited, it must be <= ZSTD_getBlockSizeMax() <= ZSTD_BLOCKSIZE_ABSOLUTEMAX |
| 771 | + If input is larger than a block size, it's necessary to split input data into multiple blocks |
| 772 | + For inputs larger than a single block size, consider using the regular ZSTD_compress() instead. |
| 773 | Frame metadata is not that costly, and quickly becomes negligible as source size grows larger. |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 774 | - When a block is considered not compressible enough, ZSTD_compressBlock() result will be zero. |
| 775 | In which case, nothing is produced into `dst`. |
| 776 | + User must test for such outcome and deal directly with uncompressed data |
Yann Collet | f246cf5 | 2016-07-06 20:30:52 +0200 | [diff] [blame] | 777 | + ZSTD_decompressBlock() doesn't accept uncompressed data as input !!! |
Yann Collet | af4f45b | 2017-04-18 03:17:44 -0700 | [diff] [blame] | 778 | + In case of multiple successive blocks, should some of them be uncompressed, |
| 779 | decoder must be informed of their existence in order to follow proper history. |
| 780 | Use ZSTD_insertBlock() for such a case. |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 781 | */ |
| 782 | |
Yann Collet | cf05b9d | 2016-07-18 16:52:10 +0200 | [diff] [blame] | 783 | #define ZSTD_BLOCKSIZE_ABSOLUTEMAX (128 * 1024) /* define, for static allocation */ |
inikep | 82057aa | 2016-10-06 13:23:52 +0200 | [diff] [blame] | 784 | /*===== Raw zstd block functions =====*/ |
Yann Collet | cf05b9d | 2016-07-18 16:52:10 +0200 | [diff] [blame] | 785 | ZSTDLIB_API size_t ZSTD_getBlockSizeMax(ZSTD_CCtx* cctx); |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 786 | ZSTDLIB_API size_t ZSTD_compressBlock (ZSTD_CCtx* cctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize); |
| 787 | ZSTDLIB_API size_t ZSTD_decompressBlock(ZSTD_DCtx* dctx, void* dst, size_t dstCapacity, const void* src, size_t srcSize); |
Yann Collet | d5c5a77 | 2016-07-19 15:06:55 +0200 | [diff] [blame] | 788 | ZSTDLIB_API size_t ZSTD_insertBlock(ZSTD_DCtx* dctx, const void* blockStart, size_t blockSize); /**< insert block into `dctx` history. Useful for uncompressed blocks */ |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 789 | |
| 790 | |
Nick Terrell | 05c00f2 | 2016-11-29 11:46:37 -0800 | [diff] [blame] | 791 | #endif /* ZSTD_H_ZSTD_STATIC_LINKING_ONLY */ |
Yann Collet | d3b7f8d | 2016-06-04 19:47:02 +0200 | [diff] [blame] | 792 | |
Yann Collet | 4856a00 | 2015-01-24 01:58:16 +0100 | [diff] [blame] | 793 | #if defined (__cplusplus) |
| 794 | } |
| 795 | #endif |