mirror of
				git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
				synced 2025-09-04 20:19:47 +08:00 
			
		
		
		
	 73f3d1b48f
			
		
	
	
		73f3d1b48f
		
	
	
	
	
		
			
			Add zstd compression and decompression kernel modules.
zstd offers a wide varity of compression speed and quality trade-offs.
It can compress at speeds approaching lz4, and quality approaching lzma.
zstd decompressions at speeds more than twice as fast as zlib, and
decompression speed remains roughly the same across all compression levels.
The code was ported from the upstream zstd source repository. The
`linux/zstd.h` header was modified to match linux kernel style.
The cross-platform and allocation code was stripped out. Instead zstd
requires the caller to pass a preallocated workspace. The source files
were clang-formatted [1] to match the Linux Kernel style as much as
possible. Otherwise, the code was unmodified. We would like to avoid
as much further manual modification to the source code as possible, so it
will be easier to keep the kernel zstd up to date.
I benchmarked zstd compression as a special character device. I ran zstd
and zlib compression at several levels, as well as performing no
compression, which measure the time spent copying the data to kernel space.
Data is passed to the compresser 4096 B at a time. The benchmark file is
located in the upstream zstd source repository under
`contrib/linux-kernel/zstd_compress_test.c` [2].
I ran the benchmarks on a Ubuntu 14.04 VM with 2 cores and 4 GiB of RAM.
The VM is running on a MacBook Pro with a 3.1 GHz Intel Core i7 processor,
16 GB of RAM, and a SSD. I benchmarked using `silesia.tar` [3], which is
211,988,480 B large. Run the following commands for the benchmark:
    sudo modprobe zstd_compress_test
    sudo mknod zstd_compress_test c 245 0
    sudo cp silesia.tar zstd_compress_test
The time is reported by the time of the userland `cp`.
The MB/s is computed with
    1,536,217,008 B / time(buffer size, hash)
which includes the time to copy from userland.
The Adjusted MB/s is computed with
    1,536,217,088 B / (time(buffer size, hash) - time(buffer size, none)).
The memory reported is the amount of memory the compressor requests.
| Method   | Size (B) | Time (s) | Ratio | MB/s    | Adj MB/s | Mem (MB) |
|----------|----------|----------|-------|---------|----------|----------|
| none     | 11988480 |    0.100 |     1 | 2119.88 |        - |        - |
| zstd -1  | 73645762 |    1.044 | 2.878 |  203.05 |   224.56 |     1.23 |
| zstd -3  | 66988878 |    1.761 | 3.165 |  120.38 |   127.63 |     2.47 |
| zstd -5  | 65001259 |    2.563 | 3.261 |   82.71 |    86.07 |     2.86 |
| zstd -10 | 60165346 |   13.242 | 3.523 |   16.01 |    16.13 |    13.22 |
| zstd -15 | 58009756 |   47.601 | 3.654 |    4.45 |     4.46 |    21.61 |
| zstd -19 | 54014593 |  102.835 | 3.925 |    2.06 |     2.06 |    60.15 |
| zlib -1  | 77260026 |    2.895 | 2.744 |   73.23 |    75.85 |     0.27 |
| zlib -3  | 72972206 |    4.116 | 2.905 |   51.50 |    52.79 |     0.27 |
| zlib -6  | 68190360 |    9.633 | 3.109 |   22.01 |    22.24 |     0.27 |
| zlib -9  | 67613382 |   22.554 | 3.135 |    9.40 |     9.44 |     0.27 |
I benchmarked zstd decompression using the same method on the same machine.
The benchmark file is located in the upstream zstd repo under
`contrib/linux-kernel/zstd_decompress_test.c` [4]. The memory reported is
the amount of memory required to decompress data compressed with the given
compression level. If you know the maximum size of your input, you can
reduce the memory usage of decompression irrespective of the compression
level.
| Method   | Time (s) | MB/s    | Adjusted MB/s | Memory (MB) |
|----------|----------|---------|---------------|-------------|
| none     |    0.025 | 8479.54 |             - |           - |
| zstd -1  |    0.358 |  592.15 |        636.60 |        0.84 |
| zstd -3  |    0.396 |  535.32 |        571.40 |        1.46 |
| zstd -5  |    0.396 |  535.32 |        571.40 |        1.46 |
| zstd -10 |    0.374 |  566.81 |        607.42 |        2.51 |
| zstd -15 |    0.379 |  559.34 |        598.84 |        4.61 |
| zstd -19 |    0.412 |  514.54 |        547.77 |        8.80 |
| zlib -1  |    0.940 |  225.52 |        231.68 |        0.04 |
| zlib -3  |    0.883 |  240.08 |        247.07 |        0.04 |
| zlib -6  |    0.844 |  251.17 |        258.84 |        0.04 |
| zlib -9  |    0.837 |  253.27 |        287.64 |        0.04 |
Tested in userland using the test-suite in the zstd repo under
`contrib/linux-kernel/test/UserlandTest.cpp` [5] by mocking the kernel
functions. Fuzz tested using libfuzzer [6] with the fuzz harnesses under
`contrib/linux-kernel/test/{RoundTripCrash.c,DecompressCrash.c}` [7] [8]
with ASAN, UBSAN, and MSAN. Additionaly, it was tested while testing the
BtrFS and SquashFS patches coming next.
[1] https://clang.llvm.org/docs/ClangFormat.html
[2] https://github.com/facebook/zstd/blob/dev/contrib/linux-kernel/zstd_compress_test.c
[3] http://sun.aei.polsl.pl/~sdeor/index.php?page=silesia
[4] https://github.com/facebook/zstd/blob/dev/contrib/linux-kernel/zstd_decompress_test.c
[5] https://github.com/facebook/zstd/blob/dev/contrib/linux-kernel/test/UserlandTest.cpp
[6] http://llvm.org/docs/LibFuzzer.html
[7] https://github.com/facebook/zstd/blob/dev/contrib/linux-kernel/test/RoundTripCrash.c
[8] https://github.com/facebook/zstd/blob/dev/contrib/linux-kernel/test/DecompressCrash.c
zstd source repository: https://github.com/facebook/zstd
Signed-off-by: Nick Terrell <terrelln@fb.com>
Signed-off-by: Chris Mason <clm@fb.com>
		
	
			
		
			
				
	
	
		
			213 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			213 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * Huffman coder, part of New Generation Entropy library
 | |
|  * header file
 | |
|  * Copyright (C) 2013-2016, Yann Collet.
 | |
|  *
 | |
|  * BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
 | |
|  *
 | |
|  * Redistribution and use in source and binary forms, with or without
 | |
|  * modification, are permitted provided that the following conditions are
 | |
|  * met:
 | |
|  *
 | |
|  *   * Redistributions of source code must retain the above copyright
 | |
|  * notice, this list of conditions and the following disclaimer.
 | |
|  *   * Redistributions in binary form must reproduce the above
 | |
|  * copyright notice, this list of conditions and the following disclaimer
 | |
|  * in the documentation and/or other materials provided with the
 | |
|  * distribution.
 | |
|  *
 | |
|  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 | |
|  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 | |
|  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 | |
|  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 | |
|  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 | |
|  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 | |
|  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 | |
|  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 | |
|  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 | |
|  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 | |
|  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 | |
|  *
 | |
|  * This program is free software; you can redistribute it and/or modify it under
 | |
|  * the terms of the GNU General Public License version 2 as published by the
 | |
|  * Free Software Foundation. This program is dual-licensed; you may select
 | |
|  * either version 2 of the GNU General Public License ("GPL") or BSD license
 | |
|  * ("BSD").
 | |
|  *
 | |
|  * You can contact the author at :
 | |
|  * - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
 | |
|  */
 | |
| #ifndef HUF_H_298734234
 | |
| #define HUF_H_298734234
 | |
| 
 | |
| /* *** Dependencies *** */
 | |
| #include <linux/types.h> /* size_t */
 | |
| 
 | |
| /* ***   Tool functions *** */
 | |
| #define HUF_BLOCKSIZE_MAX (128 * 1024) /**< maximum input size for a single block compressed with HUF_compress */
 | |
| size_t HUF_compressBound(size_t size); /**< maximum compressed size (worst case) */
 | |
| 
 | |
| /* Error Management */
 | |
| unsigned HUF_isError(size_t code); /**< tells if a return value is an error code */
 | |
| 
 | |
| /* ***   Advanced function   *** */
 | |
| 
 | |
| /** HUF_compress4X_wksp() :
 | |
| *   Same as HUF_compress2(), but uses externally allocated `workSpace`, which must be a table of >= 1024 unsigned */
 | |
| size_t HUF_compress4X_wksp(void *dst, size_t dstSize, const void *src, size_t srcSize, unsigned maxSymbolValue, unsigned tableLog, void *workSpace,
 | |
| 			   size_t wkspSize); /**< `workSpace` must be a table of at least HUF_COMPRESS_WORKSPACE_SIZE_U32 unsigned */
 | |
| 
 | |
| /* *** Dependencies *** */
 | |
| #include "mem.h" /* U32 */
 | |
| 
 | |
| /* *** Constants *** */
 | |
| #define HUF_TABLELOG_MAX 12     /* max configured tableLog (for static allocation); can be modified up to HUF_ABSOLUTEMAX_TABLELOG */
 | |
| #define HUF_TABLELOG_DEFAULT 11 /* tableLog by default, when not specified */
 | |
| #define HUF_SYMBOLVALUE_MAX 255
 | |
| 
 | |
| #define HUF_TABLELOG_ABSOLUTEMAX 15 /* absolute limit of HUF_MAX_TABLELOG. Beyond that value, code does not work */
 | |
| #if (HUF_TABLELOG_MAX > HUF_TABLELOG_ABSOLUTEMAX)
 | |
| #error "HUF_TABLELOG_MAX is too large !"
 | |
| #endif
 | |
| 
 | |
| /* ****************************************
 | |
| *  Static allocation
 | |
| ******************************************/
 | |
| /* HUF buffer bounds */
 | |
| #define HUF_CTABLEBOUND 129
 | |
| #define HUF_BLOCKBOUND(size) (size + (size >> 8) + 8)			 /* only true if incompressible pre-filtered with fast heuristic */
 | |
| #define HUF_COMPRESSBOUND(size) (HUF_CTABLEBOUND + HUF_BLOCKBOUND(size)) /* Macro version, useful for static allocation */
 | |
| 
 | |
| /* static allocation of HUF's Compression Table */
 | |
| #define HUF_CREATE_STATIC_CTABLE(name, maxSymbolValue) \
 | |
| 	U32 name##hb[maxSymbolValue + 1];              \
 | |
| 	void *name##hv = &(name##hb);                  \
 | |
| 	HUF_CElt *name = (HUF_CElt *)(name##hv) /* no final ; */
 | |
| 
 | |
| /* static allocation of HUF's DTable */
 | |
| typedef U32 HUF_DTable;
 | |
| #define HUF_DTABLE_SIZE(maxTableLog) (1 + (1 << (maxTableLog)))
 | |
| #define HUF_CREATE_STATIC_DTABLEX2(DTable, maxTableLog) HUF_DTable DTable[HUF_DTABLE_SIZE((maxTableLog)-1)] = {((U32)((maxTableLog)-1) * 0x01000001)}
 | |
| #define HUF_CREATE_STATIC_DTABLEX4(DTable, maxTableLog) HUF_DTable DTable[HUF_DTABLE_SIZE(maxTableLog)] = {((U32)(maxTableLog)*0x01000001)}
 | |
| 
 | |
| /* The workspace must have alignment at least 4 and be at least this large */
 | |
| #define HUF_COMPRESS_WORKSPACE_SIZE (6 << 10)
 | |
| #define HUF_COMPRESS_WORKSPACE_SIZE_U32 (HUF_COMPRESS_WORKSPACE_SIZE / sizeof(U32))
 | |
| 
 | |
| /* The workspace must have alignment at least 4 and be at least this large */
 | |
| #define HUF_DECOMPRESS_WORKSPACE_SIZE (3 << 10)
 | |
| #define HUF_DECOMPRESS_WORKSPACE_SIZE_U32 (HUF_DECOMPRESS_WORKSPACE_SIZE / sizeof(U32))
 | |
| 
 | |
| /* ****************************************
 | |
| *  Advanced decompression functions
 | |
| ******************************************/
 | |
| size_t HUF_decompress4X_DCtx_wksp(HUF_DTable *dctx, void *dst, size_t dstSize, const void *cSrc, size_t cSrcSize, void *workspace, size_t workspaceSize); /**< decodes RLE and uncompressed */
 | |
| size_t HUF_decompress4X_hufOnly_wksp(HUF_DTable *dctx, void *dst, size_t dstSize, const void *cSrc, size_t cSrcSize, void *workspace,
 | |
| 				size_t workspaceSize);							       /**< considers RLE and uncompressed as errors */
 | |
| size_t HUF_decompress4X2_DCtx_wksp(HUF_DTable *dctx, void *dst, size_t dstSize, const void *cSrc, size_t cSrcSize, void *workspace,
 | |
| 				   size_t workspaceSize); /**< single-symbol decoder */
 | |
| size_t HUF_decompress4X4_DCtx_wksp(HUF_DTable *dctx, void *dst, size_t dstSize, const void *cSrc, size_t cSrcSize, void *workspace,
 | |
| 				   size_t workspaceSize); /**< double-symbols decoder */
 | |
| 
 | |
| /* ****************************************
 | |
| *  HUF detailed API
 | |
| ******************************************/
 | |
| /*!
 | |
| HUF_compress() does the following:
 | |
| 1. count symbol occurrence from source[] into table count[] using FSE_count()
 | |
| 2. (optional) refine tableLog using HUF_optimalTableLog()
 | |
| 3. build Huffman table from count using HUF_buildCTable()
 | |
| 4. save Huffman table to memory buffer using HUF_writeCTable_wksp()
 | |
| 5. encode the data stream using HUF_compress4X_usingCTable()
 | |
| 
 | |
| The following API allows targeting specific sub-functions for advanced tasks.
 | |
| For example, it's possible to compress several blocks using the same 'CTable',
 | |
| or to save and regenerate 'CTable' using external methods.
 | |
| */
 | |
| /* FSE_count() : find it within "fse.h" */
 | |
| unsigned HUF_optimalTableLog(unsigned maxTableLog, size_t srcSize, unsigned maxSymbolValue);
 | |
| typedef struct HUF_CElt_s HUF_CElt; /* incomplete type */
 | |
| size_t HUF_writeCTable_wksp(void *dst, size_t maxDstSize, const HUF_CElt *CTable, unsigned maxSymbolValue, unsigned huffLog, void *workspace, size_t workspaceSize);
 | |
| size_t HUF_compress4X_usingCTable(void *dst, size_t dstSize, const void *src, size_t srcSize, const HUF_CElt *CTable);
 | |
| 
 | |
| typedef enum {
 | |
| 	HUF_repeat_none,  /**< Cannot use the previous table */
 | |
| 	HUF_repeat_check, /**< Can use the previous table but it must be checked. Note : The previous table must have been constructed by HUF_compress{1,
 | |
| 			     4}X_repeat */
 | |
| 	HUF_repeat_valid  /**< Can use the previous table and it is asumed to be valid */
 | |
| } HUF_repeat;
 | |
| /** HUF_compress4X_repeat() :
 | |
| *   Same as HUF_compress4X_wksp(), but considers using hufTable if *repeat != HUF_repeat_none.
 | |
| *   If it uses hufTable it does not modify hufTable or repeat.
 | |
| *   If it doesn't, it sets *repeat = HUF_repeat_none, and it sets hufTable to the table used.
 | |
| *   If preferRepeat then the old table will always be used if valid. */
 | |
| size_t HUF_compress4X_repeat(void *dst, size_t dstSize, const void *src, size_t srcSize, unsigned maxSymbolValue, unsigned tableLog, void *workSpace,
 | |
| 			     size_t wkspSize, HUF_CElt *hufTable, HUF_repeat *repeat,
 | |
| 			     int preferRepeat); /**< `workSpace` must be a table of at least HUF_COMPRESS_WORKSPACE_SIZE_U32 unsigned */
 | |
| 
 | |
| /** HUF_buildCTable_wksp() :
 | |
|  *  Same as HUF_buildCTable(), but using externally allocated scratch buffer.
 | |
|  *  `workSpace` must be aligned on 4-bytes boundaries, and be at least as large as a table of 1024 unsigned.
 | |
|  */
 | |
| size_t HUF_buildCTable_wksp(HUF_CElt *tree, const U32 *count, U32 maxSymbolValue, U32 maxNbBits, void *workSpace, size_t wkspSize);
 | |
| 
 | |
| /*! HUF_readStats() :
 | |
| 	Read compact Huffman tree, saved by HUF_writeCTable().
 | |
| 	`huffWeight` is destination buffer.
 | |
| 	@return : size read from `src` , or an error Code .
 | |
| 	Note : Needed by HUF_readCTable() and HUF_readDTableXn() . */
 | |
| size_t HUF_readStats_wksp(BYTE *huffWeight, size_t hwSize, U32 *rankStats, U32 *nbSymbolsPtr, U32 *tableLogPtr, const void *src, size_t srcSize,
 | |
| 			  void *workspace, size_t workspaceSize);
 | |
| 
 | |
| /** HUF_readCTable() :
 | |
| *   Loading a CTable saved with HUF_writeCTable() */
 | |
| size_t HUF_readCTable_wksp(HUF_CElt *CTable, unsigned maxSymbolValue, const void *src, size_t srcSize, void *workspace, size_t workspaceSize);
 | |
| 
 | |
| /*
 | |
| HUF_decompress() does the following:
 | |
| 1. select the decompression algorithm (X2, X4) based on pre-computed heuristics
 | |
| 2. build Huffman table from save, using HUF_readDTableXn()
 | |
| 3. decode 1 or 4 segments in parallel using HUF_decompressSXn_usingDTable
 | |
| */
 | |
| 
 | |
| /** HUF_selectDecoder() :
 | |
| *   Tells which decoder is likely to decode faster,
 | |
| *   based on a set of pre-determined metrics.
 | |
| *   @return : 0==HUF_decompress4X2, 1==HUF_decompress4X4 .
 | |
| *   Assumption : 0 < cSrcSize < dstSize <= 128 KB */
 | |
| U32 HUF_selectDecoder(size_t dstSize, size_t cSrcSize);
 | |
| 
 | |
| size_t HUF_readDTableX2_wksp(HUF_DTable *DTable, const void *src, size_t srcSize, void *workspace, size_t workspaceSize);
 | |
| size_t HUF_readDTableX4_wksp(HUF_DTable *DTable, const void *src, size_t srcSize, void *workspace, size_t workspaceSize);
 | |
| 
 | |
| size_t HUF_decompress4X_usingDTable(void *dst, size_t maxDstSize, const void *cSrc, size_t cSrcSize, const HUF_DTable *DTable);
 | |
| size_t HUF_decompress4X2_usingDTable(void *dst, size_t maxDstSize, const void *cSrc, size_t cSrcSize, const HUF_DTable *DTable);
 | |
| size_t HUF_decompress4X4_usingDTable(void *dst, size_t maxDstSize, const void *cSrc, size_t cSrcSize, const HUF_DTable *DTable);
 | |
| 
 | |
| /* single stream variants */
 | |
| 
 | |
| size_t HUF_compress1X_wksp(void *dst, size_t dstSize, const void *src, size_t srcSize, unsigned maxSymbolValue, unsigned tableLog, void *workSpace,
 | |
| 			   size_t wkspSize); /**< `workSpace` must be a table of at least HUF_COMPRESS_WORKSPACE_SIZE_U32 unsigned */
 | |
| size_t HUF_compress1X_usingCTable(void *dst, size_t dstSize, const void *src, size_t srcSize, const HUF_CElt *CTable);
 | |
| /** HUF_compress1X_repeat() :
 | |
| *   Same as HUF_compress1X_wksp(), but considers using hufTable if *repeat != HUF_repeat_none.
 | |
| *   If it uses hufTable it does not modify hufTable or repeat.
 | |
| *   If it doesn't, it sets *repeat = HUF_repeat_none, and it sets hufTable to the table used.
 | |
| *   If preferRepeat then the old table will always be used if valid. */
 | |
| size_t HUF_compress1X_repeat(void *dst, size_t dstSize, const void *src, size_t srcSize, unsigned maxSymbolValue, unsigned tableLog, void *workSpace,
 | |
| 			     size_t wkspSize, HUF_CElt *hufTable, HUF_repeat *repeat,
 | |
| 			     int preferRepeat); /**< `workSpace` must be a table of at least HUF_COMPRESS_WORKSPACE_SIZE_U32 unsigned */
 | |
| 
 | |
| size_t HUF_decompress1X_DCtx_wksp(HUF_DTable *dctx, void *dst, size_t dstSize, const void *cSrc, size_t cSrcSize, void *workspace, size_t workspaceSize);
 | |
| size_t HUF_decompress1X2_DCtx_wksp(HUF_DTable *dctx, void *dst, size_t dstSize, const void *cSrc, size_t cSrcSize, void *workspace,
 | |
| 				   size_t workspaceSize); /**< single-symbol decoder */
 | |
| size_t HUF_decompress1X4_DCtx_wksp(HUF_DTable *dctx, void *dst, size_t dstSize, const void *cSrc, size_t cSrcSize, void *workspace,
 | |
| 				   size_t workspaceSize); /**< double-symbols decoder */
 | |
| 
 | |
| size_t HUF_decompress1X_usingDTable(void *dst, size_t maxDstSize, const void *cSrc, size_t cSrcSize,
 | |
| 				    const HUF_DTable *DTable); /**< automatic selection of sing or double symbol decoder, based on DTable */
 | |
| size_t HUF_decompress1X2_usingDTable(void *dst, size_t maxDstSize, const void *cSrc, size_t cSrcSize, const HUF_DTable *DTable);
 | |
| size_t HUF_decompress1X4_usingDTable(void *dst, size_t maxDstSize, const void *cSrc, size_t cSrcSize, const HUF_DTable *DTable);
 | |
| 
 | |
| #endif /* HUF_H_298734234 */
 |