1*f739fcd8STom Rini // SPDX-License-Identifier: BSD-2-Clause
2027b728dSJulius Werner /*
3027b728dSJulius Werner LZ4 - Fast LZ compression algorithm
4027b728dSJulius Werner Copyright (C) 2011-2015, Yann Collet.
5027b728dSJulius Werner
6027b728dSJulius Werner You can contact the author at :
7027b728dSJulius Werner - LZ4 source repository : https://github.com/Cyan4973/lz4
8027b728dSJulius Werner - LZ4 public forum : https://groups.google.com/forum/#!forum/lz4c
9027b728dSJulius Werner */
10027b728dSJulius Werner
11027b728dSJulius Werner
12027b728dSJulius Werner /**************************************
13027b728dSJulius Werner * Reading and writing into memory
14027b728dSJulius Werner **************************************/
15027b728dSJulius Werner
16027b728dSJulius Werner /* customized version of memcpy, which may overwrite up to 7 bytes beyond dstEnd */
LZ4_wildCopy(void * dstPtr,const void * srcPtr,void * dstEnd)17027b728dSJulius Werner static void LZ4_wildCopy(void* dstPtr, const void* srcPtr, void* dstEnd)
18027b728dSJulius Werner {
19027b728dSJulius Werner BYTE* d = (BYTE*)dstPtr;
20027b728dSJulius Werner const BYTE* s = (const BYTE*)srcPtr;
21027b728dSJulius Werner BYTE* e = (BYTE*)dstEnd;
22027b728dSJulius Werner do { LZ4_copy8(d,s); d+=8; s+=8; } while (d<e);
23027b728dSJulius Werner }
24027b728dSJulius Werner
25027b728dSJulius Werner
26027b728dSJulius Werner /**************************************
27027b728dSJulius Werner * Common Constants
28027b728dSJulius Werner **************************************/
29027b728dSJulius Werner #define MINMATCH 4
30027b728dSJulius Werner
31027b728dSJulius Werner #define COPYLENGTH 8
32027b728dSJulius Werner #define LASTLITERALS 5
33027b728dSJulius Werner #define MFLIMIT (COPYLENGTH+MINMATCH)
34027b728dSJulius Werner static const int LZ4_minLength = (MFLIMIT+1);
35027b728dSJulius Werner
36027b728dSJulius Werner #define KB *(1 <<10)
37027b728dSJulius Werner #define MB *(1 <<20)
38027b728dSJulius Werner #define GB *(1U<<30)
39027b728dSJulius Werner
40027b728dSJulius Werner #define MAXD_LOG 16
41027b728dSJulius Werner #define MAX_DISTANCE ((1 << MAXD_LOG) - 1)
42027b728dSJulius Werner
43027b728dSJulius Werner #define ML_BITS 4
44027b728dSJulius Werner #define ML_MASK ((1U<<ML_BITS)-1)
45027b728dSJulius Werner #define RUN_BITS (8-ML_BITS)
46027b728dSJulius Werner #define RUN_MASK ((1U<<RUN_BITS)-1)
47027b728dSJulius Werner
48027b728dSJulius Werner
49027b728dSJulius Werner /**************************************
50027b728dSJulius Werner * Local Structures and types
51027b728dSJulius Werner **************************************/
52027b728dSJulius Werner typedef enum { noDict = 0, withPrefix64k, usingExtDict } dict_directive;
53027b728dSJulius Werner typedef enum { endOnOutputSize = 0, endOnInputSize = 1 } endCondition_directive;
54027b728dSJulius Werner typedef enum { full = 0, partial = 1 } earlyEnd_directive;
55027b728dSJulius Werner
56027b728dSJulius Werner
57027b728dSJulius Werner
58027b728dSJulius Werner /*******************************
59027b728dSJulius Werner * Decompression functions
60027b728dSJulius Werner *******************************/
61027b728dSJulius Werner /*
62027b728dSJulius Werner * This generic decompression function cover all use cases.
63027b728dSJulius Werner * It shall be instantiated several times, using different sets of directives
64027b728dSJulius Werner * Note that it is essential this generic function is really inlined,
65027b728dSJulius Werner * in order to remove useless branches during compilation optimization.
66027b728dSJulius Werner */
LZ4_decompress_generic(const char * const source,char * const dest,int inputSize,int outputSize,int endOnInput,int partialDecoding,int targetOutputSize,int dict,const BYTE * const lowPrefix,const BYTE * const dictStart,const size_t dictSize)67027b728dSJulius Werner FORCE_INLINE int LZ4_decompress_generic(
68027b728dSJulius Werner const char* const source,
69027b728dSJulius Werner char* const dest,
70027b728dSJulius Werner int inputSize,
71027b728dSJulius Werner int outputSize, /* If endOnInput==endOnInputSize, this value is the max size of Output Buffer. */
72027b728dSJulius Werner
73027b728dSJulius Werner int endOnInput, /* endOnOutputSize, endOnInputSize */
74027b728dSJulius Werner int partialDecoding, /* full, partial */
75027b728dSJulius Werner int targetOutputSize, /* only used if partialDecoding==partial */
76027b728dSJulius Werner int dict, /* noDict, withPrefix64k, usingExtDict */
77027b728dSJulius Werner const BYTE* const lowPrefix, /* == dest if dict == noDict */
78027b728dSJulius Werner const BYTE* const dictStart, /* only if dict==usingExtDict */
79027b728dSJulius Werner const size_t dictSize /* note : = 0 if noDict */
80027b728dSJulius Werner )
81027b728dSJulius Werner {
82027b728dSJulius Werner /* Local Variables */
83027b728dSJulius Werner const BYTE* ip = (const BYTE*) source;
84027b728dSJulius Werner const BYTE* const iend = ip + inputSize;
85027b728dSJulius Werner
86027b728dSJulius Werner BYTE* op = (BYTE*) dest;
87027b728dSJulius Werner BYTE* const oend = op + outputSize;
88027b728dSJulius Werner BYTE* cpy;
89027b728dSJulius Werner BYTE* oexit = op + targetOutputSize;
90027b728dSJulius Werner const BYTE* const lowLimit = lowPrefix - dictSize;
91027b728dSJulius Werner
92027b728dSJulius Werner const BYTE* const dictEnd = (const BYTE*)dictStart + dictSize;
93027b728dSJulius Werner const size_t dec32table[] = {4, 1, 2, 1, 4, 4, 4, 4};
94027b728dSJulius Werner const size_t dec64table[] = {0, 0, 0, (size_t)-1, 0, 1, 2, 3};
95027b728dSJulius Werner
96027b728dSJulius Werner const int safeDecode = (endOnInput==endOnInputSize);
97027b728dSJulius Werner const int checkOffset = ((safeDecode) && (dictSize < (int)(64 KB)));
98027b728dSJulius Werner
99027b728dSJulius Werner
100027b728dSJulius Werner /* Special cases */
101027b728dSJulius Werner if ((partialDecoding) && (oexit> oend-MFLIMIT)) oexit = oend-MFLIMIT; /* targetOutputSize too high => decode everything */
102027b728dSJulius Werner if ((endOnInput) && (unlikely(outputSize==0))) return ((inputSize==1) && (*ip==0)) ? 0 : -1; /* Empty output buffer */
103027b728dSJulius Werner if ((!endOnInput) && (unlikely(outputSize==0))) return (*ip==0?1:-1);
104027b728dSJulius Werner
105027b728dSJulius Werner
106027b728dSJulius Werner /* Main Loop */
107027b728dSJulius Werner while (1)
108027b728dSJulius Werner {
109027b728dSJulius Werner unsigned token;
110027b728dSJulius Werner size_t length;
111027b728dSJulius Werner const BYTE* match;
112027b728dSJulius Werner
113027b728dSJulius Werner /* get literal length */
114027b728dSJulius Werner token = *ip++;
115027b728dSJulius Werner if ((length=(token>>ML_BITS)) == RUN_MASK)
116027b728dSJulius Werner {
117027b728dSJulius Werner unsigned s;
118027b728dSJulius Werner do
119027b728dSJulius Werner {
120027b728dSJulius Werner s = *ip++;
121027b728dSJulius Werner length += s;
122027b728dSJulius Werner }
123027b728dSJulius Werner while (likely((endOnInput)?ip<iend-RUN_MASK:1) && (s==255));
124027b728dSJulius Werner if ((safeDecode) && unlikely((size_t)(op+length)<(size_t)(op))) goto _output_error; /* overflow detection */
125027b728dSJulius Werner if ((safeDecode) && unlikely((size_t)(ip+length)<(size_t)(ip))) goto _output_error; /* overflow detection */
126027b728dSJulius Werner }
127027b728dSJulius Werner
128027b728dSJulius Werner /* copy literals */
129027b728dSJulius Werner cpy = op+length;
130027b728dSJulius Werner if (((endOnInput) && ((cpy>(partialDecoding?oexit:oend-MFLIMIT)) || (ip+length>iend-(2+1+LASTLITERALS))) )
131027b728dSJulius Werner || ((!endOnInput) && (cpy>oend-COPYLENGTH)))
132027b728dSJulius Werner {
133027b728dSJulius Werner if (partialDecoding)
134027b728dSJulius Werner {
135027b728dSJulius Werner if (cpy > oend) goto _output_error; /* Error : write attempt beyond end of output buffer */
136027b728dSJulius Werner if ((endOnInput) && (ip+length > iend)) goto _output_error; /* Error : read attempt beyond end of input buffer */
137027b728dSJulius Werner }
138027b728dSJulius Werner else
139027b728dSJulius Werner {
140027b728dSJulius Werner if ((!endOnInput) && (cpy != oend)) goto _output_error; /* Error : block decoding must stop exactly there */
141027b728dSJulius Werner if ((endOnInput) && ((ip+length != iend) || (cpy > oend))) goto _output_error; /* Error : input must be consumed */
142027b728dSJulius Werner }
143027b728dSJulius Werner memcpy(op, ip, length);
144027b728dSJulius Werner ip += length;
145027b728dSJulius Werner op += length;
146027b728dSJulius Werner break; /* Necessarily EOF, due to parsing restrictions */
147027b728dSJulius Werner }
148027b728dSJulius Werner LZ4_wildCopy(op, ip, cpy);
149027b728dSJulius Werner ip += length; op = cpy;
150027b728dSJulius Werner
151027b728dSJulius Werner /* get offset */
152027b728dSJulius Werner match = cpy - LZ4_readLE16(ip); ip+=2;
153027b728dSJulius Werner if ((checkOffset) && (unlikely(match < lowLimit))) goto _output_error; /* Error : offset outside destination buffer */
154027b728dSJulius Werner
155027b728dSJulius Werner /* get matchlength */
156027b728dSJulius Werner length = token & ML_MASK;
157027b728dSJulius Werner if (length == ML_MASK)
158027b728dSJulius Werner {
159027b728dSJulius Werner unsigned s;
160027b728dSJulius Werner do
161027b728dSJulius Werner {
162027b728dSJulius Werner if ((endOnInput) && (ip > iend-LASTLITERALS)) goto _output_error;
163027b728dSJulius Werner s = *ip++;
164027b728dSJulius Werner length += s;
165027b728dSJulius Werner } while (s==255);
166027b728dSJulius Werner if ((safeDecode) && unlikely((size_t)(op+length)<(size_t)op)) goto _output_error; /* overflow detection */
167027b728dSJulius Werner }
168027b728dSJulius Werner length += MINMATCH;
169027b728dSJulius Werner
170027b728dSJulius Werner /* check external dictionary */
171027b728dSJulius Werner if ((dict==usingExtDict) && (match < lowPrefix))
172027b728dSJulius Werner {
173027b728dSJulius Werner if (unlikely(op+length > oend-LASTLITERALS)) goto _output_error; /* doesn't respect parsing restriction */
174027b728dSJulius Werner
175027b728dSJulius Werner if (length <= (size_t)(lowPrefix-match))
176027b728dSJulius Werner {
177027b728dSJulius Werner /* match can be copied as a single segment from external dictionary */
178027b728dSJulius Werner match = dictEnd - (lowPrefix-match);
179027b728dSJulius Werner memmove(op, match, length); op += length;
180027b728dSJulius Werner }
181027b728dSJulius Werner else
182027b728dSJulius Werner {
183027b728dSJulius Werner /* match encompass external dictionary and current segment */
184027b728dSJulius Werner size_t copySize = (size_t)(lowPrefix-match);
185027b728dSJulius Werner memcpy(op, dictEnd - copySize, copySize);
186027b728dSJulius Werner op += copySize;
187027b728dSJulius Werner copySize = length - copySize;
188027b728dSJulius Werner if (copySize > (size_t)(op-lowPrefix)) /* overlap within current segment */
189027b728dSJulius Werner {
190027b728dSJulius Werner BYTE* const endOfMatch = op + copySize;
191027b728dSJulius Werner const BYTE* copyFrom = lowPrefix;
192027b728dSJulius Werner while (op < endOfMatch) *op++ = *copyFrom++;
193027b728dSJulius Werner }
194027b728dSJulius Werner else
195027b728dSJulius Werner {
196027b728dSJulius Werner memcpy(op, lowPrefix, copySize);
197027b728dSJulius Werner op += copySize;
198027b728dSJulius Werner }
199027b728dSJulius Werner }
200027b728dSJulius Werner continue;
201027b728dSJulius Werner }
202027b728dSJulius Werner
203027b728dSJulius Werner /* copy repeated sequence */
204027b728dSJulius Werner cpy = op + length;
205027b728dSJulius Werner if (unlikely((op-match)<8))
206027b728dSJulius Werner {
207027b728dSJulius Werner const size_t dec64 = dec64table[op-match];
208027b728dSJulius Werner op[0] = match[0];
209027b728dSJulius Werner op[1] = match[1];
210027b728dSJulius Werner op[2] = match[2];
211027b728dSJulius Werner op[3] = match[3];
212027b728dSJulius Werner match += dec32table[op-match];
213027b728dSJulius Werner LZ4_copy4(op+4, match);
214027b728dSJulius Werner op += 8; match -= dec64;
215027b728dSJulius Werner } else { LZ4_copy8(op, match); op+=8; match+=8; }
216027b728dSJulius Werner
217027b728dSJulius Werner if (unlikely(cpy>oend-12))
218027b728dSJulius Werner {
219027b728dSJulius Werner if (cpy > oend-LASTLITERALS) goto _output_error; /* Error : last LASTLITERALS bytes must be literals */
220027b728dSJulius Werner if (op < oend-8)
221027b728dSJulius Werner {
222027b728dSJulius Werner LZ4_wildCopy(op, match, oend-8);
223027b728dSJulius Werner match += (oend-8) - op;
224027b728dSJulius Werner op = oend-8;
225027b728dSJulius Werner }
226027b728dSJulius Werner while (op<cpy) *op++ = *match++;
227027b728dSJulius Werner }
228027b728dSJulius Werner else
229027b728dSJulius Werner LZ4_wildCopy(op, match, cpy);
230027b728dSJulius Werner op=cpy; /* correction */
231027b728dSJulius Werner }
232027b728dSJulius Werner
233027b728dSJulius Werner /* end of decoding */
234027b728dSJulius Werner if (endOnInput)
235027b728dSJulius Werner return (int) (((char*)op)-dest); /* Nb of output bytes decoded */
236027b728dSJulius Werner else
237027b728dSJulius Werner return (int) (((const char*)ip)-source); /* Nb of input bytes read */
238027b728dSJulius Werner
239027b728dSJulius Werner /* Overflow error detected */
240027b728dSJulius Werner _output_error:
241027b728dSJulius Werner return (int) (-(((const char*)ip)-source))-1;
242027b728dSJulius Werner }
243