1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43#define FORCE_INLINE static __always_inline
44
45
46
47
48#include "bitstream.h"
49#include "fse.h"
50#include "zstd_internal.h"
51#include <linux/compiler.h>
52#include <linux/kernel.h>
53#include <linux/string.h>
54
55
56
57
58#define FSE_isError ERR_isError
59#define FSE_STATIC_ASSERT(c) \
60 { \
61 enum { FSE_static_assert = 1 / (int)(!!(c)) }; \
62 }
63
64
65
66
67
68
69
70
71
72
73
74#ifndef FSE_FUNCTION_EXTENSION
75#error "FSE_FUNCTION_EXTENSION must be defined"
76#endif
77#ifndef FSE_FUNCTION_TYPE
78#error "FSE_FUNCTION_TYPE must be defined"
79#endif
80
81
82#define FSE_CAT(X, Y) X##Y
83#define FSE_FUNCTION_NAME(X, Y) FSE_CAT(X, Y)
84#define FSE_TYPE_NAME(X, Y) FSE_CAT(X, Y)
85
86
87
88size_t FSE_buildDTable_wksp(FSE_DTable *dt, const short *normalizedCounter, unsigned maxSymbolValue, unsigned tableLog, void *workspace, size_t workspaceSize)
89{
90 void *const tdPtr = dt + 1;
91 FSE_DECODE_TYPE *const tableDecode = (FSE_DECODE_TYPE *)(tdPtr);
92 U16 *symbolNext = (U16 *)workspace;
93
94 U32 const maxSV1 = maxSymbolValue + 1;
95 U32 const tableSize = 1 << tableLog;
96 U32 highThreshold = tableSize - 1;
97
98
99 if (workspaceSize < sizeof(U16) * (FSE_MAX_SYMBOL_VALUE + 1))
100 return ERROR(tableLog_tooLarge);
101 if (maxSymbolValue > FSE_MAX_SYMBOL_VALUE)
102 return ERROR(maxSymbolValue_tooLarge);
103 if (tableLog > FSE_MAX_TABLELOG)
104 return ERROR(tableLog_tooLarge);
105
106
107 {
108 FSE_DTableHeader DTableH;
109 DTableH.tableLog = (U16)tableLog;
110 DTableH.fastMode = 1;
111 {
112 S16 const largeLimit = (S16)(1 << (tableLog - 1));
113 U32 s;
114 for (s = 0; s < maxSV1; s++) {
115 if (normalizedCounter[s] == -1) {
116 tableDecode[highThreshold--].symbol = (FSE_FUNCTION_TYPE)s;
117 symbolNext[s] = 1;
118 } else {
119 if (normalizedCounter[s] >= largeLimit)
120 DTableH.fastMode = 0;
121 symbolNext[s] = normalizedCounter[s];
122 }
123 }
124 }
125 memcpy(dt, &DTableH, sizeof(DTableH));
126 }
127
128
129 {
130 U32 const tableMask = tableSize - 1;
131 U32 const step = FSE_TABLESTEP(tableSize);
132 U32 s, position = 0;
133 for (s = 0; s < maxSV1; s++) {
134 int i;
135 for (i = 0; i < normalizedCounter[s]; i++) {
136 tableDecode[position].symbol = (FSE_FUNCTION_TYPE)s;
137 position = (position + step) & tableMask;
138 while (position > highThreshold)
139 position = (position + step) & tableMask;
140 }
141 }
142 if (position != 0)
143 return ERROR(GENERIC);
144 }
145
146
147 {
148 U32 u;
149 for (u = 0; u < tableSize; u++) {
150 FSE_FUNCTION_TYPE const symbol = (FSE_FUNCTION_TYPE)(tableDecode[u].symbol);
151 U16 nextState = symbolNext[symbol]++;
152 tableDecode[u].nbBits = (BYTE)(tableLog - BIT_highbit32((U32)nextState));
153 tableDecode[u].newState = (U16)((nextState << tableDecode[u].nbBits) - tableSize);
154 }
155 }
156
157 return 0;
158}
159
160
161
162
163size_t FSE_buildDTable_rle(FSE_DTable *dt, BYTE symbolValue)
164{
165 void *ptr = dt;
166 FSE_DTableHeader *const DTableH = (FSE_DTableHeader *)ptr;
167 void *dPtr = dt + 1;
168 FSE_decode_t *const cell = (FSE_decode_t *)dPtr;
169
170 DTableH->tableLog = 0;
171 DTableH->fastMode = 0;
172
173 cell->newState = 0;
174 cell->symbol = symbolValue;
175 cell->nbBits = 0;
176
177 return 0;
178}
179
180size_t FSE_buildDTable_raw(FSE_DTable *dt, unsigned nbBits)
181{
182 void *ptr = dt;
183 FSE_DTableHeader *const DTableH = (FSE_DTableHeader *)ptr;
184 void *dPtr = dt + 1;
185 FSE_decode_t *const dinfo = (FSE_decode_t *)dPtr;
186 const unsigned tableSize = 1 << nbBits;
187 const unsigned tableMask = tableSize - 1;
188 const unsigned maxSV1 = tableMask + 1;
189 unsigned s;
190
191
192 if (nbBits < 1)
193 return ERROR(GENERIC);
194
195
196 DTableH->tableLog = (U16)nbBits;
197 DTableH->fastMode = 1;
198 for (s = 0; s < maxSV1; s++) {
199 dinfo[s].newState = 0;
200 dinfo[s].symbol = (BYTE)s;
201 dinfo[s].nbBits = (BYTE)nbBits;
202 }
203
204 return 0;
205}
206
207FORCE_INLINE size_t FSE_decompress_usingDTable_generic(void *dst, size_t maxDstSize, const void *cSrc, size_t cSrcSize, const FSE_DTable *dt,
208 const unsigned fast)
209{
210 BYTE *const ostart = (BYTE *)dst;
211 BYTE *op = ostart;
212 BYTE *const omax = op + maxDstSize;
213 BYTE *const olimit = omax - 3;
214
215 BIT_DStream_t bitD;
216 FSE_DState_t state1;
217 FSE_DState_t state2;
218
219
220 CHECK_F(BIT_initDStream(&bitD, cSrc, cSrcSize));
221
222 FSE_initDState(&state1, &bitD, dt);
223 FSE_initDState(&state2, &bitD, dt);
224
225#define FSE_GETSYMBOL(statePtr) fast ? FSE_decodeSymbolFast(statePtr, &bitD) : FSE_decodeSymbol(statePtr, &bitD)
226
227
228 for (; (BIT_reloadDStream(&bitD) == BIT_DStream_unfinished) & (op < olimit); op += 4) {
229 op[0] = FSE_GETSYMBOL(&state1);
230
231 if (FSE_MAX_TABLELOG * 2 + 7 > sizeof(bitD.bitContainer) * 8)
232 BIT_reloadDStream(&bitD);
233
234 op[1] = FSE_GETSYMBOL(&state2);
235
236 if (FSE_MAX_TABLELOG * 4 + 7 > sizeof(bitD.bitContainer) * 8)
237 {
238 if (BIT_reloadDStream(&bitD) > BIT_DStream_unfinished) {
239 op += 2;
240 break;
241 }
242 }
243
244 op[2] = FSE_GETSYMBOL(&state1);
245
246 if (FSE_MAX_TABLELOG * 2 + 7 > sizeof(bitD.bitContainer) * 8)
247 BIT_reloadDStream(&bitD);
248
249 op[3] = FSE_GETSYMBOL(&state2);
250 }
251
252
253
254 while (1) {
255 if (op > (omax - 2))
256 return ERROR(dstSize_tooSmall);
257 *op++ = FSE_GETSYMBOL(&state1);
258 if (BIT_reloadDStream(&bitD) == BIT_DStream_overflow) {
259 *op++ = FSE_GETSYMBOL(&state2);
260 break;
261 }
262
263 if (op > (omax - 2))
264 return ERROR(dstSize_tooSmall);
265 *op++ = FSE_GETSYMBOL(&state2);
266 if (BIT_reloadDStream(&bitD) == BIT_DStream_overflow) {
267 *op++ = FSE_GETSYMBOL(&state1);
268 break;
269 }
270 }
271
272 return op - ostart;
273}
274
275size_t FSE_decompress_usingDTable(void *dst, size_t originalSize, const void *cSrc, size_t cSrcSize, const FSE_DTable *dt)
276{
277 const void *ptr = dt;
278 const FSE_DTableHeader *DTableH = (const FSE_DTableHeader *)ptr;
279 const U32 fastMode = DTableH->fastMode;
280
281
282 if (fastMode)
283 return FSE_decompress_usingDTable_generic(dst, originalSize, cSrc, cSrcSize, dt, 1);
284 return FSE_decompress_usingDTable_generic(dst, originalSize, cSrc, cSrcSize, dt, 0);
285}
286
287size_t FSE_decompress_wksp(void *dst, size_t dstCapacity, const void *cSrc, size_t cSrcSize, unsigned maxLog, void *workspace, size_t workspaceSize)
288{
289 const BYTE *const istart = (const BYTE *)cSrc;
290 const BYTE *ip = istart;
291 unsigned tableLog;
292 unsigned maxSymbolValue = FSE_MAX_SYMBOL_VALUE;
293 size_t NCountLength;
294
295 FSE_DTable *dt;
296 short *counting;
297 size_t spaceUsed32 = 0;
298
299 FSE_STATIC_ASSERT(sizeof(FSE_DTable) == sizeof(U32));
300
301 dt = (FSE_DTable *)((U32 *)workspace + spaceUsed32);
302 spaceUsed32 += FSE_DTABLE_SIZE_U32(maxLog);
303 counting = (short *)((U32 *)workspace + spaceUsed32);
304 spaceUsed32 += ALIGN(sizeof(short) * (FSE_MAX_SYMBOL_VALUE + 1), sizeof(U32)) >> 2;
305
306 if ((spaceUsed32 << 2) > workspaceSize)
307 return ERROR(tableLog_tooLarge);
308 workspace = (U32 *)workspace + spaceUsed32;
309 workspaceSize -= (spaceUsed32 << 2);
310
311
312 NCountLength = FSE_readNCount(counting, &maxSymbolValue, &tableLog, istart, cSrcSize);
313 if (FSE_isError(NCountLength))
314 return NCountLength;
315
316
317 if (tableLog > maxLog)
318 return ERROR(tableLog_tooLarge);
319 ip += NCountLength;
320 cSrcSize -= NCountLength;
321
322 CHECK_F(FSE_buildDTable_wksp(dt, counting, maxSymbolValue, tableLog, workspace, workspaceSize));
323
324 return FSE_decompress_usingDTable(dst, dstCapacity, ip, cSrcSize, dt);
325}
326