blob: 9d3c694e4431ebfb618706709b711012f816017c [file] [log] [blame]
Stefan Reinauer2e200cd2012-10-30 14:02:45 -07001/* LzFind.c -- Match finder for LZ algorithms
22009-04-22 : Igor Pavlov : Public domain */
3
4#include <string.h>
5
6#include "LzFind.h"
7#include "LzHash.h"
8
9#define kEmptyHashValue 0
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -060010#define kMaxValForNormalize ((uint32_t)0xFFFFFFFF)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070011#define kNormalizeStepMin (1 << 10) /* it must be power of 2 */
12#define kNormalizeMask (~(kNormalizeStepMin - 1))
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -060013#define kMaxHistorySize ((uint32_t)3 << 30)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070014
15#define kStartMaxLen 3
16
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -060017static void LzInWindow_Free(struct CMatchFinder *p, struct ISzAlloc *alloc)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070018{
19 if (!p->directInput)
20 {
21 alloc->Free(alloc, p->bufferBase);
22 p->bufferBase = 0;
23 }
24}
25
26/* keepSizeBefore + keepSizeAfter + keepSizeReserv must be < 4G) */
27
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -060028static int LzInWindow_Create(struct CMatchFinder *p, uint32_t keepSizeReserv, struct ISzAlloc *alloc)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070029{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -060030 uint32_t blockSize = p->keepSizeBefore + p->keepSizeAfter + keepSizeReserv;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070031 if (p->directInput)
32 {
33 p->blockSize = blockSize;
34 return 1;
35 }
36 if (p->bufferBase == 0 || p->blockSize != blockSize)
37 {
38 LzInWindow_Free(p, alloc);
39 p->blockSize = blockSize;
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -060040 p->bufferBase = (uint8_t *)alloc->Alloc(alloc, (size_t)blockSize);
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070041 }
42 return (p->bufferBase != 0);
43}
44
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -060045uint8_t *MatchFinder_GetPointerToCurrentPos(struct CMatchFinder *p) { return p->buffer; }
46static uint8_t MatchFinder_GetIndexByte(struct CMatchFinder *p, int32_t bindex) { return p->buffer[bindex]; }
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070047
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -060048static uint32_t MatchFinder_GetNumAvailableBytes(struct CMatchFinder *p) { return p->streamPos - p->pos; }
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070049
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -060050void MatchFinder_ReduceOffsets(struct CMatchFinder *p, uint32_t subValue)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070051{
52 p->posLimit -= subValue;
53 p->pos -= subValue;
54 p->streamPos -= subValue;
55}
56
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -060057static void MatchFinder_ReadBlock(struct CMatchFinder *p)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070058{
59 if (p->streamEndWasReached || p->result != SZ_OK)
60 return;
61 if (p->directInput)
62 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -060063 uint32_t curSize = 0xFFFFFFFF - p->streamPos;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070064 if (curSize > p->directInputRem)
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -060065 curSize = (uint32_t)p->directInputRem;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070066 p->directInputRem -= curSize;
67 p->streamPos += curSize;
68 if (p->directInputRem == 0)
69 p->streamEndWasReached = 1;
70 return;
71 }
72 for (;;)
73 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -060074 uint8_t *dest = p->buffer + (p->streamPos - p->pos);
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070075 size_t size = (p->bufferBase + p->blockSize - dest);
76 if (size == 0)
77 return;
78 p->result = p->stream->Read(p->stream, dest, &size);
79 if (p->result != SZ_OK)
80 return;
81 if (size == 0)
82 {
83 p->streamEndWasReached = 1;
84 return;
85 }
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -060086 p->streamPos += (uint32_t)size;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070087 if (p->streamPos - p->pos > p->keepSizeAfter)
88 return;
89 }
90}
91
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -060092void MatchFinder_MoveBlock(struct CMatchFinder *p)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -070093{
94 memmove(p->bufferBase,
95 p->buffer - p->keepSizeBefore,
96 (size_t)(p->streamPos - p->pos + p->keepSizeBefore));
97 p->buffer = p->bufferBase + p->keepSizeBefore;
98}
99
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600100int MatchFinder_NeedMove(struct CMatchFinder *p)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700101{
102 if (p->directInput)
103 return 0;
104 /* if (p->streamEndWasReached) return 0; */
105 return ((size_t)(p->bufferBase + p->blockSize - p->buffer) <= p->keepSizeAfter);
106}
107
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600108void MatchFinder_ReadIfRequired(struct CMatchFinder *p)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700109{
110 if (p->streamEndWasReached)
111 return;
112 if (p->keepSizeAfter >= p->streamPos - p->pos)
113 MatchFinder_ReadBlock(p);
114}
115
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600116static void MatchFinder_CheckAndMoveAndRead(struct CMatchFinder *p)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700117{
118 if (MatchFinder_NeedMove(p))
119 MatchFinder_MoveBlock(p);
120 MatchFinder_ReadBlock(p);
121}
122
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600123static void MatchFinder_SetDefaultSettings(struct CMatchFinder *p)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700124{
125 p->cutValue = 32;
126 p->btMode = 1;
127 p->numHashBytes = 4;
128 p->bigHash = 0;
129}
130
131#define kCrcPoly 0xEDB88320
132
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600133void MatchFinder_Construct(struct CMatchFinder *p)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700134{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600135 uint32_t i;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700136 p->bufferBase = 0;
137 p->directInput = 0;
138 p->hash = 0;
139 MatchFinder_SetDefaultSettings(p);
140
141 for (i = 0; i < 256; i++)
142 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600143 uint32_t r = i;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700144 int j;
145 for (j = 0; j < 8; j++)
146 r = (r >> 1) ^ (kCrcPoly & ~((r & 1) - 1));
147 p->crc[i] = r;
148 }
149}
150
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600151static void MatchFinder_FreeThisClassMemory(struct CMatchFinder *p, struct ISzAlloc *alloc)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700152{
153 alloc->Free(alloc, p->hash);
154 p->hash = 0;
155}
156
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600157void MatchFinder_Free(struct CMatchFinder *p, struct ISzAlloc *alloc)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700158{
159 MatchFinder_FreeThisClassMemory(p, alloc);
160 LzInWindow_Free(p, alloc);
161}
162
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600163static CLzRef* AllocRefs(uint32_t num, struct ISzAlloc *alloc)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700164{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600165 size_t sizeInuint8_ts = (size_t)num * sizeof(CLzRef);
166 if (sizeInuint8_ts / sizeof(CLzRef) != num)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700167 return 0;
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600168 return (CLzRef *)alloc->Alloc(alloc, sizeInuint8_ts);
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700169}
170
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600171int MatchFinder_Create(struct CMatchFinder *p, uint32_t historySize,
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600172 uint32_t keepAddBufferBefore, uint32_t matchMaxLen, uint32_t keepAddBufferAfter,
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600173 struct ISzAlloc *alloc)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700174{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600175 uint32_t sizeReserv;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700176 if (historySize > kMaxHistorySize)
177 {
178 MatchFinder_Free(p, alloc);
179 return 0;
180 }
181 sizeReserv = historySize >> 1;
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600182 if (historySize > ((uint32_t)2 << 30))
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700183 sizeReserv = historySize >> 2;
184 sizeReserv += (keepAddBufferBefore + matchMaxLen + keepAddBufferAfter) / 2 + (1 << 19);
185
186 p->keepSizeBefore = historySize + keepAddBufferBefore + 1;
187 p->keepSizeAfter = matchMaxLen + keepAddBufferAfter;
188 /* we need one additional byte, since we use MoveBlock after pos++ and before dictionary using */
189 if (LzInWindow_Create(p, sizeReserv, alloc))
190 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600191 uint32_t newCyclicBufferSize = historySize + 1;
192 uint32_t hs;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700193 p->matchMaxLen = matchMaxLen;
194 {
195 p->fixedHashSize = 0;
196 if (p->numHashBytes == 2)
197 hs = (1 << 16) - 1;
198 else
199 {
200 hs = historySize - 1;
201 hs |= (hs >> 1);
202 hs |= (hs >> 2);
203 hs |= (hs >> 4);
204 hs |= (hs >> 8);
205 hs >>= 1;
206 hs |= 0xFFFF; /* don't change it! It's required for Deflate */
207 if (hs > (1 << 24))
208 {
209 if (p->numHashBytes == 3)
210 hs = (1 << 24) - 1;
211 else
212 hs >>= 1;
213 }
214 }
215 p->hashMask = hs;
216 hs++;
217 if (p->numHashBytes > 2) p->fixedHashSize += kHash2Size;
218 if (p->numHashBytes > 3) p->fixedHashSize += kHash3Size;
219 if (p->numHashBytes > 4) p->fixedHashSize += kHash4Size;
220 hs += p->fixedHashSize;
221 }
222
223 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600224 uint32_t prevSize = p->hashSizeSum + p->numSons;
225 uint32_t newSize;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700226 p->historySize = historySize;
227 p->hashSizeSum = hs;
228 p->cyclicBufferSize = newCyclicBufferSize;
229 p->numSons = (p->btMode ? newCyclicBufferSize * 2 : newCyclicBufferSize);
230 newSize = p->hashSizeSum + p->numSons;
231 if (p->hash != 0 && prevSize == newSize)
232 return 1;
233 MatchFinder_FreeThisClassMemory(p, alloc);
234 p->hash = AllocRefs(newSize, alloc);
235 if (p->hash != 0)
236 {
237 p->son = p->hash + p->hashSizeSum;
238 return 1;
239 }
240 }
241 }
242 MatchFinder_Free(p, alloc);
243 return 0;
244}
245
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600246static void MatchFinder_SetLimits(struct CMatchFinder *p)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700247{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600248 uint32_t limit = kMaxValForNormalize - p->pos;
249 uint32_t limit2 = p->cyclicBufferSize - p->cyclicBufferPos;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700250 if (limit2 < limit)
251 limit = limit2;
252 limit2 = p->streamPos - p->pos;
253 if (limit2 <= p->keepSizeAfter)
254 {
255 if (limit2 > 0)
256 limit2 = 1;
257 }
258 else
259 limit2 -= p->keepSizeAfter;
260 if (limit2 < limit)
261 limit = limit2;
262 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600263 uint32_t lenLimit = p->streamPos - p->pos;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700264 if (lenLimit > p->matchMaxLen)
265 lenLimit = p->matchMaxLen;
266 p->lenLimit = lenLimit;
267 }
268 p->posLimit = p->pos + limit;
269}
270
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600271void MatchFinder_Init(struct CMatchFinder *p)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700272{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600273 uint32_t i;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700274 for (i = 0; i < p->hashSizeSum; i++)
275 p->hash[i] = kEmptyHashValue;
276 p->cyclicBufferPos = 0;
277 p->buffer = p->bufferBase;
278 p->pos = p->streamPos = p->cyclicBufferSize;
279 p->result = SZ_OK;
280 p->streamEndWasReached = 0;
281 MatchFinder_ReadBlock(p);
282 MatchFinder_SetLimits(p);
283}
284
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600285static uint32_t MatchFinder_GetSubValue(struct CMatchFinder *p)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700286{
287 return (p->pos - p->historySize - 1) & kNormalizeMask;
288}
289
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600290void MatchFinder_Normalize3(uint32_t subValue, CLzRef *items, uint32_t numItems)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700291{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600292 uint32_t i;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700293 for (i = 0; i < numItems; i++)
294 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600295 uint32_t value = items[i];
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700296 if (value <= subValue)
297 value = kEmptyHashValue;
298 else
299 value -= subValue;
300 items[i] = value;
301 }
302}
303
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600304static void MatchFinder_Normalize(struct CMatchFinder *p)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700305{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600306 uint32_t subValue = MatchFinder_GetSubValue(p);
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700307 MatchFinder_Normalize3(subValue, p->hash, p->hashSizeSum + p->numSons);
308 MatchFinder_ReduceOffsets(p, subValue);
309}
310
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600311static void MatchFinder_CheckLimits(struct CMatchFinder *p)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700312{
313 if (p->pos == kMaxValForNormalize)
314 MatchFinder_Normalize(p);
315 if (!p->streamEndWasReached && p->keepSizeAfter == p->streamPos - p->pos)
316 MatchFinder_CheckAndMoveAndRead(p);
317 if (p->cyclicBufferPos == p->cyclicBufferSize)
318 p->cyclicBufferPos = 0;
319 MatchFinder_SetLimits(p);
320}
321
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600322static uint32_t * Hc_GetMatchesSpec(uint32_t lenLimit, uint32_t curMatch, uint32_t pos, const uint8_t *cur, CLzRef *son,
323 uint32_t _cyclicBufferPos, uint32_t _cyclicBufferSize, uint32_t cutValue,
324 uint32_t *distances, uint32_t maxLen)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700325{
326 son[_cyclicBufferPos] = curMatch;
327 for (;;)
328 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600329 uint32_t delta = pos - curMatch;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700330 if (cutValue-- == 0 || delta >= _cyclicBufferSize)
331 return distances;
332 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600333 const uint8_t *pb = cur - delta;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700334 curMatch = son[_cyclicBufferPos - delta + ((delta > _cyclicBufferPos) ? _cyclicBufferSize : 0)];
335 if (pb[maxLen] == cur[maxLen] && *pb == *cur)
336 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600337 uint32_t len = 0;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700338 while (++len != lenLimit)
339 if (pb[len] != cur[len])
340 break;
341 if (maxLen < len)
342 {
343 *distances++ = maxLen = len;
344 *distances++ = delta - 1;
345 if (len == lenLimit)
346 return distances;
347 }
348 }
349 }
350 }
351}
352
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600353uint32_t * GetMatchesSpec1(uint32_t lenLimit, uint32_t curMatch, uint32_t pos, const uint8_t *cur, CLzRef *son,
354 uint32_t _cyclicBufferPos, uint32_t _cyclicBufferSize, uint32_t cutValue,
355 uint32_t *distances, uint32_t maxLen)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700356{
357 CLzRef *ptr0 = son + (_cyclicBufferPos << 1) + 1;
358 CLzRef *ptr1 = son + (_cyclicBufferPos << 1);
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600359 uint32_t len0 = 0, len1 = 0;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700360 for (;;)
361 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600362 uint32_t delta = pos - curMatch;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700363 if (cutValue-- == 0 || delta >= _cyclicBufferSize)
364 {
365 *ptr0 = *ptr1 = kEmptyHashValue;
366 return distances;
367 }
368 {
369 CLzRef *pair = son + ((_cyclicBufferPos - delta + ((delta > _cyclicBufferPos) ? _cyclicBufferSize : 0)) << 1);
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600370 const uint8_t *pb = cur - delta;
371 uint32_t len = (len0 < len1 ? len0 : len1);
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700372 if (pb[len] == cur[len])
373 {
374 if (++len != lenLimit && pb[len] == cur[len])
375 while (++len != lenLimit)
376 if (pb[len] != cur[len])
377 break;
378 if (maxLen < len)
379 {
380 *distances++ = maxLen = len;
381 *distances++ = delta - 1;
382 if (len == lenLimit)
383 {
384 *ptr1 = pair[0];
385 *ptr0 = pair[1];
386 return distances;
387 }
388 }
389 }
390 if (pb[len] < cur[len])
391 {
392 *ptr1 = curMatch;
393 ptr1 = pair + 1;
394 curMatch = *ptr1;
395 len1 = len;
396 }
397 else
398 {
399 *ptr0 = curMatch;
400 ptr0 = pair;
401 curMatch = *ptr0;
402 len0 = len;
403 }
404 }
405 }
406}
407
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600408static void SkipMatchesSpec(uint32_t lenLimit, uint32_t curMatch, uint32_t pos, const uint8_t *cur, CLzRef *son,
409 uint32_t _cyclicBufferPos, uint32_t _cyclicBufferSize, uint32_t cutValue)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700410{
411 CLzRef *ptr0 = son + (_cyclicBufferPos << 1) + 1;
412 CLzRef *ptr1 = son + (_cyclicBufferPos << 1);
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600413 uint32_t len0 = 0, len1 = 0;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700414 for (;;)
415 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600416 uint32_t delta = pos - curMatch;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700417 if (cutValue-- == 0 || delta >= _cyclicBufferSize)
418 {
419 *ptr0 = *ptr1 = kEmptyHashValue;
420 return;
421 }
422 {
423 CLzRef *pair = son + ((_cyclicBufferPos - delta + ((delta > _cyclicBufferPos) ? _cyclicBufferSize : 0)) << 1);
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600424 const uint8_t *pb = cur - delta;
425 uint32_t len = (len0 < len1 ? len0 : len1);
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700426 if (pb[len] == cur[len])
427 {
428 while (++len != lenLimit)
429 if (pb[len] != cur[len])
430 break;
431 {
432 if (len == lenLimit)
433 {
434 *ptr1 = pair[0];
435 *ptr0 = pair[1];
436 return;
437 }
438 }
439 }
440 if (pb[len] < cur[len])
441 {
442 *ptr1 = curMatch;
443 ptr1 = pair + 1;
444 curMatch = *ptr1;
445 len1 = len;
446 }
447 else
448 {
449 *ptr0 = curMatch;
450 ptr0 = pair;
451 curMatch = *ptr0;
452 len0 = len;
453 }
454 }
455 }
456}
457
458#define MOVE_POS \
459 ++p->cyclicBufferPos; \
460 p->buffer++; \
461 if (++p->pos == p->posLimit) MatchFinder_CheckLimits(p);
462
463#define MOVE_POS_RET MOVE_POS return offset;
464
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600465static void MatchFinder_MovePos(struct CMatchFinder *p) { MOVE_POS; }
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700466
467#define GET_MATCHES_HEADER2(minLen, ret_op) \
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600468 uint32_t lenLimit; uint32_t hashValue; const uint8_t *cur; uint32_t curMatch; \
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700469 lenLimit = p->lenLimit; { if (lenLimit < minLen) { MatchFinder_MovePos(p); ret_op; }} \
470 cur = p->buffer;
471
472#define GET_MATCHES_HEADER(minLen) GET_MATCHES_HEADER2(minLen, return 0)
473#define SKIP_HEADER(minLen) GET_MATCHES_HEADER2(minLen, continue)
474
475#define MF_PARAMS(p) p->pos, p->buffer, p->son, p->cyclicBufferPos, p->cyclicBufferSize, p->cutValue
476
477#define GET_MATCHES_FOOTER(offset, maxLen) \
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600478 offset = (uint32_t)(GetMatchesSpec1(lenLimit, curMatch, MF_PARAMS(p), \
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700479 distances + offset, maxLen) - distances); MOVE_POS_RET;
480
481#define SKIP_FOOTER \
482 SkipMatchesSpec(lenLimit, curMatch, MF_PARAMS(p)); MOVE_POS;
483
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600484static uint32_t Bt2_MatchFinder_GetMatches(struct CMatchFinder *p, uint32_t *distances)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700485{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600486 uint32_t offset;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700487 GET_MATCHES_HEADER(2)
488 HASH2_CALC;
489 curMatch = p->hash[hashValue];
490 p->hash[hashValue] = p->pos;
491 offset = 0;
492 GET_MATCHES_FOOTER(offset, 1)
493}
494
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600495uint32_t Bt3Zip_MatchFinder_GetMatches(struct CMatchFinder *p, uint32_t *distances)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700496{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600497 uint32_t offset;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700498 GET_MATCHES_HEADER(3)
499 HASH_ZIP_CALC;
500 curMatch = p->hash[hashValue];
501 p->hash[hashValue] = p->pos;
502 offset = 0;
503 GET_MATCHES_FOOTER(offset, 2)
504}
505
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600506static uint32_t Bt3_MatchFinder_GetMatches(struct CMatchFinder *p, uint32_t *distances)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700507{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600508 uint32_t hash2Value, delta2, maxLen, offset;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700509 GET_MATCHES_HEADER(3)
510
511 HASH3_CALC;
512
513 delta2 = p->pos - p->hash[hash2Value];
514 curMatch = p->hash[kFix3HashSize + hashValue];
Kyösti Mälkkiecd84242013-09-13 07:57:49 +0300515
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700516 p->hash[hash2Value] =
517 p->hash[kFix3HashSize + hashValue] = p->pos;
518
519
520 maxLen = 2;
521 offset = 0;
522 if (delta2 < p->cyclicBufferSize && *(cur - delta2) == *cur)
523 {
524 for (; maxLen != lenLimit; maxLen++)
525 if (cur[(ptrdiff_t)maxLen - delta2] != cur[maxLen])
526 break;
527 distances[0] = maxLen;
528 distances[1] = delta2 - 1;
529 offset = 2;
530 if (maxLen == lenLimit)
531 {
532 SkipMatchesSpec(lenLimit, curMatch, MF_PARAMS(p));
533 MOVE_POS_RET;
534 }
535 }
536 GET_MATCHES_FOOTER(offset, maxLen)
537}
538
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600539static uint32_t Bt4_MatchFinder_GetMatches(struct CMatchFinder *p, uint32_t *distances)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700540{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600541 uint32_t hash2Value, hash3Value, delta2, delta3, maxLen, offset;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700542 GET_MATCHES_HEADER(4)
543
544 HASH4_CALC;
545
546 delta2 = p->pos - p->hash[ hash2Value];
547 delta3 = p->pos - p->hash[kFix3HashSize + hash3Value];
548 curMatch = p->hash[kFix4HashSize + hashValue];
Kyösti Mälkkiecd84242013-09-13 07:57:49 +0300549
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700550 p->hash[ hash2Value] =
551 p->hash[kFix3HashSize + hash3Value] =
552 p->hash[kFix4HashSize + hashValue] = p->pos;
553
554 maxLen = 1;
555 offset = 0;
556 if (delta2 < p->cyclicBufferSize && *(cur - delta2) == *cur)
557 {
558 distances[0] = maxLen = 2;
559 distances[1] = delta2 - 1;
560 offset = 2;
561 }
562 if (delta2 != delta3 && delta3 < p->cyclicBufferSize && *(cur - delta3) == *cur)
563 {
564 maxLen = 3;
565 distances[offset + 1] = delta3 - 1;
566 offset += 2;
567 delta2 = delta3;
568 }
569 if (offset != 0)
570 {
571 for (; maxLen != lenLimit; maxLen++)
572 if (cur[(ptrdiff_t)maxLen - delta2] != cur[maxLen])
573 break;
574 distances[offset - 2] = maxLen;
575 if (maxLen == lenLimit)
576 {
577 SkipMatchesSpec(lenLimit, curMatch, MF_PARAMS(p));
578 MOVE_POS_RET;
579 }
580 }
581 if (maxLen < 3)
582 maxLen = 3;
583 GET_MATCHES_FOOTER(offset, maxLen)
584}
585
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600586static uint32_t Hc4_MatchFinder_GetMatches(struct CMatchFinder *p, uint32_t *distances)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700587{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600588 uint32_t hash2Value, hash3Value, delta2, delta3, maxLen, offset;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700589 GET_MATCHES_HEADER(4)
590
591 HASH4_CALC;
592
593 delta2 = p->pos - p->hash[ hash2Value];
594 delta3 = p->pos - p->hash[kFix3HashSize + hash3Value];
595 curMatch = p->hash[kFix4HashSize + hashValue];
596
597 p->hash[ hash2Value] =
598 p->hash[kFix3HashSize + hash3Value] =
599 p->hash[kFix4HashSize + hashValue] = p->pos;
600
601 maxLen = 1;
602 offset = 0;
603 if (delta2 < p->cyclicBufferSize && *(cur - delta2) == *cur)
604 {
605 distances[0] = maxLen = 2;
606 distances[1] = delta2 - 1;
607 offset = 2;
608 }
609 if (delta2 != delta3 && delta3 < p->cyclicBufferSize && *(cur - delta3) == *cur)
610 {
611 maxLen = 3;
612 distances[offset + 1] = delta3 - 1;
613 offset += 2;
614 delta2 = delta3;
615 }
616 if (offset != 0)
617 {
618 for (; maxLen != lenLimit; maxLen++)
619 if (cur[(ptrdiff_t)maxLen - delta2] != cur[maxLen])
620 break;
621 distances[offset - 2] = maxLen;
622 if (maxLen == lenLimit)
623 {
624 p->son[p->cyclicBufferPos] = curMatch;
625 MOVE_POS_RET;
626 }
627 }
628 if (maxLen < 3)
629 maxLen = 3;
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600630 offset = (uint32_t)(Hc_GetMatchesSpec(lenLimit, curMatch, MF_PARAMS(p),
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700631 distances + offset, maxLen) - (distances));
632 MOVE_POS_RET
633}
634
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600635uint32_t Hc3Zip_MatchFinder_GetMatches(struct CMatchFinder *p, uint32_t *distances)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700636{
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600637 uint32_t offset;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700638 GET_MATCHES_HEADER(3)
639 HASH_ZIP_CALC;
640 curMatch = p->hash[hashValue];
641 p->hash[hashValue] = p->pos;
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600642 offset = (uint32_t)(Hc_GetMatchesSpec(lenLimit, curMatch, MF_PARAMS(p),
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700643 distances, 2) - (distances));
644 MOVE_POS_RET
645}
646
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600647static void Bt2_MatchFinder_Skip(struct CMatchFinder *p, uint32_t num)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700648{
649 do
650 {
651 SKIP_HEADER(2)
652 HASH2_CALC;
653 curMatch = p->hash[hashValue];
654 p->hash[hashValue] = p->pos;
655 SKIP_FOOTER
656 }
657 while (--num != 0);
658}
659
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600660void Bt3Zip_MatchFinder_Skip(struct CMatchFinder *p, uint32_t num)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700661{
662 do
663 {
664 SKIP_HEADER(3)
665 HASH_ZIP_CALC;
666 curMatch = p->hash[hashValue];
667 p->hash[hashValue] = p->pos;
668 SKIP_FOOTER
669 }
670 while (--num != 0);
671}
672
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600673static void Bt3_MatchFinder_Skip(struct CMatchFinder *p, uint32_t num)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700674{
675 do
676 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600677 uint32_t hash2Value;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700678 SKIP_HEADER(3)
679 HASH3_CALC;
680 curMatch = p->hash[kFix3HashSize + hashValue];
681 p->hash[hash2Value] =
682 p->hash[kFix3HashSize + hashValue] = p->pos;
683 SKIP_FOOTER
684 }
685 while (--num != 0);
686}
687
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600688static void Bt4_MatchFinder_Skip(struct CMatchFinder *p, uint32_t num)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700689{
690 do
691 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600692 uint32_t hash2Value, hash3Value;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700693 SKIP_HEADER(4)
694 HASH4_CALC;
695 curMatch = p->hash[kFix4HashSize + hashValue];
696 p->hash[ hash2Value] =
697 p->hash[kFix3HashSize + hash3Value] = p->pos;
698 p->hash[kFix4HashSize + hashValue] = p->pos;
699 SKIP_FOOTER
700 }
701 while (--num != 0);
702}
703
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600704static void Hc4_MatchFinder_Skip(struct CMatchFinder *p, uint32_t num)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700705{
706 do
707 {
Alexandru Gagniuc91e9f272014-01-26 22:55:01 -0600708 uint32_t hash2Value, hash3Value;
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700709 SKIP_HEADER(4)
710 HASH4_CALC;
711 curMatch = p->hash[kFix4HashSize + hashValue];
712 p->hash[ hash2Value] =
713 p->hash[kFix3HashSize + hash3Value] =
714 p->hash[kFix4HashSize + hashValue] = p->pos;
715 p->son[p->cyclicBufferPos] = curMatch;
716 MOVE_POS
717 }
718 while (--num != 0);
719}
720
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600721void Hc3Zip_MatchFinder_Skip(struct CMatchFinder *p, uint32_t num)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700722{
723 do
724 {
725 SKIP_HEADER(3)
726 HASH_ZIP_CALC;
727 curMatch = p->hash[hashValue];
728 p->hash[hashValue] = p->pos;
729 p->son[p->cyclicBufferPos] = curMatch;
730 MOVE_POS
731 }
732 while (--num != 0);
733}
734
Alexandru Gagniuc9ad52fe2014-01-27 20:57:54 -0600735void MatchFinder_CreateVTable(struct CMatchFinder *p, struct IMatchFinder *vTable)
Stefan Reinauer2e200cd2012-10-30 14:02:45 -0700736{
737 vTable->Init = (Mf_Init_Func)MatchFinder_Init;
738 vTable->GetIndexByte = (Mf_GetIndexByte_Func)MatchFinder_GetIndexByte;
739 vTable->GetNumAvailableBytes = (Mf_GetNumAvailableBytes_Func)MatchFinder_GetNumAvailableBytes;
740 vTable->GetPointerToCurrentPos = (Mf_GetPointerToCurrentPos_Func)MatchFinder_GetPointerToCurrentPos;
741 if (!p->btMode)
742 {
743 vTable->GetMatches = (Mf_GetMatches_Func)Hc4_MatchFinder_GetMatches;
744 vTable->Skip = (Mf_Skip_Func)Hc4_MatchFinder_Skip;
745 }
746 else if (p->numHashBytes == 2)
747 {
748 vTable->GetMatches = (Mf_GetMatches_Func)Bt2_MatchFinder_GetMatches;
749 vTable->Skip = (Mf_Skip_Func)Bt2_MatchFinder_Skip;
750 }
751 else if (p->numHashBytes == 3)
752 {
753 vTable->GetMatches = (Mf_GetMatches_Func)Bt3_MatchFinder_GetMatches;
754 vTable->Skip = (Mf_Skip_Func)Bt3_MatchFinder_Skip;
755 }
756 else
757 {
758 vTable->GetMatches = (Mf_GetMatches_Func)Bt4_MatchFinder_GetMatches;
759 vTable->Skip = (Mf_Skip_Func)Bt4_MatchFinder_Skip;
760 }
761}