xref: /freebsd/contrib/libarchive/libarchive/archive_ppmd7.c (revision 2e113ef82465598b8c26e0ca415fbe90677fbd47)
1 /* Ppmd7.c -- PPMdH codec
2 2010-03-12 : Igor Pavlov : Public domain
3 This code is based on PPMd var.H (2001): Dmitry Shkarin : Public domain */
4 
5 #include "archive_platform.h"
6 
7 #include <stdlib.h>
8 
9 #include "archive_ppmd7_private.h"
10 
11 #ifdef PPMD_32BIT
12   #define Ppmd7_GetPtr(p, ptr) (ptr)
13   #define Ppmd7_GetContext(p, ptr) (ptr)
14   #define Ppmd7_GetStats(p, ctx) ((ctx)->Stats)
15 #else
16   #define Ppmd7_GetPtr(p, offs) ((void *)((p)->Base + (offs)))
17   #define Ppmd7_GetContext(p, offs) ((CPpmd7_Context *)Ppmd7_GetPtr((p), (offs)))
18   #define Ppmd7_GetStats(p, ctx) ((CPpmd_State *)Ppmd7_GetPtr((p), ((ctx)->Stats)))
19 #endif
20 
21 #define Ppmd7_GetBinSumm(p) \
22     &p->BinSumm[Ppmd7Context_OneState(p->MinContext)->Freq - 1][p->PrevSuccess + \
23     p->NS2BSIndx[Ppmd7_GetContext(p, p->MinContext->Suffix)->NumStats - 1] + \
24     (p->HiBitsFlag = p->HB2Flag[p->FoundState->Symbol]) + \
25     2 * p->HB2Flag[Ppmd7Context_OneState(p->MinContext)->Symbol] + \
26     ((p->RunLength >> 26) & 0x20)]
27 
28 #define kTopValue (1 << 24)
29 #define MAX_FREQ 124
30 #define UNIT_SIZE 12
31 
32 #define U2B(nu) ((UInt32)(nu) * UNIT_SIZE)
33 #define U2I(nu) (p->Units2Indx[(nu) - 1])
34 #define I2U(indx) (p->Indx2Units[indx])
35 
36 #ifdef PPMD_32BIT
37   #define REF(ptr) (ptr)
38 #else
39   #define REF(ptr) ((UInt32)((Byte *)(ptr) - (p)->Base))
40 #endif
41 
42 #define STATS_REF(ptr) ((CPpmd_State_Ref)REF(ptr))
43 
44 #define CTX(ref) ((CPpmd7_Context *)Ppmd7_GetContext(p, ref))
45 #define STATS(ctx) Ppmd7_GetStats(p, ctx)
46 #define ONE_STATE(ctx) Ppmd7Context_OneState(ctx)
47 #define SUFFIX(ctx) CTX((ctx)->Suffix)
48 
49 static const UInt16 kInitBinEsc[] = { 0x3CDD, 0x1F3F, 0x59BF, 0x48F3, 0x64A1, 0x5ABC, 0x6632, 0x6051};
50 static const Byte PPMD7_kExpEscape[16] = { 25, 14, 9, 7, 5, 5, 4, 4, 4, 3, 3, 3, 2, 2, 2, 2 };
51 
52 typedef CPpmd7_Context * CTX_PTR;
53 
54 struct CPpmd7_Node_;
55 
56 typedef
57   #ifdef PPMD_32BIT
58     struct CPpmd7_Node_ *
59   #else
60     UInt32
61   #endif
62   CPpmd7_Node_Ref;
63 
64 typedef struct CPpmd7_Node_
65 {
66   UInt16 Stamp; /* must be at offset 0 as CPpmd7_Context::NumStats. Stamp=0 means free */
67   UInt16 NU;
68   CPpmd7_Node_Ref Next; /* must be at offset >= 4 */
69   CPpmd7_Node_Ref Prev;
70 } CPpmd7_Node;
71 
72 #ifdef PPMD_32BIT
73   #define NODE(ptr) (ptr)
74 #else
75   #define NODE(offs) ((CPpmd7_Node *)(p->Base + (offs)))
76 #endif
77 
78 static void Ppmd7_Update1(CPpmd7 *p);
79 static void Ppmd7_Update1_0(CPpmd7 *p);
80 static void Ppmd7_Update2(CPpmd7 *p);
81 static void Ppmd7_UpdateBin(CPpmd7 *p);
82 static CPpmd_See *Ppmd7_MakeEscFreq(CPpmd7 *p, unsigned numMasked,
83                                     UInt32 *scale);
84 
85 /* ----------- Base ----------- */
86 
Ppmd7_Construct(CPpmd7 * p)87 static void Ppmd7_Construct(CPpmd7 *p)
88 {
89   unsigned i, k, m;
90 
91   p->Base = 0;
92 
93   for (i = 0, k = 0; i < PPMD_NUM_INDEXES; i++)
94   {
95     unsigned step = (i >= 12 ? 4 : (i >> 2) + 1);
96     do { p->Units2Indx[k++] = (Byte)i; } while(--step);
97     p->Indx2Units[i] = (Byte)k;
98   }
99 
100   p->NS2BSIndx[0] = (0 << 1);
101   p->NS2BSIndx[1] = (1 << 1);
102   memset(p->NS2BSIndx + 2, (2 << 1), 9);
103   memset(p->NS2BSIndx + 11, (3 << 1), 256 - 11);
104 
105   for (i = 0; i < 3; i++)
106     p->NS2Indx[i] = (Byte)i;
107   for (m = i, k = 1; i < 256; i++)
108   {
109     p->NS2Indx[i] = (Byte)m;
110     if (--k == 0)
111       k = (++m) - 2;
112   }
113 
114   memset(p->HB2Flag, 0, 0x40);
115   memset(p->HB2Flag + 0x40, 8, 0x100 - 0x40);
116 }
117 
Ppmd7_Free(CPpmd7 * p)118 static void Ppmd7_Free(CPpmd7 *p)
119 {
120   free(p->Base);
121   p->Size = 0;
122   p->Base = 0;
123 }
124 
Ppmd7_Alloc(CPpmd7 * p,UInt32 size)125 static Bool Ppmd7_Alloc(CPpmd7 *p, UInt32 size)
126 {
127   if (p->Base == 0 || p->Size != size)
128   {
129     /* RestartModel() below assumes that p->Size >= UNIT_SIZE
130        (see the calculation of m->MinContext). */
131     if (size < UNIT_SIZE) {
132       return False;
133     }
134     Ppmd7_Free(p);
135     p->AlignOffset =
136       #ifdef PPMD_32BIT
137         (4 - size) & 3;
138       #else
139         4 - (size & 3);
140       #endif
141     if ((p->Base = malloc(p->AlignOffset + size
142         #ifndef PPMD_32BIT
143         + UNIT_SIZE
144         #endif
145         )) == 0)
146       return False;
147     p->Size = size;
148   }
149   return True;
150 }
151 
InsertNode(CPpmd7 * p,void * node,unsigned indx)152 static void InsertNode(CPpmd7 *p, void *node, unsigned indx)
153 {
154   *((CPpmd_Void_Ref *)node) = p->FreeList[indx];
155   p->FreeList[indx] = REF(node);
156 }
157 
RemoveNode(CPpmd7 * p,unsigned indx)158 static void *RemoveNode(CPpmd7 *p, unsigned indx)
159 {
160   CPpmd_Void_Ref *node = (CPpmd_Void_Ref *)Ppmd7_GetPtr(p, p->FreeList[indx]);
161   p->FreeList[indx] = *node;
162   return node;
163 }
164 
SplitBlock(CPpmd7 * p,void * ptr,unsigned oldIndx,unsigned newIndx)165 static void SplitBlock(CPpmd7 *p, void *ptr, unsigned oldIndx, unsigned newIndx)
166 {
167   unsigned i, nu = I2U(oldIndx) - I2U(newIndx);
168   ptr = (Byte *)ptr + U2B(I2U(newIndx));
169   if (I2U(i = U2I(nu)) != nu)
170   {
171     unsigned k = I2U(--i);
172     InsertNode(p, ((Byte *)ptr) + U2B(k), nu - k - 1);
173   }
174   InsertNode(p, ptr, i);
175 }
176 
GlueFreeBlocks(CPpmd7 * p)177 static void GlueFreeBlocks(CPpmd7 *p)
178 {
179   #ifdef PPMD_32BIT
180   CPpmd7_Node headItem;
181   CPpmd7_Node_Ref head = &headItem;
182   #else
183   CPpmd7_Node_Ref head = p->AlignOffset + p->Size;
184   #endif
185 
186   CPpmd7_Node_Ref n = head;
187   unsigned i;
188 
189   p->GlueCount = 255;
190 
191   /* create doubly-linked list of free blocks */
192   for (i = 0; i < PPMD_NUM_INDEXES; i++)
193   {
194     UInt16 nu = I2U(i);
195     CPpmd7_Node_Ref next = (CPpmd7_Node_Ref)p->FreeList[i];
196     p->FreeList[i] = 0;
197     while (next != 0)
198     {
199       CPpmd7_Node *node = NODE(next);
200       node->Next = n;
201       n = NODE(n)->Prev = next;
202       next = *(const CPpmd7_Node_Ref *)node;
203       node->Stamp = 0;
204       node->NU = (UInt16)nu;
205     }
206   }
207   NODE(head)->Stamp = 1;
208   NODE(head)->Next = n;
209   NODE(n)->Prev = head;
210   if (p->LoUnit != p->HiUnit)
211     ((CPpmd7_Node *)p->LoUnit)->Stamp = 1;
212 
213   /* Glue free blocks */
214   while (n != head)
215   {
216     CPpmd7_Node *node = NODE(n);
217     UInt32 nu = (UInt32)node->NU;
218     for (;;)
219     {
220       CPpmd7_Node *node2 = NODE(n) + nu;
221       nu += node2->NU;
222       if (node2->Stamp != 0 || nu >= 0x10000)
223         break;
224       NODE(node2->Prev)->Next = node2->Next;
225       NODE(node2->Next)->Prev = node2->Prev;
226       node->NU = (UInt16)nu;
227     }
228     n = node->Next;
229   }
230 
231   /* Fill lists of free blocks */
232   for (n = NODE(head)->Next; n != head;)
233   {
234     CPpmd7_Node *node = NODE(n);
235     unsigned nu;
236     CPpmd7_Node_Ref next = node->Next;
237     for (nu = node->NU; nu > 128; nu -= 128, node += 128)
238       InsertNode(p, node, PPMD_NUM_INDEXES - 1);
239     if (I2U(i = U2I(nu)) != nu)
240     {
241       unsigned k = I2U(--i);
242       InsertNode(p, node + k, nu - k - 1);
243     }
244     InsertNode(p, node, i);
245     n = next;
246   }
247 }
248 
AllocUnitsRare(CPpmd7 * p,unsigned indx)249 static void *AllocUnitsRare(CPpmd7 *p, unsigned indx)
250 {
251   unsigned i;
252   void *retVal;
253   if (p->GlueCount == 0)
254   {
255     GlueFreeBlocks(p);
256     if (p->FreeList[indx] != 0)
257       return RemoveNode(p, indx);
258   }
259   i = indx;
260   do
261   {
262     if (++i == PPMD_NUM_INDEXES)
263     {
264       UInt32 numBytes = U2B(I2U(indx));
265       p->GlueCount--;
266       return ((UInt32)(p->UnitsStart - p->Text) > numBytes) ? (p->UnitsStart -= numBytes) : (NULL);
267     }
268   }
269   while (p->FreeList[i] == 0);
270   retVal = RemoveNode(p, i);
271   SplitBlock(p, retVal, i, indx);
272   return retVal;
273 }
274 
AllocUnits(CPpmd7 * p,unsigned indx)275 static void *AllocUnits(CPpmd7 *p, unsigned indx)
276 {
277   UInt32 numBytes;
278   if (p->FreeList[indx] != 0)
279     return RemoveNode(p, indx);
280   numBytes = U2B(I2U(indx));
281   if (numBytes <= (UInt32)(p->HiUnit - p->LoUnit))
282   {
283     void *retVal = p->LoUnit;
284     p->LoUnit += numBytes;
285     return retVal;
286   }
287   return AllocUnitsRare(p, indx);
288 }
289 
290 #define MyMem12Cpy(dest, src, num) do {					\
291 	UInt32 *d = (UInt32 *)dest;					\
292 	const UInt32 *s = (const UInt32 *)src;				\
293 	UInt32 n = num;							\
294 	do {								\
295 		d[0] = s[0]; d[1] = s[1]; d[2] = s[2]; s += 3; d += 3;	\
296 	} while(--n);							\
297 } while (0)
298 
ShrinkUnits(CPpmd7 * p,void * oldPtr,unsigned oldNU,unsigned newNU)299 static void *ShrinkUnits(CPpmd7 *p, void *oldPtr, unsigned oldNU, unsigned newNU)
300 {
301   unsigned i0 = U2I(oldNU);
302   unsigned i1 = U2I(newNU);
303   if (i0 == i1)
304     return oldPtr;
305   if (p->FreeList[i1] != 0)
306   {
307     void *ptr = RemoveNode(p, i1);
308     MyMem12Cpy(ptr, oldPtr, newNU);
309     InsertNode(p, oldPtr, i0);
310     return ptr;
311   }
312   SplitBlock(p, oldPtr, i0, i1);
313   return oldPtr;
314 }
315 
316 #define SUCCESSOR(p) ((CPpmd_Void_Ref)((p)->SuccessorLow | ((UInt32)(p)->SuccessorHigh << 16)))
317 
SetSuccessor(CPpmd_State * p,CPpmd_Void_Ref v)318 static void SetSuccessor(CPpmd_State *p, CPpmd_Void_Ref v)
319 {
320   (p)->SuccessorLow = (UInt16)((UInt32)(v) & 0xFFFF);
321   (p)->SuccessorHigh = (UInt16)(((UInt32)(v) >> 16) & 0xFFFF);
322 }
323 
RestartModel(CPpmd7 * p)324 static void RestartModel(CPpmd7 *p)
325 {
326   unsigned i, k, m;
327 
328   memset(p->FreeList, 0, sizeof(p->FreeList));
329   p->Text = p->Base + p->AlignOffset;
330   p->HiUnit = p->Text + p->Size;
331   p->LoUnit = p->UnitsStart = p->HiUnit - p->Size / 8 / UNIT_SIZE * 7 * UNIT_SIZE;
332   p->GlueCount = 0;
333 
334   p->OrderFall = p->MaxOrder;
335   p->RunLength = p->InitRL = -(Int32)((p->MaxOrder < 12) ? p->MaxOrder : 12) - 1;
336   p->PrevSuccess = 0;
337 
338   p->MinContext = p->MaxContext = (CTX_PTR)(p->HiUnit -= UNIT_SIZE); /* AllocContext(p); */
339   p->MinContext->Suffix = 0;
340   p->MinContext->NumStats = 256;
341   p->MinContext->SummFreq = 256 + 1;
342   p->FoundState = (CPpmd_State *)p->LoUnit; /* AllocUnits(p, PPMD_NUM_INDEXES - 1); */
343   p->LoUnit += U2B(256 / 2);
344   p->MinContext->Stats = REF(p->FoundState);
345   for (i = 0; i < 256; i++)
346   {
347     CPpmd_State *s = &p->FoundState[i];
348     s->Symbol = (Byte)i;
349     s->Freq = 1;
350     SetSuccessor(s, 0);
351   }
352 
353   for (i = 0; i < 128; i++)
354     for (k = 0; k < 8; k++)
355     {
356       UInt16 *dest = p->BinSumm[i] + k;
357       UInt16 val = (UInt16)(PPMD_BIN_SCALE - kInitBinEsc[k] / (i + 2));
358       for (m = 0; m < 64; m += 8)
359         dest[m] = val;
360     }
361 
362   for (i = 0; i < 25; i++)
363     for (k = 0; k < 16; k++)
364     {
365       CPpmd_See *s = &p->See[i][k];
366       s->Summ = (UInt16)((5 * i + 10) << (s->Shift = PPMD_PERIOD_BITS - 4));
367       s->Count = 4;
368     }
369 }
370 
Ppmd7_Init(CPpmd7 * p,unsigned maxOrder)371 static void Ppmd7_Init(CPpmd7 *p, unsigned maxOrder)
372 {
373   p->MaxOrder = maxOrder;
374   RestartModel(p);
375   p->DummySee.Shift = PPMD_PERIOD_BITS;
376   p->DummySee.Summ = 0; /* unused */
377   p->DummySee.Count = 64; /* unused */
378 }
379 
CreateSuccessors(CPpmd7 * p,Bool skip)380 static CTX_PTR CreateSuccessors(CPpmd7 *p, Bool skip)
381 {
382   CPpmd_State upState;
383   CTX_PTR c = p->MinContext;
384   CPpmd_Byte_Ref upBranch = (CPpmd_Byte_Ref)SUCCESSOR(p->FoundState);
385   CPpmd_State *ps[PPMD7_MAX_ORDER];
386   unsigned numPs = 0;
387 
388   if (!skip)
389     ps[numPs++] = p->FoundState;
390 
391   while (c->Suffix)
392   {
393     CPpmd_Void_Ref successor;
394     CPpmd_State *s;
395     c = SUFFIX(c);
396     if (c->NumStats != 1)
397     {
398       for (s = STATS(c); s->Symbol != p->FoundState->Symbol; s++);
399     }
400     else
401       s = ONE_STATE(c);
402     successor = SUCCESSOR(s);
403     if (successor != upBranch)
404     {
405       c = CTX(successor);
406       if (numPs == 0)
407         return c;
408       break;
409     }
410     ps[numPs++] = s;
411   }
412 
413   upState.Symbol = *(const Byte *)Ppmd7_GetPtr(p, upBranch);
414   SetSuccessor(&upState, upBranch + 1);
415 
416   if (c->NumStats == 1)
417     upState.Freq = ONE_STATE(c)->Freq;
418   else
419   {
420     UInt32 cf, s0;
421     CPpmd_State *s;
422     for (s = STATS(c); s->Symbol != upState.Symbol; s++);
423     cf = s->Freq - 1;
424     s0 = c->SummFreq - c->NumStats - cf;
425     upState.Freq = (Byte)(1 + ((2 * cf <= s0) ? (5 * cf > s0) : ((2 * cf + 3 * s0 - 1) / (2 * s0))));
426   }
427 
428   while (numPs != 0)
429   {
430     /* Create Child */
431     CTX_PTR c1; /* = AllocContext(p); */
432     if (p->HiUnit != p->LoUnit)
433       c1 = (CTX_PTR)(p->HiUnit -= UNIT_SIZE);
434     else if (p->FreeList[0] != 0)
435       c1 = (CTX_PTR)RemoveNode(p, 0);
436     else
437     {
438       c1 = (CTX_PTR)AllocUnitsRare(p, 0);
439       if (!c1)
440         return NULL;
441     }
442     c1->NumStats = 1;
443     *ONE_STATE(c1) = upState;
444     c1->Suffix = REF(c);
445     SetSuccessor(ps[--numPs], REF(c1));
446     c = c1;
447   }
448 
449   return c;
450 }
451 
SwapStates(CPpmd_State * t1,CPpmd_State * t2)452 static void SwapStates(CPpmd_State *t1, CPpmd_State *t2)
453 {
454   CPpmd_State tmp = *t1;
455   *t1 = *t2;
456   *t2 = tmp;
457 }
458 
UpdateModel(CPpmd7 * p)459 static void UpdateModel(CPpmd7 *p)
460 {
461   CPpmd_Void_Ref successor, fSuccessor = SUCCESSOR(p->FoundState);
462   CTX_PTR c;
463   unsigned s0, ns;
464 
465   if (p->FoundState->Freq < MAX_FREQ / 4 && p->MinContext->Suffix != 0)
466   {
467     c = SUFFIX(p->MinContext);
468 
469     if (c->NumStats == 1)
470     {
471       CPpmd_State *s = ONE_STATE(c);
472       if (s->Freq < 32)
473         s->Freq++;
474     }
475     else
476     {
477       CPpmd_State *s = STATS(c);
478       if (s->Symbol != p->FoundState->Symbol)
479       {
480         do { s++; } while (s->Symbol != p->FoundState->Symbol);
481         if (s[0].Freq >= s[-1].Freq)
482         {
483           SwapStates(&s[0], &s[-1]);
484           s--;
485         }
486       }
487       if (s->Freq < MAX_FREQ - 9)
488       {
489         s->Freq += 2;
490         c->SummFreq += 2;
491       }
492     }
493   }
494 
495   if (p->OrderFall == 0)
496   {
497     p->MinContext = p->MaxContext = CreateSuccessors(p, True);
498     if (p->MinContext == 0)
499     {
500       RestartModel(p);
501       return;
502     }
503     SetSuccessor(p->FoundState, REF(p->MinContext));
504     return;
505   }
506 
507   *p->Text++ = p->FoundState->Symbol;
508   successor = REF(p->Text);
509   if (p->Text >= p->UnitsStart)
510   {
511     RestartModel(p);
512     return;
513   }
514 
515   if (fSuccessor)
516   {
517     if (fSuccessor <= successor)
518     {
519       CTX_PTR cs = CreateSuccessors(p, False);
520       if (cs == NULL)
521       {
522         RestartModel(p);
523         return;
524       }
525       fSuccessor = REF(cs);
526     }
527     if (--p->OrderFall == 0)
528     {
529       successor = fSuccessor;
530       p->Text -= (p->MaxContext != p->MinContext);
531     }
532   }
533   else
534   {
535     SetSuccessor(p->FoundState, successor);
536     fSuccessor = REF(p->MinContext);
537   }
538 
539   s0 = p->MinContext->SummFreq - (ns = p->MinContext->NumStats) - (p->FoundState->Freq - 1);
540 
541   for (c = p->MaxContext; c != p->MinContext; c = SUFFIX(c))
542   {
543     unsigned ns1;
544     UInt32 cf, sf;
545     if ((ns1 = c->NumStats) != 1)
546     {
547       if ((ns1 & 1) == 0)
548       {
549         /* Expand for one UNIT */
550         unsigned oldNU = ns1 >> 1;
551         unsigned i = U2I(oldNU);
552         if (i != U2I(oldNU + 1))
553         {
554           void *ptr = AllocUnits(p, i + 1);
555           void *oldPtr;
556           if (!ptr)
557           {
558             RestartModel(p);
559             return;
560           }
561           oldPtr = STATS(c);
562           MyMem12Cpy(ptr, oldPtr, oldNU);
563           InsertNode(p, oldPtr, i);
564           c->Stats = STATS_REF(ptr);
565         }
566       }
567       c->SummFreq = (UInt16)(c->SummFreq + (2 * ns1 < ns) + 2 * ((4 * ns1 <= ns) & (c->SummFreq <= 8 * ns1)));
568     }
569     else
570     {
571       CPpmd_State *s = (CPpmd_State*)AllocUnits(p, 0);
572       if (!s)
573       {
574         RestartModel(p);
575         return;
576       }
577       *s = *ONE_STATE(c);
578       c->Stats = REF(s);
579       if (s->Freq < MAX_FREQ / 4 - 1)
580         s->Freq <<= 1;
581       else
582         s->Freq = MAX_FREQ - 4;
583       c->SummFreq = (UInt16)(s->Freq + p->InitEsc + (ns > 3));
584     }
585     cf = 2 * (UInt32)p->FoundState->Freq * (c->SummFreq + 6);
586     sf = (UInt32)s0 + c->SummFreq;
587     if (cf < 6 * sf)
588     {
589       cf = 1 + (cf > sf) + (cf >= 4 * sf);
590       c->SummFreq += 3;
591     }
592     else
593     {
594       cf = 4 + (cf >= 9 * sf) + (cf >= 12 * sf) + (cf >= 15 * sf);
595       c->SummFreq = (UInt16)(c->SummFreq + cf);
596     }
597     {
598       CPpmd_State *s = STATS(c) + ns1;
599       SetSuccessor(s, successor);
600       s->Symbol = p->FoundState->Symbol;
601       s->Freq = (Byte)cf;
602       c->NumStats = (UInt16)(ns1 + 1);
603     }
604   }
605   p->MaxContext = p->MinContext = CTX(fSuccessor);
606 }
607 
Rescale(CPpmd7 * p)608 static void Rescale(CPpmd7 *p)
609 {
610   unsigned i, adder, sumFreq, escFreq;
611   CPpmd_State *stats = STATS(p->MinContext);
612   CPpmd_State *s = p->FoundState;
613   {
614     CPpmd_State tmp = *s;
615     for (; s != stats; s--)
616       s[0] = s[-1];
617     *s = tmp;
618   }
619   escFreq = p->MinContext->SummFreq - s->Freq;
620   s->Freq += 4;
621   adder = (p->OrderFall != 0);
622   s->Freq = (Byte)((s->Freq + adder) >> 1);
623   sumFreq = s->Freq;
624 
625   i = p->MinContext->NumStats - 1;
626   do
627   {
628     escFreq -= (++s)->Freq;
629     s->Freq = (Byte)((s->Freq + adder) >> 1);
630     sumFreq += s->Freq;
631     if (s[0].Freq > s[-1].Freq)
632     {
633       CPpmd_State *s1 = s;
634       CPpmd_State tmp = *s1;
635       do
636         s1[0] = s1[-1];
637       while (--s1 != stats && tmp.Freq > s1[-1].Freq);
638       *s1 = tmp;
639     }
640   }
641   while (--i);
642 
643   if (s->Freq == 0)
644   {
645     unsigned numStats = p->MinContext->NumStats;
646     unsigned n0, n1;
647     do { i++; } while ((--s)->Freq == 0);
648     escFreq += i;
649     p->MinContext->NumStats = (UInt16)(p->MinContext->NumStats - i);
650     if (p->MinContext->NumStats == 1)
651     {
652       CPpmd_State tmp = *stats;
653       do
654       {
655         tmp.Freq = (Byte)(tmp.Freq - (tmp.Freq >> 1));
656         escFreq >>= 1;
657       }
658       while (escFreq > 1);
659       InsertNode(p, stats, U2I(((numStats + 1) >> 1)));
660       *(p->FoundState = ONE_STATE(p->MinContext)) = tmp;
661       return;
662     }
663     n0 = (numStats + 1) >> 1;
664     n1 = (p->MinContext->NumStats + 1) >> 1;
665     if (n0 != n1)
666       p->MinContext->Stats = STATS_REF(ShrinkUnits(p, stats, n0, n1));
667   }
668   p->MinContext->SummFreq = (UInt16)(sumFreq + escFreq - (escFreq >> 1));
669   p->FoundState = STATS(p->MinContext);
670 }
671 
Ppmd7_MakeEscFreq(CPpmd7 * p,unsigned numMasked,UInt32 * escFreq)672 static CPpmd_See *Ppmd7_MakeEscFreq(CPpmd7 *p, unsigned numMasked, UInt32 *escFreq)
673 {
674   CPpmd_See *see;
675   unsigned nonMasked = p->MinContext->NumStats - numMasked;
676   if (p->MinContext->NumStats != 256)
677   {
678     see = p->See[p->NS2Indx[nonMasked - 1]] +
679         (nonMasked < (unsigned)SUFFIX(p->MinContext)->NumStats - p->MinContext->NumStats) +
680         2 * (p->MinContext->SummFreq < 11 * p->MinContext->NumStats) +
681         4 * (numMasked > nonMasked) +
682         p->HiBitsFlag;
683     {
684       unsigned r = (see->Summ >> see->Shift);
685       see->Summ = (UInt16)(see->Summ - r);
686       *escFreq = r + (r == 0);
687     }
688   }
689   else
690   {
691     see = &p->DummySee;
692     *escFreq = 1;
693   }
694   return see;
695 }
696 
NextContext(CPpmd7 * p)697 static void NextContext(CPpmd7 *p)
698 {
699   CTX_PTR c = CTX(SUCCESSOR(p->FoundState));
700   if (p->OrderFall == 0 && (Byte *)c > p->Text)
701     p->MinContext = p->MaxContext = c;
702   else
703     UpdateModel(p);
704 }
705 
Ppmd7_Update1(CPpmd7 * p)706 static void Ppmd7_Update1(CPpmd7 *p)
707 {
708   CPpmd_State *s = p->FoundState;
709   s->Freq += 4;
710   p->MinContext->SummFreq += 4;
711   if (s[0].Freq > s[-1].Freq)
712   {
713     SwapStates(&s[0], &s[-1]);
714     p->FoundState = --s;
715     if (s->Freq > MAX_FREQ)
716       Rescale(p);
717   }
718   NextContext(p);
719 }
720 
Ppmd7_Update1_0(CPpmd7 * p)721 static void Ppmd7_Update1_0(CPpmd7 *p)
722 {
723   p->PrevSuccess = (2 * p->FoundState->Freq > p->MinContext->SummFreq);
724   p->RunLength += p->PrevSuccess;
725   p->MinContext->SummFreq += 4;
726   if ((p->FoundState->Freq += 4) > MAX_FREQ)
727     Rescale(p);
728   NextContext(p);
729 }
730 
Ppmd7_UpdateBin(CPpmd7 * p)731 static void Ppmd7_UpdateBin(CPpmd7 *p)
732 {
733   p->FoundState->Freq = (Byte)(p->FoundState->Freq + (p->FoundState->Freq < 128 ? 1: 0));
734   p->PrevSuccess = 1;
735   p->RunLength++;
736   NextContext(p);
737 }
738 
Ppmd7_Update2(CPpmd7 * p)739 static void Ppmd7_Update2(CPpmd7 *p)
740 {
741   p->MinContext->SummFreq += 4;
742   if ((p->FoundState->Freq += 4) > MAX_FREQ)
743     Rescale(p);
744   p->RunLength = p->InitRL;
745   UpdateModel(p);
746 }
747 
748 /* ---------- Decode ---------- */
749 
Ppmd_RangeDec_Init(CPpmd7z_RangeDec * p)750 static Bool Ppmd_RangeDec_Init(CPpmd7z_RangeDec *p)
751 {
752   unsigned i;
753   p->Low = p->Bottom = 0;
754   p->Range = 0xFFFFFFFF;
755   for (i = 0; i < 4; i++)
756     p->Code = (p->Code << 8) | p->Stream->Read((void *)p->Stream);
757   return (p->Code < 0xFFFFFFFF);
758 }
759 
Ppmd7z_RangeDec_Init(CPpmd7z_RangeDec * p)760 static Bool Ppmd7z_RangeDec_Init(CPpmd7z_RangeDec *p)
761 {
762   if (p->Stream->Read((void *)p->Stream) != 0)
763     return False;
764   return Ppmd_RangeDec_Init(p);
765 }
766 
PpmdRAR_RangeDec_Init(CPpmd7z_RangeDec * p)767 static Bool PpmdRAR_RangeDec_Init(CPpmd7z_RangeDec *p)
768 {
769   if (!Ppmd_RangeDec_Init(p))
770     return False;
771   p->Bottom = 0x8000;
772   return True;
773 }
774 
Range_GetThreshold(void * pp,UInt32 total)775 static UInt32 Range_GetThreshold(void *pp, UInt32 total)
776 {
777   CPpmd7z_RangeDec *p = (CPpmd7z_RangeDec *)pp;
778   return (p->Code - p->Low) / (p->Range /= total);
779 }
780 
Range_Normalize(CPpmd7z_RangeDec * p)781 static void Range_Normalize(CPpmd7z_RangeDec *p)
782 {
783   while (1)
784   {
785     if((p->Low ^ (p->Low + p->Range)) >= kTopValue)
786     {
787       if(p->Range >= p->Bottom)
788         break;
789       else
790         p->Range = ((uint32_t)(-(int32_t)p->Low)) & (p->Bottom - 1);
791     }
792     p->Code = (p->Code << 8) | p->Stream->Read((void *)p->Stream);
793     p->Range <<= 8;
794     p->Low <<= 8;
795   }
796 }
797 
Range_Decode_7z(void * pp,UInt32 start,UInt32 size)798 static void Range_Decode_7z(void *pp, UInt32 start, UInt32 size)
799 {
800   CPpmd7z_RangeDec *p = (CPpmd7z_RangeDec *)pp;
801   p->Code -= start * p->Range;
802   p->Range *= size;
803   Range_Normalize(p);
804 }
805 
Range_Decode_RAR(void * pp,UInt32 start,UInt32 size)806 static void Range_Decode_RAR(void *pp, UInt32 start, UInt32 size)
807 {
808   CPpmd7z_RangeDec *p = (CPpmd7z_RangeDec *)pp;
809   p->Low += start * p->Range;
810   p->Range *= size;
811   Range_Normalize(p);
812 }
813 
Range_DecodeBit_7z(void * pp,UInt32 size0)814 static UInt32 Range_DecodeBit_7z(void *pp, UInt32 size0)
815 {
816   CPpmd7z_RangeDec *p = (CPpmd7z_RangeDec *)pp;
817   UInt32 newBound = (p->Range >> 14) * size0;
818   UInt32 symbol;
819   if (p->Code < newBound)
820   {
821     symbol = 0;
822     p->Range = newBound;
823   }
824   else
825   {
826     symbol = 1;
827     p->Code -= newBound;
828     p->Range -= newBound;
829   }
830   Range_Normalize(p);
831   return symbol;
832 }
833 
Range_DecodeBit_RAR(void * pp,UInt32 size0)834 static UInt32 Range_DecodeBit_RAR(void *pp, UInt32 size0)
835 {
836   CPpmd7z_RangeDec *p = (CPpmd7z_RangeDec *)pp;
837   UInt32 bit, value = p->p.GetThreshold(p, PPMD_BIN_SCALE);
838   if(value < size0)
839   {
840     bit = 0;
841     p->p.Decode(p, 0, size0);
842   }
843   else
844   {
845     bit = 1;
846     p->p.Decode(p, size0, PPMD_BIN_SCALE - size0);
847   }
848   return bit;
849 }
850 
Ppmd7z_RangeDec_CreateVTable(CPpmd7z_RangeDec * p)851 static void Ppmd7z_RangeDec_CreateVTable(CPpmd7z_RangeDec *p)
852 {
853   p->p.GetThreshold = Range_GetThreshold;
854   p->p.Decode = Range_Decode_7z;
855   p->p.DecodeBit = Range_DecodeBit_7z;
856 }
857 
PpmdRAR_RangeDec_CreateVTable(CPpmd7z_RangeDec * p)858 static void PpmdRAR_RangeDec_CreateVTable(CPpmd7z_RangeDec *p)
859 {
860   p->p.GetThreshold = Range_GetThreshold;
861   p->p.Decode = Range_Decode_RAR;
862   p->p.DecodeBit = Range_DecodeBit_RAR;
863 }
864 
865 #define MASK(sym) ((signed char *)charMask)[sym]
866 
Ppmd7_DecodeSymbol(CPpmd7 * p,IPpmd7_RangeDec * rc)867 static int Ppmd7_DecodeSymbol(CPpmd7 *p, IPpmd7_RangeDec *rc)
868 {
869   size_t charMask[256 / sizeof(size_t)];
870   if (p->MinContext->NumStats != 1)
871   {
872     CPpmd_State *s = Ppmd7_GetStats(p, p->MinContext);
873     unsigned i;
874     UInt32 count, hiCnt;
875     if ((count = rc->GetThreshold(rc, p->MinContext->SummFreq)) < (hiCnt = s->Freq))
876     {
877       Byte symbol;
878       rc->Decode(rc, 0, s->Freq);
879       p->FoundState = s;
880       symbol = s->Symbol;
881       Ppmd7_Update1_0(p);
882       return symbol;
883     }
884     p->PrevSuccess = 0;
885     i = p->MinContext->NumStats - 1;
886     do
887     {
888       if ((hiCnt += (++s)->Freq) > count)
889       {
890         Byte symbol;
891         rc->Decode(rc, hiCnt - s->Freq, s->Freq);
892         p->FoundState = s;
893         symbol = s->Symbol;
894         Ppmd7_Update1(p);
895         return symbol;
896       }
897     }
898     while (--i);
899     if (count >= p->MinContext->SummFreq)
900       return -2;
901     p->HiBitsFlag = p->HB2Flag[p->FoundState->Symbol];
902     rc->Decode(rc, hiCnt, p->MinContext->SummFreq - hiCnt);
903     PPMD_SetAllBitsIn256Bytes(charMask);
904     MASK(s->Symbol) = 0;
905     i = p->MinContext->NumStats - 1;
906     do { MASK((--s)->Symbol) = 0; } while (--i);
907   }
908   else
909   {
910     UInt16 *prob = Ppmd7_GetBinSumm(p);
911     if (rc->DecodeBit(rc, *prob) == 0)
912     {
913       Byte symbol;
914       *prob = (UInt16)PPMD_UPDATE_PROB_0(*prob);
915       symbol = (p->FoundState = Ppmd7Context_OneState(p->MinContext))->Symbol;
916       Ppmd7_UpdateBin(p);
917       return symbol;
918     }
919     *prob = (UInt16)PPMD_UPDATE_PROB_1(*prob);
920     p->InitEsc = PPMD7_kExpEscape[*prob >> 10];
921     PPMD_SetAllBitsIn256Bytes(charMask);
922     MASK(Ppmd7Context_OneState(p->MinContext)->Symbol) = 0;
923     p->PrevSuccess = 0;
924   }
925   for (;;)
926   {
927     CPpmd_State *ps[256], *s;
928     UInt32 freqSum, count, hiCnt;
929     CPpmd_See *see;
930     unsigned i, num, numMasked = p->MinContext->NumStats;
931     do
932     {
933       p->OrderFall++;
934       if (!p->MinContext->Suffix)
935         return -1;
936       p->MinContext = Ppmd7_GetContext(p, p->MinContext->Suffix);
937     }
938     while (p->MinContext->NumStats == numMasked);
939     hiCnt = 0;
940     s = Ppmd7_GetStats(p, p->MinContext);
941     i = 0;
942     num = p->MinContext->NumStats - numMasked;
943     do
944     {
945       int k = (int)(MASK(s->Symbol));
946       hiCnt += (s->Freq & k);
947       ps[i] = s++;
948       i -= k;
949     }
950     while (i != num);
951 
952     see = Ppmd7_MakeEscFreq(p, numMasked, &freqSum);
953     freqSum += hiCnt;
954     count = rc->GetThreshold(rc, freqSum);
955 
956     if (count < hiCnt)
957     {
958       Byte symbol;
959       CPpmd_State **pps = ps;
960       for (hiCnt = 0; (hiCnt += (*pps)->Freq) <= count; pps++);
961       s = *pps;
962       rc->Decode(rc, hiCnt - s->Freq, s->Freq);
963       Ppmd_See_Update(see);
964       p->FoundState = s;
965       symbol = s->Symbol;
966       Ppmd7_Update2(p);
967       return symbol;
968     }
969     if (count >= freqSum)
970       return -2;
971     rc->Decode(rc, hiCnt, freqSum - hiCnt);
972     see->Summ = (UInt16)(see->Summ + freqSum);
973     do { MASK(ps[--i]->Symbol) = 0; } while (i != 0);
974   }
975 }
976 
977 /* ---------- Encode ---------- Ppmd7Enc.c */
978 
979 #define kTopValue (1 << 24)
980 
Ppmd7z_RangeEnc_Init(CPpmd7z_RangeEnc * p)981 static void Ppmd7z_RangeEnc_Init(CPpmd7z_RangeEnc *p)
982 {
983   p->Low = 0;
984   p->Range = 0xFFFFFFFF;
985   p->Cache = 0;
986   p->CacheSize = 1;
987 }
988 
RangeEnc_ShiftLow(CPpmd7z_RangeEnc * p)989 static void RangeEnc_ShiftLow(CPpmd7z_RangeEnc *p)
990 {
991   if ((UInt32)p->Low < (UInt32)0xFF000000 || (unsigned)(p->Low >> 32) != 0)
992   {
993     Byte temp = p->Cache;
994     do
995     {
996       p->Stream->Write(p->Stream, (Byte)(temp + (Byte)(p->Low >> 32)));
997       temp = 0xFF;
998     }
999     while(--p->CacheSize != 0);
1000     p->Cache = (Byte)((UInt32)p->Low >> 24);
1001   }
1002   p->CacheSize++;
1003   p->Low = ((UInt32)p->Low << 8) & 0xFFFFFFFF;
1004 }
1005 
RangeEnc_Encode(CPpmd7z_RangeEnc * p,UInt32 start,UInt32 size,UInt32 total)1006 static void RangeEnc_Encode(CPpmd7z_RangeEnc *p, UInt32 start, UInt32 size, UInt32 total)
1007 {
1008   p->Low += (UInt64)start * (UInt64)(p->Range /= total);
1009   p->Range *= size;
1010   while (p->Range < kTopValue)
1011   {
1012     p->Range <<= 8;
1013     RangeEnc_ShiftLow(p);
1014   }
1015 }
1016 
RangeEnc_EncodeBit_0(CPpmd7z_RangeEnc * p,UInt32 size0)1017 static void RangeEnc_EncodeBit_0(CPpmd7z_RangeEnc *p, UInt32 size0)
1018 {
1019   p->Range = (p->Range >> 14) * size0;
1020   while (p->Range < kTopValue)
1021   {
1022     p->Range <<= 8;
1023     RangeEnc_ShiftLow(p);
1024   }
1025 }
1026 
RangeEnc_EncodeBit_1(CPpmd7z_RangeEnc * p,UInt32 size0)1027 static void RangeEnc_EncodeBit_1(CPpmd7z_RangeEnc *p, UInt32 size0)
1028 {
1029   UInt32 newBound = (p->Range >> 14) * size0;
1030   p->Low += newBound;
1031   p->Range -= newBound;
1032   while (p->Range < kTopValue)
1033   {
1034     p->Range <<= 8;
1035     RangeEnc_ShiftLow(p);
1036   }
1037 }
1038 
Ppmd7z_RangeEnc_FlushData(CPpmd7z_RangeEnc * p)1039 static void Ppmd7z_RangeEnc_FlushData(CPpmd7z_RangeEnc *p)
1040 {
1041   unsigned i;
1042   for (i = 0; i < 5; i++)
1043     RangeEnc_ShiftLow(p);
1044 }
1045 
1046 
1047 #define MASK(sym) ((signed char *)charMask)[sym]
1048 
Ppmd7_EncodeSymbol(CPpmd7 * p,CPpmd7z_RangeEnc * rc,int symbol)1049 static void Ppmd7_EncodeSymbol(CPpmd7 *p, CPpmd7z_RangeEnc *rc, int symbol)
1050 {
1051   size_t charMask[256 / sizeof(size_t)];
1052   if (p->MinContext->NumStats != 1)
1053   {
1054     CPpmd_State *s = Ppmd7_GetStats(p, p->MinContext);
1055     UInt32 sum;
1056     unsigned i;
1057     if (s->Symbol == symbol)
1058     {
1059       RangeEnc_Encode(rc, 0, s->Freq, p->MinContext->SummFreq);
1060       p->FoundState = s;
1061       Ppmd7_Update1_0(p);
1062       return;
1063     }
1064     p->PrevSuccess = 0;
1065     sum = s->Freq;
1066     i = p->MinContext->NumStats - 1;
1067     do
1068     {
1069       if ((++s)->Symbol == symbol)
1070       {
1071         RangeEnc_Encode(rc, sum, s->Freq, p->MinContext->SummFreq);
1072         p->FoundState = s;
1073         Ppmd7_Update1(p);
1074         return;
1075       }
1076       sum += s->Freq;
1077     }
1078     while (--i);
1079 
1080     p->HiBitsFlag = p->HB2Flag[p->FoundState->Symbol];
1081     PPMD_SetAllBitsIn256Bytes(charMask);
1082     MASK(s->Symbol) = 0;
1083     i = p->MinContext->NumStats - 1;
1084     do { MASK((--s)->Symbol) = 0; } while (--i);
1085     RangeEnc_Encode(rc, sum, p->MinContext->SummFreq - sum, p->MinContext->SummFreq);
1086   }
1087   else
1088   {
1089     UInt16 *prob = Ppmd7_GetBinSumm(p);
1090     CPpmd_State *s = Ppmd7Context_OneState(p->MinContext);
1091     if (s->Symbol == symbol)
1092     {
1093       RangeEnc_EncodeBit_0(rc, *prob);
1094       *prob = (UInt16)PPMD_UPDATE_PROB_0(*prob);
1095       p->FoundState = s;
1096       Ppmd7_UpdateBin(p);
1097       return;
1098     }
1099     else
1100     {
1101       RangeEnc_EncodeBit_1(rc, *prob);
1102       *prob = (UInt16)PPMD_UPDATE_PROB_1(*prob);
1103       p->InitEsc = PPMD7_kExpEscape[*prob >> 10];
1104       PPMD_SetAllBitsIn256Bytes(charMask);
1105       MASK(s->Symbol) = 0;
1106       p->PrevSuccess = 0;
1107     }
1108   }
1109   for (;;)
1110   {
1111     UInt32 escFreq;
1112     CPpmd_See *see;
1113     CPpmd_State *s;
1114     UInt32 sum;
1115     unsigned i, numMasked = p->MinContext->NumStats;
1116     do
1117     {
1118       p->OrderFall++;
1119       if (!p->MinContext->Suffix)
1120         return; /* EndMarker (symbol = -1) */
1121       p->MinContext = Ppmd7_GetContext(p, p->MinContext->Suffix);
1122     }
1123     while (p->MinContext->NumStats == numMasked);
1124 
1125     see = Ppmd7_MakeEscFreq(p, numMasked, &escFreq);
1126     s = Ppmd7_GetStats(p, p->MinContext);
1127     sum = 0;
1128     i = p->MinContext->NumStats;
1129     do
1130     {
1131       int cur = s->Symbol;
1132       if (cur == symbol)
1133       {
1134         UInt32 low = sum;
1135         CPpmd_State *s1 = s;
1136         do
1137         {
1138           sum += (s->Freq & (int)(MASK(s->Symbol)));
1139           s++;
1140         }
1141         while (--i);
1142         RangeEnc_Encode(rc, low, s1->Freq, sum + escFreq);
1143         Ppmd_See_Update(see);
1144         p->FoundState = s1;
1145         Ppmd7_Update2(p);
1146         return;
1147       }
1148       sum += (s->Freq & (int)(MASK(cur)));
1149       MASK(cur) = 0;
1150       s++;
1151     }
1152     while (--i);
1153 
1154     RangeEnc_Encode(rc, sum, escFreq, sum + escFreq);
1155     see->Summ = (UInt16)(see->Summ + sum + escFreq);
1156   }
1157 }
1158 
1159 const IPpmd7 __archive_ppmd7_functions =
1160 {
1161   &Ppmd7_Construct,
1162   &Ppmd7_Alloc,
1163   &Ppmd7_Free,
1164   &Ppmd7_Init,
1165   &Ppmd7z_RangeDec_CreateVTable,
1166   &PpmdRAR_RangeDec_CreateVTable,
1167   &Ppmd7z_RangeDec_Init,
1168   &PpmdRAR_RangeDec_Init,
1169   &Ppmd7_DecodeSymbol,
1170   &Ppmd7z_RangeEnc_Init,
1171   &Ppmd7z_RangeEnc_FlushData,
1172   &Ppmd7_EncodeSymbol
1173 };
1174