1 /* Ppmd8.c -- PPMdI codec 2 2016-05-21 : Igor Pavlov : Public domain 3 This code is based on PPMd var.I (2002): Dmitry Shkarin : Public domain */ 4 5 #include "archive_platform.h" 6 7 #include <string.h> 8 9 #include "archive_ppmd8_private.h" 10 11 const Byte PPMD8_kExpEscape[16] = { 25, 14, 9, 7, 5, 5, 4, 4, 4, 3, 3, 3, 2, 2, 2, 2 }; 12 static const UInt16 kInitBinEsc[] = { 0x3CDD, 0x1F3F, 0x59BF, 0x48F3, 0x64A1, 0x5ABC, 0x6632, 0x6051}; 13 14 #define MAX_FREQ 124 15 #define UNIT_SIZE 12 16 17 #define U2B(nu) ((UInt32)(nu) * UNIT_SIZE) 18 #define U2I(nu) (p->Units2Indx[(nu) - 1]) 19 #define I2U(indx) (p->Indx2Units[indx]) 20 21 #ifdef PPMD_32BIT 22 #define REF(ptr) (ptr) 23 #else 24 #define REF(ptr) ((UInt32)((Byte *)(ptr) - (p)->Base)) 25 #endif 26 27 #define STATS_REF(ptr) ((CPpmd_State_Ref)REF(ptr)) 28 29 #define CTX(ref) ((CPpmd8_Context *)Ppmd8_GetContext(p, ref)) 30 #define STATS(ctx) Ppmd8_GetStats(p, ctx) 31 #define ONE_STATE(ctx) Ppmd8Context_OneState(ctx) 32 #define SUFFIX(ctx) CTX((ctx)->Suffix) 33 34 #define kTop (1 << 24) 35 #define kBot (1 << 15) 36 37 typedef CPpmd8_Context * CTX_PTR; 38 39 struct CPpmd8_Node_; 40 41 typedef 42 #ifdef PPMD_32BIT 43 struct CPpmd8_Node_ * 44 #else 45 UInt32 46 #endif 47 CPpmd8_Node_Ref; 48 49 typedef struct CPpmd8_Node_ 50 { 51 UInt32 Stamp; 52 CPpmd8_Node_Ref Next; 53 UInt32 NU; 54 } CPpmd8_Node; 55 56 #ifdef PPMD_32BIT 57 #define NODE(ptr) (ptr) 58 #else 59 #define NODE(offs) ((CPpmd8_Node *)(p->Base + (offs))) 60 #endif 61 62 #define EMPTY_NODE 0xFFFFFFFF 63 64 void Ppmd8_Construct(CPpmd8 *p) 65 { 66 unsigned i, k, m; 67 68 p->Base = 0; 69 70 for (i = 0, k = 0; i < PPMD_NUM_INDEXES; i++) 71 { 72 unsigned step = (i >= 12 ? 4 : (i >> 2) + 1); 73 do { p->Units2Indx[k++] = (Byte)i; } while (--step); 74 p->Indx2Units[i] = (Byte)k; 75 } 76 77 p->NS2BSIndx[0] = (0 << 1); 78 p->NS2BSIndx[1] = (1 << 1); 79 memset(p->NS2BSIndx + 2, (2 << 1), 9); 80 memset(p->NS2BSIndx + 11, (3 << 1), 256 - 11); 81 82 for (i = 0; i < 5; i++) 83 p->NS2Indx[i] = (Byte)i; 84 for (m = i, k = 1; i < 260; i++) 85 { 86 p->NS2Indx[i] = (Byte)m; 87 if (--k == 0) 88 k = (++m) - 4; 89 } 90 } 91 92 void Ppmd8_Free(CPpmd8 *p) 93 { 94 free(p->Base); 95 p->Size = 0; 96 p->Base = 0; 97 } 98 99 Bool Ppmd8_Alloc(CPpmd8 *p, UInt32 size) 100 { 101 if (p->Base == 0 || p->Size != size) 102 { 103 Ppmd8_Free(p); 104 p->AlignOffset = 105 #ifdef PPMD_32BIT 106 (4 - size) & 3; 107 #else 108 4 - (size & 3); 109 #endif 110 if ((p->Base = malloc(p->AlignOffset + size)) == 0) 111 return False; 112 p->Size = size; 113 } 114 return True; 115 } 116 117 static void InsertNode(CPpmd8 *p, void *node, unsigned indx) 118 { 119 ((CPpmd8_Node *)node)->Stamp = EMPTY_NODE; 120 ((CPpmd8_Node *)node)->Next = (CPpmd8_Node_Ref)p->FreeList[indx]; 121 ((CPpmd8_Node *)node)->NU = I2U(indx); 122 p->FreeList[indx] = REF(node); 123 p->Stamps[indx]++; 124 } 125 126 static void *RemoveNode(CPpmd8 *p, unsigned indx) 127 { 128 CPpmd8_Node *node = NODE((CPpmd8_Node_Ref)p->FreeList[indx]); 129 p->FreeList[indx] = node->Next; 130 p->Stamps[indx]--; 131 return node; 132 } 133 134 static void SplitBlock(CPpmd8 *p, void *ptr, unsigned oldIndx, unsigned newIndx) 135 { 136 unsigned i, nu = I2U(oldIndx) - I2U(newIndx); 137 ptr = (Byte *)ptr + U2B(I2U(newIndx)); 138 if (I2U(i = U2I(nu)) != nu) 139 { 140 unsigned k = I2U(--i); 141 InsertNode(p, ((Byte *)ptr) + U2B(k), nu - k - 1); 142 } 143 InsertNode(p, ptr, i); 144 } 145 146 static void GlueFreeBlocks(CPpmd8 *p) 147 { 148 CPpmd8_Node_Ref head = 0; 149 CPpmd8_Node_Ref *prev = &head; 150 unsigned i; 151 152 p->GlueCount = 1 << 13; 153 memset(p->Stamps, 0, sizeof(p->Stamps)); 154 155 /* Order-0 context is always at top UNIT, so we don't need guard NODE at the end. 156 All blocks up to p->LoUnit can be free, so we need guard NODE at LoUnit. */ 157 if (p->LoUnit != p->HiUnit) 158 ((CPpmd8_Node *)p->LoUnit)->Stamp = 0; 159 160 /* Glue free blocks */ 161 for (i = 0; i < PPMD_NUM_INDEXES; i++) 162 { 163 CPpmd8_Node_Ref next = (CPpmd8_Node_Ref)p->FreeList[i]; 164 p->FreeList[i] = 0; 165 while (next != 0) 166 { 167 CPpmd8_Node *node = NODE(next); 168 if (node->NU != 0) 169 { 170 CPpmd8_Node *node2; 171 *prev = next; 172 prev = &(node->Next); 173 while ((node2 = node + node->NU)->Stamp == EMPTY_NODE) 174 { 175 node->NU += node2->NU; 176 node2->NU = 0; 177 } 178 } 179 next = node->Next; 180 } 181 } 182 *prev = 0; 183 184 /* Fill lists of free blocks */ 185 while (head != 0) 186 { 187 CPpmd8_Node *node = NODE(head); 188 unsigned nu; 189 head = node->Next; 190 nu = node->NU; 191 if (nu == 0) 192 continue; 193 for (; nu > 128; nu -= 128, node += 128) 194 InsertNode(p, node, PPMD_NUM_INDEXES - 1); 195 if (I2U(i = U2I(nu)) != nu) 196 { 197 unsigned k = I2U(--i); 198 InsertNode(p, node + k, nu - k - 1); 199 } 200 InsertNode(p, node, i); 201 } 202 } 203 204 static void *AllocUnitsRare(CPpmd8 *p, unsigned indx) 205 { 206 unsigned i; 207 void *retVal; 208 if (p->GlueCount == 0) 209 { 210 GlueFreeBlocks(p); 211 if (p->FreeList[indx] != 0) 212 return RemoveNode(p, indx); 213 } 214 i = indx; 215 do 216 { 217 if (++i == PPMD_NUM_INDEXES) 218 { 219 UInt32 numBytes = U2B(I2U(indx)); 220 p->GlueCount--; 221 return ((UInt32)(p->UnitsStart - p->Text) > numBytes) ? (p->UnitsStart -= numBytes) : (NULL); 222 } 223 } 224 while (p->FreeList[i] == 0); 225 retVal = RemoveNode(p, i); 226 SplitBlock(p, retVal, i, indx); 227 return retVal; 228 } 229 230 static void *AllocUnits(CPpmd8 *p, unsigned indx) 231 { 232 UInt32 numBytes; 233 if (p->FreeList[indx] != 0) 234 return RemoveNode(p, indx); 235 numBytes = U2B(I2U(indx)); 236 if (numBytes <= (UInt32)(p->HiUnit - p->LoUnit)) 237 { 238 void *retVal = p->LoUnit; 239 p->LoUnit += numBytes; 240 return retVal; 241 } 242 return AllocUnitsRare(p, indx); 243 } 244 245 #define MyMem12Cpy(dest, src, num) \ 246 { UInt32 *d = (UInt32 *)dest; const UInt32 *z = (const UInt32 *)src; UInt32 n = num; \ 247 do { d[0] = z[0]; d[1] = z[1]; d[2] = z[2]; z += 3; d += 3; } while (--n); } 248 249 static void *ShrinkUnits(CPpmd8 *p, void *oldPtr, unsigned oldNU, unsigned newNU) 250 { 251 unsigned i0 = U2I(oldNU); 252 unsigned i1 = U2I(newNU); 253 if (i0 == i1) 254 return oldPtr; 255 if (p->FreeList[i1] != 0) 256 { 257 void *ptr = RemoveNode(p, i1); 258 MyMem12Cpy(ptr, oldPtr, newNU); 259 InsertNode(p, oldPtr, i0); 260 return ptr; 261 } 262 SplitBlock(p, oldPtr, i0, i1); 263 return oldPtr; 264 } 265 266 static void FreeUnits(CPpmd8 *p, void *ptr, unsigned nu) 267 { 268 InsertNode(p, ptr, U2I(nu)); 269 } 270 271 static void SpecialFreeUnit(CPpmd8 *p, void *ptr) 272 { 273 if ((Byte *)ptr != p->UnitsStart) 274 InsertNode(p, ptr, 0); 275 else 276 { 277 #ifdef PPMD8_FREEZE_SUPPORT 278 *(UInt32 *)ptr = EMPTY_NODE; /* it's used for (Flags == 0xFF) check in RemoveBinContexts */ 279 #endif 280 p->UnitsStart += UNIT_SIZE; 281 } 282 } 283 284 static void *MoveUnitsUp(CPpmd8 *p, void *oldPtr, unsigned nu) 285 { 286 unsigned indx = U2I(nu); 287 void *ptr; 288 if ((Byte *)oldPtr > p->UnitsStart + 16 * 1024 || REF(oldPtr) > p->FreeList[indx]) 289 return oldPtr; 290 ptr = RemoveNode(p, indx); 291 MyMem12Cpy(ptr, oldPtr, nu); 292 if ((Byte*)oldPtr != p->UnitsStart) 293 InsertNode(p, oldPtr, indx); 294 else 295 p->UnitsStart += U2B(I2U(indx)); 296 return ptr; 297 } 298 299 static void ExpandTextArea(CPpmd8 *p) 300 { 301 UInt32 count[PPMD_NUM_INDEXES]; 302 unsigned i; 303 memset(count, 0, sizeof(count)); 304 if (p->LoUnit != p->HiUnit) 305 ((CPpmd8_Node *)p->LoUnit)->Stamp = 0; 306 307 { 308 CPpmd8_Node *node = (CPpmd8_Node *)p->UnitsStart; 309 for (; node->Stamp == EMPTY_NODE; node += node->NU) 310 { 311 node->Stamp = 0; 312 count[U2I(node->NU)]++; 313 } 314 p->UnitsStart = (Byte *)node; 315 } 316 317 for (i = 0; i < PPMD_NUM_INDEXES; i++) 318 { 319 CPpmd8_Node_Ref *next = (CPpmd8_Node_Ref *)&p->FreeList[i]; 320 while (count[i] != 0) 321 { 322 CPpmd8_Node *node = NODE(*next); 323 while (node->Stamp == 0) 324 { 325 *next = node->Next; 326 node = NODE(*next); 327 p->Stamps[i]--; 328 if (--count[i] == 0) 329 break; 330 } 331 next = &node->Next; 332 } 333 } 334 } 335 336 #define SUCCESSOR(p) ((CPpmd_Void_Ref)((p)->SuccessorLow | ((UInt32)(p)->SuccessorHigh << 16))) 337 338 static void SetSuccessor(CPpmd_State *p, CPpmd_Void_Ref v) 339 { 340 (p)->SuccessorLow = (UInt16)((UInt32)(v) & 0xFFFF); 341 (p)->SuccessorHigh = (UInt16)(((UInt32)(v) >> 16) & 0xFFFF); 342 } 343 344 #define RESET_TEXT(offs) { p->Text = p->Base + p->AlignOffset + (offs); } 345 346 static void RestartModel(CPpmd8 *p) 347 { 348 unsigned i, k, m, r; 349 350 memset(p->FreeList, 0, sizeof(p->FreeList)); 351 memset(p->Stamps, 0, sizeof(p->Stamps)); 352 RESET_TEXT(0); 353 p->HiUnit = p->Text + p->Size; 354 p->LoUnit = p->UnitsStart = p->HiUnit - p->Size / 8 / UNIT_SIZE * 7 * UNIT_SIZE; 355 p->GlueCount = 0; 356 357 p->OrderFall = p->MaxOrder; 358 p->RunLength = p->InitRL = -(Int32)((p->MaxOrder < 12) ? p->MaxOrder : 12) - 1; 359 p->PrevSuccess = 0; 360 361 p->MinContext = p->MaxContext = (CTX_PTR)(p->HiUnit -= UNIT_SIZE); /* AllocContext(p); */ 362 p->MinContext->Suffix = 0; 363 p->MinContext->NumStats = 255; 364 p->MinContext->Flags = 0; 365 p->MinContext->SummFreq = 256 + 1; 366 p->FoundState = (CPpmd_State *)p->LoUnit; /* AllocUnits(p, PPMD_NUM_INDEXES - 1); */ 367 p->LoUnit += U2B(256 / 2); 368 p->MinContext->Stats = REF(p->FoundState); 369 for (i = 0; i < 256; i++) 370 { 371 CPpmd_State *s = &p->FoundState[i]; 372 s->Symbol = (Byte)i; 373 s->Freq = 1; 374 SetSuccessor(s, 0); 375 } 376 377 for (i = m = 0; m < 25; m++) 378 { 379 while (p->NS2Indx[i] == m) 380 i++; 381 for (k = 0; k < 8; k++) 382 { 383 UInt16 val = (UInt16)(PPMD_BIN_SCALE - kInitBinEsc[k] / (i + 1)); 384 UInt16 *dest = p->BinSumm[m] + k; 385 for (r = 0; r < 64; r += 8) 386 dest[r] = val; 387 } 388 } 389 390 for (i = m = 0; m < 24; m++) 391 { 392 while (p->NS2Indx[i + 3] == m + 3) 393 i++; 394 for (k = 0; k < 32; k++) 395 { 396 CPpmd_See *s = &p->See[m][k]; 397 s->Summ = (UInt16)((2 * i + 5) << (s->Shift = PPMD_PERIOD_BITS - 4)); 398 s->Count = 7; 399 } 400 } 401 } 402 403 void Ppmd8_Init(CPpmd8 *p, unsigned maxOrder, unsigned restoreMethod) 404 { 405 p->MaxOrder = maxOrder; 406 p->RestoreMethod = restoreMethod; 407 RestartModel(p); 408 p->DummySee.Shift = PPMD_PERIOD_BITS; 409 p->DummySee.Summ = 0; /* unused */ 410 p->DummySee.Count = 64; /* unused */ 411 } 412 413 static void Refresh(CPpmd8 *p, CTX_PTR ctx, unsigned oldNU, unsigned scale) 414 { 415 unsigned i = ctx->NumStats, escFreq, sumFreq, flags; 416 CPpmd_State *s = (CPpmd_State *)ShrinkUnits(p, STATS(ctx), oldNU, (i + 2) >> 1); 417 ctx->Stats = REF(s); 418 #ifdef PPMD8_FREEZE_SUPPORT 419 /* fixed over Shkarin's code. Fixed code is not compatible with original code for some files in FREEZE mode. */ 420 scale |= (ctx->SummFreq >= ((UInt32)1 << 15)); 421 #endif 422 flags = (ctx->Flags & (0x10 + 0x04 * scale)) + 0x08 * (s->Symbol >= 0x40); 423 escFreq = ctx->SummFreq - s->Freq; 424 sumFreq = (s->Freq = (Byte)((s->Freq + scale) >> scale)); 425 do 426 { 427 escFreq -= (++s)->Freq; 428 sumFreq += (s->Freq = (Byte)((s->Freq + scale) >> scale)); 429 flags |= 0x08 * (s->Symbol >= 0x40); 430 } 431 while (--i); 432 ctx->SummFreq = (UInt16)(sumFreq + ((escFreq + scale) >> scale)); 433 ctx->Flags = (Byte)flags; 434 } 435 436 static void SwapStates(CPpmd_State *t1, CPpmd_State *t2) 437 { 438 CPpmd_State tmp = *t1; 439 *t1 = *t2; 440 *t2 = tmp; 441 } 442 443 static CPpmd_Void_Ref CutOff(CPpmd8 *p, CTX_PTR ctx, unsigned order) 444 { 445 int i; 446 unsigned tmp; 447 CPpmd_State *s; 448 449 if (!ctx->NumStats) 450 { 451 s = ONE_STATE(ctx); 452 if ((Byte *)Ppmd8_GetPtr(p, SUCCESSOR(s)) >= p->UnitsStart) 453 { 454 if (order < p->MaxOrder) 455 SetSuccessor(s, CutOff(p, CTX(SUCCESSOR(s)), order + 1)); 456 else 457 SetSuccessor(s, 0); 458 if (SUCCESSOR(s) || order <= 9) /* O_BOUND */ 459 return REF(ctx); 460 } 461 SpecialFreeUnit(p, ctx); 462 return 0; 463 } 464 465 ctx->Stats = STATS_REF(MoveUnitsUp(p, STATS(ctx), tmp = ((unsigned)ctx->NumStats + 2) >> 1)); 466 467 for (s = STATS(ctx) + (i = ctx->NumStats); s >= STATS(ctx); s--) 468 if ((Byte *)Ppmd8_GetPtr(p, SUCCESSOR(s)) < p->UnitsStart) 469 { 470 CPpmd_State *s2 = STATS(ctx) + (i--); 471 SetSuccessor(s, 0); 472 SwapStates(s, s2); 473 } 474 else if (order < p->MaxOrder) 475 SetSuccessor(s, CutOff(p, CTX(SUCCESSOR(s)), order + 1)); 476 else 477 SetSuccessor(s, 0); 478 479 if (i != ctx->NumStats && order) 480 { 481 ctx->NumStats = (Byte)i; 482 s = STATS(ctx); 483 if (i < 0) 484 { 485 FreeUnits(p, s, tmp); 486 SpecialFreeUnit(p, ctx); 487 return 0; 488 } 489 if (i == 0) 490 { 491 ctx->Flags = (Byte)((ctx->Flags & 0x10) + 0x08 * (s->Symbol >= 0x40)); 492 *ONE_STATE(ctx) = *s; 493 FreeUnits(p, s, tmp); 494 /* 9.31: the code was fixed. It's was not BUG, if Freq <= MAX_FREQ = 124 */ 495 ONE_STATE(ctx)->Freq = (Byte)(((unsigned)ONE_STATE(ctx)->Freq + 11) >> 3); 496 } 497 else 498 Refresh(p, ctx, tmp, ctx->SummFreq > 16 * i); 499 } 500 return REF(ctx); 501 } 502 503 #ifdef PPMD8_FREEZE_SUPPORT 504 static CPpmd_Void_Ref RemoveBinContexts(CPpmd8 *p, CTX_PTR ctx, unsigned order) 505 { 506 CPpmd_State *s; 507 if (!ctx->NumStats) 508 { 509 s = ONE_STATE(ctx); 510 if ((Byte *)Ppmd8_GetPtr(p, SUCCESSOR(s)) >= p->UnitsStart && order < p->MaxOrder) 511 SetSuccessor(s, RemoveBinContexts(p, CTX(SUCCESSOR(s)), order + 1)); 512 else 513 SetSuccessor(s, 0); 514 /* Suffix context can be removed already, since different (high-order) 515 Successors may refer to same context. So we check Flags == 0xFF (Stamp == EMPTY_NODE) */ 516 if (!SUCCESSOR(s) && (!SUFFIX(ctx)->NumStats || SUFFIX(ctx)->Flags == 0xFF)) 517 { 518 FreeUnits(p, ctx, 1); 519 return 0; 520 } 521 else 522 return REF(ctx); 523 } 524 525 for (s = STATS(ctx) + ctx->NumStats; s >= STATS(ctx); s--) 526 if ((Byte *)Ppmd8_GetPtr(p, SUCCESSOR(s)) >= p->UnitsStart && order < p->MaxOrder) 527 SetSuccessor(s, RemoveBinContexts(p, CTX(SUCCESSOR(s)), order + 1)); 528 else 529 SetSuccessor(s, 0); 530 531 return REF(ctx); 532 } 533 #endif 534 535 static UInt32 GetUsedMemory(const CPpmd8 *p) 536 { 537 UInt32 v = 0; 538 unsigned i; 539 for (i = 0; i < PPMD_NUM_INDEXES; i++) 540 v += p->Stamps[i] * I2U(i); 541 return p->Size - (UInt32)(p->HiUnit - p->LoUnit) - (UInt32)(p->UnitsStart - p->Text) - U2B(v); 542 } 543 544 #ifdef PPMD8_FREEZE_SUPPORT 545 #define RESTORE_MODEL(c1, fSuccessor) RestoreModel(p, c1, fSuccessor) 546 #else 547 #define RESTORE_MODEL(c1, fSuccessor) RestoreModel(p, c1) 548 #endif 549 550 static void RestoreModel(CPpmd8 *p, CTX_PTR c1 551 #ifdef PPMD8_FREEZE_SUPPORT 552 , CTX_PTR fSuccessor 553 #endif 554 ) 555 { 556 CTX_PTR c; 557 CPpmd_State *s; 558 RESET_TEXT(0); 559 for (c = p->MaxContext; c != c1; c = SUFFIX(c)) 560 if (--(c->NumStats) == 0) 561 { 562 s = STATS(c); 563 c->Flags = (Byte)((c->Flags & 0x10) + 0x08 * (s->Symbol >= 0x40)); 564 *ONE_STATE(c) = *s; 565 SpecialFreeUnit(p, s); 566 ONE_STATE(c)->Freq = (Byte)(((unsigned)ONE_STATE(c)->Freq + 11) >> 3); 567 } 568 else 569 Refresh(p, c, (c->NumStats+3) >> 1, 0); 570 571 for (; c != p->MinContext; c = SUFFIX(c)) 572 if (!c->NumStats) 573 ONE_STATE(c)->Freq = (Byte)(ONE_STATE(c)->Freq - (ONE_STATE(c)->Freq >> 1)); 574 else if ((c->SummFreq += 4) > 128 + 4 * c->NumStats) 575 Refresh(p, c, (c->NumStats + 2) >> 1, 1); 576 577 #ifdef PPMD8_FREEZE_SUPPORT 578 if (p->RestoreMethod > PPMD8_RESTORE_METHOD_FREEZE) 579 { 580 p->MaxContext = fSuccessor; 581 p->GlueCount += !(p->Stamps[1] & 1); 582 } 583 else if (p->RestoreMethod == PPMD8_RESTORE_METHOD_FREEZE) 584 { 585 while (p->MaxContext->Suffix) 586 p->MaxContext = SUFFIX(p->MaxContext); 587 RemoveBinContexts(p, p->MaxContext, 0); 588 p->RestoreMethod++; 589 p->GlueCount = 0; 590 p->OrderFall = p->MaxOrder; 591 } 592 else 593 #endif 594 if (p->RestoreMethod == PPMD8_RESTORE_METHOD_RESTART || GetUsedMemory(p) < (p->Size >> 1)) 595 RestartModel(p); 596 else 597 { 598 while (p->MaxContext->Suffix) 599 p->MaxContext = SUFFIX(p->MaxContext); 600 do 601 { 602 CutOff(p, p->MaxContext, 0); 603 ExpandTextArea(p); 604 } 605 while (GetUsedMemory(p) > 3 * (p->Size >> 2)); 606 p->GlueCount = 0; 607 p->OrderFall = p->MaxOrder; 608 } 609 } 610 611 static CTX_PTR CreateSuccessors(CPpmd8 *p, Bool skip, CPpmd_State *s1, CTX_PTR c) 612 { 613 CPpmd_State upState; 614 Byte flags; 615 CPpmd_Byte_Ref upBranch = (CPpmd_Byte_Ref)SUCCESSOR(p->FoundState); 616 /* fixed over Shkarin's code. Maybe it could work without + 1 too. */ 617 CPpmd_State *ps[PPMD8_MAX_ORDER + 1]; 618 unsigned numPs = 0; 619 620 if (!skip) 621 ps[numPs++] = p->FoundState; 622 623 while (c->Suffix) 624 { 625 CPpmd_Void_Ref successor; 626 CPpmd_State *s; 627 c = SUFFIX(c); 628 if (s1) 629 { 630 s = s1; 631 s1 = NULL; 632 } 633 else if (c->NumStats != 0) 634 { 635 for (s = STATS(c); s->Symbol != p->FoundState->Symbol; s++); 636 if (s->Freq < MAX_FREQ - 9) 637 { 638 s->Freq++; 639 c->SummFreq++; 640 } 641 } 642 else 643 { 644 s = ONE_STATE(c); 645 s->Freq = (Byte)(s->Freq + (!SUFFIX(c)->NumStats & (s->Freq < 24))); 646 } 647 successor = SUCCESSOR(s); 648 if (successor != upBranch) 649 { 650 c = CTX(successor); 651 if (numPs == 0) 652 return c; 653 break; 654 } 655 ps[numPs++] = s; 656 } 657 658 upState.Symbol = *(const Byte *)Ppmd8_GetPtr(p, upBranch); 659 SetSuccessor(&upState, upBranch + 1); 660 flags = (Byte)(0x10 * (p->FoundState->Symbol >= 0x40) + 0x08 * (upState.Symbol >= 0x40)); 661 662 if (c->NumStats == 0) 663 upState.Freq = ONE_STATE(c)->Freq; 664 else 665 { 666 UInt32 cf, s0; 667 CPpmd_State *s; 668 for (s = STATS(c); s->Symbol != upState.Symbol; s++); 669 cf = s->Freq - 1; 670 s0 = c->SummFreq - c->NumStats - cf; 671 upState.Freq = (Byte)(1 + ((2 * cf <= s0) ? (5 * cf > s0) : ((cf + 2 * s0 - 3) / s0))); 672 } 673 674 while (numPs != 0) 675 { 676 /* Create Child */ 677 CTX_PTR c1; /* = AllocContext(p); */ 678 if (p->HiUnit != p->LoUnit) 679 c1 = (CTX_PTR)(p->HiUnit -= UNIT_SIZE); 680 else if (p->FreeList[0] != 0) 681 c1 = (CTX_PTR)RemoveNode(p, 0); 682 else 683 { 684 c1 = (CTX_PTR)AllocUnitsRare(p, 0); 685 if (!c1) 686 return NULL; 687 } 688 c1->NumStats = 0; 689 c1->Flags = flags; 690 *ONE_STATE(c1) = upState; 691 c1->Suffix = REF(c); 692 SetSuccessor(ps[--numPs], REF(c1)); 693 c = c1; 694 } 695 696 return c; 697 } 698 699 static CTX_PTR ReduceOrder(CPpmd8 *p, CPpmd_State *s1, CTX_PTR c) 700 { 701 CPpmd_State *s = NULL; 702 CTX_PTR c1 = c; 703 CPpmd_Void_Ref upBranch = REF(p->Text); 704 705 #ifdef PPMD8_FREEZE_SUPPORT 706 /* The BUG in Shkarin's code was fixed: ps could overflow in CUT_OFF mode. */ 707 CPpmd_State *ps[PPMD8_MAX_ORDER + 1]; 708 unsigned numPs = 0; 709 ps[numPs++] = p->FoundState; 710 #endif 711 712 SetSuccessor(p->FoundState, upBranch); 713 p->OrderFall++; 714 715 for (;;) 716 { 717 if (s1) 718 { 719 c = SUFFIX(c); 720 s = s1; 721 s1 = NULL; 722 } 723 else 724 { 725 if (!c->Suffix) 726 { 727 #ifdef PPMD8_FREEZE_SUPPORT 728 if (p->RestoreMethod > PPMD8_RESTORE_METHOD_FREEZE) 729 { 730 do { SetSuccessor(ps[--numPs], REF(c)); } while (numPs); 731 RESET_TEXT(1); 732 p->OrderFall = 1; 733 } 734 #endif 735 return c; 736 } 737 c = SUFFIX(c); 738 if (c->NumStats) 739 { 740 if ((s = STATS(c))->Symbol != p->FoundState->Symbol) 741 do { s++; } while (s->Symbol != p->FoundState->Symbol); 742 if (s->Freq < MAX_FREQ - 9) 743 { 744 s->Freq += 2; 745 c->SummFreq += 2; 746 } 747 } 748 else 749 { 750 s = ONE_STATE(c); 751 s->Freq = (Byte)(s->Freq + (s->Freq < 32)); 752 } 753 } 754 if (SUCCESSOR(s)) 755 break; 756 #ifdef PPMD8_FREEZE_SUPPORT 757 ps[numPs++] = s; 758 #endif 759 SetSuccessor(s, upBranch); 760 p->OrderFall++; 761 } 762 763 #ifdef PPMD8_FREEZE_SUPPORT 764 if (p->RestoreMethod > PPMD8_RESTORE_METHOD_FREEZE) 765 { 766 c = CTX(SUCCESSOR(s)); 767 do { SetSuccessor(ps[--numPs], REF(c)); } while (numPs); 768 RESET_TEXT(1); 769 p->OrderFall = 1; 770 return c; 771 } 772 else 773 #endif 774 if (SUCCESSOR(s) <= upBranch) 775 { 776 CTX_PTR successor; 777 CPpmd_State *s2 = p->FoundState; 778 p->FoundState = s; 779 780 successor = CreateSuccessors(p, False, NULL, c); 781 if (successor == NULL) 782 SetSuccessor(s, 0); 783 else 784 SetSuccessor(s, REF(successor)); 785 p->FoundState = s2; 786 } 787 788 if (p->OrderFall == 1 && c1 == p->MaxContext) 789 { 790 SetSuccessor(p->FoundState, SUCCESSOR(s)); 791 p->Text--; 792 } 793 if (SUCCESSOR(s) == 0) 794 return NULL; 795 return CTX(SUCCESSOR(s)); 796 } 797 798 static void UpdateModel(CPpmd8 *p) 799 { 800 CPpmd_Void_Ref successor, fSuccessor = SUCCESSOR(p->FoundState); 801 CTX_PTR c; 802 unsigned s0, ns, fFreq = p->FoundState->Freq; 803 Byte flag, fSymbol = p->FoundState->Symbol; 804 CPpmd_State *s = NULL; 805 806 if (p->FoundState->Freq < MAX_FREQ / 4 && p->MinContext->Suffix != 0) 807 { 808 c = SUFFIX(p->MinContext); 809 810 if (c->NumStats == 0) 811 { 812 s = ONE_STATE(c); 813 if (s->Freq < 32) 814 s->Freq++; 815 } 816 else 817 { 818 s = STATS(c); 819 if (s->Symbol != p->FoundState->Symbol) 820 { 821 do { s++; } while (s->Symbol != p->FoundState->Symbol); 822 if (s[0].Freq >= s[-1].Freq) 823 { 824 SwapStates(&s[0], &s[-1]); 825 s--; 826 } 827 } 828 if (s->Freq < MAX_FREQ - 9) 829 { 830 s->Freq += 2; 831 c->SummFreq += 2; 832 } 833 } 834 } 835 836 c = p->MaxContext; 837 if (p->OrderFall == 0 && fSuccessor) 838 { 839 CTX_PTR cs = CreateSuccessors(p, True, s, p->MinContext); 840 if (cs == 0) 841 { 842 SetSuccessor(p->FoundState, 0); 843 RESTORE_MODEL(c, CTX(fSuccessor)); 844 } 845 else 846 { 847 SetSuccessor(p->FoundState, REF(cs)); 848 p->MaxContext = cs; 849 } 850 return; 851 } 852 853 *p->Text++ = p->FoundState->Symbol; 854 successor = REF(p->Text); 855 if (p->Text >= p->UnitsStart) 856 { 857 RESTORE_MODEL(c, CTX(fSuccessor)); /* check it */ 858 return; 859 } 860 861 if (!fSuccessor) 862 { 863 CTX_PTR cs = ReduceOrder(p, s, p->MinContext); 864 if (cs == NULL) 865 { 866 RESTORE_MODEL(c, 0); 867 return; 868 } 869 fSuccessor = REF(cs); 870 } 871 else if ((Byte *)Ppmd8_GetPtr(p, fSuccessor) < p->UnitsStart) 872 { 873 CTX_PTR cs = CreateSuccessors(p, False, s, p->MinContext); 874 if (cs == NULL) 875 { 876 RESTORE_MODEL(c, 0); 877 return; 878 } 879 fSuccessor = REF(cs); 880 } 881 882 if (--p->OrderFall == 0) 883 { 884 successor = fSuccessor; 885 p->Text -= (p->MaxContext != p->MinContext); 886 } 887 #ifdef PPMD8_FREEZE_SUPPORT 888 else if (p->RestoreMethod > PPMD8_RESTORE_METHOD_FREEZE) 889 { 890 successor = fSuccessor; 891 RESET_TEXT(0); 892 p->OrderFall = 0; 893 } 894 #endif 895 896 s0 = p->MinContext->SummFreq - (ns = p->MinContext->NumStats) - fFreq; 897 flag = (Byte)(0x08 * (fSymbol >= 0x40)); 898 899 for (; c != p->MinContext; c = SUFFIX(c)) 900 { 901 unsigned ns1; 902 UInt32 cf, sf; 903 if ((ns1 = c->NumStats) != 0) 904 { 905 if ((ns1 & 1) != 0) 906 { 907 /* Expand for one UNIT */ 908 unsigned oldNU = (ns1 + 1) >> 1; 909 unsigned i = U2I(oldNU); 910 if (i != U2I(oldNU + 1)) 911 { 912 void *ptr = AllocUnits(p, i + 1); 913 void *oldPtr; 914 if (!ptr) 915 { 916 RESTORE_MODEL(c, CTX(fSuccessor)); 917 return; 918 } 919 oldPtr = STATS(c); 920 MyMem12Cpy(ptr, oldPtr, oldNU); 921 InsertNode(p, oldPtr, i); 922 c->Stats = STATS_REF(ptr); 923 } 924 } 925 c->SummFreq = (UInt16)(c->SummFreq + (3 * ns1 + 1 < ns)); 926 } 927 else 928 { 929 CPpmd_State *s2 = (CPpmd_State*)AllocUnits(p, 0); 930 if (!s2) 931 { 932 RESTORE_MODEL(c, CTX(fSuccessor)); 933 return; 934 } 935 *s2 = *ONE_STATE(c); 936 c->Stats = REF(s2); 937 if (s2->Freq < MAX_FREQ / 4 - 1) 938 s2->Freq <<= 1; 939 else 940 s2->Freq = MAX_FREQ - 4; 941 c->SummFreq = (UInt16)(s2->Freq + p->InitEsc + (ns > 2)); 942 } 943 cf = 2 * fFreq * (c->SummFreq + 6); 944 sf = (UInt32)s0 + c->SummFreq; 945 if (cf < 6 * sf) 946 { 947 cf = 1 + (cf > sf) + (cf >= 4 * sf); 948 c->SummFreq += 4; 949 } 950 else 951 { 952 cf = 4 + (cf > 9 * sf) + (cf > 12 * sf) + (cf > 15 * sf); 953 c->SummFreq = (UInt16)(c->SummFreq + cf); 954 } 955 { 956 CPpmd_State *s2 = STATS(c) + ns1 + 1; 957 SetSuccessor(s2, successor); 958 s2->Symbol = fSymbol; 959 s2->Freq = (Byte)cf; 960 c->Flags |= flag; 961 c->NumStats = (Byte)(ns1 + 1); 962 } 963 } 964 p->MaxContext = p->MinContext = CTX(fSuccessor); 965 } 966 967 static void Rescale(CPpmd8 *p) 968 { 969 unsigned i, adder, sumFreq, escFreq; 970 CPpmd_State *stats = STATS(p->MinContext); 971 CPpmd_State *s = p->FoundState; 972 { 973 CPpmd_State tmp = *s; 974 for (; s != stats; s--) 975 s[0] = s[-1]; 976 *s = tmp; 977 } 978 escFreq = p->MinContext->SummFreq - s->Freq; 979 s->Freq += 4; 980 adder = (p->OrderFall != 0 981 #ifdef PPMD8_FREEZE_SUPPORT 982 || p->RestoreMethod > PPMD8_RESTORE_METHOD_FREEZE 983 #endif 984 ); 985 s->Freq = (Byte)((s->Freq + adder) >> 1); 986 sumFreq = s->Freq; 987 988 i = p->MinContext->NumStats; 989 do 990 { 991 escFreq -= (++s)->Freq; 992 s->Freq = (Byte)((s->Freq + adder) >> 1); 993 sumFreq += s->Freq; 994 if (s[0].Freq > s[-1].Freq) 995 { 996 CPpmd_State *s1 = s; 997 CPpmd_State tmp = *s1; 998 do 999 s1[0] = s1[-1]; 1000 while (--s1 != stats && tmp.Freq > s1[-1].Freq); 1001 *s1 = tmp; 1002 } 1003 } 1004 while (--i); 1005 1006 if (s->Freq == 0) 1007 { 1008 unsigned numStats = p->MinContext->NumStats; 1009 unsigned n0, n1; 1010 do { i++; } while ((--s)->Freq == 0); 1011 escFreq += i; 1012 p->MinContext->NumStats = (Byte)(p->MinContext->NumStats - i); 1013 if (p->MinContext->NumStats == 0) 1014 { 1015 CPpmd_State tmp = *stats; 1016 tmp.Freq = (Byte)((2 * tmp.Freq + escFreq - 1) / escFreq); 1017 if (tmp.Freq > MAX_FREQ / 3) 1018 tmp.Freq = MAX_FREQ / 3; 1019 InsertNode(p, stats, U2I((numStats + 2) >> 1)); 1020 p->MinContext->Flags = (Byte)((p->MinContext->Flags & 0x10) + 0x08 * (tmp.Symbol >= 0x40)); 1021 *(p->FoundState = ONE_STATE(p->MinContext)) = tmp; 1022 return; 1023 } 1024 n0 = (numStats + 2) >> 1; 1025 n1 = (p->MinContext->NumStats + 2) >> 1; 1026 if (n0 != n1) 1027 p->MinContext->Stats = STATS_REF(ShrinkUnits(p, stats, n0, n1)); 1028 p->MinContext->Flags &= ~0x08; 1029 p->MinContext->Flags |= 0x08 * ((s = STATS(p->MinContext))->Symbol >= 0x40); 1030 i = p->MinContext->NumStats; 1031 do { p->MinContext->Flags |= 0x08*((++s)->Symbol >= 0x40); } while (--i); 1032 } 1033 p->MinContext->SummFreq = (UInt16)(sumFreq + escFreq - (escFreq >> 1)); 1034 p->MinContext->Flags |= 0x4; 1035 p->FoundState = STATS(p->MinContext); 1036 } 1037 1038 CPpmd_See *Ppmd8_MakeEscFreq(CPpmd8 *p, unsigned numMasked1, UInt32 *escFreq) 1039 { 1040 CPpmd_See *see; 1041 if (p->MinContext->NumStats != 0xFF) 1042 { 1043 see = p->See[(unsigned)p->NS2Indx[(unsigned)p->MinContext->NumStats + 2] - 3] + 1044 (p->MinContext->SummFreq > 11 * ((unsigned)p->MinContext->NumStats + 1)) + 1045 2 * (unsigned)(2 * (unsigned)p->MinContext->NumStats < 1046 ((unsigned)SUFFIX(p->MinContext)->NumStats + numMasked1)) + 1047 p->MinContext->Flags; 1048 { 1049 unsigned r = (see->Summ >> see->Shift); 1050 see->Summ = (UInt16)(see->Summ - r); 1051 *escFreq = r + (r == 0); 1052 } 1053 } 1054 else 1055 { 1056 see = &p->DummySee; 1057 *escFreq = 1; 1058 } 1059 return see; 1060 } 1061 1062 static void NextContext(CPpmd8 *p) 1063 { 1064 CTX_PTR c = CTX(SUCCESSOR(p->FoundState)); 1065 if (p->OrderFall == 0 && (Byte *)c >= p->UnitsStart) 1066 p->MinContext = p->MaxContext = c; 1067 else 1068 { 1069 UpdateModel(p); 1070 p->MinContext = p->MaxContext; 1071 } 1072 } 1073 1074 void Ppmd8_Update1(CPpmd8 *p) 1075 { 1076 CPpmd_State *s = p->FoundState; 1077 s->Freq += 4; 1078 p->MinContext->SummFreq += 4; 1079 if (s[0].Freq > s[-1].Freq) 1080 { 1081 SwapStates(&s[0], &s[-1]); 1082 p->FoundState = --s; 1083 if (s->Freq > MAX_FREQ) 1084 Rescale(p); 1085 } 1086 NextContext(p); 1087 } 1088 1089 void Ppmd8_Update1_0(CPpmd8 *p) 1090 { 1091 p->PrevSuccess = (2 * p->FoundState->Freq >= p->MinContext->SummFreq); 1092 p->RunLength += p->PrevSuccess; 1093 p->MinContext->SummFreq += 4; 1094 if ((p->FoundState->Freq += 4) > MAX_FREQ) 1095 Rescale(p); 1096 NextContext(p); 1097 } 1098 1099 void Ppmd8_UpdateBin(CPpmd8 *p) 1100 { 1101 p->FoundState->Freq = (Byte)(p->FoundState->Freq + (p->FoundState->Freq < 196)); 1102 p->PrevSuccess = 1; 1103 p->RunLength++; 1104 NextContext(p); 1105 } 1106 1107 void Ppmd8_Update2(CPpmd8 *p) 1108 { 1109 p->MinContext->SummFreq += 4; 1110 if ((p->FoundState->Freq += 4) > MAX_FREQ) 1111 Rescale(p); 1112 p->RunLength = p->InitRL; 1113 UpdateModel(p); 1114 p->MinContext = p->MaxContext; 1115 } 1116 1117 /* Ppmd8Dec.c -- PPMdI Decoder 1118 2010-04-16 : Igor Pavlov : Public domain 1119 This code is based on: 1120 PPMd var.I (2002): Dmitry Shkarin : Public domain 1121 Carryless rangecoder (1999): Dmitry Subbotin : Public domain */ 1122 1123 Bool Ppmd8_RangeDec_Init(CPpmd8 *p) 1124 { 1125 unsigned i; 1126 p->Low = 0; 1127 p->Range = 0xFFFFFFFF; 1128 p->Code = 0; 1129 for (i = 0; i < 4; i++) 1130 p->Code = (p->Code << 8) | p->Stream.In->Read(p->Stream.In); 1131 return (p->Code < 0xFFFFFFFF); 1132 } 1133 1134 static UInt32 RangeDec_GetThreshold(CPpmd8 *p, UInt32 total) 1135 { 1136 return p->Code / (p->Range /= total); 1137 } 1138 1139 static void RangeDec_Decode(CPpmd8 *p, UInt32 start, UInt32 size) 1140 { 1141 start *= p->Range; 1142 p->Low += start; 1143 p->Code -= start; 1144 p->Range *= size; 1145 1146 while ((p->Low ^ (p->Low + p->Range)) < kTop || 1147 (p->Range < kBot && ((p->Range = (0 - p->Low) & (kBot - 1)), 1))) 1148 { 1149 p->Code = (p->Code << 8) | p->Stream.In->Read(p->Stream.In); 1150 p->Range <<= 8; 1151 p->Low <<= 8; 1152 } 1153 } 1154 1155 #define MASK(sym) ((signed char *)charMask)[sym] 1156 1157 int Ppmd8_DecodeSymbol(CPpmd8 *p) 1158 { 1159 size_t charMask[256 / sizeof(size_t)]; 1160 if (p->MinContext->NumStats != 0) 1161 { 1162 CPpmd_State *s = Ppmd8_GetStats(p, p->MinContext); 1163 unsigned i; 1164 UInt32 count, hiCnt; 1165 if ((count = RangeDec_GetThreshold(p, p->MinContext->SummFreq)) < (hiCnt = s->Freq)) 1166 { 1167 Byte symbol; 1168 RangeDec_Decode(p, 0, s->Freq); 1169 p->FoundState = s; 1170 symbol = s->Symbol; 1171 Ppmd8_Update1_0(p); 1172 return symbol; 1173 } 1174 p->PrevSuccess = 0; 1175 i = p->MinContext->NumStats; 1176 do 1177 { 1178 if ((hiCnt += (++s)->Freq) > count) 1179 { 1180 Byte symbol; 1181 RangeDec_Decode(p, hiCnt - s->Freq, s->Freq); 1182 p->FoundState = s; 1183 symbol = s->Symbol; 1184 Ppmd8_Update1(p); 1185 return symbol; 1186 } 1187 } 1188 while (--i); 1189 if (count >= p->MinContext->SummFreq) 1190 return -2; 1191 RangeDec_Decode(p, hiCnt, p->MinContext->SummFreq - hiCnt); 1192 PPMD_SetAllBitsIn256Bytes(charMask); 1193 MASK(s->Symbol) = 0; 1194 i = p->MinContext->NumStats; 1195 do { MASK((--s)->Symbol) = 0; } while (--i); 1196 } 1197 else 1198 { 1199 UInt16 *prob = Ppmd8_GetBinSumm(p); 1200 if (((p->Code / (p->Range >>= 14)) < *prob)) 1201 { 1202 Byte symbol; 1203 RangeDec_Decode(p, 0, *prob); 1204 *prob = (UInt16)PPMD_UPDATE_PROB_0(*prob); 1205 symbol = (p->FoundState = Ppmd8Context_OneState(p->MinContext))->Symbol; 1206 Ppmd8_UpdateBin(p); 1207 return symbol; 1208 } 1209 RangeDec_Decode(p, *prob, (1 << 14) - *prob); 1210 *prob = (UInt16)PPMD_UPDATE_PROB_1(*prob); 1211 p->InitEsc = PPMD8_kExpEscape[*prob >> 10]; 1212 PPMD_SetAllBitsIn256Bytes(charMask); 1213 MASK(Ppmd8Context_OneState(p->MinContext)->Symbol) = 0; 1214 p->PrevSuccess = 0; 1215 } 1216 for (;;) 1217 { 1218 CPpmd_State *ps[256], *s; 1219 UInt32 freqSum, count, hiCnt; 1220 CPpmd_See *see; 1221 unsigned i, num, numMasked = p->MinContext->NumStats; 1222 do 1223 { 1224 p->OrderFall++; 1225 if (!p->MinContext->Suffix) 1226 return -1; 1227 p->MinContext = Ppmd8_GetContext(p, p->MinContext->Suffix); 1228 } 1229 while (p->MinContext->NumStats == numMasked); 1230 hiCnt = 0; 1231 s = Ppmd8_GetStats(p, p->MinContext); 1232 i = 0; 1233 num = p->MinContext->NumStats - numMasked; 1234 do 1235 { 1236 int k = (int)(MASK(s->Symbol)); 1237 hiCnt += (s->Freq & k); 1238 ps[i] = s++; 1239 i -= k; 1240 } 1241 while (i != num); 1242 1243 see = Ppmd8_MakeEscFreq(p, numMasked, &freqSum); 1244 freqSum += hiCnt; 1245 count = RangeDec_GetThreshold(p, freqSum); 1246 1247 if (count < hiCnt) 1248 { 1249 Byte symbol; 1250 CPpmd_State **pps = ps; 1251 for (hiCnt = 0; (hiCnt += (*pps)->Freq) <= count; pps++); 1252 s = *pps; 1253 RangeDec_Decode(p, hiCnt - s->Freq, s->Freq); 1254 Ppmd_See_Update(see); 1255 p->FoundState = s; 1256 symbol = s->Symbol; 1257 Ppmd8_Update2(p); 1258 return symbol; 1259 } 1260 if (count >= freqSum) 1261 return -2; 1262 RangeDec_Decode(p, hiCnt, freqSum - hiCnt); 1263 see->Summ = (UInt16)(see->Summ + freqSum); 1264 do { MASK(ps[--i]->Symbol) = 0; } while (i != 0); 1265 } 1266 } 1267 1268 /* H->I changes: 1269 NS2Indx 1270 GlewCount, and Glue method 1271 BinSum 1272 See / EscFreq 1273 CreateSuccessors updates more suffix contexts 1274 UpdateModel consts. 1275 PrevSuccess Update 1276 */ 1277 1278 const IPpmd8 __archive_ppmd8_functions = 1279 { 1280 &Ppmd8_Construct, 1281 &Ppmd8_Alloc, 1282 &Ppmd8_Free, 1283 &Ppmd8_Init, 1284 &Ppmd8_RangeDec_Init, 1285 &Ppmd8_DecodeSymbol, 1286 }; 1287