wok-tiny annotate plop/stuff/unlzma.S @ rev 169

memtest,plop: tune lzma compression
author Pascal Bellard <pascal.bellard@slitaz.org>
date Thu May 06 12:57:42 2021 +0000 (2021-05-06)
parents 7efc88318579
children 7a5d5860f3ea
rev   line source
pascal@152 1 // #define RC_NORMALIZE if (Range < kTopValue) { Range <<= 8; Code = (Code << 8) | RC_READ_BYTE; }
pascal@152 2 //
pascal@152 3 // #define IfBit0(p) RC_NORMALIZE; bound = (Range >> kNumBitModelTotalBits) * *(p); if (Code < bound)
pascal@152 4 // #define UpdateBit0(p) Range = bound; *(p) += (kBitModelTotal - *(p)) >> kNumMoveBits;
pascal@152 5 // #define UpdateBit1(p) Range -= bound; Code -= bound; *(p) -= (*(p)) >> kNumMoveBits;
pascal@152 6 //
pascal@152 7 //#define RC_GET_BIT2(p, mi, A0, A1) IfBit0(p) \
pascal@152 8 // { UpdateBit0(p); mi <<= 1; A0; } else \
pascal@152 9 // { UpdateBit1(p); mi = (mi + mi) + 1; A1; }
pascal@152 10 //
pascal@152 11 // #define RC_GET_BIT(p, mi) RC_GET_BIT2(p, mi, ; , ;)
pascal@152 12 //
pascal@152 13 // #define RangeDecoderBitTreeDecode(probs, numLevels, res) \
pascal@152 14 // { int i = numLevels; res = 1; \
pascal@152 15 // do { CProb *p = probs + res; RC_GET_BIT(p, res) } while(--i != 0); \
pascal@152 16 // res -= (1 << numLevels); }
pascal@152 17 /*
pascal@152 18 * Compression with : lzma e src dst -eos -pb2 -lp0 -lc3
pascal@152 19 */
pascal@152 20
pascal@169 21 //#define PROP_PB 2
pascal@169 22 #define PROP_PB 0
pascal@152 23 #define PROP_LP 0
pascal@169 24 //#define PROP_LC 3
pascal@169 25 #define PROP_LC 0
pascal@152 26 #define PROPS (PROP_LC+(PROP_LP*9)+(PROP_PB*45))
pascal@152 27
pascal@152 28 // static const Byte *Buffer;
pascal@152 29 // static UInt32 bound, Code, Range;
pascal@152 30
pascal@152 31 /*
pascal@152 32 * Buffer register DS:SI
pascal@152 33 * all var based ws=ss:bp
pascal@152 34 */
pascal@152 35
pascal@152 36 rep0 = -4 // long
pascal@152 37 rep1 = rep0-4 // long
pascal@152 38 rep2 = rep0-8 // long
pascal@152 39 rep3 = rep0-12 // long
pascal@152 40 state = -17 // byte, 0..11
pascal@152 41 posState = state-1 // byte, 0..15
pascal@152 42 posState2 = posState-1 // byte, 0..15
pascal@152 43 scratched = rep0-16 // byte = 1
pascal@152 44 Code = -24 // long
pascal@152 45 outStream = -28 // long
pascal@152 46 nowPos = outStream // long
pascal@152 47 Range = Code-8 // long
pascal@152 48 #define LOCALS 32
pascal@152 49
pascal@152 50 // int LzmaDecode(CLzmaDecoderState *vs,
pascal@152 51 // const unsigned char *inStream,
pascal@152 52 // unsigned char *outStream)
pascal@152 53 // {
pascal@152 54 // CProb *p = vs->Probs;
pascal@152 55 // SizeT nowPos = 0;
pascal@152 56 // #define posStateMask = (1 << (vs->Properties.pb)) - 1;
pascal@152 57 // #define literalPosMask = (1 << (vs->Properties.lp)) - 1;
pascal@152 58 // int lc = vs->Properties.lc, state = 0, len = 0;
pascal@152 59 // UInt32 rep0 = 1, rep1 = 1, rep2 = 1, rep3 = 1;
pascal@152 60 //
pascal@152 61 // {
pascal@152 62 // UInt32 i, numProbs = Literal /*1846*/
pascal@152 63 // + ((UInt32)LZMA_LIT_SIZE /*768*/ << (lc + vs->Properties.lp));
pascal@152 64 // for (i = 0; i < numProbs; i++) p[i] = kBitModelTotal /*2048*/ >> 1;
pascal@152 65
pascal@152 66 #define WS (1846+(768<<(PROP_LC+PROP_LP)))
pascal@152 67 #if (WS+WS+LOCALS) >= 65000
pascal@152 68 /* MAX WS = (1846+(768<<(8+4))) > 3MB! */
pascal@152 69 #error invalid (lc,lp,pb) : out of memory
pascal@152 70 #endif
pascal@152 71
pascal@152 72 ws1 = WS
pascal@152 73 ws2 = ws1*2
pascal@152 74 ws = ws2+LOCALS+15
pascal@152 75
pascal@152 76 #ifndef FLAT32
pascal@152 77 #define AX %ax
pascal@152 78 #define BX %bx
pascal@152 79 #define CX %cx
pascal@152 80 #define DX %dx
pascal@152 81 #define SI %si
pascal@152 82 #define DI %di
pascal@152 83 #define BP %bp
pascal@152 84 #define SP %sp
pascal@152 85 #define CWD cwd
pascal@152 86 #else
pascal@152 87 #define AX %eax
pascal@152 88 #define BX %ebx
pascal@152 89 #define CX %ecx
pascal@152 90 #define DX %edx
pascal@152 91 #define SI %esi
pascal@152 92 #define DI %edi
pascal@152 93 #define BP %ebp
pascal@152 94 #define SP %esp
pascal@152 95 #define CWD cdq
pascal@152 96 #endif
pascal@152 97 /*
pascal@152 98 * LzmaDecode:
pascal@152 99 #ifndef FLAT32
pascal@152 100 * input ds:si=inStream, es:di=outStream
pascal@152 101 * output outStream[], ds:si, es:di
pascal@152 102 .code 16
pascal@152 103 #else
pascal@152 104 * input esi=inStream, edi=outStream
pascal@152 105 * output outStream[], esi, edi
pascal@152 106 .code 32
pascal@152 107 #endif
pascal@152 108 */
pascal@152 109
pascal@152 110 mov $ws1, CX
pascal@152 111 #ifdef ONLY8086
pascal@152 112 movw $2048/2, %ax
pascal@152 113 lzd1:
pascal@152 114 pushw %ax
pascal@152 115 #else
pascal@152 116 lzd1:
pascal@152 117 pushw $2048/2
pascal@152 118 #endif
pascal@152 119 loop lzd1
pascal@152 120 mov SP, BP
pascal@152 121 movb $((LOCALS+3)/4)*2, %cl
pascal@152 122 #ifdef ONLY8086
pascal@152 123 movw $1, %ax
pascal@152 124 cwd
pascal@152 125 initlocals:
pascal@152 126 pushw %dx
pascal@152 127 pushw %ax
pascal@152 128 #else
pascal@152 129 initlocals:
pascal@152 130 pushl $1
pascal@152 131 #endif
pascal@152 132 loop initlocals
pascal@152 133
pascal@152 134 #if !defined(FLAT32) && !defined(FLAT16OUT)
pascal@152 135 movb $4, %cl
pascal@152 136 movw %es, %bx
pascal@152 137 shrw %cl, %bx
pascal@152 138 movw %es, %dx
pascal@152 139 shlw %cl, %dx
pascal@152 140 addw %dx, %di
pascal@152 141 movw %di, outStream(%bp)
pascal@152 142 adcb %bh, outStream+2(%bp)
pascal@152 143 incw %cx
pascal@152 144 #else
pascal@152 145 movb $5, %cl
pascal@152 146 mov DI, outStream(BP)
pascal@152 147 #endif
pascal@152 148
pascal@152 149 // Byte previousByte = 0;
pascal@152 150 xor BX, BX
pascal@152 151
pascal@152 152 // #define RC_INIT(buffer)
pascal@152 153 // Buffer = buffer; Code = 0; Range = 0xFFFFFFFF;
pascal@152 154 // { int i; for(i=0; i<5; i++) { Code = (Code<<8) | RC_READ_BYTE; }}
pascal@152 155 // }
pascal@152 156 // RC_INIT(inStream);
pascal@152 157
pascal@152 158 #ifndef NO_LZMA_HEADER
pascal@152 159 #ifdef CHECK_LZMA_HEADER
pascal@152 160 cmp.w $0x5A4C, (SI) // lzip header ('LZIP' version:1 dicobits:1)
pascal@152 161 je lzip_header
pascal@152 162 cmp.w $0x5D, (SI) // lzma header (0x5D dicosz:4 orgsz:8)
pascal@152 163 jne no_header
pascal@152 164 add $13-6, SI // skip lzma header
pascal@152 165 lzip_header:
pascal@152 166 add $6, SI // skip lzip header
pascal@152 167 no_header:
pascal@152 168 #else
pascal@152 169 add $13, SI // skip lzma header (0x5D dicosz:4 orgsz:8)
pascal@152 170 #endif
pascal@152 171 #endif
pascal@152 172 setrep:
pascal@152 173 call RC_LOAD_BYTE
pascal@152 174 decb Range(BP)
pascal@152 175 loop setrep
pascal@152 176
pascal@152 177 lzdmainlp:
pascal@152 178 // while(1) {
pascal@152 179 // CProb *prob;
pascal@152 180 // int posState = (int)((nowPos) & posStateMask);
pascal@152 181 //
pascal@152 182 // prob = p + IsMatch /*0*/ + (state << kNumPosBitsMax /*4*/) + posState;
pascal@152 183 // if (Bit0(prob)) { /* char */
pascal@152 184
pascal@152 185 xor DX, DX
pascal@152 186 call Bit1state // Bit1(dx + (state << kNumPosBitsMax /*4*/) + posState)
pascal@152 187 mov $state, DI
pascal@152 188 jc lzdstring
pascal@152 189
pascal@152 190 // prob = p + Literal /*1846*/ + (LZMA_LIT_SIZE /*768*/ *
pascal@152 191 // ((((nowPos) & literalPosMask) << lc) + (previousByte >> (8 - lc))));
pascal@152 192
pascal@152 193 #if PROP_LC != 0
pascal@152 194 # ifdef ONLY8086
pascal@152 195 movb $8-PROP_LC, %cl
pascal@152 196 shrb %cl, %bl
pascal@152 197 # else
pascal@152 198 shrb $8-PROP_LC, %bl
pascal@152 199 # endif
pascal@152 200 #endif
pascal@152 201
pascal@152 202 #if PROP_LP != 0
pascal@152 203 movb posState2(BP), %dl
pascal@152 204 # ifdef ONLY8086
pascal@152 205 movb $PROP_LC, %cl
pascal@152 206 shl %cl, DX
pascal@152 207 # else
pascal@152 208 shl $PROP_LC, DX
pascal@152 209 # endif
pascal@152 210 movb $0, %bh
pascal@152 211 add BX, DX
pascal@152 212 #endif
pascal@152 213
pascal@152 214 movb $3, %ah
pascal@152 215 mul BX // dx = 3*bh
pascal@152 216 add $1846, AX
pascal@152 217
pascal@152 218 // int symbol = 1;
pascal@152 219
pascal@152 220 CWD
pascal@152 221 inc DX // symbol = 1
pascal@152 222 xchg AX, CX // save prob
pascal@152 223
pascal@152 224 // if (state >= kNumLitStates /*7*/) { /* previous was string */
pascal@152 225 // if (state < 4) state = 0;
pascal@152 226
pascal@152 227 lzd6z:
pascal@152 228 subb $3, (BP, DI)
pascal@152 229
pascal@152 230 // if (state < 4) state = 0;
pascal@152 231
pascal@152 232 jnc lzd6
pascal@152 233 movb %dh, (BP, DI) // %dh = 0
pascal@152 234
pascal@152 235 lzd6:
pascal@152 236 // else if (state < 10) state -= 3;
pascal@152 237
pascal@152 238 cmpb $10-3, (BP, DI)
pascal@152 239
pascal@152 240 // else state -= 6;
pascal@152 241
pascal@152 242 jnb lzd6z
pascal@152 243 cmpb $7-3-1, (BP, DI)
pascal@152 244 jbe lzd3
pascal@152 245
pascal@152 246 // int matchByte = outStream[nowPos - rep0];
pascal@152 247
pascal@152 248 call DicoRep02ESDI // %bl = outStream[nowPos - rep0];
pascal@152 249
pascal@152 250 // do {
pascal@152 251 // int bit;
pascal@152 252 // CProb *probLit;
pascal@152 253 // matchByte <<= 1; bit = (matchByte & 0x100);
pascal@152 254
pascal@152 255 movb $1, %bh
pascal@152 256 lzd4:
pascal@152 257 shlb $1, %bl // matchByte <<= 1
pascal@152 258 sbb DI, DI // save bit=C
pascal@152 259
pascal@152 260 // probLit = prob + 0x100 + bit + symbol;
pascal@152 261
pascal@152 262 mov CX, AX // restore prob
pascal@152 263 adcb %bh, %ah // + bit + 0x100
pascal@152 264
pascal@152 265 // RC_GET_BIT2(probLit, symbol, if (bit) break, if (!bit) break)
pascal@152 266
pascal@152 267 call Bit1axdx // C,%ax = Bit1(prob+%ax)
pascal@152 268 rclb $1, %dl // symbol <<= 1; symbol |= C
pascal@152 269 jc lzd5 // if symbol >= 0x100
pascal@152 270 cmp DI, AX
pascal@152 271 jz lzd4 // if bit == Bit1(prob+%ax)
pascal@152 272
pascal@152 273 // } while (symbol < 0x100);
pascal@152 274 // }
pascal@152 275 lzd3:
pascal@152 276 // while (symbol < 0x100) {
pascal@152 277 // CProb *probLit = prob + symbol;
pascal@152 278 // RC_GET_BIT(probLit, symbol)
pascal@152 279 // }
pascal@152 280
pascal@152 281 xor BX, BX
pascal@152 282 jmp lzd4
pascal@152 283 lzd5:
pascal@152 284
pascal@152 285 // outStream[nowPos++] = previousByte = (Byte)symbol;
pascal@152 286
pascal@152 287 xchg AX, DX
pascal@152 288 call outchar // %bl = outStream[nowPos++] = %al;
pascal@152 289 jmp lzdmainlp
pascal@152 290
pascal@152 291 // }
pascal@152 292
pascal@152 293 lzdstring:
pascal@152 294 mov $1, CX
pascal@152 295
pascal@152 296 // else { /* string */
pascal@152 297 // prob = p + IsRep /*192*/ + state;
pascal@152 298
pascal@152 299 movb $192, %dl
pascal@152 300 addb (BP, DI), %dl
pascal@152 301 mov $rep0, DI
pascal@152 302
pascal@152 303 // if (Bit0(prob)) {
pascal@152 304
pascal@152 305 call Bit1dx // Bit1(prob)
pascal@152 306 jc lzd8
pascal@152 307
pascal@152 308 // rep3 = rep2; rep2 = rep1; rep1 = rep0;
pascal@152 309 // state = (state < kNumLitStates /*7*/) ? 0 : 3;
pascal@152 310
pascal@152 311 stc
pascal@152 312
pascal@152 313 // prob = p + LenCoder /*818*/;
pascal@152 314
pascal@152 315 mov $818, DX
pascal@152 316
pascal@152 317 // }
pascal@152 318
pascal@152 319 jmp lzd11a
pascal@152 320
pascal@152 321 // else {
pascal@152 322 lzd8:
pascal@152 323 // prob += kNumStates /*12*/;
pascal@152 324 // if (Bit0(prob)) {
pascal@152 325 call Bit1dx12 // prob += 12; Bit1(prob)
pascal@152 326 jc lzd11
pascal@152 327 // prob = p + IsRep0Long /*240*/ + (state << kNumPosBitsMax /*4*/)
pascal@152 328 // + posState;
pascal@152 329 movb $240, %dl // dh=0
pascal@152 330
pascal@152 331 // if (Bit0(prob)) {
pascal@152 332
pascal@152 333 call Bit1state // Bit1(dx + (state << kNumPosBitsMax /*4*/) + posState)
pascal@152 334 jc lzd12
pascal@152 335
pascal@152 336 // // if (nowPos == 0) return LZMA_RESULT_DATA_ERROR;
pascal@152 337 // state = (state < kNumLitStates /*7*/) ? 9 : 11;
pascal@152 338
pascal@152 339 movb $9, %dl
pascal@152 340
pascal@152 341 // len++; goto string;
pascal@152 342 jmp lzd13string // ax = 0
pascal@152 343 // }
pascal@152 344 // }
pascal@152 345 // else {
pascal@152 346 lzd11:
pascal@152 347 // UInt32 distance = rep1;
pascal@152 348 // prob += kNumStates /*12*/;
pascal@152 349 // if (!Bit0(prob)) {
pascal@152 350
pascal@152 351 call Bit1dx12 // prob += 12; Bit1(prob)
pascal@152 352 jnc lzd11z
pascal@152 353
pascal@152 354 // prob += kNumStates /*12*/;
pascal@152 355 // if (Bit0(prob)) distance = rep2;
pascal@152 356
pascal@152 357 call Bit1dx12 // prob += 12; Bit1(prob)
pascal@152 358 lzd11a:
pascal@152 359 adcb %cl, %cl
pascal@152 360
pascal@152 361 // else { distance = rep3; rep3 = rep2; }
pascal@152 362 // rep2 = rep1;
pascal@152 363 // }
pascal@152 364 // rep1 = rep0; rep0 = distance;
pascal@152 365
pascal@152 366 lzd11z:
pascal@152 367 # ifdef ONLY8086
pascal@152 368 shl $1, CX
pascal@152 369 shl $1, CX // 8->32 bits
pascal@152 370 sub CX, DI // &rep[cx]
pascal@152 371 movw (BP, DI), %ax
pascal@152 372 pushw 2(BP, DI)
pascal@152 373 rotreplp:
pascal@152 374 movb 4(BP, DI), %bl
pascal@152 375 movb %bl, (BP, DI)
pascal@152 376 inc DI
pascal@152 377 loop rotreplp
pascal@152 378 popw %bx
pascal@152 379 testb %dh, %dh
pascal@152 380 jnz lzd10
pascal@152 381 movw %ax, (BP, DI)
pascal@152 382 movw %bx, 2(BP, DI)
pascal@152 383 # else
pascal@152 384 shl $2, CX // 8->32 bits
pascal@152 385 sub CX, DI // &rep[cx]
pascal@152 386 movl (BP, DI), %eax
pascal@152 387 rotreplp:
pascal@152 388 movb 4(BP, DI), %bl
pascal@152 389 movb %bl, (BP, DI)
pascal@152 390 inc DI
pascal@152 391 loop rotreplp
pascal@152 392 testb %dh, %dh
pascal@152 393 jnz lzd10
pascal@152 394 movl %eax, (BP, DI)
pascal@152 395 # endif
pascal@152 396
pascal@152 397 // }
pascal@152 398 lzd12:
pascal@152 399 // state = (state < kNumLitStates /*7*/) ? 8 : 11;
pascal@152 400
pascal@152 401 movb $0x08, %cl
pascal@152 402
pascal@152 403 // prob = p + RepLenCoder /*1332*/;
pascal@152 404
pascal@152 405 mov $1332, DX
pascal@152 406
pascal@152 407 // }
pascal@152 408 lzd10:
pascal@152 409 push CX // CX = 0
pascal@152 410
pascal@152 411 // { /* get len */
pascal@152 412 // int numBits, offset;
pascal@152 413 // CProb *probLen = prob + LenChoice /*0*/;
pascal@152 414 // numBits = kLenNumLowBits /*3*/;
pascal@152 415
pascal@152 416 movb $8, %cl // numBits : 3,3,8
pascal@152 417
pascal@152 418 // if (Bit0(probLen)) {
pascal@152 419
pascal@152 420 call Bit1dx // Bit1(prob)
pascal@152 421 xchg AX, BX
pascal@152 422 inc DX
pascal@152 423 jnc lzd15 // bx=0
pascal@152 424
pascal@152 425 // probLen = prob + LenLow/*2*/ + (posState << kLenNumLowBits/*3*/);
pascal@152 426 // offset = 0;
pascal@152 427 // }
pascal@152 428 // else {
pascal@152 429 // probLen = prob + LenChoice2 /*1*/;
pascal@152 430
pascal@152 431 call Bit1dx // Bit1(prob)
pascal@152 432 add AX, BX
pascal@152 433
pascal@152 434 #if PROP_PB != 0
pascal@152 435 inc AX // ah=0
pascal@152 436 #endif
pascal@152 437 jc lzd16 // %ax=0, %bx=-2
pascal@152 438 lzd15:
pascal@152 439 #if PROP_PB != 0
pascal@152 440 movb $8, %al
pascal@152 441 mulb posState(BP)
pascal@152 442 #endif
pascal@152 443
pascal@152 444 // if (Bit0(probLen)) {
pascal@152 445 // probLen = prob + LenMid/*130*/ + (posState << kLenNumMidBits/*3*/);
pascal@152 446
pascal@152 447 movb $3, %cl // numBits : 3,3,8
pascal@152 448 lzd16:
pascal@152 449 #if PROP_PB != 0
pascal@152 450 add $2-128-1, AX // probLen : 2,130,258
pascal@152 451 #else
pascal@152 452 mov $2-128-1, AX // probLen : 2,130,258
pascal@152 453 #endif
pascal@152 454 add DX, AX
pascal@152 455 mov $-8+1, DX // offset : 0,8,16
pascal@152 456 lzdargslp:
pascal@152 457 add $8, DX
pascal@152 458 add $128, AX
pascal@152 459 inc BX
pascal@152 460 jle lzdargslp // leave with bx=1
pascal@152 461
pascal@152 462 // offset = kLenNumLowSymbols /*8*/;
pascal@152 463 // //numBits = kLenNumMidBits /*3*/;
pascal@152 464 // }
pascal@152 465 // else {
pascal@152 466 // probLen = prob + LenHigh /*258*/;
pascal@152 467 // offset = kLenNumLowSymbols /*8*/ + kLenNumMidSymbols /*8*/;
pascal@152 468 // numBits = kLenNumHighBits /*8*/;
pascal@152 469 // }
pascal@152 470 // }
pascal@152 471 // RangeDecoderBitTreeDecode(probLen, numBits, len); len += offset;
pascal@152 472
pascal@152 473 push DX
pascal@152 474 call RangeDecoder // %ax=probs, %cx=numLevels, %ax=res
pascal@152 475 pop DX
pascal@152 476 add DX, AX // offset
pascal@152 477 pop DX // 0
pascal@152 478 lzd13string:
pascal@152 479 push AX
pascal@152 480
pascal@152 481 // state = (state < kNumLitStates /*7*/) ? dl : dl|3;
pascal@152 482
pascal@152 483 movb $7, %cl
pascal@152 484 cmpb %cl, state(BP)
pascal@152 485 jb new_state
pascal@152 486 orb $3, %dl
pascal@152 487 new_state:
pascal@152 488 movb %dl, state(BP)
pascal@152 489
pascal@152 490 // } /* get len */
pascal@152 491 // if (state < 4) {
pascal@152 492
pascal@152 493 cmpb $4-1, %dl
pascal@152 494 ja lzd19
pascal@152 495
pascal@152 496 // int posSlot;
pascal@152 497 // state += kNumLitStates /*7*/;
pascal@152 498
pascal@152 499 addb %cl, state(BP)
pascal@152 500
pascal@152 501 // prob = p + PosSlot /*432*/ + (((len < kNumLenToPosStates /*4*/) ?
pascal@152 502 // len : kNumLenToPosStates - 1) << kNumPosSlotBits /*6*/);
pascal@152 503
pascal@152 504 cmp $4+1, AX
pascal@152 505 jb lzd21
pascal@152 506 mov $3+1, AX
pascal@152 507
pascal@152 508 lzd21:
pascal@152 509
pascal@152 510 dec CX // cx = 6
pascal@152 511 shl %cl, AX
pascal@152 512 add $432-64, AX
pascal@152 513
pascal@152 514 // RangeDecoderBitTreeDecode(prob, kNumPosSlotBits /*6*/, posSlot);
pascal@152 515
pascal@152 516 call RangeDecoder // %ax=probs, %cx=numLevels, %ax=res
pascal@152 517
pascal@152 518 // if (posSlot >= kStartPosModelIndex /*4*/) {
pascal@152 519 // int numDirectBits = ((posSlot >> 1) - 1);
pascal@152 520
pascal@152 521 #ifndef FLAT32
pascal@152 522 movw %cx, 2(%bp, %di) // %cx = 0
pascal@152 523 #endif
pascal@152 524 mov AX, (BP, DI)
pascal@152 525 mov AX, CX
pascal@152 526 shrw $1, CX
pascal@152 527 dec CX
pascal@152 528 cmpb $4, %al
pascal@152 529 jb lzd22
pascal@152 530
pascal@152 531 // rep0 = (2 | ((UInt32)posSlot & 1));
pascal@152 532
pascal@152 533 andb %bl, (BP, DI) // %bx=1
pascal@152 534 orb $2, (BP, DI)
pascal@152 535
pascal@152 536 // if (posSlot < kEndPosModelIndex /*14*/) {
pascal@152 537
pascal@152 538 cmpb $14, %al
pascal@152 539 jnb lzd23
pascal@152 540
pascal@152 541 // rep0 <<= numDirectBits;
pascal@152 542
pascal@152 543 neg AX
pascal@152 544 # ifdef ONLY8086
pascal@152 545 pushw %cx
pascal@152 546 movb $0, %ch
pascal@152 547 shllrep0:
pascal@152 548 shlw $1, (BP, DI)
pascal@152 549 rclw $1, 2(BP, DI)
pascal@152 550 loop shllrep0
pascal@152 551 popw %cx
pascal@152 552 # else
pascal@152 553 shll %cl, (BP, DI)
pascal@152 554 # endif
pascal@152 555 add (BP, DI), AX
pascal@152 556
pascal@152 557 // prob = p + SpecPos /*688*/ + rep0 - posSlot - 1;
pascal@152 558
pascal@152 559 add $687, AX
pascal@152 560 jmp lzd24
pascal@152 561
pascal@152 562 // }
pascal@152 563 // else {
pascal@152 564 lzd23:
pascal@152 565 // numDirectBits -= kNumAlignBits /*4*/;
pascal@152 566 // do {
pascal@152 567 // RC_NORMALIZE; Range >>= 1; rep0 <<= 1;
pascal@152 568 // if (Code >= Range) { Code -= Range; rep0 |= 1; }
pascal@152 569
pascal@152 570 lzd23z:
pascal@152 571 call RC_NORMALIZE
pascal@152 572 # ifdef ONLY8086
pascal@152 573 pushw %dx
pascal@152 574 shrw $1, Range+2(BP)
pascal@152 575 rcrw $1, Range(BP)
pascal@152 576 movw Range(BP), %ax
pascal@152 577 movw Range+2(BP), %dx
pascal@152 578 cmpw Code+2(BP), %dx
pascal@152 579 ja lzd25
pascal@152 580 jb lzd25x
pascal@152 581 cmpw Code(BP), %ax
pascal@152 582 ja lzd25
pascal@152 583 lzd25x:
pascal@152 584 subw %ax, Code(BP)
pascal@152 585 sbbw %dx, Code+2(BP)
pascal@152 586 stc
pascal@152 587 lzd25:
pascal@152 588 popw %dx
pascal@152 589 rclw $1, (BP, DI)
pascal@152 590 rclw $1, 2(BP, DI)
pascal@152 591 # else
pascal@152 592 shrl $1, Range(BP)
pascal@152 593 movl Range(BP), %eax
pascal@152 594 cmpl Code(BP), %eax
pascal@152 595 ja lzd25
pascal@152 596 subl %eax, Code(BP)
pascal@152 597 stc
pascal@152 598 lzd25:
pascal@152 599 rcll $1, (BP, DI)
pascal@152 600 # endif
pascal@152 601
pascal@152 602 // } while (--numDirectBits != 0);
pascal@152 603
pascal@152 604 cmpb $4+1, %cl
pascal@152 605 loopne lzd23z
pascal@152 606
pascal@152 607 // prob = p + Align /* 802 */; numDirectBits = kNumAlignBits /*4*/;
pascal@152 608 // rep0 <<= numDirectBits;
pascal@152 609
pascal@152 610 # ifdef ONLY8086
pascal@152 611 pushw %cx
pascal@152 612 movb $0, %ch
pascal@152 613 shlrep0:
pascal@152 614 shlw $1, (BP, DI)
pascal@152 615 rclw $1, 2(BP, DI)
pascal@152 616 loop shlrep0
pascal@152 617 popw %cx
pascal@152 618 # else
pascal@152 619 shll %cl, (BP, DI)
pascal@152 620 # endif
pascal@152 621 mov $802, AX
pascal@152 622 // }
pascal@152 623
pascal@152 624 lzd24:
pascal@152 625 call RangeDecoder // %ax=probs, %cx=numLevels, %ax=res
pascal@152 626
pascal@152 627 // {
pascal@152 628 // int i = 1, mi = 1;
pascal@152 629 // do {
pascal@152 630 // CProb *prob3 = prob + mi;
pascal@152 631 // RC_GET_BIT2(prob3, mi, ; , rep0 |= i);
pascal@152 632
pascal@152 633 orb %dh, (BP, DI) // update rep0 with DirectBits
pascal@152 634
pascal@152 635 // i <<= 1;
pascal@152 636 // } while(--numDirectBits != 0);
pascal@152 637 // }
pascal@152 638 // } else rep0 = posSlot;
pascal@152 639 lzd22:
pascal@152 640 // if (++rep0 == (UInt32)(0)) break; /* EOF */
pascal@152 641
pascal@152 642 # ifdef ONLY8086
pascal@152 643 incw (BP, DI)
pascal@152 644 jnz lzd19
pascal@152 645 incw 2(BP, DI)
pascal@152 646 # else
pascal@152 647 incl (BP, DI)
pascal@152 648 # endif
pascal@152 649
pascal@152 650 lzd19:
pascal@152 651 pop CX
pascal@152 652 jz lzdone
pascal@152 653
pascal@152 654 // }
pascal@152 655 // len += kMatchMinLen;/*2*/
pascal@152 656
pascal@152 657 inc CX
pascal@152 658
pascal@152 659 // string: // if (rep0 > nowPos) return LZMA_RESULT_DATA_ERROR;
pascal@152 660 // do {
pascal@152 661 lzd13z:
pascal@152 662 // previousByte = outStream[nowPos - rep0];
pascal@152 663 // outStream[nowPos++] = previousByte;
pascal@152 664
pascal@152 665 call outcharDico // %bl = outStream[nowPos++] = outStream[nowPos - rep0]
pascal@152 666
pascal@152 667 // } while(--len != 0);
pascal@152 668
pascal@152 669 loop lzd13z
pascal@152 670
pascal@152 671 // } /* char/string */
pascal@152 672 // }
pascal@152 673
pascal@152 674 jmp lzdmainlp
pascal@152 675
pascal@152 676 lzdone:
pascal@152 677 // //RC_NORMALIZE;
pascal@152 678 // //*inSizeProcessed = (SizeT)(Buffer - inStream); *outSizeProcessed = nowPos;
pascal@152 679 // return LZMA_RESULT_OK;
pascal@152 680 call Dico2ESDI // set es & di (rep0 = 0)
pascal@152 681 lea ws2(BP), SP // dealloc
pascal@152 682 ret
pascal@152 683 // }
pascal@152 684
pascal@152 685 // al = outStream[nowPos - rep0];
pascal@152 686
pascal@152 687 /*
pascal@152 688 * output es:di, al
pascal@152 689 * scratch bh, cl, flags
pascal@152 690 */
pascal@152 691
pascal@152 692 DicoRep02ESDI:
pascal@152 693 stc
pascal@152 694
pascal@152 695 // bl = outStream[nowPos];
pascal@152 696
pascal@152 697 /*
pascal@152 698 * output es:di, bl
pascal@152 699 * scratch bh, cl, flags
pascal@152 700 */
pascal@152 701
pascal@152 702 Dico2ESDI:
pascal@152 703 #if !defined(FLAT32) && !defined(FLAT16OUT)
pascal@152 704 # ifdef ONLY8086
pascal@152 705 pushw %ax
pascal@152 706 movw nowPos(%bp), %bx
pascal@152 707 movw nowPos+2(%bp), %ax
pascal@152 708 jnc Dico2ESDIz
pascal@152 709 subw rep0(%bp), %bx
pascal@152 710 sbbw rep0+2(%bp), %ax
pascal@152 711 Dico2ESDIz:
pascal@152 712 movw $0xF, %di
pascal@152 713 andw %bx, %di
pascal@152 714 pushw %cx
pascal@152 715 movb $4, %cl
pascal@152 716 shrw %cl, %bx
pascal@152 717 shlw %cl, %ax
pascal@152 718 popw %cx
pascal@152 719 addb %al, %bh
pascal@152 720 popw %ax
pascal@152 721 # else
pascal@152 722 movl nowPos(%bp), %ebx
pascal@152 723 jnc Dico2ESDIz
pascal@152 724 subl rep0(%bp), %ebx
pascal@152 725 Dico2ESDIz:
pascal@152 726 movw %bx, %di
pascal@152 727 xorw %bx, %bx
pascal@152 728 shrl $4, %ebx
pascal@152 729 # endif
pascal@152 730 movw %bx, %es
pascal@152 731 #else
pascal@152 732 mov nowPos(BP), DI
pascal@152 733 jnc Dico2ESDIz
pascal@152 734 sub rep0(BP), DI
pascal@152 735 Dico2ESDIz:
pascal@152 736 #endif
pascal@152 737 #ifdef FLAT32
pascal@152 738 movb (DI), %bl
pascal@152 739 #else
pascal@152 740 movb %es:(%di), %bl
pascal@152 741 #endif
pascal@152 742 ret
pascal@152 743
pascal@152 744 outcharDico:
pascal@152 745
pascal@152 746 // bl = outStream[nowPos++] = outStream[nowPos - rep0]
pascal@152 747
pascal@152 748 /*
pascal@152 749 * output es:di, bl
pascal@152 750 * update nowPos
pascal@152 751 * scratch ax, dx, bh, cl, flags
pascal@152 752 */
pascal@152 753
pascal@152 754 call DicoRep02ESDI // %bl = outStream[nowPos - rep0]
pascal@152 755 xchg AX, BX
pascal@152 756 outchar:
pascal@152 757
pascal@152 758 // bl = outStream[nowPos++] = previousByte = al;
pascal@152 759
pascal@152 760 /*
pascal@152 761 * output bl
pascal@152 762 * update nowPos
pascal@152 763 * scratch ax, dx, bh, di, cl, flags
pascal@152 764 */
pascal@152 765
pascal@152 766 clc
pascal@152 767 call Dico2ESDI
pascal@152 768 stosb
pascal@152 769 xchg AX, BX // previous byte
pascal@152 770
pascal@152 771 // int posState = (int)((nowPos) & posStateMask);
pascal@152 772
pascal@152 773 #if PROP_PB != 0 && PROP_LP != 0
pascal@152 774 addw $0x0101, posState2(BP)
pascal@152 775 andb $(((1 << PROP_PB) -1)<<8)+((1 << PROP_LP) -1), posState2(BP)
pascal@152 776 #else
pascal@152 777 # if PROP_PB != 0
pascal@152 778 incb posState(BP)
pascal@152 779 andb $((1 << PROP_PB) -1), posState(BP)
pascal@152 780 # endif
pascal@152 781 # if PROP_LP != 0
pascal@152 782 incb posState2(BP)
pascal@152 783 andb $((1 << PROP_LP) -1), posState2(BP)
pascal@152 784 # endif
pascal@152 785 #endif
pascal@152 786 #ifdef ONLY8086
pascal@152 787 incw nowPos(BP)
pascal@152 788 jnz incnowPosDone
pascal@152 789 incw nowPos+2(BP)
pascal@152 790 incnowPosDone:
pascal@152 791 #else
pascal@152 792 incl nowPos(BP)
pascal@152 793 #endif
pascal@152 794 ret
pascal@152 795
pascal@152 796 //
pascal@152 797 // #define RC_NORMALIZE if (Range < kTopValue)
pascal@152 798 // { Range <<= 8; Code = (Code << 8) | RC_READ_BYTE; }
pascal@152 799
pascal@152 800 /*
pascal@152 801 * update Range, Code, ds:si
pascal@152 802 * scratch flags
pascal@152 803 */
pascal@152 804
pascal@152 805 RC_NORMALIZE:
pascal@152 806 cmpb $0, Range+3(BP)
pascal@152 807 jne RC_NORMALIZE_1
pascal@152 808 RC_LOAD_BYTE:
pascal@152 809 push AX
pascal@152 810 #ifdef ONLY8086
pascal@152 811 movw Range+1(BP), %ax
pascal@152 812 movw %ax, Range+2(BP)
pascal@152 813 movw Code+1(BP), %ax
pascal@152 814 movw %ax, Code+2(BP)
pascal@152 815 xorw %ax, %ax
pascal@152 816 movb Range(BP), %ah
pascal@152 817 movw %ax, Range(BP)
pascal@152 818 movb Code(BP), %ah
pascal@152 819 movw %ax, Code(BP)
pascal@152 820 #else
pascal@152 821 shll $8, Range(BP)
pascal@152 822 shll $8, Code(BP)
pascal@152 823 #endif
pascal@152 824 #if !defined(FLAT16) && !defined(FLAT32)
pascal@152 825 testw %si, %si
pascal@152 826 jns RC_READ_BYTE
pascal@152 827 movw %ds, %ax
pascal@152 828 incw %ax
pascal@152 829 movw %ax, %ds
pascal@152 830 addw $-16, %si
pascal@152 831 RC_READ_BYTE:
pascal@152 832 #endif
pascal@152 833 lodsb
pascal@152 834 movb %al, Code(BP)
pascal@152 835 pop AX
pascal@152 836 RC_NORMALIZE_1:
pascal@152 837 ret
pascal@152 838
pascal@152 839 // Bit1(dx + (state << kNumPosBitsMax /*4*/) + posState)
pascal@152 840
pascal@152 841 Bit1state:
pascal@152 842 movb $16, %al
pascal@152 843 mulb state(BP)
pascal@152 844 # if PROP_PB != 0
pascal@152 845 addb posState(BP), %al
pascal@152 846 # endif
pascal@152 847 Bit1axdx:
pascal@152 848 add DX, AX
pascal@152 849 jmp Bit1
pascal@152 850
pascal@152 851 // prob += 12; Bit1(prob)
pascal@152 852
pascal@152 853 Bit1dx12:
pascal@152 854 add $12, DX
pascal@152 855 Bit1dx:
pascal@152 856 mov DX, AX
pascal@152 857
pascal@152 858 // static int Bit1(CProb *p)
pascal@152 859
pascal@152 860 Bit1:
pascal@152 861 /*
pascal@152 862 * input ax=p
pascal@152 863 * output C, ax
pascal@152 864 * update bound, Range, Code, ds:si
pascal@152 865 * scratch flags
pascal@152 866 */
pascal@152 867
pascal@152 868 // {
pascal@152 869 // RC_NORMALIZE;
pascal@152 870
pascal@152 871 call RC_NORMALIZE // kill %ax, update %si
pascal@152 872
pascal@152 873 #ifdef ONLY8086
pascal@152 874 pushw %ax
pascal@152 875 pushw %cx
pascal@152 876 pushw %dx
pascal@152 877 pushw %di
pascal@152 878 #else
pascal@152 879 pushal
pascal@152 880 #endif
pascal@152 881
pascal@152 882 xchg AX, DI
pascal@152 883 add DI, DI // short *
pascal@152 884
pascal@152 885
pascal@152 886 // bound = (Range>>kNumBitModelTotalBits /*11*/) * *(p);
pascal@152 887
pascal@152 888 #ifdef ONLY8086
pascal@152 889 movw Range(BP), %dx
pascal@152 890 movw Range+2(BP), %ax
pascal@152 891 movw $11, %cx
pascal@152 892 shr11lp:
pascal@152 893 shrw $1, %ax
pascal@152 894 rcrw $1, %dx
pascal@152 895 loop shr11lp
pascal@152 896 movw %dx, %cx
pascal@152 897 mulw (BP, DI)
pascal@152 898 xchgw %ax, %cx
pascal@152 899 mulw (BP, DI)
pascal@152 900 addw %cx, %dx
pascal@152 901 #else
pascal@152 902 movl Range(BP), %eax
pascal@152 903 shrl $11, %eax
pascal@152 904 movzwl (BP, DI), %edx
pascal@152 905 mull %edx
pascal@152 906 #endif
pascal@152 907
pascal@152 908 // if (Code < bound) {
pascal@152 909
pascal@152 910 #ifdef ONLY8086
pascal@152 911 cmpw Code+2(BP), %dx
pascal@152 912 jb Bit1_1
pascal@152 913 ja Bit1_1x
pascal@152 914 cmpw Code(BP), %ax
pascal@152 915 jbe Bit1_1
pascal@152 916 Bit1_1x:
pascal@152 917
pascal@152 918 // Range = bound;
pascal@152 919
pascal@152 920 movw %ax, Range(BP)
pascal@152 921 movw %dx, Range+2(BP)
pascal@152 922 #else
pascal@152 923 cmpl Code(BP), %eax
pascal@152 924 jbe Bit1_1
pascal@152 925
pascal@152 926 // Range = bound;
pascal@152 927
pascal@152 928 movl %eax, Range(BP)
pascal@152 929 #endif
pascal@152 930
pascal@152 931 // *(p) += (kBitModelTotal /*2048*/ - *(p)) >> kNumMoveBits /*5*/;
pascal@152 932
pascal@152 933 movw $2048, %ax
pascal@152 934
pascal@152 935 // return 0;
pascal@152 936
pascal@152 937 jmp Bit1_2
pascal@152 938
pascal@152 939 // }
pascal@152 940 // else {
pascal@152 941
pascal@152 942 Bit1_1:
pascal@152 943
pascal@152 944 // Range -= bound; Code -= bound;
pascal@152 945
pascal@152 946 #ifdef ONLY8086
pascal@152 947 subw %ax, Range(BP)
pascal@152 948 sbbw %dx, Range+2(BP)
pascal@152 949 subw %ax, Code(BP)
pascal@152 950 sbbw %dx, Code+2(BP)
pascal@152 951 #else
pascal@152 952 subl %eax, Range(BP)
pascal@152 953 subl %eax, Code(BP)
pascal@152 954 #endif
pascal@152 955
pascal@152 956 // *(p) -= (*(p)) >> kNumMoveBits /*5*/;
pascal@152 957
pascal@152 958 movw $31, %ax
pascal@152 959
pascal@152 960 // return 1;
pascal@152 961
pascal@152 962 stc
pascal@152 963 Bit1_2:
pascal@152 964 pushf
pascal@152 965 subw (BP, DI), %ax
pascal@152 966 #ifdef ONLY8086
pascal@152 967 movb $5, %cl
pascal@152 968 sarw %cl, %ax
pascal@152 969 #else
pascal@152 970 sarw $5, %ax
pascal@152 971 #endif
pascal@152 972 addw %ax, (BP, DI)
pascal@152 973 popf
pascal@152 974 #ifdef ONLY8086
pascal@152 975 popw %di
pascal@152 976 popw %dx
pascal@152 977 popw %cx
pascal@152 978 popw %ax
pascal@152 979 #else
pascal@152 980 popal
pascal@152 981 #endif
pascal@152 982 sbb AX, AX
pascal@152 983
pascal@152 984 // }
pascal@152 985 // }
pascal@152 986
pascal@152 987 ret
pascal@152 988
pascal@152 989 RangeDecoder:
pascal@152 990
pascal@152 991 /*
pascal@152 992 * input ax=probs cx=numLevels (< 8) bx=1
pascal@152 993 * output ax=res (backward), dh (forward)
pascal@152 994 * update bound, Range, Code, ds:si
pascal@152 995 * scratch flags, cx=0, dl
pascal@152 996 */
pascal@152 997
pascal@152 998 push BX
pascal@152 999
pascal@152 1000 // { int i = numLevels; res = 1;
pascal@152 1001 mov BX, DX // res = 1
pascal@152 1002
pascal@152 1003 // do { CProb *p = probs + res; RC_GET_BIT(p, res) } while(--i != 0);
pascal@152 1004
pascal@152 1005 RangeDecoder_1:
pascal@152 1006 push AX
pascal@152 1007 call Bit1axdx // C,%ax = Bit1(prob+%ax)
pascal@152 1008 rclb $1, %dl // res <<= 1; res |= C
pascal@152 1009 andb %bl, %al // current bit
pascal@152 1010 orb %al, %bh // store in bh
pascal@152 1011 shlb $1, %bl // update max
pascal@152 1012 pop AX
pascal@152 1013 loop RangeDecoder_1
pascal@152 1014
pascal@152 1015 // res -= (1 << numLevels); }
pascal@152 1016
pascal@152 1017 xchg AX, BX // move bh to dh
pascal@152 1018 xchg AX, DX // and dl to al
pascal@152 1019 sub %dl, %al // sub max
pascal@152 1020 pop BX
pascal@152 1021 ret