annotate src/bzip2-1.0.6/compress.c @ 83:ae30d91d2ffe

Replace these with versions built using an older toolset (so as to avoid ABI compatibilities when linking on Ubuntu 14.04 for packaging purposes)
author Chris Cannam
date Fri, 07 Feb 2020 11:51:13 +0000
parents e13257ea84a4
children
rev   line source
Chris@4 1
Chris@4 2 /*-------------------------------------------------------------*/
Chris@4 3 /*--- Compression machinery (not incl block sorting) ---*/
Chris@4 4 /*--- compress.c ---*/
Chris@4 5 /*-------------------------------------------------------------*/
Chris@4 6
Chris@4 7 /* ------------------------------------------------------------------
Chris@4 8 This file is part of bzip2/libbzip2, a program and library for
Chris@4 9 lossless, block-sorting data compression.
Chris@4 10
Chris@4 11 bzip2/libbzip2 version 1.0.6 of 6 September 2010
Chris@4 12 Copyright (C) 1996-2010 Julian Seward <jseward@bzip.org>
Chris@4 13
Chris@4 14 Please read the WARNING, DISCLAIMER and PATENTS sections in the
Chris@4 15 README file.
Chris@4 16
Chris@4 17 This program is released under the terms of the license contained
Chris@4 18 in the file LICENSE.
Chris@4 19 ------------------------------------------------------------------ */
Chris@4 20
Chris@4 21
Chris@4 22 /* CHANGES
Chris@4 23 0.9.0 -- original version.
Chris@4 24 0.9.0a/b -- no changes in this file.
Chris@4 25 0.9.0c -- changed setting of nGroups in sendMTFValues()
Chris@4 26 so as to do a bit better on small files
Chris@4 27 */
Chris@4 28
Chris@4 29 #include "bzlib_private.h"
Chris@4 30
Chris@4 31
Chris@4 32 /*---------------------------------------------------*/
Chris@4 33 /*--- Bit stream I/O ---*/
Chris@4 34 /*---------------------------------------------------*/
Chris@4 35
Chris@4 36 /*---------------------------------------------------*/
Chris@4 37 void BZ2_bsInitWrite ( EState* s )
Chris@4 38 {
Chris@4 39 s->bsLive = 0;
Chris@4 40 s->bsBuff = 0;
Chris@4 41 }
Chris@4 42
Chris@4 43
Chris@4 44 /*---------------------------------------------------*/
Chris@4 45 static
Chris@4 46 void bsFinishWrite ( EState* s )
Chris@4 47 {
Chris@4 48 while (s->bsLive > 0) {
Chris@4 49 s->zbits[s->numZ] = (UChar)(s->bsBuff >> 24);
Chris@4 50 s->numZ++;
Chris@4 51 s->bsBuff <<= 8;
Chris@4 52 s->bsLive -= 8;
Chris@4 53 }
Chris@4 54 }
Chris@4 55
Chris@4 56
Chris@4 57 /*---------------------------------------------------*/
Chris@4 58 #define bsNEEDW(nz) \
Chris@4 59 { \
Chris@4 60 while (s->bsLive >= 8) { \
Chris@4 61 s->zbits[s->numZ] \
Chris@4 62 = (UChar)(s->bsBuff >> 24); \
Chris@4 63 s->numZ++; \
Chris@4 64 s->bsBuff <<= 8; \
Chris@4 65 s->bsLive -= 8; \
Chris@4 66 } \
Chris@4 67 }
Chris@4 68
Chris@4 69
Chris@4 70 /*---------------------------------------------------*/
Chris@4 71 static
Chris@4 72 __inline__
Chris@4 73 void bsW ( EState* s, Int32 n, UInt32 v )
Chris@4 74 {
Chris@4 75 bsNEEDW ( n );
Chris@4 76 s->bsBuff |= (v << (32 - s->bsLive - n));
Chris@4 77 s->bsLive += n;
Chris@4 78 }
Chris@4 79
Chris@4 80
Chris@4 81 /*---------------------------------------------------*/
Chris@4 82 static
Chris@4 83 void bsPutUInt32 ( EState* s, UInt32 u )
Chris@4 84 {
Chris@4 85 bsW ( s, 8, (u >> 24) & 0xffL );
Chris@4 86 bsW ( s, 8, (u >> 16) & 0xffL );
Chris@4 87 bsW ( s, 8, (u >> 8) & 0xffL );
Chris@4 88 bsW ( s, 8, u & 0xffL );
Chris@4 89 }
Chris@4 90
Chris@4 91
Chris@4 92 /*---------------------------------------------------*/
Chris@4 93 static
Chris@4 94 void bsPutUChar ( EState* s, UChar c )
Chris@4 95 {
Chris@4 96 bsW( s, 8, (UInt32)c );
Chris@4 97 }
Chris@4 98
Chris@4 99
Chris@4 100 /*---------------------------------------------------*/
Chris@4 101 /*--- The back end proper ---*/
Chris@4 102 /*---------------------------------------------------*/
Chris@4 103
Chris@4 104 /*---------------------------------------------------*/
Chris@4 105 static
Chris@4 106 void makeMaps_e ( EState* s )
Chris@4 107 {
Chris@4 108 Int32 i;
Chris@4 109 s->nInUse = 0;
Chris@4 110 for (i = 0; i < 256; i++)
Chris@4 111 if (s->inUse[i]) {
Chris@4 112 s->unseqToSeq[i] = s->nInUse;
Chris@4 113 s->nInUse++;
Chris@4 114 }
Chris@4 115 }
Chris@4 116
Chris@4 117
Chris@4 118 /*---------------------------------------------------*/
Chris@4 119 static
Chris@4 120 void generateMTFValues ( EState* s )
Chris@4 121 {
Chris@4 122 UChar yy[256];
Chris@4 123 Int32 i, j;
Chris@4 124 Int32 zPend;
Chris@4 125 Int32 wr;
Chris@4 126 Int32 EOB;
Chris@4 127
Chris@4 128 /*
Chris@4 129 After sorting (eg, here),
Chris@4 130 s->arr1 [ 0 .. s->nblock-1 ] holds sorted order,
Chris@4 131 and
Chris@4 132 ((UChar*)s->arr2) [ 0 .. s->nblock-1 ]
Chris@4 133 holds the original block data.
Chris@4 134
Chris@4 135 The first thing to do is generate the MTF values,
Chris@4 136 and put them in
Chris@4 137 ((UInt16*)s->arr1) [ 0 .. s->nblock-1 ].
Chris@4 138 Because there are strictly fewer or equal MTF values
Chris@4 139 than block values, ptr values in this area are overwritten
Chris@4 140 with MTF values only when they are no longer needed.
Chris@4 141
Chris@4 142 The final compressed bitstream is generated into the
Chris@4 143 area starting at
Chris@4 144 (UChar*) (&((UChar*)s->arr2)[s->nblock])
Chris@4 145
Chris@4 146 These storage aliases are set up in bzCompressInit(),
Chris@4 147 except for the last one, which is arranged in
Chris@4 148 compressBlock().
Chris@4 149 */
Chris@4 150 UInt32* ptr = s->ptr;
Chris@4 151 UChar* block = s->block;
Chris@4 152 UInt16* mtfv = s->mtfv;
Chris@4 153
Chris@4 154 makeMaps_e ( s );
Chris@4 155 EOB = s->nInUse+1;
Chris@4 156
Chris@4 157 for (i = 0; i <= EOB; i++) s->mtfFreq[i] = 0;
Chris@4 158
Chris@4 159 wr = 0;
Chris@4 160 zPend = 0;
Chris@4 161 for (i = 0; i < s->nInUse; i++) yy[i] = (UChar) i;
Chris@4 162
Chris@4 163 for (i = 0; i < s->nblock; i++) {
Chris@4 164 UChar ll_i;
Chris@4 165 AssertD ( wr <= i, "generateMTFValues(1)" );
Chris@4 166 j = ptr[i]-1; if (j < 0) j += s->nblock;
Chris@4 167 ll_i = s->unseqToSeq[block[j]];
Chris@4 168 AssertD ( ll_i < s->nInUse, "generateMTFValues(2a)" );
Chris@4 169
Chris@4 170 if (yy[0] == ll_i) {
Chris@4 171 zPend++;
Chris@4 172 } else {
Chris@4 173
Chris@4 174 if (zPend > 0) {
Chris@4 175 zPend--;
Chris@4 176 while (True) {
Chris@4 177 if (zPend & 1) {
Chris@4 178 mtfv[wr] = BZ_RUNB; wr++;
Chris@4 179 s->mtfFreq[BZ_RUNB]++;
Chris@4 180 } else {
Chris@4 181 mtfv[wr] = BZ_RUNA; wr++;
Chris@4 182 s->mtfFreq[BZ_RUNA]++;
Chris@4 183 }
Chris@4 184 if (zPend < 2) break;
Chris@4 185 zPend = (zPend - 2) / 2;
Chris@4 186 };
Chris@4 187 zPend = 0;
Chris@4 188 }
Chris@4 189 {
Chris@4 190 register UChar rtmp;
Chris@4 191 register UChar* ryy_j;
Chris@4 192 register UChar rll_i;
Chris@4 193 rtmp = yy[1];
Chris@4 194 yy[1] = yy[0];
Chris@4 195 ryy_j = &(yy[1]);
Chris@4 196 rll_i = ll_i;
Chris@4 197 while ( rll_i != rtmp ) {
Chris@4 198 register UChar rtmp2;
Chris@4 199 ryy_j++;
Chris@4 200 rtmp2 = rtmp;
Chris@4 201 rtmp = *ryy_j;
Chris@4 202 *ryy_j = rtmp2;
Chris@4 203 };
Chris@4 204 yy[0] = rtmp;
Chris@4 205 j = ryy_j - &(yy[0]);
Chris@4 206 mtfv[wr] = j+1; wr++; s->mtfFreq[j+1]++;
Chris@4 207 }
Chris@4 208
Chris@4 209 }
Chris@4 210 }
Chris@4 211
Chris@4 212 if (zPend > 0) {
Chris@4 213 zPend--;
Chris@4 214 while (True) {
Chris@4 215 if (zPend & 1) {
Chris@4 216 mtfv[wr] = BZ_RUNB; wr++;
Chris@4 217 s->mtfFreq[BZ_RUNB]++;
Chris@4 218 } else {
Chris@4 219 mtfv[wr] = BZ_RUNA; wr++;
Chris@4 220 s->mtfFreq[BZ_RUNA]++;
Chris@4 221 }
Chris@4 222 if (zPend < 2) break;
Chris@4 223 zPend = (zPend - 2) / 2;
Chris@4 224 };
Chris@4 225 zPend = 0;
Chris@4 226 }
Chris@4 227
Chris@4 228 mtfv[wr] = EOB; wr++; s->mtfFreq[EOB]++;
Chris@4 229
Chris@4 230 s->nMTF = wr;
Chris@4 231 }
Chris@4 232
Chris@4 233
Chris@4 234 /*---------------------------------------------------*/
Chris@4 235 #define BZ_LESSER_ICOST 0
Chris@4 236 #define BZ_GREATER_ICOST 15
Chris@4 237
Chris@4 238 static
Chris@4 239 void sendMTFValues ( EState* s )
Chris@4 240 {
Chris@4 241 Int32 v, t, i, j, gs, ge, totc, bt, bc, iter;
Chris@4 242 Int32 nSelectors, alphaSize, minLen, maxLen, selCtr;
Chris@4 243 Int32 nGroups, nBytes;
Chris@4 244
Chris@4 245 /*--
Chris@4 246 UChar len [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
Chris@4 247 is a global since the decoder also needs it.
Chris@4 248
Chris@4 249 Int32 code[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
Chris@4 250 Int32 rfreq[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
Chris@4 251 are also globals only used in this proc.
Chris@4 252 Made global to keep stack frame size small.
Chris@4 253 --*/
Chris@4 254
Chris@4 255
Chris@4 256 UInt16 cost[BZ_N_GROUPS];
Chris@4 257 Int32 fave[BZ_N_GROUPS];
Chris@4 258
Chris@4 259 UInt16* mtfv = s->mtfv;
Chris@4 260
Chris@4 261 if (s->verbosity >= 3)
Chris@4 262 VPrintf3( " %d in block, %d after MTF & 1-2 coding, "
Chris@4 263 "%d+2 syms in use\n",
Chris@4 264 s->nblock, s->nMTF, s->nInUse );
Chris@4 265
Chris@4 266 alphaSize = s->nInUse+2;
Chris@4 267 for (t = 0; t < BZ_N_GROUPS; t++)
Chris@4 268 for (v = 0; v < alphaSize; v++)
Chris@4 269 s->len[t][v] = BZ_GREATER_ICOST;
Chris@4 270
Chris@4 271 /*--- Decide how many coding tables to use ---*/
Chris@4 272 AssertH ( s->nMTF > 0, 3001 );
Chris@4 273 if (s->nMTF < 200) nGroups = 2; else
Chris@4 274 if (s->nMTF < 600) nGroups = 3; else
Chris@4 275 if (s->nMTF < 1200) nGroups = 4; else
Chris@4 276 if (s->nMTF < 2400) nGroups = 5; else
Chris@4 277 nGroups = 6;
Chris@4 278
Chris@4 279 /*--- Generate an initial set of coding tables ---*/
Chris@4 280 {
Chris@4 281 Int32 nPart, remF, tFreq, aFreq;
Chris@4 282
Chris@4 283 nPart = nGroups;
Chris@4 284 remF = s->nMTF;
Chris@4 285 gs = 0;
Chris@4 286 while (nPart > 0) {
Chris@4 287 tFreq = remF / nPart;
Chris@4 288 ge = gs-1;
Chris@4 289 aFreq = 0;
Chris@4 290 while (aFreq < tFreq && ge < alphaSize-1) {
Chris@4 291 ge++;
Chris@4 292 aFreq += s->mtfFreq[ge];
Chris@4 293 }
Chris@4 294
Chris@4 295 if (ge > gs
Chris@4 296 && nPart != nGroups && nPart != 1
Chris@4 297 && ((nGroups-nPart) % 2 == 1)) {
Chris@4 298 aFreq -= s->mtfFreq[ge];
Chris@4 299 ge--;
Chris@4 300 }
Chris@4 301
Chris@4 302 if (s->verbosity >= 3)
Chris@4 303 VPrintf5( " initial group %d, [%d .. %d], "
Chris@4 304 "has %d syms (%4.1f%%)\n",
Chris@4 305 nPart, gs, ge, aFreq,
Chris@4 306 (100.0 * (float)aFreq) / (float)(s->nMTF) );
Chris@4 307
Chris@4 308 for (v = 0; v < alphaSize; v++)
Chris@4 309 if (v >= gs && v <= ge)
Chris@4 310 s->len[nPart-1][v] = BZ_LESSER_ICOST; else
Chris@4 311 s->len[nPart-1][v] = BZ_GREATER_ICOST;
Chris@4 312
Chris@4 313 nPart--;
Chris@4 314 gs = ge+1;
Chris@4 315 remF -= aFreq;
Chris@4 316 }
Chris@4 317 }
Chris@4 318
Chris@4 319 /*---
Chris@4 320 Iterate up to BZ_N_ITERS times to improve the tables.
Chris@4 321 ---*/
Chris@4 322 for (iter = 0; iter < BZ_N_ITERS; iter++) {
Chris@4 323
Chris@4 324 for (t = 0; t < nGroups; t++) fave[t] = 0;
Chris@4 325
Chris@4 326 for (t = 0; t < nGroups; t++)
Chris@4 327 for (v = 0; v < alphaSize; v++)
Chris@4 328 s->rfreq[t][v] = 0;
Chris@4 329
Chris@4 330 /*---
Chris@4 331 Set up an auxiliary length table which is used to fast-track
Chris@4 332 the common case (nGroups == 6).
Chris@4 333 ---*/
Chris@4 334 if (nGroups == 6) {
Chris@4 335 for (v = 0; v < alphaSize; v++) {
Chris@4 336 s->len_pack[v][0] = (s->len[1][v] << 16) | s->len[0][v];
Chris@4 337 s->len_pack[v][1] = (s->len[3][v] << 16) | s->len[2][v];
Chris@4 338 s->len_pack[v][2] = (s->len[5][v] << 16) | s->len[4][v];
Chris@4 339 }
Chris@4 340 }
Chris@4 341
Chris@4 342 nSelectors = 0;
Chris@4 343 totc = 0;
Chris@4 344 gs = 0;
Chris@4 345 while (True) {
Chris@4 346
Chris@4 347 /*--- Set group start & end marks. --*/
Chris@4 348 if (gs >= s->nMTF) break;
Chris@4 349 ge = gs + BZ_G_SIZE - 1;
Chris@4 350 if (ge >= s->nMTF) ge = s->nMTF-1;
Chris@4 351
Chris@4 352 /*--
Chris@4 353 Calculate the cost of this group as coded
Chris@4 354 by each of the coding tables.
Chris@4 355 --*/
Chris@4 356 for (t = 0; t < nGroups; t++) cost[t] = 0;
Chris@4 357
Chris@4 358 if (nGroups == 6 && 50 == ge-gs+1) {
Chris@4 359 /*--- fast track the common case ---*/
Chris@4 360 register UInt32 cost01, cost23, cost45;
Chris@4 361 register UInt16 icv;
Chris@4 362 cost01 = cost23 = cost45 = 0;
Chris@4 363
Chris@4 364 # define BZ_ITER(nn) \
Chris@4 365 icv = mtfv[gs+(nn)]; \
Chris@4 366 cost01 += s->len_pack[icv][0]; \
Chris@4 367 cost23 += s->len_pack[icv][1]; \
Chris@4 368 cost45 += s->len_pack[icv][2]; \
Chris@4 369
Chris@4 370 BZ_ITER(0); BZ_ITER(1); BZ_ITER(2); BZ_ITER(3); BZ_ITER(4);
Chris@4 371 BZ_ITER(5); BZ_ITER(6); BZ_ITER(7); BZ_ITER(8); BZ_ITER(9);
Chris@4 372 BZ_ITER(10); BZ_ITER(11); BZ_ITER(12); BZ_ITER(13); BZ_ITER(14);
Chris@4 373 BZ_ITER(15); BZ_ITER(16); BZ_ITER(17); BZ_ITER(18); BZ_ITER(19);
Chris@4 374 BZ_ITER(20); BZ_ITER(21); BZ_ITER(22); BZ_ITER(23); BZ_ITER(24);
Chris@4 375 BZ_ITER(25); BZ_ITER(26); BZ_ITER(27); BZ_ITER(28); BZ_ITER(29);
Chris@4 376 BZ_ITER(30); BZ_ITER(31); BZ_ITER(32); BZ_ITER(33); BZ_ITER(34);
Chris@4 377 BZ_ITER(35); BZ_ITER(36); BZ_ITER(37); BZ_ITER(38); BZ_ITER(39);
Chris@4 378 BZ_ITER(40); BZ_ITER(41); BZ_ITER(42); BZ_ITER(43); BZ_ITER(44);
Chris@4 379 BZ_ITER(45); BZ_ITER(46); BZ_ITER(47); BZ_ITER(48); BZ_ITER(49);
Chris@4 380
Chris@4 381 # undef BZ_ITER
Chris@4 382
Chris@4 383 cost[0] = cost01 & 0xffff; cost[1] = cost01 >> 16;
Chris@4 384 cost[2] = cost23 & 0xffff; cost[3] = cost23 >> 16;
Chris@4 385 cost[4] = cost45 & 0xffff; cost[5] = cost45 >> 16;
Chris@4 386
Chris@4 387 } else {
Chris@4 388 /*--- slow version which correctly handles all situations ---*/
Chris@4 389 for (i = gs; i <= ge; i++) {
Chris@4 390 UInt16 icv = mtfv[i];
Chris@4 391 for (t = 0; t < nGroups; t++) cost[t] += s->len[t][icv];
Chris@4 392 }
Chris@4 393 }
Chris@4 394
Chris@4 395 /*--
Chris@4 396 Find the coding table which is best for this group,
Chris@4 397 and record its identity in the selector table.
Chris@4 398 --*/
Chris@4 399 bc = 999999999; bt = -1;
Chris@4 400 for (t = 0; t < nGroups; t++)
Chris@4 401 if (cost[t] < bc) { bc = cost[t]; bt = t; };
Chris@4 402 totc += bc;
Chris@4 403 fave[bt]++;
Chris@4 404 s->selector[nSelectors] = bt;
Chris@4 405 nSelectors++;
Chris@4 406
Chris@4 407 /*--
Chris@4 408 Increment the symbol frequencies for the selected table.
Chris@4 409 --*/
Chris@4 410 if (nGroups == 6 && 50 == ge-gs+1) {
Chris@4 411 /*--- fast track the common case ---*/
Chris@4 412
Chris@4 413 # define BZ_ITUR(nn) s->rfreq[bt][ mtfv[gs+(nn)] ]++
Chris@4 414
Chris@4 415 BZ_ITUR(0); BZ_ITUR(1); BZ_ITUR(2); BZ_ITUR(3); BZ_ITUR(4);
Chris@4 416 BZ_ITUR(5); BZ_ITUR(6); BZ_ITUR(7); BZ_ITUR(8); BZ_ITUR(9);
Chris@4 417 BZ_ITUR(10); BZ_ITUR(11); BZ_ITUR(12); BZ_ITUR(13); BZ_ITUR(14);
Chris@4 418 BZ_ITUR(15); BZ_ITUR(16); BZ_ITUR(17); BZ_ITUR(18); BZ_ITUR(19);
Chris@4 419 BZ_ITUR(20); BZ_ITUR(21); BZ_ITUR(22); BZ_ITUR(23); BZ_ITUR(24);
Chris@4 420 BZ_ITUR(25); BZ_ITUR(26); BZ_ITUR(27); BZ_ITUR(28); BZ_ITUR(29);
Chris@4 421 BZ_ITUR(30); BZ_ITUR(31); BZ_ITUR(32); BZ_ITUR(33); BZ_ITUR(34);
Chris@4 422 BZ_ITUR(35); BZ_ITUR(36); BZ_ITUR(37); BZ_ITUR(38); BZ_ITUR(39);
Chris@4 423 BZ_ITUR(40); BZ_ITUR(41); BZ_ITUR(42); BZ_ITUR(43); BZ_ITUR(44);
Chris@4 424 BZ_ITUR(45); BZ_ITUR(46); BZ_ITUR(47); BZ_ITUR(48); BZ_ITUR(49);
Chris@4 425
Chris@4 426 # undef BZ_ITUR
Chris@4 427
Chris@4 428 } else {
Chris@4 429 /*--- slow version which correctly handles all situations ---*/
Chris@4 430 for (i = gs; i <= ge; i++)
Chris@4 431 s->rfreq[bt][ mtfv[i] ]++;
Chris@4 432 }
Chris@4 433
Chris@4 434 gs = ge+1;
Chris@4 435 }
Chris@4 436 if (s->verbosity >= 3) {
Chris@4 437 VPrintf2 ( " pass %d: size is %d, grp uses are ",
Chris@4 438 iter+1, totc/8 );
Chris@4 439 for (t = 0; t < nGroups; t++)
Chris@4 440 VPrintf1 ( "%d ", fave[t] );
Chris@4 441 VPrintf0 ( "\n" );
Chris@4 442 }
Chris@4 443
Chris@4 444 /*--
Chris@4 445 Recompute the tables based on the accumulated frequencies.
Chris@4 446 --*/
Chris@4 447 /* maxLen was changed from 20 to 17 in bzip2-1.0.3. See
Chris@4 448 comment in huffman.c for details. */
Chris@4 449 for (t = 0; t < nGroups; t++)
Chris@4 450 BZ2_hbMakeCodeLengths ( &(s->len[t][0]), &(s->rfreq[t][0]),
Chris@4 451 alphaSize, 17 /*20*/ );
Chris@4 452 }
Chris@4 453
Chris@4 454
Chris@4 455 AssertH( nGroups < 8, 3002 );
Chris@4 456 AssertH( nSelectors < 32768 &&
Chris@4 457 nSelectors <= (2 + (900000 / BZ_G_SIZE)),
Chris@4 458 3003 );
Chris@4 459
Chris@4 460
Chris@4 461 /*--- Compute MTF values for the selectors. ---*/
Chris@4 462 {
Chris@4 463 UChar pos[BZ_N_GROUPS], ll_i, tmp2, tmp;
Chris@4 464 for (i = 0; i < nGroups; i++) pos[i] = i;
Chris@4 465 for (i = 0; i < nSelectors; i++) {
Chris@4 466 ll_i = s->selector[i];
Chris@4 467 j = 0;
Chris@4 468 tmp = pos[j];
Chris@4 469 while ( ll_i != tmp ) {
Chris@4 470 j++;
Chris@4 471 tmp2 = tmp;
Chris@4 472 tmp = pos[j];
Chris@4 473 pos[j] = tmp2;
Chris@4 474 };
Chris@4 475 pos[0] = tmp;
Chris@4 476 s->selectorMtf[i] = j;
Chris@4 477 }
Chris@4 478 };
Chris@4 479
Chris@4 480 /*--- Assign actual codes for the tables. --*/
Chris@4 481 for (t = 0; t < nGroups; t++) {
Chris@4 482 minLen = 32;
Chris@4 483 maxLen = 0;
Chris@4 484 for (i = 0; i < alphaSize; i++) {
Chris@4 485 if (s->len[t][i] > maxLen) maxLen = s->len[t][i];
Chris@4 486 if (s->len[t][i] < minLen) minLen = s->len[t][i];
Chris@4 487 }
Chris@4 488 AssertH ( !(maxLen > 17 /*20*/ ), 3004 );
Chris@4 489 AssertH ( !(minLen < 1), 3005 );
Chris@4 490 BZ2_hbAssignCodes ( &(s->code[t][0]), &(s->len[t][0]),
Chris@4 491 minLen, maxLen, alphaSize );
Chris@4 492 }
Chris@4 493
Chris@4 494 /*--- Transmit the mapping table. ---*/
Chris@4 495 {
Chris@4 496 Bool inUse16[16];
Chris@4 497 for (i = 0; i < 16; i++) {
Chris@4 498 inUse16[i] = False;
Chris@4 499 for (j = 0; j < 16; j++)
Chris@4 500 if (s->inUse[i * 16 + j]) inUse16[i] = True;
Chris@4 501 }
Chris@4 502
Chris@4 503 nBytes = s->numZ;
Chris@4 504 for (i = 0; i < 16; i++)
Chris@4 505 if (inUse16[i]) bsW(s,1,1); else bsW(s,1,0);
Chris@4 506
Chris@4 507 for (i = 0; i < 16; i++)
Chris@4 508 if (inUse16[i])
Chris@4 509 for (j = 0; j < 16; j++) {
Chris@4 510 if (s->inUse[i * 16 + j]) bsW(s,1,1); else bsW(s,1,0);
Chris@4 511 }
Chris@4 512
Chris@4 513 if (s->verbosity >= 3)
Chris@4 514 VPrintf1( " bytes: mapping %d, ", s->numZ-nBytes );
Chris@4 515 }
Chris@4 516
Chris@4 517 /*--- Now the selectors. ---*/
Chris@4 518 nBytes = s->numZ;
Chris@4 519 bsW ( s, 3, nGroups );
Chris@4 520 bsW ( s, 15, nSelectors );
Chris@4 521 for (i = 0; i < nSelectors; i++) {
Chris@4 522 for (j = 0; j < s->selectorMtf[i]; j++) bsW(s,1,1);
Chris@4 523 bsW(s,1,0);
Chris@4 524 }
Chris@4 525 if (s->verbosity >= 3)
Chris@4 526 VPrintf1( "selectors %d, ", s->numZ-nBytes );
Chris@4 527
Chris@4 528 /*--- Now the coding tables. ---*/
Chris@4 529 nBytes = s->numZ;
Chris@4 530
Chris@4 531 for (t = 0; t < nGroups; t++) {
Chris@4 532 Int32 curr = s->len[t][0];
Chris@4 533 bsW ( s, 5, curr );
Chris@4 534 for (i = 0; i < alphaSize; i++) {
Chris@4 535 while (curr < s->len[t][i]) { bsW(s,2,2); curr++; /* 10 */ };
Chris@4 536 while (curr > s->len[t][i]) { bsW(s,2,3); curr--; /* 11 */ };
Chris@4 537 bsW ( s, 1, 0 );
Chris@4 538 }
Chris@4 539 }
Chris@4 540
Chris@4 541 if (s->verbosity >= 3)
Chris@4 542 VPrintf1 ( "code lengths %d, ", s->numZ-nBytes );
Chris@4 543
Chris@4 544 /*--- And finally, the block data proper ---*/
Chris@4 545 nBytes = s->numZ;
Chris@4 546 selCtr = 0;
Chris@4 547 gs = 0;
Chris@4 548 while (True) {
Chris@4 549 if (gs >= s->nMTF) break;
Chris@4 550 ge = gs + BZ_G_SIZE - 1;
Chris@4 551 if (ge >= s->nMTF) ge = s->nMTF-1;
Chris@4 552 AssertH ( s->selector[selCtr] < nGroups, 3006 );
Chris@4 553
Chris@4 554 if (nGroups == 6 && 50 == ge-gs+1) {
Chris@4 555 /*--- fast track the common case ---*/
Chris@4 556 UInt16 mtfv_i;
Chris@4 557 UChar* s_len_sel_selCtr
Chris@4 558 = &(s->len[s->selector[selCtr]][0]);
Chris@4 559 Int32* s_code_sel_selCtr
Chris@4 560 = &(s->code[s->selector[selCtr]][0]);
Chris@4 561
Chris@4 562 # define BZ_ITAH(nn) \
Chris@4 563 mtfv_i = mtfv[gs+(nn)]; \
Chris@4 564 bsW ( s, \
Chris@4 565 s_len_sel_selCtr[mtfv_i], \
Chris@4 566 s_code_sel_selCtr[mtfv_i] )
Chris@4 567
Chris@4 568 BZ_ITAH(0); BZ_ITAH(1); BZ_ITAH(2); BZ_ITAH(3); BZ_ITAH(4);
Chris@4 569 BZ_ITAH(5); BZ_ITAH(6); BZ_ITAH(7); BZ_ITAH(8); BZ_ITAH(9);
Chris@4 570 BZ_ITAH(10); BZ_ITAH(11); BZ_ITAH(12); BZ_ITAH(13); BZ_ITAH(14);
Chris@4 571 BZ_ITAH(15); BZ_ITAH(16); BZ_ITAH(17); BZ_ITAH(18); BZ_ITAH(19);
Chris@4 572 BZ_ITAH(20); BZ_ITAH(21); BZ_ITAH(22); BZ_ITAH(23); BZ_ITAH(24);
Chris@4 573 BZ_ITAH(25); BZ_ITAH(26); BZ_ITAH(27); BZ_ITAH(28); BZ_ITAH(29);
Chris@4 574 BZ_ITAH(30); BZ_ITAH(31); BZ_ITAH(32); BZ_ITAH(33); BZ_ITAH(34);
Chris@4 575 BZ_ITAH(35); BZ_ITAH(36); BZ_ITAH(37); BZ_ITAH(38); BZ_ITAH(39);
Chris@4 576 BZ_ITAH(40); BZ_ITAH(41); BZ_ITAH(42); BZ_ITAH(43); BZ_ITAH(44);
Chris@4 577 BZ_ITAH(45); BZ_ITAH(46); BZ_ITAH(47); BZ_ITAH(48); BZ_ITAH(49);
Chris@4 578
Chris@4 579 # undef BZ_ITAH
Chris@4 580
Chris@4 581 } else {
Chris@4 582 /*--- slow version which correctly handles all situations ---*/
Chris@4 583 for (i = gs; i <= ge; i++) {
Chris@4 584 bsW ( s,
Chris@4 585 s->len [s->selector[selCtr]] [mtfv[i]],
Chris@4 586 s->code [s->selector[selCtr]] [mtfv[i]] );
Chris@4 587 }
Chris@4 588 }
Chris@4 589
Chris@4 590
Chris@4 591 gs = ge+1;
Chris@4 592 selCtr++;
Chris@4 593 }
Chris@4 594 AssertH( selCtr == nSelectors, 3007 );
Chris@4 595
Chris@4 596 if (s->verbosity >= 3)
Chris@4 597 VPrintf1( "codes %d\n", s->numZ-nBytes );
Chris@4 598 }
Chris@4 599
Chris@4 600
Chris@4 601 /*---------------------------------------------------*/
Chris@4 602 void BZ2_compressBlock ( EState* s, Bool is_last_block )
Chris@4 603 {
Chris@4 604 if (s->nblock > 0) {
Chris@4 605
Chris@4 606 BZ_FINALISE_CRC ( s->blockCRC );
Chris@4 607 s->combinedCRC = (s->combinedCRC << 1) | (s->combinedCRC >> 31);
Chris@4 608 s->combinedCRC ^= s->blockCRC;
Chris@4 609 if (s->blockNo > 1) s->numZ = 0;
Chris@4 610
Chris@4 611 if (s->verbosity >= 2)
Chris@4 612 VPrintf4( " block %d: crc = 0x%08x, "
Chris@4 613 "combined CRC = 0x%08x, size = %d\n",
Chris@4 614 s->blockNo, s->blockCRC, s->combinedCRC, s->nblock );
Chris@4 615
Chris@4 616 BZ2_blockSort ( s );
Chris@4 617 }
Chris@4 618
Chris@4 619 s->zbits = (UChar*) (&((UChar*)s->arr2)[s->nblock]);
Chris@4 620
Chris@4 621 /*-- If this is the first block, create the stream header. --*/
Chris@4 622 if (s->blockNo == 1) {
Chris@4 623 BZ2_bsInitWrite ( s );
Chris@4 624 bsPutUChar ( s, BZ_HDR_B );
Chris@4 625 bsPutUChar ( s, BZ_HDR_Z );
Chris@4 626 bsPutUChar ( s, BZ_HDR_h );
Chris@4 627 bsPutUChar ( s, (UChar)(BZ_HDR_0 + s->blockSize100k) );
Chris@4 628 }
Chris@4 629
Chris@4 630 if (s->nblock > 0) {
Chris@4 631
Chris@4 632 bsPutUChar ( s, 0x31 ); bsPutUChar ( s, 0x41 );
Chris@4 633 bsPutUChar ( s, 0x59 ); bsPutUChar ( s, 0x26 );
Chris@4 634 bsPutUChar ( s, 0x53 ); bsPutUChar ( s, 0x59 );
Chris@4 635
Chris@4 636 /*-- Now the block's CRC, so it is in a known place. --*/
Chris@4 637 bsPutUInt32 ( s, s->blockCRC );
Chris@4 638
Chris@4 639 /*--
Chris@4 640 Now a single bit indicating (non-)randomisation.
Chris@4 641 As of version 0.9.5, we use a better sorting algorithm
Chris@4 642 which makes randomisation unnecessary. So always set
Chris@4 643 the randomised bit to 'no'. Of course, the decoder
Chris@4 644 still needs to be able to handle randomised blocks
Chris@4 645 so as to maintain backwards compatibility with
Chris@4 646 older versions of bzip2.
Chris@4 647 --*/
Chris@4 648 bsW(s,1,0);
Chris@4 649
Chris@4 650 bsW ( s, 24, s->origPtr );
Chris@4 651 generateMTFValues ( s );
Chris@4 652 sendMTFValues ( s );
Chris@4 653 }
Chris@4 654
Chris@4 655
Chris@4 656 /*-- If this is the last block, add the stream trailer. --*/
Chris@4 657 if (is_last_block) {
Chris@4 658
Chris@4 659 bsPutUChar ( s, 0x17 ); bsPutUChar ( s, 0x72 );
Chris@4 660 bsPutUChar ( s, 0x45 ); bsPutUChar ( s, 0x38 );
Chris@4 661 bsPutUChar ( s, 0x50 ); bsPutUChar ( s, 0x90 );
Chris@4 662 bsPutUInt32 ( s, s->combinedCRC );
Chris@4 663 if (s->verbosity >= 2)
Chris@4 664 VPrintf1( " final combined CRC = 0x%08x\n ", s->combinedCRC );
Chris@4 665 bsFinishWrite ( s );
Chris@4 666 }
Chris@4 667 }
Chris@4 668
Chris@4 669
Chris@4 670 /*-------------------------------------------------------------*/
Chris@4 671 /*--- end compress.c ---*/
Chris@4 672 /*-------------------------------------------------------------*/