annotate src/bzip2-1.0.6/compress.c @ 23:619f715526df sv_v2.1

Update Vamp plugin SDK to 2.5
author Chris Cannam
date Thu, 09 May 2013 10:52:46 +0100
parents e13257ea84a4
children
rev   line source
Chris@4 1
Chris@4 2 /*-------------------------------------------------------------*/
Chris@4 3 /*--- Compression machinery (not incl block sorting) ---*/
Chris@4 4 /*--- compress.c ---*/
Chris@4 5 /*-------------------------------------------------------------*/
Chris@4 6
Chris@4 7 /* ------------------------------------------------------------------
Chris@4 8 This file is part of bzip2/libbzip2, a program and library for
Chris@4 9 lossless, block-sorting data compression.
Chris@4 10
Chris@4 11 bzip2/libbzip2 version 1.0.6 of 6 September 2010
Chris@4 12 Copyright (C) 1996-2010 Julian Seward <jseward@bzip.org>
Chris@4 13
Chris@4 14 Please read the WARNING, DISCLAIMER and PATENTS sections in the
Chris@4 15 README file.
Chris@4 16
Chris@4 17 This program is released under the terms of the license contained
Chris@4 18 in the file LICENSE.
Chris@4 19 ------------------------------------------------------------------ */
Chris@4 20
Chris@4 21
Chris@4 22 /* CHANGES
Chris@4 23 0.9.0 -- original version.
Chris@4 24 0.9.0a/b -- no changes in this file.
Chris@4 25 0.9.0c -- changed setting of nGroups in sendMTFValues()
Chris@4 26 so as to do a bit better on small files
Chris@4 27 */
Chris@4 28
Chris@4 29 #include "bzlib_private.h"
Chris@4 30
Chris@4 31
Chris@4 32 /*---------------------------------------------------*/
Chris@4 33 /*--- Bit stream I/O ---*/
Chris@4 34 /*---------------------------------------------------*/
Chris@4 35
Chris@4 36 /*---------------------------------------------------*/
Chris@4 37 void BZ2_bsInitWrite ( EState* s )
Chris@4 38 {
Chris@4 39 s->bsLive = 0;
Chris@4 40 s->bsBuff = 0;
Chris@4 41 }
Chris@4 42
Chris@4 43
Chris@4 44 /*---------------------------------------------------*/
Chris@4 45 static
Chris@4 46 void bsFinishWrite ( EState* s )
Chris@4 47 {
Chris@4 48 while (s->bsLive > 0) {
Chris@4 49 s->zbits[s->numZ] = (UChar)(s->bsBuff >> 24);
Chris@4 50 s->numZ++;
Chris@4 51 s->bsBuff <<= 8;
Chris@4 52 s->bsLive -= 8;
Chris@4 53 }
Chris@4 54 }
Chris@4 55
Chris@4 56
Chris@4 57 /*---------------------------------------------------*/
Chris@4 58 #define bsNEEDW(nz) \
Chris@4 59 { \
Chris@4 60 while (s->bsLive >= 8) { \
Chris@4 61 s->zbits[s->numZ] \
Chris@4 62 = (UChar)(s->bsBuff >> 24); \
Chris@4 63 s->numZ++; \
Chris@4 64 s->bsBuff <<= 8; \
Chris@4 65 s->bsLive -= 8; \
Chris@4 66 } \
Chris@4 67 }
Chris@4 68
Chris@4 69
Chris@4 70 /*---------------------------------------------------*/
Chris@4 71 static
Chris@4 72 __inline__
Chris@4 73 void bsW ( EState* s, Int32 n, UInt32 v )
Chris@4 74 {
Chris@4 75 bsNEEDW ( n );
Chris@4 76 s->bsBuff |= (v << (32 - s->bsLive - n));
Chris@4 77 s->bsLive += n;
Chris@4 78 }
Chris@4 79
Chris@4 80
Chris@4 81 /*---------------------------------------------------*/
Chris@4 82 static
Chris@4 83 void bsPutUInt32 ( EState* s, UInt32 u )
Chris@4 84 {
Chris@4 85 bsW ( s, 8, (u >> 24) & 0xffL );
Chris@4 86 bsW ( s, 8, (u >> 16) & 0xffL );
Chris@4 87 bsW ( s, 8, (u >> 8) & 0xffL );
Chris@4 88 bsW ( s, 8, u & 0xffL );
Chris@4 89 }
Chris@4 90
Chris@4 91
Chris@4 92 /*---------------------------------------------------*/
Chris@4 93 static
Chris@4 94 void bsPutUChar ( EState* s, UChar c )
Chris@4 95 {
Chris@4 96 bsW( s, 8, (UInt32)c );
Chris@4 97 }
Chris@4 98
Chris@4 99
Chris@4 100 /*---------------------------------------------------*/
Chris@4 101 /*--- The back end proper ---*/
Chris@4 102 /*---------------------------------------------------*/
Chris@4 103
Chris@4 104 /*---------------------------------------------------*/
Chris@4 105 static
Chris@4 106 void makeMaps_e ( EState* s )
Chris@4 107 {
Chris@4 108 Int32 i;
Chris@4 109 s->nInUse = 0;
Chris@4 110 for (i = 0; i < 256; i++)
Chris@4 111 if (s->inUse[i]) {
Chris@4 112 s->unseqToSeq[i] = s->nInUse;
Chris@4 113 s->nInUse++;
Chris@4 114 }
Chris@4 115 }
Chris@4 116
Chris@4 117
Chris@4 118 /*---------------------------------------------------*/
Chris@4 119 static
Chris@4 120 void generateMTFValues ( EState* s )
Chris@4 121 {
Chris@4 122 UChar yy[256];
Chris@4 123 Int32 i, j;
Chris@4 124 Int32 zPend;
Chris@4 125 Int32 wr;
Chris@4 126 Int32 EOB;
Chris@4 127
Chris@4 128 /*
Chris@4 129 After sorting (eg, here),
Chris@4 130 s->arr1 [ 0 .. s->nblock-1 ] holds sorted order,
Chris@4 131 and
Chris@4 132 ((UChar*)s->arr2) [ 0 .. s->nblock-1 ]
Chris@4 133 holds the original block data.
Chris@4 134
Chris@4 135 The first thing to do is generate the MTF values,
Chris@4 136 and put them in
Chris@4 137 ((UInt16*)s->arr1) [ 0 .. s->nblock-1 ].
Chris@4 138 Because there are strictly fewer or equal MTF values
Chris@4 139 than block values, ptr values in this area are overwritten
Chris@4 140 with MTF values only when they are no longer needed.
Chris@4 141
Chris@4 142 The final compressed bitstream is generated into the
Chris@4 143 area starting at
Chris@4 144 (UChar*) (&((UChar*)s->arr2)[s->nblock])
Chris@4 145
Chris@4 146 These storage aliases are set up in bzCompressInit(),
Chris@4 147 except for the last one, which is arranged in
Chris@4 148 compressBlock().
Chris@4 149 */
Chris@4 150 UInt32* ptr = s->ptr;
Chris@4 151 UChar* block = s->block;
Chris@4 152 UInt16* mtfv = s->mtfv;
Chris@4 153
Chris@4 154 makeMaps_e ( s );
Chris@4 155 EOB = s->nInUse+1;
Chris@4 156
Chris@4 157 for (i = 0; i <= EOB; i++) s->mtfFreq[i] = 0;
Chris@4 158
Chris@4 159 wr = 0;
Chris@4 160 zPend = 0;
Chris@4 161 for (i = 0; i < s->nInUse; i++) yy[i] = (UChar) i;
Chris@4 162
Chris@4 163 for (i = 0; i < s->nblock; i++) {
Chris@4 164 UChar ll_i;
Chris@4 165 AssertD ( wr <= i, "generateMTFValues(1)" );
Chris@4 166 j = ptr[i]-1; if (j < 0) j += s->nblock;
Chris@4 167 ll_i = s->unseqToSeq[block[j]];
Chris@4 168 AssertD ( ll_i < s->nInUse, "generateMTFValues(2a)" );
Chris@4 169
Chris@4 170 if (yy[0] == ll_i) {
Chris@4 171 zPend++;
Chris@4 172 } else {
Chris@4 173
Chris@4 174 if (zPend > 0) {
Chris@4 175 zPend--;
Chris@4 176 while (True) {
Chris@4 177 if (zPend & 1) {
Chris@4 178 mtfv[wr] = BZ_RUNB; wr++;
Chris@4 179 s->mtfFreq[BZ_RUNB]++;
Chris@4 180 } else {
Chris@4 181 mtfv[wr] = BZ_RUNA; wr++;
Chris@4 182 s->mtfFreq[BZ_RUNA]++;
Chris@4 183 }
Chris@4 184 if (zPend < 2) break;
Chris@4 185 zPend = (zPend - 2) / 2;
Chris@4 186 };
Chris@4 187 zPend = 0;
Chris@4 188 }
Chris@4 189 {
Chris@4 190 register UChar rtmp;
Chris@4 191 register UChar* ryy_j;
Chris@4 192 register UChar rll_i;
Chris@4 193 rtmp = yy[1];
Chris@4 194 yy[1] = yy[0];
Chris@4 195 ryy_j = &(yy[1]);
Chris@4 196 rll_i = ll_i;
Chris@4 197 while ( rll_i != rtmp ) {
Chris@4 198 register UChar rtmp2;
Chris@4 199 ryy_j++;
Chris@4 200 rtmp2 = rtmp;
Chris@4 201 rtmp = *ryy_j;
Chris@4 202 *ryy_j = rtmp2;
Chris@4 203 };
Chris@4 204 yy[0] = rtmp;
Chris@4 205 j = ryy_j - &(yy[0]);
Chris@4 206 mtfv[wr] = j+1; wr++; s->mtfFreq[j+1]++;
Chris@4 207 }
Chris@4 208
Chris@4 209 }
Chris@4 210 }
Chris@4 211
Chris@4 212 if (zPend > 0) {
Chris@4 213 zPend--;
Chris@4 214 while (True) {
Chris@4 215 if (zPend & 1) {
Chris@4 216 mtfv[wr] = BZ_RUNB; wr++;
Chris@4 217 s->mtfFreq[BZ_RUNB]++;
Chris@4 218 } else {
Chris@4 219 mtfv[wr] = BZ_RUNA; wr++;
Chris@4 220 s->mtfFreq[BZ_RUNA]++;
Chris@4 221 }
Chris@4 222 if (zPend < 2) break;
Chris@4 223 zPend = (zPend - 2) / 2;
Chris@4 224 };
Chris@4 225 zPend = 0;
Chris@4 226 }
Chris@4 227
Chris@4 228 mtfv[wr] = EOB; wr++; s->mtfFreq[EOB]++;
Chris@4 229
Chris@4 230 s->nMTF = wr;
Chris@4 231 }
Chris@4 232
Chris@4 233
Chris@4 234 /*---------------------------------------------------*/
Chris@4 235 #define BZ_LESSER_ICOST 0
Chris@4 236 #define BZ_GREATER_ICOST 15
Chris@4 237
Chris@4 238 static
Chris@4 239 void sendMTFValues ( EState* s )
Chris@4 240 {
Chris@4 241 Int32 v, t, i, j, gs, ge, totc, bt, bc, iter;
Chris@4 242 Int32 nSelectors, alphaSize, minLen, maxLen, selCtr;
Chris@4 243 Int32 nGroups, nBytes;
Chris@4 244
Chris@4 245 /*--
Chris@4 246 UChar len [BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
Chris@4 247 is a global since the decoder also needs it.
Chris@4 248
Chris@4 249 Int32 code[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
Chris@4 250 Int32 rfreq[BZ_N_GROUPS][BZ_MAX_ALPHA_SIZE];
Chris@4 251 are also globals only used in this proc.
Chris@4 252 Made global to keep stack frame size small.
Chris@4 253 --*/
Chris@4 254
Chris@4 255
Chris@4 256 UInt16 cost[BZ_N_GROUPS];
Chris@4 257 Int32 fave[BZ_N_GROUPS];
Chris@4 258
Chris@4 259 UInt16* mtfv = s->mtfv;
Chris@4 260
Chris@4 261 if (s->verbosity >= 3)
Chris@4 262 VPrintf3( " %d in block, %d after MTF & 1-2 coding, "
Chris@4 263 "%d+2 syms in use\n",
Chris@4 264 s->nblock, s->nMTF, s->nInUse );
Chris@4 265
Chris@4 266 alphaSize = s->nInUse+2;
Chris@4 267 for (t = 0; t < BZ_N_GROUPS; t++)
Chris@4 268 for (v = 0; v < alphaSize; v++)
Chris@4 269 s->len[t][v] = BZ_GREATER_ICOST;
Chris@4 270
Chris@4 271 /*--- Decide how many coding tables to use ---*/
Chris@4 272 AssertH ( s->nMTF > 0, 3001 );
Chris@4 273 if (s->nMTF < 200) nGroups = 2; else
Chris@4 274 if (s->nMTF < 600) nGroups = 3; else
Chris@4 275 if (s->nMTF < 1200) nGroups = 4; else
Chris@4 276 if (s->nMTF < 2400) nGroups = 5; else
Chris@4 277 nGroups = 6;
Chris@4 278
Chris@4 279 /*--- Generate an initial set of coding tables ---*/
Chris@4 280 {
Chris@4 281 Int32 nPart, remF, tFreq, aFreq;
Chris@4 282
Chris@4 283 nPart = nGroups;
Chris@4 284 remF = s->nMTF;
Chris@4 285 gs = 0;
Chris@4 286 while (nPart > 0) {
Chris@4 287 tFreq = remF / nPart;
Chris@4 288 ge = gs-1;
Chris@4 289 aFreq = 0;
Chris@4 290 while (aFreq < tFreq && ge < alphaSize-1) {
Chris@4 291 ge++;
Chris@4 292 aFreq += s->mtfFreq[ge];
Chris@4 293 }
Chris@4 294
Chris@4 295 if (ge > gs
Chris@4 296 && nPart != nGroups && nPart != 1
Chris@4 297 && ((nGroups-nPart) % 2 == 1)) {
Chris@4 298 aFreq -= s->mtfFreq[ge];
Chris@4 299 ge--;
Chris@4 300 }
Chris@4 301
Chris@4 302 if (s->verbosity >= 3)
Chris@4 303 VPrintf5( " initial group %d, [%d .. %d], "
Chris@4 304 "has %d syms (%4.1f%%)\n",
Chris@4 305 nPart, gs, ge, aFreq,
Chris@4 306 (100.0 * (float)aFreq) / (float)(s->nMTF) );
Chris@4 307
Chris@4 308 for (v = 0; v < alphaSize; v++)
Chris@4 309 if (v >= gs && v <= ge)
Chris@4 310 s->len[nPart-1][v] = BZ_LESSER_ICOST; else
Chris@4 311 s->len[nPart-1][v] = BZ_GREATER_ICOST;
Chris@4 312
Chris@4 313 nPart--;
Chris@4 314 gs = ge+1;
Chris@4 315 remF -= aFreq;
Chris@4 316 }
Chris@4 317 }
Chris@4 318
Chris@4 319 /*---
Chris@4 320 Iterate up to BZ_N_ITERS times to improve the tables.
Chris@4 321 ---*/
Chris@4 322 for (iter = 0; iter < BZ_N_ITERS; iter++) {
Chris@4 323
Chris@4 324 for (t = 0; t < nGroups; t++) fave[t] = 0;
Chris@4 325
Chris@4 326 for (t = 0; t < nGroups; t++)
Chris@4 327 for (v = 0; v < alphaSize; v++)
Chris@4 328 s->rfreq[t][v] = 0;
Chris@4 329
Chris@4 330 /*---
Chris@4 331 Set up an auxiliary length table which is used to fast-track
Chris@4 332 the common case (nGroups == 6).
Chris@4 333 ---*/
Chris@4 334 if (nGroups == 6) {
Chris@4 335 for (v = 0; v < alphaSize; v++) {
Chris@4 336 s->len_pack[v][0] = (s->len[1][v] << 16) | s->len[0][v];
Chris@4 337 s->len_pack[v][1] = (s->len[3][v] << 16) | s->len[2][v];
Chris@4 338 s->len_pack[v][2] = (s->len[5][v] << 16) | s->len[4][v];
Chris@4 339 }
Chris@4 340 }
Chris@4 341
Chris@4 342 nSelectors = 0;
Chris@4 343 totc = 0;
Chris@4 344 gs = 0;
Chris@4 345 while (True) {
Chris@4 346
Chris@4 347 /*--- Set group start & end marks. --*/
Chris@4 348 if (gs >= s->nMTF) break;
Chris@4 349 ge = gs + BZ_G_SIZE - 1;
Chris@4 350 if (ge >= s->nMTF) ge = s->nMTF-1;
Chris@4 351
Chris@4 352 /*--
Chris@4 353 Calculate the cost of this group as coded
Chris@4 354 by each of the coding tables.
Chris@4 355 --*/
Chris@4 356 for (t = 0; t < nGroups; t++) cost[t] = 0;
Chris@4 357
Chris@4 358 if (nGroups == 6 && 50 == ge-gs+1) {
Chris@4 359 /*--- fast track the common case ---*/
Chris@4 360 register UInt32 cost01, cost23, cost45;
Chris@4 361 register UInt16 icv;
Chris@4 362 cost01 = cost23 = cost45 = 0;
Chris@4 363
Chris@4 364 # define BZ_ITER(nn) \
Chris@4 365 icv = mtfv[gs+(nn)]; \
Chris@4 366 cost01 += s->len_pack[icv][0]; \
Chris@4 367 cost23 += s->len_pack[icv][1]; \
Chris@4 368 cost45 += s->len_pack[icv][2]; \
Chris@4 369
Chris@4 370 BZ_ITER(0); BZ_ITER(1); BZ_ITER(2); BZ_ITER(3); BZ_ITER(4);
Chris@4 371 BZ_ITER(5); BZ_ITER(6); BZ_ITER(7); BZ_ITER(8); BZ_ITER(9);
Chris@4 372 BZ_ITER(10); BZ_ITER(11); BZ_ITER(12); BZ_ITER(13); BZ_ITER(14);
Chris@4 373 BZ_ITER(15); BZ_ITER(16); BZ_ITER(17); BZ_ITER(18); BZ_ITER(19);
Chris@4 374 BZ_ITER(20); BZ_ITER(21); BZ_ITER(22); BZ_ITER(23); BZ_ITER(24);
Chris@4 375 BZ_ITER(25); BZ_ITER(26); BZ_ITER(27); BZ_ITER(28); BZ_ITER(29);
Chris@4 376 BZ_ITER(30); BZ_ITER(31); BZ_ITER(32); BZ_ITER(33); BZ_ITER(34);
Chris@4 377 BZ_ITER(35); BZ_ITER(36); BZ_ITER(37); BZ_ITER(38); BZ_ITER(39);
Chris@4 378 BZ_ITER(40); BZ_ITER(41); BZ_ITER(42); BZ_ITER(43); BZ_ITER(44);
Chris@4 379 BZ_ITER(45); BZ_ITER(46); BZ_ITER(47); BZ_ITER(48); BZ_ITER(49);
Chris@4 380
Chris@4 381 # undef BZ_ITER
Chris@4 382
Chris@4 383 cost[0] = cost01 & 0xffff; cost[1] = cost01 >> 16;
Chris@4 384 cost[2] = cost23 & 0xffff; cost[3] = cost23 >> 16;
Chris@4 385 cost[4] = cost45 & 0xffff; cost[5] = cost45 >> 16;
Chris@4 386
Chris@4 387 } else {
Chris@4 388 /*--- slow version which correctly handles all situations ---*/
Chris@4 389 for (i = gs; i <= ge; i++) {
Chris@4 390 UInt16 icv = mtfv[i];
Chris@4 391 for (t = 0; t < nGroups; t++) cost[t] += s->len[t][icv];
Chris@4 392 }
Chris@4 393 }
Chris@4 394
Chris@4 395 /*--
Chris@4 396 Find the coding table which is best for this group,
Chris@4 397 and record its identity in the selector table.
Chris@4 398 --*/
Chris@4 399 bc = 999999999; bt = -1;
Chris@4 400 for (t = 0; t < nGroups; t++)
Chris@4 401 if (cost[t] < bc) { bc = cost[t]; bt = t; };
Chris@4 402 totc += bc;
Chris@4 403 fave[bt]++;
Chris@4 404 s->selector[nSelectors] = bt;
Chris@4 405 nSelectors++;
Chris@4 406
Chris@4 407 /*--
Chris@4 408 Increment the symbol frequencies for the selected table.
Chris@4 409 --*/
Chris@4 410 if (nGroups == 6 && 50 == ge-gs+1) {
Chris@4 411 /*--- fast track the common case ---*/
Chris@4 412
Chris@4 413 # define BZ_ITUR(nn) s->rfreq[bt][ mtfv[gs+(nn)] ]++
Chris@4 414
Chris@4 415 BZ_ITUR(0); BZ_ITUR(1); BZ_ITUR(2); BZ_ITUR(3); BZ_ITUR(4);
Chris@4 416 BZ_ITUR(5); BZ_ITUR(6); BZ_ITUR(7); BZ_ITUR(8); BZ_ITUR(9);
Chris@4 417 BZ_ITUR(10); BZ_ITUR(11); BZ_ITUR(12); BZ_ITUR(13); BZ_ITUR(14);
Chris@4 418 BZ_ITUR(15); BZ_ITUR(16); BZ_ITUR(17); BZ_ITUR(18); BZ_ITUR(19);
Chris@4 419 BZ_ITUR(20); BZ_ITUR(21); BZ_ITUR(22); BZ_ITUR(23); BZ_ITUR(24);
Chris@4 420 BZ_ITUR(25); BZ_ITUR(26); BZ_ITUR(27); BZ_ITUR(28); BZ_ITUR(29);
Chris@4 421 BZ_ITUR(30); BZ_ITUR(31); BZ_ITUR(32); BZ_ITUR(33); BZ_ITUR(34);
Chris@4 422 BZ_ITUR(35); BZ_ITUR(36); BZ_ITUR(37); BZ_ITUR(38); BZ_ITUR(39);
Chris@4 423 BZ_ITUR(40); BZ_ITUR(41); BZ_ITUR(42); BZ_ITUR(43); BZ_ITUR(44);
Chris@4 424 BZ_ITUR(45); BZ_ITUR(46); BZ_ITUR(47); BZ_ITUR(48); BZ_ITUR(49);
Chris@4 425
Chris@4 426 # undef BZ_ITUR
Chris@4 427
Chris@4 428 } else {
Chris@4 429 /*--- slow version which correctly handles all situations ---*/
Chris@4 430 for (i = gs; i <= ge; i++)
Chris@4 431 s->rfreq[bt][ mtfv[i] ]++;
Chris@4 432 }
Chris@4 433
Chris@4 434 gs = ge+1;
Chris@4 435 }
Chris@4 436 if (s->verbosity >= 3) {
Chris@4 437 VPrintf2 ( " pass %d: size is %d, grp uses are ",
Chris@4 438 iter+1, totc/8 );
Chris@4 439 for (t = 0; t < nGroups; t++)
Chris@4 440 VPrintf1 ( "%d ", fave[t] );
Chris@4 441 VPrintf0 ( "\n" );
Chris@4 442 }
Chris@4 443
Chris@4 444 /*--
Chris@4 445 Recompute the tables based on the accumulated frequencies.
Chris@4 446 --*/
Chris@4 447 /* maxLen was changed from 20 to 17 in bzip2-1.0.3. See
Chris@4 448 comment in huffman.c for details. */
Chris@4 449 for (t = 0; t < nGroups; t++)
Chris@4 450 BZ2_hbMakeCodeLengths ( &(s->len[t][0]), &(s->rfreq[t][0]),
Chris@4 451 alphaSize, 17 /*20*/ );
Chris@4 452 }
Chris@4 453
Chris@4 454
Chris@4 455 AssertH( nGroups < 8, 3002 );
Chris@4 456 AssertH( nSelectors < 32768 &&
Chris@4 457 nSelectors <= (2 + (900000 / BZ_G_SIZE)),
Chris@4 458 3003 );
Chris@4 459
Chris@4 460
Chris@4 461 /*--- Compute MTF values for the selectors. ---*/
Chris@4 462 {
Chris@4 463 UChar pos[BZ_N_GROUPS], ll_i, tmp2, tmp;
Chris@4 464 for (i = 0; i < nGroups; i++) pos[i] = i;
Chris@4 465 for (i = 0; i < nSelectors; i++) {
Chris@4 466 ll_i = s->selector[i];
Chris@4 467 j = 0;
Chris@4 468 tmp = pos[j];
Chris@4 469 while ( ll_i != tmp ) {
Chris@4 470 j++;
Chris@4 471 tmp2 = tmp;
Chris@4 472 tmp = pos[j];
Chris@4 473 pos[j] = tmp2;
Chris@4 474 };
Chris@4 475 pos[0] = tmp;
Chris@4 476 s->selectorMtf[i] = j;
Chris@4 477 }
Chris@4 478 };
Chris@4 479
Chris@4 480 /*--- Assign actual codes for the tables. --*/
Chris@4 481 for (t = 0; t < nGroups; t++) {
Chris@4 482 minLen = 32;
Chris@4 483 maxLen = 0;
Chris@4 484 for (i = 0; i < alphaSize; i++) {
Chris@4 485 if (s->len[t][i] > maxLen) maxLen = s->len[t][i];
Chris@4 486 if (s->len[t][i] < minLen) minLen = s->len[t][i];
Chris@4 487 }
Chris@4 488 AssertH ( !(maxLen > 17 /*20*/ ), 3004 );
Chris@4 489 AssertH ( !(minLen < 1), 3005 );
Chris@4 490 BZ2_hbAssignCodes ( &(s->code[t][0]), &(s->len[t][0]),
Chris@4 491 minLen, maxLen, alphaSize );
Chris@4 492 }
Chris@4 493
Chris@4 494 /*--- Transmit the mapping table. ---*/
Chris@4 495 {
Chris@4 496 Bool inUse16[16];
Chris@4 497 for (i = 0; i < 16; i++) {
Chris@4 498 inUse16[i] = False;
Chris@4 499 for (j = 0; j < 16; j++)
Chris@4 500 if (s->inUse[i * 16 + j]) inUse16[i] = True;
Chris@4 501 }
Chris@4 502
Chris@4 503 nBytes = s->numZ;
Chris@4 504 for (i = 0; i < 16; i++)
Chris@4 505 if (inUse16[i]) bsW(s,1,1); else bsW(s,1,0);
Chris@4 506
Chris@4 507 for (i = 0; i < 16; i++)
Chris@4 508 if (inUse16[i])
Chris@4 509 for (j = 0; j < 16; j++) {
Chris@4 510 if (s->inUse[i * 16 + j]) bsW(s,1,1); else bsW(s,1,0);
Chris@4 511 }
Chris@4 512
Chris@4 513 if (s->verbosity >= 3)
Chris@4 514 VPrintf1( " bytes: mapping %d, ", s->numZ-nBytes );
Chris@4 515 }
Chris@4 516
Chris@4 517 /*--- Now the selectors. ---*/
Chris@4 518 nBytes = s->numZ;
Chris@4 519 bsW ( s, 3, nGroups );
Chris@4 520 bsW ( s, 15, nSelectors );
Chris@4 521 for (i = 0; i < nSelectors; i++) {
Chris@4 522 for (j = 0; j < s->selectorMtf[i]; j++) bsW(s,1,1);
Chris@4 523 bsW(s,1,0);
Chris@4 524 }
Chris@4 525 if (s->verbosity >= 3)
Chris@4 526 VPrintf1( "selectors %d, ", s->numZ-nBytes );
Chris@4 527
Chris@4 528 /*--- Now the coding tables. ---*/
Chris@4 529 nBytes = s->numZ;
Chris@4 530
Chris@4 531 for (t = 0; t < nGroups; t++) {
Chris@4 532 Int32 curr = s->len[t][0];
Chris@4 533 bsW ( s, 5, curr );
Chris@4 534 for (i = 0; i < alphaSize; i++) {
Chris@4 535 while (curr < s->len[t][i]) { bsW(s,2,2); curr++; /* 10 */ };
Chris@4 536 while (curr > s->len[t][i]) { bsW(s,2,3); curr--; /* 11 */ };
Chris@4 537 bsW ( s, 1, 0 );
Chris@4 538 }
Chris@4 539 }
Chris@4 540
Chris@4 541 if (s->verbosity >= 3)
Chris@4 542 VPrintf1 ( "code lengths %d, ", s->numZ-nBytes );
Chris@4 543
Chris@4 544 /*--- And finally, the block data proper ---*/
Chris@4 545 nBytes = s->numZ;
Chris@4 546 selCtr = 0;
Chris@4 547 gs = 0;
Chris@4 548 while (True) {
Chris@4 549 if (gs >= s->nMTF) break;
Chris@4 550 ge = gs + BZ_G_SIZE - 1;
Chris@4 551 if (ge >= s->nMTF) ge = s->nMTF-1;
Chris@4 552 AssertH ( s->selector[selCtr] < nGroups, 3006 );
Chris@4 553
Chris@4 554 if (nGroups == 6 && 50 == ge-gs+1) {
Chris@4 555 /*--- fast track the common case ---*/
Chris@4 556 UInt16 mtfv_i;
Chris@4 557 UChar* s_len_sel_selCtr
Chris@4 558 = &(s->len[s->selector[selCtr]][0]);
Chris@4 559 Int32* s_code_sel_selCtr
Chris@4 560 = &(s->code[s->selector[selCtr]][0]);
Chris@4 561
Chris@4 562 # define BZ_ITAH(nn) \
Chris@4 563 mtfv_i = mtfv[gs+(nn)]; \
Chris@4 564 bsW ( s, \
Chris@4 565 s_len_sel_selCtr[mtfv_i], \
Chris@4 566 s_code_sel_selCtr[mtfv_i] )
Chris@4 567
Chris@4 568 BZ_ITAH(0); BZ_ITAH(1); BZ_ITAH(2); BZ_ITAH(3); BZ_ITAH(4);
Chris@4 569 BZ_ITAH(5); BZ_ITAH(6); BZ_ITAH(7); BZ_ITAH(8); BZ_ITAH(9);
Chris@4 570 BZ_ITAH(10); BZ_ITAH(11); BZ_ITAH(12); BZ_ITAH(13); BZ_ITAH(14);
Chris@4 571 BZ_ITAH(15); BZ_ITAH(16); BZ_ITAH(17); BZ_ITAH(18); BZ_ITAH(19);
Chris@4 572 BZ_ITAH(20); BZ_ITAH(21); BZ_ITAH(22); BZ_ITAH(23); BZ_ITAH(24);
Chris@4 573 BZ_ITAH(25); BZ_ITAH(26); BZ_ITAH(27); BZ_ITAH(28); BZ_ITAH(29);
Chris@4 574 BZ_ITAH(30); BZ_ITAH(31); BZ_ITAH(32); BZ_ITAH(33); BZ_ITAH(34);
Chris@4 575 BZ_ITAH(35); BZ_ITAH(36); BZ_ITAH(37); BZ_ITAH(38); BZ_ITAH(39);
Chris@4 576 BZ_ITAH(40); BZ_ITAH(41); BZ_ITAH(42); BZ_ITAH(43); BZ_ITAH(44);
Chris@4 577 BZ_ITAH(45); BZ_ITAH(46); BZ_ITAH(47); BZ_ITAH(48); BZ_ITAH(49);
Chris@4 578
Chris@4 579 # undef BZ_ITAH
Chris@4 580
Chris@4 581 } else {
Chris@4 582 /*--- slow version which correctly handles all situations ---*/
Chris@4 583 for (i = gs; i <= ge; i++) {
Chris@4 584 bsW ( s,
Chris@4 585 s->len [s->selector[selCtr]] [mtfv[i]],
Chris@4 586 s->code [s->selector[selCtr]] [mtfv[i]] );
Chris@4 587 }
Chris@4 588 }
Chris@4 589
Chris@4 590
Chris@4 591 gs = ge+1;
Chris@4 592 selCtr++;
Chris@4 593 }
Chris@4 594 AssertH( selCtr == nSelectors, 3007 );
Chris@4 595
Chris@4 596 if (s->verbosity >= 3)
Chris@4 597 VPrintf1( "codes %d\n", s->numZ-nBytes );
Chris@4 598 }
Chris@4 599
Chris@4 600
Chris@4 601 /*---------------------------------------------------*/
Chris@4 602 void BZ2_compressBlock ( EState* s, Bool is_last_block )
Chris@4 603 {
Chris@4 604 if (s->nblock > 0) {
Chris@4 605
Chris@4 606 BZ_FINALISE_CRC ( s->blockCRC );
Chris@4 607 s->combinedCRC = (s->combinedCRC << 1) | (s->combinedCRC >> 31);
Chris@4 608 s->combinedCRC ^= s->blockCRC;
Chris@4 609 if (s->blockNo > 1) s->numZ = 0;
Chris@4 610
Chris@4 611 if (s->verbosity >= 2)
Chris@4 612 VPrintf4( " block %d: crc = 0x%08x, "
Chris@4 613 "combined CRC = 0x%08x, size = %d\n",
Chris@4 614 s->blockNo, s->blockCRC, s->combinedCRC, s->nblock );
Chris@4 615
Chris@4 616 BZ2_blockSort ( s );
Chris@4 617 }
Chris@4 618
Chris@4 619 s->zbits = (UChar*) (&((UChar*)s->arr2)[s->nblock]);
Chris@4 620
Chris@4 621 /*-- If this is the first block, create the stream header. --*/
Chris@4 622 if (s->blockNo == 1) {
Chris@4 623 BZ2_bsInitWrite ( s );
Chris@4 624 bsPutUChar ( s, BZ_HDR_B );
Chris@4 625 bsPutUChar ( s, BZ_HDR_Z );
Chris@4 626 bsPutUChar ( s, BZ_HDR_h );
Chris@4 627 bsPutUChar ( s, (UChar)(BZ_HDR_0 + s->blockSize100k) );
Chris@4 628 }
Chris@4 629
Chris@4 630 if (s->nblock > 0) {
Chris@4 631
Chris@4 632 bsPutUChar ( s, 0x31 ); bsPutUChar ( s, 0x41 );
Chris@4 633 bsPutUChar ( s, 0x59 ); bsPutUChar ( s, 0x26 );
Chris@4 634 bsPutUChar ( s, 0x53 ); bsPutUChar ( s, 0x59 );
Chris@4 635
Chris@4 636 /*-- Now the block's CRC, so it is in a known place. --*/
Chris@4 637 bsPutUInt32 ( s, s->blockCRC );
Chris@4 638
Chris@4 639 /*--
Chris@4 640 Now a single bit indicating (non-)randomisation.
Chris@4 641 As of version 0.9.5, we use a better sorting algorithm
Chris@4 642 which makes randomisation unnecessary. So always set
Chris@4 643 the randomised bit to 'no'. Of course, the decoder
Chris@4 644 still needs to be able to handle randomised blocks
Chris@4 645 so as to maintain backwards compatibility with
Chris@4 646 older versions of bzip2.
Chris@4 647 --*/
Chris@4 648 bsW(s,1,0);
Chris@4 649
Chris@4 650 bsW ( s, 24, s->origPtr );
Chris@4 651 generateMTFValues ( s );
Chris@4 652 sendMTFValues ( s );
Chris@4 653 }
Chris@4 654
Chris@4 655
Chris@4 656 /*-- If this is the last block, add the stream trailer. --*/
Chris@4 657 if (is_last_block) {
Chris@4 658
Chris@4 659 bsPutUChar ( s, 0x17 ); bsPutUChar ( s, 0x72 );
Chris@4 660 bsPutUChar ( s, 0x45 ); bsPutUChar ( s, 0x38 );
Chris@4 661 bsPutUChar ( s, 0x50 ); bsPutUChar ( s, 0x90 );
Chris@4 662 bsPutUInt32 ( s, s->combinedCRC );
Chris@4 663 if (s->verbosity >= 2)
Chris@4 664 VPrintf1( " final combined CRC = 0x%08x\n ", s->combinedCRC );
Chris@4 665 bsFinishWrite ( s );
Chris@4 666 }
Chris@4 667 }
Chris@4 668
Chris@4 669
Chris@4 670 /*-------------------------------------------------------------*/
Chris@4 671 /*--- end compress.c ---*/
Chris@4 672 /*-------------------------------------------------------------*/