1*f071c501SMasahiro Yamada #include <config.h>
2*f071c501SMasahiro Yamada
3*f071c501SMasahiro Yamada /*-------------------------------------------------------------*/
4*f071c501SMasahiro Yamada /*--- Huffman coding low-level stuff ---*/
5*f071c501SMasahiro Yamada /*--- huffman.c ---*/
6*f071c501SMasahiro Yamada /*-------------------------------------------------------------*/
7*f071c501SMasahiro Yamada
8*f071c501SMasahiro Yamada /*--
9*f071c501SMasahiro Yamada This file is a part of bzip2 and/or libbzip2, a program and
10*f071c501SMasahiro Yamada library for lossless, block-sorting data compression.
11*f071c501SMasahiro Yamada
12*f071c501SMasahiro Yamada Copyright (C) 1996-2002 Julian R Seward. All rights reserved.
13*f071c501SMasahiro Yamada
14*f071c501SMasahiro Yamada Redistribution and use in source and binary forms, with or without
15*f071c501SMasahiro Yamada modification, are permitted provided that the following conditions
16*f071c501SMasahiro Yamada are met:
17*f071c501SMasahiro Yamada
18*f071c501SMasahiro Yamada 1. Redistributions of source code must retain the above copyright
19*f071c501SMasahiro Yamada notice, this list of conditions and the following disclaimer.
20*f071c501SMasahiro Yamada
21*f071c501SMasahiro Yamada 2. The origin of this software must not be misrepresented; you must
22*f071c501SMasahiro Yamada not claim that you wrote the original software. If you use this
23*f071c501SMasahiro Yamada software in a product, an acknowledgment in the product
24*f071c501SMasahiro Yamada documentation would be appreciated but is not required.
25*f071c501SMasahiro Yamada
26*f071c501SMasahiro Yamada 3. Altered source versions must be plainly marked as such, and must
27*f071c501SMasahiro Yamada not be misrepresented as being the original software.
28*f071c501SMasahiro Yamada
29*f071c501SMasahiro Yamada 4. The name of the author may not be used to endorse or promote
30*f071c501SMasahiro Yamada products derived from this software without specific prior written
31*f071c501SMasahiro Yamada permission.
32*f071c501SMasahiro Yamada
33*f071c501SMasahiro Yamada THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS
34*f071c501SMasahiro Yamada OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
35*f071c501SMasahiro Yamada WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
36*f071c501SMasahiro Yamada ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
37*f071c501SMasahiro Yamada DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
38*f071c501SMasahiro Yamada DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
39*f071c501SMasahiro Yamada GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
40*f071c501SMasahiro Yamada INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
41*f071c501SMasahiro Yamada WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
42*f071c501SMasahiro Yamada NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
43*f071c501SMasahiro Yamada SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
44*f071c501SMasahiro Yamada
45*f071c501SMasahiro Yamada Julian Seward, Cambridge, UK.
46*f071c501SMasahiro Yamada jseward@acm.org
47*f071c501SMasahiro Yamada bzip2/libbzip2 version 1.0 of 21 March 2000
48*f071c501SMasahiro Yamada
49*f071c501SMasahiro Yamada This program is based on (at least) the work of:
50*f071c501SMasahiro Yamada Mike Burrows
51*f071c501SMasahiro Yamada David Wheeler
52*f071c501SMasahiro Yamada Peter Fenwick
53*f071c501SMasahiro Yamada Alistair Moffat
54*f071c501SMasahiro Yamada Radford Neal
55*f071c501SMasahiro Yamada Ian H. Witten
56*f071c501SMasahiro Yamada Robert Sedgewick
57*f071c501SMasahiro Yamada Jon L. Bentley
58*f071c501SMasahiro Yamada
59*f071c501SMasahiro Yamada For more information on these sources, see the manual.
60*f071c501SMasahiro Yamada --*/
61*f071c501SMasahiro Yamada
62*f071c501SMasahiro Yamada
63*f071c501SMasahiro Yamada #include "bzlib_private.h"
64*f071c501SMasahiro Yamada
65*f071c501SMasahiro Yamada /*---------------------------------------------------*/
66*f071c501SMasahiro Yamada #define WEIGHTOF(zz0) ((zz0) & 0xffffff00)
67*f071c501SMasahiro Yamada #define DEPTHOF(zz1) ((zz1) & 0x000000ff)
68*f071c501SMasahiro Yamada #define MYMAX(zz2,zz3) ((zz2) > (zz3) ? (zz2) : (zz3))
69*f071c501SMasahiro Yamada
70*f071c501SMasahiro Yamada #define ADDWEIGHTS(zw1,zw2) \
71*f071c501SMasahiro Yamada (WEIGHTOF(zw1)+WEIGHTOF(zw2)) | \
72*f071c501SMasahiro Yamada (1 + MYMAX(DEPTHOF(zw1),DEPTHOF(zw2)))
73*f071c501SMasahiro Yamada
74*f071c501SMasahiro Yamada #define UPHEAP(z) \
75*f071c501SMasahiro Yamada { \
76*f071c501SMasahiro Yamada Int32 zz, tmp; \
77*f071c501SMasahiro Yamada zz = z; tmp = heap[zz]; \
78*f071c501SMasahiro Yamada while (weight[tmp] < weight[heap[zz >> 1]]) { \
79*f071c501SMasahiro Yamada heap[zz] = heap[zz >> 1]; \
80*f071c501SMasahiro Yamada zz >>= 1; \
81*f071c501SMasahiro Yamada } \
82*f071c501SMasahiro Yamada heap[zz] = tmp; \
83*f071c501SMasahiro Yamada }
84*f071c501SMasahiro Yamada
85*f071c501SMasahiro Yamada #define DOWNHEAP(z) \
86*f071c501SMasahiro Yamada { \
87*f071c501SMasahiro Yamada Int32 zz, yy, tmp; \
88*f071c501SMasahiro Yamada zz = z; tmp = heap[zz]; \
89*f071c501SMasahiro Yamada while (True) { \
90*f071c501SMasahiro Yamada yy = zz << 1; \
91*f071c501SMasahiro Yamada if (yy > nHeap) break; \
92*f071c501SMasahiro Yamada if (yy < nHeap && \
93*f071c501SMasahiro Yamada weight[heap[yy+1]] < weight[heap[yy]]) \
94*f071c501SMasahiro Yamada yy++; \
95*f071c501SMasahiro Yamada if (weight[tmp] < weight[heap[yy]]) break; \
96*f071c501SMasahiro Yamada heap[zz] = heap[yy]; \
97*f071c501SMasahiro Yamada zz = yy; \
98*f071c501SMasahiro Yamada } \
99*f071c501SMasahiro Yamada heap[zz] = tmp; \
100*f071c501SMasahiro Yamada }
101*f071c501SMasahiro Yamada
102*f071c501SMasahiro Yamada
103*f071c501SMasahiro Yamada /*---------------------------------------------------*/
BZ2_hbMakeCodeLengths(UChar * len,Int32 * freq,Int32 alphaSize,Int32 maxLen)104*f071c501SMasahiro Yamada void BZ2_hbMakeCodeLengths ( UChar *len,
105*f071c501SMasahiro Yamada Int32 *freq,
106*f071c501SMasahiro Yamada Int32 alphaSize,
107*f071c501SMasahiro Yamada Int32 maxLen )
108*f071c501SMasahiro Yamada {
109*f071c501SMasahiro Yamada /*--
110*f071c501SMasahiro Yamada Nodes and heap entries run from 1. Entry 0
111*f071c501SMasahiro Yamada for both the heap and nodes is a sentinel.
112*f071c501SMasahiro Yamada --*/
113*f071c501SMasahiro Yamada Int32 nNodes, nHeap, n1, n2, i, j, k;
114*f071c501SMasahiro Yamada Bool tooLong;
115*f071c501SMasahiro Yamada
116*f071c501SMasahiro Yamada Int32 heap [ BZ_MAX_ALPHA_SIZE + 2 ];
117*f071c501SMasahiro Yamada Int32 weight [ BZ_MAX_ALPHA_SIZE * 2 ];
118*f071c501SMasahiro Yamada Int32 parent [ BZ_MAX_ALPHA_SIZE * 2 ];
119*f071c501SMasahiro Yamada
120*f071c501SMasahiro Yamada for (i = 0; i < alphaSize; i++)
121*f071c501SMasahiro Yamada weight[i+1] = (freq[i] == 0 ? 1 : freq[i]) << 8;
122*f071c501SMasahiro Yamada
123*f071c501SMasahiro Yamada while (True) {
124*f071c501SMasahiro Yamada
125*f071c501SMasahiro Yamada nNodes = alphaSize;
126*f071c501SMasahiro Yamada nHeap = 0;
127*f071c501SMasahiro Yamada
128*f071c501SMasahiro Yamada heap[0] = 0;
129*f071c501SMasahiro Yamada weight[0] = 0;
130*f071c501SMasahiro Yamada parent[0] = -2;
131*f071c501SMasahiro Yamada
132*f071c501SMasahiro Yamada for (i = 1; i <= alphaSize; i++) {
133*f071c501SMasahiro Yamada parent[i] = -1;
134*f071c501SMasahiro Yamada nHeap++;
135*f071c501SMasahiro Yamada heap[nHeap] = i;
136*f071c501SMasahiro Yamada UPHEAP(nHeap);
137*f071c501SMasahiro Yamada }
138*f071c501SMasahiro Yamada
139*f071c501SMasahiro Yamada AssertH( nHeap < (BZ_MAX_ALPHA_SIZE+2), 2001 );
140*f071c501SMasahiro Yamada
141*f071c501SMasahiro Yamada while (nHeap > 1) {
142*f071c501SMasahiro Yamada n1 = heap[1]; heap[1] = heap[nHeap]; nHeap--; DOWNHEAP(1);
143*f071c501SMasahiro Yamada n2 = heap[1]; heap[1] = heap[nHeap]; nHeap--; DOWNHEAP(1);
144*f071c501SMasahiro Yamada nNodes++;
145*f071c501SMasahiro Yamada parent[n1] = parent[n2] = nNodes;
146*f071c501SMasahiro Yamada weight[nNodes] = ADDWEIGHTS(weight[n1], weight[n2]);
147*f071c501SMasahiro Yamada parent[nNodes] = -1;
148*f071c501SMasahiro Yamada nHeap++;
149*f071c501SMasahiro Yamada heap[nHeap] = nNodes;
150*f071c501SMasahiro Yamada UPHEAP(nHeap);
151*f071c501SMasahiro Yamada }
152*f071c501SMasahiro Yamada
153*f071c501SMasahiro Yamada AssertH( nNodes < (BZ_MAX_ALPHA_SIZE * 2), 2002 );
154*f071c501SMasahiro Yamada
155*f071c501SMasahiro Yamada tooLong = False;
156*f071c501SMasahiro Yamada for (i = 1; i <= alphaSize; i++) {
157*f071c501SMasahiro Yamada j = 0;
158*f071c501SMasahiro Yamada k = i;
159*f071c501SMasahiro Yamada while (parent[k] >= 0) { k = parent[k]; j++; }
160*f071c501SMasahiro Yamada len[i-1] = j;
161*f071c501SMasahiro Yamada if (j > maxLen) tooLong = True;
162*f071c501SMasahiro Yamada }
163*f071c501SMasahiro Yamada
164*f071c501SMasahiro Yamada if (! tooLong) break;
165*f071c501SMasahiro Yamada
166*f071c501SMasahiro Yamada for (i = 1; i < alphaSize; i++) {
167*f071c501SMasahiro Yamada j = weight[i] >> 8;
168*f071c501SMasahiro Yamada j = 1 + (j / 2);
169*f071c501SMasahiro Yamada weight[i] = j << 8;
170*f071c501SMasahiro Yamada }
171*f071c501SMasahiro Yamada }
172*f071c501SMasahiro Yamada }
173*f071c501SMasahiro Yamada
174*f071c501SMasahiro Yamada
175*f071c501SMasahiro Yamada /*---------------------------------------------------*/
BZ2_hbAssignCodes(Int32 * code,UChar * length,Int32 minLen,Int32 maxLen,Int32 alphaSize)176*f071c501SMasahiro Yamada void BZ2_hbAssignCodes ( Int32 *code,
177*f071c501SMasahiro Yamada UChar *length,
178*f071c501SMasahiro Yamada Int32 minLen,
179*f071c501SMasahiro Yamada Int32 maxLen,
180*f071c501SMasahiro Yamada Int32 alphaSize )
181*f071c501SMasahiro Yamada {
182*f071c501SMasahiro Yamada Int32 n, vec, i;
183*f071c501SMasahiro Yamada
184*f071c501SMasahiro Yamada vec = 0;
185*f071c501SMasahiro Yamada for (n = minLen; n <= maxLen; n++) {
186*f071c501SMasahiro Yamada for (i = 0; i < alphaSize; i++)
187*f071c501SMasahiro Yamada if (length[i] == n) { code[i] = vec; vec++; };
188*f071c501SMasahiro Yamada vec <<= 1;
189*f071c501SMasahiro Yamada }
190*f071c501SMasahiro Yamada }
191*f071c501SMasahiro Yamada
192*f071c501SMasahiro Yamada
193*f071c501SMasahiro Yamada /*---------------------------------------------------*/
BZ2_hbCreateDecodeTables(Int32 * limit,Int32 * base,Int32 * perm,UChar * length,Int32 minLen,Int32 maxLen,Int32 alphaSize)194*f071c501SMasahiro Yamada void BZ2_hbCreateDecodeTables ( Int32 *limit,
195*f071c501SMasahiro Yamada Int32 *base,
196*f071c501SMasahiro Yamada Int32 *perm,
197*f071c501SMasahiro Yamada UChar *length,
198*f071c501SMasahiro Yamada Int32 minLen,
199*f071c501SMasahiro Yamada Int32 maxLen,
200*f071c501SMasahiro Yamada Int32 alphaSize )
201*f071c501SMasahiro Yamada {
202*f071c501SMasahiro Yamada Int32 pp, i, j, vec;
203*f071c501SMasahiro Yamada
204*f071c501SMasahiro Yamada pp = 0;
205*f071c501SMasahiro Yamada for (i = minLen; i <= maxLen; i++)
206*f071c501SMasahiro Yamada for (j = 0; j < alphaSize; j++)
207*f071c501SMasahiro Yamada if (length[j] == i) { perm[pp] = j; pp++; };
208*f071c501SMasahiro Yamada
209*f071c501SMasahiro Yamada for (i = 0; i < BZ_MAX_CODE_LEN; i++) base[i] = 0;
210*f071c501SMasahiro Yamada for (i = 0; i < alphaSize; i++) base[length[i]+1]++;
211*f071c501SMasahiro Yamada
212*f071c501SMasahiro Yamada for (i = 1; i < BZ_MAX_CODE_LEN; i++) base[i] += base[i-1];
213*f071c501SMasahiro Yamada
214*f071c501SMasahiro Yamada for (i = 0; i < BZ_MAX_CODE_LEN; i++) limit[i] = 0;
215*f071c501SMasahiro Yamada vec = 0;
216*f071c501SMasahiro Yamada
217*f071c501SMasahiro Yamada for (i = minLen; i <= maxLen; i++) {
218*f071c501SMasahiro Yamada vec += (base[i+1] - base[i]);
219*f071c501SMasahiro Yamada limit[i] = vec-1;
220*f071c501SMasahiro Yamada vec <<= 1;
221*f071c501SMasahiro Yamada }
222*f071c501SMasahiro Yamada for (i = minLen + 1; i <= maxLen; i++)
223*f071c501SMasahiro Yamada base[i] = ((limit[i-1] + 1) << 1) - base[i];
224*f071c501SMasahiro Yamada }
225*f071c501SMasahiro Yamada
226*f071c501SMasahiro Yamada
227*f071c501SMasahiro Yamada /*-------------------------------------------------------------*/
228*f071c501SMasahiro Yamada /*--- end huffman.c ---*/
229*f071c501SMasahiro Yamada /*-------------------------------------------------------------*/
230