1 // Copyright 2012 Google Inc. All Rights Reserved.
2 //
3 // Use of this source code is governed by a BSD-style license
4 // that can be found in the COPYING file in the root of the source
5 // tree. An additional intellectual property rights grant can be found
6 // in the file PATENTS. All contributing project authors may
7 // be found in the AUTHORS file in the root of the source tree.
8 // -----------------------------------------------------------------------------
9 //
10 // Utilities for building and looking up Huffman trees.
11 //
12 // Author: Urvang Joshi (urvang@google.com)
13
14 #include <assert.h>
15 #include <stdlib.h>
16 #include <string.h>
17 #include "./huffman.h"
18 #include "../utils/utils.h"
19 #include "../webp/format_constants.h"
20
21 // Uncomment the following to use look-up table for ReverseBits()
22 // (might be faster on some platform)
23 // #define USE_LUT_REVERSE_BITS
24
25 // Huffman data read via DecodeImageStream is represented in two (red and green)
26 // bytes.
27 #define MAX_HTREE_GROUPS 0x10000
28 #define NON_EXISTENT_SYMBOL (-1)
29
TreeNodeInit(HuffmanTreeNode * const node)30 static void TreeNodeInit(HuffmanTreeNode* const node) {
31 node->children_ = -1; // means: 'unassigned so far'
32 }
33
NodeIsEmpty(const HuffmanTreeNode * const node)34 static int NodeIsEmpty(const HuffmanTreeNode* const node) {
35 return (node->children_ < 0);
36 }
37
IsFull(const HuffmanTree * const tree)38 static int IsFull(const HuffmanTree* const tree) {
39 return (tree->num_nodes_ == tree->max_nodes_);
40 }
41
AssignChildren(HuffmanTree * const tree,HuffmanTreeNode * const node)42 static void AssignChildren(HuffmanTree* const tree,
43 HuffmanTreeNode* const node) {
44 HuffmanTreeNode* const children = tree->root_ + tree->num_nodes_;
45 node->children_ = (int)(children - node);
46 assert(children - node == (int)(children - node));
47 tree->num_nodes_ += 2;
48 TreeNodeInit(children + 0);
49 TreeNodeInit(children + 1);
50 }
51
52 // A Huffman tree is a full binary tree; and in a full binary tree with L
53 // leaves, the total number of nodes N = 2 * L - 1.
HuffmanTreeMaxNodes(int num_leaves)54 static int HuffmanTreeMaxNodes(int num_leaves) {
55 return (2 * num_leaves - 1);
56 }
57
HuffmanTreeAllocate(HuffmanTree * const tree,int num_nodes)58 static int HuffmanTreeAllocate(HuffmanTree* const tree, int num_nodes) {
59 assert(tree != NULL);
60 tree->root_ =
61 (HuffmanTreeNode*)WebPSafeMalloc(num_nodes, sizeof(*tree->root_));
62 return (tree->root_ != NULL);
63 }
64
TreeInit(HuffmanTree * const tree,int num_leaves)65 static int TreeInit(HuffmanTree* const tree, int num_leaves) {
66 assert(tree != NULL);
67 if (num_leaves == 0) return 0;
68 tree->max_nodes_ = HuffmanTreeMaxNodes(num_leaves);
69 assert(tree->max_nodes_ < (1 << 16)); // limit for the lut_jump_ table
70 if (!HuffmanTreeAllocate(tree, tree->max_nodes_)) return 0;
71 TreeNodeInit(tree->root_); // Initialize root.
72 tree->num_nodes_ = 1;
73 memset(tree->lut_bits_, 255, sizeof(tree->lut_bits_));
74 memset(tree->lut_jump_, 0, sizeof(tree->lut_jump_));
75 return 1;
76 }
77
VP8LHuffmanTreeFree(HuffmanTree * const tree)78 void VP8LHuffmanTreeFree(HuffmanTree* const tree) {
79 if (tree != NULL) {
80 WebPSafeFree(tree->root_);
81 tree->root_ = NULL;
82 tree->max_nodes_ = 0;
83 tree->num_nodes_ = 0;
84 }
85 }
86
VP8LHtreeGroupsNew(int num_htree_groups)87 HTreeGroup* VP8LHtreeGroupsNew(int num_htree_groups) {
88 HTreeGroup* const htree_groups =
89 (HTreeGroup*)WebPSafeCalloc(num_htree_groups, sizeof(*htree_groups));
90 assert(num_htree_groups <= MAX_HTREE_GROUPS);
91 if (htree_groups == NULL) {
92 return NULL;
93 }
94 return htree_groups;
95 }
96
VP8LHtreeGroupsFree(HTreeGroup * htree_groups,int num_htree_groups)97 void VP8LHtreeGroupsFree(HTreeGroup* htree_groups, int num_htree_groups) {
98 if (htree_groups != NULL) {
99 int i, j;
100 for (i = 0; i < num_htree_groups; ++i) {
101 HuffmanTree* const htrees = htree_groups[i].htrees_;
102 for (j = 0; j < HUFFMAN_CODES_PER_META_CODE; ++j) {
103 VP8LHuffmanTreeFree(&htrees[j]);
104 }
105 }
106 WebPSafeFree(htree_groups);
107 }
108 }
109
VP8LHuffmanCodeLengthsToCodes(const int * const code_lengths,int code_lengths_size,int * const huff_codes)110 int VP8LHuffmanCodeLengthsToCodes(
111 const int* const code_lengths, int code_lengths_size,
112 int* const huff_codes) {
113 int symbol;
114 int code_len;
115 int code_length_hist[MAX_ALLOWED_CODE_LENGTH + 1] = { 0 };
116 int curr_code;
117 int next_codes[MAX_ALLOWED_CODE_LENGTH + 1] = { 0 };
118 int max_code_length = 0;
119
120 assert(code_lengths != NULL);
121 assert(code_lengths_size > 0);
122 assert(huff_codes != NULL);
123
124 // Calculate max code length.
125 for (symbol = 0; symbol < code_lengths_size; ++symbol) {
126 if (code_lengths[symbol] > max_code_length) {
127 max_code_length = code_lengths[symbol];
128 }
129 }
130 if (max_code_length > MAX_ALLOWED_CODE_LENGTH) return 0;
131
132 // Calculate code length histogram.
133 for (symbol = 0; symbol < code_lengths_size; ++symbol) {
134 ++code_length_hist[code_lengths[symbol]];
135 }
136 code_length_hist[0] = 0;
137
138 // Calculate the initial values of 'next_codes' for each code length.
139 // next_codes[code_len] denotes the code to be assigned to the next symbol
140 // of code length 'code_len'.
141 curr_code = 0;
142 next_codes[0] = -1; // Unused, as code length = 0 implies code doesn't exist.
143 for (code_len = 1; code_len <= max_code_length; ++code_len) {
144 curr_code = (curr_code + code_length_hist[code_len - 1]) << 1;
145 next_codes[code_len] = curr_code;
146 }
147
148 // Get symbols.
149 for (symbol = 0; symbol < code_lengths_size; ++symbol) {
150 if (code_lengths[symbol] > 0) {
151 huff_codes[symbol] = next_codes[code_lengths[symbol]]++;
152 } else {
153 huff_codes[symbol] = NON_EXISTENT_SYMBOL;
154 }
155 }
156 return 1;
157 }
158
159 #ifndef USE_LUT_REVERSE_BITS
160
ReverseBitsShort(int bits,int num_bits)161 static int ReverseBitsShort(int bits, int num_bits) {
162 int retval = 0;
163 int i;
164 assert(num_bits <= 8); // Not a hard requirement, just for coherency.
165 for (i = 0; i < num_bits; ++i) {
166 retval <<= 1;
167 retval |= bits & 1;
168 bits >>= 1;
169 }
170 return retval;
171 }
172
173 #else
174
175 static const uint8_t kReversedBits[16] = { // Pre-reversed 4-bit values.
176 0x0, 0x8, 0x4, 0xc, 0x2, 0xa, 0x6, 0xe,
177 0x1, 0x9, 0x5, 0xd, 0x3, 0xb, 0x7, 0xf
178 };
179
ReverseBitsShort(int bits,int num_bits)180 static int ReverseBitsShort(int bits, int num_bits) {
181 const uint8_t v = (kReversedBits[bits & 0xf] << 4) | kReversedBits[bits >> 4];
182 assert(num_bits <= 8);
183 return v >> (8 - num_bits);
184 }
185
186 #endif
187
TreeAddSymbol(HuffmanTree * const tree,int symbol,int code,int code_length)188 static int TreeAddSymbol(HuffmanTree* const tree,
189 int symbol, int code, int code_length) {
190 int step = HUFF_LUT_BITS;
191 int base_code;
192 HuffmanTreeNode* node = tree->root_;
193 const HuffmanTreeNode* const max_node = tree->root_ + tree->max_nodes_;
194 assert(symbol == (int16_t)symbol);
195 if (code_length <= HUFF_LUT_BITS) {
196 int i;
197 base_code = ReverseBitsShort(code, code_length);
198 for (i = 0; i < (1 << (HUFF_LUT_BITS - code_length)); ++i) {
199 const int idx = base_code | (i << code_length);
200 tree->lut_symbol_[idx] = (int16_t)symbol;
201 tree->lut_bits_[idx] = code_length;
202 }
203 } else {
204 base_code = ReverseBitsShort((code >> (code_length - HUFF_LUT_BITS)),
205 HUFF_LUT_BITS);
206 }
207 while (code_length-- > 0) {
208 if (node >= max_node) {
209 return 0;
210 }
211 if (NodeIsEmpty(node)) {
212 if (IsFull(tree)) return 0; // error: too many symbols.
213 AssignChildren(tree, node);
214 } else if (!HuffmanTreeNodeIsNotLeaf(node)) {
215 return 0; // leaf is already occupied.
216 }
217 node += node->children_ + ((code >> code_length) & 1);
218 if (--step == 0) {
219 tree->lut_jump_[base_code] = (int16_t)(node - tree->root_);
220 }
221 }
222 if (NodeIsEmpty(node)) {
223 node->children_ = 0; // turn newly created node into a leaf.
224 } else if (HuffmanTreeNodeIsNotLeaf(node)) {
225 return 0; // trying to assign a symbol to already used code.
226 }
227 node->symbol_ = symbol; // Add symbol in this node.
228 return 1;
229 }
230
VP8LHuffmanTreeBuildImplicit(HuffmanTree * const tree,const int * const code_lengths,int * const codes,int code_lengths_size)231 int VP8LHuffmanTreeBuildImplicit(HuffmanTree* const tree,
232 const int* const code_lengths,
233 int* const codes,
234 int code_lengths_size) {
235 int symbol;
236 int num_symbols = 0;
237 int root_symbol = 0;
238
239 assert(tree != NULL);
240 assert(code_lengths != NULL);
241
242 // Find out number of symbols and the root symbol.
243 for (symbol = 0; symbol < code_lengths_size; ++symbol) {
244 if (code_lengths[symbol] > 0) {
245 // Note: code length = 0 indicates non-existent symbol.
246 ++num_symbols;
247 root_symbol = symbol;
248 }
249 }
250
251 // Initialize the tree. Will fail for num_symbols = 0
252 if (!TreeInit(tree, num_symbols)) return 0;
253
254 // Build tree.
255 if (num_symbols == 1) { // Trivial case.
256 const int max_symbol = code_lengths_size;
257 if (root_symbol < 0 || root_symbol >= max_symbol) {
258 VP8LHuffmanTreeFree(tree);
259 return 0;
260 }
261 return TreeAddSymbol(tree, root_symbol, 0, 0);
262 } else { // Normal case.
263 int ok = 0;
264 memset(codes, 0, code_lengths_size * sizeof(*codes));
265
266 if (!VP8LHuffmanCodeLengthsToCodes(code_lengths, code_lengths_size,
267 codes)) {
268 goto End;
269 }
270
271 // Add symbols one-by-one.
272 for (symbol = 0; symbol < code_lengths_size; ++symbol) {
273 if (code_lengths[symbol] > 0) {
274 if (!TreeAddSymbol(tree, symbol, codes[symbol],
275 code_lengths[symbol])) {
276 goto End;
277 }
278 }
279 }
280 ok = 1;
281 End:
282 ok = ok && IsFull(tree);
283 if (!ok) VP8LHuffmanTreeFree(tree);
284 return ok;
285 }
286 }
287
VP8LHuffmanTreeBuildExplicit(HuffmanTree * const tree,const int * const code_lengths,const int * const codes,const int * const symbols,int max_symbol,int num_symbols)288 int VP8LHuffmanTreeBuildExplicit(HuffmanTree* const tree,
289 const int* const code_lengths,
290 const int* const codes,
291 const int* const symbols, int max_symbol,
292 int num_symbols) {
293 int ok = 0;
294 int i;
295 assert(tree != NULL);
296 assert(code_lengths != NULL);
297 assert(codes != NULL);
298 assert(symbols != NULL);
299
300 // Initialize the tree. Will fail if num_symbols = 0.
301 if (!TreeInit(tree, num_symbols)) return 0;
302
303 // Add symbols one-by-one.
304 for (i = 0; i < num_symbols; ++i) {
305 if (codes[i] != NON_EXISTENT_SYMBOL) {
306 if (symbols[i] < 0 || symbols[i] >= max_symbol) {
307 goto End;
308 }
309 if (!TreeAddSymbol(tree, symbols[i], codes[i], code_lengths[i])) {
310 goto End;
311 }
312 }
313 }
314 ok = 1;
315 End:
316 ok = ok && IsFull(tree);
317 if (!ok) VP8LHuffmanTreeFree(tree);
318 return ok;
319 }
320