• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // Copyright 2012 Google Inc. All Rights Reserved.
2 //
3 // Use of this source code is governed by a BSD-style license
4 // that can be found in the COPYING file in the root of the source
5 // tree. An additional intellectual property rights grant can be found
6 // in the file PATENTS. All contributing project authors may
7 // be found in the AUTHORS file in the root of the source tree.
8 // -----------------------------------------------------------------------------
9 //
10 // Utilities for building and looking up Huffman trees.
11 //
12 // Author: Urvang Joshi (urvang@google.com)
13 
14 #include <assert.h>
15 #include <stdlib.h>
16 #include "./huffman.h"
17 #include "../utils/utils.h"
18 #include "webp/format_constants.h"
19 
20 #if defined(__cplusplus) || defined(c_plusplus)
21 extern "C" {
22 #endif
23 
24 #define NON_EXISTENT_SYMBOL (-1)
25 
TreeNodeInit(HuffmanTreeNode * const node)26 static void TreeNodeInit(HuffmanTreeNode* const node) {
27   node->children_ = -1;   // means: 'unassigned so far'
28 }
29 
NodeIsEmpty(const HuffmanTreeNode * const node)30 static int NodeIsEmpty(const HuffmanTreeNode* const node) {
31   return (node->children_ < 0);
32 }
33 
IsFull(const HuffmanTree * const tree)34 static int IsFull(const HuffmanTree* const tree) {
35   return (tree->num_nodes_ == tree->max_nodes_);
36 }
37 
AssignChildren(HuffmanTree * const tree,HuffmanTreeNode * const node)38 static void AssignChildren(HuffmanTree* const tree,
39                            HuffmanTreeNode* const node) {
40   HuffmanTreeNode* const children = tree->root_ + tree->num_nodes_;
41   node->children_ = (int)(children - node);
42   assert(children - node == (int)(children - node));
43   tree->num_nodes_ += 2;
44   TreeNodeInit(children + 0);
45   TreeNodeInit(children + 1);
46 }
47 
TreeInit(HuffmanTree * const tree,int num_leaves)48 static int TreeInit(HuffmanTree* const tree, int num_leaves) {
49   assert(tree != NULL);
50   if (num_leaves == 0) return 0;
51   // We allocate maximum possible nodes in the tree at once.
52   // Note that a Huffman tree is a full binary tree; and in a full binary tree
53   // with L leaves, the total number of nodes N = 2 * L - 1.
54   tree->max_nodes_ = 2 * num_leaves - 1;
55   tree->root_ = (HuffmanTreeNode*)WebPSafeMalloc((uint64_t)tree->max_nodes_,
56                                                  sizeof(*tree->root_));
57   if (tree->root_ == NULL) return 0;
58   TreeNodeInit(tree->root_);  // Initialize root.
59   tree->num_nodes_ = 1;
60   return 1;
61 }
62 
HuffmanTreeRelease(HuffmanTree * const tree)63 void HuffmanTreeRelease(HuffmanTree* const tree) {
64   if (tree != NULL) {
65     free(tree->root_);
66     tree->root_ = NULL;
67     tree->max_nodes_ = 0;
68     tree->num_nodes_ = 0;
69   }
70 }
71 
HuffmanCodeLengthsToCodes(const int * const code_lengths,int code_lengths_size,int * const huff_codes)72 int HuffmanCodeLengthsToCodes(const int* const code_lengths,
73                               int code_lengths_size, int* const huff_codes) {
74   int symbol;
75   int code_len;
76   int code_length_hist[MAX_ALLOWED_CODE_LENGTH + 1] = { 0 };
77   int curr_code;
78   int next_codes[MAX_ALLOWED_CODE_LENGTH + 1] = { 0 };
79   int max_code_length = 0;
80 
81   assert(code_lengths != NULL);
82   assert(code_lengths_size > 0);
83   assert(huff_codes != NULL);
84 
85   // Calculate max code length.
86   for (symbol = 0; symbol < code_lengths_size; ++symbol) {
87     if (code_lengths[symbol] > max_code_length) {
88       max_code_length = code_lengths[symbol];
89     }
90   }
91   if (max_code_length > MAX_ALLOWED_CODE_LENGTH) return 0;
92 
93   // Calculate code length histogram.
94   for (symbol = 0; symbol < code_lengths_size; ++symbol) {
95     ++code_length_hist[code_lengths[symbol]];
96   }
97   code_length_hist[0] = 0;
98 
99   // Calculate the initial values of 'next_codes' for each code length.
100   // next_codes[code_len] denotes the code to be assigned to the next symbol
101   // of code length 'code_len'.
102   curr_code = 0;
103   next_codes[0] = -1;  // Unused, as code length = 0 implies code doesn't exist.
104   for (code_len = 1; code_len <= max_code_length; ++code_len) {
105     curr_code = (curr_code + code_length_hist[code_len - 1]) << 1;
106     next_codes[code_len] = curr_code;
107   }
108 
109   // Get symbols.
110   for (symbol = 0; symbol < code_lengths_size; ++symbol) {
111     if (code_lengths[symbol] > 0) {
112       huff_codes[symbol] = next_codes[code_lengths[symbol]]++;
113     } else {
114       huff_codes[symbol] = NON_EXISTENT_SYMBOL;
115     }
116   }
117   return 1;
118 }
119 
TreeAddSymbol(HuffmanTree * const tree,int symbol,int code,int code_length)120 static int TreeAddSymbol(HuffmanTree* const tree,
121                          int symbol, int code, int code_length) {
122   HuffmanTreeNode* node = tree->root_;
123   const HuffmanTreeNode* const max_node = tree->root_ + tree->max_nodes_;
124   while (code_length-- > 0) {
125     if (node >= max_node) {
126       return 0;
127     }
128     if (NodeIsEmpty(node)) {
129       if (IsFull(tree)) return 0;    // error: too many symbols.
130       AssignChildren(tree, node);
131     } else if (HuffmanTreeNodeIsLeaf(node)) {
132       return 0;  // leaf is already occupied.
133     }
134     node += node->children_ + ((code >> code_length) & 1);
135   }
136   if (NodeIsEmpty(node)) {
137     node->children_ = 0;      // turn newly created node into a leaf.
138   } else if (!HuffmanTreeNodeIsLeaf(node)) {
139     return 0;   // trying to assign a symbol to already used code.
140   }
141   node->symbol_ = symbol;  // Add symbol in this node.
142   return 1;
143 }
144 
HuffmanTreeBuildImplicit(HuffmanTree * const tree,const int * const code_lengths,int code_lengths_size)145 int HuffmanTreeBuildImplicit(HuffmanTree* const tree,
146                              const int* const code_lengths,
147                              int code_lengths_size) {
148   int symbol;
149   int num_symbols = 0;
150   int root_symbol = 0;
151 
152   assert(tree != NULL);
153   assert(code_lengths != NULL);
154 
155   // Find out number of symbols and the root symbol.
156   for (symbol = 0; symbol < code_lengths_size; ++symbol) {
157     if (code_lengths[symbol] > 0) {
158       // Note: code length = 0 indicates non-existent symbol.
159       ++num_symbols;
160       root_symbol = symbol;
161     }
162   }
163 
164   // Initialize the tree. Will fail for num_symbols = 0
165   if (!TreeInit(tree, num_symbols)) return 0;
166 
167   // Build tree.
168   if (num_symbols == 1) {  // Trivial case.
169     const int max_symbol = code_lengths_size;
170     if (root_symbol < 0 || root_symbol >= max_symbol) {
171       HuffmanTreeRelease(tree);
172       return 0;
173     }
174     return TreeAddSymbol(tree, root_symbol, 0, 0);
175   } else {  // Normal case.
176     int ok = 0;
177 
178     // Get Huffman codes from the code lengths.
179     int* const codes =
180         (int*)WebPSafeMalloc((uint64_t)code_lengths_size, sizeof(*codes));
181     if (codes == NULL) goto End;
182 
183     if (!HuffmanCodeLengthsToCodes(code_lengths, code_lengths_size, codes)) {
184       goto End;
185     }
186 
187     // Add symbols one-by-one.
188     for (symbol = 0; symbol < code_lengths_size; ++symbol) {
189       if (code_lengths[symbol] > 0) {
190         if (!TreeAddSymbol(tree, symbol, codes[symbol], code_lengths[symbol])) {
191           goto End;
192         }
193       }
194     }
195     ok = 1;
196  End:
197     free(codes);
198     ok = ok && IsFull(tree);
199     if (!ok) HuffmanTreeRelease(tree);
200     return ok;
201   }
202 }
203 
HuffmanTreeBuildExplicit(HuffmanTree * const tree,const int * const code_lengths,const int * const codes,const int * const symbols,int max_symbol,int num_symbols)204 int HuffmanTreeBuildExplicit(HuffmanTree* const tree,
205                              const int* const code_lengths,
206                              const int* const codes,
207                              const int* const symbols, int max_symbol,
208                              int num_symbols) {
209   int ok = 0;
210   int i;
211 
212   assert(tree != NULL);
213   assert(code_lengths != NULL);
214   assert(codes != NULL);
215   assert(symbols != NULL);
216 
217   // Initialize the tree. Will fail if num_symbols = 0.
218   if (!TreeInit(tree, num_symbols)) return 0;
219 
220   // Add symbols one-by-one.
221   for (i = 0; i < num_symbols; ++i) {
222     if (codes[i] != NON_EXISTENT_SYMBOL) {
223       if (symbols[i] < 0 || symbols[i] >= max_symbol) {
224         goto End;
225       }
226       if (!TreeAddSymbol(tree, symbols[i], codes[i], code_lengths[i])) {
227         goto End;
228       }
229     }
230   }
231   ok = 1;
232  End:
233   ok = ok && IsFull(tree);
234   if (!ok) HuffmanTreeRelease(tree);
235   return ok;
236 }
237 
238 #if defined(__cplusplus) || defined(c_plusplus)
239 }    // extern "C"
240 #endif
241