sources/huffman/huffcodec.cpp

changeset 8
8b697d30c49f
equal deleted inserted replaced
7:01e4e9ae323a 8:8b697d30c49f
1 /*
2 * skulltag::HuffmanCodec class - Huffman encoder and decoder.
3 *
4 * Copyright 2009 Timothy Landers
5 * email: code.vortexcortex@gmail.com
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining a copy
8 * of this software and associated documentation files (the "Software"), to deal
9 * in the Software without restriction, including without limitation the rights
10 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
11 * copies of the Software, and to permit persons to whom the Software is
12 * furnished to do so, subject to the following conditions:
13 *
14 * The above copyright notice and this permission notice shall be included in
15 * all copies or substantial portions of the Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
20 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
23 * THE SOFTWARE.
24 */
25
26 #include "huffcodec.h"
27
28 /** Prevents naming convention problems via encapsulation. */
29 namespace skulltag {
30
31 // HuffmanCodec Implementation
32
33 /** Reverses the order of bits in a byte.
34 * EG: The statement <code>reverseMap[0xAF] == 0xF5</code> is <code>true</code>. <br>
35 * The index <code>10101111</code> stores the reverse value: <code>11110101</code>. <br>
36 * Note: One array lookup is much faster than Eight bit manipulating loop iterations. */
37 unsigned char const HuffmanCodec::reverseMap[] = {
38 0,128, 64,192, 32,160, 96,224, 16,144, 80,208, 48,176,112,240,
39 8,136, 72,200, 40,168,104,232, 24,152, 88,216, 56,184,120,248,
40 4,132, 68,196, 36,164,100,228, 20,148, 84,212, 52,180,116,244,
41 12,140, 76,204, 44,172,108,236, 28,156, 92,220, 60,188,124,252,
42 2,130, 66,194, 34,162, 98,226, 18,146, 82,210, 50,178,114,242,
43 10,138, 74,202, 42,170,106,234, 26,154, 90,218, 58,186,122,250,
44 6,134, 70,198, 38,166,102,230, 22,150, 86,214, 54,182,118,246,
45 14,142, 78,206, 46,174,110,238, 30,158, 94,222, 62,190,126,254,
46 1,129, 65,193, 33,161, 97,225, 17,145, 81,209, 49,177,113,241,
47 9,137, 73,201, 41,169,105,233, 25,153, 89,217, 57,185,121,249,
48 5,133, 69,197, 37,165,101,229, 21,149, 85,213, 53,181,117,245,
49 13,141, 77,205, 45,173,109,237, 29,157, 93,221, 61,189,125,253,
50 3,131, 67,195, 35,163, 99,227, 19,147, 83,211, 51,179,115,243,
51 11,139, 75,203, 43,171,107,235, 27,155, 91,219, 59,187,123,251,
52 7,135, 71,199, 39,167,103,231, 23,151, 87,215, 55,183,119,247,
53 15,143, 79,207, 47,175,111,239, 31,159, 95,223, 63,191,127,255
54 };
55
56 /** Creates a new HuffmanCodec
57 * @param treeData char array containing the tree data to use.
58 * @param dataLength number of chars in treeData. */
59 HuffmanCodec::HuffmanCodec(
60 unsigned char const * const treeData,
61 int dataLength
62 ) : Codec() {
63 init();
64 // init code table (256 pointers to Huffman Leaf Nodes.)
65 codeTable = new HuffmanNode*[256];
66 for (int i = 0; i < 256; i++) codeTable[i] = 0;
67 // build root node
68 root = new HuffmanNode;
69 root->bitCount = 0;
70 root->code = 0;
71 root->value = -1;
72 // recursive Huffman tree builder.
73 buildTree( root, treeData, 0, dataLength, codeTable, 256 );
74 huffResourceOwner = true;
75 }
76
77
78 /** Creates a new HuffmanCodec that uses the specified Huffman resources.
79 * @param treeRootNode The root node of a valid huffman tree.
80 * @param leafCodeTable A code lookup table where references to HuffmanNodes are stored with their array index equal to their value.
81 * Note: The tree nodes will not be released upon destruction of this HuffmanCodec. */
82 HuffmanCodec::HuffmanCodec(
83 HuffmanNode * treeRootNode,
84 HuffmanNode ** leafCodeTable
85 ){
86 init();
87 // assign values -- no table building or allocations.
88 root = treeRootNode;
89 codeTable = leafCodeTable;
90 huffResourceOwner = false;
91 }
92
93 /** Checks the ownership state of this HuffmanCodec's resources.
94 * @return true if the tree & code table will be released upon destruction of this HuffmanCodec. <br>
95 * A false return value means this HuffmanCodec is not responsible for deleting its resources. */
96 bool HuffmanCodec::huffmanResourceOwner(){
97 return huffResourceOwner;
98 }
99
100 /** Perform initialization procedures common to all constructors. */
101 void HuffmanCodec::init(){
102 writer = new BitWriter();
103 reverseBits = false;
104 expandable = true;
105 huffResourceOwner = false;
106 }
107
108 /** Increases a codeLength up to the longest Huffman code bit length found in the node or any of its children. <br>
109 * Set to Zero before calling to determine maximum code bit length.
110 * @param node in: The node to begin searching at.
111 * @param codeLength out: Variable to hold the longest code bit length found. */
112 void HuffmanCodec::maxCodeLength( HuffmanNode const * const node, int &codeLength ){
113 // [TL] We must walk each tree node since the codeTable may not contain the set of all leaf nodes.
114 // bail on NULL node (tree is corrupt).
115 if ( node == 0) return;
116 // Recurse across children if they exist.
117 if ( node->branch != 0 ){
118 maxCodeLength( &(node->branch[0]), codeLength );
119 maxCodeLength( &(node->branch[1]), codeLength );
120 } else if ( codeLength < node->bitCount ){
121 // set codeLength if it's smaller than current node's bitCount.
122 codeLength = node->bitCount;
123 }
124 }
125
126 /** Decreases a codeLength to the shortest Huffman code bit length found in the node or any of its children. <br>
127 * Set to Zero before calling to determine minimum code bit length.
128 * @param node in: The node to begin searching at.
129 * @param codeLength out: Variable to hold the longest code bit length found. */
130 void HuffmanCodec::minCodeLength( HuffmanNode const * const node, int &codeLength ){
131 /* [TL] Do not optimize under the assumption child nodes will have longer code Lengths!
132 * Future subclasses may have trees that diverge from Huffman specs. */
133 // bail on NULL node (tree is corrupt).
134 if ( node == 0 ) return;
135 // Recurse across children if they exist.
136 if ( node->branch != 0 ){
137 minCodeLength( &(node->branch[0]), codeLength );
138 minCodeLength( &(node->branch[1]), codeLength );
139 } else if ( (codeLength > node->bitCount) || (codeLength == 0) ) {
140 // set codeLength if it's Zero or larger than current node's bitCount.
141 codeLength = node->bitCount;
142 }
143 }
144
145 /** Recursively builds a Huffman Tree. <br>
146 * The initial root node should have the following field values: <br>
147 * <pre>
148 * bitCount : 0
149 * code : 0
150 * value : -1
151 * branch : 0 (NULL)
152 * </pre>
153 * @param node in/out: branch node of the Huffman Tree.
154 * @param treeData in: char array containing the Huffman Tree's byte representation.
155 * @param index in: Current array element to read the next tree node from.
156 * @param dataLength in: Length of treeData
157 * @param codeTable in/out: array of pointers to HuffmanNode structs.
158 * @param tableLength in: maximum index allowed in the codeTable.
159 * @return the next index to read from or -1 if an error occurs.
160 * */
161 int HuffmanCodec::buildTree(
162 HuffmanNode * node,
163 unsigned char const * const treeData,
164 int index,
165 int dataLength,
166 HuffmanNode ** const &codeTable,
167 int tableLength
168 ){
169 if ( index >= dataLength ) return -1;
170 // Read the branch description bit field
171 int desc = treeData[index];
172 index++;
173
174 // Create the array that will hold L/R child nodes of this branch.
175 node->branch = new HuffmanNode[2];
176
177 // Read the child Nodes for this branch.
178 for ( int i = 0; i < 2; i++ ){
179 // Increase bit count, and update huffman code to match the node's tree position.
180 node->branch[i].bitCount = node->bitCount + 1;
181 node->branch[i].code = (node->code << 1) | i; // appends a 0 or 1 depending on L/R branch.
182 node->branch[i].value = -1; // default value.
183
184 // Test a bit from the branch description (least significant bit == left)
185 if ( (desc & (1 << i)) == 0 ){
186 // Child node is a branch; Recurse.
187 if ( (index = buildTree( &(node->branch[i]), treeData, index, dataLength, codeTable, tableLength )) < 0 ) return -1;
188 // This means the entire left sub tree will be read before the right sub tree gets read.
189 } else {
190 // Read leaf value and map its value/index in the nodes array.
191 if ( index >= dataLength ) return -1;
192 // set the nodes huffman code values.
193 node->branch[i].code = (node->code << 1) | i;
194 node->branch[i].bitCount = node->bitCount+1;
195 node->branch[i].value = treeData[index] & 0xff;
196 // NULL the child node's branch to mark it as a leaf.
197 node->branch[i].branch = 0;
198 // buffer overflow check.
199 if ( (node->branch[i].value >= 0) && (node->branch[i].value <= tableLength ) )
200 // store a pointer to the leaf node into the code table at the location of its byte value.
201 codeTable[ node->branch[i].value ] = &node->branch[i];
202 index++;
203 }
204 }
205
206 return index;
207 }
208
209 /** Decodes data read from an input buffer and stores the result in the output buffer.
210 * @return number of bytes stored in the output buffer or -1 if an error occurs while encoding. */
211 int HuffmanCodec::encode(
212 unsigned char const * const input, /**< in: pointer to the first byte to encode. */
213 unsigned char * const output, /**< out: pointer to an output buffer to store data. */
214 int const &inLength, /**< in: number of bytes of input buffer to encoded. */
215 int const &outLength /**< in: maximum length of data to output. */
216 ) const {
217 // setup the bit buffer to output. if not expandable Limit output to input length.
218 if ( expandable ) writer->outputBuffer( output, outLength );
219 else writer->outputBuffer( output, ((inLength + 1) < outLength) ? inLength + 1 : outLength );
220
221 writer->put( (unsigned char)0 ); // reserve place for padding signal.
222
223 HuffmanNode * node; // temp ptr cache;
224 for ( int i = 0; i < inLength; i++ ){
225 node = codeTable[ 0xff & input[i] ]; //lookup node
226 // Put the huffman code into the bit buffer and bail if error occurs.
227 if ( !writer->put( node->code, node->bitCount ) ) return -1;
228 }
229 int bytesWritten, padding;
230 if ( writer->finish( bytesWritten, padding ) ){
231 // write padding signal byte to begining of stream.
232 output[0] = (unsigned char)padding;
233 } else return -1;
234
235 // Reverse the bit order of each byte (Old Huffman Compatibility Mode)
236 if ( reverseBits ) for ( int i = 1; i < bytesWritten; i++ ){
237 output[i] = reverseMap[ 0xff & output[i] ];
238 }
239
240 return bytesWritten;
241 } // end function encode
242
243 /** Decodes data read from an input buffer and stores the result in the output buffer.
244 * @return number of bytes stored in the output buffer or -1 if an error occurs while decoding. */
245 int HuffmanCodec::decode(
246 unsigned char const * const input, /**< in: pointer to data that needs decoding. */
247 unsigned char * const output, /**< out: pointer to output buffer to store decoded data. */
248 int const &inLength, /**< in: number of bytes of input buffer to read. */
249 int const &outLength /**< in: maximum length of data to output. */
250 ){
251 if ( inLength < 1 ) return 0;
252 int bitsAvailable = ((inLength-1) << 3) - (0xff & input[0]);
253 int rIndex = 1; // read index of input buffer.
254 int wIndex = 0; // write index of output buffer.
255 char byte = 0; // bits of the current byte.
256 int bitsLeft = 0; // bits left in byte;
257
258 HuffmanNode * node = root;
259
260 // Traverse the tree, output values.
261 while ( (bitsAvailable > 0) && (node != 0) ){
262
263 // Get the next byte if we've run out.
264 if ( bitsLeft <= 0 ){
265 byte = input[rIndex++];
266 if ( reverseBits ) byte = reverseMap[ 0xff & byte ];
267 bitsLeft = 8;
268 }
269
270 // Traverse the tree according to the most significant bit.
271 node = &(node->branch[ ((byte >> 7) & 0x01) ]);
272
273 // Is the node Non NULL, and a leaf?
274 if ( (node != 0) && (node->branch == 0) ){
275 // buffer overflow prevention
276 if ( wIndex >= outLength ) return wIndex;
277 // Output leaf node's value and restart traversal at root node.
278 output[ wIndex++ ] = (unsigned char)(node->value & 0xff);
279 node = root;
280 }
281
282 byte <<= 1; // cue up the next bit
283 bitsLeft--; // use up one bit of byte
284 bitsAvailable--; // decrement total bits left
285 }
286
287 return wIndex;
288 } // end function decode
289
290 /** Deletes all sub nodes of a HuffmanNode by traversing and deleting its child nodes.
291 * @param treeNode pointer to a HuffmanNode whos children will be deleted. */
292 void HuffmanCodec::deleteTree( HuffmanNode * treeNode ){
293 if ( treeNode == 0 ) return;
294 if ( treeNode->branch != 0 ){
295 deleteTree( &(treeNode->branch[0]) );
296 deleteTree( &(treeNode->branch[1]) );
297 delete treeNode->branch;
298 }
299 }
300
301 /** Destructor - frees resources. */
302 HuffmanCodec::~HuffmanCodec() {
303 delete writer;
304 //check for resource ownership before deletion
305 if ( huffmanResourceOwner() ){
306 delete codeTable;
307 deleteTree( root );
308 delete root;
309 }
310 }
311
312 /** Enables or Disables backwards bit ordering of bytes.
313 * @param backwards "true" enables reversed bit order bytes, "false" uses standard byte bit ordering. */
314 void HuffmanCodec::reversedBytes( bool backwards ){ reverseBits = backwards; }
315
316 /** Check the state of backwards bit ordering for bytes.
317 * @return true: bits within bytes are reversed. false: bits within bytes are normal. */
318 bool HuffmanCodec::reversedBytes(){ return reverseBits; }
319
320 /** Enable or Disable data expansion during encoding.
321 * @param expandingAllowed "true" allows encoding to expand data. "false" causes failure upon expansion. */
322 void HuffmanCodec::allowExpansion( bool expandingAllowed ){ expandable = expandingAllowed; }
323
324 /** Check the state of data expandability.
325 * @return true: data expansion is allowed. false: data is not allowed to expand. */
326 bool HuffmanCodec::allowExpansion(){ return expandable; }
327
328
329 }; // end namespace skulltag

mercurial