gem5  v21.0.0.0
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Modules Pages
huffman.cc
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2019, 2020 Inria
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions are
7  * met: redistributions of source code must retain the above copyright
8  * notice, this list of conditions and the following disclaimer;
9  * redistributions in binary form must reproduce the above copyright
10  * notice, this list of conditions and the following disclaimer in the
11  * documentation and/or other materials provided with the distribution;
12  * neither the name of the copyright holders nor the names of its
13  * contributors may be used to endorse or promote products derived from
14  * this software without specific prior written permission.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
17  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
18  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
19  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
20  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
21  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
22  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
26  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27  */
28 
30 
31 #include <cassert>
32 
33 #include "base/logging.hh"
34 
35 namespace Compressor {
36 namespace Encoder {
37 
38 Huffman::Huffman(uint64_t max_code_length)
39  : Base(), maxCodeLength(max_code_length)
40 {
42  "Code length cannot surpass its underlying container");
43 }
44 
45 void
46 Huffman::sample(uint64_t value, uint64_t frequency)
47 {
48  if (frequency != 0) {
49  trees.push(new Node(value, frequency));
50  }
51 }
52 
53 std::unique_ptr<Huffman::Node>
55 {
56  // Construct tree by assigning left and right nodes. The left path leads
57  // to the most frequent values
58  while (trees.size() > 1) {
59  Node* left = trees.top();
60  trees.pop();
61 
62  Node* right = trees.top();
63  trees.pop();
64 
65  Node* parent = new Node(left, right);
66  trees.push(parent);
67  }
68 
69  // All queue entries have been merged into a single entry containing
70  // the tree
71  Node* root = trees.top();
72  trees.pop();
73  return std::unique_ptr<Node>(root);
74 }
75 
76 void
78 {
79  valueToCode.clear();
80  codeToValue.clear();
81  generateCodes(buildTree().get(), Code());
82 }
83 
84 void
85 Huffman::generateCodes(const Node* node, const Code& current_code)
86 {
87  // Drop all entries with length greater than maxCodeLength
88  if (current_code.length > maxCodeLength) {
89  return;
90  }
91 
92  if (node->isLeaf()) {
93  valueToCode[node->getValue()] = current_code;
94  codeToValue[current_code.code] = node->getValue();
95  } else {
96  Code right_code = current_code;
97  right_code.code = (right_code.code << 1) + 1;
98  right_code.length++;
99  generateCodes(node->getRightSubTree(), right_code);
100 
101  Code left_code = current_code;
102  left_code.code = left_code.code << 1;
103  left_code.length++;
104  generateCodes(node->getLeftSubTree(), left_code);
105  }
106 }
107 
108 Code
109 Huffman::encode(const uint64_t val) const
110 {
111  auto it = valueToCode.find(val);
112  if (it == valueToCode.end()) {
113  // If the value is unknown, generate a dummy code with invalid
114  // length to let the caller know the encoding is invalid
115  Code dummy_code;
116  dummy_code.code = 0;
117  dummy_code.length = 65;
118  return dummy_code;
119  } else {
120  return it->second;
121  }
122 }
123 
124 uint64_t
125 Huffman::decode(const uint64_t code) const
126 {
127  // A code that does not exist cannot be decoded
128  auto it = codeToValue.find(code);
129  assert(it != codeToValue.end());
130  return it->second;
131 }
132 
133 } // namespace Encoder
134 } // namespace Compressor
Compressor::Encoder::Huffman::trees
std::priority_queue< Node *, std::vector< Node * >, NodeComparator > trees
Definition: huffman.hh:155
Compressor::Encoder::Huffman::maxCodeLength
const unsigned maxCodeLength
Maximum number of bits in a codeword.
Definition: huffman.hh:134
Compressor
Definition: base.cc:47
Compressor::Encoder::Huffman::Node::getLeftSubTree
const Node * getLeftSubTree() const
Definition: huffman.hh:126
Compressor::Encoder::Huffman::generateCodeMaps
void generateCodeMaps()
Generation of the code maps.
Definition: huffman.cc:77
Compressor::Encoder::Code::code
uint64_t code
Only the LSB of the code are relevant.
Definition: base.hh:40
Compressor::Encoder::Huffman::sample
void sample(uint64_t value, uint64_t frequency)
Inserts the value-frequency pair in the tree.
Definition: huffman.cc:46
Compressor::Encoder::Huffman::Node::getValue
uint64_t getValue() const
Get the leaf's value.
Definition: huffman.hh:120
Compressor::Encoder::Huffman::buildTree
std::unique_ptr< Node > buildTree()
Build a Huffman tree using the values and their respective frequencies, which have been informed thro...
Definition: huffman.cc:54
Compressor::Encoder::Huffman::decode
uint64_t decode(const uint64_t code) const override
Decode a value.
Definition: huffman.cc:125
Compressor::Encoder::Code
Definition: base.hh:37
Compressor::Encoder::Huffman::valueToCode
std::map< uint64_t, Code > valueToCode
Table containing the codewords and their respective lengths.
Definition: huffman.hh:140
X86ISA::val
Bitfield< 63 > val
Definition: misc.hh:769
Compressor::Encoder::Huffman::Node::getRightSubTree
const Node * getRightSubTree() const
Definition: huffman.hh:127
Compressor::Encoder::Huffman::Huffman
Huffman(uint64_t max_code_length)
Definition: huffman.cc:38
Compressor::Encoder::Huffman::Node::isLeaf
bool isLeaf() const
Determine if the node is a leaf node by checking if it does not have sub-trees.
Definition: huffman.hh:109
Compressor::Encoder::Code::length
unsigned length
Number of bits in the code.
Definition: base.hh:42
logging.hh
huffman.hh
Compressor::Encoder::Huffman::generateCodes
void generateCodes(const Node *node, const Code &current_code)
Recursive function that generates the huffman codes based on the tree provided.
Definition: huffman.cc:85
fatal_if
#define fatal_if(cond,...)
Conditional fatal macro that checks the supplied condition and only causes a fatal error if the condi...
Definition: logging.hh:219
Compressor::Encoder::Huffman::codeToValue
std::map< uint64_t, uint64_t > codeToValue
Definition: huffman.hh:141
Compressor::Encoder::Base
Base class for encoders.
Definition: base.hh:50
Compressor::Encoder::Huffman::encode
Code encode(const uint64_t val) const override
The function responsible for the generation of the alternative value.
Definition: huffman.cc:109
Compressor::Encoder::Huffman::Node
Node for the Huffman tree.
Definition: huffman.hh:70

Generated on Tue Mar 23 2021 19:41:27 for gem5 by doxygen 1.8.17