-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathHCTree.cpp
219 lines (210 loc) · 6.43 KB
/
HCTree.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
/**
* Christopher Yeh
* Implementation of a HCTree.
* Methods for numerous encode and decodes for a naive approach, also
* space efficient implementations, as well as building the tree.
*/
#include "HCTree.hpp"
/** Use the Huffman algorithm to build a Huffman coding trie.
* PRECONDITION: freqs is a vector of ints, such that freqs[i] is
* the frequency of occurrence of byte i in the message.
* POSTCONDITION: root points to the root of the trie,
* and leaves[i] points to the leaf node containing byte i.
* @param freqs vector of ascii values and their frequency.
*/
void HCTree::build(const vector<int>& freqs) {
// Create our priority queue as a min-heap and add our freqs to it.
priority_queue<HCNode*, vector<HCNode*>, HCNodePtrComp> q;
for (int i = 0; i < freqs.size(); i++) {
if (freqs[i] != 0) {
auto node = new HCNode(freqs[i], i);
q.push(node);
}
}
HCNode* n0;
HCNode* n1;
// Begin building the Huffman trie.
if (q.size() == 1) { // File contains one character.
root = new HCNode(1, q.top()->symbol);
}
while (q.size() > 1) {
n0 = q.top();
q.pop();
n1 = q.top();
q.pop();
root = new HCNode(n0->count + n1->count, '\0');
// Set pointers.
if (n0->c0 == nullptr && n0->c1 == nullptr) {
leaves[n0->symbol] = n0;
}
if (n1->c0 == nullptr && n1->c1 == nullptr) {
leaves[n1->symbol] = n1;
}
root->c0 = n0;
n0->p = root;
root->c1 = n1;
n1->p = root;
q.push(root);
}
// Get the codes for our leaves.
HCNode* curr;
HCNode* prev;
for (HCNode* leaf : leaves) {
string code;
if (leaf != nullptr) {
curr = leaf;
while (curr->p != nullptr) {
prev = curr;
curr = curr->p;
if (curr->c0 == prev) {
code.insert(0, "0"); // Prepend.
} else {
code.insert(0, "1"); // Prepend.
}
}
codes[leaf->symbol] = code;
// cout << leaf->count << " : " << codes.at(leaf->symbol) << endl;
}
}
}
/** Use our encoding to build a Huffman coding trie.
* PRECONDITION: a file was properly encoded.
* @param in our input stream for bits.
*/
void HCTree::buildFromEncoding(BitInputStream& in) {
int charsEncountered = 0;
int bit;
bit = in.readBit();
root = new HCNode(bit, '\0');
HCNode* curr = root;
while (true) {
// Get to a node where we can set its children.
while (curr->c0 != nullptr && curr->c1 != nullptr) {
curr = curr->p;
if (curr == nullptr) {
break;
}
}
if (curr == nullptr) {
break;
}
bit = in.readBit();
// Create new node.
if (bit == 0) {
HCNode* newNode = new HCNode(bit, '\0');
newNode->p = curr;
if (curr->c0 == nullptr) {
curr->c0 = newNode;
curr = curr->c0;
} else {
curr->c1 = newNode;
curr = curr->c1;
}
} else {
byte symbol = in.readByte();
HCNode* newNode = new HCNode(bit, symbol);
newNode->p = curr;
if (curr->c0 == nullptr) {
curr->c0 = newNode;
} else {
curr->c1 = newNode;
}
}
}
}
/** Encode this tree with pre-order traversal.
* PRECONDITION: build() has been called, to create the coding
* tree, and initialize root pointer and leaves vector.
* @param out our input stream for bits.
* @param numCharacters how many total characters there are.
* @param numUniqueChars how many different ascii values there are.
*/
void HCTree::writeHeader(BitOutputStream& out,
unsigned int numCharacters, unsigned int numUniqueChars) const
{
out.writeInt(numCharacters);
// One character case.
if (numUniqueChars == 1) {
out.writeBit(1);
out.writeByte(root->symbol);
} else {
out.writeBit(0);
writeHeaderHelper(out, root);
}
}
/** Helper for writeHeader.
* @param out our input stream for bits.
* @param parent root to be handed for recursion.
*/
void HCTree::writeHeaderHelper(BitOutputStream& out, HCNode* parent) const {
if (parent == nullptr) {
return;
} else if (parent->c0 == nullptr && parent->c1 == nullptr) { // Is a leaf:
// Flag we found a leaf.
out.writeBit(1);
// Encode the symbol at the leaf in 8 bits.
out.writeByte(parent->symbol);
} else {
// Flag we are at a non-leaf.
out.writeBit(0);
}
writeHeaderHelper(out, parent->c0);
writeHeaderHelper(out, parent->c1);
}
/** Write to the given BitOutputStream.
* the sequence of bits coding the given symbol.
* PRECONDITION: build() has been called, to create the coding
* tree, and initialize root pointer and leaves vector.
* @param symbol 8 bits to be encoded.
* @param out our output stream.
*/
void HCTree::encode(byte symbol, BitOutputStream& out) const {
string code = codes.at(symbol);
for (char& bit : code) {
out.writeBit((unsigned int) (bit - CHAR_TO_INT));
}
}
/** Make sure we get the last byte in.
* @param out our input stream for bits.
*/
void HCTree::pad(BitOutputStream& out) const {
out.pad();
}
/** Return symbol coded in the next sequence of bits from the stream.
* PRECONDITION: build() has been called, to create the coding
* tree, and initialize root pointer and leaves vector.
* @param in our input stream for bits.
* @return symbol of the 8 bits read.
*/
int HCTree::decode(BitInputStream& in) const {
int nextBit;
if (root == nullptr) { // Empty file case.
return 0;
}
// Else we have an ordinary file.
HCNode* curr = root; // TODO: Use leaves instead.
while (curr->c0 != nullptr && curr->c1 != nullptr) { // Not a leaf:
nextBit = in.readBit();
if (nextBit == 0) {
curr = curr->c0;
} else {
curr = curr->c1;
}
}
return curr->symbol;
}
/** Destructor */
HCTree::~HCTree() {
deleteAll(root);
}
/** Delete every note from root, post-order */
void HCTree::deleteAll(HCNode *start) {
HCNode* curr = start;
if (curr == nullptr) {
return;
}
deleteAll(curr->c0);
deleteAll(curr->c1);
delete curr;
}