naiveproxy/net/tools/huffman_trie/huffman/huffman_builder.cc
2018-12-09 21:59:24 -05:00

166 lines
4.6 KiB
C++

// Copyright (c) 2016 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "net/tools/huffman_trie/huffman/huffman_builder.h"
#include <algorithm>
#include "base/logging.h"
namespace net {
namespace huffman_trie {
namespace {
class HuffmanNode {
public:
HuffmanNode(uint8_t value,
uint32_t count,
std::unique_ptr<HuffmanNode> left,
std::unique_ptr<HuffmanNode> right)
: value_(value),
count_(count),
left_(std::move(left)),
right_(std::move(right)) {}
~HuffmanNode() = default;
bool IsLeaf() const {
return left_.get() == nullptr && right_.get() == nullptr;
}
uint8_t value() const { return value_; }
uint32_t count() const { return count_; }
const std::unique_ptr<HuffmanNode>& left() const { return left_; }
const std::unique_ptr<HuffmanNode>& right() const { return right_; }
private:
uint8_t value_;
uint32_t count_;
std::unique_ptr<HuffmanNode> left_;
std::unique_ptr<HuffmanNode> right_;
};
bool CompareNodes(const std::unique_ptr<HuffmanNode>& lhs,
const std::unique_ptr<HuffmanNode>& rhs) {
return lhs->count() < rhs->count();
}
} // namespace
HuffmanBuilder::HuffmanBuilder() = default;
HuffmanBuilder::~HuffmanBuilder() = default;
void HuffmanBuilder::RecordUsage(uint8_t character) {
DCHECK(character < 128);
counts_[character & 127] += 1;
}
HuffmanRepresentationTable HuffmanBuilder::ToTable() {
HuffmanRepresentationTable table;
std::unique_ptr<HuffmanNode> node(BuildTree());
TreeToTable(node.get(), 0, 0, &table);
return table;
}
void HuffmanBuilder::TreeToTable(HuffmanNode* node,
uint32_t bits,
uint32_t number_of_bits,
HuffmanRepresentationTable* table) {
if (node->IsLeaf()) {
HuffmanRepresentation item;
item.bits = bits;
item.number_of_bits = number_of_bits;
table->insert(HuffmanRepresentationPair(node->value(), item));
} else {
uint32_t new_bits = bits << 1;
TreeToTable(node->left().get(), new_bits, number_of_bits + 1, table);
TreeToTable(node->right().get(), new_bits | 1, number_of_bits + 1, table);
}
}
std::vector<uint8_t> HuffmanBuilder::ToVector() {
std::vector<uint8_t> bytes;
std::unique_ptr<HuffmanNode> node(BuildTree());
WriteToVector(node.get(), &bytes);
return bytes;
}
uint32_t HuffmanBuilder::WriteToVector(HuffmanNode* node,
std::vector<uint8_t>* vector) {
uint8_t left_value;
uint8_t right_value;
uint32_t child_position;
if (node->left()->IsLeaf()) {
left_value = 128 | node->left()->value();
} else {
child_position = WriteToVector(node->left().get(), vector);
DCHECK(child_position < 512) << "huffman tree too large";
left_value = child_position / 2;
}
if (node->right()->IsLeaf()) {
right_value = 128 | node->right()->value();
} else {
child_position = WriteToVector(node->right().get(), vector);
DCHECK(child_position < 512) << "huffman tree to large";
right_value = child_position / 2;
}
uint32_t position = static_cast<uint32_t>(vector->size());
vector->push_back(left_value);
vector->push_back(right_value);
return position;
}
std::unique_ptr<HuffmanNode> HuffmanBuilder::BuildTree() {
std::vector<std::unique_ptr<HuffmanNode>> nodes;
nodes.reserve(counts_.size());
for (const auto& item : counts_) {
nodes.push_back(std::make_unique<HuffmanNode>(item.first, item.second,
nullptr, nullptr));
}
// At least 2 entries are required for everything to work properly. Add
// arbitrary values to fill the tree.
for (uint8_t i = 0; nodes.size() < 2 && i < 2; ++i) {
for (const auto& node : nodes) {
if (node->value() == i) {
break;
}
}
nodes.push_back(std::make_unique<HuffmanNode>(i, 0, nullptr, nullptr));
}
std::stable_sort(nodes.begin(), nodes.end(), CompareNodes);
while (nodes.size() > 1) {
std::unique_ptr<HuffmanNode> a = std::move(nodes[0]);
std::unique_ptr<HuffmanNode> b = std::move(nodes[1]);
uint32_t count_a = a->count();
uint32_t count_b = b->count();
std::unique_ptr<HuffmanNode> parent(
new HuffmanNode(0, count_a + count_b, std::move(a), std::move(b)));
nodes.erase(nodes.begin());
nodes[0] = std::move(parent);
std::stable_sort(nodes.begin(), nodes.end(), CompareNodes);
}
return std::move(nodes[0]);
}
} // namespace huffman_trie
} // namespace net