mirror of
https://github.com/chylex/Brotli-Builder.git
synced 2025-01-08 02:42:50 +01:00
204 lines
7.5 KiB
C#
204 lines
7.5 KiB
C#
using System;
|
|
using System.Collections;
|
|
using System.Collections.Generic;
|
|
using System.Linq;
|
|
using BrotliLib.Brotli.Parameters;
|
|
using BrotliLib.Collections;
|
|
using BrotliLib.Collections.Huffman;
|
|
using BrotliLib.Markers.Serialization;
|
|
using BrotliLib.Numbers;
|
|
using BrotliLib.Serialization;
|
|
|
|
namespace BrotliLib.Brotli.Components.Header{
|
|
/// <summary>
|
|
/// Represents a Huffman tree with symbols from various alphabets in the Brotli format. Provides helper methods for iteration and lookups.
|
|
/// https://tools.ietf.org/html/rfc7932#section-3.2
|
|
/// </summary>
|
|
public sealed partial class HuffmanTree<T> : IEnumerable<KeyValuePair<T, BitPath>> where T : IComparable<T>{
|
|
public const int DefaultMaxDepth = 15;
|
|
|
|
/// <summary>
|
|
/// Generates a canonical depth-limited Huffman tree using the provided <paramref name="symbolFrequencies"/>, and default depth limit of 15.
|
|
/// </summary>
|
|
public static HuffmanTree<T> FromSymbols(FrequencyList<T> symbolFrequencies){
|
|
return FromSymbols(symbolFrequencies, DefaultMaxDepth);
|
|
}
|
|
|
|
/// <summary>
|
|
/// Generates a canonical depth-limited Huffman tree using the provided <paramref name="symbolFrequencies"/>.
|
|
/// </summary>
|
|
public static HuffmanTree<T> FromSymbols(FrequencyList<T> symbolFrequencies, byte maxDepth){
|
|
if (symbolFrequencies.Count == 0){
|
|
throw new ArgumentOutOfRangeException(nameof(symbolFrequencies), "Cannot generate a tree with no symbols.");
|
|
}
|
|
else if (symbolFrequencies.Count == 1){
|
|
return new HuffmanTree<T>(new HuffmanNode<T>.Leaf(symbolFrequencies.First()));
|
|
}
|
|
else{
|
|
return new HuffmanTree<T>(HuffmanGenerator<T>.FromFrequenciesCanonical(symbolFrequencies.HuffmanFreq.ToArray(), maxDepth));
|
|
}
|
|
}
|
|
|
|
// Data
|
|
|
|
/// <summary>
|
|
/// Root node of the tree.
|
|
/// </summary>
|
|
public HuffmanNode<T> Root { get; }
|
|
|
|
/// <summary>
|
|
/// Total amount of symbols in the tree.
|
|
/// </summary>
|
|
public int SymbolCount => ReverseLookup.Count;
|
|
|
|
/// <summary>
|
|
/// Length of the longest path in the tree.
|
|
/// </summary>
|
|
public int MaxDepth => ReverseLookup.Values.Max(stream => stream.Length);
|
|
|
|
private Dictionary<T, BitPath> ReverseLookup => reverseLookupCached ??= Root.GenerateValueMapOptimized();
|
|
private Dictionary<T, BitPath>? reverseLookupCached;
|
|
|
|
private T[] ValueList => valueListCached ??= ReverseLookup.Keys.ToArray();
|
|
private T[]? valueListCached;
|
|
|
|
public HuffmanTree(HuffmanNode<T> root){
|
|
this.Root = root;
|
|
}
|
|
|
|
// Search
|
|
|
|
public BitPath FindPath(T element){
|
|
return ReverseLookup[element];
|
|
}
|
|
|
|
public BitPath? FindPathOrNull(T element){
|
|
return ReverseLookup.TryGetValue(element, out BitPath path) ? path : (BitPath?)null;
|
|
}
|
|
|
|
public KeyValuePair<T, BitPath> FindShortest<A>(A param1, Func<T, A, bool> predicate){
|
|
foreach(var key in ValueList){
|
|
if (predicate(key, param1)){
|
|
return new KeyValuePair<T, BitPath>(key, ReverseLookup[key]);
|
|
}
|
|
}
|
|
|
|
throw new InvalidOperationException("No suitable entry found.");
|
|
}
|
|
|
|
public KeyValuePair<T, BitPath> FindShortest<A, B>(A param1, B param2, Func<T, A, B, bool> predicate){
|
|
foreach(var key in ValueList){
|
|
if (predicate(key, param1, param2)){
|
|
return new KeyValuePair<T, BitPath>(key, ReverseLookup[key]);
|
|
}
|
|
}
|
|
|
|
throw new InvalidOperationException("No suitable entry found.");
|
|
}
|
|
|
|
public KeyValuePair<T, BitPath> FindShortest<A, B>(A param1, B param2, Func<T, A, B, bool> predicate, Func<T, int> extraLength){
|
|
KeyValuePair<T, BitPath>? bestEntry = null;
|
|
int bestBits = int.MaxValue;
|
|
|
|
foreach(var key in ValueList){
|
|
if (predicate(key, param1, param2)){
|
|
var path = ReverseLookup[key];
|
|
int bits = path.Length + extraLength(key);
|
|
|
|
if (bits < bestBits){
|
|
bestEntry = new KeyValuePair<T, BitPath>(key, path);
|
|
bestBits = bits;
|
|
}
|
|
}
|
|
}
|
|
|
|
return bestEntry ?? throw new InvalidOperationException("No suitable entry found.");
|
|
}
|
|
|
|
// Enumerator
|
|
|
|
public IEnumerator<KeyValuePair<T, BitPath>> GetEnumerator(){
|
|
return ReverseLookup.GetEnumerator();
|
|
}
|
|
|
|
IEnumerator IEnumerable.GetEnumerator(){
|
|
return GetEnumerator();
|
|
}
|
|
|
|
// Object
|
|
|
|
public override bool Equals(object obj){
|
|
return obj is HuffmanTree<T> tree &&
|
|
ReverseLookup.SequenceEqual(tree.ReverseLookup);
|
|
}
|
|
|
|
public override int GetHashCode(){
|
|
int hash = ReverseLookup.Count * 17;
|
|
|
|
foreach(KeyValuePair<T, BitPath> kvp in this){
|
|
hash = unchecked((hash * 31) + kvp.Key.GetHashCode());
|
|
hash = unchecked((hash * 31) + kvp.Value.GetHashCode());
|
|
}
|
|
|
|
return hash;
|
|
}
|
|
|
|
// Context
|
|
|
|
public sealed class Context{
|
|
public AlphabetSize AlphabetSize { get; }
|
|
|
|
public Func<int, T> BitsToSymbol { get; }
|
|
public Func<T, int> SymbolToBits { get; }
|
|
|
|
internal int SkippedComplexCodeLengths { get; }
|
|
|
|
private Context(AlphabetSize alphabetSize, Func<int, T> bitsToSymbol, Func<T, int> symbolToBits, int skippedComplexCodeLengths){
|
|
this.AlphabetSize = alphabetSize;
|
|
this.BitsToSymbol = bitsToSymbol;
|
|
this.SymbolToBits = symbolToBits;
|
|
this.SkippedComplexCodeLengths = skippedComplexCodeLengths;
|
|
}
|
|
|
|
public Context(AlphabetSize alphabetSize, Func<int, T> bitsToSymbol, Func<T, int> symbolToBits) : this(alphabetSize, bitsToSymbol, symbolToBits, -1){}
|
|
|
|
internal Context ForComplexDeserialization(int skippedComplexCodeLengths){
|
|
return new Context(AlphabetSize, BitsToSymbol, SymbolToBits, skippedComplexCodeLengths);
|
|
}
|
|
}
|
|
|
|
// Serialization
|
|
|
|
public static readonly BitDeserializer<HuffmanTree<T>, Context> Deserialize = MarkedBitDeserializer.Wrap<HuffmanTree<T>, Context>(
|
|
(reader, context) => {
|
|
reader.MarkStart();
|
|
|
|
int type = reader.NextChunk(2, "HSKIP");
|
|
HuffmanTree<T> tree;
|
|
|
|
if (type == 1){
|
|
tree = Simple.Deserialize(reader, context);
|
|
reader.MarkEndTitle("Simple Huffman Tree");
|
|
}
|
|
else{
|
|
tree = Complex.Deserialize(reader, context.ForComplexDeserialization(type));
|
|
reader.MarkEndTitle("Complex Huffman Tree");
|
|
}
|
|
|
|
return tree;
|
|
}
|
|
);
|
|
|
|
public static readonly BitSerializer<HuffmanTree<T>, Context, BrotliSerializationParameters> Serialize = (writer, obj, context, parameters) => {
|
|
if (obj.SymbolCount <= 4){
|
|
writer.WriteChunk(2, 0b01);
|
|
Simple.Serialize(writer, obj, context);
|
|
}
|
|
else{
|
|
// type identifier is written by the serializer
|
|
Complex.Serialize(writer, obj, context, parameters);
|
|
}
|
|
};
|
|
}
|
|
}
|