1
// Copyright 2014 The Go Authors. All rights reserved.
2
// Use of this source code is governed by a BSD-style
3
// license that can be found in the LICENSE file.
14
var bufPool = sync.Pool{
15
New: func() interface{} { return new(bytes.Buffer) },
18
// HuffmanDecode decodes the string in v and writes the expanded
19
// result to w, returning the number of bytes written to w and the
20
// Write call's return value. At most one Write call is made.
21
func HuffmanDecode(w io.Writer, v []byte) (int, error) {
22
buf := bufPool.Get().(*bytes.Buffer)
24
defer bufPool.Put(buf)
25
if err := huffmanDecode(buf, 0, v); err != nil {
28
return w.Write(buf.Bytes())
31
// HuffmanDecodeToString decodes the string in v.
32
func HuffmanDecodeToString(v []byte) (string, error) {
33
buf := bufPool.Get().(*bytes.Buffer)
35
defer bufPool.Put(buf)
36
if err := huffmanDecode(buf, 0, v); err != nil {
39
return buf.String(), nil
42
// ErrInvalidHuffman is returned for errors found decoding
43
// Huffman-encoded strings.
44
var ErrInvalidHuffman = errors.New("hpack: invalid Huffman-encoded data")
46
// huffmanDecode decodes v to buf.
47
// If maxLen is greater than 0, attempts to write more to buf than
48
// maxLen bytes will return ErrStringLength.
49
func huffmanDecode(buf *bytes.Buffer, maxLen int, v []byte) error {
50
rootHuffmanNode := getRootHuffmanNode()
52
// cur is the bit buffer that has not been fed into n.
53
// cbits is the number of low order bits in cur that are valid.
54
// sbits is the number of bits of the symbol prefix being decoded.
55
cur, cbits, sbits := uint(0), uint8(0), uint8(0)
57
cur = cur<<8 | uint(b)
61
idx := byte(cur >> (cbits - 8))
64
return ErrInvalidHuffman
66
if n.children == nil {
67
if maxLen != 0 && buf.Len() == maxLen {
68
return ErrStringLength
80
n = n.children[byte(cur<<(8-cbits))]
82
return ErrInvalidHuffman
84
if n.children != nil || n.codeLen > cbits {
87
if maxLen != 0 && buf.Len() == maxLen {
88
return ErrStringLength
96
// Either there was an incomplete symbol, or overlong padding.
97
// Both are decoding errors per RFC 7541 section 5.2.
98
return ErrInvalidHuffman
100
if mask := uint(1<<cbits - 1); cur&mask != mask {
101
// Trailing bits must be a prefix of EOS per RFC 7541 section 5.2.
102
return ErrInvalidHuffman
108
// incomparable is a zero-width, non-comparable type. Adding it to a struct
109
// makes that struct also non-comparable, and generally doesn't add
110
// any size (as long as it's first).
111
type incomparable [0]func()
116
// children is non-nil for internal nodes
119
// The following are only valid if children is nil:
120
codeLen uint8 // number of bits that led to the output of sym
121
sym byte // output symbol
124
func newInternalNode() *node {
125
return &node{children: new([256]*node)}
129
buildRootOnce sync.Once
130
lazyRootHuffmanNode *node
133
func getRootHuffmanNode() *node {
134
buildRootOnce.Do(buildRootHuffmanNode)
135
return lazyRootHuffmanNode
138
func buildRootHuffmanNode() {
139
if len(huffmanCodes) != 256 {
140
panic("unexpected size")
142
lazyRootHuffmanNode = newInternalNode()
143
// allocate a leaf node for each of the 256 symbols
144
leaves := new([256]node)
146
for sym, code := range huffmanCodes {
147
codeLen := huffmanCodeLen[sym]
149
cur := lazyRootHuffmanNode
152
i := uint8(code >> codeLen)
153
if cur.children[i] == nil {
154
cur.children[i] = newInternalNode()
156
cur = cur.children[i]
159
start, end := int(uint8(code<<shift)), int(1<<shift)
161
leaves[sym].sym = byte(sym)
162
leaves[sym].codeLen = codeLen
163
for i := start; i < start+end; i++ {
164
cur.children[i] = &leaves[sym]
169
// AppendHuffmanString appends s, as encoded in Huffman codes, to dst
170
// and returns the extended buffer.
171
func AppendHuffmanString(dst []byte, s string) []byte {
172
// This relies on the maximum huffman code length being 30 (See tables.go huffmanCodeLen array)
173
// So if a uint64 buffer has less than 32 valid bits can always accommodate another huffmanCode.
176
n uint // number valid of bits present in x
178
for i := 0; i < len(s); i++ {
180
n += uint(huffmanCodeLen[c])
181
x <<= huffmanCodeLen[c] % 64
182
x |= uint64(huffmanCodes[c])
184
n %= 32 // Normally would be -= 32 but %= 32 informs compiler 0 <= n <= 31 for upcoming shift
185
y := uint32(x >> n) // Compiler doesn't combine memory writes if y isn't uint32
186
dst = append(dst, byte(y>>24), byte(y>>16), byte(y>>8), byte(y))
189
// Add padding bits if necessary
190
if over := n % 8; over > 0 {
194
eosPadByte = eosCode >> (eosNBits - 8)
197
x = (x << pad) | (eosPadByte >> over)
198
n += pad // 8 now divides into n exactly
200
// n in (0, 8, 16, 24, 32)
205
return append(dst, byte(x))
208
return append(dst, byte(y>>8), byte(y))
211
return append(dst, byte(y>>8), byte(y), byte(x))
215
return append(dst, byte(y>>24), byte(y>>16), byte(y>>8), byte(y))
218
// HuffmanEncodeLength returns the number of bytes required to encode
219
// s in Huffman codes. The result is round up to byte boundary.
220
func HuffmanEncodeLength(s string) uint64 {
222
for i := 0; i < len(s); i++ {
223
n += uint64(huffmanCodeLen[s[i]])