blob: 2d951341053a016922ce2f7d132676b74739b97b [file] [log] [blame]
/*
* Huffman decoding and encoding for HPACK (RFC7541)
*
* Copyright (C) 2014-2017 Willy Tarreau <willy@haproxy.org>
* Copyright (C) 2017 HAProxy Technologies
*
* Permission is hereby granted, free of charge, to any person obtaining
* a copy of this software and associated documentation files (the
* "Software"), to deal in the Software without restriction, including
* without limitation the rights to use, copy, modify, merge, publish,
* distribute, sublicense, and/or sell copies of the Software, and to
* permit persons to whom the Software is furnished to do so, subject to
* the following conditions:
*
* The above copyright notice and this permission notice shall be
* included in all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
* OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
* HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
* WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
* OTHER DEALINGS IN THE SOFTWARE.
*/
#include <stdio.h>
#include <inttypes.h>
#include <string.h>
#include <haproxy/api.h>
#include <haproxy/hpack-huff.h>
#include <haproxy/net_helper.h>
struct huff {
uint32_t c; /* code point */
int b; /* bits */
};
/* huffman table as per RFC7541 appendix B */
static const struct huff ht[257] = {
[ 0] = { .c = 0x00001ff8, .b = 13 },
[ 1] = { .c = 0x007fffd8, .b = 23 },
[ 2] = { .c = 0x0fffffe2, .b = 28 },
[ 3] = { .c = 0x0fffffe3, .b = 28 },
[ 4] = { .c = 0x0fffffe4, .b = 28 },
[ 5] = { .c = 0x0fffffe5, .b = 28 },
[ 6] = { .c = 0x0fffffe6, .b = 28 },
[ 7] = { .c = 0x0fffffe7, .b = 28 },
[ 8] = { .c = 0x0fffffe8, .b = 28 },
[ 9] = { .c = 0x00ffffea, .b = 24 },
[ 10] = { .c = 0x3ffffffc, .b = 30 },
[ 11] = { .c = 0x0fffffe9, .b = 28 },
[ 12] = { .c = 0x0fffffea, .b = 28 },
[ 13] = { .c = 0x3ffffffd, .b = 30 },
[ 14] = { .c = 0x0fffffeb, .b = 28 },
[ 15] = { .c = 0x0fffffec, .b = 28 },
[ 16] = { .c = 0x0fffffed, .b = 28 },
[ 17] = { .c = 0x0fffffee, .b = 28 },
[ 18] = { .c = 0x0fffffef, .b = 28 },
[ 19] = { .c = 0x0ffffff0, .b = 28 },
[ 20] = { .c = 0x0ffffff1, .b = 28 },
[ 21] = { .c = 0x0ffffff2, .b = 28 },
[ 22] = { .c = 0x3ffffffe, .b = 30 },
[ 23] = { .c = 0x0ffffff3, .b = 28 },
[ 24] = { .c = 0x0ffffff4, .b = 28 },
[ 25] = { .c = 0x0ffffff5, .b = 28 },
[ 26] = { .c = 0x0ffffff6, .b = 28 },
[ 27] = { .c = 0x0ffffff7, .b = 28 },
[ 28] = { .c = 0x0ffffff8, .b = 28 },
[ 29] = { .c = 0x0ffffff9, .b = 28 },
[ 30] = { .c = 0x0ffffffa, .b = 28 },
[ 31] = { .c = 0x0ffffffb, .b = 28 },
[ 32] = { .c = 0x00000014, .b = 6 },
[ 33] = { .c = 0x000003f8, .b = 10 },
[ 34] = { .c = 0x000003f9, .b = 10 },
[ 35] = { .c = 0x00000ffa, .b = 12 },
[ 36] = { .c = 0x00001ff9, .b = 13 },
[ 37] = { .c = 0x00000015, .b = 6 },
[ 38] = { .c = 0x000000f8, .b = 8 },
[ 39] = { .c = 0x000007fa, .b = 11 },
[ 40] = { .c = 0x000003fa, .b = 10 },
[ 41] = { .c = 0x000003fb, .b = 10 },
[ 42] = { .c = 0x000000f9, .b = 8 },
[ 43] = { .c = 0x000007fb, .b = 11 },
[ 44] = { .c = 0x000000fa, .b = 8 },
[ 45] = { .c = 0x00000016, .b = 6 },
[ 46] = { .c = 0x00000017, .b = 6 },
[ 47] = { .c = 0x00000018, .b = 6 },
[ 48] = { .c = 0x00000000, .b = 5 },
[ 49] = { .c = 0x00000001, .b = 5 },
[ 50] = { .c = 0x00000002, .b = 5 },
[ 51] = { .c = 0x00000019, .b = 6 },
[ 52] = { .c = 0x0000001a, .b = 6 },
[ 53] = { .c = 0x0000001b, .b = 6 },
[ 54] = { .c = 0x0000001c, .b = 6 },
[ 55] = { .c = 0x0000001d, .b = 6 },
[ 56] = { .c = 0x0000001e, .b = 6 },
[ 57] = { .c = 0x0000001f, .b = 6 },
[ 58] = { .c = 0x0000005c, .b = 7 },
[ 59] = { .c = 0x000000fb, .b = 8 },
[ 60] = { .c = 0x00007ffc, .b = 15 },
[ 61] = { .c = 0x00000020, .b = 6 },
[ 62] = { .c = 0x00000ffb, .b = 12 },
[ 63] = { .c = 0x000003fc, .b = 10 },
[ 64] = { .c = 0x00001ffa, .b = 13 },
[ 65] = { .c = 0x00000021, .b = 6 },
[ 66] = { .c = 0x0000005d, .b = 7 },
[ 67] = { .c = 0x0000005e, .b = 7 },
[ 68] = { .c = 0x0000005f, .b = 7 },
[ 69] = { .c = 0x00000060, .b = 7 },
[ 70] = { .c = 0x00000061, .b = 7 },
[ 71] = { .c = 0x00000062, .b = 7 },
[ 72] = { .c = 0x00000063, .b = 7 },
[ 73] = { .c = 0x00000064, .b = 7 },
[ 74] = { .c = 0x00000065, .b = 7 },
[ 75] = { .c = 0x00000066, .b = 7 },
[ 76] = { .c = 0x00000067, .b = 7 },
[ 77] = { .c = 0x00000068, .b = 7 },
[ 78] = { .c = 0x00000069, .b = 7 },
[ 79] = { .c = 0x0000006a, .b = 7 },
[ 80] = { .c = 0x0000006b, .b = 7 },
[ 81] = { .c = 0x0000006c, .b = 7 },
[ 82] = { .c = 0x0000006d, .b = 7 },
[ 83] = { .c = 0x0000006e, .b = 7 },
[ 84] = { .c = 0x0000006f, .b = 7 },
[ 85] = { .c = 0x00000070, .b = 7 },
[ 86] = { .c = 0x00000071, .b = 7 },
[ 87] = { .c = 0x00000072, .b = 7 },
[ 88] = { .c = 0x000000fc, .b = 8 },
[ 89] = { .c = 0x00000073, .b = 7 },
[ 90] = { .c = 0x000000fd, .b = 8 },
[ 91] = { .c = 0x00001ffb, .b = 13 },
[ 92] = { .c = 0x0007fff0, .b = 19 },
[ 93] = { .c = 0x00001ffc, .b = 13 },
[ 94] = { .c = 0x00003ffc, .b = 14 },
[ 95] = { .c = 0x00000022, .b = 6 },
[ 96] = { .c = 0x00007ffd, .b = 15 },
[ 97] = { .c = 0x00000003, .b = 5 },
[ 98] = { .c = 0x00000023, .b = 6 },
[ 99] = { .c = 0x00000004, .b = 5 },
[100] = { .c = 0x00000024, .b = 6 },
[101] = { .c = 0x00000005, .b = 5 },
[102] = { .c = 0x00000025, .b = 6 },
[103] = { .c = 0x00000026, .b = 6 },
[104] = { .c = 0x00000027, .b = 6 },
[105] = { .c = 0x00000006, .b = 5 },
[106] = { .c = 0x00000074, .b = 7 },
[107] = { .c = 0x00000075, .b = 7 },
[108] = { .c = 0x00000028, .b = 6 },
[109] = { .c = 0x00000029, .b = 6 },
[110] = { .c = 0x0000002a, .b = 6 },
[111] = { .c = 0x00000007, .b = 5 },
[112] = { .c = 0x0000002b, .b = 6 },
[113] = { .c = 0x00000076, .b = 7 },
[114] = { .c = 0x0000002c, .b = 6 },
[115] = { .c = 0x00000008, .b = 5 },
[116] = { .c = 0x00000009, .b = 5 },
[117] = { .c = 0x0000002d, .b = 6 },
[118] = { .c = 0x00000077, .b = 7 },
[119] = { .c = 0x00000078, .b = 7 },
[120] = { .c = 0x00000079, .b = 7 },
[121] = { .c = 0x0000007a, .b = 7 },
[122] = { .c = 0x0000007b, .b = 7 },
[123] = { .c = 0x00007ffe, .b = 15 },
[124] = { .c = 0x000007fc, .b = 11 },
[125] = { .c = 0x00003ffd, .b = 14 },
[126] = { .c = 0x00001ffd, .b = 13 },
[127] = { .c = 0x0ffffffc, .b = 28 },
[128] = { .c = 0x000fffe6, .b = 20 },
[129] = { .c = 0x003fffd2, .b = 22 },
[130] = { .c = 0x000fffe7, .b = 20 },
[131] = { .c = 0x000fffe8, .b = 20 },
[132] = { .c = 0x003fffd3, .b = 22 },
[133] = { .c = 0x003fffd4, .b = 22 },
[134] = { .c = 0x003fffd5, .b = 22 },
[135] = { .c = 0x007fffd9, .b = 23 },
[136] = { .c = 0x003fffd6, .b = 22 },
[137] = { .c = 0x007fffda, .b = 23 },
[138] = { .c = 0x007fffdb, .b = 23 },
[139] = { .c = 0x007fffdc, .b = 23 },
[140] = { .c = 0x007fffdd, .b = 23 },
[141] = { .c = 0x007fffde, .b = 23 },
[142] = { .c = 0x00ffffeb, .b = 24 },
[143] = { .c = 0x007fffdf, .b = 23 },
[144] = { .c = 0x00ffffec, .b = 24 },
[145] = { .c = 0x00ffffed, .b = 24 },
[146] = { .c = 0x003fffd7, .b = 22 },
[147] = { .c = 0x007fffe0, .b = 23 },
[148] = { .c = 0x00ffffee, .b = 24 },
[149] = { .c = 0x007fffe1, .b = 23 },
[150] = { .c = 0x007fffe2, .b = 23 },
[151] = { .c = 0x007fffe3, .b = 23 },
[152] = { .c = 0x007fffe4, .b = 23 },
[153] = { .c = 0x001fffdc, .b = 21 },
[154] = { .c = 0x003fffd8, .b = 22 },
[155] = { .c = 0x007fffe5, .b = 23 },
[156] = { .c = 0x003fffd9, .b = 22 },
[157] = { .c = 0x007fffe6, .b = 23 },
[158] = { .c = 0x007fffe7, .b = 23 },
[159] = { .c = 0x00ffffef, .b = 24 },
[160] = { .c = 0x003fffda, .b = 22 },
[161] = { .c = 0x001fffdd, .b = 21 },
[162] = { .c = 0x000fffe9, .b = 20 },
[163] = { .c = 0x003fffdb, .b = 22 },
[164] = { .c = 0x003fffdc, .b = 22 },
[165] = { .c = 0x007fffe8, .b = 23 },
[166] = { .c = 0x007fffe9, .b = 23 },
[167] = { .c = 0x001fffde, .b = 21 },
[168] = { .c = 0x007fffea, .b = 23 },
[169] = { .c = 0x003fffdd, .b = 22 },
[170] = { .c = 0x003fffde, .b = 22 },
[171] = { .c = 0x00fffff0, .b = 24 },
[172] = { .c = 0x001fffdf, .b = 21 },
[173] = { .c = 0x003fffdf, .b = 22 },
[174] = { .c = 0x007fffeb, .b = 23 },
[175] = { .c = 0x007fffec, .b = 23 },
[176] = { .c = 0x001fffe0, .b = 21 },
[177] = { .c = 0x001fffe1, .b = 21 },
[178] = { .c = 0x003fffe0, .b = 22 },
[179] = { .c = 0x001fffe2, .b = 21 },
[180] = { .c = 0x007fffed, .b = 23 },
[181] = { .c = 0x003fffe1, .b = 22 },
[182] = { .c = 0x007fffee, .b = 23 },
[183] = { .c = 0x007fffef, .b = 23 },
[184] = { .c = 0x000fffea, .b = 20 },
[185] = { .c = 0x003fffe2, .b = 22 },
[186] = { .c = 0x003fffe3, .b = 22 },
[187] = { .c = 0x003fffe4, .b = 22 },
[188] = { .c = 0x007ffff0, .b = 23 },
[189] = { .c = 0x003fffe5, .b = 22 },
[190] = { .c = 0x003fffe6, .b = 22 },
[191] = { .c = 0x007ffff1, .b = 23 },
[192] = { .c = 0x03ffffe0, .b = 26 },
[193] = { .c = 0x03ffffe1, .b = 26 },
[194] = { .c = 0x000fffeb, .b = 20 },
[195] = { .c = 0x0007fff1, .b = 19 },
[196] = { .c = 0x003fffe7, .b = 22 },
[197] = { .c = 0x007ffff2, .b = 23 },
[198] = { .c = 0x003fffe8, .b = 22 },
[199] = { .c = 0x01ffffec, .b = 25 },
[200] = { .c = 0x03ffffe2, .b = 26 },
[201] = { .c = 0x03ffffe3, .b = 26 },
[202] = { .c = 0x03ffffe4, .b = 26 },
[203] = { .c = 0x07ffffde, .b = 27 },
[204] = { .c = 0x07ffffdf, .b = 27 },
[205] = { .c = 0x03ffffe5, .b = 26 },
[206] = { .c = 0x00fffff1, .b = 24 },
[207] = { .c = 0x01ffffed, .b = 25 },
[208] = { .c = 0x0007fff2, .b = 19 },
[209] = { .c = 0x001fffe3, .b = 21 },
[210] = { .c = 0x03ffffe6, .b = 26 },
[211] = { .c = 0x07ffffe0, .b = 27 },
[212] = { .c = 0x07ffffe1, .b = 27 },
[213] = { .c = 0x03ffffe7, .b = 26 },
[214] = { .c = 0x07ffffe2, .b = 27 },
[215] = { .c = 0x00fffff2, .b = 24 },
[216] = { .c = 0x001fffe4, .b = 21 },
[217] = { .c = 0x001fffe5, .b = 21 },
[218] = { .c = 0x03ffffe8, .b = 26 },
[219] = { .c = 0x03ffffe9, .b = 26 },
[220] = { .c = 0x0ffffffd, .b = 28 },
[221] = { .c = 0x07ffffe3, .b = 27 },
[222] = { .c = 0x07ffffe4, .b = 27 },
[223] = { .c = 0x07ffffe5, .b = 27 },
[224] = { .c = 0x000fffec, .b = 20 },
[225] = { .c = 0x00fffff3, .b = 24 },
[226] = { .c = 0x000fffed, .b = 20 },
[227] = { .c = 0x001fffe6, .b = 21 },
[228] = { .c = 0x003fffe9, .b = 22 },
[229] = { .c = 0x001fffe7, .b = 21 },
[230] = { .c = 0x001fffe8, .b = 21 },
[231] = { .c = 0x007ffff3, .b = 23 },
[232] = { .c = 0x003fffea, .b = 22 },
[233] = { .c = 0x003fffeb, .b = 22 },
[234] = { .c = 0x01ffffee, .b = 25 },
[235] = { .c = 0x01ffffef, .b = 25 },
[236] = { .c = 0x00fffff4, .b = 24 },
[237] = { .c = 0x00fffff5, .b = 24 },
[238] = { .c = 0x03ffffea, .b = 26 },
[239] = { .c = 0x007ffff4, .b = 23 },
[240] = { .c = 0x03ffffeb, .b = 26 },
[241] = { .c = 0x07ffffe6, .b = 27 },
[242] = { .c = 0x03ffffec, .b = 26 },
[243] = { .c = 0x03ffffed, .b = 26 },
[244] = { .c = 0x07ffffe7, .b = 27 },
[245] = { .c = 0x07ffffe8, .b = 27 },
[246] = { .c = 0x07ffffe9, .b = 27 },
[247] = { .c = 0x07ffffea, .b = 27 },
[248] = { .c = 0x07ffffeb, .b = 27 },
[249] = { .c = 0x0ffffffe, .b = 28 },
[250] = { .c = 0x07ffffec, .b = 27 },
[251] = { .c = 0x07ffffed, .b = 27 },
[252] = { .c = 0x07ffffee, .b = 27 },
[253] = { .c = 0x07ffffef, .b = 27 },
[254] = { .c = 0x07fffff0, .b = 27 },
[255] = { .c = 0x03ffffee, .b = 26 },
[256] = { .c = 0x3fffffff, .b = 30 }, /* EOS */
};
/* Reversed huffman codes, generated by dev/hpack/gen-rht.c from the table
* above, then simplified by hand by extracting the few different length
* values and writing code to produce them instead.
*
* The codes are aligned on the MSB since that's how they appear in the stream.
*
* Quick summary below of the way the tables work. They're based on how the
* prefixes are organized, starting from the MSB.
*
* These codes fit in a single octet (5 to 8 bits) :
* 00/5 08/5 10/5 18/5 20/5 28/5 30/5 38/5
* 40/5 48/5
*
* 50/6 54/6 58/6 5c/6 60/6 64/6 68/6 6c/6
* 70/6 74/6 78/6 7c/6 80/6 84/6 88/6 8c/6
* 90/6 94/6 98/6 9c/6 a0/6 a4/6 a8/6 ac/6
* b0/6 b4/6
*
* b8/7 ba/7 bc/7 be/7 c0/7 c2/7 c4/7 c6/7
* c8/7 ca/7 cc/7 ce/7 d0/7 d2/7 d4/7 d6/7
* d8/7 da/7 dc/7 de/7 e0/7 e2/7 e4/7 e6/7
* e8/7 ea/7 ec/7 ee/7 f0/7 f2/7 f4/7 f6/7
*
* f8/8 f9/8 fa/8 fb/8 fc/8 fd/8
*
* ==> a single 256-symbol table based on the full byte provides a direct
* access and the bit count
*
* These codes fit in two octets (10 to 15 bits, neither 9 nor 16 bits code) :
*
* fe + 2 bits:
* 00/2 40/2 80/2 c0/2
*
* ff + 2..7 bits :
* 00/2
* 40/3 60/3 80/3
* a0/4 b0/4
* c0/5 c8/5 d0/5 d8/5 e0/5 e8/5
* f0/6 f4/6
* f8/7 fa/7 fc/7
*
* ==> a single 256-symbol table made of b0.0 and b1.7-1 provides a direct
* access and the bit count after a miss on the first one above.
*
* These ones fit in three octets :
* ff fe + 3..5 bits :
* 00/3 20/3 40/3 60/4 70/4 80/4 90/4 a0/4
* b0/4 c0/4 d0/4
* e0/5 e8/5 f0/5 f8/5
*
* ff ff + 5..8 bits :
* 00/5 08/5 10/5 18/5 20/5 28/5 30/5 38/5
* 40/5
* 48/6 4c/6 50/6 54/6 58/6 5c/6 60/6 64/6
* 68/6 6c/6 70/6 74/6 78/6 7c/6 80/6 84/6
* 88/6 8c/6 90/6 94/6 98/6 9c/6 a0/6 a4/6
* a8/6 ac/6
* b0/7 b2/7 b4/7 b6/7 b8/7 ba/7 bc/7 be/7
* c0/7 c2/7 c4/7 c6/7 c8/7 ca/7 cc/7 ce/7
* d0/7 d2/7 d4/7 d6/7 d8/7 da/7 dc/7 de/7
* e0/7 e2/7 e4/7 e6/7 e8/7
* ea/8 eb/8 ec/8 ed/8 ee/8 ef/8 f0/8 f1/8
* f2/8 f3/8 f4/8 f5/8
*
* ==> a 32-symbol table has to be applied to 0xfffe
* ==> a 256-symbol table has to be applied to 0xffff
*
* The other ones fit in four octets with 1 to 6 bits in the last one :
* ff ff f6 : 00/1 80/1
* ff ff f7 : 00/1 80/1
* ff ff f8 : 00/2 40/2 80/2 c0/2
* ff ff f9 : 00/2 40/2 80/2 c0/2
* ff ff fa : 00/2 40/2 80/2 c0/2
* ff ff fb : 00/2 40/2 80/2
* ff ff fb : c0/3 e0/3
* ff ff fc : 00/3 20/3 40/3 60/3 80/3 a0/3 c0/3 e0/3
* ff ff fd : 00/3 20/3 40/3 60/3 80/3 a0/3 c0/3 e0/3
* ff ff fe : 00/3
* ff ff fe : 20/4 30/4 40/4 50/4 60/4 70/4 80/4 90/4 a0/4 b0/4 c0/4 d0/4 e0/4 f0/4
* ff ff ff : 00/4 10/4 20/4 30/4 40/4 50/4 60/4 70/4 80/4 90/4 a0/4 b0/4 c0/4 d0/4 e0/4
* ff ff ff : f0/6 f4/6 f8/6 fc/6
*
* ==> a 256-symbol table with b2.0-3,b3.7-4 gives all of them except the
* distinction between ffffff{f0,f4,f8,fc} which is rare enough
* and can be done by hand when bit count == 30.
*
*
* Code lengths :
* 5..8 : 0x00..0xfe
* 10..15 : 0xfe
* 0xff 0x00..0xfe
* 19..20 : 0xff 0xfe 0x00..0xdf
* 21 : 0xff 0xfe 0xe0..0xff
* 21 : 0xff 0xff 0x00..0x40
* 22..24 : 0xff 0xff 0x00..0xf5
* 24..28 : 0xff 0xff 0xf5..0xff
* 30 : 0xff 0xff 0xff 0xf0..0xff
*
*
* if b0 < 0xfe ==> 5..8 bits (74 codes)
* if b0 == 0xfe or 0xff : 10..15
* => if b0 == 0xfe || b1 < 0xfe : lookup (b0:0|b1:7..1) (21 codes)
*
* -- b0 = 0xff --
* if b1 == 0xfe : 19..21 bits
* => lookup b2:7..3 (15 codes)
*
* -- b0 = 0xff, b1 = 0xff : 147 codes --
* if b2 < 0xf6 : 21..24 bits (76 codes)
* if b2 >= 0xf6 : 25..30 bits (71 codes)
*
* Algorithm:
* - if > 24 and < 32, read missing bits.
* - if less than 24 bits, read 1 byte. If past end, insert 0xff instead.
* - if b0 < 0xfe lookup b0 in table0[0..255]
* - else if b0 == 0xfe, manual lookup
* - else if b0 == 0xff, lookup b1 in table1[0..255]
* ...
*/
uint8_t rht_bit31_24[256] = {
/* 0x00 */ 0x30, 0x30, 0x30, 0x30, 0x30, 0x30, 0x30, 0x30,
/* 0x08 */ 0x31, 0x31, 0x31, 0x31, 0x31, 0x31, 0x31, 0x31,
/* 0x10 */ 0x32, 0x32, 0x32, 0x32, 0x32, 0x32, 0x32, 0x32,
/* 0x18 */ 0x61, 0x61, 0x61, 0x61, 0x61, 0x61, 0x61, 0x61,
/* 0x20 */ 0x63, 0x63, 0x63, 0x63, 0x63, 0x63, 0x63, 0x63,
/* 0x28 */ 0x65, 0x65, 0x65, 0x65, 0x65, 0x65, 0x65, 0x65,
/* 0x30 */ 0x69, 0x69, 0x69, 0x69, 0x69, 0x69, 0x69, 0x69,
/* 0x38 */ 0x6f, 0x6f, 0x6f, 0x6f, 0x6f, 0x6f, 0x6f, 0x6f,
/* 0x40 */ 0x73, 0x73, 0x73, 0x73, 0x73, 0x73, 0x73, 0x73,
/* 0x48 */ 0x74, 0x74, 0x74, 0x74, 0x74, 0x74, 0x74, 0x74,
/* 0x50 */ 0x20, 0x20, 0x20, 0x20,
/* 0x54 */ 0x25, 0x25, 0x25, 0x25,
/* 0x58 */ 0x2d, 0x2d, 0x2d, 0x2d,
/* 0x5c */ 0x2e, 0x2e, 0x2e, 0x2e,
/* 0x60 */ 0x2f, 0x2f, 0x2f, 0x2f,
/* 0x64 */ 0x33, 0x33, 0x33, 0x33,
/* 0x68 */ 0x34, 0x34, 0x34, 0x34,
/* 0x6c */ 0x35, 0x35, 0x35, 0x35,
/* 0x70 */ 0x36, 0x36, 0x36, 0x36,
/* 0x74 */ 0x37, 0x37, 0x37, 0x37,
/* 0x78 */ 0x38, 0x38, 0x38, 0x38,
/* 0x7c */ 0x39, 0x39, 0x39, 0x39,
/* 0x80 */ 0x3d, 0x3d, 0x3d, 0x3d,
/* 0x84 */ 0x41, 0x41, 0x41, 0x41,
/* 0x88 */ 0x5f, 0x5f, 0x5f, 0x5f,
/* 0x8c */ 0x62, 0x62, 0x62, 0x62,
/* 0x90 */ 0x64, 0x64, 0x64, 0x64,
/* 0x94 */ 0x66, 0x66, 0x66, 0x66,
/* 0x98 */ 0x67, 0x67, 0x67, 0x67,
/* 0x9c */ 0x68, 0x68, 0x68, 0x68,
/* 0xa0 */ 0x6c, 0x6c, 0x6c, 0x6c,
/* 0xa4 */ 0x6d, 0x6d, 0x6d, 0x6d,
/* 0xa8 */ 0x6e, 0x6e, 0x6e, 0x6e,
/* 0xac */ 0x70, 0x70, 0x70, 0x70,
/* 0xb0 */ 0x72, 0x72, 0x72, 0x72,
/* 0xb4 */ 0x75, 0x75, 0x75, 0x75,
/* 0xb8 */ 0x3a, 0x3a,
/* 0xba */ 0x42, 0x42,
/* 0xbc */ 0x43, 0x43,
/* 0xbe */ 0x44, 0x44,
/* 0xc0 */ 0x45, 0x45,
/* 0xc2 */ 0x46, 0x46,
/* 0xc4 */ 0x47, 0x47,
/* 0xc6 */ 0x48, 0x48,
/* 0xc8 */ 0x49, 0x49,
/* 0xca */ 0x4a, 0x4a,
/* 0xcc */ 0x4b, 0x4b,
/* 0xce */ 0x4c, 0x4c,
/* 0xd0 */ 0x4d, 0x4d,
/* 0xd2 */ 0x4e, 0x4e,
/* 0xd4 */ 0x4f, 0x4f,
/* 0xd6 */ 0x50, 0x50,
/* 0xd8 */ 0x51, 0x51,
/* 0xda */ 0x52, 0x52,
/* 0xdc */ 0x53, 0x53,
/* 0xde */ 0x54, 0x54,
/* 0xe0 */ 0x55, 0x55,
/* 0xe2 */ 0x56, 0x56,
/* 0xe4 */ 0x57, 0x57,
/* 0xe6 */ 0x59, 0x59,
/* 0xe8 */ 0x6a, 0x6a,
/* 0xea */ 0x6b, 0x6b,
/* 0xec */ 0x71, 0x71,
/* 0xee */ 0x76, 0x76,
/* 0xf0 */ 0x77, 0x77,
/* 0xf2 */ 0x78, 0x78,
/* 0xf4 */ 0x79, 0x79,
/* 0xf6 */ 0x7a, 0x7a,
/* 0xf8 */ 0x26,
/* 0xf9 */ 0x2a,
/* 0xfa */ 0x2c,
/* 0xfb */ 0x3b,
/* 0xfc */ 0x58,
/* 0xfd */ 0x5a,
};
uint8_t rht_bit24_17[256] = {
/* 0x00 */ 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21,
/* 0x10 */ 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21, 0x21,
/* 0x20 */ 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22,
/* 0x30 */ 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22, 0x22,
/* 0x40 */ 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28,
/* 0x50 */ 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28, 0x28,
/* 0x60 */ 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29,
/* 0x70 */ 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29, 0x29,
/* 0x80 */ 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f,
/* 0x90 */ 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f, 0x3f,
/* 0xa0 */ 0x27, 0x27, 0x27, 0x27, 0x27, 0x27, 0x27, 0x27, 0x27, 0x27, 0x27, 0x27, 0x27, 0x27, 0x27, 0x27,
/* 0xb0 */ 0x2b, 0x2b, 0x2b, 0x2b, 0x2b, 0x2b, 0x2b, 0x2b, 0x2b, 0x2b, 0x2b, 0x2b, 0x2b, 0x2b, 0x2b, 0x2b,
/* 0xc0 */ 0x7c, 0x7c, 0x7c, 0x7c, 0x7c, 0x7c, 0x7c, 0x7c, 0x7c, 0x7c, 0x7c, 0x7c, 0x7c, 0x7c, 0x7c, 0x7c,
/* 0xd0 */ 0x23, 0x23, 0x23, 0x23, 0x23, 0x23, 0x23, 0x23,
/* 0xd8 */ 0x3e, 0x3e, 0x3e, 0x3e, 0x3e, 0x3e, 0x3e, 0x3e,
/* 0xe0 */ 0x00, 0x00, 0x00, 0x00,
/* 0xe4 */ 0x24, 0x24, 0x24, 0x24,
/* 0xe8 */ 0x40, 0x40, 0x40, 0x40,
/* 0xec */ 0x5b, 0x5b, 0x5b, 0x5b,
/* 0xf0 */ 0x5d, 0x5d, 0x5d, 0x5d,
/* 0xf4 */ 0x7e, 0x7e, 0x7e, 0x7e,
/* 0xf8 */ 0x5e, 0x5e,
/* 0xfa */ 0x7d, 0x7d,
/* 0xfc */ 0x3c,
/* 0xfd */ 0x60,
/* 0xfe */ 0x7b,
};
uint8_t rht_bit15_8[256] = {
/* 0x00 */ 0xb0, 0xb0, 0xb0, 0xb0, 0xb0, 0xb0, 0xb0, 0xb0,
/* 0x08 */ 0xb1, 0xb1, 0xb1, 0xb1, 0xb1, 0xb1, 0xb1, 0xb1,
/* 0x10 */ 0xb3, 0xb3, 0xb3, 0xb3, 0xb3, 0xb3, 0xb3, 0xb3,
/* 0x18 */ 0xd1, 0xd1, 0xd1, 0xd1, 0xd1, 0xd1, 0xd1, 0xd1,
/* 0x20 */ 0xd8, 0xd8, 0xd8, 0xd8, 0xd8, 0xd8, 0xd8, 0xd8,
/* 0x28 */ 0xd9, 0xd9, 0xd9, 0xd9, 0xd9, 0xd9, 0xd9, 0xd9,
/* 0x30 */ 0xe3, 0xe3, 0xe3, 0xe3, 0xe3, 0xe3, 0xe3, 0xe3,
/* 0x38 */ 0xe5, 0xe5, 0xe5, 0xe5, 0xe5, 0xe5, 0xe5, 0xe5,
/* 0x40 */ 0xe6, 0xe6, 0xe6, 0xe6, 0xe6, 0xe6, 0xe6, 0xe6,
/* 0x48 */ 0x81, 0x81, 0x81, 0x81,
/* 0x4c */ 0x84, 0x84, 0x84, 0x84,
/* 0x50 */ 0x85, 0x85, 0x85, 0x85,
/* 0x54 */ 0x86, 0x86, 0x86, 0x86,
/* 0x58 */ 0x88, 0x88, 0x88, 0x88,
/* 0x5c */ 0x92, 0x92, 0x92, 0x92,
/* 0x60 */ 0x9a, 0x9a, 0x9a, 0x9a,
/* 0x64 */ 0x9c, 0x9c, 0x9c, 0x9c,
/* 0x68 */ 0xa0, 0xa0, 0xa0, 0xa0,
/* 0x6c */ 0xa3, 0xa3, 0xa3, 0xa3,
/* 0x70 */ 0xa4, 0xa4, 0xa4, 0xa4,
/* 0x74 */ 0xa9, 0xa9, 0xa9, 0xa9,
/* 0x78 */ 0xaa, 0xaa, 0xaa, 0xaa,
/* 0x7c */ 0xad, 0xad, 0xad, 0xad,
/* 0x80 */ 0xb2, 0xb2, 0xb2, 0xb2,
/* 0x84 */ 0xb5, 0xb5, 0xb5, 0xb5,
/* 0x88 */ 0xb9, 0xb9, 0xb9, 0xb9,
/* 0x8c */ 0xba, 0xba, 0xba, 0xba,
/* 0x90 */ 0xbb, 0xbb, 0xbb, 0xbb,
/* 0x94 */ 0xbd, 0xbd, 0xbd, 0xbd,
/* 0x98 */ 0xbe, 0xbe, 0xbe, 0xbe,
/* 0x9c */ 0xc4, 0xc4, 0xc4, 0xc4,
/* 0xa0 */ 0xc6, 0xc6, 0xc6, 0xc6,
/* 0xa4 */ 0xe4, 0xe4, 0xe4, 0xe4,
/* 0xa8 */ 0xe8, 0xe8, 0xe8, 0xe8,
/* 0xac */ 0xe9, 0xe9, 0xe9, 0xe9,
/* 0xb0 */ 0x01, 0x01,
/* 0xb2 */ 0x87, 0x87,
/* 0xb4 */ 0x89, 0x89,
/* 0xb6 */ 0x8a, 0x8a,
/* 0xb8 */ 0x8b, 0x8b,
/* 0xba */ 0x8c, 0x8c,
/* 0xbc */ 0x8d, 0x8d,
/* 0xbe */ 0x8f, 0x8f,
/* 0xc0 */ 0x93, 0x93,
/* 0xc2 */ 0x95, 0x95,
/* 0xc4 */ 0x96, 0x96,
/* 0xc6 */ 0x97, 0x97,
/* 0xc8 */ 0x98, 0x98,
/* 0xca */ 0x9b, 0x9b,
/* 0xcc */ 0x9d, 0x9d,
/* 0xce */ 0x9e, 0x9e,
/* 0xd0 */ 0xa5, 0xa5,
/* 0xd2 */ 0xa6, 0xa6,
/* 0xd4 */ 0xa8, 0xa8,
/* 0xd6 */ 0xae, 0xae,
/* 0xd8 */ 0xaf, 0xaf,
/* 0xda */ 0xb4, 0xb4,
/* 0xdc */ 0xb6, 0xb6,
/* 0xde */ 0xb7, 0xb7,
/* 0xe0 */ 0xbc, 0xbc,
/* 0xe2 */ 0xbf, 0xbf,
/* 0xe4 */ 0xc5, 0xc5,
/* 0xe6 */ 0xe7, 0xe7,
/* 0xe8 */ 0xef, 0xef,
/* 0xea */ 0x09,
/* 0xeb */ 0x8e,
/* 0xec */ 0x90,
/* 0xed */ 0x91,
/* 0xee */ 0x94,
/* 0xef */ 0x9f,
/* 0xf0 */ 0xab,
/* 0xf1 */ 0xce,
/* 0xf2 */ 0xd7,
/* 0xf3 */ 0xe1,
/* 0xf4 */ 0xec,
/* 0xf5 */ 0xed,
};
/* below two non-overlapping tables are merged in order to save on L1D:
* - bits 15-11 for values 0x00-0x1f
* - bits 11-4 for values 0x60-0xff
*/
uint8_t rht_bit15_11_11_4[256] = {
/* part used for bits 15-11 (0x00-0x1f) */
/* 0x00 */ 0x5c, 0x5c, 0x5c, 0x5c,
/* 0x04 */ 0xc3, 0xc3, 0xc3, 0xc3,
/* 0x08 */ 0xd0, 0xd0, 0xd0, 0xd0,
/* 0x0c */ 0x80, 0x80,
/* 0x0e */ 0x82, 0x82,
/* 0x10 */ 0x83, 0x83,
/* 0x12 */ 0xa2, 0xa2,
/* 0x14 */ 0xb8, 0xb8,
/* 0x16 */ 0xc2, 0xc2,
/* 0x18 */ 0xe0, 0xe0,
/* 0x1a */ 0xe2, 0xe2,
/* 0x1c */ 0x99,
/* 0x1d */ 0xa1,
/* 0x1e */ 0xa7,
/* 0x1f */ 0xac,
/* part used for bits 11-4 for 0xf600 (0x60-0xff) */
/* 0x60 */ 0xc7, 0xc7, 0xc7, 0xc7, 0xc7, 0xc7, 0xc7, 0xc7,
/* 0x68 */ 0xcf, 0xcf, 0xcf, 0xcf, 0xcf, 0xcf, 0xcf, 0xcf,
/* 0x70 */ 0xea, 0xea, 0xea, 0xea, 0xea, 0xea, 0xea, 0xea,
/* 0x78 */ 0xeb, 0xeb, 0xeb, 0xeb, 0xeb, 0xeb, 0xeb, 0xeb,
/* 0x80 */ 0xc0, 0xc0, 0xc0, 0xc0,
/* 0x84 */ 0xc1, 0xc1, 0xc1, 0xc1,
/* 0x88 */ 0xc8, 0xc8, 0xc8, 0xc8,
/* 0x8c */ 0xc9, 0xc9, 0xc9, 0xc9,
/* 0x90 */ 0xca, 0xca, 0xca, 0xca,
/* 0x94 */ 0xcd, 0xcd, 0xcd, 0xcd,
/* 0x98 */ 0xd2, 0xd2, 0xd2, 0xd2,
/* 0x9c */ 0xd5, 0xd5, 0xd5, 0xd5,
/* 0xa0 */ 0xda, 0xda, 0xda, 0xda,
/* 0xa4 */ 0xdb, 0xdb, 0xdb, 0xdb,
/* 0xa8 */ 0xee, 0xee, 0xee, 0xee,
/* 0xac */ 0xf0, 0xf0, 0xf0, 0xf0,
/* 0xb0 */ 0xf2, 0xf2, 0xf2, 0xf2,
/* 0xb4 */ 0xf3, 0xf3, 0xf3, 0xf3,
/* 0xb8 */ 0xff, 0xff, 0xff, 0xff,
/* 0xbc */ 0xcb, 0xcb,
/* 0xbe */ 0xcc, 0xcc,
/* 0xc0 */ 0xd3, 0xd3,
/* 0xc2 */ 0xd4, 0xd4,
/* 0xc4 */ 0xd6, 0xd6,
/* 0xc6 */ 0xdd, 0xdd,
/* 0xc8 */ 0xde, 0xde,
/* 0xca */ 0xdf, 0xdf,
/* 0xcc */ 0xf1, 0xf1,
/* 0xce */ 0xf4, 0xf4,
/* 0xd0 */ 0xf5, 0xf5,
/* 0xd2 */ 0xf6, 0xf6,
/* 0xd4 */ 0xf7, 0xf7,
/* 0xd6 */ 0xf8, 0xf8,
/* 0xd8 */ 0xfa, 0xfa,
/* 0xda */ 0xfb, 0xfb,
/* 0xdc */ 0xfc, 0xfc,
/* 0xde */ 0xfd, 0xfd,
/* 0xe0 */ 0xfe, 0xfe,
/* 0xe2 */ 0x02,
/* 0xe3 */ 0x03,
/* 0xe4 */ 0x04,
/* 0xe5 */ 0x05,
/* 0xe6 */ 0x06,
/* 0xe7 */ 0x07,
/* 0xe8 */ 0x08,
/* 0xe9 */ 0x0b,
/* 0xea */ 0x0c,
/* 0xeb */ 0x0e,
/* 0xec */ 0x0f,
/* 0xed */ 0x10,
/* 0xee */ 0x11,
/* 0xef */ 0x12,
/* 0xf0 */ 0x13,
/* 0xf1 */ 0x14,
/* 0xf2 */ 0x15,
/* 0xf3 */ 0x17,
/* 0xf4 */ 0x18,
/* 0xf5 */ 0x19,
/* 0xf6 */ 0x1a,
/* 0xf7 */ 0x1b,
/* 0xf8 */ 0x1c,
/* 0xf9 */ 0x1d,
/* 0xfa */ 0x1e,
/* 0xfb */ 0x1f,
/* 0xfc */ 0x7f,
/* 0xfd */ 0xdc,
/* 0xfe */ 0xf9,
/* 0xff */ 0x0a,
/* Note, for [0xff], l==30 and bits 2..3 give 00:0x0a, 01:0x0d, 10:0x16, 11:EOS */
};
/* huffman-encode string <s> into the huff_tmp buffer and returns the amount
* of output bytes. The caller must ensure the output is large enough (ie at
* least 4 times as long as s).
*
* FIXME: bits are only counted for now, no code is emitted!
*/
int huff_enc(const char *s, char *out)
{
int bits = 0;
while (*s) {
bits += ht[(uint8_t)*s].b;
s++;
}
bits += 7;
/* FIXME: huffman code is not emitted yet. */
//memset(out, 'H', bits / 8);
return bits / 8;
}
/* pass a huffman string, it will decode it and return the new output size or
* -1 in case of error.
*
* The principle of the decoder is to lookup full bytes in reverse-huffman
* tables. Since we may need up to 30 bits and the word positions are not
* always multiples of 8, we build the code word by shifting the "current"
* 32-bit word and the "next" one of the appropriate amount of bits. Once
* the shift goes beyond 32, words are swapped and the "next" one is refilled
* with new bytes. Shift operations are cheap when done a single time like this.
* On 64-bit platforms it is possible to further improve this by storing both
* of them in a single word.
*/
int huff_dec(const uint8_t *huff, int hlen, char *out, int olen)
{
char *out_start = out;
char *out_end = out + olen;
const uint8_t *huff_end = huff + hlen;
uint32_t curr = 0;
uint32_t next = 0;
uint32_t shift;
uint32_t code; /* The 30-bit code being looked up, MSB-aligned */
uint8_t sym;
int bleft; /* bits left */
int l;
code = 0;
shift = 64; // start with an empty buffer
bleft = hlen << 3;
while (bleft > 0 && out != out_end) {
while (shift >= 32) {
curr = next;
/* read up to 4 bytes into next */
next = 0;
if (huff + 4 <= huff_end) {
next = read_n32(huff);
huff += 4;
}
else {
/* note: we append 0 and not 0xff so that we can
* distinguish shifted bits from a really inserted
* EOS.
*/
next = (((huff + 0 < huff_end) ? (uint32_t)huff[0] : 0x00) << 24) +
(((huff + 1 < huff_end) ? (uint32_t)huff[1] : 0x00) << 16) +
(((huff + 2 < huff_end) ? (uint32_t)huff[2] : 0x00) << 8) +
((huff + 3 < huff_end) ? (uint32_t)huff[3] : 0x00);
huff = huff_end;
}
shift -= 32;
}
/* curr:next contain 64 bit of huffman code */
code = curr;
if (shift)
code = (code << shift) + (next >> (32 - shift));
/* now we necessarily have 32 bits available */
if (code < 0xfe000000) {
/* single byte */
sym = code >> 24;
l = sym < 0xb8 ?
sym < 0x50 ? 5 : 6 :
sym < 0xf8 ? 7 : 8;
sym = rht_bit31_24[code >> 24];
}
else if (code < 0xfffe0000) {
/* two bytes, 0xfe + 2 bits or 0xff + 2..7 bits */
sym = code >> 17;
l = sym < 0xe0 ?
sym < 0xa0 ? 10 : sym < 0xd0 ? 11 : 12 :
sym < 0xf8 ? 13 : sym < 0xfc ? 14 : 15;
sym = rht_bit24_17[(code >> 17) & 0xff];
}
else if (code < 0xffff0000) { /* 3..5 bits */
/* 0xff + 0xfe + 3..5 bits or
* 0xff + 0xff + 5..8 bits for values till 0xf5
*/
sym = (code >> 11) & 0x1f;
l = sym < 0x0c ? 19 : sym < 0x1c ? 20 : 21;
sym = rht_bit15_11_11_4[(code >> 11) & 0x1f];
}
else if (code < 0xfffff600) { /* 5..8 bits */
/* that's 0xff + 0xff */
sym = code >> 8;
l = sym < 0xb0 ?
sym < 0x48 ? 21 : 22 :
sym < 0xea ? 23 : 24;
sym = rht_bit15_8[(code >> 8) & 0xff];
}
else {
/* 0xff 0xff 0xf6..0xff */
sym = code >> 4;
l = sym < 0xbc ?
sym < 0x80 ? 25 : 26 :
sym < 0xe2 ? 27 : sym < 0xff ? 28 : 30;
if (sym < 0xff)
sym = rht_bit15_11_11_4[(code >> 4) & 0xff];
else if ((code & 0xff) == 0xf0)
sym = 10;
else if ((code & 0xff) == 0xf4)
sym = 13;
else if ((code & 0xff) == 0xf8)
sym = 22;
else { // 0xfc : EOS
break;
}
}
if (!l || bleft - l < 0)
break;
bleft -= l;
shift += l;
*out++ = sym;
}
if (bleft > 0) {
/* some bits were not consumed after the last code, they must
* match EOS (ie: all ones) and there must be 7 bits or less.
* (7541#5.2).
*/
if (bleft > 7)
return -1;
if ((code & -(1 << (32 - bleft))) != (uint32_t)-(1 << (32 - bleft)))
return -1;
}
if (out < out_end)
*out = 0; // end of string whenever possible
return out - out_start;
}