blob: 44c0cc1178e6abfd77c5280d08ede637c9f68da0 [file] [log] [blame]
Willy Tarreauce040942017-05-30 18:46:58 +02001/*
2 * HPACK header table management (RFC7541) - type definitions and prototypes
3 *
4 * Copyright (C) 2014-2017 Willy Tarreau <willy@haproxy.org>
5 * Copyright (C) 2017 HAProxy Technologies
6 *
7 * Permission is hereby granted, free of charge, to any person obtaining
8 * a copy of this software and associated documentation files (the
9 * "Software"), to deal in the Software without restriction, including
10 * without limitation the rights to use, copy, modify, merge, publish,
11 * distribute, sublicense, and/or sell copies of the Software, and to
12 * permit persons to whom the Software is furnished to do so, subject to
13 * the following conditions:
14 *
15 * The above copyright notice and this permission notice shall be
16 * included in all copies or substantial portions of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
19 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
20 * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
21 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
22 * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
23 * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
24 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
25 * OTHER DEALINGS IN THE SOFTWARE.
26 */
27#ifndef _COMMON_HPACK_TBL_H
28#define _COMMON_HPACK_TBL_H
29
Willy Tarreaua1bd1fa2019-03-29 17:26:33 +010030#include <inttypes.h>
Willy Tarreauce040942017-05-30 18:46:58 +020031#include <stdlib.h>
32#include <common/config.h>
33#include <common/http-hdr.h>
34#include <common/ist.h>
Willy Tarreau2bdcc702020-05-19 11:31:11 +020035#include <common/memory.h>
Willy Tarreauce040942017-05-30 18:46:58 +020036
37/* Dynamic Headers Table, usable for tables up to 4GB long and values of 64kB-1.
38 * The model can be improved by using offsets relative to the table entry's end
39 * or to the end of the area, or by moving the descriptors at the end of the
40 * table and the data at the beginning. This entry is 8 bytes long, which is 1/4
41 * of the bookkeeping planned by the HPACK spec. Thus it saves 24 bytes per
42 * header field, meaning that even with a single header, 24 extra bytes can be
43 * stored (ie one such descriptor). At 29.2 average bytes per header field as
44 * found in the hpack test case, that's slightly more than 1.5kB of space saved
45 * from a 4kB block, resulting in contiguous space almost always being
46 * available.
47 *
48 * Principle: the table is stored in a contiguous array containing both the
49 * descriptors and the contents. Descriptors are stored at the beginning of the
50 * array while contents are stored starting from the end. Most of the time there
51 * is enough room left in the table to insert a new header field, thanks to the
52 * savings on the descriptor size. Thus by inserting headers from the end it's
53 * possible to maximize the delay before a collision of DTEs and data. In order
54 * to always insert from the right, we need to keep a reference to the latest
55 * inserted element and look before it. The last inserted cell's address defines
Ilya Shipitsin77e3b4a2020-03-10 12:06:11 +050056 * the lowest known address still in use, unless the area wraps in which case
Willy Tarreauce040942017-05-30 18:46:58 +020057 * the available space lies between the end of the tail and the beginning of the
58 * head.
59 *
60 * In order to detect collisions between data blocks and DTEs, we also maintain
61 * an index to the lowest element facing the DTE table, called "front". This one
62 * is updated each time an element is inserted before it. Once the buffer wraps,
63 * this element doesn't have to be updated anymore until it is released, in
64 * which case the buffer doesn't wrap anymore and the front element becomes the
65 * head again.
66 *
67 * Various heuristics are possible concerning the opportunity to wrap the
68 * entries to limit the risk of collisions with the DTE, but experimentation
69 * shows that thanks to the important savings made on the descriptors, the
70 * likeliness of finding a large amount of free space at the end of the area is
71 * much higher than the risk of colliding, so in the end the most naive
72 * algorithms work pretty fine. Typical ratios of 1 collision per 2000 requests
73 * have been observed.
74 *
75 * The defragmentation should be rare ; a study on live data shows on average
76 * 29.2 bytes used per header field. This plus the 32 bytes overhead fix an
77 * average of 66.9 header fields per 4kB table. This brings a 1606 bytes saving
78 * using the current storage description, ensuring that oldest headers are
79 * linearly removed by the sender before fragmentation occurs. This means that
80 * for all smaller header fields there will not be any requirement to defragment
81 * the area and most of the time it will even be possible to copy the old values
82 * directly within the buffer after creating a new entry. On average within the
83 * available space there will be enough room to store 1606/(29.2+8)=43 extra
84 * header fields without switching to another place.
85 *
86 * The table header fits in the table itself, it only takes 16 bytes, so in the
87 * worst case (1 single header) it's possible to store 4096 - 16 - 8 = 4072
88 * data bytes, which is larger than the 4064 the protocol requires (4096 - 32).
89 */
90
91/* One dynamic table entry descriptor */
92struct hpack_dte {
93 uint32_t addr; /* storage address, relative to the dte address */
94 uint16_t nlen; /* header name length */
95 uint16_t vlen; /* header value length */
96};
97
98/* Note: the table's head plus a struct hpack_dte must be smaller than or equal to 32
99 * bytes so that a single large header can always fit. Here that's 16 bytes for
100 * the header, plus 8 bytes per slot.
101 * Note that when <used> == 0, front, head, and wrap are undefined.
102 */
103struct hpack_dht {
104 uint32_t size; /* allocated table size in bytes */
105 uint32_t total; /* sum of nlen + vlen in bytes */
106 uint16_t front; /* slot number of the first node after the idx table */
107 uint16_t wrap; /* number of allocated slots, wraps here */
108 uint16_t head; /* last inserted slot number */
109 uint16_t used; /* number of slots in use */
110 struct hpack_dte dte[0]; /* dynamic table entries */
111};
112
113/* supported hpack encoding/decoding errors */
114enum {
115 HPACK_ERR_NONE = 0, /* no error */
116 HPACK_ERR_ALLOC_FAIL, /* memory allocation error */
117 HPACK_ERR_UNKNOWN_OPCODE, /* invalid first byte */
118 HPACK_ERR_TRUNCATED, /* truncated stream */
119 HPACK_ERR_HUFFMAN, /* huffman decoding error */
120 HPACK_ERR_INVALID_PHDR, /* invalid pseudo header field name */
121 HPACK_ERR_MISPLACED_PHDR, /* pseudo header field after a regular header field */
122 HPACK_ERR_DUPLICATE_PHDR, /* duplicate pseudo header field */
123 HPACK_ERR_DHT_INSERT_FAIL, /* failed to insert into DHT */
124 HPACK_ERR_TOO_LARGE, /* decoded request/response is too large */
125 HPACK_ERR_MISSING_METHOD, /* :method is missing */
126 HPACK_ERR_MISSING_SCHEME, /* :scheme is missing */
127 HPACK_ERR_MISSING_PATH, /* :path is missing */
128 HPACK_ERR_MISSING_AUTHORITY, /* :authority is missing with CONNECT */
129 HPACK_ERR_SCHEME_NOT_ALLOWED, /* :scheme not allowed with CONNECT */
130 HPACK_ERR_PATH_NOT_ALLOWED, /* :path not allowed with CONNECT */
Willy Tarreau1e7d4442019-01-24 10:47:10 +0100131 HPACK_ERR_INVALID_ARGUMENT, /* an invalid argument was passed */
Willy Tarreauce040942017-05-30 18:46:58 +0200132};
133
134/* static header table as in RFC7541 Appendix A. [0] unused. */
135#define HPACK_SHT_SIZE 62
136extern const struct http_hdr hpack_sht[HPACK_SHT_SIZE];
Willy Tarreau2bdcc702020-05-19 11:31:11 +0200137extern struct pool_head *pool_head_hpack_tbl;
Willy Tarreauce040942017-05-30 18:46:58 +0200138
139extern int __hpack_dht_make_room(struct hpack_dht *dht, unsigned int needed);
140extern int hpack_dht_insert(struct hpack_dht *dht, struct ist name, struct ist value);
141
142/* return a pointer to the entry designated by index <idx> (starting at 1) or
143 * NULL if this index is not there.
144 */
145static inline const struct hpack_dte *hpack_get_dte(const struct hpack_dht *dht, uint16_t idx)
146{
147 idx--;
148
149 if (idx >= dht->used)
150 return NULL;
151
152 if (idx <= dht->head)
153 idx = dht->head - idx;
154 else
155 idx = dht->head - idx + dht->wrap;
156
157 return &dht->dte[idx];
158}
159
Willy Tarreaud85ba4e2017-12-03 12:12:17 +0100160/* returns non-zero if <idx> is valid for table <dht> */
Willy Tarreau7f2a44d2018-09-17 14:07:33 +0200161static inline int hpack_valid_idx(const struct hpack_dht *dht, uint32_t idx)
Willy Tarreaud85ba4e2017-12-03 12:12:17 +0100162{
163 return idx < dht->used + HPACK_SHT_SIZE;
164}
165
Willy Tarreauce040942017-05-30 18:46:58 +0200166/* return a pointer to the header name for entry <dte>. */
167static inline struct ist hpack_get_name(const struct hpack_dht *dht, const struct hpack_dte *dte)
168{
169 struct ist ret = {
170 .ptr = (void *)dht + dte->addr,
171 .len = dte->nlen,
172 };
173 return ret;
174}
175
176/* return a pointer to the header value for entry <dte>. */
177static inline struct ist hpack_get_value(const struct hpack_dht *dht, const struct hpack_dte *dte)
178{
179 struct ist ret = {
180 .ptr = (void *)dht + dte->addr + dte->nlen,
181 .len = dte->vlen,
182 };
183 return ret;
184}
185
186/* takes an idx, returns the associated name */
Willy Tarreau7f2a44d2018-09-17 14:07:33 +0200187static inline struct ist hpack_idx_to_name(const struct hpack_dht *dht, uint32_t idx)
Willy Tarreauce040942017-05-30 18:46:58 +0200188{
189 const struct hpack_dte *dte;
190
191 if (idx < HPACK_SHT_SIZE)
192 return hpack_sht[idx].n;
193
194 dte = hpack_get_dte(dht, idx - HPACK_SHT_SIZE + 1);
195 if (!dte)
196 return ist("### ERR ###"); // error
197
198 return hpack_get_name(dht, dte);
199}
200
201/* takes an idx, returns the associated value */
Willy Tarreau7f2a44d2018-09-17 14:07:33 +0200202static inline struct ist hpack_idx_to_value(const struct hpack_dht *dht, uint32_t idx)
Willy Tarreauce040942017-05-30 18:46:58 +0200203{
204 const struct hpack_dte *dte;
205
206 if (idx < HPACK_SHT_SIZE)
207 return hpack_sht[idx].v;
208
209 dte = hpack_get_dte(dht, idx - HPACK_SHT_SIZE + 1);
210 if (!dte)
211 return ist("### ERR ###"); // error
212
213 return hpack_get_value(dht, dte);
214}
215
216/* Purges table dht until a header field of <needed> bytes fits according to
217 * the protocol (adding 32 bytes overhead). Returns non-zero on success, zero
218 * on failure (ie: table empty but still not sufficient).
219 */
220static inline int hpack_dht_make_room(struct hpack_dht *dht, unsigned int needed)
221{
Willy Tarreau6c71e462017-12-04 17:58:37 +0100222 if (dht->used * 32 + dht->total + needed + 32 <= dht->size)
Willy Tarreauce040942017-05-30 18:46:58 +0200223 return 1;
Willy Tarreau6c71e462017-12-04 17:58:37 +0100224 else if (!dht->used)
225 return 0;
Willy Tarreauce040942017-05-30 18:46:58 +0200226
227 return __hpack_dht_make_room(dht, needed);
228}
229
230/* allocate a dynamic headers table of <size> bytes and return it initialized */
231static inline void hpack_dht_init(struct hpack_dht *dht, uint32_t size)
232{
233 dht->size = size;
234 dht->total = 0;
235 dht->used = 0;
236}
237
Willy Tarreau2bdcc702020-05-19 11:31:11 +0200238/* allocate a dynamic headers table from the pool and return it initialized */
239static inline struct hpack_dht *hpack_dht_alloc()
Willy Tarreauce040942017-05-30 18:46:58 +0200240{
241 struct hpack_dht *dht;
242
Willy Tarreau2bdcc702020-05-19 11:31:11 +0200243 if (unlikely(!pool_head_hpack_tbl))
244 return NULL;
Willy Tarreauce040942017-05-30 18:46:58 +0200245
Willy Tarreau2bdcc702020-05-19 11:31:11 +0200246 dht = pool_alloc(pool_head_hpack_tbl);
247 if (dht)
248 hpack_dht_init(dht, pool_head_hpack_tbl->size);
Willy Tarreauce040942017-05-30 18:46:58 +0200249 return dht;
250}
251
252/* free a dynamic headers table */
253static inline void hpack_dht_free(struct hpack_dht *dht)
254{
Willy Tarreau2bdcc702020-05-19 11:31:11 +0200255 pool_free(pool_head_hpack_tbl, dht);
Willy Tarreauce040942017-05-30 18:46:58 +0200256}
257
258#endif /* _COMMON_HPACK_TBL_H */