blob: 4c494d565abb29e472f7b3976de86cfc97c69bec [file] [log] [blame]
Willy Tarreau62f52692017-10-08 23:01:42 +02001/*
2 * HTTP/2 mux-demux for connections
3 *
4 * Copyright 2017 Willy Tarreau <w@1wt.eu>
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 */
12
13#include <common/cfgparse.h>
14#include <common/config.h>
Willy Tarreauafba57a2018-12-11 13:44:24 +010015#include <common/h1.h>
Willy Tarreau5ab6b572017-09-22 08:05:00 +020016#include <common/h2.h>
Willy Tarreau13278b42017-10-13 19:23:14 +020017#include <common/hpack-dec.h>
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +020018#include <common/hpack-enc.h>
Willy Tarreau5ab6b572017-09-22 08:05:00 +020019#include <common/hpack-tbl.h>
Willy Tarreaub96b77e2018-12-11 10:22:41 +010020#include <common/htx.h>
Willy Tarreau0108d902018-11-25 19:14:37 +010021#include <common/initcall.h>
Willy Tarreaue4820742017-07-27 13:37:23 +020022#include <common/net_helper.h>
Willy Tarreau62f52692017-10-08 23:01:42 +020023#include <proto/connection.h>
Willy Tarreaubcd3bb32018-12-01 18:59:00 +010024#include <proto/http_htx.h>
Olivier Houchard44d59142018-12-13 18:46:22 +010025#include <proto/session.h>
Willy Tarreau62f52692017-10-08 23:01:42 +020026#include <proto/stream.h>
Olivier Houchard44d59142018-12-13 18:46:22 +010027#include <proto/stream_interface.h>
Willy Tarreauea392822017-10-31 10:02:25 +010028#include <types/session.h>
Willy Tarreau5ab6b572017-09-22 08:05:00 +020029#include <eb32tree.h>
Willy Tarreau62f52692017-10-08 23:01:42 +020030
31
Willy Tarreau2a856182017-05-16 15:20:39 +020032/* dummy streams returned for idle and closed states */
33static const struct h2s *h2_closed_stream;
34static const struct h2s *h2_idle_stream;
35
Willy Tarreau5ab6b572017-09-22 08:05:00 +020036/* Connection flags (32 bit), in h2c->flags */
37#define H2_CF_NONE 0x00000000
38
Willy Tarreau2e5b60e2017-09-25 11:49:03 +020039/* Flags indicating why writing to the mux is blocked. */
40#define H2_CF_MUX_MALLOC 0x00000001 // mux blocked on lack of connection's mux buffer
41#define H2_CF_MUX_MFULL 0x00000002 // mux blocked on connection's mux buffer full
42#define H2_CF_MUX_BLOCK_ANY 0x00000003 // aggregate of the mux flags above
43
Willy Tarreau315d8072017-12-10 22:17:57 +010044/* Flags indicating why writing to the demux is blocked.
45 * The first two ones directly affect the ability for the mux to receive data
46 * from the connection. The other ones affect the mux's ability to demux
47 * received data.
48 */
Willy Tarreau2e5b60e2017-09-25 11:49:03 +020049#define H2_CF_DEM_DALLOC 0x00000004 // demux blocked on lack of connection's demux buffer
50#define H2_CF_DEM_DFULL 0x00000008 // demux blocked on connection's demux buffer full
Willy Tarreau315d8072017-12-10 22:17:57 +010051
Willy Tarreau2e5b60e2017-09-25 11:49:03 +020052#define H2_CF_DEM_MBUSY 0x00000010 // demux blocked on connection's mux side busy
53#define H2_CF_DEM_MROOM 0x00000020 // demux blocked on lack of room in mux buffer
54#define H2_CF_DEM_SALLOC 0x00000040 // demux blocked on lack of stream's request buffer
55#define H2_CF_DEM_SFULL 0x00000080 // demux blocked on stream request buffer full
Willy Tarreauf2101912018-07-19 10:11:38 +020056#define H2_CF_DEM_TOOMANY 0x00000100 // demux blocked waiting for some conn_streams to leave
57#define H2_CF_DEM_BLOCK_ANY 0x000001F0 // aggregate of the demux flags above except DALLOC/DFULL
Willy Tarreau2e5b60e2017-09-25 11:49:03 +020058
Willy Tarreau081d4722017-05-16 21:51:05 +020059/* other flags */
Willy Tarreauf2101912018-07-19 10:11:38 +020060#define H2_CF_GOAWAY_SENT 0x00001000 // a GOAWAY frame was successfully sent
61#define H2_CF_GOAWAY_FAILED 0x00002000 // a GOAWAY frame failed to be sent
62#define H2_CF_WAIT_FOR_HS 0x00004000 // We did check that at least a stream was waiting for handshake
Willy Tarreaub3fb56d2018-10-03 13:56:38 +020063#define H2_CF_IS_BACK 0x00008000 // this is an outgoing connection
Willy Tarreau081d4722017-05-16 21:51:05 +020064
Willy Tarreau5ab6b572017-09-22 08:05:00 +020065/* H2 connection state, in h2c->st0 */
66enum h2_cs {
67 H2_CS_PREFACE, // init done, waiting for connection preface
68 H2_CS_SETTINGS1, // preface OK, waiting for first settings frame
69 H2_CS_FRAME_H, // first settings frame ok, waiting for frame header
70 H2_CS_FRAME_P, // frame header OK, waiting for frame payload
Willy Tarreaua20a5192017-12-27 11:02:06 +010071 H2_CS_FRAME_A, // frame payload OK, trying to send ACK frame
72 H2_CS_FRAME_E, // frame payload OK, trying to send RST frame
Willy Tarreau5ab6b572017-09-22 08:05:00 +020073 H2_CS_ERROR, // send GOAWAY(errcode) and close the connection ASAP
74 H2_CS_ERROR2, // GOAWAY(errcode) sent, close the connection ASAP
75 H2_CS_ENTRIES // must be last
76} __attribute__((packed));
77
78/* H2 connection descriptor */
79struct h2c {
80 struct connection *conn;
81
82 enum h2_cs st0; /* mux state */
83 enum h2_err errcode; /* H2 err code (H2_ERR_*) */
84
85 /* 16 bit hole here */
86 uint32_t flags; /* connection flags: H2_CF_* */
87 int32_t max_id; /* highest ID known on this connection, <0 before preface */
88 uint32_t rcvd_c; /* newly received data to ACK for the connection */
89 uint32_t rcvd_s; /* newly received data to ACK for the current stream (dsi) */
90
91 /* states for the demux direction */
92 struct hpack_dht *ddht; /* demux dynamic header table */
Willy Tarreauc9fa0482018-07-10 17:43:27 +020093 struct buffer dbuf; /* demux buffer */
Willy Tarreau5ab6b572017-09-22 08:05:00 +020094
95 int32_t dsi; /* demux stream ID (<0 = idle) */
96 int32_t dfl; /* demux frame length (if dsi >= 0) */
97 int8_t dft; /* demux frame type (if dsi >= 0) */
98 int8_t dff; /* demux frame flags (if dsi >= 0) */
Willy Tarreau05e5daf2017-12-11 15:17:36 +010099 uint8_t dpl; /* demux pad length (part of dfl), init to 0 */
100 /* 8 bit hole here */
Willy Tarreau5ab6b572017-09-22 08:05:00 +0200101 int32_t last_sid; /* last processed stream ID for GOAWAY, <0 before preface */
102
103 /* states for the mux direction */
Willy Tarreauc9fa0482018-07-10 17:43:27 +0200104 struct buffer mbuf; /* mux buffer */
Willy Tarreau5ab6b572017-09-22 08:05:00 +0200105 int32_t msi; /* mux stream ID (<0 = idle) */
106 int32_t mfl; /* mux frame length (if dsi >= 0) */
107 int8_t mft; /* mux frame type (if dsi >= 0) */
108 int8_t mff; /* mux frame flags (if dsi >= 0) */
109 /* 16 bit hole here */
110 int32_t miw; /* mux initial window size for all new streams */
111 int32_t mws; /* mux window size. Can be negative. */
112 int32_t mfs; /* mux's max frame size */
113
Willy Tarreauea392822017-10-31 10:02:25 +0100114 int timeout; /* idle timeout duration in ticks */
Willy Tarreau599391a2017-11-24 10:16:00 +0100115 int shut_timeout; /* idle timeout duration in ticks after GOAWAY was sent */
Willy Tarreau49745612017-12-03 18:56:02 +0100116 unsigned int nb_streams; /* number of streams in the tree */
Willy Tarreau7ac60e82018-07-19 09:04:05 +0200117 unsigned int nb_cs; /* number of attached conn_streams */
Willy Tarreau0b37d652018-10-03 10:33:02 +0200118 struct proxy *proxy; /* the proxy this connection was created for */
Willy Tarreauea392822017-10-31 10:02:25 +0100119 struct task *task; /* timeout management task */
Willy Tarreau5ab6b572017-09-22 08:05:00 +0200120 struct eb_root streams_by_id; /* all active streams by their ID */
121 struct list send_list; /* list of blocked streams requesting to send */
122 struct list fctl_list; /* list of streams blocked by connection's fctl */
Olivier Houchardd846c262018-10-19 17:24:29 +0200123 struct list sending_list; /* list of h2s scheduled to send data */
Willy Tarreau44e973f2018-03-01 17:49:30 +0100124 struct buffer_wait buf_wait; /* wait list for buffer allocations */
Olivier Houchardfa8aa862018-10-10 18:25:41 +0200125 struct wait_event wait_event; /* To be used if we're waiting for I/Os */
Willy Tarreau5ab6b572017-09-22 08:05:00 +0200126};
127
Willy Tarreau18312642017-10-11 07:57:07 +0200128/* H2 stream state, in h2s->st */
129enum h2_ss {
130 H2_SS_IDLE = 0, // idle
131 H2_SS_RLOC, // reserved(local)
132 H2_SS_RREM, // reserved(remote)
133 H2_SS_OPEN, // open
134 H2_SS_HREM, // half-closed(remote)
135 H2_SS_HLOC, // half-closed(local)
Willy Tarreau96060ba2017-10-16 18:34:34 +0200136 H2_SS_ERROR, // an error needs to be sent using RST_STREAM
Willy Tarreau18312642017-10-11 07:57:07 +0200137 H2_SS_CLOSED, // closed
138 H2_SS_ENTRIES // must be last
139} __attribute__((packed));
140
141/* HTTP/2 stream flags (32 bit), in h2s->flags */
142#define H2_SF_NONE 0x00000000
143#define H2_SF_ES_RCVD 0x00000001
144#define H2_SF_ES_SENT 0x00000002
145
146#define H2_SF_RST_RCVD 0x00000004 // received RST_STREAM
147#define H2_SF_RST_SENT 0x00000008 // sent RST_STREAM
148
Willy Tarreau2e5b60e2017-09-25 11:49:03 +0200149/* stream flags indicating the reason the stream is blocked */
150#define H2_SF_BLK_MBUSY 0x00000010 // blocked waiting for mux access (transient)
151#define H2_SF_BLK_MROOM 0x00000020 // blocked waiting for room in the mux
152#define H2_SF_BLK_MFCTL 0x00000040 // blocked due to mux fctl
153#define H2_SF_BLK_SFCTL 0x00000080 // blocked due to stream fctl
154#define H2_SF_BLK_ANY 0x000000F0 // any of the reasons above
155
Willy Tarreau454f9052017-10-26 19:40:35 +0200156/* stream flags indicating how data is supposed to be sent */
157#define H2_SF_DATA_CLEN 0x00000100 // data sent using content-length
158#define H2_SF_DATA_CHNK 0x00000200 // data sent using chunked-encoding
159
160/* step we're currently in when sending chunks. This is needed because we may
161 * have to transfer chunks as large as a full buffer so there's no room left
162 * for size nor crlf around.
163 */
164#define H2_SF_CHNK_SIZE 0x00000000 // trying to send chunk size
165#define H2_SF_CHNK_DATA 0x00000400 // trying to send chunk data
166#define H2_SF_CHNK_CRLF 0x00000800 // trying to send chunk crlf after data
167
168#define H2_SF_CHNK_MASK 0x00000C00 // trying to send chunk size
169
Willy Tarreau67434202017-11-06 20:20:51 +0100170#define H2_SF_HEADERS_SENT 0x00001000 // a HEADERS frame was sent for this stream
Willy Tarreauc4312d32017-11-07 12:01:53 +0100171#define H2_SF_OUTGOING_DATA 0x00002000 // set whenever we've seen outgoing data
Willy Tarreau67434202017-11-06 20:20:51 +0100172
Willy Tarreau18312642017-10-11 07:57:07 +0200173/* H2 stream descriptor, describing the stream as it appears in the H2C, and as
174 * it is being processed in the internal HTTP representation (H1 for now).
175 */
176struct h2s {
177 struct conn_stream *cs;
Olivier Houchardf502aca2018-12-14 19:42:40 +0100178 struct session *sess;
Willy Tarreau18312642017-10-11 07:57:07 +0200179 struct h2c *h2c;
Willy Tarreaua40704a2018-09-11 13:52:04 +0200180 struct h1m h1m; /* request or response parser state for H1 */
Willy Tarreau18312642017-10-11 07:57:07 +0200181 struct eb32_node by_id; /* place in h2c's streams_by_id */
Willy Tarreau18312642017-10-11 07:57:07 +0200182 int32_t id; /* stream ID */
183 uint32_t flags; /* H2_SF_* */
184 int mws; /* mux window size for this stream */
185 enum h2_err errcode; /* H2 err code (H2_ERR_*) */
186 enum h2_ss st;
Willy Tarreau9c5e22e2018-09-11 19:22:14 +0200187 uint16_t status; /* HTTP response status */
Olivier Houchard638b7992018-08-16 15:41:52 +0200188 struct buffer rxbuf; /* receive buffer, always valid (buf_empty or real buffer) */
Olivier Houchardfa8aa862018-10-10 18:25:41 +0200189 struct wait_event wait_event; /* Wait list, when we're attempting to send a RST but we can't send */
190 struct wait_event *recv_wait; /* Address of the wait_event the conn_stream associated is waiting on */
191 struct wait_event *send_wait; /* The streeam is waiting for flow control */
192 struct list list; /* To be used when adding in h2c->send_list or h2c->fctl_lsit */
Willy Tarreau18312642017-10-11 07:57:07 +0200193};
Willy Tarreau5ab6b572017-09-22 08:05:00 +0200194
Willy Tarreauc6405142017-09-21 20:23:50 +0200195/* descriptor for an h2 frame header */
196struct h2_fh {
197 uint32_t len; /* length, host order, 24 bits */
198 uint32_t sid; /* stream id, host order, 31 bits */
199 uint8_t ft; /* frame type */
200 uint8_t ff; /* frame flags */
201};
202
Willy Tarreau8ceae722018-11-26 11:58:30 +0100203/* the h2c connection pool */
204DECLARE_STATIC_POOL(pool_head_h2c, "h2c", sizeof(struct h2c));
205
206/* the h2s stream pool */
207DECLARE_STATIC_POOL(pool_head_h2s, "h2s", sizeof(struct h2s));
208
Willy Tarreaudc572362018-12-12 08:08:05 +0100209/* The default connection window size is 65535, it may only be enlarged using
210 * a WINDOW_UPDATE message. Since the window must never be larger than 2G-1,
211 * we'll pretend we already received the difference between the two to send
212 * an equivalent window update to enlarge it to 2G-1.
213 */
214#define H2_INITIAL_WINDOW_INCREMENT ((1U<<31)-1 - 65535)
215
Willy Tarreaufe20e5b2017-07-27 11:42:14 +0200216/* a few settings from the global section */
217static int h2_settings_header_table_size = 4096; /* initial value */
Willy Tarreaue6baec02017-07-27 11:45:11 +0200218static int h2_settings_initial_window_size = 65535; /* initial value */
Willy Tarreau5242ef82017-07-27 11:47:28 +0200219static int h2_settings_max_concurrent_streams = 100;
Willy Tarreaufe20e5b2017-07-27 11:42:14 +0200220
Willy Tarreau2a856182017-05-16 15:20:39 +0200221/* a dmumy closed stream */
222static const struct h2s *h2_closed_stream = &(const struct h2s){
223 .cs = NULL,
224 .h2c = NULL,
225 .st = H2_SS_CLOSED,
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +0100226 .errcode = H2_ERR_STREAM_CLOSED,
Willy Tarreauab837502017-12-27 15:07:30 +0100227 .flags = H2_SF_RST_RCVD,
Willy Tarreau2a856182017-05-16 15:20:39 +0200228 .id = 0,
229};
230
231/* and a dummy idle stream for use with any unannounced stream */
232static const struct h2s *h2_idle_stream = &(const struct h2s){
233 .cs = NULL,
234 .h2c = NULL,
235 .st = H2_SS_IDLE,
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +0100236 .errcode = H2_ERR_STREAM_CLOSED,
Willy Tarreau2a856182017-05-16 15:20:39 +0200237 .id = 0,
238};
239
Olivier Houchard9f6af332018-05-25 14:04:04 +0200240static struct task *h2_timeout_task(struct task *t, void *context, unsigned short state);
Olivier Houchardd4dd22d2018-08-17 18:39:46 +0200241static int h2_send(struct h2c *h2c);
242static int h2_recv(struct h2c *h2c);
Olivier Houchard7505f942018-08-21 18:10:44 +0200243static int h2_process(struct h2c *h2c);
Olivier Houchard29fb89d2018-08-02 18:56:36 +0200244static struct task *h2_io_cb(struct task *t, void *ctx, unsigned short state);
Willy Tarreau0b559072018-02-26 15:22:17 +0100245static inline struct h2s *h2c_st_by_id(struct h2c *h2c, int id);
Willy Tarreauc3e18f32018-10-08 14:51:56 +0200246static int h2s_decode_headers(struct h2s *h2s);
Willy Tarreaua56a6de2018-02-26 15:59:07 +0100247static int h2_frt_transfer_data(struct h2s *h2s);
Olivier Houchard8ae735d2018-09-11 18:24:28 +0200248static struct task *h2_deferred_shut(struct task *t, void *ctx, unsigned short state);
Olivier Houchardf502aca2018-12-14 19:42:40 +0100249static struct h2s *h2c_bck_stream_new(struct h2c *h2c, struct conn_stream *cs, struct session *sess);
Willy Tarreaufe20e5b2017-07-27 11:42:14 +0200250
Willy Tarreau35dbd5d2017-09-22 09:13:49 +0200251/*****************************************************/
252/* functions below are for dynamic buffer management */
253/*****************************************************/
254
Willy Tarreau315d8072017-12-10 22:17:57 +0100255/* indicates whether or not the we may call the h2_recv() function to attempt
256 * to receive data into the buffer and/or demux pending data. The condition is
257 * a bit complex due to some API limits for now. The rules are the following :
258 * - if an error or a shutdown was detected on the connection and the buffer
259 * is empty, we must not attempt to receive
260 * - if the demux buf failed to be allocated, we must not try to receive and
261 * we know there is nothing pending
Willy Tarreau6042aeb2017-12-12 11:01:44 +0100262 * - if no flag indicates a blocking condition, we may attempt to receive,
263 * regardless of whether the demux buffer is full or not, so that only
264 * de demux part decides whether or not to block. This is needed because
265 * the connection API indeed prevents us from re-enabling receipt that is
266 * already enabled in a polled state, so we must always immediately stop
267 * as soon as the demux can't proceed so as never to hit an end of read
268 * with data pending in the buffers.
Willy Tarreau315d8072017-12-10 22:17:57 +0100269 * - otherwise must may not attempt
270 */
271static inline int h2_recv_allowed(const struct h2c *h2c)
272{
Willy Tarreauc9fa0482018-07-10 17:43:27 +0200273 if (b_data(&h2c->dbuf) == 0 &&
Willy Tarreau315d8072017-12-10 22:17:57 +0100274 (h2c->st0 >= H2_CS_ERROR ||
275 h2c->conn->flags & CO_FL_ERROR ||
276 conn_xprt_read0_pending(h2c->conn)))
277 return 0;
278
279 if (!(h2c->flags & H2_CF_DEM_DALLOC) &&
Willy Tarreau6042aeb2017-12-12 11:01:44 +0100280 !(h2c->flags & H2_CF_DEM_BLOCK_ANY))
Willy Tarreau315d8072017-12-10 22:17:57 +0100281 return 1;
282
283 return 0;
284}
285
Willy Tarreauf2101912018-07-19 10:11:38 +0200286/* returns true if the connection has too many conn_streams attached */
287static inline int h2_has_too_many_cs(const struct h2c *h2c)
288{
289 return h2c->nb_cs >= h2_settings_max_concurrent_streams;
290}
291
Willy Tarreau44e973f2018-03-01 17:49:30 +0100292/* Tries to grab a buffer and to re-enable processing on mux <target>. The h2c
293 * flags are used to figure what buffer was requested. It returns 1 if the
294 * allocation succeeds, in which case the connection is woken up, or 0 if it's
295 * impossible to wake up and we prefer to be woken up later.
Willy Tarreau35dbd5d2017-09-22 09:13:49 +0200296 */
Willy Tarreau44e973f2018-03-01 17:49:30 +0100297static int h2_buf_available(void *target)
Willy Tarreau35dbd5d2017-09-22 09:13:49 +0200298{
299 struct h2c *h2c = target;
Willy Tarreau0b559072018-02-26 15:22:17 +0100300 struct h2s *h2s;
Willy Tarreau35dbd5d2017-09-22 09:13:49 +0200301
Willy Tarreau44e973f2018-03-01 17:49:30 +0100302 if ((h2c->flags & H2_CF_DEM_DALLOC) && b_alloc_margin(&h2c->dbuf, 0)) {
Willy Tarreau1b62c5c2017-09-25 11:55:01 +0200303 h2c->flags &= ~H2_CF_DEM_DALLOC;
Olivier Houchard53216e72018-10-10 15:46:36 +0200304 if (h2_recv_allowed(h2c))
Olivier Houchardfa8aa862018-10-10 18:25:41 +0200305 tasklet_wakeup(h2c->wait_event.task);
Willy Tarreau35dbd5d2017-09-22 09:13:49 +0200306 return 1;
307 }
Willy Tarreau35dbd5d2017-09-22 09:13:49 +0200308
Willy Tarreau44e973f2018-03-01 17:49:30 +0100309 if ((h2c->flags & H2_CF_MUX_MALLOC) && b_alloc_margin(&h2c->mbuf, 0)) {
310 h2c->flags &= ~H2_CF_MUX_MALLOC;
Willy Tarreau1b62c5c2017-09-25 11:55:01 +0200311
312 if (h2c->flags & H2_CF_DEM_MROOM) {
313 h2c->flags &= ~H2_CF_DEM_MROOM;
Olivier Houchard53216e72018-10-10 15:46:36 +0200314 if (h2_recv_allowed(h2c))
Olivier Houchardfa8aa862018-10-10 18:25:41 +0200315 tasklet_wakeup(h2c->wait_event.task);
Willy Tarreau1b62c5c2017-09-25 11:55:01 +0200316 }
Willy Tarreau14398122017-09-22 14:26:04 +0200317 return 1;
318 }
Willy Tarreau0b559072018-02-26 15:22:17 +0100319
320 if ((h2c->flags & H2_CF_DEM_SALLOC) &&
321 (h2s = h2c_st_by_id(h2c, h2c->dsi)) && h2s->cs &&
Olivier Houchard638b7992018-08-16 15:41:52 +0200322 b_alloc_margin(&h2s->rxbuf, 0)) {
Willy Tarreau0b559072018-02-26 15:22:17 +0100323 h2c->flags &= ~H2_CF_DEM_SALLOC;
Olivier Houchard53216e72018-10-10 15:46:36 +0200324 if (h2_recv_allowed(h2c))
Olivier Houchardfa8aa862018-10-10 18:25:41 +0200325 tasklet_wakeup(h2c->wait_event.task);
Willy Tarreau0b559072018-02-26 15:22:17 +0100326 return 1;
327 }
328
Willy Tarreau14398122017-09-22 14:26:04 +0200329 return 0;
330}
331
Willy Tarreauc9fa0482018-07-10 17:43:27 +0200332static inline struct buffer *h2_get_buf(struct h2c *h2c, struct buffer *bptr)
Willy Tarreau14398122017-09-22 14:26:04 +0200333{
334 struct buffer *buf = NULL;
335
Willy Tarreau44e973f2018-03-01 17:49:30 +0100336 if (likely(LIST_ISEMPTY(&h2c->buf_wait.list)) &&
337 unlikely((buf = b_alloc_margin(bptr, 0)) == NULL)) {
338 h2c->buf_wait.target = h2c;
339 h2c->buf_wait.wakeup_cb = h2_buf_available;
Christopher Faulet2a944ee2017-11-07 10:42:54 +0100340 HA_SPIN_LOCK(BUF_WQ_LOCK, &buffer_wq_lock);
Willy Tarreau44e973f2018-03-01 17:49:30 +0100341 LIST_ADDQ(&buffer_wq, &h2c->buf_wait.list);
Christopher Faulet2a944ee2017-11-07 10:42:54 +0100342 HA_SPIN_UNLOCK(BUF_WQ_LOCK, &buffer_wq_lock);
Willy Tarreau14398122017-09-22 14:26:04 +0200343 __conn_xprt_stop_recv(h2c->conn);
344 }
345 return buf;
346}
347
Willy Tarreauc9fa0482018-07-10 17:43:27 +0200348static inline void h2_release_buf(struct h2c *h2c, struct buffer *bptr)
Willy Tarreau14398122017-09-22 14:26:04 +0200349{
Willy Tarreauc9fa0482018-07-10 17:43:27 +0200350 if (bptr->size) {
Willy Tarreau44e973f2018-03-01 17:49:30 +0100351 b_free(bptr);
Olivier Houchard673867c2018-05-25 16:58:52 +0200352 offer_buffers(h2c->buf_wait.target, tasks_run_queue);
Willy Tarreau14398122017-09-22 14:26:04 +0200353 }
354}
355
Olivier Houchardd540b362018-11-05 18:37:53 +0100356static int h2_avail_streams(struct connection *conn)
357{
358 struct h2c *h2c = conn->mux_ctx;
359
Olivier Houchard8defe4b2018-12-02 01:31:17 +0100360 /* XXX Should use the negociated max concurrent stream nb instead of the conf value */
Olivier Houchardd540b362018-11-05 18:37:53 +0100361 return (h2_settings_max_concurrent_streams - h2c->nb_streams);
362}
363
Olivier Houchard8defe4b2018-12-02 01:31:17 +0100364static int h2_max_streams(struct connection *conn)
365{
366 /* XXX Should use the negociated max concurrent stream nb instead of the conf value */
367 return h2_settings_max_concurrent_streams;
368}
369
Willy Tarreau35dbd5d2017-09-22 09:13:49 +0200370
Willy Tarreau62f52692017-10-08 23:01:42 +0200371/*****************************************************************/
372/* functions below are dedicated to the mux setup and management */
373/*****************************************************************/
374
Willy Tarreau7dc24e42018-10-03 13:52:41 +0200375/* Initialize the mux once it's attached. For outgoing connections, the context
376 * is already initialized before installing the mux, so we detect incoming
377 * connections from the fact that the context is still NULL. Returns < 0 on
378 * error.
379 */
Olivier Houchardf502aca2018-12-14 19:42:40 +0100380static int h2_init(struct connection *conn, struct proxy *prx, struct session *sess)
Willy Tarreau32218eb2017-09-22 08:07:25 +0200381{
382 struct h2c *h2c;
Willy Tarreauea392822017-10-31 10:02:25 +0100383 struct task *t = NULL;
Willy Tarreau32218eb2017-09-22 08:07:25 +0200384
Willy Tarreaubafbe012017-11-24 17:34:44 +0100385 h2c = pool_alloc(pool_head_h2c);
Willy Tarreau32218eb2017-09-22 08:07:25 +0200386 if (!h2c)
mildiscd2d7de2018-10-02 16:44:18 +0200387 goto fail_no_h2c;
Willy Tarreau32218eb2017-09-22 08:07:25 +0200388
Willy Tarreau01b44822018-10-03 14:26:37 +0200389 if (conn->mux_ctx) {
390 h2c->flags = H2_CF_IS_BACK;
391 h2c->shut_timeout = h2c->timeout = prx->timeout.server;
392 if (tick_isset(prx->timeout.serverfin))
393 h2c->shut_timeout = prx->timeout.serverfin;
394 } else {
395 h2c->flags = H2_CF_NONE;
396 h2c->shut_timeout = h2c->timeout = prx->timeout.client;
397 if (tick_isset(prx->timeout.clientfin))
398 h2c->shut_timeout = prx->timeout.clientfin;
399 }
Willy Tarreau3f133572017-10-31 19:21:06 +0100400
Willy Tarreau0b37d652018-10-03 10:33:02 +0200401 h2c->proxy = prx;
Willy Tarreau33400292017-11-05 11:23:40 +0100402 h2c->task = NULL;
Willy Tarreau3f133572017-10-31 19:21:06 +0100403 if (tick_isset(h2c->timeout)) {
404 t = task_new(tid_bit);
405 if (!t)
406 goto fail;
407
408 h2c->task = t;
409 t->process = h2_timeout_task;
410 t->context = h2c;
411 t->expire = tick_add(now_ms, h2c->timeout);
412 }
Willy Tarreauea392822017-10-31 10:02:25 +0100413
Olivier Houchardfa8aa862018-10-10 18:25:41 +0200414 h2c->wait_event.task = tasklet_new();
415 if (!h2c->wait_event.task)
Olivier Houchard910b2bc2018-07-17 18:49:38 +0200416 goto fail;
Olivier Houchardfa8aa862018-10-10 18:25:41 +0200417 h2c->wait_event.task->process = h2_io_cb;
418 h2c->wait_event.task->context = h2c;
419 h2c->wait_event.wait_reason = 0;
Olivier Houchard910b2bc2018-07-17 18:49:38 +0200420
Willy Tarreau32218eb2017-09-22 08:07:25 +0200421 h2c->ddht = hpack_dht_alloc(h2_settings_header_table_size);
422 if (!h2c->ddht)
423 goto fail;
424
425 /* Initialise the context. */
426 h2c->st0 = H2_CS_PREFACE;
427 h2c->conn = conn;
428 h2c->max_id = -1;
429 h2c->errcode = H2_ERR_NO_ERROR;
Willy Tarreaudc572362018-12-12 08:08:05 +0100430 h2c->rcvd_c = H2_INITIAL_WINDOW_INCREMENT;
Willy Tarreau32218eb2017-09-22 08:07:25 +0200431 h2c->rcvd_s = 0;
Willy Tarreau49745612017-12-03 18:56:02 +0100432 h2c->nb_streams = 0;
Willy Tarreau7ac60e82018-07-19 09:04:05 +0200433 h2c->nb_cs = 0;
Willy Tarreau32218eb2017-09-22 08:07:25 +0200434
Willy Tarreauc9fa0482018-07-10 17:43:27 +0200435 h2c->dbuf = BUF_NULL;
Willy Tarreau32218eb2017-09-22 08:07:25 +0200436 h2c->dsi = -1;
437 h2c->msi = -1;
438 h2c->last_sid = -1;
439
Willy Tarreauc9fa0482018-07-10 17:43:27 +0200440 h2c->mbuf = BUF_NULL;
Willy Tarreau32218eb2017-09-22 08:07:25 +0200441 h2c->miw = 65535; /* mux initial window size */
442 h2c->mws = 65535; /* mux window size */
443 h2c->mfs = 16384; /* initial max frame size */
Willy Tarreau751f2d02018-10-05 09:35:00 +0200444 h2c->streams_by_id = EB_ROOT;
Willy Tarreau32218eb2017-09-22 08:07:25 +0200445 LIST_INIT(&h2c->send_list);
446 LIST_INIT(&h2c->fctl_list);
Olivier Houchardd846c262018-10-19 17:24:29 +0200447 LIST_INIT(&h2c->sending_list);
Willy Tarreau44e973f2018-03-01 17:49:30 +0100448 LIST_INIT(&h2c->buf_wait.list);
Willy Tarreau32218eb2017-09-22 08:07:25 +0200449
Willy Tarreau3f133572017-10-31 19:21:06 +0100450 if (t)
451 task_queue(t);
Willy Tarreauea392822017-10-31 10:02:25 +0100452
Willy Tarreau01b44822018-10-03 14:26:37 +0200453 if (h2c->flags & H2_CF_IS_BACK) {
454 /* FIXME: this is temporary, for outgoing connections we need
455 * to immediately allocate a stream until the code is modified
456 * so that the caller calls ->attach(). For now the outgoing cs
457 * is stored as conn->mux_ctx by the caller.
458 */
459 struct h2s *h2s;
460
Olivier Houchardf502aca2018-12-14 19:42:40 +0100461 h2s = h2c_bck_stream_new(h2c, conn->mux_ctx, sess);
Willy Tarreau01b44822018-10-03 14:26:37 +0200462 if (!h2s)
463 goto fail_stream;
464 }
465
466 conn->mux_ctx = h2c;
467
Willy Tarreau0f383582018-10-03 14:22:21 +0200468 /* prepare to read something */
Olivier Houchardfa8aa862018-10-10 18:25:41 +0200469 tasklet_wakeup(h2c->wait_event.task);
Willy Tarreau32218eb2017-09-22 08:07:25 +0200470 return 0;
Willy Tarreau01b44822018-10-03 14:26:37 +0200471 fail_stream:
472 hpack_dht_free(h2c->ddht);
mildiscd2d7de2018-10-02 16:44:18 +0200473 fail:
Willy Tarreauea392822017-10-31 10:02:25 +0100474 if (t)
475 task_free(t);
Olivier Houchardfa8aa862018-10-10 18:25:41 +0200476 if (h2c->wait_event.task)
477 tasklet_free(h2c->wait_event.task);
Willy Tarreaubafbe012017-11-24 17:34:44 +0100478 pool_free(pool_head_h2c, h2c);
mildiscd2d7de2018-10-02 16:44:18 +0200479 fail_no_h2c:
Willy Tarreau32218eb2017-09-22 08:07:25 +0200480 return -1;
481}
482
Willy Tarreau751f2d02018-10-05 09:35:00 +0200483/* returns the next allocatable outgoing stream ID for the H2 connection, or
484 * -1 if no more is allocatable.
485 */
486static inline int32_t h2c_get_next_sid(const struct h2c *h2c)
487{
488 int32_t id = (h2c->max_id + 1) | 1;
489 if (id & 0x80000000U)
490 id = -1;
491 return id;
492}
493
Willy Tarreau2373acc2017-10-12 17:35:14 +0200494/* returns the stream associated with id <id> or NULL if not found */
495static inline struct h2s *h2c_st_by_id(struct h2c *h2c, int id)
496{
497 struct eb32_node *node;
498
Willy Tarreau751f2d02018-10-05 09:35:00 +0200499 if (id == 0)
500 return (struct h2s *)h2_closed_stream;
501
Willy Tarreau2a856182017-05-16 15:20:39 +0200502 if (id > h2c->max_id)
503 return (struct h2s *)h2_idle_stream;
504
Willy Tarreau2373acc2017-10-12 17:35:14 +0200505 node = eb32_lookup(&h2c->streams_by_id, id);
506 if (!node)
Willy Tarreau2a856182017-05-16 15:20:39 +0200507 return (struct h2s *)h2_closed_stream;
Willy Tarreau2373acc2017-10-12 17:35:14 +0200508
509 return container_of(node, struct h2s, by_id);
510}
511
Willy Tarreau62f52692017-10-08 23:01:42 +0200512/* release function for a connection. This one should be called to free all
513 * resources allocated to the mux.
514 */
515static void h2_release(struct connection *conn)
516{
Willy Tarreau32218eb2017-09-22 08:07:25 +0200517 struct h2c *h2c = conn->mux_ctx;
518
519 LIST_DEL(&conn->list);
520
521 if (h2c) {
522 hpack_dht_free(h2c->ddht);
Willy Tarreau14398122017-09-22 14:26:04 +0200523
Christopher Faulet2a944ee2017-11-07 10:42:54 +0100524 HA_SPIN_LOCK(BUF_WQ_LOCK, &buffer_wq_lock);
Willy Tarreau44e973f2018-03-01 17:49:30 +0100525 LIST_DEL(&h2c->buf_wait.list);
Christopher Faulet2a944ee2017-11-07 10:42:54 +0100526 HA_SPIN_UNLOCK(BUF_WQ_LOCK, &buffer_wq_lock);
Willy Tarreau14398122017-09-22 14:26:04 +0200527
Willy Tarreau44e973f2018-03-01 17:49:30 +0100528 h2_release_buf(h2c, &h2c->dbuf);
529 h2_release_buf(h2c, &h2c->mbuf);
530
Willy Tarreauea392822017-10-31 10:02:25 +0100531 if (h2c->task) {
Willy Tarreau0975f112018-03-29 15:22:59 +0200532 h2c->task->context = NULL;
533 task_wakeup(h2c->task, TASK_WOKEN_OTHER);
Willy Tarreauea392822017-10-31 10:02:25 +0100534 h2c->task = NULL;
535 }
Olivier Houchardfa8aa862018-10-10 18:25:41 +0200536 if (h2c->wait_event.task)
537 tasklet_free(h2c->wait_event.task);
538 if (h2c->wait_event.wait_reason != 0)
539 conn->xprt->unsubscribe(conn, h2c->wait_event.wait_reason,
540 &h2c->wait_event);
Willy Tarreauea392822017-10-31 10:02:25 +0100541
Willy Tarreaubafbe012017-11-24 17:34:44 +0100542 pool_free(pool_head_h2c, h2c);
Willy Tarreau32218eb2017-09-22 08:07:25 +0200543 }
544
545 conn->mux = NULL;
546 conn->mux_ctx = NULL;
547
548 conn_stop_tracking(conn);
549 conn_full_close(conn);
550 if (conn->destroy_cb)
551 conn->destroy_cb(conn);
552 conn_free(conn);
Willy Tarreau62f52692017-10-08 23:01:42 +0200553}
554
555
Willy Tarreau71681172017-10-23 14:39:06 +0200556/******************************************************/
557/* functions below are for the H2 protocol processing */
558/******************************************************/
559
560/* returns the stream if of stream <h2s> or 0 if <h2s> is NULL */
Willy Tarreau1f094672017-11-20 21:27:45 +0100561static inline __maybe_unused int h2s_id(const struct h2s *h2s)
Willy Tarreau71681172017-10-23 14:39:06 +0200562{
563 return h2s ? h2s->id : 0;
564}
565
Willy Tarreau5b5e6872017-09-25 16:17:25 +0200566/* returns true of the mux is currently busy as seen from stream <h2s> */
Willy Tarreau1f094672017-11-20 21:27:45 +0100567static inline __maybe_unused int h2c_mux_busy(const struct h2c *h2c, const struct h2s *h2s)
Willy Tarreau5b5e6872017-09-25 16:17:25 +0200568{
569 if (h2c->msi < 0)
570 return 0;
571
572 if (h2c->msi == h2s_id(h2s))
573 return 0;
574
575 return 1;
576}
577
Willy Tarreau741d6df2017-10-17 08:00:59 +0200578/* marks an error on the connection */
Willy Tarreau1f094672017-11-20 21:27:45 +0100579static inline __maybe_unused void h2c_error(struct h2c *h2c, enum h2_err err)
Willy Tarreau741d6df2017-10-17 08:00:59 +0200580{
581 h2c->errcode = err;
582 h2c->st0 = H2_CS_ERROR;
583}
584
Willy Tarreau2e43f082017-10-17 08:03:59 +0200585/* marks an error on the stream */
Willy Tarreau1f094672017-11-20 21:27:45 +0100586static inline __maybe_unused void h2s_error(struct h2s *h2s, enum h2_err err)
Willy Tarreau2e43f082017-10-17 08:03:59 +0200587{
Willy Tarreauab0e1da2018-10-05 10:16:37 +0200588 if (h2s->id && h2s->st < H2_SS_ERROR) {
Willy Tarreau2e43f082017-10-17 08:03:59 +0200589 h2s->errcode = err;
590 h2s->st = H2_SS_ERROR;
591 if (h2s->cs)
592 h2s->cs->flags |= CS_FL_ERROR;
593 }
594}
595
Willy Tarreaue4820742017-07-27 13:37:23 +0200596/* writes the 24-bit frame size <len> at address <frame> */
Willy Tarreau1f094672017-11-20 21:27:45 +0100597static inline __maybe_unused void h2_set_frame_size(void *frame, uint32_t len)
Willy Tarreaue4820742017-07-27 13:37:23 +0200598{
599 uint8_t *out = frame;
600
601 *out = len >> 16;
602 write_n16(out + 1, len);
603}
604
Willy Tarreau54c15062017-10-10 17:10:03 +0200605/* reads <bytes> bytes from buffer <b> starting at relative offset <o> from the
606 * current pointer, dealing with wrapping, and stores the result in <dst>. It's
607 * the caller's responsibility to verify that there are at least <bytes> bytes
Willy Tarreau9c7f2d12018-06-15 11:51:32 +0200608 * available in the buffer's input prior to calling this function. The buffer
609 * is assumed not to hold any output data.
Willy Tarreau54c15062017-10-10 17:10:03 +0200610 */
Willy Tarreau1f094672017-11-20 21:27:45 +0100611static inline __maybe_unused void h2_get_buf_bytes(void *dst, size_t bytes,
Willy Tarreau54c15062017-10-10 17:10:03 +0200612 const struct buffer *b, int o)
613{
Willy Tarreau591d4452018-06-15 17:21:00 +0200614 readv_bytes(dst, bytes, b_peek(b, o), b_wrap(b) - b_peek(b, o), b_orig(b));
Willy Tarreau54c15062017-10-10 17:10:03 +0200615}
616
Willy Tarreau1f094672017-11-20 21:27:45 +0100617static inline __maybe_unused uint16_t h2_get_n16(const struct buffer *b, int o)
Willy Tarreau54c15062017-10-10 17:10:03 +0200618{
Willy Tarreau591d4452018-06-15 17:21:00 +0200619 return readv_n16(b_peek(b, o), b_wrap(b) - b_peek(b, o), b_orig(b));
Willy Tarreau54c15062017-10-10 17:10:03 +0200620}
621
Willy Tarreau1f094672017-11-20 21:27:45 +0100622static inline __maybe_unused uint32_t h2_get_n32(const struct buffer *b, int o)
Willy Tarreau54c15062017-10-10 17:10:03 +0200623{
Willy Tarreau591d4452018-06-15 17:21:00 +0200624 return readv_n32(b_peek(b, o), b_wrap(b) - b_peek(b, o), b_orig(b));
Willy Tarreau54c15062017-10-10 17:10:03 +0200625}
626
Willy Tarreau1f094672017-11-20 21:27:45 +0100627static inline __maybe_unused uint64_t h2_get_n64(const struct buffer *b, int o)
Willy Tarreau54c15062017-10-10 17:10:03 +0200628{
Willy Tarreau591d4452018-06-15 17:21:00 +0200629 return readv_n64(b_peek(b, o), b_wrap(b) - b_peek(b, o), b_orig(b));
Willy Tarreau54c15062017-10-10 17:10:03 +0200630}
631
632
Willy Tarreau715d5312017-07-11 15:20:24 +0200633/* Peeks an H2 frame header from buffer <b> into descriptor <h>. The algorithm
634 * is not obvious. It turns out that H2 headers are neither aligned nor do they
635 * use regular sizes. And to add to the trouble, the buffer may wrap so each
636 * byte read must be checked. The header is formed like this :
637 *
638 * b0 b1 b2 b3 b4 b5..b8
639 * +----------+---------+--------+----+----+----------------------+
640 * |len[23:16]|len[15:8]|len[7:0]|type|flag|sid[31:0] (big endian)|
641 * +----------+---------+--------+----+----+----------------------+
642 *
643 * Here we read a big-endian 64 bit word from h[1]. This way in a single read
644 * we get the sid properly aligned and ordered, and 16 bits of len properly
645 * ordered as well. The type and flags can be extracted using bit shifts from
646 * the word, and only one extra read is needed to fetch len[16:23].
Willy Tarreau9c7f2d12018-06-15 11:51:32 +0200647 * Returns zero if some bytes are missing, otherwise non-zero on success. The
648 * buffer is assumed not to contain any output data.
Willy Tarreau715d5312017-07-11 15:20:24 +0200649 */
Willy Tarreau1f094672017-11-20 21:27:45 +0100650static __maybe_unused int h2_peek_frame_hdr(const struct buffer *b, struct h2_fh *h)
Willy Tarreau715d5312017-07-11 15:20:24 +0200651{
652 uint64_t w;
653
Willy Tarreaub7b5fe12018-06-18 13:33:09 +0200654 if (b_data(b) < 9)
Willy Tarreau715d5312017-07-11 15:20:24 +0200655 return 0;
656
Willy Tarreau9c7f2d12018-06-15 11:51:32 +0200657 w = h2_get_n64(b, 1);
Willy Tarreaub7b5fe12018-06-18 13:33:09 +0200658 h->len = *(uint8_t*)b_head(b) << 16;
Willy Tarreau715d5312017-07-11 15:20:24 +0200659 h->sid = w & 0x7FFFFFFF; /* RFC7540#4.1: R bit must be ignored */
660 h->ff = w >> 32;
661 h->ft = w >> 40;
662 h->len += w >> 48;
663 return 1;
664}
665
666/* skip the next 9 bytes corresponding to the frame header possibly parsed by
667 * h2_peek_frame_hdr() above.
668 */
Willy Tarreau1f094672017-11-20 21:27:45 +0100669static inline __maybe_unused void h2_skip_frame_hdr(struct buffer *b)
Willy Tarreau715d5312017-07-11 15:20:24 +0200670{
Willy Tarreaue5f12ce2018-06-15 10:28:05 +0200671 b_del(b, 9);
Willy Tarreau715d5312017-07-11 15:20:24 +0200672}
673
674/* same as above, automatically advances the buffer on success */
Willy Tarreau1f094672017-11-20 21:27:45 +0100675static inline __maybe_unused int h2_get_frame_hdr(struct buffer *b, struct h2_fh *h)
Willy Tarreau715d5312017-07-11 15:20:24 +0200676{
677 int ret;
678
679 ret = h2_peek_frame_hdr(b, h);
680 if (ret > 0)
681 h2_skip_frame_hdr(b);
682 return ret;
683}
684
Willy Tarreau00dd0782018-03-01 16:31:34 +0100685/* marks stream <h2s> as CLOSED and decrement the number of active streams for
686 * its connection if the stream was not yet closed. Please use this exclusively
687 * before closing a stream to ensure stream count is well maintained.
Willy Tarreau91bfdd72017-12-14 12:00:14 +0100688 */
Willy Tarreau00dd0782018-03-01 16:31:34 +0100689static inline void h2s_close(struct h2s *h2s)
Willy Tarreau91bfdd72017-12-14 12:00:14 +0100690{
691 if (h2s->st != H2_SS_CLOSED)
692 h2s->h2c->nb_streams--;
693 h2s->st = H2_SS_CLOSED;
694}
695
Willy Tarreau71049cc2018-03-28 13:56:39 +0200696/* detaches an H2 stream from its H2C and releases it to the H2S pool. */
697static void h2s_destroy(struct h2s *h2s)
Willy Tarreau0a10de62018-03-01 16:27:53 +0100698{
699 h2s_close(h2s);
700 eb32_delete(&h2s->by_id);
Olivier Houchard638b7992018-08-16 15:41:52 +0200701 if (b_size(&h2s->rxbuf)) {
702 b_free(&h2s->rxbuf);
703 offer_buffers(NULL, tasks_run_queue);
704 }
Olivier Houchardfa8aa862018-10-10 18:25:41 +0200705 if (h2s->send_wait != NULL)
706 h2s->send_wait->wait_reason &= ~SUB_CAN_SEND;
707 if (h2s->recv_wait != NULL)
708 h2s->recv_wait->wait_reason &= ~SUB_CAN_RECV;
Joseph Herlantd77575d2018-11-25 10:54:45 -0800709 /* There's no need to explicitly call unsubscribe here, the only
Olivier Houchardfa8aa862018-10-10 18:25:41 +0200710 * reference left would be in the h2c send_list/fctl_list, and if
711 * we're in it, we're getting out anyway
712 */
713 LIST_DEL(&h2s->list);
714 LIST_INIT(&h2s->list);
715 tasklet_free(h2s->wait_event.task);
Willy Tarreau0a10de62018-03-01 16:27:53 +0100716 pool_free(pool_head_h2s, h2s);
717}
718
Willy Tarreaua8e49542018-10-03 18:53:55 +0200719/* allocates a new stream <id> for connection <h2c> and adds it into h2c's
720 * stream tree. In case of error, nothing is added and NULL is returned. The
721 * causes of errors can be any failed memory allocation. The caller is
722 * responsible for checking if the connection may support an extra stream
723 * prior to calling this function.
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200724 */
Willy Tarreaua8e49542018-10-03 18:53:55 +0200725static struct h2s *h2s_new(struct h2c *h2c, int id)
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200726{
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200727 struct h2s *h2s;
728
Willy Tarreaubafbe012017-11-24 17:34:44 +0100729 h2s = pool_alloc(pool_head_h2s);
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200730 if (!h2s)
731 goto out;
732
Olivier Houchardfa8aa862018-10-10 18:25:41 +0200733 h2s->wait_event.task = tasklet_new();
734 if (!h2s->wait_event.task) {
735 pool_free(pool_head_h2s, h2s);
736 goto out;
737 }
738 h2s->send_wait = NULL;
739 h2s->recv_wait = NULL;
740 h2s->wait_event.task->process = h2_deferred_shut;
741 h2s->wait_event.task->context = h2s;
742 h2s->wait_event.handle = NULL;
743 h2s->wait_event.wait_reason = 0;
744 LIST_INIT(&h2s->list);
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200745 h2s->h2c = h2c;
Willy Tarreaua8e49542018-10-03 18:53:55 +0200746 h2s->cs = NULL;
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200747 h2s->mws = h2c->miw;
748 h2s->flags = H2_SF_NONE;
749 h2s->errcode = H2_ERR_NO_ERROR;
750 h2s->st = H2_SS_IDLE;
Willy Tarreau9c5e22e2018-09-11 19:22:14 +0200751 h2s->status = 0;
Olivier Houchard638b7992018-08-16 15:41:52 +0200752 h2s->rxbuf = BUF_NULL;
Willy Tarreau751f2d02018-10-05 09:35:00 +0200753
754 if (h2c->flags & H2_CF_IS_BACK) {
755 h1m_init_req(&h2s->h1m);
756 h2s->h1m.err_pos = -1; // don't care about errors on the request path
757 h2s->h1m.flags |= H1_MF_TOLOWER;
758 } else {
759 h1m_init_res(&h2s->h1m);
760 h2s->h1m.err_pos = -1; // don't care about errors on the response path
761 h2s->h1m.flags |= H1_MF_TOLOWER;
762 }
763
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200764 h2s->by_id.key = h2s->id = id;
Willy Tarreau751f2d02018-10-05 09:35:00 +0200765 if (id > 0)
766 h2c->max_id = id;
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200767
768 eb32_insert(&h2c->streams_by_id, &h2s->by_id);
Willy Tarreau49745612017-12-03 18:56:02 +0100769 h2c->nb_streams++;
Willy Tarreaua8e49542018-10-03 18:53:55 +0200770
771 return h2s;
772
773 out_free_h2s:
774 pool_free(pool_head_h2s, h2s);
775 out:
776 return NULL;
777}
778
779/* creates a new stream <id> on the h2c connection and returns it, or NULL in
780 * case of memory allocation error.
781 */
782static struct h2s *h2c_frt_stream_new(struct h2c *h2c, int id)
783{
784 struct session *sess = h2c->conn->owner;
785 struct conn_stream *cs;
786 struct h2s *h2s;
787
788 if (h2c->nb_streams >= h2_settings_max_concurrent_streams)
789 goto out;
790
791 h2s = h2s_new(h2c, id);
792 if (!h2s)
793 goto out;
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200794
795 cs = cs_new(h2c->conn);
796 if (!cs)
797 goto out_close;
798
Olivier Houchard746fb772018-12-15 19:42:00 +0100799 cs->flags |= CS_FL_NOT_FIRST;
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200800 h2s->cs = cs;
801 cs->ctx = h2s;
Willy Tarreau7ac60e82018-07-19 09:04:05 +0200802 h2c->nb_cs++;
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200803
804 if (stream_create_from_cs(cs) < 0)
805 goto out_free_cs;
806
Willy Tarreau590a0512018-09-05 11:56:48 +0200807 /* We want the accept date presented to the next stream to be the one
808 * we have now, the handshake time to be null (since the next stream
809 * is not delayed by a handshake), and the idle time to count since
810 * right now.
811 */
812 sess->accept_date = date;
813 sess->tv_accept = now;
814 sess->t_handshake = 0;
815
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200816 /* OK done, the stream lives its own life now */
Willy Tarreauf2101912018-07-19 10:11:38 +0200817 if (h2_has_too_many_cs(h2c))
818 h2c->flags |= H2_CF_DEM_TOOMANY;
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200819 return h2s;
820
821 out_free_cs:
Willy Tarreau7ac60e82018-07-19 09:04:05 +0200822 h2c->nb_cs--;
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200823 cs_free(cs);
824 out_close:
Willy Tarreau71049cc2018-03-28 13:56:39 +0200825 h2s_destroy(h2s);
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200826 out:
Willy Tarreau45efc072018-10-03 18:27:52 +0200827 sess_log(sess);
828 return NULL;
Willy Tarreau3ccf4b22017-10-13 19:07:26 +0200829}
830
Willy Tarreau751f2d02018-10-05 09:35:00 +0200831/* allocates a new stream associated to conn_stream <cs> on the h2c connection
832 * and returns it, or NULL in case of memory allocation error or if the highest
833 * possible stream ID was reached.
834 */
Olivier Houchardf502aca2018-12-14 19:42:40 +0100835static struct h2s *h2c_bck_stream_new(struct h2c *h2c, struct conn_stream *cs, struct session *sess)
Willy Tarreau751f2d02018-10-05 09:35:00 +0200836{
837 struct h2s *h2s = NULL;
838
839 if (h2c->nb_streams >= h2_settings_max_concurrent_streams)
840 goto out;
841
842 /* Defer choosing the ID until we send the first message to create the stream */
843 h2s = h2s_new(h2c, 0);
844 if (!h2s)
845 goto out;
846
847 h2s->cs = cs;
Olivier Houchardf502aca2018-12-14 19:42:40 +0100848 h2s->sess = sess;
Willy Tarreau751f2d02018-10-05 09:35:00 +0200849 cs->ctx = h2s;
850 h2c->nb_cs++;
851
Willy Tarreau751f2d02018-10-05 09:35:00 +0200852 out:
853 return h2s;
854}
855
Willy Tarreaube5b7152017-09-25 16:25:39 +0200856/* try to send a settings frame on the connection. Returns > 0 on success, 0 if
857 * it couldn't do anything. It may return an error in h2c. See RFC7540#11.3 for
858 * the various settings codes.
859 */
Willy Tarreau7f0cc492018-10-08 07:13:08 +0200860static int h2c_send_settings(struct h2c *h2c)
Willy Tarreaube5b7152017-09-25 16:25:39 +0200861{
862 struct buffer *res;
863 char buf_data[100]; // enough for 15 settings
Willy Tarreau83061a82018-07-13 11:56:34 +0200864 struct buffer buf;
Willy Tarreaube5b7152017-09-25 16:25:39 +0200865 int ret;
866
867 if (h2c_mux_busy(h2c, NULL)) {
868 h2c->flags |= H2_CF_DEM_MBUSY;
869 return 0;
870 }
871
Willy Tarreau44e973f2018-03-01 17:49:30 +0100872 res = h2_get_buf(h2c, &h2c->mbuf);
Willy Tarreaube5b7152017-09-25 16:25:39 +0200873 if (!res) {
874 h2c->flags |= H2_CF_MUX_MALLOC;
875 h2c->flags |= H2_CF_DEM_MROOM;
876 return 0;
877 }
878
879 chunk_init(&buf, buf_data, sizeof(buf_data));
880 chunk_memcpy(&buf,
881 "\x00\x00\x00" /* length : 0 for now */
882 "\x04\x00" /* type : 4 (settings), flags : 0 */
883 "\x00\x00\x00\x00", /* stream ID : 0 */
884 9);
885
886 if (h2_settings_header_table_size != 4096) {
887 char str[6] = "\x00\x01"; /* header_table_size */
888
889 write_n32(str + 2, h2_settings_header_table_size);
890 chunk_memcat(&buf, str, 6);
891 }
892
893 if (h2_settings_initial_window_size != 65535) {
894 char str[6] = "\x00\x04"; /* initial_window_size */
895
896 write_n32(str + 2, h2_settings_initial_window_size);
897 chunk_memcat(&buf, str, 6);
898 }
899
900 if (h2_settings_max_concurrent_streams != 0) {
901 char str[6] = "\x00\x03"; /* max_concurrent_streams */
902
903 /* Note: 0 means "unlimited" for haproxy's config but not for
904 * the protocol, so never send this value!
905 */
906 write_n32(str + 2, h2_settings_max_concurrent_streams);
907 chunk_memcat(&buf, str, 6);
908 }
909
910 if (global.tune.bufsize != 16384) {
911 char str[6] = "\x00\x05"; /* max_frame_size */
912
913 /* note: similarly we could also emit MAX_HEADER_LIST_SIZE to
914 * match bufsize - rewrite size, but at the moment it seems
915 * that clients don't take care of it.
916 */
917 write_n32(str + 2, global.tune.bufsize);
918 chunk_memcat(&buf, str, 6);
919 }
920
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200921 h2_set_frame_size(buf.area, buf.data - 9);
922 ret = b_istput(res, ist2(buf.area, buf.data));
Willy Tarreaube5b7152017-09-25 16:25:39 +0200923 if (unlikely(ret <= 0)) {
924 if (!ret) {
925 h2c->flags |= H2_CF_MUX_MFULL;
926 h2c->flags |= H2_CF_DEM_MROOM;
927 return 0;
928 }
929 else {
930 h2c_error(h2c, H2_ERR_INTERNAL_ERROR);
931 return 0;
932 }
933 }
934 return ret;
935}
936
Willy Tarreau52eed752017-09-22 15:05:09 +0200937/* Try to receive a connection preface, then upon success try to send our
938 * preface which is a SETTINGS frame. Returns > 0 on success or zero on
939 * missing data. It may return an error in h2c.
940 */
941static int h2c_frt_recv_preface(struct h2c *h2c)
942{
943 int ret1;
Willy Tarreaube5b7152017-09-25 16:25:39 +0200944 int ret2;
Willy Tarreau52eed752017-09-22 15:05:09 +0200945
Willy Tarreauc9fa0482018-07-10 17:43:27 +0200946 ret1 = b_isteq(&h2c->dbuf, 0, b_data(&h2c->dbuf), ist(H2_CONN_PREFACE));
Willy Tarreau52eed752017-09-22 15:05:09 +0200947
948 if (unlikely(ret1 <= 0)) {
Willy Tarreau22de8d32018-09-05 19:55:58 +0200949 if (ret1 < 0)
950 sess_log(h2c->conn->owner);
951
Willy Tarreau52eed752017-09-22 15:05:09 +0200952 if (ret1 < 0 || conn_xprt_read0_pending(h2c->conn))
953 h2c_error(h2c, H2_ERR_PROTOCOL_ERROR);
954 return 0;
955 }
956
Willy Tarreau7f0cc492018-10-08 07:13:08 +0200957 ret2 = h2c_send_settings(h2c);
Willy Tarreaube5b7152017-09-25 16:25:39 +0200958 if (ret2 > 0)
Willy Tarreauc9fa0482018-07-10 17:43:27 +0200959 b_del(&h2c->dbuf, ret1);
Willy Tarreau52eed752017-09-22 15:05:09 +0200960
Willy Tarreaube5b7152017-09-25 16:25:39 +0200961 return ret2;
Willy Tarreau52eed752017-09-22 15:05:09 +0200962}
963
Willy Tarreau01b44822018-10-03 14:26:37 +0200964/* Try to send a connection preface, then upon success try to send our
965 * preface which is a SETTINGS frame. Returns > 0 on success or zero on
966 * missing data. It may return an error in h2c.
967 */
968static int h2c_bck_send_preface(struct h2c *h2c)
969{
970 struct buffer *res;
971
972 if (h2c_mux_busy(h2c, NULL)) {
973 h2c->flags |= H2_CF_DEM_MBUSY;
974 return 0;
975 }
976
977 res = h2_get_buf(h2c, &h2c->mbuf);
978 if (!res) {
979 h2c->flags |= H2_CF_MUX_MALLOC;
980 h2c->flags |= H2_CF_DEM_MROOM;
981 return 0;
982 }
983
984 if (!b_data(res)) {
985 /* preface not yet sent */
986 b_istput(res, ist(H2_CONN_PREFACE));
987 }
988
989 return h2c_send_settings(h2c);
990}
991
Willy Tarreau081d4722017-05-16 21:51:05 +0200992/* try to send a GOAWAY frame on the connection to report an error or a graceful
993 * shutdown, with h2c->errcode as the error code. Returns > 0 on success or zero
994 * if nothing was done. It uses h2c->last_sid as the advertised ID, or copies it
995 * from h2c->max_id if it's not set yet (<0). In case of lack of room to write
996 * the message, it subscribes the requester (either <h2s> or <h2c>) to future
997 * notifications. It sets H2_CF_GOAWAY_SENT on success, and H2_CF_GOAWAY_FAILED
998 * on unrecoverable failure. It will not attempt to send one again in this last
999 * case so that it is safe to use h2c_error() to report such errors.
1000 */
1001static int h2c_send_goaway_error(struct h2c *h2c, struct h2s *h2s)
1002{
1003 struct buffer *res;
1004 char str[17];
1005 int ret;
1006
1007 if (h2c->flags & H2_CF_GOAWAY_FAILED)
1008 return 1; // claim that it worked
1009
1010 if (h2c_mux_busy(h2c, h2s)) {
1011 if (h2s)
1012 h2s->flags |= H2_SF_BLK_MBUSY;
1013 else
1014 h2c->flags |= H2_CF_DEM_MBUSY;
1015 return 0;
1016 }
1017
Willy Tarreau44e973f2018-03-01 17:49:30 +01001018 res = h2_get_buf(h2c, &h2c->mbuf);
Willy Tarreau081d4722017-05-16 21:51:05 +02001019 if (!res) {
1020 h2c->flags |= H2_CF_MUX_MALLOC;
1021 if (h2s)
1022 h2s->flags |= H2_SF_BLK_MROOM;
1023 else
1024 h2c->flags |= H2_CF_DEM_MROOM;
1025 return 0;
1026 }
1027
1028 /* len: 8, type: 7, flags: none, sid: 0 */
1029 memcpy(str, "\x00\x00\x08\x07\x00\x00\x00\x00\x00", 9);
1030
1031 if (h2c->last_sid < 0)
1032 h2c->last_sid = h2c->max_id;
1033
1034 write_n32(str + 9, h2c->last_sid);
1035 write_n32(str + 13, h2c->errcode);
Willy Tarreauea1b06d2018-07-12 09:02:47 +02001036 ret = b_istput(res, ist2(str, 17));
Willy Tarreau081d4722017-05-16 21:51:05 +02001037 if (unlikely(ret <= 0)) {
1038 if (!ret) {
1039 h2c->flags |= H2_CF_MUX_MFULL;
1040 if (h2s)
1041 h2s->flags |= H2_SF_BLK_MROOM;
1042 else
1043 h2c->flags |= H2_CF_DEM_MROOM;
1044 return 0;
1045 }
1046 else {
1047 /* we cannot report this error using GOAWAY, so we mark
1048 * it and claim a success.
1049 */
1050 h2c_error(h2c, H2_ERR_INTERNAL_ERROR);
1051 h2c->flags |= H2_CF_GOAWAY_FAILED;
1052 return 1;
1053 }
1054 }
1055 h2c->flags |= H2_CF_GOAWAY_SENT;
1056 return ret;
1057}
1058
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01001059/* Try to send an RST_STREAM frame on the connection for the indicated stream
1060 * during mux operations. This stream must be valid and cannot be closed
1061 * already. h2s->id will be used for the stream ID and h2s->errcode will be
1062 * used for the error code. h2s->st will be update to H2_SS_CLOSED if it was
1063 * not yet.
1064 *
1065 * Returns > 0 on success or zero if nothing was done. In case of lack of room
1066 * to write the message, it subscribes the stream to future notifications.
1067 */
1068static int h2s_send_rst_stream(struct h2c *h2c, struct h2s *h2s)
1069{
1070 struct buffer *res;
1071 char str[13];
1072 int ret;
1073
1074 if (!h2s || h2s->st == H2_SS_CLOSED)
1075 return 1;
1076
Willy Tarreau8adae7c2018-03-22 17:37:05 +01001077 /* RFC7540#5.4.2: To avoid looping, an endpoint MUST NOT send a
1078 * RST_STREAM in response to a RST_STREAM frame.
1079 */
1080 if (h2c->dft == H2_FT_RST_STREAM) {
1081 ret = 1;
1082 goto ignore;
1083 }
1084
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01001085 if (h2c_mux_busy(h2c, h2s)) {
1086 h2s->flags |= H2_SF_BLK_MBUSY;
1087 return 0;
1088 }
1089
Willy Tarreau44e973f2018-03-01 17:49:30 +01001090 res = h2_get_buf(h2c, &h2c->mbuf);
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01001091 if (!res) {
1092 h2c->flags |= H2_CF_MUX_MALLOC;
1093 h2s->flags |= H2_SF_BLK_MROOM;
1094 return 0;
1095 }
1096
1097 /* len: 4, type: 3, flags: none */
1098 memcpy(str, "\x00\x00\x04\x03\x00", 5);
1099 write_n32(str + 5, h2s->id);
1100 write_n32(str + 9, h2s->errcode);
Willy Tarreauea1b06d2018-07-12 09:02:47 +02001101 ret = b_istput(res, ist2(str, 13));
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01001102
1103 if (unlikely(ret <= 0)) {
1104 if (!ret) {
1105 h2c->flags |= H2_CF_MUX_MFULL;
1106 h2s->flags |= H2_SF_BLK_MROOM;
1107 return 0;
1108 }
1109 else {
1110 h2c_error(h2c, H2_ERR_INTERNAL_ERROR);
1111 return 0;
1112 }
1113 }
1114
Willy Tarreau8adae7c2018-03-22 17:37:05 +01001115 ignore:
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01001116 h2s->flags |= H2_SF_RST_SENT;
Willy Tarreau00dd0782018-03-01 16:31:34 +01001117 h2s_close(h2s);
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01001118 return ret;
1119}
1120
1121/* Try to send an RST_STREAM frame on the connection for the stream being
1122 * demuxed using h2c->dsi for the stream ID. It will use h2s->errcode as the
1123 * error code unless the stream's state already is IDLE or CLOSED in which
1124 * case STREAM_CLOSED will be used, and will update h2s->st to H2_SS_CLOSED if
1125 * it was not yet.
1126 *
1127 * Returns > 0 on success or zero if nothing was done. In case of lack of room
1128 * to write the message, it blocks the demuxer and subscribes it to future
Joseph Herlantd77575d2018-11-25 10:54:45 -08001129 * notifications. It's worth mentioning that an RST may even be sent for a
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01001130 * closed stream.
Willy Tarreau27a84c92017-10-17 08:10:17 +02001131 */
1132static int h2c_send_rst_stream(struct h2c *h2c, struct h2s *h2s)
1133{
1134 struct buffer *res;
1135 char str[13];
1136 int ret;
1137
Willy Tarreau8adae7c2018-03-22 17:37:05 +01001138 /* RFC7540#5.4.2: To avoid looping, an endpoint MUST NOT send a
1139 * RST_STREAM in response to a RST_STREAM frame.
1140 */
1141 if (h2c->dft == H2_FT_RST_STREAM) {
1142 ret = 1;
1143 goto ignore;
1144 }
1145
Willy Tarreau27a84c92017-10-17 08:10:17 +02001146 if (h2c_mux_busy(h2c, h2s)) {
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01001147 h2c->flags |= H2_CF_DEM_MBUSY;
Willy Tarreau27a84c92017-10-17 08:10:17 +02001148 return 0;
1149 }
1150
Willy Tarreau44e973f2018-03-01 17:49:30 +01001151 res = h2_get_buf(h2c, &h2c->mbuf);
Willy Tarreau27a84c92017-10-17 08:10:17 +02001152 if (!res) {
1153 h2c->flags |= H2_CF_MUX_MALLOC;
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01001154 h2c->flags |= H2_CF_DEM_MROOM;
Willy Tarreau27a84c92017-10-17 08:10:17 +02001155 return 0;
1156 }
1157
1158 /* len: 4, type: 3, flags: none */
1159 memcpy(str, "\x00\x00\x04\x03\x00", 5);
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01001160
Willy Tarreau27a84c92017-10-17 08:10:17 +02001161 write_n32(str + 5, h2c->dsi);
Willy Tarreauab0e1da2018-10-05 10:16:37 +02001162 write_n32(str + 9, h2s->id ? h2s->errcode : H2_ERR_STREAM_CLOSED);
Willy Tarreauea1b06d2018-07-12 09:02:47 +02001163 ret = b_istput(res, ist2(str, 13));
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01001164
Willy Tarreau27a84c92017-10-17 08:10:17 +02001165 if (unlikely(ret <= 0)) {
1166 if (!ret) {
1167 h2c->flags |= H2_CF_MUX_MFULL;
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01001168 h2c->flags |= H2_CF_DEM_MROOM;
Willy Tarreau27a84c92017-10-17 08:10:17 +02001169 return 0;
1170 }
1171 else {
1172 h2c_error(h2c, H2_ERR_INTERNAL_ERROR);
1173 return 0;
1174 }
1175 }
1176
Willy Tarreau8adae7c2018-03-22 17:37:05 +01001177 ignore:
Willy Tarreauab0e1da2018-10-05 10:16:37 +02001178 if (h2s->id) {
Willy Tarreau27a84c92017-10-17 08:10:17 +02001179 h2s->flags |= H2_SF_RST_SENT;
Willy Tarreau00dd0782018-03-01 16:31:34 +01001180 h2s_close(h2s);
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01001181 }
1182
Willy Tarreau27a84c92017-10-17 08:10:17 +02001183 return ret;
1184}
1185
Willy Tarreauc7576ea2017-10-29 22:00:09 +01001186/* try to send an empty DATA frame with the ES flag set to notify about the
1187 * end of stream and match a shutdown(write). If an ES was already sent as
1188 * indicated by HLOC/ERROR/RESET/CLOSED states, nothing is done. Returns > 0
1189 * on success or zero if nothing was done. In case of lack of room to write the
1190 * message, it subscribes the requesting stream to future notifications.
1191 */
1192static int h2_send_empty_data_es(struct h2s *h2s)
1193{
1194 struct h2c *h2c = h2s->h2c;
1195 struct buffer *res;
1196 char str[9];
1197 int ret;
1198
Willy Tarreau721c9742017-11-07 11:05:42 +01001199 if (h2s->st == H2_SS_HLOC || h2s->st == H2_SS_ERROR || h2s->st == H2_SS_CLOSED)
Willy Tarreauc7576ea2017-10-29 22:00:09 +01001200 return 1;
1201
1202 if (h2c_mux_busy(h2c, h2s)) {
1203 h2s->flags |= H2_SF_BLK_MBUSY;
1204 return 0;
1205 }
1206
Willy Tarreau44e973f2018-03-01 17:49:30 +01001207 res = h2_get_buf(h2c, &h2c->mbuf);
Willy Tarreauc7576ea2017-10-29 22:00:09 +01001208 if (!res) {
1209 h2c->flags |= H2_CF_MUX_MALLOC;
1210 h2s->flags |= H2_SF_BLK_MROOM;
1211 return 0;
1212 }
1213
1214 /* len: 0x000000, type: 0(DATA), flags: ES=1 */
1215 memcpy(str, "\x00\x00\x00\x00\x01", 5);
1216 write_n32(str + 5, h2s->id);
Willy Tarreauea1b06d2018-07-12 09:02:47 +02001217 ret = b_istput(res, ist2(str, 9));
Willy Tarreau6d8b6822017-11-07 14:39:09 +01001218 if (likely(ret > 0)) {
1219 h2s->flags |= H2_SF_ES_SENT;
1220 }
1221 else if (!ret) {
1222 h2c->flags |= H2_CF_MUX_MFULL;
1223 h2s->flags |= H2_SF_BLK_MROOM;
1224 return 0;
1225 }
1226 else {
1227 h2c_error(h2c, H2_ERR_INTERNAL_ERROR);
1228 return 0;
Willy Tarreauc7576ea2017-10-29 22:00:09 +01001229 }
1230 return ret;
1231}
1232
Willy Tarreau23b92aa2017-10-30 00:26:54 +01001233/* wake the streams attached to the connection, whose id is greater than <last>,
1234 * and assign their conn_stream the CS_FL_* flags <flags> in addition to
Willy Tarreau2c096c32018-09-12 09:45:54 +02001235 * CS_FL_ERROR in case of error and CS_FL_REOS in case of closed connection.
1236 * The stream's state is automatically updated accordingly.
Willy Tarreau23b92aa2017-10-30 00:26:54 +01001237 */
1238static void h2_wake_some_streams(struct h2c *h2c, int last, uint32_t flags)
1239{
1240 struct eb32_node *node;
1241 struct h2s *h2s;
1242
1243 if (h2c->st0 >= H2_CS_ERROR || h2c->conn->flags & CO_FL_ERROR)
1244 flags |= CS_FL_ERROR;
1245
1246 if (conn_xprt_read0_pending(h2c->conn))
Willy Tarreau2c096c32018-09-12 09:45:54 +02001247 flags |= CS_FL_REOS;
Willy Tarreau23b92aa2017-10-30 00:26:54 +01001248
1249 node = eb32_lookup_ge(&h2c->streams_by_id, last + 1);
1250 while (node) {
1251 h2s = container_of(node, struct h2s, by_id);
1252 if (h2s->id <= last)
1253 break;
1254 node = eb32_next(node);
Willy Tarreau22cf59b2017-11-10 11:42:33 +01001255
1256 if (!h2s->cs) {
1257 /* this stream was already orphaned */
Willy Tarreau71049cc2018-03-28 13:56:39 +02001258 h2s_destroy(h2s);
Willy Tarreau22cf59b2017-11-10 11:42:33 +01001259 continue;
Willy Tarreau23b92aa2017-10-30 00:26:54 +01001260 }
Willy Tarreau22cf59b2017-11-10 11:42:33 +01001261
1262 h2s->cs->flags |= flags;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02001263 if (h2s->recv_wait) {
1264 struct wait_event *sw = h2s->recv_wait;
Olivier Houchardc2aa7112018-09-11 18:27:21 +02001265 sw->wait_reason &= ~SUB_CAN_RECV;
1266 tasklet_wakeup(sw->task);
Olivier Houchardfa8aa862018-10-10 18:25:41 +02001267 h2s->recv_wait = NULL;
Olivier Houchard21df6cc2018-09-14 23:21:44 +02001268 } else if (h2s->cs->data_cb->wake != NULL)
1269 h2s->cs->data_cb->wake(h2s->cs);
Willy Tarreau22cf59b2017-11-10 11:42:33 +01001270
Willy Tarreau23b92aa2017-10-30 00:26:54 +01001271 if (flags & CS_FL_ERROR && h2s->st < H2_SS_ERROR)
1272 h2s->st = H2_SS_ERROR;
Willy Tarreau2c096c32018-09-12 09:45:54 +02001273 else if (flags & CS_FL_REOS && h2s->st == H2_SS_OPEN)
Willy Tarreau23b92aa2017-10-30 00:26:54 +01001274 h2s->st = H2_SS_HREM;
Willy Tarreau2c096c32018-09-12 09:45:54 +02001275 else if (flags & CS_FL_REOS && h2s->st == H2_SS_HLOC)
Willy Tarreau00dd0782018-03-01 16:31:34 +01001276 h2s_close(h2s);
Willy Tarreau23b92aa2017-10-30 00:26:54 +01001277 }
1278}
1279
Willy Tarreau3421aba2017-07-27 15:41:03 +02001280/* Increase all streams' outgoing window size by the difference passed in
1281 * argument. This is needed upon receipt of the settings frame if the initial
1282 * window size is different. The difference may be negative and the resulting
1283 * window size as well, for the time it takes to receive some window updates.
1284 */
1285static void h2c_update_all_ws(struct h2c *h2c, int diff)
1286{
1287 struct h2s *h2s;
1288 struct eb32_node *node;
1289
1290 if (!diff)
1291 return;
1292
1293 node = eb32_first(&h2c->streams_by_id);
1294 while (node) {
1295 h2s = container_of(node, struct h2s, by_id);
1296 h2s->mws += diff;
1297 node = eb32_next(node);
1298 }
1299}
1300
1301/* processes a SETTINGS frame whose payload is <payload> for <plen> bytes, and
1302 * ACKs it if needed. Returns > 0 on success or zero on missing data. It may
1303 * return an error in h2c. Described in RFC7540#6.5.
1304 */
1305static int h2c_handle_settings(struct h2c *h2c)
1306{
1307 unsigned int offset;
1308 int error;
1309
1310 if (h2c->dff & H2_F_SETTINGS_ACK) {
1311 if (h2c->dfl) {
1312 error = H2_ERR_FRAME_SIZE_ERROR;
1313 goto fail;
1314 }
1315 return 1;
1316 }
1317
1318 if (h2c->dsi != 0) {
1319 error = H2_ERR_PROTOCOL_ERROR;
1320 goto fail;
1321 }
1322
1323 if (h2c->dfl % 6) {
1324 error = H2_ERR_FRAME_SIZE_ERROR;
1325 goto fail;
1326 }
1327
1328 /* that's the limit we can process */
1329 if (h2c->dfl > global.tune.bufsize) {
1330 error = H2_ERR_FRAME_SIZE_ERROR;
1331 goto fail;
1332 }
1333
1334 /* process full frame only */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001335 if (b_data(&h2c->dbuf) < h2c->dfl)
Willy Tarreau3421aba2017-07-27 15:41:03 +02001336 return 0;
1337
1338 /* parse the frame */
1339 for (offset = 0; offset < h2c->dfl; offset += 6) {
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001340 uint16_t type = h2_get_n16(&h2c->dbuf, offset);
1341 int32_t arg = h2_get_n32(&h2c->dbuf, offset + 2);
Willy Tarreau3421aba2017-07-27 15:41:03 +02001342
1343 switch (type) {
1344 case H2_SETTINGS_INITIAL_WINDOW_SIZE:
1345 /* we need to update all existing streams with the
1346 * difference from the previous iws.
1347 */
1348 if (arg < 0) { // RFC7540#6.5.2
1349 error = H2_ERR_FLOW_CONTROL_ERROR;
1350 goto fail;
1351 }
1352 h2c_update_all_ws(h2c, arg - h2c->miw);
1353 h2c->miw = arg;
1354 break;
1355 case H2_SETTINGS_MAX_FRAME_SIZE:
1356 if (arg < 16384 || arg > 16777215) { // RFC7540#6.5.2
1357 error = H2_ERR_PROTOCOL_ERROR;
1358 goto fail;
1359 }
1360 h2c->mfs = arg;
1361 break;
Willy Tarreau1b38b462017-12-03 19:02:28 +01001362 case H2_SETTINGS_ENABLE_PUSH:
1363 if (arg < 0 || arg > 1) { // RFC7540#6.5.2
1364 error = H2_ERR_PROTOCOL_ERROR;
1365 goto fail;
1366 }
1367 break;
Willy Tarreau3421aba2017-07-27 15:41:03 +02001368 }
1369 }
1370
1371 /* need to ACK this frame now */
1372 h2c->st0 = H2_CS_FRAME_A;
1373 return 1;
1374 fail:
Willy Tarreau22de8d32018-09-05 19:55:58 +02001375 sess_log(h2c->conn->owner);
Willy Tarreau3421aba2017-07-27 15:41:03 +02001376 h2c_error(h2c, error);
1377 return 0;
1378}
1379
1380/* try to send an ACK for a settings frame on the connection. Returns > 0 on
1381 * success or one of the h2_status values.
1382 */
1383static int h2c_ack_settings(struct h2c *h2c)
1384{
1385 struct buffer *res;
1386 char str[9];
1387 int ret = -1;
1388
1389 if (h2c_mux_busy(h2c, NULL)) {
1390 h2c->flags |= H2_CF_DEM_MBUSY;
1391 return 0;
1392 }
1393
Willy Tarreau44e973f2018-03-01 17:49:30 +01001394 res = h2_get_buf(h2c, &h2c->mbuf);
Willy Tarreau3421aba2017-07-27 15:41:03 +02001395 if (!res) {
1396 h2c->flags |= H2_CF_MUX_MALLOC;
1397 h2c->flags |= H2_CF_DEM_MROOM;
1398 return 0;
1399 }
1400
1401 memcpy(str,
1402 "\x00\x00\x00" /* length : 0 (no data) */
1403 "\x04" "\x01" /* type : 4, flags : ACK */
1404 "\x00\x00\x00\x00" /* stream ID */, 9);
1405
Willy Tarreauea1b06d2018-07-12 09:02:47 +02001406 ret = b_istput(res, ist2(str, 9));
Willy Tarreau3421aba2017-07-27 15:41:03 +02001407 if (unlikely(ret <= 0)) {
1408 if (!ret) {
1409 h2c->flags |= H2_CF_MUX_MFULL;
1410 h2c->flags |= H2_CF_DEM_MROOM;
1411 return 0;
1412 }
1413 else {
1414 h2c_error(h2c, H2_ERR_INTERNAL_ERROR);
1415 return 0;
1416 }
1417 }
1418 return ret;
1419}
1420
Willy Tarreaucf68c782017-10-10 17:11:41 +02001421/* processes a PING frame and schedules an ACK if needed. The caller must pass
1422 * the pointer to the payload in <payload>. Returns > 0 on success or zero on
1423 * missing data. It may return an error in h2c.
1424 */
1425static int h2c_handle_ping(struct h2c *h2c)
1426{
1427 /* frame length must be exactly 8 */
1428 if (h2c->dfl != 8) {
1429 h2c_error(h2c, H2_ERR_FRAME_SIZE_ERROR);
1430 return 0;
1431 }
1432
1433 /* schedule a response */
Willy Tarreau68ed6412017-12-03 18:15:56 +01001434 if (!(h2c->dff & H2_F_PING_ACK))
Willy Tarreaucf68c782017-10-10 17:11:41 +02001435 h2c->st0 = H2_CS_FRAME_A;
1436 return 1;
1437}
1438
Willy Tarreaucc0b8c32017-10-26 16:55:59 +02001439/* Try to send a window update for stream id <sid> and value <increment>.
1440 * Returns > 0 on success or zero on missing room or failure. It may return an
1441 * error in h2c.
1442 */
1443static int h2c_send_window_update(struct h2c *h2c, int sid, uint32_t increment)
1444{
1445 struct buffer *res;
1446 char str[13];
1447 int ret = -1;
1448
1449 if (h2c_mux_busy(h2c, NULL)) {
1450 h2c->flags |= H2_CF_DEM_MBUSY;
1451 return 0;
1452 }
1453
Willy Tarreau44e973f2018-03-01 17:49:30 +01001454 res = h2_get_buf(h2c, &h2c->mbuf);
Willy Tarreaucc0b8c32017-10-26 16:55:59 +02001455 if (!res) {
1456 h2c->flags |= H2_CF_MUX_MALLOC;
1457 h2c->flags |= H2_CF_DEM_MROOM;
1458 return 0;
1459 }
1460
1461 /* length: 4, type: 8, flags: none */
1462 memcpy(str, "\x00\x00\x04\x08\x00", 5);
1463 write_n32(str + 5, sid);
1464 write_n32(str + 9, increment);
1465
Willy Tarreauea1b06d2018-07-12 09:02:47 +02001466 ret = b_istput(res, ist2(str, 13));
Willy Tarreaucc0b8c32017-10-26 16:55:59 +02001467
1468 if (unlikely(ret <= 0)) {
1469 if (!ret) {
1470 h2c->flags |= H2_CF_MUX_MFULL;
1471 h2c->flags |= H2_CF_DEM_MROOM;
1472 return 0;
1473 }
1474 else {
1475 h2c_error(h2c, H2_ERR_INTERNAL_ERROR);
1476 return 0;
1477 }
1478 }
1479 return ret;
1480}
1481
1482/* try to send pending window update for the connection. It's safe to call it
1483 * with no pending updates. Returns > 0 on success or zero on missing room or
1484 * failure. It may return an error in h2c.
1485 */
1486static int h2c_send_conn_wu(struct h2c *h2c)
1487{
1488 int ret = 1;
1489
1490 if (h2c->rcvd_c <= 0)
1491 return 1;
1492
1493 /* send WU for the connection */
1494 ret = h2c_send_window_update(h2c, 0, h2c->rcvd_c);
1495 if (ret > 0)
1496 h2c->rcvd_c = 0;
1497
1498 return ret;
1499}
1500
1501/* try to send pending window update for the current dmux stream. It's safe to
1502 * call it with no pending updates. Returns > 0 on success or zero on missing
1503 * room or failure. It may return an error in h2c.
1504 */
1505static int h2c_send_strm_wu(struct h2c *h2c)
1506{
1507 int ret = 1;
1508
1509 if (h2c->rcvd_s <= 0)
1510 return 1;
1511
1512 /* send WU for the stream */
1513 ret = h2c_send_window_update(h2c, h2c->dsi, h2c->rcvd_s);
1514 if (ret > 0)
1515 h2c->rcvd_s = 0;
1516
1517 return ret;
1518}
1519
Willy Tarreaucf68c782017-10-10 17:11:41 +02001520/* try to send an ACK for a ping frame on the connection. Returns > 0 on
1521 * success, 0 on missing data or one of the h2_status values.
1522 */
1523static int h2c_ack_ping(struct h2c *h2c)
1524{
1525 struct buffer *res;
1526 char str[17];
1527 int ret = -1;
1528
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001529 if (b_data(&h2c->dbuf) < 8)
Willy Tarreaucf68c782017-10-10 17:11:41 +02001530 return 0;
1531
1532 if (h2c_mux_busy(h2c, NULL)) {
1533 h2c->flags |= H2_CF_DEM_MBUSY;
1534 return 0;
1535 }
1536
Willy Tarreau44e973f2018-03-01 17:49:30 +01001537 res = h2_get_buf(h2c, &h2c->mbuf);
Willy Tarreaucf68c782017-10-10 17:11:41 +02001538 if (!res) {
1539 h2c->flags |= H2_CF_MUX_MALLOC;
1540 h2c->flags |= H2_CF_DEM_MROOM;
1541 return 0;
1542 }
1543
1544 memcpy(str,
1545 "\x00\x00\x08" /* length : 8 (same payload) */
1546 "\x06" "\x01" /* type : 6, flags : ACK */
1547 "\x00\x00\x00\x00" /* stream ID */, 9);
1548
1549 /* copy the original payload */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001550 h2_get_buf_bytes(str + 9, 8, &h2c->dbuf, 0);
Willy Tarreaucf68c782017-10-10 17:11:41 +02001551
Willy Tarreauea1b06d2018-07-12 09:02:47 +02001552 ret = b_istput(res, ist2(str, 17));
Willy Tarreaucf68c782017-10-10 17:11:41 +02001553 if (unlikely(ret <= 0)) {
1554 if (!ret) {
1555 h2c->flags |= H2_CF_MUX_MFULL;
1556 h2c->flags |= H2_CF_DEM_MROOM;
1557 return 0;
1558 }
1559 else {
1560 h2c_error(h2c, H2_ERR_INTERNAL_ERROR);
1561 return 0;
1562 }
1563 }
1564 return ret;
1565}
1566
Willy Tarreau26f95952017-07-27 17:18:30 +02001567/* processes a WINDOW_UPDATE frame whose payload is <payload> for <plen> bytes.
1568 * Returns > 0 on success or zero on missing data. It may return an error in
1569 * h2c or h2s. Described in RFC7540#6.9.
1570 */
1571static int h2c_handle_window_update(struct h2c *h2c, struct h2s *h2s)
1572{
1573 int32_t inc;
1574 int error;
1575
1576 if (h2c->dfl != 4) {
1577 error = H2_ERR_FRAME_SIZE_ERROR;
1578 goto conn_err;
1579 }
1580
1581 /* process full frame only */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001582 if (b_data(&h2c->dbuf) < h2c->dfl)
Willy Tarreau26f95952017-07-27 17:18:30 +02001583 return 0;
1584
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001585 inc = h2_get_n32(&h2c->dbuf, 0);
Willy Tarreau26f95952017-07-27 17:18:30 +02001586
1587 if (h2c->dsi != 0) {
1588 /* stream window update */
Willy Tarreau26f95952017-07-27 17:18:30 +02001589
1590 /* it's not an error to receive WU on a closed stream */
1591 if (h2s->st == H2_SS_CLOSED)
1592 return 1;
1593
1594 if (!inc) {
1595 error = H2_ERR_PROTOCOL_ERROR;
1596 goto strm_err;
1597 }
1598
1599 if (h2s->mws >= 0 && h2s->mws + inc < 0) {
1600 error = H2_ERR_FLOW_CONTROL_ERROR;
1601 goto strm_err;
1602 }
1603
1604 h2s->mws += inc;
1605 if (h2s->mws > 0 && (h2s->flags & H2_SF_BLK_SFCTL)) {
1606 h2s->flags &= ~H2_SF_BLK_SFCTL;
Olivier Houcharddddfe312018-10-10 18:51:00 +02001607 if (h2s->send_wait)
1608 LIST_ADDQ(&h2c->send_list, &h2s->list);
1609
Willy Tarreau26f95952017-07-27 17:18:30 +02001610 }
1611 }
1612 else {
1613 /* connection window update */
1614 if (!inc) {
1615 error = H2_ERR_PROTOCOL_ERROR;
1616 goto conn_err;
1617 }
1618
1619 if (h2c->mws >= 0 && h2c->mws + inc < 0) {
1620 error = H2_ERR_FLOW_CONTROL_ERROR;
1621 goto conn_err;
1622 }
1623
1624 h2c->mws += inc;
1625 }
1626
1627 return 1;
1628
1629 conn_err:
1630 h2c_error(h2c, error);
1631 return 0;
1632
1633 strm_err:
1634 if (h2s) {
1635 h2s_error(h2s, error);
Willy Tarreaua20a5192017-12-27 11:02:06 +01001636 h2c->st0 = H2_CS_FRAME_E;
Willy Tarreau26f95952017-07-27 17:18:30 +02001637 }
1638 else
1639 h2c_error(h2c, error);
1640 return 0;
1641}
1642
Willy Tarreaue96b0922017-10-30 00:28:29 +01001643/* processes a GOAWAY frame, and signals all streams whose ID is greater than
1644 * the last ID. Returns > 0 on success or zero on missing data. It may return
1645 * an error in h2c. Described in RFC7540#6.8.
1646 */
1647static int h2c_handle_goaway(struct h2c *h2c)
1648{
1649 int error;
1650 int last;
1651
1652 if (h2c->dsi != 0) {
1653 error = H2_ERR_PROTOCOL_ERROR;
1654 goto conn_err;
1655 }
1656
1657 if (h2c->dfl < 8) {
1658 error = H2_ERR_FRAME_SIZE_ERROR;
1659 goto conn_err;
1660 }
1661
1662 /* process full frame only */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001663 if (b_data(&h2c->dbuf) < h2c->dfl)
Willy Tarreaue96b0922017-10-30 00:28:29 +01001664 return 0;
1665
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001666 last = h2_get_n32(&h2c->dbuf, 0);
1667 h2c->errcode = h2_get_n32(&h2c->dbuf, 4);
Willy Tarreaue96b0922017-10-30 00:28:29 +01001668 h2_wake_some_streams(h2c, last, CS_FL_ERROR);
Willy Tarreau11cc2d62017-12-03 10:27:47 +01001669 if (h2c->last_sid < 0)
1670 h2c->last_sid = last;
Willy Tarreaue96b0922017-10-30 00:28:29 +01001671 return 1;
1672
1673 conn_err:
1674 h2c_error(h2c, error);
1675 return 0;
1676}
1677
Willy Tarreau92153fc2017-12-03 19:46:19 +01001678/* processes a PRIORITY frame, and either skips it or rejects if it is
1679 * invalid. Returns > 0 on success or zero on missing data. It may return
1680 * an error in h2c. Described in RFC7540#6.3.
1681 */
1682static int h2c_handle_priority(struct h2c *h2c)
1683{
1684 int error;
1685
1686 if (h2c->dsi == 0) {
1687 error = H2_ERR_PROTOCOL_ERROR;
1688 goto conn_err;
1689 }
1690
1691 if (h2c->dfl != 5) {
1692 error = H2_ERR_FRAME_SIZE_ERROR;
1693 goto conn_err;
1694 }
1695
1696 /* process full frame only */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001697 if (b_data(&h2c->dbuf) < h2c->dfl)
Willy Tarreau92153fc2017-12-03 19:46:19 +01001698 return 0;
1699
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001700 if (h2_get_n32(&h2c->dbuf, 0) == h2c->dsi) {
Willy Tarreau92153fc2017-12-03 19:46:19 +01001701 /* 7540#5.3 : can't depend on itself */
1702 error = H2_ERR_PROTOCOL_ERROR;
1703 goto conn_err;
1704 }
1705 return 1;
1706
1707 conn_err:
1708 h2c_error(h2c, error);
1709 return 0;
1710}
1711
Willy Tarreaucd234e92017-08-18 10:59:39 +02001712/* processes an RST_STREAM frame, and sets the 32-bit error code on the stream.
1713 * Returns > 0 on success or zero on missing data. It may return an error in
1714 * h2c. Described in RFC7540#6.4.
1715 */
1716static int h2c_handle_rst_stream(struct h2c *h2c, struct h2s *h2s)
1717{
1718 int error;
1719
1720 if (h2c->dsi == 0) {
1721 error = H2_ERR_PROTOCOL_ERROR;
1722 goto conn_err;
1723 }
1724
Willy Tarreaucd234e92017-08-18 10:59:39 +02001725 if (h2c->dfl != 4) {
1726 error = H2_ERR_FRAME_SIZE_ERROR;
1727 goto conn_err;
1728 }
1729
1730 /* process full frame only */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001731 if (b_data(&h2c->dbuf) < h2c->dfl)
Willy Tarreaucd234e92017-08-18 10:59:39 +02001732 return 0;
1733
1734 /* late RST, already handled */
1735 if (h2s->st == H2_SS_CLOSED)
1736 return 1;
1737
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001738 h2s->errcode = h2_get_n32(&h2c->dbuf, 0);
Willy Tarreau00dd0782018-03-01 16:31:34 +01001739 h2s_close(h2s);
Willy Tarreaucd234e92017-08-18 10:59:39 +02001740
1741 if (h2s->cs) {
Willy Tarreau7ecb6f12018-12-18 16:39:21 +01001742 if (h2s->cs->flags & CS_FL_EOS)
1743 h2s->cs->flags |= CS_FL_ERROR;
1744 else
1745 h2s->cs->flags |= CS_FL_REOS | CS_FL_ERR_PENDING;
1746
Olivier Houchardfa8aa862018-10-10 18:25:41 +02001747 if (h2s->recv_wait) {
1748 struct wait_event *sw = h2s->recv_wait;
Olivier Houchardc2aa7112018-09-11 18:27:21 +02001749
1750 sw->wait_reason &= ~SUB_CAN_RECV;
1751 tasklet_wakeup(sw->task);
Olivier Houchardfa8aa862018-10-10 18:25:41 +02001752 h2s->recv_wait = NULL;
Olivier Houchardc2aa7112018-09-11 18:27:21 +02001753 }
Willy Tarreaucd234e92017-08-18 10:59:39 +02001754 }
1755
1756 h2s->flags |= H2_SF_RST_RCVD;
1757 return 1;
1758
1759 conn_err:
1760 h2c_error(h2c, error);
1761 return 0;
1762}
1763
Willy Tarreau2a761dc2018-02-26 18:50:57 +01001764/* processes a HEADERS frame. Returns h2s on success or NULL on missing data.
1765 * It may return an error in h2c or h2s. The caller must consider that the
1766 * return value is the new h2s in case one was allocated (most common case).
1767 * Described in RFC7540#6.2. Most of the
Willy Tarreau13278b42017-10-13 19:23:14 +02001768 * errors here are reported as connection errors since it's impossible to
1769 * recover from such errors after the compression context has been altered.
1770 */
Willy Tarreau2a761dc2018-02-26 18:50:57 +01001771static struct h2s *h2c_frt_handle_headers(struct h2c *h2c, struct h2s *h2s)
Willy Tarreau13278b42017-10-13 19:23:14 +02001772{
1773 int error;
1774
1775 if (!h2c->dfl) {
1776 error = H2_ERR_PROTOCOL_ERROR; // empty headers frame!
Willy Tarreau22de8d32018-09-05 19:55:58 +02001777 sess_log(h2c->conn->owner);
Willy Tarreau13278b42017-10-13 19:23:14 +02001778 goto strm_err;
1779 }
1780
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001781 if (!b_size(&h2c->dbuf))
Willy Tarreau2a761dc2018-02-26 18:50:57 +01001782 return NULL; // empty buffer
Willy Tarreau13278b42017-10-13 19:23:14 +02001783
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001784 if (b_data(&h2c->dbuf) < h2c->dfl && !b_full(&h2c->dbuf))
Willy Tarreau2a761dc2018-02-26 18:50:57 +01001785 return NULL; // incomplete frame
Willy Tarreau13278b42017-10-13 19:23:14 +02001786
Willy Tarreauf2101912018-07-19 10:11:38 +02001787 if (h2c->flags & H2_CF_DEM_TOOMANY)
1788 return 0; // too many cs still present
1789
Willy Tarreau13278b42017-10-13 19:23:14 +02001790 /* now either the frame is complete or the buffer is complete */
1791 if (h2s->st != H2_SS_IDLE) {
1792 /* FIXME: stream already exists, this is only allowed for
1793 * trailers (not supported for now).
1794 */
1795 error = H2_ERR_PROTOCOL_ERROR;
Willy Tarreau22de8d32018-09-05 19:55:58 +02001796 sess_log(h2c->conn->owner);
Willy Tarreau13278b42017-10-13 19:23:14 +02001797 goto conn_err;
1798 }
1799 else if (h2c->dsi <= h2c->max_id || !(h2c->dsi & 1)) {
1800 /* RFC7540#5.1.1 stream id > prev ones, and must be odd here */
1801 error = H2_ERR_PROTOCOL_ERROR;
Willy Tarreau22de8d32018-09-05 19:55:58 +02001802 sess_log(h2c->conn->owner);
Willy Tarreau13278b42017-10-13 19:23:14 +02001803 goto conn_err;
1804 }
1805
Willy Tarreau22de8d32018-09-05 19:55:58 +02001806 /* Note: we don't emit any other logs below because ff we return
Willy Tarreaua8e49542018-10-03 18:53:55 +02001807 * positively from h2c_frt_stream_new(), the stream will report the error,
1808 * and if we return in error, h2c_frt_stream_new() will emit the error.
Willy Tarreau22de8d32018-09-05 19:55:58 +02001809 */
Willy Tarreaua8e49542018-10-03 18:53:55 +02001810 h2s = h2c_frt_stream_new(h2c, h2c->dsi);
Willy Tarreau13278b42017-10-13 19:23:14 +02001811 if (!h2s) {
1812 error = H2_ERR_INTERNAL_ERROR;
1813 goto conn_err;
1814 }
1815
1816 h2s->st = H2_SS_OPEN;
1817 if (h2c->dff & H2_F_HEADERS_END_STREAM) {
1818 h2s->st = H2_SS_HREM;
1819 h2s->flags |= H2_SF_ES_RCVD;
Willy Tarreau39d68502018-03-02 12:26:37 +01001820 /* note: cs cannot be null for now (just created above) */
1821 h2s->cs->flags |= CS_FL_REOS;
Willy Tarreau13278b42017-10-13 19:23:14 +02001822 }
1823
Willy Tarreauc3e18f32018-10-08 14:51:56 +02001824 if (!h2s_decode_headers(h2s))
Willy Tarreau2a761dc2018-02-26 18:50:57 +01001825 return NULL;
Willy Tarreau13278b42017-10-13 19:23:14 +02001826
Willy Tarreau8f650c32017-11-21 19:36:21 +01001827 if (h2c->st0 >= H2_CS_ERROR)
Willy Tarreau2a761dc2018-02-26 18:50:57 +01001828 return NULL;
Willy Tarreau8f650c32017-11-21 19:36:21 +01001829
Willy Tarreau721c9742017-11-07 11:05:42 +01001830 if (h2s->st >= H2_SS_ERROR) {
Willy Tarreau13278b42017-10-13 19:23:14 +02001831 /* stream error : send RST_STREAM */
Willy Tarreaua20a5192017-12-27 11:02:06 +01001832 h2c->st0 = H2_CS_FRAME_E;
Willy Tarreau13278b42017-10-13 19:23:14 +02001833 }
1834 else {
1835 /* update the max stream ID if the request is being processed */
1836 if (h2s->id > h2c->max_id)
1837 h2c->max_id = h2s->id;
1838 }
1839
Willy Tarreau2a761dc2018-02-26 18:50:57 +01001840 return h2s;
Willy Tarreau13278b42017-10-13 19:23:14 +02001841
1842 conn_err:
1843 h2c_error(h2c, error);
Willy Tarreau2a761dc2018-02-26 18:50:57 +01001844 return NULL;
Willy Tarreau13278b42017-10-13 19:23:14 +02001845
1846 strm_err:
1847 if (h2s) {
1848 h2s_error(h2s, error);
Willy Tarreaua20a5192017-12-27 11:02:06 +01001849 h2c->st0 = H2_CS_FRAME_E;
Willy Tarreau13278b42017-10-13 19:23:14 +02001850 }
1851 else
1852 h2c_error(h2c, error);
Willy Tarreau2a761dc2018-02-26 18:50:57 +01001853 return NULL;
Willy Tarreau13278b42017-10-13 19:23:14 +02001854}
1855
Willy Tarreauc12f38f2018-10-08 14:53:27 +02001856/* processes a HEADERS frame. Returns h2s on success or NULL on missing data.
1857 * It may return an error in h2c or h2s. Described in RFC7540#6.2. Most of the
1858 * errors here are reported as connection errors since it's impossible to
1859 * recover from such errors after the compression context has been altered.
1860 */
1861static struct h2s *h2c_bck_handle_headers(struct h2c *h2c, struct h2s *h2s)
1862{
1863 int error;
1864
1865 if (!h2c->dfl) {
1866 error = H2_ERR_PROTOCOL_ERROR; // empty headers frame!
1867 sess_log(h2c->conn->owner);
1868 goto strm_err;
1869 }
1870
1871 if (!b_size(&h2c->dbuf))
1872 return NULL; // empty buffer
1873
1874 if (b_data(&h2c->dbuf) < h2c->dfl && !b_full(&h2c->dbuf))
1875 return NULL; // incomplete frame
1876
1877 if (h2c->flags & H2_CF_DEM_TOOMANY)
1878 return 0; // too many cs still present
1879
1880 if (h2c->dff & H2_F_HEADERS_END_STREAM) {
1881 h2s->flags |= H2_SF_ES_RCVD;
1882 h2s->cs->flags |= CS_FL_REOS;
1883 }
1884
1885 if (!h2s_decode_headers(h2s))
1886 return NULL;
1887
1888 if (h2c->st0 >= H2_CS_ERROR)
1889 return NULL;
1890
1891 if (h2s->st >= H2_SS_ERROR) {
1892 /* stream error : send RST_STREAM */
1893 h2c->st0 = H2_CS_FRAME_E;
1894 }
1895
1896 if (h2s->cs->flags & CS_FL_ERROR && h2s->st < H2_SS_ERROR)
1897 h2s->st = H2_SS_ERROR;
1898 else if (h2s->cs->flags & CS_FL_REOS && h2s->st == H2_SS_OPEN)
1899 h2s->st = H2_SS_HREM;
1900 else if (h2s->cs->flags & CS_FL_REOS && h2s->st == H2_SS_HLOC)
1901 h2s_close(h2s);
1902
1903 return h2s;
1904
1905 conn_err:
1906 h2c_error(h2c, error);
1907 return NULL;
1908
1909 strm_err:
1910 if (h2s) {
1911 h2s_error(h2s, error);
1912 h2c->st0 = H2_CS_FRAME_E;
1913 }
1914 else
1915 h2c_error(h2c, error);
1916 return NULL;
1917}
1918
Willy Tarreau454f9052017-10-26 19:40:35 +02001919/* processes a DATA frame. Returns > 0 on success or zero on missing data.
1920 * It may return an error in h2c or h2s. Described in RFC7540#6.1.
1921 */
1922static int h2c_frt_handle_data(struct h2c *h2c, struct h2s *h2s)
1923{
1924 int error;
1925
1926 /* note that empty DATA frames are perfectly valid and sometimes used
1927 * to signal an end of stream (with the ES flag).
1928 */
1929
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001930 if (!b_size(&h2c->dbuf) && h2c->dfl)
Willy Tarreau454f9052017-10-26 19:40:35 +02001931 return 0; // empty buffer
1932
Willy Tarreauc9fa0482018-07-10 17:43:27 +02001933 if (b_data(&h2c->dbuf) < h2c->dfl && !b_full(&h2c->dbuf))
Willy Tarreau454f9052017-10-26 19:40:35 +02001934 return 0; // incomplete frame
1935
1936 /* now either the frame is complete or the buffer is complete */
1937
1938 if (!h2c->dsi) {
1939 /* RFC7540#6.1 */
1940 error = H2_ERR_PROTOCOL_ERROR;
1941 goto conn_err;
1942 }
1943
1944 if (h2s->st != H2_SS_OPEN && h2s->st != H2_SS_HLOC) {
1945 /* RFC7540#6.1 */
1946 error = H2_ERR_STREAM_CLOSED;
1947 goto strm_err;
1948 }
1949
Willy Tarreaua56a6de2018-02-26 15:59:07 +01001950 if (!h2_frt_transfer_data(h2s))
1951 return 0;
1952
Willy Tarreau454f9052017-10-26 19:40:35 +02001953 /* call the upper layers to process the frame, then let the upper layer
1954 * notify the stream about any change.
1955 */
1956 if (!h2s->cs) {
1957 error = H2_ERR_STREAM_CLOSED;
1958 goto strm_err;
1959 }
1960
Willy Tarreau8f650c32017-11-21 19:36:21 +01001961 if (h2c->st0 >= H2_CS_ERROR)
1962 return 0;
1963
Willy Tarreau721c9742017-11-07 11:05:42 +01001964 if (h2s->st >= H2_SS_ERROR) {
Willy Tarreau454f9052017-10-26 19:40:35 +02001965 /* stream error : send RST_STREAM */
Willy Tarreaua20a5192017-12-27 11:02:06 +01001966 h2c->st0 = H2_CS_FRAME_E;
Willy Tarreau454f9052017-10-26 19:40:35 +02001967 }
1968
1969 /* check for completion : the callee will change this to FRAME_A or
1970 * FRAME_H once done.
1971 */
1972 if (h2c->st0 == H2_CS_FRAME_P)
1973 return 0;
1974
Willy Tarreauc4134ba2017-12-11 18:45:08 +01001975
1976 /* last frame */
1977 if (h2c->dff & H2_F_DATA_END_STREAM) {
1978 h2s->st = H2_SS_HREM;
1979 h2s->flags |= H2_SF_ES_RCVD;
Willy Tarreau39d68502018-03-02 12:26:37 +01001980 h2s->cs->flags |= CS_FL_REOS;
Willy Tarreauc4134ba2017-12-11 18:45:08 +01001981 }
1982
Willy Tarreau454f9052017-10-26 19:40:35 +02001983 return 1;
1984
1985 conn_err:
1986 h2c_error(h2c, error);
1987 return 0;
1988
1989 strm_err:
1990 if (h2s) {
1991 h2s_error(h2s, error);
Willy Tarreaua20a5192017-12-27 11:02:06 +01001992 h2c->st0 = H2_CS_FRAME_E;
Willy Tarreau454f9052017-10-26 19:40:35 +02001993 }
1994 else
1995 h2c_error(h2c, error);
1996 return 0;
1997}
1998
Willy Tarreaubc933932017-10-09 16:21:43 +02001999/* process Rx frames to be demultiplexed */
2000static void h2_process_demux(struct h2c *h2c)
2001{
Willy Tarreau2a761dc2018-02-26 18:50:57 +01002002 struct h2s *h2s = NULL, *tmp_h2s;
Willy Tarreauf3ee0692017-10-17 08:18:25 +02002003
Willy Tarreau081d4722017-05-16 21:51:05 +02002004 if (h2c->st0 >= H2_CS_ERROR)
2005 return;
Willy Tarreau52eed752017-09-22 15:05:09 +02002006
2007 if (unlikely(h2c->st0 < H2_CS_FRAME_H)) {
2008 if (h2c->st0 == H2_CS_PREFACE) {
Willy Tarreau01b44822018-10-03 14:26:37 +02002009 if (h2c->flags & H2_CF_IS_BACK)
2010 return;
Willy Tarreau52eed752017-09-22 15:05:09 +02002011 if (unlikely(h2c_frt_recv_preface(h2c) <= 0)) {
2012 /* RFC7540#3.5: a GOAWAY frame MAY be omitted */
Willy Tarreau22de8d32018-09-05 19:55:58 +02002013 if (h2c->st0 == H2_CS_ERROR) {
Willy Tarreau52eed752017-09-22 15:05:09 +02002014 h2c->st0 = H2_CS_ERROR2;
Willy Tarreau22de8d32018-09-05 19:55:58 +02002015 sess_log(h2c->conn->owner);
2016 }
Willy Tarreau52eed752017-09-22 15:05:09 +02002017 goto fail;
2018 }
2019
2020 h2c->max_id = 0;
2021 h2c->st0 = H2_CS_SETTINGS1;
2022 }
Willy Tarreau4c3690b2017-10-10 15:16:55 +02002023
2024 if (h2c->st0 == H2_CS_SETTINGS1) {
2025 struct h2_fh hdr;
2026
2027 /* ensure that what is pending is a valid SETTINGS frame
2028 * without an ACK.
2029 */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002030 if (!h2_get_frame_hdr(&h2c->dbuf, &hdr)) {
Willy Tarreau4c3690b2017-10-10 15:16:55 +02002031 /* RFC7540#3.5: a GOAWAY frame MAY be omitted */
Willy Tarreau22de8d32018-09-05 19:55:58 +02002032 if (h2c->st0 == H2_CS_ERROR) {
Willy Tarreau4c3690b2017-10-10 15:16:55 +02002033 h2c->st0 = H2_CS_ERROR2;
Willy Tarreau22de8d32018-09-05 19:55:58 +02002034 sess_log(h2c->conn->owner);
2035 }
Willy Tarreau4c3690b2017-10-10 15:16:55 +02002036 goto fail;
2037 }
2038
2039 if (hdr.sid || hdr.ft != H2_FT_SETTINGS || hdr.ff & H2_F_SETTINGS_ACK) {
2040 /* RFC7540#3.5: a GOAWAY frame MAY be omitted */
2041 h2c_error(h2c, H2_ERR_PROTOCOL_ERROR);
2042 h2c->st0 = H2_CS_ERROR2;
Willy Tarreau22de8d32018-09-05 19:55:58 +02002043 sess_log(h2c->conn->owner);
Willy Tarreau4c3690b2017-10-10 15:16:55 +02002044 goto fail;
2045 }
2046
Willy Tarreau3f0e1ec2018-04-17 10:28:27 +02002047 if ((int)hdr.len < 0 || (int)hdr.len > global.tune.bufsize) {
Willy Tarreau4c3690b2017-10-10 15:16:55 +02002048 /* RFC7540#3.5: a GOAWAY frame MAY be omitted */
2049 h2c_error(h2c, H2_ERR_FRAME_SIZE_ERROR);
2050 h2c->st0 = H2_CS_ERROR2;
Willy Tarreau22de8d32018-09-05 19:55:58 +02002051 sess_log(h2c->conn->owner);
Willy Tarreau4c3690b2017-10-10 15:16:55 +02002052 goto fail;
2053 }
2054
2055 /* that's OK, switch to FRAME_P to process it */
2056 h2c->dfl = hdr.len;
2057 h2c->dsi = hdr.sid;
2058 h2c->dft = hdr.ft;
2059 h2c->dff = hdr.ff;
Willy Tarreau05e5daf2017-12-11 15:17:36 +01002060 h2c->dpl = 0;
Willy Tarreau4c3690b2017-10-10 15:16:55 +02002061 h2c->st0 = H2_CS_FRAME_P;
2062 }
Willy Tarreau52eed752017-09-22 15:05:09 +02002063 }
Willy Tarreau7e98c052017-10-10 15:56:59 +02002064
2065 /* process as many incoming frames as possible below */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002066 while (b_data(&h2c->dbuf)) {
Willy Tarreau7e98c052017-10-10 15:56:59 +02002067 int ret = 0;
2068
2069 if (h2c->st0 >= H2_CS_ERROR)
2070 break;
2071
2072 if (h2c->st0 == H2_CS_FRAME_H) {
2073 struct h2_fh hdr;
2074
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002075 if (!h2_peek_frame_hdr(&h2c->dbuf, &hdr))
Willy Tarreau7e98c052017-10-10 15:56:59 +02002076 break;
2077
Willy Tarreau3f0e1ec2018-04-17 10:28:27 +02002078 if ((int)hdr.len < 0 || (int)hdr.len > global.tune.bufsize) {
Willy Tarreau7e98c052017-10-10 15:56:59 +02002079 h2c_error(h2c, H2_ERR_FRAME_SIZE_ERROR);
2080 h2c->st0 = H2_CS_ERROR;
Willy Tarreau22de8d32018-09-05 19:55:58 +02002081 if (!h2c->nb_streams) {
2082 /* only log if no other stream can report the error */
2083 sess_log(h2c->conn->owner);
2084 }
Willy Tarreau7e98c052017-10-10 15:56:59 +02002085 break;
2086 }
2087
2088 h2c->dfl = hdr.len;
2089 h2c->dsi = hdr.sid;
2090 h2c->dft = hdr.ft;
2091 h2c->dff = hdr.ff;
Willy Tarreau05e5daf2017-12-11 15:17:36 +01002092 h2c->dpl = 0;
Willy Tarreau7e98c052017-10-10 15:56:59 +02002093 h2c->st0 = H2_CS_FRAME_P;
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002094 h2_skip_frame_hdr(&h2c->dbuf);
Willy Tarreau7e98c052017-10-10 15:56:59 +02002095 }
2096
2097 /* Only H2_CS_FRAME_P and H2_CS_FRAME_A here */
Willy Tarreau2a761dc2018-02-26 18:50:57 +01002098 tmp_h2s = h2c_st_by_id(h2c, h2c->dsi);
2099
Olivier Houchard638b7992018-08-16 15:41:52 +02002100 if (tmp_h2s != h2s && h2s && h2s->cs && b_data(&h2s->rxbuf)) {
Willy Tarreau2a761dc2018-02-26 18:50:57 +01002101 /* we may have to signal the upper layers */
2102 h2s->cs->flags |= CS_FL_RCV_MORE;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002103 if (h2s->recv_wait) {
2104 h2s->recv_wait->wait_reason &= ~SUB_CAN_RECV;
2105 tasklet_wakeup(h2s->recv_wait->task);
2106 h2s->recv_wait = NULL;
Willy Tarreau2a761dc2018-02-26 18:50:57 +01002107 }
Willy Tarreau2a761dc2018-02-26 18:50:57 +01002108 }
2109 h2s = tmp_h2s;
Willy Tarreau7e98c052017-10-10 15:56:59 +02002110
Willy Tarreaud7901432017-12-29 11:34:40 +01002111 if (h2c->st0 == H2_CS_FRAME_E)
2112 goto strm_err;
2113
Willy Tarreauf65b80d2017-10-30 11:46:49 +01002114 if (h2s->st == H2_SS_IDLE &&
2115 h2c->dft != H2_FT_HEADERS && h2c->dft != H2_FT_PRIORITY) {
2116 /* RFC7540#5.1: any frame other than HEADERS or PRIORITY in
2117 * this state MUST be treated as a connection error
2118 */
2119 h2c_error(h2c, H2_ERR_PROTOCOL_ERROR);
2120 h2c->st0 = H2_CS_ERROR;
Willy Tarreau22de8d32018-09-05 19:55:58 +02002121 if (!h2c->nb_streams) {
2122 /* only log if no other stream can report the error */
2123 sess_log(h2c->conn->owner);
2124 }
Willy Tarreauf65b80d2017-10-30 11:46:49 +01002125 break;
2126 }
2127
Willy Tarreauf182a9a2017-10-30 12:03:50 +01002128 if (h2s->st == H2_SS_HREM && h2c->dft != H2_FT_WINDOW_UPDATE &&
2129 h2c->dft != H2_FT_RST_STREAM && h2c->dft != H2_FT_PRIORITY) {
2130 /* RFC7540#5.1: any frame other than WU/PRIO/RST in
2131 * this state MUST be treated as a stream error
2132 */
2133 h2s_error(h2s, H2_ERR_STREAM_CLOSED);
2134 goto strm_err;
2135 }
2136
Willy Tarreauab837502017-12-27 15:07:30 +01002137 /* Below the management of frames received in closed state is a
2138 * bit hackish because the spec makes strong differences between
2139 * streams closed by receiving RST, sending RST, and seeing ES
2140 * in both directions. In addition to this, the creation of a
2141 * new stream reusing the identifier of a closed one will be
2142 * detected here. Given that we cannot keep track of all closed
2143 * streams forever, we consider that unknown closed streams were
2144 * closed on RST received, which allows us to respond with an
2145 * RST without breaking the connection (eg: to abort a transfer).
2146 * Some frames have to be silently ignored as well.
2147 */
2148 if (h2s->st == H2_SS_CLOSED && h2c->dsi) {
2149 if (h2c->dft == H2_FT_HEADERS || h2c->dft == H2_FT_PUSH_PROMISE) {
2150 /* #5.1.1: The identifier of a newly
2151 * established stream MUST be numerically
2152 * greater than all streams that the initiating
2153 * endpoint has opened or reserved. This
2154 * governs streams that are opened using a
2155 * HEADERS frame and streams that are reserved
2156 * using PUSH_PROMISE. An endpoint that
2157 * receives an unexpected stream identifier
2158 * MUST respond with a connection error.
2159 */
2160 h2c_error(h2c, H2_ERR_STREAM_CLOSED);
2161 goto strm_err;
2162 }
2163
2164 if (h2s->flags & H2_SF_RST_RCVD) {
2165 /* RFC7540#5.1:closed: an endpoint that
2166 * receives any frame other than PRIORITY after
2167 * receiving a RST_STREAM MUST treat that as a
2168 * stream error of type STREAM_CLOSED.
2169 *
2170 * Note that old streams fall into this category
2171 * and will lead to an RST being sent.
2172 */
2173 h2s_error(h2s, H2_ERR_STREAM_CLOSED);
2174 h2c->st0 = H2_CS_FRAME_E;
2175 goto strm_err;
2176 }
2177
2178 /* RFC7540#5.1:closed: if this state is reached as a
2179 * result of sending a RST_STREAM frame, the peer that
2180 * receives the RST_STREAM might have already sent
2181 * frames on the stream that cannot be withdrawn. An
2182 * endpoint MUST ignore frames that it receives on
2183 * closed streams after it has sent a RST_STREAM
2184 * frame. An endpoint MAY choose to limit the period
2185 * over which it ignores frames and treat frames that
2186 * arrive after this time as being in error.
2187 */
2188 if (!(h2s->flags & H2_SF_RST_SENT)) {
2189 /* RFC7540#5.1:closed: any frame other than
2190 * PRIO/WU/RST in this state MUST be treated as
2191 * a connection error
2192 */
2193 if (h2c->dft != H2_FT_RST_STREAM &&
2194 h2c->dft != H2_FT_PRIORITY &&
2195 h2c->dft != H2_FT_WINDOW_UPDATE) {
2196 h2c_error(h2c, H2_ERR_STREAM_CLOSED);
2197 goto strm_err;
2198 }
2199 }
2200 }
2201
Willy Tarreauc0da1962017-10-30 18:38:00 +01002202#if 0
2203 // problem below: it is not possible to completely ignore such
2204 // streams as we need to maintain the compression state as well
2205 // and for this we need to completely process these frames (eg:
2206 // HEADERS frames) as well as counting DATA frames to emit
2207 // proper WINDOW UPDATES and ensure the connection doesn't stall.
2208 // This is a typical case of layer violation where the
2209 // transported contents are critical to the connection's
2210 // validity and must be ignored at the same time :-(
2211
2212 /* graceful shutdown, ignore streams whose ID is higher than
2213 * the one advertised in GOAWAY. RFC7540#6.8.
2214 */
2215 if (unlikely(h2c->last_sid >= 0) && h2c->dsi > h2c->last_sid) {
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002216 ret = MIN(b_data(&h2c->dbuf), h2c->dfl);
2217 b_del(&h2c->dbuf, ret);
Willy Tarreauc0da1962017-10-30 18:38:00 +01002218 h2c->dfl -= ret;
2219 ret = h2c->dfl == 0;
2220 goto strm_err;
2221 }
2222#endif
2223
Willy Tarreau7e98c052017-10-10 15:56:59 +02002224 switch (h2c->dft) {
Willy Tarreau3421aba2017-07-27 15:41:03 +02002225 case H2_FT_SETTINGS:
2226 if (h2c->st0 == H2_CS_FRAME_P)
2227 ret = h2c_handle_settings(h2c);
2228
2229 if (h2c->st0 == H2_CS_FRAME_A)
2230 ret = h2c_ack_settings(h2c);
2231 break;
2232
Willy Tarreaucf68c782017-10-10 17:11:41 +02002233 case H2_FT_PING:
2234 if (h2c->st0 == H2_CS_FRAME_P)
2235 ret = h2c_handle_ping(h2c);
2236
2237 if (h2c->st0 == H2_CS_FRAME_A)
2238 ret = h2c_ack_ping(h2c);
2239 break;
2240
Willy Tarreau26f95952017-07-27 17:18:30 +02002241 case H2_FT_WINDOW_UPDATE:
2242 if (h2c->st0 == H2_CS_FRAME_P)
2243 ret = h2c_handle_window_update(h2c, h2s);
2244 break;
2245
Willy Tarreau61290ec2017-10-17 08:19:21 +02002246 case H2_FT_CONTINUATION:
2247 /* we currently don't support CONTINUATION frames since
2248 * we have nowhere to store the partial HEADERS frame.
2249 * Let's abort the stream on an INTERNAL_ERROR here.
2250 */
Willy Tarreaua20a5192017-12-27 11:02:06 +01002251 if (h2c->st0 == H2_CS_FRAME_P) {
Willy Tarreau61290ec2017-10-17 08:19:21 +02002252 h2s_error(h2s, H2_ERR_INTERNAL_ERROR);
Willy Tarreaua20a5192017-12-27 11:02:06 +01002253 h2c->st0 = H2_CS_FRAME_E;
2254 }
Willy Tarreau61290ec2017-10-17 08:19:21 +02002255 break;
2256
Willy Tarreau13278b42017-10-13 19:23:14 +02002257 case H2_FT_HEADERS:
Willy Tarreau2a761dc2018-02-26 18:50:57 +01002258 if (h2c->st0 == H2_CS_FRAME_P) {
Willy Tarreauc12f38f2018-10-08 14:53:27 +02002259 if (h2c->flags & H2_CF_IS_BACK)
2260 tmp_h2s = h2c_bck_handle_headers(h2c, h2s);
2261 else
2262 tmp_h2s = h2c_frt_handle_headers(h2c, h2s);
Willy Tarreau2a761dc2018-02-26 18:50:57 +01002263 if (tmp_h2s) {
2264 h2s = tmp_h2s;
2265 ret = 1;
2266 }
2267 }
Willy Tarreau13278b42017-10-13 19:23:14 +02002268 break;
2269
Willy Tarreau454f9052017-10-26 19:40:35 +02002270 case H2_FT_DATA:
2271 if (h2c->st0 == H2_CS_FRAME_P)
2272 ret = h2c_frt_handle_data(h2c, h2s);
2273
2274 if (h2c->st0 == H2_CS_FRAME_A)
2275 ret = h2c_send_strm_wu(h2c);
2276 break;
Willy Tarreaucd234e92017-08-18 10:59:39 +02002277
Willy Tarreau92153fc2017-12-03 19:46:19 +01002278 case H2_FT_PRIORITY:
2279 if (h2c->st0 == H2_CS_FRAME_P)
2280 ret = h2c_handle_priority(h2c);
2281 break;
2282
Willy Tarreaucd234e92017-08-18 10:59:39 +02002283 case H2_FT_RST_STREAM:
2284 if (h2c->st0 == H2_CS_FRAME_P)
2285 ret = h2c_handle_rst_stream(h2c, h2s);
2286 break;
2287
Willy Tarreaue96b0922017-10-30 00:28:29 +01002288 case H2_FT_GOAWAY:
2289 if (h2c->st0 == H2_CS_FRAME_P)
2290 ret = h2c_handle_goaway(h2c);
2291 break;
2292
Willy Tarreau1c661982017-10-30 13:52:01 +01002293 case H2_FT_PUSH_PROMISE:
2294 /* not permitted here, RFC7540#5.1 */
2295 h2c_error(h2c, H2_ERR_PROTOCOL_ERROR);
Willy Tarreau22de8d32018-09-05 19:55:58 +02002296 if (!h2c->nb_streams) {
2297 /* only log if no other stream can report the error */
2298 sess_log(h2c->conn->owner);
2299 }
Willy Tarreau1c661982017-10-30 13:52:01 +01002300 break;
2301
2302 /* implement all extra frame types here */
Willy Tarreau7e98c052017-10-10 15:56:59 +02002303 default:
2304 /* drop frames that we ignore. They may be larger than
2305 * the buffer so we drain all of their contents until
2306 * we reach the end.
2307 */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002308 ret = MIN(b_data(&h2c->dbuf), h2c->dfl);
2309 b_del(&h2c->dbuf, ret);
Willy Tarreau7e98c052017-10-10 15:56:59 +02002310 h2c->dfl -= ret;
2311 ret = h2c->dfl == 0;
2312 }
2313
Willy Tarreauf182a9a2017-10-30 12:03:50 +01002314 strm_err:
Willy Tarreaua20a5192017-12-27 11:02:06 +01002315 /* We may have to send an RST if not done yet */
2316 if (h2s->st == H2_SS_ERROR)
2317 h2c->st0 = H2_CS_FRAME_E;
Willy Tarreau27a84c92017-10-17 08:10:17 +02002318
Willy Tarreaua20a5192017-12-27 11:02:06 +01002319 if (h2c->st0 == H2_CS_FRAME_E)
2320 ret = h2c_send_rst_stream(h2c, h2s);
Willy Tarreau27a84c92017-10-17 08:10:17 +02002321
Willy Tarreau7e98c052017-10-10 15:56:59 +02002322 /* error or missing data condition met above ? */
Willy Tarreau1ed87b72018-11-25 08:45:16 +01002323 if (ret <= 0)
Willy Tarreau7e98c052017-10-10 15:56:59 +02002324 break;
2325
2326 if (h2c->st0 != H2_CS_FRAME_H) {
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002327 b_del(&h2c->dbuf, h2c->dfl);
Willy Tarreau7e98c052017-10-10 15:56:59 +02002328 h2c->st0 = H2_CS_FRAME_H;
2329 }
2330 }
Willy Tarreau52eed752017-09-22 15:05:09 +02002331
Willy Tarreaucc0b8c32017-10-26 16:55:59 +02002332 if (h2c->rcvd_c > 0 &&
2333 !(h2c->flags & (H2_CF_MUX_MFULL | H2_CF_DEM_MBUSY | H2_CF_DEM_MROOM)))
2334 h2c_send_conn_wu(h2c);
2335
Willy Tarreau52eed752017-09-22 15:05:09 +02002336 fail:
2337 /* we can go here on missing data, blocked response or error */
Olivier Houchard638b7992018-08-16 15:41:52 +02002338 if (h2s && h2s->cs && b_data(&h2s->rxbuf)) {
Willy Tarreau2a761dc2018-02-26 18:50:57 +01002339 /* we may have to signal the upper layers */
2340 h2s->cs->flags |= CS_FL_RCV_MORE;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002341 if (h2s->recv_wait) {
2342 h2s->recv_wait->wait_reason &= ~SUB_CAN_RECV;
2343 tasklet_wakeup(h2s->recv_wait->task);
2344 h2s->recv_wait = NULL;
Willy Tarreau2a761dc2018-02-26 18:50:57 +01002345 }
2346 }
Willy Tarreau1ed87b72018-11-25 08:45:16 +01002347
2348 if (h2_recv_allowed(h2c))
2349 tasklet_wakeup(h2c->wait_event.task);
Willy Tarreaubc933932017-10-09 16:21:43 +02002350}
2351
2352/* process Tx frames from streams to be multiplexed. Returns > 0 if it reached
2353 * the end.
2354 */
2355static int h2_process_mux(struct h2c *h2c)
2356{
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002357 struct h2s *h2s, *h2s_back;
Willy Tarreaubacdf5a2017-10-17 10:57:04 +02002358
Willy Tarreau01b44822018-10-03 14:26:37 +02002359 if (unlikely(h2c->st0 < H2_CS_FRAME_H)) {
2360 if (unlikely(h2c->st0 == H2_CS_PREFACE && (h2c->flags & H2_CF_IS_BACK))) {
2361 if (unlikely(h2c_bck_send_preface(h2c) <= 0)) {
2362 /* RFC7540#3.5: a GOAWAY frame MAY be omitted */
2363 if (h2c->st0 == H2_CS_ERROR) {
2364 h2c->st0 = H2_CS_ERROR2;
2365 sess_log(h2c->conn->owner);
2366 }
2367 goto fail;
2368 }
2369 h2c->st0 = H2_CS_SETTINGS1;
2370 }
2371 /* need to wait for the other side */
Willy Tarreau75a930a2018-12-12 08:03:58 +01002372 if (h2c->st0 < H2_CS_FRAME_H)
Willy Tarreau01b44822018-10-03 14:26:37 +02002373 return 1;
2374 }
2375
Willy Tarreaucc0b8c32017-10-26 16:55:59 +02002376 /* start by sending possibly pending window updates */
2377 if (h2c->rcvd_c > 0 &&
2378 !(h2c->flags & (H2_CF_MUX_MFULL | H2_CF_MUX_MALLOC)) &&
2379 h2c_send_conn_wu(h2c) < 0)
2380 goto fail;
2381
Willy Tarreaubacdf5a2017-10-17 10:57:04 +02002382 /* First we always process the flow control list because the streams
2383 * waiting there were already elected for immediate emission but were
2384 * blocked just on this.
2385 */
2386
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002387 list_for_each_entry_safe(h2s, h2s_back, &h2c->fctl_list, list) {
Willy Tarreaubacdf5a2017-10-17 10:57:04 +02002388 if (h2c->mws <= 0 || h2c->flags & H2_CF_MUX_BLOCK_ANY ||
2389 h2c->st0 >= H2_CS_ERROR)
2390 break;
2391
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002392 h2s->flags &= ~H2_SF_BLK_ANY;
2393 h2s->send_wait->wait_reason &= ~SUB_CAN_SEND;
Olivier Houchardd846c262018-10-19 17:24:29 +02002394 h2s->send_wait->wait_reason |= SUB_CALL_UNSUBSCRIBE;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002395 tasklet_wakeup(h2s->send_wait->task);
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002396 LIST_DEL(&h2s->list);
2397 LIST_INIT(&h2s->list);
Olivier Houchardd846c262018-10-19 17:24:29 +02002398 LIST_ADDQ(&h2c->sending_list, &h2s->list);
Willy Tarreaubacdf5a2017-10-17 10:57:04 +02002399 }
2400
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002401 list_for_each_entry_safe(h2s, h2s_back, &h2c->send_list, list) {
Willy Tarreaubacdf5a2017-10-17 10:57:04 +02002402 if (h2c->st0 >= H2_CS_ERROR || h2c->flags & H2_CF_MUX_BLOCK_ANY)
2403 break;
2404
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002405 h2s->flags &= ~H2_SF_BLK_ANY;
2406 h2s->send_wait->wait_reason &= ~SUB_CAN_SEND;
Olivier Houchardd846c262018-10-19 17:24:29 +02002407 h2s->send_wait->wait_reason |= SUB_CALL_UNSUBSCRIBE;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002408 tasklet_wakeup(h2s->send_wait->task);
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002409 LIST_DEL(&h2s->list);
2410 LIST_INIT(&h2s->list);
Olivier Houchardd846c262018-10-19 17:24:29 +02002411 LIST_ADDQ(&h2c->sending_list, &h2s->list);
Willy Tarreaubacdf5a2017-10-17 10:57:04 +02002412 }
2413
Willy Tarreaucc0b8c32017-10-26 16:55:59 +02002414 fail:
Willy Tarreau3eabe9b2017-11-07 11:03:01 +01002415 if (unlikely(h2c->st0 >= H2_CS_ERROR)) {
Willy Tarreau081d4722017-05-16 21:51:05 +02002416 if (h2c->st0 == H2_CS_ERROR) {
2417 if (h2c->max_id >= 0) {
2418 h2c_send_goaway_error(h2c, NULL);
2419 if (h2c->flags & H2_CF_MUX_BLOCK_ANY)
2420 return 0;
2421 }
2422
2423 h2c->st0 = H2_CS_ERROR2; // sent (or failed hard) !
2424 }
2425 return 1;
2426 }
Willy Tarreaubacdf5a2017-10-17 10:57:04 +02002427 return (h2c->mws <= 0 || LIST_ISEMPTY(&h2c->fctl_list)) && LIST_ISEMPTY(&h2c->send_list);
Willy Tarreaubc933932017-10-09 16:21:43 +02002428}
2429
Willy Tarreau62f52692017-10-08 23:01:42 +02002430
Willy Tarreau479998a2018-11-18 06:30:59 +01002431/* Attempt to read data, and subscribe if none available.
2432 * The function returns 1 if data has been received, otherwise zero.
2433 */
Olivier Houchardd4dd22d2018-08-17 18:39:46 +02002434static int h2_recv(struct h2c *h2c)
Willy Tarreau62f52692017-10-08 23:01:42 +02002435{
Olivier Houchardaf4021e2018-08-09 13:06:55 +02002436 struct connection *conn = h2c->conn;
Willy Tarreau35dbd5d2017-09-22 09:13:49 +02002437 struct buffer *buf;
Willy Tarreaua2af5122017-10-09 11:56:46 +02002438 int max;
Olivier Houchard7505f942018-08-21 18:10:44 +02002439 size_t ret;
Willy Tarreaua2af5122017-10-09 11:56:46 +02002440
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002441 if (h2c->wait_event.wait_reason & SUB_CAN_RECV)
Olivier Houchard81a15af2018-10-19 17:26:49 +02002442 return (b_data(&h2c->dbuf));
Olivier Houchardaf4021e2018-08-09 13:06:55 +02002443
Willy Tarreau315d8072017-12-10 22:17:57 +01002444 if (!h2_recv_allowed(h2c))
Olivier Houchard81a15af2018-10-19 17:26:49 +02002445 return 1;
Willy Tarreaua2af5122017-10-09 11:56:46 +02002446
Willy Tarreau44e973f2018-03-01 17:49:30 +01002447 buf = h2_get_buf(h2c, &h2c->dbuf);
Willy Tarreau1b62c5c2017-09-25 11:55:01 +02002448 if (!buf) {
2449 h2c->flags |= H2_CF_DEM_DALLOC;
Olivier Houchardd4dd22d2018-08-17 18:39:46 +02002450 return 0;
Willy Tarreau1b62c5c2017-09-25 11:55:01 +02002451 }
Willy Tarreau35dbd5d2017-09-22 09:13:49 +02002452
Olivier Houchard7505f942018-08-21 18:10:44 +02002453 do {
Willy Tarreaue0f24ee2018-12-14 10:51:23 +01002454 b_realign_if_empty(buf);
Willy Tarreau2a59e872018-12-12 08:23:47 +01002455 if (!b_data(buf) && (h2c->proxy->options2 & PR_O2_USE_HTX)) {
2456 /* HTX in use : try to pre-align the buffer like the
2457 * rxbufs will be to optimize memory copies. We'll make
2458 * sure that the frame header lands at the end of the
2459 * HTX block to alias it upon recv. We cannot use the
2460 * head because rcv_buf() will realign the buffer if
2461 * it's empty. Thus we cheat and pretend we already
2462 * have a few bytes there.
2463 */
2464 max = buf_room_for_htx_data(buf) + 9;
Willy Tarreauc0960d12018-12-14 10:59:15 +01002465 buf->head = sizeof(struct htx) - 9;
Willy Tarreau2a59e872018-12-12 08:23:47 +01002466 }
2467 else
2468 max = b_room(buf);
2469
Olivier Houchard7505f942018-08-21 18:10:44 +02002470 if (max)
2471 ret = conn->xprt->rcv_buf(conn, buf, max, 0);
2472 else
2473 ret = 0;
2474 } while (ret > 0);
Willy Tarreaua2af5122017-10-09 11:56:46 +02002475
Olivier Houchard53216e72018-10-10 15:46:36 +02002476 if (h2_recv_allowed(h2c) && (b_data(buf) < buf->size))
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002477 conn->xprt->subscribe(conn, SUB_CAN_RECV, &h2c->wait_event);
Olivier Houchard81a15af2018-10-19 17:26:49 +02002478
Olivier Houcharda1411e62018-08-17 18:42:48 +02002479 if (!b_data(buf)) {
Willy Tarreau44e973f2018-03-01 17:49:30 +01002480 h2_release_buf(h2c, &h2c->dbuf);
Olivier Houchard46677732018-11-29 17:06:17 +01002481 return (conn->flags & CO_FL_ERROR || conn_xprt_read0_pending(conn));
Willy Tarreaua2af5122017-10-09 11:56:46 +02002482 }
2483
Willy Tarreaub7b5fe12018-06-18 13:33:09 +02002484 if (b_data(buf) == buf->size)
Willy Tarreaufbe3b4f2017-10-09 15:14:19 +02002485 h2c->flags |= H2_CF_DEM_DFULL;
Olivier Houchardd4dd22d2018-08-17 18:39:46 +02002486 return 1;
Willy Tarreau62f52692017-10-08 23:01:42 +02002487}
2488
Willy Tarreau479998a2018-11-18 06:30:59 +01002489/* Try to send data if possible.
2490 * The function returns 1 if data have been sent, otherwise zero.
2491 */
Olivier Houchardd4dd22d2018-08-17 18:39:46 +02002492static int h2_send(struct h2c *h2c)
Willy Tarreau62f52692017-10-08 23:01:42 +02002493{
Olivier Houchard29fb89d2018-08-02 18:56:36 +02002494 struct connection *conn = h2c->conn;
Willy Tarreaubc933932017-10-09 16:21:43 +02002495 int done;
Olivier Houchardd4dd22d2018-08-17 18:39:46 +02002496 int sent = 0;
Willy Tarreaua2af5122017-10-09 11:56:46 +02002497
2498 if (conn->flags & CO_FL_ERROR)
Olivier Houchard7c6f8b12018-11-13 16:48:36 +01002499 return 1;
Willy Tarreaua2af5122017-10-09 11:56:46 +02002500
Olivier Houchard7505f942018-08-21 18:10:44 +02002501
Willy Tarreaua2af5122017-10-09 11:56:46 +02002502 if (conn->flags & (CO_FL_HANDSHAKE|CO_FL_WAIT_L4_CONN|CO_FL_WAIT_L6_CONN)) {
2503 /* a handshake was requested */
Olivier Houchardd4dd22d2018-08-17 18:39:46 +02002504 goto schedule;
Willy Tarreaua2af5122017-10-09 11:56:46 +02002505 }
2506
Willy Tarreaubc933932017-10-09 16:21:43 +02002507 /* This loop is quite simple : it tries to fill as much as it can from
2508 * pending streams into the existing buffer until it's reportedly full
2509 * or the end of send requests is reached. Then it tries to send this
2510 * buffer's contents out, marks it not full if at least one byte could
2511 * be sent, and tries again.
2512 *
2513 * The snd_buf() function normally takes a "flags" argument which may
2514 * be made of a combination of CO_SFL_MSG_MORE to indicate that more
2515 * data immediately comes and CO_SFL_STREAMER to indicate that the
2516 * connection is streaming lots of data (used to increase TLS record
2517 * size at the expense of latency). The former can be sent any time
2518 * there's a buffer full flag, as it indicates at least one stream
2519 * attempted to send and failed so there are pending data. An
2520 * alternative would be to set it as long as there's an active stream
2521 * but that would be problematic for ACKs until we have an absolute
2522 * guarantee that all waiters have at least one byte to send. The
2523 * latter should possibly not be set for now.
2524 */
2525
2526 done = 0;
2527 while (!done) {
2528 unsigned int flags = 0;
2529
2530 /* fill as much as we can into the current buffer */
2531 while (((h2c->flags & (H2_CF_MUX_MFULL|H2_CF_MUX_MALLOC)) == 0) && !done)
2532 done = h2_process_mux(h2c);
2533
2534 if (conn->flags & CO_FL_ERROR)
2535 break;
2536
2537 if (h2c->flags & (H2_CF_MUX_MFULL | H2_CF_DEM_MBUSY | H2_CF_DEM_MROOM))
2538 flags |= CO_SFL_MSG_MORE;
2539
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002540 if (b_data(&h2c->mbuf)) {
2541 int ret = conn->xprt->snd_buf(conn, &h2c->mbuf, b_data(&h2c->mbuf), flags);
Willy Tarreau787db9a2018-06-14 18:31:46 +02002542 if (!ret)
2543 break;
Olivier Houchardd4dd22d2018-08-17 18:39:46 +02002544 sent = 1;
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002545 b_del(&h2c->mbuf, ret);
2546 b_realign_if_empty(&h2c->mbuf);
Willy Tarreau787db9a2018-06-14 18:31:46 +02002547 }
Willy Tarreaubc933932017-10-09 16:21:43 +02002548
2549 /* wrote at least one byte, the buffer is not full anymore */
2550 h2c->flags &= ~(H2_CF_MUX_MFULL | H2_CF_DEM_MROOM);
2551 }
2552
Willy Tarreaua2af5122017-10-09 11:56:46 +02002553 if (conn->flags & CO_FL_SOCK_WR_SH) {
2554 /* output closed, nothing to send, clear the buffer to release it */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002555 b_reset(&h2c->mbuf);
Willy Tarreaua2af5122017-10-09 11:56:46 +02002556 }
Olivier Houchard6ff20392018-07-17 18:46:31 +02002557 /* We're not full anymore, so we can wake any task that are waiting
2558 * for us.
2559 */
2560 if (!(h2c->flags & (H2_CF_MUX_MFULL | H2_CF_DEM_MROOM))) {
Olivier Houchard8ae735d2018-09-11 18:24:28 +02002561 while (!LIST_ISEMPTY(&h2c->send_list)) {
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002562 struct h2s *h2s = LIST_ELEM(h2c->send_list.n,
2563 struct h2s *, list);
2564 LIST_DEL(&h2s->list);
2565 LIST_INIT(&h2s->list);
Olivier Houchardd846c262018-10-19 17:24:29 +02002566 LIST_ADDQ(&h2c->sending_list, &h2s->list);
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002567 h2s->send_wait->wait_reason &= ~SUB_CAN_SEND;
Olivier Houchardd846c262018-10-19 17:24:29 +02002568 h2s->send_wait->wait_reason |= SUB_CALL_UNSUBSCRIBE;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002569 tasklet_wakeup(h2s->send_wait->task);
Olivier Houchard4cf7fb12018-08-02 19:23:05 +02002570 }
Olivier Houchard6ff20392018-07-17 18:46:31 +02002571 }
Olivier Houchard910b2bc2018-07-17 18:49:38 +02002572 /* We're done, no more to send */
2573 if (!b_data(&h2c->mbuf))
Olivier Houchardd4dd22d2018-08-17 18:39:46 +02002574 return sent;
Olivier Houchard910b2bc2018-07-17 18:49:38 +02002575schedule:
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002576 if (!(h2c->wait_event.wait_reason & SUB_CAN_SEND))
2577 conn->xprt->subscribe(conn, SUB_CAN_SEND, &h2c->wait_event);
Olivier Houchardd4dd22d2018-08-17 18:39:46 +02002578 return sent;
Olivier Houchard29fb89d2018-08-02 18:56:36 +02002579}
2580
2581static struct task *h2_io_cb(struct task *t, void *ctx, unsigned short status)
2582{
2583 struct h2c *h2c = ctx;
Olivier Houchard7505f942018-08-21 18:10:44 +02002584 int ret = 0;
Olivier Houchard29fb89d2018-08-02 18:56:36 +02002585
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002586 if (!(h2c->wait_event.wait_reason & SUB_CAN_SEND))
Olivier Houchard7505f942018-08-21 18:10:44 +02002587 ret = h2_send(h2c);
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002588 if (!(h2c->wait_event.wait_reason & SUB_CAN_RECV))
Olivier Houchard7505f942018-08-21 18:10:44 +02002589 ret |= h2_recv(h2c);
Willy Tarreaucef5c8e2018-12-18 10:29:54 +01002590 if (ret || b_data(&h2c->dbuf))
Olivier Houchard7505f942018-08-21 18:10:44 +02002591 h2_process(h2c);
Olivier Houchard910b2bc2018-07-17 18:49:38 +02002592 return NULL;
Willy Tarreaufbe3b4f2017-10-09 15:14:19 +02002593}
Willy Tarreaua2af5122017-10-09 11:56:46 +02002594
Willy Tarreau62f52692017-10-08 23:01:42 +02002595/* callback called on any event by the connection handler.
2596 * It applies changes and returns zero, or < 0 if it wants immediate
2597 * destruction of the connection (which normally doesn not happen in h2).
2598 */
Olivier Houchard7505f942018-08-21 18:10:44 +02002599static int h2_process(struct h2c *h2c)
Willy Tarreau62f52692017-10-08 23:01:42 +02002600{
Olivier Houchard7505f942018-08-21 18:10:44 +02002601 struct connection *conn = h2c->conn;
Willy Tarreaua2af5122017-10-09 11:56:46 +02002602
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002603 if (b_data(&h2c->dbuf) && !(h2c->flags & H2_CF_DEM_BLOCK_ANY)) {
Willy Tarreaud13bf272017-12-14 10:34:52 +01002604 h2_process_demux(h2c);
2605
2606 if (h2c->st0 >= H2_CS_ERROR || conn->flags & CO_FL_ERROR)
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002607 b_reset(&h2c->dbuf);
Willy Tarreaud13bf272017-12-14 10:34:52 +01002608
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002609 if (!b_full(&h2c->dbuf))
Willy Tarreaud13bf272017-12-14 10:34:52 +01002610 h2c->flags &= ~H2_CF_DEM_DFULL;
2611 }
Olivier Houchard7505f942018-08-21 18:10:44 +02002612 h2_send(h2c);
Willy Tarreaud13bf272017-12-14 10:34:52 +01002613
Willy Tarreau0b37d652018-10-03 10:33:02 +02002614 if (unlikely(h2c->proxy->state == PR_STSTOPPED)) {
Willy Tarreau8ec14062017-12-30 18:08:13 +01002615 /* frontend is stopping, reload likely in progress, let's try
2616 * to announce a graceful shutdown if not yet done. We don't
2617 * care if it fails, it will be tried again later.
2618 */
2619 if (!(h2c->flags & (H2_CF_GOAWAY_SENT|H2_CF_GOAWAY_FAILED))) {
2620 if (h2c->last_sid < 0)
2621 h2c->last_sid = (1U << 31) - 1;
2622 h2c_send_goaway_error(h2c, NULL);
2623 }
2624 }
2625
Olivier Houchard7fc96d52017-11-23 18:25:47 +01002626 /*
Olivier Houchard6fa63d92017-11-27 18:41:32 +01002627 * If we received early data, and the handshake is done, wake
2628 * any stream that was waiting for it.
Olivier Houchard7fc96d52017-11-23 18:25:47 +01002629 */
Olivier Houchard6fa63d92017-11-27 18:41:32 +01002630 if (!(h2c->flags & H2_CF_WAIT_FOR_HS) &&
2631 (conn->flags & (CO_FL_EARLY_SSL_HS | CO_FL_HANDSHAKE | CO_FL_EARLY_DATA)) == CO_FL_EARLY_DATA) {
2632 struct eb32_node *node;
2633 struct h2s *h2s;
2634
2635 h2c->flags |= H2_CF_WAIT_FOR_HS;
2636 node = eb32_lookup_ge(&h2c->streams_by_id, 1);
2637
2638 while (node) {
2639 h2s = container_of(node, struct h2s, by_id);
Olivier Houchardc2aa7112018-09-11 18:27:21 +02002640 if ((h2s->cs->flags & CS_FL_WAIT_FOR_HS) &&
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002641 h2s->recv_wait) {
2642 struct wait_event *sw = h2s->recv_wait;
Olivier Houchardc2aa7112018-09-11 18:27:21 +02002643 sw->wait_reason &= ~SUB_CAN_RECV;
2644 tasklet_wakeup(sw->task);
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002645 h2s->recv_wait = NULL;
Olivier Houchardc2aa7112018-09-11 18:27:21 +02002646 }
Olivier Houchard6fa63d92017-11-27 18:41:32 +01002647 node = eb32_next(node);
2648 }
Olivier Houchard7fc96d52017-11-23 18:25:47 +01002649 }
Olivier Houchard6fa63d92017-11-27 18:41:32 +01002650
Willy Tarreau26bd7612017-10-09 16:47:04 +02002651 if (conn->flags & CO_FL_ERROR || conn_xprt_read0_pending(conn) ||
Willy Tarreau29a98242017-10-31 06:59:15 +01002652 h2c->st0 == H2_CS_ERROR2 || h2c->flags & H2_CF_GOAWAY_FAILED ||
2653 (eb_is_empty(&h2c->streams_by_id) && h2c->last_sid >= 0 &&
2654 h2c->max_id >= h2c->last_sid)) {
Willy Tarreau23b92aa2017-10-30 00:26:54 +01002655 h2_wake_some_streams(h2c, 0, 0);
Willy Tarreaufbe3b4f2017-10-09 15:14:19 +02002656
2657 if (eb_is_empty(&h2c->streams_by_id)) {
2658 /* no more stream, kill the connection now */
2659 h2_release(conn);
2660 return -1;
2661 }
Willy Tarreaufbe3b4f2017-10-09 15:14:19 +02002662 }
2663
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002664 if (!b_data(&h2c->dbuf))
Willy Tarreau44e973f2018-03-01 17:49:30 +01002665 h2_release_buf(h2c, &h2c->dbuf);
Willy Tarreaufbe3b4f2017-10-09 15:14:19 +02002666
Olivier Houchard53216e72018-10-10 15:46:36 +02002667 if ((conn->flags & CO_FL_SOCK_WR_SH) ||
2668 h2c->st0 == H2_CS_ERROR2 || (h2c->flags & H2_CF_GOAWAY_FAILED) ||
2669 (h2c->st0 != H2_CS_ERROR &&
2670 !b_data(&h2c->mbuf) &&
2671 (h2c->mws <= 0 || LIST_ISEMPTY(&h2c->fctl_list)) &&
2672 ((h2c->flags & H2_CF_MUX_BLOCK_ANY) || LIST_ISEMPTY(&h2c->send_list))))
Willy Tarreau44e973f2018-03-01 17:49:30 +01002673 h2_release_buf(h2c, &h2c->mbuf);
Willy Tarreaua2af5122017-10-09 11:56:46 +02002674
Willy Tarreau3f133572017-10-31 19:21:06 +01002675 if (h2c->task) {
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002676 if (eb_is_empty(&h2c->streams_by_id) || b_data(&h2c->mbuf)) {
Willy Tarreau599391a2017-11-24 10:16:00 +01002677 h2c->task->expire = tick_add(now_ms, h2c->last_sid < 0 ? h2c->timeout : h2c->shut_timeout);
Willy Tarreau3f133572017-10-31 19:21:06 +01002678 task_queue(h2c->task);
2679 }
2680 else
2681 h2c->task->expire = TICK_ETERNITY;
Willy Tarreauea392822017-10-31 10:02:25 +01002682 }
Olivier Houchard910b2bc2018-07-17 18:49:38 +02002683
Olivier Houchard7505f942018-08-21 18:10:44 +02002684 h2_send(h2c);
Willy Tarreau62f52692017-10-08 23:01:42 +02002685 return 0;
2686}
2687
Olivier Houchard21df6cc2018-09-14 23:21:44 +02002688static int h2_wake(struct connection *conn)
2689{
2690 struct h2c *h2c = conn->mux_ctx;
2691
2692 return (h2_process(h2c));
2693}
2694
Willy Tarreauea392822017-10-31 10:02:25 +01002695/* Connection timeout management. The principle is that if there's no receipt
2696 * nor sending for a certain amount of time, the connection is closed. If the
2697 * MUX buffer still has lying data or is not allocatable, the connection is
2698 * immediately killed. If it's allocatable and empty, we attempt to send a
2699 * GOAWAY frame.
2700 */
Olivier Houchard9f6af332018-05-25 14:04:04 +02002701static struct task *h2_timeout_task(struct task *t, void *context, unsigned short state)
Willy Tarreauea392822017-10-31 10:02:25 +01002702{
Olivier Houchard9f6af332018-05-25 14:04:04 +02002703 struct h2c *h2c = context;
Willy Tarreauea392822017-10-31 10:02:25 +01002704 int expired = tick_is_expired(t->expire, now_ms);
2705
Willy Tarreau0975f112018-03-29 15:22:59 +02002706 if (!expired && h2c)
Willy Tarreauea392822017-10-31 10:02:25 +01002707 return t;
2708
Willy Tarreau0975f112018-03-29 15:22:59 +02002709 task_delete(t);
2710 task_free(t);
2711
2712 if (!h2c) {
2713 /* resources were already deleted */
2714 return NULL;
2715 }
2716
2717 h2c->task = NULL;
Willy Tarreauea392822017-10-31 10:02:25 +01002718 h2c_error(h2c, H2_ERR_NO_ERROR);
2719 h2_wake_some_streams(h2c, 0, 0);
2720
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002721 if (b_data(&h2c->mbuf)) {
Willy Tarreauea392822017-10-31 10:02:25 +01002722 /* don't even try to send a GOAWAY, the buffer is stuck */
2723 h2c->flags |= H2_CF_GOAWAY_FAILED;
2724 }
2725
2726 /* try to send but no need to insist */
Willy Tarreau599391a2017-11-24 10:16:00 +01002727 h2c->last_sid = h2c->max_id;
Willy Tarreauea392822017-10-31 10:02:25 +01002728 if (h2c_send_goaway_error(h2c, NULL) <= 0)
2729 h2c->flags |= H2_CF_GOAWAY_FAILED;
2730
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002731 if (b_data(&h2c->mbuf) && !(h2c->flags & H2_CF_GOAWAY_FAILED) && conn_xprt_ready(h2c->conn)) {
2732 int ret = h2c->conn->xprt->snd_buf(h2c->conn, &h2c->mbuf, b_data(&h2c->mbuf), 0);
Willy Tarreau787db9a2018-06-14 18:31:46 +02002733 if (ret > 0) {
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002734 b_del(&h2c->mbuf, ret);
2735 b_realign_if_empty(&h2c->mbuf);
Willy Tarreau787db9a2018-06-14 18:31:46 +02002736 }
2737 }
Willy Tarreauea392822017-10-31 10:02:25 +01002738
Willy Tarreau0975f112018-03-29 15:22:59 +02002739 /* either we can release everything now or it will be done later once
2740 * the last stream closes.
2741 */
2742 if (eb_is_empty(&h2c->streams_by_id))
2743 h2_release(h2c->conn);
Willy Tarreauea392822017-10-31 10:02:25 +01002744
Willy Tarreauea392822017-10-31 10:02:25 +01002745 return NULL;
2746}
2747
2748
Willy Tarreau62f52692017-10-08 23:01:42 +02002749/*******************************************/
2750/* functions below are used by the streams */
2751/*******************************************/
2752
2753/*
2754 * Attach a new stream to a connection
2755 * (Used for outgoing connections)
2756 */
Olivier Houchardf502aca2018-12-14 19:42:40 +01002757static struct conn_stream *h2_attach(struct connection *conn, struct session *sess)
Willy Tarreau62f52692017-10-08 23:01:42 +02002758{
Olivier Houchard7a57e8a2018-11-27 17:36:33 +01002759 struct conn_stream *cs;
2760 struct h2s *h2s;
2761 struct h2c *h2c = conn->mux_ctx;
2762
2763 cs = cs_new(conn);
2764 if (!cs)
2765 return NULL;
Olivier Houchardf502aca2018-12-14 19:42:40 +01002766 h2s = h2c_bck_stream_new(h2c, cs, sess);
Olivier Houchard7a57e8a2018-11-27 17:36:33 +01002767 if (!h2s) {
2768 cs_free(cs);
2769 return NULL;
2770 }
2771 return cs;
Willy Tarreau62f52692017-10-08 23:01:42 +02002772}
2773
Willy Tarreaufafd3982018-11-18 21:29:20 +01002774/* Retrieves the first valid conn_stream from this connection, or returns NULL.
2775 * We have to scan because we may have some orphan streams. It might be
2776 * beneficial to scan backwards from the end to reduce the likeliness to find
2777 * orphans.
2778 */
2779static const struct conn_stream *h2_get_first_cs(const struct connection *conn)
2780{
2781 struct h2c *h2c = conn->mux_ctx;
2782 struct h2s *h2s;
2783 struct eb32_node *node;
2784
2785 node = eb32_first(&h2c->streams_by_id);
2786 while (node) {
2787 h2s = container_of(node, struct h2s, by_id);
2788 if (h2s->cs)
2789 return h2s->cs;
2790 node = eb32_next(node);
2791 }
2792 return NULL;
2793}
2794
Willy Tarreau62f52692017-10-08 23:01:42 +02002795/*
Olivier Houchard060ed432018-11-06 16:32:42 +01002796 * Destroy the mux and the associated connection, if it is no longer used
2797 */
2798static void h2_destroy(struct connection *conn)
2799{
2800 struct h2c *h2c = conn->mux_ctx;
2801
2802 if (eb_is_empty(&h2c->streams_by_id))
2803 h2_release(h2c->conn);
2804}
2805
2806/*
Willy Tarreau62f52692017-10-08 23:01:42 +02002807 * Detach the stream from the connection and possibly release the connection.
2808 */
2809static void h2_detach(struct conn_stream *cs)
2810{
Willy Tarreau60935142017-10-16 18:11:19 +02002811 struct h2s *h2s = cs->ctx;
2812 struct h2c *h2c;
Olivier Houchardf502aca2018-12-14 19:42:40 +01002813 struct session *sess;
Willy Tarreau60935142017-10-16 18:11:19 +02002814
2815 cs->ctx = NULL;
2816 if (!h2s)
2817 return;
2818
Olivier Houchardf502aca2018-12-14 19:42:40 +01002819 sess = h2s->sess;
Willy Tarreau60935142017-10-16 18:11:19 +02002820 h2c = h2s->h2c;
2821 h2s->cs = NULL;
Willy Tarreau7ac60e82018-07-19 09:04:05 +02002822 h2c->nb_cs--;
Willy Tarreauf2101912018-07-19 10:11:38 +02002823 if (h2c->flags & H2_CF_DEM_TOOMANY &&
2824 !h2_has_too_many_cs(h2c)) {
2825 h2c->flags &= ~H2_CF_DEM_TOOMANY;
Olivier Houchard53216e72018-10-10 15:46:36 +02002826 if (h2_recv_allowed(h2c))
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002827 tasklet_wakeup(h2c->wait_event.task);
Willy Tarreauf2101912018-07-19 10:11:38 +02002828 }
Willy Tarreau60935142017-10-16 18:11:19 +02002829
Willy Tarreau22cf59b2017-11-10 11:42:33 +01002830 /* this stream may be blocked waiting for some data to leave (possibly
2831 * an ES or RST frame), so orphan it in this case.
2832 */
Willy Tarreau3041fcc2018-03-29 15:41:32 +02002833 if (!(cs->conn->flags & CO_FL_ERROR) &&
Willy Tarreaua2b51812018-07-27 09:55:14 +02002834 (h2c->st0 < H2_CS_ERROR) &&
Willy Tarreau3041fcc2018-03-29 15:41:32 +02002835 (h2s->flags & (H2_SF_BLK_MBUSY | H2_SF_BLK_MROOM | H2_SF_BLK_MFCTL)))
Willy Tarreau22cf59b2017-11-10 11:42:33 +01002836 return;
2837
Willy Tarreau45f752e2017-10-30 15:44:59 +01002838 if ((h2c->flags & H2_CF_DEM_BLOCK_ANY && h2s->id == h2c->dsi) ||
2839 (h2c->flags & H2_CF_MUX_BLOCK_ANY && h2s->id == h2c->msi)) {
2840 /* unblock the connection if it was blocked on this
2841 * stream.
2842 */
2843 h2c->flags &= ~H2_CF_DEM_BLOCK_ANY;
2844 h2c->flags &= ~H2_CF_MUX_BLOCK_ANY;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002845 tasklet_wakeup(h2c->wait_event.task);
Willy Tarreau45f752e2017-10-30 15:44:59 +01002846 }
2847
Willy Tarreau71049cc2018-03-28 13:56:39 +02002848 h2s_destroy(h2s);
Willy Tarreau60935142017-10-16 18:11:19 +02002849
Olivier Houchard8a786902018-12-15 16:05:40 +01002850 if (h2c->flags & H2_CF_IS_BACK &&
2851 (h2c->proxy->options2 & PR_O2_USE_HTX)) {
Olivier Houchard8a786902018-12-15 16:05:40 +01002852 if (!(h2c->conn->flags &
2853 (CO_FL_ERROR | CO_FL_SOCK_RD_SH | CO_FL_SOCK_WR_SH))) {
2854 if (!h2c->conn->owner) {
Olivier Houchardf502aca2018-12-14 19:42:40 +01002855 h2c->conn->owner = sess;
2856 session_add_conn(sess, h2c->conn, h2c->conn->target);
Olivier Houchard8a786902018-12-15 16:05:40 +01002857 }
Olivier Houcharda4d4fdf2018-12-14 19:27:06 +01002858 if (eb_is_empty(&h2c->streams_by_id)) {
2859 if (session_check_idle_conn(h2c->conn->owner, h2c->conn) != 0)
2860 /* At this point either the connection is destroyed, or it's been added to the server idle list, just stop */
2861 return;
2862 }
Olivier Houchard8a786902018-12-15 16:05:40 +01002863 /* Never ever allow to reuse a connection from a non-reuse backend */
2864 if ((h2c->proxy->options & PR_O_REUSE_MASK) == PR_O_REUSE_NEVR)
2865 h2c->conn->flags |= CO_FL_PRIVATE;
2866 if (LIST_ISEMPTY(&h2c->conn->list)) {
2867 struct server *srv = objt_server(h2c->conn->target);
2868
2869 if (srv) {
2870 if (h2c->conn->flags & CO_FL_PRIVATE)
2871 LIST_ADD(&srv->priv_conns[tid], &h2c->conn->list);
2872 else
2873 LIST_ADD(&srv->idle_conns[tid], &h2c->conn->list);
2874 }
2875
2876 }
2877 }
2878 }
2879
Willy Tarreaue323f342018-03-28 13:51:45 +02002880 /* We don't want to close right now unless we're removing the
2881 * last stream, and either the connection is in error, or it
2882 * reached the ID already specified in a GOAWAY frame received
2883 * or sent (as seen by last_sid >= 0).
2884 */
2885 if (eb_is_empty(&h2c->streams_by_id) && /* don't close if streams exist */
2886 ((h2c->conn->flags & CO_FL_ERROR) || /* errors close immediately */
Willy Tarreau42d55b92018-06-13 14:24:56 +02002887 (h2c->st0 >= H2_CS_ERROR && !h2c->task) || /* a timeout stroke earlier */
Olivier Houchard52b94662018-10-21 03:01:20 +02002888 (h2c->flags & (H2_CF_GOAWAY_FAILED | H2_CF_GOAWAY_SENT)) ||
Olivier Houchard93c88522018-11-30 15:39:16 +01002889 (!(h2c->conn->owner)) || /* Nobody's left to take care of the connection, drop it now */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002890 (!b_data(&h2c->mbuf) && /* mux buffer empty, also process clean events below */
Willy Tarreaue323f342018-03-28 13:51:45 +02002891 (conn_xprt_read0_pending(h2c->conn) ||
2892 (h2c->last_sid >= 0 && h2c->max_id >= h2c->last_sid))))) {
2893 /* no more stream will come, kill it now */
2894 h2_release(h2c->conn);
2895 }
2896 else if (h2c->task) {
Willy Tarreauc9fa0482018-07-10 17:43:27 +02002897 if (eb_is_empty(&h2c->streams_by_id) || b_data(&h2c->mbuf)) {
Willy Tarreaue323f342018-03-28 13:51:45 +02002898 h2c->task->expire = tick_add(now_ms, h2c->last_sid < 0 ? h2c->timeout : h2c->shut_timeout);
2899 task_queue(h2c->task);
Willy Tarreaue6ae77f2017-11-07 11:59:51 +01002900 }
Willy Tarreaue323f342018-03-28 13:51:45 +02002901 else
2902 h2c->task->expire = TICK_ETERNITY;
Willy Tarreau60935142017-10-16 18:11:19 +02002903 }
Willy Tarreau62f52692017-10-08 23:01:42 +02002904}
2905
Olivier Houchard8ae735d2018-09-11 18:24:28 +02002906static void h2_do_shutr(struct h2s *h2s)
Willy Tarreau62f52692017-10-08 23:01:42 +02002907{
Olivier Houchard8ae735d2018-09-11 18:24:28 +02002908 struct h2c *h2c = h2s->h2c;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002909 struct wait_event *sw = &h2s->wait_event;
Willy Tarreauc7576ea2017-10-29 22:00:09 +01002910
Willy Tarreau721c9742017-11-07 11:05:42 +01002911 if (h2s->st == H2_SS_HLOC || h2s->st == H2_SS_ERROR || h2s->st == H2_SS_CLOSED)
Willy Tarreauc7576ea2017-10-29 22:00:09 +01002912 return;
2913
Willy Tarreau926fa4c2017-11-07 14:42:12 +01002914 /* if no outgoing data was seen on this stream, it means it was
2915 * closed with a "tcp-request content" rule that is normally
2916 * used to kill the connection ASAP (eg: limit abuse). In this
2917 * case we send a goaway to close the connection.
2918 */
Willy Tarreau90c32322017-11-24 08:00:30 +01002919 if (!(h2s->flags & H2_SF_RST_SENT) &&
Olivier Houchard8ae735d2018-09-11 18:24:28 +02002920 h2s_send_rst_stream(h2c, h2s) <= 0)
Willy Tarreaub2e290a2018-03-30 17:35:38 +02002921 goto add_to_list;
Willy Tarreau90c32322017-11-24 08:00:30 +01002922
Willy Tarreau926fa4c2017-11-07 14:42:12 +01002923 if (!(h2s->flags & H2_SF_OUTGOING_DATA) &&
2924 !(h2s->h2c->flags & (H2_CF_GOAWAY_SENT|H2_CF_GOAWAY_FAILED)) &&
Olivier Houchard8ae735d2018-09-11 18:24:28 +02002925 h2c_send_goaway_error(h2c, h2s) <= 0)
2926 return;
Willy Tarreauc7576ea2017-10-29 22:00:09 +01002927
Olivier Houchard435ce2d2018-12-03 18:43:16 +01002928 if (!(h2c->wait_event.wait_reason & SUB_CAN_SEND))
2929 tasklet_wakeup(h2c->wait_event.task);
Willy Tarreau00dd0782018-03-01 16:31:34 +01002930 h2s_close(h2s);
Willy Tarreaub2e290a2018-03-30 17:35:38 +02002931
Olivier Houchard8ae735d2018-09-11 18:24:28 +02002932 return;
2933add_to_list:
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002934 if (LIST_ISEMPTY(&h2s->list)) {
Olivier Houchard8ae735d2018-09-11 18:24:28 +02002935 sw->wait_reason |= SUB_CAN_SEND;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002936 if (h2s->flags & H2_SF_BLK_MFCTL) {
2937 LIST_ADDQ(&h2c->fctl_list, &h2s->list);
2938 h2s->send_wait = sw;
2939 } else if (h2s->flags & (H2_SF_BLK_MBUSY|H2_SF_BLK_MROOM)) {
2940 h2s->send_wait = sw;
2941 LIST_ADDQ(&h2c->send_list, &h2s->list);
2942 }
Willy Tarreaub2e290a2018-03-30 17:35:38 +02002943 }
Olivier Houchard8ae735d2018-09-11 18:24:28 +02002944 /* Let the handler know we want shutr */
2945 sw->handle = (void *)((long)sw->handle | 1);
2946
Willy Tarreau62f52692017-10-08 23:01:42 +02002947}
2948
Olivier Houchard8ae735d2018-09-11 18:24:28 +02002949static void h2_do_shutw(struct h2s *h2s)
Willy Tarreau62f52692017-10-08 23:01:42 +02002950{
Olivier Houchard8ae735d2018-09-11 18:24:28 +02002951 struct h2c *h2c = h2s->h2c;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002952 struct wait_event *sw = &h2s->wait_event;
Willy Tarreauc7576ea2017-10-29 22:00:09 +01002953
Willy Tarreau721c9742017-11-07 11:05:42 +01002954 if (h2s->st == H2_SS_HLOC || h2s->st == H2_SS_ERROR || h2s->st == H2_SS_CLOSED)
Willy Tarreauc7576ea2017-10-29 22:00:09 +01002955 return;
2956
Willy Tarreau67434202017-11-06 20:20:51 +01002957 if (h2s->flags & H2_SF_HEADERS_SENT) {
Willy Tarreau58e32082017-11-07 14:41:09 +01002958 /* we can cleanly close using an empty data frame only after headers */
2959
2960 if (!(h2s->flags & (H2_SF_ES_SENT|H2_SF_RST_SENT)) &&
2961 h2_send_empty_data_es(h2s) <= 0)
Willy Tarreaub2e290a2018-03-30 17:35:38 +02002962 goto add_to_list;
Willy Tarreau58e32082017-11-07 14:41:09 +01002963
2964 if (h2s->st == H2_SS_HREM)
Willy Tarreau00dd0782018-03-01 16:31:34 +01002965 h2s_close(h2s);
Willy Tarreau58e32082017-11-07 14:41:09 +01002966 else
2967 h2s->st = H2_SS_HLOC;
Willy Tarreauc7576ea2017-10-29 22:00:09 +01002968 } else {
Willy Tarreau926fa4c2017-11-07 14:42:12 +01002969 /* if no outgoing data was seen on this stream, it means it was
2970 * closed with a "tcp-request content" rule that is normally
2971 * used to kill the connection ASAP (eg: limit abuse). In this
2972 * case we send a goaway to close the connection.
Willy Tarreaua1349f02017-10-31 07:41:55 +01002973 */
Willy Tarreau90c32322017-11-24 08:00:30 +01002974 if (!(h2s->flags & H2_SF_RST_SENT) &&
Olivier Houchard8ae735d2018-09-11 18:24:28 +02002975 h2s_send_rst_stream(h2c, h2s) <= 0)
Willy Tarreaub2e290a2018-03-30 17:35:38 +02002976 goto add_to_list;
Willy Tarreau90c32322017-11-24 08:00:30 +01002977
Willy Tarreau926fa4c2017-11-07 14:42:12 +01002978 if (!(h2s->flags & H2_SF_OUTGOING_DATA) &&
2979 !(h2s->h2c->flags & (H2_CF_GOAWAY_SENT|H2_CF_GOAWAY_FAILED)) &&
Olivier Houchard8ae735d2018-09-11 18:24:28 +02002980 h2c_send_goaway_error(h2c, h2s) <= 0)
Willy Tarreaub2e290a2018-03-30 17:35:38 +02002981 goto add_to_list;
Willy Tarreaua1349f02017-10-31 07:41:55 +01002982
Willy Tarreau00dd0782018-03-01 16:31:34 +01002983 h2s_close(h2s);
Willy Tarreauc7576ea2017-10-29 22:00:09 +01002984 }
2985
Olivier Houchard435ce2d2018-12-03 18:43:16 +01002986 if (!(h2c->wait_event.wait_reason & SUB_CAN_SEND))
2987 tasklet_wakeup(h2c->wait_event.task);
2988 return;
Willy Tarreaub2e290a2018-03-30 17:35:38 +02002989
2990 add_to_list:
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002991 if (LIST_ISEMPTY(&h2s->list)) {
Olivier Houchard8ae735d2018-09-11 18:24:28 +02002992 sw->wait_reason |= SUB_CAN_SEND;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02002993 if (h2s->flags & H2_SF_BLK_MFCTL) {
2994 LIST_ADDQ(&h2c->fctl_list, &h2s->list);
2995 h2s->send_wait = sw;
2996 } else if (h2s->flags & (H2_SF_BLK_MBUSY|H2_SF_BLK_MROOM)) {
2997 h2s->send_wait = sw;
2998 LIST_ADDQ(&h2c->send_list, &h2s->list);
2999 }
Willy Tarreaub2e290a2018-03-30 17:35:38 +02003000 }
Olivier Houchardfa8aa862018-10-10 18:25:41 +02003001 /* let the handler know we want to shutw */
3002 sw->handle = (void *)((long)(sw->handle) | 2);
3003
Olivier Houchard8ae735d2018-09-11 18:24:28 +02003004}
3005
3006static struct task *h2_deferred_shut(struct task *t, void *ctx, unsigned short state)
3007{
3008 struct h2s *h2s = ctx;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02003009 long reason = (long)h2s->wait_event.handle;
Olivier Houchard8ae735d2018-09-11 18:24:28 +02003010
Olivier Houchard2c68a462018-12-15 22:42:20 +01003011 if (h2s->send_wait) {
3012 h2s->send_wait->wait_reason &= ~SUB_CALL_UNSUBSCRIBE;
3013 h2s->send_wait = NULL;
3014 LIST_DEL(&h2s->list);
3015 LIST_INIT(&h2s->list);
3016 }
Olivier Houchard8ae735d2018-09-11 18:24:28 +02003017 if (reason & 2)
3018 h2_do_shutw(h2s);
Olivier Houchard2c68a462018-12-15 22:42:20 +01003019 if (reason & 1)
3020 h2_do_shutr(h2s);
Olivier Houchard8ae735d2018-09-11 18:24:28 +02003021
Olivier Houchard2c68a462018-12-15 22:42:20 +01003022 if (h2s->st == H2_SS_CLOSED &&
Olivier Houchardffda58b2018-12-16 01:29:11 +01003023 !((h2s->flags & (H2_SF_BLK_MBUSY | H2_SF_BLK_MROOM | H2_SF_BLK_MFCTL))) && !h2s->cs)
Olivier Houchard2c68a462018-12-15 22:42:20 +01003024 h2s_destroy(h2s);
Olivier Houchard8ae735d2018-09-11 18:24:28 +02003025 return NULL;
Willy Tarreau62f52692017-10-08 23:01:42 +02003026}
3027
Olivier Houchard8ae735d2018-09-11 18:24:28 +02003028static void h2_shutr(struct conn_stream *cs, enum cs_shr_mode mode)
3029{
3030 struct h2s *h2s = cs->ctx;
3031
3032 if (!mode)
3033 return;
3034
3035 h2_do_shutr(h2s);
3036}
3037
3038static void h2_shutw(struct conn_stream *cs, enum cs_shw_mode mode)
3039{
3040 struct h2s *h2s = cs->ctx;
3041
3042 h2_do_shutw(h2s);
3043}
3044
Willy Tarreaubd4a6b62018-11-27 09:29:36 +01003045/* Decode the payload of a HEADERS frame and produce the equivalent HTTP/1 or
Willy Tarreauc3e18f32018-10-08 14:51:56 +02003046 * HTX request or response depending on the connection's side. Returns the
3047 * number of bytes emitted if > 0, or 0 if it couldn't proceed. Stream errors
3048 * are reported in h2s->errcode and connection errors in h2c->errcode.
Willy Tarreau13278b42017-10-13 19:23:14 +02003049 */
Willy Tarreauc3e18f32018-10-08 14:51:56 +02003050static int h2s_decode_headers(struct h2s *h2s)
Willy Tarreau13278b42017-10-13 19:23:14 +02003051{
3052 struct h2c *h2c = h2s->h2c;
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003053 const uint8_t *hdrs = (uint8_t *)b_head(&h2c->dbuf);
Willy Tarreau83061a82018-07-13 11:56:34 +02003054 struct buffer *tmp = get_trash_chunk();
Willy Tarreau59a10fb2017-11-21 20:03:02 +01003055 struct http_hdr list[MAX_HTTP_HDR * 2];
Willy Tarreau83061a82018-07-13 11:56:34 +02003056 struct buffer *copy = NULL;
Willy Tarreau174b06a2018-04-25 18:13:58 +02003057 unsigned int msgf;
Willy Tarreau937f7602018-02-26 15:22:17 +01003058 struct buffer *csbuf;
Willy Tarreaubd4a6b62018-11-27 09:29:36 +01003059 struct htx *htx = NULL;
Willy Tarreau13278b42017-10-13 19:23:14 +02003060 int flen = h2c->dfl;
3061 int outlen = 0;
3062 int wrap;
Willy Tarreaubd4a6b62018-11-27 09:29:36 +01003063 int try = 0;
Willy Tarreau13278b42017-10-13 19:23:14 +02003064
3065 if (!h2c->dfl) {
3066 h2s_error(h2s, H2_ERR_PROTOCOL_ERROR); // empty headers frame!
Willy Tarreaua20a5192017-12-27 11:02:06 +01003067 h2c->st0 = H2_CS_FRAME_E;
Willy Tarreau13278b42017-10-13 19:23:14 +02003068 return 0;
3069 }
3070
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003071 if (b_data(&h2c->dbuf) < h2c->dfl && !b_full(&h2c->dbuf))
Willy Tarreau68472622017-12-11 18:36:37 +01003072 return 0; // incomplete input frame
3073
Willy Tarreau13278b42017-10-13 19:23:14 +02003074 /* if the input buffer wraps, take a temporary copy of it (rare) */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003075 wrap = b_wrap(&h2c->dbuf) - b_head(&h2c->dbuf);
Willy Tarreau13278b42017-10-13 19:23:14 +02003076 if (wrap < h2c->dfl) {
Willy Tarreau68dd9852017-07-03 14:44:26 +02003077 copy = alloc_trash_chunk();
3078 if (!copy) {
3079 h2c_error(h2c, H2_ERR_INTERNAL_ERROR);
3080 goto fail;
3081 }
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003082 memcpy(copy->area, b_head(&h2c->dbuf), wrap);
3083 memcpy(copy->area + wrap, b_orig(&h2c->dbuf), h2c->dfl - wrap);
3084 hdrs = (uint8_t *) copy->area;
Willy Tarreau13278b42017-10-13 19:23:14 +02003085 }
3086
3087 /* The padlen is the first byte before data, and the padding appears
3088 * after data. padlen+data+padding are included in flen.
3089 */
3090 if (h2c->dff & H2_F_HEADERS_PADDED) {
Willy Tarreau05e5daf2017-12-11 15:17:36 +01003091 h2c->dpl = *hdrs;
3092 if (h2c->dpl >= flen) {
Willy Tarreau13278b42017-10-13 19:23:14 +02003093 /* RFC7540#6.2 : pad length = length of frame payload or greater */
3094 h2c_error(h2c, H2_ERR_PROTOCOL_ERROR);
Willy Tarreaua0d11b62018-09-05 18:30:05 +02003095 goto fail;
Willy Tarreau13278b42017-10-13 19:23:14 +02003096 }
Willy Tarreau05e5daf2017-12-11 15:17:36 +01003097 flen -= h2c->dpl + 1;
Willy Tarreau13278b42017-10-13 19:23:14 +02003098 hdrs += 1; // skip Pad Length
3099 }
3100
3101 /* Skip StreamDep and weight for now (we don't support PRIORITY) */
3102 if (h2c->dff & H2_F_HEADERS_PRIORITY) {
Willy Tarreau18b86cd2017-12-03 19:24:50 +01003103 if (read_n32(hdrs) == h2s->id) {
3104 /* RFC7540#5.3.1 : stream dep may not depend on itself */
3105 h2c_error(h2c, H2_ERR_PROTOCOL_ERROR);
Willy Tarreaua0d11b62018-09-05 18:30:05 +02003106 goto fail;
Willy Tarreau18b86cd2017-12-03 19:24:50 +01003107 }
3108
Willy Tarreau13278b42017-10-13 19:23:14 +02003109 hdrs += 5; // stream dep = 4, weight = 1
3110 flen -= 5;
3111 }
3112
3113 /* FIXME: lack of END_HEADERS means there's a continuation frame, we
3114 * don't support this for now and can't even decompress so we have to
3115 * break the connection.
3116 */
3117 if (!(h2c->dff & H2_F_HEADERS_END_HEADERS)) {
3118 h2c_error(h2c, H2_ERR_INTERNAL_ERROR);
Willy Tarreau68dd9852017-07-03 14:44:26 +02003119 goto fail;
Willy Tarreau13278b42017-10-13 19:23:14 +02003120 }
3121
Olivier Houchard638b7992018-08-16 15:41:52 +02003122 csbuf = h2_get_buf(h2c, &h2s->rxbuf);
Willy Tarreau937f7602018-02-26 15:22:17 +01003123 if (!csbuf) {
3124 h2c->flags |= H2_CF_DEM_SALLOC;
Willy Tarreau59a10fb2017-11-21 20:03:02 +01003125 goto fail;
3126 }
Willy Tarreau13278b42017-10-13 19:23:14 +02003127
Willy Tarreau937f7602018-02-26 15:22:17 +01003128 /* we can't retry a failed decompression operation so we must be very
3129 * careful not to take any risks. In practice the output buffer is
3130 * always empty except maybe for trailers, in which case we simply have
3131 * to wait for the upper layer to finish consuming what is available.
3132 */
Willy Tarreaubd4a6b62018-11-27 09:29:36 +01003133
3134 if (h2c->proxy->options2 & PR_O2_USE_HTX) {
3135 htx = htx_from_buf(&h2s->rxbuf);
3136 if (!htx_is_empty(htx))
3137 goto fail;
3138 } else {
3139 if (b_data(csbuf))
3140 goto fail;
Willy Tarreau59a10fb2017-11-21 20:03:02 +01003141
Willy Tarreaubd4a6b62018-11-27 09:29:36 +01003142 csbuf->head = 0;
3143 try = b_size(csbuf);
3144 }
Willy Tarreau59a10fb2017-11-21 20:03:02 +01003145
3146 outlen = hpack_decode_frame(h2c->ddht, hdrs, flen, list,
3147 sizeof(list)/sizeof(list[0]), tmp);
3148 if (outlen < 0) {
3149 h2c_error(h2c, H2_ERR_COMPRESSION_ERROR);
3150 goto fail;
3151 }
3152
3153 /* OK now we have our header list in <list> */
Willy Tarreau174b06a2018-04-25 18:13:58 +02003154 msgf = (h2c->dff & H2_F_DATA_END_STREAM) ? 0 : H2_MSGF_BODY;
Willy Tarreaubd4a6b62018-11-27 09:29:36 +01003155
Willy Tarreauc3e18f32018-10-08 14:51:56 +02003156 if (htx) {
3157 /* HTX mode */
3158 if (h2c->flags & H2_CF_IS_BACK)
3159 outlen = h2_make_htx_response(list, htx, &msgf);
3160 else
3161 outlen = h2_make_htx_request(list, htx, &msgf);
3162 } else {
3163 /* HTTP/1 mode */
Willy Tarreaubd4a6b62018-11-27 09:29:36 +01003164 outlen = h2_make_h1_request(list, b_tail(csbuf), try, &msgf);
Willy Tarreauc3e18f32018-10-08 14:51:56 +02003165 }
Willy Tarreau59a10fb2017-11-21 20:03:02 +01003166
3167 if (outlen < 0) {
3168 h2c_error(h2c, H2_ERR_COMPRESSION_ERROR);
3169 goto fail;
3170 }
Willy Tarreau13278b42017-10-13 19:23:14 +02003171
Willy Tarreau174b06a2018-04-25 18:13:58 +02003172 if (msgf & H2_MSGF_BODY) {
3173 /* a payload is present */
3174 if (msgf & H2_MSGF_BODY_CL)
3175 h2s->flags |= H2_SF_DATA_CLEN;
Olivier Houchard50d660c2018-12-08 00:18:31 +01003176 else if (!(msgf & H2_MSGF_BODY_TUNNEL) && !htx)
Willy Tarreau174b06a2018-04-25 18:13:58 +02003177 h2s->flags |= H2_SF_DATA_CHNK;
3178 }
3179
Willy Tarreau13278b42017-10-13 19:23:14 +02003180 /* now consume the input data */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003181 b_del(&h2c->dbuf, h2c->dfl);
Willy Tarreau13278b42017-10-13 19:23:14 +02003182 h2c->st0 = H2_CS_FRAME_H;
Willy Tarreau937f7602018-02-26 15:22:17 +01003183 b_add(csbuf, outlen);
Willy Tarreau13278b42017-10-13 19:23:14 +02003184
Willy Tarreau39d68502018-03-02 12:26:37 +01003185 if (h2c->dff & H2_F_HEADERS_END_STREAM) {
Willy Tarreau13278b42017-10-13 19:23:14 +02003186 h2s->flags |= H2_SF_ES_RCVD;
Willy Tarreau39d68502018-03-02 12:26:37 +01003187 h2s->cs->flags |= CS_FL_REOS;
Willy Tarreaubd4a6b62018-11-27 09:29:36 +01003188 if (htx)
3189 htx_add_endof(htx, HTX_BLK_EOM);
Willy Tarreau39d68502018-03-02 12:26:37 +01003190 }
Willy Tarreau937f7602018-02-26 15:22:17 +01003191
Willy Tarreau68dd9852017-07-03 14:44:26 +02003192 leave:
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01003193 if (htx)
3194 htx_to_buf(htx, &h2s->rxbuf);
Willy Tarreau68dd9852017-07-03 14:44:26 +02003195 free_trash_chunk(copy);
Willy Tarreau13278b42017-10-13 19:23:14 +02003196 return outlen;
Willy Tarreau68dd9852017-07-03 14:44:26 +02003197 fail:
3198 outlen = 0;
3199 goto leave;
Willy Tarreau13278b42017-10-13 19:23:14 +02003200}
3201
Willy Tarreau454f9052017-10-26 19:40:35 +02003202/* Transfer the payload of a DATA frame to the HTTP/1 side. When content-length
3203 * or a tunnel is used, the contents are copied as-is. When chunked encoding is
3204 * in use, a new chunk is emitted for each frame. This is supposed to fit
3205 * because the smallest chunk takes 1 byte for the size, 2 for CRLF, X for the
3206 * data, 2 for the extra CRLF, so that's 5+X, while on the H2 side the smallest
3207 * frame will be 9+X bytes based on the same buffer size. The HTTP/2 frame
Willy Tarreau61ea7dc2018-12-01 23:23:04 +01003208 * parser state is automatically updated. Returns > 0 if it could completely
3209 * send the current frame, 0 if it couldn't complete, in which case
3210 * CS_FL_RCV_MORE must be checked to know if some data remain pending (an empty
3211 * DATA frame can return 0 as a valid result). Stream errors are reported in
3212 * h2s->errcode and connection errors in h2c->errcode. The caller must already
3213 * have checked the frame header and ensured that the frame was complete or the
3214 * buffer full. It changes the frame state to FRAME_A once done.
Willy Tarreau454f9052017-10-26 19:40:35 +02003215 */
Willy Tarreau454b57b2018-02-26 15:50:05 +01003216static int h2_frt_transfer_data(struct h2s *h2s)
Willy Tarreau454f9052017-10-26 19:40:35 +02003217{
3218 struct h2c *h2c = h2s->h2c;
3219 int block1, block2;
Willy Tarreaud755ea62018-02-26 15:44:54 +01003220 unsigned int flen = 0;
Willy Tarreaueba10f22018-04-25 20:44:22 +02003221 unsigned int chklen = 0;
Willy Tarreau61ea7dc2018-12-01 23:23:04 +01003222 struct htx *htx = NULL;
Willy Tarreaud755ea62018-02-26 15:44:54 +01003223 struct buffer *csbuf;
Willy Tarreau454f9052017-10-26 19:40:35 +02003224
Willy Tarreau8fc016d2017-12-11 18:27:15 +01003225 h2c->flags &= ~H2_CF_DEM_SFULL;
Willy Tarreau454f9052017-10-26 19:40:35 +02003226
3227 /* The padlen is the first byte before data, and the padding appears
3228 * after data. padlen+data+padding are included in flen.
3229 */
Willy Tarreau79127812017-12-03 21:06:59 +01003230 if (h2c->dff & H2_F_DATA_PADDED) {
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003231 if (b_data(&h2c->dbuf) < 1)
Willy Tarreau8fc016d2017-12-11 18:27:15 +01003232 return 0;
3233
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003234 h2c->dpl = *(uint8_t *)b_head(&h2c->dbuf);
Willy Tarreau05e5daf2017-12-11 15:17:36 +01003235 if (h2c->dpl >= h2c->dfl) {
Willy Tarreau454f9052017-10-26 19:40:35 +02003236 /* RFC7540#6.1 : pad length = length of frame payload or greater */
3237 h2c_error(h2c, H2_ERR_PROTOCOL_ERROR);
Willy Tarreau454f9052017-10-26 19:40:35 +02003238 return 0;
3239 }
Willy Tarreau8fc016d2017-12-11 18:27:15 +01003240
3241 /* skip the padlen byte */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003242 b_del(&h2c->dbuf, 1);
Willy Tarreau8fc016d2017-12-11 18:27:15 +01003243 h2c->dfl--;
3244 h2c->rcvd_c++; h2c->rcvd_s++;
3245 h2c->dff &= ~H2_F_DATA_PADDED;
Willy Tarreau454f9052017-10-26 19:40:35 +02003246 }
3247
Olivier Houchard638b7992018-08-16 15:41:52 +02003248 csbuf = h2_get_buf(h2c, &h2s->rxbuf);
Willy Tarreaud755ea62018-02-26 15:44:54 +01003249 if (!csbuf) {
3250 h2c->flags |= H2_CF_DEM_SALLOC;
Willy Tarreau454b57b2018-02-26 15:50:05 +01003251 goto fail;
Willy Tarreaud755ea62018-02-26 15:44:54 +01003252 }
3253
Willy Tarreau61ea7dc2018-12-01 23:23:04 +01003254try_again:
Willy Tarreau8fc016d2017-12-11 18:27:15 +01003255 flen = h2c->dfl - h2c->dpl;
3256 if (!flen)
Willy Tarreau4a28da12018-01-04 14:41:00 +01003257 goto end_transfer;
Willy Tarreau8fc016d2017-12-11 18:27:15 +01003258
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003259 if (flen > b_data(&h2c->dbuf)) {
3260 flen = b_data(&h2c->dbuf);
Willy Tarreau8fc016d2017-12-11 18:27:15 +01003261 if (!flen)
Willy Tarreau454b57b2018-02-26 15:50:05 +01003262 goto fail;
Willy Tarreaud755ea62018-02-26 15:44:54 +01003263 }
3264
Willy Tarreau61ea7dc2018-12-01 23:23:04 +01003265 if (h2c->proxy->options2 & PR_O2_USE_HTX) {
3266 htx = htx_from_buf(csbuf);
3267 block1 = htx_free_data_space(htx);
3268 if (!block1) {
3269 h2c->flags |= H2_CF_DEM_SFULL;
3270 goto fail;
3271 }
3272 if (flen > block1)
3273 flen = block1;
3274
3275 /* here, flen is the max we can copy into the output buffer */
3276 block1 = b_contig_data(&h2c->dbuf, 0);
3277 if (flen > block1)
3278 flen = block1;
3279
3280 if (!htx_add_data(htx, ist2(b_head(&h2c->dbuf), flen))) {
3281 h2c->flags |= H2_CF_DEM_SFULL;
3282 goto fail;
3283 }
3284
3285 b_del(&h2c->dbuf, flen);
3286 h2c->dfl -= flen;
3287 h2c->rcvd_c += flen;
3288 h2c->rcvd_s += flen; // warning, this can also affect the closed streams!
3289 goto try_again;
3290 }
3291 else if (unlikely(b_space_wraps(csbuf))) {
Willy Tarreaud755ea62018-02-26 15:44:54 +01003292 /* it doesn't fit and the buffer is fragmented,
3293 * so let's defragment it and try again.
3294 */
3295 b_slow_realign(csbuf, trash.area, 0);
Willy Tarreau454f9052017-10-26 19:40:35 +02003296 }
3297
Willy Tarreaueba10f22018-04-25 20:44:22 +02003298 /* chunked-encoding requires more room */
3299 if (h2s->flags & H2_SF_DATA_CHNK) {
Willy Tarreaud755ea62018-02-26 15:44:54 +01003300 chklen = MIN(flen, b_room(csbuf));
Willy Tarreaueba10f22018-04-25 20:44:22 +02003301 chklen = (chklen < 16) ? 1 : (chklen < 256) ? 2 :
3302 (chklen < 4096) ? 3 : (chklen < 65536) ? 4 :
3303 (chklen < 1048576) ? 4 : 8;
3304 chklen += 4; // CRLF, CRLF
3305 }
3306
Willy Tarreau8fc016d2017-12-11 18:27:15 +01003307 /* does it fit in output buffer or should we wait ? */
Willy Tarreaud755ea62018-02-26 15:44:54 +01003308 if (flen + chklen > b_room(csbuf)) {
3309 if (chklen >= b_room(csbuf)) {
3310 h2c->flags |= H2_CF_DEM_SFULL;
Willy Tarreau454b57b2018-02-26 15:50:05 +01003311 goto fail;
Willy Tarreaud755ea62018-02-26 15:44:54 +01003312 }
3313 flen = b_room(csbuf) - chklen;
Willy Tarreaueba10f22018-04-25 20:44:22 +02003314 }
3315
3316 if (h2s->flags & H2_SF_DATA_CHNK) {
3317 /* emit the chunk size */
3318 unsigned int chksz = flen;
3319 char str[10];
3320 char *beg;
3321
3322 beg = str + sizeof(str);
3323 *--beg = '\n';
3324 *--beg = '\r';
3325 do {
3326 *--beg = hextab[chksz & 0xF];
3327 } while (chksz >>= 4);
Willy Tarreaud755ea62018-02-26 15:44:54 +01003328 b_putblk(csbuf, beg, str + sizeof(str) - beg);
Willy Tarreau8fc016d2017-12-11 18:27:15 +01003329 }
3330
Willy Tarreau454f9052017-10-26 19:40:35 +02003331 /* Block1 is the length of the first block before the buffer wraps,
3332 * block2 is the optional second block to reach the end of the frame.
3333 */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003334 block1 = b_contig_data(&h2c->dbuf, 0);
Willy Tarreau8fc016d2017-12-11 18:27:15 +01003335 if (block1 > flen)
3336 block1 = flen;
Willy Tarreau454f9052017-10-26 19:40:35 +02003337 block2 = flen - block1;
3338
3339 if (block1)
Willy Tarreaud755ea62018-02-26 15:44:54 +01003340 b_putblk(csbuf, b_head(&h2c->dbuf), block1);
Willy Tarreau454f9052017-10-26 19:40:35 +02003341
3342 if (block2)
Willy Tarreaud755ea62018-02-26 15:44:54 +01003343 b_putblk(csbuf, b_peek(&h2c->dbuf, block1), block2);
Willy Tarreau454f9052017-10-26 19:40:35 +02003344
Willy Tarreaueba10f22018-04-25 20:44:22 +02003345 if (h2s->flags & H2_SF_DATA_CHNK) {
3346 /* emit the CRLF */
Willy Tarreaud755ea62018-02-26 15:44:54 +01003347 b_putblk(csbuf, "\r\n", 2);
Willy Tarreaueba10f22018-04-25 20:44:22 +02003348 }
3349
Willy Tarreau454f9052017-10-26 19:40:35 +02003350 /* now mark the input data as consumed (will be deleted from the buffer
3351 * by the caller when seeing FRAME_A after sending the window update).
3352 */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003353 b_del(&h2c->dbuf, flen);
Willy Tarreau8fc016d2017-12-11 18:27:15 +01003354 h2c->dfl -= flen;
3355 h2c->rcvd_c += flen;
3356 h2c->rcvd_s += flen; // warning, this can also affect the closed streams!
3357
3358 if (h2c->dfl > h2c->dpl) {
3359 /* more data available, transfer stalled on stream full */
Willy Tarreaud755ea62018-02-26 15:44:54 +01003360 h2c->flags |= H2_CF_DEM_SFULL;
Willy Tarreau454b57b2018-02-26 15:50:05 +01003361 goto fail;
Willy Tarreau8fc016d2017-12-11 18:27:15 +01003362 }
3363
Willy Tarreau4a28da12018-01-04 14:41:00 +01003364 end_transfer:
Willy Tarreau8fc016d2017-12-11 18:27:15 +01003365 /* here we're done with the frame, all the payload (except padding) was
3366 * transferred.
3367 */
Willy Tarreaueba10f22018-04-25 20:44:22 +02003368
Willy Tarreau61ea7dc2018-12-01 23:23:04 +01003369 if (h2c->dff & H2_F_DATA_END_STREAM) {
3370 if (htx) {
3371 if (!htx_add_endof(htx, HTX_BLK_EOM)) {
3372 h2c->flags |= H2_CF_DEM_SFULL;
3373 goto fail;
3374 }
Willy Tarreaud755ea62018-02-26 15:44:54 +01003375 }
Willy Tarreau61ea7dc2018-12-01 23:23:04 +01003376 else if (h2s->flags & H2_SF_DATA_CHNK) {
3377 /* emit the trailing 0 CRLF CRLF */
3378 if (b_room(csbuf) < 5) {
3379 h2c->flags |= H2_CF_DEM_SFULL;
3380 goto fail;
3381 }
3382 chklen += 5;
3383 b_putblk(csbuf, "0\r\n\r\n", 5);
3384 }
Willy Tarreaueba10f22018-04-25 20:44:22 +02003385 }
3386
Willy Tarreaud1023bb2018-03-22 16:53:12 +01003387 h2c->rcvd_c += h2c->dpl;
3388 h2c->rcvd_s += h2c->dpl;
3389 h2c->dpl = 0;
Willy Tarreau454f9052017-10-26 19:40:35 +02003390 h2c->st0 = H2_CS_FRAME_A; // send the corresponding window update
3391
Willy Tarreau39d68502018-03-02 12:26:37 +01003392 if (h2c->dff & H2_F_DATA_END_STREAM) {
Willy Tarreau454f9052017-10-26 19:40:35 +02003393 h2s->flags |= H2_SF_ES_RCVD;
Willy Tarreau39d68502018-03-02 12:26:37 +01003394 h2s->cs->flags |= CS_FL_REOS;
3395 }
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01003396 if (htx)
3397 htx_to_buf(htx, csbuf);
Willy Tarreau61ea7dc2018-12-01 23:23:04 +01003398 return 1;
Willy Tarreau454b57b2018-02-26 15:50:05 +01003399 fail:
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01003400 if (htx)
3401 htx_to_buf(htx, csbuf);
Willy Tarreau454b57b2018-02-26 15:50:05 +01003402 return 0;
Willy Tarreau454f9052017-10-26 19:40:35 +02003403}
3404
Willy Tarreau5dd17352018-06-14 13:33:30 +02003405/* Try to send a HEADERS frame matching HTTP/1 response present at offset <ofs>
3406 * and for <max> bytes in buffer <buf> for the H2 stream <h2s>. Returns the
3407 * number of bytes sent. The caller must check the stream's status to detect
3408 * any error which might have happened subsequently to a successful send.
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003409 */
Willy Tarreau206ba832018-06-14 15:27:31 +02003410static size_t h2s_frt_make_resp_headers(struct h2s *h2s, const struct buffer *buf, size_t ofs, size_t max)
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003411{
3412 struct http_hdr list[MAX_HTTP_HDR];
3413 struct h2c *h2c = h2s->h2c;
Willy Tarreaua40704a2018-09-11 13:52:04 +02003414 struct h1m *h1m = &h2s->h1m;
Willy Tarreau83061a82018-07-13 11:56:34 +02003415 struct buffer outbuf;
Willy Tarreau9c5e22e2018-09-11 19:22:14 +02003416 union h1_sl sl;
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003417 int es_now = 0;
3418 int ret = 0;
3419 int hdr;
3420
3421 if (h2c_mux_busy(h2c, h2s)) {
3422 h2s->flags |= H2_SF_BLK_MBUSY;
3423 return 0;
3424 }
3425
Willy Tarreau44e973f2018-03-01 17:49:30 +01003426 if (!h2_get_buf(h2c, &h2c->mbuf)) {
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003427 h2c->flags |= H2_CF_MUX_MALLOC;
3428 h2s->flags |= H2_SF_BLK_MROOM;
3429 return 0;
3430 }
3431
3432 /* First, try to parse the H1 response and index it into <list>.
3433 * NOTE! Since it comes from haproxy, we *know* that a response header
3434 * block does not wrap and we can safely read it this way without
3435 * having to realign the buffer.
3436 */
Willy Tarreau5dd17352018-06-14 13:33:30 +02003437 ret = h1_headers_to_hdr_list(b_peek(buf, ofs), b_peek(buf, ofs) + max,
Willy Tarreau9c5e22e2018-09-11 19:22:14 +02003438 list, sizeof(list)/sizeof(list[0]), h1m, &sl);
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003439 if (ret <= 0) {
Willy Tarreauf13ef962017-11-02 15:14:19 +01003440 /* incomplete or invalid response, this is abnormal coming from
3441 * haproxy and may only result in a bad errorfile or bad Lua code
3442 * so that won't be fixed, raise an error now.
3443 *
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003444 * FIXME: we should instead add the ability to only return a
3445 * 502 bad gateway. But in theory this is not supposed to
3446 * happen.
3447 */
3448 h2s_error(h2s, H2_ERR_INTERNAL_ERROR);
3449 ret = 0;
3450 goto end;
3451 }
3452
Willy Tarreau9c5e22e2018-09-11 19:22:14 +02003453 h2s->status = sl.st.status;
Willy Tarreaudb72da02018-09-13 11:52:20 +02003454
3455 /* certain statuses have no body or an empty one, regardless of
3456 * what the headers say.
3457 */
3458 if (sl.st.status >= 100 && sl.st.status < 200) {
3459 h1m->flags &= ~(H1_MF_CLEN | H1_MF_CHNK);
3460 h1m->curr_len = h1m->body_len = 0;
3461 }
3462 else if (sl.st.status == 204 || sl.st.status == 304) {
3463 /* no contents, claim c-len is present and set to zero */
3464 h1m->flags &= ~H1_MF_CHNK;
3465 h1m->flags |= H1_MF_CLEN;
3466 h1m->curr_len = h1m->body_len = 0;
3467 }
3468
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003469 chunk_reset(&outbuf);
3470
3471 while (1) {
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003472 outbuf.area = b_tail(&h2c->mbuf);
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003473 outbuf.size = b_contig_space(&h2c->mbuf);
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003474 outbuf.data = 0;
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003475
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003476 if (outbuf.size >= 9 || !b_space_wraps(&h2c->mbuf))
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003477 break;
3478 realign_again:
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003479 b_slow_realign(&h2c->mbuf, trash.area, b_data(&h2c->mbuf));
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003480 }
3481
Willy Tarreaub5b7d4a2018-09-12 18:51:18 +02003482 if (outbuf.size < 9)
3483 goto full;
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003484
3485 /* len: 0x000000 (fill later), type: 1(HEADERS), flags: ENDH=4 */
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003486 memcpy(outbuf.area, "\x00\x00\x00\x01\x04", 5);
3487 write_n32(outbuf.area + 5, h2s->id); // 4 bytes
3488 outbuf.data = 9;
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003489
3490 /* encode status, which necessarily is the first one */
Willy Tarreauaafdf582018-12-10 18:06:40 +01003491 if (unlikely(list[0].v.len != 3)) {
Willy Tarreaua87f2022017-11-09 11:23:00 +01003492 /* this is an unparsable response */
3493 h2s_error(h2s, H2_ERR_INTERNAL_ERROR);
3494 ret = 0;
3495 goto end;
3496 }
Willy Tarreauaafdf582018-12-10 18:06:40 +01003497
3498 if (!hpack_encode_str_status(&outbuf, h2s->status, list[0].v)) {
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003499 if (b_space_wraps(&h2c->mbuf))
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003500 goto realign_again;
Willy Tarreaub5b7d4a2018-09-12 18:51:18 +02003501 goto full;
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003502 }
3503
3504 /* encode all headers, stop at empty name */
3505 for (hdr = 1; hdr < sizeof(list)/sizeof(list[0]); hdr++) {
Willy Tarreaua76e4c22017-11-24 08:17:28 +01003506 /* these ones do not exist in H2 and must be dropped. */
3507 if (isteq(list[hdr].n, ist("connection")) ||
3508 isteq(list[hdr].n, ist("proxy-connection")) ||
3509 isteq(list[hdr].n, ist("keep-alive")) ||
3510 isteq(list[hdr].n, ist("upgrade")) ||
3511 isteq(list[hdr].n, ist("transfer-encoding")))
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003512 continue;
3513
3514 if (isteq(list[hdr].n, ist("")))
3515 break; // end
3516
3517 if (!hpack_encode_header(&outbuf, list[hdr].n, list[hdr].v)) {
3518 /* output full */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003519 if (b_space_wraps(&h2c->mbuf))
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003520 goto realign_again;
Willy Tarreaub5b7d4a2018-09-12 18:51:18 +02003521 goto full;
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003522 }
3523 }
3524
3525 /* we may need to add END_STREAM */
3526 if (((h1m->flags & H1_MF_CLEN) && !h1m->body_len) || h2s->cs->flags & CS_FL_SHW)
3527 es_now = 1;
3528
3529 /* update the frame's size */
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003530 h2_set_frame_size(outbuf.area, outbuf.data - 9);
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003531
3532 if (es_now)
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003533 outbuf.area[4] |= H2_F_HEADERS_END_STREAM;
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003534
3535 /* consume incoming H1 response */
Willy Tarreau5dd17352018-06-14 13:33:30 +02003536 max -= ret;
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003537
3538 /* commit the H2 response */
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003539 b_add(&h2c->mbuf, outbuf.data);
Willy Tarreau67434202017-11-06 20:20:51 +01003540 h2s->flags |= H2_SF_HEADERS_SENT;
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003541
3542 /* for now we don't implemented CONTINUATION, so we wait for a
3543 * body or directly end in TRL2.
3544 */
3545 if (es_now) {
Willy Tarreau35a62702018-02-27 15:37:25 +01003546 // trim any possibly pending data (eg: inconsistent content-length)
Willy Tarreau5dd17352018-06-14 13:33:30 +02003547 ret += max;
Willy Tarreau35a62702018-02-27 15:37:25 +01003548
Willy Tarreau801250e2018-09-11 11:45:04 +02003549 h1m->state = H1_MSG_DONE;
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003550 h2s->flags |= H2_SF_ES_SENT;
3551 if (h2s->st == H2_SS_OPEN)
3552 h2s->st = H2_SS_HLOC;
3553 else
Willy Tarreau00dd0782018-03-01 16:31:34 +01003554 h2s_close(h2s);
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003555 }
Willy Tarreau9c5e22e2018-09-11 19:22:14 +02003556 else if (h2s->status >= 100 && h2s->status < 200) {
Willy Tarreau87285592017-11-29 15:41:32 +01003557 /* we'll let the caller check if it has more headers to send */
Willy Tarreau7f437ff2018-09-11 13:51:19 +02003558 h1m_init_res(h1m);
Willy Tarreau9b8cd1f2018-09-12 09:24:38 +02003559 h1m->err_pos = -1; // don't care about errors on the response path
Willy Tarreaueb528db2018-09-12 09:54:00 +02003560 h2s->h1m.flags |= H1_MF_TOLOWER;
Willy Tarreau87285592017-11-29 15:41:32 +01003561 goto end;
Willy Tarreauc199faf2017-10-31 08:35:27 +01003562 }
Willy Tarreau001823c2018-09-12 17:25:32 +02003563
3564 /* now the h1m state is either H1_MSG_CHUNK_SIZE or H1_MSG_DATA */
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003565
3566 end:
Dirkjan Bussinkc26c72d2018-09-14 14:30:25 +02003567 //fprintf(stderr, "[%d] sent simple H2 response (sid=%d) = %d bytes (%d in, ep=%u, es=%s)\n", h2c->st0, h2s->id, outbuf.len, ret, h1m->err_pos, h1m_state_str(h1m->err_state));
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003568 return ret;
Willy Tarreaub5b7d4a2018-09-12 18:51:18 +02003569 full:
3570 h1m_init_res(h1m);
3571 h1m->err_pos = -1; // don't care about errors on the response path
3572 h2c->flags |= H2_CF_MUX_MFULL;
3573 h2s->flags |= H2_SF_BLK_MROOM;
3574 ret = 0;
3575 goto end;
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02003576}
3577
Willy Tarreau5dd17352018-06-14 13:33:30 +02003578/* Try to send a DATA frame matching HTTP/1 response present at offset <ofs>
3579 * for up to <max> bytes in response buffer <buf>, for stream <h2s>. Returns
3580 * the number of bytes sent. The caller must check the stream's status to
3581 * detect any error which might have happened subsequently to a successful send.
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003582 */
Willy Tarreau206ba832018-06-14 15:27:31 +02003583static size_t h2s_frt_make_resp_data(struct h2s *h2s, const struct buffer *buf, size_t ofs, size_t max)
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003584{
3585 struct h2c *h2c = h2s->h2c;
Willy Tarreaua40704a2018-09-11 13:52:04 +02003586 struct h1m *h1m = &h2s->h1m;
Willy Tarreau83061a82018-07-13 11:56:34 +02003587 struct buffer outbuf;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003588 int ret = 0;
Willy Tarreau1dc41e72018-06-14 13:21:28 +02003589 size_t total = 0;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003590 int es_now = 0;
3591 int size = 0;
Willy Tarreau206ba832018-06-14 15:27:31 +02003592 const char *blk1, *blk2;
Willy Tarreau55f3ce12018-07-18 11:49:27 +02003593 size_t len1, len2;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003594
3595 if (h2c_mux_busy(h2c, h2s)) {
3596 h2s->flags |= H2_SF_BLK_MBUSY;
3597 goto end;
3598 }
3599
Willy Tarreau44e973f2018-03-01 17:49:30 +01003600 if (!h2_get_buf(h2c, &h2c->mbuf)) {
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003601 h2c->flags |= H2_CF_MUX_MALLOC;
3602 h2s->flags |= H2_SF_BLK_MROOM;
3603 goto end;
3604 }
3605
3606 new_frame:
Willy Tarreau5dd17352018-06-14 13:33:30 +02003607 if (!max)
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003608 goto end;
3609
3610 chunk_reset(&outbuf);
3611
3612 while (1) {
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003613 outbuf.area = b_tail(&h2c->mbuf);
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003614 outbuf.size = b_contig_space(&h2c->mbuf);
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003615 outbuf.data = 0;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003616
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003617 if (outbuf.size >= 9 || !b_space_wraps(&h2c->mbuf))
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003618 break;
3619 realign_again:
Willy Tarreau06ae84a2018-12-12 09:17:21 +01003620 /* If there are pending data in the output buffer, and we have
3621 * less than 1/4 of the mbuf's size and everything fits, we'll
3622 * still perform a copy anyway. Otherwise we'll pretend the mbuf
3623 * is full and wait, to save some slow realign calls.
3624 */
3625 if ((max + 9 > b_room(&h2c->mbuf) || max >= b_size(&h2c->mbuf) / 4)) {
3626 h2c->flags |= H2_CF_MUX_MFULL;
3627 h2s->flags |= H2_SF_BLK_MROOM;
3628 goto end;
3629 }
3630
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003631 b_slow_realign(&h2c->mbuf, trash.area, b_data(&h2c->mbuf));
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003632 }
3633
3634 if (outbuf.size < 9) {
3635 h2c->flags |= H2_CF_MUX_MFULL;
3636 h2s->flags |= H2_SF_BLK_MROOM;
3637 goto end;
3638 }
3639
3640 /* len: 0x000000 (fill later), type: 0(DATA), flags: none=0 */
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003641 memcpy(outbuf.area, "\x00\x00\x00\x00\x00", 5);
3642 write_n32(outbuf.area + 5, h2s->id); // 4 bytes
3643 outbuf.data = 9;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003644
3645 switch (h1m->flags & (H1_MF_CLEN|H1_MF_CHNK)) {
3646 case 0: /* no content length, read till SHUTW */
Willy Tarreau5dd17352018-06-14 13:33:30 +02003647 size = max;
Willy Tarreau13e4e942017-12-14 10:55:21 +01003648 h1m->curr_len = size;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003649 break;
3650 case H1_MF_CLEN: /* content-length: read only h2m->body_len */
Willy Tarreau5dd17352018-06-14 13:33:30 +02003651 size = max;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003652 if ((long long)size > h1m->curr_len)
3653 size = h1m->curr_len;
3654 break;
3655 default: /* te:chunked : parse chunks */
Willy Tarreau801250e2018-09-11 11:45:04 +02003656 if (h1m->state == H1_MSG_CHUNK_CRLF) {
Willy Tarreauc0973c62018-06-14 15:53:21 +02003657 ret = h1_skip_chunk_crlf(buf, ofs, ofs + max);
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003658 if (!ret)
3659 goto end;
3660
3661 if (ret < 0) {
3662 /* FIXME: bad contents. how to proceed here when we're in H2 ? */
Willy Tarreau25173a72018-09-12 09:05:16 +02003663 h1m->err_pos = ofs + max + ret;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003664 h2s_error(h2s, H2_ERR_INTERNAL_ERROR);
3665 goto end;
3666 }
Willy Tarreau5dd17352018-06-14 13:33:30 +02003667 max -= ret;
3668 ofs += ret;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003669 total += ret;
Willy Tarreau801250e2018-09-11 11:45:04 +02003670 h1m->state = H1_MSG_CHUNK_SIZE;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003671 }
3672
Willy Tarreau801250e2018-09-11 11:45:04 +02003673 if (h1m->state == H1_MSG_CHUNK_SIZE) {
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003674 unsigned int chunk;
Willy Tarreau84d6b7a2018-06-14 15:59:05 +02003675 ret = h1_parse_chunk_size(buf, ofs, ofs + max, &chunk);
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003676 if (!ret)
3677 goto end;
3678
3679 if (ret < 0) {
3680 /* FIXME: bad contents. how to proceed here when we're in H2 ? */
Willy Tarreau25173a72018-09-12 09:05:16 +02003681 h1m->err_pos = ofs + max + ret;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003682 h2s_error(h2s, H2_ERR_INTERNAL_ERROR);
3683 goto end;
3684 }
3685
3686 size = chunk;
3687 h1m->curr_len = chunk;
3688 h1m->body_len += chunk;
Willy Tarreau5dd17352018-06-14 13:33:30 +02003689 max -= ret;
3690 ofs += ret;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003691 total += ret;
Willy Tarreau801250e2018-09-11 11:45:04 +02003692 h1m->state = size ? H1_MSG_DATA : H1_MSG_TRAILERS;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003693 if (!size)
3694 goto send_empty;
3695 }
3696
3697 /* in MSG_DATA state, continue below */
3698 size = h1m->curr_len;
3699 break;
3700 }
3701
3702 /* we have in <size> the exact number of bytes we need to copy from
3703 * the H1 buffer. We need to check this against the connection's and
3704 * the stream's send windows, and to ensure that this fits in the max
3705 * frame size and in the buffer's available space minus 9 bytes (for
3706 * the frame header). The connection's flow control is applied last so
3707 * that we can use a separate list of streams which are immediately
3708 * unblocked on window opening. Note: we don't implement padding.
3709 */
3710
Willy Tarreau5dd17352018-06-14 13:33:30 +02003711 if (size > max)
3712 size = max;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003713
3714 if (size > h2s->mws)
3715 size = h2s->mws;
3716
3717 if (size <= 0) {
3718 h2s->flags |= H2_SF_BLK_SFCTL;
Olivier Houcharddddfe312018-10-10 18:51:00 +02003719 if (h2s->send_wait) {
3720 LIST_DEL(&h2s->list);
3721 LIST_INIT(&h2s->list);
3722 }
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003723 goto end;
3724 }
3725
3726 if (h2c->mfs && size > h2c->mfs)
3727 size = h2c->mfs;
3728
3729 if (size + 9 > outbuf.size) {
3730 /* we have an opportunity for enlarging the too small
3731 * available space, let's try.
3732 */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003733 if (b_space_wraps(&h2c->mbuf))
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003734 goto realign_again;
3735 size = outbuf.size - 9;
3736 }
3737
3738 if (size <= 0) {
3739 h2c->flags |= H2_CF_MUX_MFULL;
3740 h2s->flags |= H2_SF_BLK_MROOM;
3741 goto end;
3742 }
3743
3744 if (size > h2c->mws)
3745 size = h2c->mws;
3746
3747 if (size <= 0) {
3748 h2s->flags |= H2_SF_BLK_MFCTL;
3749 goto end;
3750 }
3751
3752 /* copy whatever we can */
3753 blk1 = blk2 = NULL; // silence a maybe-uninitialized warning
Willy Tarreau5dd17352018-06-14 13:33:30 +02003754 ret = b_getblk_nc(buf, &blk1, &len1, &blk2, &len2, ofs, max);
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003755 if (ret == 1)
3756 len2 = 0;
3757
3758 if (!ret || len1 + len2 < size) {
3759 /* FIXME: must normally never happen */
3760 h2s_error(h2s, H2_ERR_INTERNAL_ERROR);
3761 goto end;
3762 }
3763
3764 /* limit len1/len2 to size */
3765 if (len1 + len2 > size) {
3766 int sub = len1 + len2 - size;
3767
3768 if (len2 > sub)
3769 len2 -= sub;
3770 else {
3771 sub -= len2;
3772 len2 = 0;
3773 len1 -= sub;
3774 }
3775 }
3776
3777 /* now let's copy this this into the output buffer */
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003778 memcpy(outbuf.area + 9, blk1, len1);
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003779 if (len2)
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003780 memcpy(outbuf.area + 9 + len1, blk2, len2);
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003781
3782 send_empty:
3783 /* we may need to add END_STREAM */
3784 /* FIXME: we should also detect shutdown(w) below, but how ? Maybe we
3785 * could rely on the MSG_MORE flag as a hint for this ?
Willy Tarreau00610962018-07-19 10:58:28 +02003786 *
3787 * FIXME: what we do here is not correct because we send end_stream
3788 * before knowing if we'll have to send a HEADERS frame for the
3789 * trailers. More importantly we're not consuming the trailing CRLF
3790 * after the end of trailers, so it will be left to the caller to
3791 * eat it. The right way to do it would be to measure trailers here
3792 * and to send ES only if there are no trailers.
3793 *
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003794 */
3795 if (((h1m->flags & H1_MF_CLEN) && !(h1m->curr_len - size)) ||
Willy Tarreau801250e2018-09-11 11:45:04 +02003796 !h1m->curr_len || h1m->state >= H1_MSG_DONE)
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003797 es_now = 1;
3798
3799 /* update the frame's size */
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003800 h2_set_frame_size(outbuf.area, size);
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003801
3802 if (es_now)
Willy Tarreau843b7cb2018-07-13 10:54:26 +02003803 outbuf.area[4] |= H2_F_DATA_END_STREAM;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003804
3805 /* commit the H2 response */
Willy Tarreauc9fa0482018-07-10 17:43:27 +02003806 b_add(&h2c->mbuf, size + 9);
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003807
3808 /* consume incoming H1 response */
3809 if (size > 0) {
Willy Tarreau5dd17352018-06-14 13:33:30 +02003810 max -= size;
3811 ofs += size;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003812 total += size;
3813 h1m->curr_len -= size;
3814 h2s->mws -= size;
3815 h2c->mws -= size;
3816
3817 if (size && !h1m->curr_len && (h1m->flags & H1_MF_CHNK)) {
Willy Tarreau801250e2018-09-11 11:45:04 +02003818 h1m->state = H1_MSG_CHUNK_CRLF;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003819 goto new_frame;
3820 }
3821 }
3822
3823 if (es_now) {
3824 if (h2s->st == H2_SS_OPEN)
3825 h2s->st = H2_SS_HLOC;
3826 else
Willy Tarreau00dd0782018-03-01 16:31:34 +01003827 h2s_close(h2s);
Willy Tarreau9d89ac82017-10-31 17:15:59 +01003828
Willy Tarreau35a62702018-02-27 15:37:25 +01003829 if (!(h1m->flags & H1_MF_CHNK)) {
3830 // trim any possibly pending data (eg: inconsistent content-length)
Willy Tarreau5dd17352018-06-14 13:33:30 +02003831 total += max;
3832 ofs += max;
3833 max = 0;
Willy Tarreau35a62702018-02-27 15:37:25 +01003834
Willy Tarreau801250e2018-09-11 11:45:04 +02003835 h1m->state = H1_MSG_DONE;
Willy Tarreau35a62702018-02-27 15:37:25 +01003836 }
Willy Tarreau9d89ac82017-10-31 17:15:59 +01003837
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003838 h2s->flags |= H2_SF_ES_SENT;
3839 }
3840
3841 end:
Dirkjan Bussinkc26c72d2018-09-14 14:30:25 +02003842 trace("[%d] sent simple H2 DATA response (sid=%d) = %d bytes out (%u in, st=%s, ep=%u, es=%s, h2cws=%d h2sws=%d) data=%u", h2c->st0, h2s->id, size+9, (unsigned int)total, h1m_state_str(h1m->state), h1m->err_pos, h1m_state_str(h1m->err_state), h2c->mws, h2s->mws, (unsigned int)b_data(buf));
Willy Tarreauc652dbd2017-10-19 11:16:37 +02003843 return total;
3844}
3845
Willy Tarreau115e83b2018-12-01 19:17:53 +01003846/* Try to send a HEADERS frame matching HTX response present in HTX message
3847 * <htx> for the H2 stream <h2s>. Returns the number of bytes sent. The caller
3848 * must check the stream's status to detect any error which might have happened
3849 * subsequently to a successful send. The htx blocks are automatically removed
3850 * from the message. The htx message is assumed to be valid since produced from
3851 * the internal code, hence it contains a start line, an optional series of
3852 * header blocks and an end of header, otherwise an invalid frame could be
3853 * emitted and the resulting htx message could be left in an inconsistent state.
3854 */
3855static size_t h2s_htx_frt_make_resp_headers(struct h2s *h2s, struct htx *htx)
3856{
3857 struct http_hdr list[MAX_HTTP_HDR];
3858 struct h2c *h2c = h2s->h2c;
3859 struct htx_blk *blk;
3860 struct htx_blk *blk_end;
3861 struct buffer outbuf;
3862 struct htx_sl *sl;
3863 enum htx_blk_type type;
3864 int es_now = 0;
3865 int ret = 0;
3866 int hdr;
3867 int idx;
3868
3869 if (h2c_mux_busy(h2c, h2s)) {
3870 h2s->flags |= H2_SF_BLK_MBUSY;
3871 return 0;
3872 }
3873
3874 if (!h2_get_buf(h2c, &h2c->mbuf)) {
3875 h2c->flags |= H2_CF_MUX_MALLOC;
3876 h2s->flags |= H2_SF_BLK_MROOM;
3877 return 0;
3878 }
3879
3880 /* determine the first block which must not be deleted, blk_end may
3881 * be NULL if all blocks have to be deleted.
3882 */
3883 idx = htx_get_head(htx);
3884 blk_end = NULL;
3885 while (idx != -1) {
3886 type = htx_get_blk_type(htx_get_blk(htx, idx));
3887 idx = htx_get_next(htx, idx);
3888 if (type == HTX_BLK_EOH) {
3889 if (idx != -1)
3890 blk_end = htx_get_blk(htx, idx);
3891 break;
3892 }
3893 }
3894
3895 /* get the start line, we do have one */
Willy Tarreau8e162ee2018-12-06 14:07:27 +01003896 sl = htx_get_stline(htx);
Willy Tarreaue2778a42018-12-08 15:30:46 +01003897 ALREADY_CHECKED(sl);
Willy Tarreau115e83b2018-12-01 19:17:53 +01003898 h2s->status = sl->info.res.status;
Willy Tarreauaafdf582018-12-10 18:06:40 +01003899 if (h2s->status < 100 || h2s->status > 999)
3900 goto fail;
Willy Tarreau115e83b2018-12-01 19:17:53 +01003901
3902 /* and the rest of the headers, that we dump starting at header 0 */
3903 hdr = 0;
3904
Willy Tarreau8e162ee2018-12-06 14:07:27 +01003905 idx = htx_get_head(htx); // returns the SL that we skip
Willy Tarreau115e83b2018-12-01 19:17:53 +01003906 while ((idx = htx_get_next(htx, idx)) != -1) {
3907 blk = htx_get_blk(htx, idx);
3908 type = htx_get_blk_type(blk);
3909
3910 if (type == HTX_BLK_UNUSED)
3911 continue;
3912
3913 if (type != HTX_BLK_HDR)
3914 break;
3915
3916 if (unlikely(hdr >= sizeof(list)/sizeof(list[0]) - 1))
3917 goto fail;
3918
3919 list[hdr].n = htx_get_blk_name(htx, blk);
3920 list[hdr].v = htx_get_blk_value(htx, blk);
Willy Tarreau115e83b2018-12-01 19:17:53 +01003921 hdr++;
3922 }
3923
3924 /* marker for end of headers */
3925 list[hdr].n = ist("");
3926
3927 if (h2s->status == 204 || h2s->status == 304) {
3928 /* no contents, claim c-len is present and set to zero */
3929 es_now = 1;
3930 }
3931
3932 chunk_reset(&outbuf);
3933
3934 while (1) {
3935 outbuf.area = b_tail(&h2c->mbuf);
3936 outbuf.size = b_contig_space(&h2c->mbuf);
3937 outbuf.data = 0;
3938
3939 if (outbuf.size >= 9 || !b_space_wraps(&h2c->mbuf))
3940 break;
3941 realign_again:
3942 b_slow_realign(&h2c->mbuf, trash.area, b_data(&h2c->mbuf));
3943 }
3944
3945 if (outbuf.size < 9)
3946 goto full;
3947
3948 /* len: 0x000000 (fill later), type: 1(HEADERS), flags: ENDH=4 */
3949 memcpy(outbuf.area, "\x00\x00\x00\x01\x04", 5);
3950 write_n32(outbuf.area + 5, h2s->id); // 4 bytes
3951 outbuf.data = 9;
3952
3953 /* encode status, which necessarily is the first one */
Willy Tarreauaafdf582018-12-10 18:06:40 +01003954 if (!hpack_encode_int_status(&outbuf, h2s->status)) {
Willy Tarreau115e83b2018-12-01 19:17:53 +01003955 if (b_space_wraps(&h2c->mbuf))
3956 goto realign_again;
3957 goto full;
3958 }
3959
3960 /* encode all headers, stop at empty name */
3961 for (hdr = 0; hdr < sizeof(list)/sizeof(list[0]); hdr++) {
3962 /* these ones do not exist in H2 and must be dropped. */
3963 if (isteq(list[hdr].n, ist("connection")) ||
3964 isteq(list[hdr].n, ist("proxy-connection")) ||
3965 isteq(list[hdr].n, ist("keep-alive")) ||
3966 isteq(list[hdr].n, ist("upgrade")) ||
3967 isteq(list[hdr].n, ist("transfer-encoding")))
3968 continue;
3969
3970 if (isteq(list[hdr].n, ist("")))
3971 break; // end
3972
3973 if (!hpack_encode_header(&outbuf, list[hdr].n, list[hdr].v)) {
3974 /* output full */
3975 if (b_space_wraps(&h2c->mbuf))
3976 goto realign_again;
3977 goto full;
3978 }
3979 }
3980
3981 /* we may need to add END_STREAM.
3982 * FIXME: we should also set it when we know for sure that the
3983 * content-length is zero as well as on 204/304
3984 */
3985 if (blk_end && htx_get_blk_type(blk_end) == HTX_BLK_EOM)
3986 es_now = 1;
3987
3988 if (h2s->cs->flags & CS_FL_SHW)
3989 es_now = 1;
3990
3991 /* update the frame's size */
3992 h2_set_frame_size(outbuf.area, outbuf.data - 9);
3993
3994 if (es_now)
3995 outbuf.area[4] |= H2_F_HEADERS_END_STREAM;
3996
3997 /* commit the H2 response */
3998 b_add(&h2c->mbuf, outbuf.data);
3999 h2s->flags |= H2_SF_HEADERS_SENT;
4000
4001 /* for now we don't implemented CONTINUATION, so we wait for a
4002 * body or directly end in TRL2.
4003 */
4004 if (es_now) {
4005 h2s->flags |= H2_SF_ES_SENT;
4006 if (h2s->st == H2_SS_OPEN)
4007 h2s->st = H2_SS_HLOC;
4008 else
4009 h2s_close(h2s);
4010 }
4011
4012 /* OK we could properly deliver the response */
4013
4014 /* remove all header blocks including the EOH and compute the
4015 * corresponding size.
4016 *
4017 * FIXME: We should remove everything when es_now is set.
4018 */
4019 ret = 0;
4020 idx = htx_get_head(htx);
4021 blk = htx_get_blk(htx, idx);
4022 while (blk != blk_end) {
4023 ret += htx_get_blksz(blk);
4024 blk = htx_remove_blk(htx, blk);
4025 }
Willy Tarreauc5753ae2018-12-02 12:28:01 +01004026
4027 if (blk_end && htx_get_blk_type(blk_end) == HTX_BLK_EOM)
4028 htx_remove_blk(htx, blk_end);
Willy Tarreau115e83b2018-12-01 19:17:53 +01004029 end:
4030 return ret;
4031 full:
4032 h2c->flags |= H2_CF_MUX_MFULL;
4033 h2s->flags |= H2_SF_BLK_MROOM;
4034 ret = 0;
4035 goto end;
4036 fail:
4037 /* unparsable HTX messages, too large ones to be produced in the local
4038 * list etc go here (unrecoverable errors).
4039 */
4040 h2s_error(h2s, H2_ERR_INTERNAL_ERROR);
4041 ret = 0;
4042 goto end;
4043}
4044
Willy Tarreau80739692018-10-05 11:35:57 +02004045/* Try to send a HEADERS frame matching HTX request present in HTX message
4046 * <htx> for the H2 stream <h2s>. Returns the number of bytes sent. The caller
4047 * must check the stream's status to detect any error which might have happened
4048 * subsequently to a successful send. The htx blocks are automatically removed
4049 * from the message. The htx message is assumed to be valid since produced from
4050 * the internal code, hence it contains a start line, an optional series of
4051 * header blocks and an end of header, otherwise an invalid frame could be
4052 * emitted and the resulting htx message could be left in an inconsistent state.
4053 */
4054static size_t h2s_htx_bck_make_req_headers(struct h2s *h2s, struct htx *htx)
4055{
4056 struct http_hdr list[MAX_HTTP_HDR];
4057 struct h2c *h2c = h2s->h2c;
4058 struct htx_blk *blk;
4059 struct htx_blk *blk_end;
4060 struct buffer outbuf;
4061 struct htx_sl *sl;
4062 struct ist meth, path;
4063 enum htx_blk_type type;
4064 int es_now = 0;
4065 int ret = 0;
4066 int hdr;
4067 int idx;
4068
4069 if (h2c_mux_busy(h2c, h2s)) {
4070 h2s->flags |= H2_SF_BLK_MBUSY;
4071 return 0;
4072 }
4073
4074 if (!h2_get_buf(h2c, &h2c->mbuf)) {
4075 h2c->flags |= H2_CF_MUX_MALLOC;
4076 h2s->flags |= H2_SF_BLK_MROOM;
4077 return 0;
4078 }
4079
4080 /* determine the first block which must not be deleted, blk_end may
4081 * be NULL if all blocks have to be deleted.
4082 */
4083 idx = htx_get_head(htx);
4084 blk_end = NULL;
4085 while (idx != -1) {
4086 type = htx_get_blk_type(htx_get_blk(htx, idx));
4087 idx = htx_get_next(htx, idx);
4088 if (type == HTX_BLK_EOH) {
4089 if (idx != -1)
4090 blk_end = htx_get_blk(htx, idx);
4091 break;
4092 }
4093 }
4094
4095 /* get the start line, we do have one */
Willy Tarreau8e162ee2018-12-06 14:07:27 +01004096 sl = htx_get_stline(htx);
Willy Tarreaue2778a42018-12-08 15:30:46 +01004097 ALREADY_CHECKED(sl);
Willy Tarreau80739692018-10-05 11:35:57 +02004098 meth = htx_sl_req_meth(sl);
4099 path = htx_sl_req_uri(sl);
4100
4101 /* and the rest of the headers, that we dump starting at header 0 */
4102 hdr = 0;
4103
Willy Tarreau8e162ee2018-12-06 14:07:27 +01004104 idx = htx_get_head(htx); // returns the SL that we skip
Willy Tarreau80739692018-10-05 11:35:57 +02004105 while ((idx = htx_get_next(htx, idx)) != -1) {
4106 blk = htx_get_blk(htx, idx);
4107 type = htx_get_blk_type(blk);
4108
4109 if (type == HTX_BLK_UNUSED)
4110 continue;
4111
4112 if (type != HTX_BLK_HDR)
4113 break;
4114
4115 if (unlikely(hdr >= sizeof(list)/sizeof(list[0]) - 1))
4116 goto fail;
4117
4118 list[hdr].n = htx_get_blk_name(htx, blk);
4119 list[hdr].v = htx_get_blk_value(htx, blk);
Willy Tarreau80739692018-10-05 11:35:57 +02004120 hdr++;
4121 }
4122
4123 /* marker for end of headers */
4124 list[hdr].n = ist("");
4125
4126 chunk_reset(&outbuf);
4127
4128 while (1) {
4129 outbuf.area = b_tail(&h2c->mbuf);
4130 outbuf.size = b_contig_space(&h2c->mbuf);
4131 outbuf.data = 0;
4132
4133 if (outbuf.size >= 9 || !b_space_wraps(&h2c->mbuf))
4134 break;
4135 realign_again:
4136 b_slow_realign(&h2c->mbuf, trash.area, b_data(&h2c->mbuf));
4137 }
4138
4139 if (outbuf.size < 9)
4140 goto full;
4141
4142 /* len: 0x000000 (fill later), type: 1(HEADERS), flags: ENDH=4 */
4143 memcpy(outbuf.area, "\x00\x00\x00\x01\x04", 5);
4144 write_n32(outbuf.area + 5, h2s->id); // 4 bytes
4145 outbuf.data = 9;
4146
4147 /* encode the method, which necessarily is the first one */
Willy Tarreaubdabc3a2018-12-10 18:25:11 +01004148 if (!hpack_encode_method(&outbuf, sl->info.req.meth, meth)) {
Willy Tarreau80739692018-10-05 11:35:57 +02004149 if (b_space_wraps(&h2c->mbuf))
4150 goto realign_again;
4151 goto full;
4152 }
4153
4154 /* encode the scheme which is always "https" (or 0x86 for "http") */
Willy Tarreau7561bcb2018-12-10 19:17:06 +01004155 if (!hpack_encode_scheme(&outbuf, ist("https"))) {
4156 /* output full */
4157 if (b_space_wraps(&h2c->mbuf))
4158 goto realign_again;
4159 goto full;
4160 }
Willy Tarreau80739692018-10-05 11:35:57 +02004161
4162 /* encode the path, which necessarily is the second one */
Willy Tarreau90799812018-12-10 19:28:38 +01004163 if (!hpack_encode_path(&outbuf, path)) {
Willy Tarreau80739692018-10-05 11:35:57 +02004164 /* output full */
4165 if (b_space_wraps(&h2c->mbuf))
4166 goto realign_again;
4167 goto full;
4168 }
4169
4170 /* encode all headers, stop at empty name */
4171 for (hdr = 0; hdr < sizeof(list)/sizeof(list[0]); hdr++) {
4172 /* these ones do not exist in H2 and must be dropped. */
4173 if (isteq(list[hdr].n, ist("connection")) ||
4174 isteq(list[hdr].n, ist("proxy-connection")) ||
4175 isteq(list[hdr].n, ist("keep-alive")) ||
4176 isteq(list[hdr].n, ist("upgrade")) ||
4177 isteq(list[hdr].n, ist("transfer-encoding")))
4178 continue;
4179
4180 if (isteq(list[hdr].n, ist("")))
4181 break; // end
4182
4183 if (!hpack_encode_header(&outbuf, list[hdr].n, list[hdr].v)) {
4184 /* output full */
4185 if (b_space_wraps(&h2c->mbuf))
4186 goto realign_again;
4187 goto full;
4188 }
4189 }
4190
4191 /* we may need to add END_STREAM if we have no body :
4192 * - request already closed, or :
4193 * - no transfer-encoding, and :
4194 * - no content-length or content-length:0
4195 * Fixme: this doesn't take into account CONNECT requests.
4196 */
4197 if (blk_end && htx_get_blk_type(blk_end) == HTX_BLK_EOM)
4198 es_now = 1;
4199
4200 if (sl->flags & HTX_SL_F_BODYLESS)
4201 es_now = 1;
4202
4203 if (h2s->cs->flags & CS_FL_SHW)
4204 es_now = 1;
4205
4206 /* update the frame's size */
4207 h2_set_frame_size(outbuf.area, outbuf.data - 9);
4208
4209 if (es_now)
4210 outbuf.area[4] |= H2_F_HEADERS_END_STREAM;
4211
4212 /* commit the H2 response */
4213 b_add(&h2c->mbuf, outbuf.data);
4214 h2s->flags |= H2_SF_HEADERS_SENT;
4215 h2s->st = H2_SS_OPEN;
4216
4217 /* for now we don't implemented CONTINUATION, so we wait for a
4218 * body or directly end in TRL2.
4219 */
4220 if (es_now) {
4221 // trim any possibly pending data (eg: inconsistent content-length)
4222 h2s->flags |= H2_SF_ES_SENT;
4223 h2s->st = H2_SS_HLOC;
4224 }
4225
4226 /* remove all header blocks including the EOH and compute the
4227 * corresponding size.
4228 *
4229 * FIXME: We should remove everything when es_now is set.
4230 */
4231 ret = 0;
4232 idx = htx_get_head(htx);
4233 blk = htx_get_blk(htx, idx);
4234 while (blk != blk_end) {
4235 ret += htx_get_blksz(blk);
4236 blk = htx_remove_blk(htx, blk);
4237 }
4238
4239 if (blk_end && htx_get_blk_type(blk_end) == HTX_BLK_EOM)
4240 htx_remove_blk(htx, blk_end);
4241
4242 end:
4243 return ret;
4244 full:
4245 h2c->flags |= H2_CF_MUX_MFULL;
4246 h2s->flags |= H2_SF_BLK_MROOM;
4247 ret = 0;
4248 goto end;
4249 fail:
4250 /* unparsable HTX messages, too large ones to be produced in the local
4251 * list etc go here (unrecoverable errors).
4252 */
4253 h2s_error(h2s, H2_ERR_INTERNAL_ERROR);
4254 ret = 0;
4255 goto end;
4256}
4257
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004258/* Try to send a DATA frame matching HTTP response present in HTX structure
Willy Tarreau98de12a2018-12-12 07:03:00 +01004259 * present in <buf>, for stream <h2s>. Returns the number of bytes sent. The
4260 * caller must check the stream's status to detect any error which might have
4261 * happened subsequently to a successful send. Returns the number of data bytes
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004262 * consumed, or zero if nothing done. Note that EOD/EOM count for 1 byte.
4263 */
Willy Tarreau98de12a2018-12-12 07:03:00 +01004264static size_t h2s_htx_frt_make_resp_data(struct h2s *h2s, struct buffer *buf, size_t count)
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004265{
4266 struct h2c *h2c = h2s->h2c;
Willy Tarreau98de12a2018-12-12 07:03:00 +01004267 struct htx *htx;
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004268 struct buffer outbuf;
4269 size_t total = 0;
4270 int es_now = 0;
4271 int bsize; /* htx block size */
4272 int fsize; /* h2 frame size */
4273 struct htx_blk *blk;
4274 enum htx_blk_type type;
4275 int idx;
4276
4277 if (h2c_mux_busy(h2c, h2s)) {
4278 h2s->flags |= H2_SF_BLK_MBUSY;
4279 goto end;
4280 }
4281
4282 if (!h2_get_buf(h2c, &h2c->mbuf)) {
4283 h2c->flags |= H2_CF_MUX_MALLOC;
4284 h2s->flags |= H2_SF_BLK_MROOM;
4285 goto end;
4286 }
4287
Willy Tarreau98de12a2018-12-12 07:03:00 +01004288 htx = htx_from_buf(buf);
4289
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004290 /* We only come here with HTX_BLK_DATA or HTX_BLK_EOD blocks. However,
4291 * while looping, we can meet an HTX_BLK_EOM block that we'll leave to
4292 * the caller to handle.
4293 */
4294
4295 new_frame:
Willy Tarreauee573762018-12-04 15:25:57 +01004296 if (!count || htx_is_empty(htx))
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004297 goto end;
4298
4299 idx = htx_get_head(htx);
4300 blk = htx_get_blk(htx, idx);
4301 type = htx_get_blk_type(blk); // DATA or EOD or EOM
4302 bsize = htx_get_blksz(blk);
4303 fsize = bsize;
4304
4305 if (type == HTX_BLK_EOD) {
4306 /* if we have an EOD, we're dealing with chunked data. We may
4307 * have a set of trailers after us that the caller will want to
4308 * deal with. Let's simply remove the EOD and return.
4309 */
4310 htx_remove_blk(htx, blk);
Willy Tarreauee573762018-12-04 15:25:57 +01004311 total++; // EOD counts as one byte
4312 count--;
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004313 goto end;
4314 }
4315
Willy Tarreau2fb1d4c2018-12-04 15:28:03 +01004316 if (type != HTX_BLK_DATA && type != HTX_BLK_EOM)
4317 goto end;
Willy Tarreau98de12a2018-12-12 07:03:00 +01004318
4319 /* Perform some optimizations to reduce the number of buffer copies.
4320 * First, if the mux's buffer is empty and the htx area contains
4321 * exactly one data block of the same size as the requested count, and
4322 * this count fits within the frame size, the stream's window size, and
4323 * the connection's window size, then it's possible to simply swap the
4324 * caller's buffer with the mux's output buffer and adjust offsets and
4325 * length to match the entire DATA HTX block in the middle. In this
4326 * case we perform a true zero-copy operation from end-to-end. This is
4327 * the situation that happens all the time with large files. Second, if
4328 * this is not possible, but the mux's output buffer is empty, we still
4329 * have an opportunity to avoid the copy to the intermediary buffer, by
4330 * making the intermediary buffer's area point to the output buffer's
4331 * area. In this case we want to skip the HTX header to make sure that
4332 * copies remain aligned and that this operation remains possible all
4333 * the time. This goes for headers, data blocks and any data extracted
4334 * from the HTX blocks.
4335 */
4336 if (unlikely(fsize == count &&
4337 htx->used == 1 && type == HTX_BLK_DATA &&
4338 fsize <= h2s->mws && fsize <= h2c->mws && fsize <= h2c->mfs)) {
4339 void *old_area = h2c->mbuf.area;
4340
4341 if (b_data(&h2c->mbuf)) {
4342 /* too bad there are data left there. If we have less
4343 * than 1/4 of the mbuf's size and everything fits,
4344 * we'll perform a copy anyway. Otherwise we'll pretend
4345 * the mbuf is full and wait.
4346 */
4347 if (fsize <= b_size(&h2c->mbuf) / 4 && fsize + 9 <= b_room(&h2c->mbuf))
4348 goto copy;
4349 h2c->flags |= H2_CF_MUX_MFULL;
4350 h2s->flags |= H2_SF_BLK_MROOM;
4351 goto end;
4352 }
4353
4354 /* map an H2 frame to the HTX block so that we can put the
4355 * frame header there.
4356 */
4357 h2c->mbuf.area = buf->area;
Olivier Houchard84cca662018-12-14 16:28:08 +01004358 h2c->mbuf.head = sizeof(struct htx) + blk->addr - 9;
Willy Tarreau98de12a2018-12-12 07:03:00 +01004359 h2c->mbuf.data = fsize + 9;
4360 outbuf.area = b_head(&h2c->mbuf);
4361
4362 /* prepend an H2 DATA frame header just before the DATA block */
4363 memcpy(outbuf.area, "\x00\x00\x00\x00\x00", 5);
4364 write_n32(outbuf.area + 5, h2s->id); // 4 bytes
4365 h2_set_frame_size(outbuf.area, fsize);
4366
4367 /* update windows */
4368 h2s->mws -= fsize;
4369 h2c->mws -= fsize;
4370
4371 /* and exchange with our old area */
4372 buf->area = old_area;
4373 buf->data = buf->head = 0;
4374 total += fsize;
4375 goto end;
4376 }
Willy Tarreau2fb1d4c2018-12-04 15:28:03 +01004377
Willy Tarreau98de12a2018-12-12 07:03:00 +01004378 copy:
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004379 /* for DATA and EOM we'll have to emit a frame, even if empty */
4380
4381 while (1) {
4382 outbuf.area = b_tail(&h2c->mbuf);
4383 outbuf.size = b_contig_space(&h2c->mbuf);
4384 outbuf.data = 0;
4385
4386 if (outbuf.size >= 9 || !b_space_wraps(&h2c->mbuf))
4387 break;
4388 realign_again:
4389 b_slow_realign(&h2c->mbuf, trash.area, b_data(&h2c->mbuf));
4390 }
4391
4392 if (outbuf.size < 9) {
4393 h2c->flags |= H2_CF_MUX_MFULL;
4394 h2s->flags |= H2_SF_BLK_MROOM;
4395 goto end;
4396 }
4397
4398 /* len: 0x000000 (fill later), type: 0(DATA), flags: none=0 */
4399 memcpy(outbuf.area, "\x00\x00\x00\x00\x00", 5);
4400 write_n32(outbuf.area + 5, h2s->id); // 4 bytes
4401 outbuf.data = 9;
4402
4403 /* we have in <fsize> the exact number of bytes we need to copy from
4404 * the HTX buffer. We need to check this against the connection's and
4405 * the stream's send windows, and to ensure that this fits in the max
4406 * frame size and in the buffer's available space minus 9 bytes (for
4407 * the frame header). The connection's flow control is applied last so
4408 * that we can use a separate list of streams which are immediately
4409 * unblocked on window opening. Note: we don't implement padding.
4410 */
4411
4412 /* EOM is presented with bsize==1 but would lead to the emission of an
4413 * empty frame, thus we force it to zero here.
4414 */
4415 if (type == HTX_BLK_EOM)
4416 bsize = fsize = 0;
4417
4418 if (!fsize)
4419 goto send_empty;
4420
4421 if (h2s->mws <= 0) {
4422 h2s->flags |= H2_SF_BLK_SFCTL;
4423 if (h2s->send_wait) {
4424 LIST_DEL(&h2s->list);
4425 LIST_INIT(&h2s->list);
4426 }
4427 goto end;
4428 }
4429
Willy Tarreauee573762018-12-04 15:25:57 +01004430 if (fsize > count)
4431 fsize = count;
4432
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004433 if (fsize > h2s->mws)
4434 fsize = h2s->mws; // >0
4435
4436 if (h2c->mfs && fsize > h2c->mfs)
4437 fsize = h2c->mfs; // >0
4438
4439 if (fsize + 9 > outbuf.size) {
4440 /* we have an opportunity for enlarging the too small
4441 * available space, let's try.
4442 * FIXME: is this really interesting to do? Maybe we'll
4443 * spend lots of time realigning instead of using two
4444 * frames.
4445 */
4446 if (b_space_wraps(&h2c->mbuf))
4447 goto realign_again;
4448 fsize = outbuf.size - 9;
4449
4450 if (fsize <= 0) {
4451 /* no need to send an empty frame here */
4452 h2c->flags |= H2_CF_MUX_MFULL;
4453 h2s->flags |= H2_SF_BLK_MROOM;
4454 goto end;
4455 }
4456 }
4457
4458 if (h2c->mws <= 0) {
4459 h2s->flags |= H2_SF_BLK_MFCTL;
4460 goto end;
4461 }
4462
4463 if (fsize > h2c->mws)
4464 fsize = h2c->mws;
4465
4466 /* now let's copy this this into the output buffer */
4467 memcpy(outbuf.area + 9, htx_get_blk_ptr(htx, blk), fsize);
Willy Tarreau0f799ca2018-12-04 15:20:11 +01004468 h2s->mws -= fsize;
4469 h2c->mws -= fsize;
Willy Tarreauee573762018-12-04 15:25:57 +01004470 count -= fsize;
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004471
4472 send_empty:
4473 /* update the frame's size */
4474 h2_set_frame_size(outbuf.area, fsize);
4475
4476 /* FIXME: for now we only set the ES flag on empty DATA frames, once
4477 * meeting EOM. We should optimize this later.
4478 */
4479 if (type == HTX_BLK_EOM) {
Willy Tarreauee573762018-12-04 15:25:57 +01004480 total++; // EOM counts as one byte
4481 count--;
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004482 es_now = 1;
4483 }
4484
4485 if (es_now)
4486 outbuf.area[4] |= H2_F_DATA_END_STREAM;
4487
4488 /* commit the H2 response */
4489 b_add(&h2c->mbuf, fsize + 9);
4490
4491 /* consume incoming HTX block, including EOM */
4492 total += fsize;
4493 if (fsize == bsize) {
4494 htx_remove_blk(htx, blk);
4495 if (fsize)
4496 goto new_frame;
4497 } else {
4498 /* we've truncated this block */
4499 htx_cut_data_blk(htx, blk, fsize);
4500 }
4501
4502 if (es_now) {
4503 if (h2s->st == H2_SS_OPEN)
4504 h2s->st = H2_SS_HLOC;
4505 else
4506 h2s_close(h2s);
4507
4508 h2s->flags |= H2_SF_ES_SENT;
4509 }
4510
4511 end:
4512 return total;
4513}
4514
Olivier Houchard6ff20392018-07-17 18:46:31 +02004515/* Called from the upper layer, to subscribe to events, such as being able to send */
4516static int h2_subscribe(struct conn_stream *cs, int event_type, void *param)
4517{
Olivier Houchardfa8aa862018-10-10 18:25:41 +02004518 struct wait_event *sw;
Olivier Houchard6ff20392018-07-17 18:46:31 +02004519 struct h2s *h2s = cs->ctx;
Olivier Houchard4cf7fb12018-08-02 19:23:05 +02004520 struct h2c *h2c = h2s->h2c;
Olivier Houchard6ff20392018-07-17 18:46:31 +02004521
Olivier Houchard83a0cd82018-09-28 17:57:58 +02004522 if (event_type & SUB_CAN_RECV) {
Olivier Houchard4cf7fb12018-08-02 19:23:05 +02004523 sw = param;
4524 if (!(sw->wait_reason & SUB_CAN_RECV)) {
4525 sw->wait_reason |= SUB_CAN_RECV;
Olivier Houchard8ae735d2018-09-11 18:24:28 +02004526 sw->handle = h2s;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02004527 h2s->recv_wait = sw;
Olivier Houchard4cf7fb12018-08-02 19:23:05 +02004528 }
Olivier Houchard83a0cd82018-09-28 17:57:58 +02004529 event_type &= ~SUB_CAN_RECV;
4530 }
4531 if (event_type & SUB_CAN_SEND) {
Olivier Houchard6ff20392018-07-17 18:46:31 +02004532 sw = param;
Olivier Houchard4cf7fb12018-08-02 19:23:05 +02004533 if (!(sw->wait_reason & SUB_CAN_SEND)) {
Olivier Houcharde1c6dbc2018-08-01 17:06:43 +02004534 sw->wait_reason |= SUB_CAN_SEND;
Olivier Houchard8ae735d2018-09-11 18:24:28 +02004535 sw->handle = h2s;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02004536 h2s->send_wait = sw;
4537 if (!(h2s->flags & H2_SF_BLK_SFCTL)) {
4538 if (h2s->flags & H2_SF_BLK_MFCTL)
4539 LIST_ADDQ(&h2c->fctl_list, &h2s->list);
4540 else
4541 LIST_ADDQ(&h2c->send_list, &h2s->list);
4542 }
Olivier Houcharde1c6dbc2018-08-01 17:06:43 +02004543 }
Olivier Houchard83a0cd82018-09-28 17:57:58 +02004544 event_type &= ~SUB_CAN_SEND;
Olivier Houchard6ff20392018-07-17 18:46:31 +02004545 }
Olivier Houchard83a0cd82018-09-28 17:57:58 +02004546 if (event_type != 0)
4547 return -1;
4548 return 0;
Olivier Houchard6ff20392018-07-17 18:46:31 +02004549
4550
4551}
4552
Olivier Houchard83a0cd82018-09-28 17:57:58 +02004553static int h2_unsubscribe(struct conn_stream *cs, int event_type, void *param)
4554{
Olivier Houchardfa8aa862018-10-10 18:25:41 +02004555 struct wait_event *sw;
Olivier Houchard83a0cd82018-09-28 17:57:58 +02004556 struct h2s *h2s = cs->ctx;
4557
4558 if (event_type & SUB_CAN_RECV) {
4559 sw = param;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02004560 if (h2s->recv_wait == sw) {
Olivier Houchard83a0cd82018-09-28 17:57:58 +02004561 sw->wait_reason &= ~SUB_CAN_RECV;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02004562 h2s->recv_wait = NULL;
Olivier Houchard83a0cd82018-09-28 17:57:58 +02004563 }
4564 }
4565 if (event_type & SUB_CAN_SEND) {
4566 sw = param;
Olivier Houchardfa8aa862018-10-10 18:25:41 +02004567 if (h2s->send_wait == sw) {
4568 LIST_DEL(&h2s->list);
4569 LIST_INIT(&h2s->list);
4570 sw->wait_reason &= ~SUB_CAN_SEND;
4571 h2s->send_wait = NULL;
Olivier Houchard83a0cd82018-09-28 17:57:58 +02004572 }
4573 }
Olivier Houchardd846c262018-10-19 17:24:29 +02004574 if (event_type & SUB_CALL_UNSUBSCRIBE) {
4575 sw = param;
4576 if (h2s->send_wait == sw) {
4577 sw->wait_reason &= ~SUB_CALL_UNSUBSCRIBE;
4578 h2s->send_wait = NULL;
4579 }
4580 }
Olivier Houchard83a0cd82018-09-28 17:57:58 +02004581 return 0;
4582}
4583
4584
Olivier Houchard511efea2018-08-16 15:30:32 +02004585/* Called from the upper layer, to receive data */
4586static size_t h2_rcv_buf(struct conn_stream *cs, struct buffer *buf, size_t count, int flags)
4587{
Olivier Houchard638b7992018-08-16 15:41:52 +02004588 struct h2s *h2s = cs->ctx;
Willy Tarreau082f5592018-11-25 08:03:32 +01004589 struct h2c *h2c = h2s->h2c;
Willy Tarreau86724e22018-12-01 23:19:43 +01004590 struct htx *h2s_htx = NULL;
4591 struct htx *buf_htx = NULL;
4592 struct htx_ret htx_ret;
Olivier Houchard511efea2018-08-16 15:30:32 +02004593 size_t ret = 0;
4594
4595 /* transfer possibly pending data to the upper layer */
Willy Tarreau86724e22018-12-01 23:19:43 +01004596 if (h2c->proxy->options2 & PR_O2_USE_HTX) {
4597 /* in HTX mode we ignore the count argument */
4598 h2s_htx = htx_from_buf(&h2s->rxbuf);
Olivier Houchard56b03482018-12-10 16:09:53 +01004599 if (htx_is_empty(h2s_htx)) {
4600 if (cs->flags & CS_FL_REOS)
4601 cs->flags |= CS_FL_EOS;
Olivier Houchard71748cb2018-12-17 14:16:46 +01004602 if (cs->flags & CS_FL_ERR_PENDING)
4603 cs->flags |= CS_FL_ERROR;
Willy Tarreau86724e22018-12-01 23:19:43 +01004604 goto end;
Olivier Houchard56b03482018-12-10 16:09:53 +01004605 }
Willy Tarreau86724e22018-12-01 23:19:43 +01004606
4607 buf_htx = htx_from_buf(buf);
4608 count = htx_free_space(buf_htx);
4609
Willy Tarreau0c22fa72018-12-04 15:21:35 +01004610 htx_ret = htx_xfer_blks(buf_htx, h2s_htx, count, HTX_BLK_EOM);
Willy Tarreau86724e22018-12-01 23:19:43 +01004611
4612 buf_htx->extra = h2s_htx->extra;
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01004613 htx_to_buf(buf_htx, buf);
4614 htx_to_buf(h2s_htx, &h2s->rxbuf);
Willy Tarreau86724e22018-12-01 23:19:43 +01004615 ret = htx_ret.ret;
4616 }
4617 else {
4618 ret = b_xfer(buf, &h2s->rxbuf, count);
4619 }
Olivier Houchard511efea2018-08-16 15:30:32 +02004620
Olivier Houchard638b7992018-08-16 15:41:52 +02004621 if (b_data(&h2s->rxbuf))
Olivier Houchardd247be02018-12-06 16:22:29 +01004622 cs->flags |= (CS_FL_RCV_MORE | CS_FL_WANT_ROOM);
Olivier Houchard511efea2018-08-16 15:30:32 +02004623 else {
Olivier Houchardd247be02018-12-06 16:22:29 +01004624 cs->flags &= ~(CS_FL_RCV_MORE | CS_FL_WANT_ROOM);
Olivier Houchard511efea2018-08-16 15:30:32 +02004625 if (cs->flags & CS_FL_REOS)
4626 cs->flags |= CS_FL_EOS;
Olivier Houchard71748cb2018-12-17 14:16:46 +01004627 if (cs->flags & CS_FL_ERR_PENDING)
4628 cs->flags |= CS_FL_ERROR;
Olivier Houchard638b7992018-08-16 15:41:52 +02004629 if (b_size(&h2s->rxbuf)) {
4630 b_free(&h2s->rxbuf);
4631 offer_buffers(NULL, tasks_run_queue);
4632 }
Olivier Houchard511efea2018-08-16 15:30:32 +02004633 }
4634
Willy Tarreau082f5592018-11-25 08:03:32 +01004635 if (ret && h2c->dsi == h2s->id) {
4636 /* demux is blocking on this stream's buffer */
4637 h2c->flags &= ~H2_CF_DEM_SFULL;
Willy Tarreauc5b10042018-12-18 10:27:18 +01004638 if (b_data(&h2c->dbuf) || !(h2c->wait_event.wait_reason & SUB_CAN_RECV)) {
Willy Tarreau082f5592018-11-25 08:03:32 +01004639 if (h2_recv_allowed(h2c))
4640 tasklet_wakeup(h2c->wait_event.task);
4641 }
4642 }
Willy Tarreau86724e22018-12-01 23:19:43 +01004643end:
Olivier Houchard511efea2018-08-16 15:30:32 +02004644 return ret;
4645}
4646
Olivier Houchardd846c262018-10-19 17:24:29 +02004647static void h2_stop_senders(struct h2c *h2c)
4648{
4649 struct h2s *h2s, *h2s_back;
4650
4651 list_for_each_entry_safe(h2s, h2s_back, &h2c->sending_list, list) {
4652 /* Don't unschedule the stream if the mux is just busy waiting for more data fro mthat stream */
4653 if (h2c->msi == h2s_id(h2s))
4654 continue;
4655 LIST_DEL(&h2s->list);
4656 LIST_INIT(&h2s->list);
4657 task_remove_from_task_list((struct task *)h2s->send_wait->task);
4658 h2s->send_wait->wait_reason |= SUB_CAN_SEND;
4659 h2s->send_wait->wait_reason &= ~SUB_CALL_UNSUBSCRIBE;
4660 LIST_ADD(&h2c->send_list, &h2s->list);
4661 }
4662}
4663
Willy Tarreau62f52692017-10-08 23:01:42 +02004664/* Called from the upper layer, to send data */
Christopher Fauletd44a9b32018-07-27 11:59:41 +02004665static size_t h2_snd_buf(struct conn_stream *cs, struct buffer *buf, size_t count, int flags)
Willy Tarreau62f52692017-10-08 23:01:42 +02004666{
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02004667 struct h2s *h2s = cs->ctx;
Olivier Houchard8122a8d2018-12-03 19:13:29 +01004668 size_t orig_count = count;
Willy Tarreau1dc41e72018-06-14 13:21:28 +02004669 size_t total = 0;
Willy Tarreau5dd17352018-06-14 13:33:30 +02004670 size_t ret;
Willy Tarreaubcd3bb32018-12-01 18:59:00 +01004671 struct htx *htx;
4672 struct htx_blk *blk;
4673 enum htx_blk_type btype;
4674 uint32_t bsize;
4675 int32_t idx;
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02004676
Olivier Houchardd846c262018-10-19 17:24:29 +02004677 if (h2s->send_wait) {
4678 h2s->send_wait->wait_reason &= ~SUB_CALL_UNSUBSCRIBE;
4679 h2s->send_wait = NULL;
4680 LIST_DEL(&h2s->list);
4681 LIST_INIT(&h2s->list);
4682 }
Willy Tarreau6bf641a2018-10-08 09:43:03 +02004683 if (h2s->h2c->st0 < H2_CS_FRAME_H)
4684 return 0;
4685
Willy Tarreaubcd3bb32018-12-01 18:59:00 +01004686 /* htx will be enough to decide if we're using HTX or legacy */
4687 htx = (h2s->h2c->proxy->options2 & PR_O2_USE_HTX) ? htx_from_buf(buf) : NULL;
4688
Willy Tarreau0bad0432018-06-14 16:54:01 +02004689 if (!(h2s->flags & H2_SF_OUTGOING_DATA) && count)
Willy Tarreauc4312d32017-11-07 12:01:53 +01004690 h2s->flags |= H2_SF_OUTGOING_DATA;
4691
Willy Tarreau751f2d02018-10-05 09:35:00 +02004692 if (h2s->id == 0) {
4693 int32_t id = h2c_get_next_sid(h2s->h2c);
4694
4695 if (id < 0) {
4696 cs->ctx = NULL;
4697 cs->flags |= CS_FL_ERROR;
4698 h2s_destroy(h2s);
4699 return 0;
4700 }
4701
4702 eb32_delete(&h2s->by_id);
4703 h2s->by_id.key = h2s->id = id;
4704 h2s->h2c->max_id = id;
4705 eb32_insert(&h2s->h2c->streams_by_id, &h2s->by_id);
4706 }
4707
Willy Tarreaubcd3bb32018-12-01 18:59:00 +01004708 if (htx) {
Willy Tarreauc14999b2018-12-06 14:09:09 +01004709 while (h2s->st < H2_SS_ERROR && !(h2s->flags & H2_SF_BLK_ANY) &&
4710 count && !htx_is_empty(htx)) {
Willy Tarreaubcd3bb32018-12-01 18:59:00 +01004711 idx = htx_get_head(htx);
4712 blk = htx_get_blk(htx, idx);
4713 btype = htx_get_blk_type(blk);
4714 bsize = htx_get_blksz(blk);
4715
4716 switch (btype) {
Willy Tarreau80739692018-10-05 11:35:57 +02004717 case HTX_BLK_REQ_SL:
4718 /* start-line before headers */
4719 ret = h2s_htx_bck_make_req_headers(h2s, htx);
4720 if (ret > 0) {
4721 total += ret;
4722 count -= ret;
4723 if (ret < bsize)
4724 goto done;
4725 }
4726 break;
4727
Willy Tarreau115e83b2018-12-01 19:17:53 +01004728 case HTX_BLK_RES_SL:
4729 /* start-line before headers */
4730 ret = h2s_htx_frt_make_resp_headers(h2s, htx);
4731 if (ret > 0) {
4732 total += ret;
4733 count -= ret;
4734 if (ret < bsize)
4735 goto done;
4736 }
4737 break;
4738
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004739 case HTX_BLK_DATA:
4740 case HTX_BLK_EOD:
4741 case HTX_BLK_EOM:
4742 /* all these cause the emission of a DATA frame (possibly empty) */
Willy Tarreau98de12a2018-12-12 07:03:00 +01004743 ret = h2s_htx_frt_make_resp_data(h2s, buf, count);
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004744 if (ret > 0) {
Willy Tarreau98de12a2018-12-12 07:03:00 +01004745 htx = htx_from_buf(buf);
Willy Tarreau0c535fd2018-12-01 19:25:56 +01004746 total += ret;
4747 count -= ret;
4748 if (ret < bsize)
4749 goto done;
4750 }
4751 break;
4752
Willy Tarreaubcd3bb32018-12-01 18:59:00 +01004753 default:
4754 htx_remove_blk(htx, blk);
4755 total += bsize;
4756 count -= bsize;
4757 break;
4758 }
4759 }
4760 goto done;
4761 }
4762
4763 /* legacy transfer mode */
Willy Tarreaua40704a2018-09-11 13:52:04 +02004764 while (h2s->h1m.state < H1_MSG_DONE && count) {
Willy Tarreau001823c2018-09-12 17:25:32 +02004765 if (h2s->h1m.state <= H1_MSG_LAST_LF) {
Willy Tarreau80739692018-10-05 11:35:57 +02004766 if (h2s->h2c->flags & H2_CF_IS_BACK)
4767 ret = -1;
4768 else
4769 ret = h2s_frt_make_resp_headers(h2s, buf, total, count);
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02004770 }
Willy Tarreaua40704a2018-09-11 13:52:04 +02004771 else if (h2s->h1m.state < H1_MSG_TRAILERS) {
Willy Tarreau0bad0432018-06-14 16:54:01 +02004772 ret = h2s_frt_make_resp_data(h2s, buf, total, count);
Willy Tarreau9d89ac82017-10-31 17:15:59 +01004773 }
Willy Tarreaua40704a2018-09-11 13:52:04 +02004774 else if (h2s->h1m.state == H1_MSG_TRAILERS) {
Willy Tarreau9d89ac82017-10-31 17:15:59 +01004775 /* consume the trailers if any (we don't forward them for now) */
Willy Tarreau0bad0432018-06-14 16:54:01 +02004776 ret = h1_measure_trailers(buf, total, count);
Willy Tarreau9d89ac82017-10-31 17:15:59 +01004777
Willy Tarreau5dd17352018-06-14 13:33:30 +02004778 if (unlikely((int)ret <= 0)) {
4779 if ((int)ret < 0)
Willy Tarreau9d89ac82017-10-31 17:15:59 +01004780 h2s_error(h2s, H2_ERR_INTERNAL_ERROR);
4781 break;
4782 }
Willy Tarreau35a62702018-02-27 15:37:25 +01004783 // trim any possibly pending data (eg: extra CR-LF, ...)
Willy Tarreau0bad0432018-06-14 16:54:01 +02004784 total += count;
4785 count = 0;
Willy Tarreaua40704a2018-09-11 13:52:04 +02004786 h2s->h1m.state = H1_MSG_DONE;
Willy Tarreau9d89ac82017-10-31 17:15:59 +01004787 break;
Willy Tarreauc652dbd2017-10-19 11:16:37 +02004788 }
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02004789 else {
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02004790 cs->flags |= CS_FL_ERROR;
4791 break;
4792 }
Willy Tarreau0bad0432018-06-14 16:54:01 +02004793
4794 total += ret;
4795 count -= ret;
4796
4797 if (h2s->st >= H2_SS_ERROR)
4798 break;
4799
4800 if (h2s->flags & H2_SF_BLK_ANY)
4801 break;
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02004802 }
4803
Willy Tarreaubcd3bb32018-12-01 18:59:00 +01004804 done:
Willy Tarreau00610962018-07-19 10:58:28 +02004805 if (h2s->st >= H2_SS_ERROR) {
4806 /* trim any possibly pending data after we close (extra CR-LF,
4807 * unprocessed trailers, abnormal extra data, ...)
4808 */
Willy Tarreau0bad0432018-06-14 16:54:01 +02004809 total += count;
4810 count = 0;
Willy Tarreau00610962018-07-19 10:58:28 +02004811 }
4812
Willy Tarreauc6795ca2017-11-07 09:43:06 +01004813 /* RST are sent similarly to frame acks */
Willy Tarreau02492192017-12-07 15:59:29 +01004814 if (h2s->st == H2_SS_ERROR || h2s->flags & H2_SF_RST_RCVD) {
Willy Tarreauc6795ca2017-11-07 09:43:06 +01004815 cs->flags |= CS_FL_ERROR;
Willy Tarreau8c0ea7d2017-11-10 10:05:24 +01004816 if (h2s_send_rst_stream(h2s->h2c, h2s) > 0)
Willy Tarreau00dd0782018-03-01 16:31:34 +01004817 h2s_close(h2s);
Willy Tarreauc6795ca2017-11-07 09:43:06 +01004818 }
4819
Willy Tarreaubcd3bb32018-12-01 18:59:00 +01004820 if (htx) {
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01004821 htx_to_buf(htx, buf);
Willy Tarreaubcd3bb32018-12-01 18:59:00 +01004822 } else {
4823 b_del(buf, total);
4824 }
Olivier Houchardd846c262018-10-19 17:24:29 +02004825
4826 /* The mux is full, cancel the pending tasks */
4827 if ((h2s->h2c->flags & H2_CF_MUX_BLOCK_ANY) ||
4828 (h2s->flags & H2_SF_BLK_MBUSY))
4829 h2_stop_senders(h2s->h2c);
Willy Tarreaubcd3bb32018-12-01 18:59:00 +01004830
Olivier Houchard8122a8d2018-12-03 19:13:29 +01004831 /* If we're running HTX, and we read the whole buffer, then pretend
4832 * we read exactly what the caller specified, as with HTX the caller
4833 * will always give the buffer size, instead of the amount of data
4834 * available.
4835 */
4836 if (htx && !b_data(buf))
4837 total = orig_count;
4838
Olivier Houchard7505f942018-08-21 18:10:44 +02004839 if (total > 0) {
Olivier Houchardfa8aa862018-10-10 18:25:41 +02004840 if (!(h2s->h2c->wait_event.wait_reason & SUB_CAN_SEND))
4841 tasklet_wakeup(h2s->h2c->wait_event.task);
Olivier Houchardd846c262018-10-19 17:24:29 +02004842
Olivier Houchard7505f942018-08-21 18:10:44 +02004843 }
Willy Tarreau9e5ae1d2017-10-17 19:58:20 +02004844 return total;
Willy Tarreau62f52692017-10-08 23:01:42 +02004845}
4846
Willy Tarreaue3f36cd2018-03-30 14:43:13 +02004847/* for debugging with CLI's "show fd" command */
Willy Tarreau83061a82018-07-13 11:56:34 +02004848static void h2_show_fd(struct buffer *msg, struct connection *conn)
Willy Tarreaue3f36cd2018-03-30 14:43:13 +02004849{
4850 struct h2c *h2c = conn->mux_ctx;
Willy Tarreau987c0632018-12-18 10:32:05 +01004851 struct h2s *h2s = NULL;
Willy Tarreaue3f36cd2018-03-30 14:43:13 +02004852 struct eb32_node *node;
4853 int fctl_cnt = 0;
4854 int send_cnt = 0;
4855 int tree_cnt = 0;
4856 int orph_cnt = 0;
4857
4858 if (!h2c)
4859 return;
4860
Olivier Houchardfa8aa862018-10-10 18:25:41 +02004861 list_for_each_entry(h2s, &h2c->fctl_list, list)
Willy Tarreaue3f36cd2018-03-30 14:43:13 +02004862 fctl_cnt++;
4863
Olivier Houchardfa8aa862018-10-10 18:25:41 +02004864 list_for_each_entry(h2s, &h2c->send_list, list)
Willy Tarreaue3f36cd2018-03-30 14:43:13 +02004865 send_cnt++;
4866
Willy Tarreau3af37712018-12-18 14:34:41 +01004867 h2s = NULL;
Willy Tarreaue3f36cd2018-03-30 14:43:13 +02004868 node = eb32_first(&h2c->streams_by_id);
4869 while (node) {
4870 h2s = container_of(node, struct h2s, by_id);
4871 tree_cnt++;
4872 if (!h2s->cs)
4873 orph_cnt++;
4874 node = eb32_next(node);
4875 }
4876
Willy Tarreau987c0632018-12-18 10:32:05 +01004877 chunk_appendf(msg, " h2c.st0=%d .err=%d .maxid=%d .lastid=%d .flg=0x%04x"
4878 " .nbst=%u .nbcs=%u .fctl_cnt=%d .send_cnt=%d .tree_cnt=%d"
4879 " .orph_cnt=%d .sub=%d .dsi=%d .dbuf=%u@%p+%u/%u .msi=%d .mbuf=%u@%p+%u/%u",
Willy Tarreau616ac812018-07-24 14:12:42 +02004880 h2c->st0, h2c->errcode, h2c->max_id, h2c->last_sid, h2c->flags,
4881 h2c->nb_streams, h2c->nb_cs, fctl_cnt, send_cnt, tree_cnt, orph_cnt,
Willy Tarreau987c0632018-12-18 10:32:05 +01004882 h2c->wait_event.wait_reason, h2c->dsi,
4883 (unsigned int)b_data(&h2c->dbuf), b_orig(&h2c->dbuf),
4884 (unsigned int)b_head_ofs(&h2c->dbuf), (unsigned int)b_size(&h2c->dbuf),
4885 h2c->msi,
4886 (unsigned int)b_data(&h2c->mbuf), b_orig(&h2c->mbuf),
4887 (unsigned int)b_head_ofs(&h2c->mbuf), (unsigned int)b_size(&h2c->mbuf));
4888
4889 if (h2s) {
4890 chunk_appendf(msg, " last_h2s=%p .id=%d .flg=0x%04x .rxbuf=%u@%p+%u/%u .cs=%p",
4891 h2s, h2s->id, h2s->flags,
4892 (unsigned int)b_data(&h2s->rxbuf), b_orig(&h2s->rxbuf),
4893 (unsigned int)b_head_ofs(&h2s->rxbuf), (unsigned int)b_size(&h2s->rxbuf),
4894 h2s->cs);
4895 if (h2s->cs)
4896 chunk_appendf(msg, " .cs.flg=0x%08x .cs.data=%p",
4897 h2s->cs->flags, h2s->cs->data);
4898 }
Willy Tarreaue3f36cd2018-03-30 14:43:13 +02004899}
Willy Tarreau62f52692017-10-08 23:01:42 +02004900
4901/*******************************************************/
4902/* functions below are dedicated to the config parsers */
4903/*******************************************************/
4904
Willy Tarreaufe20e5b2017-07-27 11:42:14 +02004905/* config parser for global "tune.h2.header-table-size" */
4906static int h2_parse_header_table_size(char **args, int section_type, struct proxy *curpx,
4907 struct proxy *defpx, const char *file, int line,
4908 char **err)
4909{
4910 if (too_many_args(1, args, err, NULL))
4911 return -1;
4912
4913 h2_settings_header_table_size = atoi(args[1]);
4914 if (h2_settings_header_table_size < 4096 || h2_settings_header_table_size > 65536) {
4915 memprintf(err, "'%s' expects a numeric value between 4096 and 65536.", args[0]);
4916 return -1;
4917 }
4918 return 0;
4919}
Willy Tarreau62f52692017-10-08 23:01:42 +02004920
Willy Tarreaue6baec02017-07-27 11:45:11 +02004921/* config parser for global "tune.h2.initial-window-size" */
4922static int h2_parse_initial_window_size(char **args, int section_type, struct proxy *curpx,
4923 struct proxy *defpx, const char *file, int line,
4924 char **err)
4925{
4926 if (too_many_args(1, args, err, NULL))
4927 return -1;
4928
4929 h2_settings_initial_window_size = atoi(args[1]);
4930 if (h2_settings_initial_window_size < 0) {
4931 memprintf(err, "'%s' expects a positive numeric value.", args[0]);
4932 return -1;
4933 }
4934 return 0;
4935}
4936
Willy Tarreau5242ef82017-07-27 11:47:28 +02004937/* config parser for global "tune.h2.max-concurrent-streams" */
4938static int h2_parse_max_concurrent_streams(char **args, int section_type, struct proxy *curpx,
4939 struct proxy *defpx, const char *file, int line,
4940 char **err)
4941{
4942 if (too_many_args(1, args, err, NULL))
4943 return -1;
4944
4945 h2_settings_max_concurrent_streams = atoi(args[1]);
4946 if (h2_settings_max_concurrent_streams < 0) {
4947 memprintf(err, "'%s' expects a positive numeric value.", args[0]);
4948 return -1;
4949 }
4950 return 0;
4951}
4952
Willy Tarreau62f52692017-10-08 23:01:42 +02004953
4954/****************************************/
4955/* MUX initialization and instanciation */
4956/***************************************/
4957
4958/* The mux operations */
Willy Tarreau680b2bd2018-11-27 07:30:17 +01004959static const struct mux_ops h2_ops = {
Willy Tarreau62f52692017-10-08 23:01:42 +02004960 .init = h2_init,
Olivier Houchard21df6cc2018-09-14 23:21:44 +02004961 .wake = h2_wake,
Willy Tarreau62f52692017-10-08 23:01:42 +02004962 .snd_buf = h2_snd_buf,
Olivier Houchard511efea2018-08-16 15:30:32 +02004963 .rcv_buf = h2_rcv_buf,
Olivier Houchard6ff20392018-07-17 18:46:31 +02004964 .subscribe = h2_subscribe,
Olivier Houchard83a0cd82018-09-28 17:57:58 +02004965 .unsubscribe = h2_unsubscribe,
Willy Tarreau62f52692017-10-08 23:01:42 +02004966 .attach = h2_attach,
Willy Tarreaufafd3982018-11-18 21:29:20 +01004967 .get_first_cs = h2_get_first_cs,
Willy Tarreau62f52692017-10-08 23:01:42 +02004968 .detach = h2_detach,
Olivier Houchard060ed432018-11-06 16:32:42 +01004969 .destroy = h2_destroy,
Olivier Houchardd540b362018-11-05 18:37:53 +01004970 .avail_streams = h2_avail_streams,
Olivier Houchard8defe4b2018-12-02 01:31:17 +01004971 .max_streams = h2_max_streams,
Willy Tarreau62f52692017-10-08 23:01:42 +02004972 .shutr = h2_shutr,
4973 .shutw = h2_shutw,
Willy Tarreaue3f36cd2018-03-30 14:43:13 +02004974 .show_fd = h2_show_fd,
Willy Tarreau28f1cb92017-12-20 16:14:44 +01004975 .flags = MX_FL_CLEAN_ABRT,
Willy Tarreau62f52692017-10-08 23:01:42 +02004976 .name = "H2",
4977};
4978
Christopher Faulet32f61c02018-04-10 14:33:41 +02004979/* PROTO selection : this mux registers PROTO token "h2" */
4980static struct mux_proto_list mux_proto_h2 =
Willy Tarreauf8957272018-10-03 10:25:20 +02004981 { .token = IST("h2"), .mode = PROTO_MODE_HTTP, .side = PROTO_SIDE_FE, .mux = &h2_ops };
Willy Tarreau62f52692017-10-08 23:01:42 +02004982
Willy Tarreau0108d902018-11-25 19:14:37 +01004983INITCALL1(STG_REGISTER, register_mux_proto, &mux_proto_h2);
4984
Willy Tarreauf8957272018-10-03 10:25:20 +02004985static struct mux_proto_list mux_proto_h2_htx =
4986 { .token = IST("h2"), .mode = PROTO_MODE_HTX, .side = PROTO_SIDE_BOTH, .mux = &h2_ops };
4987
4988INITCALL1(STG_REGISTER, register_mux_proto, &mux_proto_h2_htx);
4989
Willy Tarreau62f52692017-10-08 23:01:42 +02004990/* config keyword parsers */
4991static struct cfg_kw_list cfg_kws = {ILH, {
Willy Tarreaufe20e5b2017-07-27 11:42:14 +02004992 { CFG_GLOBAL, "tune.h2.header-table-size", h2_parse_header_table_size },
Willy Tarreaue6baec02017-07-27 11:45:11 +02004993 { CFG_GLOBAL, "tune.h2.initial-window-size", h2_parse_initial_window_size },
Willy Tarreau5242ef82017-07-27 11:47:28 +02004994 { CFG_GLOBAL, "tune.h2.max-concurrent-streams", h2_parse_max_concurrent_streams },
Willy Tarreau62f52692017-10-08 23:01:42 +02004995 { 0, NULL, NULL }
4996}};
4997
Willy Tarreau0108d902018-11-25 19:14:37 +01004998INITCALL1(STG_REGISTER, cfg_register_keywords, &cfg_kws);