blob: d3e44265307d807ab046961cbb63637c7a831bf1 [file] [log] [blame]
Willy Tarreau0da5b3b2017-09-21 09:30:46 +02001/*
2 * include/types/h1.h
3 * This file contains HTTP/1 protocol definitions.
4 *
5 * Copyright (C) 2000-2017 Willy Tarreau - w@1wt.eu
6 *
7 * This library is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation, version 2.1
10 * exclusively.
11 *
12 * This library is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with this library; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
21
22#ifndef _TYPES_H1_H
23#define _TYPES_H1_H
24
Willy Tarreaua41393f2018-09-11 15:34:50 +020025#include <common/http.h>
Christopher Faulet1dc2b492018-10-08 15:34:02 +020026#include <common/ist.h>
Willy Tarreaua41393f2018-09-11 15:34:50 +020027
Willy Tarreau801250e2018-09-11 11:45:04 +020028/* Legacy version of the HTTP/1 message state, used by the channels, should
29 * ultimately be removed.
30 */
Willy Tarreau0da5b3b2017-09-21 09:30:46 +020031enum h1_state {
32 HTTP_MSG_RQBEFORE = 0, // request: leading LF, before start line
33 HTTP_MSG_RQBEFORE_CR = 1, // request: leading CRLF, before start line
34 /* these ones define a request start line */
35 HTTP_MSG_RQMETH = 2, // parsing the Method
36 HTTP_MSG_RQMETH_SP = 3, // space(s) after the Method
37 HTTP_MSG_RQURI = 4, // parsing the Request URI
38 HTTP_MSG_RQURI_SP = 5, // space(s) after the Request URI
39 HTTP_MSG_RQVER = 6, // parsing the Request Version
40 HTTP_MSG_RQLINE_END = 7, // end of request line (CR or LF)
41
42 HTTP_MSG_RPBEFORE = 8, // response: leading LF, before start line
43 HTTP_MSG_RPBEFORE_CR = 9, // response: leading CRLF, before start line
44
45 /* these ones define a response start line */
46 HTTP_MSG_RPVER = 10, // parsing the Response Version
47 HTTP_MSG_RPVER_SP = 11, // space(s) after the Response Version
48 HTTP_MSG_RPCODE = 12, // response code
49 HTTP_MSG_RPCODE_SP = 13, // space(s) after the response code
50 HTTP_MSG_RPREASON = 14, // response reason
51 HTTP_MSG_RPLINE_END = 15, // end of response line (CR or LF)
52
53 /* common header processing */
54 HTTP_MSG_HDR_FIRST = 16, // waiting for first header or last CRLF (no LWS possible)
55 HTTP_MSG_HDR_NAME = 17, // parsing header name
56 HTTP_MSG_HDR_COL = 18, // parsing header colon
57 HTTP_MSG_HDR_L1_SP = 19, // parsing header LWS (SP|HT) before value
58 HTTP_MSG_HDR_L1_LF = 20, // parsing header LWS (LF) before value
59 HTTP_MSG_HDR_L1_LWS = 21, // checking whether it's a new header or an LWS
60 HTTP_MSG_HDR_VAL = 22, // parsing header value
61 HTTP_MSG_HDR_L2_LF = 23, // parsing header LWS (LF) inside/after value
62 HTTP_MSG_HDR_L2_LWS = 24, // checking whether it's a new header or an LWS
63
64 HTTP_MSG_LAST_LF = 25, // parsing last LF
65
66 /* error state : must be before HTTP_MSG_BODY so that (>=BODY) always indicates
67 * that data are being processed.
68 */
69 HTTP_MSG_ERROR = 26, // an error occurred
70 /* Body processing.
71 * The state HTTP_MSG_BODY is a delimiter to know if we're waiting for headers
72 * or body. All the sub-states below also indicate we're processing the body,
73 * with some additional information.
74 */
75 HTTP_MSG_BODY = 27, // parsing body at end of headers
76 HTTP_MSG_100_SENT = 28, // parsing body after a 100-Continue was sent
77 HTTP_MSG_CHUNK_SIZE = 29, // parsing the chunk size (RFC7230 #4.1)
78 HTTP_MSG_DATA = 30, // skipping data chunk / content-length data
79 HTTP_MSG_CHUNK_CRLF = 31, // skipping CRLF after data chunk
80 HTTP_MSG_TRAILERS = 32, // trailers (post-data entity headers)
81 /* we enter this state when we've received the end of the current message */
82 HTTP_MSG_ENDING = 33, // message end received, wait that the filters end too
83 HTTP_MSG_DONE = 34, // message end received, waiting for resync or close
84 HTTP_MSG_CLOSING = 35, // shutdown_w done, not all bytes sent yet
85 HTTP_MSG_CLOSED = 36, // shutdown_w done, all bytes sent
86 HTTP_MSG_TUNNEL = 37, // tunneled data after DONE
87} __attribute__((packed));
88
89
Willy Tarreau801250e2018-09-11 11:45:04 +020090/* Possible states while parsing HTTP/1 messages (request|response) */
91enum h1m_state {
92 H1_MSG_RQBEFORE = 0, // request: leading LF, before start line
93 H1_MSG_RQBEFORE_CR = 1, // request: leading CRLF, before start line
94 /* these ones define a request start line */
95 H1_MSG_RQMETH = 2, // parsing the Method
96 H1_MSG_RQMETH_SP = 3, // space(s) after the Method
97 H1_MSG_RQURI = 4, // parsing the Request URI
98 H1_MSG_RQURI_SP = 5, // space(s) after the Request URI
99 H1_MSG_RQVER = 6, // parsing the Request Version
100 H1_MSG_RQLINE_END = 7, // end of request line (CR or LF)
101
102 H1_MSG_RPBEFORE = 8, // response: leading LF, before start line
103 H1_MSG_RPBEFORE_CR = 9, // response: leading CRLF, before start line
104
105 /* these ones define a response start line */
106 H1_MSG_RPVER = 10, // parsing the Response Version
107 H1_MSG_RPVER_SP = 11, // space(s) after the Response Version
108 H1_MSG_RPCODE = 12, // response code
109 H1_MSG_RPCODE_SP = 13, // space(s) after the response code
110 H1_MSG_RPREASON = 14, // response reason
111 H1_MSG_RPLINE_END = 15, // end of response line (CR or LF)
112
113 /* common header processing */
114 H1_MSG_HDR_FIRST = 16, // waiting for first header or last CRLF (no LWS possible)
115 H1_MSG_HDR_NAME = 17, // parsing header name
116 H1_MSG_HDR_COL = 18, // parsing header colon
117 H1_MSG_HDR_L1_SP = 19, // parsing header LWS (SP|HT) before value
118 H1_MSG_HDR_L1_LF = 20, // parsing header LWS (LF) before value
119 H1_MSG_HDR_L1_LWS = 21, // checking whether it's a new header or an LWS
120 H1_MSG_HDR_VAL = 22, // parsing header value
121 H1_MSG_HDR_L2_LF = 23, // parsing header LWS (LF) inside/after value
122 H1_MSG_HDR_L2_LWS = 24, // checking whether it's a new header or an LWS
123
Willy Tarreau001823c2018-09-12 17:25:32 +0200124 H1_MSG_LAST_LF = 25, // parsing last LF, last state for headers
Willy Tarreau801250e2018-09-11 11:45:04 +0200125
Willy Tarreau001823c2018-09-12 17:25:32 +0200126 /* Body processing. */
127
128 H1_MSG_CHUNK_SIZE = 26, // parsing the chunk size (RFC7230 #4.1)
129 H1_MSG_DATA = 27, // skipping data chunk / content-length data
130 H1_MSG_CHUNK_CRLF = 28, // skipping CRLF after data chunk
131 H1_MSG_TRAILERS = 29, // trailers (post-data entity headers)
Willy Tarreau801250e2018-09-11 11:45:04 +0200132 /* we enter this state when we've received the end of the current message */
Willy Tarreau001823c2018-09-12 17:25:32 +0200133 H1_MSG_DONE = 30, // message end received, waiting for resync or close
134 H1_MSG_TUNNEL = 31, // tunneled data after DONE
Willy Tarreau801250e2018-09-11 11:45:04 +0200135} __attribute__((packed));
136
137
Willy Tarreau4093a4d2017-09-21 11:46:43 +0200138/* HTTP/1 message flags (32 bit), for use in h1m->flags only */
139#define H1_MF_NONE 0x00000000
140#define H1_MF_CLEN 0x00000001 // content-length present
141#define H1_MF_CHNK 0x00000002 // chunk present, exclusive with c-l
Willy Tarreauccaf2332018-09-11 16:47:23 +0200142#define H1_MF_RESP 0x00000004 // this message is the response message
Willy Tarreaueb528db2018-09-12 09:54:00 +0200143#define H1_MF_TOLOWER 0x00000008 // turn the header names to lower case
Willy Tarreauba5fbca2018-09-13 11:32:51 +0200144#define H1_MF_VER_11 0x00000010 // message indicates version 1.1 or above
Willy Tarreau98f5cf72018-09-13 14:15:58 +0200145#define H1_MF_CONN_CLO 0x00000020 // message contains "connection: close"
146#define H1_MF_CONN_KAL 0x00000040 // message contains "connection: keep-alive"
147#define H1_MF_CONN_UPG 0x00000080 // message contains "connection: upgrade"
Christopher Fauletc4e53f42018-09-14 11:15:52 +0200148#define H1_MF_XFER_LEN 0x00000100 // message xfer size can be determined
Willy Tarreau2557f6a2018-09-14 16:34:47 +0200149#define H1_MF_XFER_ENC 0x00000200 // transfer-encoding is present
Christopher Faulet25da9e32018-10-08 15:50:15 +0200150#define H1_MF_NO_PHDR 0x00000400 // don't add pseudo-headers in the header list
Willy Tarreau98f5cf72018-09-13 14:15:58 +0200151
152/* Note: for a connection to be persistent, we need this for the request :
153 * - one of CLEN or CHNK
154 * - version 1.0 and KAL and not CLO
155 * - or version 1.1 and not CLO
156 * For the response it's the same except that UPG must not appear either.
157 * So in short, for a request it's (CLEN|CHNK) > 0 && !CLO && (VER_11 || KAL)
158 * and for a response it's (CLEN|CHNK) > 0 && !(CLO|UPG) && (VER_11 || KAL)
159 */
Willy Tarreau4093a4d2017-09-21 11:46:43 +0200160
161
Willy Tarreaubbf38232018-09-12 09:08:54 +0200162/* basic HTTP/1 message state for use in parsers. The err_pos field is special,
163 * it is pre-set to a negative value (-1 or -2), and once non-negative it contains
164 * the relative position in the message of the first parse error. -2 is used to tell
165 * the parser that we want to block the invalid message. -1 is used to only perform
166 * a silent capture.
167 */
Willy Tarreau4093a4d2017-09-21 11:46:43 +0200168struct h1m {
Willy Tarreau801250e2018-09-11 11:45:04 +0200169 enum h1m_state state; // H1 message state (H1_MSG_*)
Willy Tarreau11da5672018-09-11 19:23:04 +0200170 /* 24 bits available here */
Willy Tarreau4093a4d2017-09-21 11:46:43 +0200171 uint32_t flags; // H1 message flags (H1_MF_*)
172 uint64_t curr_len; // content-length or last chunk length
173 uint64_t body_len; // total known size of the body length
Willy Tarreaub3b01522018-09-11 11:51:31 +0200174 uint32_t next; // next byte to parse, relative to buffer's head
Willy Tarreau4093a4d2017-09-21 11:46:43 +0200175 int err_pos; // position in the byte stream of the first error (H1 or H2)
176 int err_state; // state where the first error was met (H1 or H2)
177};
178
Willy Tarreaua41393f2018-09-11 15:34:50 +0200179/* basic H1 start line, describes either the request and the response */
180union h1_sl { /* useful start line pointers, relative to ->sol */
181 struct {
Christopher Faulet1dc2b492018-10-08 15:34:02 +0200182 struct ist m; /* METHOD */
183 struct ist u; /* URI */
184 struct ist v; /* VERSION */
Willy Tarreaua41393f2018-09-11 15:34:50 +0200185 enum http_meth_t meth; /* method */
186 } rq; /* request line : field, length */
187 struct {
Christopher Faulet1dc2b492018-10-08 15:34:02 +0200188 struct ist v; /* VERSION */
189 struct ist c; /* CODE */
190 struct ist r; /* REASON */
Willy Tarreaua41393f2018-09-11 15:34:50 +0200191 uint16_t status; /* status code */
192 } st; /* status line : field, length */
193};
194
Willy Tarreau0da5b3b2017-09-21 09:30:46 +0200195#endif /* _TYPES_H1_H */