blob: 849b4940ff78ab4491ee52f284ec44c1cc73d166 [file] [log] [blame]
Willy Tarreaubaaee002006-06-26 02:48:02 +02001/*
Willy Tarreau3667d5d2009-10-18 19:50:43 +02002 * include/types/proto_http.h
3 * This file contains HTTP protocol definitions.
4 *
5 * Copyright (C) 2000-2009 Willy Tarreau - w@1wt.eu
6 *
7 * This library is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation, version 2.1
10 * exclusively.
11 *
12 * This library is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with this library; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
Willy Tarreaubaaee002006-06-26 02:48:02 +020021
22#ifndef _TYPES_PROTO_HTTP_H
23#define _TYPES_PROTO_HTTP_H
24
Willy Tarreaue3ba5f02006-06-29 18:54:54 +020025#include <common/config.h>
Willy Tarreaubaaee002006-06-26 02:48:02 +020026
Willy Tarreau3bac9ff2007-03-18 17:31:28 +010027#include <types/buffers.h>
28#include <types/hdr_idx.h>
29
Willy Tarreaubaaee002006-06-26 02:48:02 +020030/*
31 * FIXME: break this into HTTP state and TCP socket state.
Willy Tarreaubaaee002006-06-26 02:48:02 +020032 */
33
Willy Tarreaub6866442008-07-14 23:54:42 +020034/* different possible states for the client side */
Willy Tarreau67f0eea2008-08-10 22:55:22 +020035#define CL_STDATA 0
36#define CL_STSHUTR 1
37#define CL_STSHUTW 2
38#define CL_STCLOSE 3
Willy Tarreaub6866442008-07-14 23:54:42 +020039
Willy Tarreaubaaee002006-06-26 02:48:02 +020040/* different possible states for the server side */
41#define SV_STIDLE 0
Willy Tarreauadfb8562008-08-11 15:24:42 +020042#define SV_STCONN 1
Willy Tarreauf5483bf2008-08-14 18:35:40 +020043#define SV_STDATA 2
44#define SV_STSHUTR 3
45#define SV_STSHUTW 4
46#define SV_STCLOSE 5
Willy Tarreaubaaee002006-06-26 02:48:02 +020047
Willy Tarreau3d300592007-03-18 18:34:41 +010048/*
49 * Transaction flags moved from session
50 */
51
52
53/* action flags */
54#define TX_CLDENY 0x00000001 /* a client header matches a deny regex */
55#define TX_CLALLOW 0x00000002 /* a client header matches an allow regex */
56#define TX_SVDENY 0x00000004 /* a server header matches a deny regex */
57#define TX_SVALLOW 0x00000008 /* a server header matches an allow regex */
58#define TX_CLTARPIT 0x00000010 /* the session is tarpitted (anti-dos) */
59/* unused: 0x00000020 */
60
61/* transaction flags dedicated to cookies : bits values 0x40, 0x80 (0-3 shift 6) */
62#define TX_CK_NONE 0x00000000 /* this session had no cookie */
63#define TX_CK_INVALID 0x00000040 /* this session had a cookie which matches no server */
64#define TX_CK_DOWN 0x00000080 /* this session had cookie matching a down server */
65#define TX_CK_VALID 0x000000C0 /* this session had cookie matching a valid server */
66#define TX_CK_MASK 0x000000C0 /* mask to get this session's cookie flags */
67#define TX_CK_SHIFT 6 /* bit shift */
68
69/* cookie information, bits values 0x100 to 0x800 (0-8 shift 8) */
70#define TX_SCK_NONE 0x00000000 /* no set-cookie seen for the server cookie */
71#define TX_SCK_DELETED 0x00000100 /* existing set-cookie deleted or changed */
72#define TX_SCK_INSERTED 0x00000200 /* new set-cookie inserted or changed existing one */
73#define TX_SCK_SEEN 0x00000400 /* set-cookie seen for the server cookie */
74#define TX_SCK_MASK 0x00000700 /* mask to get the set-cookie field */
75#define TX_SCK_ANY 0x00000800 /* at least one set-cookie seen (not to be counted) */
76#define TX_SCK_SHIFT 8 /* bit shift */
77
78/* cacheability management, bits values 0x1000 to 0x3000 (0-3 shift 12) */
79#define TX_CACHEABLE 0x00001000 /* at least part of the response is cacheable */
80#define TX_CACHE_COOK 0x00002000 /* a cookie in the response is cacheable */
81#define TX_CACHE_SHIFT 12 /* bit shift */
82
Willy Tarreau3667d5d2009-10-18 19:50:43 +020083/* client and server keep-alive capability */
84#define TX_CLI_CONN_KA 0x00004000 /* the client-side connection is still keep-alive capable */
85#define TX_SRV_CONN_KA 0x00008000 /* the server-side connection is still keep-alive capable */
86
87/* report presence of transfer-encoding:chunked and content-length headers */
88#define TX_REQ_CNT_LEN 0x00010000 /* content-length present in the request */
89#define TX_REQ_TE_CHNK 0x00020000 /* transfer-encoding: chunked present in the request */
90#define TX_RES_CNT_LEN 0x00040000 /* content-length present in the response */
91#define TX_RES_TE_CHNK 0x00080000 /* transfer-encoding: chunked present in the response */
Willy Tarreaubaaee002006-06-26 02:48:02 +020092
Willy Tarreau8d5d7f22007-01-21 19:16:41 +010093/* The HTTP parser is more complex than it looks like, because we have to
94 * support multi-line headers and any number of spaces between the colon and
95 * the value.
96 *
97 * All those examples must work :
98
99 Hdr1:val1\r\n
100 Hdr1: val1\r\n
101 Hdr1:\t val1\r\n
102 Hdr1: \r\n
103 val1\r\n
104 Hdr1:\r\n
105 val1\n
106 \tval2\r\n
107 val3\n
108
109 *
110 */
111
Willy Tarreau58f10d72006-12-04 02:26:12 +0100112/* Possible states while parsing HTTP messages (request|response) */
Willy Tarreau8d5d7f22007-01-21 19:16:41 +0100113#define HTTP_MSG_RQBEFORE 0 // request: leading LF, before start line
114#define HTTP_MSG_RQBEFORE_CR 1 // request: leading CRLF, before start line
115
116/* these ones define a request start line */
117#define HTTP_MSG_RQMETH 2 // parsing the Method
118#define HTTP_MSG_RQMETH_SP 3 // space(s) after the ethod
119#define HTTP_MSG_RQURI 4 // parsing the Request URI
120#define HTTP_MSG_RQURI_SP 5 // space(s) after the Request URI
121#define HTTP_MSG_RQVER 6 // parsing the Request Version
122#define HTTP_MSG_RQLINE_END 7 // end of request line (CR or LF)
123
124#define HTTP_MSG_RPBEFORE 8 // response: leading LF, before start line
125#define HTTP_MSG_RPBEFORE_CR 9 // response: leading CRLF, before start line
126
127/* these ones define a response start line */
128#define HTTP_MSG_RPVER 10 // parsing the Response Version
129#define HTTP_MSG_RPVER_SP 11 // space(s) after the Response Version
130#define HTTP_MSG_RPCODE 12 // response code
131#define HTTP_MSG_RPCODE_SP 13 // space(s) after the response code
132#define HTTP_MSG_RPREASON 14 // response reason
133#define HTTP_MSG_RPLINE_END 15 // end of response line (CR or LF)
134
135/* common header processing */
136
137#define HTTP_MSG_HDR_FIRST 16 // waiting for first header or last CRLF (no LWS possible)
138#define HTTP_MSG_HDR_NAME 17 // parsing header name
139#define HTTP_MSG_HDR_COL 18 // parsing header colon
140#define HTTP_MSG_HDR_L1_SP 19 // parsing header LWS (SP|HT) before value
141#define HTTP_MSG_HDR_L1_LF 20 // parsing header LWS (LF) before value
142#define HTTP_MSG_HDR_L1_LWS 21 // checking whether it's a new header or an LWS
143#define HTTP_MSG_HDR_VAL 22 // parsing header value
144#define HTTP_MSG_HDR_L2_LF 23 // parsing header LWS (LF) inside/after value
145#define HTTP_MSG_HDR_L2_LWS 24 // checking whether it's a new header or an LWS
146
147#define HTTP_MSG_LAST_LF 25 // parsing last LF
Willy Tarreau655dce92009-11-08 13:10:58 +0100148
149/* error state : must be before HTTP_MSG_BODY so that (>=BODY) always indicates
150 * that data are being processed.
151 */
152
153#define HTTP_MSG_ERROR 26 // an error occurred
154
155/* Body processing.
156 * The state HTTP_MSG_BODY is a delimiter to know if we're waiting for headers
157 * or body. All the sub-states below also indicate we're processing the body,
158 * with some additional information.
159 */
160#define HTTP_MSG_BODY 27 // parsing body at end of headers
161#define HTTP_MSG_100_SENT 28 // parsing body after a 100-Continue was sent
162#define HTTP_MSG_CHUNK_SIZE 29 // parsing the chunk size (RFC2616 #3.6.1)
163#define HTTP_MSG_DATA 30 // skipping data chunk / content-length data
164#define HTTP_MSG_DATA_CRLF 31 // skipping CRLF after data chunk
165#define HTTP_MSG_TRAILERS 32 // trailers (post-data entity headers)
Willy Tarreau8d5d7f22007-01-21 19:16:41 +0100166
Willy Tarreau58f10d72006-12-04 02:26:12 +0100167
Willy Tarreauc0dde7a2007-01-01 21:38:07 +0100168/* various data sources for the responses */
169#define DATA_SRC_NONE 0
170#define DATA_SRC_STATS 1
171
172/* data transmission states for the stats responses */
173enum {
174 DATA_ST_INIT = 0,
175 DATA_ST_HEAD,
176 DATA_ST_INFO,
177 DATA_ST_LIST,
178 DATA_ST_END,
179 DATA_ST_FIN,
180};
181
182/* data transmission states for the stats responses inside a proxy */
183enum {
184 DATA_ST_PX_INIT = 0,
185 DATA_ST_PX_TH,
186 DATA_ST_PX_FE,
Krzysztof Piotr Oledzkiaeebf9b2009-10-04 15:43:17 +0200187 DATA_ST_PX_LI,
Willy Tarreauc0dde7a2007-01-01 21:38:07 +0100188 DATA_ST_PX_SV,
189 DATA_ST_PX_BE,
190 DATA_ST_PX_END,
191 DATA_ST_PX_FIN,
192};
193
Willy Tarreau79da4692008-11-19 20:03:04 +0100194/* Redirect flags */
195enum {
196 REDIRECT_FLAG_NONE = 0,
197 REDIRECT_FLAG_DROP_QS = 1, /* drop query string */
198};
Willy Tarreaub463dfb2008-06-07 23:08:56 +0200199
200/* Redirect types (location, prefix, extended ) */
201enum {
202 REDIRECT_TYPE_NONE = 0, /* no redirection */
203 REDIRECT_TYPE_LOCATION, /* location redirect */
204 REDIRECT_TYPE_PREFIX, /* prefix redirect */
205};
206
Willy Tarreau3bac9ff2007-03-18 17:31:28 +0100207/* Known HTTP methods */
208typedef enum {
209 HTTP_METH_NONE = 0,
210 HTTP_METH_OPTIONS,
211 HTTP_METH_GET,
212 HTTP_METH_HEAD,
213 HTTP_METH_POST,
214 HTTP_METH_PUT,
215 HTTP_METH_DELETE,
216 HTTP_METH_TRACE,
217 HTTP_METH_CONNECT,
218 HTTP_METH_OTHER,
219} http_meth_t;
220
221/* This is an HTTP message, as described in RFC2616. It can be either a request
222 * message or a response message.
223 *
224 * The values there are a little bit obscure, because their meaning can change
225 * during the parsing :
226 *
227 * - som (Start of Message) : relative offset in the buffer of first byte of
228 * the request being processed or parsed. Reset to
229 * zero during accept().
230 * - eoh (End of Headers) : relative offset in the buffer of first byte that
231 * is not part of a completely processed header.
232 * During parsing, it points to last header seen
Willy Tarreaufa355d42009-11-29 18:12:29 +0100233 * for states after START. When in HTTP_MSG_BODY,
234 * eoh points to the first byte of the last CRLF
235 * preceeding data.
236 * - col and sov : When in HTTP_MSG_BODY, will point to the first
237 * byte of data.
Willy Tarreau3bac9ff2007-03-18 17:31:28 +0100238 * - eol (End of Line) : relative offset in the buffer of the first byte
239 * which marks the end of the line (LF or CRLF).
240 */
241struct http_msg {
matt.farnsworth@nokia.com1c2ab962008-04-14 20:47:37 +0200242 unsigned int msg_state; /* where we are in the current message parsing */
Willy Tarreaufa355d42009-11-29 18:12:29 +0100243 unsigned int col, sov; /* current header: colon, start of value */
244 unsigned int eoh; /* End Of Headers, relative to buffer */
matt.farnsworth@nokia.com1c2ab962008-04-14 20:47:37 +0200245 char *sol; /* start of line, also start of message when fully parsed */
246 char *eol; /* end of line */
247 unsigned int som; /* Start Of Message, relative to buffer */
Willy Tarreaufa355d42009-11-29 18:12:29 +0100248 int err_pos; /* err handling: -2=block, -1=pass, 0+=detected */
matt.farnsworth@nokia.com1c2ab962008-04-14 20:47:37 +0200249 union { /* useful start line pointers, relative to buffer */
Willy Tarreau3bac9ff2007-03-18 17:31:28 +0100250 struct {
matt.farnsworth@nokia.com1c2ab962008-04-14 20:47:37 +0200251 int l; /* request line length (not including CR) */
252 int m_l; /* METHOD length (method starts at ->som) */
253 int u, u_l; /* URI, length */
254 int v, v_l; /* VERSION, length */
255 } rq; /* request line : field, length */
Willy Tarreau3bac9ff2007-03-18 17:31:28 +0100256 struct {
matt.farnsworth@nokia.com1c2ab962008-04-14 20:47:37 +0200257 int l; /* status line length (not including CR) */
258 int v_l; /* VERSION length (version starts at ->som) */
259 int c, c_l; /* CODE, length */
260 int r, r_l; /* REASON, length */
261 } st; /* status line : field, length */
262 } sl; /* start line */
Willy Tarreau3667d5d2009-10-18 19:50:43 +0200263 unsigned long long hdr_content_len; /* cache for parsed header value or for chunk-size if present */
Willy Tarreaufa355d42009-11-29 18:12:29 +0100264 char **cap; /* array of captured headers (may be NULL) */
Willy Tarreau3bac9ff2007-03-18 17:31:28 +0100265};
266
267/* This is an HTTP transaction. It contains both a request message and a
268 * response message (which can be empty).
269 */
270struct http_txn {
271 http_meth_t meth; /* HTTP method */
272 struct hdr_idx hdr_idx; /* array of header indexes (max: MAX_HTTP_HDR) */
273 struct chunk auth_hdr; /* points to 'Authorization:' header */
274 struct http_msg req, rsp; /* HTTP request and response messages */
275
276 char *uri; /* first line if log needed, NULL otherwise */
277 char *cli_cookie; /* cookie presented by the client, in capture mode */
278 char *srv_cookie; /* cookie presented by the server, in capture mode */
279 int status; /* HTTP status from the server, negative if from proxy */
Willy Tarreau3d300592007-03-18 18:34:41 +0100280 unsigned int flags; /* transaction flags */
Willy Tarreau3bac9ff2007-03-18 17:31:28 +0100281};
282
Willy Tarreau33a7e692007-06-10 19:45:56 +0200283/* This structure is used by http_find_header() to return values of headers.
284 * The header starts at <line>, the value at <line>+<val> for <vlen> bytes.
285 */
286struct hdr_ctx {
287 const char *line;
288 int idx;
289 int val; /* relative to line */
290 int vlen; /* relative to line+val */
291};
Willy Tarreau58f10d72006-12-04 02:26:12 +0100292
Willy Tarreaubaaee002006-06-26 02:48:02 +0200293#endif /* _TYPES_PROTO_HTTP_H */
294
295/*
296 * Local variables:
297 * c-indent-level: 8
298 * c-basic-offset: 8
299 * End:
300 */