blob: 6f083d43553aec0271fd801413dd43ce10be839b [file] [log] [blame]
Willy Tarreau35b51c62018-09-10 15:38:55 +02001/*
2 * include/common/http.h
3 *
4 * Version-agnostic and implementation-agnostic HTTP protocol definitions.
5 *
6 * Copyright (C) 2000-2018 Willy Tarreau - w@1wt.eu
7 *
8 * This library is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation, version 2.1
11 * exclusively.
12 *
13 * This library is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
17 *
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with this library; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 */
22
23#ifndef _COMMON_HTTP_H
24#define _COMMON_HTTP_H
25
26#include <common/buf.h>
27#include <common/ist.h>
28
Christopher Faulet7e266c72018-10-03 14:15:28 +020029/*
Ilya Shipitsin77e3b4a2020-03-10 12:06:11 +050030 * some macros mainly used when parsing header fields.
Christopher Faulet7e266c72018-10-03 14:15:28 +020031 * from RFC7230:
32 * CTL = <any US-ASCII control character (octets 0 - 31) and DEL (127)>
33 * SEP = one of the 17 defined separators or SP or HT
34 * LWS = CR, LF, SP or HT
35 * SPHT = SP or HT. Use this macro and not a boolean expression for best speed.
36 * CRLF = CR or LF. Use this macro and not a boolean expression for best speed.
37 * token = any CHAR except CTL or SEP. Use this macro and not a boolean expression for best speed.
38 *
39 * added for ease of use:
40 * ver_token = 'H', 'P', 'T', '/', '.', and digits.
41 */
Willy Tarreau35b51c62018-09-10 15:38:55 +020042#define HTTP_FLG_CTL 0x01
43#define HTTP_FLG_SEP 0x02
44#define HTTP_FLG_LWS 0x04
45#define HTTP_FLG_SPHT 0x08
46#define HTTP_FLG_CRLF 0x10
47#define HTTP_FLG_TOK 0x20
48#define HTTP_FLG_VER 0x40
49#define HTTP_FLG_DIG 0x80
50
51#define HTTP_IS_CTL(x) (http_char_classes[(uint8_t)(x)] & HTTP_FLG_CTL)
52#define HTTP_IS_SEP(x) (http_char_classes[(uint8_t)(x)] & HTTP_FLG_SEP)
53#define HTTP_IS_LWS(x) (http_char_classes[(uint8_t)(x)] & HTTP_FLG_LWS)
54#define HTTP_IS_SPHT(x) (http_char_classes[(uint8_t)(x)] & HTTP_FLG_SPHT)
55#define HTTP_IS_CRLF(x) (http_char_classes[(uint8_t)(x)] & HTTP_FLG_CRLF)
56#define HTTP_IS_TOKEN(x) (http_char_classes[(uint8_t)(x)] & HTTP_FLG_TOK)
57#define HTTP_IS_VER_TOKEN(x) (http_char_classes[(uint8_t)(x)] & HTTP_FLG_VER)
58#define HTTP_IS_DIGIT(x) (http_char_classes[(uint8_t)(x)] & HTTP_FLG_DIG)
59
60/* Known HTTP methods */
61enum http_meth_t {
62 HTTP_METH_OPTIONS,
63 HTTP_METH_GET,
64 HTTP_METH_HEAD,
65 HTTP_METH_POST,
66 HTTP_METH_PUT,
67 HTTP_METH_DELETE,
68 HTTP_METH_TRACE,
69 HTTP_METH_CONNECT,
70 HTTP_METH_OTHER, /* Must be the last entry */
71} __attribute__((packed));
72
73/* Known HTTP authentication schemes */
74enum ht_auth_m {
75 HTTP_AUTH_WRONG = -1, /* missing or unknown */
76 HTTP_AUTH_UNKNOWN = 0,
77 HTTP_AUTH_BASIC,
78 HTTP_AUTH_DIGEST,
79} __attribute__((packed));
80
81/* All implemented HTTP status codes */
82enum {
83 HTTP_ERR_200 = 0,
84 HTTP_ERR_400,
85 HTTP_ERR_403,
Florian Tham9205fea2020-01-08 13:35:30 +010086 HTTP_ERR_404,
Willy Tarreau35b51c62018-09-10 15:38:55 +020087 HTTP_ERR_405,
88 HTTP_ERR_408,
Florian Tham272e29b2020-01-08 10:19:05 +010089 HTTP_ERR_410,
Willy Tarreau35b51c62018-09-10 15:38:55 +020090 HTTP_ERR_421,
91 HTTP_ERR_425,
92 HTTP_ERR_429,
93 HTTP_ERR_500,
94 HTTP_ERR_502,
95 HTTP_ERR_503,
96 HTTP_ERR_504,
97 HTTP_ERR_SIZE
98};
99
100/* Note: the strings below make use of chunks. Chunks may carry an allocated
101 * size in addition to the length. The size counts from the beginning (str)
102 * to the end. If the size is unknown, it MUST be zero, in which case the
103 * sample will automatically be duplicated when a change larger than <len> has
104 * to be performed. Thus it is safe to always set size to zero.
105 */
106struct http_meth {
107 enum http_meth_t meth;
108 struct buffer str;
109};
110
111struct http_auth_data {
112 enum ht_auth_m method; /* one of HTTP_AUTH_* */
113 /* 7 bytes unused here */
114 struct buffer method_data; /* points to the creditial part from 'Authorization:' header */
115 char *user, *pass; /* extracted username & password */
116};
117
118struct http_method_desc {
119 enum http_meth_t meth;
120 const struct ist text;
121};
122
123extern const int http_err_codes[HTTP_ERR_SIZE];
Christopher Fauleta7b677c2018-11-29 16:48:49 +0100124extern const char *http_err_msgs[HTTP_ERR_SIZE];
Willy Tarreaue01d11a2019-03-29 17:52:50 +0100125extern const struct ist http_known_methods[HTTP_METH_OTHER];
Willy Tarreau35b51c62018-09-10 15:38:55 +0200126extern const uint8_t http_char_classes[256];
Willy Tarreau04f1e2d2018-09-10 18:04:24 +0200127
Willy Tarreaue01d11a2019-03-29 17:52:50 +0100128extern const struct ist HTTP_100;
129extern const struct ist HTTP_103;
Willy Tarreau04f1e2d2018-09-10 18:04:24 +0200130extern const char *HTTP_301;
Willy Tarreau35b51c62018-09-10 15:38:55 +0200131extern const char *HTTP_302;
132extern const char *HTTP_303;
Willy Tarreau04f1e2d2018-09-10 18:04:24 +0200133extern const char *HTTP_307;
134extern const char *HTTP_308;
135extern const char *HTTP_401_fmt;
136extern const char *HTTP_407_fmt;
Willy Tarreau35b51c62018-09-10 15:38:55 +0200137
138enum http_meth_t find_http_meth(const char *str, const int len);
Willy Tarreau8de1df92019-04-15 21:27:18 +0200139int http_get_status_idx(unsigned int status);
Willy Tarreau04f1e2d2018-09-10 18:04:24 +0200140const char *http_get_reason(unsigned int status);
Christopher Faulet16fdc552019-10-08 14:56:58 +0200141struct ist http_get_authority(const struct ist uri, int no_userinfo);
Willy Tarreau6b952c82018-09-10 17:45:34 +0200142struct ist http_get_path(const struct ist uri);
Willy Tarreauab813a42018-09-10 18:41:28 +0200143int http_header_match2(const char *hdr, const char *end,
144 const char *name, int len);
145char *http_find_hdr_value_end(char *s, const char *e);
146char *http_find_cookie_value_end(char *s, const char *e);
147char *http_extract_cookie_value(char *hdr, const char *hdr_end,
148 char *cookie_name, size_t cookie_name_l,
149 int list, char **value, size_t *value_l);
150int http_parse_qvalue(const char *qvalue, const char **end);
151const char *http_find_url_param_pos(const char **chunks,
152 const char* url_param_name,
153 size_t url_param_name_l, char delim);
154int http_find_next_url_param(const char **chunks,
155 const char* url_param_name, size_t url_param_name_l,
156 const char **vstart, const char **vend, char delim);
157
Christopher Faulet8277ca72018-10-22 15:12:04 +0200158int http_parse_header(const struct ist hdr, struct ist *name, struct ist *value);
159int http_parse_stline(const struct ist line, struct ist *p1, struct ist *p2, struct ist *p3);
Christopher Faulet341fac12019-09-16 11:37:05 +0200160int http_parse_status_val(const struct ist value, struct ist *status, struct ist *reason);
Christopher Faulet8277ca72018-10-22 15:12:04 +0200161
Willy Tarreauab813a42018-09-10 18:41:28 +0200162/*
163 * Given a path string and its length, find the position of beginning of the
164 * query string. Returns NULL if no query string is found in the path.
165 *
166 * Example: if path = "/foo/bar/fubar?yo=mama;ye=daddy", and n = 22:
167 *
168 * find_query_string(path, n, '?') points to "yo=mama;ye=daddy" string.
169 */
170static inline char *http_find_param_list(char *path, size_t path_l, char delim)
171{
172 char *p;
173
174 p = memchr(path, delim, path_l);
175 return p ? p + 1 : NULL;
176}
177
178static inline int http_is_param_delimiter(char c, char delim)
179{
180 return c == '&' || c == ';' || c == delim;
181}
182
Willy Tarreau79e57332018-10-02 16:01:16 +0200183/* Match language range with language tag. RFC2616 14.4:
184 *
185 * A language-range matches a language-tag if it exactly equals
186 * the tag, or if it exactly equals a prefix of the tag such
187 * that the first tag character following the prefix is "-".
188 *
189 * Return 1 if the strings match, else return 0.
190 */
191static inline int http_language_range_match(const char *range, int range_len,
192 const char *tag, int tag_len)
193{
194 const char *end = range + range_len;
195 const char *tend = tag + tag_len;
196
197 while (range < end) {
198 if (*range == '-' && tag == tend)
199 return 1;
200 if (*range != *tag || tag == tend)
201 return 0;
202 range++;
203 tag++;
204 }
205 /* Return true only if the last char of the tag is matched. */
206 return tag == tend;
207}
208
Willy Tarreau35b51c62018-09-10 15:38:55 +0200209
210#endif /* _COMMON_HTTP_H */
211
212/*
213 * Local variables:
214 * c-indent-level: 8
215 * c-basic-offset: 8
216 * End:
217 */