Blame - src/http.c - haproxy

blob: f55b6969359bec04a7d8277c5cd5f5b08f804008 [file] [log] [blame]

Willy Tarreau	35b51c6	2018-09-10 15:38:55 +0200	[diff] [blame]	1	/*
				2	* HTTP semantics
				3	*
				4	* Copyright 2000-2018 Willy Tarreau <w@1wt.eu>
				5	*
				6	* This program is free software; you can redistribute it and/or
				7	* modify it under the terms of the GNU General Public License
				8	* as published by the Free Software Foundation; either version
				9	* 2 of the License, or (at your option) any later version.
				10	*
				11	*/
				12
				13	#include <ctype.h>
Willy Tarreau	4c7e4b7	2020-05-27 12:58:42 +0200	[diff] [blame]	14	#include <haproxy/api.h>
Willy Tarreau	cd72d8c	2020-06-02 19:11:26 +0200	[diff] [blame]	15	#include <haproxy/http.h>
Willy Tarreau	48fbcae	2020-06-03 18:09:46 +0200	[diff] [blame]	16	#include <haproxy/tools.h>
Willy Tarreau	35b51c6	2018-09-10 15:38:55 +0200	[diff] [blame]	17
				18	/* It is about twice as fast on recent architectures to lookup a byte in a
				19	* table than to perform a boolean AND or OR between two tests. Refer to
				20	* RFC2616/RFC5234/RFC7230 for those chars. A token is any ASCII char that is
				21	* neither a separator nor a CTL char. An http ver_token is any ASCII which can
				22	* be found in an HTTP version, which includes 'H', 'T', 'P', '/', '.' and any
				23	* digit. Note: please do not overwrite values in assignment since gcc-2.95
				24	* will not handle them correctly. It's worth noting that chars 128..255 are
				25	* nothing, not even control chars.
				26	*/
				27	const unsigned char http_char_classes[256] = {
				28	[ 0] = HTTP_FLG_CTL,
				29	[ 1] = HTTP_FLG_CTL,
				30	[ 2] = HTTP_FLG_CTL,
				31	[ 3] = HTTP_FLG_CTL,
				32	[ 4] = HTTP_FLG_CTL,
				33	[ 5] = HTTP_FLG_CTL,
				34	[ 6] = HTTP_FLG_CTL,
				35	[ 7] = HTTP_FLG_CTL,
				36	[ 8] = HTTP_FLG_CTL,
				37	[ 9] = HTTP_FLG_SPHT \| HTTP_FLG_LWS \| HTTP_FLG_SEP \| HTTP_FLG_CTL,
				38	[ 10] = HTTP_FLG_CRLF \| HTTP_FLG_LWS \| HTTP_FLG_CTL,
				39	[ 11] = HTTP_FLG_CTL,
				40	[ 12] = HTTP_FLG_CTL,
				41	[ 13] = HTTP_FLG_CRLF \| HTTP_FLG_LWS \| HTTP_FLG_CTL,
				42	[ 14] = HTTP_FLG_CTL,
				43	[ 15] = HTTP_FLG_CTL,
				44	[ 16] = HTTP_FLG_CTL,
				45	[ 17] = HTTP_FLG_CTL,
				46	[ 18] = HTTP_FLG_CTL,
				47	[ 19] = HTTP_FLG_CTL,
				48	[ 20] = HTTP_FLG_CTL,
				49	[ 21] = HTTP_FLG_CTL,
				50	[ 22] = HTTP_FLG_CTL,
				51	[ 23] = HTTP_FLG_CTL,
				52	[ 24] = HTTP_FLG_CTL,
				53	[ 25] = HTTP_FLG_CTL,
				54	[ 26] = HTTP_FLG_CTL,
				55	[ 27] = HTTP_FLG_CTL,
				56	[ 28] = HTTP_FLG_CTL,
				57	[ 29] = HTTP_FLG_CTL,
				58	[ 30] = HTTP_FLG_CTL,
				59	[ 31] = HTTP_FLG_CTL,
				60	[' '] = HTTP_FLG_SPHT \| HTTP_FLG_LWS \| HTTP_FLG_SEP,
				61	['!'] = HTTP_FLG_TOK,
				62	['"'] = HTTP_FLG_SEP,
				63	['#'] = HTTP_FLG_TOK,
				64	['$'] = HTTP_FLG_TOK,
				65	['%'] = HTTP_FLG_TOK,
				66	['&'] = HTTP_FLG_TOK,
				67	[ 39] = HTTP_FLG_TOK,
				68	['('] = HTTP_FLG_SEP,
				69	[')'] = HTTP_FLG_SEP,
				70	['*'] = HTTP_FLG_TOK,
				71	['+'] = HTTP_FLG_TOK,
				72	[','] = HTTP_FLG_SEP,
				73	['-'] = HTTP_FLG_TOK,
				74	['.'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				75	['/'] = HTTP_FLG_SEP \| HTTP_FLG_VER,
				76	['0'] = HTTP_FLG_TOK \| HTTP_FLG_VER \| HTTP_FLG_DIG,
				77	['1'] = HTTP_FLG_TOK \| HTTP_FLG_VER \| HTTP_FLG_DIG,
				78	['2'] = HTTP_FLG_TOK \| HTTP_FLG_VER \| HTTP_FLG_DIG,
				79	['3'] = HTTP_FLG_TOK \| HTTP_FLG_VER \| HTTP_FLG_DIG,
				80	['4'] = HTTP_FLG_TOK \| HTTP_FLG_VER \| HTTP_FLG_DIG,
				81	['5'] = HTTP_FLG_TOK \| HTTP_FLG_VER \| HTTP_FLG_DIG,
				82	['6'] = HTTP_FLG_TOK \| HTTP_FLG_VER \| HTTP_FLG_DIG,
				83	['7'] = HTTP_FLG_TOK \| HTTP_FLG_VER \| HTTP_FLG_DIG,
				84	['8'] = HTTP_FLG_TOK \| HTTP_FLG_VER \| HTTP_FLG_DIG,
				85	['9'] = HTTP_FLG_TOK \| HTTP_FLG_VER \| HTTP_FLG_DIG,
				86	[':'] = HTTP_FLG_SEP,
				87	[';'] = HTTP_FLG_SEP,
				88	['<'] = HTTP_FLG_SEP,
				89	['='] = HTTP_FLG_SEP,
				90	['>'] = HTTP_FLG_SEP,
				91	['?'] = HTTP_FLG_SEP,
				92	['@'] = HTTP_FLG_SEP,
Willy Tarreau	1ba3016	2022-05-24 15:34:26 +0200	[diff] [blame]	93	['A'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				94	['B'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				95	['C'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				96	['D'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				97	['E'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				98	['F'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				99	['G'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
Willy Tarreau	35b51c6	2018-09-10 15:38:55 +0200	[diff] [blame]	100	['H'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
Willy Tarreau	1ba3016	2022-05-24 15:34:26 +0200	[diff] [blame]	101	['I'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				102	['J'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				103	['K'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				104	['L'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				105	['M'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				106	['N'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				107	['O'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
Willy Tarreau	35b51c6	2018-09-10 15:38:55 +0200	[diff] [blame]	108	['P'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
Willy Tarreau	1ba3016	2022-05-24 15:34:26 +0200	[diff] [blame]	109	['Q'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
Willy Tarreau	35b51c6	2018-09-10 15:38:55 +0200	[diff] [blame]	110	['R'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				111	['S'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				112	['T'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
Willy Tarreau	1ba3016	2022-05-24 15:34:26 +0200	[diff] [blame]	113	['U'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				114	['V'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				115	['W'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				116	['X'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				117	['Y'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
				118	['Z'] = HTTP_FLG_TOK \| HTTP_FLG_VER,
Willy Tarreau	35b51c6	2018-09-10 15:38:55 +0200	[diff] [blame]	119	['['] = HTTP_FLG_SEP,
				120	[ 92] = HTTP_FLG_SEP,
				121	[']'] = HTTP_FLG_SEP,
				122	['^'] = HTTP_FLG_TOK,
				123	['_'] = HTTP_FLG_TOK,
				124	['`'] = HTTP_FLG_TOK,
				125	['a'] = HTTP_FLG_TOK,
				126	['b'] = HTTP_FLG_TOK,
				127	['c'] = HTTP_FLG_TOK,
				128	['d'] = HTTP_FLG_TOK,
				129	['e'] = HTTP_FLG_TOK,
				130	['f'] = HTTP_FLG_TOK,
				131	['g'] = HTTP_FLG_TOK,
				132	['h'] = HTTP_FLG_TOK,
				133	['i'] = HTTP_FLG_TOK,
				134	['j'] = HTTP_FLG_TOK,
				135	['k'] = HTTP_FLG_TOK,
				136	['l'] = HTTP_FLG_TOK,
				137	['m'] = HTTP_FLG_TOK,
				138	['n'] = HTTP_FLG_TOK,
				139	['o'] = HTTP_FLG_TOK,
				140	['p'] = HTTP_FLG_TOK,
				141	['q'] = HTTP_FLG_TOK,
				142	['r'] = HTTP_FLG_TOK,
				143	['s'] = HTTP_FLG_TOK,
				144	['t'] = HTTP_FLG_TOK,
				145	['u'] = HTTP_FLG_TOK,
				146	['v'] = HTTP_FLG_TOK,
				147	['w'] = HTTP_FLG_TOK,
				148	['x'] = HTTP_FLG_TOK,
				149	['y'] = HTTP_FLG_TOK,
				150	['z'] = HTTP_FLG_TOK,
				151	['{'] = HTTP_FLG_SEP,
				152	['\|'] = HTTP_FLG_TOK,
				153	['}'] = HTTP_FLG_SEP,
				154	['~'] = HTTP_FLG_TOK,
				155	[127] = HTTP_FLG_CTL,
				156	};
				157
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	158	const int http_err_codes[HTTP_ERR_SIZE] = {
				159	[HTTP_ERR_200] = 200, /* used by "monitor-uri" */
				160	[HTTP_ERR_400] = 400,
Christopher Faulet	612f2ea	2020-05-27 09:57:28 +0200	[diff] [blame]	161	[HTTP_ERR_401] = 401,
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	162	[HTTP_ERR_403] = 403,
Florian Tham	9205fea	2020-01-08 13:35:30 +0100	[diff] [blame]	163	[HTTP_ERR_404] = 404,
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	164	[HTTP_ERR_405] = 405,
Christopher Faulet	612f2ea	2020-05-27 09:57:28 +0200	[diff] [blame]	165	[HTTP_ERR_407] = 407,
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	166	[HTTP_ERR_408] = 408,
Florian Tham	272e29b	2020-01-08 10:19:05 +0100	[diff] [blame]	167	[HTTP_ERR_410] = 410,
Anthonin Bonnefoy	85048f8	2020-06-22 09:17:01 +0200	[diff] [blame]	168	[HTTP_ERR_413] = 413,
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	169	[HTTP_ERR_421] = 421,
Christopher Faulet	92cafb3	2021-09-28 08:48:51 +0200	[diff] [blame]	170	[HTTP_ERR_422] = 422,
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	171	[HTTP_ERR_425] = 425,
				172	[HTTP_ERR_429] = 429,
				173	[HTTP_ERR_500] = 500,
Christopher Faulet	e095f31	2020-12-07 11:22:24 +0100	[diff] [blame]	174	[HTTP_ERR_501] = 501,
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	175	[HTTP_ERR_502] = 502,
				176	[HTTP_ERR_503] = 503,
				177	[HTTP_ERR_504] = 504,
				178	};
				179
Christopher Faulet	a7b677c	2018-11-29 16:48:49 +0100	[diff] [blame]	180	const char *http_err_msgs[HTTP_ERR_SIZE] = {
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	181	[HTTP_ERR_200] =
Willy Tarreau	b5ba2b0	2019-06-11 16:08:25 +0200	[diff] [blame]	182	"HTTP/1.1 200 OK\r\n"
				183	"Content-length: 58\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	184	"Cache-Control: no-cache\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	185	"Content-Type: text/html\r\n"
				186	"\r\n"
				187	"<html><body><h1>200 OK</h1>\nService ready.\n</body></html>\n",
				188
				189	[HTTP_ERR_400] =
Willy Tarreau	b5ba2b0	2019-06-11 16:08:25 +0200	[diff] [blame]	190	"HTTP/1.1 400 Bad request\r\n"
				191	"Content-length: 90\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	192	"Cache-Control: no-cache\r\n"
				193	"Connection: close\r\n"
				194	"Content-Type: text/html\r\n"
				195	"\r\n"
				196	"<html><body><h1>400 Bad request</h1>\nYour browser sent an invalid request.\n</body></html>\n",
				197
Christopher Faulet	612f2ea	2020-05-27 09:57:28 +0200	[diff] [blame]	198	[HTTP_ERR_401] =
				199	"HTTP/1.1 401 Unauthorized\r\n"
				200	"Content-length: 112\r\n"
				201	"Cache-Control: no-cache\r\n"
Christopher Faulet	612f2ea	2020-05-27 09:57:28 +0200	[diff] [blame]	202	"Content-Type: text/html\r\n"
				203	"\r\n"
				204	"<html><body><h1>401 Unauthorized</h1>\nYou need a valid user and password to access this content.\n</body></html>\n",
				205
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	206	[HTTP_ERR_403] =
Willy Tarreau	b5ba2b0	2019-06-11 16:08:25 +0200	[diff] [blame]	207	"HTTP/1.1 403 Forbidden\r\n"
				208	"Content-length: 93\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	209	"Cache-Control: no-cache\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	210	"Content-Type: text/html\r\n"
				211	"\r\n"
				212	"<html><body><h1>403 Forbidden</h1>\nRequest forbidden by administrative rules.\n</body></html>\n",
				213
Florian Tham	9205fea	2020-01-08 13:35:30 +0100	[diff] [blame]	214	[HTTP_ERR_404] =
				215	"HTTP/1.1 404 Not Found\r\n"
				216	"Content-length: 83\r\n"
				217	"Cache-Control: no-cache\r\n"
Florian Tham	9205fea	2020-01-08 13:35:30 +0100	[diff] [blame]	218	"Content-Type: text/html\r\n"
				219	"\r\n"
				220	"<html><body><h1>404 Not Found</h1>\nThe resource could not be found.\n</body></html>\n",
				221
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	222	[HTTP_ERR_405] =
Willy Tarreau	b5ba2b0	2019-06-11 16:08:25 +0200	[diff] [blame]	223	"HTTP/1.1 405 Method Not Allowed\r\n"
				224	"Content-length: 146\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	225	"Cache-Control: no-cache\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	226	"Content-Type: text/html\r\n"
				227	"\r\n"
				228	"<html><body><h1>405 Method Not Allowed</h1>\nA request was made of a resource using a request method not supported by that resource\n</body></html>\n",
				229
Christopher Faulet	612f2ea	2020-05-27 09:57:28 +0200	[diff] [blame]	230	[HTTP_ERR_407] =
				231	"HTTP/1.1 407 Unauthorized\r\n"
				232	"Content-length: 112\r\n"
				233	"Cache-Control: no-cache\r\n"
Christopher Faulet	612f2ea	2020-05-27 09:57:28 +0200	[diff] [blame]	234	"Content-Type: text/html\r\n"
				235	"\r\n"
				236	"<html><body><h1>407 Unauthorized</h1>\nYou need a valid user and password to access this content.\n</body></html>\n",
				237
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	238	[HTTP_ERR_408] =
Willy Tarreau	b5ba2b0	2019-06-11 16:08:25 +0200	[diff] [blame]	239	"HTTP/1.1 408 Request Time-out\r\n"
				240	"Content-length: 110\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	241	"Cache-Control: no-cache\r\n"
				242	"Connection: close\r\n"
				243	"Content-Type: text/html\r\n"
				244	"\r\n"
				245	"<html><body><h1>408 Request Time-out</h1>\nYour browser didn't send a complete request in time.\n</body></html>\n",
				246
Florian Tham	272e29b	2020-01-08 10:19:05 +0100	[diff] [blame]	247	[HTTP_ERR_410] =
				248	"HTTP/1.1 410 Gone\r\n"
				249	"Content-length: 114\r\n"
				250	"Cache-Control: no-cache\r\n"
Florian Tham	272e29b	2020-01-08 10:19:05 +0100	[diff] [blame]	251	"Content-Type: text/html\r\n"
				252	"\r\n"
				253	"<html><body><h1>410 Gone</h1>\nThe resource is no longer available and will not be available again.\n</body></html>\n",
				254
Anthonin Bonnefoy	85048f8	2020-06-22 09:17:01 +0200	[diff] [blame]	255	[HTTP_ERR_413] =
				256	"HTTP/1.1 413 Payload Too Large\r\n"
				257	"Content-length: 106\r\n"
				258	"Cache-Control: no-cache\r\n"
				259	"Content-Type: text/html\r\n"
				260	"\r\n"
				261	"<html><body><h1>413 Payload Too Large</h1>\nThe request entity exceeds the maximum allowed.\n</body></html>\n",
				262
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	263	[HTTP_ERR_421] =
Willy Tarreau	b5ba2b0	2019-06-11 16:08:25 +0200	[diff] [blame]	264	"HTTP/1.1 421 Misdirected Request\r\n"
				265	"Content-length: 104\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	266	"Cache-Control: no-cache\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	267	"Content-Type: text/html\r\n"
				268	"\r\n"
				269	"<html><body><h1>421 Misdirected Request</h1>\nRequest sent to a non-authoritative server.\n</body></html>\n",
				270
Christopher Faulet	92cafb3	2021-09-28 08:48:51 +0200	[diff] [blame]	271	[HTTP_ERR_422] =
				272	"HTTP/1.1 422 Unprocessable Content\r\n"
				273	"Content-length: 116\r\n"
				274	"Cache-Control: no-cache\r\n"
				275	"Content-Type: text/html\r\n"
				276	"\r\n"
				277	"<html><body><h1>422 Unprocessable Content</h1>\nThe server cannot process the contained instructions.\n</body></html>\n",
				278
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	279	[HTTP_ERR_425] =
Willy Tarreau	b5ba2b0	2019-06-11 16:08:25 +0200	[diff] [blame]	280	"HTTP/1.1 425 Too Early\r\n"
				281	"Content-length: 80\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	282	"Cache-Control: no-cache\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	283	"Content-Type: text/html\r\n"
				284	"\r\n"
				285	"<html><body><h1>425 Too Early</h1>\nYour browser sent early data.\n</body></html>\n",
				286
				287	[HTTP_ERR_429] =
Willy Tarreau	b5ba2b0	2019-06-11 16:08:25 +0200	[diff] [blame]	288	"HTTP/1.1 429 Too Many Requests\r\n"
				289	"Content-length: 117\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	290	"Cache-Control: no-cache\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	291	"Content-Type: text/html\r\n"
				292	"\r\n"
				293	"<html><body><h1>429 Too Many Requests</h1>\nYou have sent too many requests in a given amount of time.\n</body></html>\n",
				294
				295	[HTTP_ERR_500] =
Willy Tarreau	b5ba2b0	2019-06-11 16:08:25 +0200	[diff] [blame]	296	"HTTP/1.1 500 Internal Server Error\r\n"
Christopher Faulet	5563392	2020-10-09 08:39:26 +0200	[diff] [blame]	297	"Content-length: 97\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	298	"Cache-Control: no-cache\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	299	"Content-Type: text/html\r\n"
				300	"\r\n"
Ilya Shipitsin	46a030c	2020-07-05 16:36:08 +0500	[diff] [blame]	301	"<html><body><h1>500 Internal Server Error</h1>\nAn internal server error occurred.\n</body></html>\n",
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	302
Christopher Faulet	e095f31	2020-12-07 11:22:24 +0100	[diff] [blame]	303	[HTTP_ERR_501] =
				304	"HTTP/1.1 501 Not Implemented\r\n"
				305	"Content-length: 136\r\n"
				306	"Cache-Control: no-cache\r\n"
				307	"Content-Type: text/html\r\n"
				308	"\r\n"
				309	"<html><body><h1>501 Not Implemented</h1>\n.The server does not support the functionality required to fulfill the request.\n</body></html>\n",
				310
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	311	[HTTP_ERR_502] =
Willy Tarreau	b5ba2b0	2019-06-11 16:08:25 +0200	[diff] [blame]	312	"HTTP/1.1 502 Bad Gateway\r\n"
				313	"Content-length: 107\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	314	"Cache-Control: no-cache\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	315	"Content-Type: text/html\r\n"
				316	"\r\n"
				317	"<html><body><h1>502 Bad Gateway</h1>\nThe server returned an invalid or incomplete response.\n</body></html>\n",
				318
				319	[HTTP_ERR_503] =
Willy Tarreau	b5ba2b0	2019-06-11 16:08:25 +0200	[diff] [blame]	320	"HTTP/1.1 503 Service Unavailable\r\n"
				321	"Content-length: 107\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	322	"Cache-Control: no-cache\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	323	"Content-Type: text/html\r\n"
				324	"\r\n"
				325	"<html><body><h1>503 Service Unavailable</h1>\nNo server is available to handle this request.\n</body></html>\n",
				326
				327	[HTTP_ERR_504] =
Willy Tarreau	b5ba2b0	2019-06-11 16:08:25 +0200	[diff] [blame]	328	"HTTP/1.1 504 Gateway Time-out\r\n"
				329	"Content-length: 92\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	330	"Cache-Control: no-cache\r\n"
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	331	"Content-Type: text/html\r\n"
				332	"\r\n"
				333	"<html><body><h1>504 Gateway Time-out</h1>\nThe server didn't respond in time.\n</body></html>\n",
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	334	};
				335
Willy Tarreau	35b51c6	2018-09-10 15:38:55 +0200	[diff] [blame]	336	const struct ist http_known_methods[HTTP_METH_OTHER] = {
				337	[HTTP_METH_OPTIONS] = IST("OPTIONS"),
				338	[HTTP_METH_GET] = IST("GET"),
				339	[HTTP_METH_HEAD] = IST("HEAD"),
				340	[HTTP_METH_POST] = IST("POST"),
				341	[HTTP_METH_PUT] = IST("PUT"),
				342	[HTTP_METH_DELETE] = IST("DELETE"),
				343	[HTTP_METH_TRACE] = IST("TRACE"),
				344	[HTTP_METH_CONNECT] = IST("CONNECT"),
				345	};
				346
				347	/*
				348	* returns a known method among HTTP_METH_* or HTTP_METH_OTHER for all unknown
				349	* ones.
				350	*/
				351	enum http_meth_t find_http_meth(const char *str, const int len)
				352	{
				353	const struct ist m = ist2(str, len);
				354
				355	if (isteq(m, ist("GET"))) return HTTP_METH_GET;
				356	else if (isteq(m, ist("HEAD"))) return HTTP_METH_HEAD;
				357	else if (isteq(m, ist("POST"))) return HTTP_METH_POST;
				358	else if (isteq(m, ist("CONNECT"))) return HTTP_METH_CONNECT;
				359	else if (isteq(m, ist("PUT"))) return HTTP_METH_PUT;
				360	else if (isteq(m, ist("OPTIONS"))) return HTTP_METH_OPTIONS;
				361	else if (isteq(m, ist("DELETE"))) return HTTP_METH_DELETE;
				362	else if (isteq(m, ist("TRACE"))) return HTTP_METH_TRACE;
				363	else return HTTP_METH_OTHER;
				364	}
Willy Tarreau	6b952c8	2018-09-10 17:45:34 +0200	[diff] [blame]	365
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	366	/* This function returns HTTP_ERR_<num> (enum) matching http status code.
				367	* Returned value should match codes from http_err_codes.
				368	*/
Willy Tarreau	8de1df9	2019-04-15 21:27:18 +0200	[diff] [blame]	369	int http_get_status_idx(unsigned int status)
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	370	{
				371	switch (status) {
				372	case 200: return HTTP_ERR_200;
				373	case 400: return HTTP_ERR_400;
Christopher Faulet	612f2ea	2020-05-27 09:57:28 +0200	[diff] [blame]	374	case 401: return HTTP_ERR_401;
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	375	case 403: return HTTP_ERR_403;
Florian Tham	9205fea	2020-01-08 13:35:30 +0100	[diff] [blame]	376	case 404: return HTTP_ERR_404;
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	377	case 405: return HTTP_ERR_405;
Christopher Faulet	612f2ea	2020-05-27 09:57:28 +0200	[diff] [blame]	378	case 407: return HTTP_ERR_407;
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	379	case 408: return HTTP_ERR_408;
Florian Tham	272e29b	2020-01-08 10:19:05 +0100	[diff] [blame]	380	case 410: return HTTP_ERR_410;
Anthonin Bonnefoy	85048f8	2020-06-22 09:17:01 +0200	[diff] [blame]	381	case 413: return HTTP_ERR_413;
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	382	case 421: return HTTP_ERR_421;
Christopher Faulet	92cafb3	2021-09-28 08:48:51 +0200	[diff] [blame]	383	case 422: return HTTP_ERR_422;
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	384	case 425: return HTTP_ERR_425;
				385	case 429: return HTTP_ERR_429;
				386	case 500: return HTTP_ERR_500;
Christopher Faulet	e095f31	2020-12-07 11:22:24 +0100	[diff] [blame]	387	case 501: return HTTP_ERR_501;
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	388	case 502: return HTTP_ERR_502;
				389	case 503: return HTTP_ERR_503;
				390	case 504: return HTTP_ERR_504;
				391	default: return HTTP_ERR_500;
				392	}
				393	}
				394
				395	/* This function returns a reason associated with the HTTP status.
				396	* This function never fails, a message is always returned.
				397	*/
				398	const char *http_get_reason(unsigned int status)
				399	{
				400	switch (status) {
				401	case 100: return "Continue";
				402	case 101: return "Switching Protocols";
				403	case 102: return "Processing";
				404	case 200: return "OK";
				405	case 201: return "Created";
				406	case 202: return "Accepted";
				407	case 203: return "Non-Authoritative Information";
				408	case 204: return "No Content";
				409	case 205: return "Reset Content";
				410	case 206: return "Partial Content";
				411	case 207: return "Multi-Status";
				412	case 210: return "Content Different";
				413	case 226: return "IM Used";
				414	case 300: return "Multiple Choices";
				415	case 301: return "Moved Permanently";
				416	case 302: return "Moved Temporarily";
				417	case 303: return "See Other";
				418	case 304: return "Not Modified";
				419	case 305: return "Use Proxy";
				420	case 307: return "Temporary Redirect";
				421	case 308: return "Permanent Redirect";
				422	case 310: return "Too many Redirects";
				423	case 400: return "Bad Request";
				424	case 401: return "Unauthorized";
				425	case 402: return "Payment Required";
				426	case 403: return "Forbidden";
				427	case 404: return "Not Found";
				428	case 405: return "Method Not Allowed";
				429	case 406: return "Not Acceptable";
				430	case 407: return "Proxy Authentication Required";
				431	case 408: return "Request Time-out";
				432	case 409: return "Conflict";
				433	case 410: return "Gone";
				434	case 411: return "Length Required";
				435	case 412: return "Precondition Failed";
				436	case 413: return "Request Entity Too Large";
				437	case 414: return "Request-URI Too Long";
				438	case 415: return "Unsupported Media Type";
				439	case 416: return "Requested range unsatisfiable";
				440	case 417: return "Expectation failed";
				441	case 418: return "I'm a teapot";
				442	case 421: return "Misdirected Request";
Christopher Faulet	92cafb3	2021-09-28 08:48:51 +0200	[diff] [blame]	443	case 422: return "Unprocessable Content";
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	444	case 423: return "Locked";
				445	case 424: return "Method failure";
				446	case 425: return "Too Early";
				447	case 426: return "Upgrade Required";
				448	case 428: return "Precondition Required";
				449	case 429: return "Too Many Requests";
				450	case 431: return "Request Header Fields Too Large";
				451	case 449: return "Retry With";
				452	case 450: return "Blocked by Windows Parental Controls";
				453	case 451: return "Unavailable For Legal Reasons";
				454	case 456: return "Unrecoverable Error";
				455	case 499: return "client has closed connection";
				456	case 500: return "Internal Server Error";
				457	case 501: return "Not Implemented";
				458	case 502: return "Bad Gateway or Proxy Error";
				459	case 503: return "Service Unavailable";
				460	case 504: return "Gateway Time-out";
				461	case 505: return "HTTP Version not supported";
Ilya Shipitsin	46a030c	2020-07-05 16:36:08 +0500	[diff] [blame]	462	case 506: return "Variant also negotiate";
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	463	case 507: return "Insufficient storage";
				464	case 508: return "Loop detected";
				465	case 509: return "Bandwidth Limit Exceeded";
				466	case 510: return "Not extended";
				467	case 511: return "Network authentication required";
				468	case 520: return "Web server is returning an unknown error";
				469	default:
				470	switch (status) {
				471	case 100 ... 199: return "Informational";
				472	case 200 ... 299: return "Success";
				473	case 300 ... 399: return "Redirection";
				474	case 400 ... 499: return "Client Error";
				475	case 500 ... 599: return "Server Error";
				476	default: return "Other";
				477	}
				478	}
				479	}
				480
Christopher Faulet	658f971	2022-07-05 09:48:39 +0200	[diff] [blame]	481	/* Returns the ist string corresponding to port part (without ':') in the host
Christopher Faulet	99ade9e	2022-11-21 18:57:49 +0100	[diff] [blame]	482	* <host>, IST_NULL if no ':' is found or an empty IST if there is no digit. In
Ilya Shipitsin	6f86eaa	2022-11-30 16:22:42 +0500	[diff] [blame]	483	* the last case, the result is the original ist trimmed to 0. So be sure to test
Christopher Faulet	99ade9e	2022-11-21 18:57:49 +0100	[diff] [blame]	484	* the result length before doing any pointer arithmetic.
Christopher Faulet	658f971	2022-07-05 09:48:39 +0200	[diff] [blame]	485	*/
				486	struct ist http_get_host_port(const struct ist host)
				487	{
				488	char start, end, *ptr;
				489
				490	start = istptr(host);
				491	end = istend(host);
				492	for (ptr = end; ptr > start && isdigit((unsigned char)*--ptr););
				493
				494	/* no port found */
Christopher Faulet	99ade9e	2022-11-21 18:57:49 +0100	[diff] [blame]	495	if (likely(*ptr != ':'))
Christopher Faulet	658f971	2022-07-05 09:48:39 +0200	[diff] [blame]	496	return IST_NULL;
Christopher Faulet	99ade9e	2022-11-21 18:57:49 +0100	[diff] [blame]	497	if (ptr+1 == end)
				498	return isttrim(host, 0);
Christopher Faulet	658f971	2022-07-05 09:48:39 +0200	[diff] [blame]	499
				500	return istnext(ist2(ptr, end - ptr));
				501	}
				502
Christopher Faulet	ca7218a	2022-07-05 09:53:37 +0200	[diff] [blame]	503
				504	/* Return non-zero if the port <port> is a default port. If the scheme <schm> is
				505	* set, it is used to detect default ports (HTTP => 80 and HTTPS => 443)
				506	* port. Otherwise, both are considered as default ports.
				507	*/
				508	int http_is_default_port(const struct ist schm, const struct ist port)
				509	{
Christopher Faulet	99ade9e	2022-11-21 18:57:49 +0100	[diff] [blame]	510	if (!istlen(port))
				511	return 1;
				512
Christopher Faulet	ca7218a	2022-07-05 09:53:37 +0200	[diff] [blame]	513	if (!isttest(schm))
				514	return (isteq(port, ist("443")) \|\| isteq(port, ist("80")));
				515	else
				516	return (isteq(port, ist("443")) && isteqi(schm, ist("https://"))) \|\|
				517	(isteq(port, ist("80")) && isteqi(schm, ist("http://")));
				518	}
				519
Willy Tarreau	d3d8d03	2021-08-10 15:35:36 +0200	[diff] [blame]	520	/* Returns non-zero if the scheme <schm> is syntactically correct according to
				521	* RFC3986#3.1, otherwise zero. It expects only the scheme and nothing else
				522	* (particularly not the following "://").
				523	* Scheme = alpha *(alpha\|digit\|'+'\|'-'\|'.')
				524	*/
				525	int http_validate_scheme(const struct ist schm)
				526	{
				527	size_t i;
				528
				529	for (i = 0; i < schm.len; i++) {
				530	if (likely((schm.ptr[i] >= 'a' && schm.ptr[i] <= 'z') \|\|
				531	(schm.ptr[i] >= 'A' && schm.ptr[i] <= 'Z')))
				532	continue;
				533	if (unlikely(!i)) // first char must be alpha
				534	return 0;
				535	if ((schm.ptr[i] >= '0' && schm.ptr[i] <= '9') \|\|
				536	schm.ptr[i] == '+' \|\| schm.ptr[i] == '-' \|\| schm.ptr[i] == '.')
				537	continue;
				538	return 0;
				539	}
				540	return !!i;
				541	}
				542
Amaury Denoyelle	ef08811	2021-07-07 10:49:25 +0200	[diff] [blame]	543	/* Parse the uri and looks for the scheme. If not found, an empty ist is
				544	* returned. Otherwise, the ist pointing to the scheme is returned.
Amaury Denoyelle	8ac8cbf	2021-07-06 10:52:58 +0200	[diff] [blame]	545	*
				546	* <parser> must have been initialized via http_uri_parser_init. See the
				547	* related http_uri_parser documentation for the specific API usage.
Amaury Denoyelle	ef08811	2021-07-07 10:49:25 +0200	[diff] [blame]	548	*/
Amaury Denoyelle	8ac8cbf	2021-07-06 10:52:58 +0200	[diff] [blame]	549	struct ist http_parse_scheme(struct http_uri_parser *parser)
Amaury Denoyelle	ef08811	2021-07-07 10:49:25 +0200	[diff] [blame]	550	{
				551	const char ptr, start, *end;
				552
Amaury Denoyelle	8ac8cbf	2021-07-06 10:52:58 +0200	[diff] [blame]	553	if (parser->state >= URI_PARSER_STATE_SCHEME_DONE)
Amaury Denoyelle	ef08811	2021-07-07 10:49:25 +0200	[diff] [blame]	554	goto not_found;
				555
Amaury Denoyelle	8ac8cbf	2021-07-06 10:52:58 +0200	[diff] [blame]	556	if (parser->format != URI_PARSER_FORMAT_ABSURI_OR_AUTHORITY)
Amaury Denoyelle	ef08811	2021-07-07 10:49:25 +0200	[diff] [blame]	557	goto not_found;
				558
Amaury Denoyelle	8ac8cbf	2021-07-06 10:52:58 +0200	[diff] [blame]	559	ptr = start = istptr(parser->uri);
				560	end = istend(parser->uri);
				561
Amaury Denoyelle	ef08811	2021-07-07 10:49:25 +0200	[diff] [blame]	562	if (isalpha((unsigned char)*ptr)) {
				563	/* this is a scheme as described by RFC3986, par. 3.1, or only
				564	* an authority (in case of a CONNECT method).
				565	*/
				566	ptr++;
				567	/* retrieve the scheme up to the suffix '://'. If the suffix is
				568	* not found, this means there is no scheme and it is an
				569	* authority-only uri.
				570	*/
				571	while (ptr < end &&
				572	(isalnum((unsigned char)ptr) \|\| ptr == '+' \|\| ptr == '-' \|\| ptr == '.'))
				573	ptr++;
				574	if (ptr == end \|\| *ptr++ != ':')
				575	goto not_found;
				576	if (ptr == end \|\| *ptr++ != '/')
				577	goto not_found;
				578	if (ptr == end \|\| *ptr++ != '/')
				579	goto not_found;
				580	}
				581	else {
				582	goto not_found;
				583	}
				584
Amaury Denoyelle	8ac8cbf	2021-07-06 10:52:58 +0200	[diff] [blame]	585	parser->uri = ist2(ptr, end - ptr);
				586	parser->state = URI_PARSER_STATE_SCHEME_DONE;
Amaury Denoyelle	ef08811	2021-07-07 10:49:25 +0200	[diff] [blame]	587	return ist2(start, ptr - start);
				588
				589	not_found:
Amaury Denoyelle	8ac8cbf	2021-07-06 10:52:58 +0200	[diff] [blame]	590	parser->state = URI_PARSER_STATE_SCHEME_DONE;
Amaury Denoyelle	ef08811	2021-07-07 10:49:25 +0200	[diff] [blame]	591	return IST_NULL;
				592	}
				593
Christopher Faulet	16fdc55	2019-10-08 14:56:58 +0200	[diff] [blame]	594	/* Parse the uri and looks for the authority, between the scheme and the
				595	* path. if no_userinfo is not zero, the part before the '@' (including it) is
				596	* skipped. If not found, an empty ist is returned. Otherwise, the ist pointing
				597	* on the authority is returned.
Amaury Denoyelle	69294b2	2021-07-06 11:02:22 +0200	[diff] [blame]	598	*
				599	* <parser> must have been initialized via http_uri_parser_init. See the
				600	* related http_uri_parser documentation for the specific API usage.
Christopher Faulet	16fdc55	2019-10-08 14:56:58 +0200	[diff] [blame]	601	*/
Amaury Denoyelle	69294b2	2021-07-06 11:02:22 +0200	[diff] [blame]	602	struct ist http_parse_authority(struct http_uri_parser *parser, int no_userinfo)
Christopher Faulet	16fdc55	2019-10-08 14:56:58 +0200	[diff] [blame]	603	{
				604	const char ptr, start, *end;
				605
Amaury Denoyelle	69294b2	2021-07-06 11:02:22 +0200	[diff] [blame]	606	if (parser->state >= URI_PARSER_STATE_AUTHORITY_DONE)
Christopher Faulet	16fdc55	2019-10-08 14:56:58 +0200	[diff] [blame]	607	goto not_found;
				608
Amaury Denoyelle	69294b2	2021-07-06 11:02:22 +0200	[diff] [blame]	609	if (parser->format != URI_PARSER_FORMAT_ABSURI_OR_AUTHORITY)
Christopher Faulet	16fdc55	2019-10-08 14:56:58 +0200	[diff] [blame]	610	goto not_found;
				611
Amaury Denoyelle	69294b2	2021-07-06 11:02:22 +0200	[diff] [blame]	612	if (parser->state < URI_PARSER_STATE_SCHEME_DONE)
				613	http_parse_scheme(parser);
Christopher Faulet	16fdc55	2019-10-08 14:56:58 +0200	[diff] [blame]	614
Amaury Denoyelle	69294b2	2021-07-06 11:02:22 +0200	[diff] [blame]	615	ptr = start = istptr(parser->uri);
				616	end = istend(parser->uri);
				617
Christopher Faulet	16fdc55	2019-10-08 14:56:58 +0200	[diff] [blame]	618	while (ptr < end && *ptr != '/') {
				619	if (*ptr++ == '@' && no_userinfo)
				620	start = ptr;
				621	}
				622
				623	/* OK, ptr point on the '/' or the end */
Christopher Faulet	16fdc55	2019-10-08 14:56:58 +0200	[diff] [blame]	624
				625	authority:
Amaury Denoyelle	69294b2	2021-07-06 11:02:22 +0200	[diff] [blame]	626	parser->uri = ist2(ptr, end - ptr);
				627	parser->state = URI_PARSER_STATE_AUTHORITY_DONE;
				628	return ist2(start, ptr - start);
Christopher Faulet	16fdc55	2019-10-08 14:56:58 +0200	[diff] [blame]	629
				630	not_found:
Amaury Denoyelle	69294b2	2021-07-06 11:02:22 +0200	[diff] [blame]	631	parser->state = URI_PARSER_STATE_AUTHORITY_DONE;
Tim Duesterhus	241e29e	2020-03-05 17:56:30 +0100	[diff] [blame]	632	return IST_NULL;
Christopher Faulet	16fdc55	2019-10-08 14:56:58 +0200	[diff] [blame]	633	}
				634
Willy Tarreau	6b952c8	2018-09-10 17:45:34 +0200	[diff] [blame]	635	/* Parse the URI from the given transaction (which is assumed to be in request
				636	* phase) and look for the "/" beginning the PATH. If not found, ist2(0,0) is
				637	* returned. Otherwise the pointer and length are returned.
Amaury Denoyelle	c453f95	2021-07-06 11:40:12 +0200	[diff] [blame]	638	*
				639	* <parser> must have been initialized via http_uri_parser_init. See the
				640	* related http_uri_parser documentation for the specific API usage.
Willy Tarreau	6b952c8	2018-09-10 17:45:34 +0200	[diff] [blame]	641	*/
Amaury Denoyelle	c453f95	2021-07-06 11:40:12 +0200	[diff] [blame]	642	struct ist http_parse_path(struct http_uri_parser *parser)
Willy Tarreau	6b952c8	2018-09-10 17:45:34 +0200	[diff] [blame]	643	{
				644	const char ptr, end;
				645
Amaury Denoyelle	c453f95	2021-07-06 11:40:12 +0200	[diff] [blame]	646	if (parser->state >= URI_PARSER_STATE_PATH_DONE)
Willy Tarreau	6b952c8	2018-09-10 17:45:34 +0200	[diff] [blame]	647	goto not_found;
				648
Amaury Denoyelle	c453f95	2021-07-06 11:40:12 +0200	[diff] [blame]	649	if (parser->format == URI_PARSER_FORMAT_EMPTY \|\|
				650	parser->format == URI_PARSER_FORMAT_ASTERISK) {
				651	goto not_found;
				652	}
				653
				654	ptr = istptr(parser->uri);
				655	end = istend(parser->uri);
Willy Tarreau	6b952c8	2018-09-10 17:45:34 +0200	[diff] [blame]	656
Amaury Denoyelle	c453f95	2021-07-06 11:40:12 +0200	[diff] [blame]	657	/* If the uri is in absolute-path format, first skip the scheme and
				658	* authority parts. No scheme will be found if the uri is in authority
				659	* format, which indicates that the path won't be present.
Willy Tarreau	6b952c8	2018-09-10 17:45:34 +0200	[diff] [blame]	660	*/
Amaury Denoyelle	c453f95	2021-07-06 11:40:12 +0200	[diff] [blame]	661	if (parser->format == URI_PARSER_FORMAT_ABSURI_OR_AUTHORITY) {
				662	if (parser->state < URI_PARSER_STATE_SCHEME_DONE) {
				663	/* If no scheme found, uri is in authority format. No
				664	* path is present.
				665	*/
				666	if (!isttest(http_parse_scheme(parser)))
				667	goto not_found;
				668	}
Willy Tarreau	6b952c8	2018-09-10 17:45:34 +0200	[diff] [blame]	669
Amaury Denoyelle	c453f95	2021-07-06 11:40:12 +0200	[diff] [blame]	670	if (parser->state < URI_PARSER_STATE_AUTHORITY_DONE)
				671	http_parse_authority(parser, 1);
Willy Tarreau	6b952c8	2018-09-10 17:45:34 +0200	[diff] [blame]	672
Amaury Denoyelle	c453f95	2021-07-06 11:40:12 +0200	[diff] [blame]	673	ptr = istptr(parser->uri);
				674
				675	if (ptr == end)
Willy Tarreau	6b952c8	2018-09-10 17:45:34 +0200	[diff] [blame]	676	goto not_found;
				677	}
Willy Tarreau	6b952c8	2018-09-10 17:45:34 +0200	[diff] [blame]	678
Amaury Denoyelle	c453f95	2021-07-06 11:40:12 +0200	[diff] [blame]	679	parser->state = URI_PARSER_STATE_PATH_DONE;
Willy Tarreau	6b952c8	2018-09-10 17:45:34 +0200	[diff] [blame]	680	return ist2(ptr, end - ptr);
				681
				682	not_found:
Amaury Denoyelle	c453f95	2021-07-06 11:40:12 +0200	[diff] [blame]	683	parser->state = URI_PARSER_STATE_PATH_DONE;
Tim Duesterhus	241e29e	2020-03-05 17:56:30 +0100	[diff] [blame]	684	return IST_NULL;
Willy Tarreau	6b952c8	2018-09-10 17:45:34 +0200	[diff] [blame]	685	}
Willy Tarreau	04f1e2d	2018-09-10 18:04:24 +0200	[diff] [blame]	686
Amaury Denoyelle	15f3cc4	2022-12-08 16:53:58 +0100	[diff] [blame]	687	/* Parse <value> Content-Length header field of an HTTP request. The function
				688	* checks all possible occurrences of a comma-delimited value, and verifies if
				689	* any of them doesn't match a previous value. <value> is sanitized on return
				690	* to contain a single value if several identical values were found.
				691	*
				692	* <body_len> must be a valid pointer and is used to return the parsed length
				693	* unless values differ. Also if <not_first> is true, <body_len> is assumed to
				694	* point to previously parsed value and which must be equal to the new length.
				695	* This is useful if an HTTP message contains several Content-Length headers.
				696	*
				697	* Returns <0 if a value differs, 0 if the whole header can be dropped (i.e.
				698	* already known), or >0 if the value can be indexed (first one). In the last
				699	* case, the value might be adjusted and the caller must only add the updated
				700	* value.
				701	*/
				702	int http_parse_cont_len_header(struct ist value, unsigned long long body_len,
				703	int not_first)
				704	{
				705	char e, n;
				706	unsigned long long cl;
				707	struct ist word;
				708	int check_prev = not_first;
				709
				710	word.ptr = value->ptr - 1; // -1 for next loop's pre-increment
				711	e = value->ptr + value->len;
				712
				713	while (++word.ptr < e) {
				714	/* skip leading delimiter and blanks */
				715	if (unlikely(HTTP_IS_LWS(*word.ptr)))
				716	continue;
				717
				718	/* digits only now */
				719	for (cl = 0, n = word.ptr; n < e; n++) {
				720	unsigned int c = *n - '0';
				721	if (unlikely(c > 9)) {
				722	/* non-digit */
				723	if (unlikely(n == word.ptr)) // spaces only
				724	goto fail;
				725	break;
				726	}
				727	if (unlikely(cl > ULLONG_MAX / 10ULL))
				728	goto fail; /* multiply overflow */
				729	cl = cl * 10ULL;
				730	if (unlikely(cl + c < cl))
				731	goto fail; /* addition overflow */
				732	cl = cl + c;
				733	}
				734
				735	/* keep a copy of the exact cleaned value */
				736	word.len = n - word.ptr;
				737
				738	/* skip trailing LWS till next comma or EOL */
				739	for (; n < e; n++) {
				740	if (!HTTP_IS_LWS(*n)) {
				741	if (unlikely(*n != ','))
				742	goto fail;
				743	break;
				744	}
				745	}
				746
				747	/* if duplicate, must be equal */
				748	if (check_prev && cl != *body_len)
				749	goto fail;
				750
				751	/* OK, store this result as the one to be indexed */
				752	*body_len = cl;
				753	*value = word;
				754	word.ptr = n;
				755	check_prev = 1;
				756	}
				757
				758	/* here we've reached the end with a single value or a series of
				759	* identical values, all matching previous series if any. The last
				760	* parsed value was sent back into <value>. We just have to decide
				761	* if this occurrence has to be indexed (it's the first one) or
				762	* silently skipped (it's not the first one)
				763	*/
				764	return !not_first;
				765	fail:
				766	return -1;
				767	}
				768
Willy Tarreau	ab813a4	2018-09-10 18:41:28 +0200	[diff] [blame]	769	/*
				770	* Checks if <hdr> is exactly <name> for <len> chars, and ends with a colon.
				771	* If so, returns the position of the first non-space character relative to
				772	* <hdr>, or <end>-<hdr> if not found before. If no value is found, it tries
				773	* to return a pointer to the place after the first space. Returns 0 if the
				774	* header name does not match. Checks are case-insensitive.
				775	*/
				776	int http_header_match2(const char hdr, const char end,
				777	const char *name, int len)
				778	{
				779	const char *val;
				780
				781	if (hdr + len >= end)
				782	return 0;
				783	if (hdr[len] != ':')
				784	return 0;
				785	if (strncasecmp(hdr, name, len) != 0)
				786	return 0;
				787	val = hdr + len + 1;
				788	while (val < end && HTTP_IS_SPHT(*val))
				789	val++;
				790	if ((val >= end) && (len + 2 <= end - hdr))
				791	return len + 2; /* we may replace starting from second space */
				792	return val - hdr;
				793	}
				794
				795	/* Find the end of the header value contained between <s> and <e>. See RFC7230,
				796	* par 3.2 for more information. Note that it requires a valid header to return
				797	* a valid result. This works for headers defined as comma-separated lists.
				798	*/
				799	char http_find_hdr_value_end(char s, const char *e)
				800	{
				801	int quoted, qdpair;
				802
				803	quoted = qdpair = 0;
				804
Willy Tarreau	02ac950	2020-02-21 16:31:22 +0100	[diff] [blame]	805	#ifdef HA_UNALIGNED_LE
Willy Tarreau	ab813a4	2018-09-10 18:41:28 +0200	[diff] [blame]	806	/* speedup: skip everything not a comma nor a double quote */
				807	for (; s <= e - sizeof(int); s += sizeof(int)) {
				808	unsigned int c = (int )s; // comma
				809	unsigned int q = c; // quote
				810
				811	c ^= 0x2c2c2c2c; // contains one zero on a comma
				812	q ^= 0x22222222; // contains one zero on a quote
				813
				814	c = (c - 0x01010101) & ~c; // contains 0x80 below a comma
				815	q = (q - 0x01010101) & ~q; // contains 0x80 below a quote
				816
				817	if ((c \| q) & 0x80808080)
				818	break; // found a comma or a quote
				819	}
				820	#endif
				821	for (; s < e; s++) {
				822	if (qdpair) qdpair = 0;
				823	else if (quoted) {
				824	if (*s == '\\') qdpair = 1;
				825	else if (*s == '"') quoted = 0;
				826	}
				827	else if (*s == '"') quoted = 1;
				828	else if (*s == ',') return s;
				829	}
				830	return s;
				831	}
				832
				833	/* Find the end of a cookie value contained between <s> and <e>. It works the
				834	* same way as with headers above except that the semi-colon also ends a token.
				835	* See RFC2965 for more information. Note that it requires a valid header to
				836	* return a valid result.
				837	*/
				838	char http_find_cookie_value_end(char s, const char *e)
				839	{
				840	int quoted, qdpair;
				841
				842	quoted = qdpair = 0;
				843	for (; s < e; s++) {
				844	if (qdpair) qdpair = 0;
				845	else if (quoted) {
				846	if (*s == '\\') qdpair = 1;
				847	else if (*s == '"') quoted = 0;
				848	}
				849	else if (*s == '"') quoted = 1;
				850	else if (s == ',' \|\| s == ';') return s;
				851	}
				852	return s;
				853	}
				854
				855	/* Try to find the next occurrence of a cookie name in a cookie header value.
Maciej Zdeb	dea7c20	2020-11-13 09:38:06 +0000	[diff] [blame]	856	* To match on any cookie name, <cookie_name_l> must be set to 0.
Willy Tarreau	ab813a4	2018-09-10 18:41:28 +0200	[diff] [blame]	857	* The lookup begins at <hdr>. The pointer and size of the next occurrence of
				858	* the cookie value is returned into value and value_l, and the function
				859	* returns a pointer to the next pointer to search from if the value was found.
				860	* Otherwise if the cookie was not found, NULL is returned and neither value
				861	* nor value_l are touched. The input <hdr> string should first point to the
				862	* header's value, and the <hdr_end> pointer must point to the first character
				863	* not part of the value. <list> must be non-zero if value may represent a list
				864	* of values (cookie headers). This makes it faster to abort parsing when no
				865	* list is expected.
				866	*/
				867	char http_extract_cookie_value(char hdr, const char *hdr_end,
				868	char *cookie_name, size_t cookie_name_l,
				869	int list, char *value, size_t value_l)
				870	{
				871	char equal, att_end, att_beg, val_beg, *val_end;
				872	char *next;
				873
				874	/* we search at least a cookie name followed by an equal, and more
				875	* generally something like this :
				876	* Cookie: NAME1 = VALUE 1 ; NAME2 = VALUE2 ; NAME3 = VALUE3\r\n
				877	*/
				878	for (att_beg = hdr; att_beg + cookie_name_l + 1 < hdr_end; att_beg = next + 1) {
				879	/* Iterate through all cookies on this line */
				880
				881	while (att_beg < hdr_end && HTTP_IS_SPHT(*att_beg))
				882	att_beg++;
				883
				884	/* find att_end : this is the first character after the last non
				885	* space before the equal. It may be equal to hdr_end.
				886	*/
				887	equal = att_end = att_beg;
				888
				889	while (equal < hdr_end) {
				890	if (equal == '=' \|\| equal == ';' \|\| (list && *equal == ','))
				891	break;
				892	if (HTTP_IS_SPHT(*equal++))
				893	continue;
				894	att_end = equal;
				895	}
				896
Ilya Shipitsin	46a030c	2020-07-05 16:36:08 +0500	[diff] [blame]	897	/* here, <equal> points to '=', a delimiter or the end. <att_end>
Willy Tarreau	ab813a4	2018-09-10 18:41:28 +0200	[diff] [blame]	898	* is between <att_beg> and <equal>, both may be identical.
				899	*/
				900
				901	/* look for end of cookie if there is an equal sign */
				902	if (equal < hdr_end && *equal == '=') {
				903	/* look for the beginning of the value */
				904	val_beg = equal + 1;
				905	while (val_beg < hdr_end && HTTP_IS_SPHT(*val_beg))
				906	val_beg++;
				907
				908	/* find the end of the value, respecting quotes */
				909	next = http_find_cookie_value_end(val_beg, hdr_end);
				910
Ilya Shipitsin	46a030c	2020-07-05 16:36:08 +0500	[diff] [blame]	911	/* make val_end point to the first white space or delimiter after the value */
Willy Tarreau	ab813a4	2018-09-10 18:41:28 +0200	[diff] [blame]	912	val_end = next;
				913	while (val_end > val_beg && HTTP_IS_SPHT(*(val_end - 1)))
				914	val_end--;
				915	} else {
				916	val_beg = val_end = next = equal;
				917	}
				918
				919	/* We have nothing to do with attributes beginning with '$'. However,
				920	* they will automatically be removed if a header before them is removed,
				921	* since they're supposed to be linked together.
				922	*/
				923	if (*att_beg == '$')
				924	continue;
				925
				926	/* Ignore cookies with no equal sign */
				927	if (equal == next)
				928	continue;
				929
				930	/* Now we have the cookie name between att_beg and att_end, and
				931	* its value between val_beg and val_end.
				932	*/
				933
Maciej Zdeb	dea7c20	2020-11-13 09:38:06 +0000	[diff] [blame]	934	if (cookie_name_l == 0 \|\| (att_end - att_beg == cookie_name_l &&
				935	memcmp(att_beg, cookie_name, cookie_name_l) == 0)) {
Willy Tarreau	ab813a4	2018-09-10 18:41:28 +0200	[diff] [blame]	936	/* let's return this value and indicate where to go on from */
				937	*value = val_beg;
				938	*value_l = val_end - val_beg;
				939	return next + 1;
				940	}
				941
				942	/* Set-Cookie headers only have the name in the first attr=value part */
				943	if (!list)
				944	break;
				945	}
				946
				947	return NULL;
				948	}
				949
Joseph Herlant	942eea3	2018-11-15 13:57:22 -0800	[diff] [blame]	950	/* Parses a qvalue and returns it multiplied by 1000, from 0 to 1000. If the
Willy Tarreau	ab813a4	2018-09-10 18:41:28 +0200	[diff] [blame]	951	* value is larger than 1000, it is bound to 1000. The parser consumes up to
				952	* 1 digit, one dot and 3 digits and stops on the first invalid character.
				953	* Unparsable qvalues return 1000 as "q=1.000".
				954	*/
				955	int http_parse_qvalue(const char qvalue, const char *end)
				956	{
				957	int q = 1000;
				958
				959	if (!isdigit((unsigned char)*qvalue))
				960	goto out;
				961	q = (qvalue++ - '0') 1000;
				962
				963	if (*qvalue++ != '.')
				964	goto out;
				965
				966	if (!isdigit((unsigned char)*qvalue))
				967	goto out;
				968	q += (qvalue++ - '0') 100;
				969
				970	if (!isdigit((unsigned char)*qvalue))
				971	goto out;
				972	q += (qvalue++ - '0') 10;
				973
				974	if (!isdigit((unsigned char)*qvalue))
				975	goto out;
				976	q += (qvalue++ - '0') 1;
				977	out:
				978	if (q > 1000)
				979	q = 1000;
				980	if (end)
				981	*end = qvalue;
				982	return q;
				983	}
				984
				985	/*
Joseph Herlant	942eea3	2018-11-15 13:57:22 -0800	[diff] [blame]	986	* Given a url parameter, find the starting position of the first occurrence,
Willy Tarreau	ab813a4	2018-09-10 18:41:28 +0200	[diff] [blame]	987	* or NULL if the parameter is not found.
				988	*
				989	* Example: if query_string is "yo=mama;ye=daddy" and url_param_name is "ye",
				990	* the function will return query_string+8.
				991	*
				992	* Warning: this function returns a pointer that can point to the first chunk
				993	* or the second chunk. The caller must be check the position before using the
				994	* result.
				995	*/
				996	const char http_find_url_param_pos(const char *chunks,
				997	const char* url_param_name, size_t url_param_name_l,
				998	char delim)
				999	{
				1000	const char pos, last, *equal;
				1001	const char **bufs = chunks;
				1002	int l1, l2;
				1003
				1004
				1005	pos = bufs[0];
				1006	last = bufs[1];
				1007	while (pos < last) {
				1008	/* Check the equal. */
				1009	equal = pos + url_param_name_l;
				1010	if (fix_pointer_if_wrap(chunks, &equal)) {
				1011	if (equal >= chunks[3])
				1012	return NULL;
				1013	} else {
				1014	if (equal >= chunks[1])
				1015	return NULL;
				1016	}
				1017	if (*equal == '=') {
				1018	if (pos + url_param_name_l > last) {
				1019	/* process wrap case, we detect a wrap. In this case, the
				1020	* comparison is performed in two parts.
				1021	*/
				1022
Thayne McCombs	8f0cc5c	2021-01-07 21:35:52 -0700	[diff] [blame]	1023	/* This is the end, we don't have any other chunk. */
Willy Tarreau	ab813a4	2018-09-10 18:41:28 +0200	[diff] [blame]	1024	if (bufs != chunks \|\| !bufs[2])
				1025	return NULL;
				1026
				1027	/* Compute the length of each part of the comparison. */
				1028	l1 = last - pos;
				1029	l2 = url_param_name_l - l1;
				1030
				1031	/* The second buffer is too short to contain the compared string. */
				1032	if (bufs[2] + l2 > bufs[3])
				1033	return NULL;
				1034
				1035	if (memcmp(pos, url_param_name, l1) == 0 &&
				1036	memcmp(bufs[2], url_param_name+l1, l2) == 0)
				1037	return pos;
				1038
				1039	/* Perform wrapping and jump the string who fail the comparison. */
				1040	bufs += 2;
				1041	pos = bufs[0] + l2;
				1042	last = bufs[1];
				1043
				1044	} else {
				1045	/* process a simple comparison. */
				1046	if (memcmp(pos, url_param_name, url_param_name_l) == 0)
				1047	return pos;
				1048	pos += url_param_name_l + 1;
				1049	if (fix_pointer_if_wrap(chunks, &pos))
				1050	last = bufs[2];
				1051	}
				1052	}
				1053
				1054	while (1) {
				1055	/* Look for the next delimiter. */
				1056	while (pos < last && !http_is_param_delimiter(*pos, delim))
				1057	pos++;
				1058	if (pos < last)
				1059	break;
				1060	/* process buffer wrapping. */
				1061	if (bufs != chunks \|\| !bufs[2])
				1062	return NULL;
				1063	bufs += 2;
				1064	pos = bufs[0];
				1065	last = bufs[1];
				1066	}
				1067	pos++;
				1068	}
				1069	return NULL;
				1070	}
				1071
				1072	/*
				1073	* Given a url parameter name and a query string, find the next value.
				1074	* An empty url_param_name matches the first available parameter.
				1075	* If the parameter is found, 1 is returned and vstart / vend are updated to
				1076	* respectively provide a pointer to the value and its end.
				1077	* Otherwise, 0 is returned and vstart/vend are not modified.
				1078	*/
				1079	int http_find_next_url_param(const char **chunks,
				1080	const char* url_param_name, size_t url_param_name_l,
				1081	const char vstart, const char vend, char delim)
				1082	{
				1083	const char arg_start, qs_end;
				1084	const char value_start, value_end;
				1085
				1086	arg_start = chunks[0];
				1087	qs_end = chunks[1];
				1088	if (url_param_name_l) {
				1089	/* Looks for an argument name. */
				1090	arg_start = http_find_url_param_pos(chunks,
				1091	url_param_name, url_param_name_l,
				1092	delim);
				1093	/* Check for wrapping. */
				1094	if (arg_start >= qs_end)
				1095	qs_end = chunks[3];
				1096	}
				1097	if (!arg_start)
				1098	return 0;
				1099
				1100	if (!url_param_name_l) {
				1101	while (1) {
				1102	/* looks for the first argument. */
				1103	value_start = memchr(arg_start, '=', qs_end - arg_start);
				1104	if (!value_start) {
				1105	/* Check for wrapping. */
				1106	if (arg_start >= chunks[0] &&
				1107	arg_start < chunks[1] &&
				1108	chunks[2]) {
				1109	arg_start = chunks[2];
				1110	qs_end = chunks[3];
				1111	continue;
				1112	}
				1113	return 0;
				1114	}
				1115	break;
				1116	}
				1117	value_start++;
				1118	}
				1119	else {
				1120	/* Jump the argument length. */
				1121	value_start = arg_start + url_param_name_l + 1;
				1122
				1123	/* Check for pointer wrapping. */
				1124	if (fix_pointer_if_wrap(chunks, &value_start)) {
				1125	/* Update the end pointer. */
				1126	qs_end = chunks[3];
				1127
				1128	/* Check for overflow. */
				1129	if (value_start >= qs_end)
				1130	return 0;
				1131	}
				1132	}
				1133
				1134	value_end = value_start;
				1135
				1136	while (1) {
				1137	while ((value_end < qs_end) && !http_is_param_delimiter(*value_end, delim))
				1138	value_end++;
				1139	if (value_end < qs_end)
				1140	break;
				1141	/* process buffer wrapping. */
				1142	if (value_end >= chunks[0] &&
				1143	value_end < chunks[1] &&
				1144	chunks[2]) {
				1145	value_end = chunks[2];
				1146	qs_end = chunks[3];
				1147	continue;
				1148	}
				1149	break;
				1150	}
				1151
				1152	*vstart = value_start;
				1153	*vend = value_end;
				1154	return 1;
				1155	}
				1156
Christopher Faulet	8277ca7	2018-10-22 15:12:04 +0200	[diff] [blame]	1157	/* Parses a single header line (without the CRLF) and splits it into its name
				1158	* and its value. The parsing is pretty naive and just skip spaces.
				1159	*/
				1160	int http_parse_header(const struct ist hdr, struct ist name, struct ist value)
				1161	{
				1162	char *p = hdr.ptr;
				1163	char *end = p + hdr.len;
				1164
				1165	name->len = value->len = 0;
				1166
				1167	/* Skip leading spaces */
				1168	for (; p < end && HTTP_IS_SPHT(*p); p++);
				1169
				1170	/* Set the header name */
				1171	name->ptr = p;
				1172	for (; p < end && HTTP_IS_TOKEN(*p); p++);
				1173	name->len = p - name->ptr;
				1174
				1175	/* Skip the ':' and spaces before and after it */
				1176	for (; p < end && HTTP_IS_SPHT(*p); p++);
				1177	if (p < end && *p == ':') p++;
				1178	for (; p < end && HTTP_IS_SPHT(*p); p++);
				1179
				1180	/* Set the header value */
				1181	value->ptr = p;
				1182	value->len = end - p;
				1183
				1184	return 1;
				1185	}
				1186
				1187	/* Parses a single start line (without the CRLF) and splits it into 3 parts. The
				1188	* parsing is pretty naive and just skip spaces.
				1189	*/
				1190	int http_parse_stline(const struct ist line, struct ist p1, struct ist p2, struct ist *p3)
				1191	{
				1192	char *p = line.ptr;
				1193	char *end = p + line.len;
				1194
				1195	p1->len = p2->len = p3->len = 0;
				1196
				1197	/* Skip leading spaces */
				1198	for (; p < end && HTTP_IS_SPHT(*p); p++);
				1199
				1200	/* Set the first part */
				1201	p1->ptr = p;
				1202	for (; p < end && HTTP_IS_TOKEN(*p); p++);
				1203	p1->len = p - p1->ptr;
				1204
				1205	/* Skip spaces between p1 and p2 */
				1206	for (; p < end && HTTP_IS_SPHT(*p); p++);
				1207
				1208	/* Set the second part */
				1209	p2->ptr = p;
				1210	for (; p < end && !HTTP_IS_SPHT(*p); p++);
				1211	p2->len = p - p2->ptr;
				1212
				1213	/* Skip spaces between p2 and p3 */
				1214	for (; p < end && HTTP_IS_SPHT(*p); p++);
				1215
Ilya Shipitsin	46a030c	2020-07-05 16:36:08 +0500	[diff] [blame]	1216	/* The remaining is the third value */
Christopher Faulet	8277ca7	2018-10-22 15:12:04 +0200	[diff] [blame]	1217	p3->ptr = p;
				1218	p3->len = end - p;
				1219
				1220	return 1;
				1221	}
Christopher Faulet	341fac1	2019-09-16 11:37:05 +0200	[diff] [blame]	1222
				1223	/* Parses value of a Status header with the following format: "Status: Code[
				1224	* Reason]". The parsing is pretty naive and just skip spaces. It return the
				1225	* numeric value of the status code.
				1226	*/
				1227	int http_parse_status_val(const struct ist value, struct ist status, struct ist reason)
				1228	{
				1229	char *p = value.ptr;
				1230	char *end = p + value.len;
				1231	uint16_t code;
				1232
				1233	status->len = reason->len = 0;
				1234
				1235	/* Skip leading spaces */
				1236	for (; p < end && HTTP_IS_SPHT(*p); p++);
				1237
				1238	/* Set the status part */
				1239	status->ptr = p;
				1240	for (; p < end && HTTP_IS_TOKEN(*p); p++);
				1241	status->len = p - status->ptr;
				1242
				1243	/* Skip spaces between status and reason */
				1244	for (; p < end && HTTP_IS_SPHT(*p); p++);
				1245
				1246	/* the remaining is the reason */
				1247	reason->ptr = p;
				1248	reason->len = end - p;
				1249
				1250	code = strl2ui(status->ptr, status->len);
				1251	return code;
				1252	}
Remi Tricot-Le Breton	bcced09	2020-10-22 10:40:03 +0200	[diff] [blame]	1253
				1254
				1255	/* Returns non-zero if the two ETags are comparable (see RFC 7232#2.3.2).
				1256	* If any of them is a weak ETag, we discard the weakness prefix and perform
				1257	* a strict string comparison.
				1258	* Returns 0 otherwise.
				1259	*/
				1260	int http_compare_etags(struct ist etag1, struct ist etag2)
				1261	{
				1262	enum http_etag_type etag_type1;
				1263	enum http_etag_type etag_type2;
				1264
				1265	etag_type1 = http_get_etag_type(etag1);
				1266	etag_type2 = http_get_etag_type(etag2);
				1267
				1268	if (etag_type1 == ETAG_INVALID \|\| etag_type2 == ETAG_INVALID)
				1269	return 0;
				1270
				1271	/* Discard the 'W/' prefix an ETag is a weak one. */
				1272	if (etag_type1 == ETAG_WEAK)
				1273	etag1 = istadv(etag1, 2);
				1274	if (etag_type2 == ETAG_WEAK)
				1275	etag2 = istadv(etag2, 2);
				1276
				1277	return isteq(etag1, etag2);
				1278	}
Remi Tricot-Le Breton	56e46cb	2020-12-23 18:13:48 +0100	[diff] [blame]	1279
				1280
				1281	/*
				1282	* Trim leading space or horizontal tab characters from <value> string.
				1283	* Returns the trimmed string.
				1284	*/
				1285	struct ist http_trim_leading_spht(struct ist value)
				1286	{
				1287	struct ist ret = value;
				1288
				1289	while (ret.len && HTTP_IS_SPHT(ret.ptr[0])) {
				1290	++ret.ptr;
				1291	--ret.len;
				1292	}
				1293
				1294	return ret;
				1295	}
				1296
				1297	/*
				1298	* Trim trailing space or horizontal tab characters from <value> string.
				1299	* Returns the trimmed string.
				1300	*/
				1301	struct ist http_trim_trailing_spht(struct ist value)
				1302	{
				1303	struct ist ret = value;
				1304
				1305	while (ret.len && HTTP_IS_SPHT(ret.ptr[-1]))
				1306	--ret.len;
				1307
				1308	return ret;
				1309	}