| /* |
| * HTTP protocol analyzer |
| * |
| * Copyright 2000-2010 Willy Tarreau <w@1wt.eu> |
| * |
| * This program is free software; you can redistribute it and/or |
| * modify it under the terms of the GNU General Public License |
| * as published by the Free Software Foundation; either version |
| * 2 of the License, or (at your option) any later version. |
| * |
| */ |
| |
| #include <ctype.h> |
| #include <errno.h> |
| #include <fcntl.h> |
| #include <stdio.h> |
| #include <stdlib.h> |
| #include <string.h> |
| #include <syslog.h> |
| #include <time.h> |
| |
| #include <sys/socket.h> |
| #include <sys/stat.h> |
| #include <sys/types.h> |
| |
| #include <common/appsession.h> |
| #include <common/base64.h> |
| #include <common/compat.h> |
| #include <common/config.h> |
| #include <common/debug.h> |
| #include <common/memory.h> |
| #include <common/mini-clist.h> |
| #include <common/standard.h> |
| #include <common/ticks.h> |
| #include <common/time.h> |
| #include <common/uri_auth.h> |
| #include <common/version.h> |
| |
| #include <types/capture.h> |
| #include <types/global.h> |
| |
| #include <proto/acl.h> |
| #include <proto/auth.h> |
| #include <proto/backend.h> |
| #include <proto/buffers.h> |
| #include <proto/checks.h> |
| #include <proto/dumpstats.h> |
| #include <proto/fd.h> |
| #include <proto/frontend.h> |
| #include <proto/log.h> |
| #include <proto/hdr_idx.h> |
| #include <proto/pattern.h> |
| #include <proto/proto_tcp.h> |
| #include <proto/proto_http.h> |
| #include <proto/proxy.h> |
| #include <proto/queue.h> |
| #include <proto/server.h> |
| #include <proto/session.h> |
| #include <proto/stream_interface.h> |
| #include <proto/stream_sock.h> |
| #include <proto/task.h> |
| |
| const char HTTP_100[] = |
| "HTTP/1.1 100 Continue\r\n\r\n"; |
| |
| const struct chunk http_100_chunk = { |
| .str = (char *)&HTTP_100, |
| .len = sizeof(HTTP_100)-1 |
| }; |
| |
| /* This is used by remote monitoring */ |
| const char HTTP_200[] = |
| "HTTP/1.0 200 OK\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>200 OK</h1>\nHAProxy: service ready.\n</body></html>\n"; |
| |
| const struct chunk http_200_chunk = { |
| .str = (char *)&HTTP_200, |
| .len = sizeof(HTTP_200)-1 |
| }; |
| |
| /* Warning: no "connection" header is provided with the 3xx messages below */ |
| const char *HTTP_301 = |
| "HTTP/1.1 301 Moved Permanently\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Content-length: 0\r\n" |
| "Location: "; /* not terminated since it will be concatenated with the URL */ |
| |
| const char *HTTP_302 = |
| "HTTP/1.1 302 Found\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Content-length: 0\r\n" |
| "Location: "; /* not terminated since it will be concatenated with the URL */ |
| |
| /* same as 302 except that the browser MUST retry with the GET method */ |
| const char *HTTP_303 = |
| "HTTP/1.1 303 See Other\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Content-length: 0\r\n" |
| "Location: "; /* not terminated since it will be concatenated with the URL */ |
| |
| /* Warning: this one is an sprintf() fmt string, with <realm> as its only argument */ |
| const char *HTTP_401_fmt = |
| "HTTP/1.0 401 Unauthorized\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "WWW-Authenticate: Basic realm=\"%s\"\r\n" |
| "\r\n" |
| "<html><body><h1>401 Unauthorized</h1>\nYou need a valid user and password to access this content.\n</body></html>\n"; |
| |
| const char *HTTP_407_fmt = |
| "HTTP/1.0 407 Unauthorized\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "Proxy-Authenticate: Basic realm=\"%s\"\r\n" |
| "\r\n" |
| "<html><body><h1>401 Unauthorized</h1>\nYou need a valid user and password to access this content.\n</body></html>\n"; |
| |
| |
| const int http_err_codes[HTTP_ERR_SIZE] = { |
| [HTTP_ERR_400] = 400, |
| [HTTP_ERR_403] = 403, |
| [HTTP_ERR_408] = 408, |
| [HTTP_ERR_500] = 500, |
| [HTTP_ERR_502] = 502, |
| [HTTP_ERR_503] = 503, |
| [HTTP_ERR_504] = 504, |
| }; |
| |
| static const char *http_err_msgs[HTTP_ERR_SIZE] = { |
| [HTTP_ERR_400] = |
| "HTTP/1.0 400 Bad request\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>400 Bad request</h1>\nYour browser sent an invalid request.\n</body></html>\n", |
| |
| [HTTP_ERR_403] = |
| "HTTP/1.0 403 Forbidden\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>403 Forbidden</h1>\nRequest forbidden by administrative rules.\n</body></html>\n", |
| |
| [HTTP_ERR_408] = |
| "HTTP/1.0 408 Request Time-out\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>408 Request Time-out</h1>\nYour browser didn't send a complete request in time.\n</body></html>\n", |
| |
| [HTTP_ERR_500] = |
| "HTTP/1.0 500 Server Error\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>500 Server Error</h1>\nAn internal server error occured.\n</body></html>\n", |
| |
| [HTTP_ERR_502] = |
| "HTTP/1.0 502 Bad Gateway\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>502 Bad Gateway</h1>\nThe server returned an invalid or incomplete response.\n</body></html>\n", |
| |
| [HTTP_ERR_503] = |
| "HTTP/1.0 503 Service Unavailable\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>503 Service Unavailable</h1>\nNo server is available to handle this request.\n</body></html>\n", |
| |
| [HTTP_ERR_504] = |
| "HTTP/1.0 504 Gateway Time-out\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>504 Gateway Time-out</h1>\nThe server didn't respond in time.\n</body></html>\n", |
| |
| }; |
| |
| /* We must put the messages here since GCC cannot initialize consts depending |
| * on strlen(). |
| */ |
| struct chunk http_err_chunks[HTTP_ERR_SIZE]; |
| |
| #define FD_SETS_ARE_BITFIELDS |
| #ifdef FD_SETS_ARE_BITFIELDS |
| /* |
| * This map is used with all the FD_* macros to check whether a particular bit |
| * is set or not. Each bit represents an ACSII code. FD_SET() sets those bytes |
| * which should be encoded. When FD_ISSET() returns non-zero, it means that the |
| * byte should be encoded. Be careful to always pass bytes from 0 to 255 |
| * exclusively to the macros. |
| */ |
| fd_set hdr_encode_map[(sizeof(fd_set) > (256/8)) ? 1 : ((256/8) / sizeof(fd_set))]; |
| fd_set url_encode_map[(sizeof(fd_set) > (256/8)) ? 1 : ((256/8) / sizeof(fd_set))]; |
| |
| #else |
| #error "Check if your OS uses bitfields for fd_sets" |
| #endif |
| |
| void init_proto_http() |
| { |
| int i; |
| char *tmp; |
| int msg; |
| |
| for (msg = 0; msg < HTTP_ERR_SIZE; msg++) { |
| if (!http_err_msgs[msg]) { |
| Alert("Internal error: no message defined for HTTP return code %d. Aborting.\n", msg); |
| abort(); |
| } |
| |
| http_err_chunks[msg].str = (char *)http_err_msgs[msg]; |
| http_err_chunks[msg].len = strlen(http_err_msgs[msg]); |
| } |
| |
| /* initialize the log header encoding map : '{|}"#' should be encoded with |
| * '#' as prefix, as well as non-printable characters ( <32 or >= 127 ). |
| * URL encoding only requires '"', '#' to be encoded as well as non- |
| * printable characters above. |
| */ |
| memset(hdr_encode_map, 0, sizeof(hdr_encode_map)); |
| memset(url_encode_map, 0, sizeof(url_encode_map)); |
| for (i = 0; i < 32; i++) { |
| FD_SET(i, hdr_encode_map); |
| FD_SET(i, url_encode_map); |
| } |
| for (i = 127; i < 256; i++) { |
| FD_SET(i, hdr_encode_map); |
| FD_SET(i, url_encode_map); |
| } |
| |
| tmp = "\"#{|}"; |
| while (*tmp) { |
| FD_SET(*tmp, hdr_encode_map); |
| tmp++; |
| } |
| |
| tmp = "\"#"; |
| while (*tmp) { |
| FD_SET(*tmp, url_encode_map); |
| tmp++; |
| } |
| |
| /* memory allocations */ |
| pool2_requri = create_pool("requri", REQURI_LEN, MEM_F_SHARED); |
| pool2_capture = create_pool("capture", CAPTURE_LEN, MEM_F_SHARED); |
| } |
| |
| /* |
| * We have 26 list of methods (1 per first letter), each of which can have |
| * up to 3 entries (2 valid, 1 null). |
| */ |
| struct http_method_desc { |
| http_meth_t meth; |
| int len; |
| const char text[8]; |
| }; |
| |
| const struct http_method_desc http_methods[26][3] = { |
| ['C' - 'A'] = { |
| [0] = { .meth = HTTP_METH_CONNECT , .len=7, .text="CONNECT" }, |
| }, |
| ['D' - 'A'] = { |
| [0] = { .meth = HTTP_METH_DELETE , .len=6, .text="DELETE" }, |
| }, |
| ['G' - 'A'] = { |
| [0] = { .meth = HTTP_METH_GET , .len=3, .text="GET" }, |
| }, |
| ['H' - 'A'] = { |
| [0] = { .meth = HTTP_METH_HEAD , .len=4, .text="HEAD" }, |
| }, |
| ['P' - 'A'] = { |
| [0] = { .meth = HTTP_METH_POST , .len=4, .text="POST" }, |
| [1] = { .meth = HTTP_METH_PUT , .len=3, .text="PUT" }, |
| }, |
| ['T' - 'A'] = { |
| [0] = { .meth = HTTP_METH_TRACE , .len=5, .text="TRACE" }, |
| }, |
| /* rest is empty like this : |
| * [1] = { .meth = HTTP_METH_NONE , .len=0, .text="" }, |
| */ |
| }; |
| |
| /* It is about twice as fast on recent architectures to lookup a byte in a |
| * table than to perform a boolean AND or OR between two tests. Refer to |
| * RFC2616 for those chars. |
| */ |
| |
| const char http_is_spht[256] = { |
| [' '] = 1, ['\t'] = 1, |
| }; |
| |
| const char http_is_crlf[256] = { |
| ['\r'] = 1, ['\n'] = 1, |
| }; |
| |
| const char http_is_lws[256] = { |
| [' '] = 1, ['\t'] = 1, |
| ['\r'] = 1, ['\n'] = 1, |
| }; |
| |
| const char http_is_sep[256] = { |
| ['('] = 1, [')'] = 1, ['<'] = 1, ['>'] = 1, |
| ['@'] = 1, [','] = 1, [';'] = 1, [':'] = 1, |
| ['"'] = 1, ['/'] = 1, ['['] = 1, [']'] = 1, |
| ['{'] = 1, ['}'] = 1, ['?'] = 1, ['='] = 1, |
| [' '] = 1, ['\t'] = 1, ['\\'] = 1, |
| }; |
| |
| const char http_is_ctl[256] = { |
| [0 ... 31] = 1, |
| [127] = 1, |
| }; |
| |
| /* |
| * A token is any ASCII char that is neither a separator nor a CTL char. |
| * Do not overwrite values in assignment since gcc-2.95 will not handle |
| * them correctly. Instead, define every non-CTL char's status. |
| */ |
| const char http_is_token[256] = { |
| [' '] = 0, ['!'] = 1, ['"'] = 0, ['#'] = 1, |
| ['$'] = 1, ['%'] = 1, ['&'] = 1, ['\''] = 1, |
| ['('] = 0, [')'] = 0, ['*'] = 1, ['+'] = 1, |
| [','] = 0, ['-'] = 1, ['.'] = 1, ['/'] = 0, |
| ['0'] = 1, ['1'] = 1, ['2'] = 1, ['3'] = 1, |
| ['4'] = 1, ['5'] = 1, ['6'] = 1, ['7'] = 1, |
| ['8'] = 1, ['9'] = 1, [':'] = 0, [';'] = 0, |
| ['<'] = 0, ['='] = 0, ['>'] = 0, ['?'] = 0, |
| ['@'] = 0, ['A'] = 1, ['B'] = 1, ['C'] = 1, |
| ['D'] = 1, ['E'] = 1, ['F'] = 1, ['G'] = 1, |
| ['H'] = 1, ['I'] = 1, ['J'] = 1, ['K'] = 1, |
| ['L'] = 1, ['M'] = 1, ['N'] = 1, ['O'] = 1, |
| ['P'] = 1, ['Q'] = 1, ['R'] = 1, ['S'] = 1, |
| ['T'] = 1, ['U'] = 1, ['V'] = 1, ['W'] = 1, |
| ['X'] = 1, ['Y'] = 1, ['Z'] = 1, ['['] = 0, |
| ['\\'] = 0, [']'] = 0, ['^'] = 1, ['_'] = 1, |
| ['`'] = 1, ['a'] = 1, ['b'] = 1, ['c'] = 1, |
| ['d'] = 1, ['e'] = 1, ['f'] = 1, ['g'] = 1, |
| ['h'] = 1, ['i'] = 1, ['j'] = 1, ['k'] = 1, |
| ['l'] = 1, ['m'] = 1, ['n'] = 1, ['o'] = 1, |
| ['p'] = 1, ['q'] = 1, ['r'] = 1, ['s'] = 1, |
| ['t'] = 1, ['u'] = 1, ['v'] = 1, ['w'] = 1, |
| ['x'] = 1, ['y'] = 1, ['z'] = 1, ['{'] = 0, |
| ['|'] = 1, ['}'] = 0, ['~'] = 1, |
| }; |
| |
| |
| /* |
| * An http ver_token is any ASCII which can be found in an HTTP version, |
| * which includes 'H', 'T', 'P', '/', '.' and any digit. |
| */ |
| const char http_is_ver_token[256] = { |
| ['.'] = 1, ['/'] = 1, |
| ['0'] = 1, ['1'] = 1, ['2'] = 1, ['3'] = 1, ['4'] = 1, |
| ['5'] = 1, ['6'] = 1, ['7'] = 1, ['8'] = 1, ['9'] = 1, |
| ['H'] = 1, ['P'] = 1, ['T'] = 1, |
| }; |
| |
| |
| /* |
| * Silent debug that outputs only in strace, using fd #-1. Trash is modified. |
| */ |
| #if defined(DEBUG_FSM) |
| static void http_silent_debug(int line, struct session *s) |
| { |
| int size = 0; |
| size += snprintf(trash + size, sizeof(trash) - size, |
| "[%04d] req: p=%d(%d) s=%d bf=%08x an=%08x data=%p size=%d l=%d w=%p r=%p lr=%p sm=%d fw=%ld tf=%08x\n", |
| line, |
| s->si[0].state, s->si[0].fd, s->txn.req.msg_state, s->req->flags, s->req->analysers, |
| s->req->data, s->req->size, s->req->l, s->req->w, s->req->r, s->req->lr, s->req->send_max, s->req->to_forward, s->txn.flags); |
| write(-1, trash, size); |
| size = 0; |
| size += snprintf(trash + size, sizeof(trash) - size, |
| " %04d rep: p=%d(%d) s=%d bf=%08x an=%08x data=%p size=%d l=%d w=%p r=%p lr=%p sm=%d fw=%ld\n", |
| line, |
| s->si[1].state, s->si[1].fd, s->txn.rsp.msg_state, s->rep->flags, s->rep->analysers, |
| s->rep->data, s->rep->size, s->rep->l, s->rep->w, s->rep->r, s->rep->lr, s->rep->send_max, s->rep->to_forward); |
| |
| write(-1, trash, size); |
| } |
| #else |
| #define http_silent_debug(l,s) do { } while (0) |
| #endif |
| |
| /* |
| * Adds a header and its CRLF at the tail of buffer <b>, just before the last |
| * CRLF. Text length is measured first, so it cannot be NULL. |
| * The header is also automatically added to the index <hdr_idx>, and the end |
| * of headers is automatically adjusted. The number of bytes added is returned |
| * on success, otherwise <0 is returned indicating an error. |
| */ |
| int http_header_add_tail(struct buffer *b, struct http_msg *msg, |
| struct hdr_idx *hdr_idx, const char *text) |
| { |
| int bytes, len; |
| |
| len = strlen(text); |
| bytes = buffer_insert_line2(b, b->data + msg->eoh, text, len); |
| if (!bytes) |
| return -1; |
| http_msg_move_end(msg, bytes); |
| return hdr_idx_add(len, 1, hdr_idx, hdr_idx->tail); |
| } |
| |
| /* |
| * Adds a header and its CRLF at the tail of buffer <b>, just before the last |
| * CRLF. <len> bytes are copied, not counting the CRLF. If <text> is NULL, then |
| * the buffer is only opened and the space reserved, but nothing is copied. |
| * The header is also automatically added to the index <hdr_idx>, and the end |
| * of headers is automatically adjusted. The number of bytes added is returned |
| * on success, otherwise <0 is returned indicating an error. |
| */ |
| int http_header_add_tail2(struct buffer *b, struct http_msg *msg, |
| struct hdr_idx *hdr_idx, const char *text, int len) |
| { |
| int bytes; |
| |
| bytes = buffer_insert_line2(b, b->data + msg->eoh, text, len); |
| if (!bytes) |
| return -1; |
| http_msg_move_end(msg, bytes); |
| return hdr_idx_add(len, 1, hdr_idx, hdr_idx->tail); |
| } |
| |
| /* |
| * Checks if <hdr> is exactly <name> for <len> chars, and ends with a colon. |
| * If so, returns the position of the first non-space character relative to |
| * <hdr>, or <end>-<hdr> if not found before. If no value is found, it tries |
| * to return a pointer to the place after the first space. Returns 0 if the |
| * header name does not match. Checks are case-insensitive. |
| */ |
| int http_header_match2(const char *hdr, const char *end, |
| const char *name, int len) |
| { |
| const char *val; |
| |
| if (hdr + len >= end) |
| return 0; |
| if (hdr[len] != ':') |
| return 0; |
| if (strncasecmp(hdr, name, len) != 0) |
| return 0; |
| val = hdr + len + 1; |
| while (val < end && HTTP_IS_SPHT(*val)) |
| val++; |
| if ((val >= end) && (len + 2 <= end - hdr)) |
| return len + 2; /* we may replace starting from second space */ |
| return val - hdr; |
| } |
| |
| /* Find the end of the header value contained between <s> and <e>. See RFC2616, |
| * par 2.2 for more information. Note that it requires a valid header to return |
| * a valid result. This works for headers defined as comma-separated lists. |
| */ |
| char *find_hdr_value_end(char *s, const char *e) |
| { |
| int quoted, qdpair; |
| |
| quoted = qdpair = 0; |
| for (; s < e; s++) { |
| if (qdpair) qdpair = 0; |
| else if (quoted) { |
| if (*s == '\\') qdpair = 1; |
| else if (*s == '"') quoted = 0; |
| } |
| else if (*s == '"') quoted = 1; |
| else if (*s == ',') return s; |
| } |
| return s; |
| } |
| |
| /* Find the first or next occurrence of header <name> in message buffer <sol> |
| * using headers index <idx>, and return it in the <ctx> structure. This |
| * structure holds everything necessary to use the header and find next |
| * occurrence. If its <idx> member is 0, the header is searched from the |
| * beginning. Otherwise, the next occurrence is returned. The function returns |
| * 1 when it finds a value, and 0 when there is no more. It is designed to work |
| * with headers defined as comma-separated lists. As a special case, if ctx->val |
| * is NULL when searching for a new values of a header, the current header is |
| * rescanned. This allows rescanning after a header deletion. |
| */ |
| int http_find_header2(const char *name, int len, |
| char *sol, struct hdr_idx *idx, |
| struct hdr_ctx *ctx) |
| { |
| char *eol, *sov; |
| int cur_idx, old_idx; |
| |
| cur_idx = ctx->idx; |
| if (cur_idx) { |
| /* We have previously returned a value, let's search |
| * another one on the same line. |
| */ |
| sol = ctx->line; |
| ctx->del = ctx->val + ctx->vlen; |
| sov = sol + ctx->del; |
| eol = sol + idx->v[cur_idx].len; |
| |
| if (sov >= eol) |
| /* no more values in this header */ |
| goto next_hdr; |
| |
| /* values remaining for this header, skip the comma but save it |
| * for later use (eg: for header deletion). |
| */ |
| sov++; |
| while (sov < eol && http_is_lws[(unsigned char)*sov]) |
| sov++; |
| |
| goto return_hdr; |
| } |
| |
| /* first request for this header */ |
| sol += hdr_idx_first_pos(idx); |
| old_idx = 0; |
| cur_idx = hdr_idx_first_idx(idx); |
| while (cur_idx) { |
| eol = sol + idx->v[cur_idx].len; |
| |
| if (len == 0) { |
| /* No argument was passed, we want any header. |
| * To achieve this, we simply build a fake request. */ |
| while (sol + len < eol && sol[len] != ':') |
| len++; |
| name = sol; |
| } |
| |
| if ((len < eol - sol) && |
| (sol[len] == ':') && |
| (strncasecmp(sol, name, len) == 0)) { |
| ctx->del = len; |
| sov = sol + len + 1; |
| while (sov < eol && http_is_lws[(unsigned char)*sov]) |
| sov++; |
| |
| ctx->line = sol; |
| ctx->prev = old_idx; |
| return_hdr: |
| ctx->idx = cur_idx; |
| ctx->val = sov - sol; |
| |
| eol = find_hdr_value_end(sov, eol); |
| ctx->vlen = eol - sov; |
| return 1; |
| } |
| next_hdr: |
| sol = eol + idx->v[cur_idx].cr + 1; |
| old_idx = cur_idx; |
| cur_idx = idx->v[cur_idx].next; |
| } |
| return 0; |
| } |
| |
| int http_find_header(const char *name, |
| char *sol, struct hdr_idx *idx, |
| struct hdr_ctx *ctx) |
| { |
| return http_find_header2(name, strlen(name), sol, idx, ctx); |
| } |
| |
| /* Remove one value of a header. This only works on a <ctx> returned by one of |
| * the http_find_header functions. The value is removed, as well as surrounding |
| * commas if any. If the removed value was alone, the whole header is removed. |
| * The ctx is always updated accordingly, as well as buffer <buf> and HTTP |
| * message <msg>. The new index is returned. If it is zero, it means there is |
| * no more header, so any processing may stop. The ctx is always left in a form |
| * that can be handled by http_find_header2() to find next occurrence. |
| */ |
| int http_remove_header2(struct http_msg *msg, struct buffer *buf, |
| struct hdr_idx *idx, struct hdr_ctx *ctx) |
| { |
| int cur_idx = ctx->idx; |
| char *sol = ctx->line; |
| struct hdr_idx_elem *hdr; |
| int delta, skip_comma; |
| |
| if (!cur_idx) |
| return 0; |
| |
| hdr = &idx->v[cur_idx]; |
| if (sol[ctx->del] == ':' && ctx->val + ctx->vlen == hdr->len) { |
| /* This was the only value of the header, we must now remove it entirely. */ |
| delta = buffer_replace2(buf, sol, sol + hdr->len + hdr->cr + 1, NULL, 0); |
| http_msg_move_end(msg, delta); |
| idx->used--; |
| hdr->len = 0; /* unused entry */ |
| idx->v[ctx->prev].next = idx->v[ctx->idx].next; |
| ctx->idx = ctx->prev; /* walk back to the end of previous header */ |
| ctx->line -= idx->v[ctx->idx].len + idx->v[cur_idx].cr + 1; |
| ctx->val = idx->v[ctx->idx].len; /* point to end of previous header */ |
| ctx->vlen = 0; |
| return ctx->idx; |
| } |
| |
| /* This was not the only value of this header. We have to remove between |
| * ctx->del+1 and ctx->val+ctx->vlen+1 included. If it is the last entry |
| * of the list, we remove the last separator. |
| */ |
| |
| skip_comma = (ctx->val + ctx->vlen == hdr->len) ? 0 : 1; |
| delta = buffer_replace2(buf, sol + ctx->del + skip_comma, |
| sol + ctx->val + ctx->vlen + skip_comma, |
| NULL, 0); |
| hdr->len += delta; |
| http_msg_move_end(msg, delta); |
| ctx->val = ctx->del; |
| ctx->vlen = 0; |
| return ctx->idx; |
| } |
| |
| /* This function handles a server error at the stream interface level. The |
| * stream interface is assumed to be already in a closed state. An optional |
| * message is copied into the input buffer, and an HTTP status code stored. |
| * The error flags are set to the values in arguments. Any pending request |
| * in this buffer will be lost. |
| */ |
| static void http_server_error(struct session *t, struct stream_interface *si, |
| int err, int finst, int status, const struct chunk *msg) |
| { |
| buffer_auto_read(si->ob); |
| buffer_abort(si->ob); |
| buffer_auto_close(si->ob); |
| buffer_erase(si->ob); |
| buffer_auto_close(si->ib); |
| buffer_auto_read(si->ib); |
| if (status > 0 && msg) { |
| t->txn.status = status; |
| buffer_write(si->ib, msg->str, msg->len); |
| } |
| if (!(t->flags & SN_ERR_MASK)) |
| t->flags |= err; |
| if (!(t->flags & SN_FINST_MASK)) |
| t->flags |= finst; |
| } |
| |
| /* This function returns the appropriate error location for the given session |
| * and message. |
| */ |
| |
| struct chunk *error_message(struct session *s, int msgnum) |
| { |
| if (s->be->errmsg[msgnum].str) |
| return &s->be->errmsg[msgnum]; |
| else if (s->fe->errmsg[msgnum].str) |
| return &s->fe->errmsg[msgnum]; |
| else |
| return &http_err_chunks[msgnum]; |
| } |
| |
| /* |
| * returns HTTP_METH_NONE if there is nothing valid to read (empty or non-text |
| * string), HTTP_METH_OTHER for unknown methods, or the identified method. |
| */ |
| static http_meth_t find_http_meth(const char *str, const int len) |
| { |
| unsigned char m; |
| const struct http_method_desc *h; |
| |
| m = ((unsigned)*str - 'A'); |
| |
| if (m < 26) { |
| for (h = http_methods[m]; h->len > 0; h++) { |
| if (unlikely(h->len != len)) |
| continue; |
| if (likely(memcmp(str, h->text, h->len) == 0)) |
| return h->meth; |
| }; |
| return HTTP_METH_OTHER; |
| } |
| return HTTP_METH_NONE; |
| |
| } |
| |
| /* Parse the URI from the given transaction (which is assumed to be in request |
| * phase) and look for the "/" beginning the PATH. If not found, return NULL. |
| * It is returned otherwise. |
| */ |
| static char * |
| http_get_path(struct http_txn *txn) |
| { |
| char *ptr, *end; |
| |
| ptr = txn->req.sol + txn->req.sl.rq.u; |
| end = ptr + txn->req.sl.rq.u_l; |
| |
| if (ptr >= end) |
| return NULL; |
| |
| /* RFC2616, par. 5.1.2 : |
| * Request-URI = "*" | absuri | abspath | authority |
| */ |
| |
| if (*ptr == '*') |
| return NULL; |
| |
| if (isalpha((unsigned char)*ptr)) { |
| /* this is a scheme as described by RFC3986, par. 3.1 */ |
| ptr++; |
| while (ptr < end && |
| (isalnum((unsigned char)*ptr) || *ptr == '+' || *ptr == '-' || *ptr == '.')) |
| ptr++; |
| /* skip '://' */ |
| if (ptr == end || *ptr++ != ':') |
| return NULL; |
| if (ptr == end || *ptr++ != '/') |
| return NULL; |
| if (ptr == end || *ptr++ != '/') |
| return NULL; |
| } |
| /* skip [user[:passwd]@]host[:[port]] */ |
| |
| while (ptr < end && *ptr != '/') |
| ptr++; |
| |
| if (ptr == end) |
| return NULL; |
| |
| /* OK, we got the '/' ! */ |
| return ptr; |
| } |
| |
| /* Returns a 302 for a redirectable request. This may only be called just after |
| * the stream interface has moved to SI_ST_ASS. Unprocessable requests are |
| * left unchanged and will follow normal proxy processing. |
| */ |
| void perform_http_redirect(struct session *s, struct stream_interface *si) |
| { |
| struct http_txn *txn; |
| struct chunk rdr; |
| char *path; |
| int len; |
| |
| /* 1: create the response header */ |
| rdr.len = strlen(HTTP_302); |
| rdr.str = trash; |
| rdr.size = sizeof(trash); |
| memcpy(rdr.str, HTTP_302, rdr.len); |
| |
| /* 2: add the server's prefix */ |
| if (rdr.len + s->srv->rdr_len > rdr.size) |
| return; |
| |
| /* special prefix "/" means don't change URL */ |
| if (s->srv->rdr_len != 1 || *s->srv->rdr_pfx != '/') { |
| memcpy(rdr.str + rdr.len, s->srv->rdr_pfx, s->srv->rdr_len); |
| rdr.len += s->srv->rdr_len; |
| } |
| |
| /* 3: add the request URI */ |
| txn = &s->txn; |
| path = http_get_path(txn); |
| if (!path) |
| return; |
| |
| len = txn->req.sl.rq.u_l + (txn->req.sol + txn->req.sl.rq.u) - path; |
| if (rdr.len + len > rdr.size - 4) /* 4 for CRLF-CRLF */ |
| return; |
| |
| memcpy(rdr.str + rdr.len, path, len); |
| rdr.len += len; |
| |
| if (unlikely(txn->flags & TX_USE_PX_CONN)) { |
| memcpy(rdr.str + rdr.len, "\r\nProxy-Connection: close\r\n\r\n", 29); |
| rdr.len += 29; |
| } else { |
| memcpy(rdr.str + rdr.len, "\r\nConnection: close\r\n\r\n", 23); |
| rdr.len += 23; |
| } |
| |
| /* prepare to return without error. */ |
| si->shutr(si); |
| si->shutw(si); |
| si->err_type = SI_ET_NONE; |
| si->err_loc = NULL; |
| si->state = SI_ST_CLO; |
| |
| /* send the message */ |
| http_server_error(s, si, SN_ERR_PRXCOND, SN_FINST_C, 302, &rdr); |
| |
| /* FIXME: we should increase a counter of redirects per server and per backend. */ |
| if (s->srv) |
| srv_inc_sess_ctr(s->srv); |
| } |
| |
| /* Return the error message corresponding to si->err_type. It is assumed |
| * that the server side is closed. Note that err_type is actually a |
| * bitmask, where almost only aborts may be cumulated with other |
| * values. We consider that aborted operations are more important |
| * than timeouts or errors due to the fact that nobody else in the |
| * logs might explain incomplete retries. All others should avoid |
| * being cumulated. It should normally not be possible to have multiple |
| * aborts at once, but just in case, the first one in sequence is reported. |
| */ |
| void http_return_srv_error(struct session *s, struct stream_interface *si) |
| { |
| int err_type = si->err_type; |
| |
| if (err_type & SI_ET_QUEUE_ABRT) |
| http_server_error(s, si, SN_ERR_CLICL, SN_FINST_Q, |
| 503, error_message(s, HTTP_ERR_503)); |
| else if (err_type & SI_ET_CONN_ABRT) |
| http_server_error(s, si, SN_ERR_CLICL, SN_FINST_C, |
| 503, error_message(s, HTTP_ERR_503)); |
| else if (err_type & SI_ET_QUEUE_TO) |
| http_server_error(s, si, SN_ERR_SRVTO, SN_FINST_Q, |
| 503, error_message(s, HTTP_ERR_503)); |
| else if (err_type & SI_ET_QUEUE_ERR) |
| http_server_error(s, si, SN_ERR_SRVCL, SN_FINST_Q, |
| 503, error_message(s, HTTP_ERR_503)); |
| else if (err_type & SI_ET_CONN_TO) |
| http_server_error(s, si, SN_ERR_SRVTO, SN_FINST_C, |
| 503, error_message(s, HTTP_ERR_503)); |
| else if (err_type & SI_ET_CONN_ERR) |
| http_server_error(s, si, SN_ERR_SRVCL, SN_FINST_C, |
| 503, error_message(s, HTTP_ERR_503)); |
| else /* SI_ET_CONN_OTHER and others */ |
| http_server_error(s, si, SN_ERR_INTERNAL, SN_FINST_C, |
| 500, error_message(s, HTTP_ERR_500)); |
| } |
| |
| extern const char sess_term_cond[8]; |
| extern const char sess_fin_state[8]; |
| extern const char *monthname[12]; |
| const char sess_cookie[8] = "NIDVEO67"; /* No cookie, Invalid cookie, cookie for a Down server, Valid cookie, Expired cookie, Old cookie, unknown */ |
| const char sess_set_cookie[8] = "NPDIRU67"; /* No set-cookie, Set-cookie found and left unchanged (passive), |
| Set-cookie Deleted, Set-Cookie Inserted, Set-cookie Rewritten, |
| Set-cookie Updated, unknown, unknown */ |
| struct pool_head *pool2_requri; |
| struct pool_head *pool2_capture; |
| |
| void http_sess_clflog(struct session *s) |
| { |
| char pn[INET6_ADDRSTRLEN + strlen(":65535")]; |
| struct proxy *fe = s->fe; |
| struct proxy *be = s->be; |
| struct proxy *prx_log; |
| struct http_txn *txn = &s->txn; |
| int tolog, level, err; |
| char *uri, *h; |
| char *svid; |
| struct tm tm; |
| static char tmpline[MAX_SYSLOG_LEN]; |
| int hdr; |
| size_t w; |
| int t_request; |
| |
| prx_log = fe; |
| err = (s->flags & (SN_ERR_MASK | SN_REDISP)) || |
| (s->req->cons->conn_retries != be->conn_retries) || |
| txn->status >= 500; |
| |
| if (s->cli_addr.ss_family == AF_INET) |
| inet_ntop(AF_INET, |
| (const void *)&((struct sockaddr_in *)&s->cli_addr)->sin_addr, |
| pn, sizeof(pn)); |
| else |
| inet_ntop(AF_INET6, |
| (const void *)&((struct sockaddr_in6 *)(&s->cli_addr))->sin6_addr, |
| pn, sizeof(pn)); |
| |
| get_gmtime(s->logs.accept_date.tv_sec, &tm); |
| |
| /* FIXME: let's limit ourselves to frontend logging for now. */ |
| tolog = fe->to_log; |
| |
| h = tmpline; |
| |
| w = snprintf(h, sizeof(tmpline), |
| "%s - - [%02d/%s/%04d:%02d:%02d:%02d +0000]", |
| pn, |
| tm.tm_mday, monthname[tm.tm_mon], tm.tm_year+1900, |
| tm.tm_hour, tm.tm_min, tm.tm_sec); |
| if (w < 0 || w >= sizeof(tmpline) - (h - tmpline)) |
| goto trunc; |
| h += w; |
| |
| if (h >= tmpline + sizeof(tmpline) - 4) |
| goto trunc; |
| |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| uri = txn->uri ? txn->uri : "<BADREQ>"; |
| h = encode_string(h, tmpline + sizeof(tmpline) - 1, |
| '#', url_encode_map, uri); |
| *(h++) = '\"'; |
| |
| w = snprintf(h, sizeof(tmpline) - (h - tmpline), " %d %lld", txn->status, s->logs.bytes_out); |
| if (w < 0 || w >= sizeof(tmpline) - (h - tmpline)) |
| goto trunc; |
| h += w; |
| |
| if (h >= tmpline + sizeof(tmpline) - 9) |
| goto trunc; |
| memcpy(h, " \"-\" \"-\"", 8); |
| h += 8; |
| |
| w = snprintf(h, sizeof(tmpline) - (h - tmpline), |
| " %d %03d", |
| (s->cli_addr.ss_family == AF_INET) ? |
| ntohs(((struct sockaddr_in *)&s->cli_addr)->sin_port) : |
| ntohs(((struct sockaddr_in6 *)&s->cli_addr)->sin6_port), |
| (int)s->logs.accept_date.tv_usec/1000); |
| if (w < 0 || w >= sizeof(tmpline) - (h - tmpline)) |
| goto trunc; |
| h += w; |
| |
| w = strlen(fe->id); |
| if (h >= tmpline + sizeof(tmpline) - 4 - w) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| memcpy(h, fe->id, w); |
| h += w; |
| *(h++) = '\"'; |
| |
| w = strlen(be->id); |
| if (h >= tmpline + sizeof(tmpline) - 4 - w) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| memcpy(h, be->id, w); |
| h += w; |
| *(h++) = '\"'; |
| |
| svid = (tolog & LW_SVID) ? |
| (s->data_source != DATA_SRC_STATS) ? |
| (s->srv != NULL) ? s->srv->id : "<NOSRV>" : "<STATS>" : "-"; |
| |
| w = strlen(svid); |
| if (h >= tmpline + sizeof(tmpline) - 4 - w) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| memcpy(h, svid, w); |
| h += w; |
| *(h++) = '\"'; |
| |
| t_request = -1; |
| if (tv_isge(&s->logs.tv_request, &s->logs.tv_accept)) |
| t_request = tv_ms_elapsed(&s->logs.tv_accept, &s->logs.tv_request); |
| w = snprintf(h, sizeof(tmpline) - (h - tmpline), |
| " %d %ld %ld %ld %ld", |
| t_request, |
| (s->logs.t_queue >= 0) ? s->logs.t_queue - t_request : -1, |
| (s->logs.t_connect >= 0) ? s->logs.t_connect - s->logs.t_queue : -1, |
| (s->logs.t_data >= 0) ? s->logs.t_data - s->logs.t_connect : -1, |
| s->logs.t_close); |
| if (w < 0 || w >= sizeof(tmpline) - (h - tmpline)) |
| goto trunc; |
| h += w; |
| |
| if (h >= tmpline + sizeof(tmpline) - 8) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| *(h++) = sess_term_cond[(s->flags & SN_ERR_MASK) >> SN_ERR_SHIFT]; |
| *(h++) = sess_fin_state[(s->flags & SN_FINST_MASK) >> SN_FINST_SHIFT]; |
| *(h++) = (be->options & PR_O_COOK_ANY) ? sess_cookie[(txn->flags & TX_CK_MASK) >> TX_CK_SHIFT] : '-', |
| *(h++) = (be->options & PR_O_COOK_ANY) ? sess_set_cookie[(txn->flags & TX_SCK_MASK) >> TX_SCK_SHIFT] : '-'; |
| *(h++) = '\"'; |
| |
| w = snprintf(h, sizeof(tmpline) - (h - tmpline), |
| " %d %d %d %d %d %ld %ld", |
| actconn, fe->feconn, be->beconn, s->srv ? s->srv->cur_sess : 0, |
| (s->req->cons->conn_retries > 0) ? (be->conn_retries - s->req->cons->conn_retries) : be->conn_retries, |
| s->logs.srv_queue_size, s->logs.prx_queue_size); |
| |
| if (w < 0 || w >= sizeof(tmpline) - (h - tmpline)) |
| goto trunc; |
| h += w; |
| |
| if (txn->cli_cookie) { |
| w = strlen(txn->cli_cookie); |
| if (h >= tmpline + sizeof(tmpline) - 4 - w) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| memcpy(h, txn->cli_cookie, w); |
| h += w; |
| *(h++) = '\"'; |
| } else { |
| if (h >= tmpline + sizeof(tmpline) - 5) |
| goto trunc; |
| memcpy(h, " \"-\"", 4); |
| h += 4; |
| } |
| |
| if (txn->srv_cookie) { |
| w = strlen(txn->srv_cookie); |
| if (h >= tmpline + sizeof(tmpline) - 4 - w) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| memcpy(h, txn->srv_cookie, w); |
| h += w; |
| *(h++) = '\"'; |
| } else { |
| if (h >= tmpline + sizeof(tmpline) - 5) |
| goto trunc; |
| memcpy(h, " \"-\"", 4); |
| h += 4; |
| } |
| |
| if ((fe->to_log & LW_REQHDR) && txn->req.cap) { |
| for (hdr = 0; hdr < fe->nb_req_cap; hdr++) { |
| if (h >= sizeof (tmpline) + tmpline - 4) |
| goto trunc; |
| if (txn->req.cap[hdr] != NULL) { |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| h = encode_string(h, tmpline + sizeof(tmpline) - 2, |
| '#', hdr_encode_map, txn->req.cap[hdr]); |
| *(h++) = '\"'; |
| } else { |
| memcpy(h, " \"-\"", 4); |
| h += 4; |
| } |
| } |
| } |
| |
| if ((fe->to_log & LW_RSPHDR) && txn->rsp.cap) { |
| for (hdr = 0; hdr < fe->nb_rsp_cap; hdr++) { |
| if (h >= sizeof (tmpline) + tmpline - 4) |
| goto trunc; |
| if (txn->rsp.cap[hdr] != NULL) { |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| h = encode_string(h, tmpline + sizeof(tmpline) - 2, |
| '#', hdr_encode_map, txn->rsp.cap[hdr]); |
| *(h++) = '\"'; |
| } else { |
| memcpy(h, " \"-\"", 4); |
| h += 4; |
| } |
| } |
| } |
| |
| trunc: |
| *h = '\0'; |
| |
| level = LOG_INFO; |
| if (err && (fe->options2 & PR_O2_LOGERRORS)) |
| level = LOG_ERR; |
| |
| send_log(prx_log, level, "%s\n", tmpline); |
| |
| s->logs.logwait = 0; |
| } |
| |
| /* |
| * send a log for the session when we have enough info about it. |
| * Will not log if the frontend has no log defined. |
| */ |
| void http_sess_log(struct session *s) |
| { |
| char pn[INET6_ADDRSTRLEN + strlen(":65535")]; |
| struct proxy *fe = s->fe; |
| struct proxy *be = s->be; |
| struct proxy *prx_log; |
| struct http_txn *txn = &s->txn; |
| int tolog, level, err; |
| char *uri, *h; |
| char *svid; |
| struct tm tm; |
| static char tmpline[MAX_SYSLOG_LEN]; |
| int t_request; |
| int hdr; |
| |
| /* if we don't want to log normal traffic, return now */ |
| err = (s->flags & (SN_ERR_MASK | SN_REDISP)) || |
| (s->req->cons->conn_retries != be->conn_retries) || |
| txn->status >= 500; |
| if (!err && (fe->options2 & PR_O2_NOLOGNORM)) |
| return; |
| |
| if (fe->logfac1 < 0 && fe->logfac2 < 0) |
| return; |
| prx_log = fe; |
| |
| if (prx_log->options2 & PR_O2_CLFLOG) |
| return http_sess_clflog(s); |
| |
| if (s->cli_addr.ss_family == AF_INET) |
| inet_ntop(AF_INET, |
| (const void *)&((struct sockaddr_in *)&s->cli_addr)->sin_addr, |
| pn, sizeof(pn)); |
| else |
| inet_ntop(AF_INET6, |
| (const void *)&((struct sockaddr_in6 *)(&s->cli_addr))->sin6_addr, |
| pn, sizeof(pn)); |
| |
| get_localtime(s->logs.accept_date.tv_sec, &tm); |
| |
| /* FIXME: let's limit ourselves to frontend logging for now. */ |
| tolog = fe->to_log; |
| |
| h = tmpline; |
| if (fe->to_log & LW_REQHDR && |
| txn->req.cap && |
| (h < tmpline + sizeof(tmpline) - 10)) { |
| *(h++) = ' '; |
| *(h++) = '{'; |
| for (hdr = 0; hdr < fe->nb_req_cap; hdr++) { |
| if (hdr) |
| *(h++) = '|'; |
| if (txn->req.cap[hdr] != NULL) |
| h = encode_string(h, tmpline + sizeof(tmpline) - 7, |
| '#', hdr_encode_map, txn->req.cap[hdr]); |
| } |
| *(h++) = '}'; |
| } |
| |
| if (fe->to_log & LW_RSPHDR && |
| txn->rsp.cap && |
| (h < tmpline + sizeof(tmpline) - 7)) { |
| *(h++) = ' '; |
| *(h++) = '{'; |
| for (hdr = 0; hdr < fe->nb_rsp_cap; hdr++) { |
| if (hdr) |
| *(h++) = '|'; |
| if (txn->rsp.cap[hdr] != NULL) |
| h = encode_string(h, tmpline + sizeof(tmpline) - 4, |
| '#', hdr_encode_map, txn->rsp.cap[hdr]); |
| } |
| *(h++) = '}'; |
| } |
| |
| if (h < tmpline + sizeof(tmpline) - 4) { |
| *(h++) = ' '; |
| *(h++) = '"'; |
| uri = txn->uri ? txn->uri : "<BADREQ>"; |
| h = encode_string(h, tmpline + sizeof(tmpline) - 1, |
| '#', url_encode_map, uri); |
| *(h++) = '"'; |
| } |
| *h = '\0'; |
| |
| svid = (tolog & LW_SVID) ? |
| (s->data_source != DATA_SRC_STATS) ? |
| (s->srv != NULL) ? s->srv->id : "<NOSRV>" : "<STATS>" : "-"; |
| |
| t_request = -1; |
| if (tv_isge(&s->logs.tv_request, &s->logs.tv_accept)) |
| t_request = tv_ms_elapsed(&s->logs.tv_accept, &s->logs.tv_request); |
| |
| level = LOG_INFO; |
| if (err && (fe->options2 & PR_O2_LOGERRORS)) |
| level = LOG_ERR; |
| |
| send_log(prx_log, level, |
| "%s:%d [%02d/%s/%04d:%02d:%02d:%02d.%03d]" |
| " %s %s/%s %d/%ld/%ld/%ld/%s%ld %d %s%lld" |
| " %s %s %c%c%c%c %d/%d/%d/%d/%s%u %ld/%ld%s\n", |
| pn, |
| (s->cli_addr.ss_family == AF_INET) ? |
| ntohs(((struct sockaddr_in *)&s->cli_addr)->sin_port) : |
| ntohs(((struct sockaddr_in6 *)&s->cli_addr)->sin6_port), |
| tm.tm_mday, monthname[tm.tm_mon], tm.tm_year+1900, |
| tm.tm_hour, tm.tm_min, tm.tm_sec, (int)s->logs.accept_date.tv_usec/1000, |
| fe->id, be->id, svid, |
| t_request, |
| (s->logs.t_queue >= 0) ? s->logs.t_queue - t_request : -1, |
| (s->logs.t_connect >= 0) ? s->logs.t_connect - s->logs.t_queue : -1, |
| (s->logs.t_data >= 0) ? s->logs.t_data - s->logs.t_connect : -1, |
| (tolog & LW_BYTES) ? "" : "+", s->logs.t_close, |
| txn->status, |
| (tolog & LW_BYTES) ? "" : "+", s->logs.bytes_out, |
| txn->cli_cookie ? txn->cli_cookie : "-", |
| txn->srv_cookie ? txn->srv_cookie : "-", |
| sess_term_cond[(s->flags & SN_ERR_MASK) >> SN_ERR_SHIFT], |
| sess_fin_state[(s->flags & SN_FINST_MASK) >> SN_FINST_SHIFT], |
| (be->options & PR_O_COOK_ANY) ? sess_cookie[(txn->flags & TX_CK_MASK) >> TX_CK_SHIFT] : '-', |
| (be->options & PR_O_COOK_ANY) ? sess_set_cookie[(txn->flags & TX_SCK_MASK) >> TX_SCK_SHIFT] : '-', |
| actconn, fe->feconn, be->beconn, s->srv ? s->srv->cur_sess : 0, |
| (s->flags & SN_REDISP)?"+":"", |
| (s->req->cons->conn_retries>0)?(be->conn_retries - s->req->cons->conn_retries):be->conn_retries, |
| s->logs.srv_queue_size, s->logs.prx_queue_size, tmpline); |
| |
| s->logs.logwait = 0; |
| } |
| |
| |
| /* |
| * Capture headers from message starting at <som> according to header list |
| * <cap_hdr>, and fill the <idx> structure appropriately. |
| */ |
| void capture_headers(char *som, struct hdr_idx *idx, |
| char **cap, struct cap_hdr *cap_hdr) |
| { |
| char *eol, *sol, *col, *sov; |
| int cur_idx; |
| struct cap_hdr *h; |
| int len; |
| |
| sol = som + hdr_idx_first_pos(idx); |
| cur_idx = hdr_idx_first_idx(idx); |
| |
| while (cur_idx) { |
| eol = sol + idx->v[cur_idx].len; |
| |
| col = sol; |
| while (col < eol && *col != ':') |
| col++; |
| |
| sov = col + 1; |
| while (sov < eol && http_is_lws[(unsigned char)*sov]) |
| sov++; |
| |
| for (h = cap_hdr; h; h = h->next) { |
| if ((h->namelen == col - sol) && |
| (strncasecmp(sol, h->name, h->namelen) == 0)) { |
| if (cap[h->index] == NULL) |
| cap[h->index] = |
| pool_alloc2(h->pool); |
| |
| if (cap[h->index] == NULL) { |
| Alert("HTTP capture : out of memory.\n"); |
| continue; |
| } |
| |
| len = eol - sov; |
| if (len > h->len) |
| len = h->len; |
| |
| memcpy(cap[h->index], sov, len); |
| cap[h->index][len]=0; |
| } |
| } |
| sol = eol + idx->v[cur_idx].cr + 1; |
| cur_idx = idx->v[cur_idx].next; |
| } |
| } |
| |
| |
| /* either we find an LF at <ptr> or we jump to <bad>. |
| */ |
| #define EXPECT_LF_HERE(ptr, bad) do { if (unlikely(*(ptr) != '\n')) goto bad; } while (0) |
| |
| /* plays with variables <ptr>, <end> and <state>. Jumps to <good> if OK, |
| * otherwise to <http_msg_ood> with <state> set to <st>. |
| */ |
| #define EAT_AND_JUMP_OR_RETURN(good, st) do { \ |
| ptr++; \ |
| if (likely(ptr < end)) \ |
| goto good; \ |
| else { \ |
| state = (st); \ |
| goto http_msg_ood; \ |
| } \ |
| } while (0) |
| |
| |
| /* |
| * This function parses a status line between <ptr> and <end>, starting with |
| * parser state <state>. Only states HTTP_MSG_RPVER, HTTP_MSG_RPVER_SP, |
| * HTTP_MSG_RPCODE, HTTP_MSG_RPCODE_SP and HTTP_MSG_RPREASON are handled. Others |
| * will give undefined results. |
| * Note that it is upon the caller's responsibility to ensure that ptr < end, |
| * and that msg->sol points to the beginning of the response. |
| * If a complete line is found (which implies that at least one CR or LF is |
| * found before <end>, the updated <ptr> is returned, otherwise NULL is |
| * returned indicating an incomplete line (which does not mean that parts have |
| * not been updated). In the incomplete case, if <ret_ptr> or <ret_state> are |
| * non-NULL, they are fed with the new <ptr> and <state> values to be passed |
| * upon next call. |
| * |
| * This function was intentionally designed to be called from |
| * http_msg_analyzer() with the lowest overhead. It should integrate perfectly |
| * within its state machine and use the same macros, hence the need for same |
| * labels and variable names. Note that msg->sol is left unchanged. |
| */ |
| const char *http_parse_stsline(struct http_msg *msg, const char *msg_buf, |
| unsigned int state, const char *ptr, const char *end, |
| char **ret_ptr, unsigned int *ret_state) |
| { |
| switch (state) { |
| case HTTP_MSG_RPVER: |
| http_msg_rpver: |
| if (likely(HTTP_IS_VER_TOKEN(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpver, HTTP_MSG_RPVER); |
| |
| if (likely(HTTP_IS_SPHT(*ptr))) { |
| msg->sl.st.v_l = (ptr - msg_buf) - msg->som; |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpver_sp, HTTP_MSG_RPVER_SP); |
| } |
| state = HTTP_MSG_ERROR; |
| break; |
| |
| case HTTP_MSG_RPVER_SP: |
| http_msg_rpver_sp: |
| if (likely(!HTTP_IS_LWS(*ptr))) { |
| msg->sl.st.c = (ptr - msg_buf) - msg->som; |
| goto http_msg_rpcode; |
| } |
| if (likely(HTTP_IS_SPHT(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpver_sp, HTTP_MSG_RPVER_SP); |
| /* so it's a CR/LF, this is invalid */ |
| state = HTTP_MSG_ERROR; |
| break; |
| |
| case HTTP_MSG_RPCODE: |
| http_msg_rpcode: |
| if (likely(!HTTP_IS_LWS(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpcode, HTTP_MSG_RPCODE); |
| |
| if (likely(HTTP_IS_SPHT(*ptr))) { |
| msg->sl.st.c_l = (ptr - msg_buf) - msg->som - msg->sl.st.c; |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpcode_sp, HTTP_MSG_RPCODE_SP); |
| } |
| |
| /* so it's a CR/LF, so there is no reason phrase */ |
| msg->sl.st.c_l = (ptr - msg_buf) - msg->som - msg->sl.st.c; |
| http_msg_rsp_reason: |
| /* FIXME: should we support HTTP responses without any reason phrase ? */ |
| msg->sl.st.r = (ptr - msg_buf) - msg->som; |
| msg->sl.st.r_l = 0; |
| goto http_msg_rpline_eol; |
| |
| case HTTP_MSG_RPCODE_SP: |
| http_msg_rpcode_sp: |
| if (likely(!HTTP_IS_LWS(*ptr))) { |
| msg->sl.st.r = (ptr - msg_buf) - msg->som; |
| goto http_msg_rpreason; |
| } |
| if (likely(HTTP_IS_SPHT(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpcode_sp, HTTP_MSG_RPCODE_SP); |
| /* so it's a CR/LF, so there is no reason phrase */ |
| goto http_msg_rsp_reason; |
| |
| case HTTP_MSG_RPREASON: |
| http_msg_rpreason: |
| if (likely(!HTTP_IS_CRLF(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpreason, HTTP_MSG_RPREASON); |
| msg->sl.st.r_l = (ptr - msg_buf) - msg->som - msg->sl.st.r; |
| http_msg_rpline_eol: |
| /* We have seen the end of line. Note that we do not |
| * necessarily have the \n yet, but at least we know that we |
| * have EITHER \r OR \n, otherwise the response would not be |
| * complete. We can then record the response length and return |
| * to the caller which will be able to register it. |
| */ |
| msg->sl.st.l = ptr - msg->sol; |
| return ptr; |
| |
| #ifdef DEBUG_FULL |
| default: |
| fprintf(stderr, "FIXME !!!! impossible state at %s:%d = %d\n", __FILE__, __LINE__, state); |
| exit(1); |
| #endif |
| } |
| |
| http_msg_ood: |
| /* out of valid data */ |
| if (ret_state) |
| *ret_state = state; |
| if (ret_ptr) |
| *ret_ptr = (char *)ptr; |
| return NULL; |
| } |
| |
| /* |
| * This function parses a request line between <ptr> and <end>, starting with |
| * parser state <state>. Only states HTTP_MSG_RQMETH, HTTP_MSG_RQMETH_SP, |
| * HTTP_MSG_RQURI, HTTP_MSG_RQURI_SP and HTTP_MSG_RQVER are handled. Others |
| * will give undefined results. |
| * Note that it is upon the caller's responsibility to ensure that ptr < end, |
| * and that msg->sol points to the beginning of the request. |
| * If a complete line is found (which implies that at least one CR or LF is |
| * found before <end>, the updated <ptr> is returned, otherwise NULL is |
| * returned indicating an incomplete line (which does not mean that parts have |
| * not been updated). In the incomplete case, if <ret_ptr> or <ret_state> are |
| * non-NULL, they are fed with the new <ptr> and <state> values to be passed |
| * upon next call. |
| * |
| * This function was intentionally designed to be called from |
| * http_msg_analyzer() with the lowest overhead. It should integrate perfectly |
| * within its state machine and use the same macros, hence the need for same |
| * labels and variable names. Note that msg->sol is left unchanged. |
| */ |
| const char *http_parse_reqline(struct http_msg *msg, const char *msg_buf, |
| unsigned int state, const char *ptr, const char *end, |
| char **ret_ptr, unsigned int *ret_state) |
| { |
| switch (state) { |
| case HTTP_MSG_RQMETH: |
| http_msg_rqmeth: |
| if (likely(HTTP_IS_TOKEN(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqmeth, HTTP_MSG_RQMETH); |
| |
| if (likely(HTTP_IS_SPHT(*ptr))) { |
| msg->sl.rq.m_l = (ptr - msg_buf) - msg->som; |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqmeth_sp, HTTP_MSG_RQMETH_SP); |
| } |
| |
| if (likely(HTTP_IS_CRLF(*ptr))) { |
| /* HTTP 0.9 request */ |
| msg->sl.rq.m_l = (ptr - msg_buf) - msg->som; |
| http_msg_req09_uri: |
| msg->sl.rq.u = (ptr - msg_buf) - msg->som; |
| http_msg_req09_uri_e: |
| msg->sl.rq.u_l = (ptr - msg_buf) - msg->som - msg->sl.rq.u; |
| http_msg_req09_ver: |
| msg->sl.rq.v = (ptr - msg_buf) - msg->som; |
| msg->sl.rq.v_l = 0; |
| goto http_msg_rqline_eol; |
| } |
| state = HTTP_MSG_ERROR; |
| break; |
| |
| case HTTP_MSG_RQMETH_SP: |
| http_msg_rqmeth_sp: |
| if (likely(!HTTP_IS_LWS(*ptr))) { |
| msg->sl.rq.u = (ptr - msg_buf) - msg->som; |
| goto http_msg_rquri; |
| } |
| if (likely(HTTP_IS_SPHT(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqmeth_sp, HTTP_MSG_RQMETH_SP); |
| /* so it's a CR/LF, meaning an HTTP 0.9 request */ |
| goto http_msg_req09_uri; |
| |
| case HTTP_MSG_RQURI: |
| http_msg_rquri: |
| if (likely(!HTTP_IS_LWS(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rquri, HTTP_MSG_RQURI); |
| |
| if (likely(HTTP_IS_SPHT(*ptr))) { |
| msg->sl.rq.u_l = (ptr - msg_buf) - msg->som - msg->sl.rq.u; |
| EAT_AND_JUMP_OR_RETURN(http_msg_rquri_sp, HTTP_MSG_RQURI_SP); |
| } |
| |
| /* so it's a CR/LF, meaning an HTTP 0.9 request */ |
| goto http_msg_req09_uri_e; |
| |
| case HTTP_MSG_RQURI_SP: |
| http_msg_rquri_sp: |
| if (likely(!HTTP_IS_LWS(*ptr))) { |
| msg->sl.rq.v = (ptr - msg_buf) - msg->som; |
| goto http_msg_rqver; |
| } |
| if (likely(HTTP_IS_SPHT(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rquri_sp, HTTP_MSG_RQURI_SP); |
| /* so it's a CR/LF, meaning an HTTP 0.9 request */ |
| goto http_msg_req09_ver; |
| |
| case HTTP_MSG_RQVER: |
| http_msg_rqver: |
| if (likely(HTTP_IS_VER_TOKEN(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqver, HTTP_MSG_RQVER); |
| |
| if (likely(HTTP_IS_CRLF(*ptr))) { |
| msg->sl.rq.v_l = (ptr - msg_buf) - msg->som - msg->sl.rq.v; |
| http_msg_rqline_eol: |
| /* We have seen the end of line. Note that we do not |
| * necessarily have the \n yet, but at least we know that we |
| * have EITHER \r OR \n, otherwise the request would not be |
| * complete. We can then record the request length and return |
| * to the caller which will be able to register it. |
| */ |
| msg->sl.rq.l = ptr - msg->sol; |
| return ptr; |
| } |
| |
| /* neither an HTTP_VER token nor a CRLF */ |
| state = HTTP_MSG_ERROR; |
| break; |
| |
| #ifdef DEBUG_FULL |
| default: |
| fprintf(stderr, "FIXME !!!! impossible state at %s:%d = %d\n", __FILE__, __LINE__, state); |
| exit(1); |
| #endif |
| } |
| |
| http_msg_ood: |
| /* out of valid data */ |
| if (ret_state) |
| *ret_state = state; |
| if (ret_ptr) |
| *ret_ptr = (char *)ptr; |
| return NULL; |
| } |
| |
| /* |
| * Returns the data from Authorization header. Function may be called more |
| * than once so data is stored in txn->auth_data. When no header is found |
| * or auth method is unknown auth_method is set to HTTP_AUTH_WRONG to avoid |
| * searching again for something we are unable to find anyway. |
| */ |
| |
| char get_http_auth_buff[BUFSIZE]; |
| |
| int |
| get_http_auth(struct session *s) |
| { |
| |
| struct http_txn *txn = &s->txn; |
| struct chunk auth_method; |
| struct hdr_ctx ctx; |
| char *h, *p; |
| int len; |
| |
| #ifdef DEBUG_AUTH |
| printf("Auth for session %p: %d\n", s, txn->auth.method); |
| #endif |
| |
| if (txn->auth.method == HTTP_AUTH_WRONG) |
| return 0; |
| |
| if (txn->auth.method) |
| return 1; |
| |
| txn->auth.method = HTTP_AUTH_WRONG; |
| |
| ctx.idx = 0; |
| |
| if (txn->flags & TX_USE_PX_CONN) { |
| h = "Proxy-Authorization"; |
| len = strlen(h); |
| } else { |
| h = "Authorization"; |
| len = strlen(h); |
| } |
| |
| if (!http_find_header2(h, len, txn->req.sol, &txn->hdr_idx, &ctx)) |
| return 0; |
| |
| h = ctx.line + ctx.val; |
| |
| p = memchr(h, ' ', ctx.vlen); |
| if (!p || p == h) |
| return 0; |
| |
| chunk_initlen(&auth_method, h, 0, p-h); |
| chunk_initlen(&txn->auth.method_data, p+1, 0, ctx.vlen-(p-h)-1); |
| |
| if (!strncasecmp("Basic", auth_method.str, auth_method.len)) { |
| |
| len = base64dec(txn->auth.method_data.str, txn->auth.method_data.len, |
| get_http_auth_buff, BUFSIZE - 1); |
| |
| if (len < 0) |
| return 0; |
| |
| |
| get_http_auth_buff[len] = '\0'; |
| |
| p = strchr(get_http_auth_buff, ':'); |
| |
| if (!p) |
| return 0; |
| |
| txn->auth.user = get_http_auth_buff; |
| *p = '\0'; |
| txn->auth.pass = p+1; |
| |
| txn->auth.method = HTTP_AUTH_BASIC; |
| return 1; |
| } |
| |
| return 0; |
| } |
| |
| |
| /* |
| * This function parses an HTTP message, either a request or a response, |
| * depending on the initial msg->msg_state. It can be preempted everywhere |
| * when data are missing and recalled at the exact same location with no |
| * information loss. The header index is re-initialized when switching from |
| * MSG_R[PQ]BEFORE to MSG_RPVER|MSG_RQMETH. It modifies msg->sol among other |
| * fields. Note that msg->som and msg->sol will be initialized after completing |
| * the first state, so that none of the msg pointers has to be initialized |
| * prior to the first call. |
| */ |
| void http_msg_analyzer(struct buffer *buf, struct http_msg *msg, struct hdr_idx *idx) |
| { |
| unsigned int state; /* updated only when leaving the FSM */ |
| register char *ptr, *end; /* request pointers, to avoid dereferences */ |
| |
| state = msg->msg_state; |
| ptr = buf->lr; |
| end = buf->r; |
| |
| if (unlikely(ptr >= end)) |
| goto http_msg_ood; |
| |
| switch (state) { |
| /* |
| * First, states that are specific to the response only. |
| * We check them first so that request and headers are |
| * closer to each other (accessed more often). |
| */ |
| case HTTP_MSG_RPBEFORE: |
| http_msg_rpbefore: |
| if (likely(HTTP_IS_TOKEN(*ptr))) { |
| /* we have a start of message, but we have to check |
| * first if we need to remove some CRLF. We can only |
| * do this when send_max=0. |
| */ |
| char *beg = buf->w + buf->send_max; |
| if (beg >= buf->data + buf->size) |
| beg -= buf->size; |
| if (unlikely(ptr != beg)) { |
| if (buf->send_max) |
| goto http_msg_ood; |
| /* Remove empty leading lines, as recommended by RFC2616. */ |
| buffer_ignore(buf, ptr - beg); |
| } |
| msg->som = ptr - buf->data; |
| msg->sol = ptr; |
| hdr_idx_init(idx); |
| state = HTTP_MSG_RPVER; |
| goto http_msg_rpver; |
| } |
| |
| if (unlikely(!HTTP_IS_CRLF(*ptr))) |
| goto http_msg_invalid; |
| |
| if (unlikely(*ptr == '\n')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpbefore, HTTP_MSG_RPBEFORE); |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpbefore_cr, HTTP_MSG_RPBEFORE_CR); |
| /* stop here */ |
| |
| case HTTP_MSG_RPBEFORE_CR: |
| http_msg_rpbefore_cr: |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpbefore, HTTP_MSG_RPBEFORE); |
| /* stop here */ |
| |
| case HTTP_MSG_RPVER: |
| http_msg_rpver: |
| case HTTP_MSG_RPVER_SP: |
| case HTTP_MSG_RPCODE: |
| case HTTP_MSG_RPCODE_SP: |
| case HTTP_MSG_RPREASON: |
| ptr = (char *)http_parse_stsline(msg, buf->data, state, ptr, end, |
| &buf->lr, &msg->msg_state); |
| if (unlikely(!ptr)) |
| return; |
| |
| /* we have a full response and we know that we have either a CR |
| * or an LF at <ptr>. |
| */ |
| //fprintf(stderr,"som=%d rq.l=%d *ptr=0x%02x\n", msg->som, msg->sl.st.l, *ptr); |
| hdr_idx_set_start(idx, msg->sl.st.l, *ptr == '\r'); |
| |
| msg->sol = ptr; |
| if (likely(*ptr == '\r')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpline_end, HTTP_MSG_RPLINE_END); |
| goto http_msg_rpline_end; |
| |
| case HTTP_MSG_RPLINE_END: |
| http_msg_rpline_end: |
| /* msg->sol must point to the first of CR or LF. */ |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_first, HTTP_MSG_HDR_FIRST); |
| /* stop here */ |
| |
| /* |
| * Second, states that are specific to the request only |
| */ |
| case HTTP_MSG_RQBEFORE: |
| http_msg_rqbefore: |
| if (likely(HTTP_IS_TOKEN(*ptr))) { |
| /* we have a start of message, but we have to check |
| * first if we need to remove some CRLF. We can only |
| * do this when send_max=0. |
| */ |
| char *beg = buf->w + buf->send_max; |
| if (beg >= buf->data + buf->size) |
| beg -= buf->size; |
| if (likely(ptr != beg)) { |
| if (buf->send_max) |
| goto http_msg_ood; |
| /* Remove empty leading lines, as recommended by RFC2616. */ |
| buffer_ignore(buf, ptr - beg); |
| } |
| msg->som = ptr - buf->data; |
| msg->sol = ptr; |
| /* we will need this when keep-alive will be supported |
| hdr_idx_init(idx); |
| */ |
| state = HTTP_MSG_RQMETH; |
| goto http_msg_rqmeth; |
| } |
| |
| if (unlikely(!HTTP_IS_CRLF(*ptr))) |
| goto http_msg_invalid; |
| |
| if (unlikely(*ptr == '\n')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqbefore, HTTP_MSG_RQBEFORE); |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqbefore_cr, HTTP_MSG_RQBEFORE_CR); |
| /* stop here */ |
| |
| case HTTP_MSG_RQBEFORE_CR: |
| http_msg_rqbefore_cr: |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqbefore, HTTP_MSG_RQBEFORE); |
| /* stop here */ |
| |
| case HTTP_MSG_RQMETH: |
| http_msg_rqmeth: |
| case HTTP_MSG_RQMETH_SP: |
| case HTTP_MSG_RQURI: |
| case HTTP_MSG_RQURI_SP: |
| case HTTP_MSG_RQVER: |
| ptr = (char *)http_parse_reqline(msg, buf->data, state, ptr, end, |
| &buf->lr, &msg->msg_state); |
| if (unlikely(!ptr)) |
| return; |
| |
| /* we have a full request and we know that we have either a CR |
| * or an LF at <ptr>. |
| */ |
| //fprintf(stderr,"som=%d rq.l=%d *ptr=0x%02x\n", msg->som, msg->sl.rq.l, *ptr); |
| hdr_idx_set_start(idx, msg->sl.rq.l, *ptr == '\r'); |
| |
| msg->sol = ptr; |
| if (likely(*ptr == '\r')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqline_end, HTTP_MSG_RQLINE_END); |
| goto http_msg_rqline_end; |
| |
| case HTTP_MSG_RQLINE_END: |
| http_msg_rqline_end: |
| /* check for HTTP/0.9 request : no version information available. |
| * msg->sol must point to the first of CR or LF. |
| */ |
| if (unlikely(msg->sl.rq.v_l == 0)) |
| goto http_msg_last_lf; |
| |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_first, HTTP_MSG_HDR_FIRST); |
| /* stop here */ |
| |
| /* |
| * Common states below |
| */ |
| case HTTP_MSG_HDR_FIRST: |
| http_msg_hdr_first: |
| msg->sol = ptr; |
| if (likely(!HTTP_IS_CRLF(*ptr))) { |
| goto http_msg_hdr_name; |
| } |
| |
| if (likely(*ptr == '\r')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_last_lf, HTTP_MSG_LAST_LF); |
| goto http_msg_last_lf; |
| |
| case HTTP_MSG_HDR_NAME: |
| http_msg_hdr_name: |
| /* assumes msg->sol points to the first char */ |
| if (likely(HTTP_IS_TOKEN(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_name, HTTP_MSG_HDR_NAME); |
| |
| if (likely(*ptr == ':')) { |
| msg->col = ptr - buf->data; |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_l1_sp, HTTP_MSG_HDR_L1_SP); |
| } |
| |
| if (likely(msg->err_pos < -1) || *ptr == '\n') |
| goto http_msg_invalid; |
| |
| if (msg->err_pos == -1) /* capture error pointer */ |
| msg->err_pos = ptr - buf->data; /* >= 0 now */ |
| |
| /* and we still accept this non-token character */ |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_name, HTTP_MSG_HDR_NAME); |
| |
| case HTTP_MSG_HDR_L1_SP: |
| http_msg_hdr_l1_sp: |
| /* assumes msg->sol points to the first char and msg->col to the colon */ |
| if (likely(HTTP_IS_SPHT(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_l1_sp, HTTP_MSG_HDR_L1_SP); |
| |
| /* header value can be basically anything except CR/LF */ |
| msg->sov = ptr - buf->data; |
| |
| if (likely(!HTTP_IS_CRLF(*ptr))) { |
| goto http_msg_hdr_val; |
| } |
| |
| if (likely(*ptr == '\r')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_l1_lf, HTTP_MSG_HDR_L1_LF); |
| goto http_msg_hdr_l1_lf; |
| |
| case HTTP_MSG_HDR_L1_LF: |
| http_msg_hdr_l1_lf: |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_l1_lws, HTTP_MSG_HDR_L1_LWS); |
| |
| case HTTP_MSG_HDR_L1_LWS: |
| http_msg_hdr_l1_lws: |
| if (likely(HTTP_IS_SPHT(*ptr))) { |
| /* replace HT,CR,LF with spaces */ |
| for (; buf->data+msg->sov < ptr; msg->sov++) |
| buf->data[msg->sov] = ' '; |
| goto http_msg_hdr_l1_sp; |
| } |
| /* we had a header consisting only in spaces ! */ |
| msg->eol = buf->data + msg->sov; |
| goto http_msg_complete_header; |
| |
| case HTTP_MSG_HDR_VAL: |
| http_msg_hdr_val: |
| /* assumes msg->sol points to the first char, msg->col to the |
| * colon, and msg->sov points to the first character of the |
| * value. |
| */ |
| if (likely(!HTTP_IS_CRLF(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_val, HTTP_MSG_HDR_VAL); |
| |
| msg->eol = ptr; |
| /* Note: we could also copy eol into ->eoh so that we have the |
| * real header end in case it ends with lots of LWS, but is this |
| * really needed ? |
| */ |
| if (likely(*ptr == '\r')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_l2_lf, HTTP_MSG_HDR_L2_LF); |
| goto http_msg_hdr_l2_lf; |
| |
| case HTTP_MSG_HDR_L2_LF: |
| http_msg_hdr_l2_lf: |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_l2_lws, HTTP_MSG_HDR_L2_LWS); |
| |
| case HTTP_MSG_HDR_L2_LWS: |
| http_msg_hdr_l2_lws: |
| if (unlikely(HTTP_IS_SPHT(*ptr))) { |
| /* LWS: replace HT,CR,LF with spaces */ |
| for (; msg->eol < ptr; msg->eol++) |
| *msg->eol = ' '; |
| goto http_msg_hdr_val; |
| } |
| http_msg_complete_header: |
| /* |
| * It was a new header, so the last one is finished. |
| * Assumes msg->sol points to the first char, msg->col to the |
| * colon, msg->sov points to the first character of the value |
| * and msg->eol to the first CR or LF so we know how the line |
| * ends. We insert last header into the index. |
| */ |
| /* |
| fprintf(stderr,"registering %-2d bytes : ", msg->eol - msg->sol); |
| write(2, msg->sol, msg->eol-msg->sol); |
| fprintf(stderr,"\n"); |
| */ |
| |
| if (unlikely(hdr_idx_add(msg->eol - msg->sol, *msg->eol == '\r', |
| idx, idx->tail) < 0)) |
| goto http_msg_invalid; |
| |
| msg->sol = ptr; |
| if (likely(!HTTP_IS_CRLF(*ptr))) { |
| goto http_msg_hdr_name; |
| } |
| |
| if (likely(*ptr == '\r')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_last_lf, HTTP_MSG_LAST_LF); |
| goto http_msg_last_lf; |
| |
| case HTTP_MSG_LAST_LF: |
| http_msg_last_lf: |
| /* Assumes msg->sol points to the first of either CR or LF */ |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| ptr++; |
| buf->lr = ptr; |
| msg->col = msg->sov = buf->lr - buf->data; |
| msg->eoh = msg->sol - buf->data; |
| msg->sol = buf->data + msg->som; |
| msg->msg_state = HTTP_MSG_BODY; |
| return; |
| #ifdef DEBUG_FULL |
| default: |
| fprintf(stderr, "FIXME !!!! impossible state at %s:%d = %d\n", __FILE__, __LINE__, state); |
| exit(1); |
| #endif |
| } |
| http_msg_ood: |
| /* out of data */ |
| msg->msg_state = state; |
| buf->lr = ptr; |
| return; |
| |
| http_msg_invalid: |
| /* invalid message */ |
| msg->msg_state = HTTP_MSG_ERROR; |
| buf->lr = ptr; |
| return; |
| } |
| |
| /* convert an HTTP/0.9 request into an HTTP/1.0 request. Returns 1 if the |
| * conversion succeeded, 0 in case of error. If the request was already 1.X, |
| * nothing is done and 1 is returned. |
| */ |
| static int http_upgrade_v09_to_v10(struct buffer *req, struct http_msg *msg, struct http_txn *txn) |
| { |
| int delta; |
| char *cur_end; |
| |
| if (msg->sl.rq.v_l != 0) |
| return 1; |
| |
| cur_end = msg->sol + msg->sl.rq.l; |
| delta = 0; |
| |
| if (msg->sl.rq.u_l == 0) { |
| /* if no URI was set, add "/" */ |
| delta = buffer_replace2(req, cur_end, cur_end, " /", 2); |
| cur_end += delta; |
| http_msg_move_end(msg, delta); |
| } |
| /* add HTTP version */ |
| delta = buffer_replace2(req, cur_end, cur_end, " HTTP/1.0\r\n", 11); |
| http_msg_move_end(msg, delta); |
| cur_end += delta; |
| cur_end = (char *)http_parse_reqline(msg, req->data, |
| HTTP_MSG_RQMETH, |
| msg->sol, cur_end + 1, |
| NULL, NULL); |
| if (unlikely(!cur_end)) |
| return 0; |
| |
| /* we have a full HTTP/1.0 request now and we know that |
| * we have either a CR or an LF at <ptr>. |
| */ |
| hdr_idx_set_start(&txn->hdr_idx, msg->sl.rq.l, *cur_end == '\r'); |
| return 1; |
| } |
| |
| /* Parse the Connection: header of an HTTP request, looking for both "close" |
| * and "keep-alive" values. If a buffer is provided and we already know that |
| * some headers may safely be removed, we remove them now. The <to_del> flags |
| * are used for that : |
| * - bit 0 means remove "close" headers (in HTTP/1.0 requests/responses) |
| * - bit 1 means remove "keep-alive" headers (in HTTP/1.1 reqs/resp to 1.1). |
| * The TX_HDR_CONN_* flags are adjusted in txn->flags depending on what was |
| * found, and TX_CON_*_SET is adjusted depending on what is left so only |
| * harmless combinations may be removed. Do not call that after changes have |
| * been processed. If unused, the buffer can be NULL, and no data will be |
| * changed. |
| */ |
| void http_parse_connection_header(struct http_txn *txn, struct http_msg *msg, struct buffer *buf, int to_del) |
| { |
| struct hdr_ctx ctx; |
| const char *hdr_val = "Connection"; |
| int hdr_len = 10; |
| |
| if (txn->flags & TX_HDR_CONN_PRS) |
| return; |
| |
| if (unlikely(txn->flags & TX_USE_PX_CONN)) { |
| hdr_val = "Proxy-Connection"; |
| hdr_len = 16; |
| } |
| |
| ctx.idx = 0; |
| txn->flags &= ~(TX_CON_KAL_SET|TX_CON_CLO_SET); |
| while (http_find_header2(hdr_val, hdr_len, msg->sol, &txn->hdr_idx, &ctx)) { |
| if (ctx.vlen >= 10 && word_match(ctx.line + ctx.val, ctx.vlen, "keep-alive", 10)) { |
| txn->flags |= TX_HDR_CONN_KAL; |
| if ((to_del & 2) && buf) |
| http_remove_header2(msg, buf, &txn->hdr_idx, &ctx); |
| else |
| txn->flags |= TX_CON_KAL_SET; |
| } |
| else if (ctx.vlen >= 5 && word_match(ctx.line + ctx.val, ctx.vlen, "close", 5)) { |
| txn->flags |= TX_HDR_CONN_CLO; |
| if ((to_del & 1) && buf) |
| http_remove_header2(msg, buf, &txn->hdr_idx, &ctx); |
| else |
| txn->flags |= TX_CON_CLO_SET; |
| } |
| } |
| |
| txn->flags |= TX_HDR_CONN_PRS; |
| return; |
| } |
| |
| /* Apply desired changes on the Connection: header. Values may be removed and/or |
| * added depending on the <wanted> flags, which are exclusively composed of |
| * TX_CON_CLO_SET and TX_CON_KAL_SET, depending on what flags are desired. The |
| * TX_CON_*_SET flags are adjusted in txn->flags depending on what is left. |
| */ |
| void http_change_connection_header(struct http_txn *txn, struct http_msg *msg, struct buffer *buf, int wanted) |
| { |
| struct hdr_ctx ctx; |
| const char *hdr_val = "Connection"; |
| int hdr_len = 10; |
| |
| ctx.idx = 0; |
| |
| |
| if (unlikely(txn->flags & TX_USE_PX_CONN)) { |
| hdr_val = "Proxy-Connection"; |
| hdr_len = 16; |
| } |
| |
| txn->flags &= ~(TX_CON_CLO_SET | TX_CON_KAL_SET); |
| while (http_find_header2(hdr_val, hdr_len, msg->sol, &txn->hdr_idx, &ctx)) { |
| if (ctx.vlen >= 10 && word_match(ctx.line + ctx.val, ctx.vlen, "keep-alive", 10)) { |
| if (wanted & TX_CON_KAL_SET) |
| txn->flags |= TX_CON_KAL_SET; |
| else |
| http_remove_header2(msg, buf, &txn->hdr_idx, &ctx); |
| } |
| else if (ctx.vlen >= 5 && word_match(ctx.line + ctx.val, ctx.vlen, "close", 5)) { |
| if (wanted & TX_CON_CLO_SET) |
| txn->flags |= TX_CON_CLO_SET; |
| else |
| http_remove_header2(msg, buf, &txn->hdr_idx, &ctx); |
| } |
| } |
| |
| if (wanted == (txn->flags & (TX_CON_CLO_SET|TX_CON_KAL_SET))) |
| return; |
| |
| if ((wanted & TX_CON_CLO_SET) && !(txn->flags & TX_CON_CLO_SET)) { |
| txn->flags |= TX_CON_CLO_SET; |
| hdr_val = "Connection: close"; |
| hdr_len = 17; |
| if (unlikely(txn->flags & TX_USE_PX_CONN)) { |
| hdr_val = "Proxy-Connection: close"; |
| hdr_len = 23; |
| } |
| http_header_add_tail2(buf, msg, &txn->hdr_idx, hdr_val, hdr_len); |
| } |
| |
| if ((wanted & TX_CON_KAL_SET) && !(txn->flags & TX_CON_KAL_SET)) { |
| txn->flags |= TX_CON_KAL_SET; |
| hdr_val = "Connection: keep-alive"; |
| hdr_len = 22; |
| if (unlikely(txn->flags & TX_USE_PX_CONN)) { |
| hdr_val = "Proxy-Connection: keep-alive"; |
| hdr_len = 28; |
| } |
| http_header_add_tail2(buf, msg, &txn->hdr_idx, hdr_val, hdr_len); |
| } |
| return; |
| } |
| |
| /* Parse the chunk size at buf->lr. Once done, it adjusts ->lr to point to the |
| * first byte of body, and increments msg->sov by the number of bytes parsed, |
| * so that we know we can forward between ->som and ->sov. Note that due to |
| * possible wrapping at the end of the buffer, it is possible that msg->sov is |
| * lower than msg->som. |
| * Return >0 on success, 0 when some data is missing, <0 on error. |
| * Note: this function is designed to parse wrapped CRLF at the end of the buffer. |
| */ |
| int http_parse_chunk_size(struct buffer *buf, struct http_msg *msg) |
| { |
| char *ptr = buf->lr; |
| char *end = buf->data + buf->size; |
| unsigned int chunk = 0; |
| |
| /* The chunk size is in the following form, though we are only |
| * interested in the size and CRLF : |
| * 1*HEXDIGIT *WSP *[ ';' extensions ] CRLF |
| */ |
| while (1) { |
| int c; |
| if (ptr == buf->r) |
| return 0; |
| c = hex2i(*ptr); |
| if (c < 0) /* not a hex digit anymore */ |
| break; |
| if (++ptr >= end) |
| ptr = buf->data; |
| if (chunk & 0xF000000) /* overflow will occur */ |
| return -1; |
| chunk = (chunk << 4) + c; |
| } |
| |
| /* empty size not allowed */ |
| if (ptr == buf->lr) |
| return -1; |
| |
| while (http_is_spht[(unsigned char)*ptr]) { |
| if (++ptr >= end) |
| ptr = buf->data; |
| if (ptr == buf->r) |
| return 0; |
| } |
| |
| /* Up to there, we know that at least one byte is present at *ptr. Check |
| * for the end of chunk size. |
| */ |
| while (1) { |
| if (likely(HTTP_IS_CRLF(*ptr))) { |
| /* we now have a CR or an LF at ptr */ |
| if (likely(*ptr == '\r')) { |
| if (++ptr >= end) |
| ptr = buf->data; |
| if (ptr == buf->r) |
| return 0; |
| } |
| |
| if (*ptr != '\n') |
| return -1; |
| if (++ptr >= end) |
| ptr = buf->data; |
| /* done */ |
| break; |
| } |
| else if (*ptr == ';') { |
| /* chunk extension, ends at next CRLF */ |
| if (++ptr >= end) |
| ptr = buf->data; |
| if (ptr == buf->r) |
| return 0; |
| |
| while (!HTTP_IS_CRLF(*ptr)) { |
| if (++ptr >= end) |
| ptr = buf->data; |
| if (ptr == buf->r) |
| return 0; |
| } |
| /* we have a CRLF now, loop above */ |
| continue; |
| } |
| else |
| return -1; |
| } |
| |
| /* OK we found our CRLF and now <ptr> points to the next byte, |
| * which may or may not be present. We save that into ->lr and |
| * ->sov. |
| */ |
| msg->sov += ptr - buf->lr; |
| buf->lr = ptr; |
| msg->hdr_content_len = chunk; |
| msg->msg_state = chunk ? HTTP_MSG_DATA : HTTP_MSG_TRAILERS; |
| return 1; |
| } |
| |
| /* This function skips trailers in the buffer <buf> associated with HTTP |
| * message <msg>. The first visited position is buf->lr. If the end of |
| * the trailers is found, it is automatically scheduled to be forwarded, |
| * msg->msg_state switches to HTTP_MSG_DONE, and the function returns >0. |
| * If not enough data are available, the function does not change anything |
| * except maybe buf->lr and msg->sov if it could parse some lines, and returns |
| * zero. If a parse error is encountered, the function returns < 0 and does not |
| * change anything except maybe buf->lr and msg->sov. Note that the message |
| * must already be in HTTP_MSG_TRAILERS state before calling this function, |
| * which implies that all non-trailers data have already been scheduled for |
| * forwarding, and that the difference between msg->som and msg->sov exactly |
| * matches the length of trailers already parsed and not forwarded. It is also |
| * important to note that this function is designed to be able to parse wrapped |
| * headers at end of buffer. |
| */ |
| int http_forward_trailers(struct buffer *buf, struct http_msg *msg) |
| { |
| /* we have buf->lr which points to next line. Look for CRLF. */ |
| while (1) { |
| char *p1 = NULL, *p2 = NULL; |
| char *ptr = buf->lr; |
| int bytes; |
| |
| /* scan current line and stop at LF or CRLF */ |
| while (1) { |
| if (ptr == buf->r) |
| return 0; |
| |
| if (*ptr == '\n') { |
| if (!p1) |
| p1 = ptr; |
| p2 = ptr; |
| break; |
| } |
| |
| if (*ptr == '\r') { |
| if (p1) |
| return -1; |
| p1 = ptr; |
| } |
| |
| ptr++; |
| if (ptr >= buf->data + buf->size) |
| ptr = buf->data; |
| } |
| |
| /* after LF; point to beginning of next line */ |
| p2++; |
| if (p2 >= buf->data + buf->size) |
| p2 = buf->data; |
| |
| bytes = p2 - buf->lr; |
| if (bytes < 0) |
| bytes += buf->size; |
| |
| /* schedule this line for forwarding */ |
| msg->sov += bytes; |
| if (msg->sov >= buf->size) |
| msg->sov -= buf->size; |
| |
| if (p1 == buf->lr) { |
| /* LF/CRLF at beginning of line => end of trailers at p2. |
| * Everything was scheduled for forwarding, there's nothing |
| * left from this message. |
| */ |
| buf->lr = p2; |
| msg->msg_state = HTTP_MSG_DONE; |
| return 1; |
| } |
| /* OK, next line then */ |
| buf->lr = p2; |
| } |
| } |
| |
| /* This function may be called only in HTTP_MSG_DATA_CRLF. It reads the CRLF or |
| * a possible LF alone at the end of a chunk. It automatically adjusts msg->sov, |
| * ->som, buf->lr in order to include this part into the next forwarding phase. |
| * It also sets msg_state to HTTP_MSG_CHUNK_SIZE and returns >0 on success. If |
| * not enough data are available, the function does not change anything and |
| * returns zero. If a parse error is encountered, the function returns < 0 and |
| * does not change anything. Note: this function is designed to parse wrapped |
| * CRLF at the end of the buffer. |
| */ |
| int http_skip_chunk_crlf(struct buffer *buf, struct http_msg *msg) |
| { |
| char *ptr; |
| int bytes; |
| |
| /* NB: we'll check data availabilty at the end. It's not a |
| * problem because whatever we match first will be checked |
| * against the correct length. |
| */ |
| bytes = 1; |
| ptr = buf->lr; |
| if (*ptr == '\r') { |
| bytes++; |
| ptr++; |
| if (ptr >= buf->data + buf->size) |
| ptr = buf->data; |
| } |
| |
| if (bytes > buf->l - buf->send_max) |
| return 0; |
| |
| if (*ptr != '\n') |
| return -1; |
| |
| ptr++; |
| if (ptr >= buf->data + buf->size) |
| ptr = buf->data; |
| buf->lr = ptr; |
| /* prepare the CRLF to be forwarded. msg->som may be before data but we don't care */ |
| msg->sov = ptr - buf->data; |
| msg->som = msg->sov - bytes; |
| msg->msg_state = HTTP_MSG_CHUNK_SIZE; |
| return 1; |
| } |
| |
| void http_buffer_heavy_realign(struct buffer *buf, struct http_msg *msg) |
| { |
| char *end = buf->data + buf->size; |
| int off = buf->data + buf->size - buf->w; |
| |
| /* two possible cases : |
| * - the buffer is in one contiguous block, we move it in-place |
| * - the buffer is in two blocks, we move it via the swap_buffer |
| */ |
| if (buf->l) { |
| int block1 = buf->l; |
| int block2 = 0; |
| if (buf->r <= buf->w) { |
| /* non-contiguous block */ |
| block1 = buf->data + buf->size - buf->w; |
| block2 = buf->r - buf->data; |
| } |
| if (block2) |
| memcpy(swap_buffer, buf->data, block2); |
| memmove(buf->data, buf->w, block1); |
| if (block2) |
| memcpy(buf->data + block1, swap_buffer, block2); |
| } |
| |
| /* adjust all known pointers */ |
| buf->w = buf->data; |
| buf->lr += off; if (buf->lr >= end) buf->lr -= buf->size; |
| buf->r += off; if (buf->r >= end) buf->r -= buf->size; |
| msg->sol += off; if (msg->sol >= end) msg->sol -= buf->size; |
| msg->eol += off; if (msg->eol >= end) msg->eol -= buf->size; |
| |
| /* adjust relative pointers */ |
| msg->som = 0; |
| msg->eoh += off; if (msg->eoh >= buf->size) msg->eoh -= buf->size; |
| msg->col += off; if (msg->col >= buf->size) msg->col -= buf->size; |
| msg->sov += off; if (msg->sov >= buf->size) msg->sov -= buf->size; |
| |
| if (msg->err_pos >= 0) { |
| msg->err_pos += off; |
| if (msg->err_pos >= buf->size) |
| msg->err_pos -= buf->size; |
| } |
| |
| buf->flags &= ~BF_FULL; |
| if (buf->l >= buffer_max_len(buf)) |
| buf->flags |= BF_FULL; |
| } |
| |
| /* This stream analyser waits for a complete HTTP request. It returns 1 if the |
| * processing can continue on next analysers, or zero if it either needs more |
| * data or wants to immediately abort the request (eg: timeout, error, ...). It |
| * is tied to AN_REQ_WAIT_HTTP and may may remove itself from s->req->analysers |
| * when it has nothing left to do, and may remove any analyser when it wants to |
| * abort. |
| */ |
| int http_wait_for_request(struct session *s, struct buffer *req, int an_bit) |
| { |
| /* |
| * We will parse the partial (or complete) lines. |
| * We will check the request syntax, and also join multi-line |
| * headers. An index of all the lines will be elaborated while |
| * parsing. |
| * |
| * For the parsing, we use a 28 states FSM. |
| * |
| * Here is the information we currently have : |
| * req->data + msg->som = beginning of request |
| * req->data + msg->eoh = end of processed headers / start of current one |
| * msg->eol = end of current header or line (LF or CRLF) |
| * req->lr = first non-visited byte |
| * req->r = end of data |
| * |
| * At end of parsing, we may perform a capture of the error (if any), and |
| * we will set a few fields (msg->sol, txn->meth, sn->flags/SN_REDIRECTABLE). |
| * We also check for monitor-uri, logging, HTTP/0.9 to 1.0 conversion, and |
| * finally headers capture. |
| */ |
| |
| int cur_idx; |
| int use_close_only; |
| struct http_txn *txn = &s->txn; |
| struct http_msg *msg = &txn->req; |
| struct hdr_ctx ctx; |
| |
| DPRINTF(stderr,"[%u] %s: session=%p b=%p, exp(r,w)=%u,%u bf=%08x bl=%d analysers=%02x\n", |
| now_ms, __FUNCTION__, |
| s, |
| req, |
| req->rex, req->wex, |
| req->flags, |
| req->l, |
| req->analysers); |
| |
| /* we're speaking HTTP here, so let's speak HTTP to the client */ |
| s->srv_error = http_return_srv_error; |
| |
| /* There's a protected area at the end of the buffer for rewriting |
| * purposes. We don't want to start to parse the request if the |
| * protected area is affected, because we may have to move processed |
| * data later, which is much more complicated. |
| */ |
| if (req->l && msg->msg_state < HTTP_MSG_ERROR) { |
| if ((txn->flags & TX_NOT_FIRST) && |
| unlikely((req->flags & BF_FULL) || |
| req->r < req->lr || |
| req->r > req->data + req->size - global.tune.maxrewrite)) { |
| if (req->send_max) { |
| if (req->flags & (BF_SHUTW|BF_SHUTW_NOW|BF_WRITE_ERROR|BF_WRITE_TIMEOUT)) |
| goto failed_keep_alive; |
| /* some data has still not left the buffer, wake us once that's done */ |
| buffer_dont_connect(req); |
| req->flags |= BF_READ_DONTWAIT; /* try to get back here ASAP */ |
| return 0; |
| } |
| if (req->l <= req->size - global.tune.maxrewrite) |
| http_buffer_heavy_realign(req, msg); |
| } |
| |
| /* Note that we have the same problem with the response ; we |
| * may want to send a redirect, error or anything which requires |
| * some spare space. So we'll ensure that we have at least |
| * maxrewrite bytes available in the response buffer before |
| * processing that one. This will only affect pipelined |
| * keep-alive requests. |
| */ |
| if ((txn->flags & TX_NOT_FIRST) && |
| unlikely((s->rep->flags & BF_FULL) || |
| s->rep->r < s->rep->lr || |
| s->rep->r > s->rep->data + s->rep->size - global.tune.maxrewrite)) { |
| if (s->rep->send_max) { |
| if (s->rep->flags & (BF_SHUTW|BF_SHUTW_NOW|BF_WRITE_ERROR|BF_WRITE_TIMEOUT)) |
| goto failed_keep_alive; |
| /* don't let a connection request be initiated */ |
| buffer_dont_connect(req); |
| s->rep->flags &= ~BF_EXPECT_MORE; /* speed up sending a previous response */ |
| return 0; |
| } |
| } |
| |
| if (likely(req->lr < req->r)) |
| http_msg_analyzer(req, msg, &txn->hdr_idx); |
| } |
| |
| /* 1: we might have to print this header in debug mode */ |
| if (unlikely((global.mode & MODE_DEBUG) && |
| (!(global.mode & MODE_QUIET) || (global.mode & MODE_VERBOSE)) && |
| msg->sol && |
| (msg->msg_state >= HTTP_MSG_BODY || msg->msg_state == HTTP_MSG_ERROR))) { |
| char *eol, *sol; |
| |
| sol = req->data + msg->som; |
| eol = sol + msg->sl.rq.l; |
| debug_hdr("clireq", s, sol, eol); |
| |
| sol += hdr_idx_first_pos(&txn->hdr_idx); |
| cur_idx = hdr_idx_first_idx(&txn->hdr_idx); |
| |
| while (cur_idx) { |
| eol = sol + txn->hdr_idx.v[cur_idx].len; |
| debug_hdr("clihdr", s, sol, eol); |
| sol = eol + txn->hdr_idx.v[cur_idx].cr + 1; |
| cur_idx = txn->hdr_idx.v[cur_idx].next; |
| } |
| } |
| |
| |
| /* |
| * Now we quickly check if we have found a full valid request. |
| * If not so, we check the FD and buffer states before leaving. |
| * A full request is indicated by the fact that we have seen |
| * the double LF/CRLF, so the state is >= HTTP_MSG_BODY. Invalid |
| * requests are checked first. When waiting for a second request |
| * on a keep-alive session, if we encounter and error, close, t/o, |
| * we note the error in the session flags but don't set any state. |
| * Since the error will be noted there, it will not be counted by |
| * process_session() as a frontend error. |
| * Last, we may increase some tracked counters' http request errors on |
| * the cases that are deliberately the client's fault. For instance, |
| * a timeout or connection reset is not counted as an error. However |
| * a bad request is. |
| */ |
| |
| if (unlikely(msg->msg_state < HTTP_MSG_BODY)) { |
| /* |
| * First, let's catch bad requests. |
| */ |
| if (unlikely(msg->msg_state == HTTP_MSG_ERROR)) { |
| session_inc_http_req_ctr(s); |
| session_inc_http_err_ctr(s); |
| proxy_inc_fe_req_ctr(s->fe); |
| goto return_bad_req; |
| } |
| |
| /* 1: Since we are in header mode, if there's no space |
| * left for headers, we won't be able to free more |
| * later, so the session will never terminate. We |
| * must terminate it now. |
| */ |
| if (unlikely(req->flags & BF_FULL)) { |
| /* FIXME: check if URI is set and return Status |
| * 414 Request URI too long instead. |
| */ |
| session_inc_http_req_ctr(s); |
| session_inc_http_err_ctr(s); |
| proxy_inc_fe_req_ctr(s->fe); |
| goto return_bad_req; |
| } |
| |
| /* 2: have we encountered a read error ? */ |
| else if (req->flags & BF_READ_ERROR) { |
| if (!(s->flags & SN_ERR_MASK)) |
| s->flags |= SN_ERR_CLICL; |
| |
| if (txn->flags & TX_WAIT_NEXT_RQ) |
| goto failed_keep_alive; |
| |
| /* we cannot return any message on error */ |
| if (msg->err_pos >= 0) { |
| http_capture_bad_message(&s->fe->invalid_req, s, req, msg, s->fe); |
| session_inc_http_err_ctr(s); |
| } |
| |
| msg->msg_state = HTTP_MSG_ERROR; |
| req->analysers = 0; |
| |
| session_inc_http_req_ctr(s); |
| proxy_inc_fe_req_ctr(s->fe); |
| s->fe->counters.failed_req++; |
| if (s->listener->counters) |
| s->listener->counters->failed_req++; |
| |
| if (!(s->flags & SN_FINST_MASK)) |
| s->flags |= SN_FINST_R; |
| return 0; |
| } |
| |
| /* 3: has the read timeout expired ? */ |
| else if (req->flags & BF_READ_TIMEOUT || tick_is_expired(req->analyse_exp, now_ms)) { |
| if (!(s->flags & SN_ERR_MASK)) |
| s->flags |= SN_ERR_CLITO; |
| |
| if (txn->flags & TX_WAIT_NEXT_RQ) |
| goto failed_keep_alive; |
| |
| /* read timeout : give up with an error message. */ |
| if (msg->err_pos >= 0) { |
| http_capture_bad_message(&s->fe->invalid_req, s, req, msg, s->fe); |
| session_inc_http_err_ctr(s); |
| } |
| txn->status = 408; |
| stream_int_retnclose(req->prod, error_message(s, HTTP_ERR_408)); |
| msg->msg_state = HTTP_MSG_ERROR; |
| req->analysers = 0; |
| |
| session_inc_http_req_ctr(s); |
| proxy_inc_fe_req_ctr(s->fe); |
| s->fe->counters.failed_req++; |
| if (s->listener->counters) |
| s->listener->counters->failed_req++; |
| |
| if (!(s->flags & SN_FINST_MASK)) |
| s->flags |= SN_FINST_R; |
| return 0; |
| } |
| |
| /* 4: have we encountered a close ? */ |
| else if (req->flags & BF_SHUTR) { |
| if (!(s->flags & SN_ERR_MASK)) |
| s->flags |= SN_ERR_CLICL; |
| |
| if (txn->flags & TX_WAIT_NEXT_RQ) |
| goto failed_keep_alive; |
| |
| if (msg->err_pos >= 0) |
| http_capture_bad_message(&s->fe->invalid_req, s, req, msg, s->fe); |
| txn->status = 400; |
| stream_int_retnclose(req->prod, error_message(s, HTTP_ERR_400)); |
| msg->msg_state = HTTP_MSG_ERROR; |
| req->analysers = 0; |
| |
| session_inc_http_err_ctr(s); |
| session_inc_http_req_ctr(s); |
| proxy_inc_fe_req_ctr(s->fe); |
| s->fe->counters.failed_req++; |
| if (s->listener->counters) |
| s->listener->counters->failed_req++; |
| |
| if (!(s->flags & SN_FINST_MASK)) |
| s->flags |= SN_FINST_R; |
| return 0; |
| } |
| |
| buffer_dont_connect(req); |
| req->flags |= BF_READ_DONTWAIT; /* try to get back here ASAP */ |
| s->rep->flags &= ~BF_EXPECT_MORE; /* speed up sending a previous response */ |
| |
| if ((msg->msg_state != HTTP_MSG_RQBEFORE) && (txn->flags & TX_WAIT_NEXT_RQ)) { |
| /* If the client starts to talk, let's fall back to |
| * request timeout processing. |
| */ |
| txn->flags &= ~TX_WAIT_NEXT_RQ; |
| req->analyse_exp = TICK_ETERNITY; |
| } |
| |
| /* just set the request timeout once at the beginning of the request */ |
| if (!tick_isset(req->analyse_exp)) { |
| if ((msg->msg_state == HTTP_MSG_RQBEFORE) && |
| (txn->flags & TX_WAIT_NEXT_RQ) && |
| tick_isset(s->be->timeout.httpka)) |
| req->analyse_exp = tick_add(now_ms, s->be->timeout.httpka); |
| else |
| req->analyse_exp = tick_add_ifset(now_ms, s->be->timeout.httpreq); |
| } |
| |
| /* we're not ready yet */ |
| return 0; |
| |
| failed_keep_alive: |
| /* Here we process low-level errors for keep-alive requests. In |
| * short, if the request is not the first one and it experiences |
| * a timeout, read error or shutdown, we just silently close so |
| * that the client can try again. |
| */ |
| txn->status = 0; |
| msg->msg_state = HTTP_MSG_RQBEFORE; |
| req->analysers = 0; |
| s->logs.logwait = 0; |
| s->rep->flags &= ~BF_EXPECT_MORE; /* speed up sending a previous response */ |
| stream_int_retnclose(req->prod, NULL); |
| return 0; |
| } |
| |
| /* OK now we have a complete HTTP request with indexed headers. Let's |
| * complete the request parsing by setting a few fields we will need |
| * later. At this point, we have the last CRLF at req->data + msg->eoh. |
| * If the request is in HTTP/0.9 form, the rule is still true, and eoh |
| * points to the CRLF of the request line. req->lr points to the first |
| * byte after the last LF. msg->col and msg->sov point to the first |
| * byte of data. msg->eol cannot be trusted because it may have been |
| * left uninitialized (for instance in the absence of headers). |
| */ |
| |
| session_inc_http_req_ctr(s); |
| proxy_inc_fe_req_ctr(s->fe); /* one more valid request for this FE */ |
| |
| if (txn->flags & TX_WAIT_NEXT_RQ) { |
| /* kill the pending keep-alive timeout */ |
| txn->flags &= ~TX_WAIT_NEXT_RQ; |
| req->analyse_exp = TICK_ETERNITY; |
| } |
| |
| |
| /* Maybe we found in invalid header name while we were configured not |
| * to block on that, so we have to capture it now. |
| */ |
| if (unlikely(msg->err_pos >= 0)) |
| http_capture_bad_message(&s->fe->invalid_req, s, req, msg, s->fe); |
| |
| /* |
| * 1: identify the method |
| */ |
| txn->meth = find_http_meth(msg->sol, msg->sl.rq.m_l); |
| |
| /* we can make use of server redirect on GET and HEAD */ |
| if (txn->meth == HTTP_METH_GET || txn->meth == HTTP_METH_HEAD) |
| s->flags |= SN_REDIRECTABLE; |
| |
| /* |
| * 2: check if the URI matches the monitor_uri. |
| * We have to do this for every request which gets in, because |
| * the monitor-uri is defined by the frontend. |
| */ |
| if (unlikely((s->fe->monitor_uri_len != 0) && |
| (s->fe->monitor_uri_len == msg->sl.rq.u_l) && |
| !memcmp(msg->sol + msg->sl.rq.u, |
| s->fe->monitor_uri, |
| s->fe->monitor_uri_len))) { |
| /* |
| * We have found the monitor URI |
| */ |
| struct acl_cond *cond; |
| |
| s->flags |= SN_MONITOR; |
| |
| /* Check if we want to fail this monitor request or not */ |
| list_for_each_entry(cond, &s->fe->mon_fail_cond, list) { |
| int ret = acl_exec_cond(cond, s->fe, s, txn, ACL_DIR_REQ); |
| |
| ret = acl_pass(ret); |
| if (cond->pol == ACL_COND_UNLESS) |
| ret = !ret; |
| |
| if (ret) { |
| /* we fail this request, let's return 503 service unavail */ |
| txn->status = 503; |
| stream_int_retnclose(req->prod, error_message(s, HTTP_ERR_503)); |
| goto return_prx_cond; |
| } |
| } |
| |
| /* nothing to fail, let's reply normaly */ |
| txn->status = 200; |
| stream_int_retnclose(req->prod, &http_200_chunk); |
| goto return_prx_cond; |
| } |
| |
| /* |
| * 3: Maybe we have to copy the original REQURI for the logs ? |
| * Note: we cannot log anymore if the request has been |
| * classified as invalid. |
| */ |
| if (unlikely(s->logs.logwait & LW_REQ)) { |
| /* we have a complete HTTP request that we must log */ |
| if ((txn->uri = pool_alloc2(pool2_requri)) != NULL) { |
| int urilen = msg->sl.rq.l; |
| |
| if (urilen >= REQURI_LEN) |
| urilen = REQURI_LEN - 1; |
| memcpy(txn->uri, &req->data[msg->som], urilen); |
| txn->uri[urilen] = 0; |
| |
| if (!(s->logs.logwait &= ~LW_REQ)) |
| s->do_log(s); |
| } else { |
| Alert("HTTP logging : out of memory.\n"); |
| } |
| } |
| |
| /* 4. We may have to convert HTTP/0.9 requests to HTTP/1.0 */ |
| if (unlikely(msg->sl.rq.v_l == 0) && !http_upgrade_v09_to_v10(req, msg, txn)) |
| goto return_bad_req; |
| |
| /* ... and check if the request is HTTP/1.1 or above */ |
| if ((msg->sl.rq.v_l == 8) && |
| ((msg->sol[msg->sl.rq.v + 5] > '1') || |
| ((msg->sol[msg->sl.rq.v + 5] == '1') && |
| (msg->sol[msg->sl.rq.v + 7] >= '1')))) |
| txn->flags |= TX_REQ_VER_11; |
| |
| /* "connection" has not been parsed yet */ |
| txn->flags &= ~(TX_HDR_CONN_PRS | TX_HDR_CONN_CLO | TX_HDR_CONN_KAL); |
| |
| /* if the frontend has "option http-use-proxy-header", we'll check if |
| * we have what looks like a proxied connection instead of a connection, |
| * and in this case set the TX_USE_PX_CONN flag to use Proxy-connection. |
| * Note that this is *not* RFC-compliant, however browsers and proxies |
| * happen to do that despite being non-standard :-( |
| * We consider that a request not beginning with either '/' or '*' is |
| * a proxied connection, which covers both "scheme://location" and |
| * CONNECT ip:port. |
| */ |
| if ((s->fe->options2 & PR_O2_USE_PXHDR) && |
| msg->sol[msg->sl.rq.u] != '/' && msg->sol[msg->sl.rq.u] != '*') |
| txn->flags |= TX_USE_PX_CONN; |
| |
| /* transfer length unknown*/ |
| txn->flags &= ~TX_REQ_XFER_LEN; |
| |
| /* 5: we may need to capture headers */ |
| if (unlikely((s->logs.logwait & LW_REQHDR) && s->fe->req_cap)) |
| capture_headers(msg->sol, &txn->hdr_idx, |
| txn->req.cap, s->fe->req_cap); |
| |
| /* 6: determine the transfer-length. |
| * According to RFC2616 #4.4, amended by the HTTPbis working group, |
| * the presence of a message-body in a REQUEST and its transfer length |
| * must be determined that way (in order of precedence) : |
| * 1. The presence of a message-body in a request is signaled by the |
| * inclusion of a Content-Length or Transfer-Encoding header field |
| * in the request's header fields. When a request message contains |
| * both a message-body of non-zero length and a method that does |
| * not define any semantics for that request message-body, then an |
| * origin server SHOULD either ignore the message-body or respond |
| * with an appropriate error message (e.g., 413). A proxy or |
| * gateway, when presented the same request, SHOULD either forward |
| * the request inbound with the message- body or ignore the |
| * message-body when determining a response. |
| * |
| * 2. If a Transfer-Encoding header field (Section 9.7) is present |
| * and the "chunked" transfer-coding (Section 6.2) is used, the |
| * transfer-length is defined by the use of this transfer-coding. |
| * If a Transfer-Encoding header field is present and the "chunked" |
| * transfer-coding is not present, the transfer-length is defined |
| * by the sender closing the connection. |
| * |
| * 3. If a Content-Length header field is present, its decimal value in |
| * OCTETs represents both the entity-length and the transfer-length. |
| * If a message is received with both a Transfer-Encoding header |
| * field and a Content-Length header field, the latter MUST be ignored. |
| * |
| * 4. By the server closing the connection. (Closing the connection |
| * cannot be used to indicate the end of a request body, since that |
| * would leave no possibility for the server to send back a response.) |
| * |
| * Whenever a transfer-coding is applied to a message-body, the set of |
| * transfer-codings MUST include "chunked", unless the message indicates |
| * it is terminated by closing the connection. When the "chunked" |
| * transfer-coding is used, it MUST be the last transfer-coding applied |
| * to the message-body. |
| */ |
| |
| use_close_only = 0; |
| ctx.idx = 0; |
| /* set TE_CHNK and XFER_LEN only if "chunked" is seen last */ |
| while ((txn->flags & TX_REQ_VER_11) && |
| http_find_header2("Transfer-Encoding", 17, msg->sol, &txn->hdr_idx, &ctx)) { |
| if (ctx.vlen == 7 && strncasecmp(ctx.line + ctx.val, "chunked", 7) == 0) |
| txn->flags |= (TX_REQ_TE_CHNK | TX_REQ_XFER_LEN); |
| else if (txn->flags & TX_REQ_TE_CHNK) { |
| /* bad transfer-encoding (chunked followed by something else) */ |
| use_close_only = 1; |
| txn->flags &= ~(TX_REQ_TE_CHNK | TX_REQ_XFER_LEN); |
| break; |
| } |
| } |
| |
| ctx.idx = 0; |
| while (!(txn->flags & TX_REQ_TE_CHNK) && !use_close_only && |
| http_find_header2("Content-Length", 14, msg->sol, &txn->hdr_idx, &ctx)) { |
| signed long long cl; |
| |
| if (!ctx.vlen) |
| goto return_bad_req; |
| |
| if (strl2llrc(ctx.line + ctx.val, ctx.vlen, &cl)) |
| goto return_bad_req; /* parse failure */ |
| |
| if (cl < 0) |
| goto return_bad_req; |
| |
| if ((txn->flags & TX_REQ_CNT_LEN) && (msg->hdr_content_len != cl)) |
| goto return_bad_req; /* already specified, was different */ |
| |
| txn->flags |= TX_REQ_CNT_LEN | TX_REQ_XFER_LEN; |
| msg->hdr_content_len |