| /* |
| * HTTP protocol analyzer |
| * |
| * Copyright 2000-2008 Willy Tarreau <w@1wt.eu> |
| * |
| * This program is free software; you can redistribute it and/or |
| * modify it under the terms of the GNU General Public License |
| * as published by the Free Software Foundation; either version |
| * 2 of the License, or (at your option) any later version. |
| * |
| */ |
| |
| #include <ctype.h> |
| #include <errno.h> |
| #include <fcntl.h> |
| #include <stdio.h> |
| #include <stdlib.h> |
| #include <string.h> |
| #include <syslog.h> |
| #include <time.h> |
| |
| #include <sys/socket.h> |
| #include <sys/stat.h> |
| #include <sys/types.h> |
| |
| #include <common/appsession.h> |
| #include <common/compat.h> |
| #include <common/config.h> |
| #include <common/debug.h> |
| #include <common/memory.h> |
| #include <common/mini-clist.h> |
| #include <common/standard.h> |
| #include <common/ticks.h> |
| #include <common/time.h> |
| #include <common/uri_auth.h> |
| #include <common/version.h> |
| |
| #include <types/capture.h> |
| #include <types/global.h> |
| |
| #include <proto/acl.h> |
| #include <proto/backend.h> |
| #include <proto/buffers.h> |
| #include <proto/client.h> |
| #include <proto/dumpstats.h> |
| #include <proto/fd.h> |
| #include <proto/log.h> |
| #include <proto/hdr_idx.h> |
| #include <proto/proto_tcp.h> |
| #include <proto/proto_http.h> |
| #include <proto/proxy.h> |
| #include <proto/queue.h> |
| #include <proto/server.h> |
| #include <proto/session.h> |
| #include <proto/stream_interface.h> |
| #include <proto/stream_sock.h> |
| #include <proto/task.h> |
| |
| /* This is used by remote monitoring */ |
| const char HTTP_200[] = |
| "HTTP/1.0 200 OK\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>200 OK</h1>\nHAProxy: service ready.\n</body></html>\n"; |
| |
| const struct chunk http_200_chunk = { |
| .str = (char *)&HTTP_200, |
| .len = sizeof(HTTP_200)-1 |
| }; |
| |
| const char *HTTP_301 = |
| "HTTP/1.0 301 Moved Permantenly\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Location: "; /* not terminated since it will be concatenated with the URL */ |
| |
| const char *HTTP_302 = |
| "HTTP/1.0 302 Found\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Location: "; /* not terminated since it will be concatenated with the URL */ |
| |
| /* same as 302 except that the browser MUST retry with the GET method */ |
| const char *HTTP_303 = |
| "HTTP/1.0 303 See Other\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Location: "; /* not terminated since it will be concatenated with the URL */ |
| |
| /* Warning: this one is an sprintf() fmt string, with <realm> as its only argument */ |
| const char *HTTP_401_fmt = |
| "HTTP/1.0 401 Unauthorized\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "WWW-Authenticate: Basic realm=\"%s\"\r\n" |
| "\r\n" |
| "<html><body><h1>401 Unauthorized</h1>\nYou need a valid user and password to access this content.\n</body></html>\n"; |
| |
| |
| const int http_err_codes[HTTP_ERR_SIZE] = { |
| [HTTP_ERR_400] = 400, |
| [HTTP_ERR_403] = 403, |
| [HTTP_ERR_408] = 408, |
| [HTTP_ERR_500] = 500, |
| [HTTP_ERR_502] = 502, |
| [HTTP_ERR_503] = 503, |
| [HTTP_ERR_504] = 504, |
| }; |
| |
| static const char *http_err_msgs[HTTP_ERR_SIZE] = { |
| [HTTP_ERR_400] = |
| "HTTP/1.0 400 Bad request\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>400 Bad request</h1>\nYour browser sent an invalid request.\n</body></html>\n", |
| |
| [HTTP_ERR_403] = |
| "HTTP/1.0 403 Forbidden\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>403 Forbidden</h1>\nRequest forbidden by administrative rules.\n</body></html>\n", |
| |
| [HTTP_ERR_408] = |
| "HTTP/1.0 408 Request Time-out\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>408 Request Time-out</h1>\nYour browser didn't send a complete request in time.\n</body></html>\n", |
| |
| [HTTP_ERR_500] = |
| "HTTP/1.0 500 Server Error\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>500 Server Error</h1>\nAn internal server error occured.\n</body></html>\n", |
| |
| [HTTP_ERR_502] = |
| "HTTP/1.0 502 Bad Gateway\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>502 Bad Gateway</h1>\nThe server returned an invalid or incomplete response.\n</body></html>\n", |
| |
| [HTTP_ERR_503] = |
| "HTTP/1.0 503 Service Unavailable\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>503 Service Unavailable</h1>\nNo server is available to handle this request.\n</body></html>\n", |
| |
| [HTTP_ERR_504] = |
| "HTTP/1.0 504 Gateway Time-out\r\n" |
| "Cache-Control: no-cache\r\n" |
| "Connection: close\r\n" |
| "Content-Type: text/html\r\n" |
| "\r\n" |
| "<html><body><h1>504 Gateway Time-out</h1>\nThe server didn't respond in time.\n</body></html>\n", |
| |
| }; |
| |
| /* We must put the messages here since GCC cannot initialize consts depending |
| * on strlen(). |
| */ |
| struct chunk http_err_chunks[HTTP_ERR_SIZE]; |
| |
| #define FD_SETS_ARE_BITFIELDS |
| #ifdef FD_SETS_ARE_BITFIELDS |
| /* |
| * This map is used with all the FD_* macros to check whether a particular bit |
| * is set or not. Each bit represents an ACSII code. FD_SET() sets those bytes |
| * which should be encoded. When FD_ISSET() returns non-zero, it means that the |
| * byte should be encoded. Be careful to always pass bytes from 0 to 255 |
| * exclusively to the macros. |
| */ |
| fd_set hdr_encode_map[(sizeof(fd_set) > (256/8)) ? 1 : ((256/8) / sizeof(fd_set))]; |
| fd_set url_encode_map[(sizeof(fd_set) > (256/8)) ? 1 : ((256/8) / sizeof(fd_set))]; |
| |
| #else |
| #error "Check if your OS uses bitfields for fd_sets" |
| #endif |
| |
| void init_proto_http() |
| { |
| int i; |
| char *tmp; |
| int msg; |
| |
| for (msg = 0; msg < HTTP_ERR_SIZE; msg++) { |
| if (!http_err_msgs[msg]) { |
| Alert("Internal error: no message defined for HTTP return code %d. Aborting.\n", msg); |
| abort(); |
| } |
| |
| http_err_chunks[msg].str = (char *)http_err_msgs[msg]; |
| http_err_chunks[msg].len = strlen(http_err_msgs[msg]); |
| } |
| |
| /* initialize the log header encoding map : '{|}"#' should be encoded with |
| * '#' as prefix, as well as non-printable characters ( <32 or >= 127 ). |
| * URL encoding only requires '"', '#' to be encoded as well as non- |
| * printable characters above. |
| */ |
| memset(hdr_encode_map, 0, sizeof(hdr_encode_map)); |
| memset(url_encode_map, 0, sizeof(url_encode_map)); |
| for (i = 0; i < 32; i++) { |
| FD_SET(i, hdr_encode_map); |
| FD_SET(i, url_encode_map); |
| } |
| for (i = 127; i < 256; i++) { |
| FD_SET(i, hdr_encode_map); |
| FD_SET(i, url_encode_map); |
| } |
| |
| tmp = "\"#{|}"; |
| while (*tmp) { |
| FD_SET(*tmp, hdr_encode_map); |
| tmp++; |
| } |
| |
| tmp = "\"#"; |
| while (*tmp) { |
| FD_SET(*tmp, url_encode_map); |
| tmp++; |
| } |
| |
| /* memory allocations */ |
| pool2_requri = create_pool("requri", REQURI_LEN, MEM_F_SHARED); |
| pool2_capture = create_pool("capture", CAPTURE_LEN, MEM_F_SHARED); |
| } |
| |
| /* |
| * We have 26 list of methods (1 per first letter), each of which can have |
| * up to 3 entries (2 valid, 1 null). |
| */ |
| struct http_method_desc { |
| http_meth_t meth; |
| int len; |
| const char text[8]; |
| }; |
| |
| const struct http_method_desc http_methods[26][3] = { |
| ['C' - 'A'] = { |
| [0] = { .meth = HTTP_METH_CONNECT , .len=7, .text="CONNECT" }, |
| }, |
| ['D' - 'A'] = { |
| [0] = { .meth = HTTP_METH_DELETE , .len=6, .text="DELETE" }, |
| }, |
| ['G' - 'A'] = { |
| [0] = { .meth = HTTP_METH_GET , .len=3, .text="GET" }, |
| }, |
| ['H' - 'A'] = { |
| [0] = { .meth = HTTP_METH_HEAD , .len=4, .text="HEAD" }, |
| }, |
| ['P' - 'A'] = { |
| [0] = { .meth = HTTP_METH_POST , .len=4, .text="POST" }, |
| [1] = { .meth = HTTP_METH_PUT , .len=3, .text="PUT" }, |
| }, |
| ['T' - 'A'] = { |
| [0] = { .meth = HTTP_METH_TRACE , .len=5, .text="TRACE" }, |
| }, |
| /* rest is empty like this : |
| * [1] = { .meth = HTTP_METH_NONE , .len=0, .text="" }, |
| */ |
| }; |
| |
| /* It is about twice as fast on recent architectures to lookup a byte in a |
| * table than to perform a boolean AND or OR between two tests. Refer to |
| * RFC2616 for those chars. |
| */ |
| |
| const char http_is_spht[256] = { |
| [' '] = 1, ['\t'] = 1, |
| }; |
| |
| const char http_is_crlf[256] = { |
| ['\r'] = 1, ['\n'] = 1, |
| }; |
| |
| const char http_is_lws[256] = { |
| [' '] = 1, ['\t'] = 1, |
| ['\r'] = 1, ['\n'] = 1, |
| }; |
| |
| const char http_is_sep[256] = { |
| ['('] = 1, [')'] = 1, ['<'] = 1, ['>'] = 1, |
| ['@'] = 1, [','] = 1, [';'] = 1, [':'] = 1, |
| ['"'] = 1, ['/'] = 1, ['['] = 1, [']'] = 1, |
| ['{'] = 1, ['}'] = 1, ['?'] = 1, ['='] = 1, |
| [' '] = 1, ['\t'] = 1, ['\\'] = 1, |
| }; |
| |
| const char http_is_ctl[256] = { |
| [0 ... 31] = 1, |
| [127] = 1, |
| }; |
| |
| /* |
| * A token is any ASCII char that is neither a separator nor a CTL char. |
| * Do not overwrite values in assignment since gcc-2.95 will not handle |
| * them correctly. Instead, define every non-CTL char's status. |
| */ |
| const char http_is_token[256] = { |
| [' '] = 0, ['!'] = 1, ['"'] = 0, ['#'] = 1, |
| ['$'] = 1, ['%'] = 1, ['&'] = 1, ['\''] = 1, |
| ['('] = 0, [')'] = 0, ['*'] = 1, ['+'] = 1, |
| [','] = 0, ['-'] = 1, ['.'] = 1, ['/'] = 0, |
| ['0'] = 1, ['1'] = 1, ['2'] = 1, ['3'] = 1, |
| ['4'] = 1, ['5'] = 1, ['6'] = 1, ['7'] = 1, |
| ['8'] = 1, ['9'] = 1, [':'] = 0, [';'] = 0, |
| ['<'] = 0, ['='] = 0, ['>'] = 0, ['?'] = 0, |
| ['@'] = 0, ['A'] = 1, ['B'] = 1, ['C'] = 1, |
| ['D'] = 1, ['E'] = 1, ['F'] = 1, ['G'] = 1, |
| ['H'] = 1, ['I'] = 1, ['J'] = 1, ['K'] = 1, |
| ['L'] = 1, ['M'] = 1, ['N'] = 1, ['O'] = 1, |
| ['P'] = 1, ['Q'] = 1, ['R'] = 1, ['S'] = 1, |
| ['T'] = 1, ['U'] = 1, ['V'] = 1, ['W'] = 1, |
| ['X'] = 1, ['Y'] = 1, ['Z'] = 1, ['['] = 0, |
| ['\\'] = 0, [']'] = 0, ['^'] = 1, ['_'] = 1, |
| ['`'] = 1, ['a'] = 1, ['b'] = 1, ['c'] = 1, |
| ['d'] = 1, ['e'] = 1, ['f'] = 1, ['g'] = 1, |
| ['h'] = 1, ['i'] = 1, ['j'] = 1, ['k'] = 1, |
| ['l'] = 1, ['m'] = 1, ['n'] = 1, ['o'] = 1, |
| ['p'] = 1, ['q'] = 1, ['r'] = 1, ['s'] = 1, |
| ['t'] = 1, ['u'] = 1, ['v'] = 1, ['w'] = 1, |
| ['x'] = 1, ['y'] = 1, ['z'] = 1, ['{'] = 0, |
| ['|'] = 1, ['}'] = 0, ['~'] = 1, |
| }; |
| |
| |
| /* |
| * An http ver_token is any ASCII which can be found in an HTTP version, |
| * which includes 'H', 'T', 'P', '/', '.' and any digit. |
| */ |
| const char http_is_ver_token[256] = { |
| ['.'] = 1, ['/'] = 1, |
| ['0'] = 1, ['1'] = 1, ['2'] = 1, ['3'] = 1, ['4'] = 1, |
| ['5'] = 1, ['6'] = 1, ['7'] = 1, ['8'] = 1, ['9'] = 1, |
| ['H'] = 1, ['P'] = 1, ['T'] = 1, |
| }; |
| |
| |
| /* |
| * Adds a header and its CRLF at the tail of buffer <b>, just before the last |
| * CRLF. Text length is measured first, so it cannot be NULL. |
| * The header is also automatically added to the index <hdr_idx>, and the end |
| * of headers is automatically adjusted. The number of bytes added is returned |
| * on success, otherwise <0 is returned indicating an error. |
| */ |
| int http_header_add_tail(struct buffer *b, struct http_msg *msg, |
| struct hdr_idx *hdr_idx, const char *text) |
| { |
| int bytes, len; |
| |
| len = strlen(text); |
| bytes = buffer_insert_line2(b, b->data + msg->eoh, text, len); |
| if (!bytes) |
| return -1; |
| msg->eoh += bytes; |
| return hdr_idx_add(len, 1, hdr_idx, hdr_idx->tail); |
| } |
| |
| /* |
| * Adds a header and its CRLF at the tail of buffer <b>, just before the last |
| * CRLF. <len> bytes are copied, not counting the CRLF. If <text> is NULL, then |
| * the buffer is only opened and the space reserved, but nothing is copied. |
| * The header is also automatically added to the index <hdr_idx>, and the end |
| * of headers is automatically adjusted. The number of bytes added is returned |
| * on success, otherwise <0 is returned indicating an error. |
| */ |
| int http_header_add_tail2(struct buffer *b, struct http_msg *msg, |
| struct hdr_idx *hdr_idx, const char *text, int len) |
| { |
| int bytes; |
| |
| bytes = buffer_insert_line2(b, b->data + msg->eoh, text, len); |
| if (!bytes) |
| return -1; |
| msg->eoh += bytes; |
| return hdr_idx_add(len, 1, hdr_idx, hdr_idx->tail); |
| } |
| |
| /* |
| * Checks if <hdr> is exactly <name> for <len> chars, and ends with a colon. |
| * If so, returns the position of the first non-space character relative to |
| * <hdr>, or <end>-<hdr> if not found before. If no value is found, it tries |
| * to return a pointer to the place after the first space. Returns 0 if the |
| * header name does not match. Checks are case-insensitive. |
| */ |
| int http_header_match2(const char *hdr, const char *end, |
| const char *name, int len) |
| { |
| const char *val; |
| |
| if (hdr + len >= end) |
| return 0; |
| if (hdr[len] != ':') |
| return 0; |
| if (strncasecmp(hdr, name, len) != 0) |
| return 0; |
| val = hdr + len + 1; |
| while (val < end && HTTP_IS_SPHT(*val)) |
| val++; |
| if ((val >= end) && (len + 2 <= end - hdr)) |
| return len + 2; /* we may replace starting from second space */ |
| return val - hdr; |
| } |
| |
| /* Find the end of the header value contained between <s> and <e>. |
| * See RFC2616, par 2.2 for more information. Note that it requires |
| * a valid header to return a valid result. |
| */ |
| const char *find_hdr_value_end(const char *s, const char *e) |
| { |
| int quoted, qdpair; |
| |
| quoted = qdpair = 0; |
| for (; s < e; s++) { |
| if (qdpair) qdpair = 0; |
| else if (quoted && *s == '\\') qdpair = 1; |
| else if (quoted && *s == '"') quoted = 0; |
| else if (*s == '"') quoted = 1; |
| else if (*s == ',') return s; |
| } |
| return s; |
| } |
| |
| /* Find the first or next occurrence of header <name> in message buffer <sol> |
| * using headers index <idx>, and return it in the <ctx> structure. This |
| * structure holds everything necessary to use the header and find next |
| * occurrence. If its <idx> member is 0, the header is searched from the |
| * beginning. Otherwise, the next occurrence is returned. The function returns |
| * 1 when it finds a value, and 0 when there is no more. |
| */ |
| int http_find_header2(const char *name, int len, |
| const char *sol, struct hdr_idx *idx, |
| struct hdr_ctx *ctx) |
| { |
| const char *eol, *sov; |
| int cur_idx; |
| |
| if (ctx->idx) { |
| /* We have previously returned a value, let's search |
| * another one on the same line. |
| */ |
| cur_idx = ctx->idx; |
| sol = ctx->line; |
| sov = sol + ctx->val + ctx->vlen; |
| eol = sol + idx->v[cur_idx].len; |
| |
| if (sov >= eol) |
| /* no more values in this header */ |
| goto next_hdr; |
| |
| /* values remaining for this header, skip the comma */ |
| sov++; |
| while (sov < eol && http_is_lws[(unsigned char)*sov]) |
| sov++; |
| |
| goto return_hdr; |
| } |
| |
| /* first request for this header */ |
| sol += hdr_idx_first_pos(idx); |
| cur_idx = hdr_idx_first_idx(idx); |
| |
| while (cur_idx) { |
| eol = sol + idx->v[cur_idx].len; |
| |
| if (len == 0) { |
| /* No argument was passed, we want any header. |
| * To achieve this, we simply build a fake request. */ |
| while (sol + len < eol && sol[len] != ':') |
| len++; |
| name = sol; |
| } |
| |
| if ((len < eol - sol) && |
| (sol[len] == ':') && |
| (strncasecmp(sol, name, len) == 0)) { |
| |
| sov = sol + len + 1; |
| while (sov < eol && http_is_lws[(unsigned char)*sov]) |
| sov++; |
| return_hdr: |
| ctx->line = sol; |
| ctx->idx = cur_idx; |
| ctx->val = sov - sol; |
| |
| eol = find_hdr_value_end(sov, eol); |
| ctx->vlen = eol - sov; |
| return 1; |
| } |
| next_hdr: |
| sol = eol + idx->v[cur_idx].cr + 1; |
| cur_idx = idx->v[cur_idx].next; |
| } |
| return 0; |
| } |
| |
| int http_find_header(const char *name, |
| const char *sol, struct hdr_idx *idx, |
| struct hdr_ctx *ctx) |
| { |
| return http_find_header2(name, strlen(name), sol, idx, ctx); |
| } |
| |
| /* This function handles a server error at the stream interface level. The |
| * stream interface is assumed to be already in a closed state. An optional |
| * message is copied into the input buffer, and an HTTP status code stored. |
| * The error flags are set to the values in arguments. Any pending request |
| * in this buffer will be lost. |
| */ |
| static void http_server_error(struct session *t, struct stream_interface *si, |
| int err, int finst, int status, const struct chunk *msg) |
| { |
| buffer_erase(si->ob); |
| buffer_erase(si->ib); |
| buffer_write_ena(si->ib); |
| if (status > 0 && msg) { |
| t->txn.status = status; |
| buffer_write(si->ib, msg->str, msg->len); |
| } |
| if (!(t->flags & SN_ERR_MASK)) |
| t->flags |= err; |
| if (!(t->flags & SN_FINST_MASK)) |
| t->flags |= finst; |
| } |
| |
| /* This function returns the appropriate error location for the given session |
| * and message. |
| */ |
| |
| struct chunk *error_message(struct session *s, int msgnum) |
| { |
| if (s->be->errmsg[msgnum].str) |
| return &s->be->errmsg[msgnum]; |
| else if (s->fe->errmsg[msgnum].str) |
| return &s->fe->errmsg[msgnum]; |
| else |
| return &http_err_chunks[msgnum]; |
| } |
| |
| /* |
| * returns HTTP_METH_NONE if there is nothing valid to read (empty or non-text |
| * string), HTTP_METH_OTHER for unknown methods, or the identified method. |
| */ |
| static http_meth_t find_http_meth(const char *str, const int len) |
| { |
| unsigned char m; |
| const struct http_method_desc *h; |
| |
| m = ((unsigned)*str - 'A'); |
| |
| if (m < 26) { |
| for (h = http_methods[m]; h->len > 0; h++) { |
| if (unlikely(h->len != len)) |
| continue; |
| if (likely(memcmp(str, h->text, h->len) == 0)) |
| return h->meth; |
| }; |
| return HTTP_METH_OTHER; |
| } |
| return HTTP_METH_NONE; |
| |
| } |
| |
| /* Parse the URI from the given transaction (which is assumed to be in request |
| * phase) and look for the "/" beginning the PATH. If not found, return NULL. |
| * It is returned otherwise. |
| */ |
| static char * |
| http_get_path(struct http_txn *txn) |
| { |
| char *ptr, *end; |
| |
| ptr = txn->req.sol + txn->req.sl.rq.u; |
| end = ptr + txn->req.sl.rq.u_l; |
| |
| if (ptr >= end) |
| return NULL; |
| |
| /* RFC2616, par. 5.1.2 : |
| * Request-URI = "*" | absuri | abspath | authority |
| */ |
| |
| if (*ptr == '*') |
| return NULL; |
| |
| if (isalpha((unsigned char)*ptr)) { |
| /* this is a scheme as described by RFC3986, par. 3.1 */ |
| ptr++; |
| while (ptr < end && |
| (isalnum((unsigned char)*ptr) || *ptr == '+' || *ptr == '-' || *ptr == '.')) |
| ptr++; |
| /* skip '://' */ |
| if (ptr == end || *ptr++ != ':') |
| return NULL; |
| if (ptr == end || *ptr++ != '/') |
| return NULL; |
| if (ptr == end || *ptr++ != '/') |
| return NULL; |
| } |
| /* skip [user[:passwd]@]host[:[port]] */ |
| |
| while (ptr < end && *ptr != '/') |
| ptr++; |
| |
| if (ptr == end) |
| return NULL; |
| |
| /* OK, we got the '/' ! */ |
| return ptr; |
| } |
| |
| /* Returns a 302 for a redirectable request. This may only be called just after |
| * the stream interface has moved to SI_ST_ASS. Unprocessable requests are |
| * left unchanged and will follow normal proxy processing. |
| */ |
| void perform_http_redirect(struct session *s, struct stream_interface *si) |
| { |
| struct http_txn *txn; |
| struct chunk rdr; |
| char *path; |
| int len; |
| |
| /* 1: create the response header */ |
| rdr.len = strlen(HTTP_302); |
| rdr.str = trash; |
| memcpy(rdr.str, HTTP_302, rdr.len); |
| |
| /* 2: add the server's prefix */ |
| if (rdr.len + s->srv->rdr_len > sizeof(trash)) |
| return; |
| |
| memcpy(rdr.str + rdr.len, s->srv->rdr_pfx, s->srv->rdr_len); |
| rdr.len += s->srv->rdr_len; |
| |
| /* 3: add the request URI */ |
| txn = &s->txn; |
| path = http_get_path(txn); |
| if (!path) |
| return; |
| |
| len = txn->req.sl.rq.u_l + (txn->req.sol+txn->req.sl.rq.u) - path; |
| if (rdr.len + len > sizeof(trash) - 4) /* 4 for CRLF-CRLF */ |
| return; |
| |
| memcpy(rdr.str + rdr.len, path, len); |
| rdr.len += len; |
| memcpy(rdr.str + rdr.len, "\r\n\r\n", 4); |
| rdr.len += 4; |
| |
| /* prepare to return without error. */ |
| si->shutr(si); |
| si->shutw(si); |
| si->err_type = SI_ET_NONE; |
| si->err_loc = NULL; |
| si->state = SI_ST_CLO; |
| |
| /* send the message */ |
| http_server_error(s, si, SN_ERR_PRXCOND, SN_FINST_C, 302, &rdr); |
| |
| /* FIXME: we should increase a counter of redirects per server and per backend. */ |
| if (s->srv) |
| srv_inc_sess_ctr(s->srv); |
| } |
| |
| /* Return the error message corresponding to si->err_type. It is assumed |
| * that the server side is closed. Note that err_type is actually a |
| * bitmask, where almost only aborts may be cumulated with other |
| * values. We consider that aborted operations are more important |
| * than timeouts or errors due to the fact that nobody else in the |
| * logs might explain incomplete retries. All others should avoid |
| * being cumulated. It should normally not be possible to have multiple |
| * aborts at once, but just in case, the first one in sequence is reported. |
| */ |
| void http_return_srv_error(struct session *s, struct stream_interface *si) |
| { |
| int err_type = si->err_type; |
| |
| if (err_type & SI_ET_QUEUE_ABRT) |
| http_server_error(s, si, SN_ERR_CLICL, SN_FINST_Q, |
| 503, error_message(s, HTTP_ERR_503)); |
| else if (err_type & SI_ET_CONN_ABRT) |
| http_server_error(s, si, SN_ERR_CLICL, SN_FINST_C, |
| 503, error_message(s, HTTP_ERR_503)); |
| else if (err_type & SI_ET_QUEUE_TO) |
| http_server_error(s, si, SN_ERR_SRVTO, SN_FINST_Q, |
| 503, error_message(s, HTTP_ERR_503)); |
| else if (err_type & SI_ET_QUEUE_ERR) |
| http_server_error(s, si, SN_ERR_SRVCL, SN_FINST_Q, |
| 503, error_message(s, HTTP_ERR_503)); |
| else if (err_type & SI_ET_CONN_TO) |
| http_server_error(s, si, SN_ERR_SRVTO, SN_FINST_C, |
| 503, error_message(s, HTTP_ERR_503)); |
| else if (err_type & SI_ET_CONN_ERR) |
| http_server_error(s, si, SN_ERR_SRVCL, SN_FINST_C, |
| 503, error_message(s, HTTP_ERR_503)); |
| else /* SI_ET_CONN_OTHER and others */ |
| http_server_error(s, si, SN_ERR_INTERNAL, SN_FINST_C, |
| 500, error_message(s, HTTP_ERR_500)); |
| } |
| |
| extern const char sess_term_cond[8]; |
| extern const char sess_fin_state[8]; |
| extern const char *monthname[12]; |
| const char sess_cookie[4] = "NIDV"; /* No cookie, Invalid cookie, cookie for a Down server, Valid cookie */ |
| const char sess_set_cookie[8] = "N1I3PD5R"; /* No set-cookie, unknown, Set-Cookie Inserted, unknown, |
| Set-cookie seen and left unchanged (passive), Set-cookie Deleted, |
| unknown, Set-cookie Rewritten */ |
| struct pool_head *pool2_requri; |
| struct pool_head *pool2_capture; |
| |
| void http_sess_clflog(struct session *s) |
| { |
| char pn[INET6_ADDRSTRLEN + strlen(":65535")]; |
| struct proxy *fe = s->fe; |
| struct proxy *be = s->be; |
| struct proxy *prx_log; |
| struct http_txn *txn = &s->txn; |
| int tolog, level, err; |
| char *uri, *h; |
| char *svid; |
| struct tm tm; |
| static char tmpline[MAX_SYSLOG_LEN]; |
| int hdr; |
| size_t w; |
| int t_request; |
| |
| prx_log = fe; |
| err = (s->flags & (SN_ERR_MASK | SN_REDISP)) || |
| (s->conn_retries != be->conn_retries) || |
| txn->status >= 500; |
| |
| if (s->cli_addr.ss_family == AF_INET) |
| inet_ntop(AF_INET, |
| (const void *)&((struct sockaddr_in *)&s->cli_addr)->sin_addr, |
| pn, sizeof(pn)); |
| else |
| inet_ntop(AF_INET6, |
| (const void *)&((struct sockaddr_in6 *)(&s->cli_addr))->sin6_addr, |
| pn, sizeof(pn)); |
| |
| get_gmtime(s->logs.accept_date.tv_sec, &tm); |
| |
| /* FIXME: let's limit ourselves to frontend logging for now. */ |
| tolog = fe->to_log; |
| |
| h = tmpline; |
| |
| w = snprintf(h, sizeof(tmpline), |
| "%s - - [%02d/%s/%04d:%02d:%02d:%02d +0000]", |
| pn, |
| tm.tm_mday, monthname[tm.tm_mon], tm.tm_year+1900, |
| tm.tm_hour, tm.tm_min, tm.tm_sec); |
| if (w < 0 || w >= sizeof(tmpline) - (h - tmpline)) |
| goto trunc; |
| h += w; |
| |
| if (h >= tmpline + sizeof(tmpline) - 4) |
| goto trunc; |
| |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| uri = txn->uri ? txn->uri : "<BADREQ>"; |
| h = encode_string(h, tmpline + sizeof(tmpline) - 1, |
| '#', url_encode_map, uri); |
| *(h++) = '\"'; |
| |
| w = snprintf(h, sizeof(tmpline) - (h - tmpline), " %d %lld", txn->status, s->logs.bytes_out); |
| if (w < 0 || w >= sizeof(tmpline) - (h - tmpline)) |
| goto trunc; |
| h += w; |
| |
| if (h >= tmpline + sizeof(tmpline) - 9) |
| goto trunc; |
| memcpy(h, " \"-\" \"-\"", 8); |
| h += 8; |
| |
| w = snprintf(h, sizeof(tmpline) - (h - tmpline), |
| " %d %03d", |
| (s->cli_addr.ss_family == AF_INET) ? |
| ntohs(((struct sockaddr_in *)&s->cli_addr)->sin_port) : |
| ntohs(((struct sockaddr_in6 *)&s->cli_addr)->sin6_port), |
| (int)s->logs.accept_date.tv_usec/1000); |
| if (w < 0 || w >= sizeof(tmpline) - (h - tmpline)) |
| goto trunc; |
| h += w; |
| |
| w = strlen(fe->id); |
| if (h >= tmpline + sizeof(tmpline) - 4 - w) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| memcpy(h, fe->id, w); |
| h += w; |
| *(h++) = '\"'; |
| |
| w = strlen(be->id); |
| if (h >= tmpline + sizeof(tmpline) - 4 - w) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| memcpy(h, be->id, w); |
| h += w; |
| *(h++) = '\"'; |
| |
| svid = (tolog & LW_SVID) ? |
| (s->data_source != DATA_SRC_STATS) ? |
| (s->srv != NULL) ? s->srv->id : "<NOSRV>" : "<STATS>" : "-"; |
| |
| w = strlen(svid); |
| if (h >= tmpline + sizeof(tmpline) - 4 - w) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| memcpy(h, svid, w); |
| h += w; |
| *(h++) = '\"'; |
| |
| t_request = -1; |
| if (tv_isge(&s->logs.tv_request, &s->logs.tv_accept)) |
| t_request = tv_ms_elapsed(&s->logs.tv_accept, &s->logs.tv_request); |
| w = snprintf(h, sizeof(tmpline) - (h - tmpline), |
| " %d %ld %ld %ld %ld", |
| t_request, |
| (s->logs.t_queue >= 0) ? s->logs.t_queue - t_request : -1, |
| (s->logs.t_connect >= 0) ? s->logs.t_connect - s->logs.t_queue : -1, |
| (s->logs.t_data >= 0) ? s->logs.t_data - s->logs.t_connect : -1, |
| s->logs.t_close); |
| if (w < 0 || w >= sizeof(tmpline) - (h - tmpline)) |
| goto trunc; |
| h += w; |
| |
| if (h >= tmpline + sizeof(tmpline) - 8) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| *(h++) = sess_term_cond[(s->flags & SN_ERR_MASK) >> SN_ERR_SHIFT]; |
| *(h++) = sess_fin_state[(s->flags & SN_FINST_MASK) >> SN_FINST_SHIFT]; |
| *(h++) = (be->options & PR_O_COOK_ANY) ? sess_cookie[(txn->flags & TX_CK_MASK) >> TX_CK_SHIFT] : '-', |
| *(h++) = (be->options & PR_O_COOK_ANY) ? sess_set_cookie[(txn->flags & TX_SCK_MASK) >> TX_SCK_SHIFT] : '-'; |
| *(h++) = '\"'; |
| |
| w = snprintf(h, sizeof(tmpline) - (h - tmpline), |
| " %d %d %d %d %d %ld %ld", |
| actconn, fe->feconn, be->beconn, s->srv ? s->srv->cur_sess : 0, |
| (s->conn_retries > 0) ? (be->conn_retries - s->conn_retries) : be->conn_retries, |
| s->logs.srv_queue_size, s->logs.prx_queue_size); |
| |
| if (w < 0 || w >= sizeof(tmpline) - (h - tmpline)) |
| goto trunc; |
| h += w; |
| |
| if (txn->cli_cookie) { |
| w = strlen(txn->cli_cookie); |
| if (h >= tmpline + sizeof(tmpline) - 4 - w) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| memcpy(h, txn->cli_cookie, w); |
| h += w; |
| *(h++) = '\"'; |
| } else { |
| if (h >= tmpline + sizeof(tmpline) - 5) |
| goto trunc; |
| memcpy(h, " \"-\"", 4); |
| h += 4; |
| } |
| |
| if (txn->srv_cookie) { |
| w = strlen(txn->srv_cookie); |
| if (h >= tmpline + sizeof(tmpline) - 4 - w) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| memcpy(h, txn->srv_cookie, w); |
| h += w; |
| *(h++) = '\"'; |
| } else { |
| if (h >= tmpline + sizeof(tmpline) - 5) |
| goto trunc; |
| memcpy(h, " \"-\"", 4); |
| h += 4; |
| } |
| |
| if ((fe->to_log & LW_REQHDR) && txn->req.cap) { |
| for (hdr = 0; hdr < fe->nb_req_cap; hdr++) { |
| if (h >= sizeof (tmpline) + tmpline - 4) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| h = encode_string(h, tmpline + sizeof(tmpline) - 2, |
| '#', hdr_encode_map, txn->req.cap[hdr]); |
| *(h++) = '\"'; |
| } |
| } |
| |
| if ((fe->to_log & LW_RSPHDR) && txn->rsp.cap) { |
| for (hdr = 0; hdr < fe->nb_rsp_cap; hdr++) { |
| if (h >= sizeof (tmpline) + tmpline - 4) |
| goto trunc; |
| *(h++) = ' '; |
| *(h++) = '\"'; |
| h = encode_string(h, tmpline + sizeof(tmpline) - 2, |
| '#', hdr_encode_map, txn->rsp.cap[hdr]); |
| *(h++) = '\"'; |
| } |
| } |
| |
| trunc: |
| *h = '\0'; |
| |
| level = LOG_INFO; |
| if (err && (fe->options2 & PR_O2_LOGERRORS)) |
| level = LOG_ERR; |
| |
| send_log(prx_log, level, "%s\n", tmpline); |
| |
| s->logs.logwait = 0; |
| } |
| |
| /* |
| * send a log for the session when we have enough info about it. |
| * Will not log if the frontend has no log defined. |
| */ |
| void http_sess_log(struct session *s) |
| { |
| char pn[INET6_ADDRSTRLEN + strlen(":65535")]; |
| struct proxy *fe = s->fe; |
| struct proxy *be = s->be; |
| struct proxy *prx_log; |
| struct http_txn *txn = &s->txn; |
| int tolog, level, err; |
| char *uri, *h; |
| char *svid; |
| struct tm tm; |
| static char tmpline[MAX_SYSLOG_LEN]; |
| int t_request; |
| int hdr; |
| |
| /* if we don't want to log normal traffic, return now */ |
| err = (s->flags & (SN_ERR_MASK | SN_REDISP)) || |
| (s->conn_retries != be->conn_retries) || |
| txn->status >= 500; |
| if (!err && (fe->options2 & PR_O2_NOLOGNORM)) |
| return; |
| |
| if (fe->logfac1 < 0 && fe->logfac2 < 0) |
| return; |
| prx_log = fe; |
| |
| if (prx_log->options2 & PR_O2_CLFLOG) |
| return http_sess_clflog(s); |
| |
| if (s->cli_addr.ss_family == AF_INET) |
| inet_ntop(AF_INET, |
| (const void *)&((struct sockaddr_in *)&s->cli_addr)->sin_addr, |
| pn, sizeof(pn)); |
| else |
| inet_ntop(AF_INET6, |
| (const void *)&((struct sockaddr_in6 *)(&s->cli_addr))->sin6_addr, |
| pn, sizeof(pn)); |
| |
| get_localtime(s->logs.accept_date.tv_sec, &tm); |
| |
| /* FIXME: let's limit ourselves to frontend logging for now. */ |
| tolog = fe->to_log; |
| |
| h = tmpline; |
| if (fe->to_log & LW_REQHDR && |
| txn->req.cap && |
| (h < tmpline + sizeof(tmpline) - 10)) { |
| *(h++) = ' '; |
| *(h++) = '{'; |
| for (hdr = 0; hdr < fe->nb_req_cap; hdr++) { |
| if (hdr) |
| *(h++) = '|'; |
| if (txn->req.cap[hdr] != NULL) |
| h = encode_string(h, tmpline + sizeof(tmpline) - 7, |
| '#', hdr_encode_map, txn->req.cap[hdr]); |
| } |
| *(h++) = '}'; |
| } |
| |
| if (fe->to_log & LW_RSPHDR && |
| txn->rsp.cap && |
| (h < tmpline + sizeof(tmpline) - 7)) { |
| *(h++) = ' '; |
| *(h++) = '{'; |
| for (hdr = 0; hdr < fe->nb_rsp_cap; hdr++) { |
| if (hdr) |
| *(h++) = '|'; |
| if (txn->rsp.cap[hdr] != NULL) |
| h = encode_string(h, tmpline + sizeof(tmpline) - 4, |
| '#', hdr_encode_map, txn->rsp.cap[hdr]); |
| } |
| *(h++) = '}'; |
| } |
| |
| if (h < tmpline + sizeof(tmpline) - 4) { |
| *(h++) = ' '; |
| *(h++) = '"'; |
| uri = txn->uri ? txn->uri : "<BADREQ>"; |
| h = encode_string(h, tmpline + sizeof(tmpline) - 1, |
| '#', url_encode_map, uri); |
| *(h++) = '"'; |
| } |
| *h = '\0'; |
| |
| svid = (tolog & LW_SVID) ? |
| (s->data_source != DATA_SRC_STATS) ? |
| (s->srv != NULL) ? s->srv->id : "<NOSRV>" : "<STATS>" : "-"; |
| |
| t_request = -1; |
| if (tv_isge(&s->logs.tv_request, &s->logs.tv_accept)) |
| t_request = tv_ms_elapsed(&s->logs.tv_accept, &s->logs.tv_request); |
| |
| level = LOG_INFO; |
| if (err && (fe->options2 & PR_O2_LOGERRORS)) |
| level = LOG_ERR; |
| |
| send_log(prx_log, level, |
| "%s:%d [%02d/%s/%04d:%02d:%02d:%02d.%03d]" |
| " %s %s/%s %d/%ld/%ld/%ld/%s%ld %d %s%lld" |
| " %s %s %c%c%c%c %d/%d/%d/%d/%s%u %ld/%ld%s\n", |
| pn, |
| (s->cli_addr.ss_family == AF_INET) ? |
| ntohs(((struct sockaddr_in *)&s->cli_addr)->sin_port) : |
| ntohs(((struct sockaddr_in6 *)&s->cli_addr)->sin6_port), |
| tm.tm_mday, monthname[tm.tm_mon], tm.tm_year+1900, |
| tm.tm_hour, tm.tm_min, tm.tm_sec, (int)s->logs.accept_date.tv_usec/1000, |
| fe->id, be->id, svid, |
| t_request, |
| (s->logs.t_queue >= 0) ? s->logs.t_queue - t_request : -1, |
| (s->logs.t_connect >= 0) ? s->logs.t_connect - s->logs.t_queue : -1, |
| (s->logs.t_data >= 0) ? s->logs.t_data - s->logs.t_connect : -1, |
| (tolog & LW_BYTES) ? "" : "+", s->logs.t_close, |
| txn->status, |
| (tolog & LW_BYTES) ? "" : "+", s->logs.bytes_out, |
| txn->cli_cookie ? txn->cli_cookie : "-", |
| txn->srv_cookie ? txn->srv_cookie : "-", |
| sess_term_cond[(s->flags & SN_ERR_MASK) >> SN_ERR_SHIFT], |
| sess_fin_state[(s->flags & SN_FINST_MASK) >> SN_FINST_SHIFT], |
| (be->options & PR_O_COOK_ANY) ? sess_cookie[(txn->flags & TX_CK_MASK) >> TX_CK_SHIFT] : '-', |
| (be->options & PR_O_COOK_ANY) ? sess_set_cookie[(txn->flags & TX_SCK_MASK) >> TX_SCK_SHIFT] : '-', |
| actconn, fe->feconn, be->beconn, s->srv ? s->srv->cur_sess : 0, |
| (s->flags & SN_REDISP)?"+":"", |
| (s->conn_retries>0)?(be->conn_retries - s->conn_retries):be->conn_retries, |
| s->logs.srv_queue_size, s->logs.prx_queue_size, tmpline); |
| |
| s->logs.logwait = 0; |
| } |
| |
| |
| /* |
| * Capture headers from message starting at <som> according to header list |
| * <cap_hdr>, and fill the <idx> structure appropriately. |
| */ |
| void capture_headers(char *som, struct hdr_idx *idx, |
| char **cap, struct cap_hdr *cap_hdr) |
| { |
| char *eol, *sol, *col, *sov; |
| int cur_idx; |
| struct cap_hdr *h; |
| int len; |
| |
| sol = som + hdr_idx_first_pos(idx); |
| cur_idx = hdr_idx_first_idx(idx); |
| |
| while (cur_idx) { |
| eol = sol + idx->v[cur_idx].len; |
| |
| col = sol; |
| while (col < eol && *col != ':') |
| col++; |
| |
| sov = col + 1; |
| while (sov < eol && http_is_lws[(unsigned char)*sov]) |
| sov++; |
| |
| for (h = cap_hdr; h; h = h->next) { |
| if ((h->namelen == col - sol) && |
| (strncasecmp(sol, h->name, h->namelen) == 0)) { |
| if (cap[h->index] == NULL) |
| cap[h->index] = |
| pool_alloc2(h->pool); |
| |
| if (cap[h->index] == NULL) { |
| Alert("HTTP capture : out of memory.\n"); |
| continue; |
| } |
| |
| len = eol - sov; |
| if (len > h->len) |
| len = h->len; |
| |
| memcpy(cap[h->index], sov, len); |
| cap[h->index][len]=0; |
| } |
| } |
| sol = eol + idx->v[cur_idx].cr + 1; |
| cur_idx = idx->v[cur_idx].next; |
| } |
| } |
| |
| |
| /* either we find an LF at <ptr> or we jump to <bad>. |
| */ |
| #define EXPECT_LF_HERE(ptr, bad) do { if (unlikely(*(ptr) != '\n')) goto bad; } while (0) |
| |
| /* plays with variables <ptr>, <end> and <state>. Jumps to <good> if OK, |
| * otherwise to <http_msg_ood> with <state> set to <st>. |
| */ |
| #define EAT_AND_JUMP_OR_RETURN(good, st) do { \ |
| ptr++; \ |
| if (likely(ptr < end)) \ |
| goto good; \ |
| else { \ |
| state = (st); \ |
| goto http_msg_ood; \ |
| } \ |
| } while (0) |
| |
| |
| /* |
| * This function parses a status line between <ptr> and <end>, starting with |
| * parser state <state>. Only states HTTP_MSG_RPVER, HTTP_MSG_RPVER_SP, |
| * HTTP_MSG_RPCODE, HTTP_MSG_RPCODE_SP and HTTP_MSG_RPREASON are handled. Others |
| * will give undefined results. |
| * Note that it is upon the caller's responsibility to ensure that ptr < end, |
| * and that msg->sol points to the beginning of the response. |
| * If a complete line is found (which implies that at least one CR or LF is |
| * found before <end>, the updated <ptr> is returned, otherwise NULL is |
| * returned indicating an incomplete line (which does not mean that parts have |
| * not been updated). In the incomplete case, if <ret_ptr> or <ret_state> are |
| * non-NULL, they are fed with the new <ptr> and <state> values to be passed |
| * upon next call. |
| * |
| * This function was intentionally designed to be called from |
| * http_msg_analyzer() with the lowest overhead. It should integrate perfectly |
| * within its state machine and use the same macros, hence the need for same |
| * labels and variable names. Note that msg->sol is left unchanged. |
| */ |
| const char *http_parse_stsline(struct http_msg *msg, const char *msg_buf, |
| unsigned int state, const char *ptr, const char *end, |
| char **ret_ptr, unsigned int *ret_state) |
| { |
| switch (state) { |
| http_msg_rpver: |
| case HTTP_MSG_RPVER: |
| if (likely(HTTP_IS_VER_TOKEN(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpver, HTTP_MSG_RPVER); |
| |
| if (likely(HTTP_IS_SPHT(*ptr))) { |
| msg->sl.st.v_l = (ptr - msg_buf) - msg->som; |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpver_sp, HTTP_MSG_RPVER_SP); |
| } |
| state = HTTP_MSG_ERROR; |
| break; |
| |
| http_msg_rpver_sp: |
| case HTTP_MSG_RPVER_SP: |
| if (likely(!HTTP_IS_LWS(*ptr))) { |
| msg->sl.st.c = ptr - msg_buf; |
| goto http_msg_rpcode; |
| } |
| if (likely(HTTP_IS_SPHT(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpver_sp, HTTP_MSG_RPVER_SP); |
| /* so it's a CR/LF, this is invalid */ |
| state = HTTP_MSG_ERROR; |
| break; |
| |
| http_msg_rpcode: |
| case HTTP_MSG_RPCODE: |
| if (likely(!HTTP_IS_LWS(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpcode, HTTP_MSG_RPCODE); |
| |
| if (likely(HTTP_IS_SPHT(*ptr))) { |
| msg->sl.st.c_l = (ptr - msg_buf) - msg->sl.st.c; |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpcode_sp, HTTP_MSG_RPCODE_SP); |
| } |
| |
| /* so it's a CR/LF, so there is no reason phrase */ |
| msg->sl.st.c_l = (ptr - msg_buf) - msg->sl.st.c; |
| http_msg_rsp_reason: |
| /* FIXME: should we support HTTP responses without any reason phrase ? */ |
| msg->sl.st.r = ptr - msg_buf; |
| msg->sl.st.r_l = 0; |
| goto http_msg_rpline_eol; |
| |
| http_msg_rpcode_sp: |
| case HTTP_MSG_RPCODE_SP: |
| if (likely(!HTTP_IS_LWS(*ptr))) { |
| msg->sl.st.r = ptr - msg_buf; |
| goto http_msg_rpreason; |
| } |
| if (likely(HTTP_IS_SPHT(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpcode_sp, HTTP_MSG_RPCODE_SP); |
| /* so it's a CR/LF, so there is no reason phrase */ |
| goto http_msg_rsp_reason; |
| |
| http_msg_rpreason: |
| case HTTP_MSG_RPREASON: |
| if (likely(!HTTP_IS_CRLF(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpreason, HTTP_MSG_RPREASON); |
| msg->sl.st.r_l = (ptr - msg_buf) - msg->sl.st.r; |
| http_msg_rpline_eol: |
| /* We have seen the end of line. Note that we do not |
| * necessarily have the \n yet, but at least we know that we |
| * have EITHER \r OR \n, otherwise the response would not be |
| * complete. We can then record the response length and return |
| * to the caller which will be able to register it. |
| */ |
| msg->sl.st.l = ptr - msg->sol; |
| return ptr; |
| |
| #ifdef DEBUG_FULL |
| default: |
| fprintf(stderr, "FIXME !!!! impossible state at %s:%d = %d\n", __FILE__, __LINE__, state); |
| exit(1); |
| #endif |
| } |
| |
| http_msg_ood: |
| /* out of valid data */ |
| if (ret_state) |
| *ret_state = state; |
| if (ret_ptr) |
| *ret_ptr = (char *)ptr; |
| return NULL; |
| } |
| |
| |
| /* |
| * This function parses a request line between <ptr> and <end>, starting with |
| * parser state <state>. Only states HTTP_MSG_RQMETH, HTTP_MSG_RQMETH_SP, |
| * HTTP_MSG_RQURI, HTTP_MSG_RQURI_SP and HTTP_MSG_RQVER are handled. Others |
| * will give undefined results. |
| * Note that it is upon the caller's responsibility to ensure that ptr < end, |
| * and that msg->sol points to the beginning of the request. |
| * If a complete line is found (which implies that at least one CR or LF is |
| * found before <end>, the updated <ptr> is returned, otherwise NULL is |
| * returned indicating an incomplete line (which does not mean that parts have |
| * not been updated). In the incomplete case, if <ret_ptr> or <ret_state> are |
| * non-NULL, they are fed with the new <ptr> and <state> values to be passed |
| * upon next call. |
| * |
| * This function was intentionally designed to be called from |
| * http_msg_analyzer() with the lowest overhead. It should integrate perfectly |
| * within its state machine and use the same macros, hence the need for same |
| * labels and variable names. Note that msg->sol is left unchanged. |
| */ |
| const char *http_parse_reqline(struct http_msg *msg, const char *msg_buf, |
| unsigned int state, const char *ptr, const char *end, |
| char **ret_ptr, unsigned int *ret_state) |
| { |
| switch (state) { |
| http_msg_rqmeth: |
| case HTTP_MSG_RQMETH: |
| if (likely(HTTP_IS_TOKEN(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqmeth, HTTP_MSG_RQMETH); |
| |
| if (likely(HTTP_IS_SPHT(*ptr))) { |
| msg->sl.rq.m_l = (ptr - msg_buf) - msg->som; |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqmeth_sp, HTTP_MSG_RQMETH_SP); |
| } |
| |
| if (likely(HTTP_IS_CRLF(*ptr))) { |
| /* HTTP 0.9 request */ |
| msg->sl.rq.m_l = (ptr - msg_buf) - msg->som; |
| http_msg_req09_uri: |
| msg->sl.rq.u = ptr - msg_buf; |
| http_msg_req09_uri_e: |
| msg->sl.rq.u_l = (ptr - msg_buf) - msg->sl.rq.u; |
| http_msg_req09_ver: |
| msg->sl.rq.v = ptr - msg_buf; |
| msg->sl.rq.v_l = 0; |
| goto http_msg_rqline_eol; |
| } |
| state = HTTP_MSG_ERROR; |
| break; |
| |
| http_msg_rqmeth_sp: |
| case HTTP_MSG_RQMETH_SP: |
| if (likely(!HTTP_IS_LWS(*ptr))) { |
| msg->sl.rq.u = ptr - msg_buf; |
| goto http_msg_rquri; |
| } |
| if (likely(HTTP_IS_SPHT(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqmeth_sp, HTTP_MSG_RQMETH_SP); |
| /* so it's a CR/LF, meaning an HTTP 0.9 request */ |
| goto http_msg_req09_uri; |
| |
| http_msg_rquri: |
| case HTTP_MSG_RQURI: |
| if (likely(!HTTP_IS_LWS(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rquri, HTTP_MSG_RQURI); |
| |
| if (likely(HTTP_IS_SPHT(*ptr))) { |
| msg->sl.rq.u_l = (ptr - msg_buf) - msg->sl.rq.u; |
| EAT_AND_JUMP_OR_RETURN(http_msg_rquri_sp, HTTP_MSG_RQURI_SP); |
| } |
| |
| /* so it's a CR/LF, meaning an HTTP 0.9 request */ |
| goto http_msg_req09_uri_e; |
| |
| http_msg_rquri_sp: |
| case HTTP_MSG_RQURI_SP: |
| if (likely(!HTTP_IS_LWS(*ptr))) { |
| msg->sl.rq.v = ptr - msg_buf; |
| goto http_msg_rqver; |
| } |
| if (likely(HTTP_IS_SPHT(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rquri_sp, HTTP_MSG_RQURI_SP); |
| /* so it's a CR/LF, meaning an HTTP 0.9 request */ |
| goto http_msg_req09_ver; |
| |
| http_msg_rqver: |
| case HTTP_MSG_RQVER: |
| if (likely(HTTP_IS_VER_TOKEN(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqver, HTTP_MSG_RQVER); |
| |
| if (likely(HTTP_IS_CRLF(*ptr))) { |
| msg->sl.rq.v_l = (ptr - msg_buf) - msg->sl.rq.v; |
| http_msg_rqline_eol: |
| /* We have seen the end of line. Note that we do not |
| * necessarily have the \n yet, but at least we know that we |
| * have EITHER \r OR \n, otherwise the request would not be |
| * complete. We can then record the request length and return |
| * to the caller which will be able to register it. |
| */ |
| msg->sl.rq.l = ptr - msg->sol; |
| return ptr; |
| } |
| |
| /* neither an HTTP_VER token nor a CRLF */ |
| state = HTTP_MSG_ERROR; |
| break; |
| |
| #ifdef DEBUG_FULL |
| default: |
| fprintf(stderr, "FIXME !!!! impossible state at %s:%d = %d\n", __FILE__, __LINE__, state); |
| exit(1); |
| #endif |
| } |
| |
| http_msg_ood: |
| /* out of valid data */ |
| if (ret_state) |
| *ret_state = state; |
| if (ret_ptr) |
| *ret_ptr = (char *)ptr; |
| return NULL; |
| } |
| |
| |
| /* |
| * This function parses an HTTP message, either a request or a response, |
| * depending on the initial msg->msg_state. It can be preempted everywhere |
| * when data are missing and recalled at the exact same location with no |
| * information loss. The header index is re-initialized when switching from |
| * MSG_R[PQ]BEFORE to MSG_RPVER|MSG_RQMETH. It modifies msg->sol among other |
| * fields. |
| */ |
| void http_msg_analyzer(struct buffer *buf, struct http_msg *msg, struct hdr_idx *idx) |
| { |
| unsigned int state; /* updated only when leaving the FSM */ |
| register char *ptr, *end; /* request pointers, to avoid dereferences */ |
| |
| state = msg->msg_state; |
| ptr = buf->lr; |
| end = buf->r; |
| |
| if (unlikely(ptr >= end)) |
| goto http_msg_ood; |
| |
| switch (state) { |
| /* |
| * First, states that are specific to the response only. |
| * We check them first so that request and headers are |
| * closer to each other (accessed more often). |
| */ |
| http_msg_rpbefore: |
| case HTTP_MSG_RPBEFORE: |
| if (likely(HTTP_IS_TOKEN(*ptr))) { |
| if (likely(ptr == buf->data)) { |
| msg->sol = ptr; |
| msg->som = 0; |
| } else { |
| #if PARSE_PRESERVE_EMPTY_LINES |
| /* only skip empty leading lines, don't remove them */ |
| msg->sol = ptr; |
| msg->som = ptr - buf->data; |
| #else |
| /* Remove empty leading lines, as recommended by |
| * RFC2616. This takes a lot of time because we |
| * must move all the buffer backwards, but this |
| * is rarely needed. The method above will be |
| * cleaner when we'll be able to start sending |
| * the request from any place in the buffer. |
| */ |
| buf->lr = ptr; |
| buffer_replace2(buf, buf->data, buf->lr, NULL, 0); |
| msg->som = 0; |
| msg->sol = buf->data; |
| ptr = buf->data; |
| end = buf->r; |
| #endif |
| } |
| hdr_idx_init(idx); |
| state = HTTP_MSG_RPVER; |
| goto http_msg_rpver; |
| } |
| |
| if (unlikely(!HTTP_IS_CRLF(*ptr))) |
| goto http_msg_invalid; |
| |
| if (unlikely(*ptr == '\n')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpbefore, HTTP_MSG_RPBEFORE); |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpbefore_cr, HTTP_MSG_RPBEFORE_CR); |
| /* stop here */ |
| |
| http_msg_rpbefore_cr: |
| case HTTP_MSG_RPBEFORE_CR: |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpbefore, HTTP_MSG_RPBEFORE); |
| /* stop here */ |
| |
| http_msg_rpver: |
| case HTTP_MSG_RPVER: |
| case HTTP_MSG_RPVER_SP: |
| case HTTP_MSG_RPCODE: |
| case HTTP_MSG_RPCODE_SP: |
| case HTTP_MSG_RPREASON: |
| ptr = (char *)http_parse_stsline(msg, buf->data, state, ptr, end, |
| &buf->lr, &msg->msg_state); |
| if (unlikely(!ptr)) |
| return; |
| |
| /* we have a full response and we know that we have either a CR |
| * or an LF at <ptr>. |
| */ |
| //fprintf(stderr,"som=%d rq.l=%d *ptr=0x%02x\n", msg->som, msg->sl.st.l, *ptr); |
| hdr_idx_set_start(idx, msg->sl.st.l, *ptr == '\r'); |
| |
| msg->sol = ptr; |
| if (likely(*ptr == '\r')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rpline_end, HTTP_MSG_RPLINE_END); |
| goto http_msg_rpline_end; |
| |
| http_msg_rpline_end: |
| case HTTP_MSG_RPLINE_END: |
| /* msg->sol must point to the first of CR or LF. */ |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_first, HTTP_MSG_HDR_FIRST); |
| /* stop here */ |
| |
| /* |
| * Second, states that are specific to the request only |
| */ |
| http_msg_rqbefore: |
| case HTTP_MSG_RQBEFORE: |
| if (likely(HTTP_IS_TOKEN(*ptr))) { |
| if (likely(ptr == buf->data)) { |
| msg->sol = ptr; |
| msg->som = 0; |
| } else { |
| #if PARSE_PRESERVE_EMPTY_LINES |
| /* only skip empty leading lines, don't remove them */ |
| msg->sol = ptr; |
| msg->som = ptr - buf->data; |
| #else |
| /* Remove empty leading lines, as recommended by |
| * RFC2616. This takes a lot of time because we |
| * must move all the buffer backwards, but this |
| * is rarely needed. The method above will be |
| * cleaner when we'll be able to start sending |
| * the request from any place in the buffer. |
| */ |
| buf->lr = ptr; |
| buffer_replace2(buf, buf->data, buf->lr, NULL, 0); |
| msg->som = 0; |
| msg->sol = buf->data; |
| ptr = buf->data; |
| end = buf->r; |
| #endif |
| } |
| /* we will need this when keep-alive will be supported |
| hdr_idx_init(idx); |
| */ |
| state = HTTP_MSG_RQMETH; |
| goto http_msg_rqmeth; |
| } |
| |
| if (unlikely(!HTTP_IS_CRLF(*ptr))) |
| goto http_msg_invalid; |
| |
| if (unlikely(*ptr == '\n')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqbefore, HTTP_MSG_RQBEFORE); |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqbefore_cr, HTTP_MSG_RQBEFORE_CR); |
| /* stop here */ |
| |
| http_msg_rqbefore_cr: |
| case HTTP_MSG_RQBEFORE_CR: |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqbefore, HTTP_MSG_RQBEFORE); |
| /* stop here */ |
| |
| http_msg_rqmeth: |
| case HTTP_MSG_RQMETH: |
| case HTTP_MSG_RQMETH_SP: |
| case HTTP_MSG_RQURI: |
| case HTTP_MSG_RQURI_SP: |
| case HTTP_MSG_RQVER: |
| ptr = (char *)http_parse_reqline(msg, buf->data, state, ptr, end, |
| &buf->lr, &msg->msg_state); |
| if (unlikely(!ptr)) |
| return; |
| |
| /* we have a full request and we know that we have either a CR |
| * or an LF at <ptr>. |
| */ |
| //fprintf(stderr,"som=%d rq.l=%d *ptr=0x%02x\n", msg->som, msg->sl.rq.l, *ptr); |
| hdr_idx_set_start(idx, msg->sl.rq.l, *ptr == '\r'); |
| |
| msg->sol = ptr; |
| if (likely(*ptr == '\r')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_rqline_end, HTTP_MSG_RQLINE_END); |
| goto http_msg_rqline_end; |
| |
| http_msg_rqline_end: |
| case HTTP_MSG_RQLINE_END: |
| /* check for HTTP/0.9 request : no version information available. |
| * msg->sol must point to the first of CR or LF. |
| */ |
| if (unlikely(msg->sl.rq.v_l == 0)) |
| goto http_msg_last_lf; |
| |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_first, HTTP_MSG_HDR_FIRST); |
| /* stop here */ |
| |
| /* |
| * Common states below |
| */ |
| http_msg_hdr_first: |
| case HTTP_MSG_HDR_FIRST: |
| msg->sol = ptr; |
| if (likely(!HTTP_IS_CRLF(*ptr))) { |
| goto http_msg_hdr_name; |
| } |
| |
| if (likely(*ptr == '\r')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_last_lf, HTTP_MSG_LAST_LF); |
| goto http_msg_last_lf; |
| |
| http_msg_hdr_name: |
| case HTTP_MSG_HDR_NAME: |
| /* assumes msg->sol points to the first char */ |
| if (likely(HTTP_IS_TOKEN(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_name, HTTP_MSG_HDR_NAME); |
| |
| if (likely(*ptr == ':')) { |
| msg->col = ptr - buf->data; |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_l1_sp, HTTP_MSG_HDR_L1_SP); |
| } |
| |
| if (likely(msg->err_pos < -1) || *ptr == '\n') |
| goto http_msg_invalid; |
| |
| if (msg->err_pos == -1) /* capture error pointer */ |
| msg->err_pos = ptr - buf->data; /* >= 0 now */ |
| |
| /* and we still accept this non-token character */ |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_name, HTTP_MSG_HDR_NAME); |
| |
| http_msg_hdr_l1_sp: |
| case HTTP_MSG_HDR_L1_SP: |
| /* assumes msg->sol points to the first char and msg->col to the colon */ |
| if (likely(HTTP_IS_SPHT(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_l1_sp, HTTP_MSG_HDR_L1_SP); |
| |
| /* header value can be basically anything except CR/LF */ |
| msg->sov = ptr - buf->data; |
| |
| if (likely(!HTTP_IS_CRLF(*ptr))) { |
| goto http_msg_hdr_val; |
| } |
| |
| if (likely(*ptr == '\r')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_l1_lf, HTTP_MSG_HDR_L1_LF); |
| goto http_msg_hdr_l1_lf; |
| |
| http_msg_hdr_l1_lf: |
| case HTTP_MSG_HDR_L1_LF: |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_l1_lws, HTTP_MSG_HDR_L1_LWS); |
| |
| http_msg_hdr_l1_lws: |
| case HTTP_MSG_HDR_L1_LWS: |
| if (likely(HTTP_IS_SPHT(*ptr))) { |
| /* replace HT,CR,LF with spaces */ |
| for (; buf->data+msg->sov < ptr; msg->sov++) |
| buf->data[msg->sov] = ' '; |
| goto http_msg_hdr_l1_sp; |
| } |
| /* we had a header consisting only in spaces ! */ |
| msg->eol = buf->data + msg->sov; |
| goto http_msg_complete_header; |
| |
| http_msg_hdr_val: |
| case HTTP_MSG_HDR_VAL: |
| /* assumes msg->sol points to the first char, msg->col to the |
| * colon, and msg->sov points to the first character of the |
| * value. |
| */ |
| if (likely(!HTTP_IS_CRLF(*ptr))) |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_val, HTTP_MSG_HDR_VAL); |
| |
| msg->eol = ptr; |
| /* Note: we could also copy eol into ->eoh so that we have the |
| * real header end in case it ends with lots of LWS, but is this |
| * really needed ? |
| */ |
| if (likely(*ptr == '\r')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_l2_lf, HTTP_MSG_HDR_L2_LF); |
| goto http_msg_hdr_l2_lf; |
| |
| http_msg_hdr_l2_lf: |
| case HTTP_MSG_HDR_L2_LF: |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| EAT_AND_JUMP_OR_RETURN(http_msg_hdr_l2_lws, HTTP_MSG_HDR_L2_LWS); |
| |
| http_msg_hdr_l2_lws: |
| case HTTP_MSG_HDR_L2_LWS: |
| if (unlikely(HTTP_IS_SPHT(*ptr))) { |
| /* LWS: replace HT,CR,LF with spaces */ |
| for (; msg->eol < ptr; msg->eol++) |
| *msg->eol = ' '; |
| goto http_msg_hdr_val; |
| } |
| http_msg_complete_header: |
| /* |
| * It was a new header, so the last one is finished. |
| * Assumes msg->sol points to the first char, msg->col to the |
| * colon, msg->sov points to the first character of the value |
| * and msg->eol to the first CR or LF so we know how the line |
| * ends. We insert last header into the index. |
| */ |
| /* |
| fprintf(stderr,"registering %-2d bytes : ", msg->eol - msg->sol); |
| write(2, msg->sol, msg->eol-msg->sol); |
| fprintf(stderr,"\n"); |
| */ |
| |
| if (unlikely(hdr_idx_add(msg->eol - msg->sol, *msg->eol == '\r', |
| idx, idx->tail) < 0)) |
| goto http_msg_invalid; |
| |
| msg->sol = ptr; |
| if (likely(!HTTP_IS_CRLF(*ptr))) { |
| goto http_msg_hdr_name; |
| } |
| |
| if (likely(*ptr == '\r')) |
| EAT_AND_JUMP_OR_RETURN(http_msg_last_lf, HTTP_MSG_LAST_LF); |
| goto http_msg_last_lf; |
| |
| http_msg_last_lf: |
| case HTTP_MSG_LAST_LF: |
| /* Assumes msg->sol points to the first of either CR or LF */ |
| EXPECT_LF_HERE(ptr, http_msg_invalid); |
| ptr++; |
| buf->lr = ptr; |
| msg->eoh = msg->sol - buf->data; |
| msg->msg_state = HTTP_MSG_BODY; |
| return; |
| #ifdef DEBUG_FULL |
| default: |
| fprintf(stderr, "FIXME !!!! impossible state at %s:%d = %d\n", __FILE__, __LINE__, state); |
| exit(1); |
| #endif |
| } |
| http_msg_ood: |
| /* out of data */ |
| msg->msg_state = state; |
| buf->lr = ptr; |
| return; |
| |
| http_msg_invalid: |
| /* invalid message */ |
| msg->msg_state = HTTP_MSG_ERROR; |
| buf->lr = ptr; |
| return; |
| } |
| |
| /* convert an HTTP/0.9 request into an HTTP/1.0 request. Returns 1 if the |
| * conversion succeeded, 0 in case of error. If the request was already 1.X, |
| * nothing is done and 1 is returned. |
| */ |
| static int http_upgrade_v09_to_v10(struct buffer *req, struct http_msg *msg, struct http_txn *txn) |
| { |
| int delta; |
| char *cur_end; |
| |
| if (msg->sl.rq.v_l != 0) |
| return 1; |
| |
| msg->sol = req->data + msg->som; |
| cur_end = msg->sol + msg->sl.rq.l; |
| delta = 0; |
| |
| if (msg->sl.rq.u_l == 0) { |
| /* if no URI was set, add "/" */ |
| delta = buffer_replace2(req, cur_end, cur_end, " /", 2); |
| cur_end += delta; |
| msg->eoh += delta; |
| } |
| /* add HTTP version */ |
| delta = buffer_replace2(req, cur_end, cur_end, " HTTP/1.0\r\n", 11); |
| msg->eoh += delta; |
| cur_end += delta; |
| cur_end = (char *)http_parse_reqline(msg, req->data, |
| HTTP_MSG_RQMETH, |
| msg->sol, cur_end + 1, |
| NULL, NULL); |
| if (unlikely(!cur_end)) |
| return 0; |
| |
| /* we have a full HTTP/1.0 request now and we know that |
| * we have either a CR or an LF at <ptr>. |
| */ |
| hdr_idx_set_start(&txn->hdr_idx, msg->sl.rq.l, *cur_end == '\r'); |
| return 1; |
| } |
| |
| /* This stream analyser waits for a complete HTTP request. It returns 1 if the |
| * processing can continue on next analysers, or zero if it either needs more |
| * data or wants to immediately abort the request (eg: timeout, error, ...). It |
| * is tied to AN_REQ_WAIT_HTTP and may may remove itself from s->req->analysers |
| * when it has nothing left to do, and may remove any analyser when it wants to |
| * abort. |
| */ |
| int http_wait_for_request(struct session *s, struct buffer *req, int an_bit) |
| { |
| /* |
| * We will parse the partial (or complete) lines. |
| * We will check the request syntax, and also join multi-line |
| * headers. An index of all the lines will be elaborated while |
| * parsing. |
| * |
| * For the parsing, we use a 28 states FSM. |
| * |
| * Here is the information we currently have : |
| * req->data + msg->som = beginning of request |
| * req->data + req->eoh = end of processed headers / start of current one |
| * req->data + req->eol = end of current header or line (LF or CRLF) |
| * req->lr = first non-visited byte |
| * req->r = end of data |
| * |
| * At end of parsing, we may perform a capture of the error (if any), and |
| * we will set a few fields (msg->sol, txn->meth, sn->flags/SN_REDIRECTABLE). |
| * We also check for monitor-uri, logging, HTTP/0.9 to 1.0 conversion, and |
| * finally headers capture. |
| */ |
| |
| int cur_idx; |
| struct http_txn *txn = &s->txn; |
| struct http_msg *msg = &txn->req; |
| |
| DPRINTF(stderr,"[%u] %s: session=%p b=%p, exp(r,w)=%u,%u bf=%08x bl=%d analysers=%02x\n", |
| now_ms, __FUNCTION__, |
| s, |
| req, |
| req->rex, req->wex, |
| req->flags, |
| req->l, |
| req->analysers); |
| |
| if (likely(req->lr < req->r)) |
| http_msg_analyzer(req, msg, &txn->hdr_idx); |
| |
| /* 1: we might have to print this header in debug mode */ |
| if (unlikely((global.mode & MODE_DEBUG) && |
| (!(global.mode & MODE_QUIET) || (global.mode & MODE_VERBOSE)) && |
| (msg->msg_state == HTTP_MSG_BODY || msg->msg_state == HTTP_MSG_ERROR))) { |
| char *eol, *sol; |
| |
| sol = req->data + msg->som; |
| eol = sol + msg->sl.rq.l; |
| debug_hdr("clireq", s, sol, eol); |
| |
| sol += hdr_idx_first_pos(&txn->hdr_idx); |
| cur_idx = hdr_idx_first_idx(&txn->hdr_idx); |
| |
| while (cur_idx) { |
| eol = sol + txn->hdr_idx.v[cur_idx].len; |
| debug_hdr("clihdr", s, sol, eol); |
| sol = eol + txn->hdr_idx.v[cur_idx].cr + 1; |
| cur_idx = txn->hdr_idx.v[cur_idx].next; |
| } |
| } |
| |
| |
| /* |
| * Now we quickly check if we have found a full valid request. |
| * If not so, we check the FD and buffer states before leaving. |
| * A full request is indicated by the fact that we have seen |
| * the double LF/CRLF, so the state is HTTP_MSG_BODY. Invalid |
| * requests are checked first. |
| * |
| */ |
| |
| if (unlikely(msg->msg_state != HTTP_MSG_BODY)) { |
| /* |
| * First, let's catch bad requests. |
| */ |
| if (unlikely(msg->msg_state == HTTP_MSG_ERROR)) |
| goto return_bad_req; |
| |
| /* 1: Since we are in header mode, if there's no space |
| * left for headers, we won't be able to free more |
| * later, so the session will never terminate. We |
| * must terminate it now. |
| */ |
| if (unlikely(req->flags & BF_FULL)) { |
| /* FIXME: check if URI is set and return Status |
| * 414 Request URI too long instead. |
| */ |
| goto return_bad_req; |
| } |
| |
| /* 2: have we encountered a read error ? */ |
| else if (req->flags & BF_READ_ERROR) { |
| /* we cannot return any message on error */ |
| if (msg->err_pos >= 0) |
| http_capture_bad_message(&s->fe->invalid_req, s, req, msg, s->fe); |
| msg->msg_state = HTTP_MSG_ERROR; |
| req->analysers = 0; |
| s->fe->failed_req++; |
| if (!(s->flags & SN_ERR_MASK)) |
| s->flags |= SN_ERR_CLICL; |
| if (!(s->flags & SN_FINST_MASK)) |
| s->flags |= SN_FINST_R; |
| return 0; |
| } |
| |
| /* 3: has the read timeout expired ? */ |
| else if (req->flags & BF_READ_TIMEOUT || tick_is_expired(req->analyse_exp, now_ms)) { |
| /* read timeout : give up with an error message. */ |
| if (msg->err_pos >= 0) |
| http_capture_bad_message(&s->fe->invalid_req, s, req, msg, s->fe); |
| txn->status = 408; |
| stream_int_retnclose(req->prod, error_message(s, HTTP_ERR_408)); |
| msg->msg_state = HTTP_MSG_ERROR; |
| req->analysers = 0; |
| s->fe->failed_req++; |
| if (!(s->flags & SN_ERR_MASK)) |
| s->flags |= SN_ERR_CLITO; |
| if (!(s->flags & SN_FINST_MASK)) |
| s->flags |= SN_FINST_R; |
| return 0; |
| } |
| |
| /* 4: have we encountered a close ? */ |
| else if (req->flags & BF_SHUTR) { |
| if (msg->err_pos >= 0) |
| http_capture_bad_message(&s->fe->invalid_req, s, req, msg, s->fe); |
| txn->status = 400; |
| stream_int_retnclose(req->prod, error_message(s, HTTP_ERR_400)); |
| msg->msg_state = HTTP_MSG_ERROR; |
| req->analysers = 0; |
| s->fe->failed_req++; |
| |
| if (!(s->flags & SN_ERR_MASK)) |
| s->flags |= SN_ERR_CLICL; |
| if (!(s->flags & SN_FINST_MASK)) |
| s->flags |= SN_FINST_R; |
| return 0; |
| } |
| |
| buffer_write_dis(req); |
| req->flags |= BF_READ_DONTWAIT; /* try to get back here ASAP */ |
| |
| /* just set the request timeout once at the beginning of the request */ |
| if (!tick_isset(req->analyse_exp)) |
| req->analyse_exp = tick_add_ifset(now_ms, s->be->timeout.httpreq); |
| |
| /* we're not ready yet */ |
| return 0; |
| } |
| |
| /* OK now we have a complete HTTP request with indexed headers. Let's |
| * complete the request parsing by setting a few fields we will need |
| * later. |
| */ |
| |
| /* Maybe we found in invalid header name while we were configured not |
| * to block on that, so we have to capture it now. |
| */ |
| if (unlikely(msg->err_pos >= 0)) |
| http_capture_bad_message(&s->fe->invalid_req, s, req, msg, s->fe); |
| |
| /* ensure we keep this pointer to the beginning of the message */ |
| msg->sol = req->data + msg->som; |
| |
| /* |
| * 1: identify the method |
| */ |
| txn->meth = find_http_meth(&req->data[msg->som], msg->sl.rq.m_l); |
| |
| /* we can make use of server redirect on GET and HEAD */ |
| if (txn->meth == HTTP_METH_GET || txn->meth == HTTP_METH_HEAD) |
| s->flags |= SN_REDIRECTABLE; |
| |
| /* |
| * 2: check if the URI matches the monitor_uri. |
| * We have to do this for every request which gets in, because |
| * the monitor-uri is defined by the frontend. |
| */ |
| if (unlikely((s->fe->monitor_uri_len != 0) && |
| (s->fe->monitor_uri_len == msg->sl.rq.u_l) && |
| !memcmp(&req->data[msg->sl.rq.u], |
| s->fe->monitor_uri, |
| s->fe->monitor_uri_len))) { |
| /* |
| * We have found the monitor URI |
| */ |
| struct acl_cond *cond; |
| |
| s->flags |= SN_MONITOR; |
| |
| /* Check if we want to fail this monitor request or not */ |
| list_for_each_entry(cond, &s->fe->mon_fail_cond, list) { |
| int ret = acl_exec_cond(cond, s->fe, s, txn, ACL_DIR_REQ); |
| |
| ret = acl_pass(ret); |
| if (cond->pol == ACL_COND_UNLESS) |
| ret = !ret; |
| |
| if (ret) { |
| /* we fail this request, let's return 503 service unavail */ |
| txn->status = 503; |
| stream_int_retnclose(req->prod, error_message(s, HTTP_ERR_503)); |
| goto return_prx_cond; |
| } |
| } |
| |
| /* nothing to fail, let's reply normaly */ |
| txn->status = 200; |
| stream_int_retnclose(req->prod, &http_200_chunk); |
| goto return_prx_cond; |
| } |
| |
| /* |
| * 3: Maybe we have to copy the original REQURI for the logs ? |
| * Note: we cannot log anymore if the request has been |
| * classified as invalid. |
| */ |
| if (unlikely(s->logs.logwait & LW_REQ)) { |
| /* we have a complete HTTP request that we must log */ |
| if ((txn->uri = pool_alloc2(pool2_requri)) != NULL) { |
| int urilen = msg->sl.rq.l; |
| |
| if (urilen >= REQURI_LEN) |
| urilen = REQURI_LEN - 1; |
| memcpy(txn->uri, &req->data[msg->som], urilen); |
| txn->uri[urilen] = 0; |
| |
| if (!(s->logs.logwait &= ~LW_REQ)) |
| s->do_log(s); |
| } else { |
| Alert("HTTP logging : out of memory.\n"); |
| } |
| } |
| |
| /* 4. We may have to convert HTTP/0.9 requests to HTTP/1.0 */ |
| if (unlikely(msg->sl.rq.v_l == 0) && !http_upgrade_v09_to_v10(req, msg, txn)) |
| goto return_bad_req; |
| |
| /* 5: we may need to capture headers */ |
| if (unlikely((s->logs.logwait & LW_REQHDR) && s->fe->req_cap)) |
| capture_headers(req->data + msg->som, &txn->hdr_idx, |
| txn->req.cap, s->fe->req_cap); |
| |
| /* end of job, return OK */ |
| req->analysers &= ~an_bit; |
| req->analyse_exp = TICK_ETERNITY; |
| return 1; |
| |
| return_bad_req: |
| /* We centralize bad requests processing here */ |
| if (unlikely(msg->msg_state == HTTP_MSG_ERROR) || msg->err_pos >= 0) { |
| /* we detected a parsing error. We want to archive this request |
| * in the dedicated proxy area for later troubleshooting. |
| */ |
| http_capture_bad_message(&s->fe->invalid_req, s, req, msg, s->fe); |
| } |
| |
| txn->req.msg_state = HTTP_MSG_ERROR; |
| txn->status = 400; |
| stream_int_retnclose(req->prod, error_message(s, HTTP_ERR_400)); |
| s->fe->failed_req++; |
| |
| return_prx_cond: |
| if (!(s->flags & SN_ERR_MASK)) |
| s->flags |= SN_ERR_PRXCOND; |
| if (!(s->flags & SN_FINST_MASK)) |
| s->flags |= SN_FINST_R; |
| |
| req->analysers = 0; |
| req->analyse_exp = TICK_ETERNITY; |
| return 0; |
| } |
| |
| /* This stream analyser runs all HTTP request processing which is common to |
| * frontends and backends, which means blocking ACLs, filters, connection-close, |
| * reqadd, stats and redirects. This is performed for the designated proxy. |
| * It returns 1 if the processing can continue on next analysers, or zero if it |
| * either needs more data or wants to immediately abort the request (eg: deny, |
| * error, ...). |
| */ |
| int http_process_req_common(struct session *s, struct buffer *req, int an_bit, struct proxy *px) |
| { |
| struct http_txn *txn = &s->txn; |
| struct http_msg *msg = &txn->req; |
| struct acl_cond *cond; |
| struct redirect_rule *rule; |
| int cur_idx; |
| |
| if (unlikely(msg->msg_state != HTTP_MSG_BODY)) { |
| /* we need more data */ |
| buffer_write_dis(req); |
| return 0; |
| } |
| |
| req->analysers &= ~an_bit; |
| req->analyse_exp = TICK_ETERNITY; |
| |
| DPRINTF(stderr,"[%u] %s: session=%p b=%p, exp(r,w)=%u,%u bf=%08x bl=%d analysers=%02x\n", |
| now_ms, __FUNCTION__, |
| s, |
| req, |
| req->rex, req->wex, |
| req->flags, |
| req->l, |
| req->analysers); |
| |
| /* first check whether we have some ACLs set to block this request */ |
| list_for_each_entry(cond, &px->block_cond, list) { |
| int ret = acl_exec_cond(cond, px, s, txn, ACL_DIR_REQ); |
| |
| ret = acl_pass(ret); |
| if (cond->pol == ACL_COND_UNLESS) |
| ret = !ret; |
| |
| if (ret) { |
| txn->status = 403; |
| /* let's log the request time */ |
| s->logs.tv_request = now; |
| stream_int_retnclose(req->prod, error_message(s, HTTP_ERR_403)); |
| goto return_prx_cond; |
| } |
| } |
| |
| /* try headers filters */ |
| if (px->req_exp != NULL) { |
| if (apply_filters_to_request(s, req, px->req_exp) < 0) |
| goto return_bad_req; |
| |
| /* has the request been denied ? */ |
| if (txn->flags & TX_CLDENY) { |
| /* no need to go further */ |
| txn->status = 403; |
| /* let's log the request time */ |
| s->logs.tv_request = now; |
| stream_int_retnclose(req->prod, error_message(s, HTTP_ERR_403)); |
| goto return_prx_cond; |
| } |
| } |
| |
| /* We might have to check for "Connection:" */ |
| if (((s->fe->options | s->be->options) & (PR_O_HTTP_CLOSE|PR_O_FORCE_CLO)) && |
| !(s->flags & SN_CONN_CLOSED)) { |
| char *cur_ptr, *cur_end, *cur_next; |
| int old_idx, delta, val; |
| struct hdr_idx_elem *cur_hdr; |
| |
| cur_next = req->data + txn->req.som + hdr_idx_first_pos(&txn->hdr_idx); |
| old_idx = 0; |
| |
| while ((cur_idx = txn->hdr_idx.v[old_idx].next)) { |
| cur_hdr = &txn->hdr_idx.v[cur_idx]; |
| cur_ptr = cur_next; |
| cur_end = cur_ptr + cur_hdr->len; |
| cur_next = cur_end + cur_hdr->cr + 1; |
| |
| val = http_header_match2(cur_ptr, cur_end, "Connection", 10); |
| if (val) { |
| /* 3 possibilities : |
| * - we have already set Connection: close, |
| * so we remove this line. |
| * - we have not yet set Connection: close, |
| * but this line indicates close. We leave |
| * it untouched and set the flag. |
| * - we have not yet set Connection: close, |
| * and this line indicates non-close. We |
| * replace it. |
| */ |
| if (s->flags & SN_CONN_CLOSED) { |
| delta = buffer_replace2(req, cur_ptr, cur_next, NULL, 0); |
| txn->req.eoh += delta; |
| cur_next += delta; |
| txn->hdr_idx.v[old_idx].next = cur_hdr->next; |
| txn->hdr_idx.used--; |
| cur_hdr->len = 0; |
| } else { |
| if (strncasecmp(cur_ptr + val, "close", 5) != 0) { |
| delta = buffer_replace2(req, cur_ptr + val, cur_end, |
| "close", 5); |
| cur_next += delta; |
| cur_hdr->len += delta; |
| txn->req.eoh += delta; |
| } |
| s->flags |= SN_CONN_CLOSED; |
| } |
| } |
| old_idx = cur_idx; |
| } |
| } |
| /* add request headers from the rule sets in the same order */ |
| for (cur_idx = 0; cur_idx < px->nb_reqadd; cur_idx++) { |
| if (unlikely(http_header_add_tail(req, |
| &txn->req, |
| &txn->hdr_idx, |
| px->req_add[cur_idx])) < 0) |
| goto return_bad_req; |
| } |
| |
| /* check if stats URI was requested, and if an auth is needed */ |
| if (px->uri_auth != NULL && |
| (txn->meth == HTTP_METH_GET || txn->meth == HTTP_METH_HEAD)) { |
| /* we have to check the URI and auth for this request. |
| * FIXME!!! that one is rather dangerous, we want to |
| * make it follow standard rules (eg: clear req->analysers). |
| */ |
| if (stats_check_uri_auth(s, px)) { |
| req->analysers = 0; |
| return 0; |
| } |
| } |
| |
| /* check whether we have some ACLs set to redirect this request */ |
| list_for_each_entry(rule, &px->redirect_rules, list) { |
| int ret = acl_exec_cond(rule->cond, px, s, txn, ACL_DIR_REQ); |
| |
| ret = acl_pass(ret); |
| if (rule->cond->pol == ACL_COND_UNLESS) |
| ret = !ret; |
| |
| if (ret) { |
| struct chunk rdr = { trash, 0 }; |
| const char *msg_fmt; |
| |
| /* build redirect message */ |
| switch(rule->code) { |
| case 303: |
| rdr.len = strlen(HTTP_303); |
| msg_fmt = HTTP_303; |
| break; |
| case 301: |
| rdr.len = strlen(HTTP_301); |
| msg_fmt = HTTP_301; |
| break; |
| case 302: |
| default: |
| rdr.len = strlen(HTTP_302); |
| msg_fmt = HTTP_302; |
| break; |
| } |
| |
| if (unlikely(rdr.len > sizeof(trash))) |
| goto return_bad_req; |
| memcpy(rdr.str, msg_fmt, rdr.len); |
| |
| switch(rule->type) { |
| case REDIRECT_TYPE_PREFIX: { |
| const char *path; |
| int pathlen; |
| |
| path = http_get_path(txn); |
| /* build message using path */ |
| if (path) { |
| pathlen = txn->req.sl.rq.u_l + (txn->req.sol+txn->req.sl.rq.u) - path; |
| if (rule->flags & REDIRECT_FLAG_DROP_QS) { |
| int qs = 0; |
| while (qs < pathlen) { |
| if (path[qs] == '?') { |
| pathlen = qs; |
| break; |
| } |
| qs++; |
| } |
| } |
| } else { |
| path = "/"; |
| pathlen = 1; |
| } |
| |
| if (rdr.len + rule->rdr_len + pathlen > sizeof(trash) - 4) |
| goto return_bad_req; |
| |
| /* add prefix. Note that if prefix == "/", we don't want to |
| * add anything, otherwise it makes it hard for the user to |
| * configure a self-redirection. |
| */ |
| if (rule->rdr_len != 1 || *rule->rdr_str != '/') { |
| memcpy(rdr.str + rdr.len, rule->rdr_str, rule->rdr_len); |
| rdr.len += rule->rdr_len; |
| } |
| |
| /* add path */ |
| memcpy(rdr.str + rdr.len, path, pathlen); |
| rdr.len += pathlen; |
| break; |
| } |
| case REDIRECT_TYPE_LOCATION: |
| default: |
| if (rdr.len + rule->rdr_len > sizeof(trash) - 4) |
| goto return_bad_req; |
| |
| /* add location */ |
| memcpy(rdr.str + rdr.len, rule->rdr_str, rule->rdr_len); |
| rdr.len += rule->rdr_len; |
| break; |
| } |
| |
| if (rule->cookie_len) { |
| memcpy(rdr.str + rdr.len, "\r\nSet-Cookie: ", 14); |
| rdr.len += 14; |
| memcpy(rdr.str + rdr.len, rule->cookie_str, rule->cookie_len); |
| rdr.len += rule->cookie_len; |
| memcpy(rdr.str + rdr.len, "\r\n", 2); |
| rdr.len += 2; |
| } |
| |
| /* add end of headers */ |
| memcpy(rdr.str + rdr.len, "\r\n\r\n", 4); |
| rdr.len += 4; |
| |
| txn->status = rule->code; |
| /* let's log the request time */ |
| s->logs.tv_request = now; |
| stream_int_retnclose(req->prod, &rdr); |
| goto return_prx_cond; |
| } |
| } |
| |
| /* that's OK for us now, let's move on to next analysers */ |
| return 1; |
| |
| return_bad_req: |
| /* We centralize bad requests processing here */ |
| if (unlikely(msg->msg_state == HTTP_MSG_ERROR) || msg->err_pos >= 0) { |
| /* we detected a parsing error. We want to archive this request |
| * in the dedicated proxy area for later troubleshooting. |
| */ |
| http_capture_bad_message(&s->fe->invalid_req, s, req, msg, s->fe); |
| } |
| |
| txn->req.msg_state = HTTP_MSG_ERROR; |
| txn->status = 400; |
| stream_int_retnclose(req->prod, error_message(s, HTTP_ERR_400)); |
| s->fe->failed_req++; |
| |
| return_prx_cond: |
| if (!(s->flags & SN_ERR_MASK)) |
| s->flags |= SN_ERR_PRXCOND; |
| if (!(s->flags & SN_FINST_MASK)) |
| s->flags |= SN_FINST_R; |
| |
| req->analysers = 0; |
| req->analyse_exp = TICK_ETERNITY; |
| return 0; |
| } |
| |
| /* This function performs all the processing enabled for the current request. |
| * It returns 1 if the processing can continue on next analysers, or zero if it |
| * needs more data, encounters an error, or wants to immediately abort the |
| * request. It relies on buffers flags, and updates s->req->analysers. |
| */ |
| int http_process_request(struct session *s, struct buffer *req, int an_bit) |
| { |
| struct http_txn *txn = &s->txn; |
| struct http_msg *msg = &txn->req; |
| |
| if (unlikely(msg->msg_state != HTTP_MSG_BODY)) { |
| /* we need more data */ |
| buffer_write_dis(req); |
| return 0; |
| } |
| |
| req->analysers &= ~an_bit; |
| req->analyse_exp = TICK_ETERNITY; |
| |
| DPRINTF(stderr,"[%u] %s: session=%p b=%p, exp(r,w)=%u,%u bf=%08x bl=%d analysers=%02x\n", |
| now_ms, __FUNCTION__, |
| s, |
| req, |
| req->rex, req->wex, |
| req->flags, |
| req->l, |
| req->analysers); |
| |
| /* |
| * Right now, we know that we have processed the entire headers |
| * and that unwanted requests have been filtered out. We can do |
| * whatever we want with the remaining request. Also, now we |
| * may have separate values for ->fe, ->be. |
| */ |
| |
| /* |
| * If HTTP PROXY is set we simply get remote server address |
| * parsing incoming request. |
| */ |
| if ((s->be->options & PR_O_HTTP_PROXY) && !(s->flags & SN_ADDR_SET)) { |
| url2sa(req->data + msg->sl.rq.u, msg->sl.rq.u_l, &s->srv_addr); |
| } |
| |
| /* |
| * 7: the appsession cookie was looked up very early in 1.2, |
| * so let's do the same now. |
| */ |
| |
| /* It needs to look into the URI */ |
| if (s->be->appsession_name) { |
| get_srv_from_appsession(s, &req->data[msg->som], msg->sl.rq.l); |
| } |
| |
| /* |
| * 8: Now we can work with the cookies. |
| * Note that doing so might move headers in the request, but |
| * the fields will stay coherent and the URI will not move. |
| * This should only be performed in the backend. |
| */ |
| if ((s->be->cookie_name || s->be->appsession_name || s->fe->capture_name) |
| && !(txn->flags & (TX_CLDENY|TX_CLTARPIT))) |
| manage_client_side_cookies(s, req); |
| |
| /* |
| * 9: add X-Forwarded-For if either the frontend or the backend |
| * asks for it. |
| */ |
| if ((s->fe->options | s->be->options) & PR_O_FWDFOR) { |
| if (s->cli_addr.ss_family == AF_INET) { |
| /* Add an X-Forwarded-For header unless the source IP is |
| * in the 'except' network range. |
| */ |
| if ((!s->fe->except_mask.s_addr || |
| (((struct sockaddr_in *)&s->cli_addr)->sin_addr.s_addr & s->fe->except_mask.s_addr) |
| != s->fe->except_net.s_addr) && |
| (!s->be->except_mask.s_addr || |
| (((struct sockaddr_in *)&s->cli_addr)->sin_addr.s_addr & s->be->except_mask.s_addr) |
| != s->be->except_net.s_addr)) { |
| int len; |
| unsigned char *pn; |
| pn = (unsigned char *)&((struct sockaddr_in *)&s->cli_addr)->sin_addr; |
| |
| /* Note: we rely on the backend to get the header name to be used for |
| * x-forwarded-for, because the header is really meant for the backends. |
| * However, if the backend did not specify any option, we have to rely |
| * on the frontend's header name. |
| */ |
| if (s->be->fwdfor_hdr_len) { |
| len = s->be->fwdfor_hdr_len; |
| memcpy(trash, s->be->fwdfor_hdr_name, len); |
| } else { |
| len = s->fe->fwdfor_hdr_len; |
| memcpy(trash, s->fe->fwdfor_hdr_name, len); |
| } |
| len += sprintf(trash + len, ": %d.%d.%d.%d", pn[0], pn[1], pn[2], pn[3]); |
| |
| if (unlikely(http_header_add_tail2(req, &txn->req, |
| &txn->hdr_idx, trash, len)) < 0) |
| goto return_bad_req; |
| } |
| } |
| else if (s->cli_addr.ss_family == AF_INET6) { |
| /* FIXME: for the sake of completeness, we should also support |
| * 'except' here, although it is mostly useless in this case. |
| */ |
| int len; |
| char pn[INET6_ADDRSTRLEN]; |
| inet_ntop(AF_INET6, |
| (const void *)&((struct sockaddr_in6 *)(&s->cli_addr))->sin6_addr, |
| pn, sizeof(pn)); |
| |
| /* Note: we rely on the backend to get the header name to be used for |
| * x-forwarded-for, because the header is really meant for the backends. |
| * However, if the backend did not specify any option, we have to rely |
| * on the frontend's header name. |
| */ |
| if (s->be->fwdfor_hdr_len) { |
| len = s->be->fwdfor_hdr_len; |
| memcpy(trash, s->be->fwdfor_hdr_name, len); |
| } else { |
| len = s->fe->fwdfor_hdr_len; |
| memcpy(trash, s->fe->fwdfor_hdr_name, len); |
| } |
| len += sprintf(trash + len, ": %s", pn); |
| |
| if (unlikely(http_header_add_tail2(req, &txn->req, |
| &txn->hdr_idx, trash, len)) < 0) |
| goto return_bad_req; |
| } |
| } |
| |
| /* |
| * 10: add X-Original-To if either the frontend or the backend |
| * asks for it. |
| */ |
| if ((s->fe->options | s->be->options) & PR_O_ORGTO) { |
| |
| /* FIXME: don't know if IPv6 can handle that case too. */ |
| if (s->cli_addr.ss_family == AF_INET) { |
| /* Add an X-Original-To header unless the destination IP is |
| * in the 'except' network range. |
| */ |
| if (!(s->flags & SN_FRT_ADDR_SET)) |
| get_frt_addr(s); |
| |
| if ((!s->fe->except_mask_to.s_addr || |
| (((struct sockaddr_in *)&s->frt_addr)->sin_addr.s_addr & s->fe->except_mask_to.s_addr) |
| != s->fe->except_to.s_addr) && |
| (!s->be->except_mask_to.s_addr || |
| (((struct sockaddr_in *)&s->frt_addr)->sin_addr.s_addr & s->be->except_mask_to.s_addr) |
| != s->be->except_to.s_addr)) { |
| int len; |
| unsigned char *pn; |
| pn = (unsigned char *)&((struct sockaddr_in *)&s->frt_addr)->sin_addr; |
| |
| /* Note: we rely on the backend to get the header name to be used for |
| * x-original-to, because the header is really meant for the backends. |
| * However, if the backend did not specify any option, we have to rely |
| * on the frontend's header name. |
| */ |
| if (s->be->orgto_hdr_len) { |
| len = s->be->orgto_hdr_len; |
| memcpy(trash, s->be->orgto_hdr_name, len); |
| } else { |
| len = s->fe->orgto_hdr_len; |
| memcpy(trash, s->fe->orgto_hdr_name, len); |
| } |
| len += sprintf(trash + len, ": %d.%d.%d.%d", pn[0], pn[1], pn[2], pn[3]); |
| |
| if (unlikely(http_header_add_tail2(req, &txn->req, |
| &txn->hdr_idx, trash, len)) < 0) |
| goto return_bad_req; |
| } |
| } |
| } |
| |
| /* |
| * 11: add "Connection: close" if needed and not yet set. |
| * Note that we do not need to add it in case of HTTP/1.0. |
| */ |
| if (!(s->flags & SN_CONN_CLOSED) && |
| ((s->fe->options | s->be->options) & (PR_O_HTTP_CLOSE|PR_O_FORCE_CLO))) { |
| if ((unlikely(msg->sl.rq.v_l != 8) || |
| unlikely(req->data[msg->som + msg->sl.rq.v + 7] != '0')) && |
| unlikely(http_header_add_tail2(req, &txn->req, &txn->hdr_idx, |
| "Connection: close", 17)) < 0) |
| goto return_bad_req; |
| s->flags |= SN_CONN_CLOSED; |
| } |
| /* Before we switch to data, was assignment set in manage_client_side_cookie? |
| * If not assigned, perhaps we are balancing on url_param, but this is a |
| * POST; and the parameters are in the body, maybe scan there to find our server. |
| * (unless headers overflowed the buffer?) |
| */ |
| if (!(s->flags & (SN_ASSIGNED|SN_DIRECT)) && |
| s->txn.meth == HTTP_METH_POST && s->be->url_param_name != NULL && |
| s->be->url_param_post_limit != 0 && !(req->flags & BF_FULL) && |
| memchr(msg->sol + msg->sl.rq.u, '?', msg->sl.rq.u_l) == NULL) { |
| /* are there enough bytes here? total == l || r || rlim ? |
| * len is unsigned, but eoh is int, |
| * how many bytes of body have we received? |
| * eoh is the first empty line of the header |
| */ |
| /* already established CRLF or LF at eoh, move to start of message, find message length in buffer */ |
| unsigned long len = req->l - (msg->sol[msg->eoh] == '\r' ? msg->eoh + 2 : msg->eoh + 1); |
| |
| /* If we have HTTP/1.1 and Expect: 100-continue, then abort. |
| * We can't assume responsibility for the server's decision, |
| * on this URI and header set. See rfc2616: 14.20, 8.2.3, |
| * We also can't change our mind later, about which server to choose, so round robin. |
| */ |
| if ((likely(msg->sl.rq.v_l == 8) && req->data[msg->som + msg->sl.rq.v + 7] == '1')) { |
| struct hdr_ctx ctx; |
| ctx.idx = 0; |
| /* Expect is allowed in 1.1, look for it */ |
| http_find_header2("Expect", 6, msg->sol, &txn->hdr_idx, &ctx); |
| if (ctx.idx != 0 && |
| unlikely(ctx.vlen == 12 && strncasecmp(ctx.line+ctx.val, "100-continue", 12) == 0)) |
| /* We can't reliablly stall and wait for data, because of |
| * .NET clients that don't conform to rfc2616; so, no need for |
| * the next block to check length expectations. |
| * We could send 100 status back to the client, but then we need to |
| * re-write headers, and send the message. And this isn't the right |
| * place for that action. |
| * TODO: support Expect elsewhere and delete this block. |
| */ |
| goto end_check_maybe_wait_for_body; |
| } |
| |
| if (likely(len > s->be->url_param_post_limit)) { |
| /* nothing to do, we got enough */ |
| } else { |
| /* limit implies we are supposed to need this many bytes |
| * to find the parameter. Let's see how many bytes we can wait for. |
| */ |
| long long hint = len; |
| struct hdr_ctx ctx; |
| ctx.idx = 0; |
| http_find_header2("Transfer-Encoding", 17, msg->sol, &txn->hdr_idx, &ctx); |
| if (ctx.idx && ctx.vlen >= 7 && strncasecmp(ctx.line+ctx.val, "chunked", 7) == 0) { |
| buffer_write_dis(req); |
| req->analysers |= AN_REQ_HTTP_BODY; |
| } |
| else { |
| ctx.idx = 0; |
| http_find_header2("Content-Length", 14, msg->sol, &txn->hdr_idx, &ctx); |
| /* now if we have a length, we'll take the hint */ |
| if (ctx.idx) { |
| /* We have Content-Length */ |
| if (strl2llrc(ctx.line+ctx.val,ctx.vlen, &hint)) |
| hint = 0; /* parse failure, untrusted client */ |
| else { |
| if (hint > 0) |
| msg->hdr_content_len = hint; |
| else |
| hint = 0; /* bad client, sent negative length */ |
| } |
| } |
| /* but limited to what we care about, maybe we don't expect any entity data (hint == 0) */ |
| if (s->be->url_param_post_limit < hint) |
| hint = s->be->url_param_post_limit; |
| /* now do we really need to buffer more data? */ |
| if (len < hint) { |
| buffer_write_dis(req); |
| req->analysers |= AN_REQ_HTTP_BODY; |
| } |
| /* else... There are no body bytes to wait for */ |
| } |
| } |
| } |
| end_check_maybe_wait_for_body: |
| |
| /************************************************************* |
| * OK, that's finished for the headers. We have done what we * |
| * could. Let's switch to the DATA state. * |
| ************************************************************/ |
| |
| buffer_set_rlim(req, BUFSIZE); /* no more rewrite needed */ |
| s->logs.tv_request = now; |
| |
| /* When a connection is tarpitted, we use the tarpit timeout, |
| * which may be the same as the connect timeout if unspecified. |
| * If unset, then set it to zero because we really want it to |
| * eventually expire. We build the tarpit as an analyser. |
| */ |
| if (txn->flags & TX_CLTARPIT) { |
| buffer_erase(s->req); |
| /* wipe the request out so that we can drop the connection early |
| * if the client closes first. |
| */ |
| buffer_write_dis(req); |
| req->analysers |= AN_REQ_HTTP_TARPIT; |
| req->analyse_exp = tick_add_ifset(now_ms, s->be->timeout.tarpit); |
| if (!req->analyse_exp) |
| req->analyse_exp = tick_add(now_ms, 0); |
| } |
| |
| /* OK let's go on with the BODY now */ |
| return 1; |
| |
| return_bad_req: /* let's centralize all bad requests */ |
| if (unlikely(msg->msg_state == HTTP_MSG_ERROR) || msg->err_pos >= 0) { |
| /* we detected a parsing error. We want to archive this request |
| * in the dedicated proxy area for later troubleshooting. |
| */ |
| http_capture_bad_message(&s->fe->invalid_req, s, req, msg, s->fe); |
| } |
| |
| txn->req.msg_state = HTTP_MSG_ERROR; |
| txn->status = 400; |
| req->analysers = 0; |
| stream_int_retnclose(req->prod, error_message(s, HTTP_ERR_400)); |
| s->fe->failed_req++; |
| |
| if (!(s->flags & SN_ERR_MASK)) |
| s->flags |= SN_ERR_PRXCOND; |
| if (!(s->flags & SN_FINST_MASK)) |
| s->flags |= SN_FINST_R; |
| return 0; |
| } |
| |
| /* This function is an analyser which processes the HTTP tarpit. It always |
| * returns zero, at the beginning because it prevents any other processing |
| * from occurring, and at the end because it terminates the request. |
| */ |
| int http_process_tarpit(struct session *s, struct buffer *req, int an_bit) |
| { |
| struct http_txn *txn = &s->txn; |
| |
| /* This connection is being tarpitted. The CLIENT side has |
| * already set the connect expiration date to the right |
| * timeout. We just have to check that the client is still |
| * there and that the timeout has not expired. |
| */ |
| if ((req->flags & (BF_SHUTR|BF_READ_ERROR)) == 0 && |
| !tick_is_expired(req->analyse_exp, now_ms)) |
| return 0; |
| |
| /* We will set the queue timer to the time spent, just for |
| * logging purposes. We fake a 500 server error, so that the |
| * attacker will not suspect his connection has been tarpitted. |
| * It will not cause trouble to the logs because we can exclude |
| * the tarpitted connections by filtering on the 'PT' status flags. |
| */ |
| s->logs.t_queue = tv_ms_elapsed(&s->logs.tv_accept, &now); |
| |
| txn->status = 500; |
| if (req->flags != BF_READ_ERROR) |
| stream_int_retnclose(req->prod, error_message(s, HTTP_ERR_500)); |
| |
| req->analysers = 0; |
| req->analyse_exp = TICK_ETERNITY; |
| |
| s->fe->failed_req++; |
| if (!(s->flags & SN_ERR_MASK)) |
| s->flags |= SN_ERR_PRXCOND; |
| if (!(s->flags & SN_FINST_MASK)) |
| s->flags |= SN_FINST_T; |
| return 0; |
| } |
| |
| /* This function is an analyser which processes the HTTP request body. It looks |
| * for parameters to be used for the load balancing algorithm (url_param). It |
| * must only be called after the standard HTTP request processing has occurred, |
| * because it expects the request to be parsed. It returns zero if it needs to |
| * read more data, or 1 once it has completed its analysis. |
| */ |
| int http_process_request_body(struct session *s, struct buffer *req, int an_bit) |
| { |
| struct http_msg *msg = &s->txn.req; |
| unsigned long body = msg->sol[msg->eoh] == '\r' ? msg->eoh + 2 : msg->eoh + 1; |
| long long limit = s->be->url_param_post_limit; |
| struct hdr_ctx ctx; |
| |
| if (unlikely(msg->msg_state != HTTP_MSG_BODY)) { |
| /* we need more data */ |
| buffer_write_dis(req); |
| return 0; |
| } |
| |
| /* We have to parse the HTTP request body to find any required data. |
| * "balance url_param check_post" should have been the only way to get |
| * into this. We were brought here after HTTP header analysis, so all |
| * related structures are ready. |
| */ |
| |
| ctx.idx = 0; |
| |
| /* now if we have a length, we'll take the hint */ |
| http_find_header2("Transfer-Encoding", 17, msg->sol, &s->txn.hdr_idx, &ctx); |
| if (ctx.idx && ctx.vlen >= 7 && strncasecmp(ctx.line+ctx.val, "chunked", 7) == 0) { |
| unsigned int chunk = 0; |
| while (body < req->l && !HTTP_IS_CRLF(msg->sol[body])) { |
| char c = msg->sol[body]; |
| if (ishex(c)) { |
| unsigned int hex = toupper(c) - '0'; |
| if (hex > 9) |
| hex -= 'A' - '9' - 1; |
| chunk = (chunk << 4) | hex; |
| } else |
| break; |
| body++; |
| } |
| if (body + 2 >= req->l) /* we want CRLF too */ |
| goto http_body_end; /* end of buffer? data missing! */ |
| |
| if (memcmp(msg->sol+body, "\r\n", 2) != 0) |
| goto http_body_end; /* chunked encoding len ends with CRLF, and we don't have it yet */ |
| |
| body += 2; // skip CRLF |
| |
| /* if we support more then one chunk here, we have to do it again when assigning server |
| * 1. how much entity data do we have? new var |
| * 2. should save entity_start, entity_cursor, elen & rlen in req; so we don't repeat scanning here |
| * 3. test if elen > limit, or set new limit to elen if 0 (end of entity found) |
| */ |
| |
| if (chunk < limit) |
| limit = chunk; /* only reading one chunk */ |
| } else { |
| if (msg->hdr_content_len < limit) |
| limit = msg->hdr_content_len; |
| } |
| |
| http_body_end: |
| /* we leave once we know we have nothing left to do. This means that we have |
| * enough bytes, or that we know we'll not get any more (buffer full, read |
| * buffer closed). |
| */ |
| if (req->l - body >= limit || /* enough bytes! */ |
| req->flags & (BF_FULL | BF_READ_ERROR | BF_SHUTR | BF_READ_TIMEOUT) || |
| tick_is_expired(req->analyse_exp, now_ms)) { |
| /* The situation will not evolve, so let's give up on the analysis. */ |
| s->logs.tv_request = now; /* update the request timer to reflect full request */ |
| req->analysers &= ~an_bit; |
| req->analyse_exp = TICK_ETERNITY; |
| return 1; |
| } |
| else { |
| /* Not enough data. We'll re-use the http-request |
| * timeout here. Ideally, we should set the timeout |
| * relative to the accept() date. We just set the |
| * request timeout once at the beginning of the |
| * request. |
| */ |
| buffer_write_dis(req); |
| if (!tick_isset(req->analyse_exp)) |
| req->analyse_exp = tick_add_ifset(now_ms, s->be->timeout.httpreq); |
| return 0; |
| } |
| } |
| |
| /* This function performs all the processing enabled for the current response. |
| * It normally returns zero, but may return 1 if it absolutely needs to be |
| * called again after other functions. It relies on buffers flags, and updates |
| * t->rep->analysers. It might make sense to explode it into several other |
| * functions. It works like process_request (see indications above). |
| */ |
| int process_response(struct session *t) |
| { |
| struct http_txn *txn = &t->txn; |
| struct buffer *req = t->req; |
| struct buffer *rep = t->rep; |
| |
| DPRINTF(stderr,"[%u] %s: session=%p b=%p, exp(r,w)=%u,%u bf=%08x bl=%d analysers=%02x\n", |
| now_ms, __FUNCTION__, |
| t, |
| rep, |
| rep->rex, rep->wex, |
| rep->flags, |
| rep->l, |
| rep->analysers); |
| |
| if (rep->analysers & AN_RTR_HTTP_HDR) { /* receiving server headers */ |
| /* |
| * Now parse the partial (or complete) lines. |
| * We will check the response syntax, and also join multi-line |
| * headers. An index of all the lines will be elaborated while |
| * parsing. |
| * |
| * For the parsing, we use a 28 states FSM. |
| * |
| * Here is the information we currently have : |
| * rep->data + rep->som = beginning of response |
| * rep->data + rep->eoh = end of processed headers / start of current one |
| * rep->data + rep->eol = end of current header or line (LF or CRLF) |
| * rep->lr = first non-visited byte |
| * rep->r = end of data |
| */ |
| |
| int cur_idx; |
| struct http_msg *msg = &txn->rsp; |
| struct proxy *cur_proxy; |
| |
| if (likely(rep->lr < rep->r)) |
| http_msg_analyzer(rep, msg, &txn->hdr_idx); |
| |
| /* 1: we might have to print this header in debug mode */ |
| if (unlikely((global.mode & MODE_DEBUG) && |
| (!(global.mode & MODE_QUIET) || (global.mode & MODE_VERBOSE)) && |
| (msg->msg_state == HTTP_MSG_BODY || msg->msg_state == HTTP_MSG_ERROR))) { |
| char *eol, *sol; |
| |
| sol = rep->data + msg->som; |
| eol = sol + msg->sl.rq.l; |
| debug_hdr("srvrep"
|