blob: 12228b1fe542d40441941de8cd0f15edeebafdeb [file] [log] [blame]
Christopher Fauletf4eb75d2018-10-11 15:55:07 +02001/*
2 * HTTP protocol analyzer
3 *
4 * Copyright (C) 2018 HAProxy Technologies, Christopher Faulet <cfaulet@haproxy.com>
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 */
12
Willy Tarreaudcc048a2020-06-04 19:11:43 +020013#include <haproxy/acl.h>
Willy Tarreau122eba92020-06-04 10:15:32 +020014#include <haproxy/action-t.h>
Willy Tarreau4c7e4b72020-05-27 12:58:42 +020015#include <haproxy/api.h>
Willy Tarreau91cefca2022-05-03 17:08:29 +020016#include <haproxy/applet.h>
Willy Tarreaub2551052020-06-09 09:07:15 +020017#include <haproxy/backend.h>
Willy Tarreau8d366972020-05-27 16:10:29 +020018#include <haproxy/base64.h>
Willy Tarreaudfd3de82020-06-04 23:46:14 +020019#include <haproxy/capture-t.h>
Amaury Denoyelle03517732021-05-07 14:25:01 +020020#include <haproxy/cfgparse.h>
Willy Tarreauf1d32c42020-06-04 21:07:02 +020021#include <haproxy/channel.h>
Willy Tarreau4aa573d2020-06-04 18:21:56 +020022#include <haproxy/check.h>
Willy Tarreau7ea393d2020-06-04 18:02:10 +020023#include <haproxy/connection.h>
Willy Tarreau36979d92020-06-05 17:27:29 +020024#include <haproxy/errors.h>
Willy Tarreauc7babd82020-06-04 21:29:29 +020025#include <haproxy/filters.h>
Willy Tarreaucd72d8c2020-06-02 19:11:26 +020026#include <haproxy/http.h>
Willy Tarreauc2b1ff02020-06-04 21:21:03 +020027#include <haproxy/http_ana.h>
Willy Tarreau87735332020-06-04 09:08:41 +020028#include <haproxy/http_htx.h>
Aurelien DARRAGONb2bb9252022-12-28 15:37:57 +010029#include <haproxy/http_ext.h>
Willy Tarreau16f958c2020-06-03 08:44:35 +020030#include <haproxy/htx.h>
Willy Tarreauaeed4a82020-06-04 22:01:04 +020031#include <haproxy/log.h>
Willy Tarreau6131d6a2020-06-02 16:48:09 +020032#include <haproxy/net_helper.h>
Willy Tarreaua264d962020-06-04 22:29:18 +020033#include <haproxy/proxy.h>
Willy Tarreau7cd8b6e2020-06-02 17:32:26 +020034#include <haproxy/regex.h>
Willy Tarreau5edca2f2022-05-27 09:25:10 +020035#include <haproxy/sc_strm.h>
Willy Tarreau1e56f922020-06-04 23:20:13 +020036#include <haproxy/server-t.h>
Willy Tarreau2eec9b52020-06-04 19:58:55 +020037#include <haproxy/stats.h>
Willy Tarreaucb086c62022-05-27 09:47:12 +020038#include <haproxy/stconn.h>
Willy Tarreaudfd3de82020-06-04 23:46:14 +020039#include <haproxy/stream.h>
Willy Tarreaudfd3de82020-06-04 23:46:14 +020040#include <haproxy/trace.h>
Willy Tarreau8c42b8a2020-06-04 19:27:34 +020041#include <haproxy/uri_auth-t.h>
Willy Tarreaua1718922020-06-04 16:25:31 +020042#include <haproxy/vars.h>
Christopher Faulete0768eb2018-10-03 16:38:02 +020043
Christopher Faulete0768eb2018-10-03 16:38:02 +020044
Christopher Fauleteea8fc72019-11-05 16:18:10 +010045#define TRACE_SOURCE &trace_strm
46
Christopher Faulet377c5a52018-10-24 21:21:30 +020047extern const char *stat_status_codes[];
Christopher Fauletf2824e62018-10-01 12:12:37 +020048
Willy Tarreauff882702021-04-10 17:23:00 +020049struct pool_head *pool_head_requri __read_mostly = NULL;
50struct pool_head *pool_head_capture __read_mostly = NULL;
Christopher Fauleta8a46e22019-07-16 14:53:09 +020051
52
Christopher Fauletfc9cfe42019-07-16 14:54:53 +020053static void http_end_request(struct stream *s);
54static void http_end_response(struct stream *s);
Christopher Fauletf2824e62018-10-01 12:12:37 +020055
Christopher Fauletfc9cfe42019-07-16 14:54:53 +020056static void http_capture_headers(struct htx *htx, char **cap, struct cap_hdr *cap_hdr);
57static int http_del_hdr_value(char *start, char *end, char **from, char *next);
58static size_t http_fmt_req_line(const struct htx_sl *sl, char *str, size_t len);
Christopher Fauletfc9cfe42019-07-16 14:54:53 +020059static void http_debug_stline(const char *dir, struct stream *s, const struct htx_sl *sl);
60static void http_debug_hdr(const char *dir, struct stream *s, const struct ist n, const struct ist v);
Christopher Faulet0f226952018-10-22 09:29:56 +020061
Christopher Fauletd4150ad2021-10-13 15:35:55 +020062static enum rule_result http_req_get_intercept_rule(struct proxy *px, struct list *def_rules, struct list *rules, struct stream *s);
63static enum rule_result http_res_get_intercept_rule(struct proxy *px, struct list *def_rules, struct list *rules, struct stream *s);
Christopher Faulet18c13d32022-05-16 11:43:10 +020064static enum rule_result http_req_restrict_header_names(struct stream *s, struct htx *htx, struct proxy *px);
Christopher Faulet3e964192018-10-24 11:39:23 +020065
Christopher Fauletfc9cfe42019-07-16 14:54:53 +020066static void http_manage_client_side_cookies(struct stream *s, struct channel *req);
67static void http_manage_server_side_cookies(struct stream *s, struct channel *res);
Christopher Fauletfcda7c62018-10-24 11:56:22 +020068
Aurelien DARRAGONf6286142023-12-05 17:54:20 +010069static int http_stats_check_uri(struct stream *s, struct http_txn *txn, struct proxy *px);
70static int http_handle_stats(struct stream *s, struct channel *req, struct proxy *px);
Christopher Faulet377c5a52018-10-24 21:21:30 +020071
Christopher Fauletfc9cfe42019-07-16 14:54:53 +020072static int http_handle_expect_hdr(struct stream *s, struct htx *htx, struct http_msg *msg);
73static int http_reply_100_continue(struct stream *s);
Christopher Faulet23a3c792018-11-28 10:01:23 +010074
Christopher Faulete0768eb2018-10-03 16:38:02 +020075/* This stream analyser waits for a complete HTTP request. It returns 1 if the
76 * processing can continue on next analysers, or zero if it either needs more
77 * data or wants to immediately abort the request (eg: timeout, error, ...). It
78 * is tied to AN_REQ_WAIT_HTTP and may may remove itself from s->req.analysers
79 * when it has nothing left to do, and may remove any analyser when it wants to
80 * abort.
81 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +020082int http_wait_for_request(struct stream *s, struct channel *req, int an_bit)
Christopher Faulete0768eb2018-10-03 16:38:02 +020083{
Christopher Faulet9768c262018-10-22 09:34:31 +020084
Christopher Faulete0768eb2018-10-03 16:38:02 +020085 /*
Christopher Faulet9768c262018-10-22 09:34:31 +020086 * We will analyze a complete HTTP request to check the its syntax.
Christopher Faulete0768eb2018-10-03 16:38:02 +020087 *
Christopher Faulet9768c262018-10-22 09:34:31 +020088 * Once the start line and all headers are received, we may perform a
89 * capture of the error (if any), and we will set a few fields. We also
90 * check for monitor-uri, logging and finally headers capture.
Christopher Faulete0768eb2018-10-03 16:38:02 +020091 */
Christopher Faulete0768eb2018-10-03 16:38:02 +020092 struct session *sess = s->sess;
93 struct http_txn *txn = s->txn;
94 struct http_msg *msg = &txn->req;
Christopher Faulet9768c262018-10-22 09:34:31 +020095 struct htx *htx;
Christopher Fauletf1ba18d2018-11-26 21:37:08 +010096 struct htx_sl *sl;
Frédéric Lécaille9969adb2023-01-18 11:52:21 +010097 char http_ver;
98 int len;
Christopher Faulete0768eb2018-10-03 16:38:02 +020099
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100100 DBG_TRACE_ENTER(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn, msg);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200101
Christopher Fauletda46a0d2021-01-21 17:32:58 +0100102 if (unlikely(!IS_HTX_STRM(s))) {
103 /* It is only possible when a TCP stream is upgrade to HTTP.
104 * There is a transition period during which there is no
105 * data. The stream is still in raw mode and SF_IGNORE flag is
106 * still set. When this happens, the new mux is responsible to
Ilya Shipitsinacf84592021-02-06 22:29:08 +0500107 * handle all errors. Thus we may leave immediately.
Christopher Fauletda46a0d2021-01-21 17:32:58 +0100108 */
109 BUG_ON(!(s->flags & SF_IGNORE) || !c_empty(&s->req));
Christopher Faulet9768c262018-10-22 09:34:31 +0200110
Christopher Faulet97b3a612021-03-15 17:10:12 +0100111 /* Don't connect for now */
112 channel_dont_connect(req);
113
Christopher Faulet0c370ee2023-04-13 16:05:13 +0200114 /* An abort at this stage means we are performing a "destructive"
Christopher Faulet97b3a612021-03-15 17:10:12 +0100115 * HTTP upgrade (TCP>H2). In this case, we can leave.
116 */
Christopher Fauletca5309a2023-04-17 16:17:32 +0200117 if (s->scf->flags & (SC_FL_ABRT_DONE|SC_FL_EOS)) {
Christopher Faulet97b3a612021-03-15 17:10:12 +0100118 s->logs.logwait = 0;
119 s->logs.level = 0;
Christopher Faulet7eb837d2023-04-13 15:22:29 +0200120 stream_abort(s);
Christopher Faulet97b3a612021-03-15 17:10:12 +0100121 req->analysers &= AN_REQ_FLT_END;
122 req->analyse_exp = TICK_ETERNITY;
123 DBG_TRACE_LEAVE(STRM_EV_STRM_ANA, s);
124 return 1;
125 }
Christopher Fauletda46a0d2021-01-21 17:32:58 +0100126 DBG_TRACE_LEAVE(STRM_EV_STRM_ANA, s);
127 return 0;
128 }
129
130 htx = htxbuf(&req->buf);
Frédéric Lécaille9969adb2023-01-18 11:52:21 +0100131 sl = http_get_stline(htx);
132 len = HTX_SL_REQ_VLEN(sl);
133 if (len < 6) {
134 http_ver = 0;
135 }
136 else {
137 char *ptr;
138
139 ptr = HTX_SL_REQ_VPTR(sl);
140 http_ver = ptr[5] - '0';
141 }
Christopher Faulet8bebd2f2020-10-06 17:54:56 +0200142
Willy Tarreau4236f032019-03-05 10:43:32 +0100143 /* Parsing errors are caught here */
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200144 if (htx->flags & (HTX_FL_PARSING_ERROR|HTX_FL_PROCESSING_ERROR)) {
Willy Tarreau4236f032019-03-05 10:43:32 +0100145 stream_inc_http_req_ctr(s);
Frédéric Lécaille9969adb2023-01-18 11:52:21 +0100146 proxy_inc_fe_req_ctr(sess->listener, sess->fe, http_ver);
Christopher Fauletbf7175f2021-02-10 14:58:01 +0100147 if (htx->flags & HTX_FL_PARSING_ERROR) {
148 stream_inc_http_err_ctr(s);
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200149 goto return_bad_req;
Christopher Fauletbf7175f2021-02-10 14:58:01 +0100150 }
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200151 else
152 goto return_int_err;
Willy Tarreau4236f032019-03-05 10:43:32 +0100153 }
154
Christopher Faulete0768eb2018-10-03 16:38:02 +0200155 /* we're speaking HTTP here, so let's speak HTTP to the client */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200156 s->srv_error = http_return_srv_error;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200157
Christopher Faulet9768c262018-10-22 09:34:31 +0200158 msg->msg_state = HTTP_MSG_BODY;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200159 stream_inc_http_req_ctr(s);
Frédéric Lécaille9969adb2023-01-18 11:52:21 +0100160 proxy_inc_fe_req_ctr(sess->listener, sess->fe, http_ver); /* one more valid request for this FE */
Christopher Faulete0768eb2018-10-03 16:38:02 +0200161
Christopher Faulet9768c262018-10-22 09:34:31 +0200162 /* kill the pending keep-alive timeout */
Christopher Faulet9768c262018-10-22 09:34:31 +0200163 req->analyse_exp = TICK_ETERNITY;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200164
Christopher Faulet29f17582019-05-23 11:03:26 +0200165 BUG_ON(htx_get_first_type(htx) != HTX_BLK_REQ_SL);
Christopher Faulet03599112018-11-27 11:21:21 +0100166
Christopher Faulet9768c262018-10-22 09:34:31 +0200167 /* 0: we might have to print this header in debug mode */
168 if (unlikely((global.mode & MODE_DEBUG) &&
169 (!(global.mode & MODE_QUIET) || (global.mode & MODE_VERBOSE)))) {
170 int32_t pos;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200171
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200172 http_debug_stline("clireq", s, sl);
Christopher Faulet9768c262018-10-22 09:34:31 +0200173
Christopher Fauleta3f15502019-05-13 15:27:23 +0200174 for (pos = htx_get_first(htx); pos != -1; pos = htx_get_next(htx, pos)) {
Christopher Faulet9768c262018-10-22 09:34:31 +0200175 struct htx_blk *blk = htx_get_blk(htx, pos);
176 enum htx_blk_type type = htx_get_blk_type(blk);
177
178 if (type == HTX_BLK_EOH)
179 break;
180 if (type != HTX_BLK_HDR)
181 continue;
182
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200183 http_debug_hdr("clihdr", s,
184 htx_get_blk_name(htx, blk),
185 htx_get_blk_value(htx, blk));
Christopher Faulet9768c262018-10-22 09:34:31 +0200186 }
187 }
Christopher Faulete0768eb2018-10-03 16:38:02 +0200188
189 /*
Christopher Faulet03599112018-11-27 11:21:21 +0100190 * 1: identify the method and the version. Also set HTTP flags
Christopher Faulete0768eb2018-10-03 16:38:02 +0200191 */
Christopher Fauletf1ba18d2018-11-26 21:37:08 +0100192 txn->meth = sl->info.req.meth;
Christopher Faulet03599112018-11-27 11:21:21 +0100193 if (sl->flags & HTX_SL_F_VER_11)
Christopher Faulet9768c262018-10-22 09:34:31 +0200194 msg->flags |= HTTP_MSGF_VER_11;
Christopher Faulet03599112018-11-27 11:21:21 +0100195 msg->flags |= HTTP_MSGF_XFER_LEN;
Christopher Faulet2a408542020-11-20 14:22:37 +0100196 if (sl->flags & HTX_SL_F_CLEN)
197 msg->flags |= HTTP_MSGF_CNT_LEN;
198 else if (sl->flags & HTX_SL_F_CHNK)
199 msg->flags |= HTTP_MSGF_TE_CHNK;
Christopher Fauletb2db4fa2018-11-27 16:51:09 +0100200 if (sl->flags & HTX_SL_F_BODYLESS)
201 msg->flags |= HTTP_MSGF_BODYLESS;
Christopher Faulet576c3582021-01-08 15:53:01 +0100202 if (sl->flags & HTX_SL_F_CONN_UPG)
203 msg->flags |= HTTP_MSGF_CONN_UPG;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200204
205 /* we can make use of server redirect on GET and HEAD */
206 if (txn->meth == HTTP_METH_GET || txn->meth == HTTP_METH_HEAD)
207 s->flags |= SF_REDIRECTABLE;
Christopher Fauletf1ba18d2018-11-26 21:37:08 +0100208 else if (txn->meth == HTTP_METH_OTHER && isteqi(htx_sl_req_meth(sl), ist("PRI"))) {
Christopher Faulete0768eb2018-10-03 16:38:02 +0200209 /* PRI is reserved for the HTTP/2 preface */
Christopher Faulete0768eb2018-10-03 16:38:02 +0200210 goto return_bad_req;
211 }
212
213 /*
Christopher Faulet6072beb2020-02-18 15:34:58 +0100214 * 2: check if the URI matches the monitor_uri. We have to do this for
215 * every request which gets in, because the monitor-uri is defined by
216 * the frontend. If the monitor-uri starts with a '/', the matching is
217 * done against the request's path. Otherwise, the request's uri is
218 * used. It is a workaround to let HTTP/2 health-checks work as
219 * expected.
Christopher Faulete0768eb2018-10-03 16:38:02 +0200220 */
Tim Duesterhus4b1fcaa2022-03-05 00:52:40 +0100221 if (unlikely(isttest(sess->fe->monitor_uri))) {
222 const struct ist monitor_uri = sess->fe->monitor_uri;
Amaury Denoyellec453f952021-07-06 11:40:12 +0200223 struct http_uri_parser parser = http_uri_parser_init(htx_sl_req_uri(sl));
Christopher Faulete0768eb2018-10-03 16:38:02 +0200224
Amaury Denoyelle5a9bd372021-07-06 11:23:10 +0200225 if ((istptr(monitor_uri)[0] == '/' &&
Amaury Denoyellec453f952021-07-06 11:40:12 +0200226 isteq(http_parse_path(&parser), monitor_uri)) ||
Amaury Denoyelle5a9bd372021-07-06 11:23:10 +0200227 isteq(htx_sl_req_uri(sl), monitor_uri)) {
228 /*
229 * We have found the monitor URI
230 */
231 struct acl_cond *cond;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200232
Amaury Denoyelle5a9bd372021-07-06 11:23:10 +0200233 s->flags |= SF_MONITOR;
234 _HA_ATOMIC_INC(&sess->fe->fe_counters.intercepted_req);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200235
Amaury Denoyelle5a9bd372021-07-06 11:23:10 +0200236 /* Check if we want to fail this monitor request or not */
237 list_for_each_entry(cond, &sess->fe->mon_fail_cond, list) {
238 int ret = acl_exec_cond(cond, sess->fe, sess, s, SMP_OPT_DIR_REQ|SMP_OPT_FINAL);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200239
Amaury Denoyelle5a9bd372021-07-06 11:23:10 +0200240 ret = acl_pass(ret);
241 if (cond->pol == ACL_COND_UNLESS)
242 ret = !ret;
243
244 if (ret) {
245 /* we fail this request, let's return 503 service unavail */
246 txn->status = 503;
247 if (!(s->flags & SF_ERR_MASK))
248 s->flags |= SF_ERR_LOCAL; /* we don't want a real error here */
249 goto return_prx_cond;
250 }
Christopher Faulete0768eb2018-10-03 16:38:02 +0200251 }
Christopher Faulete0768eb2018-10-03 16:38:02 +0200252
Amaury Denoyelle5a9bd372021-07-06 11:23:10 +0200253 /* nothing to fail, let's reply normally */
254 txn->status = 200;
255 if (!(s->flags & SF_ERR_MASK))
256 s->flags |= SF_ERR_LOCAL; /* we don't want a real error here */
257 goto return_prx_cond;
258 }
Christopher Faulete0768eb2018-10-03 16:38:02 +0200259 }
260
261 /*
262 * 3: Maybe we have to copy the original REQURI for the logs ?
263 * Note: we cannot log anymore if the request has been
264 * classified as invalid.
265 */
266 if (unlikely(s->logs.logwait & LW_REQ)) {
267 /* we have a complete HTTP request that we must log */
268 if ((txn->uri = pool_alloc(pool_head_requri)) != NULL) {
Christopher Faulet9768c262018-10-22 09:34:31 +0200269 size_t len;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200270
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200271 len = http_fmt_req_line(sl, txn->uri, global.tune.requri_len - 1);
Christopher Faulet9768c262018-10-22 09:34:31 +0200272 txn->uri[len] = 0;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200273
274 if (!(s->logs.logwait &= ~(LW_REQ|LW_INIT)))
275 s->do_log(s);
276 } else {
277 ha_alert("HTTP logging : out of memory.\n");
278 }
279 }
Christopher Faulete0768eb2018-10-03 16:38:02 +0200280
Christopher Faulete0768eb2018-10-03 16:38:02 +0200281 /* if the frontend has "option http-use-proxy-header", we'll check if
282 * we have what looks like a proxied connection instead of a connection,
283 * and in this case set the TX_USE_PX_CONN flag to use Proxy-connection.
284 * Note that this is *not* RFC-compliant, however browsers and proxies
285 * happen to do that despite being non-standard :-(
286 * We consider that a request not beginning with either '/' or '*' is
287 * a proxied connection, which covers both "scheme://location" and
288 * CONNECT ip:port.
289 */
290 if ((sess->fe->options2 & PR_O2_USE_PXHDR) &&
Christopher Fauletf1ba18d2018-11-26 21:37:08 +0100291 *HTX_SL_REQ_UPTR(sl) != '/' && *HTX_SL_REQ_UPTR(sl) != '*')
Christopher Faulete0768eb2018-10-03 16:38:02 +0200292 txn->flags |= TX_USE_PX_CONN;
293
Christopher Faulete0768eb2018-10-03 16:38:02 +0200294 /* 5: we may need to capture headers */
295 if (unlikely((s->logs.logwait & LW_REQHDR) && s->req_cap))
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200296 http_capture_headers(htx, s->req_cap, sess->fe->req_cap);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200297
Christopher Faulete0768eb2018-10-03 16:38:02 +0200298 /* we may have to wait for the request's body */
Christopher Faulet9768c262018-10-22 09:34:31 +0200299 if (s->be->options & PR_O_WREQ_BODY)
Christopher Faulete0768eb2018-10-03 16:38:02 +0200300 req->analysers |= AN_REQ_HTTP_BODY;
301
302 /*
303 * RFC7234#4:
304 * A cache MUST write through requests with methods
305 * that are unsafe (Section 4.2.1 of [RFC7231]) to
306 * the origin server; i.e., a cache is not allowed
307 * to generate a reply to such a request before
308 * having forwarded the request and having received
309 * a corresponding response.
310 *
311 * RFC7231#4.2.1:
312 * Of the request methods defined by this
313 * specification, the GET, HEAD, OPTIONS, and TRACE
314 * methods are defined to be safe.
315 */
316 if (likely(txn->meth == HTTP_METH_GET ||
317 txn->meth == HTTP_METH_HEAD ||
318 txn->meth == HTTP_METH_OPTIONS ||
319 txn->meth == HTTP_METH_TRACE))
320 txn->flags |= TX_CACHEABLE | TX_CACHE_COOK;
321
322 /* end of job, return OK */
323 req->analysers &= ~an_bit;
324 req->analyse_exp = TICK_ETERNITY;
Christopher Faulet9768c262018-10-22 09:34:31 +0200325
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100326 DBG_TRACE_LEAVE(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200327 return 1;
328
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200329 return_int_err:
330 txn->status = 500;
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200331 if (!(s->flags & SF_ERR_MASK))
332 s->flags |= SF_ERR_INTERNAL;
Willy Tarreau4781b152021-04-06 13:53:36 +0200333 _HA_ATOMIC_INC(&sess->fe->fe_counters.internal_errors);
William Lallemand36119de2021-03-08 15:26:48 +0100334 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +0200335 _HA_ATOMIC_INC(&sess->listener->counters->internal_errors);
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200336 goto return_prx_cond;
337
Christopher Faulete0768eb2018-10-03 16:38:02 +0200338 return_bad_req:
Christopher Faulet9768c262018-10-22 09:34:31 +0200339 txn->status = 400;
Willy Tarreau4781b152021-04-06 13:53:36 +0200340 _HA_ATOMIC_INC(&sess->fe->fe_counters.failed_req);
William Lallemand36119de2021-03-08 15:26:48 +0100341 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +0200342 _HA_ATOMIC_INC(&sess->listener->counters->failed_req);
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200343 /* fall through */
Christopher Faulete0768eb2018-10-03 16:38:02 +0200344
345 return_prx_cond:
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200346 http_reply_and_close(s, txn->status, http_error_message(s));
Christopher Faulet4a66c942023-01-13 09:43:21 +0100347 http_set_term_flags(s);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200348
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100349 DBG_TRACE_DEVEL("leaving on error",
350 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA|STRM_EV_HTTP_ERR, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200351 return 0;
352}
353
354
355/* This stream analyser runs all HTTP request processing which is common to
356 * frontends and backends, which means blocking ACLs, filters, connection-close,
357 * reqadd, stats and redirects. This is performed for the designated proxy.
358 * It returns 1 if the processing can continue on next analysers, or zero if it
359 * either needs more data or wants to immediately abort the request (eg: deny,
360 * error, ...).
361 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200362int http_process_req_common(struct stream *s, struct channel *req, int an_bit, struct proxy *px)
Christopher Faulete0768eb2018-10-03 16:38:02 +0200363{
Christopher Fauletd4150ad2021-10-13 15:35:55 +0200364 struct list *def_rules, *rules;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200365 struct session *sess = s->sess;
366 struct http_txn *txn = s->txn;
367 struct http_msg *msg = &txn->req;
Christopher Fauletff2759f2018-10-24 11:13:16 +0200368 struct htx *htx;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200369 struct redirect_rule *rule;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200370 enum rule_result verdict;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200371 struct connection *conn = objt_conn(sess->origin);
372
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100373 DBG_TRACE_ENTER(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn, msg);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200374
Christopher Faulet27ba2dc2018-12-05 11:53:24 +0100375 htx = htxbuf(&req->buf);
Christopher Fauletff2759f2018-10-24 11:13:16 +0200376
Christopher Faulet1907ccc2019-04-29 13:12:02 +0200377 /* just in case we have some per-backend tracking. Only called the first
378 * execution of the analyser. */
Christopher Fauletd4150ad2021-10-13 15:35:55 +0200379 if (!s->current_rule && !s->current_rule_list)
Christopher Faulet1907ccc2019-04-29 13:12:02 +0200380 stream_inc_be_http_req_ctr(s);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200381
Christopher Fauletd4150ad2021-10-13 15:35:55 +0200382 def_rules = ((px->defpx && (an_bit == AN_REQ_HTTP_PROCESS_FE || px != sess->fe)) ? &px->defpx->http_req_rules : NULL);
383 rules = &px->http_req_rules;
384
Christopher Faulete0768eb2018-10-03 16:38:02 +0200385 /* evaluate http-request rules */
Christopher Fauletd4150ad2021-10-13 15:35:55 +0200386 if ((def_rules && !LIST_ISEMPTY(def_rules)) || !LIST_ISEMPTY(rules)) {
387 verdict = http_req_get_intercept_rule(px, def_rules, rules, s);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200388
389 switch (verdict) {
390 case HTTP_RULE_RES_YIELD: /* some data miss, call the function later. */
391 goto return_prx_yield;
392
393 case HTTP_RULE_RES_CONT:
394 case HTTP_RULE_RES_STOP: /* nothing to do */
395 break;
396
397 case HTTP_RULE_RES_DENY: /* deny or tarpit */
398 if (txn->flags & TX_CLTARPIT)
399 goto tarpit;
400 goto deny;
401
402 case HTTP_RULE_RES_ABRT: /* abort request, response already sent. Eg: auth */
403 goto return_prx_cond;
404
405 case HTTP_RULE_RES_DONE: /* OK, but terminate request processing (eg: redirect) */
406 goto done;
407
408 case HTTP_RULE_RES_BADREQ: /* failed with a bad request */
409 goto return_bad_req;
Christopher Faulet3a26bee2019-12-16 12:47:40 +0100410
411 case HTTP_RULE_RES_ERROR: /* failed with a bad request */
412 goto return_int_err;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200413 }
414 }
415
Christopher Faulet18c13d32022-05-16 11:43:10 +0200416 if (px->options2 & (PR_O2_RSTRICT_REQ_HDR_NAMES_BLK|PR_O2_RSTRICT_REQ_HDR_NAMES_DEL)) {
417 verdict = http_req_restrict_header_names(s, htx, px);
418 if (verdict == HTTP_RULE_RES_DENY)
419 goto deny;
420 }
421
Christopher Faulete0768eb2018-10-03 16:38:02 +0200422 if (conn && (conn->flags & CO_FL_EARLY_DATA) &&
Olivier Houchard220a26c2020-01-23 14:57:36 +0100423 (conn->flags & (CO_FL_EARLY_SSL_HS | CO_FL_SSL_WAIT_HS))) {
Christopher Fauletff2759f2018-10-24 11:13:16 +0200424 struct http_hdr_ctx ctx;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200425
Christopher Fauletff2759f2018-10-24 11:13:16 +0200426 ctx.blk = NULL;
427 if (!http_find_header(htx, ist("Early-Data"), &ctx, 0)) {
428 if (unlikely(!http_add_header(htx, ist("Early-Data"), ist("1"))))
Christopher Fauletd649b572022-06-01 17:42:35 +0200429 goto return_fail_rewrite;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200430 }
Christopher Faulete0768eb2018-10-03 16:38:02 +0200431 }
432
433 /* OK at this stage, we know that the request was accepted according to
434 * the http-request rules, we can check for the stats. Note that the
435 * URI is detected *before* the req* rules in order not to be affected
436 * by a possible reqrep, while they are processed *after* so that a
437 * reqdeny can still block them. This clearly needs to change in 1.6!
438 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200439 if (!s->target && http_stats_check_uri(s, txn, px)) {
Christopher Faulete0768eb2018-10-03 16:38:02 +0200440 s->target = &http_stats_applet.obj_type;
Willy Tarreaua0b58b52022-05-27 08:33:53 +0200441 if (unlikely(!sc_applet_create(s->scb, objt_applet(s->target)))) {
Willy Tarreau69530f52023-04-28 09:16:15 +0200442 s->logs.request_ts = now_ns;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200443 if (!(s->flags & SF_ERR_MASK))
444 s->flags |= SF_ERR_RESOURCE;
Christopher Fauletb8a53712019-12-16 11:29:38 +0100445 goto return_int_err;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200446 }
447
448 /* parse the whole stats request and extract the relevant information */
Aurelien DARRAGONf6286142023-12-05 17:54:20 +0100449 http_handle_stats(s, req, px);
Christopher Fauletd4150ad2021-10-13 15:35:55 +0200450 verdict = http_req_get_intercept_rule(px, NULL, &px->uri_auth->http_req_rules, s);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200451 /* not all actions implemented: deny, allow, auth */
452
453 if (verdict == HTTP_RULE_RES_DENY) /* stats http-request deny */
454 goto deny;
455
456 if (verdict == HTTP_RULE_RES_ABRT) /* stats auth / stats http-request auth */
457 goto return_prx_cond;
Christopher Faulet3a26bee2019-12-16 12:47:40 +0100458
459 if (verdict == HTTP_RULE_RES_BADREQ) /* failed with a bad request */
460 goto return_bad_req;
461
462 if (verdict == HTTP_RULE_RES_ERROR) /* failed with a bad request */
463 goto return_int_err;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200464 }
465
Christopher Faulet2571bc62019-03-01 11:44:26 +0100466 /* Proceed with the applets now. */
467 if (unlikely(objt_applet(s->target))) {
Christopher Faulete0768eb2018-10-03 16:38:02 +0200468 if (sess->fe == s->be) /* report it if the request was intercepted by the frontend */
Willy Tarreau4781b152021-04-06 13:53:36 +0200469 _HA_ATOMIC_INC(&sess->fe->fe_counters.intercepted_req);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200470
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200471 if (http_handle_expect_hdr(s, htx, msg) == -1)
Christopher Fauletb8a53712019-12-16 11:29:38 +0100472 goto return_int_err;
Christopher Fauletbcf242a2019-03-01 11:36:26 +0100473
Christopher Faulete0768eb2018-10-03 16:38:02 +0200474 if (!(s->flags & SF_ERR_MASK)) // this is not really an error but it is
475 s->flags |= SF_ERR_LOCAL; // to mark that it comes from the proxy
Christopher Faulet4a66c942023-01-13 09:43:21 +0100476 http_set_term_flags(s);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200477
Christopher Fauletc2ac5e42021-03-08 18:20:09 +0100478 if (HAS_FILTERS(s))
479 req->analysers |= AN_REQ_FLT_HTTP_HDRS;
480
Christopher Faulete0768eb2018-10-03 16:38:02 +0200481 /* enable the minimally required analyzers to handle keep-alive and compression on the HTTP response */
482 req->analysers &= (AN_REQ_HTTP_BODY | AN_REQ_FLT_HTTP_HDRS | AN_REQ_FLT_END);
483 req->analysers &= ~AN_REQ_FLT_XFER_DATA;
484 req->analysers |= AN_REQ_HTTP_XFER_BODY;
Christopher Fauletbcf242a2019-03-01 11:36:26 +0100485
Christopher Faulet5c281d52023-03-16 15:53:28 +0100486 s->scb->flags |= SC_FL_SND_ASAP;
Christopher Fauletbcf242a2019-03-01 11:36:26 +0100487 s->flags |= SF_ASSIGNED;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200488 goto done;
489 }
490
491 /* check whether we have some ACLs set to redirect this request */
492 list_for_each_entry(rule, &px->redirect_rules, list) {
493 if (rule->cond) {
494 int ret;
495
496 ret = acl_exec_cond(rule->cond, px, sess, s, SMP_OPT_DIR_REQ|SMP_OPT_FINAL);
497 ret = acl_pass(ret);
498 if (rule->cond->pol == ACL_COND_UNLESS)
499 ret = !ret;
500 if (!ret)
501 continue;
502 }
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200503 if (!http_apply_redirect_rule(rule, s, txn))
Christopher Fauletb8a53712019-12-16 11:29:38 +0100504 goto return_int_err;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200505 goto done;
506 }
507
508 /* POST requests may be accompanied with an "Expect: 100-Continue" header.
509 * If this happens, then the data will not come immediately, so we must
510 * send all what we have without waiting. Note that due to the small gain
511 * in waiting for the body of the request, it's easier to simply put the
Christopher Faulet5c281d52023-03-16 15:53:28 +0100512 * SC_FL_SND_ASAP flag on the back SC any time. It's a one-shot flag so it
513 * will remove itself once used.
Christopher Faulete0768eb2018-10-03 16:38:02 +0200514 */
Christopher Faulet5c281d52023-03-16 15:53:28 +0100515 s->scb->flags |= SC_FL_SND_ASAP;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200516
517 done: /* done with this analyser, continue with next ones that the calling
518 * points will have set, if any.
519 */
520 req->analyse_exp = TICK_ETERNITY;
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +0500521 done_without_exp: /* done with this analyser, but don't reset the analyse_exp. */
Christopher Faulete0768eb2018-10-03 16:38:02 +0200522 req->analysers &= ~an_bit;
Christopher Fauletd4150ad2021-10-13 15:35:55 +0200523 s->current_rule = s->current_rule_list = NULL;
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100524 DBG_TRACE_LEAVE(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200525 return 1;
526
527 tarpit:
528 /* Allow cookie logging
529 */
530 if (s->be->cookie_name || sess->fe->capture_name)
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200531 http_manage_client_side_cookies(s, req);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200532
533 /* When a connection is tarpitted, we use the tarpit timeout,
534 * which may be the same as the connect timeout if unspecified.
535 * If unset, then set it to zero because we really want it to
536 * eventually expire. We build the tarpit as an analyser.
537 */
Christopher Faulet202c6ce2019-01-07 14:57:35 +0100538 channel_htx_erase(&s->req, htx);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200539
540 /* wipe the request out so that we can drop the connection early
541 * if the client closes first.
542 */
543 channel_dont_connect(req);
544
Christopher Faulete0768eb2018-10-03 16:38:02 +0200545 req->analysers &= AN_REQ_FLT_END; /* remove switching rules etc... */
546 req->analysers |= AN_REQ_HTTP_TARPIT;
547 req->analyse_exp = tick_add_ifset(now_ms, s->be->timeout.tarpit);
548 if (!req->analyse_exp)
549 req->analyse_exp = tick_add(now_ms, 0);
550 stream_inc_http_err_ctr(s);
Willy Tarreau4781b152021-04-06 13:53:36 +0200551 _HA_ATOMIC_INC(&sess->fe->fe_counters.denied_req);
Christopher Fauletcff0f732019-12-16 16:13:44 +0100552 if (s->flags & SF_BE_ASSIGNED)
Willy Tarreau4781b152021-04-06 13:53:36 +0200553 _HA_ATOMIC_INC(&s->be->be_counters.denied_req);
William Lallemand36119de2021-03-08 15:26:48 +0100554 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +0200555 _HA_ATOMIC_INC(&sess->listener->counters->denied_req);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200556 goto done_without_exp;
557
558 deny: /* this request was blocked (denied) */
559
560 /* Allow cookie logging
561 */
562 if (s->be->cookie_name || sess->fe->capture_name)
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200563 http_manage_client_side_cookies(s, req);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200564
Willy Tarreau69530f52023-04-28 09:16:15 +0200565 s->logs.request_ts = now_ns;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200566 stream_inc_http_err_ctr(s);
Willy Tarreau4781b152021-04-06 13:53:36 +0200567 _HA_ATOMIC_INC(&sess->fe->fe_counters.denied_req);
Christopher Fauletcff0f732019-12-16 16:13:44 +0100568 if (s->flags & SF_BE_ASSIGNED)
Willy Tarreau4781b152021-04-06 13:53:36 +0200569 _HA_ATOMIC_INC(&s->be->be_counters.denied_req);
William Lallemand36119de2021-03-08 15:26:48 +0100570 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +0200571 _HA_ATOMIC_INC(&sess->listener->counters->denied_req);
Christopher Fauletb8a53712019-12-16 11:29:38 +0100572 goto return_prx_err;
573
Christopher Fauletd649b572022-06-01 17:42:35 +0200574 return_fail_rewrite:
575 if (!(s->flags & SF_ERR_MASK))
576 s->flags |= SF_ERR_PRXCOND;
577 _HA_ATOMIC_INC(&sess->fe->fe_counters.failed_rewrites);
578 if (s->flags & SF_BE_ASSIGNED)
579 _HA_ATOMIC_INC(&s->be->be_counters.failed_rewrites);
580 if (sess->listener && sess->listener->counters)
581 _HA_ATOMIC_INC(&sess->listener->counters->failed_rewrites);
582 if (objt_server(s->target))
583 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.failed_rewrites);
584 /* fall through */
585
Christopher Fauletb8a53712019-12-16 11:29:38 +0100586 return_int_err:
587 txn->status = 500;
588 if (!(s->flags & SF_ERR_MASK))
589 s->flags |= SF_ERR_INTERNAL;
Willy Tarreau4781b152021-04-06 13:53:36 +0200590 _HA_ATOMIC_INC(&sess->fe->fe_counters.internal_errors);
Christopher Fauletcff0f732019-12-16 16:13:44 +0100591 if (s->flags & SF_BE_ASSIGNED)
Willy Tarreau4781b152021-04-06 13:53:36 +0200592 _HA_ATOMIC_INC(&s->be->be_counters.internal_errors);
William Lallemand36119de2021-03-08 15:26:48 +0100593 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +0200594 _HA_ATOMIC_INC(&sess->listener->counters->internal_errors);
Christopher Fauletb8a53712019-12-16 11:29:38 +0100595 goto return_prx_err;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200596
597 return_bad_req:
Christopher Faulete0768eb2018-10-03 16:38:02 +0200598 txn->status = 400;
Willy Tarreau4781b152021-04-06 13:53:36 +0200599 _HA_ATOMIC_INC(&sess->fe->fe_counters.failed_req);
William Lallemand36119de2021-03-08 15:26:48 +0100600 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +0200601 _HA_ATOMIC_INC(&sess->listener->counters->failed_req);
Christopher Fauletb8a53712019-12-16 11:29:38 +0100602 /* fall through */
603
604 return_prx_err:
605 http_reply_and_close(s, txn->status, http_error_message(s));
606 /* fall through */
Christopher Faulete0768eb2018-10-03 16:38:02 +0200607
608 return_prx_cond:
Christopher Faulet4a66c942023-01-13 09:43:21 +0100609 http_set_term_flags(s);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200610
611 req->analysers &= AN_REQ_FLT_END;
612 req->analyse_exp = TICK_ETERNITY;
Christopher Fauletd4150ad2021-10-13 15:35:55 +0200613 s->current_rule = s->current_rule_list = NULL;
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100614 DBG_TRACE_DEVEL("leaving on error",
615 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA|STRM_EV_HTTP_ERR, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200616 return 0;
617
618 return_prx_yield:
619 channel_dont_connect(req);
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100620 DBG_TRACE_DEVEL("waiting for more data",
621 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200622 return 0;
623}
624
625/* This function performs all the processing enabled for the current request.
626 * It returns 1 if the processing can continue on next analysers, or zero if it
627 * needs more data, encounters an error, or wants to immediately abort the
628 * request. It relies on buffers flags, and updates s->req.analysers.
629 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200630int http_process_request(struct stream *s, struct channel *req, int an_bit)
Christopher Faulete0768eb2018-10-03 16:38:02 +0200631{
632 struct session *sess = s->sess;
633 struct http_txn *txn = s->txn;
Christopher Fauletd7bdfb12018-10-24 11:14:34 +0200634 struct htx *htx;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200635 struct connection *cli_conn = objt_conn(strm_sess(s)->origin);
636
Christopher Faulet8bebd2f2020-10-06 17:54:56 +0200637 DBG_TRACE_ENTER(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200638
639 /*
640 * Right now, we know that we have processed the entire headers
641 * and that unwanted requests have been filtered out. We can do
642 * whatever we want with the remaining request. Also, now we
643 * may have separate values for ->fe, ->be.
644 */
Christopher Faulet27ba2dc2018-12-05 11:53:24 +0100645 htx = htxbuf(&req->buf);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200646
647 /*
Christopher Faulete0768eb2018-10-03 16:38:02 +0200648 * 7: Now we can work with the cookies.
649 * Note that doing so might move headers in the request, but
650 * the fields will stay coherent and the URI will not move.
651 * This should only be performed in the backend.
652 */
653 if (s->be->cookie_name || sess->fe->capture_name)
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200654 http_manage_client_side_cookies(s, req);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200655
Tim Duesterhus2825b4b2020-02-28 15:13:34 +0100656 /* 8: Generate unique ID if a "unique-id-format" is defined.
657 *
658 * A unique ID is generated even when it is not sent to ensure that the ID can make use of
659 * fetches only available in the HTTP request processing stage.
660 */
661 if (!LIST_ISEMPTY(&sess->fe->format_unique_id)) {
Tim Duesterhusa17e6622020-03-05 20:19:02 +0100662 struct ist unique_id = stream_generate_unique_id(s, &sess->fe->format_unique_id);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200663
Tim Duesterhusa17e6622020-03-05 20:19:02 +0100664 if (!isttest(unique_id)) {
Christopher Fauletb8a53712019-12-16 11:29:38 +0100665 if (!(s->flags & SF_ERR_MASK))
666 s->flags |= SF_ERR_RESOURCE;
667 goto return_int_err;
668 }
Christopher Faulete0768eb2018-10-03 16:38:02 +0200669
Tim Duesterhus2825b4b2020-02-28 15:13:34 +0100670 /* send unique ID if a "unique-id-header" is defined */
Tim Duesterhus0643b0e2020-03-05 17:56:35 +0100671 if (isttest(sess->fe->header_unique_id) &&
Tim Duesterhus7ad27d42022-05-18 00:22:15 +0200672 unlikely(!http_add_header(htx, sess->fe->header_unique_id, unique_id)))
Christopher Fauletd649b572022-06-01 17:42:35 +0200673 goto return_fail_rewrite;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200674 }
675
Aurelien DARRAGONb2e2ec52023-01-09 11:09:03 +0100676 /* handle http extensions (if configured) */
677 if (unlikely(!http_handle_7239_header(s, req)))
678 goto return_fail_rewrite;
679 if (unlikely(!http_handle_xff_header(s, req)))
680 goto return_fail_rewrite;
681 if (unlikely(!http_handle_xot_header(s, req)))
682 goto return_fail_rewrite;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200683
Christopher Fauletc2ac5e42021-03-08 18:20:09 +0100684 /* Filter the request headers if there are filters attached to the
685 * stream.
686 */
687 if (HAS_FILTERS(s))
688 req->analysers |= AN_REQ_FLT_HTTP_HDRS;
689
Christopher Faulete0768eb2018-10-03 16:38:02 +0200690 /* If we have no server assigned yet and we're balancing on url_param
691 * with a POST request, we may be interested in checking the body for
692 * that parameter. This will be done in another analyser.
693 */
694 if (!(s->flags & (SF_ASSIGNED|SF_DIRECT)) &&
Willy Tarreau089eaa02019-01-14 15:17:46 +0100695 s->txn->meth == HTTP_METH_POST &&
696 (s->be->lbprm.algo & BE_LB_ALGO) == BE_LB_ALGO_PH) {
Christopher Faulete0768eb2018-10-03 16:38:02 +0200697 channel_dont_connect(req);
698 req->analysers |= AN_REQ_HTTP_BODY;
699 }
700
701 req->analysers &= ~AN_REQ_FLT_XFER_DATA;
702 req->analysers |= AN_REQ_HTTP_XFER_BODY;
Willy Tarreau1a18b542018-12-11 16:37:42 +0100703
Christopher Faulete0768eb2018-10-03 16:38:02 +0200704 /* We expect some data from the client. Unless we know for sure
705 * we already have a full request, we have to re-enable quick-ack
706 * in case we previously disabled it, otherwise we might cause
707 * the client to delay further data.
708 */
Willy Tarreau9bdcf422023-01-12 19:40:42 +0100709 if ((sess->listener && (sess->listener->bind_conf->options & BC_O_NOQUICKACK)) && !(htx->flags & HTX_FL_EOM))
Willy Tarreau1a18b542018-12-11 16:37:42 +0100710 conn_set_quickack(cli_conn, 1);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200711
712 /*************************************************************
713 * OK, that's finished for the headers. We have done what we *
714 * could. Let's switch to the DATA state. *
715 ************************************************************/
716 req->analyse_exp = TICK_ETERNITY;
717 req->analysers &= ~an_bit;
718
Willy Tarreau69530f52023-04-28 09:16:15 +0200719 s->logs.request_ts = now_ns;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200720 /* OK let's go on with the BODY now */
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100721 DBG_TRACE_LEAVE(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200722 return 1;
723
Christopher Fauletd649b572022-06-01 17:42:35 +0200724 return_fail_rewrite:
725 if (!(s->flags & SF_ERR_MASK))
726 s->flags |= SF_ERR_PRXCOND;
727 _HA_ATOMIC_INC(&sess->fe->fe_counters.failed_rewrites);
728 if (s->flags & SF_BE_ASSIGNED)
729 _HA_ATOMIC_INC(&s->be->be_counters.failed_rewrites);
730 if (sess->listener && sess->listener->counters)
731 _HA_ATOMIC_INC(&sess->listener->counters->failed_rewrites);
732 if (objt_server(s->target))
733 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.failed_rewrites);
734 /* fall through */
735
Christopher Fauletb8a53712019-12-16 11:29:38 +0100736 return_int_err:
737 txn->status = 500;
738 if (!(s->flags & SF_ERR_MASK))
739 s->flags |= SF_ERR_INTERNAL;
Willy Tarreau4781b152021-04-06 13:53:36 +0200740 _HA_ATOMIC_INC(&sess->fe->fe_counters.internal_errors);
Christopher Fauletcff0f732019-12-16 16:13:44 +0100741 if (s->flags & SF_BE_ASSIGNED)
Willy Tarreau4781b152021-04-06 13:53:36 +0200742 _HA_ATOMIC_INC(&s->be->be_counters.internal_errors);
William Lallemand36119de2021-03-08 15:26:48 +0100743 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +0200744 _HA_ATOMIC_INC(&sess->listener->counters->internal_errors);
Christopher Fauletb8a53712019-12-16 11:29:38 +0100745
Christopher Fauletb8a53712019-12-16 11:29:38 +0100746 http_reply_and_close(s, txn->status, http_error_message(s));
Christopher Faulet4a66c942023-01-13 09:43:21 +0100747 http_set_term_flags(s);
Christopher Fauletb8a53712019-12-16 11:29:38 +0100748
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100749 DBG_TRACE_DEVEL("leaving on error",
750 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA|STRM_EV_HTTP_ERR, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200751 return 0;
752}
753
754/* This function is an analyser which processes the HTTP tarpit. It always
755 * returns zero, at the beginning because it prevents any other processing
756 * from occurring, and at the end because it terminates the request.
757 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200758int http_process_tarpit(struct stream *s, struct channel *req, int an_bit)
Christopher Faulete0768eb2018-10-03 16:38:02 +0200759{
760 struct http_txn *txn = s->txn;
761
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100762 DBG_TRACE_ENTER(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn, &txn->req);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200763 /* This connection is being tarpitted. The CLIENT side has
764 * already set the connect expiration date to the right
765 * timeout. We just have to check that the client is still
766 * there and that the timeout has not expired.
767 */
768 channel_dont_connect(req);
Christopher Fauletca5309a2023-04-17 16:17:32 +0200769 if (!(s->scf->flags & (SC_FL_ABRT_DONE|SC_FL_EOS)) &&
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100770 !tick_is_expired(req->analyse_exp, now_ms)) {
Christopher Fauletb0c87f12021-10-29 14:37:07 +0200771 /* Be sure to drain all data from the request channel */
772 channel_htx_erase(req, htxbuf(&req->buf));
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100773 DBG_TRACE_DEVEL("waiting for tarpit timeout expiry",
774 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200775 return 0;
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100776 }
777
Christopher Faulete0768eb2018-10-03 16:38:02 +0200778
779 /* We will set the queue timer to the time spent, just for
780 * logging purposes. We fake a 500 server error, so that the
781 * attacker will not suspect his connection has been tarpitted.
782 * It will not cause trouble to the logs because we can exclude
783 * the tarpitted connections by filtering on the 'PT' status flags.
784 */
Willy Tarreau69530f52023-04-28 09:16:15 +0200785 s->logs.t_queue = ns_to_ms(now_ns - s->logs.accept_ts);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200786
Christopher Fauletd7bac882023-04-14 12:05:55 +0200787 http_reply_and_close(s, txn->status, (!(s->scf->flags & SC_FL_ERROR) ? http_error_message(s) : NULL));
Christopher Faulet4a66c942023-01-13 09:43:21 +0100788 http_set_term_flags(s);
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100789
790 DBG_TRACE_LEAVE(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200791 return 0;
792}
793
794/* This function is an analyser which waits for the HTTP request body. It waits
795 * for either the buffer to be full, or the full advertised contents to have
796 * reached the buffer. It must only be called after the standard HTTP request
797 * processing has occurred, because it expects the request to be parsed and will
798 * look for the Expect header. It may send a 100-Continue interim response. It
Christopher Faulet2954bcc2023-04-05 10:42:03 +0200799 * returns zero if it needs to read more data, or 1 once it has completed its
800 * analysis.
Christopher Faulete0768eb2018-10-03 16:38:02 +0200801 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200802int http_wait_for_request_body(struct stream *s, struct channel *req, int an_bit)
Christopher Faulete0768eb2018-10-03 16:38:02 +0200803{
804 struct session *sess = s->sess;
805 struct http_txn *txn = s->txn;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200806
Christopher Fauletf4569bb2023-01-13 10:49:31 +0100807 DBG_TRACE_ENTER(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn, &s->txn->req);
Christopher Fauletf76ebe82018-10-24 11:16:22 +0200808
Christopher Fauletf76ebe82018-10-24 11:16:22 +0200809
Christopher Faulet021a8e42021-03-29 10:46:38 +0200810 switch (http_wait_for_msg_body(s, req, s->be->timeout.httpreq, 0)) {
811 case HTTP_RULE_RES_CONT:
812 goto http_end;
813 case HTTP_RULE_RES_YIELD:
814 goto missing_data_or_waiting;
815 case HTTP_RULE_RES_BADREQ:
Willy Tarreau4236f032019-03-05 10:43:32 +0100816 goto return_bad_req;
Christopher Faulet021a8e42021-03-29 10:46:38 +0200817 case HTTP_RULE_RES_ERROR:
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200818 goto return_int_err;
Christopher Faulet021a8e42021-03-29 10:46:38 +0200819 case HTTP_RULE_RES_ABRT:
Christopher Fauletb8a53712019-12-16 11:29:38 +0100820 goto return_prx_cond;
Christopher Faulet021a8e42021-03-29 10:46:38 +0200821 default:
822 goto return_int_err;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200823 }
824
825 http_end:
826 /* The situation will not evolve, so let's give up on the analysis. */
Willy Tarreau69530f52023-04-28 09:16:15 +0200827 s->logs.request_ts = now_ns; /* update the request timer to reflect full request */
Christopher Faulete0768eb2018-10-03 16:38:02 +0200828 req->analysers &= ~an_bit;
829 req->analyse_exp = TICK_ETERNITY;
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100830 DBG_TRACE_LEAVE(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200831 return 1;
832
Christopher Faulet021a8e42021-03-29 10:46:38 +0200833 missing_data_or_waiting:
834 channel_dont_connect(req);
835 DBG_TRACE_DEVEL("waiting for more data",
836 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
837 return 0;
838
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200839 return_int_err:
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200840 txn->status = 500;
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200841 if (!(s->flags & SF_ERR_MASK))
842 s->flags |= SF_ERR_INTERNAL;
Willy Tarreau4781b152021-04-06 13:53:36 +0200843 _HA_ATOMIC_INC(&sess->fe->fe_counters.internal_errors);
Christopher Fauletcff0f732019-12-16 16:13:44 +0100844 if (s->flags & SF_BE_ASSIGNED)
Willy Tarreau4781b152021-04-06 13:53:36 +0200845 _HA_ATOMIC_INC(&s->be->be_counters.internal_errors);
William Lallemand36119de2021-03-08 15:26:48 +0100846 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +0200847 _HA_ATOMIC_INC(&sess->listener->counters->internal_errors);
Christopher Faulet021a8e42021-03-29 10:46:38 +0200848 goto return_prx_err;
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200849
Christopher Faulete0768eb2018-10-03 16:38:02 +0200850 return_bad_req: /* let's centralize all bad requests */
Christopher Faulete0768eb2018-10-03 16:38:02 +0200851 txn->status = 400;
Willy Tarreau4781b152021-04-06 13:53:36 +0200852 _HA_ATOMIC_INC(&sess->fe->fe_counters.failed_req);
William Lallemand36119de2021-03-08 15:26:48 +0100853 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +0200854 _HA_ATOMIC_INC(&sess->listener->counters->failed_req);
Christopher Fauletb8a53712019-12-16 11:29:38 +0100855 /* fall through */
856
Christopher Faulet021a8e42021-03-29 10:46:38 +0200857 return_prx_err:
Christopher Fauletb8a53712019-12-16 11:29:38 +0100858 http_reply_and_close(s, txn->status, http_error_message(s));
Christopher Faulet021a8e42021-03-29 10:46:38 +0200859 /* fall through */
Christopher Faulete0768eb2018-10-03 16:38:02 +0200860
Christopher Faulet021a8e42021-03-29 10:46:38 +0200861 return_prx_cond:
Christopher Fauletf0d80df2023-01-13 10:20:20 +0100862 http_set_term_flags(s);
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200863
Christopher Faulete0768eb2018-10-03 16:38:02 +0200864 req->analysers &= AN_REQ_FLT_END;
Christopher Fauletb8a53712019-12-16 11:29:38 +0100865 req->analyse_exp = TICK_ETERNITY;
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100866 DBG_TRACE_DEVEL("leaving on error",
867 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA|STRM_EV_HTTP_ERR, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200868 return 0;
869}
870
871/* This function is an analyser which forwards request body (including chunk
872 * sizes if any). It is called as soon as we must forward, even if we forward
873 * zero byte. The only situation where it must not be called is when we're in
874 * tunnel mode and we want to forward till the close. It's used both to forward
875 * remaining data and to resync after end of body. It expects the msg_state to
876 * be between MSG_BODY and MSG_DONE (inclusive). It returns zero if it needs to
877 * read more data, or 1 once we can go on with next request or end the stream.
878 * When in MSG_DATA or MSG_TRAILERS, it will automatically forward chunk_len
879 * bytes of pending data + the headers if not already done.
880 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200881int http_request_forward_body(struct stream *s, struct channel *req, int an_bit)
Christopher Faulete0768eb2018-10-03 16:38:02 +0200882{
883 struct session *sess = s->sess;
884 struct http_txn *txn = s->txn;
Christopher Faulet9768c262018-10-22 09:34:31 +0200885 struct http_msg *msg = &txn->req;
886 struct htx *htx;
Christopher Faulet93e02d82019-03-08 14:18:50 +0100887 short status = 0;
Christopher Fauletaed82cf2018-11-30 22:22:32 +0100888 int ret;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200889
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100890 DBG_TRACE_ENTER(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn, msg);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200891
Christopher Faulet27ba2dc2018-12-05 11:53:24 +0100892 htx = htxbuf(&req->buf);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200893
Christopher Fauletb9a92f32019-09-09 10:15:21 +0200894 if (htx->flags & HTX_FL_PARSING_ERROR)
895 goto return_bad_req;
896 if (htx->flags & HTX_FL_PROCESSING_ERROR)
897 goto return_int_err;
898
Christopher Faulete0768eb2018-10-03 16:38:02 +0200899 /* Note that we don't have to send 100-continue back because we don't
900 * need the data to complete our job, and it's up to the server to
901 * decide whether to return 100, 417 or anything else in return of
902 * an "Expect: 100-continue" header.
903 */
Christopher Faulet9768c262018-10-22 09:34:31 +0200904 if (msg->msg_state == HTTP_MSG_BODY)
905 msg->msg_state = HTTP_MSG_DATA;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200906
Christopher Faulete0768eb2018-10-03 16:38:02 +0200907 /* in most states, we should abort in case of early close */
908 channel_auto_close(req);
909
910 if (req->to_forward) {
Christopher Faulet66af0b22019-03-22 14:54:52 +0100911 if (req->to_forward == CHN_INFINITE_FORWARD) {
Christopher Faulet904763f2023-03-22 14:53:11 +0100912 if (s->scf->flags & SC_FL_EOI)
Christopher Faulet1a3e0272019-11-15 16:31:46 +0100913 msg->msg_state = HTTP_MSG_ENDING;
Christopher Faulet66af0b22019-03-22 14:54:52 +0100914 }
915 else {
916 /* We can't process the buffer's contents yet */
917 req->flags |= CF_WAKE_WRITE;
918 goto missing_data_or_waiting;
919 }
Christopher Faulete0768eb2018-10-03 16:38:02 +0200920 }
921
Christopher Faulet1a3e0272019-11-15 16:31:46 +0100922 if (msg->msg_state >= HTTP_MSG_ENDING)
923 goto ending;
924
925 if (txn->meth == HTTP_METH_CONNECT) {
926 msg->msg_state = HTTP_MSG_ENDING;
927 goto ending;
928 }
929
Christopher Fauletaed82cf2018-11-30 22:22:32 +0100930 /* Forward input data. We get it by removing all outgoing data not
931 * forwarded yet from HTX data size. If there are some data filters, we
932 * let them decide the amount of data to forward.
Christopher Faulet9768c262018-10-22 09:34:31 +0200933 */
Christopher Fauletaed82cf2018-11-30 22:22:32 +0100934 if (HAS_REQ_DATA_FILTERS(s)) {
935 ret = flt_http_payload(s, msg, htx->data);
936 if (ret < 0)
937 goto return_bad_req;
Christopher Faulet421e7692019-06-13 11:16:45 +0200938 c_adv(req, ret);
Christopher Fauletaed82cf2018-11-30 22:22:32 +0100939 }
940 else {
Christopher Faulet421e7692019-06-13 11:16:45 +0200941 c_adv(req, htx->data - co_data(req));
Christopher Faulet2f7c82b2023-02-20 14:06:52 +0100942 if ((global.tune.options & GTUNE_USE_FAST_FWD) && (msg->flags & HTTP_MSGF_XFER_LEN))
Christopher Faulet66af0b22019-03-22 14:54:52 +0100943 channel_htx_forward_forever(req, htx);
Christopher Fauletaed82cf2018-11-30 22:22:32 +0100944 }
Christopher Faulete0768eb2018-10-03 16:38:02 +0200945
Christopher Faulet1a3e0272019-11-15 16:31:46 +0100946 if (htx->data != co_data(req))
947 goto missing_data_or_waiting;
Christopher Fauletd20fdb02019-06-13 16:43:22 +0200948
Christopher Faulet9768c262018-10-22 09:34:31 +0200949 /* Check if the end-of-message is reached and if so, switch the message
Christopher Fauletd20fdb02019-06-13 16:43:22 +0200950 * in HTTP_MSG_ENDING state. Then if all data was marked to be
951 * forwarded, set the state to HTTP_MSG_DONE.
Christopher Faulet9768c262018-10-22 09:34:31 +0200952 */
Christopher Fauletd1ac2b92020-12-02 19:12:22 +0100953 if (!(htx->flags & HTX_FL_EOM))
Christopher Faulet9768c262018-10-22 09:34:31 +0200954 goto missing_data_or_waiting;
955
Christopher Fauletd20fdb02019-06-13 16:43:22 +0200956 msg->msg_state = HTTP_MSG_ENDING;
Christopher Faulet9768c262018-10-22 09:34:31 +0200957
Christopher Faulet1a3e0272019-11-15 16:31:46 +0100958 ending:
Christopher Faulet84d3ef92023-03-17 15:45:58 +0100959 s->scb->flags &= ~SC_FL_SND_EXP_MORE; /* no more data are expected to be send */
Christopher Faulet2151cdd2020-07-22 16:34:59 +0200960
Christopher Faulet1a3e0272019-11-15 16:31:46 +0100961 /* other states, ENDING...TUNNEL */
962 if (msg->msg_state >= HTTP_MSG_DONE)
963 goto done;
Christopher Faulete0768eb2018-10-03 16:38:02 +0200964
Christopher Fauletaed82cf2018-11-30 22:22:32 +0100965 if (HAS_REQ_DATA_FILTERS(s)) {
966 ret = flt_http_end(s, msg);
967 if (ret <= 0) {
968 if (!ret)
969 goto missing_data_or_waiting;
970 goto return_bad_req;
971 }
972 }
973
Christopher Faulet1a3e0272019-11-15 16:31:46 +0100974 if (txn->meth == HTTP_METH_CONNECT)
975 msg->msg_state = HTTP_MSG_TUNNEL;
976 else {
977 msg->msg_state = HTTP_MSG_DONE;
978 req->to_forward = 0;
979 }
980
981 done:
982 /* we don't want to forward closes on DONE except in tunnel mode. */
983 if (!(txn->flags & TX_CON_WANT_TUN))
984 channel_dont_close(req);
985
Christopher Faulet64350bb2023-04-13 16:37:37 +0200986 if ((s->scb->flags & SC_FL_SHUT_DONE) && co_data(req)) {
Christopher Fauletf2b02cf2023-01-13 11:02:28 +0100987 /* request errors are most likely due to the server aborting the
Christopher Fauletbea90bb2023-09-14 11:12:32 +0200988 * transfer.Bit handle server aborts only if there is no
989 * response. Otherwise, let a change to foward the response
990 * first.
991 */
992 if (htx_is_empty(htxbuf(&s->res.buf)))
993 goto return_srv_abort;
Christopher Fauletf2b02cf2023-01-13 11:02:28 +0100994 }
995
Christopher Fauletfc9cfe42019-07-16 14:54:53 +0200996 http_end_request(s);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200997 if (!(req->analysers & an_bit)) {
Christopher Fauleteea8fc72019-11-05 16:18:10 +0100998 DBG_TRACE_LEAVE(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +0200999 return 1;
1000 }
1001
1002 /* If "option abortonclose" is set on the backend, we want to monitor
1003 * the client's connection and forward any shutdown notification to the
1004 * server, which will decide whether to close or to go on processing the
1005 * request. We only do that in tunnel mode, and not in other modes since
1006 * it can be abused to exhaust source ports. */
Christopher Faulet769d0e92019-03-22 14:23:18 +01001007 if (s->be->options & PR_O_ABRT_CLOSE) {
Christopher Faulete0768eb2018-10-03 16:38:02 +02001008 channel_auto_read(req);
Christopher Fauletca5309a2023-04-17 16:17:32 +02001009 if ((s->scf->flags & (SC_FL_ABRT_DONE|SC_FL_EOS)) && !(txn->flags & TX_CON_WANT_TUN))
Willy Tarreaucb041662022-05-17 19:44:42 +02001010 s->scb->flags |= SC_FL_NOLINGER;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001011 channel_auto_close(req);
1012 }
1013 else if (s->txn->meth == HTTP_METH_POST) {
1014 /* POST requests may require to read extra CRLF sent by broken
1015 * browsers and which could cause an RST to be sent upon close
1016 * on some systems (eg: Linux). */
1017 channel_auto_read(req);
1018 }
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001019 DBG_TRACE_DEVEL("waiting for the end of the HTTP txn",
1020 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001021 return 0;
1022
1023 missing_data_or_waiting:
1024 /* stop waiting for data if the input is closed before the end */
Christopher Fauletca5309a2023-04-17 16:17:32 +02001025 if (msg->msg_state < HTTP_MSG_ENDING && (s->scf->flags & (SC_FL_ABRT_DONE|SC_FL_EOS)))
Christopher Faulet93e02d82019-03-08 14:18:50 +01001026 goto return_cli_abort;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001027
1028 waiting:
1029 /* waiting for the last bits to leave the buffer */
Christopher Fauletbea90bb2023-09-14 11:12:32 +02001030 if (s->scb->flags & SC_FL_SHUT_DONE) {
1031 /* Handle server aborts only if there is no response. Otherwise,
1032 * let a change to foward the response first.
1033 */
1034 if (htx_is_empty(htxbuf(&s->res.buf)))
1035 goto return_srv_abort;
1036 }
Christopher Faulete0768eb2018-10-03 16:38:02 +02001037
1038 /* When TE: chunked is used, we need to get there again to parse remaining
1039 * chunks even if the client has closed, so we don't want to set CF_DONTCLOSE.
1040 * And when content-length is used, we never want to let the possible
1041 * shutdown be forwarded to the other side, as the state machine will
1042 * take care of it once the client responds. It's also important to
1043 * prevent TIME_WAITs from accumulating on the backend side, and for
1044 * HTTP/2 where the last frame comes with a shutdown.
1045 */
Christopher Faulet9768c262018-10-22 09:34:31 +02001046 if (msg->flags & HTTP_MSGF_XFER_LEN)
Christopher Faulete0768eb2018-10-03 16:38:02 +02001047 channel_dont_close(req);
1048
1049 /* We know that more data are expected, but we couldn't send more that
Christopher Faulet84d3ef92023-03-17 15:45:58 +01001050 * what we did. So we always set the SC_FL_SND_EXP_MORE flag so that the
Christopher Faulete0768eb2018-10-03 16:38:02 +02001051 * system knows it must not set a PUSH on this first part. Interactive
1052 * modes are already handled by the stream sock layer. We must not do
1053 * this in content-length mode because it could present the MSG_MORE
1054 * flag with the last block of forwarded data, which would cause an
1055 * additional delay to be observed by the receiver.
1056 */
Christopher Faulet2151cdd2020-07-22 16:34:59 +02001057 if (HAS_REQ_DATA_FILTERS(s))
Christopher Faulet84d3ef92023-03-17 15:45:58 +01001058 s->scb->flags |= SC_FL_SND_EXP_MORE;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001059
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001060 DBG_TRACE_DEVEL("waiting for more data to forward",
1061 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001062 return 0;
1063
Christopher Faulet93e02d82019-03-08 14:18:50 +01001064 return_cli_abort:
Willy Tarreau4781b152021-04-06 13:53:36 +02001065 _HA_ATOMIC_INC(&sess->fe->fe_counters.cli_aborts);
1066 _HA_ATOMIC_INC(&s->be->be_counters.cli_aborts);
William Lallemand36119de2021-03-08 15:26:48 +01001067 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +02001068 _HA_ATOMIC_INC(&sess->listener->counters->cli_aborts);
Christopher Faulet93e02d82019-03-08 14:18:50 +01001069 if (objt_server(s->target))
Willy Tarreau4781b152021-04-06 13:53:36 +02001070 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.cli_aborts);
Christopher Faulet93e02d82019-03-08 14:18:50 +01001071 if (!(s->flags & SF_ERR_MASK))
Christopher Fauletf2b02cf2023-01-13 11:02:28 +01001072 s->flags |= ((req->flags & CF_READ_TIMEOUT) ? SF_ERR_CLITO : SF_ERR_CLICL);
Christopher Faulet93e02d82019-03-08 14:18:50 +01001073 status = 400;
Christopher Fauletb8a53712019-12-16 11:29:38 +01001074 goto return_prx_cond;
Christopher Faulet93e02d82019-03-08 14:18:50 +01001075
1076 return_srv_abort:
Willy Tarreau4781b152021-04-06 13:53:36 +02001077 _HA_ATOMIC_INC(&sess->fe->fe_counters.srv_aborts);
1078 _HA_ATOMIC_INC(&s->be->be_counters.srv_aborts);
William Lallemand36119de2021-03-08 15:26:48 +01001079 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +02001080 _HA_ATOMIC_INC(&sess->listener->counters->srv_aborts);
Christopher Faulet93e02d82019-03-08 14:18:50 +01001081 if (objt_server(s->target))
Willy Tarreau4781b152021-04-06 13:53:36 +02001082 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.srv_aborts);
Christopher Faulet93e02d82019-03-08 14:18:50 +01001083 if (!(s->flags & SF_ERR_MASK))
Christopher Fauletf2b02cf2023-01-13 11:02:28 +01001084 s->flags |= ((req->flags & CF_WRITE_TIMEOUT) ? SF_ERR_SRVTO : SF_ERR_SRVCL);
Christopher Faulet93e02d82019-03-08 14:18:50 +01001085 status = 502;
Christopher Fauletb8a53712019-12-16 11:29:38 +01001086 goto return_prx_cond;
Christopher Faulet93e02d82019-03-08 14:18:50 +01001087
Christopher Fauletb9a92f32019-09-09 10:15:21 +02001088 return_int_err:
1089 if (!(s->flags & SF_ERR_MASK))
1090 s->flags |= SF_ERR_INTERNAL;
Willy Tarreau4781b152021-04-06 13:53:36 +02001091 _HA_ATOMIC_INC(&sess->fe->fe_counters.internal_errors);
1092 _HA_ATOMIC_INC(&s->be->be_counters.internal_errors);
William Lallemand36119de2021-03-08 15:26:48 +01001093 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +02001094 _HA_ATOMIC_INC(&sess->listener->counters->internal_errors);
Christopher Fauletcff0f732019-12-16 16:13:44 +01001095 if (objt_server(s->target))
Willy Tarreau4781b152021-04-06 13:53:36 +02001096 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.internal_errors);
Christopher Fauletb9a92f32019-09-09 10:15:21 +02001097 status = 500;
Christopher Fauletb8a53712019-12-16 11:29:38 +01001098 goto return_prx_cond;
Christopher Fauletb9a92f32019-09-09 10:15:21 +02001099
Christopher Faulet93e02d82019-03-08 14:18:50 +01001100 return_bad_req:
Willy Tarreau4781b152021-04-06 13:53:36 +02001101 _HA_ATOMIC_INC(&sess->fe->fe_counters.failed_req);
William Lallemand36119de2021-03-08 15:26:48 +01001102 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +02001103 _HA_ATOMIC_INC(&sess->listener->counters->failed_req);
Christopher Faulet93e02d82019-03-08 14:18:50 +01001104 status = 400;
Christopher Fauletb8a53712019-12-16 11:29:38 +01001105 /* fall through */
Christopher Faulete0768eb2018-10-03 16:38:02 +02001106
Christopher Fauletb8a53712019-12-16 11:29:38 +01001107 return_prx_cond:
Christopher Faulet9768c262018-10-22 09:34:31 +02001108 if (txn->status > 0) {
Christopher Faulete0768eb2018-10-03 16:38:02 +02001109 /* Note: we don't send any error if some data were already sent */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001110 http_reply_and_close(s, txn->status, NULL);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001111 } else {
Christopher Faulet93e02d82019-03-08 14:18:50 +01001112 txn->status = status;
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001113 http_reply_and_close(s, txn->status, http_error_message(s));
Christopher Faulete0768eb2018-10-03 16:38:02 +02001114 }
Christopher Fauletf2b02cf2023-01-13 11:02:28 +01001115 http_set_term_flags(s);
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001116 DBG_TRACE_DEVEL("leaving on error ",
1117 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA|STRM_EV_HTTP_ERR, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001118 return 0;
1119}
1120
Willy Tarreau4596fe22022-05-17 19:07:51 +02001121/* Reset the stream and the backend stream connector to a situation suitable for attemption connection */
Olivier Houcharda254a372019-04-05 15:30:12 +02001122/* Returns 0 if we can attempt to retry, -1 otherwise */
Willy Tarreaub49672d2022-05-27 10:13:37 +02001123static __inline int do_l7_retry(struct stream *s, struct stconn *sc)
Olivier Houcharda254a372019-04-05 15:30:12 +02001124{
Christopher Faulet9f5382e2021-05-21 13:46:14 +02001125 struct channel *req, *res;
1126 int co_data;
Olivier Houcharda254a372019-04-05 15:30:12 +02001127
Christopher Faulet731c8e62022-03-29 16:08:44 +02001128 if (s->conn_retries >= s->be->conn_retries)
Christopher Faulet552601d2021-05-26 10:31:06 +02001129 return -1;
Christopher Faulet41ade742023-03-01 15:45:39 +01001130 s->conn_retries++;
Christopher Faulete763c8c2021-05-05 18:23:59 +02001131 if (objt_server(s->target)) {
1132 if (s->flags & SF_CURR_SESS) {
1133 s->flags &= ~SF_CURR_SESS;
1134 _HA_ATOMIC_DEC(&__objt_server(s->target)->cur_sess);
1135 }
Willy Tarreau4781b152021-04-06 13:53:36 +02001136 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.retries);
Christopher Faulete763c8c2021-05-05 18:23:59 +02001137 }
Willy Tarreau4781b152021-04-06 13:53:36 +02001138 _HA_ATOMIC_INC(&s->be->be_counters.retries);
Willy Tarreau223995e2019-05-04 10:38:31 +02001139
Christopher Faulet9f5382e2021-05-21 13:46:14 +02001140 req = &s->req;
1141 res = &s->res;
Christopher Faulet87633c32023-04-03 18:32:50 +02001142
Olivier Houcharda254a372019-04-05 15:30:12 +02001143 /* Remove any write error from the request, and read error from the response */
Christopher Fauletca5309a2023-04-17 16:17:32 +02001144 s->scf->flags &= ~(SC_FL_EOS|SC_FL_ABRT_DONE|SC_FL_ABRT_WANTED);
Christopher Faulet87633c32023-04-03 18:32:50 +02001145 req->flags &= ~CF_WRITE_TIMEOUT;
1146 res->flags &= ~(CF_READ_TIMEOUT | CF_READ_EVENT);
Christopher Faulet7bf46bb2022-01-04 10:56:03 +01001147 res->analysers &= AN_RES_FLT_END;
Christopher Faulet50264b42022-03-30 19:39:30 +02001148 s->conn_err_type = STRM_ET_NONE;
Christopher Fauletae024ce2022-03-29 19:02:31 +02001149 s->flags &= ~(SF_CONN_EXP | SF_ERR_MASK | SF_FINST_MASK);
1150 s->conn_exp = TICK_ETERNITY;
Olivier Houchard4bd58672019-07-12 16:16:59 +02001151 stream_choose_redispatch(s);
Olivier Houcharda254a372019-04-05 15:30:12 +02001152 res->to_forward = 0;
1153 res->analyse_exp = TICK_ETERNITY;
1154 res->total = 0;
Christopher Faulet9ec2f4d2022-03-23 15:15:29 +01001155
Christopher Fauleta1d14a72023-04-14 10:42:08 +02001156 s->scb->flags &= ~(SC_FL_ERROR|SC_FL_SHUT_DONE|SC_FL_SHUT_WANTED);
Willy Tarreau19c65a92022-05-27 08:49:24 +02001157 if (sc_reset_endp(s->scb) < 0) {
Christopher Faulet9ec2f4d2022-03-23 15:15:29 +01001158 if (!(s->flags & SF_ERR_MASK))
1159 s->flags |= SF_ERR_INTERNAL;
1160 return -1;
1161 }
Olivier Houcharda254a372019-04-05 15:30:12 +02001162
Christopher Faulet9f5382e2021-05-21 13:46:14 +02001163 b_free(&req->buf);
1164 /* Swap the L7 buffer with the channel buffer */
1165 /* We know we stored the co_data as b_data, so get it there */
Christopher Faulete05bf9e2022-03-29 15:23:40 +02001166 co_data = b_data(&s->txn->l7_buffer);
1167 b_set_data(&s->txn->l7_buffer, b_size(&s->txn->l7_buffer));
1168 b_xfer(&req->buf, &s->txn->l7_buffer, b_data(&s->txn->l7_buffer));
Christopher Faulet9f5382e2021-05-21 13:46:14 +02001169 co_set_data(req, co_data);
Christopher Faulet5b82cc52020-10-12 15:18:50 +02001170
Ilya Shipitsinacf84592021-02-06 22:29:08 +05001171 DBG_TRACE_DEVEL("perform a L7 retry", STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, s->txn);
Christopher Faulet9f5382e2021-05-21 13:46:14 +02001172
Olivier Houcharda254a372019-04-05 15:30:12 +02001173 b_reset(&res->buf);
1174 co_set_data(res, 0);
1175 return 0;
1176}
1177
Christopher Faulete0768eb2018-10-03 16:38:02 +02001178/* This stream analyser waits for a complete HTTP response. It returns 1 if the
1179 * processing can continue on next analysers, or zero if it either needs more
1180 * data or wants to immediately abort the response (eg: timeout, error, ...). It
1181 * is tied to AN_RES_WAIT_HTTP and may may remove itself from s->res.analysers
1182 * when it has nothing left to do, and may remove any analyser when it wants to
1183 * abort.
1184 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001185int http_wait_for_response(struct stream *s, struct channel *rep, int an_bit)
Christopher Faulete0768eb2018-10-03 16:38:02 +02001186{
Christopher Faulet9768c262018-10-22 09:34:31 +02001187 /*
1188 * We will analyze a complete HTTP response to check the its syntax.
1189 *
1190 * Once the start line and all headers are received, we may perform a
1191 * capture of the error (if any), and we will set a few fields. We also
1192 * logging and finally headers capture.
1193 */
Christopher Faulete0768eb2018-10-03 16:38:02 +02001194 struct session *sess = s->sess;
1195 struct http_txn *txn = s->txn;
1196 struct http_msg *msg = &txn->rsp;
Christopher Faulet9768c262018-10-22 09:34:31 +02001197 struct htx *htx;
Christopher Faulet61608322018-11-23 16:23:45 +01001198 struct connection *srv_conn;
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01001199 struct htx_sl *sl;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001200 int n;
1201
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001202 DBG_TRACE_ENTER(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn, msg);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001203
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01001204 htx = htxbuf(&rep->buf);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001205
Willy Tarreau4236f032019-03-05 10:43:32 +01001206 /* Parsing errors are caught here */
1207 if (htx->flags & HTX_FL_PARSING_ERROR)
1208 goto return_bad_res;
Christopher Fauletb9a92f32019-09-09 10:15:21 +02001209 if (htx->flags & HTX_FL_PROCESSING_ERROR)
1210 goto return_int_err;
Willy Tarreau4236f032019-03-05 10:43:32 +01001211
Christopher Faulete0768eb2018-10-03 16:38:02 +02001212 /*
1213 * Now we quickly check if we have found a full valid response.
1214 * If not so, we check the FD and buffer states before leaving.
1215 * A full response is indicated by the fact that we have seen
1216 * the double LF/CRLF, so the state is >= HTTP_MSG_BODY. Invalid
1217 * responses are checked first.
1218 *
1219 * Depending on whether the client is still there or not, we
1220 * may send an error response back or not. Note that normally
1221 * we should only check for HTTP status there, and check I/O
1222 * errors somewhere else.
1223 */
Christopher Fauletb75b5ea2019-05-17 08:37:28 +02001224 next_one:
Christopher Faulet29f17582019-05-23 11:03:26 +02001225 if (unlikely(htx_is_empty(htx) || htx->first == -1)) {
Christopher Faulet9768c262018-10-22 09:34:31 +02001226 /* 1: have we encountered a read error ? */
Christopher Fauletd7bac882023-04-14 12:05:55 +02001227 if (s->scb->flags & SC_FL_ERROR) {
Willy Tarreaufd9417b2022-05-18 16:23:22 +02001228 struct connection *conn = sc_conn(s->scb);
Olivier Houchard865d8392019-05-03 22:46:27 +02001229
Christopher Faulet6f78ac52023-03-01 15:47:18 +01001230
1231 if ((txn->flags & TX_L7_RETRY) &&
1232 (s->be->retry_type & PR_RE_DISCONNECTED) &&
1233 (!conn || conn->err_code != CO_ER_SSL_EARLY_FAILED)) {
1234 if (co_data(rep) || do_l7_retry(s, s->scb) == 0)
1235 return 0;
1236 }
1237
1238 /* Perform a L7 retry on empty response or because server refuses the early data. */
Christopher Faulete05bf9e2022-03-29 15:23:40 +02001239 if ((txn->flags & TX_L7_RETRY) &&
Christopher Fauletd9769232021-05-26 12:15:37 +02001240 (s->be->retry_type & PR_RE_EARLY_ERROR) &&
1241 conn && conn->err_code == CO_ER_SSL_EARLY_FAILED &&
Willy Tarreau7cb9e6c2022-05-17 19:40:40 +02001242 do_l7_retry(s, s->scb) == 0) {
Christopher Fauletd9769232021-05-26 12:15:37 +02001243 DBG_TRACE_DEVEL("leaving on L7 retry",
1244 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
1245 return 0;
1246 }
1247
Christopher Fauletca023882024-04-09 08:19:01 +02001248 if (s->flags & SF_SRV_REUSED)
Olivier Houchard6db16992019-05-17 15:40:49 +02001249 goto abort_keep_alive;
1250
Willy Tarreau4781b152021-04-06 13:53:36 +02001251 _HA_ATOMIC_INC(&s->be->be_counters.failed_resp);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001252 if (objt_server(s->target)) {
Willy Tarreau4781b152021-04-06 13:53:36 +02001253 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.failed_resp);
Willy Tarreaub54c40a2018-12-02 19:28:41 +01001254 health_adjust(__objt_server(s->target), HANA_STATUS_HTTP_READ_ERROR);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001255 }
1256
Christopher Fauletd9769232021-05-26 12:15:37 +02001257 /* if the server refused the early data, just send a 425 */
1258 if (conn && conn->err_code == CO_ER_SSL_EARLY_FAILED)
Olivier Houchard865d8392019-05-03 22:46:27 +02001259 txn->status = 425;
Christopher Fauletd9769232021-05-26 12:15:37 +02001260 else {
1261 txn->status = 502;
Willy Tarreau826f3ab2021-02-10 12:07:15 +01001262 stream_inc_http_fail_ctr(s);
Christopher Fauletd9769232021-05-26 12:15:37 +02001263 }
Christopher Faulete0768eb2018-10-03 16:38:02 +02001264
Willy Tarreaucb041662022-05-17 19:44:42 +02001265 s->scb->flags |= SC_FL_NOLINGER;
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001266 http_reply_and_close(s, txn->status, http_error_message(s));
Christopher Faulete0768eb2018-10-03 16:38:02 +02001267
1268 if (!(s->flags & SF_ERR_MASK))
1269 s->flags |= SF_ERR_SRVCL;
Christopher Faulet4a66c942023-01-13 09:43:21 +01001270 http_set_term_flags(s);
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001271 DBG_TRACE_DEVEL("leaving on error",
1272 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA|STRM_EV_HTTP_ERR, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001273 return 0;
1274 }
1275
Christopher Faulet9768c262018-10-22 09:34:31 +02001276 /* 2: read timeout : return a 504 to the client. */
Christopher Faulete0768eb2018-10-03 16:38:02 +02001277 else if (rep->flags & CF_READ_TIMEOUT) {
Christopher Faulete05bf9e2022-03-29 15:23:40 +02001278 if ((txn->flags & TX_L7_RETRY) &&
Olivier Houcharda254a372019-04-05 15:30:12 +02001279 (s->be->retry_type & PR_RE_TIMEOUT)) {
Willy Tarreau7cb9e6c2022-05-17 19:40:40 +02001280 if (co_data(rep) || do_l7_retry(s, s->scb) == 0) {
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001281 DBG_TRACE_DEVEL("leaving on L7 retry",
1282 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Olivier Houcharda254a372019-04-05 15:30:12 +02001283 return 0;
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001284 }
Olivier Houcharda254a372019-04-05 15:30:12 +02001285 }
Willy Tarreau4781b152021-04-06 13:53:36 +02001286 _HA_ATOMIC_INC(&s->be->be_counters.failed_resp);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001287 if (objt_server(s->target)) {
Willy Tarreau4781b152021-04-06 13:53:36 +02001288 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.failed_resp);
Willy Tarreaub54c40a2018-12-02 19:28:41 +01001289 health_adjust(__objt_server(s->target), HANA_STATUS_HTTP_READ_TIMEOUT);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001290 }
1291
Christopher Faulete0768eb2018-10-03 16:38:02 +02001292 txn->status = 504;
Willy Tarreau826f3ab2021-02-10 12:07:15 +01001293 stream_inc_http_fail_ctr(s);
Willy Tarreaucb041662022-05-17 19:44:42 +02001294 s->scb->flags |= SC_FL_NOLINGER;
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001295 http_reply_and_close(s, txn->status, http_error_message(s));
Christopher Faulete0768eb2018-10-03 16:38:02 +02001296
1297 if (!(s->flags & SF_ERR_MASK))
1298 s->flags |= SF_ERR_SRVTO;
Christopher Faulet4a66c942023-01-13 09:43:21 +01001299 http_set_term_flags(s);
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001300 DBG_TRACE_DEVEL("leaving on error",
1301 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA|STRM_EV_HTTP_ERR, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001302 return 0;
1303 }
1304
Christopher Faulet9768c262018-10-22 09:34:31 +02001305 /* 3: client abort with an abortonclose */
Christopher Fauletca5309a2023-04-17 16:17:32 +02001306 else if ((s->scb->flags & (SC_FL_EOS|SC_FL_ABRT_DONE)) && (s->scb->flags & SC_FL_SHUT_DONE) &&
1307 (s->scf->flags & (SC_FL_EOS|SC_FL_ABRT_DONE))) {
Willy Tarreau4781b152021-04-06 13:53:36 +02001308 _HA_ATOMIC_INC(&sess->fe->fe_counters.cli_aborts);
1309 _HA_ATOMIC_INC(&s->be->be_counters.cli_aborts);
William Lallemand36119de2021-03-08 15:26:48 +01001310 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +02001311 _HA_ATOMIC_INC(&sess->listener->counters->cli_aborts);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001312 if (objt_server(s->target))
Willy Tarreau4781b152021-04-06 13:53:36 +02001313 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.cli_aborts);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001314
Christopher Faulete0768eb2018-10-03 16:38:02 +02001315 txn->status = 400;
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001316 http_reply_and_close(s, txn->status, http_error_message(s));
Christopher Faulete0768eb2018-10-03 16:38:02 +02001317
1318 if (!(s->flags & SF_ERR_MASK))
1319 s->flags |= SF_ERR_CLICL;
Christopher Faulet4a66c942023-01-13 09:43:21 +01001320 http_set_term_flags(s);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001321
1322 /* process_stream() will take care of the error */
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001323 DBG_TRACE_DEVEL("leaving on error",
1324 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA|STRM_EV_HTTP_ERR, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001325 return 0;
1326 }
1327
Christopher Faulet9768c262018-10-22 09:34:31 +02001328 /* 4: close from server, capture the response if the server has started to respond */
Christopher Fauletca5309a2023-04-17 16:17:32 +02001329 else if (s->scb->flags & (SC_FL_EOS|SC_FL_ABRT_DONE)) {
Christopher Faulete05bf9e2022-03-29 15:23:40 +02001330 if ((txn->flags & TX_L7_RETRY) &&
Olivier Houcharda254a372019-04-05 15:30:12 +02001331 (s->be->retry_type & PR_RE_DISCONNECTED)) {
Willy Tarreau7cb9e6c2022-05-17 19:40:40 +02001332 if (co_data(rep) || do_l7_retry(s, s->scb) == 0) {
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001333 DBG_TRACE_DEVEL("leaving on L7 retry",
1334 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Olivier Houcharda254a372019-04-05 15:30:12 +02001335 return 0;
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001336 }
Olivier Houcharda254a372019-04-05 15:30:12 +02001337 }
1338
Christopher Fauletca023882024-04-09 08:19:01 +02001339 if (s->flags & SF_SRV_REUSED)
Olivier Houchard6db16992019-05-17 15:40:49 +02001340 goto abort_keep_alive;
1341
Willy Tarreau4781b152021-04-06 13:53:36 +02001342 _HA_ATOMIC_INC(&s->be->be_counters.failed_resp);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001343 if (objt_server(s->target)) {
Willy Tarreau4781b152021-04-06 13:53:36 +02001344 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.failed_resp);
Willy Tarreaub54c40a2018-12-02 19:28:41 +01001345 health_adjust(__objt_server(s->target), HANA_STATUS_HTTP_BROKEN_PIPE);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001346 }
1347
Christopher Faulete0768eb2018-10-03 16:38:02 +02001348 txn->status = 502;
Willy Tarreau826f3ab2021-02-10 12:07:15 +01001349 stream_inc_http_fail_ctr(s);
Willy Tarreaucb041662022-05-17 19:44:42 +02001350 s->scb->flags |= SC_FL_NOLINGER;
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001351 http_reply_and_close(s, txn->status, http_error_message(s));
Christopher Faulete0768eb2018-10-03 16:38:02 +02001352
1353 if (!(s->flags & SF_ERR_MASK))
1354 s->flags |= SF_ERR_SRVCL;
Christopher Faulet4a66c942023-01-13 09:43:21 +01001355 http_set_term_flags(s);
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001356 DBG_TRACE_DEVEL("leaving on error",
1357 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA|STRM_EV_HTTP_ERR, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001358 return 0;
1359 }
1360
Christopher Faulet9768c262018-10-22 09:34:31 +02001361 /* 5: write error to client (we don't send any message then) */
Christopher Faulet2e56a732023-01-26 16:18:09 +01001362 else if (sc_ep_test(s->scf, SE_FL_ERR_PENDING)) {
Christopher Fauletca023882024-04-09 08:19:01 +02001363 if (s->flags & SF_SRV_REUSED)
Christopher Faulete0768eb2018-10-03 16:38:02 +02001364 goto abort_keep_alive;
1365
Willy Tarreau4781b152021-04-06 13:53:36 +02001366 _HA_ATOMIC_INC(&s->be->be_counters.failed_resp);
Christopher Fauletcff0f732019-12-16 16:13:44 +01001367 if (objt_server(s->target))
Willy Tarreau4781b152021-04-06 13:53:36 +02001368 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.failed_resp);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001369 rep->analysers &= AN_RES_FLT_END;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001370
1371 if (!(s->flags & SF_ERR_MASK))
1372 s->flags |= SF_ERR_CLICL;
Christopher Faulet4a66c942023-01-13 09:43:21 +01001373 http_set_term_flags(s);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001374
1375 /* process_stream() will take care of the error */
Christopher Faulet740420d2024-08-01 15:42:09 +02001376 http_reply_and_close(s, txn->status, NULL);
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001377 DBG_TRACE_DEVEL("leaving on error",
1378 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA|STRM_EV_HTTP_ERR, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001379 return 0;
1380 }
1381
1382 channel_dont_close(rep);
Christopher Faulet9a790f62023-03-16 14:40:03 +01001383 s->scb->flags |= SC_FL_RCV_ONCE; /* try to get back here ASAP */
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001384 DBG_TRACE_DEVEL("waiting for more data",
1385 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001386 return 0;
1387 }
1388
1389 /* More interesting part now : we know that we have a complete
1390 * response which at least looks like HTTP. We have an indicator
1391 * of each header's length, so we can parse them quickly.
1392 */
Christopher Faulet29f17582019-05-23 11:03:26 +02001393 BUG_ON(htx_get_first_type(htx) != HTX_BLK_RES_SL);
Christopher Faulet297fbb42019-05-13 14:41:27 +02001394 sl = http_get_stline(htx);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001395
Christopher Faulet1f08bff2021-05-26 13:14:39 +02001396 /* Perform a L7 retry because of the status code */
Christopher Faulete05bf9e2022-03-29 15:23:40 +02001397 if ((txn->flags & TX_L7_RETRY) &&
Christopher Faulet1f08bff2021-05-26 13:14:39 +02001398 l7_status_match(s->be, sl->info.res.status) &&
Willy Tarreau7cb9e6c2022-05-17 19:40:40 +02001399 do_l7_retry(s, s->scb) == 0) {
Christopher Faulet1f08bff2021-05-26 13:14:39 +02001400 DBG_TRACE_DEVEL("leaving on L7 retry", STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
1401 return 0;
1402 }
1403
1404 /* Now, L7 buffer is useless, it can be released */
Christopher Faulete05bf9e2022-03-29 15:23:40 +02001405 b_free(&txn->l7_buffer);
Christopher Faulet1f08bff2021-05-26 13:14:39 +02001406
1407 msg->msg_state = HTTP_MSG_BODY;
1408
1409
Christopher Faulet9768c262018-10-22 09:34:31 +02001410 /* 0: we might have to print this header in debug mode */
1411 if (unlikely((global.mode & MODE_DEBUG) &&
1412 (!(global.mode & MODE_QUIET) || (global.mode & MODE_VERBOSE)))) {
1413 int32_t pos;
1414
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001415 http_debug_stline("srvrep", s, sl);
Christopher Faulet9768c262018-10-22 09:34:31 +02001416
Christopher Fauleta3f15502019-05-13 15:27:23 +02001417 for (pos = htx_get_first(htx); pos != -1; pos = htx_get_next(htx, pos)) {
Christopher Faulet9768c262018-10-22 09:34:31 +02001418 struct htx_blk *blk = htx_get_blk(htx, pos);
1419 enum htx_blk_type type = htx_get_blk_type(blk);
1420
1421 if (type == HTX_BLK_EOH)
1422 break;
1423 if (type != HTX_BLK_HDR)
1424 continue;
1425
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001426 http_debug_hdr("srvhdr", s,
1427 htx_get_blk_name(htx, blk),
1428 htx_get_blk_value(htx, blk));
Christopher Faulet9768c262018-10-22 09:34:31 +02001429 }
1430 }
1431
Christopher Faulet03599112018-11-27 11:21:21 +01001432 /* 1: get the status code and the version. Also set HTTP flags */
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01001433 txn->status = sl->info.res.status;
Christopher Faulet03599112018-11-27 11:21:21 +01001434 if (sl->flags & HTX_SL_F_VER_11)
Christopher Faulet9768c262018-10-22 09:34:31 +02001435 msg->flags |= HTTP_MSGF_VER_11;
Christopher Faulet03599112018-11-27 11:21:21 +01001436 if (sl->flags & HTX_SL_F_XFER_LEN) {
1437 msg->flags |= HTTP_MSGF_XFER_LEN;
Christopher Faulet2a408542020-11-20 14:22:37 +01001438 if (sl->flags & HTX_SL_F_CLEN)
1439 msg->flags |= HTTP_MSGF_CNT_LEN;
1440 else if (sl->flags & HTX_SL_F_CHNK)
1441 msg->flags |= HTTP_MSGF_TE_CHNK;
Christopher Faulet03599112018-11-27 11:21:21 +01001442 }
Christopher Faulet2a408542020-11-20 14:22:37 +01001443 if (sl->flags & HTX_SL_F_BODYLESS)
1444 msg->flags |= HTTP_MSGF_BODYLESS;
Christopher Faulet576c3582021-01-08 15:53:01 +01001445 if (sl->flags & HTX_SL_F_CONN_UPG)
1446 msg->flags |= HTTP_MSGF_CONN_UPG;
Christopher Faulet9768c262018-10-22 09:34:31 +02001447
1448 n = txn->status / 100;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001449 if (n < 1 || n > 5)
1450 n = 0;
Christopher Faulet9768c262018-10-22 09:34:31 +02001451
Christopher Faulete0768eb2018-10-03 16:38:02 +02001452 /* when the client triggers a 4xx from the server, it's most often due
1453 * to a missing object or permission. These events should be tracked
1454 * because if they happen often, it may indicate a brute force or a
1455 * vulnerability scan.
1456 */
1457 if (n == 4)
1458 stream_inc_http_err_ctr(s);
1459
Willy Tarreau826f3ab2021-02-10 12:07:15 +01001460 if (n == 5 && txn->status != 501 && txn->status != 505)
1461 stream_inc_http_fail_ctr(s);
1462
Marcin Deranek3c27dda2020-05-15 18:32:51 +02001463 if (objt_server(s->target)) {
Willy Tarreau4781b152021-04-06 13:53:36 +02001464 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.p.http.rsp[n]);
1465 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.p.http.cum_req);
Marcin Deranek3c27dda2020-05-15 18:32:51 +02001466 }
Christopher Faulete0768eb2018-10-03 16:38:02 +02001467
Christopher Faulete0768eb2018-10-03 16:38:02 +02001468 /* Adjust server's health based on status code. Note: status codes 501
1469 * and 505 are triggered on demand by client request, so we must not
1470 * count them as server failures.
1471 */
1472 if (objt_server(s->target)) {
1473 if (txn->status >= 100 && (txn->status < 500 || txn->status == 501 || txn->status == 505))
Willy Tarreaub54c40a2018-12-02 19:28:41 +01001474 health_adjust(__objt_server(s->target), HANA_STATUS_HTTP_OK);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001475 else
Willy Tarreaub54c40a2018-12-02 19:28:41 +01001476 health_adjust(__objt_server(s->target), HANA_STATUS_HTTP_STS);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001477 }
1478
1479 /*
1480 * We may be facing a 100-continue response, or any other informational
1481 * 1xx response which is non-final, in which case this is not the right
1482 * response, and we're waiting for the next one. Let's allow this response
1483 * to go to the client and wait for the next one. There's an exception for
1484 * 101 which is used later in the code to switch protocols.
1485 */
1486 if (txn->status < 200 &&
1487 (txn->status == 100 || txn->status >= 102)) {
Christopher Fauletaed82cf2018-11-30 22:22:32 +01001488 FLT_STRM_CB(s, flt_http_reset(s, msg));
Christopher Faulet421e7692019-06-13 11:16:45 +02001489 htx->first = channel_htx_fwd_headers(rep, htx);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001490 msg->msg_state = HTTP_MSG_RPBEFORE;
Christopher Faulet3499f622019-09-03 15:23:54 +02001491 msg->flags = 0;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001492 txn->status = 0;
1493 s->logs.t_data = -1; /* was not a response yet */
Christopher Faulet5c281d52023-03-16 15:53:28 +01001494 s->scf->flags |= SC_FL_SND_ASAP; /* Send ASAP informational messages */
Christopher Fauletb75b5ea2019-05-17 08:37:28 +02001495 goto next_one;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001496 }
1497
Christopher Faulet6e6c7b12021-01-08 16:02:05 +01001498 /* A 101-switching-protocols must contains a Connection header with the
1499 * "upgrade" option and the request too. It means both are agree to
1500 * upgrade. It is not so strict because there is no test on the Upgrade
1501 * header content. But it is probably stronger enough for now.
1502 */
1503 if (txn->status == 101 &&
1504 (!(txn->req.flags & HTTP_MSGF_CONN_UPG) || !(txn->rsp.flags & HTTP_MSGF_CONN_UPG)))
1505 goto return_bad_res;
1506
Christopher Faulete0768eb2018-10-03 16:38:02 +02001507 /*
1508 * 2: check for cacheability.
1509 */
1510
1511 switch (txn->status) {
1512 case 200:
1513 case 203:
1514 case 204:
1515 case 206:
1516 case 300:
1517 case 301:
1518 case 404:
1519 case 405:
1520 case 410:
1521 case 414:
1522 case 501:
1523 break;
1524 default:
1525 /* RFC7231#6.1:
1526 * Responses with status codes that are defined as
1527 * cacheable by default (e.g., 200, 203, 204, 206,
1528 * 300, 301, 404, 405, 410, 414, and 501 in this
1529 * specification) can be reused by a cache with
1530 * heuristic expiration unless otherwise indicated
1531 * by the method definition or explicit cache
1532 * controls [RFC7234]; all other status codes are
1533 * not cacheable by default.
1534 */
1535 txn->flags &= ~(TX_CACHEABLE | TX_CACHE_COOK);
1536 break;
1537 }
1538
1539 /*
1540 * 3: we may need to capture headers
1541 */
1542 s->logs.logwait &= ~LW_RESP;
1543 if (unlikely((s->logs.logwait & LW_RSPHDR) && s->res_cap))
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001544 http_capture_headers(htx, s->res_cap, sess->fe->rsp_cap);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001545
Christopher Faulet9768c262018-10-22 09:34:31 +02001546 /* Skip parsing if no content length is possible. */
Christopher Fauletc75668e2020-12-07 18:10:32 +01001547 if (unlikely((txn->meth == HTTP_METH_CONNECT && txn->status >= 200 && txn->status < 300) ||
Christopher Faulete0768eb2018-10-03 16:38:02 +02001548 txn->status == 101)) {
1549 /* Either we've established an explicit tunnel, or we're
1550 * switching the protocol. In both cases, we're very unlikely
1551 * to understand the next protocols. We have to switch to tunnel
1552 * mode, so that we transfer the request and responses then let
1553 * this protocol pass unmodified. When we later implement specific
1554 * parsers for such protocols, we'll want to check the Upgrade
1555 * header which contains information about that protocol for
1556 * responses with status 101 (eg: see RFC2817 about TLS).
1557 */
Christopher Fauletc41547b2019-07-16 14:32:23 +02001558 txn->flags |= TX_CON_WANT_TUN;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001559 }
1560
Amaury Denoyelleab6b0742024-03-20 09:25:03 +01001561 /* Check for NTML authentication headers in 401 (WWW-Authenticate) and
1562 * 407 (Proxy-Authenticate) responses and set the connection to
1563 * private.
1564 *
1565 * Note that this is not performed when using a true multiplexer unless
1566 * connection is already attached to the session as nothing prevents it
1567 * from being shared already by several sessions here.
Christopher Faulet61608322018-11-23 16:23:45 +01001568 */
Willy Tarreaufd9417b2022-05-18 16:23:22 +02001569 srv_conn = sc_conn(s->scb);
Amaury Denoyelleab6b0742024-03-20 09:25:03 +01001570 if (srv_conn &&
1571 (LIST_INLIST(&srv_conn->sess_el) || strcmp(srv_conn->mux->name, "H1") == 0)) {
Christopher Faulet61608322018-11-23 16:23:45 +01001572 struct ist hdr;
1573 struct http_hdr_ctx ctx;
1574
1575 if (txn->status == 401)
1576 hdr = ist("WWW-Authenticate");
1577 else if (txn->status == 407)
1578 hdr = ist("Proxy-Authenticate");
1579 else
1580 goto end;
1581
1582 ctx.blk = NULL;
1583 while (http_find_header(htx, hdr, &ctx, 0)) {
Willy Tarreauf1dcced2020-05-07 19:27:02 +02001584 /* If www-authenticate contains "Negotiate", "Nego2", or "NTLM",
1585 * possibly followed by blanks and a base64 string, the connection
1586 * is private. Since it's a mess to deal with, we only check for
1587 * values starting with "NTLM" or "Nego". Note that often multiple
1588 * headers are sent by the server there.
1589 */
1590 if ((ctx.value.len >= 4 && strncasecmp(ctx.value.ptr, "Nego", 4) == 0) ||
Willy Tarreau49a1d282020-05-07 19:10:15 +02001591 (ctx.value.len >= 4 && strncasecmp(ctx.value.ptr, "NTLM", 4) == 0)) {
Olivier Houchard250031e2019-05-29 15:01:50 +02001592 sess->flags |= SESS_FL_PREFER_LAST;
Christopher Faulet08016ab2020-07-01 16:10:06 +02001593 conn_set_owner(srv_conn, sess, NULL);
Christopher Faulet21ddc742020-07-01 15:26:14 +02001594 conn_set_private(srv_conn);
Ilya Shipitsin6b79f382020-07-23 00:32:55 +05001595 /* If it fail now, the same will be done in mux->detach() callback */
Christopher Faulet08016ab2020-07-01 16:10:06 +02001596 session_add_conn(srv_conn->owner, srv_conn, srv_conn->target);
Willy Tarreauf1dcced2020-05-07 19:27:02 +02001597 break;
Olivier Houchard250031e2019-05-29 15:01:50 +02001598 }
Christopher Faulet61608322018-11-23 16:23:45 +01001599 }
1600 }
1601
1602 end:
Christopher Faulete0768eb2018-10-03 16:38:02 +02001603 /* we want to have the response time before we start processing it */
Willy Tarreau69530f52023-04-28 09:16:15 +02001604 s->logs.t_data = ns_to_ms(now_ns - s->logs.accept_ts);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001605
1606 /* end of job, return OK */
1607 rep->analysers &= ~an_bit;
1608 rep->analyse_exp = TICK_ETERNITY;
1609 channel_auto_close(rep);
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001610 DBG_TRACE_LEAVE(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001611 return 1;
1612
Christopher Fauletb9a92f32019-09-09 10:15:21 +02001613 return_int_err:
Willy Tarreau4781b152021-04-06 13:53:36 +02001614 _HA_ATOMIC_INC(&sess->fe->fe_counters.internal_errors);
1615 _HA_ATOMIC_INC(&s->be->be_counters.internal_errors);
William Lallemand36119de2021-03-08 15:26:48 +01001616 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +02001617 _HA_ATOMIC_INC(&sess->listener->counters->internal_errors);
Christopher Fauletb8a53712019-12-16 11:29:38 +01001618 if (objt_server(s->target))
Willy Tarreau4781b152021-04-06 13:53:36 +02001619 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.internal_errors);
Christopher Fauletb9a92f32019-09-09 10:15:21 +02001620 txn->status = 500;
1621 if (!(s->flags & SF_ERR_MASK))
1622 s->flags |= SF_ERR_INTERNAL;
Christopher Fauletb8a53712019-12-16 11:29:38 +01001623 goto return_prx_cond;
Christopher Fauletb9a92f32019-09-09 10:15:21 +02001624
1625 return_bad_res:
Willy Tarreau4781b152021-04-06 13:53:36 +02001626 _HA_ATOMIC_INC(&s->be->be_counters.failed_resp);
Christopher Faulet47365272018-10-31 17:40:50 +01001627 if (objt_server(s->target)) {
Willy Tarreau4781b152021-04-06 13:53:36 +02001628 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.failed_resp);
Willy Tarreaub54c40a2018-12-02 19:28:41 +01001629 health_adjust(__objt_server(s->target), HANA_STATUS_HTTP_HDRRSP);
Christopher Faulet47365272018-10-31 17:40:50 +01001630 }
Olivier Houcharde3249a92019-05-03 23:01:47 +02001631 if ((s->be->retry_type & PR_RE_JUNK_REQUEST) &&
Christopher Faulete05bf9e2022-03-29 15:23:40 +02001632 (txn->flags & TX_L7_RETRY) &&
Willy Tarreau7cb9e6c2022-05-17 19:40:40 +02001633 do_l7_retry(s, s->scb) == 0) {
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001634 DBG_TRACE_DEVEL("leaving on L7 retry",
1635 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Olivier Houcharde3249a92019-05-03 23:01:47 +02001636 return 0;
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001637 }
Christopher Faulet47365272018-10-31 17:40:50 +01001638 txn->status = 502;
Willy Tarreau826f3ab2021-02-10 12:07:15 +01001639 stream_inc_http_fail_ctr(s);
Christopher Fauletb9a92f32019-09-09 10:15:21 +02001640 /* fall through */
1641
Christopher Fauletb8a53712019-12-16 11:29:38 +01001642 return_prx_cond:
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001643 http_reply_and_close(s, txn->status, http_error_message(s));
Christopher Faulet4a66c942023-01-13 09:43:21 +01001644 http_set_term_flags(s);
Christopher Fauletb9a92f32019-09-09 10:15:21 +02001645
Willy Tarreaucb041662022-05-17 19:44:42 +02001646 s->scb->flags |= SC_FL_NOLINGER;
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001647 DBG_TRACE_DEVEL("leaving on error",
1648 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA|STRM_EV_HTTP_ERR, s, txn);
Christopher Faulet47365272018-10-31 17:40:50 +01001649 return 0;
1650
Christopher Faulete0768eb2018-10-03 16:38:02 +02001651 abort_keep_alive:
1652 /* A keep-alive request to the server failed on a network error.
1653 * The client is required to retry. We need to close without returning
1654 * any other information so that the client retries.
1655 */
1656 txn->status = 0;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001657 s->logs.logwait = 0;
1658 s->logs.level = 0;
Christopher Faulet84d3ef92023-03-17 15:45:58 +01001659 s->scf->flags &= ~SC_FL_SND_EXP_MORE; /* speed up sending a previous response */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001660 http_reply_and_close(s, txn->status, NULL);
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001661 DBG_TRACE_DEVEL("leaving by closing K/A connection",
1662 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001663 return 0;
1664}
1665
1666/* This function performs all the processing enabled for the current response.
1667 * It normally returns 1 unless it wants to break. It relies on buffers flags,
1668 * and updates s->res.analysers. It might make sense to explode it into several
1669 * other functions. It works like process_request (see indications above).
1670 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001671int http_process_res_common(struct stream *s, struct channel *rep, int an_bit, struct proxy *px)
Christopher Faulete0768eb2018-10-03 16:38:02 +02001672{
1673 struct session *sess = s->sess;
1674 struct http_txn *txn = s->txn;
1675 struct http_msg *msg = &txn->rsp;
Christopher Fauletfec7bd12018-10-24 11:17:50 +02001676 struct htx *htx;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001677 struct proxy *cur_proxy;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001678 enum rule_result ret = HTTP_RULE_RES_CONT;
1679
Christopher Fauletfec7bd12018-10-24 11:17:50 +02001680 if (unlikely(msg->msg_state < HTTP_MSG_BODY)) /* we need more data */
1681 return 0;
Christopher Faulet9768c262018-10-22 09:34:31 +02001682
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001683 DBG_TRACE_ENTER(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn, msg);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001684
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01001685 htx = htxbuf(&rep->buf);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001686
1687 /* The stats applet needs to adjust the Connection header but we don't
1688 * apply any filter there.
1689 */
1690 if (unlikely(objt_applet(s->target) == &http_stats_applet)) {
1691 rep->analysers &= ~an_bit;
1692 rep->analyse_exp = TICK_ETERNITY;
Christopher Fauletf2824e62018-10-01 12:12:37 +02001693 goto end;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001694 }
1695
1696 /*
1697 * We will have to evaluate the filters.
1698 * As opposed to version 1.2, now they will be evaluated in the
1699 * filters order and not in the header order. This means that
1700 * each filter has to be validated among all headers.
1701 *
1702 * Filters are tried with ->be first, then with ->fe if it is
1703 * different from ->be.
1704 *
1705 * Maybe we are in resume condiion. In this case I choose the
1706 * "struct proxy" which contains the rule list matching the resume
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +05001707 * pointer. If none of these "struct proxy" match, I initialise
Christopher Faulete0768eb2018-10-03 16:38:02 +02001708 * the process with the first one.
1709 *
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +05001710 * In fact, I check only correspondence between the current list
Christopher Faulete0768eb2018-10-03 16:38:02 +02001711 * pointer and the ->fe rule list. If it doesn't match, I initialize
1712 * the loop with the ->be.
1713 */
Christopher Fauletd4150ad2021-10-13 15:35:55 +02001714 if (s->current_rule_list == &sess->fe->http_res_rules ||
1715 (sess->fe->defpx && s->current_rule_list == &sess->fe->defpx->http_res_rules))
Christopher Faulete0768eb2018-10-03 16:38:02 +02001716 cur_proxy = sess->fe;
1717 else
1718 cur_proxy = s->be;
Christopher Fauletd4150ad2021-10-13 15:35:55 +02001719
Christopher Faulete0768eb2018-10-03 16:38:02 +02001720 while (1) {
Christopher Faulete0768eb2018-10-03 16:38:02 +02001721 /* evaluate http-response rules */
Christopher Faulet46f46df2021-11-09 16:33:25 +01001722 if (ret == HTTP_RULE_RES_CONT || ret == HTTP_RULE_RES_STOP) {
Christopher Fauletd4150ad2021-10-13 15:35:55 +02001723 struct list *def_rules, *rules;
1724
1725 def_rules = ((cur_proxy->defpx && (cur_proxy == s->be || cur_proxy->defpx != s->be->defpx)) ? &cur_proxy->defpx->http_res_rules : NULL);
1726 rules = &cur_proxy->http_res_rules;
1727
1728 ret = http_res_get_intercept_rule(cur_proxy, def_rules, rules, s);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001729
Christopher Faulet3a26bee2019-12-16 12:47:40 +01001730 switch (ret) {
1731 case HTTP_RULE_RES_YIELD: /* some data miss, call the function later. */
1732 goto return_prx_yield;
1733
1734 case HTTP_RULE_RES_CONT:
1735 case HTTP_RULE_RES_STOP: /* nothing to do */
1736 break;
1737
1738 case HTTP_RULE_RES_DENY: /* deny or tarpit */
1739 goto deny;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001740
Christopher Faulet3a26bee2019-12-16 12:47:40 +01001741 case HTTP_RULE_RES_ABRT: /* abort request, response already sent */
1742 goto return_prx_cond;
1743
1744 case HTTP_RULE_RES_DONE: /* OK, but terminate request processing (eg: redirect) */
Christopher Fauletb8a53712019-12-16 11:29:38 +01001745 goto done;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001746
Christopher Faulet3a26bee2019-12-16 12:47:40 +01001747 case HTTP_RULE_RES_BADREQ: /* failed with a bad request */
1748 goto return_bad_res;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001749
Christopher Faulet3a26bee2019-12-16 12:47:40 +01001750 case HTTP_RULE_RES_ERROR: /* failed with a bad request */
1751 goto return_int_err;
1752 }
1753
1754 }
Christopher Faulete0768eb2018-10-03 16:38:02 +02001755
Christopher Faulete0768eb2018-10-03 16:38:02 +02001756 /* check whether we're already working on the frontend */
1757 if (cur_proxy == sess->fe)
1758 break;
1759 cur_proxy = sess->fe;
1760 }
1761
Christopher Faulete0768eb2018-10-03 16:38:02 +02001762 /* OK that's all we can do for 1xx responses */
1763 if (unlikely(txn->status < 200 && txn->status != 101))
Christopher Fauletf2824e62018-10-01 12:12:37 +02001764 goto end;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001765
1766 /*
1767 * Now check for a server cookie.
1768 */
1769 if (s->be->cookie_name || sess->fe->capture_name || (s->be->options & PR_O_CHK_CACHE))
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001770 http_manage_server_side_cookies(s, rep);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001771
1772 /*
1773 * Check for cache-control or pragma headers if required.
1774 */
1775 if ((s->be->options & PR_O_CHK_CACHE) || (s->be->ck_opts & PR_CK_NOC))
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02001776 http_check_response_for_cacheability(s, rep);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001777
1778 /*
1779 * Add server cookie in the response if needed
1780 */
1781 if (objt_server(s->target) && (s->be->ck_opts & PR_CK_INS) &&
1782 !((txn->flags & TX_SCK_FOUND) && (s->be->ck_opts & PR_CK_PSV)) &&
1783 (!(s->flags & SF_DIRECT) ||
1784 ((s->be->cookie_maxidle || txn->cookie_last_date) &&
1785 (!txn->cookie_last_date || (txn->cookie_last_date - date.tv_sec) < 0)) ||
1786 (s->be->cookie_maxlife && !txn->cookie_first_date) || // set the first_date
1787 (!s->be->cookie_maxlife && txn->cookie_first_date)) && // remove the first_date
1788 (!(s->be->ck_opts & PR_CK_POST) || (txn->meth == HTTP_METH_POST)) &&
1789 !(s->flags & SF_IGNORE_PRST)) {
1790 /* the server is known, it's not the one the client requested, or the
1791 * cookie's last seen date needs to be refreshed. We have to
1792 * insert a set-cookie here, except if we want to insert only on POST
1793 * requests and this one isn't. Note that servers which don't have cookies
1794 * (eg: some backup servers) will return a full cookie removal request.
1795 */
Willy Tarreau88bc8002021-12-06 07:01:02 +00001796 if (!__objt_server(s->target)->cookie) {
Christopher Faulete0768eb2018-10-03 16:38:02 +02001797 chunk_printf(&trash,
Christopher Fauletfec7bd12018-10-24 11:17:50 +02001798 "%s=; Expires=Thu, 01-Jan-1970 00:00:01 GMT; path=/",
Christopher Faulete0768eb2018-10-03 16:38:02 +02001799 s->be->cookie_name);
1800 }
1801 else {
Willy Tarreau88bc8002021-12-06 07:01:02 +00001802 chunk_printf(&trash, "%s=%s", s->be->cookie_name, __objt_server(s->target)->cookie);
Christopher Faulete0768eb2018-10-03 16:38:02 +02001803
1804 if (s->be->cookie_maxidle || s->be->cookie_maxlife) {
1805 /* emit last_date, which is mandatory */
1806 trash.area[trash.data++] = COOKIE_DELIM_DATE;
1807 s30tob64((date.tv_sec+3) >> 2,
1808 trash.area + trash.data);
1809 trash.data += 5;
1810
1811 if (s->be->cookie_maxlife) {
1812 /* emit first_date, which is either the original one or
1813 * the current date.
1814 */
1815 trash.area[trash.data++] = COOKIE_DELIM_DATE;
1816 s30tob64(txn->cookie_first_date ?
1817 txn->cookie_first_date >> 2 :
1818 (date.tv_sec+3) >> 2,
1819 trash.area + trash.data);
1820 trash.data += 5;
1821 }
1822 }
1823 chunk_appendf(&trash, "; path=/");
1824 }
1825
1826 if (s->be->cookie_domain)
1827 chunk_appendf(&trash, "; domain=%s", s->be->cookie_domain);
1828
1829 if (s->be->ck_opts & PR_CK_HTTPONLY)
1830 chunk_appendf(&trash, "; HttpOnly");
1831
1832 if (s->be->ck_opts & PR_CK_SECURE)
1833 chunk_appendf(&trash, "; Secure");
1834
Christopher Faulet2f533902020-01-21 11:06:48 +01001835 if (s->be->cookie_attrs)
1836 chunk_appendf(&trash, "; %s", s->be->cookie_attrs);
1837
Christopher Fauletfec7bd12018-10-24 11:17:50 +02001838 if (unlikely(!http_add_header(htx, ist("Set-Cookie"), ist2(trash.area, trash.data))))
Christopher Fauletd649b572022-06-01 17:42:35 +02001839 goto return_fail_rewrite;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001840
1841 txn->flags &= ~TX_SCK_MASK;
1842 if (__objt_server(s->target)->cookie && (s->flags & SF_DIRECT))
1843 /* the server did not change, only the date was updated */
1844 txn->flags |= TX_SCK_UPDATED;
1845 else
1846 txn->flags |= TX_SCK_INSERTED;
1847
1848 /* Here, we will tell an eventual cache on the client side that we don't
1849 * want it to cache this reply because HTTP/1.0 caches also cache cookies !
1850 * Some caches understand the correct form: 'no-cache="set-cookie"', but
1851 * others don't (eg: apache <= 1.3.26). So we use 'private' instead.
1852 */
1853 if ((s->be->ck_opts & PR_CK_NOC) && (txn->flags & TX_CACHEABLE)) {
1854
1855 txn->flags &= ~TX_CACHEABLE & ~TX_CACHE_COOK;
1856
Christopher Fauletfec7bd12018-10-24 11:17:50 +02001857 if (unlikely(!http_add_header(htx, ist("Cache-control"), ist("private"))))
Christopher Fauletd649b572022-06-01 17:42:35 +02001858 goto return_fail_rewrite;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001859 }
1860 }
1861
1862 /*
1863 * Check if result will be cacheable with a cookie.
1864 * We'll block the response if security checks have caught
1865 * nasty things such as a cacheable cookie.
1866 */
1867 if (((txn->flags & (TX_CACHEABLE | TX_CACHE_COOK | TX_SCK_PRESENT)) ==
1868 (TX_CACHEABLE | TX_CACHE_COOK | TX_SCK_PRESENT)) &&
1869 (s->be->options & PR_O_CHK_CACHE)) {
1870 /* we're in presence of a cacheable response containing
1871 * a set-cookie header. We'll block it as requested by
1872 * the 'checkcache' option, and send an alert.
1873 */
Christopher Faulete0768eb2018-10-03 16:38:02 +02001874 ha_alert("Blocking cacheable cookie in response from instance %s, server %s.\n",
Willy Tarreau88bc8002021-12-06 07:01:02 +00001875 s->be->id, objt_server(s->target) ? __objt_server(s->target)->id : "<dispatch>");
Christopher Faulete0768eb2018-10-03 16:38:02 +02001876 send_log(s->be, LOG_ALERT,
1877 "Blocking cacheable cookie in response from instance %s, server %s.\n",
Willy Tarreau88bc8002021-12-06 07:01:02 +00001878 s->be->id, objt_server(s->target) ? __objt_server(s->target)->id : "<dispatch>");
Christopher Fauletb8a53712019-12-16 11:29:38 +01001879 goto deny;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001880 }
1881
Christopher Fauletfec7bd12018-10-24 11:17:50 +02001882 end:
Christopher Faulet6d0c3df2020-01-22 09:26:35 +01001883 /*
1884 * Evaluate after-response rules before forwarding the response. rules
1885 * from the backend are evaluated first, then one from the frontend if
1886 * it differs.
1887 */
1888 if (!http_eval_after_res_rules(s))
1889 goto return_int_err;
1890
Christopher Fauletc2ac5e42021-03-08 18:20:09 +01001891 /* Filter the response headers if there are filters attached to the
1892 * stream.
1893 */
1894 if (HAS_FILTERS(s))
1895 rep->analysers |= AN_RES_FLT_HTTP_HDRS;
1896
Christopher Faulete0768eb2018-10-03 16:38:02 +02001897 /* Always enter in the body analyzer */
1898 rep->analysers &= ~AN_RES_FLT_XFER_DATA;
1899 rep->analysers |= AN_RES_HTTP_XFER_BODY;
1900
1901 /* if the user wants to log as soon as possible, without counting
1902 * bytes from the server, then this is the right moment. We have
1903 * to temporarily assign bytes_out to log what we currently have.
1904 */
1905 if (!LIST_ISEMPTY(&sess->fe->logformat) && !(s->logs.logwait & LW_BYTES)) {
1906 s->logs.t_close = s->logs.t_data; /* to get a valid end date */
Christopher Fauletfec7bd12018-10-24 11:17:50 +02001907 s->logs.bytes_out = htx->data;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001908 s->do_log(s);
1909 s->logs.bytes_out = 0;
1910 }
Christopher Fauletfec7bd12018-10-24 11:17:50 +02001911
Christopher Fauletb8a53712019-12-16 11:29:38 +01001912 done:
Christopher Faulet6d0c3df2020-01-22 09:26:35 +01001913 DBG_TRACE_LEAVE(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Fauletb8a53712019-12-16 11:29:38 +01001914 rep->analysers &= ~an_bit;
1915 rep->analyse_exp = TICK_ETERNITY;
Christopher Fauletd4150ad2021-10-13 15:35:55 +02001916 s->current_rule = s->current_rule_list = NULL;
Christopher Fauletb8a53712019-12-16 11:29:38 +01001917 return 1;
Christopher Fauletfec7bd12018-10-24 11:17:50 +02001918
Christopher Fauletb8a53712019-12-16 11:29:38 +01001919 deny:
Willy Tarreau4781b152021-04-06 13:53:36 +02001920 _HA_ATOMIC_INC(&sess->fe->fe_counters.denied_resp);
1921 _HA_ATOMIC_INC(&s->be->be_counters.denied_resp);
William Lallemand36119de2021-03-08 15:26:48 +01001922 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +02001923 _HA_ATOMIC_INC(&sess->listener->counters->denied_resp);
Christopher Fauleta08546b2019-12-16 16:07:34 +01001924 if (objt_server(s->target))
Willy Tarreau4781b152021-04-06 13:53:36 +02001925 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.denied_resp);
Christopher Fauletb8a53712019-12-16 11:29:38 +01001926 goto return_prx_err;
1927
Christopher Fauletd649b572022-06-01 17:42:35 +02001928 return_fail_rewrite:
1929 if (!(s->flags & SF_ERR_MASK))
1930 s->flags |= SF_ERR_PRXCOND;
1931 _HA_ATOMIC_INC(&sess->fe->fe_counters.failed_rewrites);
1932 _HA_ATOMIC_INC(&s->be->be_counters.failed_rewrites);
1933 if (sess->listener && sess->listener->counters)
1934 _HA_ATOMIC_INC(&sess->listener->counters->failed_rewrites);
1935 if (objt_server(s->target))
1936 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.failed_rewrites);
1937 /* fall through */
1938
Christopher Fauletb8a53712019-12-16 11:29:38 +01001939 return_int_err:
1940 txn->status = 500;
1941 if (!(s->flags & SF_ERR_MASK))
1942 s->flags |= SF_ERR_INTERNAL;
Willy Tarreau4781b152021-04-06 13:53:36 +02001943 _HA_ATOMIC_INC(&sess->fe->fe_counters.internal_errors);
1944 _HA_ATOMIC_INC(&s->be->be_counters.internal_errors);
Dragan Dosen9a006f92021-09-21 13:02:09 +02001945 if (sess->listener && sess->listener->counters)
1946 _HA_ATOMIC_INC(&sess->listener->counters->internal_errors);
Christopher Fauletcff0f732019-12-16 16:13:44 +01001947 if (objt_server(s->target))
Willy Tarreau4781b152021-04-06 13:53:36 +02001948 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.internal_errors);
Christopher Fauletb8a53712019-12-16 11:29:38 +01001949 goto return_prx_err;
1950
1951 return_bad_res:
1952 txn->status = 502;
Willy Tarreau826f3ab2021-02-10 12:07:15 +01001953 stream_inc_http_fail_ctr(s);
Willy Tarreau4781b152021-04-06 13:53:36 +02001954 _HA_ATOMIC_INC(&s->be->be_counters.failed_resp);
Christopher Fauleta20a6532020-02-05 10:16:41 +01001955 if (objt_server(s->target)) {
Willy Tarreau4781b152021-04-06 13:53:36 +02001956 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.failed_resp);
Christopher Fauleta20a6532020-02-05 10:16:41 +01001957 health_adjust(__objt_server(s->target), HANA_STATUS_HTTP_RSP);
1958 }
Christopher Fauletb8a53712019-12-16 11:29:38 +01001959 /* fall through */
1960
1961 return_prx_err:
1962 http_reply_and_close(s, txn->status, http_error_message(s));
1963 /* fall through */
1964
1965 return_prx_cond:
Christopher Fauletfec7bd12018-10-24 11:17:50 +02001966 s->logs.t_data = -1; /* was not a valid response */
Willy Tarreaucb041662022-05-17 19:44:42 +02001967 s->scb->flags |= SC_FL_NOLINGER;
Christopher Fauletb8a53712019-12-16 11:29:38 +01001968
Christopher Faulet4a66c942023-01-13 09:43:21 +01001969 http_set_term_flags(s);
Christopher Fauletb8a53712019-12-16 11:29:38 +01001970
Christopher Faulete58c0002020-03-02 16:21:01 +01001971 rep->analysers &= AN_RES_FLT_END;
1972 s->req.analysers &= AN_REQ_FLT_END;
Christopher Fauletb8a53712019-12-16 11:29:38 +01001973 rep->analyse_exp = TICK_ETERNITY;
Christopher Fauletd4150ad2021-10-13 15:35:55 +02001974 s->current_rule = s->current_rule_list = NULL;
Christopher Fauleteea8fc72019-11-05 16:18:10 +01001975 DBG_TRACE_DEVEL("leaving on error",
1976 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA|STRM_EV_HTTP_ERR, s, txn);
Christopher Fauletfec7bd12018-10-24 11:17:50 +02001977 return 0;
Christopher Fauletb8a53712019-12-16 11:29:38 +01001978
1979 return_prx_yield:
1980 channel_dont_close(rep);
1981 DBG_TRACE_DEVEL("waiting for more data",
1982 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
1983 return 0;
Christopher Faulete0768eb2018-10-03 16:38:02 +02001984}
1985
1986/* This function is an analyser which forwards response body (including chunk
1987 * sizes if any). It is called as soon as we must forward, even if we forward
1988 * zero byte. The only situation where it must not be called is when we're in
1989 * tunnel mode and we want to forward till the close. It's used both to forward
1990 * remaining data and to resync after end of body. It expects the msg_state to
1991 * be between MSG_BODY and MSG_DONE (inclusive). It returns zero if it needs to
1992 * read more data, or 1 once we can go on with next request or end the stream.
1993 *
1994 * It is capable of compressing response data both in content-length mode and
1995 * in chunked mode. The state machines follows different flows depending on
1996 * whether content-length and chunked modes are used, since there are no
1997 * trailers in content-length :
1998 *
1999 * chk-mode cl-mode
2000 * ,----- BODY -----.
2001 * / \
2002 * V size > 0 V chk-mode
2003 * .--> SIZE -------------> DATA -------------> CRLF
2004 * | | size == 0 | last byte |
2005 * | v final crlf v inspected |
2006 * | TRAILERS -----------> DONE |
2007 * | |
2008 * `----------------------------------------------'
2009 *
2010 * Compression only happens in the DATA state, and must be flushed in final
2011 * states (TRAILERS/DONE) or when leaving on missing data. Normal forwarding
2012 * is performed at once on final states for all bytes parsed, or when leaving
2013 * on missing data.
2014 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02002015int http_response_forward_body(struct stream *s, struct channel *res, int an_bit)
Christopher Faulete0768eb2018-10-03 16:38:02 +02002016{
2017 struct session *sess = s->sess;
2018 struct http_txn *txn = s->txn;
2019 struct http_msg *msg = &s->txn->rsp;
Christopher Faulet9768c262018-10-22 09:34:31 +02002020 struct htx *htx;
Christopher Fauletaed82cf2018-11-30 22:22:32 +01002021 int ret;
Christopher Faulete0768eb2018-10-03 16:38:02 +02002022
Christopher Fauleteea8fc72019-11-05 16:18:10 +01002023 DBG_TRACE_ENTER(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn, msg);
Christopher Faulete0768eb2018-10-03 16:38:02 +02002024
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01002025 htx = htxbuf(&res->buf);
Christopher Faulete0768eb2018-10-03 16:38:02 +02002026
Christopher Fauletb9a92f32019-09-09 10:15:21 +02002027 if (htx->flags & HTX_FL_PARSING_ERROR)
2028 goto return_bad_res;
2029 if (htx->flags & HTX_FL_PROCESSING_ERROR)
2030 goto return_int_err;
2031
Christopher Faulet9768c262018-10-22 09:34:31 +02002032 if (msg->msg_state == HTTP_MSG_BODY)
2033 msg->msg_state = HTTP_MSG_DATA;
2034
Christopher Faulete0768eb2018-10-03 16:38:02 +02002035 /* in most states, we should abort in case of early close */
2036 channel_auto_close(res);
2037
Christopher Faulete0768eb2018-10-03 16:38:02 +02002038 if (res->to_forward) {
Christopher Faulet66af0b22019-03-22 14:54:52 +01002039 if (res->to_forward == CHN_INFINITE_FORWARD) {
Christopher Faulet904763f2023-03-22 14:53:11 +01002040 if (s->scb->flags & SC_FL_EOI)
Christopher Faulet1a3e0272019-11-15 16:31:46 +01002041 msg->msg_state = HTTP_MSG_ENDING;
Christopher Faulet66af0b22019-03-22 14:54:52 +01002042 }
2043 else {
2044 /* We can't process the buffer's contents yet */
2045 res->flags |= CF_WAKE_WRITE;
2046 goto missing_data_or_waiting;
2047 }
Christopher Faulete0768eb2018-10-03 16:38:02 +02002048 }
2049
Christopher Faulet1a3e0272019-11-15 16:31:46 +01002050 if (msg->msg_state >= HTTP_MSG_ENDING)
2051 goto ending;
2052
Christopher Fauletc75668e2020-12-07 18:10:32 +01002053 if ((txn->meth == HTTP_METH_CONNECT && txn->status >= 200 && txn->status < 300) || txn->status == 101 ||
Christopher Faulet1a3e0272019-11-15 16:31:46 +01002054 (!(msg->flags & HTTP_MSGF_XFER_LEN) && !HAS_RSP_DATA_FILTERS(s))) {
2055 msg->msg_state = HTTP_MSG_ENDING;
2056 goto ending;
2057 }
Christopher Faulet9768c262018-10-22 09:34:31 +02002058
Christopher Fauletaed82cf2018-11-30 22:22:32 +01002059 /* Forward input data. We get it by removing all outgoing data not
2060 * forwarded yet from HTX data size. If there are some data filters, we
2061 * let them decide the amount of data to forward.
Christopher Faulet9768c262018-10-22 09:34:31 +02002062 */
Christopher Fauletaed82cf2018-11-30 22:22:32 +01002063 if (HAS_RSP_DATA_FILTERS(s)) {
2064 ret = flt_http_payload(s, msg, htx->data);
2065 if (ret < 0)
2066 goto return_bad_res;
Christopher Faulet421e7692019-06-13 11:16:45 +02002067 c_adv(res, ret);
Christopher Fauletaed82cf2018-11-30 22:22:32 +01002068 }
2069 else {
Christopher Faulet421e7692019-06-13 11:16:45 +02002070 c_adv(res, htx->data - co_data(res));
Christopher Faulet2f7c82b2023-02-20 14:06:52 +01002071 if ((global.tune.options & GTUNE_USE_FAST_FWD) && (msg->flags & HTTP_MSGF_XFER_LEN))
Christopher Faulet66af0b22019-03-22 14:54:52 +01002072 channel_htx_forward_forever(res, htx);
Christopher Fauletaed82cf2018-11-30 22:22:32 +01002073 }
Christopher Faulet9768c262018-10-22 09:34:31 +02002074
Christopher Faulet1a3e0272019-11-15 16:31:46 +01002075 if (htx->data != co_data(res))
2076 goto missing_data_or_waiting;
2077
Christopher Fauletca5309a2023-04-17 16:17:32 +02002078 if (!(msg->flags & HTTP_MSGF_XFER_LEN) && (s->scb->flags & (SC_FL_EOS|SC_FL_ABRT_DONE))) {
Christopher Faulet1a3e0272019-11-15 16:31:46 +01002079 msg->msg_state = HTTP_MSG_ENDING;
2080 goto ending;
Christopher Faulete0768eb2018-10-03 16:38:02 +02002081 }
2082
Christopher Faulet9768c262018-10-22 09:34:31 +02002083 /* Check if the end-of-message is reached and if so, switch the message
Christopher Fauletd20fdb02019-06-13 16:43:22 +02002084 * in HTTP_MSG_ENDING state. Then if all data was marked to be
2085 * forwarded, set the state to HTTP_MSG_DONE.
Christopher Faulet9768c262018-10-22 09:34:31 +02002086 */
Christopher Fauletd1ac2b92020-12-02 19:12:22 +01002087 if (!(htx->flags & HTX_FL_EOM))
Christopher Faulet9768c262018-10-22 09:34:31 +02002088 goto missing_data_or_waiting;
2089
Christopher Fauletd20fdb02019-06-13 16:43:22 +02002090 msg->msg_state = HTTP_MSG_ENDING;
Christopher Faulet9768c262018-10-22 09:34:31 +02002091
Christopher Faulet1a3e0272019-11-15 16:31:46 +01002092 ending:
Christopher Faulet84d3ef92023-03-17 15:45:58 +01002093 s->scf->flags &= ~SC_FL_SND_EXP_MORE; /* no more data are expected to be sent */
Christopher Faulet2151cdd2020-07-22 16:34:59 +02002094
Christopher Faulet1a3e0272019-11-15 16:31:46 +01002095 /* other states, ENDING...TUNNEL */
2096 if (msg->msg_state >= HTTP_MSG_DONE)
2097 goto done;
Christopher Faulet9768c262018-10-22 09:34:31 +02002098
Christopher Fauletaed82cf2018-11-30 22:22:32 +01002099 if (HAS_RSP_DATA_FILTERS(s)) {
2100 ret = flt_http_end(s, msg);
2101 if (ret <= 0) {
2102 if (!ret)
2103 goto missing_data_or_waiting;
2104 goto return_bad_res;
2105 }
2106 }
2107
Christopher Faulet97047972023-04-17 08:52:10 +02002108 if (!(txn->flags & TX_CON_WANT_TUN) && !(msg->flags & HTTP_MSGF_XFER_LEN)) {
2109 /* One-side tunnel */
Christopher Faulet1a3e0272019-11-15 16:31:46 +01002110 msg->msg_state = HTTP_MSG_TUNNEL;
Christopher Faulet1a3e0272019-11-15 16:31:46 +01002111 }
2112 else {
2113 msg->msg_state = HTTP_MSG_DONE;
2114 res->to_forward = 0;
2115 }
2116
2117 done:
2118
2119 channel_dont_close(res);
2120
Christopher Faulet64350bb2023-04-13 16:37:37 +02002121 if ((s->scf->flags & SC_FL_SHUT_DONE) && co_data(res)) {
Christopher Fauletf2b02cf2023-01-13 11:02:28 +01002122 /* response errors are most likely due to the client aborting
2123 * the transfer. */
2124 goto return_cli_abort;
2125 }
2126
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02002127 http_end_response(s);
Christopher Faulete0768eb2018-10-03 16:38:02 +02002128 if (!(res->analysers & an_bit)) {
Christopher Fauleteea8fc72019-11-05 16:18:10 +01002129 DBG_TRACE_LEAVE(STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02002130 return 1;
2131 }
Christopher Fauleteea8fc72019-11-05 16:18:10 +01002132 DBG_TRACE_DEVEL("waiting for the end of the HTTP txn",
2133 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02002134 return 0;
2135
2136 missing_data_or_waiting:
Christopher Faulet64350bb2023-04-13 16:37:37 +02002137 if (s->scf->flags & SC_FL_SHUT_DONE)
Christopher Faulet93e02d82019-03-08 14:18:50 +01002138 goto return_cli_abort;
Christopher Faulete0768eb2018-10-03 16:38:02 +02002139
2140 /* stop waiting for data if the input is closed before the end. If the
2141 * client side was already closed, it means that the client has aborted,
2142 * so we don't want to count this as a server abort. Otherwise it's a
2143 * server abort.
2144 */
Christopher Fauletca5309a2023-04-17 16:17:32 +02002145 if (msg->msg_state < HTTP_MSG_ENDING && (s->scb->flags & (SC_FL_EOS|SC_FL_ABRT_DONE))) {
2146 if ((s->scf->flags & (SC_FL_EOS|SC_FL_ABRT_DONE)) &&
Christopher Faulet64350bb2023-04-13 16:37:37 +02002147 (s->scb->flags & SC_FL_SHUT_DONE))
Christopher Faulet93e02d82019-03-08 14:18:50 +01002148 goto return_cli_abort;
Christopher Faulete0768eb2018-10-03 16:38:02 +02002149 /* If we have some pending data, we continue the processing */
Christopher Faulet93e02d82019-03-08 14:18:50 +01002150 if (htx_is_empty(htx))
2151 goto return_srv_abort;
Christopher Faulete0768eb2018-10-03 16:38:02 +02002152 }
2153
Christopher Faulete0768eb2018-10-03 16:38:02 +02002154 /* When TE: chunked is used, we need to get there again to parse
2155 * remaining chunks even if the server has closed, so we don't want to
Christopher Faulet9768c262018-10-22 09:34:31 +02002156 * set CF_DONTCLOSE. Similarly when there is a content-leng or if there
2157 * are filters registered on the stream, we don't want to forward a
2158 * close
Christopher Faulete0768eb2018-10-03 16:38:02 +02002159 */
Christopher Fauletaed82cf2018-11-30 22:22:32 +01002160 if ((msg->flags & HTTP_MSGF_XFER_LEN) || HAS_RSP_DATA_FILTERS(s))
Christopher Faulete0768eb2018-10-03 16:38:02 +02002161 channel_dont_close(res);
2162
2163 /* We know that more data are expected, but we couldn't send more that
Christopher Faulet84d3ef92023-03-17 15:45:58 +01002164 * what we did. So we always set the SC_FL_SND_EXP_MORE flag so that the
Christopher Faulete0768eb2018-10-03 16:38:02 +02002165 * system knows it must not set a PUSH on this first part. Interactive
2166 * modes are already handled by the stream sock layer. We must not do
2167 * this in content-length mode because it could present the MSG_MORE
2168 * flag with the last block of forwarded data, which would cause an
2169 * additional delay to be observed by the receiver.
2170 */
Christopher Faulet2151cdd2020-07-22 16:34:59 +02002171 if (HAS_RSP_DATA_FILTERS(s))
Christopher Faulet84d3ef92023-03-17 15:45:58 +01002172 s->scf->flags |= SC_FL_SND_EXP_MORE;
Christopher Faulete0768eb2018-10-03 16:38:02 +02002173
2174 /* the stream handler will take care of timeouts and errors */
Christopher Fauleteea8fc72019-11-05 16:18:10 +01002175 DBG_TRACE_DEVEL("waiting for more data to forward",
2176 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02002177 return 0;
2178
Christopher Faulet93e02d82019-03-08 14:18:50 +01002179 return_srv_abort:
Willy Tarreau4781b152021-04-06 13:53:36 +02002180 _HA_ATOMIC_INC(&sess->fe->fe_counters.srv_aborts);
2181 _HA_ATOMIC_INC(&s->be->be_counters.srv_aborts);
William Lallemand36119de2021-03-08 15:26:48 +01002182 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +02002183 _HA_ATOMIC_INC(&sess->listener->counters->srv_aborts);
Christopher Faulete0768eb2018-10-03 16:38:02 +02002184 if (objt_server(s->target))
Willy Tarreau4781b152021-04-06 13:53:36 +02002185 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.srv_aborts);
Willy Tarreau826f3ab2021-02-10 12:07:15 +01002186 stream_inc_http_fail_ctr(s);
Christopher Faulet93e02d82019-03-08 14:18:50 +01002187 if (!(s->flags & SF_ERR_MASK))
Christopher Fauletf2b02cf2023-01-13 11:02:28 +01002188 s->flags |= ((res->flags & CF_READ_TIMEOUT) ? SF_ERR_SRVTO : SF_ERR_SRVCL);
Christopher Faulet93e02d82019-03-08 14:18:50 +01002189 goto return_error;
Christopher Faulete0768eb2018-10-03 16:38:02 +02002190
Christopher Faulet93e02d82019-03-08 14:18:50 +01002191 return_cli_abort:
Willy Tarreau4781b152021-04-06 13:53:36 +02002192 _HA_ATOMIC_INC(&sess->fe->fe_counters.cli_aborts);
2193 _HA_ATOMIC_INC(&s->be->be_counters.cli_aborts);
William Lallemand36119de2021-03-08 15:26:48 +01002194 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +02002195 _HA_ATOMIC_INC(&sess->listener->counters->cli_aborts);
Christopher Faulete0768eb2018-10-03 16:38:02 +02002196 if (objt_server(s->target))
Willy Tarreau4781b152021-04-06 13:53:36 +02002197 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.cli_aborts);
Christopher Faulet93e02d82019-03-08 14:18:50 +01002198 if (!(s->flags & SF_ERR_MASK))
Christopher Fauletf2b02cf2023-01-13 11:02:28 +01002199 s->flags |= ((res->flags & CF_WRITE_TIMEOUT) ? SF_ERR_CLITO : SF_ERR_CLICL);
Christopher Faulet93e02d82019-03-08 14:18:50 +01002200 goto return_error;
Christopher Faulete0768eb2018-10-03 16:38:02 +02002201
Christopher Fauletb9a92f32019-09-09 10:15:21 +02002202 return_int_err:
Willy Tarreau4781b152021-04-06 13:53:36 +02002203 _HA_ATOMIC_INC(&sess->fe->fe_counters.internal_errors);
2204 _HA_ATOMIC_INC(&s->be->be_counters.internal_errors);
William Lallemand36119de2021-03-08 15:26:48 +01002205 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +02002206 _HA_ATOMIC_INC(&sess->listener->counters->internal_errors);
Christopher Fauletb8a53712019-12-16 11:29:38 +01002207 if (objt_server(s->target))
Willy Tarreau4781b152021-04-06 13:53:36 +02002208 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.internal_errors);
Christopher Fauletb9a92f32019-09-09 10:15:21 +02002209 if (!(s->flags & SF_ERR_MASK))
2210 s->flags |= SF_ERR_INTERNAL;
2211 goto return_error;
2212
Christopher Faulet93e02d82019-03-08 14:18:50 +01002213 return_bad_res:
Willy Tarreau4781b152021-04-06 13:53:36 +02002214 _HA_ATOMIC_INC(&s->be->be_counters.failed_resp);
Christopher Faulet93e02d82019-03-08 14:18:50 +01002215 if (objt_server(s->target)) {
Willy Tarreau4781b152021-04-06 13:53:36 +02002216 _HA_ATOMIC_INC(&__objt_server(s->target)->counters.failed_resp);
Christopher Faulet93e02d82019-03-08 14:18:50 +01002217 health_adjust(__objt_server(s->target), HANA_STATUS_HTTP_RSP);
2218 }
Willy Tarreau826f3ab2021-02-10 12:07:15 +01002219 stream_inc_http_fail_ctr(s);
Christopher Faulete0768eb2018-10-03 16:38:02 +02002220 if (!(s->flags & SF_ERR_MASK))
Christopher Faulet93e02d82019-03-08 14:18:50 +01002221 s->flags |= SF_ERR_SRVCL;
Christopher Fauletb8a53712019-12-16 11:29:38 +01002222 /* fall through */
Christopher Faulete0768eb2018-10-03 16:38:02 +02002223
Christopher Faulet93e02d82019-03-08 14:18:50 +01002224 return_error:
Christopher Faulete0768eb2018-10-03 16:38:02 +02002225 /* don't send any error message as we're in the body */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02002226 http_reply_and_close(s, txn->status, NULL);
Christopher Fauletf2b02cf2023-01-13 11:02:28 +01002227 http_set_term_flags(s);
2228 stream_inc_http_fail_ctr(s);
Christopher Fauleteea8fc72019-11-05 16:18:10 +01002229 DBG_TRACE_DEVEL("leaving on error",
2230 STRM_EV_STRM_ANA|STRM_EV_HTTP_ANA|STRM_EV_HTTP_ERR, s, txn);
Christopher Faulete0768eb2018-10-03 16:38:02 +02002231 return 0;
2232}
2233
Christopher Fauletf2824e62018-10-01 12:12:37 +02002234/* Perform an HTTP redirect based on the information in <rule>. The function
Willy Tarreaubc1223b2021-09-02 16:54:33 +02002235 * returns zero in case of an irrecoverable error such as too large a request
2236 * to build a valid response, 1 in case of successful redirect (hence the rule
2237 * is final), or 2 if the rule has to be silently skipped.
Christopher Fauletf2824e62018-10-01 12:12:37 +02002238 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02002239int http_apply_redirect_rule(struct redirect_rule *rule, struct stream *s, struct http_txn *txn)
Christopher Fauletf2824e62018-10-01 12:12:37 +02002240{
Christopher Faulet99daf282018-11-28 22:58:13 +01002241 struct channel *req = &s->req;
2242 struct channel *res = &s->res;
2243 struct htx *htx;
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01002244 struct htx_sl *sl;
Christopher Fauletf2824e62018-10-01 12:12:37 +02002245 struct buffer *chunk;
Christopher Faulet99daf282018-11-28 22:58:13 +01002246 struct ist status, reason, location;
2247 unsigned int flags;
Christopher Fauleteab17572022-04-26 20:34:38 +02002248 int ret = 1, close = 0; /* Try to keep the connection alive byt default */
Christopher Fauletf2824e62018-10-01 12:12:37 +02002249
2250 chunk = alloc_trash_chunk();
Christopher Fauletb8a53712019-12-16 11:29:38 +01002251 if (!chunk) {
2252 if (!(s->flags & SF_ERR_MASK))
2253 s->flags |= SF_ERR_RESOURCE;
Christopher Faulet99daf282018-11-28 22:58:13 +01002254 goto fail;
Christopher Fauletb8a53712019-12-16 11:29:38 +01002255 }
Christopher Fauletf2824e62018-10-01 12:12:37 +02002256
Christopher Faulet99daf282018-11-28 22:58:13 +01002257 /*
2258 * Create the location
2259 */
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01002260 htx = htxbuf(&req->buf);
Christopher Fauletf2824e62018-10-01 12:12:37 +02002261 switch(rule->type) {
Christopher Faulet99daf282018-11-28 22:58:13 +01002262 case REDIRECT_TYPE_SCHEME: {
2263 struct http_hdr_ctx ctx;
2264 struct ist path, host;
Amaury Denoyellec453f952021-07-06 11:40:12 +02002265 struct http_uri_parser parser;
Christopher Fauletf2824e62018-10-01 12:12:37 +02002266
Christopher Faulet99daf282018-11-28 22:58:13 +01002267 host = ist("");
2268 ctx.blk = NULL;
2269 if (http_find_header(htx, ist("Host"), &ctx, 0))
2270 host = ctx.value;
Christopher Fauletf2824e62018-10-01 12:12:37 +02002271
Christopher Faulet297fbb42019-05-13 14:41:27 +02002272 sl = http_get_stline(htx);
Amaury Denoyellec453f952021-07-06 11:40:12 +02002273 parser = http_uri_parser_init(htx_sl_req_uri(sl));
2274 path = http_parse_path(&parser);
Christopher Faulet99daf282018-11-28 22:58:13 +01002275 /* build message using path */
Tim Duesterhused526372020-03-05 17:56:33 +01002276 if (isttest(path)) {
Christopher Faulet99daf282018-11-28 22:58:13 +01002277 if (rule->flags & REDIRECT_FLAG_DROP_QS) {
2278 int qs = 0;
2279 while (qs < path.len) {
2280 if (*(path.ptr + qs) == '?') {
2281 path.len = qs;
2282 break;
2283 }
2284 qs++;
Christopher Fauletf2824e62018-10-01 12:12:37 +02002285 }
Christopher Fauletf2824e62018-10-01 12:12:37 +02002286 }
2287 }
Christopher Faulet99daf282018-11-28 22:58:13 +01002288 else
2289 path = ist("/");
Christopher Fauletf2824e62018-10-01 12:12:37 +02002290
Christopher Faulet99daf282018-11-28 22:58:13 +01002291 if (rule->rdr_str) { /* this is an old "redirect" rule */
2292 /* add scheme */
2293 if (!chunk_memcat(chunk, rule->rdr_str, rule->rdr_len))
2294 goto fail;
2295 }
2296 else {
2297 /* add scheme with executing log format */
2298 chunk->data += build_logline(s, chunk->area + chunk->data,
2299 chunk->size - chunk->data,
2300 &rule->rdr_fmt);
2301 }
2302 /* add "://" + host + path */
2303 if (!chunk_memcat(chunk, "://", 3) ||
2304 !chunk_memcat(chunk, host.ptr, host.len) ||
2305 !chunk_memcat(chunk, path.ptr, path.len))
2306 goto fail;
Christopher Fauletf2824e62018-10-01 12:12:37 +02002307
Christopher Faulet99daf282018-11-28 22:58:13 +01002308 /* append a slash at the end of the location if needed and missing */
2309 if (chunk->data && chunk->area[chunk->data - 1] != '/' &&
2310 (rule->flags & REDIRECT_FLAG_APPEND_SLASH)) {
2311 if (chunk->data + 1 >= chunk->size)
2312 goto fail;
2313 chunk->area[chunk->data++] = '/';
2314 }
2315 break;
Christopher Fauletf2824e62018-10-01 12:12:37 +02002316 }
Christopher Fauletf2824e62018-10-01 12:12:37 +02002317
Christopher Faulet99daf282018-11-28 22:58:13 +01002318 case REDIRECT_TYPE_PREFIX: {
2319 struct ist path;
Amaury Denoyellec453f952021-07-06 11:40:12 +02002320 struct http_uri_parser parser;
Christopher Faulet99daf282018-11-28 22:58:13 +01002321
Christopher Faulet297fbb42019-05-13 14:41:27 +02002322 sl = http_get_stline(htx);
Amaury Denoyellec453f952021-07-06 11:40:12 +02002323 parser = http_uri_parser_init(htx_sl_req_uri(sl));
2324 path = http_parse_path(&parser);
Christopher Faulet99daf282018-11-28 22:58:13 +01002325 /* build message using path */
Tim Duesterhused526372020-03-05 17:56:33 +01002326 if (isttest(path)) {
Christopher Faulet99daf282018-11-28 22:58:13 +01002327 if (rule->flags & REDIRECT_FLAG_DROP_QS) {
2328 int qs = 0;
2329 while (qs < path.len) {
2330 if (*(path.ptr + qs) == '?') {
2331 path.len = qs;
2332 break;
2333 }
2334 qs++;
Christopher Fauletf2824e62018-10-01 12:12:37 +02002335 }
Christopher Fauletf2824e62018-10-01 12:12:37 +02002336 }
2337 }
Christopher Faulet99daf282018-11-28 22:58:13 +01002338 else
2339 path = ist("/");
Christopher Fauletf2824e62018-10-01 12:12:37 +02002340
Christopher Faulet99daf282018-11-28 22:58:13 +01002341 if (rule->rdr_str) { /* this is an old "redirect" rule */
2342 /* add prefix. Note that if prefix == "/", we don't want to
2343 * add anything, otherwise it makes it hard for the user to
2344 * configure a self-redirection.
2345 */
2346 if (rule->rdr_len != 1 || *rule->rdr_str != '/') {
2347 if (!chunk_memcat(chunk, rule->rdr_str, rule->rdr_len))
2348 goto fail;
2349 }
Christopher Fauletf2824e62018-10-01 12:12:37 +02002350 }
Christopher Faulet99daf282018-11-28 22:58:13 +01002351 else {
2352 /* add prefix with executing log format */
2353 chunk->data += build_logline(s, chunk->area + chunk->data,
2354 chunk->size - chunk->data,
2355 &rule->rdr_fmt);
2356 }
Christopher Fauletf2824e62018-10-01 12:12:37 +02002357
Christopher Faulet99daf282018-11-28 22:58:13 +01002358 /* add path */
2359 if (!chunk_memcat(chunk, path.ptr, path.len))
2360 goto fail;
Christopher Fauletf2824e62018-10-01 12:12:37 +02002361
Christopher Faulet99daf282018-11-28 22:58:13 +01002362 /* append a slash at the end of the location if needed and missing */
2363 if (chunk->data && chunk->area[chunk->data - 1] != '/' &&
2364 (rule->flags & REDIRECT_FLAG_APPEND_SLASH)) {
2365 if (chunk->data + 1 >= chunk->size)
2366 goto fail;
2367 chunk->area[chunk->data++] = '/';
2368 }
2369 break;
Christopher Fauletf2824e62018-10-01 12:12:37 +02002370 }
Christopher Faulet99daf282018-11-28 22:58:13 +01002371 case REDIRECT_TYPE_LOCATION:
2372 default:
2373 if (rule->rdr_str) { /* this is an old "redirect" rule */
2374 /* add location */
2375 if (!chunk_memcat(chunk, rule->rdr_str, rule->rdr_len))
2376 goto fail;
2377 }
2378 else {
2379 /* add location with executing log format */
Willy Tarreaubc1223b2021-09-02 16:54:33 +02002380 int len = build_logline(s, chunk->area + chunk->data,
2381 chunk->size - chunk->data,
2382 &rule->rdr_fmt);
Christopher Fauleteab17572022-04-26 20:34:38 +02002383 if (!len && rule->flags & REDIRECT_FLAG_IGNORE_EMPTY) {
2384 ret = 2;
2385 goto out;
2386 }
Willy Tarreaubc1223b2021-09-02 16:54:33 +02002387
2388 chunk->data += len;
Christopher Faulet99daf282018-11-28 22:58:13 +01002389 }
2390 break;
Christopher Fauletf2824e62018-10-01 12:12:37 +02002391 }
Christopher Faulet99daf282018-11-28 22:58:13 +01002392 location = ist2(chunk->area, chunk->data);
2393
2394 /*
2395 * Create the 30x response
2396 */
2397 switch (rule->code) {
2398 case 308:
2399 status = ist("308");
2400 reason = ist("Permanent Redirect");
2401 break;
2402 case 307:
2403 status = ist("307");
2404 reason = ist("Temporary Redirect");
2405 break;
2406 case 303:
2407 status = ist("303");
2408 reason = ist("See Other");
2409 break;
2410 case 301:
2411 status = ist("301");
2412 reason = ist("Moved Permanently");
2413 break;
2414 case 302:
2415 default:
2416 status = ist("302");
2417 reason = ist("Found");
2418 break;
2419 }
2420
Christopher Faulet08e66462019-05-23 16:44:59 +02002421 if (!(txn->req.flags & HTTP_MSGF_BODYLESS) && txn->req.msg_state != HTTP_MSG_DONE)
2422 close = 1;
2423
Christopher Faulet99daf282018-11-28 22:58:13 +01002424 htx = htx_from_buf(&res->buf);
Kevin Zhu96b36392020-01-07 09:42:55 +01002425 /* Trim any possible response */
2426 channel_htx_truncate(&s->res, htx);
Christopher Faulet617ec5c2023-10-17 11:43:43 +02002427 flags = (HTX_SL_F_IS_RESP|HTX_SL_F_VER_11|HTX_SL_F_XFER_LEN|HTX_SL_F_CLEN|HTX_SL_F_BODYLESS);
Christopher Faulet99daf282018-11-28 22:58:13 +01002428 sl = htx_add_stline(htx, HTX_BLK_RES_SL, flags, ist("HTTP/1.1"), status, reason);
2429 if (!sl)
2430 goto fail;
2431 sl->info.res.status = rule->code;
2432 s->txn->status = rule->code;
2433
Christopher Faulet08e66462019-05-23 16:44:59 +02002434 if (close && !htx_add_header(htx, ist("Connection"), ist("close")))
2435 goto fail;
2436
2437 if (!htx_add_header(htx, ist("Content-length"), ist("0")) ||
Christopher Faulet99daf282018-11-28 22:58:13 +01002438 !htx_add_header(htx, ist("Location"), location))
2439 goto fail;
2440
2441 if (rule->code == 302 || rule->code == 303 || rule->code == 307) {
2442 if (!htx_add_header(htx, ist("Cache-Control"), ist("no-cache")))
2443 goto fail;
Christopher Fauletf2824e62018-10-01 12:12:37 +02002444 }
2445
2446 if (rule->cookie_len) {
Christopher Faulet99daf282018-11-28 22:58:13 +01002447 if (!htx_add_header(htx, ist("Set-Cookie"), ist2(rule->cookie_str, rule->cookie_len)))
2448 goto fail;
Christopher Fauletf2824e62018-10-01 12:12:37 +02002449 }
2450
Christopher Fauletd1ac2b92020-12-02 19:12:22 +01002451 if (!htx_add_endof(htx, HTX_BLK_EOH))
Christopher Faulet99daf282018-11-28 22:58:13 +01002452 goto fail;
2453
Christopher Fauletd1ac2b92020-12-02 19:12:22 +01002454 htx->flags |= HTX_FL_EOM;
Kevin Zhu96b36392020-01-07 09:42:55 +01002455 htx_to_buf(htx, &res->buf);
Christopher Fauleta72a7e42020-01-28 09:28:11 +01002456 if (!http_forward_proxy_resp(s, 1))
2457 goto fail;
Christopher Faulet99daf282018-11-28 22:58:13 +01002458
Christopher Faulet60b33a52020-01-28 09:18:10 +01002459 if (rule->flags & REDIRECT_FLAG_FROM_REQ) {
2460 /* let's log the request time */
Willy Tarreau69530f52023-04-28 09:16:15 +02002461 s->logs.request_ts = now_ns;
Christopher Fauletd3475882021-10-04 14:16:46 +02002462 req->analysers &= AN_REQ_FLT_END;
Christopher Faulet99daf282018-11-28 22:58:13 +01002463
Christopher Faulet60b33a52020-01-28 09:18:10 +01002464 if (s->sess->fe == s->be) /* report it if the request was intercepted by the frontend */
Willy Tarreau4781b152021-04-06 13:53:36 +02002465 _HA_ATOMIC_INC(&s->sess->fe->fe_counters.intercepted_req);
Christopher Faulet60b33a52020-01-28 09:18:10 +01002466 }
Christopher Fauletf2824e62018-10-01 12:12:37 +02002467
2468 if (!(s->flags & SF_ERR_MASK))
2469 s->flags |= SF_ERR_LOCAL;
Christopher Faulet4a66c942023-01-13 09:43:21 +01002470 http_set_term_flags(s);
Christopher Fauletf2824e62018-10-01 12:12:37 +02002471
Christopher Fauleteab17572022-04-26 20:34:38 +02002472 out:
Christopher Faulet99daf282018-11-28 22:58:13 +01002473 free_trash_chunk(chunk);
Christopher Fauleteab17572022-04-26 20:34:38 +02002474 return ret;
Christopher Faulet99daf282018-11-28 22:58:13 +01002475
2476 fail:
2477 /* If an error occurred, remove the incomplete HTTP response from the
2478 * buffer */
Christopher Faulet202c6ce2019-01-07 14:57:35 +01002479 channel_htx_truncate(res, htxbuf(&res->buf));
Christopher Fauleteab17572022-04-26 20:34:38 +02002480 ret = 0;
2481 goto out;
Christopher Fauletf2824e62018-10-01 12:12:37 +02002482}
2483
Christopher Faulet18c13d32022-05-16 11:43:10 +02002484/* This function filters the request header names to only allow [0-9a-zA-Z-]
2485 * characters. Depending on the proxy configuration, headers with a name not
2486 * matching this charset are removed or the request is rejected with a
2487 * 403-Forbidden response if such name are found. It returns HTTP_RULE_RES_CONT
2488 * to continue the request processing or HTTP_RULE_RES_DENY if the request is
2489 * rejected.
2490 */
2491static enum rule_result http_req_restrict_header_names(struct stream *s, struct htx *htx, struct proxy *px)
2492{
2493 struct htx_blk *blk;
2494 enum rule_result rule_ret = HTTP_RULE_RES_CONT;
2495
2496 blk = htx_get_first_blk(htx);
2497 while (blk) {
2498 enum htx_blk_type type = htx_get_blk_type(blk);
2499
2500 if (type == HTX_BLK_HDR) {
2501 struct ist n = htx_get_blk_name(htx, blk);
Mateusz Malek4b85a962022-08-17 14:22:09 +02002502 int i, end = istlen(n);
Christopher Faulet18c13d32022-05-16 11:43:10 +02002503
Mateusz Malek4b85a962022-08-17 14:22:09 +02002504 for (i = 0; i < end; i++) {
Christopher Faulet18c13d32022-05-16 11:43:10 +02002505 if (!isalnum((unsigned char)n.ptr[i]) && n.ptr[i] != '-') {
Mateusz Malek4b85a962022-08-17 14:22:09 +02002506 break;
Christopher Faulet18c13d32022-05-16 11:43:10 +02002507 }
2508 }
Mateusz Malek4b85a962022-08-17 14:22:09 +02002509
2510 if (i < end) {
2511 /* Disallowed character found - block the request or remove the header */
2512 if (px->options2 & PR_O2_RSTRICT_REQ_HDR_NAMES_BLK)
2513 goto block;
2514 blk = htx_remove_blk(htx, blk);
2515 continue;
2516 }
Christopher Faulet18c13d32022-05-16 11:43:10 +02002517 }
2518 if (type == HTX_BLK_EOH)
2519 break;
2520
2521 blk = htx_get_next_blk(htx, blk);
2522 }
2523 out:
2524 return rule_ret;
2525 block:
2526 /* Block the request returning a 403-Forbidden response */
2527 s->txn->status = 403;
2528 rule_ret = HTTP_RULE_RES_DENY;
2529 goto out;
2530}
2531
Christopher Faulet92d34fe2019-12-17 09:20:34 +01002532/* Replace all headers matching the name <name>. The header value is replaced if
2533 * it matches the regex <re>. <str> is used for the replacement. If <full> is
2534 * set to 1, the full-line is matched and replaced. Otherwise, comma-separated
2535 * values are evaluated one by one. It returns 0 on success and -1 on error.
2536 */
2537int http_replace_hdrs(struct stream* s, struct htx *htx, struct ist name,
2538 const char *str, struct my_regex *re, int full)
Christopher Faulet72333522018-10-24 11:25:02 +02002539{
2540 struct http_hdr_ctx ctx;
Christopher Faulet72333522018-10-24 11:25:02 +02002541
Christopher Faulet72333522018-10-24 11:25:02 +02002542 ctx.blk = NULL;
Christopher Faulet92d34fe2019-12-17 09:20:34 +01002543 while (http_find_header(htx, name, &ctx, full)) {
Christopher Faulet80707f72023-08-04 16:51:11 +02002544 struct buffer *output = get_trash_chunk();
2545
Christopher Faulet72333522018-10-24 11:25:02 +02002546 if (!regex_exec_match2(re, ctx.value.ptr, ctx.value.len, MAX_MATCH, pmatch, 0))
2547 continue;
2548
2549 output->data = exp_replace(output->area, output->size, ctx.value.ptr, str, pmatch);
2550 if (output->data == -1)
2551 return -1;
2552 if (!http_replace_header_value(htx, &ctx, ist2(output->area, output->data)))
2553 return -1;
2554 }
2555 return 0;
2556}
2557
Christopher Faulet8d8ac192018-10-24 11:27:39 +02002558/* This function executes one of the set-{method,path,query,uri} actions. It
2559 * takes the string from the variable 'replace' with length 'len', then modifies
2560 * the relevant part of the request line accordingly. Then it updates various
2561 * pointers to the next elements which were moved, and the total buffer length.
2562 * It finds the action to be performed in p[2], previously filled by function
2563 * parse_set_req_line(). It returns 0 in case of success, -1 in case of internal
2564 * error, though this can be revisited when this code is finally exploited.
2565 *
2566 * 'action' can be '0' to replace method, '1' to replace path, '2' to replace
Christopher Faulet312294f2020-09-02 17:17:44 +02002567 * query string, 3 to replace uri or 4 to replace the path+query.
Christopher Faulet8d8ac192018-10-24 11:27:39 +02002568 *
2569 * In query string case, the mark question '?' must be set at the start of the
2570 * string by the caller, event if the replacement query string is empty.
2571 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02002572int http_req_replace_stline(int action, const char *replace, int len,
2573 struct proxy *px, struct stream *s)
Christopher Faulet8d8ac192018-10-24 11:27:39 +02002574{
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01002575 struct htx *htx = htxbuf(&s->req.buf);
Christopher Faulet8d8ac192018-10-24 11:27:39 +02002576
2577 switch (action) {
2578 case 0: // method
2579 if (!http_replace_req_meth(htx, ist2(replace, len)))
2580 return -1;
2581 break;
2582
2583 case 1: // path
Christopher Fauletb8ce5052020-08-31 16:11:57 +02002584 if (!http_replace_req_path(htx, ist2(replace, len), 0))
Christopher Faulet8d8ac192018-10-24 11:27:39 +02002585 return -1;
2586 break;
2587
2588 case 2: // query
2589 if (!http_replace_req_query(htx, ist2(replace, len)))
2590 return -1;
2591 break;
2592
2593 case 3: // uri
2594 if (!http_replace_req_uri(htx, ist2(replace, len)))
2595 return -1;
2596 break;
2597
Christopher Faulet312294f2020-09-02 17:17:44 +02002598 case 4: // path + query
2599 if (!http_replace_req_path(htx, ist2(replace, len), 1))
2600 return -1;
2601 break;
2602
Christopher Faulet8d8ac192018-10-24 11:27:39 +02002603 default:
2604 return -1;
2605 }
2606 return 0;
2607}
2608
2609/* This function replace the HTTP status code and the associated message. The
Christopher Faulete00d06c2019-12-16 17:18:42 +01002610 * variable <status> contains the new status code. This function never fails. It
2611 * returns 0 in case of success, -1 in case of internal error.
Christopher Faulet8d8ac192018-10-24 11:27:39 +02002612 */
Christopher Faulet96bff762019-12-17 13:46:18 +01002613int http_res_set_status(unsigned int status, struct ist reason, struct stream *s)
Christopher Faulet8d8ac192018-10-24 11:27:39 +02002614{
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01002615 struct htx *htx = htxbuf(&s->res.buf);
Christopher Faulet8d8ac192018-10-24 11:27:39 +02002616 char *res;
2617
2618 chunk_reset(&trash);
2619 res = ultoa_o(status, trash.area, trash.size);
2620 trash.data = res - trash.area;
2621
2622 /* Do we have a custom reason format string? */
Tim Duesterhuse296d3e2020-03-05 17:56:31 +01002623 if (!isttest(reason)) {
Christopher Faulet96bff762019-12-17 13:46:18 +01002624 const char *str = http_get_reason(status);
Tim Duesterhusdcf753a2021-03-04 17:31:47 +01002625 reason = ist(str);
Christopher Faulet96bff762019-12-17 13:46:18 +01002626 }
Christopher Faulet8d8ac192018-10-24 11:27:39 +02002627
Christopher Fauletbde2c4c2020-08-31 16:43:34 +02002628 if (!http_replace_res_status(htx, ist2(trash.area, trash.data), reason))
Christopher Faulete00d06c2019-12-16 17:18:42 +01002629 return -1;
Willy Tarreau640e2532023-01-10 14:50:44 +01002630 s->txn->status = status;
Christopher Faulete00d06c2019-12-16 17:18:42 +01002631 return 0;
Christopher Faulet8d8ac192018-10-24 11:27:39 +02002632}
2633
Christopher Faulet3e964192018-10-24 11:39:23 +02002634/* Executes the http-request rules <rules> for stream <s>, proxy <px> and
2635 * transaction <txn>. Returns the verdict of the first rule that prevents
2636 * further processing of the request (auth, deny, ...), and defaults to
2637 * HTTP_RULE_RES_STOP if it executed all rules or stopped on an allow, or
2638 * HTTP_RULE_RES_CONT if the last rule was reached. It may set the TX_CLTARPIT
2639 * on txn->flags if it encounters a tarpit rule. If <deny_status> is not NULL
2640 * and a deny/tarpit rule is matched, it will be filled with this rule's deny
2641 * status.
2642 */
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002643static enum rule_result http_req_get_intercept_rule(struct proxy *px, struct list *def_rules,
2644 struct list *rules, struct stream *s)
Christopher Faulet3e964192018-10-24 11:39:23 +02002645{
2646 struct session *sess = strm_sess(s);
2647 struct http_txn *txn = s->txn;
Christopher Faulet3e964192018-10-24 11:39:23 +02002648 struct act_rule *rule;
Christopher Faulet3e964192018-10-24 11:39:23 +02002649 enum rule_result rule_ret = HTTP_RULE_RES_CONT;
Christopher Faulet105ba6c2019-12-18 14:41:51 +01002650 int act_opts = 0;
Christopher Faulet3e964192018-10-24 11:39:23 +02002651
Christopher Faulet3e964192018-10-24 11:39:23 +02002652 /* If "the current_rule_list" match the executed rule list, we are in
2653 * resume condition. If a resume is needed it is always in the action
2654 * and never in the ACL or converters. In this case, we initialise the
2655 * current rule, and go to the action execution point.
2656 */
2657 if (s->current_rule) {
2658 rule = s->current_rule;
2659 s->current_rule = NULL;
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002660 if (s->current_rule_list == rules || (def_rules && s->current_rule_list == def_rules))
Christopher Faulet3e964192018-10-24 11:39:23 +02002661 goto resume_execution;
2662 }
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002663 s->current_rule_list = ((!def_rules || s->current_rule_list == def_rules) ? rules : def_rules);
Christopher Faulet3e964192018-10-24 11:39:23 +02002664
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002665 restart:
Christopher Faulet1aea50e2020-01-17 16:03:53 +01002666 /* start the ruleset evaluation in strict mode */
2667 txn->req.flags &= ~HTTP_MSGF_SOFT_RW;
Christopher Faulet46f95542019-12-20 10:07:22 +01002668
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002669 list_for_each_entry(rule, s->current_rule_list, list) {
Christopher Faulet3e964192018-10-24 11:39:23 +02002670 /* check optional condition */
2671 if (rule->cond) {
2672 int ret;
2673
2674 ret = acl_exec_cond(rule->cond, px, sess, s, SMP_OPT_DIR_REQ|SMP_OPT_FINAL);
2675 ret = acl_pass(ret);
2676
2677 if (rule->cond->pol == ACL_COND_UNLESS)
2678 ret = !ret;
2679
2680 if (!ret) /* condition not matched */
2681 continue;
2682 }
2683
Christopher Faulet105ba6c2019-12-18 14:41:51 +01002684 act_opts |= ACT_OPT_FIRST;
Christopher Faulet3e964192018-10-24 11:39:23 +02002685 resume_execution:
Amaury Denoyelle03517732021-05-07 14:25:01 +02002686 if (rule->kw->flags & KWF_EXPERIMENTAL)
2687 mark_tainted(TAINTED_ACTION_EXP_EXECUTED);
2688
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002689 /* Always call the action function if defined */
2690 if (rule->action_ptr) {
Christopher Fauletd7bac882023-04-14 12:05:55 +02002691 if ((s->scf->flags & SC_FL_ERROR) ||
Christopher Fauletca5309a2023-04-17 16:17:32 +02002692 ((s->scf->flags & (SC_FL_EOS|SC_FL_ABRT_DONE)) &&
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002693 (px->options & PR_O_ABRT_CLOSE)))
Christopher Faulet105ba6c2019-12-18 14:41:51 +01002694 act_opts |= ACT_OPT_FINAL;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002695
Christopher Faulet105ba6c2019-12-18 14:41:51 +01002696 switch (rule->action_ptr(rule, px, sess, s, act_opts)) {
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002697 case ACT_RET_CONT:
2698 break;
2699 case ACT_RET_STOP:
2700 rule_ret = HTTP_RULE_RES_STOP;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002701 s->last_rule_file = rule->conf.file;
2702 s->last_rule_line = rule->conf.line;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002703 goto end;
2704 case ACT_RET_YIELD:
2705 s->current_rule = rule;
2706 rule_ret = HTTP_RULE_RES_YIELD;
2707 goto end;
2708 case ACT_RET_ERR:
2709 rule_ret = HTTP_RULE_RES_ERROR;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002710 s->last_rule_file = rule->conf.file;
2711 s->last_rule_line = rule->conf.line;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002712 goto end;
2713 case ACT_RET_DONE:
2714 rule_ret = HTTP_RULE_RES_DONE;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002715 s->last_rule_file = rule->conf.file;
2716 s->last_rule_line = rule->conf.line;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002717 goto end;
2718 case ACT_RET_DENY:
Christopher Fauletb58f62b2020-01-13 16:40:13 +01002719 if (txn->status == -1)
2720 txn->status = 403;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002721 rule_ret = HTTP_RULE_RES_DENY;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002722 s->last_rule_file = rule->conf.file;
2723 s->last_rule_line = rule->conf.line;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002724 goto end;
2725 case ACT_RET_ABRT:
2726 rule_ret = HTTP_RULE_RES_ABRT;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002727 s->last_rule_file = rule->conf.file;
2728 s->last_rule_line = rule->conf.line;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002729 goto end;
2730 case ACT_RET_INV:
2731 rule_ret = HTTP_RULE_RES_BADREQ;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002732 s->last_rule_file = rule->conf.file;
2733 s->last_rule_line = rule->conf.line;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002734 goto end;
2735 }
2736 continue; /* eval the next rule */
2737 }
2738
2739 /* If not action function defined, check for known actions */
Christopher Faulet3e964192018-10-24 11:39:23 +02002740 switch (rule->action) {
2741 case ACT_ACTION_ALLOW:
2742 rule_ret = HTTP_RULE_RES_STOP;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002743 s->last_rule_file = rule->conf.file;
2744 s->last_rule_line = rule->conf.line;
Christopher Faulet3e964192018-10-24 11:39:23 +02002745 goto end;
2746
2747 case ACT_ACTION_DENY:
Christopher Faulet5cb513a2020-05-13 17:56:56 +02002748 txn->status = rule->arg.http_reply->status;
2749 txn->http_reply = rule->arg.http_reply;
Christopher Faulet3e964192018-10-24 11:39:23 +02002750 rule_ret = HTTP_RULE_RES_DENY;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002751 s->last_rule_file = rule->conf.file;
2752 s->last_rule_line = rule->conf.line;
Christopher Faulet3e964192018-10-24 11:39:23 +02002753 goto end;
2754
2755 case ACT_HTTP_REQ_TARPIT:
2756 txn->flags |= TX_CLTARPIT;
Christopher Faulet5cb513a2020-05-13 17:56:56 +02002757 txn->status = rule->arg.http_reply->status;
2758 txn->http_reply = rule->arg.http_reply;
Christopher Faulet3e964192018-10-24 11:39:23 +02002759 rule_ret = HTTP_RULE_RES_DENY;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002760 s->last_rule_file = rule->conf.file;
2761 s->last_rule_line = rule->conf.line;
Christopher Faulet3e964192018-10-24 11:39:23 +02002762 goto end;
2763
Willy Tarreaubc1223b2021-09-02 16:54:33 +02002764 case ACT_HTTP_REDIR: {
2765 int ret = http_apply_redirect_rule(rule->arg.redir, s, txn);
2766
2767 if (ret == 2) // 2 == skip
2768 break;
2769
2770 rule_ret = ret ? HTTP_RULE_RES_ABRT : HTTP_RULE_RES_ERROR;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002771 s->last_rule_file = rule->conf.file;
2772 s->last_rule_line = rule->conf.line;
Christopher Faulet3e964192018-10-24 11:39:23 +02002773 goto end;
Willy Tarreaubc1223b2021-09-02 16:54:33 +02002774 }
Christopher Faulet3e964192018-10-24 11:39:23 +02002775
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002776 /* other flags exists, but normally, they never be matched. */
Christopher Faulet3e964192018-10-24 11:39:23 +02002777 default:
2778 break;
2779 }
2780 }
2781
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002782 if (def_rules && s->current_rule_list == def_rules) {
2783 s->current_rule_list = rules;
2784 goto restart;
2785 }
2786
Christopher Faulet3e964192018-10-24 11:39:23 +02002787 end:
Christopher Faulet1aea50e2020-01-17 16:03:53 +01002788 /* if the ruleset evaluation is finished reset the strict mode */
Christopher Faulet46f95542019-12-20 10:07:22 +01002789 if (rule_ret != HTTP_RULE_RES_YIELD)
Christopher Faulet1aea50e2020-01-17 16:03:53 +01002790 txn->req.flags &= ~HTTP_MSGF_SOFT_RW;
Christopher Faulet46f95542019-12-20 10:07:22 +01002791
Christopher Faulet3e964192018-10-24 11:39:23 +02002792 /* we reached the end of the rules, nothing to report */
2793 return rule_ret;
2794}
2795
2796/* Executes the http-response rules <rules> for stream <s> and proxy <px>. It
2797 * returns one of 5 possible statuses: HTTP_RULE_RES_CONT, HTTP_RULE_RES_STOP,
2798 * HTTP_RULE_RES_DONE, HTTP_RULE_RES_YIELD, or HTTP_RULE_RES_BADREQ. If *CONT
2799 * is returned, the process can continue the evaluation of next rule list. If
2800 * *STOP or *DONE is returned, the process must stop the evaluation. If *BADREQ
2801 * is returned, it means the operation could not be processed and a server error
Christopher Fauleta53abad2020-05-13 08:12:22 +02002802 * must be returned. If *YIELD is returned, the caller must call again the
2803 * function with the same context.
Christopher Faulet3e964192018-10-24 11:39:23 +02002804 */
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002805static enum rule_result http_res_get_intercept_rule(struct proxy *px, struct list *def_rules,
2806 struct list *rules, struct stream *s)
Christopher Faulet3e964192018-10-24 11:39:23 +02002807{
2808 struct session *sess = strm_sess(s);
2809 struct http_txn *txn = s->txn;
Christopher Faulet3e964192018-10-24 11:39:23 +02002810 struct act_rule *rule;
Christopher Faulet3e964192018-10-24 11:39:23 +02002811 enum rule_result rule_ret = HTTP_RULE_RES_CONT;
Christopher Faulet105ba6c2019-12-18 14:41:51 +01002812 int act_opts = 0;
Christopher Faulet3e964192018-10-24 11:39:23 +02002813
Christopher Faulet3e964192018-10-24 11:39:23 +02002814 /* If "the current_rule_list" match the executed rule list, we are in
2815 * resume condition. If a resume is needed it is always in the action
2816 * and never in the ACL or converters. In this case, we initialise the
2817 * current rule, and go to the action execution point.
2818 */
2819 if (s->current_rule) {
2820 rule = s->current_rule;
2821 s->current_rule = NULL;
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002822 if (s->current_rule_list == rules || (def_rules && s->current_rule_list == def_rules))
Christopher Faulet3e964192018-10-24 11:39:23 +02002823 goto resume_execution;
2824 }
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002825 s->current_rule_list = ((!def_rules || s->current_rule_list == def_rules) ? rules : def_rules);
2826
2827 restart:
Christopher Faulet3e964192018-10-24 11:39:23 +02002828
Christopher Faulet1aea50e2020-01-17 16:03:53 +01002829 /* start the ruleset evaluation in strict mode */
2830 txn->rsp.flags &= ~HTTP_MSGF_SOFT_RW;
Christopher Faulet46f95542019-12-20 10:07:22 +01002831
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002832 list_for_each_entry(rule, s->current_rule_list, list) {
Christopher Faulet3e964192018-10-24 11:39:23 +02002833 /* check optional condition */
2834 if (rule->cond) {
2835 int ret;
2836
2837 ret = acl_exec_cond(rule->cond, px, sess, s, SMP_OPT_DIR_RES|SMP_OPT_FINAL);
2838 ret = acl_pass(ret);
2839
2840 if (rule->cond->pol == ACL_COND_UNLESS)
2841 ret = !ret;
2842
2843 if (!ret) /* condition not matched */
2844 continue;
2845 }
2846
Christopher Faulet105ba6c2019-12-18 14:41:51 +01002847 act_opts |= ACT_OPT_FIRST;
Christopher Faulet3e964192018-10-24 11:39:23 +02002848resume_execution:
Amaury Denoyelle03517732021-05-07 14:25:01 +02002849 if (rule->kw->flags & KWF_EXPERIMENTAL)
2850 mark_tainted(TAINTED_ACTION_EXP_EXECUTED);
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002851
2852 /* Always call the action function if defined */
2853 if (rule->action_ptr) {
Christopher Fauletd7bac882023-04-14 12:05:55 +02002854 if ((s->scf->flags & SC_FL_ERROR) ||
Christopher Fauletca5309a2023-04-17 16:17:32 +02002855 ((s->scf->flags & (SC_FL_EOS|SC_FL_ABRT_DONE)) &&
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002856 (px->options & PR_O_ABRT_CLOSE)))
Christopher Faulet105ba6c2019-12-18 14:41:51 +01002857 act_opts |= ACT_OPT_FINAL;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002858
Christopher Faulet105ba6c2019-12-18 14:41:51 +01002859 switch (rule->action_ptr(rule, px, sess, s, act_opts)) {
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002860 case ACT_RET_CONT:
2861 break;
2862 case ACT_RET_STOP:
2863 rule_ret = HTTP_RULE_RES_STOP;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002864 s->last_rule_file = rule->conf.file;
2865 s->last_rule_line = rule->conf.line;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002866 goto end;
2867 case ACT_RET_YIELD:
2868 s->current_rule = rule;
2869 rule_ret = HTTP_RULE_RES_YIELD;
2870 goto end;
2871 case ACT_RET_ERR:
2872 rule_ret = HTTP_RULE_RES_ERROR;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002873 s->last_rule_file = rule->conf.file;
2874 s->last_rule_line = rule->conf.line;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002875 goto end;
2876 case ACT_RET_DONE:
2877 rule_ret = HTTP_RULE_RES_DONE;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002878 s->last_rule_file = rule->conf.file;
2879 s->last_rule_line = rule->conf.line;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002880 goto end;
2881 case ACT_RET_DENY:
Christopher Fauletb58f62b2020-01-13 16:40:13 +01002882 if (txn->status == -1)
2883 txn->status = 502;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002884 rule_ret = HTTP_RULE_RES_DENY;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002885 s->last_rule_file = rule->conf.file;
2886 s->last_rule_line = rule->conf.line;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002887 goto end;
2888 case ACT_RET_ABRT:
2889 rule_ret = HTTP_RULE_RES_ABRT;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002890 s->last_rule_file = rule->conf.file;
2891 s->last_rule_line = rule->conf.line;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002892 goto end;
2893 case ACT_RET_INV:
2894 rule_ret = HTTP_RULE_RES_BADREQ;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002895 s->last_rule_file = rule->conf.file;
2896 s->last_rule_line = rule->conf.line;
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002897 goto end;
2898 }
2899 continue; /* eval the next rule */
2900 }
2901
2902 /* If not action function defined, check for known actions */
Christopher Faulet3e964192018-10-24 11:39:23 +02002903 switch (rule->action) {
2904 case ACT_ACTION_ALLOW:
2905 rule_ret = HTTP_RULE_RES_STOP; /* "allow" rules are OK */
Willy Tarreauc6dae862022-03-09 17:23:10 +01002906 s->last_rule_file = rule->conf.file;
2907 s->last_rule_line = rule->conf.line;
Christopher Faulet3e964192018-10-24 11:39:23 +02002908 goto end;
2909
2910 case ACT_ACTION_DENY:
Christopher Faulet5cb513a2020-05-13 17:56:56 +02002911 txn->status = rule->arg.http_reply->status;
2912 txn->http_reply = rule->arg.http_reply;
Christopher Faulet3a26bee2019-12-16 12:47:40 +01002913 rule_ret = HTTP_RULE_RES_DENY;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002914 s->last_rule_file = rule->conf.file;
2915 s->last_rule_line = rule->conf.line;
Christopher Faulet3e964192018-10-24 11:39:23 +02002916 goto end;
2917
Willy Tarreaubc1223b2021-09-02 16:54:33 +02002918 case ACT_HTTP_REDIR: {
2919 int ret = http_apply_redirect_rule(rule->arg.redir, s, txn);
Christopher Faulet3e964192018-10-24 11:39:23 +02002920
Willy Tarreaubc1223b2021-09-02 16:54:33 +02002921 if (ret == 2) // 2 == skip
2922 break;
2923
2924 rule_ret = ret ? HTTP_RULE_RES_ABRT : HTTP_RULE_RES_ERROR;
Willy Tarreauc6dae862022-03-09 17:23:10 +01002925 s->last_rule_file = rule->conf.file;
2926 s->last_rule_line = rule->conf.line;
Willy Tarreaubc1223b2021-09-02 16:54:33 +02002927 goto end;
2928 }
Christopher Fauletcd26e8a2019-12-18 11:13:39 +01002929 /* other flags exists, but normally, they never be matched. */
Christopher Faulet3e964192018-10-24 11:39:23 +02002930 default:
2931 break;
2932 }
2933 }
2934
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002935 if (def_rules && s->current_rule_list == def_rules) {
2936 s->current_rule_list = rules;
2937 goto restart;
2938 }
2939
Christopher Faulet3e964192018-10-24 11:39:23 +02002940 end:
Christopher Faulet1aea50e2020-01-17 16:03:53 +01002941 /* if the ruleset evaluation is finished reset the strict mode */
Christopher Faulet46f95542019-12-20 10:07:22 +01002942 if (rule_ret != HTTP_RULE_RES_YIELD)
Christopher Faulet1aea50e2020-01-17 16:03:53 +01002943 txn->rsp.flags &= ~HTTP_MSGF_SOFT_RW;
Christopher Faulet46f95542019-12-20 10:07:22 +01002944
Christopher Faulet3e964192018-10-24 11:39:23 +02002945 /* we reached the end of the rules, nothing to report */
2946 return rule_ret;
2947}
2948
Christopher Faulet6d0c3df2020-01-22 09:26:35 +01002949/* Executes backend and frontend http-after-response rules for the stream <s>,
2950 * in that order. it return 1 on success and 0 on error. It is the caller
2951 * responsibility to catch error or ignore it. If it catches it, this function
2952 * may be called a second time, for the internal error.
2953 */
2954int http_eval_after_res_rules(struct stream *s)
2955{
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002956 struct list *def_rules, *rules;
Christopher Faulet6d0c3df2020-01-22 09:26:35 +01002957 struct session *sess = s->sess;
2958 enum rule_result ret = HTTP_RULE_RES_CONT;
2959
Christopher Faulet507479b2020-05-15 12:29:46 +02002960 /* Eval after-response ruleset only if the reply is not const */
2961 if (s->txn->flags & TX_CONST_REPLY)
2962 goto end;
2963
Christopher Faulet6d0c3df2020-01-22 09:26:35 +01002964 /* prune the request variables if not already done and swap to the response variables. */
2965 if (s->vars_reqres.scope != SCOPE_RES) {
2966 if (!LIST_ISEMPTY(&s->vars_reqres.head))
2967 vars_prune(&s->vars_reqres, s->sess, s);
Willy Tarreaub7bfcb32021-08-31 08:13:25 +02002968 vars_init_head(&s->vars_reqres, SCOPE_RES);
Christopher Faulet6d0c3df2020-01-22 09:26:35 +01002969 }
2970
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002971 def_rules = (s->be->defpx ? &s->be->defpx->http_after_res_rules : NULL);
2972 rules = &s->be->http_after_res_rules;
2973
2974 ret = http_res_get_intercept_rule(s->be, def_rules, rules, s);
Christopher Faulet4c5a5912021-11-09 17:48:39 +01002975 if ((ret == HTTP_RULE_RES_CONT || ret == HTTP_RULE_RES_STOP) && sess->fe != s->be) {
Christopher Fauletd4150ad2021-10-13 15:35:55 +02002976 def_rules = ((sess->fe->defpx && sess->fe->defpx != s->be->defpx) ? &sess->fe->defpx->http_after_res_rules : NULL);
2977 rules = &sess->fe->http_after_res_rules;
2978 ret = http_res_get_intercept_rule(sess->fe, def_rules, rules, s);
2979 }
Christopher Faulet6d0c3df2020-01-22 09:26:35 +01002980
Christopher Faulet507479b2020-05-15 12:29:46 +02002981 end:
Christopher Faulet6d0c3df2020-01-22 09:26:35 +01002982 /* All other codes than CONTINUE, STOP or DONE are forbidden */
2983 return (ret == HTTP_RULE_RES_CONT || ret == HTTP_RULE_RES_STOP || ret == HTTP_RULE_RES_DONE);
2984}
2985
Christopher Fauletfcda7c62018-10-24 11:56:22 +02002986/*
2987 * Manage client-side cookie. It can impact performance by about 2% so it is
2988 * desirable to call it only when needed. This code is quite complex because
2989 * of the multiple very crappy and ambiguous syntaxes we have to support. it
2990 * highly recommended not to touch this part without a good reason !
2991 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02002992static void http_manage_client_side_cookies(struct stream *s, struct channel *req)
Christopher Fauletfcda7c62018-10-24 11:56:22 +02002993{
2994 struct session *sess = s->sess;
2995 struct http_txn *txn = s->txn;
2996 struct htx *htx;
2997 struct http_hdr_ctx ctx;
2998 char *hdr_beg, *hdr_end, *del_from;
2999 char *prev, *att_beg, *att_end, *equal, *val_beg, *val_end, *next;
3000 int preserve_hdr;
3001
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01003002 htx = htxbuf(&req->buf);
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003003 ctx.blk = NULL;
3004 while (http_find_header(htx, ist("Cookie"), &ctx, 1)) {
Olivier Houchardf0f42382019-07-22 17:43:46 +02003005 int is_first = 1;
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003006 del_from = NULL; /* nothing to be deleted */
3007 preserve_hdr = 0; /* assume we may kill the whole header */
3008
3009 /* Now look for cookies. Conforming to RFC2109, we have to support
3010 * attributes whose name begin with a '$', and associate them with
3011 * the right cookie, if we want to delete this cookie.
3012 * So there are 3 cases for each cookie read :
3013 * 1) it's a special attribute, beginning with a '$' : ignore it.
3014 * 2) it's a server id cookie that we *MAY* want to delete : save
3015 * some pointers on it (last semi-colon, beginning of cookie...)
3016 * 3) it's an application cookie : we *MAY* have to delete a previous
3017 * "special" cookie.
3018 * At the end of loop, if a "special" cookie remains, we may have to
3019 * remove it. If no application cookie persists in the header, we
3020 * *MUST* delete it.
3021 *
3022 * Note: RFC2965 is unclear about the processing of spaces around
3023 * the equal sign in the ATTR=VALUE form. A careful inspection of
3024 * the RFC explicitly allows spaces before it, and not within the
3025 * tokens (attrs or values). An inspection of RFC2109 allows that
3026 * too but section 10.1.3 lets one think that spaces may be allowed
3027 * after the equal sign too, resulting in some (rare) buggy
3028 * implementations trying to do that. So let's do what servers do.
3029 * Latest ietf draft forbids spaces all around. Also, earlier RFCs
3030 * allowed quoted strings in values, with any possible character
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +05003031 * after a backslash, including control chars and delimiters, which
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003032 * causes parsing to become ambiguous. Browsers also allow spaces
3033 * within values even without quotes.
3034 *
3035 * We have to keep multiple pointers in order to support cookie
3036 * removal at the beginning, middle or end of header without
3037 * corrupting the header. All of these headers are valid :
3038 *
3039 * hdr_beg hdr_end
3040 * | |
3041 * v |
3042 * NAME1=VALUE1;NAME2=VALUE2;NAME3=VALUE3 |
3043 * NAME1=VALUE1;NAME2_ONLY ;NAME3=VALUE3 v
3044 * NAME1 = VALUE 1 ; NAME2 = VALUE2 ; NAME3 = VALUE3
3045 * | | | | | | |
3046 * | | | | | | |
3047 * | | | | | | +--> next
3048 * | | | | | +----> val_end
3049 * | | | | +-----------> val_beg
3050 * | | | +--------------> equal
3051 * | | +----------------> att_end
3052 * | +---------------------> att_beg
3053 * +--------------------------> prev
3054 *
3055 */
3056 hdr_beg = ctx.value.ptr;
3057 hdr_end = hdr_beg + ctx.value.len;
3058 for (prev = hdr_beg; prev < hdr_end; prev = next) {
3059 /* Iterate through all cookies on this line */
3060
3061 /* find att_beg */
3062 att_beg = prev;
Olivier Houchardf0f42382019-07-22 17:43:46 +02003063 if (!is_first)
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003064 att_beg++;
Olivier Houchardf0f42382019-07-22 17:43:46 +02003065 is_first = 0;
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003066
3067 while (att_beg < hdr_end && HTTP_IS_SPHT(*att_beg))
3068 att_beg++;
3069
3070 /* find att_end : this is the first character after the last non
3071 * space before the equal. It may be equal to hdr_end.
3072 */
3073 equal = att_end = att_beg;
3074 while (equal < hdr_end) {
3075 if (*equal == '=' || *equal == ',' || *equal == ';')
3076 break;
3077 if (HTTP_IS_SPHT(*equal++))
3078 continue;
3079 att_end = equal;
3080 }
3081
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +05003082 /* here, <equal> points to '=', a delimiter or the end. <att_end>
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003083 * is between <att_beg> and <equal>, both may be identical.
3084 */
3085 /* look for end of cookie if there is an equal sign */
3086 if (equal < hdr_end && *equal == '=') {
3087 /* look for the beginning of the value */
3088 val_beg = equal + 1;
3089 while (val_beg < hdr_end && HTTP_IS_SPHT(*val_beg))
3090 val_beg++;
3091
3092 /* find the end of the value, respecting quotes */
3093 next = http_find_cookie_value_end(val_beg, hdr_end);
3094
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +05003095 /* make val_end point to the first white space or delimiter after the value */
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003096 val_end = next;
3097 while (val_end > val_beg && HTTP_IS_SPHT(*(val_end - 1)))
3098 val_end--;
3099 }
3100 else
3101 val_beg = val_end = next = equal;
3102
3103 /* We have nothing to do with attributes beginning with
3104 * '$'. However, they will automatically be removed if a
3105 * header before them is removed, since they're supposed
3106 * to be linked together.
3107 */
3108 if (*att_beg == '$')
3109 continue;
3110
3111 /* Ignore cookies with no equal sign */
3112 if (equal == next) {
3113 /* This is not our cookie, so we must preserve it. But if we already
3114 * scheduled another cookie for removal, we cannot remove the
3115 * complete header, but we can remove the previous block itself.
3116 */
3117 preserve_hdr = 1;
3118 if (del_from != NULL) {
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02003119 int delta = http_del_hdr_value(hdr_beg, hdr_end, &del_from, prev);
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003120 val_end += delta;
3121 next += delta;
3122 hdr_end += delta;
3123 prev = del_from;
3124 del_from = NULL;
3125 }
3126 continue;
3127 }
3128
3129 /* if there are spaces around the equal sign, we need to
3130 * strip them otherwise we'll get trouble for cookie captures,
3131 * or even for rewrites. Since this happens extremely rarely,
3132 * it does not hurt performance.
3133 */
3134 if (unlikely(att_end != equal || val_beg > equal + 1)) {
3135 int stripped_before = 0;
3136 int stripped_after = 0;
3137
3138 if (att_end != equal) {
3139 memmove(att_end, equal, hdr_end - equal);
3140 stripped_before = (att_end - equal);
3141 equal += stripped_before;
3142 val_beg += stripped_before;
3143 }
3144
3145 if (val_beg > equal + 1) {
3146 memmove(equal + 1, val_beg, hdr_end + stripped_before - val_beg);
3147 stripped_after = (equal + 1) - val_beg;
3148 val_beg += stripped_after;
3149 stripped_before += stripped_after;
3150 }
3151
3152 val_end += stripped_before;
3153 next += stripped_before;
3154 hdr_end += stripped_before;
3155 }
3156 /* now everything is as on the diagram above */
3157
3158 /* First, let's see if we want to capture this cookie. We check
3159 * that we don't already have a client side cookie, because we
3160 * can only capture one. Also as an optimisation, we ignore
3161 * cookies shorter than the declared name.
3162 */
3163 if (sess->fe->capture_name != NULL && txn->cli_cookie == NULL &&
3164 (val_end - att_beg >= sess->fe->capture_namelen) &&
3165 memcmp(att_beg, sess->fe->capture_name, sess->fe->capture_namelen) == 0) {
3166 int log_len = val_end - att_beg;
3167
3168 if ((txn->cli_cookie = pool_alloc(pool_head_capture)) == NULL) {
3169 ha_alert("HTTP logging : out of memory.\n");
3170 } else {
3171 if (log_len > sess->fe->capture_len)
3172 log_len = sess->fe->capture_len;
3173 memcpy(txn->cli_cookie, att_beg, log_len);
3174 txn->cli_cookie[log_len] = 0;
3175 }
3176 }
3177
3178 /* Persistence cookies in passive, rewrite or insert mode have the
3179 * following form :
3180 *
3181 * Cookie: NAME=SRV[|<lastseen>[|<firstseen>]]
3182 *
3183 * For cookies in prefix mode, the form is :
3184 *
3185 * Cookie: NAME=SRV~VALUE
3186 */
3187 if ((att_end - att_beg == s->be->cookie_len) && (s->be->cookie_name != NULL) &&
3188 (memcmp(att_beg, s->be->cookie_name, att_end - att_beg) == 0)) {
3189 struct server *srv = s->be->srv;
3190 char *delim;
3191
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +05003192 /* if we're in cookie prefix mode, we'll search the delimiter so that we
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003193 * have the server ID between val_beg and delim, and the original cookie between
3194 * delim+1 and val_end. Otherwise, delim==val_end :
3195 *
3196 * hdr_beg
3197 * |
3198 * v
3199 * NAME=SRV; # in all but prefix modes
3200 * NAME=SRV~OPAQUE ; # in prefix mode
3201 * || || | |+-> next
3202 * || || | +--> val_end
3203 * || || +---------> delim
3204 * || |+------------> val_beg
3205 * || +-------------> att_end = equal
3206 * |+-----------------> att_beg
3207 * +------------------> prev
3208 *
3209 */
3210 if (s->be->ck_opts & PR_CK_PFX) {
3211 for (delim = val_beg; delim < val_end; delim++)
3212 if (*delim == COOKIE_DELIM)
3213 break;
3214 }
3215 else {
3216 char *vbar1;
3217 delim = val_end;
3218 /* Now check if the cookie contains a date field, which would
3219 * appear after a vertical bar ('|') just after the server name
3220 * and before the delimiter.
3221 */
3222 vbar1 = memchr(val_beg, COOKIE_DELIM_DATE, val_end - val_beg);
3223 if (vbar1) {
3224 /* OK, so left of the bar is the server's cookie and
3225 * right is the last seen date. It is a base64 encoded
3226 * 30-bit value representing the UNIX date since the
3227 * epoch in 4-second quantities.
3228 */
3229 int val;
3230 delim = vbar1++;
3231 if (val_end - vbar1 >= 5) {
3232 val = b64tos30(vbar1);
3233 if (val > 0)
3234 txn->cookie_last_date = val << 2;
3235 }
3236 /* look for a second vertical bar */
3237 vbar1 = memchr(vbar1, COOKIE_DELIM_DATE, val_end - vbar1);
3238 if (vbar1 && (val_end - vbar1 > 5)) {
3239 val = b64tos30(vbar1 + 1);
3240 if (val > 0)
3241 txn->cookie_first_date = val << 2;
3242 }
3243 }
3244 }
3245
3246 /* if the cookie has an expiration date and the proxy wants to check
3247 * it, then we do that now. We first check if the cookie is too old,
3248 * then only if it has expired. We detect strict overflow because the
3249 * time resolution here is not great (4 seconds). Cookies with dates
3250 * in the future are ignored if their offset is beyond one day. This
3251 * allows an admin to fix timezone issues without expiring everyone
3252 * and at the same time avoids keeping unwanted side effects for too
3253 * long.
3254 */
3255 if (txn->cookie_first_date && s->be->cookie_maxlife &&
3256 (((signed)(date.tv_sec - txn->cookie_first_date) > (signed)s->be->cookie_maxlife) ||
3257 ((signed)(txn->cookie_first_date - date.tv_sec) > 86400))) {
3258 txn->flags &= ~TX_CK_MASK;
3259 txn->flags |= TX_CK_OLD;
3260 delim = val_beg; // let's pretend we have not found the cookie
3261 txn->cookie_first_date = 0;
3262 txn->cookie_last_date = 0;
3263 }
3264 else if (txn->cookie_last_date && s->be->cookie_maxidle &&
3265 (((signed)(date.tv_sec - txn->cookie_last_date) > (signed)s->be->cookie_maxidle) ||
3266 ((signed)(txn->cookie_last_date - date.tv_sec) > 86400))) {
3267 txn->flags &= ~TX_CK_MASK;
3268 txn->flags |= TX_CK_EXPIRED;
3269 delim = val_beg; // let's pretend we have not found the cookie
3270 txn->cookie_first_date = 0;
3271 txn->cookie_last_date = 0;
3272 }
3273
3274 /* Here, we'll look for the first running server which supports the cookie.
3275 * This allows to share a same cookie between several servers, for example
3276 * to dedicate backup servers to specific servers only.
3277 * However, to prevent clients from sticking to cookie-less backup server
3278 * when they have incidentely learned an empty cookie, we simply ignore
3279 * empty cookies and mark them as invalid.
3280 * The same behaviour is applied when persistence must be ignored.
3281 */
3282 if ((delim == val_beg) || (s->flags & (SF_IGNORE_PRST | SF_ASSIGNED)))
3283 srv = NULL;
3284
3285 while (srv) {
3286 if (srv->cookie && (srv->cklen == delim - val_beg) &&
3287 !memcmp(val_beg, srv->cookie, delim - val_beg)) {
3288 if ((srv->cur_state != SRV_ST_STOPPED) ||
3289 (s->be->options & PR_O_PERSIST) ||
3290 (s->flags & SF_FORCE_PRST)) {
3291 /* we found the server and we can use it */
3292 txn->flags &= ~TX_CK_MASK;
3293 txn->flags |= (srv->cur_state != SRV_ST_STOPPED) ? TX_CK_VALID : TX_CK_DOWN;
3294 s->flags |= SF_DIRECT | SF_ASSIGNED;
3295 s->target = &srv->obj_type;
3296 break;
3297 } else {
3298 /* we found a server, but it's down,
3299 * mark it as such and go on in case
3300 * another one is available.
3301 */
3302 txn->flags &= ~TX_CK_MASK;
3303 txn->flags |= TX_CK_DOWN;
3304 }
3305 }
3306 srv = srv->next;
3307 }
3308
3309 if (!srv && !(txn->flags & (TX_CK_DOWN|TX_CK_EXPIRED|TX_CK_OLD))) {
3310 /* no server matched this cookie or we deliberately skipped it */
3311 txn->flags &= ~TX_CK_MASK;
3312 if ((s->flags & (SF_IGNORE_PRST | SF_ASSIGNED)))
3313 txn->flags |= TX_CK_UNUSED;
3314 else
3315 txn->flags |= TX_CK_INVALID;
3316 }
3317
3318 /* depending on the cookie mode, we may have to either :
3319 * - delete the complete cookie if we're in insert+indirect mode, so that
3320 * the server never sees it ;
3321 * - remove the server id from the cookie value, and tag the cookie as an
Joseph Herlante9d5c722018-11-25 11:00:25 -08003322 * application cookie so that it does not get accidentally removed later,
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003323 * if we're in cookie prefix mode
3324 */
3325 if ((s->be->ck_opts & PR_CK_PFX) && (delim != val_end)) {
3326 int delta; /* negative */
3327
3328 memmove(val_beg, delim + 1, hdr_end - (delim + 1));
3329 delta = val_beg - (delim + 1);
3330 val_end += delta;
3331 next += delta;
3332 hdr_end += delta;
3333 del_from = NULL;
3334 preserve_hdr = 1; /* we want to keep this cookie */
3335 }
3336 else if (del_from == NULL &&
3337 (s->be->ck_opts & (PR_CK_INS | PR_CK_IND)) == (PR_CK_INS | PR_CK_IND)) {
3338 del_from = prev;
3339 }
3340 }
3341 else {
3342 /* This is not our cookie, so we must preserve it. But if we already
3343 * scheduled another cookie for removal, we cannot remove the
3344 * complete header, but we can remove the previous block itself.
3345 */
3346 preserve_hdr = 1;
3347
3348 if (del_from != NULL) {
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02003349 int delta = http_del_hdr_value(hdr_beg, hdr_end, &del_from, prev);
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003350 if (att_beg >= del_from)
3351 att_beg += delta;
3352 if (att_end >= del_from)
3353 att_end += delta;
3354 val_beg += delta;
3355 val_end += delta;
3356 next += delta;
3357 hdr_end += delta;
3358 prev = del_from;
3359 del_from = NULL;
3360 }
3361 }
3362
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003363 } /* for each cookie */
3364
3365
3366 /* There are no more cookies on this line.
3367 * We may still have one (or several) marked for deletion at the
3368 * end of the line. We must do this now in two ways :
3369 * - if some cookies must be preserved, we only delete from the
3370 * mark to the end of line ;
3371 * - if nothing needs to be preserved, simply delete the whole header
3372 */
3373 if (del_from) {
3374 hdr_end = (preserve_hdr ? del_from : hdr_beg);
3375 }
3376 if ((hdr_end - hdr_beg) != ctx.value.len) {
Christopher Faulet3e2638e2019-06-18 09:49:16 +02003377 if (hdr_beg != hdr_end)
3378 htx_change_blk_value_len(htx, ctx.blk, hdr_end - hdr_beg);
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003379 else
3380 http_remove_header(htx, &ctx);
3381 }
3382 } /* for each "Cookie header */
3383}
3384
3385/*
3386 * Manage server-side cookies. It can impact performance by about 2% so it is
3387 * desirable to call it only when needed. This function is also used when we
3388 * just need to know if there is a cookie (eg: for check-cache).
3389 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02003390static void http_manage_server_side_cookies(struct stream *s, struct channel *res)
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003391{
3392 struct session *sess = s->sess;
3393 struct http_txn *txn = s->txn;
3394 struct htx *htx;
3395 struct http_hdr_ctx ctx;
3396 struct server *srv;
3397 char *hdr_beg, *hdr_end;
3398 char *prev, *att_beg, *att_end, *equal, *val_beg, *val_end, *next;
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003399
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01003400 htx = htxbuf(&res->buf);
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003401
3402 ctx.blk = NULL;
Willy Tarreauaa1909e2022-11-14 18:58:35 +01003403 while (http_find_header(htx, ist("Set-Cookie"), &ctx, 1)) {
Olivier Houchardf0f42382019-07-22 17:43:46 +02003404 int is_first = 1;
3405
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003406 /* OK, right now we know we have a Set-Cookie* at hdr_beg, and
3407 * <prev> points to the colon.
3408 */
3409 txn->flags |= TX_SCK_PRESENT;
3410
3411 /* Maybe we only wanted to see if there was a Set-Cookie (eg:
3412 * check-cache is enabled) and we are not interested in checking
3413 * them. Warning, the cookie capture is declared in the frontend.
3414 */
3415 if (s->be->cookie_name == NULL && sess->fe->capture_name == NULL)
3416 break;
3417
3418 /* OK so now we know we have to process this response cookie.
3419 * The format of the Set-Cookie header is slightly different
3420 * from the format of the Cookie header in that it does not
3421 * support the comma as a cookie delimiter (thus the header
3422 * cannot be folded) because the Expires attribute described in
3423 * the original Netscape's spec may contain an unquoted date
3424 * with a comma inside. We have to live with this because
3425 * many browsers don't support Max-Age and some browsers don't
3426 * support quoted strings. However the Set-Cookie2 header is
Willy Tarreauaa1909e2022-11-14 18:58:35 +01003427 * clean but basically nobody supports it.
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003428 *
3429 * We have to keep multiple pointers in order to support cookie
3430 * removal at the beginning, middle or end of header without
3431 * corrupting the header (in case of set-cookie2). A special
3432 * pointer, <scav> points to the beginning of the set-cookie-av
3433 * fields after the first semi-colon. The <next> pointer points
3434 * either to the end of line (set-cookie) or next unquoted comma
3435 * (set-cookie2). All of these headers are valid :
3436 *
3437 * hdr_beg hdr_end
3438 * | |
3439 * v |
3440 * NAME1 = VALUE 1 ; Secure; Path="/" |
3441 * NAME=VALUE; Secure; Expires=Thu, 01-Jan-1970 00:00:01 GMT v
3442 * NAME = VALUE ; Secure; Expires=Thu, 01-Jan-1970 00:00:01 GMT
3443 * NAME1 = VALUE 1 ; Max-Age=0, NAME2=VALUE2; Discard
3444 * | | | | | | | |
3445 * | | | | | | | +-> next
3446 * | | | | | | +------------> scav
3447 * | | | | | +--------------> val_end
3448 * | | | | +--------------------> val_beg
3449 * | | | +----------------------> equal
3450 * | | +------------------------> att_end
3451 * | +----------------------------> att_beg
3452 * +------------------------------> prev
3453 * -------------------------------> hdr_beg
3454 */
3455 hdr_beg = ctx.value.ptr;
3456 hdr_end = hdr_beg + ctx.value.len;
3457 for (prev = hdr_beg; prev < hdr_end; prev = next) {
3458
3459 /* Iterate through all cookies on this line */
3460
3461 /* find att_beg */
3462 att_beg = prev;
Olivier Houchardf0f42382019-07-22 17:43:46 +02003463 if (!is_first)
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003464 att_beg++;
Olivier Houchardf0f42382019-07-22 17:43:46 +02003465 is_first = 0;
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003466
3467 while (att_beg < hdr_end && HTTP_IS_SPHT(*att_beg))
3468 att_beg++;
3469
3470 /* find att_end : this is the first character after the last non
3471 * space before the equal. It may be equal to hdr_end.
3472 */
3473 equal = att_end = att_beg;
3474
3475 while (equal < hdr_end) {
Willy Tarreauaa1909e2022-11-14 18:58:35 +01003476 if (*equal == '=' || *equal == ';')
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003477 break;
3478 if (HTTP_IS_SPHT(*equal++))
3479 continue;
3480 att_end = equal;
3481 }
3482
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +05003483 /* here, <equal> points to '=', a delimiter or the end. <att_end>
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003484 * is between <att_beg> and <equal>, both may be identical.
3485 */
3486
3487 /* look for end of cookie if there is an equal sign */
3488 if (equal < hdr_end && *equal == '=') {
3489 /* look for the beginning of the value */
3490 val_beg = equal + 1;
3491 while (val_beg < hdr_end && HTTP_IS_SPHT(*val_beg))
3492 val_beg++;
3493
3494 /* find the end of the value, respecting quotes */
3495 next = http_find_cookie_value_end(val_beg, hdr_end);
3496
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +05003497 /* make val_end point to the first white space or delimiter after the value */
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003498 val_end = next;
3499 while (val_end > val_beg && HTTP_IS_SPHT(*(val_end - 1)))
3500 val_end--;
3501 }
3502 else {
3503 /* <equal> points to next comma, semi-colon or EOL */
3504 val_beg = val_end = next = equal;
3505 }
3506
3507 if (next < hdr_end) {
Willy Tarreauaa1909e2022-11-14 18:58:35 +01003508 /* For Set-Cookie, since commas are permitted
3509 * in values, skip to the end.
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003510 */
Willy Tarreauaa1909e2022-11-14 18:58:35 +01003511 next = hdr_end;
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003512 }
3513
3514 /* Now everything is as on the diagram above */
3515
3516 /* Ignore cookies with no equal sign */
3517 if (equal == val_end)
3518 continue;
3519
3520 /* If there are spaces around the equal sign, we need to
3521 * strip them otherwise we'll get trouble for cookie captures,
3522 * or even for rewrites. Since this happens extremely rarely,
3523 * it does not hurt performance.
3524 */
3525 if (unlikely(att_end != equal || val_beg > equal + 1)) {
3526 int stripped_before = 0;
3527 int stripped_after = 0;
3528
3529 if (att_end != equal) {
3530 memmove(att_end, equal, hdr_end - equal);
3531 stripped_before = (att_end - equal);
3532 equal += stripped_before;
3533 val_beg += stripped_before;
3534 }
3535
3536 if (val_beg > equal + 1) {
3537 memmove(equal + 1, val_beg, hdr_end + stripped_before - val_beg);
3538 stripped_after = (equal + 1) - val_beg;
3539 val_beg += stripped_after;
3540 stripped_before += stripped_after;
3541 }
3542
3543 val_end += stripped_before;
3544 next += stripped_before;
3545 hdr_end += stripped_before;
3546
Christopher Faulet3e2638e2019-06-18 09:49:16 +02003547 htx_change_blk_value_len(htx, ctx.blk, hdr_end - hdr_beg);
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003548 ctx.value.len = hdr_end - hdr_beg;
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003549 }
3550
3551 /* First, let's see if we want to capture this cookie. We check
3552 * that we don't already have a server side cookie, because we
3553 * can only capture one. Also as an optimisation, we ignore
3554 * cookies shorter than the declared name.
3555 */
3556 if (sess->fe->capture_name != NULL &&
3557 txn->srv_cookie == NULL &&
3558 (val_end - att_beg >= sess->fe->capture_namelen) &&
3559 memcmp(att_beg, sess->fe->capture_name, sess->fe->capture_namelen) == 0) {
3560 int log_len = val_end - att_beg;
3561 if ((txn->srv_cookie = pool_alloc(pool_head_capture)) == NULL) {
3562 ha_alert("HTTP logging : out of memory.\n");
3563 }
3564 else {
3565 if (log_len > sess->fe->capture_len)
3566 log_len = sess->fe->capture_len;
3567 memcpy(txn->srv_cookie, att_beg, log_len);
3568 txn->srv_cookie[log_len] = 0;
3569 }
3570 }
3571
3572 srv = objt_server(s->target);
3573 /* now check if we need to process it for persistence */
3574 if (!(s->flags & SF_IGNORE_PRST) &&
3575 (att_end - att_beg == s->be->cookie_len) && (s->be->cookie_name != NULL) &&
3576 (memcmp(att_beg, s->be->cookie_name, att_end - att_beg) == 0)) {
3577 /* assume passive cookie by default */
3578 txn->flags &= ~TX_SCK_MASK;
3579 txn->flags |= TX_SCK_FOUND;
3580
3581 /* If the cookie is in insert mode on a known server, we'll delete
3582 * this occurrence because we'll insert another one later.
3583 * We'll delete it too if the "indirect" option is set and we're in
3584 * a direct access.
3585 */
3586 if (s->be->ck_opts & PR_CK_PSV) {
3587 /* The "preserve" flag was set, we don't want to touch the
3588 * server's cookie.
3589 */
3590 }
3591 else if ((srv && (s->be->ck_opts & PR_CK_INS)) ||
3592 ((s->flags & SF_DIRECT) && (s->be->ck_opts & PR_CK_IND))) {
3593 /* this cookie must be deleted */
3594 if (prev == hdr_beg && next == hdr_end) {
3595 /* whole header */
3596 http_remove_header(htx, &ctx);
3597 /* note: while both invalid now, <next> and <hdr_end>
3598 * are still equal, so the for() will stop as expected.
3599 */
3600 } else {
3601 /* just remove the value */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02003602 int delta = http_del_hdr_value(hdr_beg, hdr_end, &prev, next);
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003603 next = prev;
3604 hdr_end += delta;
3605 }
3606 txn->flags &= ~TX_SCK_MASK;
3607 txn->flags |= TX_SCK_DELETED;
3608 /* and go on with next cookie */
3609 }
3610 else if (srv && srv->cookie && (s->be->ck_opts & PR_CK_RW)) {
3611 /* replace bytes val_beg->val_end with the cookie name associated
3612 * with this server since we know it.
3613 */
3614 int sliding, delta;
3615
3616 ctx.value = ist2(val_beg, val_end - val_beg);
3617 ctx.lws_before = ctx.lws_after = 0;
3618 http_replace_header_value(htx, &ctx, ist2(srv->cookie, srv->cklen));
3619 delta = srv->cklen - (val_end - val_beg);
3620 sliding = (ctx.value.ptr - val_beg);
3621 hdr_beg += sliding;
3622 val_beg += sliding;
3623 next += sliding + delta;
3624 hdr_end += sliding + delta;
3625
3626 txn->flags &= ~TX_SCK_MASK;
3627 txn->flags |= TX_SCK_REPLACED;
3628 }
3629 else if (srv && srv->cookie && (s->be->ck_opts & PR_CK_PFX)) {
3630 /* insert the cookie name associated with this server
3631 * before existing cookie, and insert a delimiter between them..
3632 */
3633 int sliding, delta;
3634 ctx.value = ist2(val_beg, 0);
3635 ctx.lws_before = ctx.lws_after = 0;
3636 http_replace_header_value(htx, &ctx, ist2(srv->cookie, srv->cklen + 1));
3637 delta = srv->cklen + 1;
3638 sliding = (ctx.value.ptr - val_beg);
3639 hdr_beg += sliding;
3640 val_beg += sliding;
3641 next += sliding + delta;
3642 hdr_end += sliding + delta;
3643
3644 val_beg[srv->cklen] = COOKIE_DELIM;
3645 txn->flags &= ~TX_SCK_MASK;
3646 txn->flags |= TX_SCK_REPLACED;
3647 }
3648 }
3649 /* that's done for this cookie, check the next one on the same
Willy Tarreauaa1909e2022-11-14 18:58:35 +01003650 * line when next != hdr_end (which should normally not happen
3651 * with set-cookie2 support removed).
Christopher Fauletfcda7c62018-10-24 11:56:22 +02003652 */
3653 }
3654 }
3655}
3656
Christopher Faulet25a02f62018-10-24 12:00:25 +02003657/*
3658 * Parses the Cache-Control and Pragma request header fields to determine if
3659 * the request may be served from the cache and/or if it is cacheable. Updates
3660 * s->txn->flags.
3661 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02003662void http_check_request_for_cacheability(struct stream *s, struct channel *req)
Christopher Faulet25a02f62018-10-24 12:00:25 +02003663{
3664 struct http_txn *txn = s->txn;
3665 struct htx *htx;
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003666 struct http_hdr_ctx ctx = { .blk = NULL };
3667 int pragma_found, cc_found;
Christopher Faulet25a02f62018-10-24 12:00:25 +02003668
3669 if ((txn->flags & (TX_CACHEABLE|TX_CACHE_IGNORE)) == TX_CACHE_IGNORE)
3670 return; /* nothing more to do here */
3671
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01003672 htx = htxbuf(&req->buf);
Christopher Faulet25a02f62018-10-24 12:00:25 +02003673 pragma_found = cc_found = 0;
Christopher Faulet25a02f62018-10-24 12:00:25 +02003674
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003675 /* Check "pragma" header for HTTP/1.0 compatibility. */
3676 if (http_find_header(htx, ist("pragma"), &ctx, 1)) {
3677 if (isteqi(ctx.value, ist("no-cache"))) {
3678 pragma_found = 1;
Christopher Faulet25a02f62018-10-24 12:00:25 +02003679 }
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003680 }
Christopher Faulet25a02f62018-10-24 12:00:25 +02003681
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003682 ctx.blk = NULL;
3683 /* Don't use the cache and don't try to store if we found the
3684 * Authorization header */
3685 if (http_find_header(htx, ist("authorization"), &ctx, 1)) {
3686 txn->flags &= ~TX_CACHEABLE & ~TX_CACHE_COOK;
3687 txn->flags |= TX_CACHE_IGNORE;
3688 }
Christopher Faulet25a02f62018-10-24 12:00:25 +02003689
Christopher Faulet25a02f62018-10-24 12:00:25 +02003690
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003691 /* Look for "cache-control" header and iterate over all the values
3692 * until we find one that specifies that caching is possible or not. */
3693 ctx.blk = NULL;
3694 while (http_find_header(htx, ist("cache-control"), &ctx, 0)) {
Christopher Faulet25a02f62018-10-24 12:00:25 +02003695 cc_found = 1;
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003696 /* We don't check the values after max-age, max-stale nor min-fresh,
3697 * we simply don't use the cache when they're specified. */
3698 if (istmatchi(ctx.value, ist("max-age")) ||
3699 istmatchi(ctx.value, ist("no-cache")) ||
3700 istmatchi(ctx.value, ist("max-stale")) ||
3701 istmatchi(ctx.value, ist("min-fresh"))) {
Christopher Faulet25a02f62018-10-24 12:00:25 +02003702 txn->flags |= TX_CACHE_IGNORE;
3703 continue;
3704 }
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003705 if (istmatchi(ctx.value, ist("no-store"))) {
Christopher Faulet25a02f62018-10-24 12:00:25 +02003706 txn->flags &= ~TX_CACHEABLE & ~TX_CACHE_COOK;
3707 continue;
3708 }
3709 }
3710
3711 /* RFC7234#5.4:
3712 * When the Cache-Control header field is also present and
3713 * understood in a request, Pragma is ignored.
3714 * When the Cache-Control header field is not present in a
3715 * request, caches MUST consider the no-cache request
3716 * pragma-directive as having the same effect as if
3717 * "Cache-Control: no-cache" were present.
3718 */
3719 if (!cc_found && pragma_found)
3720 txn->flags |= TX_CACHE_IGNORE;
3721}
3722
3723/*
3724 * Check if response is cacheable or not. Updates s->txn->flags.
3725 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02003726void http_check_response_for_cacheability(struct stream *s, struct channel *res)
Christopher Faulet25a02f62018-10-24 12:00:25 +02003727{
3728 struct http_txn *txn = s->txn;
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003729 struct http_hdr_ctx ctx = { .blk = NULL };
Christopher Faulet25a02f62018-10-24 12:00:25 +02003730 struct htx *htx;
Remi Tricot-Le Bretoncc9bf2e2020-11-12 11:14:41 +01003731 int has_freshness_info = 0;
3732 int has_validator = 0;
Remi Tricot-Le Breton02f47242023-07-04 17:13:28 +02003733 int has_null_maxage = 0;
Christopher Faulet25a02f62018-10-24 12:00:25 +02003734
3735 if (txn->status < 200) {
3736 /* do not try to cache interim responses! */
3737 txn->flags &= ~TX_CACHEABLE & ~TX_CACHE_COOK;
3738 return;
3739 }
3740
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01003741 htx = htxbuf(&res->buf);
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003742 /* Check "pragma" header for HTTP/1.0 compatibility. */
3743 if (http_find_header(htx, ist("pragma"), &ctx, 1)) {
3744 if (isteqi(ctx.value, ist("no-cache"))) {
3745 txn->flags &= ~TX_CACHEABLE & ~TX_CACHE_COOK;
3746 return;
Christopher Faulet25a02f62018-10-24 12:00:25 +02003747 }
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003748 }
Christopher Faulet25a02f62018-10-24 12:00:25 +02003749
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003750 /* Look for "cache-control" header and iterate over all the values
3751 * until we find one that specifies that caching is possible or not. */
3752 ctx.blk = NULL;
3753 while (http_find_header(htx, ist("cache-control"), &ctx, 0)) {
3754 if (isteqi(ctx.value, ist("public"))) {
3755 txn->flags |= TX_CACHEABLE | TX_CACHE_COOK;
Christopher Faulet25a02f62018-10-24 12:00:25 +02003756 continue;
3757 }
Remi Tricot-Le Breton02f47242023-07-04 17:13:28 +02003758 /* This max-age might be overridden by a s-maxage directive, do
3759 * not unset the TX_CACHEABLE yet. */
3760 if (isteqi(ctx.value, ist("max-age=0"))) {
3761 has_null_maxage = 1;
3762 continue;
3763 }
3764
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003765 if (isteqi(ctx.value, ist("private")) ||
3766 isteqi(ctx.value, ist("no-cache")) ||
3767 isteqi(ctx.value, ist("no-store")) ||
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003768 isteqi(ctx.value, ist("s-maxage=0"))) {
Christopher Faulet25a02f62018-10-24 12:00:25 +02003769 txn->flags &= ~TX_CACHEABLE & ~TX_CACHE_COOK;
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003770 continue;
Christopher Faulet25a02f62018-10-24 12:00:25 +02003771 }
Remi Tricot-Le Breton40ed97b2020-10-28 11:35:15 +01003772 /* We might have a no-cache="set-cookie" form. */
3773 if (istmatchi(ctx.value, ist("no-cache=\"set-cookie"))) {
3774 txn->flags &= ~TX_CACHE_COOK;
Christopher Faulet25a02f62018-10-24 12:00:25 +02003775 continue;
3776 }
Remi Tricot-Le Bretoncc9bf2e2020-11-12 11:14:41 +01003777
Remi Tricot-Le Breton02f47242023-07-04 17:13:28 +02003778 if (istmatchi(ctx.value, ist("s-maxage"))) {
Remi Tricot-Le Bretoncc9bf2e2020-11-12 11:14:41 +01003779 has_freshness_info = 1;
Remi Tricot-Le Breton02f47242023-07-04 17:13:28 +02003780 has_null_maxage = 0; /* The null max-age is overridden, ignore it */
Remi Tricot-Le Bretoncc9bf2e2020-11-12 11:14:41 +01003781 continue;
3782 }
Remi Tricot-Le Breton02f47242023-07-04 17:13:28 +02003783 if (istmatchi(ctx.value, ist("max-age"))) {
3784 has_freshness_info = 1;
3785 continue;
3786 }
3787 }
3788
3789 /* We had a 'max-age=0' directive but no extra s-maxage, do not cache
3790 * the response. */
3791 if (has_null_maxage) {
3792 txn->flags &= ~TX_CACHEABLE & ~TX_CACHE_COOK;
Remi Tricot-Le Bretoncc9bf2e2020-11-12 11:14:41 +01003793 }
3794
3795 /* If no freshness information could be found in Cache-Control values,
3796 * look for an Expires header. */
3797 if (!has_freshness_info) {
3798 ctx.blk = NULL;
3799 has_freshness_info = http_find_header(htx, ist("expires"), &ctx, 0);
Christopher Faulet25a02f62018-10-24 12:00:25 +02003800 }
Remi Tricot-Le Bretoncc9bf2e2020-11-12 11:14:41 +01003801
3802 /* If no freshness information could be found in Cache-Control or Expires
3803 * values, look for an explicit validator. */
3804 if (!has_freshness_info) {
3805 ctx.blk = NULL;
3806 has_validator = 1;
3807 if (!http_find_header(htx, ist("etag"), &ctx, 0)) {
3808 ctx.blk = NULL;
3809 if (!http_find_header(htx, ist("last-modified"), &ctx, 0))
3810 has_validator = 0;
3811 }
3812 }
3813
3814 /* We won't store an entry that has neither a cache validator nor an
3815 * explicit expiration time, as suggested in RFC 7234#3. */
3816 if (!has_freshness_info && !has_validator)
Remi Tricot-Le Breton879debe2023-02-21 11:47:17 +01003817 txn->flags &= ~TX_CACHEABLE;
Christopher Faulet25a02f62018-10-24 12:00:25 +02003818}
3819
Christopher Faulet377c5a52018-10-24 21:21:30 +02003820/*
3821 * In a GET, HEAD or POST request, check if the requested URI matches the stats uri
Aurelien DARRAGONf6286142023-12-05 17:54:20 +01003822 * for the current proxy.
Christopher Faulet377c5a52018-10-24 21:21:30 +02003823 *
3824 * It is assumed that the request is either a HEAD, GET, or POST and that the
3825 * uri_auth field is valid.
3826 *
3827 * Returns 1 if stats should be provided, otherwise 0.
3828 */
Aurelien DARRAGONf6286142023-12-05 17:54:20 +01003829static int http_stats_check_uri(struct stream *s, struct http_txn *txn, struct proxy *px)
Christopher Faulet377c5a52018-10-24 21:21:30 +02003830{
Aurelien DARRAGONf6286142023-12-05 17:54:20 +01003831 struct uri_auth *uri_auth = px->uri_auth;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003832 struct htx *htx;
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01003833 struct htx_sl *sl;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003834 struct ist uri;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003835
3836 if (!uri_auth)
3837 return 0;
3838
3839 if (txn->meth != HTTP_METH_GET && txn->meth != HTTP_METH_HEAD && txn->meth != HTTP_METH_POST)
3840 return 0;
3841
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01003842 htx = htxbuf(&s->req.buf);
Christopher Faulet297fbb42019-05-13 14:41:27 +02003843 sl = http_get_stline(htx);
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01003844 uri = htx_sl_req_uri(sl);
Amaury Denoyellec453f952021-07-06 11:40:12 +02003845 if (*uri_auth->uri_prefix == '/') {
3846 struct http_uri_parser parser = http_uri_parser_init(uri);
3847 uri = http_parse_path(&parser);
3848 }
Christopher Faulet377c5a52018-10-24 21:21:30 +02003849
3850 /* check URI size */
3851 if (uri_auth->uri_len > uri.len)
3852 return 0;
3853
3854 if (memcmp(uri.ptr, uri_auth->uri_prefix, uri_auth->uri_len) != 0)
3855 return 0;
3856
3857 return 1;
3858}
3859
3860/* This function prepares an applet to handle the stats. It can deal with the
3861 * "100-continue" expectation, check that admin rules are met for POST requests,
3862 * and program a response message if something was unexpected. It cannot fail
3863 * and always relies on the stats applet to complete the job. It does not touch
3864 * analysers nor counters, which are left to the caller. It does not touch
3865 * s->target which is supposed to already point to the stats applet. The caller
3866 * is expected to have already assigned an appctx to the stream.
3867 */
Aurelien DARRAGONf6286142023-12-05 17:54:20 +01003868static int http_handle_stats(struct stream *s, struct channel *req, struct proxy *px)
Christopher Faulet377c5a52018-10-24 21:21:30 +02003869{
3870 struct stats_admin_rule *stats_admin_rule;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003871 struct session *sess = s->sess;
3872 struct http_txn *txn = s->txn;
3873 struct http_msg *msg = &txn->req;
Aurelien DARRAGONf6286142023-12-05 17:54:20 +01003874 struct uri_auth *uri_auth = px->uri_auth;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003875 const char *h, *lookup, *end;
Willy Tarreau8e7c6e62022-05-18 17:58:02 +02003876 struct appctx *appctx = __sc_appctx(s->scb);
Willy Tarreau91cefca2022-05-03 17:08:29 +02003877 struct show_stat_ctx *ctx = applet_reserve_svcctx(appctx, sizeof(*ctx));
Christopher Faulet377c5a52018-10-24 21:21:30 +02003878 struct htx *htx;
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01003879 struct htx_sl *sl;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003880
Willy Tarreau41f88522022-05-03 18:39:27 +02003881 appctx->st1 = 0;
Willy Tarreau6ef16482022-05-06 18:07:53 +02003882 ctx->state = STAT_STATE_INIT;
Willy Tarreau91cefca2022-05-03 17:08:29 +02003883 ctx->st_code = STAT_STATUS_INIT;
Aurelien DARRAGONf6286142023-12-05 17:54:20 +01003884 ctx->http_px = px;
Willy Tarreau91cefca2022-05-03 17:08:29 +02003885 ctx->flags |= uri_auth->flags;
3886 ctx->flags |= STAT_FMT_HTML; /* assume HTML mode by default */
Christopher Faulet377c5a52018-10-24 21:21:30 +02003887 if ((msg->flags & HTTP_MSGF_VER_11) && (txn->meth != HTTP_METH_HEAD))
Willy Tarreau91cefca2022-05-03 17:08:29 +02003888 ctx->flags |= STAT_CHUNKED;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003889
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01003890 htx = htxbuf(&req->buf);
Christopher Faulet297fbb42019-05-13 14:41:27 +02003891 sl = http_get_stline(htx);
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01003892 lookup = HTX_SL_REQ_UPTR(sl) + uri_auth->uri_len;
3893 end = HTX_SL_REQ_UPTR(sl) + HTX_SL_REQ_ULEN(sl);
Christopher Faulet377c5a52018-10-24 21:21:30 +02003894
3895 for (h = lookup; h <= end - 3; h++) {
3896 if (memcmp(h, ";up", 3) == 0) {
Willy Tarreau91cefca2022-05-03 17:08:29 +02003897 ctx->flags |= STAT_HIDE_DOWN;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003898 break;
3899 }
Amaury Denoyelle91e55ea2021-02-25 14:46:08 +01003900 }
3901
3902 for (h = lookup; h <= end - 9; h++) {
3903 if (memcmp(h, ";no-maint", 9) == 0) {
Willy Tarreau91cefca2022-05-03 17:08:29 +02003904 ctx->flags |= STAT_HIDE_MAINT;
Willy Tarreau3e320362020-10-23 17:28:57 +02003905 break;
3906 }
Christopher Faulet377c5a52018-10-24 21:21:30 +02003907 }
3908
3909 if (uri_auth->refresh) {
3910 for (h = lookup; h <= end - 10; h++) {
3911 if (memcmp(h, ";norefresh", 10) == 0) {
Willy Tarreau91cefca2022-05-03 17:08:29 +02003912 ctx->flags |= STAT_NO_REFRESH;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003913 break;
3914 }
3915 }
3916 }
3917
3918 for (h = lookup; h <= end - 4; h++) {
3919 if (memcmp(h, ";csv", 4) == 0) {
Willy Tarreau91cefca2022-05-03 17:08:29 +02003920 ctx->flags &= ~(STAT_FMT_MASK|STAT_JSON_SCHM);
Christopher Faulet377c5a52018-10-24 21:21:30 +02003921 break;
3922 }
3923 }
3924
3925 for (h = lookup; h <= end - 6; h++) {
3926 if (memcmp(h, ";typed", 6) == 0) {
Willy Tarreau91cefca2022-05-03 17:08:29 +02003927 ctx->flags &= ~(STAT_FMT_MASK|STAT_JSON_SCHM);
3928 ctx->flags |= STAT_FMT_TYPED;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003929 break;
3930 }
3931 }
3932
Christopher Faulet6338a082019-09-09 15:50:54 +02003933 for (h = lookup; h <= end - 5; h++) {
3934 if (memcmp(h, ";json", 5) == 0) {
Willy Tarreau91cefca2022-05-03 17:08:29 +02003935 ctx->flags &= ~(STAT_FMT_MASK|STAT_JSON_SCHM);
3936 ctx->flags |= STAT_FMT_JSON;
Christopher Faulet6338a082019-09-09 15:50:54 +02003937 break;
3938 }
3939 }
3940
3941 for (h = lookup; h <= end - 12; h++) {
3942 if (memcmp(h, ";json-schema", 12) == 0) {
Willy Tarreau91cefca2022-05-03 17:08:29 +02003943 ctx->flags &= ~STAT_FMT_MASK;
3944 ctx->flags |= STAT_JSON_SCHM;
Christopher Faulet6338a082019-09-09 15:50:54 +02003945 break;
3946 }
3947 }
3948
Christopher Faulet377c5a52018-10-24 21:21:30 +02003949 for (h = lookup; h <= end - 8; h++) {
3950 if (memcmp(h, ";st=", 4) == 0) {
3951 int i;
3952 h += 4;
Willy Tarreau91cefca2022-05-03 17:08:29 +02003953 ctx->st_code = STAT_STATUS_UNKN;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003954 for (i = STAT_STATUS_INIT + 1; i < STAT_STATUS_SIZE; i++) {
3955 if (strncmp(stat_status_codes[i], h, 4) == 0) {
Willy Tarreau91cefca2022-05-03 17:08:29 +02003956 ctx->st_code = i;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003957 break;
3958 }
3959 }
3960 break;
3961 }
3962 }
3963
Willy Tarreau91cefca2022-05-03 17:08:29 +02003964 ctx->scope_str = 0;
3965 ctx->scope_len = 0;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003966 for (h = lookup; h <= end - 8; h++) {
3967 if (memcmp(h, STAT_SCOPE_INPUT_NAME "=", strlen(STAT_SCOPE_INPUT_NAME) + 1) == 0) {
3968 int itx = 0;
3969 const char *h2;
3970 char scope_txt[STAT_SCOPE_TXT_MAXLEN + 1];
3971 const char *err;
3972
3973 h += strlen(STAT_SCOPE_INPUT_NAME) + 1;
3974 h2 = h;
Willy Tarreau91cefca2022-05-03 17:08:29 +02003975 ctx->scope_str = h2 - HTX_SL_REQ_UPTR(sl);
Christopher Fauleted7a0662019-01-14 11:07:34 +01003976 while (h < end) {
Christopher Faulet377c5a52018-10-24 21:21:30 +02003977 if (*h == ';' || *h == '&' || *h == ' ')
3978 break;
3979 itx++;
3980 h++;
3981 }
3982
3983 if (itx > STAT_SCOPE_TXT_MAXLEN)
3984 itx = STAT_SCOPE_TXT_MAXLEN;
Willy Tarreau91cefca2022-05-03 17:08:29 +02003985 ctx->scope_len = itx;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003986
Willy Tarreau91cefca2022-05-03 17:08:29 +02003987 /* scope_txt = search query, ctx->scope_len is always <= STAT_SCOPE_TXT_MAXLEN */
Christopher Faulet377c5a52018-10-24 21:21:30 +02003988 memcpy(scope_txt, h2, itx);
3989 scope_txt[itx] = '\0';
3990 err = invalid_char(scope_txt);
3991 if (err) {
3992 /* bad char in search text => clear scope */
Willy Tarreau91cefca2022-05-03 17:08:29 +02003993 ctx->scope_str = 0;
3994 ctx->scope_len = 0;
Christopher Faulet377c5a52018-10-24 21:21:30 +02003995 }
3996 break;
3997 }
3998 }
3999
4000 /* now check whether we have some admin rules for this request */
4001 list_for_each_entry(stats_admin_rule, &uri_auth->admin_rules, list) {
4002 int ret = 1;
4003
4004 if (stats_admin_rule->cond) {
4005 ret = acl_exec_cond(stats_admin_rule->cond, s->be, sess, s, SMP_OPT_DIR_REQ|SMP_OPT_FINAL);
4006 ret = acl_pass(ret);
4007 if (stats_admin_rule->cond->pol == ACL_COND_UNLESS)
4008 ret = !ret;
4009 }
4010
4011 if (ret) {
4012 /* no rule, or the rule matches */
Willy Tarreau91cefca2022-05-03 17:08:29 +02004013 ctx->flags |= STAT_ADMIN;
Christopher Faulet377c5a52018-10-24 21:21:30 +02004014 break;
4015 }
4016 }
4017
Christopher Faulet5d45e382019-02-27 15:15:23 +01004018 if (txn->meth == HTTP_METH_GET || txn->meth == HTTP_METH_HEAD)
4019 appctx->st0 = STAT_HTTP_HEAD;
4020 else if (txn->meth == HTTP_METH_POST) {
Willy Tarreau91cefca2022-05-03 17:08:29 +02004021 if (ctx->flags & STAT_ADMIN) {
Christopher Faulet377c5a52018-10-24 21:21:30 +02004022 appctx->st0 = STAT_HTTP_POST;
Christopher Fauletbd9e8422019-08-15 22:26:48 +02004023 if (msg->msg_state < HTTP_MSG_DATA)
4024 req->analysers |= AN_REQ_HTTP_BODY;
4025 }
Christopher Faulet377c5a52018-10-24 21:21:30 +02004026 else {
Christopher Faulet5d45e382019-02-27 15:15:23 +01004027 /* POST without admin level */
Willy Tarreau91cefca2022-05-03 17:08:29 +02004028 ctx->flags &= ~STAT_CHUNKED;
4029 ctx->st_code = STAT_STATUS_DENY;
Christopher Faulet377c5a52018-10-24 21:21:30 +02004030 appctx->st0 = STAT_HTTP_LAST;
4031 }
4032 }
4033 else {
Christopher Faulet5d45e382019-02-27 15:15:23 +01004034 /* Unsupported method */
Willy Tarreau91cefca2022-05-03 17:08:29 +02004035 ctx->flags &= ~STAT_CHUNKED;
4036 ctx->st_code = STAT_STATUS_IVAL;
Christopher Faulet5d45e382019-02-27 15:15:23 +01004037 appctx->st0 = STAT_HTTP_LAST;
Christopher Faulet377c5a52018-10-24 21:21:30 +02004038 }
4039
4040 s->task->nice = -32; /* small boost for HTTP statistics */
4041 return 1;
4042}
4043
Christopher Faulet021a8e42021-03-29 10:46:38 +02004044/* This function waits for the message payload at most <time> milliseconds (may
4045 * be set to TICK_ETERNITY). It stops to wait if at least <bytes> bytes of the
4046 * payload are received (0 means no limit). It returns HTTP_RULE_* depending on
4047 * the result:
4048 *
4049 * - HTTP_RULE_RES_CONT when conditions are met to stop waiting
4050 * - HTTP_RULE_RES_YIELD to wait for more data
Ilya Shipitsinb2be9a12021-04-24 13:25:42 +05004051 * - HTTP_RULE_RES_ABRT when a timeout occurred.
Christopher Faulet021a8e42021-03-29 10:46:38 +02004052 * - HTTP_RULE_RES_BADREQ if a parsing error is raised by lower level
Ilya Shipitsinb2be9a12021-04-24 13:25:42 +05004053 * - HTTP_RULE_RES_ERROR if an internal error occurred
Christopher Faulet021a8e42021-03-29 10:46:38 +02004054 *
Ilya Shipitsinb2be9a12021-04-24 13:25:42 +05004055 * If a timeout occurred, this function is responsible to emit the right response
Christopher Faulet021a8e42021-03-29 10:46:38 +02004056 * to the client, depending on the channel (408 on request side, 504 on response
4057 * side). All other errors must be handled by the caller.
4058 */
4059enum rule_result http_wait_for_msg_body(struct stream *s, struct channel *chn,
4060 unsigned int time, unsigned int bytes)
4061{
4062 struct session *sess = s->sess;
4063 struct http_txn *txn = s->txn;
4064 struct http_msg *msg = ((chn->flags & CF_ISRESP) ? &txn->rsp : &txn->req);
4065 struct htx *htx;
4066 enum rule_result ret = HTTP_RULE_RES_CONT;
4067
4068 htx = htxbuf(&chn->buf);
4069
4070 if (htx->flags & HTX_FL_PARSING_ERROR) {
4071 ret = HTTP_RULE_RES_BADREQ;
4072 goto end;
4073 }
4074 if (htx->flags & HTX_FL_PROCESSING_ERROR) {
4075 ret = HTTP_RULE_RES_ERROR;
4076 goto end;
4077 }
4078
4079 /* Do nothing for bodyless and CONNECT requests */
4080 if (txn->meth == HTTP_METH_CONNECT || (msg->flags & HTTP_MSGF_BODYLESS))
4081 goto end;
4082
Christopher Fauletffcffa82023-04-05 10:33:31 +02004083 if (!(chn->flags & CF_ISRESP)) {
Christopher Faulet021a8e42021-03-29 10:46:38 +02004084 if (http_handle_expect_hdr(s, htx, msg) == -1) {
4085 ret = HTTP_RULE_RES_ERROR;
4086 goto end;
4087 }
4088 }
4089
Christopher Faulet2954bcc2023-04-05 10:42:03 +02004090 /* Now we're are waiting for the payload. We just need to know if all
4091 * data have been received or if the buffer is full.
Christopher Faulet021a8e42021-03-29 10:46:38 +02004092 */
Christopher Faulet78335962021-09-23 14:46:32 +02004093 if ((htx->flags & HTX_FL_EOM) ||
4094 htx_get_tail_type(htx) > HTX_BLK_DATA ||
4095 channel_htx_full(chn, htx, global.tune.maxrewrite) ||
Willy Tarreau99615ed2022-05-25 07:29:36 +02004096 sc_waiting_room(chn_prod(chn)))
Christopher Faulet021a8e42021-03-29 10:46:38 +02004097 goto end;
4098
4099 if (bytes) {
4100 struct htx_blk *blk;
4101 unsigned int len = 0;
4102
4103 for (blk = htx_get_first_blk(htx); blk; blk = htx_get_next_blk(htx, blk)) {
4104 if (htx_get_blk_type(blk) != HTX_BLK_DATA)
4105 continue;
4106 len += htx_get_blksz(blk);
4107 if (len >= bytes)
4108 goto end;
4109 }
4110 }
4111
4112 if ((chn->flags & CF_READ_TIMEOUT) || tick_is_expired(chn->analyse_exp, now_ms)) {
4113 if (!(chn->flags & CF_ISRESP))
4114 goto abort_req;
4115 goto abort_res;
4116 }
4117
4118 /* we get here if we need to wait for more data */
Christopher Fauletca5309a2023-04-17 16:17:32 +02004119 if (!(chn_prod(chn)->flags & (SC_FL_EOS|SC_FL_ABRT_DONE))) {
Christopher Faulet021a8e42021-03-29 10:46:38 +02004120 if (!tick_isset(chn->analyse_exp))
4121 chn->analyse_exp = tick_add_ifset(now_ms, time);
4122 ret = HTTP_RULE_RES_YIELD;
4123 }
4124
4125 end:
4126 return ret;
4127
Christopher Fauletf0d80df2023-01-13 10:20:20 +01004128 abort:
4129 http_reply_and_close(s, txn->status, http_error_message(s));
4130 ret = HTTP_RULE_RES_ABRT;
4131 goto end;
4132
Christopher Faulet021a8e42021-03-29 10:46:38 +02004133 abort_req:
4134 txn->status = 408;
4135 if (!(s->flags & SF_ERR_MASK))
4136 s->flags |= SF_ERR_CLITO;
Willy Tarreau4781b152021-04-06 13:53:36 +02004137 _HA_ATOMIC_INC(&sess->fe->fe_counters.failed_req);
Christopher Faulet021a8e42021-03-29 10:46:38 +02004138 if (sess->listener && sess->listener->counters)
Willy Tarreau4781b152021-04-06 13:53:36 +02004139 _HA_ATOMIC_INC(&sess->listener->counters->failed_req);
Christopher Fauletf0d80df2023-01-13 10:20:20 +01004140 goto abort;
Christopher Faulet021a8e42021-03-29 10:46:38 +02004141
4142 abort_res:
4143 txn->status = 504;
4144 if (!(s->flags & SF_ERR_MASK))
4145 s->flags |= SF_ERR_SRVTO;
Christopher Faulet021a8e42021-03-29 10:46:38 +02004146 stream_inc_http_fail_ctr(s);
Christopher Fauletf0d80df2023-01-13 10:20:20 +01004147 goto abort;
Christopher Faulet021a8e42021-03-29 10:46:38 +02004148}
4149
Willy Tarreaub49672d2022-05-27 10:13:37 +02004150void http_perform_server_redirect(struct stream *s, struct stconn *sc)
Christopher Fauletfefc73d2018-10-24 21:18:04 +02004151{
Christopher Faulet0eaed6b2018-11-28 17:46:40 +01004152 struct channel *req = &s->req;
4153 struct channel *res = &s->res;
4154 struct server *srv;
Christopher Fauletfefc73d2018-10-24 21:18:04 +02004155 struct htx *htx;
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01004156 struct htx_sl *sl;
Christopher Faulet0eaed6b2018-11-28 17:46:40 +01004157 struct ist path, location;
4158 unsigned int flags;
Amaury Denoyellec453f952021-07-06 11:40:12 +02004159 struct http_uri_parser parser;
Christopher Fauletfefc73d2018-10-24 21:18:04 +02004160
Christopher Faulet0eaed6b2018-11-28 17:46:40 +01004161 /*
4162 * Create the location
4163 */
4164 chunk_reset(&trash);
Christopher Fauletfefc73d2018-10-24 21:18:04 +02004165
Christopher Faulet0eaed6b2018-11-28 17:46:40 +01004166 /* 1: add the server's prefix */
Christopher Fauletfefc73d2018-10-24 21:18:04 +02004167 /* special prefix "/" means don't change URL */
4168 srv = __objt_server(s->target);
4169 if (srv->rdr_len != 1 || *srv->rdr_pfx != '/') {
4170 if (!chunk_memcat(&trash, srv->rdr_pfx, srv->rdr_len))
4171 return;
4172 }
4173
Christopher Faulet0eaed6b2018-11-28 17:46:40 +01004174 /* 2: add the request Path */
Christopher Faulet27ba2dc2018-12-05 11:53:24 +01004175 htx = htxbuf(&req->buf);
Christopher Faulet297fbb42019-05-13 14:41:27 +02004176 sl = http_get_stline(htx);
Amaury Denoyellec453f952021-07-06 11:40:12 +02004177 parser = http_uri_parser_init(htx_sl_req_uri(sl));
4178 path = http_parse_path(&parser);
Tim Duesterhused526372020-03-05 17:56:33 +01004179 if (!isttest(path))
Christopher Fauletfefc73d2018-10-24 21:18:04 +02004180 return;
4181
4182 if (!chunk_memcat(&trash, path.ptr, path.len))
4183 return;
Christopher Faulet0eaed6b2018-11-28 17:46:40 +01004184 location = ist2(trash.area, trash.data);
Christopher Fauletfefc73d2018-10-24 21:18:04 +02004185
Christopher Faulet0eaed6b2018-11-28 17:46:40 +01004186 /*
Ilya Shipitsin4a689da2022-10-29 09:34:32 +05004187 * Create the 302 response
Christopher Faulet0eaed6b2018-11-28 17:46:40 +01004188 */
4189 htx = htx_from_buf(&res->buf);
Christopher Faulet617ec5c2023-10-17 11:43:43 +02004190 flags = (HTX_SL_F_IS_RESP|HTX_SL_F_VER_11|HTX_SL_F_XFER_LEN|HTX_SL_F_CLEN|HTX_SL_F_BODYLESS);
Christopher Faulet0eaed6b2018-11-28 17:46:40 +01004191 sl = htx_add_stline(htx, HTX_BLK_RES_SL, flags,
4192 ist("HTTP/1.1"), ist("302"), ist("Found"));
4193 if (!sl)
4194 goto fail;
4195 sl->info.res.status = 302;
4196 s->txn->status = 302;
4197
4198 if (!htx_add_header(htx, ist("Cache-Control"), ist("no-cache")) ||
4199 !htx_add_header(htx, ist("Connection"), ist("close")) ||
4200 !htx_add_header(htx, ist("Content-length"), ist("0")) ||
4201 !htx_add_header(htx, ist("Location"), location))
4202 goto fail;
4203
Christopher Fauletd1ac2b92020-12-02 19:12:22 +01004204 if (!htx_add_endof(htx, HTX_BLK_EOH))
Christopher Faulet0eaed6b2018-11-28 17:46:40 +01004205 goto fail;
Christopher Fauletfefc73d2018-10-24 21:18:04 +02004206
Christopher Fauletd1ac2b92020-12-02 19:12:22 +01004207 htx->flags |= HTX_FL_EOM;
Christopher Fauletc20afb82020-01-24 19:16:26 +01004208 htx_to_buf(htx, &res->buf);
Christopher Fauleta72a7e42020-01-28 09:28:11 +01004209 if (!http_forward_proxy_resp(s, 1))
4210 goto fail;
Christopher Faulet0eaed6b2018-11-28 17:46:40 +01004211
4212 /* return without error. */
Christopher Fauletcfc11c02023-04-13 16:10:23 +02004213 sc_abort(sc);
Christopher Fauletb2b1c3a2023-04-13 16:23:48 +02004214 sc_shutdown(sc);
Christopher Faulet50264b42022-03-30 19:39:30 +02004215 s->conn_err_type = STRM_ET_NONE;
Willy Tarreaub49672d2022-05-27 10:13:37 +02004216 sc->state = SC_ST_CLO;
Christopher Fauletfefc73d2018-10-24 21:18:04 +02004217
Christopher Faulet0eaed6b2018-11-28 17:46:40 +01004218 if (!(s->flags & SF_ERR_MASK))
4219 s->flags |= SF_ERR_LOCAL;
4220 if (!(s->flags & SF_FINST_MASK))
4221 s->flags |= SF_FINST_C;
Christopher Fauletfefc73d2018-10-24 21:18:04 +02004222
4223 /* FIXME: we should increase a counter of redirects per server and per backend. */
4224 srv_inc_sess_ctr(srv);
4225 srv_set_sess_last(srv);
Christopher Faulet0eaed6b2018-11-28 17:46:40 +01004226 return;
4227
4228 fail:
4229 /* If an error occurred, remove the incomplete HTTP response from the
4230 * buffer */
Christopher Faulet202c6ce2019-01-07 14:57:35 +01004231 channel_htx_truncate(res, htx);
Christopher Fauletfefc73d2018-10-24 21:18:04 +02004232}
4233
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +05004234/* This function terminates the request because it was completely analyzed or
Christopher Fauletf2824e62018-10-01 12:12:37 +02004235 * because an error was triggered during the body forwarding.
4236 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004237static void http_end_request(struct stream *s)
Christopher Fauletf2824e62018-10-01 12:12:37 +02004238{
4239 struct channel *chn = &s->req;
4240 struct http_txn *txn = s->txn;
4241
Christopher Fauleteea8fc72019-11-05 16:18:10 +01004242 DBG_TRACE_ENTER(STRM_EV_HTTP_ANA, s, txn);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004243
Christopher Fauleteea8fc72019-11-05 16:18:10 +01004244 if (unlikely(txn->req.msg_state < HTTP_MSG_DONE)) {
4245 DBG_TRACE_DEVEL("waiting end of the request", STRM_EV_HTTP_ANA, s, txn);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004246 return;
Christopher Fauleteea8fc72019-11-05 16:18:10 +01004247 }
Christopher Fauletf2824e62018-10-01 12:12:37 +02004248
4249 if (txn->req.msg_state == HTTP_MSG_DONE) {
Christopher Fauletf2824e62018-10-01 12:12:37 +02004250 /* No need to read anymore, the request was completely parsed.
4251 * We can shut the read side unless we want to abort_on_close,
4252 * or we have a POST request. The issue with POST requests is
4253 * that some browsers still send a CRLF after the request, and
4254 * this CRLF must be read so that it does not remain in the kernel
4255 * buffers, otherwise a close could cause an RST on some systems
4256 * (eg: Linux).
4257 */
Christopher Faulet769d0e92019-03-22 14:23:18 +01004258 if (!(s->be->options & PR_O_ABRT_CLOSE) && txn->meth != HTTP_METH_POST)
Christopher Fauletf2824e62018-10-01 12:12:37 +02004259 channel_dont_read(chn);
4260
4261 /* if the server closes the connection, we want to immediately react
4262 * and close the socket to save packets and syscalls.
4263 */
Willy Tarreaucb041662022-05-17 19:44:42 +02004264 s->scb->flags |= SC_FL_NOHALF;
Christopher Fauletf2824e62018-10-01 12:12:37 +02004265
4266 /* In any case we've finished parsing the request so we must
4267 * disable Nagle when sending data because 1) we're not going
4268 * to shut this side, and 2) the server is waiting for us to
4269 * send pending data.
4270 */
Christopher Faulet68ef2182023-03-17 15:38:18 +01004271 s->scb->flags |= SC_FL_SND_NEVERWAIT;
Christopher Fauletf2824e62018-10-01 12:12:37 +02004272
Christopher Fauletc2fba3f2023-03-01 16:03:17 +01004273 if (txn->rsp.msg_state < HTTP_MSG_BODY ||
4274 (txn->rsp.msg_state < HTTP_MSG_DONE && s->scb->state != SC_ST_CLO)) {
Christopher Fauletaf124362023-02-14 10:48:02 +01004275 /* The server has not finished to respond and the
4276 * backend SC is not closed, so we don't want to move in
4277 * order not to upset it.
Christopher Fauletd01ce402019-01-02 17:44:13 +01004278 */
Christopher Fauleteea8fc72019-11-05 16:18:10 +01004279 DBG_TRACE_DEVEL("waiting end of the response", STRM_EV_HTTP_ANA, s, txn);
Christopher Fauletd01ce402019-01-02 17:44:13 +01004280 return;
4281 }
4282
Christopher Fauletf2824e62018-10-01 12:12:37 +02004283 /* When we get here, it means that both the request and the
4284 * response have finished receiving. Depending on the connection
4285 * mode, we'll have to wait for the last bytes to leave in either
4286 * direction, and sometimes for a close to be effective.
4287 */
Christopher Fauletc41547b2019-07-16 14:32:23 +02004288 if (txn->flags & TX_CON_WANT_TUN) {
Christopher Fauletf2824e62018-10-01 12:12:37 +02004289 /* Tunnel mode will not have any analyser so it needs to
4290 * poll for reads.
4291 */
Christopher Faulet97047972023-04-17 08:52:10 +02004292 channel_auto_read(&s->req);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004293 txn->req.msg_state = HTTP_MSG_TUNNEL;
Christopher Faulet27c17d12023-04-18 11:01:51 +02004294 if (txn->rsp.msg_state != HTTP_MSG_TUNNEL)
4295 s->res.flags |= CF_WAKE_ONCE;
Christopher Fauletf2824e62018-10-01 12:12:37 +02004296 }
4297 else {
4298 /* we're not expecting any new data to come for this
4299 * transaction, so we can close it.
Christopher Faulet9768c262018-10-22 09:34:31 +02004300 *
4301 * However, there is an exception if the response
4302 * length is undefined. In this case, we need to wait
4303 * the close from the server. The response will be
4304 * switched in TUNNEL mode until the end.
Christopher Fauletf2824e62018-10-01 12:12:37 +02004305 */
4306 if (!(txn->rsp.flags & HTTP_MSGF_XFER_LEN) &&
4307 txn->rsp.msg_state != HTTP_MSG_CLOSED)
Christopher Faulet9768c262018-10-22 09:34:31 +02004308 goto check_channel_flags;
Christopher Fauletf2824e62018-10-01 12:12:37 +02004309
Christopher Faulet64350bb2023-04-13 16:37:37 +02004310 if (!(s->scb->flags & (SC_FL_SHUT_DONE|SC_FL_SHUT_WANTED))) {
Christopher Faulet12762f02023-04-13 15:40:10 +02004311 sc_schedule_abort(s->scf);
Christopher Fauletdf7cd712023-04-13 15:56:26 +02004312 sc_schedule_shutdown(s->scb);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004313 }
4314 }
Christopher Fauletf2824e62018-10-01 12:12:37 +02004315 goto check_channel_flags;
4316 }
4317
4318 if (txn->req.msg_state == HTTP_MSG_CLOSING) {
4319 http_msg_closing:
4320 /* nothing else to forward, just waiting for the output buffer
Christopher Fauletdf7cd712023-04-13 15:56:26 +02004321 * to be empty and for the shut_wanted to take effect.
Christopher Fauletf2824e62018-10-01 12:12:37 +02004322 */
4323 if (channel_is_empty(chn)) {
4324 txn->req.msg_state = HTTP_MSG_CLOSED;
4325 goto http_msg_closed;
4326 }
Christopher Fauleteea8fc72019-11-05 16:18:10 +01004327 DBG_TRACE_LEAVE(STRM_EV_HTTP_ANA, s, txn);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004328 return;
4329 }
4330
4331 if (txn->req.msg_state == HTTP_MSG_CLOSED) {
4332 http_msg_closed:
Christopher Fauletf2824e62018-10-01 12:12:37 +02004333 /* if we don't know whether the server will close, we need to hard close */
4334 if (txn->rsp.flags & HTTP_MSGF_XFER_LEN)
Willy Tarreaucb041662022-05-17 19:44:42 +02004335 s->scb->flags |= SC_FL_NOLINGER; /* we want to close ASAP */
Christopher Fauletf2824e62018-10-01 12:12:37 +02004336 /* see above in MSG_DONE why we only do this in these states */
Christopher Faulet769d0e92019-03-22 14:23:18 +01004337 if (!(s->be->options & PR_O_ABRT_CLOSE))
Christopher Fauletf2824e62018-10-01 12:12:37 +02004338 channel_dont_read(chn);
4339 goto end;
4340 }
4341
4342 check_channel_flags:
4343 /* Here, we are in HTTP_MSG_DONE or HTTP_MSG_TUNNEL */
Christopher Faulet64350bb2023-04-13 16:37:37 +02004344 if (s->scb->flags & (SC_FL_SHUT_DONE|SC_FL_SHUT_WANTED)) {
Christopher Fauletf2824e62018-10-01 12:12:37 +02004345 /* if we've just closed an output, let's switch */
4346 txn->req.msg_state = HTTP_MSG_CLOSING;
4347 goto http_msg_closing;
4348 }
4349
4350 end:
4351 chn->analysers &= AN_REQ_FLT_END;
Christopher Faulet198ef8b2020-12-15 13:32:55 +01004352 if (txn->req.msg_state == HTTP_MSG_TUNNEL) {
Christopher Faulet68ef2182023-03-17 15:38:18 +01004353 s->scb->flags |= SC_FL_SND_NEVERWAIT;
Christopher Faulet198ef8b2020-12-15 13:32:55 +01004354 if (HAS_REQ_DATA_FILTERS(s))
Christopher Fauletf2824e62018-10-01 12:12:37 +02004355 chn->analysers |= AN_REQ_FLT_XFER_DATA;
Christopher Faulet27c17d12023-04-18 11:01:51 +02004356 else
4357 c_adv(chn, htxbuf(&chn->buf)->data - co_data(chn));
Christopher Faulet198ef8b2020-12-15 13:32:55 +01004358 }
Christopher Fauletf2824e62018-10-01 12:12:37 +02004359 channel_auto_close(chn);
4360 channel_auto_read(chn);
Christopher Fauleteea8fc72019-11-05 16:18:10 +01004361 DBG_TRACE_LEAVE(STRM_EV_HTTP_ANA, s, txn);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004362}
4363
4364
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +05004365/* This function terminates the response because it was completely analyzed or
Christopher Fauletf2824e62018-10-01 12:12:37 +02004366 * because an error was triggered during the body forwarding.
4367 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004368static void http_end_response(struct stream *s)
Christopher Fauletf2824e62018-10-01 12:12:37 +02004369{
4370 struct channel *chn = &s->res;
4371 struct http_txn *txn = s->txn;
4372
Christopher Fauleteea8fc72019-11-05 16:18:10 +01004373 DBG_TRACE_ENTER(STRM_EV_HTTP_ANA, s, txn);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004374
Christopher Fauleteea8fc72019-11-05 16:18:10 +01004375 if (unlikely(txn->rsp.msg_state < HTTP_MSG_DONE)) {
4376 DBG_TRACE_DEVEL("waiting end of the response", STRM_EV_HTTP_ANA, s, txn);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004377 return;
Christopher Fauleteea8fc72019-11-05 16:18:10 +01004378 }
Christopher Fauletf2824e62018-10-01 12:12:37 +02004379
4380 if (txn->rsp.msg_state == HTTP_MSG_DONE) {
4381 /* In theory, we don't need to read anymore, but we must
4382 * still monitor the server connection for a possible close
4383 * while the request is being uploaded, so we don't disable
4384 * reading.
4385 */
4386 /* channel_dont_read(chn); */
4387
Christopher Fauletaf124362023-02-14 10:48:02 +01004388 if (txn->req.msg_state < HTTP_MSG_DONE && s->scf->state != SC_ST_CLO) {
Christopher Fauletf2824e62018-10-01 12:12:37 +02004389 /* The client seems to still be sending data, probably
4390 * because we got an error response during an upload.
4391 * We have the choice of either breaking the connection
4392 * or letting it pass through. Let's do the later.
4393 */
Christopher Fauleteea8fc72019-11-05 16:18:10 +01004394 DBG_TRACE_DEVEL("waiting end of the request", STRM_EV_HTTP_ANA, s, txn);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004395 return;
4396 }
4397
4398 /* When we get here, it means that both the request and the
4399 * response have finished receiving. Depending on the connection
4400 * mode, we'll have to wait for the last bytes to leave in either
4401 * direction, and sometimes for a close to be effective.
4402 */
Christopher Fauletc41547b2019-07-16 14:32:23 +02004403 if (txn->flags & TX_CON_WANT_TUN) {
Christopher Faulet97047972023-04-17 08:52:10 +02004404 channel_auto_read(&s->res);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004405 txn->rsp.msg_state = HTTP_MSG_TUNNEL;
Christopher Faulet27c17d12023-04-18 11:01:51 +02004406 if (txn->req.msg_state != HTTP_MSG_TUNNEL)
4407 s->req.flags |= CF_WAKE_ONCE;
Christopher Fauletf2824e62018-10-01 12:12:37 +02004408 }
4409 else {
4410 /* we're not expecting any new data to come for this
4411 * transaction, so we can close it.
4412 */
Christopher Faulet64350bb2023-04-13 16:37:37 +02004413 if (!(s->scf->flags & (SC_FL_SHUT_DONE|SC_FL_SHUT_WANTED))) {
Christopher Faulet12762f02023-04-13 15:40:10 +02004414 sc_schedule_abort(s->scb);
Christopher Fauletdf7cd712023-04-13 15:56:26 +02004415 sc_schedule_shutdown(s->scf);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004416 }
4417 }
4418 goto check_channel_flags;
4419 }
4420
4421 if (txn->rsp.msg_state == HTTP_MSG_CLOSING) {
4422 http_msg_closing:
4423 /* nothing else to forward, just waiting for the output buffer
Christopher Fauletdf7cd712023-04-13 15:56:26 +02004424 * to be empty and for the shut_wanted to take effect.
Christopher Fauletf2824e62018-10-01 12:12:37 +02004425 */
4426 if (channel_is_empty(chn)) {
4427 txn->rsp.msg_state = HTTP_MSG_CLOSED;
4428 goto http_msg_closed;
4429 }
Christopher Fauleteea8fc72019-11-05 16:18:10 +01004430 DBG_TRACE_LEAVE(STRM_EV_HTTP_ANA, s, txn);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004431 return;
4432 }
4433
4434 if (txn->rsp.msg_state == HTTP_MSG_CLOSED) {
4435 http_msg_closed:
4436 /* drop any pending data */
Christopher Faulet202c6ce2019-01-07 14:57:35 +01004437 channel_htx_truncate(&s->req, htxbuf(&s->req.buf));
Christopher Faulet9768c262018-10-22 09:34:31 +02004438 channel_abort(&s->req);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004439 goto end;
4440 }
4441
4442 check_channel_flags:
4443 /* Here, we are in HTTP_MSG_DONE or HTTP_MSG_TUNNEL */
Christopher Faulet64350bb2023-04-13 16:37:37 +02004444 if (s->scf->flags & (SC_FL_SHUT_DONE|SC_FL_SHUT_WANTED)) {
Christopher Fauletf2824e62018-10-01 12:12:37 +02004445 /* if we've just closed an output, let's switch */
4446 txn->rsp.msg_state = HTTP_MSG_CLOSING;
4447 goto http_msg_closing;
4448 }
4449
4450 end:
4451 chn->analysers &= AN_RES_FLT_END;
Christopher Faulet198ef8b2020-12-15 13:32:55 +01004452 if (txn->rsp.msg_state == HTTP_MSG_TUNNEL) {
Christopher Faulet68ef2182023-03-17 15:38:18 +01004453 s->scf->flags |= SC_FL_SND_NEVERWAIT;
Christopher Faulet198ef8b2020-12-15 13:32:55 +01004454 if (HAS_RSP_DATA_FILTERS(s))
4455 chn->analysers |= AN_RES_FLT_XFER_DATA;
Christopher Faulet27c17d12023-04-18 11:01:51 +02004456 else
4457 c_adv(chn, htxbuf(&chn->buf)->data - co_data(chn));
Christopher Faulet198ef8b2020-12-15 13:32:55 +01004458 }
Christopher Fauletf2824e62018-10-01 12:12:37 +02004459 channel_auto_close(chn);
4460 channel_auto_read(chn);
Christopher Fauleteea8fc72019-11-05 16:18:10 +01004461 DBG_TRACE_LEAVE(STRM_EV_HTTP_ANA, s, txn);
Christopher Fauletf2824e62018-10-01 12:12:37 +02004462}
4463
Christopher Fauletef70e252020-01-28 09:26:19 +01004464/* Forward a response generated by HAProxy (error/redirect/return). This
4465 * function forwards all pending incoming data. If <final> is set to 0, nothing
4466 * more is performed. It is used for 1xx informational messages. Otherwise, the
Christopher Faulet507479b2020-05-15 12:29:46 +02004467 * transaction is terminated and the request is emptied. On success 1 is
Christopher Faulet40e6b552020-06-25 16:04:50 +02004468 * returned. If an error occurred, 0 is returned. If it fails, this function
4469 * only exits. It is the caller responsibility to do the cleanup.
Christopher Fauletef70e252020-01-28 09:26:19 +01004470 */
4471int http_forward_proxy_resp(struct stream *s, int final)
4472{
4473 struct channel *req = &s->req;
4474 struct channel *res = &s->res;
4475 struct htx *htx = htxbuf(&res->buf);
4476 size_t data;
4477
4478 if (final) {
4479 htx->flags |= HTX_FL_PROXY_RESP;
Christopher Faulet507479b2020-05-15 12:29:46 +02004480
Christopher Fauletaab1b672020-11-18 16:44:02 +01004481 if (!htx_is_empty(htx) && !http_eval_after_res_rules(s))
Christopher Faulet6d0c3df2020-01-22 09:26:35 +01004482 return 0;
Christopher Fauletef70e252020-01-28 09:26:19 +01004483
Christopher Fauletd6c48362020-10-19 18:01:38 +02004484 if (s->txn->meth == HTTP_METH_HEAD)
4485 htx_skip_msg_payload(htx);
4486
Christopher Fauletef70e252020-01-28 09:26:19 +01004487 channel_auto_read(req);
4488 channel_abort(req);
Christopher Fauletef70e252020-01-28 09:26:19 +01004489 channel_htx_erase(req, htxbuf(&req->buf));
4490
Christopher Fauletef70e252020-01-28 09:26:19 +01004491 channel_auto_read(res);
4492 channel_auto_close(res);
Christopher Faulet12762f02023-04-13 15:40:10 +02004493 sc_schedule_abort(s->scb);
Christopher Faulet904763f2023-03-22 14:53:11 +01004494 s->scb->flags |= SC_FL_EOI; /* The response is terminated, add EOI */
Christopher Faulet42432f32020-11-20 17:43:16 +01004495 htxbuf(&res->buf)->flags |= HTX_FL_EOM; /* no more data are expected */
Christopher Fauletef70e252020-01-28 09:26:19 +01004496 }
Christopher Fauletcf6898c2020-06-25 15:55:11 +02004497 else {
Christopher Faulet904763f2023-03-22 14:53:11 +01004498 /* Send ASAP informational messages. Rely on SC_FL_EOI for final
Christopher Fauletcf6898c2020-06-25 15:55:11 +02004499 * response.
4500 */
Christopher Faulet5c281d52023-03-16 15:53:28 +01004501 s->scf->flags |= SC_FL_SND_ASAP;
Christopher Fauletcf6898c2020-06-25 15:55:11 +02004502 }
Christopher Fauletef70e252020-01-28 09:26:19 +01004503
4504 data = htx->data - co_data(res);
4505 c_adv(res, data);
4506 htx->first = -1;
4507 res->total += data;
4508 return 1;
4509}
4510
Willy Tarreaub49672d2022-05-27 10:13:37 +02004511void http_server_error(struct stream *s, struct stconn *sc, int err,
Christopher Faulet8dfeccf2020-05-15 14:16:29 +02004512 int finst, struct http_reply *msg)
Christopher Faulet0f226952018-10-22 09:29:56 +02004513{
Christopher Faulet72c7d8d2020-01-27 15:32:25 +01004514 http_reply_and_close(s, s->txn->status, msg);
Christopher Faulet0f226952018-10-22 09:29:56 +02004515 if (!(s->flags & SF_ERR_MASK))
4516 s->flags |= err;
4517 if (!(s->flags & SF_FINST_MASK))
4518 s->flags |= finst;
4519}
4520
Christopher Faulet8dfeccf2020-05-15 14:16:29 +02004521void http_reply_and_close(struct stream *s, short status, struct http_reply *msg)
Christopher Faulet0f226952018-10-22 09:29:56 +02004522{
Christopher Faulet8dfeccf2020-05-15 14:16:29 +02004523 if (!msg) {
4524 channel_htx_truncate(&s->res, htxbuf(&s->res.buf));
4525 goto end;
4526 }
4527
4528 if (http_reply_message(s, msg) == -1) {
4529 /* On error, return a 500 error message, but don't rewrite it if
Christopher Faulet40e6b552020-06-25 16:04:50 +02004530 * it is already an internal error. If it was already a "const"
4531 * 500 error, just fail.
Christopher Faulet8dfeccf2020-05-15 14:16:29 +02004532 */
Christopher Faulet40e6b552020-06-25 16:04:50 +02004533 if (s->txn->status == 500) {
4534 if (s->txn->flags & TX_CONST_REPLY)
4535 goto end;
Christopher Faulet8dfeccf2020-05-15 14:16:29 +02004536 s->txn->flags |= TX_CONST_REPLY;
Christopher Faulet40e6b552020-06-25 16:04:50 +02004537 }
Christopher Faulet8dfeccf2020-05-15 14:16:29 +02004538 s->txn->status = 500;
4539 s->txn->http_reply = NULL;
4540 return http_reply_and_close(s, s->txn->status, http_error_message(s));
4541 }
4542
4543end:
Christopher Faulet2d565002021-09-10 09:17:50 +02004544 /* At this staged, HTTP analysis is finished */
4545 s->req.analysers &= AN_REQ_FLT_END;
4546 s->req.analyse_exp = TICK_ETERNITY;
4547
4548 s->res.analysers &= AN_RES_FLT_END;
4549 s->res.analyse_exp = TICK_ETERNITY;
4550
Christopher Faulet0f226952018-10-22 09:29:56 +02004551 channel_auto_read(&s->req);
4552 channel_abort(&s->req);
Christopher Faulet202c6ce2019-01-07 14:57:35 +01004553 channel_htx_erase(&s->req, htxbuf(&s->req.buf));
Christopher Faulet72c7d8d2020-01-27 15:32:25 +01004554 channel_auto_read(&s->res);
4555 channel_auto_close(&s->res);
Christopher Faulet12762f02023-04-13 15:40:10 +02004556 sc_schedule_abort(s->scb);
Christopher Faulet0f226952018-10-22 09:29:56 +02004557}
4558
Christopher Faulet8dfeccf2020-05-15 14:16:29 +02004559struct http_reply *http_error_message(struct stream *s)
Christopher Fauleta7b677c2018-11-29 16:48:49 +01004560{
4561 const int msgnum = http_get_status_idx(s->txn->status);
4562
Christopher Faulet8dfeccf2020-05-15 14:16:29 +02004563 if (s->txn->http_reply)
4564 return s->txn->http_reply;
4565 else if (s->be->replies[msgnum])
4566 return s->be->replies[msgnum];
4567 else if (strm_fe(s)->replies[msgnum])
4568 return strm_fe(s)->replies[msgnum];
Christopher Fauleta7b677c2018-11-29 16:48:49 +01004569 else
Christopher Faulet8dfeccf2020-05-15 14:16:29 +02004570 return &http_err_replies[msgnum];
Christopher Fauleta7b677c2018-11-29 16:48:49 +01004571}
4572
Christopher Faulet40e6b552020-06-25 16:04:50 +02004573/* Produces an HTX message from an http reply. Depending on the http reply type,
4574 * a, errorfile, an raw file or a log-format string is used. On success, it
4575 * returns 0. If an error occurs -1 is returned. If it fails, this function only
4576 * exits. It is the caller responsibility to do the cleanup.
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004577 */
Christopher Fauletae43b6c2020-05-27 15:24:22 +02004578int http_reply_to_htx(struct stream *s, struct htx *htx, struct http_reply *reply)
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004579{
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004580 struct buffer *errmsg;
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004581 struct htx_sl *sl;
4582 struct buffer *body = NULL;
4583 const char *status, *reason, *clen, *ctype;
4584 unsigned int slflags;
4585 int ret = 0;
4586
Christopher Faulete29a97e2020-05-14 14:49:25 +02004587 /*
4588 * - HTTP_REPLY_ERRFILES unexpected here. handled as no payload if so
4589 *
4590 * - HTTP_REPLY_INDIRECT: switch on another reply if defined or handled
4591 * as no payload if NULL. the TXN status code is set with the status
4592 * of the original reply.
4593 */
4594
4595 if (reply->type == HTTP_REPLY_INDIRECT) {
4596 if (reply->body.reply)
4597 reply = reply->body.reply;
4598 }
Christopher Faulet8dfeccf2020-05-15 14:16:29 +02004599 if (reply->type == HTTP_REPLY_ERRMSG && !reply->body.errmsg) {
4600 /* get default error message */
4601 if (reply == s->txn->http_reply)
4602 s->txn->http_reply = NULL;
4603 reply = http_error_message(s);
4604 if (reply->type == HTTP_REPLY_INDIRECT) {
4605 if (reply->body.reply)
4606 reply = reply->body.reply;
4607 }
4608 }
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004609
4610 if (reply->type == HTTP_REPLY_ERRMSG) {
4611 /* implicit or explicit error message*/
4612 errmsg = reply->body.errmsg;
Christopher Faulet8dfeccf2020-05-15 14:16:29 +02004613 if (errmsg && !b_is_null(errmsg)) {
Christopher Faulet20567362020-05-15 14:52:49 +02004614 if (!htx_copy_msg(htx, errmsg))
Christopher Faulet8dfeccf2020-05-15 14:16:29 +02004615 goto fail;
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004616 }
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004617 }
4618 else {
4619 /* no payload, file or log-format string */
4620 if (reply->type == HTTP_REPLY_RAW) {
4621 /* file */
4622 body = &reply->body.obj;
4623 }
4624 else if (reply->type == HTTP_REPLY_LOGFMT) {
4625 /* log-format string */
4626 body = alloc_trash_chunk();
4627 if (!body)
4628 goto fail_alloc;
4629 body->data = build_logline(s, body->area, body->size, &reply->body.fmt);
4630 }
4631 /* else no payload */
4632
4633 status = ultoa(reply->status);
4634 reason = http_get_reason(reply->status);
4635 slflags = (HTX_SL_F_IS_RESP|HTX_SL_F_VER_11|HTX_SL_F_XFER_LEN|HTX_SL_F_CLEN);
4636 if (!body || !b_data(body))
4637 slflags |= HTX_SL_F_BODYLESS;
4638 sl = htx_add_stline(htx, HTX_BLK_RES_SL, slflags, ist("HTTP/1.1"), ist(status), ist(reason));
4639 if (!sl)
4640 goto fail;
4641 sl->info.res.status = reply->status;
4642
4643 clen = (body ? ultoa(b_data(body)) : "0");
4644 ctype = reply->ctype;
4645
4646 if (!LIST_ISEMPTY(&reply->hdrs)) {
4647 struct http_reply_hdr *hdr;
4648 struct buffer *value = alloc_trash_chunk();
4649
4650 if (!value)
4651 goto fail;
4652
4653 list_for_each_entry(hdr, &reply->hdrs, list) {
4654 chunk_reset(value);
4655 value->data = build_logline(s, value->area, value->size, &hdr->value);
4656 if (b_data(value) && !htx_add_header(htx, hdr->name, ist2(b_head(value), b_data(value)))) {
4657 free_trash_chunk(value);
4658 goto fail;
4659 }
4660 chunk_reset(value);
4661 }
4662 free_trash_chunk(value);
4663 }
4664
4665 if (!htx_add_header(htx, ist("content-length"), ist(clen)) ||
4666 (body && b_data(body) && ctype && !htx_add_header(htx, ist("content-type"), ist(ctype))) ||
4667 !htx_add_endof(htx, HTX_BLK_EOH) ||
Christopher Fauletd1ac2b92020-12-02 19:12:22 +01004668 (body && b_data(body) && !htx_add_data_atonce(htx, ist2(b_head(body), b_data(body)))))
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004669 goto fail;
Christopher Fauletd1ac2b92020-12-02 19:12:22 +01004670
4671 htx->flags |= HTX_FL_EOM;
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004672 }
4673
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004674 leave:
4675 if (reply->type == HTTP_REPLY_LOGFMT)
4676 free_trash_chunk(body);
4677 return ret;
4678
4679 fail_alloc:
4680 if (!(s->flags & SF_ERR_MASK))
4681 s->flags |= SF_ERR_RESOURCE;
Christopher Faulet97e466c2020-05-15 15:12:47 +02004682 /* fall through */
4683 fail:
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004684 ret = -1;
4685 goto leave;
Christopher Faulet97e466c2020-05-15 15:12:47 +02004686}
4687
4688/* Send an http reply to the client. On success, it returns 0. If an error
Christopher Faulet40e6b552020-06-25 16:04:50 +02004689 * occurs -1 is returned and the response channel is truncated, removing this
4690 * way the faulty reply. This function may fail when the reply is formatted
4691 * (http_reply_to_htx) or when the reply is forwarded
4692 * (http_forward_proxy_resp). On the last case, it is because a
4693 * http-after-response rule fails.
Christopher Faulet97e466c2020-05-15 15:12:47 +02004694 */
4695int http_reply_message(struct stream *s, struct http_reply *reply)
4696{
4697 struct channel *res = &s->res;
4698 struct htx *htx = htx_from_buf(&res->buf);
4699
4700 if (s->txn->status == -1)
4701 s->txn->status = reply->status;
4702 channel_htx_truncate(res, htx);
4703
4704 if (http_reply_to_htx(s, htx, reply) == -1)
4705 goto fail;
4706
4707 htx_to_buf(htx, &s->res.buf);
4708 if (!http_forward_proxy_resp(s, 1))
4709 goto fail;
4710 return 0;
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004711
4712 fail:
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004713 channel_htx_truncate(res, htx);
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004714 if (!(s->flags & SF_ERR_MASK))
4715 s->flags |= SF_ERR_PRXCOND;
Christopher Faulet97e466c2020-05-15 15:12:47 +02004716 return -1;
Christopher Faulet0e2ad612020-05-13 16:38:37 +02004717}
4718
Christopher Faulet50264b42022-03-30 19:39:30 +02004719/* Return the error message corresponding to s->conn_err_type. It is assumed
Christopher Faulet304cc402019-07-15 15:46:28 +02004720 * that the server side is closed. Note that err_type is actually a
4721 * bitmask, where almost only aborts may be cumulated with other
4722 * values. We consider that aborted operations are more important
4723 * than timeouts or errors due to the fact that nobody else in the
4724 * logs might explain incomplete retries. All others should avoid
4725 * being cumulated. It should normally not be possible to have multiple
4726 * aborts at once, but just in case, the first one in sequence is reported.
4727 * Note that connection errors appearing on the second request of a keep-alive
4728 * connection are not reported since this allows the client to retry.
4729 */
Willy Tarreaub49672d2022-05-27 10:13:37 +02004730void http_return_srv_error(struct stream *s, struct stconn *sc)
Christopher Faulet304cc402019-07-15 15:46:28 +02004731{
Christopher Faulet50264b42022-03-30 19:39:30 +02004732 int err_type = s->conn_err_type;
Christopher Faulet304cc402019-07-15 15:46:28 +02004733
4734 /* set s->txn->status for http_error_message(s) */
Christopher Faulet50264b42022-03-30 19:39:30 +02004735 if (err_type & STRM_ET_QUEUE_ABRT) {
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004736 s->txn->status = -1;
Willy Tarreaub49672d2022-05-27 10:13:37 +02004737 http_server_error(s, sc, SF_ERR_CLICL, SF_FINST_Q, NULL);
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004738 }
Christopher Faulet50264b42022-03-30 19:39:30 +02004739 else if (err_type & STRM_ET_CONN_ABRT) {
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004740 s->txn->status = -1;
Willy Tarreaub49672d2022-05-27 10:13:37 +02004741 http_server_error(s, sc, SF_ERR_CLICL, SF_FINST_C, NULL);
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004742 }
Christopher Faulet50264b42022-03-30 19:39:30 +02004743 else if (err_type & STRM_ET_QUEUE_TO) {
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004744 s->txn->status = 503;
Willy Tarreaub49672d2022-05-27 10:13:37 +02004745 http_server_error(s, sc, SF_ERR_SRVTO, SF_FINST_Q,
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004746 http_error_message(s));
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004747 }
Christopher Faulet50264b42022-03-30 19:39:30 +02004748 else if (err_type & STRM_ET_QUEUE_ERR) {
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004749 s->txn->status = 503;
Willy Tarreaub49672d2022-05-27 10:13:37 +02004750 http_server_error(s, sc, SF_ERR_SRVCL, SF_FINST_Q,
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004751 http_error_message(s));
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004752 }
Christopher Faulet50264b42022-03-30 19:39:30 +02004753 else if (err_type & STRM_ET_CONN_TO) {
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004754 s->txn->status = 503;
Willy Tarreaub49672d2022-05-27 10:13:37 +02004755 http_server_error(s, sc, SF_ERR_SRVTO, SF_FINST_C,
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004756 (s->txn->flags & TX_NOT_FIRST) ? NULL :
4757 http_error_message(s));
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004758 }
Christopher Faulet50264b42022-03-30 19:39:30 +02004759 else if (err_type & STRM_ET_CONN_ERR) {
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004760 s->txn->status = 503;
Willy Tarreaub49672d2022-05-27 10:13:37 +02004761 http_server_error(s, sc, SF_ERR_SRVCL, SF_FINST_C,
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004762 (s->flags & SF_SRV_REUSED) ? NULL :
4763 http_error_message(s));
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004764 }
Christopher Faulet50264b42022-03-30 19:39:30 +02004765 else if (err_type & STRM_ET_CONN_RES) {
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004766 s->txn->status = 503;
Willy Tarreaub49672d2022-05-27 10:13:37 +02004767 http_server_error(s, sc, SF_ERR_RESOURCE, SF_FINST_C,
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004768 (s->txn->flags & TX_NOT_FIRST) ? NULL :
4769 http_error_message(s));
Christopher Faulet5e702fc2021-06-02 14:07:24 +02004770 }
Christopher Faulet50264b42022-03-30 19:39:30 +02004771 else { /* STRM_ET_CONN_OTHER and others */
Christopher Faulet304cc402019-07-15 15:46:28 +02004772 s->txn->status = 500;
Willy Tarreaub49672d2022-05-27 10:13:37 +02004773 http_server_error(s, sc, SF_ERR_INTERNAL, SF_FINST_C,
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004774 http_error_message(s));
Christopher Faulet304cc402019-07-15 15:46:28 +02004775 }
4776}
4777
Christopher Fauleta7b677c2018-11-29 16:48:49 +01004778
Christopher Faulet4a28a532019-03-01 11:19:40 +01004779/* Handle Expect: 100-continue for HTTP/1.1 messages if necessary. It returns 0
4780 * on success and -1 on error.
4781 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004782static int http_handle_expect_hdr(struct stream *s, struct htx *htx, struct http_msg *msg)
Christopher Faulet4a28a532019-03-01 11:19:40 +01004783{
4784 /* If we have HTTP/1.1 message with a body and Expect: 100-continue,
4785 * then we must send an HTTP/1.1 100 Continue intermediate response.
4786 */
Christopher Fauletffcffa82023-04-05 10:33:31 +02004787 if (!(msg->flags & HTTP_MSGF_EXPECT_CHECKED) &&
4788 (msg->flags & HTTP_MSGF_VER_11) &&
Christopher Faulet4a28a532019-03-01 11:19:40 +01004789 (msg->flags & (HTTP_MSGF_CNT_LEN|HTTP_MSGF_TE_CHNK))) {
4790 struct ist hdr = { .ptr = "Expect", .len = 6 };
4791 struct http_hdr_ctx ctx;
4792
4793 ctx.blk = NULL;
4794 /* Expect is allowed in 1.1, look for it */
4795 if (http_find_header(htx, hdr, &ctx, 0) &&
4796 unlikely(isteqi(ctx.value, ist2("100-continue", 12)))) {
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004797 if (http_reply_100_continue(s) == -1)
Christopher Faulet4a28a532019-03-01 11:19:40 +01004798 return -1;
4799 http_remove_header(htx, &ctx);
4800 }
4801 }
Christopher Fauletffcffa82023-04-05 10:33:31 +02004802 msg->flags |= HTTP_MSGF_EXPECT_CHECKED;
Christopher Faulet4a28a532019-03-01 11:19:40 +01004803 return 0;
4804}
4805
Christopher Faulet23a3c792018-11-28 10:01:23 +01004806/* Send a 100-Continue response to the client. It returns 0 on success and -1
4807 * on error. The response channel is updated accordingly.
4808 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004809static int http_reply_100_continue(struct stream *s)
Christopher Faulet23a3c792018-11-28 10:01:23 +01004810{
4811 struct channel *res = &s->res;
4812 struct htx *htx = htx_from_buf(&res->buf);
4813 struct htx_sl *sl;
4814 unsigned int flags = (HTX_SL_F_IS_RESP|HTX_SL_F_VER_11|
4815 HTX_SL_F_XFER_LEN|HTX_SL_F_BODYLESS);
Christopher Faulet23a3c792018-11-28 10:01:23 +01004816
4817 sl = htx_add_stline(htx, HTX_BLK_RES_SL, flags,
4818 ist("HTTP/1.1"), ist("100"), ist("Continue"));
4819 if (!sl)
4820 goto fail;
4821 sl->info.res.status = 100;
4822
Christopher Faulet1d5ec092019-06-26 14:23:54 +02004823 if (!htx_add_endof(htx, HTX_BLK_EOH))
Christopher Faulet23a3c792018-11-28 10:01:23 +01004824 goto fail;
4825
Christopher Fauleta72a7e42020-01-28 09:28:11 +01004826 if (!http_forward_proxy_resp(s, 0))
4827 goto fail;
Christopher Faulet23a3c792018-11-28 10:01:23 +01004828 return 0;
4829
4830 fail:
4831 /* If an error occurred, remove the incomplete HTTP response from the
4832 * buffer */
Christopher Faulet202c6ce2019-01-07 14:57:35 +01004833 channel_htx_truncate(res, htx);
Christopher Faulet23a3c792018-11-28 10:01:23 +01004834 return -1;
4835}
4836
Christopher Faulet12c51e22018-11-28 15:59:42 +01004837
Christopher Faulet0f226952018-10-22 09:29:56 +02004838/*
4839 * Capture headers from message <htx> according to header list <cap_hdr>, and
4840 * fill the <cap> pointers appropriately.
4841 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004842static void http_capture_headers(struct htx *htx, char **cap, struct cap_hdr *cap_hdr)
Christopher Faulet0f226952018-10-22 09:29:56 +02004843{
4844 struct cap_hdr *h;
4845 int32_t pos;
4846
Christopher Fauleta3f15502019-05-13 15:27:23 +02004847 for (pos = htx_get_first(htx); pos != -1; pos = htx_get_next(htx, pos)) {
Christopher Faulet0f226952018-10-22 09:29:56 +02004848 struct htx_blk *blk = htx_get_blk(htx, pos);
4849 enum htx_blk_type type = htx_get_blk_type(blk);
4850 struct ist n, v;
4851
4852 if (type == HTX_BLK_EOH)
4853 break;
4854 if (type != HTX_BLK_HDR)
4855 continue;
4856
4857 n = htx_get_blk_name(htx, blk);
4858
4859 for (h = cap_hdr; h; h = h->next) {
4860 if (h->namelen && (h->namelen == n.len) &&
4861 (strncasecmp(n.ptr, h->name, h->namelen) == 0)) {
4862 if (cap[h->index] == NULL)
4863 cap[h->index] =
4864 pool_alloc(h->pool);
4865
4866 if (cap[h->index] == NULL) {
4867 ha_alert("HTTP capture : out of memory.\n");
4868 break;
4869 }
4870
4871 v = htx_get_blk_value(htx, blk);
Tim Duesterhus2471f5c2021-11-08 09:05:01 +01004872 v = isttrim(v, h->len);
Christopher Faulet0f226952018-10-22 09:29:56 +02004873
4874 memcpy(cap[h->index], v.ptr, v.len);
4875 cap[h->index][v.len]=0;
4876 }
4877 }
4878 }
4879}
4880
Christopher Faulet0b6bdc52018-10-24 11:05:36 +02004881/* Delete a value in a header between delimiters <from> and <next>. The header
4882 * itself is delimited by <start> and <end> pointers. The number of characters
4883 * displaced is returned, and the pointer to the first delimiter is updated if
4884 * required. The function tries as much as possible to respect the following
4885 * principles :
4886 * - replace <from> delimiter by the <next> one unless <from> points to <start>,
4887 * in which case <next> is simply removed
4888 * - set exactly one space character after the new first delimiter, unless there
4889 * are not enough characters in the block being moved to do so.
4890 * - remove unneeded spaces before the previous delimiter and after the new
4891 * one.
4892 *
4893 * It is the caller's responsibility to ensure that :
4894 * - <from> points to a valid delimiter or <start> ;
4895 * - <next> points to a valid delimiter or <end> ;
4896 * - there are non-space chars before <from>.
4897 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004898static int http_del_hdr_value(char *start, char *end, char **from, char *next)
Christopher Faulet0b6bdc52018-10-24 11:05:36 +02004899{
4900 char *prev = *from;
4901
4902 if (prev == start) {
4903 /* We're removing the first value. eat the semicolon, if <next>
4904 * is lower than <end> */
4905 if (next < end)
4906 next++;
4907
4908 while (next < end && HTTP_IS_SPHT(*next))
4909 next++;
4910 }
4911 else {
4912 /* Remove useless spaces before the old delimiter. */
4913 while (HTTP_IS_SPHT(*(prev-1)))
4914 prev--;
4915 *from = prev;
4916
4917 /* copy the delimiter and if possible a space if we're
4918 * not at the end of the line.
4919 */
4920 if (next < end) {
4921 *prev++ = *next++;
4922 if (prev + 1 < next)
4923 *prev++ = ' ';
4924 while (next < end && HTTP_IS_SPHT(*next))
4925 next++;
4926 }
4927 }
4928 memmove(prev, next, end - next);
4929 return (prev - next);
4930}
4931
Christopher Faulet0f226952018-10-22 09:29:56 +02004932
4933/* Formats the start line of the request (without CRLF) and puts it in <str> and
Joseph Herlantc42c0e92018-11-25 10:43:27 -08004934 * return the written length. The line can be truncated if it exceeds <len>.
Christopher Faulet0f226952018-10-22 09:29:56 +02004935 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004936static size_t http_fmt_req_line(const struct htx_sl *sl, char *str, size_t len)
Christopher Faulet0f226952018-10-22 09:29:56 +02004937{
4938 struct ist dst = ist2(str, 0);
4939
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01004940 if (istcat(&dst, htx_sl_req_meth(sl), len) == -1)
Christopher Faulet0f226952018-10-22 09:29:56 +02004941 goto end;
4942 if (dst.len + 1 > len)
4943 goto end;
4944 dst.ptr[dst.len++] = ' ';
4945
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01004946 if (istcat(&dst, htx_sl_req_uri(sl), len) == -1)
Christopher Faulet0f226952018-10-22 09:29:56 +02004947 goto end;
4948 if (dst.len + 1 > len)
4949 goto end;
4950 dst.ptr[dst.len++] = ' ';
4951
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01004952 istcat(&dst, htx_sl_req_vsn(sl), len);
Christopher Faulet0f226952018-10-22 09:29:56 +02004953 end:
4954 return dst.len;
4955}
4956
4957/*
4958 * Print a debug line with a start line.
4959 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004960static void http_debug_stline(const char *dir, struct stream *s, const struct htx_sl *sl)
Christopher Faulet0f226952018-10-22 09:29:56 +02004961{
4962 struct session *sess = strm_sess(s);
4963 int max;
4964
4965 chunk_printf(&trash, "%08x:%s.%s[%04x:%04x]: ", s->uniq_id, s->be->id,
4966 dir,
Willy Tarreau88bc8002021-12-06 07:01:02 +00004967 objt_conn(sess->origin) ? (unsigned short)__objt_conn(sess->origin)->handle.fd : -1,
Willy Tarreaufd9417b2022-05-18 16:23:22 +02004968 sc_conn(s->scb) ? (unsigned short)(__sc_conn(s->scb))->handle.fd : -1);
Christopher Faulet0f226952018-10-22 09:29:56 +02004969
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01004970 max = HTX_SL_P1_LEN(sl);
Christopher Faulet0f226952018-10-22 09:29:56 +02004971 UBOUND(max, trash.size - trash.data - 3);
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01004972 chunk_memcat(&trash, HTX_SL_P1_PTR(sl), max);
Christopher Faulet0f226952018-10-22 09:29:56 +02004973 trash.area[trash.data++] = ' ';
4974
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01004975 max = HTX_SL_P2_LEN(sl);
Christopher Faulet0f226952018-10-22 09:29:56 +02004976 UBOUND(max, trash.size - trash.data - 2);
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01004977 chunk_memcat(&trash, HTX_SL_P2_PTR(sl), max);
Christopher Faulet0f226952018-10-22 09:29:56 +02004978 trash.area[trash.data++] = ' ';
4979
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01004980 max = HTX_SL_P3_LEN(sl);
Christopher Faulet0f226952018-10-22 09:29:56 +02004981 UBOUND(max, trash.size - trash.data - 1);
Christopher Fauletf1ba18d2018-11-26 21:37:08 +01004982 chunk_memcat(&trash, HTX_SL_P3_PTR(sl), max);
Christopher Faulet0f226952018-10-22 09:29:56 +02004983 trash.area[trash.data++] = '\n';
4984
Willy Tarreau2e8ab6b2020-03-14 11:03:20 +01004985 DISGUISE(write(1, trash.area, trash.data));
Christopher Faulet0f226952018-10-22 09:29:56 +02004986}
4987
4988/*
4989 * Print a debug line with a header.
4990 */
Christopher Fauletfc9cfe42019-07-16 14:54:53 +02004991static void http_debug_hdr(const char *dir, struct stream *s, const struct ist n, const struct ist v)
Christopher Faulet0f226952018-10-22 09:29:56 +02004992{
4993 struct session *sess = strm_sess(s);
4994 int max;
4995
4996 chunk_printf(&trash, "%08x:%s.%s[%04x:%04x]: ", s->uniq_id, s->be->id,
4997 dir,
Willy Tarreau88bc8002021-12-06 07:01:02 +00004998 objt_conn(sess->origin) ? (unsigned short)__objt_conn(sess->origin)->handle.fd : -1,
Willy Tarreaufd9417b2022-05-18 16:23:22 +02004999 sc_conn(s->scb) ? (unsigned short)(__sc_conn(s->scb))->handle.fd : -1);
Christopher Faulet0f226952018-10-22 09:29:56 +02005000
5001 max = n.len;
5002 UBOUND(max, trash.size - trash.data - 3);
5003 chunk_memcat(&trash, n.ptr, max);
5004 trash.area[trash.data++] = ':';
5005 trash.area[trash.data++] = ' ';
5006
5007 max = v.len;
5008 UBOUND(max, trash.size - trash.data - 1);
5009 chunk_memcat(&trash, v.ptr, max);
5010 trash.area[trash.data++] = '\n';
5011
Willy Tarreau2e8ab6b2020-03-14 11:03:20 +01005012 DISGUISE(write(1, trash.area, trash.data));
Christopher Faulet0f226952018-10-22 09:29:56 +02005013}
5014
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005015void http_txn_reset_req(struct http_txn *txn)
5016{
Christopher Faulet1aea50e2020-01-17 16:03:53 +01005017 txn->req.flags = 0;
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005018 txn->req.msg_state = HTTP_MSG_RQBEFORE; /* at the very beginning of the request */
5019}
5020
5021void http_txn_reset_res(struct http_txn *txn)
5022{
Christopher Faulet1aea50e2020-01-17 16:03:53 +01005023 txn->rsp.flags = 0;
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005024 txn->rsp.msg_state = HTTP_MSG_RPBEFORE; /* at the very beginning of the response */
5025}
5026
5027/*
Christopher Faulet75f619a2021-03-08 19:12:58 +01005028 * Create and initialize a new HTTP transaction for stream <s>. This should be
5029 * used before processing any new request. It returns the transaction or NLULL
5030 * on error.
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005031 */
Christopher Faulet75f619a2021-03-08 19:12:58 +01005032struct http_txn *http_create_txn(struct stream *s)
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005033{
Christopher Faulet75f619a2021-03-08 19:12:58 +01005034 struct http_txn *txn;
Willy Tarreaub49672d2022-05-27 10:13:37 +02005035 struct stconn *sc = s->scf;
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005036
Christopher Faulet75f619a2021-03-08 19:12:58 +01005037 txn = pool_alloc(pool_head_http_txn);
5038 if (!txn)
5039 return NULL;
5040 s->txn = txn;
5041
Christopher Faulet5eb67f52022-06-22 17:12:05 +02005042 txn->meth = HTTP_METH_OTHER;
Willy Tarreaub49672d2022-05-27 10:13:37 +02005043 txn->flags = ((sc && sc_ep_test(sc, SE_FL_NOT_FIRST)) ? TX_NOT_FIRST : 0);
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005044 txn->status = -1;
Christopher Faulet5cb513a2020-05-13 17:56:56 +02005045 txn->http_reply = NULL;
Christopher Faulete05bf9e2022-03-29 15:23:40 +02005046 txn->l7_buffer = BUF_NULL;
Willy Tarreau8b507582020-02-25 09:35:07 +01005047 write_u32(txn->cache_hash, 0);
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005048
5049 txn->cookie_first_date = 0;
5050 txn->cookie_last_date = 0;
5051
5052 txn->srv_cookie = NULL;
5053 txn->cli_cookie = NULL;
5054 txn->uri = NULL;
5055
5056 http_txn_reset_req(txn);
5057 http_txn_reset_res(txn);
5058
5059 txn->req.chn = &s->req;
5060 txn->rsp.chn = &s->res;
5061
5062 txn->auth.method = HTTP_AUTH_UNKNOWN;
5063
Aurelien DARRAGON5ad2b642022-11-18 09:17:29 +01005064 /* here we don't want to re-initialize s->vars_txn and s->vars_reqres
5065 * variable lists, because they were already initialized upon stream
5066 * creation in stream_new(), and thus may already contain some variables
5067 */
Christopher Faulet75f619a2021-03-08 19:12:58 +01005068
5069 return txn;
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005070}
5071
5072/* to be used at the end of a transaction */
Christopher Faulet75f619a2021-03-08 19:12:58 +01005073void http_destroy_txn(struct stream *s)
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005074{
5075 struct http_txn *txn = s->txn;
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005076
5077 /* these ones will have been dynamically allocated */
5078 pool_free(pool_head_requri, txn->uri);
5079 pool_free(pool_head_capture, txn->cli_cookie);
5080 pool_free(pool_head_capture, txn->srv_cookie);
Tim Duesterhusa17e6622020-03-05 20:19:02 +01005081 pool_free(pool_head_uniqueid, s->unique_id.ptr);
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005082
Tim Duesterhusa17e6622020-03-05 20:19:02 +01005083 s->unique_id = IST_NULL;
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005084 txn->uri = NULL;
5085 txn->srv_cookie = NULL;
5086 txn->cli_cookie = NULL;
5087
Christopher Faulet59399252019-11-07 14:27:52 +01005088 if (!LIST_ISEMPTY(&s->vars_txn.head))
5089 vars_prune(&s->vars_txn, s->sess, s);
5090 if (!LIST_ISEMPTY(&s->vars_reqres.head))
5091 vars_prune(&s->vars_reqres, s->sess, s);
Christopher Faulet75f619a2021-03-08 19:12:58 +01005092
Christopher Faulete05bf9e2022-03-29 15:23:40 +02005093 b_free(&txn->l7_buffer);
5094
Christopher Faulet75f619a2021-03-08 19:12:58 +01005095 pool_free(pool_head_http_txn, txn);
5096 s->txn = NULL;
Christopher Faulet59399252019-11-07 14:27:52 +01005097}
5098
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005099
Christopher Faulet71236de2023-01-13 09:06:38 +01005100void http_set_term_flags(struct stream *s)
5101{
5102 if (!(s->flags & SF_ERR_MASK))
5103 s->flags |= SF_ERR_PRXCOND;
5104
5105 if (!(s->flags & SF_FINST_MASK)) {
5106 if (s->scb->state == SC_ST_INI) {
5107 /* Before any connection attempt on the server side, we
5108 * are still in the request analysis. Just take case to
5109 * detect tarpit error
5110 */
5111 if (s->req.analysers & AN_REQ_HTTP_TARPIT)
5112 s->flags |= SF_FINST_T;
5113 else
5114 s->flags |= SF_FINST_R;
5115 }
5116 else if (s->scb->state == SC_ST_QUE)
5117 s->flags |= SF_FINST_Q;
5118 else if (sc_state_in(s->scb->state, SC_SB_REQ|SC_SB_TAR|SC_SB_ASS|SC_SB_CON|SC_SB_CER|SC_SB_RDY)) {
5119 if (unlikely(objt_applet(s->target))) {
5120 s->flags |= SF_FINST_R;
5121 }
5122 else
5123 s->flags |= SF_FINST_C;
5124 }
5125 else {
5126 if (s->txn->rsp.msg_state < HTTP_MSG_DATA) {
5127 /* We are still processing the response headers */
5128 s->flags |= SF_FINST_H;
5129 }
Christopher Faulet5b74f992023-01-26 19:02:07 +01005130 // (res == (done|closing|closed)) & (res->flags & shutw)
5131 else if (s->txn->rsp.msg_state >= HTTP_MSG_DONE && s->txn->rsp.msg_state < HTTP_MSG_TUNNEL &&
Christopher Faulet71236de2023-01-13 09:06:38 +01005132 (s->flags & (SF_ERR_CLITO|SF_ERR_CLICL))) {
5133 /* A client error was reported and we are
5134 * transmitting the last block of data
5135 */
5136 s->flags |= SF_FINST_L;
5137 }
5138 else {
5139 /* Otherwise we are in DATA phase on both sides */
5140 s->flags |= SF_FINST_D;
5141 }
5142 }
5143 }
5144}
5145
5146
Christopher Fauleta8a46e22019-07-16 14:53:09 +02005147DECLARE_POOL(pool_head_http_txn, "http_txn", sizeof(struct http_txn));
Christopher Faulet0f226952018-10-22 09:29:56 +02005148
Christopher Fauletf4eb75d2018-10-11 15:55:07 +02005149/*
5150 * Local variables:
5151 * c-indent-level: 8
5152 * c-basic-offset: 8
5153 * End:
5154 */