blob: 1edc7256180ee96f7a937e73d9def55b45692aa3 [file] [log] [blame]
Willy Tarreaubaaee002006-06-26 02:48:02 +02001/*
Willy Tarreau81f9aa32010-06-01 17:45:26 +02002 * Session management functions.
Willy Tarreaubaaee002006-06-26 02:48:02 +02003 *
Willy Tarreau81f9aa32010-06-01 17:45:26 +02004 * Copyright 2000-2010 Willy Tarreau <w@1wt.eu>
Willy Tarreaubaaee002006-06-26 02:48:02 +02005 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 */
12
13#include <stdlib.h>
Willy Tarreau81f9aa32010-06-01 17:45:26 +020014#include <unistd.h>
15#include <fcntl.h>
Willy Tarreaue3ba5f02006-06-29 18:54:54 +020016
17#include <common/config.h>
Willy Tarreau7c669d72008-06-20 15:04:11 +020018#include <common/debug.h>
Willy Tarreau2dd0d472006-06-29 17:53:05 +020019#include <common/memory.h>
Willy Tarreaubaaee002006-06-26 02:48:02 +020020
Willy Tarreaubaaee002006-06-26 02:48:02 +020021#include <types/capture.h>
Willy Tarreau55a8d0e2008-11-30 18:47:21 +010022#include <types/global.h>
Willy Tarreaubaaee002006-06-26 02:48:02 +020023
Willy Tarreau1d0dfb12009-07-07 15:10:31 +020024#include <proto/acl.h>
Willy Tarreau55a8d0e2008-11-30 18:47:21 +010025#include <proto/backend.h>
Willy Tarreau7341d942007-05-13 19:56:02 +020026#include <proto/buffers.h>
Krzysztof Piotr Oledzki97f07b82009-12-15 22:31:24 +010027#include <proto/checks.h>
Willy Tarreau5ca791d2009-08-16 19:06:42 +020028#include <proto/dumpstats.h>
Willy Tarreau8d5d7f22007-01-21 19:16:41 +010029#include <proto/hdr_idx.h>
Willy Tarreau332f8bf2007-05-13 21:36:56 +020030#include <proto/log.h>
Willy Tarreaubaaee002006-06-26 02:48:02 +020031#include <proto/session.h>
Willy Tarreau3eba98a2009-01-25 13:56:13 +010032#include <proto/pipe.h>
Willy Tarreau55a8d0e2008-11-30 18:47:21 +010033#include <proto/proto_http.h>
34#include <proto/proto_tcp.h>
Willy Tarreau1d0dfb12009-07-07 15:10:31 +020035#include <proto/proxy.h>
Willy Tarreaubaaee002006-06-26 02:48:02 +020036#include <proto/queue.h>
Willy Tarreau7f062c42009-03-05 18:43:00 +010037#include <proto/server.h>
Emeric Brun1d33b292010-01-04 15:47:17 +010038#include <proto/stick_table.h>
Willy Tarreau55a8d0e2008-11-30 18:47:21 +010039#include <proto/stream_interface.h>
40#include <proto/stream_sock.h>
41#include <proto/task.h>
Willy Tarreaubaaee002006-06-26 02:48:02 +020042
Willy Tarreauc6ca1a02007-05-13 19:43:47 +020043struct pool_head *pool2_session;
Willy Tarreauf54f8bd2008-11-23 19:53:55 +010044struct list sessions;
Willy Tarreaubaaee002006-06-26 02:48:02 +020045
Willy Tarreau81f9aa32010-06-01 17:45:26 +020046/* This function is called from the protocol layer accept() in order to instanciate
47 * a new session on behalf of a given listener and frontend. It returns a positive
48 * value upon success, 0 if the connection needs to be closed and ignored, or a
49 * negative value upon critical failure.
50 */
51int session_accept(struct listener *l, int cfd, struct sockaddr_storage *addr)
52{
53 struct proxy *p = l->frontend;
54 struct session *s;
55 struct http_txn *txn;
56 struct task *t;
57
58 if (unlikely((s = pool_alloc2(pool2_session)) == NULL)) {
59 Alert("out of memory in event_accept().\n");
60 goto out_close;
61 }
62
63 /* minimum session initialization required for monitor mode below */
64 s->flags = 0;
65 s->logs.logwait = p->to_log;
66
67 /* if this session comes from a known monitoring system, we want to ignore
68 * it as soon as possible, which means closing it immediately for TCP, but
69 * cleanly.
70 */
71 if (unlikely((l->options & LI_O_CHK_MONNET) &&
72 addr->ss_family == AF_INET &&
73 (((struct sockaddr_in *)addr)->sin_addr.s_addr & p->mon_mask.s_addr) == p->mon_net.s_addr)) {
74 if (p->mode == PR_MODE_TCP) {
75 pool_free2(pool2_session, s);
76 return 0;
77 }
78 s->flags |= SN_MONITOR;
79 s->logs.logwait = 0;
80 }
81
82 /* OK, we're keeping the session, so let's properly initialize the session */
83 LIST_ADDQ(&sessions, &s->list);
84 LIST_INIT(&s->back_refs);
85
86 if (unlikely((t = task_new()) == NULL)) { /* disable this proxy for a while */
87 Alert("out of memory in event_accept().\n");
88 goto out_free_session;
89 }
90
91 s->term_trace = 0;
92 s->cli_addr = *addr;
93 s->logs.accept_date = date; /* user-visible date for logging */
94 s->logs.tv_accept = now; /* corrected date for internal use */
95 s->uniq_id = totalconn;
Willy Tarreau24dcaf32010-06-05 10:49:41 +020096 p->feconn++; /* beconn will be increased once assigned */
97
Willy Tarreaub36b4242010-06-04 20:59:39 +020098 proxy_inc_fe_conn_ctr(l, p); /* note: cum_beconn will be increased once assigned */
Willy Tarreau81f9aa32010-06-01 17:45:26 +020099
100 t->process = l->handler;
101 t->context = s;
102 t->nice = l->nice;
103 t->expire = TICK_ETERNITY;
104
105 s->task = t;
106 s->listener = l;
107
108 /* Note: initially, the session's backend points to the frontend.
109 * This changes later when switching rules are executed or
110 * when the default backend is assigned.
111 */
112 s->be = s->fe = p;
113 s->req = s->rep = NULL; /* will be allocated later */
114
115 /* now evaluate the tcp-request layer4 rules. Since we expect to be able
116 * to abort right here as soon as possible, we check the rules before
117 * even initializing the stream interfaces.
118 */
119 if ((l->options & LI_O_TCP_RULES) && !tcp_exec_req_rules(s)) {
120 task_free(t);
121 LIST_DEL(&s->list);
122 pool_free2(pool2_session, s);
123 /* let's do a no-linger now to close with a single RST. */
124 setsockopt(cfd, SOL_SOCKET, SO_LINGER, (struct linger *) &nolinger, sizeof(struct linger));
Willy Tarreau24dcaf32010-06-05 10:49:41 +0200125 p->feconn--;
Willy Tarreau81f9aa32010-06-01 17:45:26 +0200126 return 0;
127 }
128
Willy Tarreaub36b4242010-06-04 20:59:39 +0200129 /* This session was accepted, count it now */
Willy Tarreau24dcaf32010-06-05 10:49:41 +0200130 if (p->feconn > p->counters.feconn_max)
131 p->counters.feconn_max = p->feconn;
Willy Tarreaub36b4242010-06-04 20:59:39 +0200132 proxy_inc_fe_sess_ctr(l, p);
133
Willy Tarreau81f9aa32010-06-01 17:45:26 +0200134 /* this part should be common with other protocols */
135 s->si[0].fd = cfd;
136 s->si[0].owner = t;
137 s->si[0].state = s->si[0].prev_state = SI_ST_EST;
138 s->si[0].err_type = SI_ET_NONE;
139 s->si[0].err_loc = NULL;
140 s->si[0].connect = NULL;
141 s->si[0].iohandler = NULL;
142 s->si[0].exp = TICK_ETERNITY;
143 s->si[0].flags = SI_FL_NONE;
144
145 if (likely(s->fe->options2 & PR_O2_INDEPSTR))
146 s->si[0].flags |= SI_FL_INDEP_STR;
147
148 if (addr->ss_family == AF_INET || addr->ss_family == AF_INET6)
149 s->si[0].flags = SI_FL_CAP_SPLTCP; /* TCP/TCPv6 splicing possible */
150
151 /* add the various callbacks */
152 stream_sock_prepare_interface(&s->si[0]);
153
154 /* pre-initialize the other side's stream interface to an INIT state. The
155 * callbacks will be initialized before attempting to connect.
156 */
157 s->si[1].fd = -1; /* just to help with debugging */
158 s->si[1].owner = t;
159 s->si[1].state = s->si[1].prev_state = SI_ST_INI;
160 s->si[1].err_type = SI_ET_NONE;
161 s->si[1].err_loc = NULL;
162 s->si[1].connect = NULL;
163 s->si[1].iohandler = NULL;
164 s->si[1].shutr = stream_int_shutr;
165 s->si[1].shutw = stream_int_shutw;
166 s->si[1].exp = TICK_ETERNITY;
167 s->si[1].flags = SI_FL_NONE;
168
169 if (likely(s->fe->options2 & PR_O2_INDEPSTR))
170 s->si[1].flags |= SI_FL_INDEP_STR;
171
172 s->srv = s->prev_srv = s->srv_conn = NULL;
173 s->pend_pos = NULL;
174
175 /* init store persistence */
176 s->store_count = 0;
177
178 /* Adjust some socket options */
179 if (unlikely(fcntl(cfd, F_SETFL, O_NONBLOCK) == -1)) {
180 Alert("accept(): cannot set the socket in non blocking mode. Giving up\n");
181 goto out_free_task;
182 }
183
184 txn = &s->txn;
185 /* Those variables will be checked and freed if non-NULL in
186 * session.c:session_free(). It is important that they are
187 * properly initialized.
188 */
189 txn->sessid = NULL;
190 txn->srv_cookie = NULL;
191 txn->cli_cookie = NULL;
192 txn->uri = NULL;
193 txn->req.cap = NULL;
194 txn->rsp.cap = NULL;
195 txn->hdr_idx.v = NULL;
196 txn->hdr_idx.size = txn->hdr_idx.used = 0;
197
198 if (unlikely((s->req = pool_alloc2(pool2_buffer)) == NULL))
199 goto out_free_task; /* no memory */
200
201 if (unlikely((s->rep = pool_alloc2(pool2_buffer)) == NULL))
202 goto out_free_req; /* no memory */
203
204 /* initialize the request buffer */
205 s->req->size = global.tune.bufsize;
206 buffer_init(s->req);
207 s->req->prod = &s->si[0];
208 s->req->cons = &s->si[1];
209 s->si[0].ib = s->si[1].ob = s->req;
210 s->req->flags |= BF_READ_ATTACHED; /* the producer is already connected */
211
212 /* activate default analysers enabled for this listener */
213 s->req->analysers = l->analysers;
214
215 s->req->wto = TICK_ETERNITY;
216 s->req->rto = TICK_ETERNITY;
217 s->req->rex = TICK_ETERNITY;
218 s->req->wex = TICK_ETERNITY;
219 s->req->analyse_exp = TICK_ETERNITY;
220
221 /* initialize response buffer */
222 s->rep->size = global.tune.bufsize;
223 buffer_init(s->rep);
224 s->rep->prod = &s->si[1];
225 s->rep->cons = &s->si[0];
226 s->si[0].ob = s->si[1].ib = s->rep;
227 s->rep->analysers = 0;
228
229 s->rep->rto = TICK_ETERNITY;
230 s->rep->wto = TICK_ETERNITY;
231 s->rep->rex = TICK_ETERNITY;
232 s->rep->wex = TICK_ETERNITY;
233 s->rep->analyse_exp = TICK_ETERNITY;
234
235 /* finish initialization of the accepted file descriptor */
236 fd_insert(cfd);
237 fdtab[cfd].owner = &s->si[0];
238 fdtab[cfd].state = FD_STREADY;
239 fdtab[cfd].flags = 0;
240 fdtab[cfd].cb[DIR_RD].f = l->proto->read;
241 fdtab[cfd].cb[DIR_RD].b = s->req;
242 fdtab[cfd].cb[DIR_WR].f = l->proto->write;
243 fdtab[cfd].cb[DIR_WR].b = s->rep;
244 fdinfo[cfd].peeraddr = (struct sockaddr *)&s->cli_addr;
245 fdinfo[cfd].peerlen = sizeof(s->cli_addr);
246 EV_FD_SET(cfd, DIR_RD);
247
248 if (p->accept) {
249 int ret = p->accept(s);
250 if (unlikely(ret < 0))
251 goto out_free_rep;
252
253 if (unlikely(ret == 0)) {
254 /* work is finished, we can release everything (eg: monitoring) */
255 pool_free2(pool2_buffer, s->rep);
256 pool_free2(pool2_buffer, s->req);
257 task_free(t);
258 LIST_DEL(&s->list);
259 pool_free2(pool2_session, s);
Willy Tarreau24dcaf32010-06-05 10:49:41 +0200260 p->feconn--;
Willy Tarreau81f9aa32010-06-01 17:45:26 +0200261 return 0;
262 }
263 }
264
265 /* it is important not to call the wakeup function directly but to
266 * pass through task_wakeup(), because this one knows how to apply
267 * priorities to tasks.
268 */
269 task_wakeup(t, TASK_WOKEN_INIT);
270 return 1;
271
272 /* Error unrolling */
273 out_free_rep:
274 pool_free2(pool2_buffer, s->rep);
275 out_free_req:
276 pool_free2(pool2_buffer, s->req);
277 out_free_task:
Willy Tarreau24dcaf32010-06-05 10:49:41 +0200278 p->feconn--;
Willy Tarreau81f9aa32010-06-01 17:45:26 +0200279 task_free(t);
280 out_free_session:
281 LIST_DEL(&s->list);
282 pool_free2(pool2_session, s);
283 out_close:
284 return -1;
285}
286
Willy Tarreaubaaee002006-06-26 02:48:02 +0200287/*
288 * frees the context associated to a session. It must have been removed first.
289 */
290void session_free(struct session *s)
291{
Willy Tarreau4dbc4a22007-03-03 16:23:22 +0100292 struct http_txn *txn = &s->txn;
Willy Tarreau632f5a72007-07-11 10:42:35 +0200293 struct proxy *fe = s->fe;
Willy Tarreau62e4f1d2008-12-07 20:16:23 +0100294 struct bref *bref, *back;
Willy Tarreaua4cda672010-06-06 18:28:49 +0200295 int i;
Willy Tarreau0f7562b2007-01-07 15:46:13 +0100296
Willy Tarreaubaaee002006-06-26 02:48:02 +0200297 if (s->pend_pos)
298 pendconn_free(s->pend_pos);
Willy Tarreau922a8062008-12-04 09:33:58 +0100299
Willy Tarreau1e62de62008-11-11 20:20:02 +0100300 if (s->srv) { /* there may be requests left pending in queue */
301 if (s->flags & SN_CURR_SESS) {
302 s->flags &= ~SN_CURR_SESS;
303 s->srv->cur_sess--;
304 }
Willy Tarreau922a8062008-12-04 09:33:58 +0100305 if (may_dequeue_tasks(s->srv, s->be))
306 process_srv_queue(s->srv);
Willy Tarreau1e62de62008-11-11 20:20:02 +0100307 }
Willy Tarreau922a8062008-12-04 09:33:58 +0100308
Willy Tarreau7c669d72008-06-20 15:04:11 +0200309 if (unlikely(s->srv_conn)) {
310 /* the session still has a reserved slot on a server, but
311 * it should normally be only the same as the one above,
312 * so this should not happen in fact.
313 */
314 sess_change_server(s, NULL);
315 }
316
Willy Tarreau3eba98a2009-01-25 13:56:13 +0100317 if (s->req->pipe)
318 put_pipe(s->req->pipe);
Willy Tarreau259de1b2009-01-18 21:56:21 +0100319
Willy Tarreau3eba98a2009-01-25 13:56:13 +0100320 if (s->rep->pipe)
321 put_pipe(s->rep->pipe);
Willy Tarreau259de1b2009-01-18 21:56:21 +0100322
Willy Tarreau48d63db2008-08-03 17:41:33 +0200323 pool_free2(pool2_buffer, s->req);
324 pool_free2(pool2_buffer, s->rep);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200325
Willy Tarreau46023632010-01-07 22:51:47 +0100326 http_end_txn(s);
327
Willy Tarreaua4cda672010-06-06 18:28:49 +0200328 for (i = 0; i < s->store_count; i++) {
329 if (!s->store[i].ts)
330 continue;
331 stksess_free(s->store[i].table, s->store[i].ts);
332 s->store[i].ts = NULL;
333 }
334
Willy Tarreau92fb9832007-10-16 17:34:28 +0200335 if (fe) {
Willy Tarreau48d63db2008-08-03 17:41:33 +0200336 pool_free2(fe->hdr_idx_pool, txn->hdr_idx.v);
Willy Tarreau46023632010-01-07 22:51:47 +0100337 pool_free2(fe->rsp_cap_pool, txn->rsp.cap);
338 pool_free2(fe->req_cap_pool, txn->req.cap);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200339 }
Willy Tarreau0937bc42009-12-22 15:03:09 +0100340
Willy Tarreau62e4f1d2008-12-07 20:16:23 +0100341 list_for_each_entry_safe(bref, back, &s->back_refs, users) {
Willy Tarreaufd3828e2009-02-22 15:17:24 +0100342 /* we have to unlink all watchers. We must not relink them if
343 * this session was the last one in the list.
344 */
Willy Tarreau62e4f1d2008-12-07 20:16:23 +0100345 LIST_DEL(&bref->users);
Willy Tarreaufd3828e2009-02-22 15:17:24 +0100346 LIST_INIT(&bref->users);
347 if (s->list.n != &sessions)
348 LIST_ADDQ(&LIST_ELEM(s->list.n, struct session *, list)->back_refs, &bref->users);
Willy Tarreau62e4f1d2008-12-07 20:16:23 +0100349 bref->ref = s->list.n;
350 }
Willy Tarreauf54f8bd2008-11-23 19:53:55 +0100351 LIST_DEL(&s->list);
Willy Tarreauc6ca1a02007-05-13 19:43:47 +0200352 pool_free2(pool2_session, s);
Willy Tarreau632f5a72007-07-11 10:42:35 +0200353
354 /* We may want to free the maximum amount of pools if the proxy is stopping */
Willy Tarreau92fb9832007-10-16 17:34:28 +0200355 if (fe && unlikely(fe->state == PR_STSTOPPED)) {
Willy Tarreau48d63db2008-08-03 17:41:33 +0200356 pool_flush2(pool2_buffer);
357 pool_flush2(fe->hdr_idx_pool);
358 pool_flush2(pool2_requri);
359 pool_flush2(pool2_capture);
360 pool_flush2(pool2_session);
361 pool_flush2(fe->req_cap_pool);
362 pool_flush2(fe->rsp_cap_pool);
Willy Tarreau632f5a72007-07-11 10:42:35 +0200363 }
Willy Tarreauc6ca1a02007-05-13 19:43:47 +0200364}
365
366
367/* perform minimal intializations, report 0 in case of error, 1 if OK. */
368int init_session()
369{
Willy Tarreauf54f8bd2008-11-23 19:53:55 +0100370 LIST_INIT(&sessions);
Willy Tarreauc6ca1a02007-05-13 19:43:47 +0200371 pool2_session = create_pool("session", sizeof(struct session), MEM_F_SHARED);
372 return pool2_session != NULL;
Willy Tarreaubaaee002006-06-26 02:48:02 +0200373}
374
Willy Tarreau30e71012007-11-26 20:15:35 +0100375void session_process_counters(struct session *s)
376{
Krzysztof Piotr Oledzki583bc962007-11-24 22:12:47 +0100377 unsigned long long bytes;
378
Willy Tarreau30e71012007-11-26 20:15:35 +0100379 if (s->req) {
Krzysztof Piotr Oledzki583bc962007-11-24 22:12:47 +0100380 bytes = s->req->total - s->logs.bytes_in;
Willy Tarreau30e71012007-11-26 20:15:35 +0100381 s->logs.bytes_in = s->req->total;
382 if (bytes) {
Krzysztof Piotr Oledzki052d4fd2009-10-04 14:52:57 +0200383 s->fe->counters.bytes_in += bytes;
Krzysztof Piotr Oledzki583bc962007-11-24 22:12:47 +0100384
Willy Tarreau30e71012007-11-26 20:15:35 +0100385 if (s->be != s->fe)
Krzysztof Piotr Oledzki052d4fd2009-10-04 14:52:57 +0200386 s->be->counters.bytes_in += bytes;
Krzysztof Piotr Oledzki583bc962007-11-24 22:12:47 +0100387
Willy Tarreau30e71012007-11-26 20:15:35 +0100388 if (s->srv)
Krzysztof Piotr Oledzki052d4fd2009-10-04 14:52:57 +0200389 s->srv->counters.bytes_in += bytes;
Krzysztof Piotr Oledzkiaeebf9b2009-10-04 15:43:17 +0200390
391 if (s->listener->counters)
392 s->listener->counters->bytes_in += bytes;
Willy Tarreau30e71012007-11-26 20:15:35 +0100393 }
Krzysztof Piotr Oledzki583bc962007-11-24 22:12:47 +0100394 }
395
Willy Tarreau30e71012007-11-26 20:15:35 +0100396 if (s->rep) {
Krzysztof Piotr Oledzki583bc962007-11-24 22:12:47 +0100397 bytes = s->rep->total - s->logs.bytes_out;
Willy Tarreau30e71012007-11-26 20:15:35 +0100398 s->logs.bytes_out = s->rep->total;
399 if (bytes) {
Krzysztof Piotr Oledzki052d4fd2009-10-04 14:52:57 +0200400 s->fe->counters.bytes_out += bytes;
Krzysztof Piotr Oledzki583bc962007-11-24 22:12:47 +0100401
Willy Tarreau30e71012007-11-26 20:15:35 +0100402 if (s->be != s->fe)
Krzysztof Piotr Oledzki052d4fd2009-10-04 14:52:57 +0200403 s->be->counters.bytes_out += bytes;
Krzysztof Piotr Oledzki583bc962007-11-24 22:12:47 +0100404
Willy Tarreau30e71012007-11-26 20:15:35 +0100405 if (s->srv)
Krzysztof Piotr Oledzki052d4fd2009-10-04 14:52:57 +0200406 s->srv->counters.bytes_out += bytes;
Krzysztof Piotr Oledzkiaeebf9b2009-10-04 15:43:17 +0200407
408 if (s->listener->counters)
409 s->listener->counters->bytes_out += bytes;
Willy Tarreau30e71012007-11-26 20:15:35 +0100410 }
Krzysztof Piotr Oledzki583bc962007-11-24 22:12:47 +0100411 }
412}
Willy Tarreaubaaee002006-06-26 02:48:02 +0200413
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100414/* This function is called with (si->state == SI_ST_CON) meaning that a
415 * connection was attempted and that the file descriptor is already allocated.
416 * We must check for establishment, error and abort. Possible output states
417 * are SI_ST_EST (established), SI_ST_CER (error), SI_ST_DIS (abort), and
418 * SI_ST_CON (no change). The function returns 0 if it switches to SI_ST_CER,
419 * otherwise 1.
420 */
421int sess_update_st_con_tcp(struct session *s, struct stream_interface *si)
422{
423 struct buffer *req = si->ob;
424 struct buffer *rep = si->ib;
425
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100426 /* If we got an error, or if nothing happened and the connection timed
427 * out, we must give up. The CER state handler will take care of retry
428 * attempts and error reports.
429 */
430 if (unlikely(si->flags & (SI_FL_EXP|SI_FL_ERR))) {
Willy Tarreau127334e2009-03-28 10:47:26 +0100431 si->exp = TICK_ETERNITY;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100432 si->state = SI_ST_CER;
Willy Tarreaudc340a92009-06-28 23:10:19 +0200433 si->flags &= ~SI_FL_CAP_SPLICE;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100434 fd_delete(si->fd);
435
436 if (si->err_type)
437 return 0;
438
439 si->err_loc = s->srv;
440 if (si->flags & SI_FL_ERR)
441 si->err_type = SI_ET_CONN_ERR;
442 else
443 si->err_type = SI_ET_CONN_TO;
444 return 0;
445 }
446
447 /* OK, maybe we want to abort */
Willy Tarreau418fd472009-09-06 21:37:23 +0200448 if (unlikely((rep->flags & BF_SHUTW) ||
449 ((req->flags & BF_SHUTW_NOW) && /* FIXME: this should not prevent a connection from establishing */
Willy Tarreauba0b63d2009-09-20 08:09:44 +0200450 (((req->flags & (BF_OUT_EMPTY|BF_WRITE_ACTIVITY)) == BF_OUT_EMPTY) ||
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100451 s->be->options & PR_O_ABRT_CLOSE)))) {
452 /* give up */
453 si->shutw(si);
454 si->err_type |= SI_ET_CONN_ABRT;
455 si->err_loc = s->srv;
Willy Tarreaudc340a92009-06-28 23:10:19 +0200456 si->flags &= ~SI_FL_CAP_SPLICE;
Willy Tarreau84455332009-03-15 22:34:05 +0100457 if (s->srv_error)
458 s->srv_error(s, si);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100459 return 1;
460 }
461
462 /* we need to wait a bit more if there was no activity either */
463 if (!(req->flags & BF_WRITE_ACTIVITY))
464 return 1;
465
466 /* OK, this means that a connection succeeded. The caller will be
467 * responsible for handling the transition from CON to EST.
468 */
469 s->logs.t_connect = tv_ms_elapsed(&s->logs.tv_accept, &now);
Willy Tarreau127334e2009-03-28 10:47:26 +0100470 si->exp = TICK_ETERNITY;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100471 si->state = SI_ST_EST;
472 si->err_type = SI_ET_NONE;
473 si->err_loc = NULL;
474 return 1;
475}
476
477/* This function is called with (si->state == SI_ST_CER) meaning that a
478 * previous connection attempt has failed and that the file descriptor
479 * has already been released. Possible causes include asynchronous error
480 * notification and time out. Possible output states are SI_ST_CLO when
481 * retries are exhausted, SI_ST_TAR when a delay is wanted before a new
482 * connection attempt, SI_ST_ASS when it's wise to retry on the same server,
483 * and SI_ST_REQ when an immediate redispatch is wanted. The buffers are
484 * marked as in error state. It returns 0.
485 */
486int sess_update_st_cer(struct session *s, struct stream_interface *si)
487{
488 /* we probably have to release last session from the server */
489 if (s->srv) {
Krzysztof Piotr Oledzki97f07b82009-12-15 22:31:24 +0100490 health_adjust(s->srv, HANA_STATUS_L4_ERR);
491
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100492 if (s->flags & SN_CURR_SESS) {
493 s->flags &= ~SN_CURR_SESS;
494 s->srv->cur_sess--;
495 }
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100496 }
497
498 /* ensure that we have enough retries left */
Willy Tarreauee28de02010-06-01 09:51:00 +0200499 si->conn_retries--;
500 if (si->conn_retries < 0) {
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100501 if (!si->err_type) {
502 si->err_type = SI_ET_CONN_ERR;
503 si->err_loc = s->srv;
504 }
505
506 if (s->srv)
Krzysztof Piotr Oledzki052d4fd2009-10-04 14:52:57 +0200507 s->srv->counters.failed_conns++;
508 s->be->counters.failed_conns++;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100509 if (may_dequeue_tasks(s->srv, s->be))
510 process_srv_queue(s->srv);
511
512 /* shutw is enough so stop a connecting socket */
513 si->shutw(si);
514 si->ob->flags |= BF_WRITE_ERROR;
515 si->ib->flags |= BF_READ_ERROR;
516
517 si->state = SI_ST_CLO;
Willy Tarreau0cac36f2008-11-30 20:44:17 +0100518 if (s->srv_error)
519 s->srv_error(s, si);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100520 return 0;
521 }
522
523 /* If the "redispatch" option is set on the backend, we are allowed to
524 * retry on another server for the last retry. In order to achieve this,
525 * we must mark the session unassigned, and eventually clear the DIRECT
526 * bit to ignore any persistence cookie. We won't count a retry nor a
527 * redispatch yet, because this will depend on what server is selected.
528 */
Willy Tarreauee28de02010-06-01 09:51:00 +0200529 if (s->srv && si->conn_retries == 0 &&
Willy Tarreau4de91492010-01-22 19:10:05 +0100530 s->be->options & PR_O_REDISP && !(s->flags & SN_FORCE_PRST)) {
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100531 if (may_dequeue_tasks(s->srv, s->be))
532 process_srv_queue(s->srv);
533
534 s->flags &= ~(SN_DIRECT | SN_ASSIGNED | SN_ADDR_SET);
535 s->prev_srv = s->srv;
536 si->state = SI_ST_REQ;
537 } else {
538 if (s->srv)
Krzysztof Piotr Oledzki052d4fd2009-10-04 14:52:57 +0200539 s->srv->counters.retries++;
540 s->be->counters.retries++;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100541 si->state = SI_ST_ASS;
542 }
543
544 if (si->flags & SI_FL_ERR) {
545 /* The error was an asynchronous connection error, and we will
546 * likely have to retry connecting to the same server, most
547 * likely leading to the same result. To avoid this, we wait
548 * one second before retrying.
549 */
550
551 if (!si->err_type)
552 si->err_type = SI_ET_CONN_ERR;
553
554 si->state = SI_ST_TAR;
555 si->exp = tick_add(now_ms, MS_TO_TICKS(1000));
556 return 0;
557 }
558 return 0;
559}
560
561/*
562 * This function handles the transition between the SI_ST_CON state and the
Willy Tarreau85e7d002010-05-31 11:57:51 +0200563 * SI_ST_EST state. It must only be called after switching from SI_ST_CON (or
564 * SI_ST_INI) to SI_ST_EST, but only when a ->connect function is defined.
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100565 */
566void sess_establish(struct session *s, struct stream_interface *si)
567{
568 struct buffer *req = si->ob;
569 struct buffer *rep = si->ib;
570
Krzysztof Piotr Oledzki97f07b82009-12-15 22:31:24 +0100571 if (s->srv)
572 health_adjust(s->srv, HANA_STATUS_L4_OK);
573
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100574 if (s->be->mode == PR_MODE_TCP) { /* let's allow immediate data connection in this case */
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100575 /* if the user wants to log as soon as possible, without counting
576 * bytes from the server, then this is the right moment. */
577 if (s->fe->to_log && !(s->logs.logwait & LW_BYTES)) {
578 s->logs.t_close = s->logs.t_connect; /* to get a valid end date */
Willy Tarreaua5555ec2008-11-30 19:02:32 +0100579 s->do_log(s);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100580 }
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100581 }
582 else {
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100583 s->txn.rsp.msg_state = HTTP_MSG_RPBEFORE;
584 /* reset hdr_idx which was already initialized by the request.
585 * right now, the http parser does it.
586 * hdr_idx_init(&s->txn.hdr_idx);
587 */
588 }
589
Willy Tarreau4e5b8282009-08-16 22:57:50 +0200590 rep->analysers |= s->fe->fe_rsp_ana | s->be->be_rsp_ana;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100591 rep->flags |= BF_READ_ATTACHED; /* producer is now attached */
Willy Tarreaud04e8582010-05-31 12:31:35 +0200592 if (si->connect) {
593 /* real connections have timeouts */
594 req->wto = s->be->timeout.server;
595 rep->rto = s->be->timeout.server;
596 }
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100597 req->wex = TICK_ETERNITY;
598}
599
600/* Update stream interface status for input states SI_ST_ASS, SI_ST_QUE, SI_ST_TAR.
601 * Other input states are simply ignored.
602 * Possible output states are SI_ST_CLO, SI_ST_TAR, SI_ST_ASS, SI_ST_REQ, SI_ST_CON.
603 * Flags must have previously been updated for timeouts and other conditions.
604 */
605void sess_update_stream_int(struct session *s, struct stream_interface *si)
606{
607 DPRINTF(stderr,"[%u] %s: sess=%p rq=%p, rp=%p, exp(r,w)=%u,%u rqf=%08x rpf=%08x rql=%d rpl=%d cs=%d ss=%d\n",
608 now_ms, __FUNCTION__,
609 s,
610 s->req, s->rep,
611 s->req->rex, s->rep->wex,
612 s->req->flags, s->rep->flags,
613 s->req->l, s->rep->l, s->rep->cons->state, s->req->cons->state);
614
615 if (si->state == SI_ST_ASS) {
616 /* Server assigned to connection request, we have to try to connect now */
617 int conn_err;
618
619 conn_err = connect_server(s);
620 if (conn_err == SN_ERR_NONE) {
621 /* state = SI_ST_CON now */
Willy Tarreau8f6457c2008-12-01 00:08:28 +0100622 if (s->srv)
Willy Tarreau7f062c42009-03-05 18:43:00 +0100623 srv_inc_sess_ctr(s->srv);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100624 return;
625 }
626
627 /* We have received a synchronous error. We might have to
628 * abort, retry immediately or redispatch.
629 */
630 if (conn_err == SN_ERR_INTERNAL) {
631 if (!si->err_type) {
632 si->err_type = SI_ET_CONN_OTHER;
633 si->err_loc = s->srv;
634 }
635
636 if (s->srv)
Willy Tarreau7f062c42009-03-05 18:43:00 +0100637 srv_inc_sess_ctr(s->srv);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100638 if (s->srv)
Krzysztof Piotr Oledzki052d4fd2009-10-04 14:52:57 +0200639 s->srv->counters.failed_conns++;
640 s->be->counters.failed_conns++;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100641
642 /* release other sessions waiting for this server */
643 if (may_dequeue_tasks(s->srv, s->be))
644 process_srv_queue(s->srv);
645
646 /* Failed and not retryable. */
647 si->shutr(si);
648 si->shutw(si);
649 si->ob->flags |= BF_WRITE_ERROR;
650
651 s->logs.t_queue = tv_ms_elapsed(&s->logs.tv_accept, &now);
652
653 /* no session was ever accounted for this server */
654 si->state = SI_ST_CLO;
Willy Tarreau0cac36f2008-11-30 20:44:17 +0100655 if (s->srv_error)
656 s->srv_error(s, si);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100657 return;
658 }
659
660 /* We are facing a retryable error, but we don't want to run a
661 * turn-around now, as the problem is likely a source port
662 * allocation problem, so we want to retry now.
663 */
664 si->state = SI_ST_CER;
665 si->flags &= ~SI_FL_ERR;
666 sess_update_st_cer(s, si);
667 /* now si->state is one of SI_ST_CLO, SI_ST_TAR, SI_ST_ASS, SI_ST_REQ */
668 return;
669 }
670 else if (si->state == SI_ST_QUE) {
671 /* connection request was queued, check for any update */
672 if (!s->pend_pos) {
673 /* The connection is not in the queue anymore. Either
674 * we have a server connection slot available and we
675 * go directly to the assigned state, or we need to
676 * load-balance first and go to the INI state.
677 */
678 si->exp = TICK_ETERNITY;
679 if (unlikely(!(s->flags & SN_ASSIGNED)))
680 si->state = SI_ST_REQ;
681 else {
682 s->logs.t_queue = tv_ms_elapsed(&s->logs.tv_accept, &now);
683 si->state = SI_ST_ASS;
684 }
685 return;
686 }
687
688 /* Connection request still in queue... */
689 if (si->flags & SI_FL_EXP) {
690 /* ... and timeout expired */
691 si->exp = TICK_ETERNITY;
692 s->logs.t_queue = tv_ms_elapsed(&s->logs.tv_accept, &now);
693 if (s->srv)
Krzysztof Piotr Oledzki052d4fd2009-10-04 14:52:57 +0200694 s->srv->counters.failed_conns++;
695 s->be->counters.failed_conns++;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100696 si->shutr(si);
697 si->shutw(si);
698 si->ob->flags |= BF_WRITE_TIMEOUT;
699 if (!si->err_type)
700 si->err_type = SI_ET_QUEUE_TO;
701 si->state = SI_ST_CLO;
Willy Tarreau0cac36f2008-11-30 20:44:17 +0100702 if (s->srv_error)
703 s->srv_error(s, si);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100704 return;
705 }
706
707 /* Connection remains in queue, check if we have to abort it */
Willy Tarreau418fd472009-09-06 21:37:23 +0200708 if ((si->ob->flags & (BF_READ_ERROR)) ||
709 ((si->ob->flags & BF_SHUTW_NOW) && /* empty and client aborted */
Willy Tarreauba0b63d2009-09-20 08:09:44 +0200710 (si->ob->flags & BF_OUT_EMPTY || s->be->options & PR_O_ABRT_CLOSE))) {
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100711 /* give up */
712 si->exp = TICK_ETERNITY;
713 s->logs.t_queue = tv_ms_elapsed(&s->logs.tv_accept, &now);
714 si->shutr(si);
715 si->shutw(si);
716 si->err_type |= SI_ET_QUEUE_ABRT;
717 si->state = SI_ST_CLO;
Willy Tarreau0cac36f2008-11-30 20:44:17 +0100718 if (s->srv_error)
719 s->srv_error(s, si);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100720 return;
721 }
722
723 /* Nothing changed */
724 return;
725 }
726 else if (si->state == SI_ST_TAR) {
727 /* Connection request might be aborted */
Willy Tarreau418fd472009-09-06 21:37:23 +0200728 if ((si->ob->flags & (BF_READ_ERROR)) ||
729 ((si->ob->flags & BF_SHUTW_NOW) && /* empty and client aborted */
Willy Tarreauba0b63d2009-09-20 08:09:44 +0200730 (si->ob->flags & BF_OUT_EMPTY || s->be->options & PR_O_ABRT_CLOSE))) {
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100731 /* give up */
732 si->exp = TICK_ETERNITY;
733 si->shutr(si);
734 si->shutw(si);
735 si->err_type |= SI_ET_CONN_ABRT;
736 si->state = SI_ST_CLO;
Willy Tarreau0cac36f2008-11-30 20:44:17 +0100737 if (s->srv_error)
738 s->srv_error(s, si);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100739 return;
740 }
741
742 if (!(si->flags & SI_FL_EXP))
743 return; /* still in turn-around */
744
745 si->exp = TICK_ETERNITY;
746
747 /* we keep trying on the same server as long as the session is
748 * marked "assigned".
749 * FIXME: Should we force a redispatch attempt when the server is down ?
750 */
751 if (s->flags & SN_ASSIGNED)
752 si->state = SI_ST_ASS;
753 else
754 si->state = SI_ST_REQ;
755 return;
756 }
757}
758
759/* This function initiates a server connection request on a stream interface
760 * already in SI_ST_REQ state. Upon success, the state goes to SI_ST_ASS,
761 * indicating that a server has been assigned. It may also return SI_ST_QUE,
762 * or SI_ST_CLO upon error.
763 */
764static void sess_prepare_conn_req(struct session *s, struct stream_interface *si) {
765 DPRINTF(stderr,"[%u] %s: sess=%p rq=%p, rp=%p, exp(r,w)=%u,%u rqf=%08x rpf=%08x rql=%d rpl=%d cs=%d ss=%d\n",
766 now_ms, __FUNCTION__,
767 s,
768 s->req, s->rep,
769 s->req->rex, s->rep->wex,
770 s->req->flags, s->rep->flags,
771 s->req->l, s->rep->l, s->rep->cons->state, s->req->cons->state);
772
773 if (si->state != SI_ST_REQ)
774 return;
775
776 /* Try to assign a server */
777 if (srv_redispatch_connect(s) != 0) {
778 /* We did not get a server. Either we queued the
779 * connection request, or we encountered an error.
780 */
781 if (si->state == SI_ST_QUE)
782 return;
783
784 /* we did not get any server, let's check the cause */
785 si->shutr(si);
786 si->shutw(si);
787 si->ob->flags |= BF_WRITE_ERROR;
788 if (!si->err_type)
789 si->err_type = SI_ET_CONN_OTHER;
790 si->state = SI_ST_CLO;
Willy Tarreau0cac36f2008-11-30 20:44:17 +0100791 if (s->srv_error)
792 s->srv_error(s, si);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +0100793 return;
794 }
795
796 /* The server is assigned */
797 s->logs.t_queue = tv_ms_elapsed(&s->logs.tv_accept, &now);
798 si->state = SI_ST_ASS;
799}
800
Willy Tarreau1d0dfb12009-07-07 15:10:31 +0200801/* This stream analyser checks the switching rules and changes the backend
Willy Tarreau4de91492010-01-22 19:10:05 +0100802 * if appropriate. The default_backend rule is also considered, then the
803 * target backend's forced persistence rules are also evaluated last if any.
Willy Tarreau1d0dfb12009-07-07 15:10:31 +0200804 * It returns 1 if the processing can continue on next analysers, or zero if it
805 * either needs more data or wants to immediately abort the request.
806 */
807int process_switching_rules(struct session *s, struct buffer *req, int an_bit)
808{
Cyril Bonté47fdd8e2010-04-25 00:00:51 +0200809 struct persist_rule *prst_rule;
Willy Tarreau4de91492010-01-22 19:10:05 +0100810
Willy Tarreau1d0dfb12009-07-07 15:10:31 +0200811 req->analysers &= ~an_bit;
812 req->analyse_exp = TICK_ETERNITY;
813
814 DPRINTF(stderr,"[%u] %s: session=%p b=%p, exp(r,w)=%u,%u bf=%08x bl=%d analysers=%02x\n",
815 now_ms, __FUNCTION__,
816 s,
817 req,
818 req->rex, req->wex,
819 req->flags,
820 req->l,
821 req->analysers);
822
823 /* now check whether we have some switching rules for this request */
824 if (!(s->flags & SN_BE_ASSIGNED)) {
825 struct switching_rule *rule;
826
827 list_for_each_entry(rule, &s->fe->switching_rules, list) {
828 int ret;
829
830 ret = acl_exec_cond(rule->cond, s->fe, s, &s->txn, ACL_DIR_REQ);
831 ret = acl_pass(ret);
832 if (rule->cond->pol == ACL_COND_UNLESS)
833 ret = !ret;
834
835 if (ret) {
Willy Tarreaubedb9ba2009-07-12 08:27:39 +0200836 if (!session_set_backend(s, rule->be.backend))
837 goto sw_failed;
Willy Tarreau1d0dfb12009-07-07 15:10:31 +0200838 break;
839 }
840 }
841
842 /* To ensure correct connection accounting on the backend, we
843 * have to assign one if it was not set (eg: a listen). This
844 * measure also takes care of correctly setting the default
845 * backend if any.
846 */
847 if (!(s->flags & SN_BE_ASSIGNED))
Willy Tarreaubedb9ba2009-07-12 08:27:39 +0200848 if (!session_set_backend(s, s->fe->defbe.be ? s->fe->defbe.be : s->be))
849 goto sw_failed;
Willy Tarreau1d0dfb12009-07-07 15:10:31 +0200850 }
851
852 /* we don't want to run the HTTP filters again if the backend has not changed */
853 if (s->fe == s->be)
854 s->req->analysers &= ~AN_REQ_HTTP_PROCESS_BE;
855
Cyril Bonté47fdd8e2010-04-25 00:00:51 +0200856 /* as soon as we know the backend, we must check if we have a matching forced or ignored
Willy Tarreau4de91492010-01-22 19:10:05 +0100857 * persistence rule, and report that in the session.
858 */
Cyril Bonté47fdd8e2010-04-25 00:00:51 +0200859 list_for_each_entry(prst_rule, &s->be->persist_rules, list) {
Willy Tarreau4de91492010-01-22 19:10:05 +0100860 int ret = 1;
861
862 if (prst_rule->cond) {
863 ret = acl_exec_cond(prst_rule->cond, s->be, s, &s->txn, ACL_DIR_REQ);
864 ret = acl_pass(ret);
865 if (prst_rule->cond->pol == ACL_COND_UNLESS)
866 ret = !ret;
867 }
868
869 if (ret) {
870 /* no rule, or the rule matches */
Cyril Bonté47fdd8e2010-04-25 00:00:51 +0200871 if (prst_rule->type == PERSIST_TYPE_FORCE) {
872 s->flags |= SN_FORCE_PRST;
873 } else {
874 s->flags |= SN_IGNORE_PRST;
875 }
Willy Tarreau4de91492010-01-22 19:10:05 +0100876 break;
877 }
878 }
879
Willy Tarreau1d0dfb12009-07-07 15:10:31 +0200880 return 1;
Willy Tarreaubedb9ba2009-07-12 08:27:39 +0200881
882 sw_failed:
883 /* immediately abort this request in case of allocation failure */
884 buffer_abort(s->req);
885 buffer_abort(s->rep);
886
887 if (!(s->flags & SN_ERR_MASK))
888 s->flags |= SN_ERR_RESOURCE;
889 if (!(s->flags & SN_FINST_MASK))
890 s->flags |= SN_FINST_R;
891
892 s->txn.status = 500;
893 s->req->analysers = 0;
894 s->req->analyse_exp = TICK_ETERNITY;
895 return 0;
Willy Tarreau1d0dfb12009-07-07 15:10:31 +0200896}
897
Emeric Brun1d33b292010-01-04 15:47:17 +0100898/* This stream analyser works on a request. It applies all sticking rules on
899 * it then returns 1. The data must already be present in the buffer otherwise
900 * they won't match. It always returns 1.
901 */
902int process_sticking_rules(struct session *s, struct buffer *req, int an_bit)
903{
904 struct proxy *px = s->be;
905 struct sticking_rule *rule;
906
907 DPRINTF(stderr,"[%u] %s: session=%p b=%p, exp(r,w)=%u,%u bf=%08x bl=%d analysers=%02x\n",
908 now_ms, __FUNCTION__,
909 s,
910 req,
911 req->rex, req->wex,
912 req->flags,
913 req->l,
914 req->analysers);
915
916 list_for_each_entry(rule, &px->sticking_rules, list) {
917 int ret = 1 ;
918 int i;
919
920 for (i = 0; i < s->store_count; i++) {
921 if (rule->table.t == s->store[i].table)
922 break;
923 }
924
925 if (i != s->store_count)
926 continue;
927
928 if (rule->cond) {
929 ret = acl_exec_cond(rule->cond, px, s, &s->txn, ACL_DIR_REQ);
930 ret = acl_pass(ret);
931 if (rule->cond->pol == ACL_COND_UNLESS)
932 ret = !ret;
933 }
934
935 if (ret) {
936 struct stktable_key *key;
937
Willy Tarreauf0b38bf2010-06-06 13:22:23 +0200938 key = stktable_fetch_key(px, s, &s->txn, PATTERN_FETCH_REQ, rule->expr, rule->table.t->type);
Emeric Brun1d33b292010-01-04 15:47:17 +0100939 if (!key)
940 continue;
941
942 if (rule->flags & STK_IS_MATCH) {
943 struct stksess *ts;
944
Willy Tarreauf16d2b82010-06-06 15:38:59 +0200945 if ((ts = stktable_lookup_key(rule->table.t, key)) != NULL) {
Emeric Brun1d33b292010-01-04 15:47:17 +0100946 if (!(s->flags & SN_ASSIGNED)) {
947 struct eb32_node *node;
Willy Tarreau13c29de2010-06-06 16:40:39 +0200948 void *ptr;
Emeric Brun1d33b292010-01-04 15:47:17 +0100949
950 /* srv found in table */
Willy Tarreau13c29de2010-06-06 16:40:39 +0200951 ptr = stktable_data_ptr(rule->table.t, ts, STKTABLE_DT_SERVER_ID);
952 node = eb32_lookup(&px->conf.used_server_id, stktable_data_cast(ptr, server_id));
Emeric Brun1d33b292010-01-04 15:47:17 +0100953 if (node) {
954 struct server *srv;
955
956 srv = container_of(node, struct server, conf.id);
Willy Tarreau4de91492010-01-22 19:10:05 +0100957 if ((srv->state & SRV_RUNNING) ||
958 (px->options & PR_O_PERSIST) ||
959 (s->flags & SN_FORCE_PRST)) {
Emeric Brun1d33b292010-01-04 15:47:17 +0100960 s->flags |= SN_DIRECT | SN_ASSIGNED;
961 s->srv = srv;
962 }
963 }
964 }
965 ts->expire = tick_add(now_ms, MS_TO_TICKS(rule->table.t->expire));
966 }
967 }
968 if (rule->flags & STK_IS_STORE) {
969 if (s->store_count < (sizeof(s->store) / sizeof(s->store[0]))) {
970 struct stksess *ts;
971
972 ts = stksess_new(rule->table.t, key);
973 if (ts) {
974 s->store[s->store_count].table = rule->table.t;
975 s->store[s->store_count++].ts = ts;
976 }
977 }
978 }
979 }
980 }
981
982 req->analysers &= ~an_bit;
983 req->analyse_exp = TICK_ETERNITY;
984 return 1;
985}
986
987/* This stream analyser works on a response. It applies all store rules on it
988 * then returns 1. The data must already be present in the buffer otherwise
989 * they won't match. It always returns 1.
990 */
991int process_store_rules(struct session *s, struct buffer *rep, int an_bit)
992{
993 struct proxy *px = s->be;
994 struct sticking_rule *rule;
995 int i;
996
997 DPRINTF(stderr,"[%u] %s: session=%p b=%p, exp(r,w)=%u,%u bf=%08x bl=%d analysers=%02x\n",
998 now_ms, __FUNCTION__,
999 s,
Willy Tarreau2e2b3eb2010-02-09 20:55:44 +01001000 rep,
1001 rep->rex, rep->wex,
1002 rep->flags,
1003 rep->l,
1004 rep->analysers);
Emeric Brun1d33b292010-01-04 15:47:17 +01001005
1006 list_for_each_entry(rule, &px->storersp_rules, list) {
1007 int ret = 1 ;
1008 int storereqidx = -1;
1009
1010 for (i = 0; i < s->store_count; i++) {
1011 if (rule->table.t == s->store[i].table) {
1012 if (!(s->store[i].flags))
1013 storereqidx = i;
1014 break;
1015 }
1016 }
1017
1018 if ((i != s->store_count) && (storereqidx == -1))
1019 continue;
1020
1021 if (rule->cond) {
1022 ret = acl_exec_cond(rule->cond, px, s, &s->txn, ACL_DIR_RTR);
1023 ret = acl_pass(ret);
1024 if (rule->cond->pol == ACL_COND_UNLESS)
1025 ret = !ret;
1026 }
1027
1028 if (ret) {
1029 struct stktable_key *key;
1030
Willy Tarreauf0b38bf2010-06-06 13:22:23 +02001031 key = stktable_fetch_key(px, s, &s->txn, PATTERN_FETCH_RTR, rule->expr, rule->table.t->type);
Emeric Brun1d33b292010-01-04 15:47:17 +01001032 if (!key)
1033 continue;
1034
1035 if (storereqidx != -1) {
Willy Tarreau393379c2010-06-06 12:11:37 +02001036 stksess_setkey(s->store[storereqidx].table, s->store[storereqidx].ts, key);
Emeric Brun1d33b292010-01-04 15:47:17 +01001037 s->store[storereqidx].flags = 1;
1038 }
1039 else if (s->store_count < (sizeof(s->store) / sizeof(s->store[0]))) {
1040 struct stksess *ts;
1041
1042 ts = stksess_new(rule->table.t, key);
1043 if (ts) {
1044 s->store[s->store_count].table = rule->table.t;
1045 s->store[s->store_count].flags = 1;
1046 s->store[s->store_count++].ts = ts;
1047 }
1048 }
1049 }
1050 }
1051
1052 /* process store request and store response */
1053 for (i = 0; i < s->store_count; i++) {
Willy Tarreauf16d2b82010-06-06 15:38:59 +02001054 struct stksess *ts;
Willy Tarreau13c29de2010-06-06 16:40:39 +02001055 void *ptr;
Willy Tarreauf16d2b82010-06-06 15:38:59 +02001056
1057 ts = stktable_lookup(s->store[i].table, s->store[i].ts);
1058 if (ts) {
1059 /* the entry already existed, we can free ours */
Willy Tarreaucb183642010-06-06 17:58:34 +02001060 stktable_touch(s->store[i].table, s->store[i].ts);
Emeric Brun1d33b292010-01-04 15:47:17 +01001061 stksess_free(s->store[i].table, s->store[i].ts);
Emeric Brun1d33b292010-01-04 15:47:17 +01001062 }
Willy Tarreauf16d2b82010-06-06 15:38:59 +02001063 else
1064 ts = stktable_store(s->store[i].table, s->store[i].ts);
1065
1066 s->store[i].ts = NULL;
Willy Tarreau13c29de2010-06-06 16:40:39 +02001067 ptr = stktable_data_ptr(s->store[i].table, ts, STKTABLE_DT_SERVER_ID);
1068 stktable_data_cast(ptr, server_id) = s->srv->puid;
Emeric Brun1d33b292010-01-04 15:47:17 +01001069 }
1070
1071 rep->analysers &= ~an_bit;
1072 rep->analyse_exp = TICK_ETERNITY;
1073 return 1;
1074}
1075
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001076/* This macro is very specific to the function below. See the comments in
1077 * process_session() below to understand the logic and the tests.
1078 */
1079#define UPDATE_ANALYSERS(real, list, back, flag) { \
1080 list = (((list) & ~(flag)) | ~(back)) & (real); \
1081 back = real; \
1082 if (!(list)) \
1083 break; \
1084 if (((list) ^ ((list) & ((list) - 1))) < (flag)) \
1085 continue; \
1086}
1087
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001088/* Processes the client, server, request and response jobs of a session task,
1089 * then puts it back to the wait queue in a clean state, or cleans up its
1090 * resources if it must be deleted. Returns in <next> the date the task wants
1091 * to be woken up, or TICK_ETERNITY. In order not to call all functions for
1092 * nothing too many times, the request and response buffers flags are monitored
1093 * and each function is called only if at least another function has changed at
1094 * least one flag it is interested in.
1095 */
Willy Tarreau26c25062009-03-08 09:38:41 +01001096struct task *process_session(struct task *t)
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001097{
1098 struct session *s = t->context;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001099 unsigned int rqf_last, rpf_last;
Willy Tarreau576507f2010-01-07 00:09:04 +01001100 unsigned int req_ana_back;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001101
1102 //DPRINTF(stderr, "%s:%d: cs=%d ss=%d(%d) rqf=0x%08x rpf=0x%08x\n", __FUNCTION__, __LINE__,
1103 // s->si[0].state, s->si[1].state, s->si[1].err_type, s->req->flags, s->rep->flags);
1104
Krzysztof Piotr Oledzkif9423ae2010-01-29 19:26:18 +01001105 /* this data may be no longer valid, clear it */
1106 memset(&s->txn.auth, 0, sizeof(s->txn.auth));
1107
Willy Tarreaub67a9b82009-06-21 22:03:51 +02001108 /* This flag must explicitly be set every time */
1109 s->req->flags &= ~BF_READ_NOEXP;
1110
1111 /* Keep a copy of req/rep flags so that we can detect shutdowns */
1112 rqf_last = s->req->flags;
1113 rpf_last = s->rep->flags;
1114
Willy Tarreau89f7ef22009-09-05 20:57:35 +02001115 /* we don't want the stream interface functions to recursively wake us up */
1116 if (s->req->prod->owner == t)
1117 s->req->prod->flags |= SI_FL_DONT_WAKE;
1118 if (s->req->cons->owner == t)
1119 s->req->cons->flags |= SI_FL_DONT_WAKE;
1120
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001121 /* 1a: Check for low level timeouts if needed. We just set a flag on
1122 * stream interfaces when their timeouts have expired.
1123 */
1124 if (unlikely(t->state & TASK_WOKEN_TIMER)) {
1125 stream_int_check_timeouts(&s->si[0]);
1126 stream_int_check_timeouts(&s->si[1]);
Willy Tarreaub67a9b82009-06-21 22:03:51 +02001127
1128 /* check buffer timeouts, and close the corresponding stream interfaces
1129 * for future reads or writes. Note: this will also concern upper layers
1130 * but we do not touch any other flag. We must be careful and correctly
1131 * detect state changes when calling them.
1132 */
1133
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001134 buffer_check_timeouts(s->req);
Willy Tarreaub67a9b82009-06-21 22:03:51 +02001135
Willy Tarreau14641402009-12-29 14:49:56 +01001136 if (unlikely((s->req->flags & (BF_SHUTW|BF_WRITE_TIMEOUT)) == BF_WRITE_TIMEOUT)) {
1137 s->req->cons->flags |= SI_FL_NOLINGER;
1138 s->req->cons->shutw(s->req->cons);
1139 }
1140
Willy Tarreaub67a9b82009-06-21 22:03:51 +02001141 if (unlikely((s->req->flags & (BF_SHUTR|BF_READ_TIMEOUT)) == BF_READ_TIMEOUT))
1142 s->req->prod->shutr(s->req->prod);
1143
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001144 buffer_check_timeouts(s->rep);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001145
Willy Tarreau14641402009-12-29 14:49:56 +01001146 if (unlikely((s->rep->flags & (BF_SHUTW|BF_WRITE_TIMEOUT)) == BF_WRITE_TIMEOUT)) {
1147 s->rep->cons->flags |= SI_FL_NOLINGER;
1148 s->rep->cons->shutw(s->rep->cons);
1149 }
1150
Willy Tarreaub67a9b82009-06-21 22:03:51 +02001151 if (unlikely((s->rep->flags & (BF_SHUTR|BF_READ_TIMEOUT)) == BF_READ_TIMEOUT))
1152 s->rep->prod->shutr(s->rep->prod);
Willy Tarreaub67a9b82009-06-21 22:03:51 +02001153 }
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001154
1155 /* 1b: check for low-level errors reported at the stream interface.
1156 * First we check if it's a retryable error (in which case we don't
1157 * want to tell the buffer). Otherwise we report the error one level
1158 * upper by setting flags into the buffers. Note that the side towards
1159 * the client cannot have connect (hence retryable) errors. Also, the
1160 * connection setup code must be able to deal with any type of abort.
1161 */
1162 if (unlikely(s->si[0].flags & SI_FL_ERR)) {
1163 if (s->si[0].state == SI_ST_EST || s->si[0].state == SI_ST_DIS) {
1164 s->si[0].shutr(&s->si[0]);
1165 s->si[0].shutw(&s->si[0]);
1166 stream_int_report_error(&s->si[0]);
Willy Tarreau05cb29b2008-12-14 11:44:04 +01001167 if (!(s->req->analysers) && !(s->rep->analysers)) {
Willy Tarreauae526782010-03-04 20:34:23 +01001168 s->be->counters.cli_aborts++;
1169 if (s->srv)
1170 s->srv->counters.cli_aborts++;
Willy Tarreau05cb29b2008-12-14 11:44:04 +01001171 if (!(s->flags & SN_ERR_MASK))
1172 s->flags |= SN_ERR_CLICL;
1173 if (!(s->flags & SN_FINST_MASK))
1174 s->flags |= SN_FINST_D;
1175 }
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001176 }
1177 }
1178
1179 if (unlikely(s->si[1].flags & SI_FL_ERR)) {
1180 if (s->si[1].state == SI_ST_EST || s->si[1].state == SI_ST_DIS) {
1181 s->si[1].shutr(&s->si[1]);
1182 s->si[1].shutw(&s->si[1]);
1183 stream_int_report_error(&s->si[1]);
Krzysztof Piotr Oledzki052d4fd2009-10-04 14:52:57 +02001184 s->be->counters.failed_resp++;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001185 if (s->srv)
Krzysztof Piotr Oledzki052d4fd2009-10-04 14:52:57 +02001186 s->srv->counters.failed_resp++;
Willy Tarreau05cb29b2008-12-14 11:44:04 +01001187 if (!(s->req->analysers) && !(s->rep->analysers)) {
Willy Tarreauae526782010-03-04 20:34:23 +01001188 s->be->counters.srv_aborts++;
1189 if (s->srv)
1190 s->srv->counters.srv_aborts++;
Willy Tarreau05cb29b2008-12-14 11:44:04 +01001191 if (!(s->flags & SN_ERR_MASK))
1192 s->flags |= SN_ERR_SRVCL;
1193 if (!(s->flags & SN_FINST_MASK))
1194 s->flags |= SN_FINST_D;
1195 }
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001196 }
1197 /* note: maybe we should process connection errors here ? */
1198 }
1199
1200 if (s->si[1].state == SI_ST_CON) {
1201 /* we were trying to establish a connection on the server side,
1202 * maybe it succeeded, maybe it failed, maybe we timed out, ...
1203 */
1204 if (unlikely(!sess_update_st_con_tcp(s, &s->si[1])))
1205 sess_update_st_cer(s, &s->si[1]);
1206 else if (s->si[1].state == SI_ST_EST)
1207 sess_establish(s, &s->si[1]);
1208
1209 /* state is now one of SI_ST_CON (still in progress), SI_ST_EST
1210 * (established), SI_ST_DIS (abort), SI_ST_CLO (last error),
1211 * SI_ST_ASS/SI_ST_TAR/SI_ST_REQ for retryable errors.
1212 */
1213 }
1214
Willy Tarreaub67a9b82009-06-21 22:03:51 +02001215resync_stream_interface:
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001216 /* Check for connection closure */
1217
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001218 DPRINTF(stderr,
1219 "[%u] %s:%d: task=%p s=%p, sfl=0x%08x, rq=%p, rp=%p, exp(r,w)=%u,%u rqf=%08x rpf=%08x rql=%d rpl=%d cs=%d ss=%d, cet=0x%x set=0x%x retr=%d\n",
1220 now_ms, __FUNCTION__, __LINE__,
1221 t,
1222 s, s->flags,
1223 s->req, s->rep,
1224 s->req->rex, s->rep->wex,
1225 s->req->flags, s->rep->flags,
1226 s->req->l, s->rep->l, s->rep->cons->state, s->req->cons->state,
1227 s->rep->cons->err_type, s->req->cons->err_type,
Willy Tarreauee28de02010-06-01 09:51:00 +02001228 s->req->cons->conn_retries);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001229
1230 /* nothing special to be done on client side */
1231 if (unlikely(s->req->prod->state == SI_ST_DIS))
1232 s->req->prod->state = SI_ST_CLO;
1233
1234 /* When a server-side connection is released, we have to count it and
1235 * check for pending connections on this server.
1236 */
1237 if (unlikely(s->req->cons->state == SI_ST_DIS)) {
1238 s->req->cons->state = SI_ST_CLO;
1239 if (s->srv) {
1240 if (s->flags & SN_CURR_SESS) {
1241 s->flags &= ~SN_CURR_SESS;
1242 s->srv->cur_sess--;
1243 }
1244 sess_change_server(s, NULL);
1245 if (may_dequeue_tasks(s->srv, s->be))
1246 process_srv_queue(s->srv);
1247 }
1248 }
1249
1250 /*
1251 * Note: of the transient states (REQ, CER, DIS), only REQ may remain
1252 * at this point.
1253 */
1254
Willy Tarreau0be0ef92009-03-08 19:20:25 +01001255 resync_request:
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001256 /* Analyse request */
1257 if ((s->req->flags & BF_MASK_ANALYSER) ||
1258 (s->req->flags ^ rqf_last) & BF_MASK_STATIC) {
1259 unsigned int flags = s->req->flags;
1260
1261 if (s->req->prod->state >= SI_ST_EST) {
Willy Tarreaue34070e2010-01-08 00:32:27 +01001262 int max_loops = global.tune.maxpollevents;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001263 unsigned int ana_list;
1264 unsigned int ana_back;
Willy Tarreau1a52dbd2009-06-28 19:37:53 +02001265
Willy Tarreau90deb182010-01-07 00:20:41 +01001266 /* it's up to the analysers to stop new connections,
1267 * disable reading or closing. Note: if an analyser
1268 * disables any of these bits, it is responsible for
1269 * enabling them again when it disables itself, so
1270 * that other analysers are called in similar conditions.
1271 */
1272 buffer_auto_read(s->req);
Willy Tarreau520d95e2009-09-19 21:04:57 +02001273 buffer_auto_connect(s->req);
1274 buffer_auto_close(s->req);
Willy Tarreauedcf6682008-11-30 23:15:34 +01001275
1276 /* We will call all analysers for which a bit is set in
1277 * s->req->analysers, following the bit order from LSB
1278 * to MSB. The analysers must remove themselves from
Willy Tarreau1a52dbd2009-06-28 19:37:53 +02001279 * the list when not needed. Any analyser may return 0
1280 * to break out of the loop, either because of missing
1281 * data to take a decision, or because it decides to
1282 * kill the session. We loop at least once through each
1283 * analyser, and we may loop again if other analysers
1284 * are added in the middle.
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001285 *
1286 * We build a list of analysers to run. We evaluate all
1287 * of these analysers in the order of the lower bit to
1288 * the higher bit. This ordering is very important.
1289 * An analyser will often add/remove other analysers,
1290 * including itself. Any changes to itself have no effect
1291 * on the loop. If it removes any other analysers, we
1292 * want those analysers not to be called anymore during
1293 * this loop. If it adds an analyser that is located
1294 * after itself, we want it to be scheduled for being
1295 * processed during the loop. If it adds an analyser
1296 * which is located before it, we want it to switch to
1297 * it immediately, even if it has already been called
1298 * once but removed since.
1299 *
1300 * In order to achieve this, we compare the analyser
1301 * list after the call with a copy of it before the
1302 * call. The work list is fed with analyser bits that
1303 * appeared during the call. Then we compare previous
1304 * work list with the new one, and check the bits that
1305 * appeared. If the lowest of these bits is lower than
1306 * the current bit, it means we have enabled a previous
1307 * analyser and must immediately loop again.
Willy Tarreauedcf6682008-11-30 23:15:34 +01001308 */
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001309
1310 ana_list = ana_back = s->req->analysers;
Willy Tarreaue34070e2010-01-08 00:32:27 +01001311 while (ana_list && max_loops--) {
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001312 /* Warning! ensure that analysers are always placed in ascending order! */
Willy Tarreau1a52dbd2009-06-28 19:37:53 +02001313
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001314 if (ana_list & AN_REQ_INSPECT) {
Willy Tarreau3a816292009-07-07 10:55:49 +02001315 if (!tcp_inspect_request(s, s->req, AN_REQ_INSPECT))
Willy Tarreauedcf6682008-11-30 23:15:34 +01001316 break;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001317 UPDATE_ANALYSERS(s->req->analysers, ana_list, ana_back, AN_REQ_INSPECT);
Willy Tarreau1a52dbd2009-06-28 19:37:53 +02001318 }
Willy Tarreauedcf6682008-11-30 23:15:34 +01001319
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001320 if (ana_list & AN_REQ_WAIT_HTTP) {
Willy Tarreau3a816292009-07-07 10:55:49 +02001321 if (!http_wait_for_request(s, s->req, AN_REQ_WAIT_HTTP))
Willy Tarreaud787e662009-07-07 10:14:51 +02001322 break;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001323 UPDATE_ANALYSERS(s->req->analysers, ana_list, ana_back, AN_REQ_WAIT_HTTP);
Willy Tarreaud787e662009-07-07 10:14:51 +02001324 }
1325
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001326 if (ana_list & AN_REQ_HTTP_PROCESS_FE) {
Willy Tarreau1d0dfb12009-07-07 15:10:31 +02001327 if (!http_process_req_common(s, s->req, AN_REQ_HTTP_PROCESS_FE, s->fe))
1328 break;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001329 UPDATE_ANALYSERS(s->req->analysers, ana_list, ana_back, AN_REQ_HTTP_PROCESS_FE);
Willy Tarreau1d0dfb12009-07-07 15:10:31 +02001330 }
1331
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001332 if (ana_list & AN_REQ_SWITCHING_RULES) {
Willy Tarreau1d0dfb12009-07-07 15:10:31 +02001333 if (!process_switching_rules(s, s->req, AN_REQ_SWITCHING_RULES))
1334 break;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001335 UPDATE_ANALYSERS(s->req->analysers, ana_list, ana_back, AN_REQ_SWITCHING_RULES);
Willy Tarreau1d0dfb12009-07-07 15:10:31 +02001336 }
1337
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001338 if (ana_list & AN_REQ_HTTP_PROCESS_BE) {
Willy Tarreau1d0dfb12009-07-07 15:10:31 +02001339 if (!http_process_req_common(s, s->req, AN_REQ_HTTP_PROCESS_BE, s->be))
1340 break;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001341 UPDATE_ANALYSERS(s->req->analysers, ana_list, ana_back, AN_REQ_HTTP_PROCESS_BE);
Willy Tarreau1d0dfb12009-07-07 15:10:31 +02001342 }
1343
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001344 if (ana_list & AN_REQ_HTTP_TARPIT) {
Willy Tarreau3a816292009-07-07 10:55:49 +02001345 if (!http_process_tarpit(s, s->req, AN_REQ_HTTP_TARPIT))
Willy Tarreau60b85b02008-11-30 23:28:40 +01001346 break;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001347 UPDATE_ANALYSERS(s->req->analysers, ana_list, ana_back, AN_REQ_HTTP_TARPIT);
Willy Tarreau1a52dbd2009-06-28 19:37:53 +02001348 }
Willy Tarreau60b85b02008-11-30 23:28:40 +01001349
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001350 if (ana_list & AN_REQ_HTTP_INNER) {
Willy Tarreauc465fd72009-08-31 00:17:18 +02001351 if (!http_process_request(s, s->req, AN_REQ_HTTP_INNER))
1352 break;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001353 UPDATE_ANALYSERS(s->req->analysers, ana_list, ana_back, AN_REQ_HTTP_INNER);
Willy Tarreauc465fd72009-08-31 00:17:18 +02001354 }
1355
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001356 if (ana_list & AN_REQ_HTTP_BODY) {
Willy Tarreau3a816292009-07-07 10:55:49 +02001357 if (!http_process_request_body(s, s->req, AN_REQ_HTTP_BODY))
Willy Tarreaud34af782008-11-30 23:36:37 +01001358 break;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001359 UPDATE_ANALYSERS(s->req->analysers, ana_list, ana_back, AN_REQ_HTTP_BODY);
Willy Tarreau1a52dbd2009-06-28 19:37:53 +02001360 }
Emeric Brun647caf12009-06-30 17:57:00 +02001361
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001362 if (ana_list & AN_REQ_PRST_RDP_COOKIE) {
Emeric Brun647caf12009-06-30 17:57:00 +02001363 if (!tcp_persist_rdp_cookie(s, s->req, AN_REQ_PRST_RDP_COOKIE))
1364 break;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001365 UPDATE_ANALYSERS(s->req->analysers, ana_list, ana_back, AN_REQ_PRST_RDP_COOKIE);
Emeric Brun647caf12009-06-30 17:57:00 +02001366 }
Willy Tarreaud98cf932009-12-27 22:54:55 +01001367
Emeric Brun1d33b292010-01-04 15:47:17 +01001368 if (ana_list & AN_REQ_STICKING_RULES) {
1369 if (!process_sticking_rules(s, s->req, AN_REQ_STICKING_RULES))
1370 break;
1371 UPDATE_ANALYSERS(s->req->analysers, ana_list, ana_back, AN_REQ_STICKING_RULES);
1372 }
1373
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001374 if (ana_list & AN_REQ_HTTP_XFER_BODY) {
Willy Tarreaud98cf932009-12-27 22:54:55 +01001375 if (!http_request_forward_body(s, s->req, AN_REQ_HTTP_XFER_BODY))
1376 break;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001377 UPDATE_ANALYSERS(s->req->analysers, ana_list, ana_back, AN_REQ_HTTP_XFER_BODY);
Willy Tarreaud98cf932009-12-27 22:54:55 +01001378 }
Willy Tarreaue34070e2010-01-08 00:32:27 +01001379 break;
1380 }
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001381 }
Willy Tarreau84455332009-03-15 22:34:05 +01001382
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001383 if ((s->req->flags ^ flags) & BF_MASK_STATIC) {
1384 rqf_last = s->req->flags;
1385 goto resync_request;
1386 }
1387 }
1388
Willy Tarreau576507f2010-01-07 00:09:04 +01001389 /* we'll monitor the request analysers while parsing the response,
1390 * because some response analysers may indirectly enable new request
1391 * analysers (eg: HTTP keep-alive).
1392 */
1393 req_ana_back = s->req->analysers;
1394
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001395 resync_response:
1396 /* Analyse response */
1397
1398 if (unlikely(s->rep->flags & BF_HIJACK)) {
1399 /* In inject mode, we wake up everytime something has
1400 * happened on the write side of the buffer.
1401 */
1402 unsigned int flags = s->rep->flags;
1403
1404 if ((s->rep->flags & (BF_WRITE_PARTIAL|BF_WRITE_ERROR|BF_SHUTW)) &&
1405 !(s->rep->flags & BF_FULL)) {
1406 s->rep->hijacker(s, s->rep);
1407 }
1408
1409 if ((s->rep->flags ^ flags) & BF_MASK_STATIC) {
1410 rpf_last = s->rep->flags;
1411 goto resync_response;
1412 }
1413 }
1414 else if ((s->rep->flags & BF_MASK_ANALYSER) ||
1415 (s->rep->flags ^ rpf_last) & BF_MASK_STATIC) {
1416 unsigned int flags = s->rep->flags;
1417
1418 if (s->rep->prod->state >= SI_ST_EST) {
Willy Tarreaue34070e2010-01-08 00:32:27 +01001419 int max_loops = global.tune.maxpollevents;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001420 unsigned int ana_list;
1421 unsigned int ana_back;
Willy Tarreaub37c27e2009-10-18 22:53:08 +02001422
Willy Tarreau90deb182010-01-07 00:20:41 +01001423 /* it's up to the analysers to stop disable reading or
1424 * closing. Note: if an analyser disables any of these
1425 * bits, it is responsible for enabling them again when
1426 * it disables itself, so that other analysers are called
1427 * in similar conditions.
1428 */
1429 buffer_auto_read(s->rep);
Willy Tarreau520d95e2009-09-19 21:04:57 +02001430 buffer_auto_close(s->rep);
Willy Tarreaub37c27e2009-10-18 22:53:08 +02001431
1432 /* We will call all analysers for which a bit is set in
1433 * s->rep->analysers, following the bit order from LSB
1434 * to MSB. The analysers must remove themselves from
1435 * the list when not needed. Any analyser may return 0
1436 * to break out of the loop, either because of missing
1437 * data to take a decision, or because it decides to
1438 * kill the session. We loop at least once through each
1439 * analyser, and we may loop again if other analysers
1440 * are added in the middle.
1441 */
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001442
1443 ana_list = ana_back = s->rep->analysers;
Willy Tarreaue34070e2010-01-08 00:32:27 +01001444 while (ana_list && max_loops--) {
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001445 /* Warning! ensure that analysers are always placed in ascending order! */
1446
1447 if (ana_list & AN_RES_WAIT_HTTP) {
Willy Tarreaub37c27e2009-10-18 22:53:08 +02001448 if (!http_wait_for_response(s, s->rep, AN_RES_WAIT_HTTP))
1449 break;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001450 UPDATE_ANALYSERS(s->rep->analysers, ana_list, ana_back, AN_RES_WAIT_HTTP);
Willy Tarreaub37c27e2009-10-18 22:53:08 +02001451 }
1452
Emeric Brun1d33b292010-01-04 15:47:17 +01001453 if (ana_list & AN_RES_STORE_RULES) {
1454 if (!process_store_rules(s, s->rep, AN_RES_STORE_RULES))
1455 break;
1456 UPDATE_ANALYSERS(s->rep->analysers, ana_list, ana_back, AN_RES_STORE_RULES);
1457 }
1458
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001459 if (ana_list & AN_RES_HTTP_PROCESS_BE) {
Willy Tarreaub37c27e2009-10-18 22:53:08 +02001460 if (!http_process_res_common(s, s->rep, AN_RES_HTTP_PROCESS_BE, s->be))
1461 break;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001462 UPDATE_ANALYSERS(s->rep->analysers, ana_list, ana_back, AN_RES_HTTP_PROCESS_BE);
Willy Tarreaub37c27e2009-10-18 22:53:08 +02001463 }
Willy Tarreaud98cf932009-12-27 22:54:55 +01001464
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001465 if (ana_list & AN_RES_HTTP_XFER_BODY) {
Willy Tarreaud98cf932009-12-27 22:54:55 +01001466 if (!http_response_forward_body(s, s->rep, AN_RES_HTTP_XFER_BODY))
1467 break;
Willy Tarreau1e0bbaf2010-01-06 23:53:24 +01001468 UPDATE_ANALYSERS(s->rep->analysers, ana_list, ana_back, AN_RES_HTTP_XFER_BODY);
Willy Tarreaud98cf932009-12-27 22:54:55 +01001469 }
Willy Tarreaue34070e2010-01-08 00:32:27 +01001470 break;
1471 }
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001472 }
1473
1474 if ((s->rep->flags ^ flags) & BF_MASK_STATIC) {
1475 rpf_last = s->rep->flags;
1476 goto resync_response;
1477 }
1478 }
1479
Willy Tarreau576507f2010-01-07 00:09:04 +01001480 /* maybe someone has added some request analysers, so we must check and loop */
1481 if (s->req->analysers & ~req_ana_back)
1482 goto resync_request;
1483
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001484 /* FIXME: here we should call protocol handlers which rely on
1485 * both buffers.
1486 */
1487
1488
1489 /*
Willy Tarreauae526782010-03-04 20:34:23 +01001490 * Now we propagate unhandled errors to the session. Normally
1491 * we're just in a data phase here since it means we have not
1492 * seen any analyser who could set an error status.
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001493 */
1494 if (!(s->flags & SN_ERR_MASK)) {
1495 if (s->req->flags & (BF_READ_ERROR|BF_READ_TIMEOUT|BF_WRITE_ERROR|BF_WRITE_TIMEOUT)) {
1496 /* Report it if the client got an error or a read timeout expired */
Willy Tarreau84455332009-03-15 22:34:05 +01001497 s->req->analysers = 0;
Willy Tarreauae526782010-03-04 20:34:23 +01001498 if (s->req->flags & BF_READ_ERROR) {
1499 s->be->counters.cli_aborts++;
1500 if (s->srv)
1501 s->srv->counters.cli_aborts++;
Willy Tarreau84455332009-03-15 22:34:05 +01001502 s->flags |= SN_ERR_CLICL;
Willy Tarreauae526782010-03-04 20:34:23 +01001503 }
1504 else if (s->req->flags & BF_READ_TIMEOUT) {
1505 s->be->counters.cli_aborts++;
1506 if (s->srv)
1507 s->srv->counters.cli_aborts++;
Willy Tarreau84455332009-03-15 22:34:05 +01001508 s->flags |= SN_ERR_CLITO;
Willy Tarreauae526782010-03-04 20:34:23 +01001509 }
1510 else if (s->req->flags & BF_WRITE_ERROR) {
1511 s->be->counters.srv_aborts++;
1512 if (s->srv)
1513 s->srv->counters.srv_aborts++;
Willy Tarreau84455332009-03-15 22:34:05 +01001514 s->flags |= SN_ERR_SRVCL;
Willy Tarreauae526782010-03-04 20:34:23 +01001515 }
1516 else {
1517 s->be->counters.srv_aborts++;
1518 if (s->srv)
1519 s->srv->counters.srv_aborts++;
Willy Tarreau84455332009-03-15 22:34:05 +01001520 s->flags |= SN_ERR_SRVTO;
Willy Tarreauae526782010-03-04 20:34:23 +01001521 }
Willy Tarreau84455332009-03-15 22:34:05 +01001522 sess_set_term_flags(s);
1523 }
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001524 else if (s->rep->flags & (BF_READ_ERROR|BF_READ_TIMEOUT|BF_WRITE_ERROR|BF_WRITE_TIMEOUT)) {
1525 /* Report it if the server got an error or a read timeout expired */
1526 s->rep->analysers = 0;
Willy Tarreauae526782010-03-04 20:34:23 +01001527 if (s->rep->flags & BF_READ_ERROR) {
1528 s->be->counters.srv_aborts++;
1529 if (s->srv)
1530 s->srv->counters.srv_aborts++;
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001531 s->flags |= SN_ERR_SRVCL;
Willy Tarreauae526782010-03-04 20:34:23 +01001532 }
1533 else if (s->rep->flags & BF_READ_TIMEOUT) {
1534 s->be->counters.srv_aborts++;
1535 if (s->srv)
1536 s->srv->counters.srv_aborts++;
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001537 s->flags |= SN_ERR_SRVTO;
Willy Tarreauae526782010-03-04 20:34:23 +01001538 }
1539 else if (s->rep->flags & BF_WRITE_ERROR) {
1540 s->be->counters.cli_aborts++;
1541 if (s->srv)
1542 s->srv->counters.cli_aborts++;
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001543 s->flags |= SN_ERR_CLICL;
Willy Tarreauae526782010-03-04 20:34:23 +01001544 }
1545 else {
1546 s->be->counters.cli_aborts++;
1547 if (s->srv)
1548 s->srv->counters.cli_aborts++;
1549 s->flags |= SN_ERR_CLITO;
1550 }
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001551 sess_set_term_flags(s);
1552 }
Willy Tarreau84455332009-03-15 22:34:05 +01001553 }
1554
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001555 /*
1556 * Here we take care of forwarding unhandled data. This also includes
1557 * connection establishments and shutdown requests.
1558 */
1559
1560
Willy Tarreau7c84bab2009-03-08 21:38:23 +01001561 /* If noone is interested in analysing data, it's time to forward
Willy Tarreau31971e52009-09-20 12:07:52 +02001562 * everything. We configure the buffer to forward indefinitely.
Willy Tarreau6b66f3e2008-12-14 17:31:54 +01001563 */
Willy Tarreau7c84bab2009-03-08 21:38:23 +01001564 if (!s->req->analysers &&
Willy Tarreau82eeaf22009-12-29 12:09:05 +01001565 !(s->req->flags & (BF_HIJACK|BF_SHUTW|BF_SHUTW_NOW)) &&
Willy Tarreau31971e52009-09-20 12:07:52 +02001566 (s->req->prod->state >= SI_ST_EST) &&
1567 (s->req->to_forward != BUF_INFINITE_FORWARD)) {
Willy Tarreau7c84bab2009-03-08 21:38:23 +01001568 /* This buffer is freewheeling, there's no analyser nor hijacker
1569 * attached to it. If any data are left in, we'll permit them to
1570 * move.
1571 */
Willy Tarreau90deb182010-01-07 00:20:41 +01001572 buffer_auto_read(s->req);
Willy Tarreau520d95e2009-09-19 21:04:57 +02001573 buffer_auto_connect(s->req);
1574 buffer_auto_close(s->req);
Willy Tarreau7c84bab2009-03-08 21:38:23 +01001575 buffer_flush(s->req);
Willy Tarreau5bd8c372009-01-19 00:32:22 +01001576
Willy Tarreau31971e52009-09-20 12:07:52 +02001577 /* If the producer is still connected, we'll enable data to flow
1578 * from the producer to the consumer (which might possibly not be
1579 * connected yet).
Willy Tarreau7c84bab2009-03-08 21:38:23 +01001580 */
Willy Tarreau31971e52009-09-20 12:07:52 +02001581 if (!(s->req->flags & (BF_SHUTR|BF_SHUTW|BF_SHUTW_NOW)))
1582 buffer_forward(s->req, BUF_INFINITE_FORWARD);
Willy Tarreau6b66f3e2008-12-14 17:31:54 +01001583 }
Willy Tarreauf890dc92008-12-13 21:12:26 +01001584
Willy Tarreau7c84bab2009-03-08 21:38:23 +01001585 /* check if it is wise to enable kernel splicing to forward request data */
1586 if (!(s->req->flags & (BF_KERN_SPLICING|BF_SHUTR)) &&
1587 s->req->to_forward &&
1588 (global.tune.options & GTUNE_USE_SPLICE) &&
Willy Tarreaudc340a92009-06-28 23:10:19 +02001589 (s->si[0].flags & s->si[1].flags & SI_FL_CAP_SPLICE) &&
Willy Tarreau7c84bab2009-03-08 21:38:23 +01001590 (pipes_used < global.maxpipes) &&
1591 (((s->fe->options2|s->be->options2) & PR_O2_SPLIC_REQ) ||
1592 (((s->fe->options2|s->be->options2) & PR_O2_SPLIC_AUT) &&
1593 (s->req->flags & BF_STREAMER_FAST)))) {
1594 s->req->flags |= BF_KERN_SPLICING;
1595 }
1596
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001597 /* reflect what the L7 analysers have seen last */
1598 rqf_last = s->req->flags;
1599
1600 /*
1601 * Now forward all shutdown requests between both sides of the buffer
1602 */
1603
Willy Tarreau520d95e2009-09-19 21:04:57 +02001604 /* first, let's check if the request buffer needs to shutdown(write), which may
1605 * happen either because the input is closed or because we want to force a close
Willy Tarreaue4599762010-03-21 23:25:09 +01001606 * once the server has begun to respond.
Willy Tarreau520d95e2009-09-19 21:04:57 +02001607 */
Willy Tarreau82eeaf22009-12-29 12:09:05 +01001608 if (unlikely((s->req->flags & (BF_SHUTW|BF_SHUTW_NOW|BF_HIJACK|BF_AUTO_CLOSE|BF_SHUTR)) ==
Willy Tarreaue4599762010-03-21 23:25:09 +01001609 (BF_AUTO_CLOSE|BF_SHUTR)))
Willy Tarreauba0b63d2009-09-20 08:09:44 +02001610 buffer_shutw_now(s->req);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001611
1612 /* shutdown(write) pending */
Willy Tarreauba0b63d2009-09-20 08:09:44 +02001613 if (unlikely((s->req->flags & (BF_SHUTW|BF_SHUTW_NOW|BF_OUT_EMPTY)) == (BF_SHUTW_NOW|BF_OUT_EMPTY)))
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001614 s->req->cons->shutw(s->req->cons);
1615
1616 /* shutdown(write) done on server side, we must stop the client too */
Willy Tarreau3dbc6942008-12-07 13:05:04 +01001617 if (unlikely((s->req->flags & (BF_SHUTW|BF_SHUTR|BF_SHUTR_NOW)) == BF_SHUTW &&
1618 !s->req->analysers))
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001619 buffer_shutr_now(s->req);
1620
1621 /* shutdown(read) pending */
1622 if (unlikely((s->req->flags & (BF_SHUTR|BF_SHUTR_NOW)) == BF_SHUTR_NOW))
1623 s->req->prod->shutr(s->req->prod);
1624
Willy Tarreau520d95e2009-09-19 21:04:57 +02001625 /* it's possible that an upper layer has requested a connection setup or abort.
1626 * There are 2 situations where we decide to establish a new connection :
1627 * - there are data scheduled for emission in the buffer
1628 * - the BF_AUTO_CONNECT flag is set (active connection)
1629 */
1630 if (s->req->cons->state == SI_ST_INI) {
Willy Tarreaue4599762010-03-21 23:25:09 +01001631 if (!(s->req->flags & BF_SHUTW)) {
Willy Tarreauba0b63d2009-09-20 08:09:44 +02001632 if ((s->req->flags & (BF_AUTO_CONNECT|BF_OUT_EMPTY)) != BF_OUT_EMPTY) {
Willy Tarreau85e7d002010-05-31 11:57:51 +02001633 /* If we have an iohandler without a connect method, we immediately
1634 * switch to the connected state, otherwise we perform a connection
1635 * request.
Willy Tarreau520d95e2009-09-19 21:04:57 +02001636 */
Willy Tarreau85e7d002010-05-31 11:57:51 +02001637 s->req->cons->state = SI_ST_REQ; /* new connection requested */
Willy Tarreau070ceb62010-06-01 10:36:43 +02001638 s->req->cons->conn_retries = s->be->conn_retries;
Willy Tarreau85e7d002010-05-31 11:57:51 +02001639 if (unlikely(s->req->cons->iohandler && !s->req->cons->connect)) {
Willy Tarreau520d95e2009-09-19 21:04:57 +02001640 s->req->cons->state = SI_ST_EST; /* connection established */
Willy Tarreau85e7d002010-05-31 11:57:51 +02001641 s->rep->flags |= BF_READ_ATTACHED; /* producer is now attached */
1642 s->req->wex = TICK_ETERNITY;
1643 }
Willy Tarreau520d95e2009-09-19 21:04:57 +02001644 }
Willy Tarreau73201222009-08-16 18:27:24 +02001645 }
Willy Tarreauf41ffdc2009-09-20 08:19:25 +02001646 else {
Willy Tarreau92795622009-03-06 12:51:23 +01001647 s->req->cons->state = SI_ST_CLO; /* shutw+ini = abort */
Willy Tarreauf41ffdc2009-09-20 08:19:25 +02001648 buffer_shutw_now(s->req); /* fix buffer flags upon abort */
1649 buffer_shutr_now(s->rep);
1650 }
Willy Tarreau92795622009-03-06 12:51:23 +01001651 }
1652
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001653
1654 /* we may have a pending connection request, or a connection waiting
1655 * for completion.
1656 */
1657 if (s->si[1].state >= SI_ST_REQ && s->si[1].state < SI_ST_CON) {
1658 do {
1659 /* nb: step 1 might switch from QUE to ASS, but we first want
1660 * to give a chance to step 2 to perform a redirect if needed.
1661 */
1662 if (s->si[1].state != SI_ST_REQ)
1663 sess_update_stream_int(s, &s->si[1]);
1664 if (s->si[1].state == SI_ST_REQ)
1665 sess_prepare_conn_req(s, &s->si[1]);
1666
1667 if (s->si[1].state == SI_ST_ASS && s->srv &&
1668 s->srv->rdr_len && (s->flags & SN_REDIRECTABLE))
1669 perform_http_redirect(s, &s->si[1]);
1670 } while (s->si[1].state == SI_ST_ASS);
1671 }
1672
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001673 /* Benchmarks have shown that it's optimal to do a full resync now */
Willy Tarreau0be0ef92009-03-08 19:20:25 +01001674 if (s->req->prod->state == SI_ST_DIS || s->req->cons->state == SI_ST_DIS)
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001675 goto resync_stream_interface;
1676
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001677 /* otherwise wewant to check if we need to resync the req buffer or not */
1678 if ((s->req->flags ^ rqf_last) & BF_MASK_STATIC)
Willy Tarreau0be0ef92009-03-08 19:20:25 +01001679 goto resync_request;
1680
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001681 /* perform output updates to the response buffer */
Willy Tarreau84455332009-03-15 22:34:05 +01001682
Willy Tarreau7c84bab2009-03-08 21:38:23 +01001683 /* If noone is interested in analysing data, it's time to forward
Willy Tarreau31971e52009-09-20 12:07:52 +02001684 * everything. We configure the buffer to forward indefinitely.
Willy Tarreau6b66f3e2008-12-14 17:31:54 +01001685 */
Willy Tarreau7c84bab2009-03-08 21:38:23 +01001686 if (!s->rep->analysers &&
Willy Tarreau82eeaf22009-12-29 12:09:05 +01001687 !(s->rep->flags & (BF_HIJACK|BF_SHUTW|BF_SHUTW_NOW)) &&
Willy Tarreau31971e52009-09-20 12:07:52 +02001688 (s->rep->prod->state >= SI_ST_EST) &&
1689 (s->rep->to_forward != BUF_INFINITE_FORWARD)) {
Willy Tarreau7c84bab2009-03-08 21:38:23 +01001690 /* This buffer is freewheeling, there's no analyser nor hijacker
1691 * attached to it. If any data are left in, we'll permit them to
1692 * move.
1693 */
Willy Tarreau90deb182010-01-07 00:20:41 +01001694 buffer_auto_read(s->rep);
Willy Tarreau520d95e2009-09-19 21:04:57 +02001695 buffer_auto_close(s->rep);
Willy Tarreau7c84bab2009-03-08 21:38:23 +01001696 buffer_flush(s->rep);
Willy Tarreau31971e52009-09-20 12:07:52 +02001697 if (!(s->rep->flags & (BF_SHUTR|BF_SHUTW|BF_SHUTW_NOW)))
1698 buffer_forward(s->rep, BUF_INFINITE_FORWARD);
Willy Tarreau6b66f3e2008-12-14 17:31:54 +01001699 }
Willy Tarreauf890dc92008-12-13 21:12:26 +01001700
Willy Tarreau7c84bab2009-03-08 21:38:23 +01001701 /* check if it is wise to enable kernel splicing to forward response data */
1702 if (!(s->rep->flags & (BF_KERN_SPLICING|BF_SHUTR)) &&
1703 s->rep->to_forward &&
1704 (global.tune.options & GTUNE_USE_SPLICE) &&
Willy Tarreaudc340a92009-06-28 23:10:19 +02001705 (s->si[0].flags & s->si[1].flags & SI_FL_CAP_SPLICE) &&
Willy Tarreau7c84bab2009-03-08 21:38:23 +01001706 (pipes_used < global.maxpipes) &&
1707 (((s->fe->options2|s->be->options2) & PR_O2_SPLIC_RTR) ||
1708 (((s->fe->options2|s->be->options2) & PR_O2_SPLIC_AUT) &&
1709 (s->rep->flags & BF_STREAMER_FAST)))) {
1710 s->rep->flags |= BF_KERN_SPLICING;
1711 }
1712
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001713 /* reflect what the L7 analysers have seen last */
1714 rpf_last = s->rep->flags;
1715
1716 /*
1717 * Now forward all shutdown requests between both sides of the buffer
1718 */
1719
1720 /*
1721 * FIXME: this is probably where we should produce error responses.
1722 */
1723
Willy Tarreau6b66f3e2008-12-14 17:31:54 +01001724 /* first, let's check if the response buffer needs to shutdown(write) */
Willy Tarreau520d95e2009-09-19 21:04:57 +02001725 if (unlikely((s->rep->flags & (BF_SHUTW|BF_SHUTW_NOW|BF_HIJACK|BF_AUTO_CLOSE|BF_SHUTR)) ==
1726 (BF_AUTO_CLOSE|BF_SHUTR)))
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001727 buffer_shutw_now(s->rep);
1728
1729 /* shutdown(write) pending */
Willy Tarreauba0b63d2009-09-20 08:09:44 +02001730 if (unlikely((s->rep->flags & (BF_SHUTW|BF_OUT_EMPTY|BF_SHUTW_NOW)) == (BF_OUT_EMPTY|BF_SHUTW_NOW)))
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001731 s->rep->cons->shutw(s->rep->cons);
1732
1733 /* shutdown(write) done on the client side, we must stop the server too */
Willy Tarreau3dbc6942008-12-07 13:05:04 +01001734 if (unlikely((s->rep->flags & (BF_SHUTW|BF_SHUTR|BF_SHUTR_NOW)) == BF_SHUTW) &&
1735 !s->rep->analysers)
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001736 buffer_shutr_now(s->rep);
1737
1738 /* shutdown(read) pending */
1739 if (unlikely((s->rep->flags & (BF_SHUTR|BF_SHUTR_NOW)) == BF_SHUTR_NOW))
1740 s->rep->prod->shutr(s->rep->prod);
1741
Willy Tarreau0be0ef92009-03-08 19:20:25 +01001742 if (s->req->prod->state == SI_ST_DIS || s->req->cons->state == SI_ST_DIS)
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001743 goto resync_stream_interface;
1744
Willy Tarreau0be0ef92009-03-08 19:20:25 +01001745 if (s->req->flags != rqf_last)
1746 goto resync_request;
1747
Willy Tarreau3deb3d02009-06-21 22:43:05 +02001748 if ((s->rep->flags ^ rpf_last) & BF_MASK_STATIC)
Willy Tarreau0be0ef92009-03-08 19:20:25 +01001749 goto resync_response;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001750
Willy Tarreau89f7ef22009-09-05 20:57:35 +02001751 /* we're interested in getting wakeups again */
1752 s->req->prod->flags &= ~SI_FL_DONT_WAKE;
1753 s->req->cons->flags &= ~SI_FL_DONT_WAKE;
1754
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001755 /* This is needed only when debugging is enabled, to indicate
1756 * client-side or server-side close. Please note that in the unlikely
1757 * event where both sides would close at once, the sequence is reported
1758 * on the server side first.
1759 */
1760 if (unlikely((global.mode & MODE_DEBUG) &&
1761 (!(global.mode & MODE_QUIET) ||
1762 (global.mode & MODE_VERBOSE)))) {
1763 int len;
1764
1765 if (s->si[1].state == SI_ST_CLO &&
1766 s->si[1].prev_state == SI_ST_EST) {
1767 len = sprintf(trash, "%08x:%s.srvcls[%04x:%04x]\n",
1768 s->uniq_id, s->be->id,
1769 (unsigned short)s->si[0].fd,
1770 (unsigned short)s->si[1].fd);
1771 write(1, trash, len);
1772 }
1773
1774 if (s->si[0].state == SI_ST_CLO &&
1775 s->si[0].prev_state == SI_ST_EST) {
1776 len = sprintf(trash, "%08x:%s.clicls[%04x:%04x]\n",
1777 s->uniq_id, s->be->id,
1778 (unsigned short)s->si[0].fd,
1779 (unsigned short)s->si[1].fd);
1780 write(1, trash, len);
1781 }
1782 }
1783
1784 if (likely((s->rep->cons->state != SI_ST_CLO) ||
1785 (s->req->cons->state > SI_ST_INI && s->req->cons->state < SI_ST_CLO))) {
1786
1787 if ((s->fe->options & PR_O_CONTSTATS) && (s->flags & SN_BE_ASSIGNED))
1788 session_process_counters(s);
1789
Willy Tarreau1accfc02009-09-05 20:57:35 +02001790 if (s->rep->cons->state == SI_ST_EST && !s->rep->cons->iohandler)
Willy Tarreaudc85b392009-08-18 07:38:19 +02001791 s->rep->cons->update(s->rep->cons);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001792
Willy Tarreau1accfc02009-09-05 20:57:35 +02001793 if (s->req->cons->state == SI_ST_EST && !s->req->cons->iohandler)
Willy Tarreaudc85b392009-08-18 07:38:19 +02001794 s->req->cons->update(s->req->cons);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001795
Willy Tarreaua6eebb32010-06-04 11:40:20 +02001796 s->req->flags &= ~(BF_READ_NULL|BF_READ_PARTIAL|BF_WRITE_NULL|BF_WRITE_PARTIAL|BF_READ_ATTACHED);
1797 s->rep->flags &= ~(BF_READ_NULL|BF_READ_PARTIAL|BF_WRITE_NULL|BF_WRITE_PARTIAL|BF_READ_ATTACHED);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001798 s->si[0].prev_state = s->si[0].state;
1799 s->si[1].prev_state = s->si[1].state;
Willy Tarreaub0ef7352008-12-14 13:26:20 +01001800 s->si[0].flags &= ~(SI_FL_ERR|SI_FL_EXP);
1801 s->si[1].flags &= ~(SI_FL_ERR|SI_FL_EXP);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001802
1803 /* Trick: if a request is being waiting for the server to respond,
1804 * and if we know the server can timeout, we don't want the timeout
1805 * to expire on the client side first, but we're still interested
1806 * in passing data from the client to the server (eg: POST). Thus,
1807 * we can cancel the client's request timeout if the server's
1808 * request timeout is set and the server has not yet sent a response.
1809 */
1810
Willy Tarreau520d95e2009-09-19 21:04:57 +02001811 if ((s->rep->flags & (BF_AUTO_CLOSE|BF_SHUTR)) == 0 &&
Willy Tarreau86491c32008-12-14 09:04:47 +01001812 (tick_isset(s->req->wex) || tick_isset(s->rep->rex))) {
1813 s->req->flags |= BF_READ_NOEXP;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001814 s->req->rex = TICK_ETERNITY;
Willy Tarreau86491c32008-12-14 09:04:47 +01001815 }
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001816
Willy Tarreau1accfc02009-09-05 20:57:35 +02001817 /* Call the second stream interface's I/O handler if it's embedded.
1818 * Note that this one may wake the task up again.
1819 */
1820 if (s->req->cons->iohandler) {
1821 s->req->cons->iohandler(s->req->cons);
1822 if (task_in_rq(t)) {
1823 /* If we woke up, we don't want to requeue the
1824 * task to the wait queue, but rather requeue
1825 * it into the runqueue ASAP.
1826 */
1827 t->expire = TICK_ETERNITY;
1828 return t;
1829 }
1830 }
1831
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001832 t->expire = tick_first(tick_first(s->req->rex, s->req->wex),
1833 tick_first(s->rep->rex, s->rep->wex));
1834 if (s->req->analysers)
1835 t->expire = tick_first(t->expire, s->req->analyse_exp);
1836
1837 if (s->si[0].exp)
1838 t->expire = tick_first(t->expire, s->si[0].exp);
1839
1840 if (s->si[1].exp)
1841 t->expire = tick_first(t->expire, s->si[1].exp);
1842
1843#ifdef DEBUG_FULL
Willy Tarreau127334e2009-03-28 10:47:26 +01001844 fprintf(stderr,
1845 "[%u] queuing with exp=%u req->rex=%u req->wex=%u req->ana_exp=%u"
1846 " rep->rex=%u rep->wex=%u, si[0].exp=%u, si[1].exp=%u, cs=%d, ss=%d\n",
1847 now_ms, t->expire, s->req->rex, s->req->wex, s->req->analyse_exp,
1848 s->rep->rex, s->rep->wex, s->si[0].exp, s->si[1].exp, s->si[0].state, s->si[1].state);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001849#endif
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001850
1851#ifdef DEBUG_DEV
1852 /* this may only happen when no timeout is set or in case of an FSM bug */
Willy Tarreaud0a201b2009-03-08 15:53:06 +01001853 if (!tick_isset(t->expire))
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001854 ABORT_NOW();
1855#endif
Willy Tarreau26c25062009-03-08 09:38:41 +01001856 return t; /* nothing more to do */
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001857 }
1858
1859 s->fe->feconn--;
1860 if (s->flags & SN_BE_ASSIGNED)
1861 s->be->beconn--;
1862 actconn--;
Willy Tarreau6e6fb2b2009-08-16 18:20:44 +02001863 s->listener->nbconn--;
1864 if (s->listener->state == LI_FULL &&
1865 s->listener->nbconn < s->listener->maxconn) {
1866 /* we should reactivate the listener */
1867 EV_FD_SET(s->listener->fd, DIR_RD);
1868 s->listener->state = LI_READY;
1869 }
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001870
1871 if (unlikely((global.mode & MODE_DEBUG) &&
1872 (!(global.mode & MODE_QUIET) || (global.mode & MODE_VERBOSE)))) {
1873 int len;
Willy Tarreauec22b2c2009-03-06 13:07:40 +01001874 len = sprintf(trash, "%08x:%s.closed[%04x:%04x]\n",
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001875 s->uniq_id, s->be->id,
Willy Tarreauec22b2c2009-03-06 13:07:40 +01001876 (unsigned short)s->req->prod->fd, (unsigned short)s->req->cons->fd);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001877 write(1, trash, len);
1878 }
1879
1880 s->logs.t_close = tv_ms_elapsed(&s->logs.tv_accept, &now);
1881 session_process_counters(s);
1882
Krzysztof Piotr Oledzkide71d162009-10-24 15:36:15 +02001883 if (s->txn.status) {
1884 int n;
1885
1886 n = s->txn.status / 100;
1887 if (n < 1 || n > 5)
1888 n = 0;
1889
1890 if (s->fe->mode == PR_MODE_HTTP)
Willy Tarreau24657792010-02-26 10:30:28 +01001891 s->fe->counters.fe.http.rsp[n]++;
Krzysztof Piotr Oledzkide71d162009-10-24 15:36:15 +02001892
Willy Tarreau24657792010-02-26 10:30:28 +01001893 if ((s->flags & SN_BE_ASSIGNED) &&
Krzysztof Piotr Oledzkide71d162009-10-24 15:36:15 +02001894 (s->be->mode == PR_MODE_HTTP))
Willy Tarreau24657792010-02-26 10:30:28 +01001895 s->be->counters.be.http.rsp[n]++;
Krzysztof Piotr Oledzkide71d162009-10-24 15:36:15 +02001896 }
1897
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001898 /* let's do a final log if we need it */
1899 if (s->logs.logwait &&
1900 !(s->flags & SN_MONITOR) &&
1901 (!(s->fe->options & PR_O_NULLNOLOG) || s->req->total)) {
Willy Tarreaua5555ec2008-11-30 19:02:32 +01001902 s->do_log(s);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001903 }
1904
1905 /* the task MUST not be in the run queue anymore */
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001906 session_free(s);
Willy Tarreau26c25062009-03-08 09:38:41 +01001907 task_delete(t);
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001908 task_free(t);
Willy Tarreau26c25062009-03-08 09:38:41 +01001909 return NULL;
Willy Tarreau55a8d0e2008-11-30 18:47:21 +01001910}
1911
Willy Tarreau7c669d72008-06-20 15:04:11 +02001912/*
1913 * This function adjusts sess->srv_conn and maintains the previous and new
1914 * server's served session counts. Setting newsrv to NULL is enough to release
1915 * current connection slot. This function also notifies any LB algo which might
1916 * expect to be informed about any change in the number of active sessions on a
1917 * server.
1918 */
1919void sess_change_server(struct session *sess, struct server *newsrv)
1920{
1921 if (sess->srv_conn == newsrv)
1922 return;
1923
1924 if (sess->srv_conn) {
1925 sess->srv_conn->served--;
1926 if (sess->srv_conn->proxy->lbprm.server_drop_conn)
1927 sess->srv_conn->proxy->lbprm.server_drop_conn(sess->srv_conn);
1928 sess->srv_conn = NULL;
1929 }
1930
1931 if (newsrv) {
1932 newsrv->served++;
1933 if (newsrv->proxy->lbprm.server_take_conn)
1934 newsrv->proxy->lbprm.server_take_conn(newsrv);
1935 sess->srv_conn = newsrv;
1936 }
1937}
1938
Willy Tarreau84455332009-03-15 22:34:05 +01001939/* Set correct session termination flags in case no analyser has done it. It
1940 * also counts a failed request if the server state has not reached the request
1941 * stage.
1942 */
1943void sess_set_term_flags(struct session *s)
1944{
1945 if (!(s->flags & SN_FINST_MASK)) {
1946 if (s->si[1].state < SI_ST_REQ) {
Krzysztof Piotr Oledzkiaeebf9b2009-10-04 15:43:17 +02001947
Krzysztof Piotr Oledzki052d4fd2009-10-04 14:52:57 +02001948 s->fe->counters.failed_req++;
Krzysztof Piotr Oledzkiaeebf9b2009-10-04 15:43:17 +02001949 if (s->listener->counters)
1950 s->listener->counters->failed_req++;
1951
Willy Tarreau84455332009-03-15 22:34:05 +01001952 s->flags |= SN_FINST_R;
1953 }
1954 else if (s->si[1].state == SI_ST_QUE)
1955 s->flags |= SN_FINST_Q;
1956 else if (s->si[1].state < SI_ST_EST)
1957 s->flags |= SN_FINST_C;
Willy Tarreau033b2db2010-03-04 17:54:21 +01001958 else if (s->si[1].state == SI_ST_EST || s->si[1].prev_state == SI_ST_EST)
Willy Tarreau84455332009-03-15 22:34:05 +01001959 s->flags |= SN_FINST_D;
1960 else
1961 s->flags |= SN_FINST_L;
1962 }
1963}
1964
1965/* Handle server-side errors for default protocols. It is called whenever a a
1966 * connection setup is aborted or a request is aborted in queue. It sets the
1967 * session termination flags so that the caller does not have to worry about
1968 * them. It's installed as ->srv_error for the server-side stream_interface.
1969 */
1970void default_srv_error(struct session *s, struct stream_interface *si)
1971{
1972 int err_type = si->err_type;
1973 int err = 0, fin = 0;
1974
1975 if (err_type & SI_ET_QUEUE_ABRT) {
1976 err = SN_ERR_CLICL;
1977 fin = SN_FINST_Q;
1978 }
1979 else if (err_type & SI_ET_CONN_ABRT) {
1980 err = SN_ERR_CLICL;
1981 fin = SN_FINST_C;
1982 }
1983 else if (err_type & SI_ET_QUEUE_TO) {
1984 err = SN_ERR_SRVTO;
1985 fin = SN_FINST_Q;
1986 }
1987 else if (err_type & SI_ET_QUEUE_ERR) {
1988 err = SN_ERR_SRVCL;
1989 fin = SN_FINST_Q;
1990 }
1991 else if (err_type & SI_ET_CONN_TO) {
1992 err = SN_ERR_SRVTO;
1993 fin = SN_FINST_C;
1994 }
1995 else if (err_type & SI_ET_CONN_ERR) {
1996 err = SN_ERR_SRVCL;
1997 fin = SN_FINST_C;
1998 }
1999 else /* SI_ET_CONN_OTHER and others */ {
2000 err = SN_ERR_INTERNAL;
2001 fin = SN_FINST_C;
2002 }
2003
2004 if (!(s->flags & SN_ERR_MASK))
2005 s->flags |= err;
2006 if (!(s->flags & SN_FINST_MASK))
2007 s->flags |= fin;
2008}
Willy Tarreau7c669d72008-06-20 15:04:11 +02002009
Willy Tarreaubaaee002006-06-26 02:48:02 +02002010/*
2011 * Local variables:
2012 * c-indent-level: 8
2013 * c-basic-offset: 8
2014 * End:
2015 */