blob: 758b42967c5e51c581cfaca7f6d4c8c686166eb7 [file] [log] [blame]
Willy Tarreaubaaee002006-06-26 02:48:02 +02001/*
2 * Backend variables and functions.
3 *
Willy Tarreaud825eef2007-05-12 22:35:00 +02004 * Copyright 2000-2007 Willy Tarreau <w@1wt.eu>
Willy Tarreaubaaee002006-06-26 02:48:02 +02005 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 */
12
13#include <errno.h>
14#include <fcntl.h>
15#include <stdio.h>
16#include <stdlib.h>
17#include <syslog.h>
Willy Tarreauf19cf372006-11-14 15:40:51 +010018#include <string.h>
Willy Tarreaubaaee002006-06-26 02:48:02 +020019
Willy Tarreau2dd0d472006-06-29 17:53:05 +020020#include <common/compat.h>
Willy Tarreaue3ba5f02006-06-29 18:54:54 +020021#include <common/config.h>
Willy Tarreau2dd0d472006-06-29 17:53:05 +020022#include <common/time.h>
Willy Tarreaubaaee002006-06-26 02:48:02 +020023
24#include <types/buffers.h>
25#include <types/global.h>
26#include <types/polling.h>
27#include <types/proxy.h>
28#include <types/server.h>
29#include <types/session.h>
30
31#include <proto/backend.h>
Willy Tarreau14c8aac2007-05-08 19:46:30 +020032#include <proto/client.h>
Willy Tarreaubaaee002006-06-26 02:48:02 +020033#include <proto/fd.h>
Willy Tarreau80587432006-12-24 17:47:20 +010034#include <proto/httperr.h>
Willy Tarreaubaaee002006-06-26 02:48:02 +020035#include <proto/log.h>
36#include <proto/proto_http.h>
37#include <proto/queue.h>
38#include <proto/stream_sock.h>
39#include <proto/task.h>
40
Willy Tarreau77074d52006-11-12 23:57:19 +010041#ifdef CONFIG_HAP_CTTPROXY
42#include <import/ip_tproxy.h>
43#endif
Willy Tarreaubaaee002006-06-26 02:48:02 +020044
Willy Tarreau6d1a9882007-01-07 02:03:04 +010045#ifdef CONFIG_HAP_TCPSPLICE
46#include <libtcpsplice.h>
47#endif
48
Willy Tarreaubaaee002006-06-26 02:48:02 +020049/*
50 * This function recounts the number of usable active and backup servers for
51 * proxy <p>. These numbers are returned into the p->srv_act and p->srv_bck.
52 * This function also recomputes the total active and backup weights.
53 */
54void recount_servers(struct proxy *px)
55{
56 struct server *srv;
57
58 px->srv_act = 0; px->srv_bck = px->tot_wact = px->tot_wbck = 0;
59 for (srv = px->srv; srv != NULL; srv = srv->next) {
60 if (srv->state & SRV_RUNNING) {
61 if (srv->state & SRV_BACKUP) {
62 px->srv_bck++;
Willy Tarreau417fae02007-03-25 21:16:40 +020063 px->tot_wbck += srv->eweight;
Willy Tarreaubaaee002006-06-26 02:48:02 +020064 } else {
65 px->srv_act++;
Willy Tarreau417fae02007-03-25 21:16:40 +020066 px->tot_wact += srv->eweight;
Willy Tarreaubaaee002006-06-26 02:48:02 +020067 }
68 }
69 }
70}
71
72/* This function recomputes the server map for proxy px. It
73 * relies on px->tot_wact and px->tot_wbck, so it must be
74 * called after recount_servers(). It also expects px->srv_map
75 * to be initialized to the largest value needed.
76 */
77void recalc_server_map(struct proxy *px)
78{
79 int o, tot, flag;
80 struct server *cur, *best;
81
82 if (px->srv_act) {
83 flag = SRV_RUNNING;
84 tot = px->tot_wact;
85 } else if (px->srv_bck) {
86 flag = SRV_RUNNING | SRV_BACKUP;
87 if (px->options & PR_O_USE_ALL_BK)
88 tot = px->tot_wbck;
89 else
90 tot = 1; /* the first server is enough */
91 } else {
92 px->srv_map_sz = 0;
Willy Tarreau5af3a692007-07-24 23:32:33 +020093 px->map_state &= ~PR_MAP_RECALC;
Willy Tarreaubaaee002006-06-26 02:48:02 +020094 return;
95 }
96
97 /* this algorithm gives priority to the first server, which means that
98 * it will respect the declaration order for equivalent weights, and
99 * that whatever the weights, the first server called will always be
100 * the first declard. This is an important asumption for the backup
101 * case, where we want the first server only.
102 */
103 for (cur = px->srv; cur; cur = cur->next)
104 cur->wscore = 0;
105
106 for (o = 0; o < tot; o++) {
107 int max = 0;
108 best = NULL;
109 for (cur = px->srv; cur; cur = cur->next) {
110 if ((cur->state & (SRV_RUNNING | SRV_BACKUP)) == flag) {
111 int v;
112
113 /* If we are forced to return only one server, we don't want to
114 * go further, because we would return the wrong one due to
115 * divide overflow.
116 */
117 if (tot == 1) {
118 best = cur;
119 break;
120 }
121
Willy Tarreau417fae02007-03-25 21:16:40 +0200122 cur->wscore += cur->eweight;
Willy Tarreaubaaee002006-06-26 02:48:02 +0200123 v = (cur->wscore + tot) / tot; /* result between 0 and 3 */
124 if (best == NULL || v > max) {
125 max = v;
126 best = cur;
127 }
128 }
129 }
130 px->srv_map[o] = best;
131 best->wscore -= tot;
132 }
133 px->srv_map_sz = tot;
Willy Tarreau5af3a692007-07-24 23:32:33 +0200134 px->map_state &= ~PR_MAP_RECALC;
Willy Tarreaubaaee002006-06-26 02:48:02 +0200135}
136
137
138/*
139 * This function marks the session as 'assigned' in direct or dispatch modes,
140 * or tries to assign one in balance mode, according to the algorithm. It does
141 * nothing if the session had already been assigned a server.
142 *
143 * It may return :
144 * SRV_STATUS_OK if everything is OK. s->srv will be valid.
145 * SRV_STATUS_NOSRV if no server is available. s->srv = NULL.
146 * SRV_STATUS_FULL if all servers are saturated. s->srv = NULL.
147 * SRV_STATUS_INTERNAL for other unrecoverable errors.
148 *
149 * Upon successful return, the session flag SN_ASSIGNED to indicate that it does
150 * not need to be called anymore. This usually means that s->srv can be trusted
151 * in balance and direct modes. This flag is not cleared, so it's to the caller
152 * to clear it if required (eg: redispatch).
153 *
154 */
155
156int assign_server(struct session *s)
157{
158#ifdef DEBUG_FULL
159 fprintf(stderr,"assign_server : s=%p\n",s);
160#endif
161
162 if (s->pend_pos)
163 return SRV_STATUS_INTERNAL;
164
165 if (!(s->flags & SN_ASSIGNED)) {
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200166 if (s->be->options & PR_O_BALANCE) {
Willy Tarreau1a20a5d2007-11-01 21:08:19 +0100167 int len;
168
Willy Tarreau5d65bbb2007-01-21 12:47:26 +0100169 if (s->flags & SN_DIRECT) {
170 s->flags |= SN_ASSIGNED;
171 return SRV_STATUS_OK;
172 }
Willy Tarreau1a20a5d2007-11-01 21:08:19 +0100173
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200174 if (!s->be->srv_act && !s->be->srv_bck)
Willy Tarreaubaaee002006-06-26 02:48:02 +0200175 return SRV_STATUS_NOSRV;
176
Willy Tarreau1a20a5d2007-11-01 21:08:19 +0100177 switch (s->be->options & PR_O_BALANCE) {
178 case PR_O_BALANCE_RR:
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200179 s->srv = get_server_rr_with_conns(s->be);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200180 if (!s->srv)
181 return SRV_STATUS_FULL;
Willy Tarreau1a20a5d2007-11-01 21:08:19 +0100182 break;
183 case PR_O_BALANCE_SH:
Willy Tarreaubaaee002006-06-26 02:48:02 +0200184 if (s->cli_addr.ss_family == AF_INET)
185 len = 4;
186 else if (s->cli_addr.ss_family == AF_INET6)
187 len = 16;
188 else /* unknown IP family */
189 return SRV_STATUS_INTERNAL;
190
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200191 s->srv = get_server_sh(s->be,
Willy Tarreaubaaee002006-06-26 02:48:02 +0200192 (void *)&((struct sockaddr_in *)&s->cli_addr)->sin_addr,
193 len);
Willy Tarreau1a20a5d2007-11-01 21:08:19 +0100194 break;
195 case PR_O_BALANCE_UH:
Willy Tarreau2fcb5002007-05-08 13:35:26 +0200196 /* URI hashing */
197 s->srv = get_server_uh(s->be,
198 s->txn.req.sol + s->txn.req.sl.rq.u,
199 s->txn.req.sl.rq.u_l);
Willy Tarreau1a20a5d2007-11-01 21:08:19 +0100200 break;
201 default:
202 /* unknown balancing algorithm */
Willy Tarreaubaaee002006-06-26 02:48:02 +0200203 return SRV_STATUS_INTERNAL;
Willy Tarreau1a20a5d2007-11-01 21:08:19 +0100204 }
Willy Tarreaubaaee002006-06-26 02:48:02 +0200205 }
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200206 else if (!*(int *)&s->be->dispatch_addr.sin_addr &&
Willy Tarreau5d65bbb2007-01-21 12:47:26 +0100207 !(s->fe->options & PR_O_TRANSP)) {
Willy Tarreau1a1158b2007-01-20 11:07:46 +0100208 return SRV_STATUS_NOSRV;
Willy Tarreau5d65bbb2007-01-21 12:47:26 +0100209 }
210 s->flags |= SN_ASSIGNED;
Willy Tarreaubaaee002006-06-26 02:48:02 +0200211 }
212 return SRV_STATUS_OK;
213}
214
215
216/*
217 * This function assigns a server address to a session, and sets SN_ADDR_SET.
218 * The address is taken from the currently assigned server, or from the
219 * dispatch or transparent address.
220 *
221 * It may return :
222 * SRV_STATUS_OK if everything is OK.
223 * SRV_STATUS_INTERNAL for other unrecoverable errors.
224 *
225 * Upon successful return, the session flag SN_ADDR_SET is set. This flag is
226 * not cleared, so it's to the caller to clear it if required.
227 *
228 */
229int assign_server_address(struct session *s)
230{
231#ifdef DEBUG_FULL
232 fprintf(stderr,"assign_server_address : s=%p\n",s);
233#endif
234
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200235 if ((s->flags & SN_DIRECT) || (s->be->options & PR_O_BALANCE)) {
Willy Tarreaubaaee002006-06-26 02:48:02 +0200236 /* A server is necessarily known for this session */
237 if (!(s->flags & SN_ASSIGNED))
238 return SRV_STATUS_INTERNAL;
239
240 s->srv_addr = s->srv->addr;
241
242 /* if this server remaps proxied ports, we'll use
243 * the port the client connected to with an offset. */
244 if (s->srv->state & SRV_MAPPORTS) {
Willy Tarreau14c8aac2007-05-08 19:46:30 +0200245 if (!(s->fe->options & PR_O_TRANSP) && !(s->flags & SN_FRT_ADDR_SET))
246 get_frt_addr(s);
247 if (s->frt_addr.ss_family == AF_INET) {
248 s->srv_addr.sin_port = htons(ntohs(s->srv_addr.sin_port) +
249 ntohs(((struct sockaddr_in *)&s->frt_addr)->sin_port));
250 } else {
251 s->srv_addr.sin_port = htons(ntohs(s->srv_addr.sin_port) +
252 ntohs(((struct sockaddr_in6 *)&s->frt_addr)->sin6_port));
253 }
Willy Tarreaubaaee002006-06-26 02:48:02 +0200254 }
255 }
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200256 else if (*(int *)&s->be->dispatch_addr.sin_addr) {
Willy Tarreaubaaee002006-06-26 02:48:02 +0200257 /* connect to the defined dispatch addr */
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200258 s->srv_addr = s->be->dispatch_addr;
Willy Tarreaubaaee002006-06-26 02:48:02 +0200259 }
Willy Tarreau73de9892006-11-30 11:40:23 +0100260 else if (s->fe->options & PR_O_TRANSP) {
Willy Tarreaubaaee002006-06-26 02:48:02 +0200261 /* in transparent mode, use the original dest addr if no dispatch specified */
262 socklen_t salen = sizeof(s->srv_addr);
263
264 if (get_original_dst(s->cli_fd, &s->srv_addr, &salen) == -1) {
265 qfprintf(stderr, "Cannot get original server address.\n");
266 return SRV_STATUS_INTERNAL;
267 }
268 }
Willy Tarreau1a1158b2007-01-20 11:07:46 +0100269 else {
270 /* no server and no LB algorithm ! */
271 return SRV_STATUS_INTERNAL;
272 }
Willy Tarreaubaaee002006-06-26 02:48:02 +0200273
274 s->flags |= SN_ADDR_SET;
275 return SRV_STATUS_OK;
276}
277
278
279/* This function assigns a server to session <s> if required, and can add the
280 * connection to either the assigned server's queue or to the proxy's queue.
281 *
282 * Returns :
283 *
284 * SRV_STATUS_OK if everything is OK.
285 * SRV_STATUS_NOSRV if no server is available. s->srv = NULL.
286 * SRV_STATUS_QUEUED if the connection has been queued.
287 * SRV_STATUS_FULL if the server(s) is/are saturated and the
288 * connection could not be queued.
289 * SRV_STATUS_INTERNAL for other unrecoverable errors.
290 *
291 */
292int assign_server_and_queue(struct session *s)
293{
294 struct pendconn *p;
295 int err;
296
297 if (s->pend_pos)
298 return SRV_STATUS_INTERNAL;
299
300 if (s->flags & SN_ASSIGNED) {
Elijah Epifanovacafc5f2007-10-25 20:15:38 +0200301 if (s->srv && s->srv->maxqueue > 0 && s->srv->nbpend >= s->srv->maxqueue) {
302 s->flags &= ~(SN_DIRECT | SN_ASSIGNED | SN_ADDR_SET);
303 s->srv = NULL;
304 http_flush_cookie_flags(&s->txn);
305 } else {
306 /* a server does not need to be assigned, perhaps because we're in
307 * direct mode, or in dispatch or transparent modes where the server
308 * is not needed.
309 */
310 if (s->srv &&
311 s->srv->maxconn && s->srv->cur_sess >= srv_dynamic_maxconn(s->srv)) {
312 p = pendconn_add(s);
313 if (p)
314 return SRV_STATUS_QUEUED;
315 else
316 return SRV_STATUS_FULL;
317 }
318 return SRV_STATUS_OK;
Willy Tarreaubaaee002006-06-26 02:48:02 +0200319 }
Willy Tarreaubaaee002006-06-26 02:48:02 +0200320 }
321
322 /* a server needs to be assigned */
323 err = assign_server(s);
324 switch (err) {
325 case SRV_STATUS_OK:
326 /* in balance mode, we might have servers with connection limits */
327 if (s->srv &&
328 s->srv->maxconn && s->srv->cur_sess >= srv_dynamic_maxconn(s->srv)) {
329 p = pendconn_add(s);
330 if (p)
331 return SRV_STATUS_QUEUED;
332 else
333 return SRV_STATUS_FULL;
334 }
335 return SRV_STATUS_OK;
336
337 case SRV_STATUS_FULL:
338 /* queue this session into the proxy's queue */
339 p = pendconn_add(s);
340 if (p)
341 return SRV_STATUS_QUEUED;
342 else
343 return SRV_STATUS_FULL;
344
345 case SRV_STATUS_NOSRV:
346 case SRV_STATUS_INTERNAL:
347 return err;
348 default:
349 return SRV_STATUS_INTERNAL;
350 }
351}
352
353
354/*
355 * This function initiates a connection to the server assigned to this session
356 * (s->srv, s->srv_addr). It will assign a server if none is assigned yet.
357 * It can return one of :
358 * - SN_ERR_NONE if everything's OK
359 * - SN_ERR_SRVTO if there are no more servers
360 * - SN_ERR_SRVCL if the connection was refused by the server
361 * - SN_ERR_PRXCOND if the connection has been limited by the proxy (maxconn)
362 * - SN_ERR_RESOURCE if a system resource is lacking (eg: fd limits, ports, ...)
363 * - SN_ERR_INTERNAL for any other purely internal errors
364 * Additionnally, in the case of SN_ERR_RESOURCE, an emergency log will be emitted.
365 */
366int connect_server(struct session *s)
367{
368 int fd, err;
369
370 if (!(s->flags & SN_ADDR_SET)) {
371 err = assign_server_address(s);
372 if (err != SRV_STATUS_OK)
373 return SN_ERR_INTERNAL;
374 }
375
376 if ((fd = s->srv_fd = socket(AF_INET, SOCK_STREAM, IPPROTO_TCP)) == -1) {
377 qfprintf(stderr, "Cannot get a server socket.\n");
378
379 if (errno == ENFILE)
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200380 send_log(s->be, LOG_EMERG,
Willy Tarreaubaaee002006-06-26 02:48:02 +0200381 "Proxy %s reached system FD limit at %d. Please check system tunables.\n",
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200382 s->be->id, maxfd);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200383 else if (errno == EMFILE)
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200384 send_log(s->be, LOG_EMERG,
Willy Tarreaubaaee002006-06-26 02:48:02 +0200385 "Proxy %s reached process FD limit at %d. Please check 'ulimit-n' and restart.\n",
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200386 s->be->id, maxfd);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200387 else if (errno == ENOBUFS || errno == ENOMEM)
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200388 send_log(s->be, LOG_EMERG,
Willy Tarreaubaaee002006-06-26 02:48:02 +0200389 "Proxy %s reached system memory limit at %d sockets. Please check system tunables.\n",
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200390 s->be->id, maxfd);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200391 /* this is a resource error */
392 return SN_ERR_RESOURCE;
393 }
394
395 if (fd >= global.maxsock) {
396 /* do not log anything there, it's a normal condition when this option
397 * is used to serialize connections to a server !
398 */
399 Alert("socket(): not enough free sockets. Raise -n argument. Giving up.\n");
400 close(fd);
401 return SN_ERR_PRXCOND; /* it is a configuration limit */
402 }
403
Willy Tarreau6d1a9882007-01-07 02:03:04 +0100404#ifdef CONFIG_HAP_TCPSPLICE
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200405 if ((s->fe->options & s->be->options) & PR_O_TCPSPLICE) {
Willy Tarreau6d1a9882007-01-07 02:03:04 +0100406 /* TCP splicing supported by both FE and BE */
407 tcp_splice_initfd(s->cli_fd, fd);
408 }
409#endif
410
Willy Tarreaubaaee002006-06-26 02:48:02 +0200411 if ((fcntl(fd, F_SETFL, O_NONBLOCK)==-1) ||
412 (setsockopt(fd, IPPROTO_TCP, TCP_NODELAY, (char *) &one, sizeof(one)) == -1)) {
413 qfprintf(stderr,"Cannot set client socket to non blocking mode.\n");
414 close(fd);
415 return SN_ERR_INTERNAL;
416 }
417
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200418 if (s->be->options & PR_O_TCP_SRV_KA)
Willy Tarreaubaaee002006-06-26 02:48:02 +0200419 setsockopt(fd, SOL_SOCKET, SO_KEEPALIVE, (char *) &one, sizeof(one));
420
Alexandre Cassen87ea5482007-10-11 20:48:58 +0200421 if (s->be->options & PR_O_TCP_NOLING)
422 setsockopt(fd, SOL_SOCKET, SO_LINGER, (struct linger *) &nolinger, sizeof(struct linger));
423
Willy Tarreaubaaee002006-06-26 02:48:02 +0200424 /* allow specific binding :
425 * - server-specific at first
426 * - proxy-specific next
427 */
428 if (s->srv != NULL && s->srv->state & SRV_BIND_SRC) {
429 setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, (char *) &one, sizeof(one));
430 if (bind(fd, (struct sockaddr *)&s->srv->source_addr, sizeof(s->srv->source_addr)) == -1) {
431 Alert("Cannot bind to source address before connect() for server %s/%s. Aborting.\n",
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200432 s->be->id, s->srv->id);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200433 close(fd);
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200434 send_log(s->be, LOG_EMERG,
Willy Tarreaubaaee002006-06-26 02:48:02 +0200435 "Cannot bind to source address before connect() for server %s/%s.\n",
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200436 s->be->id, s->srv->id);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200437 return SN_ERR_RESOURCE;
438 }
Willy Tarreau77074d52006-11-12 23:57:19 +0100439#ifdef CONFIG_HAP_CTTPROXY
440 if (s->srv->state & SRV_TPROXY_MASK) {
441 struct in_tproxy itp1, itp2;
442 memset(&itp1, 0, sizeof(itp1));
443
444 itp1.op = TPROXY_ASSIGN;
445 switch (s->srv->state & SRV_TPROXY_MASK) {
446 case SRV_TPROXY_ADDR:
447 itp1.v.addr.faddr = s->srv->tproxy_addr.sin_addr;
448 itp1.v.addr.fport = s->srv->tproxy_addr.sin_port;
449 break;
450 case SRV_TPROXY_CLI:
451 itp1.v.addr.fport = ((struct sockaddr_in *)&s->cli_addr)->sin_port;
452 /* fall through */
453 case SRV_TPROXY_CIP:
454 /* FIXME: what can we do if the client connects in IPv6 ? */
455 itp1.v.addr.faddr = ((struct sockaddr_in *)&s->cli_addr)->sin_addr;
456 break;
457 }
458
459 /* set connect flag on socket */
460 itp2.op = TPROXY_FLAGS;
461 itp2.v.flags = ITP_CONNECT | ITP_ONCE;
462
463 if (setsockopt(fd, SOL_IP, IP_TPROXY, &itp1, sizeof(itp1)) == -1 ||
464 setsockopt(fd, SOL_IP, IP_TPROXY, &itp2, sizeof(itp2)) == -1) {
465 Alert("Cannot bind to tproxy source address before connect() for server %s/%s. Aborting.\n",
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200466 s->be->id, s->srv->id);
Willy Tarreau77074d52006-11-12 23:57:19 +0100467 close(fd);
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200468 send_log(s->be, LOG_EMERG,
Willy Tarreau77074d52006-11-12 23:57:19 +0100469 "Cannot bind to tproxy source address before connect() for server %s/%s.\n",
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200470 s->be->id, s->srv->id);
Willy Tarreau77074d52006-11-12 23:57:19 +0100471 return SN_ERR_RESOURCE;
472 }
473 }
474#endif
Willy Tarreaubaaee002006-06-26 02:48:02 +0200475 }
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200476 else if (s->be->options & PR_O_BIND_SRC) {
Willy Tarreaubaaee002006-06-26 02:48:02 +0200477 setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, (char *) &one, sizeof(one));
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200478 if (bind(fd, (struct sockaddr *)&s->be->source_addr, sizeof(s->be->source_addr)) == -1) {
479 Alert("Cannot bind to source address before connect() for proxy %s. Aborting.\n", s->be->id);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200480 close(fd);
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200481 send_log(s->be, LOG_EMERG,
Willy Tarreaubaaee002006-06-26 02:48:02 +0200482 "Cannot bind to source address before connect() for server %s/%s.\n",
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200483 s->be->id, s->srv->id);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200484 return SN_ERR_RESOURCE;
485 }
Willy Tarreau77074d52006-11-12 23:57:19 +0100486#ifdef CONFIG_HAP_CTTPROXY
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200487 if (s->be->options & PR_O_TPXY_MASK) {
Willy Tarreau77074d52006-11-12 23:57:19 +0100488 struct in_tproxy itp1, itp2;
489 memset(&itp1, 0, sizeof(itp1));
490
491 itp1.op = TPROXY_ASSIGN;
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200492 switch (s->be->options & PR_O_TPXY_MASK) {
Willy Tarreau77074d52006-11-12 23:57:19 +0100493 case PR_O_TPXY_ADDR:
494 itp1.v.addr.faddr = s->srv->tproxy_addr.sin_addr;
495 itp1.v.addr.fport = s->srv->tproxy_addr.sin_port;
496 break;
497 case PR_O_TPXY_CLI:
498 itp1.v.addr.fport = ((struct sockaddr_in *)&s->cli_addr)->sin_port;
499 /* fall through */
500 case PR_O_TPXY_CIP:
501 /* FIXME: what can we do if the client connects in IPv6 ? */
502 itp1.v.addr.faddr = ((struct sockaddr_in *)&s->cli_addr)->sin_addr;
503 break;
504 }
505
506 /* set connect flag on socket */
507 itp2.op = TPROXY_FLAGS;
508 itp2.v.flags = ITP_CONNECT | ITP_ONCE;
509
510 if (setsockopt(fd, SOL_IP, IP_TPROXY, &itp1, sizeof(itp1)) == -1 ||
511 setsockopt(fd, SOL_IP, IP_TPROXY, &itp2, sizeof(itp2)) == -1) {
512 Alert("Cannot bind to tproxy source address before connect() for proxy %s. Aborting.\n",
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200513 s->be->id);
Willy Tarreau77074d52006-11-12 23:57:19 +0100514 close(fd);
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200515 send_log(s->be, LOG_EMERG,
Willy Tarreau77074d52006-11-12 23:57:19 +0100516 "Cannot bind to tproxy source address before connect() for server %s/%s.\n",
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200517 s->be->id, s->srv->id);
Willy Tarreau77074d52006-11-12 23:57:19 +0100518 return SN_ERR_RESOURCE;
519 }
520 }
521#endif
Willy Tarreaubaaee002006-06-26 02:48:02 +0200522 }
523
524 if ((connect(fd, (struct sockaddr *)&s->srv_addr, sizeof(s->srv_addr)) == -1) &&
525 (errno != EINPROGRESS) && (errno != EALREADY) && (errno != EISCONN)) {
526
527 if (errno == EAGAIN || errno == EADDRINUSE) {
528 char *msg;
529 if (errno == EAGAIN) /* no free ports left, try again later */
530 msg = "no free ports";
531 else
532 msg = "local address already in use";
533
534 qfprintf(stderr,"Cannot connect: %s.\n",msg);
535 close(fd);
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200536 send_log(s->be, LOG_EMERG,
Willy Tarreaubaaee002006-06-26 02:48:02 +0200537 "Connect() failed for server %s/%s: %s.\n",
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200538 s->be->id, s->srv->id, msg);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200539 return SN_ERR_RESOURCE;
540 } else if (errno == ETIMEDOUT) {
541 //qfprintf(stderr,"Connect(): ETIMEDOUT");
542 close(fd);
543 return SN_ERR_SRVTO;
544 } else {
545 // (errno == ECONNREFUSED || errno == ENETUNREACH || errno == EACCES || errno == EPERM)
546 //qfprintf(stderr,"Connect(): %d", errno);
547 close(fd);
548 return SN_ERR_SRVCL;
549 }
550 }
551
552 fdtab[fd].owner = s->task;
Willy Tarreaubaaee002006-06-26 02:48:02 +0200553 fdtab[fd].state = FD_STCONN; /* connection in progress */
Willy Tarreaud7971282006-07-29 18:36:34 +0200554 fdtab[fd].cb[DIR_RD].f = &stream_sock_read;
Willy Tarreau54469402006-07-29 16:59:06 +0200555 fdtab[fd].cb[DIR_RD].b = s->rep;
Willy Tarreauf8306d52006-07-29 19:01:31 +0200556 fdtab[fd].cb[DIR_WR].f = &stream_sock_write;
Willy Tarreau54469402006-07-29 16:59:06 +0200557 fdtab[fd].cb[DIR_WR].b = s->req;
Willy Tarreaue94ebd02007-10-09 17:14:37 +0200558
559 fdtab[fd].peeraddr = (struct sockaddr *)&s->srv_addr;
560 fdtab[fd].peerlen = sizeof(s->srv_addr);
561
Willy Tarreauf161a342007-04-08 16:59:42 +0200562 EV_FD_SET(fd, DIR_WR); /* for connect status */
Willy Tarreaubaaee002006-06-26 02:48:02 +0200563
564 fd_insert(fd);
565 if (s->srv) {
566 s->srv->cur_sess++;
567 if (s->srv->cur_sess > s->srv->cur_sess_max)
568 s->srv->cur_sess_max = s->srv->cur_sess;
569 }
570
Willy Tarreaua8b55e32007-05-13 16:08:19 +0200571 if (!tv_add_ifset(&s->req->cex, &now, &s->be->contimeout))
Willy Tarreaud7971282006-07-29 18:36:34 +0200572 tv_eternity(&s->req->cex);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200573 return SN_ERR_NONE; /* connection is OK */
574}
575
576
577/*
578 * This function checks the retry count during the connect() job.
579 * It updates the session's srv_state and retries, so that the caller knows
580 * what it has to do. It uses the last connection error to set the log when
581 * it expires. It returns 1 when it has expired, and 0 otherwise.
582 */
583int srv_count_retry_down(struct session *t, int conn_err)
584{
585 /* we are in front of a retryable error */
586 t->conn_retries--;
Krzysztof Oledzki1cf36ba2007-10-18 19:12:30 +0200587 if (t->srv)
588 t->srv->retries++;
589 t->be->retries++;
590
Willy Tarreaubaaee002006-06-26 02:48:02 +0200591 if (t->conn_retries < 0) {
592 /* if not retryable anymore, let's abort */
Willy Tarreaud7971282006-07-29 18:36:34 +0200593 tv_eternity(&t->req->cex);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200594 srv_close_with_err(t, conn_err, SN_FINST_C,
Willy Tarreau80587432006-12-24 17:47:20 +0100595 503, error_message(t, HTTP_ERR_503));
Willy Tarreaubaaee002006-06-26 02:48:02 +0200596 if (t->srv)
597 t->srv->failed_conns++;
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200598 t->be->failed_conns++;
Willy Tarreaubaaee002006-06-26 02:48:02 +0200599
600 /* We used to have a free connection slot. Since we'll never use it,
601 * we have to inform the server that it may be used by another session.
602 */
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200603 if (may_dequeue_tasks(t->srv, t->be))
Willy Tarreau96bcfd72007-04-29 10:41:56 +0200604 task_wakeup(t->srv->queue_mgt);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200605 return 1;
606 }
607 return 0;
608}
609
610
611/*
612 * This function performs the retryable part of the connect() job.
613 * It updates the session's srv_state and retries, so that the caller knows
614 * what it has to do. It returns 1 when it breaks out of the loop, or 0 if
615 * it needs to redispatch.
616 */
617int srv_retryable_connect(struct session *t)
618{
619 int conn_err;
620
621 /* This loop ensures that we stop before the last retry in case of a
622 * redispatchable server.
623 */
624 do {
625 /* initiate a connection to the server */
626 conn_err = connect_server(t);
627 switch (conn_err) {
628
629 case SN_ERR_NONE:
630 //fprintf(stderr,"0: c=%d, s=%d\n", c, s);
631 t->srv_state = SV_STCONN;
632 return 1;
633
634 case SN_ERR_INTERNAL:
Willy Tarreaud7971282006-07-29 18:36:34 +0200635 tv_eternity(&t->req->cex);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200636 srv_close_with_err(t, SN_ERR_INTERNAL, SN_FINST_C,
Willy Tarreau80587432006-12-24 17:47:20 +0100637 500, error_message(t, HTTP_ERR_500));
Willy Tarreaubaaee002006-06-26 02:48:02 +0200638 if (t->srv)
639 t->srv->failed_conns++;
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200640 t->be->failed_conns++;
Willy Tarreaubaaee002006-06-26 02:48:02 +0200641 /* release other sessions waiting for this server */
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200642 if (may_dequeue_tasks(t->srv, t->be))
Willy Tarreau96bcfd72007-04-29 10:41:56 +0200643 task_wakeup(t->srv->queue_mgt);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200644 return 1;
645 }
646 /* ensure that we have enough retries left */
647 if (srv_count_retry_down(t, conn_err)) {
Willy Tarreaubaaee002006-06-26 02:48:02 +0200648 return 1;
649 }
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200650 } while (t->srv == NULL || t->conn_retries > 0 || !(t->be->options & PR_O_REDISP));
Willy Tarreaubaaee002006-06-26 02:48:02 +0200651
652 /* We're on our last chance, and the REDISP option was specified.
653 * We will ignore cookie and force to balance or use the dispatcher.
654 */
655 /* let's try to offer this slot to anybody */
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200656 if (may_dequeue_tasks(t->srv, t->be))
Willy Tarreau96bcfd72007-04-29 10:41:56 +0200657 task_wakeup(t->srv->queue_mgt);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200658
659 if (t->srv)
660 t->srv->failed_conns++;
Krzysztof Oledzki1cf36ba2007-10-18 19:12:30 +0200661 t->be->redispatches++;
Willy Tarreaubaaee002006-06-26 02:48:02 +0200662
663 t->flags &= ~(SN_DIRECT | SN_ASSIGNED | SN_ADDR_SET);
664 t->srv = NULL; /* it's left to the dispatcher to choose a server */
Willy Tarreau3d300592007-03-18 18:34:41 +0100665 http_flush_cookie_flags(&t->txn);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200666 return 0;
667}
668
669
670/* This function performs the "redispatch" part of a connection attempt. It
671 * will assign a server if required, queue the connection if required, and
672 * handle errors that might arise at this level. It can change the server
673 * state. It will return 1 if it encounters an error, switches the server
674 * state, or has to queue a connection. Otherwise, it will return 0 indicating
675 * that the connection is ready to use.
676 */
677
678int srv_redispatch_connect(struct session *t)
679{
680 int conn_err;
681
682 /* We know that we don't have any connection pending, so we will
683 * try to get a new one, and wait in this state if it's queued
684 */
685 conn_err = assign_server_and_queue(t);
686 switch (conn_err) {
687 case SRV_STATUS_OK:
688 break;
689
690 case SRV_STATUS_NOSRV:
691 /* note: it is guaranteed that t->srv == NULL here */
Willy Tarreaud7971282006-07-29 18:36:34 +0200692 tv_eternity(&t->req->cex);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200693 srv_close_with_err(t, SN_ERR_SRVTO, SN_FINST_C,
Willy Tarreau80587432006-12-24 17:47:20 +0100694 503, error_message(t, HTTP_ERR_503));
Willy Tarreaubaaee002006-06-26 02:48:02 +0200695 if (t->srv)
696 t->srv->failed_conns++;
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200697 t->be->failed_conns++;
Willy Tarreaubaaee002006-06-26 02:48:02 +0200698
699 return 1;
700
701 case SRV_STATUS_QUEUED:
702 /* FIXME-20060503 : we should use the queue timeout instead */
Willy Tarreaua8b55e32007-05-13 16:08:19 +0200703 if (!tv_add_ifset(&t->req->cex, &now, &t->be->contimeout))
Willy Tarreaud7971282006-07-29 18:36:34 +0200704 tv_eternity(&t->req->cex);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200705 t->srv_state = SV_STIDLE;
706 /* do nothing else and do not wake any other session up */
707 return 1;
708
709 case SRV_STATUS_FULL:
710 case SRV_STATUS_INTERNAL:
711 default:
Willy Tarreaud7971282006-07-29 18:36:34 +0200712 tv_eternity(&t->req->cex);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200713 srv_close_with_err(t, SN_ERR_INTERNAL, SN_FINST_C,
Willy Tarreau80587432006-12-24 17:47:20 +0100714 500, error_message(t, HTTP_ERR_500));
Willy Tarreaubaaee002006-06-26 02:48:02 +0200715 if (t->srv)
716 t->srv->failed_conns++;
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200717 t->be->failed_conns++;
Willy Tarreaubaaee002006-06-26 02:48:02 +0200718
719 /* release other sessions waiting for this server */
Willy Tarreaue2e27a52007-04-01 00:01:37 +0200720 if (may_dequeue_tasks(t->srv, t->be))
Willy Tarreau96bcfd72007-04-29 10:41:56 +0200721 task_wakeup(t->srv->queue_mgt);
Willy Tarreaubaaee002006-06-26 02:48:02 +0200722 return 1;
723 }
724 /* if we get here, it's because we got SRV_STATUS_OK, which also
725 * means that the connection has not been queued.
726 */
727 return 0;
728}
729
Krzysztof Oledzki85130942007-10-22 16:21:10 +0200730int be_downtime(struct proxy *px) {
731
732 if ((px->srv_act || px->srv_bck) && px->last_change < now.tv_sec) // ignore negative time
733 return px->down_time;
734
735 return now.tv_sec - px->last_change + px->down_time;
736}
Willy Tarreaubaaee002006-06-26 02:48:02 +0200737
738/*
739 * Local variables:
740 * c-indent-level: 8
741 * c-basic-offset: 8
742 * End:
743 */