blob: c94702a04a7e94a882fe3fbcf4388da5164c6ce5 [file] [log] [blame]
Willy Tarreaudd815982007-10-16 12:25:14 +02001/*
Willy Tarreaud1d54542012-09-12 22:58:11 +02002 * Listener management functions.
Willy Tarreaudd815982007-10-16 12:25:14 +02003 *
Willy Tarreau0ccb7442013-01-07 22:54:17 +01004 * Copyright 2000-2013 Willy Tarreau <w@1wt.eu>
Willy Tarreaudd815982007-10-16 12:25:14 +02005 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 */
12
Willy Tarreau6ae1ba62014-05-07 19:01:58 +020013#include <ctype.h>
Willy Tarreaubbebbbf2012-05-07 21:22:09 +020014#include <errno.h>
Willy Tarreaudd815982007-10-16 12:25:14 +020015#include <stdio.h>
16#include <string.h>
Willy Tarreau95ccdde2014-02-01 09:28:36 +010017#include <unistd.h>
Willy Tarreaudd815982007-10-16 12:25:14 +020018
Willy Tarreaudcc048a2020-06-04 19:11:43 +020019#include <haproxy/acl.h>
Willy Tarreau4c7e4b72020-05-27 12:58:42 +020020#include <haproxy/api.h>
Willy Tarreau5d9ddc52021-10-06 19:54:09 +020021#include <haproxy/activity.h>
Willy Tarreau6be78492020-06-05 00:00:29 +020022#include <haproxy/cfgparse.h>
Willy Tarreaudbf78022021-10-06 09:05:08 +020023#include <haproxy/cli-t.h>
Willy Tarreau7ea393d2020-06-04 18:02:10 +020024#include <haproxy/connection.h>
Willy Tarreau8d366972020-05-27 16:10:29 +020025#include <haproxy/errors.h>
Willy Tarreaub2551052020-06-09 09:07:15 +020026#include <haproxy/fd.h>
27#include <haproxy/freq_ctr.h>
Willy Tarreauf268ee82020-06-04 17:05:57 +020028#include <haproxy/global.h>
Willy Tarreau853b2972020-05-27 18:01:47 +020029#include <haproxy/list.h>
Willy Tarreau213e9902020-06-04 14:58:24 +020030#include <haproxy/listener.h>
Willy Tarreauaeed4a82020-06-04 22:01:04 +020031#include <haproxy/log.h>
Willy Tarreaub2551052020-06-09 09:07:15 +020032#include <haproxy/protocol.h>
Willy Tarreau5958c432021-05-08 20:30:37 +020033#include <haproxy/proxy.h>
Frédéric Lécaille748ece62022-05-21 23:58:40 +020034#include <haproxy/quic_tp.h>
Willy Tarreaub2551052020-06-09 09:07:15 +020035#include <haproxy/sample.h>
Willy Tarreaudfd3de82020-06-04 23:46:14 +020036#include <haproxy/stream.h>
Willy Tarreaucea0e1b2020-06-04 17:25:40 +020037#include <haproxy/task.h>
Willy Tarreau9310f482021-10-06 16:18:40 +020038#include <haproxy/ticks.h>
Willy Tarreaub2551052020-06-09 09:07:15 +020039#include <haproxy/tools.h>
Willy Tarreaudd815982007-10-16 12:25:14 +020040
Willy Tarreaub648d632007-10-28 22:13:50 +010041
Willy Tarreau26982662012-09-12 23:17:10 +020042/* List head of all known bind keywords */
Willy Tarreauca1acd62022-03-29 15:02:44 +020043struct bind_kw_list bind_keywords = {
Willy Tarreau26982662012-09-12 23:17:10 +020044 .list = LIST_HEAD_INIT(bind_keywords.list)
45};
46
Willy Tarreaua1d97f82019-12-10 11:18:41 +010047/* list of the temporarily limited listeners because of lack of resource */
48static struct mt_list global_listener_queue = MT_LIST_HEAD_INIT(global_listener_queue);
49static struct task *global_listener_queue_task;
Willy Tarreau469fa472022-11-22 09:08:23 +010050__decl_thread(static HA_RWLOCK_T global_listener_rwlock);
Willy Tarreaua1d97f82019-12-10 11:18:41 +010051
William Dauchy3679d0c2021-02-14 23:22:55 +010052/* listener status for stats */
53const char* li_status_st[LI_STATE_COUNT] = {
54 [LI_STATUS_WAITING] = "WAITING",
55 [LI_STATUS_OPEN] = "OPEN",
56 [LI_STATUS_FULL] = "FULL",
57};
Willy Tarreaua1d97f82019-12-10 11:18:41 +010058
Willy Tarreau1efafce2019-01-27 15:37:19 +010059#if defined(USE_THREAD)
60
61struct accept_queue_ring accept_queue_rings[MAX_THREADS] __attribute__((aligned(64))) = { };
62
63/* dequeue and process a pending connection from the local accept queue (single
Willy Tarreau83efc322020-10-14 17:37:17 +020064 * consumer). Returns the accepted connection or NULL if none was found.
Willy Tarreau1efafce2019-01-27 15:37:19 +010065 */
Willy Tarreau83efc322020-10-14 17:37:17 +020066struct connection *accept_queue_pop_sc(struct accept_queue_ring *ring)
Willy Tarreau1efafce2019-01-27 15:37:19 +010067{
Willy Tarreau1efafce2019-01-27 15:37:19 +010068 unsigned int pos, next;
Willy Tarreau83efc322020-10-14 17:37:17 +020069 struct connection *ptr;
70 struct connection **e;
Willy Tarreau1efafce2019-01-27 15:37:19 +010071
72 pos = ring->head;
73
74 if (pos == ring->tail)
Willy Tarreau83efc322020-10-14 17:37:17 +020075 return NULL;
Willy Tarreau1efafce2019-01-27 15:37:19 +010076
77 next = pos + 1;
78 if (next >= ACCEPT_QUEUE_SIZE)
79 next = 0;
80
81 e = &ring->entry[pos];
82
83 /* wait for the producer to update the listener's pointer */
84 while (1) {
Willy Tarreau83efc322020-10-14 17:37:17 +020085 ptr = *e;
Willy Tarreau1efafce2019-01-27 15:37:19 +010086 __ha_barrier_load();
87 if (ptr)
88 break;
89 pl_cpu_relax();
90 }
91
Willy Tarreau1efafce2019-01-27 15:37:19 +010092 /* release the entry */
Willy Tarreau83efc322020-10-14 17:37:17 +020093 *e = NULL;
Willy Tarreau1efafce2019-01-27 15:37:19 +010094
95 __ha_barrier_store();
96 ring->head = next;
Willy Tarreau83efc322020-10-14 17:37:17 +020097 return ptr;
Willy Tarreau1efafce2019-01-27 15:37:19 +010098}
99
100
Willy Tarreau83efc322020-10-14 17:37:17 +0200101/* tries to push a new accepted connection <conn> into ring <ring>. Returns
102 * non-zero if it succeeds, or zero if the ring is full. Supports multiple
103 * producers.
Willy Tarreau1efafce2019-01-27 15:37:19 +0100104 */
Willy Tarreau83efc322020-10-14 17:37:17 +0200105int accept_queue_push_mp(struct accept_queue_ring *ring, struct connection *conn)
Willy Tarreau1efafce2019-01-27 15:37:19 +0100106{
Willy Tarreau1efafce2019-01-27 15:37:19 +0100107 unsigned int pos, next;
108
109 pos = ring->tail;
110 do {
111 next = pos + 1;
112 if (next >= ACCEPT_QUEUE_SIZE)
113 next = 0;
114 if (next == ring->head)
115 return 0; // ring full
Olivier Houchard64213e92019-03-08 18:52:57 +0100116 } while (unlikely(!_HA_ATOMIC_CAS(&ring->tail, &pos, next)));
Willy Tarreau1efafce2019-01-27 15:37:19 +0100117
Willy Tarreau83efc322020-10-14 17:37:17 +0200118 ring->entry[pos] = conn;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100119 __ha_barrier_store();
Willy Tarreau1efafce2019-01-27 15:37:19 +0100120 return 1;
121}
122
Willy Tarreaufb5401f2021-01-29 12:25:23 +0100123/* proceed with accepting new connections. Don't mark it static so that it appears
124 * in task dumps.
125 */
Willy Tarreau144f84a2021-03-02 16:09:26 +0100126struct task *accept_queue_process(struct task *t, void *context, unsigned int state)
Willy Tarreau1efafce2019-01-27 15:37:19 +0100127{
128 struct accept_queue_ring *ring = context;
Willy Tarreau83efc322020-10-14 17:37:17 +0200129 struct connection *conn;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100130 struct listener *li;
Christopher Faulet102854c2019-04-30 12:17:13 +0200131 unsigned int max_accept;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100132 int ret;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100133
Christopher Faulet102854c2019-04-30 12:17:13 +0200134 /* if global.tune.maxaccept is -1, then max_accept is UINT_MAX. It
135 * is not really illimited, but it is probably enough.
136 */
Willy Tarreau66161322021-02-19 15:50:27 +0100137 max_accept = global.tune.maxaccept ? global.tune.maxaccept : MAX_ACCEPT;
Christopher Faulet102854c2019-04-30 12:17:13 +0200138 for (; max_accept; max_accept--) {
Willy Tarreau83efc322020-10-14 17:37:17 +0200139 conn = accept_queue_pop_sc(ring);
140 if (!conn)
Willy Tarreau1efafce2019-01-27 15:37:19 +0100141 break;
142
Willy Tarreau83efc322020-10-14 17:37:17 +0200143 li = __objt_listener(conn->target);
Willy Tarreau4781b152021-04-06 13:53:36 +0200144 _HA_ATOMIC_INC(&li->thr_conn[tid]);
Willy Tarreau83efc322020-10-14 17:37:17 +0200145 ret = li->accept(conn);
Willy Tarreau1efafce2019-01-27 15:37:19 +0100146 if (ret <= 0) {
147 /* connection was terminated by the application */
148 continue;
149 }
150
151 /* increase the per-process number of cumulated sessions, this
152 * may only be done once l->accept() has accepted the connection.
153 */
154 if (!(li->options & LI_O_UNLIMITED)) {
155 HA_ATOMIC_UPDATE_MAX(&global.sps_max,
156 update_freq_ctr(&global.sess_per_sec, 1));
Willy Tarreau11ba4042022-05-20 15:56:32 +0200157 if (li->bind_conf && li->bind_conf->options & BC_O_USE_SSL) {
Willy Tarreau1efafce2019-01-27 15:37:19 +0100158 HA_ATOMIC_UPDATE_MAX(&global.ssl_max,
159 update_freq_ctr(&global.ssl_per_sec, 1));
160 }
161 }
162 }
163
164 /* ran out of budget ? Let's come here ASAP */
Christopher Faulet102854c2019-04-30 12:17:13 +0200165 if (!max_accept)
Willy Tarreau2bd65a72019-09-24 06:55:18 +0200166 tasklet_wakeup(ring->tasklet);
Willy Tarreau1efafce2019-01-27 15:37:19 +0100167
Willy Tarreau2bd65a72019-09-24 06:55:18 +0200168 return NULL;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100169}
170
171/* Initializes the accept-queues. Returns 0 on success, otherwise ERR_* flags */
172static int accept_queue_init()
173{
Willy Tarreau2bd65a72019-09-24 06:55:18 +0200174 struct tasklet *t;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100175 int i;
176
177 for (i = 0; i < global.nbthread; i++) {
Willy Tarreau2bd65a72019-09-24 06:55:18 +0200178 t = tasklet_new();
Willy Tarreau1efafce2019-01-27 15:37:19 +0100179 if (!t) {
180 ha_alert("Out of memory while initializing accept queue for thread %d\n", i);
181 return ERR_FATAL|ERR_ABORT;
182 }
Willy Tarreau2bd65a72019-09-24 06:55:18 +0200183 t->tid = i;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100184 t->process = accept_queue_process;
185 t->context = &accept_queue_rings[i];
Willy Tarreau2bd65a72019-09-24 06:55:18 +0200186 accept_queue_rings[i].tasklet = t;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100187 }
188 return 0;
189}
190
191REGISTER_CONFIG_POSTPARSER("multi-threaded accept queue", accept_queue_init);
192
Willy Tarreaue01b08d2022-04-27 18:42:47 +0200193static void accept_queue_deinit()
194{
195 int i;
196
197 for (i = 0; i < global.nbthread; i++) {
198 if (accept_queue_rings[i].tasklet)
199 tasklet_free(accept_queue_rings[i].tasklet);
200 }
201}
202
203REGISTER_POST_DEINIT(accept_queue_deinit);
204
Willy Tarreau1efafce2019-01-27 15:37:19 +0100205#endif // USE_THREAD
206
Amaury Denoyellef68b2cb2022-01-25 16:21:47 +0100207/* Memory allocation and initialization of the per_thr field.
208 * Returns 0 if the field has been successfully initialized, -1 on failure.
209 */
210int li_init_per_thr(struct listener *li)
211{
212 int i;
213
214 /* allocate per-thread elements for listener */
215 li->per_thr = calloc(global.nbthread, sizeof(*li->per_thr));
216 if (!li->per_thr)
217 return -1;
218
219 for (i = 0; i < global.nbthread; ++i) {
220 MT_LIST_INIT(&li->per_thr[i].quic_accept.list);
221 MT_LIST_INIT(&li->per_thr[i].quic_accept.conns);
222
223 li->per_thr[i].li = li;
224 }
225
226 return 0;
227}
228
William Dauchy3679d0c2021-02-14 23:22:55 +0100229/* helper to get listener status for stats */
230enum li_status get_li_status(struct listener *l)
231{
232 if (!l->maxconn || l->nbconn < l->maxconn) {
233 if (l->state == LI_LIMITED)
234 return LI_STATUS_WAITING;
235 else
236 return LI_STATUS_OPEN;
237 }
238 return LI_STATUS_FULL;
239}
240
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200241/* adjust the listener's state and its proxy's listener counters if needed.
242 * It must be called under the listener's lock, but uses atomic ops to change
243 * the proxy's counters so that the proxy lock is not needed.
244 */
Willy Tarreaua37b2442020-09-24 07:23:45 +0200245void listener_set_state(struct listener *l, enum li_state st)
246{
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200247 struct proxy *px = l->bind_conf->frontend;
248
249 if (px) {
250 /* from state */
251 switch (l->state) {
252 case LI_NEW: /* first call */
Willy Tarreau4781b152021-04-06 13:53:36 +0200253 _HA_ATOMIC_INC(&px->li_all);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200254 break;
255 case LI_INIT:
256 case LI_ASSIGNED:
257 break;
258 case LI_PAUSED:
Willy Tarreau4781b152021-04-06 13:53:36 +0200259 _HA_ATOMIC_DEC(&px->li_paused);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200260 break;
261 case LI_LISTEN:
Willy Tarreau4781b152021-04-06 13:53:36 +0200262 _HA_ATOMIC_DEC(&px->li_bound);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200263 break;
264 case LI_READY:
265 case LI_FULL:
266 case LI_LIMITED:
Willy Tarreau4781b152021-04-06 13:53:36 +0200267 _HA_ATOMIC_DEC(&px->li_ready);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200268 break;
269 }
270
271 /* to state */
272 switch (st) {
273 case LI_NEW:
274 case LI_INIT:
275 case LI_ASSIGNED:
276 break;
277 case LI_PAUSED:
Willy Tarreau95a34602020-10-08 15:32:21 +0200278 BUG_ON(l->rx.fd == -1);
Willy Tarreau4781b152021-04-06 13:53:36 +0200279 _HA_ATOMIC_INC(&px->li_paused);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200280 break;
281 case LI_LISTEN:
Willy Tarreau95a34602020-10-08 15:32:21 +0200282 BUG_ON(l->rx.fd == -1);
Willy Tarreau4781b152021-04-06 13:53:36 +0200283 _HA_ATOMIC_INC(&px->li_bound);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200284 break;
285 case LI_READY:
286 case LI_FULL:
287 case LI_LIMITED:
Willy Tarreau95a34602020-10-08 15:32:21 +0200288 BUG_ON(l->rx.fd == -1);
Willy Tarreau4781b152021-04-06 13:53:36 +0200289 _HA_ATOMIC_INC(&px->li_ready);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200290 break;
291 }
292 }
Willy Tarreaua37b2442020-09-24 07:23:45 +0200293 l->state = st;
294}
295
Willy Tarreaudabf2e22007-10-28 21:59:24 +0100296/* This function adds the specified listener's file descriptor to the polling
297 * lists if it is in the LI_LISTEN state. The listener enters LI_READY or
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +0500298 * LI_FULL state depending on its number of connections. In daemon mode, we
Willy Tarreauae302532014-05-07 19:22:24 +0200299 * also support binding only the relevant processes to their respective
300 * listeners. We don't do that in debug mode however.
Willy Tarreaudabf2e22007-10-28 21:59:24 +0100301 */
Willy Tarreau7834a3f2020-09-25 16:40:18 +0200302void enable_listener(struct listener *listener)
Willy Tarreaudabf2e22007-10-28 21:59:24 +0100303{
Willy Tarreau08b6f962022-02-01 16:23:00 +0100304 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &listener->lock);
Willy Tarreaud6afb532020-10-09 10:35:40 +0200305
306 /* If this listener is supposed to be only in the master, close it in
307 * the workers. Conversely, if it's supposed to be only in the workers
308 * close it in the master.
309 */
Willy Tarreau18c20d22020-10-09 16:11:46 +0200310 if (!!master != !!(listener->rx.flags & RX_F_MWORKER))
Willy Tarreau75c98d12020-10-09 15:55:23 +0200311 do_unbind_listener(listener);
Willy Tarreaud6afb532020-10-09 10:35:40 +0200312
Willy Tarreaudabf2e22007-10-28 21:59:24 +0100313 if (listener->state == LI_LISTEN) {
Willy Tarreau95a34602020-10-08 15:32:21 +0200314 BUG_ON(listener->rx.fd == -1);
William Lallemand095ba4c2017-06-01 17:38:50 +0200315 if ((global.mode & (MODE_DAEMON | MODE_MWORKER)) &&
Willy Tarreau72faef32021-06-15 08:36:30 +0200316 (!!master != !!(listener->rx.flags & RX_F_MWORKER))) {
Willy Tarreauae302532014-05-07 19:22:24 +0200317 /* we don't want to enable this listener and don't
318 * want any fd event to reach it.
319 */
Willy Tarreau75c98d12020-10-09 15:55:23 +0200320 do_unbind_listener(listener);
Willy Tarreauae302532014-05-07 19:22:24 +0200321 }
Willy Tarreaua8cf66b2019-02-27 16:49:00 +0100322 else if (!listener->maxconn || listener->nbconn < listener->maxconn) {
Willy Tarreau4b51f422020-09-25 20:32:28 +0200323 listener->rx.proto->enable(listener);
Willy Tarreaua37b2442020-09-24 07:23:45 +0200324 listener_set_state(listener, LI_READY);
Willy Tarreauae302532014-05-07 19:22:24 +0200325 }
326 else {
Willy Tarreaua37b2442020-09-24 07:23:45 +0200327 listener_set_state(listener, LI_FULL);
Willy Tarreaudabf2e22007-10-28 21:59:24 +0100328 }
329 }
Willy Tarreaud6afb532020-10-09 10:35:40 +0200330
Willy Tarreau08b6f962022-02-01 16:23:00 +0100331 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &listener->lock);
Willy Tarreaudabf2e22007-10-28 21:59:24 +0100332}
333
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200334/*
Aurelien DARRAGON187396e2022-09-11 16:19:49 +0200335 * This function completely stops a listener.
336 * The proxy's listeners count is updated and the proxy is
337 * disabled and woken up after the last one is gone.
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200338 * It will need to operate under the proxy's lock and the protocol's lock.
339 * The caller is responsible for indicating in lpx, lpr whether the
340 * respective locks are already held (non-zero) or not (zero) so that the
341 * function picks the missing ones, in this order.
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200342 */
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200343void stop_listener(struct listener *l, int lpx, int lpr)
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200344{
345 struct proxy *px = l->bind_conf->frontend;
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200346
347 if (l->options & LI_O_NOSTOP) {
348 /* master-worker sockpairs are never closed but don't count as a
349 * job.
350 */
351 return;
352 }
353
Aurelien DARRAGONa57786e2022-09-12 09:26:21 +0200354 if (!lpx && px)
Willy Tarreauac66d6b2020-10-20 17:24:27 +0200355 HA_RWLOCK_WRLOCK(PROXY_LOCK, &px->lock);
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200356
357 if (!lpr)
358 HA_SPIN_LOCK(PROTO_LOCK, &proto_lock);
359
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200360 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &l->lock);
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200361
362 if (l->state > LI_INIT) {
Willy Tarreau75c98d12020-10-09 15:55:23 +0200363 do_unbind_listener(l);
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200364
365 if (l->state >= LI_ASSIGNED)
366 __delete_listener(l);
367
Aurelien DARRAGONa57786e2022-09-12 09:26:21 +0200368 if (px)
369 proxy_cond_disable(px);
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200370 }
371
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200372 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &l->lock);
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200373
374 if (!lpr)
375 HA_SPIN_UNLOCK(PROTO_LOCK, &proto_lock);
376
Aurelien DARRAGONa57786e2022-09-12 09:26:21 +0200377 if (!lpx && px)
Willy Tarreauac66d6b2020-10-20 17:24:27 +0200378 HA_RWLOCK_WRUNLOCK(PROXY_LOCK, &px->lock);
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200379}
380
Willy Tarreaud1f250f2020-12-04 15:03:36 +0100381/* This function adds the specified <listener> to the protocol <proto>. It
382 * does nothing if the protocol was already added. The listener's state is
383 * automatically updated from LI_INIT to LI_ASSIGNED. The number of listeners
384 * for the protocol is updated. This must be called with the proto lock held.
385 */
386void default_add_listener(struct protocol *proto, struct listener *listener)
387{
388 if (listener->state != LI_INIT)
389 return;
390 listener_set_state(listener, LI_ASSIGNED);
391 listener->rx.proto = proto;
Willy Tarreau2b718102021-04-21 07:32:39 +0200392 LIST_APPEND(&proto->receivers, &listener->rx.proto_list);
Willy Tarreaud1f250f2020-12-04 15:03:36 +0100393 proto->nb_receivers++;
394}
395
Willy Tarreaue03204c2020-10-09 17:02:21 +0200396/* default function called to suspend a listener: it simply passes the call to
397 * the underlying receiver. This is find for most socket-based protocols. This
398 * must be called under the listener's lock. It will return non-zero on success,
399 * 0 on failure. If no receiver-level suspend is provided, the operation is
400 * assumed to succeed.
401 */
402int default_suspend_listener(struct listener *l)
403{
404 int ret = 1;
405
406 if (!l->rx.proto->rx_suspend)
407 return 1;
408
409 ret = l->rx.proto->rx_suspend(&l->rx);
410 return ret > 0 ? ret : 0;
411}
412
413
414/* Tries to resume a suspended listener, and returns non-zero on success or
415 * zero on failure. On certain errors, an alert or a warning might be displayed.
416 * It must be called with the listener's lock held. Depending on the listener's
417 * state and protocol, a listen() call might be used to resume operations, or a
418 * call to the receiver's resume() function might be used as well. This is
419 * suitable as a default function for TCP and UDP. This must be called with the
420 * listener's lock held.
421 */
422int default_resume_listener(struct listener *l)
423{
424 int ret = 1;
425
426 if (l->state == LI_ASSIGNED) {
427 char msg[100];
428 int err;
429
430 err = l->rx.proto->listen(l, msg, sizeof(msg));
431 if (err & ERR_ALERT)
432 ha_alert("Resuming listener: %s\n", msg);
433 else if (err & ERR_WARN)
434 ha_warning("Resuming listener: %s\n", msg);
435
436 if (err & (ERR_FATAL | ERR_ABORT)) {
437 ret = 0;
438 goto end;
439 }
440 }
441
442 if (l->state < LI_PAUSED) {
443 ret = 0;
444 goto end;
445 }
446
447 if (l->state == LI_PAUSED && l->rx.proto->rx_resume &&
448 l->rx.proto->rx_resume(&l->rx) <= 0)
449 ret = 0;
450 end:
451 return ret;
452}
453
454
Willy Tarreaube58c382011-07-24 18:28:10 +0200455/* This function tries to temporarily disable a listener, depending on the OS
456 * capabilities. Linux unbinds the listen socket after a SHUT_RD, and ignores
457 * SHUT_WR. Solaris refuses either shutdown(). OpenBSD ignores SHUT_RD but
458 * closes upon SHUT_WR and refuses to rebind. So a common validation path
459 * involves SHUT_WR && listen && SHUT_RD. In case of success, the FD's polling
460 * is disabled. It normally returns non-zero, unless an error is reported.
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200461 * It will need to operate under the proxy's lock. The caller is
462 * responsible for indicating in lpx whether the proxy locks is
463 * already held (non-zero) or not (zero) so that the function picks it.
Willy Tarreaube58c382011-07-24 18:28:10 +0200464 */
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200465int pause_listener(struct listener *l, int lpx)
Willy Tarreaube58c382011-07-24 18:28:10 +0200466{
Willy Tarreau58651b42020-09-24 16:03:29 +0200467 struct proxy *px = l->bind_conf->frontend;
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200468 int ret = 1;
469
Aurelien DARRAGONa57786e2022-09-12 09:26:21 +0200470 if (!lpx && px)
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200471 HA_RWLOCK_WRLOCK(PROXY_LOCK, &px->lock);
472
Willy Tarreau08b6f962022-02-01 16:23:00 +0100473 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &l->lock);
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200474
Willy Tarreau9b3a9322020-09-24 14:46:34 +0200475 if (l->state <= LI_PAUSED)
476 goto end;
477
Willy Tarreaue03204c2020-10-09 17:02:21 +0200478 if (l->rx.proto->suspend)
479 ret = l->rx.proto->suspend(l);
Willy Tarreaube58c382011-07-24 18:28:10 +0200480
Willy Tarreau2b718102021-04-21 07:32:39 +0200481 MT_LIST_DELETE(&l->wait_queue);
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200482
Willy Tarreaua37b2442020-09-24 07:23:45 +0200483 listener_set_state(l, LI_PAUSED);
Willy Tarreau58651b42020-09-24 16:03:29 +0200484
485 if (px && !px->li_ready) {
Aurelien DARRAGONd46f4372022-09-09 15:51:37 +0200486 /* PROXY_LOCK is required */
487 proxy_cond_pause(px);
Willy Tarreau58651b42020-09-24 16:03:29 +0200488 ha_warning("Paused %s %s.\n", proxy_cap_str(px->cap), px->id);
489 send_log(px, LOG_WARNING, "Paused %s %s.\n", proxy_cap_str(px->cap), px->id);
490 }
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200491 end:
Willy Tarreau08b6f962022-02-01 16:23:00 +0100492 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &l->lock);
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200493
Aurelien DARRAGONa57786e2022-09-12 09:26:21 +0200494 if (!lpx && px)
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200495 HA_RWLOCK_WRUNLOCK(PROXY_LOCK, &px->lock);
496
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200497 return ret;
Willy Tarreaube58c382011-07-24 18:28:10 +0200498}
499
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200500/* This function tries to resume a temporarily disabled listener. Paused, full,
501 * limited and disabled listeners are handled, which means that this function
502 * may replace enable_listener(). The resulting state will either be LI_READY
503 * or LI_FULL. 0 is returned in case of failure to resume (eg: dead socket).
Willy Tarreauae302532014-05-07 19:22:24 +0200504 * Listeners bound to a different process are not woken up unless we're in
Willy Tarreauaf2fd582015-04-14 12:07:16 +0200505 * foreground mode, and are ignored. If the listener was only in the assigned
506 * state, it's totally rebound. This can happen if a pause() has completely
507 * stopped it. If the resume fails, 0 is returned and an error might be
508 * displayed.
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200509 * It will need to operate under the proxy's lock. The caller is
510 * responsible for indicating in lpx whether the proxy locks is
511 * already held (non-zero) or not (zero) so that the function picks it.
Willy Tarreaube58c382011-07-24 18:28:10 +0200512 */
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200513int resume_listener(struct listener *l, int lpx)
Willy Tarreaube58c382011-07-24 18:28:10 +0200514{
Willy Tarreau58651b42020-09-24 16:03:29 +0200515 struct proxy *px = l->bind_conf->frontend;
516 int was_paused = px && px->li_paused;
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200517 int ret = 1;
518
Aurelien DARRAGONa57786e2022-09-12 09:26:21 +0200519 if (!lpx && px)
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200520 HA_RWLOCK_WRLOCK(PROXY_LOCK, &px->lock);
521
Willy Tarreau08b6f962022-02-01 16:23:00 +0100522 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &l->lock);
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200523
Willy Tarreauf2cb1692019-07-11 10:08:31 +0200524 /* check that another thread didn't to the job in parallel (e.g. at the
525 * end of listen_accept() while we'd come from dequeue_all_listeners().
526 */
Willy Tarreau2b718102021-04-21 07:32:39 +0200527 if (MT_LIST_INLIST(&l->wait_queue))
Willy Tarreauf2cb1692019-07-11 10:08:31 +0200528 goto end;
529
Willy Tarreau5d7f9ce2020-09-24 18:54:11 +0200530 if (l->state == LI_READY)
531 goto end;
Willy Tarreaube58c382011-07-24 18:28:10 +0200532
Willy Tarreaue03204c2020-10-09 17:02:21 +0200533 if (l->rx.proto->resume)
534 ret = l->rx.proto->resume(l);
Willy Tarreaube58c382011-07-24 18:28:10 +0200535
Willy Tarreaua8cf66b2019-02-27 16:49:00 +0100536 if (l->maxconn && l->nbconn >= l->maxconn) {
Willy Tarreau4b51f422020-09-25 20:32:28 +0200537 l->rx.proto->disable(l);
Willy Tarreaua37b2442020-09-24 07:23:45 +0200538 listener_set_state(l, LI_FULL);
Willy Tarreau58651b42020-09-24 16:03:29 +0200539 goto done;
Willy Tarreaube58c382011-07-24 18:28:10 +0200540 }
541
Willy Tarreau4b51f422020-09-25 20:32:28 +0200542 l->rx.proto->enable(l);
Willy Tarreaua37b2442020-09-24 07:23:45 +0200543 listener_set_state(l, LI_READY);
Willy Tarreau58651b42020-09-24 16:03:29 +0200544
545 done:
546 if (was_paused && !px->li_paused) {
Aurelien DARRAGONd46f4372022-09-09 15:51:37 +0200547 /* PROXY_LOCK is required */
548 proxy_cond_resume(px);
Willy Tarreau58651b42020-09-24 16:03:29 +0200549 ha_warning("Resumed %s %s.\n", proxy_cap_str(px->cap), px->id);
550 send_log(px, LOG_WARNING, "Resumed %s %s.\n", proxy_cap_str(px->cap), px->id);
551 }
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200552 end:
Willy Tarreau08b6f962022-02-01 16:23:00 +0100553 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &l->lock);
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200554
Aurelien DARRAGONa57786e2022-09-12 09:26:21 +0200555 if (!lpx && px)
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200556 HA_RWLOCK_WRUNLOCK(PROXY_LOCK, &px->lock);
557
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200558 return ret;
559}
560
Willy Tarreau87b09662015-04-03 00:22:06 +0200561/* Marks a ready listener as full so that the stream code tries to re-enable
Willy Tarreau62793712011-07-24 19:23:38 +0200562 * it upon next close() using resume_listener().
563 */
Christopher Faulet5580ba22017-08-28 15:29:20 +0200564static void listener_full(struct listener *l)
Willy Tarreau62793712011-07-24 19:23:38 +0200565{
Willy Tarreau08b6f962022-02-01 16:23:00 +0100566 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &l->lock);
Willy Tarreau62793712011-07-24 19:23:38 +0200567 if (l->state >= LI_READY) {
Willy Tarreau2b718102021-04-21 07:32:39 +0200568 MT_LIST_DELETE(&l->wait_queue);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100569 if (l->state != LI_FULL) {
Willy Tarreau4b51f422020-09-25 20:32:28 +0200570 l->rx.proto->disable(l);
Willy Tarreaua37b2442020-09-24 07:23:45 +0200571 listener_set_state(l, LI_FULL);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100572 }
Willy Tarreau62793712011-07-24 19:23:38 +0200573 }
Willy Tarreau08b6f962022-02-01 16:23:00 +0100574 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &l->lock);
Willy Tarreau62793712011-07-24 19:23:38 +0200575}
576
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200577/* Marks a ready listener as limited so that we only try to re-enable it when
578 * resources are free again. It will be queued into the specified queue.
579 */
Olivier Houchard859dc802019-08-08 15:47:21 +0200580static void limit_listener(struct listener *l, struct mt_list *list)
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200581{
Willy Tarreau08b6f962022-02-01 16:23:00 +0100582 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &l->lock);
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200583 if (l->state == LI_READY) {
Willy Tarreau2b718102021-04-21 07:32:39 +0200584 MT_LIST_TRY_APPEND(list, &l->wait_queue);
Willy Tarreau4b51f422020-09-25 20:32:28 +0200585 l->rx.proto->disable(l);
Willy Tarreaua37b2442020-09-24 07:23:45 +0200586 listener_set_state(l, LI_LIMITED);
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200587 }
Willy Tarreau08b6f962022-02-01 16:23:00 +0100588 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &l->lock);
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200589}
590
Willy Tarreau241797a2019-12-10 14:10:52 +0100591/* Dequeues all listeners waiting for a resource the global wait queue */
592void dequeue_all_listeners()
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200593{
Willy Tarreau01abd022019-02-28 10:27:18 +0100594 struct listener *listener;
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200595
Willy Tarreau241797a2019-12-10 14:10:52 +0100596 while ((listener = MT_LIST_POP(&global_listener_queue, struct listener *, wait_queue))) {
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200597 /* This cannot fail because the listeners are by definition in
Willy Tarreau01abd022019-02-28 10:27:18 +0100598 * the LI_LIMITED state.
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200599 */
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200600 resume_listener(listener, 0);
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200601 }
602}
603
Willy Tarreau241797a2019-12-10 14:10:52 +0100604/* Dequeues all listeners waiting for a resource in proxy <px>'s queue */
605void dequeue_proxy_listeners(struct proxy *px)
606{
607 struct listener *listener;
608
609 while ((listener = MT_LIST_POP(&px->listener_queue, struct listener *, wait_queue))) {
610 /* This cannot fail because the listeners are by definition in
611 * the LI_LIMITED state.
612 */
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200613 resume_listener(listener, 0);
Willy Tarreau241797a2019-12-10 14:10:52 +0100614 }
615}
616
Willy Tarreau7b2febd2020-10-09 17:18:29 +0200617
618/* default function used to unbind a listener. This is for use by standard
619 * protocols working on top of accepted sockets. The receiver's rx_unbind()
620 * will automatically be used after the listener is disabled if the socket is
621 * still bound. This must be used under the listener's lock.
Christopher Faulet510c0d62018-03-16 10:04:47 +0100622 */
Willy Tarreau7b2febd2020-10-09 17:18:29 +0200623void default_unbind_listener(struct listener *listener)
Willy Tarreaub648d632007-10-28 22:13:50 +0100624{
Willy Tarreau87acd4e2020-10-08 15:36:46 +0200625 if (listener->state <= LI_ASSIGNED)
626 goto out_close;
627
628 if (listener->rx.fd == -1) {
Willy Tarreaua37b2442020-09-24 07:23:45 +0200629 listener_set_state(listener, LI_ASSIGNED);
Willy Tarreau87acd4e2020-10-08 15:36:46 +0200630 goto out_close;
631 }
632
Willy Tarreauf58b8db2020-10-09 16:32:08 +0200633 if (listener->state >= LI_READY) {
634 listener->rx.proto->disable(listener);
635 if (listener->rx.flags & RX_F_BOUND)
Willy Tarreau87acd4e2020-10-08 15:36:46 +0200636 listener_set_state(listener, LI_LISTEN);
Willy Tarreaub6607bf2020-09-23 16:24:23 +0200637 }
638
Willy Tarreau87acd4e2020-10-08 15:36:46 +0200639 out_close:
Willy Tarreauf58b8db2020-10-09 16:32:08 +0200640 if (listener->rx.flags & RX_F_BOUND)
641 listener->rx.proto->rx_unbind(&listener->rx);
Willy Tarreau7b2febd2020-10-09 17:18:29 +0200642}
643
644/* This function closes the listening socket for the specified listener,
645 * provided that it's already in a listening state. The protocol's unbind()
646 * is called to put the listener into LI_ASSIGNED or LI_LISTEN and handle
647 * the unbinding tasks. The listener enters then the LI_ASSIGNED state if
648 * the receiver is unbound. Must be called with the lock held.
649 */
650void do_unbind_listener(struct listener *listener)
651{
Willy Tarreau2b718102021-04-21 07:32:39 +0200652 MT_LIST_DELETE(&listener->wait_queue);
Willy Tarreau7b2febd2020-10-09 17:18:29 +0200653
654 if (listener->rx.proto->unbind)
655 listener->rx.proto->unbind(listener);
Willy Tarreau374e9af2020-10-09 15:47:17 +0200656
Willy Tarreauf58b8db2020-10-09 16:32:08 +0200657 /* we may have to downgrade the listener if the rx was closed */
658 if (!(listener->rx.flags & RX_F_BOUND) && listener->state > LI_ASSIGNED)
Willy Tarreau374e9af2020-10-09 15:47:17 +0200659 listener_set_state(listener, LI_ASSIGNED);
Willy Tarreaubbd09b92017-11-05 11:38:44 +0100660}
661
Olivier Houchard1fc05162017-04-06 01:05:05 +0200662/* This function closes the listening socket for the specified listener,
663 * provided that it's already in a listening state. The listener enters the
Willy Tarreau75c98d12020-10-09 15:55:23 +0200664 * LI_ASSIGNED state, except if the FD is not closed, in which case it may
665 * remain in LI_LISTEN. This function is intended to be used as a generic
Willy Tarreaubbd09b92017-11-05 11:38:44 +0100666 * function for standard protocols.
Olivier Houchard1fc05162017-04-06 01:05:05 +0200667 */
Willy Tarreaubbd09b92017-11-05 11:38:44 +0100668void unbind_listener(struct listener *listener)
Olivier Houchard1fc05162017-04-06 01:05:05 +0200669{
Willy Tarreau08b6f962022-02-01 16:23:00 +0100670 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &listener->lock);
Willy Tarreau75c98d12020-10-09 15:55:23 +0200671 do_unbind_listener(listener);
Willy Tarreau08b6f962022-02-01 16:23:00 +0100672 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &listener->lock);
Olivier Houchard1fc05162017-04-06 01:05:05 +0200673}
674
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200675/* creates one or multiple listeners for bind_conf <bc> on sockaddr <ss> on port
676 * range <portl> to <porth>, and possibly attached to fd <fd> (or -1 for auto
Willy Tarreau9b3178d2020-09-16 17:58:55 +0200677 * allocation). The address family is taken from ss->ss_family, and the protocol
Willy Tarreaud2fb99f2020-10-15 21:22:29 +0200678 * passed in <proto> must be usable on this family. The protocol's default iocb
679 * is automatically preset as the receivers' iocb. The number of jobs and
Willy Tarreau9b3178d2020-09-16 17:58:55 +0200680 * listeners is automatically increased by the number of listeners created. It
681 * returns non-zero on success, zero on error with the error message set in <err>.
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200682 */
683int create_listeners(struct bind_conf *bc, const struct sockaddr_storage *ss,
Willy Tarreau9b3178d2020-09-16 17:58:55 +0200684 int portl, int porth, int fd, struct protocol *proto, char **err)
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200685{
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200686 struct listener *l;
687 int port;
688
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200689 for (port = portl; port <= porth; port++) {
690 l = calloc(1, sizeof(*l));
691 if (!l) {
692 memprintf(err, "out of memory");
693 return 0;
694 }
695 l->obj_type = OBJ_TYPE_LISTENER;
Willy Tarreau2b718102021-04-21 07:32:39 +0200696 LIST_APPEND(&bc->frontend->conf.listeners, &l->by_fe);
697 LIST_APPEND(&bc->listeners, &l->by_bind);
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200698 l->bind_conf = bc;
Willy Tarreau0fce6bc2020-09-03 07:46:06 +0200699 l->rx.settings = &bc->settings;
Willy Tarreaueef45422020-09-03 10:05:03 +0200700 l->rx.owner = l;
Willy Tarreaud2fb99f2020-10-15 21:22:29 +0200701 l->rx.iocb = proto->default_iocb;
Willy Tarreau38ba6472020-08-27 08:16:52 +0200702 l->rx.fd = fd;
Willy Tarreau07400c52020-12-04 14:49:11 +0100703
Willy Tarreau37159062020-08-27 07:48:42 +0200704 memcpy(&l->rx.addr, ss, sizeof(*ss));
Willy Tarreaud1f250f2020-12-04 15:03:36 +0100705 if (proto->fam->set_port)
706 proto->fam->set_port(&l->rx.addr, port);
Willy Tarreau07400c52020-12-04 14:49:11 +0100707
Olivier Houchard859dc802019-08-08 15:47:21 +0200708 MT_LIST_INIT(&l->wait_queue);
Willy Tarreaua37b2442020-09-24 07:23:45 +0200709 listener_set_state(l, LI_INIT);
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200710
Willy Tarreaud1f250f2020-12-04 15:03:36 +0100711 proto->add(proto, l);
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200712
Willy Tarreau909c23b2020-09-15 13:50:58 +0200713 if (fd != -1)
Willy Tarreau43046fa2020-09-01 15:41:59 +0200714 l->rx.flags |= RX_F_INHERITED;
William Lallemand75ea0a02017-11-15 19:02:58 +0100715
Amaury Denoyelle7f8f6cb2020-11-10 14:24:31 +0100716 l->extra_counters = NULL;
717
Willy Tarreau08b6f962022-02-01 16:23:00 +0100718 HA_RWLOCK_INIT(&l->lock);
Willy Tarreau4781b152021-04-06 13:53:36 +0200719 _HA_ATOMIC_INC(&jobs);
720 _HA_ATOMIC_INC(&listeners);
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200721 }
722 return 1;
723}
724
Willy Tarreau59a877d2021-10-12 09:36:10 +0200725/* clones listener <src> and returns the new one. All dynamically allocated
726 * fields are reallocated (name for now). The new listener is inserted before
727 * the original one in the bind_conf and frontend lists. This allows it to be
728 * duplicated while iterating over the current list. The original listener must
729 * only be in the INIT or ASSIGNED states, and the new listener will only be
730 * placed into the INIT state. The counters are always set to NULL. Maxsock is
731 * updated. Returns NULL on allocation error.
732 */
733struct listener *clone_listener(struct listener *src)
734{
735 struct listener *l;
736
737 l = calloc(1, sizeof(*l));
738 if (!l)
739 goto oom1;
740 memcpy(l, src, sizeof(*l));
741
742 if (l->name) {
743 l->name = strdup(l->name);
744 if (!l->name)
745 goto oom2;
746 }
747
748 l->rx.owner = l;
749 l->state = LI_INIT;
750 l->counters = NULL;
751 l->extra_counters = NULL;
752
753 LIST_APPEND(&src->by_fe, &l->by_fe);
754 LIST_APPEND(&src->by_bind, &l->by_bind);
755
756 MT_LIST_INIT(&l->wait_queue);
757
758 l->rx.proto->add(l->rx.proto, l);
759
Willy Tarreau08b6f962022-02-01 16:23:00 +0100760 HA_RWLOCK_INIT(&l->lock);
Willy Tarreau59a877d2021-10-12 09:36:10 +0200761 _HA_ATOMIC_INC(&jobs);
762 _HA_ATOMIC_INC(&listeners);
763 global.maxsock++;
764 return l;
765
Willy Tarreau59a877d2021-10-12 09:36:10 +0200766 oom2:
767 free(l);
768 oom1:
Willy Tarreaua1462892021-10-16 14:45:29 +0200769 return NULL;
Willy Tarreau59a877d2021-10-12 09:36:10 +0200770}
771
Willy Tarreau1a64d162007-10-28 22:26:05 +0100772/* Delete a listener from its protocol's list of listeners. The listener's
773 * state is automatically updated from LI_ASSIGNED to LI_INIT. The protocol's
Willy Tarreau2cc5bae2017-09-15 08:18:11 +0200774 * number of listeners is updated, as well as the global number of listeners
775 * and jobs. Note that the listener must have previously been unbound. This
Willy Tarreaub4c083f2020-10-07 15:36:16 +0200776 * is a low-level function expected to be called with the proto_lock and the
777 * listener's lock held.
Willy Tarreau1a64d162007-10-28 22:26:05 +0100778 */
Willy Tarreaub4c083f2020-10-07 15:36:16 +0200779void __delete_listener(struct listener *listener)
Willy Tarreau1a64d162007-10-28 22:26:05 +0100780{
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100781 if (listener->state == LI_ASSIGNED) {
Willy Tarreaua37b2442020-09-24 07:23:45 +0200782 listener_set_state(listener, LI_INIT);
Willy Tarreau2b718102021-04-21 07:32:39 +0200783 LIST_DELETE(&listener->rx.proto_list);
Willy Tarreaud7f331c2020-09-25 17:01:43 +0200784 listener->rx.proto->nb_receivers--;
Willy Tarreau4781b152021-04-06 13:53:36 +0200785 _HA_ATOMIC_DEC(&jobs);
786 _HA_ATOMIC_DEC(&listeners);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100787 }
Willy Tarreaub4c083f2020-10-07 15:36:16 +0200788}
789
790/* Delete a listener from its protocol's list of listeners (please check
791 * __delete_listener() above). The proto_lock and the listener's lock will
792 * be grabbed in this order.
793 */
794void delete_listener(struct listener *listener)
795{
796 HA_SPIN_LOCK(PROTO_LOCK, &proto_lock);
Willy Tarreau08b6f962022-02-01 16:23:00 +0100797 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &listener->lock);
Willy Tarreaub4c083f2020-10-07 15:36:16 +0200798 __delete_listener(listener);
Willy Tarreau08b6f962022-02-01 16:23:00 +0100799 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &listener->lock);
Willy Tarreau6ee9f8d2019-08-26 10:55:52 +0200800 HA_SPIN_UNLOCK(PROTO_LOCK, &proto_lock);
Willy Tarreau1a64d162007-10-28 22:26:05 +0100801}
802
Willy Tarreaue2711c72019-02-27 15:39:41 +0100803/* Returns a suitable value for a listener's backlog. It uses the listener's,
804 * otherwise the frontend's backlog, otherwise the listener's maxconn,
805 * otherwise the frontend's maxconn, otherwise 1024.
806 */
807int listener_backlog(const struct listener *l)
808{
809 if (l->backlog)
810 return l->backlog;
811
812 if (l->bind_conf->frontend->backlog)
813 return l->bind_conf->frontend->backlog;
814
815 if (l->maxconn)
816 return l->maxconn;
817
818 if (l->bind_conf->frontend->maxconn)
819 return l->bind_conf->frontend->maxconn;
820
821 return 1024;
822}
823
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200824/* This function is called on a read event from a listening socket, corresponding
825 * to an accept. It tries to accept as many connections as possible, and for each
826 * calls the listener's accept handler (generally the frontend's accept handler).
827 */
Willy Tarreaua74cb382020-10-15 21:29:49 +0200828void listener_accept(struct listener *l)
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200829{
Willy Tarreau83efc322020-10-14 17:37:17 +0200830 struct connection *cli_conn;
Olivier Houchardd16a9df2019-02-25 16:18:16 +0100831 struct proxy *p;
Christopher Faulet102854c2019-04-30 12:17:13 +0200832 unsigned int max_accept;
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100833 int next_conn = 0;
Willy Tarreau82c97892019-02-27 19:32:32 +0100834 int next_feconn = 0;
835 int next_actconn = 0;
Willy Tarreaubb660302014-05-07 19:47:02 +0200836 int expire;
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200837 int ret;
838
Olivier Houchardd16a9df2019-02-25 16:18:16 +0100839 p = l->bind_conf->frontend;
Christopher Faulet102854c2019-04-30 12:17:13 +0200840
841 /* if l->maxaccept is -1, then max_accept is UINT_MAX. It is not really
842 * illimited, but it is probably enough.
843 */
Olivier Houchardd16a9df2019-02-25 16:18:16 +0100844 max_accept = l->maxaccept ? l->maxaccept : 1;
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200845
Willy Tarreau93e7c002013-10-07 18:51:07 +0200846 if (!(l->options & LI_O_UNLIMITED) && global.sps_lim) {
847 int max = freq_ctr_remain(&global.sess_per_sec, global.sps_lim, 0);
Willy Tarreau93e7c002013-10-07 18:51:07 +0200848
849 if (unlikely(!max)) {
850 /* frontend accept rate limit was reached */
Willy Tarreau93e7c002013-10-07 18:51:07 +0200851 expire = tick_add(now_ms, next_event_delay(&global.sess_per_sec, global.sps_lim, 0));
Willy Tarreau0591bf72019-12-10 12:01:21 +0100852 goto limit_global;
Willy Tarreau93e7c002013-10-07 18:51:07 +0200853 }
854
855 if (max_accept > max)
856 max_accept = max;
857 }
858
859 if (!(l->options & LI_O_UNLIMITED) && global.cps_lim) {
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200860 int max = freq_ctr_remain(&global.conn_per_sec, global.cps_lim, 0);
861
862 if (unlikely(!max)) {
863 /* frontend accept rate limit was reached */
Willy Tarreau93e7c002013-10-07 18:51:07 +0200864 expire = tick_add(now_ms, next_event_delay(&global.conn_per_sec, global.cps_lim, 0));
Willy Tarreau0591bf72019-12-10 12:01:21 +0100865 goto limit_global;
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200866 }
867
868 if (max_accept > max)
869 max_accept = max;
870 }
Willy Tarreaue43d5322013-10-07 20:01:52 +0200871#ifdef USE_OPENSSL
Willy Tarreau11ba4042022-05-20 15:56:32 +0200872 if (!(l->options & LI_O_UNLIMITED) && global.ssl_lim &&
873 l->bind_conf && l->bind_conf->options & BC_O_USE_SSL) {
Willy Tarreaue43d5322013-10-07 20:01:52 +0200874 int max = freq_ctr_remain(&global.ssl_per_sec, global.ssl_lim, 0);
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200875
Willy Tarreaue43d5322013-10-07 20:01:52 +0200876 if (unlikely(!max)) {
877 /* frontend accept rate limit was reached */
Willy Tarreaue43d5322013-10-07 20:01:52 +0200878 expire = tick_add(now_ms, next_event_delay(&global.ssl_per_sec, global.ssl_lim, 0));
Willy Tarreau0591bf72019-12-10 12:01:21 +0100879 goto limit_global;
Willy Tarreaue43d5322013-10-07 20:01:52 +0200880 }
881
882 if (max_accept > max)
883 max_accept = max;
884 }
885#endif
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200886 if (p && p->fe_sps_lim) {
887 int max = freq_ctr_remain(&p->fe_sess_per_sec, p->fe_sps_lim, 0);
888
889 if (unlikely(!max)) {
890 /* frontend accept rate limit was reached */
Willy Tarreau0591bf72019-12-10 12:01:21 +0100891 expire = tick_add(now_ms, next_event_delay(&p->fe_sess_per_sec, p->fe_sps_lim, 0));
892 goto limit_proxy;
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200893 }
894
895 if (max_accept > max)
896 max_accept = max;
897 }
898
899 /* Note: if we fail to allocate a connection because of configured
900 * limits, we'll schedule a new attempt worst 1 second later in the
901 * worst case. If we fail due to system limits or temporary resource
902 * shortage, we try again 100ms later in the worst case.
903 */
Willy Tarreau02757d02021-01-28 18:07:24 +0100904 for (; max_accept; next_conn = next_feconn = next_actconn = 0, max_accept--) {
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200905 unsigned int count;
Willy Tarreau9378bbe2020-10-15 10:09:31 +0200906 int status;
Willy Tarreau0aa5a5b2020-10-16 17:43:04 +0200907 __decl_thread(unsigned long mask);
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200908
Willy Tarreau82c97892019-02-27 19:32:32 +0100909 /* pre-increase the number of connections without going too far.
910 * We process the listener, then the proxy, then the process.
911 * We know which ones to unroll based on the next_xxx value.
912 */
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100913 do {
914 count = l->nbconn;
Willy Tarreau93604ed2019-11-15 10:20:07 +0100915 if (unlikely(l->maxconn && count >= l->maxconn)) {
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100916 /* the listener was marked full or another
917 * thread is going to do it.
918 */
919 next_conn = 0;
Willy Tarreau93604ed2019-11-15 10:20:07 +0100920 listener_full(l);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100921 goto end;
922 }
923 next_conn = count + 1;
David Carlier56716622019-03-27 16:08:42 +0000924 } while (!_HA_ATOMIC_CAS(&l->nbconn, (int *)(&count), next_conn));
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100925
Willy Tarreau82c97892019-02-27 19:32:32 +0100926 if (p) {
927 do {
928 count = p->feconn;
Willy Tarreau93604ed2019-11-15 10:20:07 +0100929 if (unlikely(count >= p->maxconn)) {
Willy Tarreau82c97892019-02-27 19:32:32 +0100930 /* the frontend was marked full or another
931 * thread is going to do it.
932 */
933 next_feconn = 0;
Willy Tarreau0591bf72019-12-10 12:01:21 +0100934 expire = TICK_ETERNITY;
935 goto limit_proxy;
Willy Tarreau82c97892019-02-27 19:32:32 +0100936 }
937 next_feconn = count + 1;
Olivier Houchard64213e92019-03-08 18:52:57 +0100938 } while (!_HA_ATOMIC_CAS(&p->feconn, &count, next_feconn));
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200939 }
940
Willy Tarreau82c97892019-02-27 19:32:32 +0100941 if (!(l->options & LI_O_UNLIMITED)) {
942 do {
943 count = actconn;
Willy Tarreau93604ed2019-11-15 10:20:07 +0100944 if (unlikely(count >= global.maxconn)) {
Willy Tarreau82c97892019-02-27 19:32:32 +0100945 /* the process was marked full or another
946 * thread is going to do it.
947 */
948 next_actconn = 0;
Willy Tarreau0591bf72019-12-10 12:01:21 +0100949 expire = tick_add(now_ms, 1000); /* try again in 1 second */
950 goto limit_global;
Willy Tarreau82c97892019-02-27 19:32:32 +0100951 }
952 next_actconn = count + 1;
David Carlier56716622019-03-27 16:08:42 +0000953 } while (!_HA_ATOMIC_CAS(&actconn, (int *)(&count), next_actconn));
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200954 }
955
Willy Tarreaufed93d32022-02-01 16:37:00 +0100956 /* be careful below, the listener might be shutting down in
957 * another thread on error and we must not dereference its
958 * FD without a bit of protection.
959 */
960 cli_conn = NULL;
961 status = CO_AC_PERMERR;
962
963 HA_RWLOCK_RDLOCK(LISTENER_LOCK, &l->lock);
964 if (l->rx.flags & RX_F_BOUND)
965 cli_conn = l->rx.proto->accept_conn(l, &status);
966 HA_RWLOCK_RDUNLOCK(LISTENER_LOCK, &l->lock);
967
Willy Tarreau9378bbe2020-10-15 10:09:31 +0200968 if (!cli_conn) {
969 switch (status) {
970 case CO_AC_DONE:
971 goto end;
Willy Tarreau818dca52014-01-31 19:40:19 +0100972
Willy Tarreau9378bbe2020-10-15 10:09:31 +0200973 case CO_AC_RETRY: /* likely a signal */
Willy Tarreau4781b152021-04-06 13:53:36 +0200974 _HA_ATOMIC_DEC(&l->nbconn);
Willy Tarreau82c97892019-02-27 19:32:32 +0100975 if (p)
Willy Tarreau4781b152021-04-06 13:53:36 +0200976 _HA_ATOMIC_DEC(&p->feconn);
Willy Tarreau82c97892019-02-27 19:32:32 +0100977 if (!(l->options & LI_O_UNLIMITED))
Willy Tarreau4781b152021-04-06 13:53:36 +0200978 _HA_ATOMIC_DEC(&actconn);
Willy Tarreaua593ec52014-01-20 21:21:30 +0100979 continue;
Willy Tarreau9378bbe2020-10-15 10:09:31 +0200980
981 case CO_AC_YIELD:
Willy Tarreau92079932019-12-10 09:30:05 +0100982 max_accept = 0;
983 goto end;
William Lallemandd9138002018-11-27 12:02:39 +0100984
Willy Tarreau9378bbe2020-10-15 10:09:31 +0200985 default:
986 goto transient_error;
Willy Tarreau83efc322020-10-14 17:37:17 +0200987 }
988 }
989
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100990 /* The connection was accepted, it must be counted as such */
991 if (l->counters)
992 HA_ATOMIC_UPDATE_MAX(&l->counters->conn_max, next_conn);
993
Willy Tarreaud8679342022-05-09 20:41:54 +0200994 if (p) {
Willy Tarreau82c97892019-02-27 19:32:32 +0100995 HA_ATOMIC_UPDATE_MAX(&p->fe_counters.conn_max, next_feconn);
Willy Tarreaud8679342022-05-09 20:41:54 +0200996 proxy_inc_fe_conn_ctr(l, p);
997 }
Willy Tarreau82c97892019-02-27 19:32:32 +0100998
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100999 if (!(l->options & LI_O_UNLIMITED)) {
1000 count = update_freq_ctr(&global.conn_per_sec, 1);
1001 HA_ATOMIC_UPDATE_MAX(&global.cps_max, count);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001002 }
1003
Willy Tarreau4781b152021-04-06 13:53:36 +02001004 _HA_ATOMIC_INC(&activity[tid].accepted);
Willy Tarreau64a9c052019-04-12 15:27:17 +02001005
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001006 /* past this point, l->accept() will automatically decrement
Willy Tarreau82c97892019-02-27 19:32:32 +01001007 * l->nbconn, feconn and actconn once done. Setting next_*conn=0
1008 * allows the error path not to rollback on nbconn. It's more
1009 * convenient than duplicating all exit labels.
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001010 */
1011 next_conn = 0;
Willy Tarreau82c97892019-02-27 19:32:32 +01001012 next_feconn = 0;
1013 next_actconn = 0;
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001014
Willy Tarreau83efc322020-10-14 17:37:17 +02001015
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001016#if defined(USE_THREAD)
Amaury Denoyelle7f7713d2022-01-19 11:37:50 +01001017 if (l->rx.flags & RX_F_LOCAL_ACCEPT)
1018 goto local_accept;
1019
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001020 mask = l->rx.bind_thread & tg->threads_enabled;
Willy Tarreaua7da5e82020-03-12 17:33:29 +01001021 if (atleast2(mask) && (global.tune.options & GTUNE_LISTENER_MQ) && !stopping) {
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001022 struct accept_queue_ring *ring;
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001023 unsigned int t, t0, t1, t2;
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001024 int base = tg->base;
Willy Tarreaufc630bd2019-03-04 19:57:34 +01001025
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001026 /* The principle is that we have two running indexes,
1027 * each visiting in turn all threads bound to this
1028 * listener. The connection will be assigned to the one
1029 * with the least connections, and the other one will
1030 * be updated. This provides a good fairness on short
Willy Tarreaufc630bd2019-03-04 19:57:34 +01001031 * connections (round robin) and on long ones (conn
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001032 * count), without ever missing any idle thread.
Willy Tarreaufc630bd2019-03-04 19:57:34 +01001033 */
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001034
1035 /* keep a copy for the final update. thr_idx is composite
1036 * and made of (t2<<16) + t1.
1037 */
Willy Tarreau0cf33172019-03-06 15:26:33 +01001038 t0 = l->thr_idx;
Willy Tarreaufc630bd2019-03-04 19:57:34 +01001039 do {
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001040 unsigned long m1, m2;
1041 int q1, q2;
1042
1043 t2 = t1 = t0;
1044 t2 >>= 16;
1045 t1 &= 0xFFFF;
1046
1047 /* t1 walks low to high bits ;
1048 * t2 walks high to low.
1049 */
1050 m1 = mask >> t1;
1051 m2 = mask & (t2 ? nbits(t2 + 1) : ~0UL);
1052
Willy Tarreau85d04242019-04-16 18:09:13 +02001053 if (unlikely(!(m1 & 1))) {
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001054 m1 &= ~1UL;
1055 if (!m1) {
1056 m1 = mask;
1057 t1 = 0;
1058 }
1059 t1 += my_ffsl(m1) - 1;
1060 }
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001061
Willy Tarreau85d04242019-04-16 18:09:13 +02001062 if (unlikely(!(m2 & (1UL << t2)) || t1 == t2)) {
1063 /* highest bit not set */
1064 if (!m2)
1065 m2 = mask;
1066
1067 t2 = my_flsl(m2) - 1;
1068 }
1069
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001070 /* now we have two distinct thread IDs belonging to the mask */
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001071 q1 = accept_queue_rings[base + t1].tail - accept_queue_rings[base + t1].head + ACCEPT_QUEUE_SIZE;
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001072 if (q1 >= ACCEPT_QUEUE_SIZE)
1073 q1 -= ACCEPT_QUEUE_SIZE;
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001074
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001075 q2 = accept_queue_rings[base + t2].tail - accept_queue_rings[base + t2].head + ACCEPT_QUEUE_SIZE;
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001076 if (q2 >= ACCEPT_QUEUE_SIZE)
1077 q2 -= ACCEPT_QUEUE_SIZE;
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001078
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001079 /* we have 3 possibilities now :
1080 * q1 < q2 : t1 is less loaded than t2, so we pick it
1081 * and update t2 (since t1 might still be
1082 * lower than another thread)
1083 * q1 > q2 : t2 is less loaded than t1, so we pick it
1084 * and update t1 (since t2 might still be
1085 * lower than another thread)
1086 * q1 = q2 : both are equally loaded, thus we pick t1
1087 * and update t1 as it will become more loaded
1088 * than t2.
1089 */
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001090
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001091 q1 += l->thr_conn[base + t1];
1092 q2 += l->thr_conn[base + t2];
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001093
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001094 if (q1 - q2 < 0) {
1095 t = t1;
1096 t2 = t2 ? t2 - 1 : LONGBITS - 1;
1097 }
1098 else if (q1 - q2 > 0) {
1099 t = t2;
1100 t1++;
1101 if (t1 >= LONGBITS)
1102 t1 = 0;
1103 }
1104 else {
1105 t = t1;
1106 t1++;
1107 if (t1 >= LONGBITS)
1108 t1 = 0;
1109 }
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001110
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001111 /* new value for thr_idx */
1112 t1 += (t2 << 16);
Olivier Houchard64213e92019-03-08 18:52:57 +01001113 } while (unlikely(!_HA_ATOMIC_CAS(&l->thr_idx, &t0, t1)));
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001114
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001115 /* We successfully selected the best thread "t" for this
1116 * connection. We use deferred accepts even if it's the
1117 * local thread because tests show that it's the best
1118 * performing model, likely due to better cache locality
1119 * when processing this loop.
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001120 */
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001121 ring = &accept_queue_rings[base + t];
Willy Tarreau83efc322020-10-14 17:37:17 +02001122 if (accept_queue_push_mp(ring, cli_conn)) {
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001123 _HA_ATOMIC_INC(&activity[base + t].accq_pushed);
Willy Tarreau2bd65a72019-09-24 06:55:18 +02001124 tasklet_wakeup(ring->tasklet);
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001125 continue;
1126 }
1127 /* If the ring is full we do a synchronous accept on
1128 * the local thread here.
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001129 */
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001130 _HA_ATOMIC_INC(&activity[base + t].accq_full);
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001131 }
1132#endif // USE_THREAD
1133
Amaury Denoyelle7f7713d2022-01-19 11:37:50 +01001134 local_accept:
Willy Tarreau4781b152021-04-06 13:53:36 +02001135 _HA_ATOMIC_INC(&l->thr_conn[tid]);
Willy Tarreau83efc322020-10-14 17:37:17 +02001136 ret = l->accept(cli_conn);
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001137 if (unlikely(ret <= 0)) {
Willy Tarreau87b09662015-04-03 00:22:06 +02001138 /* The connection was closed by stream_accept(). Either
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001139 * we just have to ignore it (ret == 0) or it's a critical
1140 * error due to a resource shortage, and we must stop the
1141 * listener (ret < 0).
1142 */
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001143 if (ret == 0) /* successful termination */
1144 continue;
1145
Willy Tarreaubb660302014-05-07 19:47:02 +02001146 goto transient_error;
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001147 }
1148
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001149 /* increase the per-process number of cumulated sessions, this
1150 * may only be done once l->accept() has accepted the connection.
1151 */
Willy Tarreau93e7c002013-10-07 18:51:07 +02001152 if (!(l->options & LI_O_UNLIMITED)) {
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +02001153 count = update_freq_ctr(&global.sess_per_sec, 1);
1154 HA_ATOMIC_UPDATE_MAX(&global.sps_max, count);
Willy Tarreau93e7c002013-10-07 18:51:07 +02001155 }
Willy Tarreaue43d5322013-10-07 20:01:52 +02001156#ifdef USE_OPENSSL
Willy Tarreau11ba4042022-05-20 15:56:32 +02001157 if (!(l->options & LI_O_UNLIMITED) &&
1158 l->bind_conf && l->bind_conf->options & BC_O_USE_SSL) {
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +02001159 count = update_freq_ctr(&global.ssl_per_sec, 1);
1160 HA_ATOMIC_UPDATE_MAX(&global.ssl_max, count);
Willy Tarreaue43d5322013-10-07 20:01:52 +02001161 }
1162#endif
Willy Tarreau93e7c002013-10-07 18:51:07 +02001163
Willy Tarreaubdcd3252022-06-22 09:19:46 +02001164 _HA_ATOMIC_AND(&th_ctx->flags, ~TH_FL_STUCK); // this thread is still running
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001165 } /* end of for (max_accept--) */
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001166
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +02001167 end:
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001168 if (next_conn)
Willy Tarreau4781b152021-04-06 13:53:36 +02001169 _HA_ATOMIC_DEC(&l->nbconn);
Willy Tarreau741b4d62019-02-25 15:02:04 +01001170
Willy Tarreau82c97892019-02-27 19:32:32 +01001171 if (p && next_feconn)
Willy Tarreau4781b152021-04-06 13:53:36 +02001172 _HA_ATOMIC_DEC(&p->feconn);
Willy Tarreau82c97892019-02-27 19:32:32 +01001173
1174 if (next_actconn)
Willy Tarreau4781b152021-04-06 13:53:36 +02001175 _HA_ATOMIC_DEC(&actconn);
Willy Tarreau82c97892019-02-27 19:32:32 +01001176
Willy Tarreaua8cf66b2019-02-27 16:49:00 +01001177 if ((l->state == LI_FULL && (!l->maxconn || l->nbconn < l->maxconn)) ||
Willy Tarreau02757d02021-01-28 18:07:24 +01001178 (l->state == LI_LIMITED &&
Willy Tarreaucdcba112019-12-11 15:06:30 +01001179 ((!p || p->feconn < p->maxconn) && (actconn < global.maxconn) &&
1180 (!tick_isset(global_listener_queue_task->expire) ||
1181 tick_is_expired(global_listener_queue_task->expire, now_ms))))) {
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001182 /* at least one thread has to this when quitting */
Aurelien DARRAGON00132882022-09-09 15:32:57 +02001183 resume_listener(l, 0);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001184
Willy Tarreau02757d02021-01-28 18:07:24 +01001185 /* Dequeues all of the listeners waiting for a resource */
Willy Tarreau241797a2019-12-10 14:10:52 +01001186 dequeue_all_listeners();
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001187
Olivier Houchard859dc802019-08-08 15:47:21 +02001188 if (p && !MT_LIST_ISEMPTY(&p->listener_queue) &&
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001189 (!p->fe_sps_lim || freq_ctr_remain(&p->fe_sess_per_sec, p->fe_sps_lim, 0) > 0))
Willy Tarreau241797a2019-12-10 14:10:52 +01001190 dequeue_proxy_listeners(p);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001191 }
Willy Tarreau0591bf72019-12-10 12:01:21 +01001192 return;
1193
1194 transient_error:
1195 /* pause the listener for up to 100 ms */
1196 expire = tick_add(now_ms, 100);
1197
Willy Tarreau258b3512020-10-13 17:46:05 +02001198 /* This may be a shared socket that was paused by another process.
1199 * Let's put it to pause in this case.
1200 */
1201 if (l->rx.proto && l->rx.proto->rx_listening(&l->rx) == 0) {
Aurelien DARRAGON00132882022-09-09 15:32:57 +02001202 pause_listener(l, 0);
Willy Tarreau258b3512020-10-13 17:46:05 +02001203 goto end;
1204 }
1205
Willy Tarreau0591bf72019-12-10 12:01:21 +01001206 limit_global:
1207 /* (re-)queue the listener to the global queue and set it to expire no
1208 * later than <expire> ahead. The listener turns to LI_LIMITED.
1209 */
1210 limit_listener(l, &global_listener_queue);
Christopher Faulet13e86d92022-11-17 14:40:20 +01001211 HA_RWLOCK_RDLOCK(LISTENER_LOCK, &global_listener_rwlock);
Willy Tarreau0591bf72019-12-10 12:01:21 +01001212 task_schedule(global_listener_queue_task, expire);
Christopher Faulet13e86d92022-11-17 14:40:20 +01001213 HA_RWLOCK_RDUNLOCK(LISTENER_LOCK, &global_listener_rwlock);
Willy Tarreau0591bf72019-12-10 12:01:21 +01001214 goto end;
1215
1216 limit_proxy:
1217 /* (re-)queue the listener to the proxy's queue and set it to expire no
1218 * later than <expire> ahead. The listener turns to LI_LIMITED.
1219 */
1220 limit_listener(l, &p->listener_queue);
Willy Tarreaueeea8082020-01-08 19:15:07 +01001221 if (p->task && tick_isset(expire))
1222 task_schedule(p->task, expire);
Willy Tarreau0591bf72019-12-10 12:01:21 +01001223 goto end;
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001224}
1225
Willy Tarreau05f50472017-09-15 09:19:58 +02001226/* Notify the listener that a connection initiated from it was released. This
1227 * is used to keep the connection count consistent and to possibly re-open
1228 * listening when it was limited.
1229 */
1230void listener_release(struct listener *l)
1231{
1232 struct proxy *fe = l->bind_conf->frontend;
1233
1234 if (!(l->options & LI_O_UNLIMITED))
Willy Tarreau4781b152021-04-06 13:53:36 +02001235 _HA_ATOMIC_DEC(&actconn);
Willy Tarreau82c97892019-02-27 19:32:32 +01001236 if (fe)
Willy Tarreau4781b152021-04-06 13:53:36 +02001237 _HA_ATOMIC_DEC(&fe->feconn);
1238 _HA_ATOMIC_DEC(&l->nbconn);
1239 _HA_ATOMIC_DEC(&l->thr_conn[tid]);
Willy Tarreau82c97892019-02-27 19:32:32 +01001240
1241 if (l->state == LI_FULL || l->state == LI_LIMITED)
Aurelien DARRAGON00132882022-09-09 15:32:57 +02001242 resume_listener(l, 0);
Willy Tarreau05f50472017-09-15 09:19:58 +02001243
Willy Tarreau02757d02021-01-28 18:07:24 +01001244 /* Dequeues all of the listeners waiting for a resource */
1245 dequeue_all_listeners();
1246
Aurelien DARRAGONa57786e2022-09-12 09:26:21 +02001247 if (fe && !MT_LIST_ISEMPTY(&fe->listener_queue) &&
Willy Tarreau05f50472017-09-15 09:19:58 +02001248 (!fe->fe_sps_lim || freq_ctr_remain(&fe->fe_sess_per_sec, fe->fe_sps_lim, 0) > 0))
Willy Tarreau241797a2019-12-10 14:10:52 +01001249 dequeue_proxy_listeners(fe);
Willy Tarreau05f50472017-09-15 09:19:58 +02001250}
1251
Willy Tarreauf2cb1692019-07-11 10:08:31 +02001252/* Initializes the listener queues. Returns 0 on success, otherwise ERR_* flags */
1253static int listener_queue_init()
1254{
Willy Tarreaubeeabf52021-10-01 18:23:30 +02001255 global_listener_queue_task = task_new_anywhere();
Willy Tarreaua1d97f82019-12-10 11:18:41 +01001256 if (!global_listener_queue_task) {
1257 ha_alert("Out of memory when initializing global listener queue\n");
1258 return ERR_FATAL|ERR_ABORT;
1259 }
1260 /* very simple initialization, users will queue the task if needed */
1261 global_listener_queue_task->context = NULL; /* not even a context! */
1262 global_listener_queue_task->process = manage_global_listener_queue;
Christopher Faulet13e86d92022-11-17 14:40:20 +01001263 HA_RWLOCK_INIT(&global_listener_rwlock);
Willy Tarreaua1d97f82019-12-10 11:18:41 +01001264
Willy Tarreauf2cb1692019-07-11 10:08:31 +02001265 return 0;
1266}
1267
1268static void listener_queue_deinit()
1269{
Willy Tarreaua1d97f82019-12-10 11:18:41 +01001270 task_destroy(global_listener_queue_task);
1271 global_listener_queue_task = NULL;
Willy Tarreauf2cb1692019-07-11 10:08:31 +02001272}
1273
1274REGISTER_CONFIG_POSTPARSER("multi-threaded listener queue", listener_queue_init);
1275REGISTER_POST_DEINIT(listener_queue_deinit);
1276
Willy Tarreaua1d97f82019-12-10 11:18:41 +01001277
1278/* This is the global management task for listeners. It enables listeners waiting
1279 * for global resources when there are enough free resource, or at least once in
Willy Tarreaud597ec22021-01-29 14:29:06 +01001280 * a while. It is designed to be called as a task. It's exported so that it's easy
1281 * to spot in "show tasks" or "show profiling".
Willy Tarreaua1d97f82019-12-10 11:18:41 +01001282 */
Willy Tarreau144f84a2021-03-02 16:09:26 +01001283struct task *manage_global_listener_queue(struct task *t, void *context, unsigned int state)
Willy Tarreaua1d97f82019-12-10 11:18:41 +01001284{
1285 /* If there are still too many concurrent connections, let's wait for
1286 * some of them to go away. We don't need to re-arm the timer because
1287 * each of them will scan the queue anyway.
1288 */
1289 if (unlikely(actconn >= global.maxconn))
1290 goto out;
1291
1292 /* We should periodically try to enable listeners waiting for a global
1293 * resource here, because it is possible, though very unlikely, that
1294 * they have been blocked by a temporary lack of global resource such
1295 * as a file descriptor or memory and that the temporary condition has
1296 * disappeared.
1297 */
1298 dequeue_all_listeners();
1299
1300 out:
Christopher Faulet13e86d92022-11-17 14:40:20 +01001301 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &global_listener_rwlock);
Willy Tarreaua1d97f82019-12-10 11:18:41 +01001302 t->expire = TICK_ETERNITY;
Christopher Faulet13e86d92022-11-17 14:40:20 +01001303 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &global_listener_rwlock);
Willy Tarreaua1d97f82019-12-10 11:18:41 +01001304 return t;
1305}
1306
Willy Tarreau26982662012-09-12 23:17:10 +02001307/*
1308 * Registers the bind keyword list <kwl> as a list of valid keywords for next
1309 * parsing sessions.
1310 */
1311void bind_register_keywords(struct bind_kw_list *kwl)
1312{
Willy Tarreau2b718102021-04-21 07:32:39 +02001313 LIST_APPEND(&bind_keywords.list, &kwl->list);
Willy Tarreau26982662012-09-12 23:17:10 +02001314}
1315
1316/* Return a pointer to the bind keyword <kw>, or NULL if not found. If the
1317 * keyword is found with a NULL ->parse() function, then an attempt is made to
1318 * find one with a valid ->parse() function. This way it is possible to declare
1319 * platform-dependant, known keywords as NULL, then only declare them as valid
1320 * if some options are met. Note that if the requested keyword contains an
1321 * opening parenthesis, everything from this point is ignored.
1322 */
1323struct bind_kw *bind_find_kw(const char *kw)
1324{
1325 int index;
1326 const char *kwend;
1327 struct bind_kw_list *kwl;
1328 struct bind_kw *ret = NULL;
1329
1330 kwend = strchr(kw, '(');
1331 if (!kwend)
1332 kwend = kw + strlen(kw);
1333
1334 list_for_each_entry(kwl, &bind_keywords.list, list) {
1335 for (index = 0; kwl->kw[index].kw != NULL; index++) {
1336 if ((strncmp(kwl->kw[index].kw, kw, kwend - kw) == 0) &&
1337 kwl->kw[index].kw[kwend-kw] == 0) {
1338 if (kwl->kw[index].parse)
1339 return &kwl->kw[index]; /* found it !*/
1340 else
1341 ret = &kwl->kw[index]; /* may be OK */
1342 }
1343 }
1344 }
1345 return ret;
1346}
1347
Willy Tarreau8638f482012-09-18 18:01:17 +02001348/* Dumps all registered "bind" keywords to the <out> string pointer. The
1349 * unsupported keywords are only dumped if their supported form was not
1350 * found.
1351 */
1352void bind_dump_kws(char **out)
1353{
1354 struct bind_kw_list *kwl;
1355 int index;
1356
Christopher Faulet784063e2020-05-18 12:14:18 +02001357 if (!out)
1358 return;
1359
Willy Tarreau8638f482012-09-18 18:01:17 +02001360 *out = NULL;
1361 list_for_each_entry(kwl, &bind_keywords.list, list) {
1362 for (index = 0; kwl->kw[index].kw != NULL; index++) {
1363 if (kwl->kw[index].parse ||
1364 bind_find_kw(kwl->kw[index].kw) == &kwl->kw[index]) {
Willy Tarreau51fb7652012-09-18 18:24:39 +02001365 memprintf(out, "%s[%4s] %s%s%s\n", *out ? *out : "",
1366 kwl->scope,
Willy Tarreau8638f482012-09-18 18:01:17 +02001367 kwl->kw[index].kw,
Willy Tarreau51fb7652012-09-18 18:24:39 +02001368 kwl->kw[index].skip ? " <arg>" : "",
1369 kwl->kw[index].parse ? "" : " (not supported)");
Willy Tarreau8638f482012-09-18 18:01:17 +02001370 }
1371 }
1372 }
1373}
1374
Willy Tarreau433b05f2021-03-12 10:14:07 +01001375/* Try to find in srv_keyword the word that looks closest to <word> by counting
1376 * transitions between letters, digits and other characters. Will return the
1377 * best matching word if found, otherwise NULL.
1378 */
1379const char *bind_find_best_kw(const char *word)
1380{
1381 uint8_t word_sig[1024];
1382 uint8_t list_sig[1024];
1383 const struct bind_kw_list *kwl;
1384 const char *best_ptr = NULL;
1385 int dist, best_dist = INT_MAX;
1386 int index;
1387
1388 make_word_fingerprint(word_sig, word);
1389 list_for_each_entry(kwl, &bind_keywords.list, list) {
1390 for (index = 0; kwl->kw[index].kw != NULL; index++) {
1391 make_word_fingerprint(list_sig, kwl->kw[index].kw);
1392 dist = word_fingerprint_distance(word_sig, list_sig);
1393 if (dist < best_dist) {
1394 best_dist = dist;
1395 best_ptr = kwl->kw[index].kw;
1396 }
1397 }
1398 }
1399
1400 if (best_dist > 2 * strlen(word) || (best_ptr && best_dist > 2 * strlen(best_ptr)))
1401 best_ptr = NULL;
1402
1403 return best_ptr;
1404}
1405
Willy Tarreaudbf78022021-10-06 09:05:08 +02001406/* allocate an bind_conf struct for a bind line, and chain it to the frontend <fe>.
1407 * If <arg> is not NULL, it is duplicated into ->arg to store useful config
1408 * information for error reporting. NULL is returned on error.
1409 */
1410struct bind_conf *bind_conf_alloc(struct proxy *fe, const char *file,
1411 int line, const char *arg, struct xprt_ops *xprt)
1412{
1413 struct bind_conf *bind_conf = calloc(1, sizeof(*bind_conf));
1414
1415 if (!bind_conf)
1416 goto err;
1417
1418 bind_conf->file = strdup(file);
1419 if (!bind_conf->file)
1420 goto err;
1421 bind_conf->line = line;
1422 if (arg) {
1423 bind_conf->arg = strdup(arg);
1424 if (!bind_conf->arg)
1425 goto err;
1426 }
1427
1428 LIST_APPEND(&fe->conf.bind, &bind_conf->by_fe);
1429 bind_conf->settings.ux.uid = -1;
1430 bind_conf->settings.ux.gid = -1;
1431 bind_conf->settings.ux.mode = 0;
Willy Tarreau6dfbef42021-10-12 15:23:03 +02001432 bind_conf->settings.shards = 1;
Willy Tarreaudbf78022021-10-06 09:05:08 +02001433 bind_conf->xprt = xprt;
1434 bind_conf->frontend = fe;
1435 bind_conf->severity_output = CLI_SEVERITY_NONE;
1436#ifdef USE_OPENSSL
1437 HA_RWLOCK_INIT(&bind_conf->sni_lock);
1438 bind_conf->sni_ctx = EB_ROOT;
1439 bind_conf->sni_w_ctx = EB_ROOT;
1440#endif
1441 LIST_INIT(&bind_conf->listeners);
1442 return bind_conf;
1443
1444 err:
1445 if (bind_conf) {
1446 ha_free(&bind_conf->file);
1447 ha_free(&bind_conf->arg);
1448 }
1449 ha_free(&bind_conf);
1450 return NULL;
1451}
1452
1453const char *listener_state_str(const struct listener *l)
1454{
1455 static const char *states[8] = {
1456 "NEW", "INI", "ASS", "PAU", "LIS", "RDY", "FUL", "LIM",
1457 };
1458 unsigned int st = l->state;
1459
1460 if (st >= sizeof(states) / sizeof(*states))
1461 return "INVALID";
1462 return states[st];
1463}
1464
Willy Tarreau645513a2010-05-24 20:55:15 +02001465/************************************************************************/
Willy Tarreau0ccb7442013-01-07 22:54:17 +01001466/* All supported sample and ACL keywords must be declared here. */
Willy Tarreau645513a2010-05-24 20:55:15 +02001467/************************************************************************/
1468
Willy Tarreaua5e37562011-12-16 17:06:15 +01001469/* set temp integer to the number of connexions to the same listening socket */
Willy Tarreau645513a2010-05-24 20:55:15 +02001470static int
Thierry FOURNIER0786d052015-05-11 15:42:45 +02001471smp_fetch_dconn(const struct arg *args, struct sample *smp, const char *kw, void *private)
Willy Tarreau645513a2010-05-24 20:55:15 +02001472{
Thierry FOURNIER8c542ca2015-08-19 09:00:18 +02001473 smp->data.type = SMP_T_SINT;
Thierry FOURNIER136f9d32015-08-19 09:07:19 +02001474 smp->data.u.sint = smp->sess->listener->nbconn;
Willy Tarreau645513a2010-05-24 20:55:15 +02001475 return 1;
1476}
1477
Willy Tarreaua5e37562011-12-16 17:06:15 +01001478/* set temp integer to the id of the socket (listener) */
Willy Tarreau645513a2010-05-24 20:55:15 +02001479static int
Thierry FOURNIER0786d052015-05-11 15:42:45 +02001480smp_fetch_so_id(const struct arg *args, struct sample *smp, const char *kw, void *private)
Willy Tarreau37406352012-04-23 16:16:37 +02001481{
Thierry FOURNIER8c542ca2015-08-19 09:00:18 +02001482 smp->data.type = SMP_T_SINT;
Thierry FOURNIER136f9d32015-08-19 09:07:19 +02001483 smp->data.u.sint = smp->sess->listener->luid;
Willy Tarreau645513a2010-05-24 20:55:15 +02001484 return 1;
1485}
Jerome Magnineb421b22020-03-27 22:08:40 +01001486static int
1487smp_fetch_so_name(const struct arg *args, struct sample *smp, const char *kw, void *private)
1488{
1489 smp->data.u.str.area = smp->sess->listener->name;
1490 if (!smp->data.u.str.area)
1491 return 0;
1492
1493 smp->data.type = SMP_T_STR;
1494 smp->flags = SMP_F_CONST;
1495 smp->data.u.str.data = strlen(smp->data.u.str.area);
1496 return 1;
1497}
Willy Tarreau645513a2010-05-24 20:55:15 +02001498
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001499/* parse the "accept-proxy" bind keyword */
Willy Tarreau4348fad2012-09-20 16:48:07 +02001500static int bind_parse_accept_proxy(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001501{
1502 struct listener *l;
1503
Willy Tarreau4348fad2012-09-20 16:48:07 +02001504 list_for_each_entry(l, &conf->listeners, by_bind)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001505 l->options |= LI_O_ACC_PROXY;
1506
1507 return 0;
1508}
1509
Bertrand Jacquin93b227d2016-06-04 15:11:10 +01001510/* parse the "accept-netscaler-cip" bind keyword */
1511static int bind_parse_accept_netscaler_cip(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
1512{
1513 struct listener *l;
1514 uint32_t val;
1515
1516 if (!*args[cur_arg + 1]) {
1517 memprintf(err, "'%s' : missing value", args[cur_arg]);
1518 return ERR_ALERT | ERR_FATAL;
1519 }
1520
1521 val = atol(args[cur_arg + 1]);
1522 if (val <= 0) {
Willy Tarreaue2711c72019-02-27 15:39:41 +01001523 memprintf(err, "'%s' : invalid value %d, must be >= 0", args[cur_arg], val);
Bertrand Jacquin93b227d2016-06-04 15:11:10 +01001524 return ERR_ALERT | ERR_FATAL;
1525 }
1526
1527 list_for_each_entry(l, &conf->listeners, by_bind) {
1528 l->options |= LI_O_ACC_CIP;
1529 conf->ns_cip_magic = val;
1530 }
1531
1532 return 0;
1533}
1534
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001535/* parse the "backlog" bind keyword */
Willy Tarreau4348fad2012-09-20 16:48:07 +02001536static int bind_parse_backlog(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001537{
1538 struct listener *l;
1539 int val;
1540
1541 if (!*args[cur_arg + 1]) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001542 memprintf(err, "'%s' : missing value", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001543 return ERR_ALERT | ERR_FATAL;
1544 }
1545
1546 val = atol(args[cur_arg + 1]);
Willy Tarreaue2711c72019-02-27 15:39:41 +01001547 if (val < 0) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001548 memprintf(err, "'%s' : invalid value %d, must be > 0", args[cur_arg], val);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001549 return ERR_ALERT | ERR_FATAL;
1550 }
1551
Willy Tarreau4348fad2012-09-20 16:48:07 +02001552 list_for_each_entry(l, &conf->listeners, by_bind)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001553 l->backlog = val;
1554
1555 return 0;
1556}
1557
1558/* parse the "id" bind keyword */
Willy Tarreau4348fad2012-09-20 16:48:07 +02001559static int bind_parse_id(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001560{
1561 struct eb32_node *node;
Willy Tarreau4348fad2012-09-20 16:48:07 +02001562 struct listener *l, *new;
Thierry Fourniere7fe8eb2016-02-26 08:45:58 +01001563 char *error;
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001564
Willy Tarreau4348fad2012-09-20 16:48:07 +02001565 if (conf->listeners.n != conf->listeners.p) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001566 memprintf(err, "'%s' can only be used with a single socket", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001567 return ERR_ALERT | ERR_FATAL;
1568 }
1569
1570 if (!*args[cur_arg + 1]) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001571 memprintf(err, "'%s' : expects an integer argument", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001572 return ERR_ALERT | ERR_FATAL;
1573 }
1574
Willy Tarreau4348fad2012-09-20 16:48:07 +02001575 new = LIST_NEXT(&conf->listeners, struct listener *, by_bind);
Thierry Fourniere7fe8eb2016-02-26 08:45:58 +01001576 new->luid = strtol(args[cur_arg + 1], &error, 10);
1577 if (*error != '\0') {
1578 memprintf(err, "'%s' : expects an integer argument, found '%s'", args[cur_arg], args[cur_arg + 1]);
1579 return ERR_ALERT | ERR_FATAL;
1580 }
Willy Tarreau4348fad2012-09-20 16:48:07 +02001581 new->conf.id.key = new->luid;
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001582
Willy Tarreau4348fad2012-09-20 16:48:07 +02001583 if (new->luid <= 0) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001584 memprintf(err, "'%s' : custom id has to be > 0", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001585 return ERR_ALERT | ERR_FATAL;
1586 }
1587
Willy Tarreau4348fad2012-09-20 16:48:07 +02001588 node = eb32_lookup(&px->conf.used_listener_id, new->luid);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001589 if (node) {
1590 l = container_of(node, struct listener, conf.id);
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001591 memprintf(err, "'%s' : custom id %d already used at %s:%d ('bind %s')",
1592 args[cur_arg], l->luid, l->bind_conf->file, l->bind_conf->line,
1593 l->bind_conf->arg);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001594 return ERR_ALERT | ERR_FATAL;
1595 }
1596
Willy Tarreau4348fad2012-09-20 16:48:07 +02001597 eb32_insert(&px->conf.used_listener_id, &new->conf.id);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001598 return 0;
1599}
1600
Willy Tarreau3882d2a2022-05-20 15:41:45 +02001601/* Complete a bind_conf by parsing the args after the address. <args> is the
1602 * arguments array, <cur_arg> is the first one to be considered. <section> is
1603 * the section name to report in error messages, and <file> and <linenum> are
1604 * the file name and line number respectively. Note that args[0..1] are used
1605 * in error messages to provide some context. The return value is an error
1606 * code, zero on success or an OR of ERR_{FATAL,ABORT,ALERT,WARN}.
1607 */
1608int bind_parse_args_list(struct bind_conf *bind_conf, char **args, int cur_arg, const char *section, const char *file, int linenum)
1609{
1610 int err_code = 0;
1611
1612 while (*(args[cur_arg])) {
1613 struct bind_kw *kw;
1614 const char *best;
1615
1616 kw = bind_find_kw(args[cur_arg]);
1617 if (kw) {
1618 char *err = NULL;
1619 int code;
1620
1621 if (!kw->parse) {
1622 ha_alert("parsing [%s:%d] : '%s %s' in section '%s' : '%s' option is not implemented in this version (check build options).\n",
1623 file, linenum, args[0], args[1], section, args[cur_arg]);
1624 cur_arg += 1 + kw->skip ;
1625 err_code |= ERR_ALERT | ERR_FATAL;
1626 goto out;
1627 }
1628
1629 code = kw->parse(args, cur_arg, bind_conf->frontend, bind_conf, &err);
1630 err_code |= code;
1631
1632 if (code) {
1633 if (err && *err) {
1634 indent_msg(&err, 2);
1635 if (((code & (ERR_WARN|ERR_ALERT)) == ERR_WARN))
1636 ha_warning("parsing [%s:%d] : '%s %s' in section '%s' : %s\n", file, linenum, args[0], args[1], section, err);
1637 else
1638 ha_alert("parsing [%s:%d] : '%s %s' in section '%s' : %s\n", file, linenum, args[0], args[1], section, err);
1639 }
1640 else
1641 ha_alert("parsing [%s:%d] : '%s %s' in section '%s' : error encountered while processing '%s'.\n",
1642 file, linenum, args[0], args[1], section, args[cur_arg]);
1643 if (code & ERR_FATAL) {
1644 free(err);
1645 cur_arg += 1 + kw->skip;
1646 goto out;
1647 }
1648 }
1649 free(err);
1650 cur_arg += 1 + kw->skip;
1651 continue;
1652 }
1653
1654 best = bind_find_best_kw(args[cur_arg]);
1655 if (best)
1656 ha_alert("parsing [%s:%d] : '%s %s' in section '%s': unknown keyword '%s'; did you mean '%s' maybe ?\n",
1657 file, linenum, args[0], args[1], section, args[cur_arg], best);
1658 else
1659 ha_alert("parsing [%s:%d] : '%s %s' in section '%s': unknown keyword '%s'.\n",
1660 file, linenum, args[0], args[1], section, args[cur_arg]);
1661
1662 err_code |= ERR_ALERT | ERR_FATAL;
1663 goto out;
1664 }
Willy Tarreau64306cc2022-05-20 16:20:52 +02001665
1666 if ((bind_conf->options & (BC_O_USE_SOCK_DGRAM|BC_O_USE_SOCK_STREAM)) == (BC_O_USE_SOCK_DGRAM|BC_O_USE_SOCK_STREAM) ||
1667 (bind_conf->options & (BC_O_USE_XPRT_DGRAM|BC_O_USE_XPRT_STREAM)) == (BC_O_USE_XPRT_DGRAM|BC_O_USE_XPRT_STREAM)) {
1668 ha_alert("parsing [%s:%d] : '%s %s' in section '%s' : cannot mix datagram and stream protocols.\n",
1669 file, linenum, args[0], args[1], section);
1670 err_code |= ERR_ALERT | ERR_FATAL;
1671 goto out;
1672 }
1673
Willy Tarreau78d0dcd2022-05-20 17:10:00 +02001674 /* The transport layer automatically switches to QUIC when QUIC is
1675 * selected, regardless of bind_conf settings. We then need to
1676 * initialize QUIC params.
1677 */
1678 if ((bind_conf->options & (BC_O_USE_SOCK_DGRAM|BC_O_USE_XPRT_STREAM)) == (BC_O_USE_SOCK_DGRAM|BC_O_USE_XPRT_STREAM)) {
1679#ifdef USE_QUIC
1680 bind_conf->xprt = xprt_get(XPRT_QUIC);
Willy Tarreau287f32f2022-05-20 18:16:52 +02001681 if (!(bind_conf->options & BC_O_USE_SSL)) {
1682 bind_conf->options |= BC_O_USE_SSL;
1683 ha_warning("parsing [%s:%d] : '%s %s' in section '%s' : QUIC protocol detected, enabling ssl. Use 'ssl' to shut this warning.\n",
1684 file, linenum, args[0], args[1], section);
1685 }
Willy Tarreau78d0dcd2022-05-20 17:10:00 +02001686 quic_transport_params_init(&bind_conf->quic_params, 1);
1687#else
1688 ha_alert("parsing [%s:%d] : '%s %s' in section '%s' : QUIC protocol selected but support not compiled in (check build options).\n",
1689 file, linenum, args[0], args[1], section);
1690 err_code |= ERR_ALERT | ERR_FATAL;
1691 goto out;
1692#endif
1693 }
Willy Tarreau2071a992022-05-20 17:14:31 +02001694 else if (bind_conf->options & BC_O_USE_SSL) {
1695 bind_conf->xprt = xprt_get(XPRT_SSL);
1696 }
Willy Tarreau78d0dcd2022-05-20 17:10:00 +02001697
Willy Tarreau3882d2a2022-05-20 15:41:45 +02001698 out:
1699 return err_code;
1700}
1701
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001702/* parse the "maxconn" bind keyword */
Willy Tarreau4348fad2012-09-20 16:48:07 +02001703static int bind_parse_maxconn(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001704{
1705 struct listener *l;
1706 int val;
1707
1708 if (!*args[cur_arg + 1]) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001709 memprintf(err, "'%s' : missing value", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001710 return ERR_ALERT | ERR_FATAL;
1711 }
1712
1713 val = atol(args[cur_arg + 1]);
Willy Tarreaua8cf66b2019-02-27 16:49:00 +01001714 if (val < 0) {
1715 memprintf(err, "'%s' : invalid value %d, must be >= 0", args[cur_arg], val);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001716 return ERR_ALERT | ERR_FATAL;
1717 }
1718
Willy Tarreau4348fad2012-09-20 16:48:07 +02001719 list_for_each_entry(l, &conf->listeners, by_bind)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001720 l->maxconn = val;
1721
1722 return 0;
1723}
1724
1725/* parse the "name" bind keyword */
Willy Tarreau4348fad2012-09-20 16:48:07 +02001726static int bind_parse_name(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001727{
1728 struct listener *l;
1729
1730 if (!*args[cur_arg + 1]) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001731 memprintf(err, "'%s' : missing name", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001732 return ERR_ALERT | ERR_FATAL;
1733 }
1734
Willy Tarreau4348fad2012-09-20 16:48:07 +02001735 list_for_each_entry(l, &conf->listeners, by_bind)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001736 l->name = strdup(args[cur_arg + 1]);
1737
1738 return 0;
1739}
1740
1741/* parse the "nice" bind keyword */
Willy Tarreau4348fad2012-09-20 16:48:07 +02001742static int bind_parse_nice(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001743{
1744 struct listener *l;
1745 int val;
1746
1747 if (!*args[cur_arg + 1]) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001748 memprintf(err, "'%s' : missing value", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001749 return ERR_ALERT | ERR_FATAL;
1750 }
1751
1752 val = atol(args[cur_arg + 1]);
1753 if (val < -1024 || val > 1024) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001754 memprintf(err, "'%s' : invalid value %d, allowed range is -1024..1024", args[cur_arg], val);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001755 return ERR_ALERT | ERR_FATAL;
1756 }
1757
Willy Tarreau4348fad2012-09-20 16:48:07 +02001758 list_for_each_entry(l, &conf->listeners, by_bind)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001759 l->nice = val;
1760
1761 return 0;
1762}
1763
Willy Tarreau6ae1ba62014-05-07 19:01:58 +02001764/* parse the "process" bind keyword */
1765static int bind_parse_process(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
1766{
Willy Tarreauacd64412022-07-15 17:16:01 +02001767 memprintf(err, "'process %s' on 'bind' lines is not supported anymore, please use 'thread' instead.", args[cur_arg+1]);
1768 return ERR_ALERT | ERR_FATAL;
Willy Tarreau6ae1ba62014-05-07 19:01:58 +02001769}
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001770
Christopher Fauleta717b992018-04-10 14:43:00 +02001771/* parse the "proto" bind keyword */
1772static int bind_parse_proto(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
1773{
1774 struct ist proto;
1775
1776 if (!*args[cur_arg + 1]) {
1777 memprintf(err, "'%s' : missing value", args[cur_arg]);
1778 return ERR_ALERT | ERR_FATAL;
1779 }
1780
Tim Duesterhusdcf753a2021-03-04 17:31:47 +01001781 proto = ist(args[cur_arg + 1]);
Christopher Fauleta717b992018-04-10 14:43:00 +02001782 conf->mux_proto = get_mux_proto(proto);
1783 if (!conf->mux_proto) {
1784 memprintf(err, "'%s' : unknown MUX protocol '%s'", args[cur_arg], args[cur_arg+1]);
1785 return ERR_ALERT | ERR_FATAL;
1786 }
Willy Tarreauc8cac042021-09-21 14:31:29 +02001787 return 0;
1788}
1789
Willy Tarreau6dfbef42021-10-12 15:23:03 +02001790/* parse the "shards" bind keyword. Takes an integer or "by-thread" */
1791static int bind_parse_shards(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
1792{
1793 int val;
1794
1795 if (!*args[cur_arg + 1]) {
1796 memprintf(err, "'%s' : missing value", args[cur_arg]);
1797 return ERR_ALERT | ERR_FATAL;
1798 }
1799
1800 if (strcmp(args[cur_arg + 1], "by-thread") == 0) {
1801 val = MAX_THREADS; /* will be trimmed later anyway */
1802 } else {
1803 val = atol(args[cur_arg + 1]);
1804 if (val < 1 || val > MAX_THREADS) {
1805 memprintf(err, "'%s' : invalid value %d, allowed range is %d..%d or 'by-thread'", args[cur_arg], val, 1, MAX_THREADS);
1806 return ERR_ALERT | ERR_FATAL;
1807 }
1808 }
1809
1810 conf->settings.shards = val;
1811 return 0;
1812}
1813
Willy Tarreauc8cac042021-09-21 14:31:29 +02001814/* parse the "thread" bind keyword */
1815static int bind_parse_thread(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
1816{
Willy Tarreaud57b9ff2021-09-29 18:50:31 +02001817 char *sep = NULL;
1818 ulong thread = 0;
1819 long tgroup = 0;
Willy Tarreauc8cac042021-09-21 14:31:29 +02001820
Willy Tarreaud57b9ff2021-09-29 18:50:31 +02001821 tgroup = strtol(args[cur_arg + 1], &sep, 10);
1822 if (*sep == '/') {
1823 /* a thread group was present */
1824 if (tgroup < 1 || tgroup > MAX_TGROUPS) {
1825 memprintf(err, "'%s' thread-group number must be between 1 and %d (was %ld)", args[cur_arg + 1], MAX_TGROUPS, tgroup);
1826 return ERR_ALERT | ERR_FATAL;
1827 }
1828 sep++;
1829 }
1830 else {
1831 /* no thread group */
1832 tgroup = 0;
1833 sep = args[cur_arg + 1];
1834 }
Willy Tarreauc8cac042021-09-21 14:31:29 +02001835
Willy Tarreau01cac3f2021-10-12 08:47:54 +02001836 if ((conf->bind_tgroup || conf->bind_thread) &&
1837 conf->bind_tgroup != tgroup) {
Willy Tarreaud57b9ff2021-09-29 18:50:31 +02001838 memprintf(err, "'%s' multiple thread-groups are not supported", args[cur_arg + 1]);
Willy Tarreauc8cac042021-09-21 14:31:29 +02001839 return ERR_ALERT | ERR_FATAL;
1840 }
Willy Tarreau740038c2022-07-15 17:18:23 +02001841
1842 if (parse_process_number(sep, &thread, LONGBITS, NULL, err)) {
Willy Tarreaud57b9ff2021-09-29 18:50:31 +02001843 memprintf(err, "'%s' : %s", sep, *err);
Willy Tarreauc8cac042021-09-21 14:31:29 +02001844 return ERR_ALERT | ERR_FATAL;
1845 }
1846
Willy Tarreau01cac3f2021-10-12 08:47:54 +02001847 conf->bind_thread |= thread;
1848 conf->bind_tgroup = tgroup;
Christopher Fauleta717b992018-04-10 14:43:00 +02001849 return 0;
1850}
1851
Willy Tarreau7ac908b2019-02-27 12:02:18 +01001852/* config parser for global "tune.listener.multi-queue", accepts "on" or "off" */
1853static int cfg_parse_tune_listener_mq(char **args, int section_type, struct proxy *curpx,
Willy Tarreau01825162021-03-09 09:53:46 +01001854 const struct proxy *defpx, const char *file, int line,
Willy Tarreau7ac908b2019-02-27 12:02:18 +01001855 char **err)
1856{
1857 if (too_many_args(1, args, err, NULL))
1858 return -1;
1859
1860 if (strcmp(args[1], "on") == 0)
1861 global.tune.options |= GTUNE_LISTENER_MQ;
1862 else if (strcmp(args[1], "off") == 0)
1863 global.tune.options &= ~GTUNE_LISTENER_MQ;
1864 else {
1865 memprintf(err, "'%s' expects either 'on' or 'off' but got '%s'.", args[0], args[1]);
1866 return -1;
1867 }
1868 return 0;
1869}
1870
Willy Tarreau61612d42012-04-19 18:42:05 +02001871/* Note: must not be declared <const> as its list will be overwritten.
1872 * Please take care of keeping this list alphabetically sorted.
1873 */
Willy Tarreaudc13c112013-06-21 23:16:39 +02001874static struct sample_fetch_kw_list smp_kws = {ILH, {
Thierry FOURNIER07ee64e2015-07-06 23:43:03 +02001875 { "dst_conn", smp_fetch_dconn, 0, NULL, SMP_T_SINT, SMP_USE_FTEND, },
1876 { "so_id", smp_fetch_so_id, 0, NULL, SMP_T_SINT, SMP_USE_FTEND, },
Jerome Magnineb421b22020-03-27 22:08:40 +01001877 { "so_name", smp_fetch_so_name, 0, NULL, SMP_T_STR, SMP_USE_FTEND, },
Willy Tarreau0ccb7442013-01-07 22:54:17 +01001878 { /* END */ },
1879}};
1880
Willy Tarreau0108d902018-11-25 19:14:37 +01001881INITCALL1(STG_REGISTER, sample_register_fetches, &smp_kws);
1882
Willy Tarreau0ccb7442013-01-07 22:54:17 +01001883/* Note: must not be declared <const> as its list will be overwritten.
1884 * Please take care of keeping this list alphabetically sorted.
1885 */
Willy Tarreaudc13c112013-06-21 23:16:39 +02001886static struct acl_kw_list acl_kws = {ILH, {
Willy Tarreau0ccb7442013-01-07 22:54:17 +01001887 { /* END */ },
Willy Tarreau645513a2010-05-24 20:55:15 +02001888}};
1889
Willy Tarreau0108d902018-11-25 19:14:37 +01001890INITCALL1(STG_REGISTER, acl_register_keywords, &acl_kws);
1891
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001892/* Note: must not be declared <const> as its list will be overwritten.
1893 * Please take care of keeping this list alphabetically sorted, doing so helps
1894 * all code contributors.
1895 * Optional keywords are also declared with a NULL ->parse() function so that
1896 * the config parser can report an appropriate error when a known keyword was
1897 * not enabled.
1898 */
Willy Tarreau51fb7652012-09-18 18:24:39 +02001899static struct bind_kw_list bind_kws = { "ALL", { }, {
Bertrand Jacquin93b227d2016-06-04 15:11:10 +01001900 { "accept-netscaler-cip", bind_parse_accept_netscaler_cip, 1 }, /* enable NetScaler Client IP insertion protocol */
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001901 { "accept-proxy", bind_parse_accept_proxy, 0 }, /* enable PROXY protocol */
1902 { "backlog", bind_parse_backlog, 1 }, /* set backlog of listening socket */
1903 { "id", bind_parse_id, 1 }, /* set id of listening socket */
1904 { "maxconn", bind_parse_maxconn, 1 }, /* set maxconn of listening socket */
1905 { "name", bind_parse_name, 1 }, /* set name of listening socket */
1906 { "nice", bind_parse_nice, 1 }, /* set nice of listening socket */
Willy Tarreau6ae1ba62014-05-07 19:01:58 +02001907 { "process", bind_parse_process, 1 }, /* set list of allowed process for this socket */
Christopher Fauleta717b992018-04-10 14:43:00 +02001908 { "proto", bind_parse_proto, 1 }, /* set the proto to use for all incoming connections */
Willy Tarreau6dfbef42021-10-12 15:23:03 +02001909 { "shards", bind_parse_shards, 1 }, /* set number of shards */
Willy Tarreauc8cac042021-09-21 14:31:29 +02001910 { "thread", bind_parse_thread, 1 }, /* set list of allowed threads for this socket */
Willy Tarreau0ccb7442013-01-07 22:54:17 +01001911 { /* END */ },
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001912}};
1913
Willy Tarreau0108d902018-11-25 19:14:37 +01001914INITCALL1(STG_REGISTER, bind_register_keywords, &bind_kws);
1915
Willy Tarreau7ac908b2019-02-27 12:02:18 +01001916/* config keyword parsers */
1917static struct cfg_kw_list cfg_kws = {ILH, {
1918 { CFG_GLOBAL, "tune.listener.multi-queue", cfg_parse_tune_listener_mq },
1919 { 0, NULL, NULL }
1920}};
1921
1922INITCALL1(STG_REGISTER, cfg_register_keywords, &cfg_kws);
1923
Willy Tarreau645513a2010-05-24 20:55:15 +02001924/*
1925 * Local variables:
1926 * c-indent-level: 8
1927 * c-basic-offset: 8
1928 * End:
1929 */