blob: bddc29f40d018ee3356fedce7e39132cc92dc37b [file] [log] [blame]
Willy Tarreaudd815982007-10-16 12:25:14 +02001/*
Willy Tarreaud1d54542012-09-12 22:58:11 +02002 * Listener management functions.
Willy Tarreaudd815982007-10-16 12:25:14 +02003 *
Willy Tarreau0ccb7442013-01-07 22:54:17 +01004 * Copyright 2000-2013 Willy Tarreau <w@1wt.eu>
Willy Tarreaudd815982007-10-16 12:25:14 +02005 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 */
12
Willy Tarreau6ae1ba62014-05-07 19:01:58 +020013#include <ctype.h>
Willy Tarreaubbebbbf2012-05-07 21:22:09 +020014#include <errno.h>
Willy Tarreaudd815982007-10-16 12:25:14 +020015#include <stdio.h>
16#include <string.h>
Willy Tarreau95ccdde2014-02-01 09:28:36 +010017#include <unistd.h>
Willy Tarreaudd815982007-10-16 12:25:14 +020018
Willy Tarreaudcc048a2020-06-04 19:11:43 +020019#include <haproxy/acl.h>
Willy Tarreau4c7e4b72020-05-27 12:58:42 +020020#include <haproxy/api.h>
Willy Tarreau5d9ddc52021-10-06 19:54:09 +020021#include <haproxy/activity.h>
Willy Tarreau6be78492020-06-05 00:00:29 +020022#include <haproxy/cfgparse.h>
Willy Tarreaudbf78022021-10-06 09:05:08 +020023#include <haproxy/cli-t.h>
Willy Tarreau7ea393d2020-06-04 18:02:10 +020024#include <haproxy/connection.h>
Willy Tarreau8d366972020-05-27 16:10:29 +020025#include <haproxy/errors.h>
Willy Tarreaub2551052020-06-09 09:07:15 +020026#include <haproxy/fd.h>
27#include <haproxy/freq_ctr.h>
Willy Tarreauf268ee82020-06-04 17:05:57 +020028#include <haproxy/global.h>
Willy Tarreau853b2972020-05-27 18:01:47 +020029#include <haproxy/list.h>
Willy Tarreau213e9902020-06-04 14:58:24 +020030#include <haproxy/listener.h>
Willy Tarreauaeed4a82020-06-04 22:01:04 +020031#include <haproxy/log.h>
Willy Tarreaub2551052020-06-09 09:07:15 +020032#include <haproxy/protocol.h>
Willy Tarreau5958c432021-05-08 20:30:37 +020033#include <haproxy/proxy.h>
Frédéric Lécaille748ece62022-05-21 23:58:40 +020034#include <haproxy/quic_tp.h>
Willy Tarreaub2551052020-06-09 09:07:15 +020035#include <haproxy/sample.h>
Willy Tarreaudfd3de82020-06-04 23:46:14 +020036#include <haproxy/stream.h>
Willy Tarreaucea0e1b2020-06-04 17:25:40 +020037#include <haproxy/task.h>
Willy Tarreau9310f482021-10-06 16:18:40 +020038#include <haproxy/ticks.h>
Willy Tarreaub2551052020-06-09 09:07:15 +020039#include <haproxy/tools.h>
Willy Tarreaudd815982007-10-16 12:25:14 +020040
Willy Tarreaub648d632007-10-28 22:13:50 +010041
Willy Tarreau26982662012-09-12 23:17:10 +020042/* List head of all known bind keywords */
Willy Tarreauca1acd62022-03-29 15:02:44 +020043struct bind_kw_list bind_keywords = {
Willy Tarreau26982662012-09-12 23:17:10 +020044 .list = LIST_HEAD_INIT(bind_keywords.list)
45};
46
Willy Tarreaua1d97f82019-12-10 11:18:41 +010047/* list of the temporarily limited listeners because of lack of resource */
48static struct mt_list global_listener_queue = MT_LIST_HEAD_INIT(global_listener_queue);
49static struct task *global_listener_queue_task;
Willy Tarreaua1d97f82019-12-10 11:18:41 +010050
William Dauchy3679d0c2021-02-14 23:22:55 +010051/* listener status for stats */
52const char* li_status_st[LI_STATE_COUNT] = {
53 [LI_STATUS_WAITING] = "WAITING",
54 [LI_STATUS_OPEN] = "OPEN",
55 [LI_STATUS_FULL] = "FULL",
56};
Willy Tarreaua1d97f82019-12-10 11:18:41 +010057
Willy Tarreau1efafce2019-01-27 15:37:19 +010058#if defined(USE_THREAD)
59
60struct accept_queue_ring accept_queue_rings[MAX_THREADS] __attribute__((aligned(64))) = { };
61
62/* dequeue and process a pending connection from the local accept queue (single
Willy Tarreau83efc322020-10-14 17:37:17 +020063 * consumer). Returns the accepted connection or NULL if none was found.
Willy Tarreau1efafce2019-01-27 15:37:19 +010064 */
Willy Tarreau83efc322020-10-14 17:37:17 +020065struct connection *accept_queue_pop_sc(struct accept_queue_ring *ring)
Willy Tarreau1efafce2019-01-27 15:37:19 +010066{
Willy Tarreau1efafce2019-01-27 15:37:19 +010067 unsigned int pos, next;
Willy Tarreau83efc322020-10-14 17:37:17 +020068 struct connection *ptr;
69 struct connection **e;
Willy Tarreau1efafce2019-01-27 15:37:19 +010070
71 pos = ring->head;
72
73 if (pos == ring->tail)
Willy Tarreau83efc322020-10-14 17:37:17 +020074 return NULL;
Willy Tarreau1efafce2019-01-27 15:37:19 +010075
76 next = pos + 1;
77 if (next >= ACCEPT_QUEUE_SIZE)
78 next = 0;
79
80 e = &ring->entry[pos];
81
82 /* wait for the producer to update the listener's pointer */
83 while (1) {
Willy Tarreau83efc322020-10-14 17:37:17 +020084 ptr = *e;
Willy Tarreau1efafce2019-01-27 15:37:19 +010085 __ha_barrier_load();
86 if (ptr)
87 break;
88 pl_cpu_relax();
89 }
90
Willy Tarreau1efafce2019-01-27 15:37:19 +010091 /* release the entry */
Willy Tarreau83efc322020-10-14 17:37:17 +020092 *e = NULL;
Willy Tarreau1efafce2019-01-27 15:37:19 +010093
94 __ha_barrier_store();
95 ring->head = next;
Willy Tarreau83efc322020-10-14 17:37:17 +020096 return ptr;
Willy Tarreau1efafce2019-01-27 15:37:19 +010097}
98
99
Willy Tarreau83efc322020-10-14 17:37:17 +0200100/* tries to push a new accepted connection <conn> into ring <ring>. Returns
101 * non-zero if it succeeds, or zero if the ring is full. Supports multiple
102 * producers.
Willy Tarreau1efafce2019-01-27 15:37:19 +0100103 */
Willy Tarreau83efc322020-10-14 17:37:17 +0200104int accept_queue_push_mp(struct accept_queue_ring *ring, struct connection *conn)
Willy Tarreau1efafce2019-01-27 15:37:19 +0100105{
Willy Tarreau1efafce2019-01-27 15:37:19 +0100106 unsigned int pos, next;
107
108 pos = ring->tail;
109 do {
110 next = pos + 1;
111 if (next >= ACCEPT_QUEUE_SIZE)
112 next = 0;
113 if (next == ring->head)
114 return 0; // ring full
Olivier Houchard64213e92019-03-08 18:52:57 +0100115 } while (unlikely(!_HA_ATOMIC_CAS(&ring->tail, &pos, next)));
Willy Tarreau1efafce2019-01-27 15:37:19 +0100116
Willy Tarreau83efc322020-10-14 17:37:17 +0200117 ring->entry[pos] = conn;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100118 __ha_barrier_store();
Willy Tarreau1efafce2019-01-27 15:37:19 +0100119 return 1;
120}
121
Willy Tarreaufb5401f2021-01-29 12:25:23 +0100122/* proceed with accepting new connections. Don't mark it static so that it appears
123 * in task dumps.
124 */
Willy Tarreau144f84a2021-03-02 16:09:26 +0100125struct task *accept_queue_process(struct task *t, void *context, unsigned int state)
Willy Tarreau1efafce2019-01-27 15:37:19 +0100126{
127 struct accept_queue_ring *ring = context;
Willy Tarreau83efc322020-10-14 17:37:17 +0200128 struct connection *conn;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100129 struct listener *li;
Christopher Faulet102854c2019-04-30 12:17:13 +0200130 unsigned int max_accept;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100131 int ret;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100132
Christopher Faulet102854c2019-04-30 12:17:13 +0200133 /* if global.tune.maxaccept is -1, then max_accept is UINT_MAX. It
134 * is not really illimited, but it is probably enough.
135 */
Willy Tarreau66161322021-02-19 15:50:27 +0100136 max_accept = global.tune.maxaccept ? global.tune.maxaccept : MAX_ACCEPT;
Christopher Faulet102854c2019-04-30 12:17:13 +0200137 for (; max_accept; max_accept--) {
Willy Tarreau83efc322020-10-14 17:37:17 +0200138 conn = accept_queue_pop_sc(ring);
139 if (!conn)
Willy Tarreau1efafce2019-01-27 15:37:19 +0100140 break;
141
Willy Tarreau83efc322020-10-14 17:37:17 +0200142 li = __objt_listener(conn->target);
Willy Tarreau4781b152021-04-06 13:53:36 +0200143 _HA_ATOMIC_INC(&li->thr_conn[tid]);
Willy Tarreau83efc322020-10-14 17:37:17 +0200144 ret = li->accept(conn);
Willy Tarreau1efafce2019-01-27 15:37:19 +0100145 if (ret <= 0) {
146 /* connection was terminated by the application */
147 continue;
148 }
149
150 /* increase the per-process number of cumulated sessions, this
151 * may only be done once l->accept() has accepted the connection.
152 */
153 if (!(li->options & LI_O_UNLIMITED)) {
154 HA_ATOMIC_UPDATE_MAX(&global.sps_max,
155 update_freq_ctr(&global.sess_per_sec, 1));
Willy Tarreau11ba4042022-05-20 15:56:32 +0200156 if (li->bind_conf && li->bind_conf->options & BC_O_USE_SSL) {
Willy Tarreau1efafce2019-01-27 15:37:19 +0100157 HA_ATOMIC_UPDATE_MAX(&global.ssl_max,
158 update_freq_ctr(&global.ssl_per_sec, 1));
159 }
160 }
161 }
162
163 /* ran out of budget ? Let's come here ASAP */
Christopher Faulet102854c2019-04-30 12:17:13 +0200164 if (!max_accept)
Willy Tarreau2bd65a72019-09-24 06:55:18 +0200165 tasklet_wakeup(ring->tasklet);
Willy Tarreau1efafce2019-01-27 15:37:19 +0100166
Willy Tarreau2bd65a72019-09-24 06:55:18 +0200167 return NULL;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100168}
169
170/* Initializes the accept-queues. Returns 0 on success, otherwise ERR_* flags */
171static int accept_queue_init()
172{
Willy Tarreau2bd65a72019-09-24 06:55:18 +0200173 struct tasklet *t;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100174 int i;
175
176 for (i = 0; i < global.nbthread; i++) {
Willy Tarreau2bd65a72019-09-24 06:55:18 +0200177 t = tasklet_new();
Willy Tarreau1efafce2019-01-27 15:37:19 +0100178 if (!t) {
179 ha_alert("Out of memory while initializing accept queue for thread %d\n", i);
180 return ERR_FATAL|ERR_ABORT;
181 }
Willy Tarreau2bd65a72019-09-24 06:55:18 +0200182 t->tid = i;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100183 t->process = accept_queue_process;
184 t->context = &accept_queue_rings[i];
Willy Tarreau2bd65a72019-09-24 06:55:18 +0200185 accept_queue_rings[i].tasklet = t;
Willy Tarreau1efafce2019-01-27 15:37:19 +0100186 }
187 return 0;
188}
189
190REGISTER_CONFIG_POSTPARSER("multi-threaded accept queue", accept_queue_init);
191
Willy Tarreaue01b08d2022-04-27 18:42:47 +0200192static void accept_queue_deinit()
193{
194 int i;
195
196 for (i = 0; i < global.nbthread; i++) {
197 if (accept_queue_rings[i].tasklet)
198 tasklet_free(accept_queue_rings[i].tasklet);
199 }
200}
201
202REGISTER_POST_DEINIT(accept_queue_deinit);
203
Willy Tarreau1efafce2019-01-27 15:37:19 +0100204#endif // USE_THREAD
205
Amaury Denoyellef68b2cb2022-01-25 16:21:47 +0100206/* Memory allocation and initialization of the per_thr field.
207 * Returns 0 if the field has been successfully initialized, -1 on failure.
208 */
209int li_init_per_thr(struct listener *li)
210{
211 int i;
212
213 /* allocate per-thread elements for listener */
214 li->per_thr = calloc(global.nbthread, sizeof(*li->per_thr));
215 if (!li->per_thr)
216 return -1;
217
218 for (i = 0; i < global.nbthread; ++i) {
219 MT_LIST_INIT(&li->per_thr[i].quic_accept.list);
220 MT_LIST_INIT(&li->per_thr[i].quic_accept.conns);
221
222 li->per_thr[i].li = li;
223 }
224
225 return 0;
226}
227
William Dauchy3679d0c2021-02-14 23:22:55 +0100228/* helper to get listener status for stats */
229enum li_status get_li_status(struct listener *l)
230{
231 if (!l->maxconn || l->nbconn < l->maxconn) {
232 if (l->state == LI_LIMITED)
233 return LI_STATUS_WAITING;
234 else
235 return LI_STATUS_OPEN;
236 }
237 return LI_STATUS_FULL;
238}
239
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200240/* adjust the listener's state and its proxy's listener counters if needed.
241 * It must be called under the listener's lock, but uses atomic ops to change
242 * the proxy's counters so that the proxy lock is not needed.
243 */
Willy Tarreaua37b2442020-09-24 07:23:45 +0200244void listener_set_state(struct listener *l, enum li_state st)
245{
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200246 struct proxy *px = l->bind_conf->frontend;
247
248 if (px) {
249 /* from state */
250 switch (l->state) {
251 case LI_NEW: /* first call */
Willy Tarreau4781b152021-04-06 13:53:36 +0200252 _HA_ATOMIC_INC(&px->li_all);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200253 break;
254 case LI_INIT:
255 case LI_ASSIGNED:
256 break;
257 case LI_PAUSED:
Willy Tarreau4781b152021-04-06 13:53:36 +0200258 _HA_ATOMIC_DEC(&px->li_paused);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200259 break;
260 case LI_LISTEN:
Willy Tarreau4781b152021-04-06 13:53:36 +0200261 _HA_ATOMIC_DEC(&px->li_bound);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200262 break;
263 case LI_READY:
264 case LI_FULL:
265 case LI_LIMITED:
Willy Tarreau4781b152021-04-06 13:53:36 +0200266 _HA_ATOMIC_DEC(&px->li_ready);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200267 break;
268 }
269
270 /* to state */
271 switch (st) {
272 case LI_NEW:
273 case LI_INIT:
274 case LI_ASSIGNED:
275 break;
276 case LI_PAUSED:
Willy Tarreau95a34602020-10-08 15:32:21 +0200277 BUG_ON(l->rx.fd == -1);
Willy Tarreau4781b152021-04-06 13:53:36 +0200278 _HA_ATOMIC_INC(&px->li_paused);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200279 break;
280 case LI_LISTEN:
Willy Tarreau95a34602020-10-08 15:32:21 +0200281 BUG_ON(l->rx.fd == -1);
Willy Tarreau4781b152021-04-06 13:53:36 +0200282 _HA_ATOMIC_INC(&px->li_bound);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200283 break;
284 case LI_READY:
285 case LI_FULL:
286 case LI_LIMITED:
Willy Tarreau95a34602020-10-08 15:32:21 +0200287 BUG_ON(l->rx.fd == -1);
Willy Tarreau4781b152021-04-06 13:53:36 +0200288 _HA_ATOMIC_INC(&px->li_ready);
Willy Tarreauefc0eec2020-09-24 07:27:06 +0200289 break;
290 }
291 }
Willy Tarreaua37b2442020-09-24 07:23:45 +0200292 l->state = st;
293}
294
Willy Tarreaudabf2e22007-10-28 21:59:24 +0100295/* This function adds the specified listener's file descriptor to the polling
296 * lists if it is in the LI_LISTEN state. The listener enters LI_READY or
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +0500297 * LI_FULL state depending on its number of connections. In daemon mode, we
Willy Tarreauae302532014-05-07 19:22:24 +0200298 * also support binding only the relevant processes to their respective
299 * listeners. We don't do that in debug mode however.
Willy Tarreaudabf2e22007-10-28 21:59:24 +0100300 */
Willy Tarreau7834a3f2020-09-25 16:40:18 +0200301void enable_listener(struct listener *listener)
Willy Tarreaudabf2e22007-10-28 21:59:24 +0100302{
Willy Tarreau08b6f962022-02-01 16:23:00 +0100303 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &listener->lock);
Willy Tarreaud6afb532020-10-09 10:35:40 +0200304
305 /* If this listener is supposed to be only in the master, close it in
306 * the workers. Conversely, if it's supposed to be only in the workers
307 * close it in the master.
308 */
Willy Tarreau18c20d22020-10-09 16:11:46 +0200309 if (!!master != !!(listener->rx.flags & RX_F_MWORKER))
Willy Tarreau75c98d12020-10-09 15:55:23 +0200310 do_unbind_listener(listener);
Willy Tarreaud6afb532020-10-09 10:35:40 +0200311
Willy Tarreaudabf2e22007-10-28 21:59:24 +0100312 if (listener->state == LI_LISTEN) {
Willy Tarreau95a34602020-10-08 15:32:21 +0200313 BUG_ON(listener->rx.fd == -1);
William Lallemand095ba4c2017-06-01 17:38:50 +0200314 if ((global.mode & (MODE_DAEMON | MODE_MWORKER)) &&
Willy Tarreau72faef32021-06-15 08:36:30 +0200315 (!!master != !!(listener->rx.flags & RX_F_MWORKER))) {
Willy Tarreauae302532014-05-07 19:22:24 +0200316 /* we don't want to enable this listener and don't
317 * want any fd event to reach it.
318 */
Willy Tarreau75c98d12020-10-09 15:55:23 +0200319 do_unbind_listener(listener);
Willy Tarreauae302532014-05-07 19:22:24 +0200320 }
Willy Tarreaua8cf66b2019-02-27 16:49:00 +0100321 else if (!listener->maxconn || listener->nbconn < listener->maxconn) {
Willy Tarreau4b51f422020-09-25 20:32:28 +0200322 listener->rx.proto->enable(listener);
Willy Tarreaua37b2442020-09-24 07:23:45 +0200323 listener_set_state(listener, LI_READY);
Willy Tarreauae302532014-05-07 19:22:24 +0200324 }
325 else {
Willy Tarreaua37b2442020-09-24 07:23:45 +0200326 listener_set_state(listener, LI_FULL);
Willy Tarreaudabf2e22007-10-28 21:59:24 +0100327 }
328 }
Willy Tarreaud6afb532020-10-09 10:35:40 +0200329
Willy Tarreau08b6f962022-02-01 16:23:00 +0100330 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &listener->lock);
Willy Tarreaudabf2e22007-10-28 21:59:24 +0100331}
332
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200333/*
334 * This function completely stops a listener. It will need to operate under the
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200335 * It will need to operate under the proxy's lock and the protocol's lock.
336 * The caller is responsible for indicating in lpx, lpr whether the
337 * respective locks are already held (non-zero) or not (zero) so that the
338 * function picks the missing ones, in this order.
339 * The proxy's listeners count is updated and the proxy is
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200340 * disabled and woken up after the last one is gone.
341 */
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200342void stop_listener(struct listener *l, int lpx, int lpr)
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200343{
344 struct proxy *px = l->bind_conf->frontend;
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200345
346 if (l->options & LI_O_NOSTOP) {
347 /* master-worker sockpairs are never closed but don't count as a
348 * job.
349 */
350 return;
351 }
352
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200353 if (!lpx)
Willy Tarreauac66d6b2020-10-20 17:24:27 +0200354 HA_RWLOCK_WRLOCK(PROXY_LOCK, &px->lock);
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200355
356 if (!lpr)
357 HA_SPIN_LOCK(PROTO_LOCK, &proto_lock);
358
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200359 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &l->lock);
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200360
361 if (l->state > LI_INIT) {
Willy Tarreau75c98d12020-10-09 15:55:23 +0200362 do_unbind_listener(l);
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200363
364 if (l->state >= LI_ASSIGNED)
365 __delete_listener(l);
366
Willy Tarreauacde1522020-10-07 16:31:39 +0200367 proxy_cond_disable(px);
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200368 }
369
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200370 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &l->lock);
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200371
372 if (!lpr)
373 HA_SPIN_UNLOCK(PROTO_LOCK, &proto_lock);
374
375 if (!lpx)
Willy Tarreauac66d6b2020-10-20 17:24:27 +0200376 HA_RWLOCK_WRUNLOCK(PROXY_LOCK, &px->lock);
Willy Tarreaucaa7df12020-10-07 15:58:50 +0200377}
378
Willy Tarreaud1f250f2020-12-04 15:03:36 +0100379/* This function adds the specified <listener> to the protocol <proto>. It
380 * does nothing if the protocol was already added. The listener's state is
381 * automatically updated from LI_INIT to LI_ASSIGNED. The number of listeners
382 * for the protocol is updated. This must be called with the proto lock held.
383 */
384void default_add_listener(struct protocol *proto, struct listener *listener)
385{
386 if (listener->state != LI_INIT)
387 return;
388 listener_set_state(listener, LI_ASSIGNED);
389 listener->rx.proto = proto;
Willy Tarreau2b718102021-04-21 07:32:39 +0200390 LIST_APPEND(&proto->receivers, &listener->rx.proto_list);
Willy Tarreaud1f250f2020-12-04 15:03:36 +0100391 proto->nb_receivers++;
392}
393
Willy Tarreaue03204c2020-10-09 17:02:21 +0200394/* default function called to suspend a listener: it simply passes the call to
395 * the underlying receiver. This is find for most socket-based protocols. This
396 * must be called under the listener's lock. It will return non-zero on success,
397 * 0 on failure. If no receiver-level suspend is provided, the operation is
398 * assumed to succeed.
399 */
400int default_suspend_listener(struct listener *l)
401{
402 int ret = 1;
403
404 if (!l->rx.proto->rx_suspend)
405 return 1;
406
407 ret = l->rx.proto->rx_suspend(&l->rx);
408 return ret > 0 ? ret : 0;
409}
410
411
412/* Tries to resume a suspended listener, and returns non-zero on success or
413 * zero on failure. On certain errors, an alert or a warning might be displayed.
414 * It must be called with the listener's lock held. Depending on the listener's
415 * state and protocol, a listen() call might be used to resume operations, or a
416 * call to the receiver's resume() function might be used as well. This is
417 * suitable as a default function for TCP and UDP. This must be called with the
418 * listener's lock held.
419 */
420int default_resume_listener(struct listener *l)
421{
422 int ret = 1;
423
424 if (l->state == LI_ASSIGNED) {
425 char msg[100];
426 int err;
427
428 err = l->rx.proto->listen(l, msg, sizeof(msg));
429 if (err & ERR_ALERT)
430 ha_alert("Resuming listener: %s\n", msg);
431 else if (err & ERR_WARN)
432 ha_warning("Resuming listener: %s\n", msg);
433
434 if (err & (ERR_FATAL | ERR_ABORT)) {
435 ret = 0;
436 goto end;
437 }
438 }
439
440 if (l->state < LI_PAUSED) {
441 ret = 0;
442 goto end;
443 }
444
445 if (l->state == LI_PAUSED && l->rx.proto->rx_resume &&
446 l->rx.proto->rx_resume(&l->rx) <= 0)
447 ret = 0;
448 end:
449 return ret;
450}
451
452
Willy Tarreaube58c382011-07-24 18:28:10 +0200453/* This function tries to temporarily disable a listener, depending on the OS
454 * capabilities. Linux unbinds the listen socket after a SHUT_RD, and ignores
455 * SHUT_WR. Solaris refuses either shutdown(). OpenBSD ignores SHUT_RD but
456 * closes upon SHUT_WR and refuses to rebind. So a common validation path
457 * involves SHUT_WR && listen && SHUT_RD. In case of success, the FD's polling
458 * is disabled. It normally returns non-zero, unless an error is reported.
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200459 * It will need to operate under the proxy's lock. The caller is
460 * responsible for indicating in lpx whether the proxy locks is
461 * already held (non-zero) or not (zero) so that the function picks it.
Willy Tarreaube58c382011-07-24 18:28:10 +0200462 */
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200463int pause_listener(struct listener *l, int lpx)
Willy Tarreaube58c382011-07-24 18:28:10 +0200464{
Willy Tarreau58651b42020-09-24 16:03:29 +0200465 struct proxy *px = l->bind_conf->frontend;
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200466 int ret = 1;
467
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200468 if (!lpx)
469 HA_RWLOCK_WRLOCK(PROXY_LOCK, &px->lock);
470
Willy Tarreau08b6f962022-02-01 16:23:00 +0100471 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &l->lock);
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200472
Willy Tarreau9b3a9322020-09-24 14:46:34 +0200473 if (l->state <= LI_PAUSED)
474 goto end;
475
Willy Tarreaue03204c2020-10-09 17:02:21 +0200476 if (l->rx.proto->suspend)
477 ret = l->rx.proto->suspend(l);
Willy Tarreaube58c382011-07-24 18:28:10 +0200478
Willy Tarreau2b718102021-04-21 07:32:39 +0200479 MT_LIST_DELETE(&l->wait_queue);
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200480
Willy Tarreaua37b2442020-09-24 07:23:45 +0200481 listener_set_state(l, LI_PAUSED);
Willy Tarreau58651b42020-09-24 16:03:29 +0200482
483 if (px && !px->li_ready) {
Aurelien DARRAGONd46f4372022-09-09 15:51:37 +0200484 /* PROXY_LOCK is required */
485 proxy_cond_pause(px);
Willy Tarreau58651b42020-09-24 16:03:29 +0200486 ha_warning("Paused %s %s.\n", proxy_cap_str(px->cap), px->id);
487 send_log(px, LOG_WARNING, "Paused %s %s.\n", proxy_cap_str(px->cap), px->id);
488 }
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200489 end:
Willy Tarreau08b6f962022-02-01 16:23:00 +0100490 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &l->lock);
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200491
492 if (!lpx)
493 HA_RWLOCK_WRUNLOCK(PROXY_LOCK, &px->lock);
494
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200495 return ret;
Willy Tarreaube58c382011-07-24 18:28:10 +0200496}
497
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200498/* This function tries to resume a temporarily disabled listener. Paused, full,
499 * limited and disabled listeners are handled, which means that this function
500 * may replace enable_listener(). The resulting state will either be LI_READY
501 * or LI_FULL. 0 is returned in case of failure to resume (eg: dead socket).
Willy Tarreauae302532014-05-07 19:22:24 +0200502 * Listeners bound to a different process are not woken up unless we're in
Willy Tarreauaf2fd582015-04-14 12:07:16 +0200503 * foreground mode, and are ignored. If the listener was only in the assigned
504 * state, it's totally rebound. This can happen if a pause() has completely
505 * stopped it. If the resume fails, 0 is returned and an error might be
506 * displayed.
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200507 * It will need to operate under the proxy's lock. The caller is
508 * responsible for indicating in lpx whether the proxy locks is
509 * already held (non-zero) or not (zero) so that the function picks it.
Willy Tarreaube58c382011-07-24 18:28:10 +0200510 */
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200511int resume_listener(struct listener *l, int lpx)
Willy Tarreaube58c382011-07-24 18:28:10 +0200512{
Willy Tarreau58651b42020-09-24 16:03:29 +0200513 struct proxy *px = l->bind_conf->frontend;
514 int was_paused = px && px->li_paused;
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200515 int ret = 1;
516
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200517 if (!lpx)
518 HA_RWLOCK_WRLOCK(PROXY_LOCK, &px->lock);
519
Willy Tarreau08b6f962022-02-01 16:23:00 +0100520 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &l->lock);
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200521
Willy Tarreauf2cb1692019-07-11 10:08:31 +0200522 /* check that another thread didn't to the job in parallel (e.g. at the
523 * end of listen_accept() while we'd come from dequeue_all_listeners().
524 */
Willy Tarreau2b718102021-04-21 07:32:39 +0200525 if (MT_LIST_INLIST(&l->wait_queue))
Willy Tarreauf2cb1692019-07-11 10:08:31 +0200526 goto end;
527
Willy Tarreau5d7f9ce2020-09-24 18:54:11 +0200528 if (l->state == LI_READY)
529 goto end;
Willy Tarreaube58c382011-07-24 18:28:10 +0200530
Willy Tarreaue03204c2020-10-09 17:02:21 +0200531 if (l->rx.proto->resume)
532 ret = l->rx.proto->resume(l);
Willy Tarreaube58c382011-07-24 18:28:10 +0200533
Willy Tarreaua8cf66b2019-02-27 16:49:00 +0100534 if (l->maxconn && l->nbconn >= l->maxconn) {
Willy Tarreau4b51f422020-09-25 20:32:28 +0200535 l->rx.proto->disable(l);
Willy Tarreaua37b2442020-09-24 07:23:45 +0200536 listener_set_state(l, LI_FULL);
Willy Tarreau58651b42020-09-24 16:03:29 +0200537 goto done;
Willy Tarreaube58c382011-07-24 18:28:10 +0200538 }
539
Willy Tarreau4b51f422020-09-25 20:32:28 +0200540 l->rx.proto->enable(l);
Willy Tarreaua37b2442020-09-24 07:23:45 +0200541 listener_set_state(l, LI_READY);
Willy Tarreau58651b42020-09-24 16:03:29 +0200542
543 done:
544 if (was_paused && !px->li_paused) {
Aurelien DARRAGONd46f4372022-09-09 15:51:37 +0200545 /* PROXY_LOCK is required */
546 proxy_cond_resume(px);
Willy Tarreau58651b42020-09-24 16:03:29 +0200547 ha_warning("Resumed %s %s.\n", proxy_cap_str(px->cap), px->id);
548 send_log(px, LOG_WARNING, "Resumed %s %s.\n", proxy_cap_str(px->cap), px->id);
549 }
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200550 end:
Willy Tarreau08b6f962022-02-01 16:23:00 +0100551 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &l->lock);
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200552
553 if (!lpx)
554 HA_RWLOCK_WRUNLOCK(PROXY_LOCK, &px->lock);
555
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200556 return ret;
557}
558
Willy Tarreau87b09662015-04-03 00:22:06 +0200559/* Marks a ready listener as full so that the stream code tries to re-enable
Willy Tarreau62793712011-07-24 19:23:38 +0200560 * it upon next close() using resume_listener().
561 */
Christopher Faulet5580ba22017-08-28 15:29:20 +0200562static void listener_full(struct listener *l)
Willy Tarreau62793712011-07-24 19:23:38 +0200563{
Willy Tarreau08b6f962022-02-01 16:23:00 +0100564 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &l->lock);
Willy Tarreau62793712011-07-24 19:23:38 +0200565 if (l->state >= LI_READY) {
Willy Tarreau2b718102021-04-21 07:32:39 +0200566 MT_LIST_DELETE(&l->wait_queue);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100567 if (l->state != LI_FULL) {
Willy Tarreau4b51f422020-09-25 20:32:28 +0200568 l->rx.proto->disable(l);
Willy Tarreaua37b2442020-09-24 07:23:45 +0200569 listener_set_state(l, LI_FULL);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100570 }
Willy Tarreau62793712011-07-24 19:23:38 +0200571 }
Willy Tarreau08b6f962022-02-01 16:23:00 +0100572 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &l->lock);
Willy Tarreau62793712011-07-24 19:23:38 +0200573}
574
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200575/* Marks a ready listener as limited so that we only try to re-enable it when
576 * resources are free again. It will be queued into the specified queue.
577 */
Olivier Houchard859dc802019-08-08 15:47:21 +0200578static void limit_listener(struct listener *l, struct mt_list *list)
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200579{
Willy Tarreau08b6f962022-02-01 16:23:00 +0100580 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &l->lock);
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200581 if (l->state == LI_READY) {
Willy Tarreau2b718102021-04-21 07:32:39 +0200582 MT_LIST_TRY_APPEND(list, &l->wait_queue);
Willy Tarreau4b51f422020-09-25 20:32:28 +0200583 l->rx.proto->disable(l);
Willy Tarreaua37b2442020-09-24 07:23:45 +0200584 listener_set_state(l, LI_LIMITED);
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200585 }
Willy Tarreau08b6f962022-02-01 16:23:00 +0100586 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &l->lock);
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200587}
588
Willy Tarreau241797a2019-12-10 14:10:52 +0100589/* Dequeues all listeners waiting for a resource the global wait queue */
590void dequeue_all_listeners()
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200591{
Willy Tarreau01abd022019-02-28 10:27:18 +0100592 struct listener *listener;
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200593
Willy Tarreau241797a2019-12-10 14:10:52 +0100594 while ((listener = MT_LIST_POP(&global_listener_queue, struct listener *, wait_queue))) {
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200595 /* This cannot fail because the listeners are by definition in
Willy Tarreau01abd022019-02-28 10:27:18 +0100596 * the LI_LIMITED state.
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200597 */
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200598 resume_listener(listener, 0);
Willy Tarreaue6ca1fc2011-07-24 22:03:52 +0200599 }
600}
601
Willy Tarreau241797a2019-12-10 14:10:52 +0100602/* Dequeues all listeners waiting for a resource in proxy <px>'s queue */
603void dequeue_proxy_listeners(struct proxy *px)
604{
605 struct listener *listener;
606
607 while ((listener = MT_LIST_POP(&px->listener_queue, struct listener *, wait_queue))) {
608 /* This cannot fail because the listeners are by definition in
609 * the LI_LIMITED state.
610 */
Aurelien DARRAGON00132882022-09-09 15:32:57 +0200611 resume_listener(listener, 0);
Willy Tarreau241797a2019-12-10 14:10:52 +0100612 }
613}
614
Willy Tarreau7b2febd2020-10-09 17:18:29 +0200615
616/* default function used to unbind a listener. This is for use by standard
617 * protocols working on top of accepted sockets. The receiver's rx_unbind()
618 * will automatically be used after the listener is disabled if the socket is
619 * still bound. This must be used under the listener's lock.
Christopher Faulet510c0d62018-03-16 10:04:47 +0100620 */
Willy Tarreau7b2febd2020-10-09 17:18:29 +0200621void default_unbind_listener(struct listener *listener)
Willy Tarreaub648d632007-10-28 22:13:50 +0100622{
Willy Tarreau87acd4e2020-10-08 15:36:46 +0200623 if (listener->state <= LI_ASSIGNED)
624 goto out_close;
625
626 if (listener->rx.fd == -1) {
Willy Tarreaua37b2442020-09-24 07:23:45 +0200627 listener_set_state(listener, LI_ASSIGNED);
Willy Tarreau87acd4e2020-10-08 15:36:46 +0200628 goto out_close;
629 }
630
Willy Tarreauf58b8db2020-10-09 16:32:08 +0200631 if (listener->state >= LI_READY) {
632 listener->rx.proto->disable(listener);
633 if (listener->rx.flags & RX_F_BOUND)
Willy Tarreau87acd4e2020-10-08 15:36:46 +0200634 listener_set_state(listener, LI_LISTEN);
Willy Tarreaub6607bf2020-09-23 16:24:23 +0200635 }
636
Willy Tarreau87acd4e2020-10-08 15:36:46 +0200637 out_close:
Willy Tarreauf58b8db2020-10-09 16:32:08 +0200638 if (listener->rx.flags & RX_F_BOUND)
639 listener->rx.proto->rx_unbind(&listener->rx);
Willy Tarreau7b2febd2020-10-09 17:18:29 +0200640}
641
642/* This function closes the listening socket for the specified listener,
643 * provided that it's already in a listening state. The protocol's unbind()
644 * is called to put the listener into LI_ASSIGNED or LI_LISTEN and handle
645 * the unbinding tasks. The listener enters then the LI_ASSIGNED state if
646 * the receiver is unbound. Must be called with the lock held.
647 */
648void do_unbind_listener(struct listener *listener)
649{
Willy Tarreau2b718102021-04-21 07:32:39 +0200650 MT_LIST_DELETE(&listener->wait_queue);
Willy Tarreau7b2febd2020-10-09 17:18:29 +0200651
652 if (listener->rx.proto->unbind)
653 listener->rx.proto->unbind(listener);
Willy Tarreau374e9af2020-10-09 15:47:17 +0200654
Willy Tarreauf58b8db2020-10-09 16:32:08 +0200655 /* we may have to downgrade the listener if the rx was closed */
656 if (!(listener->rx.flags & RX_F_BOUND) && listener->state > LI_ASSIGNED)
Willy Tarreau374e9af2020-10-09 15:47:17 +0200657 listener_set_state(listener, LI_ASSIGNED);
Willy Tarreaubbd09b92017-11-05 11:38:44 +0100658}
659
Olivier Houchard1fc05162017-04-06 01:05:05 +0200660/* This function closes the listening socket for the specified listener,
661 * provided that it's already in a listening state. The listener enters the
Willy Tarreau75c98d12020-10-09 15:55:23 +0200662 * LI_ASSIGNED state, except if the FD is not closed, in which case it may
663 * remain in LI_LISTEN. This function is intended to be used as a generic
Willy Tarreaubbd09b92017-11-05 11:38:44 +0100664 * function for standard protocols.
Olivier Houchard1fc05162017-04-06 01:05:05 +0200665 */
Willy Tarreaubbd09b92017-11-05 11:38:44 +0100666void unbind_listener(struct listener *listener)
Olivier Houchard1fc05162017-04-06 01:05:05 +0200667{
Willy Tarreau08b6f962022-02-01 16:23:00 +0100668 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &listener->lock);
Willy Tarreau75c98d12020-10-09 15:55:23 +0200669 do_unbind_listener(listener);
Willy Tarreau08b6f962022-02-01 16:23:00 +0100670 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &listener->lock);
Olivier Houchard1fc05162017-04-06 01:05:05 +0200671}
672
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200673/* creates one or multiple listeners for bind_conf <bc> on sockaddr <ss> on port
674 * range <portl> to <porth>, and possibly attached to fd <fd> (or -1 for auto
Willy Tarreau9b3178d2020-09-16 17:58:55 +0200675 * allocation). The address family is taken from ss->ss_family, and the protocol
Willy Tarreaud2fb99f2020-10-15 21:22:29 +0200676 * passed in <proto> must be usable on this family. The protocol's default iocb
677 * is automatically preset as the receivers' iocb. The number of jobs and
Willy Tarreau9b3178d2020-09-16 17:58:55 +0200678 * listeners is automatically increased by the number of listeners created. It
679 * returns non-zero on success, zero on error with the error message set in <err>.
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200680 */
681int create_listeners(struct bind_conf *bc, const struct sockaddr_storage *ss,
Willy Tarreau9b3178d2020-09-16 17:58:55 +0200682 int portl, int porth, int fd, struct protocol *proto, char **err)
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200683{
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200684 struct listener *l;
685 int port;
686
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200687 for (port = portl; port <= porth; port++) {
688 l = calloc(1, sizeof(*l));
689 if (!l) {
690 memprintf(err, "out of memory");
691 return 0;
692 }
693 l->obj_type = OBJ_TYPE_LISTENER;
Willy Tarreau2b718102021-04-21 07:32:39 +0200694 LIST_APPEND(&bc->frontend->conf.listeners, &l->by_fe);
695 LIST_APPEND(&bc->listeners, &l->by_bind);
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200696 l->bind_conf = bc;
Willy Tarreau0fce6bc2020-09-03 07:46:06 +0200697 l->rx.settings = &bc->settings;
Willy Tarreaueef45422020-09-03 10:05:03 +0200698 l->rx.owner = l;
Willy Tarreaud2fb99f2020-10-15 21:22:29 +0200699 l->rx.iocb = proto->default_iocb;
Willy Tarreau38ba6472020-08-27 08:16:52 +0200700 l->rx.fd = fd;
Willy Tarreau07400c52020-12-04 14:49:11 +0100701
Willy Tarreau37159062020-08-27 07:48:42 +0200702 memcpy(&l->rx.addr, ss, sizeof(*ss));
Willy Tarreaud1f250f2020-12-04 15:03:36 +0100703 if (proto->fam->set_port)
704 proto->fam->set_port(&l->rx.addr, port);
Willy Tarreau07400c52020-12-04 14:49:11 +0100705
Olivier Houchard859dc802019-08-08 15:47:21 +0200706 MT_LIST_INIT(&l->wait_queue);
Willy Tarreaua37b2442020-09-24 07:23:45 +0200707 listener_set_state(l, LI_INIT);
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200708
Willy Tarreaud1f250f2020-12-04 15:03:36 +0100709 proto->add(proto, l);
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200710
Willy Tarreau909c23b2020-09-15 13:50:58 +0200711 if (fd != -1)
Willy Tarreau43046fa2020-09-01 15:41:59 +0200712 l->rx.flags |= RX_F_INHERITED;
William Lallemand75ea0a02017-11-15 19:02:58 +0100713
Amaury Denoyelle7f8f6cb2020-11-10 14:24:31 +0100714 l->extra_counters = NULL;
715
Willy Tarreau08b6f962022-02-01 16:23:00 +0100716 HA_RWLOCK_INIT(&l->lock);
Willy Tarreau4781b152021-04-06 13:53:36 +0200717 _HA_ATOMIC_INC(&jobs);
718 _HA_ATOMIC_INC(&listeners);
Willy Tarreau0de59fd2017-09-15 08:10:44 +0200719 }
720 return 1;
721}
722
Willy Tarreau59a877d2021-10-12 09:36:10 +0200723/* clones listener <src> and returns the new one. All dynamically allocated
724 * fields are reallocated (name for now). The new listener is inserted before
725 * the original one in the bind_conf and frontend lists. This allows it to be
726 * duplicated while iterating over the current list. The original listener must
727 * only be in the INIT or ASSIGNED states, and the new listener will only be
728 * placed into the INIT state. The counters are always set to NULL. Maxsock is
729 * updated. Returns NULL on allocation error.
730 */
731struct listener *clone_listener(struct listener *src)
732{
733 struct listener *l;
734
735 l = calloc(1, sizeof(*l));
736 if (!l)
737 goto oom1;
738 memcpy(l, src, sizeof(*l));
739
740 if (l->name) {
741 l->name = strdup(l->name);
742 if (!l->name)
743 goto oom2;
744 }
745
746 l->rx.owner = l;
747 l->state = LI_INIT;
748 l->counters = NULL;
749 l->extra_counters = NULL;
750
751 LIST_APPEND(&src->by_fe, &l->by_fe);
752 LIST_APPEND(&src->by_bind, &l->by_bind);
753
754 MT_LIST_INIT(&l->wait_queue);
755
756 l->rx.proto->add(l->rx.proto, l);
757
Willy Tarreau08b6f962022-02-01 16:23:00 +0100758 HA_RWLOCK_INIT(&l->lock);
Willy Tarreau59a877d2021-10-12 09:36:10 +0200759 _HA_ATOMIC_INC(&jobs);
760 _HA_ATOMIC_INC(&listeners);
761 global.maxsock++;
762 return l;
763
Willy Tarreau59a877d2021-10-12 09:36:10 +0200764 oom2:
765 free(l);
766 oom1:
Willy Tarreaua1462892021-10-16 14:45:29 +0200767 return NULL;
Willy Tarreau59a877d2021-10-12 09:36:10 +0200768}
769
Willy Tarreau1a64d162007-10-28 22:26:05 +0100770/* Delete a listener from its protocol's list of listeners. The listener's
771 * state is automatically updated from LI_ASSIGNED to LI_INIT. The protocol's
Willy Tarreau2cc5bae2017-09-15 08:18:11 +0200772 * number of listeners is updated, as well as the global number of listeners
773 * and jobs. Note that the listener must have previously been unbound. This
Willy Tarreaub4c083f2020-10-07 15:36:16 +0200774 * is a low-level function expected to be called with the proto_lock and the
775 * listener's lock held.
Willy Tarreau1a64d162007-10-28 22:26:05 +0100776 */
Willy Tarreaub4c083f2020-10-07 15:36:16 +0200777void __delete_listener(struct listener *listener)
Willy Tarreau1a64d162007-10-28 22:26:05 +0100778{
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100779 if (listener->state == LI_ASSIGNED) {
Willy Tarreaua37b2442020-09-24 07:23:45 +0200780 listener_set_state(listener, LI_INIT);
Willy Tarreau2b718102021-04-21 07:32:39 +0200781 LIST_DELETE(&listener->rx.proto_list);
Willy Tarreaud7f331c2020-09-25 17:01:43 +0200782 listener->rx.proto->nb_receivers--;
Willy Tarreau4781b152021-04-06 13:53:36 +0200783 _HA_ATOMIC_DEC(&jobs);
784 _HA_ATOMIC_DEC(&listeners);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100785 }
Willy Tarreaub4c083f2020-10-07 15:36:16 +0200786}
787
788/* Delete a listener from its protocol's list of listeners (please check
789 * __delete_listener() above). The proto_lock and the listener's lock will
790 * be grabbed in this order.
791 */
792void delete_listener(struct listener *listener)
793{
794 HA_SPIN_LOCK(PROTO_LOCK, &proto_lock);
Willy Tarreau08b6f962022-02-01 16:23:00 +0100795 HA_RWLOCK_WRLOCK(LISTENER_LOCK, &listener->lock);
Willy Tarreaub4c083f2020-10-07 15:36:16 +0200796 __delete_listener(listener);
Willy Tarreau08b6f962022-02-01 16:23:00 +0100797 HA_RWLOCK_WRUNLOCK(LISTENER_LOCK, &listener->lock);
Willy Tarreau6ee9f8d2019-08-26 10:55:52 +0200798 HA_SPIN_UNLOCK(PROTO_LOCK, &proto_lock);
Willy Tarreau1a64d162007-10-28 22:26:05 +0100799}
800
Willy Tarreaue2711c72019-02-27 15:39:41 +0100801/* Returns a suitable value for a listener's backlog. It uses the listener's,
802 * otherwise the frontend's backlog, otherwise the listener's maxconn,
803 * otherwise the frontend's maxconn, otherwise 1024.
804 */
805int listener_backlog(const struct listener *l)
806{
807 if (l->backlog)
808 return l->backlog;
809
810 if (l->bind_conf->frontend->backlog)
811 return l->bind_conf->frontend->backlog;
812
813 if (l->maxconn)
814 return l->maxconn;
815
816 if (l->bind_conf->frontend->maxconn)
817 return l->bind_conf->frontend->maxconn;
818
819 return 1024;
820}
821
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200822/* This function is called on a read event from a listening socket, corresponding
823 * to an accept. It tries to accept as many connections as possible, and for each
824 * calls the listener's accept handler (generally the frontend's accept handler).
825 */
Willy Tarreaua74cb382020-10-15 21:29:49 +0200826void listener_accept(struct listener *l)
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200827{
Willy Tarreau83efc322020-10-14 17:37:17 +0200828 struct connection *cli_conn;
Olivier Houchardd16a9df2019-02-25 16:18:16 +0100829 struct proxy *p;
Christopher Faulet102854c2019-04-30 12:17:13 +0200830 unsigned int max_accept;
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100831 int next_conn = 0;
Willy Tarreau82c97892019-02-27 19:32:32 +0100832 int next_feconn = 0;
833 int next_actconn = 0;
Willy Tarreaubb660302014-05-07 19:47:02 +0200834 int expire;
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200835 int ret;
836
Olivier Houchardd16a9df2019-02-25 16:18:16 +0100837 p = l->bind_conf->frontend;
Christopher Faulet102854c2019-04-30 12:17:13 +0200838
839 /* if l->maxaccept is -1, then max_accept is UINT_MAX. It is not really
840 * illimited, but it is probably enough.
841 */
Olivier Houchardd16a9df2019-02-25 16:18:16 +0100842 max_accept = l->maxaccept ? l->maxaccept : 1;
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200843
Willy Tarreau93e7c002013-10-07 18:51:07 +0200844 if (!(l->options & LI_O_UNLIMITED) && global.sps_lim) {
845 int max = freq_ctr_remain(&global.sess_per_sec, global.sps_lim, 0);
Willy Tarreau93e7c002013-10-07 18:51:07 +0200846
847 if (unlikely(!max)) {
848 /* frontend accept rate limit was reached */
Willy Tarreau93e7c002013-10-07 18:51:07 +0200849 expire = tick_add(now_ms, next_event_delay(&global.sess_per_sec, global.sps_lim, 0));
Willy Tarreau0591bf72019-12-10 12:01:21 +0100850 goto limit_global;
Willy Tarreau93e7c002013-10-07 18:51:07 +0200851 }
852
853 if (max_accept > max)
854 max_accept = max;
855 }
856
857 if (!(l->options & LI_O_UNLIMITED) && global.cps_lim) {
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200858 int max = freq_ctr_remain(&global.conn_per_sec, global.cps_lim, 0);
859
860 if (unlikely(!max)) {
861 /* frontend accept rate limit was reached */
Willy Tarreau93e7c002013-10-07 18:51:07 +0200862 expire = tick_add(now_ms, next_event_delay(&global.conn_per_sec, global.cps_lim, 0));
Willy Tarreau0591bf72019-12-10 12:01:21 +0100863 goto limit_global;
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200864 }
865
866 if (max_accept > max)
867 max_accept = max;
868 }
Willy Tarreaue43d5322013-10-07 20:01:52 +0200869#ifdef USE_OPENSSL
Willy Tarreau11ba4042022-05-20 15:56:32 +0200870 if (!(l->options & LI_O_UNLIMITED) && global.ssl_lim &&
871 l->bind_conf && l->bind_conf->options & BC_O_USE_SSL) {
Willy Tarreaue43d5322013-10-07 20:01:52 +0200872 int max = freq_ctr_remain(&global.ssl_per_sec, global.ssl_lim, 0);
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200873
Willy Tarreaue43d5322013-10-07 20:01:52 +0200874 if (unlikely(!max)) {
875 /* frontend accept rate limit was reached */
Willy Tarreaue43d5322013-10-07 20:01:52 +0200876 expire = tick_add(now_ms, next_event_delay(&global.ssl_per_sec, global.ssl_lim, 0));
Willy Tarreau0591bf72019-12-10 12:01:21 +0100877 goto limit_global;
Willy Tarreaue43d5322013-10-07 20:01:52 +0200878 }
879
880 if (max_accept > max)
881 max_accept = max;
882 }
883#endif
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200884 if (p && p->fe_sps_lim) {
885 int max = freq_ctr_remain(&p->fe_sess_per_sec, p->fe_sps_lim, 0);
886
887 if (unlikely(!max)) {
888 /* frontend accept rate limit was reached */
Willy Tarreau0591bf72019-12-10 12:01:21 +0100889 expire = tick_add(now_ms, next_event_delay(&p->fe_sess_per_sec, p->fe_sps_lim, 0));
890 goto limit_proxy;
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200891 }
892
893 if (max_accept > max)
894 max_accept = max;
895 }
896
897 /* Note: if we fail to allocate a connection because of configured
898 * limits, we'll schedule a new attempt worst 1 second later in the
899 * worst case. If we fail due to system limits or temporary resource
900 * shortage, we try again 100ms later in the worst case.
901 */
Willy Tarreau02757d02021-01-28 18:07:24 +0100902 for (; max_accept; next_conn = next_feconn = next_actconn = 0, max_accept--) {
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +0200903 unsigned int count;
Willy Tarreau9378bbe2020-10-15 10:09:31 +0200904 int status;
Willy Tarreau0aa5a5b2020-10-16 17:43:04 +0200905 __decl_thread(unsigned long mask);
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200906
Willy Tarreau82c97892019-02-27 19:32:32 +0100907 /* pre-increase the number of connections without going too far.
908 * We process the listener, then the proxy, then the process.
909 * We know which ones to unroll based on the next_xxx value.
910 */
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100911 do {
912 count = l->nbconn;
Willy Tarreau93604ed2019-11-15 10:20:07 +0100913 if (unlikely(l->maxconn && count >= l->maxconn)) {
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100914 /* the listener was marked full or another
915 * thread is going to do it.
916 */
917 next_conn = 0;
Willy Tarreau93604ed2019-11-15 10:20:07 +0100918 listener_full(l);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100919 goto end;
920 }
921 next_conn = count + 1;
David Carlier56716622019-03-27 16:08:42 +0000922 } while (!_HA_ATOMIC_CAS(&l->nbconn, (int *)(&count), next_conn));
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100923
Willy Tarreau82c97892019-02-27 19:32:32 +0100924 if (p) {
925 do {
926 count = p->feconn;
Willy Tarreau93604ed2019-11-15 10:20:07 +0100927 if (unlikely(count >= p->maxconn)) {
Willy Tarreau82c97892019-02-27 19:32:32 +0100928 /* the frontend was marked full or another
929 * thread is going to do it.
930 */
931 next_feconn = 0;
Willy Tarreau0591bf72019-12-10 12:01:21 +0100932 expire = TICK_ETERNITY;
933 goto limit_proxy;
Willy Tarreau82c97892019-02-27 19:32:32 +0100934 }
935 next_feconn = count + 1;
Olivier Houchard64213e92019-03-08 18:52:57 +0100936 } while (!_HA_ATOMIC_CAS(&p->feconn, &count, next_feconn));
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200937 }
938
Willy Tarreau82c97892019-02-27 19:32:32 +0100939 if (!(l->options & LI_O_UNLIMITED)) {
940 do {
941 count = actconn;
Willy Tarreau93604ed2019-11-15 10:20:07 +0100942 if (unlikely(count >= global.maxconn)) {
Willy Tarreau82c97892019-02-27 19:32:32 +0100943 /* the process was marked full or another
944 * thread is going to do it.
945 */
946 next_actconn = 0;
Willy Tarreau0591bf72019-12-10 12:01:21 +0100947 expire = tick_add(now_ms, 1000); /* try again in 1 second */
948 goto limit_global;
Willy Tarreau82c97892019-02-27 19:32:32 +0100949 }
950 next_actconn = count + 1;
David Carlier56716622019-03-27 16:08:42 +0000951 } while (!_HA_ATOMIC_CAS(&actconn, (int *)(&count), next_actconn));
Willy Tarreaubbebbbf2012-05-07 21:22:09 +0200952 }
953
Willy Tarreaufed93d32022-02-01 16:37:00 +0100954 /* be careful below, the listener might be shutting down in
955 * another thread on error and we must not dereference its
956 * FD without a bit of protection.
957 */
958 cli_conn = NULL;
959 status = CO_AC_PERMERR;
960
961 HA_RWLOCK_RDLOCK(LISTENER_LOCK, &l->lock);
962 if (l->rx.flags & RX_F_BOUND)
963 cli_conn = l->rx.proto->accept_conn(l, &status);
964 HA_RWLOCK_RDUNLOCK(LISTENER_LOCK, &l->lock);
965
Willy Tarreau9378bbe2020-10-15 10:09:31 +0200966 if (!cli_conn) {
967 switch (status) {
968 case CO_AC_DONE:
969 goto end;
Willy Tarreau818dca52014-01-31 19:40:19 +0100970
Willy Tarreau9378bbe2020-10-15 10:09:31 +0200971 case CO_AC_RETRY: /* likely a signal */
Willy Tarreau4781b152021-04-06 13:53:36 +0200972 _HA_ATOMIC_DEC(&l->nbconn);
Willy Tarreau82c97892019-02-27 19:32:32 +0100973 if (p)
Willy Tarreau4781b152021-04-06 13:53:36 +0200974 _HA_ATOMIC_DEC(&p->feconn);
Willy Tarreau82c97892019-02-27 19:32:32 +0100975 if (!(l->options & LI_O_UNLIMITED))
Willy Tarreau4781b152021-04-06 13:53:36 +0200976 _HA_ATOMIC_DEC(&actconn);
Willy Tarreaua593ec52014-01-20 21:21:30 +0100977 continue;
Willy Tarreau9378bbe2020-10-15 10:09:31 +0200978
979 case CO_AC_YIELD:
Willy Tarreau92079932019-12-10 09:30:05 +0100980 max_accept = 0;
981 goto end;
William Lallemandd9138002018-11-27 12:02:39 +0100982
Willy Tarreau9378bbe2020-10-15 10:09:31 +0200983 default:
984 goto transient_error;
Willy Tarreau83efc322020-10-14 17:37:17 +0200985 }
986 }
987
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100988 /* The connection was accepted, it must be counted as such */
989 if (l->counters)
990 HA_ATOMIC_UPDATE_MAX(&l->counters->conn_max, next_conn);
991
Willy Tarreaud8679342022-05-09 20:41:54 +0200992 if (p) {
Willy Tarreau82c97892019-02-27 19:32:32 +0100993 HA_ATOMIC_UPDATE_MAX(&p->fe_counters.conn_max, next_feconn);
Willy Tarreaud8679342022-05-09 20:41:54 +0200994 proxy_inc_fe_conn_ctr(l, p);
995 }
Willy Tarreau82c97892019-02-27 19:32:32 +0100996
Willy Tarreau3f0d02b2019-02-25 19:23:37 +0100997 if (!(l->options & LI_O_UNLIMITED)) {
998 count = update_freq_ctr(&global.conn_per_sec, 1);
999 HA_ATOMIC_UPDATE_MAX(&global.cps_max, count);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001000 }
1001
Willy Tarreau4781b152021-04-06 13:53:36 +02001002 _HA_ATOMIC_INC(&activity[tid].accepted);
Willy Tarreau64a9c052019-04-12 15:27:17 +02001003
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001004 /* past this point, l->accept() will automatically decrement
Willy Tarreau82c97892019-02-27 19:32:32 +01001005 * l->nbconn, feconn and actconn once done. Setting next_*conn=0
1006 * allows the error path not to rollback on nbconn. It's more
1007 * convenient than duplicating all exit labels.
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001008 */
1009 next_conn = 0;
Willy Tarreau82c97892019-02-27 19:32:32 +01001010 next_feconn = 0;
1011 next_actconn = 0;
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001012
Willy Tarreau83efc322020-10-14 17:37:17 +02001013
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001014#if defined(USE_THREAD)
Amaury Denoyelle7f7713d2022-01-19 11:37:50 +01001015 if (l->rx.flags & RX_F_LOCAL_ACCEPT)
1016 goto local_accept;
1017
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001018 mask = l->rx.bind_thread & tg->threads_enabled;
Willy Tarreaua7da5e82020-03-12 17:33:29 +01001019 if (atleast2(mask) && (global.tune.options & GTUNE_LISTENER_MQ) && !stopping) {
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001020 struct accept_queue_ring *ring;
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001021 unsigned int t, t0, t1, t2;
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001022 int base = tg->base;
Willy Tarreaufc630bd2019-03-04 19:57:34 +01001023
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001024 /* The principle is that we have two running indexes,
1025 * each visiting in turn all threads bound to this
1026 * listener. The connection will be assigned to the one
1027 * with the least connections, and the other one will
1028 * be updated. This provides a good fairness on short
Willy Tarreaufc630bd2019-03-04 19:57:34 +01001029 * connections (round robin) and on long ones (conn
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001030 * count), without ever missing any idle thread.
Willy Tarreaufc630bd2019-03-04 19:57:34 +01001031 */
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001032
1033 /* keep a copy for the final update. thr_idx is composite
1034 * and made of (t2<<16) + t1.
1035 */
Willy Tarreau0cf33172019-03-06 15:26:33 +01001036 t0 = l->thr_idx;
Willy Tarreaufc630bd2019-03-04 19:57:34 +01001037 do {
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001038 unsigned long m1, m2;
1039 int q1, q2;
1040
1041 t2 = t1 = t0;
1042 t2 >>= 16;
1043 t1 &= 0xFFFF;
1044
1045 /* t1 walks low to high bits ;
1046 * t2 walks high to low.
1047 */
1048 m1 = mask >> t1;
1049 m2 = mask & (t2 ? nbits(t2 + 1) : ~0UL);
1050
Willy Tarreau85d04242019-04-16 18:09:13 +02001051 if (unlikely(!(m1 & 1))) {
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001052 m1 &= ~1UL;
1053 if (!m1) {
1054 m1 = mask;
1055 t1 = 0;
1056 }
1057 t1 += my_ffsl(m1) - 1;
1058 }
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001059
Willy Tarreau85d04242019-04-16 18:09:13 +02001060 if (unlikely(!(m2 & (1UL << t2)) || t1 == t2)) {
1061 /* highest bit not set */
1062 if (!m2)
1063 m2 = mask;
1064
1065 t2 = my_flsl(m2) - 1;
1066 }
1067
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001068 /* now we have two distinct thread IDs belonging to the mask */
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001069 q1 = accept_queue_rings[base + t1].tail - accept_queue_rings[base + t1].head + ACCEPT_QUEUE_SIZE;
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001070 if (q1 >= ACCEPT_QUEUE_SIZE)
1071 q1 -= ACCEPT_QUEUE_SIZE;
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001072
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001073 q2 = accept_queue_rings[base + t2].tail - accept_queue_rings[base + t2].head + ACCEPT_QUEUE_SIZE;
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001074 if (q2 >= ACCEPT_QUEUE_SIZE)
1075 q2 -= ACCEPT_QUEUE_SIZE;
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001076
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001077 /* we have 3 possibilities now :
1078 * q1 < q2 : t1 is less loaded than t2, so we pick it
1079 * and update t2 (since t1 might still be
1080 * lower than another thread)
1081 * q1 > q2 : t2 is less loaded than t1, so we pick it
1082 * and update t1 (since t2 might still be
1083 * lower than another thread)
1084 * q1 = q2 : both are equally loaded, thus we pick t1
1085 * and update t1 as it will become more loaded
1086 * than t2.
1087 */
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001088
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001089 q1 += l->thr_conn[base + t1];
1090 q2 += l->thr_conn[base + t2];
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001091
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001092 if (q1 - q2 < 0) {
1093 t = t1;
1094 t2 = t2 ? t2 - 1 : LONGBITS - 1;
1095 }
1096 else if (q1 - q2 > 0) {
1097 t = t2;
1098 t1++;
1099 if (t1 >= LONGBITS)
1100 t1 = 0;
1101 }
1102 else {
1103 t = t1;
1104 t1++;
1105 if (t1 >= LONGBITS)
1106 t1 = 0;
1107 }
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001108
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001109 /* new value for thr_idx */
1110 t1 += (t2 << 16);
Olivier Houchard64213e92019-03-08 18:52:57 +01001111 } while (unlikely(!_HA_ATOMIC_CAS(&l->thr_idx, &t0, t1)));
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001112
Willy Tarreau0fe703b2019-03-05 08:46:28 +01001113 /* We successfully selected the best thread "t" for this
1114 * connection. We use deferred accepts even if it's the
1115 * local thread because tests show that it's the best
1116 * performing model, likely due to better cache locality
1117 * when processing this loop.
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001118 */
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001119 ring = &accept_queue_rings[base + t];
Willy Tarreau83efc322020-10-14 17:37:17 +02001120 if (accept_queue_push_mp(ring, cli_conn)) {
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001121 _HA_ATOMIC_INC(&activity[base + t].accq_pushed);
Willy Tarreau2bd65a72019-09-24 06:55:18 +02001122 tasklet_wakeup(ring->tasklet);
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001123 continue;
1124 }
1125 /* If the ring is full we do a synchronous accept on
1126 * the local thread here.
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001127 */
Willy Tarreaud0b73bc2022-06-28 08:30:43 +02001128 _HA_ATOMIC_INC(&activity[base + t].accq_full);
Willy Tarreaue0e9c482019-01-27 15:37:19 +01001129 }
1130#endif // USE_THREAD
1131
Amaury Denoyelle7f7713d2022-01-19 11:37:50 +01001132 local_accept:
Willy Tarreau4781b152021-04-06 13:53:36 +02001133 _HA_ATOMIC_INC(&l->thr_conn[tid]);
Willy Tarreau83efc322020-10-14 17:37:17 +02001134 ret = l->accept(cli_conn);
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001135 if (unlikely(ret <= 0)) {
Willy Tarreau87b09662015-04-03 00:22:06 +02001136 /* The connection was closed by stream_accept(). Either
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001137 * we just have to ignore it (ret == 0) or it's a critical
1138 * error due to a resource shortage, and we must stop the
1139 * listener (ret < 0).
1140 */
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001141 if (ret == 0) /* successful termination */
1142 continue;
1143
Willy Tarreaubb660302014-05-07 19:47:02 +02001144 goto transient_error;
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001145 }
1146
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001147 /* increase the per-process number of cumulated sessions, this
1148 * may only be done once l->accept() has accepted the connection.
1149 */
Willy Tarreau93e7c002013-10-07 18:51:07 +02001150 if (!(l->options & LI_O_UNLIMITED)) {
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +02001151 count = update_freq_ctr(&global.sess_per_sec, 1);
1152 HA_ATOMIC_UPDATE_MAX(&global.sps_max, count);
Willy Tarreau93e7c002013-10-07 18:51:07 +02001153 }
Willy Tarreaue43d5322013-10-07 20:01:52 +02001154#ifdef USE_OPENSSL
Willy Tarreau11ba4042022-05-20 15:56:32 +02001155 if (!(l->options & LI_O_UNLIMITED) &&
1156 l->bind_conf && l->bind_conf->options & BC_O_USE_SSL) {
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +02001157 count = update_freq_ctr(&global.ssl_per_sec, 1);
1158 HA_ATOMIC_UPDATE_MAX(&global.ssl_max, count);
Willy Tarreaue43d5322013-10-07 20:01:52 +02001159 }
1160#endif
Willy Tarreau93e7c002013-10-07 18:51:07 +02001161
Willy Tarreaubdcd3252022-06-22 09:19:46 +02001162 _HA_ATOMIC_AND(&th_ctx->flags, ~TH_FL_STUCK); // this thread is still running
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001163 } /* end of for (max_accept--) */
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001164
Christopher Faulet8d8aa0d2017-05-30 15:36:50 +02001165 end:
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001166 if (next_conn)
Willy Tarreau4781b152021-04-06 13:53:36 +02001167 _HA_ATOMIC_DEC(&l->nbconn);
Willy Tarreau741b4d62019-02-25 15:02:04 +01001168
Willy Tarreau82c97892019-02-27 19:32:32 +01001169 if (p && next_feconn)
Willy Tarreau4781b152021-04-06 13:53:36 +02001170 _HA_ATOMIC_DEC(&p->feconn);
Willy Tarreau82c97892019-02-27 19:32:32 +01001171
1172 if (next_actconn)
Willy Tarreau4781b152021-04-06 13:53:36 +02001173 _HA_ATOMIC_DEC(&actconn);
Willy Tarreau82c97892019-02-27 19:32:32 +01001174
Willy Tarreaua8cf66b2019-02-27 16:49:00 +01001175 if ((l->state == LI_FULL && (!l->maxconn || l->nbconn < l->maxconn)) ||
Willy Tarreau02757d02021-01-28 18:07:24 +01001176 (l->state == LI_LIMITED &&
Willy Tarreaucdcba112019-12-11 15:06:30 +01001177 ((!p || p->feconn < p->maxconn) && (actconn < global.maxconn) &&
1178 (!tick_isset(global_listener_queue_task->expire) ||
1179 tick_is_expired(global_listener_queue_task->expire, now_ms))))) {
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001180 /* at least one thread has to this when quitting */
Aurelien DARRAGON00132882022-09-09 15:32:57 +02001181 resume_listener(l, 0);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001182
Willy Tarreau02757d02021-01-28 18:07:24 +01001183 /* Dequeues all of the listeners waiting for a resource */
Willy Tarreau241797a2019-12-10 14:10:52 +01001184 dequeue_all_listeners();
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001185
Olivier Houchard859dc802019-08-08 15:47:21 +02001186 if (p && !MT_LIST_ISEMPTY(&p->listener_queue) &&
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001187 (!p->fe_sps_lim || freq_ctr_remain(&p->fe_sess_per_sec, p->fe_sps_lim, 0) > 0))
Willy Tarreau241797a2019-12-10 14:10:52 +01001188 dequeue_proxy_listeners(p);
Willy Tarreau3f0d02b2019-02-25 19:23:37 +01001189 }
Willy Tarreau0591bf72019-12-10 12:01:21 +01001190 return;
1191
1192 transient_error:
1193 /* pause the listener for up to 100 ms */
1194 expire = tick_add(now_ms, 100);
1195
Willy Tarreau258b3512020-10-13 17:46:05 +02001196 /* This may be a shared socket that was paused by another process.
1197 * Let's put it to pause in this case.
1198 */
1199 if (l->rx.proto && l->rx.proto->rx_listening(&l->rx) == 0) {
Aurelien DARRAGON00132882022-09-09 15:32:57 +02001200 pause_listener(l, 0);
Willy Tarreau258b3512020-10-13 17:46:05 +02001201 goto end;
1202 }
1203
Willy Tarreau0591bf72019-12-10 12:01:21 +01001204 limit_global:
1205 /* (re-)queue the listener to the global queue and set it to expire no
1206 * later than <expire> ahead. The listener turns to LI_LIMITED.
1207 */
1208 limit_listener(l, &global_listener_queue);
1209 task_schedule(global_listener_queue_task, expire);
1210 goto end;
1211
1212 limit_proxy:
1213 /* (re-)queue the listener to the proxy's queue and set it to expire no
1214 * later than <expire> ahead. The listener turns to LI_LIMITED.
1215 */
1216 limit_listener(l, &p->listener_queue);
Willy Tarreaueeea8082020-01-08 19:15:07 +01001217 if (p->task && tick_isset(expire))
1218 task_schedule(p->task, expire);
Willy Tarreau0591bf72019-12-10 12:01:21 +01001219 goto end;
Willy Tarreaubbebbbf2012-05-07 21:22:09 +02001220}
1221
Willy Tarreau05f50472017-09-15 09:19:58 +02001222/* Notify the listener that a connection initiated from it was released. This
1223 * is used to keep the connection count consistent and to possibly re-open
1224 * listening when it was limited.
1225 */
1226void listener_release(struct listener *l)
1227{
1228 struct proxy *fe = l->bind_conf->frontend;
1229
1230 if (!(l->options & LI_O_UNLIMITED))
Willy Tarreau4781b152021-04-06 13:53:36 +02001231 _HA_ATOMIC_DEC(&actconn);
Willy Tarreau82c97892019-02-27 19:32:32 +01001232 if (fe)
Willy Tarreau4781b152021-04-06 13:53:36 +02001233 _HA_ATOMIC_DEC(&fe->feconn);
1234 _HA_ATOMIC_DEC(&l->nbconn);
1235 _HA_ATOMIC_DEC(&l->thr_conn[tid]);
Willy Tarreau82c97892019-02-27 19:32:32 +01001236
1237 if (l->state == LI_FULL || l->state == LI_LIMITED)
Aurelien DARRAGON00132882022-09-09 15:32:57 +02001238 resume_listener(l, 0);
Willy Tarreau05f50472017-09-15 09:19:58 +02001239
Willy Tarreau02757d02021-01-28 18:07:24 +01001240 /* Dequeues all of the listeners waiting for a resource */
1241 dequeue_all_listeners();
1242
Olivier Houchard859dc802019-08-08 15:47:21 +02001243 if (!MT_LIST_ISEMPTY(&fe->listener_queue) &&
Willy Tarreau05f50472017-09-15 09:19:58 +02001244 (!fe->fe_sps_lim || freq_ctr_remain(&fe->fe_sess_per_sec, fe->fe_sps_lim, 0) > 0))
Willy Tarreau241797a2019-12-10 14:10:52 +01001245 dequeue_proxy_listeners(fe);
Willy Tarreau05f50472017-09-15 09:19:58 +02001246}
1247
Willy Tarreauf2cb1692019-07-11 10:08:31 +02001248/* Initializes the listener queues. Returns 0 on success, otherwise ERR_* flags */
1249static int listener_queue_init()
1250{
Willy Tarreaubeeabf52021-10-01 18:23:30 +02001251 global_listener_queue_task = task_new_anywhere();
Willy Tarreaua1d97f82019-12-10 11:18:41 +01001252 if (!global_listener_queue_task) {
1253 ha_alert("Out of memory when initializing global listener queue\n");
1254 return ERR_FATAL|ERR_ABORT;
1255 }
1256 /* very simple initialization, users will queue the task if needed */
1257 global_listener_queue_task->context = NULL; /* not even a context! */
1258 global_listener_queue_task->process = manage_global_listener_queue;
1259
Willy Tarreauf2cb1692019-07-11 10:08:31 +02001260 return 0;
1261}
1262
1263static void listener_queue_deinit()
1264{
Willy Tarreaua1d97f82019-12-10 11:18:41 +01001265 task_destroy(global_listener_queue_task);
1266 global_listener_queue_task = NULL;
Willy Tarreauf2cb1692019-07-11 10:08:31 +02001267}
1268
1269REGISTER_CONFIG_POSTPARSER("multi-threaded listener queue", listener_queue_init);
1270REGISTER_POST_DEINIT(listener_queue_deinit);
1271
Willy Tarreaua1d97f82019-12-10 11:18:41 +01001272
1273/* This is the global management task for listeners. It enables listeners waiting
1274 * for global resources when there are enough free resource, or at least once in
Willy Tarreaud597ec22021-01-29 14:29:06 +01001275 * a while. It is designed to be called as a task. It's exported so that it's easy
1276 * to spot in "show tasks" or "show profiling".
Willy Tarreaua1d97f82019-12-10 11:18:41 +01001277 */
Willy Tarreau144f84a2021-03-02 16:09:26 +01001278struct task *manage_global_listener_queue(struct task *t, void *context, unsigned int state)
Willy Tarreaua1d97f82019-12-10 11:18:41 +01001279{
1280 /* If there are still too many concurrent connections, let's wait for
1281 * some of them to go away. We don't need to re-arm the timer because
1282 * each of them will scan the queue anyway.
1283 */
1284 if (unlikely(actconn >= global.maxconn))
1285 goto out;
1286
1287 /* We should periodically try to enable listeners waiting for a global
1288 * resource here, because it is possible, though very unlikely, that
1289 * they have been blocked by a temporary lack of global resource such
1290 * as a file descriptor or memory and that the temporary condition has
1291 * disappeared.
1292 */
1293 dequeue_all_listeners();
1294
1295 out:
1296 t->expire = TICK_ETERNITY;
1297 task_queue(t);
1298 return t;
1299}
1300
Willy Tarreau26982662012-09-12 23:17:10 +02001301/*
1302 * Registers the bind keyword list <kwl> as a list of valid keywords for next
1303 * parsing sessions.
1304 */
1305void bind_register_keywords(struct bind_kw_list *kwl)
1306{
Willy Tarreau2b718102021-04-21 07:32:39 +02001307 LIST_APPEND(&bind_keywords.list, &kwl->list);
Willy Tarreau26982662012-09-12 23:17:10 +02001308}
1309
1310/* Return a pointer to the bind keyword <kw>, or NULL if not found. If the
1311 * keyword is found with a NULL ->parse() function, then an attempt is made to
1312 * find one with a valid ->parse() function. This way it is possible to declare
1313 * platform-dependant, known keywords as NULL, then only declare them as valid
1314 * if some options are met. Note that if the requested keyword contains an
1315 * opening parenthesis, everything from this point is ignored.
1316 */
1317struct bind_kw *bind_find_kw(const char *kw)
1318{
1319 int index;
1320 const char *kwend;
1321 struct bind_kw_list *kwl;
1322 struct bind_kw *ret = NULL;
1323
1324 kwend = strchr(kw, '(');
1325 if (!kwend)
1326 kwend = kw + strlen(kw);
1327
1328 list_for_each_entry(kwl, &bind_keywords.list, list) {
1329 for (index = 0; kwl->kw[index].kw != NULL; index++) {
1330 if ((strncmp(kwl->kw[index].kw, kw, kwend - kw) == 0) &&
1331 kwl->kw[index].kw[kwend-kw] == 0) {
1332 if (kwl->kw[index].parse)
1333 return &kwl->kw[index]; /* found it !*/
1334 else
1335 ret = &kwl->kw[index]; /* may be OK */
1336 }
1337 }
1338 }
1339 return ret;
1340}
1341
Willy Tarreau8638f482012-09-18 18:01:17 +02001342/* Dumps all registered "bind" keywords to the <out> string pointer. The
1343 * unsupported keywords are only dumped if their supported form was not
1344 * found.
1345 */
1346void bind_dump_kws(char **out)
1347{
1348 struct bind_kw_list *kwl;
1349 int index;
1350
Christopher Faulet784063e2020-05-18 12:14:18 +02001351 if (!out)
1352 return;
1353
Willy Tarreau8638f482012-09-18 18:01:17 +02001354 *out = NULL;
1355 list_for_each_entry(kwl, &bind_keywords.list, list) {
1356 for (index = 0; kwl->kw[index].kw != NULL; index++) {
1357 if (kwl->kw[index].parse ||
1358 bind_find_kw(kwl->kw[index].kw) == &kwl->kw[index]) {
Willy Tarreau51fb7652012-09-18 18:24:39 +02001359 memprintf(out, "%s[%4s] %s%s%s\n", *out ? *out : "",
1360 kwl->scope,
Willy Tarreau8638f482012-09-18 18:01:17 +02001361 kwl->kw[index].kw,
Willy Tarreau51fb7652012-09-18 18:24:39 +02001362 kwl->kw[index].skip ? " <arg>" : "",
1363 kwl->kw[index].parse ? "" : " (not supported)");
Willy Tarreau8638f482012-09-18 18:01:17 +02001364 }
1365 }
1366 }
1367}
1368
Willy Tarreau433b05f2021-03-12 10:14:07 +01001369/* Try to find in srv_keyword the word that looks closest to <word> by counting
1370 * transitions between letters, digits and other characters. Will return the
1371 * best matching word if found, otherwise NULL.
1372 */
1373const char *bind_find_best_kw(const char *word)
1374{
1375 uint8_t word_sig[1024];
1376 uint8_t list_sig[1024];
1377 const struct bind_kw_list *kwl;
1378 const char *best_ptr = NULL;
1379 int dist, best_dist = INT_MAX;
1380 int index;
1381
1382 make_word_fingerprint(word_sig, word);
1383 list_for_each_entry(kwl, &bind_keywords.list, list) {
1384 for (index = 0; kwl->kw[index].kw != NULL; index++) {
1385 make_word_fingerprint(list_sig, kwl->kw[index].kw);
1386 dist = word_fingerprint_distance(word_sig, list_sig);
1387 if (dist < best_dist) {
1388 best_dist = dist;
1389 best_ptr = kwl->kw[index].kw;
1390 }
1391 }
1392 }
1393
1394 if (best_dist > 2 * strlen(word) || (best_ptr && best_dist > 2 * strlen(best_ptr)))
1395 best_ptr = NULL;
1396
1397 return best_ptr;
1398}
1399
Willy Tarreaudbf78022021-10-06 09:05:08 +02001400/* allocate an bind_conf struct for a bind line, and chain it to the frontend <fe>.
1401 * If <arg> is not NULL, it is duplicated into ->arg to store useful config
1402 * information for error reporting. NULL is returned on error.
1403 */
1404struct bind_conf *bind_conf_alloc(struct proxy *fe, const char *file,
1405 int line, const char *arg, struct xprt_ops *xprt)
1406{
1407 struct bind_conf *bind_conf = calloc(1, sizeof(*bind_conf));
1408
1409 if (!bind_conf)
1410 goto err;
1411
1412 bind_conf->file = strdup(file);
1413 if (!bind_conf->file)
1414 goto err;
1415 bind_conf->line = line;
1416 if (arg) {
1417 bind_conf->arg = strdup(arg);
1418 if (!bind_conf->arg)
1419 goto err;
1420 }
1421
1422 LIST_APPEND(&fe->conf.bind, &bind_conf->by_fe);
1423 bind_conf->settings.ux.uid = -1;
1424 bind_conf->settings.ux.gid = -1;
1425 bind_conf->settings.ux.mode = 0;
Willy Tarreau6dfbef42021-10-12 15:23:03 +02001426 bind_conf->settings.shards = 1;
Willy Tarreaudbf78022021-10-06 09:05:08 +02001427 bind_conf->xprt = xprt;
1428 bind_conf->frontend = fe;
1429 bind_conf->severity_output = CLI_SEVERITY_NONE;
1430#ifdef USE_OPENSSL
1431 HA_RWLOCK_INIT(&bind_conf->sni_lock);
1432 bind_conf->sni_ctx = EB_ROOT;
1433 bind_conf->sni_w_ctx = EB_ROOT;
1434#endif
1435 LIST_INIT(&bind_conf->listeners);
1436 return bind_conf;
1437
1438 err:
1439 if (bind_conf) {
1440 ha_free(&bind_conf->file);
1441 ha_free(&bind_conf->arg);
1442 }
1443 ha_free(&bind_conf);
1444 return NULL;
1445}
1446
1447const char *listener_state_str(const struct listener *l)
1448{
1449 static const char *states[8] = {
1450 "NEW", "INI", "ASS", "PAU", "LIS", "RDY", "FUL", "LIM",
1451 };
1452 unsigned int st = l->state;
1453
1454 if (st >= sizeof(states) / sizeof(*states))
1455 return "INVALID";
1456 return states[st];
1457}
1458
Willy Tarreau645513a2010-05-24 20:55:15 +02001459/************************************************************************/
Willy Tarreau0ccb7442013-01-07 22:54:17 +01001460/* All supported sample and ACL keywords must be declared here. */
Willy Tarreau645513a2010-05-24 20:55:15 +02001461/************************************************************************/
1462
Willy Tarreaua5e37562011-12-16 17:06:15 +01001463/* set temp integer to the number of connexions to the same listening socket */
Willy Tarreau645513a2010-05-24 20:55:15 +02001464static int
Thierry FOURNIER0786d052015-05-11 15:42:45 +02001465smp_fetch_dconn(const struct arg *args, struct sample *smp, const char *kw, void *private)
Willy Tarreau645513a2010-05-24 20:55:15 +02001466{
Thierry FOURNIER8c542ca2015-08-19 09:00:18 +02001467 smp->data.type = SMP_T_SINT;
Thierry FOURNIER136f9d32015-08-19 09:07:19 +02001468 smp->data.u.sint = smp->sess->listener->nbconn;
Willy Tarreau645513a2010-05-24 20:55:15 +02001469 return 1;
1470}
1471
Willy Tarreaua5e37562011-12-16 17:06:15 +01001472/* set temp integer to the id of the socket (listener) */
Willy Tarreau645513a2010-05-24 20:55:15 +02001473static int
Thierry FOURNIER0786d052015-05-11 15:42:45 +02001474smp_fetch_so_id(const struct arg *args, struct sample *smp, const char *kw, void *private)
Willy Tarreau37406352012-04-23 16:16:37 +02001475{
Thierry FOURNIER8c542ca2015-08-19 09:00:18 +02001476 smp->data.type = SMP_T_SINT;
Thierry FOURNIER136f9d32015-08-19 09:07:19 +02001477 smp->data.u.sint = smp->sess->listener->luid;
Willy Tarreau645513a2010-05-24 20:55:15 +02001478 return 1;
1479}
Jerome Magnineb421b22020-03-27 22:08:40 +01001480static int
1481smp_fetch_so_name(const struct arg *args, struct sample *smp, const char *kw, void *private)
1482{
1483 smp->data.u.str.area = smp->sess->listener->name;
1484 if (!smp->data.u.str.area)
1485 return 0;
1486
1487 smp->data.type = SMP_T_STR;
1488 smp->flags = SMP_F_CONST;
1489 smp->data.u.str.data = strlen(smp->data.u.str.area);
1490 return 1;
1491}
Willy Tarreau645513a2010-05-24 20:55:15 +02001492
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001493/* parse the "accept-proxy" bind keyword */
Willy Tarreau4348fad2012-09-20 16:48:07 +02001494static int bind_parse_accept_proxy(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001495{
1496 struct listener *l;
1497
Willy Tarreau4348fad2012-09-20 16:48:07 +02001498 list_for_each_entry(l, &conf->listeners, by_bind)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001499 l->options |= LI_O_ACC_PROXY;
1500
1501 return 0;
1502}
1503
Bertrand Jacquin93b227d2016-06-04 15:11:10 +01001504/* parse the "accept-netscaler-cip" bind keyword */
1505static int bind_parse_accept_netscaler_cip(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
1506{
1507 struct listener *l;
1508 uint32_t val;
1509
1510 if (!*args[cur_arg + 1]) {
1511 memprintf(err, "'%s' : missing value", args[cur_arg]);
1512 return ERR_ALERT | ERR_FATAL;
1513 }
1514
1515 val = atol(args[cur_arg + 1]);
1516 if (val <= 0) {
Willy Tarreaue2711c72019-02-27 15:39:41 +01001517 memprintf(err, "'%s' : invalid value %d, must be >= 0", args[cur_arg], val);
Bertrand Jacquin93b227d2016-06-04 15:11:10 +01001518 return ERR_ALERT | ERR_FATAL;
1519 }
1520
1521 list_for_each_entry(l, &conf->listeners, by_bind) {
1522 l->options |= LI_O_ACC_CIP;
1523 conf->ns_cip_magic = val;
1524 }
1525
1526 return 0;
1527}
1528
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001529/* parse the "backlog" bind keyword */
Willy Tarreau4348fad2012-09-20 16:48:07 +02001530static int bind_parse_backlog(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001531{
1532 struct listener *l;
1533 int val;
1534
1535 if (!*args[cur_arg + 1]) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001536 memprintf(err, "'%s' : missing value", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001537 return ERR_ALERT | ERR_FATAL;
1538 }
1539
1540 val = atol(args[cur_arg + 1]);
Willy Tarreaue2711c72019-02-27 15:39:41 +01001541 if (val < 0) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001542 memprintf(err, "'%s' : invalid value %d, must be > 0", args[cur_arg], val);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001543 return ERR_ALERT | ERR_FATAL;
1544 }
1545
Willy Tarreau4348fad2012-09-20 16:48:07 +02001546 list_for_each_entry(l, &conf->listeners, by_bind)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001547 l->backlog = val;
1548
1549 return 0;
1550}
1551
1552/* parse the "id" bind keyword */
Willy Tarreau4348fad2012-09-20 16:48:07 +02001553static int bind_parse_id(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001554{
1555 struct eb32_node *node;
Willy Tarreau4348fad2012-09-20 16:48:07 +02001556 struct listener *l, *new;
Thierry Fourniere7fe8eb2016-02-26 08:45:58 +01001557 char *error;
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001558
Willy Tarreau4348fad2012-09-20 16:48:07 +02001559 if (conf->listeners.n != conf->listeners.p) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001560 memprintf(err, "'%s' can only be used with a single socket", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001561 return ERR_ALERT | ERR_FATAL;
1562 }
1563
1564 if (!*args[cur_arg + 1]) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001565 memprintf(err, "'%s' : expects an integer argument", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001566 return ERR_ALERT | ERR_FATAL;
1567 }
1568
Willy Tarreau4348fad2012-09-20 16:48:07 +02001569 new = LIST_NEXT(&conf->listeners, struct listener *, by_bind);
Thierry Fourniere7fe8eb2016-02-26 08:45:58 +01001570 new->luid = strtol(args[cur_arg + 1], &error, 10);
1571 if (*error != '\0') {
1572 memprintf(err, "'%s' : expects an integer argument, found '%s'", args[cur_arg], args[cur_arg + 1]);
1573 return ERR_ALERT | ERR_FATAL;
1574 }
Willy Tarreau4348fad2012-09-20 16:48:07 +02001575 new->conf.id.key = new->luid;
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001576
Willy Tarreau4348fad2012-09-20 16:48:07 +02001577 if (new->luid <= 0) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001578 memprintf(err, "'%s' : custom id has to be > 0", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001579 return ERR_ALERT | ERR_FATAL;
1580 }
1581
Willy Tarreau4348fad2012-09-20 16:48:07 +02001582 node = eb32_lookup(&px->conf.used_listener_id, new->luid);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001583 if (node) {
1584 l = container_of(node, struct listener, conf.id);
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001585 memprintf(err, "'%s' : custom id %d already used at %s:%d ('bind %s')",
1586 args[cur_arg], l->luid, l->bind_conf->file, l->bind_conf->line,
1587 l->bind_conf->arg);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001588 return ERR_ALERT | ERR_FATAL;
1589 }
1590
Willy Tarreau4348fad2012-09-20 16:48:07 +02001591 eb32_insert(&px->conf.used_listener_id, &new->conf.id);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001592 return 0;
1593}
1594
Willy Tarreau3882d2a2022-05-20 15:41:45 +02001595/* Complete a bind_conf by parsing the args after the address. <args> is the
1596 * arguments array, <cur_arg> is the first one to be considered. <section> is
1597 * the section name to report in error messages, and <file> and <linenum> are
1598 * the file name and line number respectively. Note that args[0..1] are used
1599 * in error messages to provide some context. The return value is an error
1600 * code, zero on success or an OR of ERR_{FATAL,ABORT,ALERT,WARN}.
1601 */
1602int bind_parse_args_list(struct bind_conf *bind_conf, char **args, int cur_arg, const char *section, const char *file, int linenum)
1603{
1604 int err_code = 0;
1605
1606 while (*(args[cur_arg])) {
1607 struct bind_kw *kw;
1608 const char *best;
1609
1610 kw = bind_find_kw(args[cur_arg]);
1611 if (kw) {
1612 char *err = NULL;
1613 int code;
1614
1615 if (!kw->parse) {
1616 ha_alert("parsing [%s:%d] : '%s %s' in section '%s' : '%s' option is not implemented in this version (check build options).\n",
1617 file, linenum, args[0], args[1], section, args[cur_arg]);
1618 cur_arg += 1 + kw->skip ;
1619 err_code |= ERR_ALERT | ERR_FATAL;
1620 goto out;
1621 }
1622
1623 code = kw->parse(args, cur_arg, bind_conf->frontend, bind_conf, &err);
1624 err_code |= code;
1625
1626 if (code) {
1627 if (err && *err) {
1628 indent_msg(&err, 2);
1629 if (((code & (ERR_WARN|ERR_ALERT)) == ERR_WARN))
1630 ha_warning("parsing [%s:%d] : '%s %s' in section '%s' : %s\n", file, linenum, args[0], args[1], section, err);
1631 else
1632 ha_alert("parsing [%s:%d] : '%s %s' in section '%s' : %s\n", file, linenum, args[0], args[1], section, err);
1633 }
1634 else
1635 ha_alert("parsing [%s:%d] : '%s %s' in section '%s' : error encountered while processing '%s'.\n",
1636 file, linenum, args[0], args[1], section, args[cur_arg]);
1637 if (code & ERR_FATAL) {
1638 free(err);
1639 cur_arg += 1 + kw->skip;
1640 goto out;
1641 }
1642 }
1643 free(err);
1644 cur_arg += 1 + kw->skip;
1645 continue;
1646 }
1647
1648 best = bind_find_best_kw(args[cur_arg]);
1649 if (best)
1650 ha_alert("parsing [%s:%d] : '%s %s' in section '%s': unknown keyword '%s'; did you mean '%s' maybe ?\n",
1651 file, linenum, args[0], args[1], section, args[cur_arg], best);
1652 else
1653 ha_alert("parsing [%s:%d] : '%s %s' in section '%s': unknown keyword '%s'.\n",
1654 file, linenum, args[0], args[1], section, args[cur_arg]);
1655
1656 err_code |= ERR_ALERT | ERR_FATAL;
1657 goto out;
1658 }
Willy Tarreau64306cc2022-05-20 16:20:52 +02001659
1660 if ((bind_conf->options & (BC_O_USE_SOCK_DGRAM|BC_O_USE_SOCK_STREAM)) == (BC_O_USE_SOCK_DGRAM|BC_O_USE_SOCK_STREAM) ||
1661 (bind_conf->options & (BC_O_USE_XPRT_DGRAM|BC_O_USE_XPRT_STREAM)) == (BC_O_USE_XPRT_DGRAM|BC_O_USE_XPRT_STREAM)) {
1662 ha_alert("parsing [%s:%d] : '%s %s' in section '%s' : cannot mix datagram and stream protocols.\n",
1663 file, linenum, args[0], args[1], section);
1664 err_code |= ERR_ALERT | ERR_FATAL;
1665 goto out;
1666 }
1667
Willy Tarreau78d0dcd2022-05-20 17:10:00 +02001668 /* The transport layer automatically switches to QUIC when QUIC is
1669 * selected, regardless of bind_conf settings. We then need to
1670 * initialize QUIC params.
1671 */
1672 if ((bind_conf->options & (BC_O_USE_SOCK_DGRAM|BC_O_USE_XPRT_STREAM)) == (BC_O_USE_SOCK_DGRAM|BC_O_USE_XPRT_STREAM)) {
1673#ifdef USE_QUIC
1674 bind_conf->xprt = xprt_get(XPRT_QUIC);
Willy Tarreau287f32f2022-05-20 18:16:52 +02001675 if (!(bind_conf->options & BC_O_USE_SSL)) {
1676 bind_conf->options |= BC_O_USE_SSL;
1677 ha_warning("parsing [%s:%d] : '%s %s' in section '%s' : QUIC protocol detected, enabling ssl. Use 'ssl' to shut this warning.\n",
1678 file, linenum, args[0], args[1], section);
1679 }
Willy Tarreau78d0dcd2022-05-20 17:10:00 +02001680 quic_transport_params_init(&bind_conf->quic_params, 1);
1681#else
1682 ha_alert("parsing [%s:%d] : '%s %s' in section '%s' : QUIC protocol selected but support not compiled in (check build options).\n",
1683 file, linenum, args[0], args[1], section);
1684 err_code |= ERR_ALERT | ERR_FATAL;
1685 goto out;
1686#endif
1687 }
Willy Tarreau2071a992022-05-20 17:14:31 +02001688 else if (bind_conf->options & BC_O_USE_SSL) {
1689 bind_conf->xprt = xprt_get(XPRT_SSL);
1690 }
Willy Tarreau78d0dcd2022-05-20 17:10:00 +02001691
Willy Tarreau3882d2a2022-05-20 15:41:45 +02001692 out:
1693 return err_code;
1694}
1695
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001696/* parse the "maxconn" bind keyword */
Willy Tarreau4348fad2012-09-20 16:48:07 +02001697static int bind_parse_maxconn(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001698{
1699 struct listener *l;
1700 int val;
1701
1702 if (!*args[cur_arg + 1]) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001703 memprintf(err, "'%s' : missing value", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001704 return ERR_ALERT | ERR_FATAL;
1705 }
1706
1707 val = atol(args[cur_arg + 1]);
Willy Tarreaua8cf66b2019-02-27 16:49:00 +01001708 if (val < 0) {
1709 memprintf(err, "'%s' : invalid value %d, must be >= 0", args[cur_arg], val);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001710 return ERR_ALERT | ERR_FATAL;
1711 }
1712
Willy Tarreau4348fad2012-09-20 16:48:07 +02001713 list_for_each_entry(l, &conf->listeners, by_bind)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001714 l->maxconn = val;
1715
1716 return 0;
1717}
1718
1719/* parse the "name" bind keyword */
Willy Tarreau4348fad2012-09-20 16:48:07 +02001720static int bind_parse_name(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001721{
1722 struct listener *l;
1723
1724 if (!*args[cur_arg + 1]) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001725 memprintf(err, "'%s' : missing name", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001726 return ERR_ALERT | ERR_FATAL;
1727 }
1728
Willy Tarreau4348fad2012-09-20 16:48:07 +02001729 list_for_each_entry(l, &conf->listeners, by_bind)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001730 l->name = strdup(args[cur_arg + 1]);
1731
1732 return 0;
1733}
1734
1735/* parse the "nice" bind keyword */
Willy Tarreau4348fad2012-09-20 16:48:07 +02001736static int bind_parse_nice(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001737{
1738 struct listener *l;
1739 int val;
1740
1741 if (!*args[cur_arg + 1]) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001742 memprintf(err, "'%s' : missing value", args[cur_arg]);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001743 return ERR_ALERT | ERR_FATAL;
1744 }
1745
1746 val = atol(args[cur_arg + 1]);
1747 if (val < -1024 || val > 1024) {
Willy Tarreaueb6cead2012-09-20 19:43:14 +02001748 memprintf(err, "'%s' : invalid value %d, allowed range is -1024..1024", args[cur_arg], val);
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001749 return ERR_ALERT | ERR_FATAL;
1750 }
1751
Willy Tarreau4348fad2012-09-20 16:48:07 +02001752 list_for_each_entry(l, &conf->listeners, by_bind)
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001753 l->nice = val;
1754
1755 return 0;
1756}
1757
Willy Tarreau6ae1ba62014-05-07 19:01:58 +02001758/* parse the "process" bind keyword */
1759static int bind_parse_process(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
1760{
Willy Tarreauacd64412022-07-15 17:16:01 +02001761 memprintf(err, "'process %s' on 'bind' lines is not supported anymore, please use 'thread' instead.", args[cur_arg+1]);
1762 return ERR_ALERT | ERR_FATAL;
Willy Tarreau6ae1ba62014-05-07 19:01:58 +02001763}
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001764
Christopher Fauleta717b992018-04-10 14:43:00 +02001765/* parse the "proto" bind keyword */
1766static int bind_parse_proto(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
1767{
1768 struct ist proto;
1769
1770 if (!*args[cur_arg + 1]) {
1771 memprintf(err, "'%s' : missing value", args[cur_arg]);
1772 return ERR_ALERT | ERR_FATAL;
1773 }
1774
Tim Duesterhusdcf753a2021-03-04 17:31:47 +01001775 proto = ist(args[cur_arg + 1]);
Christopher Fauleta717b992018-04-10 14:43:00 +02001776 conf->mux_proto = get_mux_proto(proto);
1777 if (!conf->mux_proto) {
1778 memprintf(err, "'%s' : unknown MUX protocol '%s'", args[cur_arg], args[cur_arg+1]);
1779 return ERR_ALERT | ERR_FATAL;
1780 }
Willy Tarreauc8cac042021-09-21 14:31:29 +02001781 return 0;
1782}
1783
Willy Tarreau6dfbef42021-10-12 15:23:03 +02001784/* parse the "shards" bind keyword. Takes an integer or "by-thread" */
1785static int bind_parse_shards(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
1786{
1787 int val;
1788
1789 if (!*args[cur_arg + 1]) {
1790 memprintf(err, "'%s' : missing value", args[cur_arg]);
1791 return ERR_ALERT | ERR_FATAL;
1792 }
1793
1794 if (strcmp(args[cur_arg + 1], "by-thread") == 0) {
1795 val = MAX_THREADS; /* will be trimmed later anyway */
1796 } else {
1797 val = atol(args[cur_arg + 1]);
1798 if (val < 1 || val > MAX_THREADS) {
1799 memprintf(err, "'%s' : invalid value %d, allowed range is %d..%d or 'by-thread'", args[cur_arg], val, 1, MAX_THREADS);
1800 return ERR_ALERT | ERR_FATAL;
1801 }
1802 }
1803
1804 conf->settings.shards = val;
1805 return 0;
1806}
1807
Willy Tarreauc8cac042021-09-21 14:31:29 +02001808/* parse the "thread" bind keyword */
1809static int bind_parse_thread(char **args, int cur_arg, struct proxy *px, struct bind_conf *conf, char **err)
1810{
Willy Tarreaud57b9ff2021-09-29 18:50:31 +02001811 char *sep = NULL;
1812 ulong thread = 0;
1813 long tgroup = 0;
Willy Tarreauc8cac042021-09-21 14:31:29 +02001814
Willy Tarreaud57b9ff2021-09-29 18:50:31 +02001815 tgroup = strtol(args[cur_arg + 1], &sep, 10);
1816 if (*sep == '/') {
1817 /* a thread group was present */
1818 if (tgroup < 1 || tgroup > MAX_TGROUPS) {
1819 memprintf(err, "'%s' thread-group number must be between 1 and %d (was %ld)", args[cur_arg + 1], MAX_TGROUPS, tgroup);
1820 return ERR_ALERT | ERR_FATAL;
1821 }
1822 sep++;
1823 }
1824 else {
1825 /* no thread group */
1826 tgroup = 0;
1827 sep = args[cur_arg + 1];
1828 }
Willy Tarreauc8cac042021-09-21 14:31:29 +02001829
Willy Tarreau01cac3f2021-10-12 08:47:54 +02001830 if ((conf->bind_tgroup || conf->bind_thread) &&
1831 conf->bind_tgroup != tgroup) {
Willy Tarreaud57b9ff2021-09-29 18:50:31 +02001832 memprintf(err, "'%s' multiple thread-groups are not supported", args[cur_arg + 1]);
Willy Tarreauc8cac042021-09-21 14:31:29 +02001833 return ERR_ALERT | ERR_FATAL;
1834 }
Willy Tarreau740038c2022-07-15 17:18:23 +02001835
1836 if (parse_process_number(sep, &thread, LONGBITS, NULL, err)) {
Willy Tarreaud57b9ff2021-09-29 18:50:31 +02001837 memprintf(err, "'%s' : %s", sep, *err);
Willy Tarreauc8cac042021-09-21 14:31:29 +02001838 return ERR_ALERT | ERR_FATAL;
1839 }
1840
Willy Tarreau01cac3f2021-10-12 08:47:54 +02001841 conf->bind_thread |= thread;
1842 conf->bind_tgroup = tgroup;
Christopher Fauleta717b992018-04-10 14:43:00 +02001843 return 0;
1844}
1845
Willy Tarreau7ac908b2019-02-27 12:02:18 +01001846/* config parser for global "tune.listener.multi-queue", accepts "on" or "off" */
1847static int cfg_parse_tune_listener_mq(char **args, int section_type, struct proxy *curpx,
Willy Tarreau01825162021-03-09 09:53:46 +01001848 const struct proxy *defpx, const char *file, int line,
Willy Tarreau7ac908b2019-02-27 12:02:18 +01001849 char **err)
1850{
1851 if (too_many_args(1, args, err, NULL))
1852 return -1;
1853
1854 if (strcmp(args[1], "on") == 0)
1855 global.tune.options |= GTUNE_LISTENER_MQ;
1856 else if (strcmp(args[1], "off") == 0)
1857 global.tune.options &= ~GTUNE_LISTENER_MQ;
1858 else {
1859 memprintf(err, "'%s' expects either 'on' or 'off' but got '%s'.", args[0], args[1]);
1860 return -1;
1861 }
1862 return 0;
1863}
1864
Willy Tarreau61612d42012-04-19 18:42:05 +02001865/* Note: must not be declared <const> as its list will be overwritten.
1866 * Please take care of keeping this list alphabetically sorted.
1867 */
Willy Tarreaudc13c112013-06-21 23:16:39 +02001868static struct sample_fetch_kw_list smp_kws = {ILH, {
Thierry FOURNIER07ee64e2015-07-06 23:43:03 +02001869 { "dst_conn", smp_fetch_dconn, 0, NULL, SMP_T_SINT, SMP_USE_FTEND, },
1870 { "so_id", smp_fetch_so_id, 0, NULL, SMP_T_SINT, SMP_USE_FTEND, },
Jerome Magnineb421b22020-03-27 22:08:40 +01001871 { "so_name", smp_fetch_so_name, 0, NULL, SMP_T_STR, SMP_USE_FTEND, },
Willy Tarreau0ccb7442013-01-07 22:54:17 +01001872 { /* END */ },
1873}};
1874
Willy Tarreau0108d902018-11-25 19:14:37 +01001875INITCALL1(STG_REGISTER, sample_register_fetches, &smp_kws);
1876
Willy Tarreau0ccb7442013-01-07 22:54:17 +01001877/* Note: must not be declared <const> as its list will be overwritten.
1878 * Please take care of keeping this list alphabetically sorted.
1879 */
Willy Tarreaudc13c112013-06-21 23:16:39 +02001880static struct acl_kw_list acl_kws = {ILH, {
Willy Tarreau0ccb7442013-01-07 22:54:17 +01001881 { /* END */ },
Willy Tarreau645513a2010-05-24 20:55:15 +02001882}};
1883
Willy Tarreau0108d902018-11-25 19:14:37 +01001884INITCALL1(STG_REGISTER, acl_register_keywords, &acl_kws);
1885
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001886/* Note: must not be declared <const> as its list will be overwritten.
1887 * Please take care of keeping this list alphabetically sorted, doing so helps
1888 * all code contributors.
1889 * Optional keywords are also declared with a NULL ->parse() function so that
1890 * the config parser can report an appropriate error when a known keyword was
1891 * not enabled.
1892 */
Willy Tarreau51fb7652012-09-18 18:24:39 +02001893static struct bind_kw_list bind_kws = { "ALL", { }, {
Bertrand Jacquin93b227d2016-06-04 15:11:10 +01001894 { "accept-netscaler-cip", bind_parse_accept_netscaler_cip, 1 }, /* enable NetScaler Client IP insertion protocol */
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001895 { "accept-proxy", bind_parse_accept_proxy, 0 }, /* enable PROXY protocol */
1896 { "backlog", bind_parse_backlog, 1 }, /* set backlog of listening socket */
1897 { "id", bind_parse_id, 1 }, /* set id of listening socket */
1898 { "maxconn", bind_parse_maxconn, 1 }, /* set maxconn of listening socket */
1899 { "name", bind_parse_name, 1 }, /* set name of listening socket */
1900 { "nice", bind_parse_nice, 1 }, /* set nice of listening socket */
Willy Tarreau6ae1ba62014-05-07 19:01:58 +02001901 { "process", bind_parse_process, 1 }, /* set list of allowed process for this socket */
Christopher Fauleta717b992018-04-10 14:43:00 +02001902 { "proto", bind_parse_proto, 1 }, /* set the proto to use for all incoming connections */
Willy Tarreau6dfbef42021-10-12 15:23:03 +02001903 { "shards", bind_parse_shards, 1 }, /* set number of shards */
Willy Tarreauc8cac042021-09-21 14:31:29 +02001904 { "thread", bind_parse_thread, 1 }, /* set list of allowed threads for this socket */
Willy Tarreau0ccb7442013-01-07 22:54:17 +01001905 { /* END */ },
Willy Tarreau3dcc3412012-09-18 17:17:28 +02001906}};
1907
Willy Tarreau0108d902018-11-25 19:14:37 +01001908INITCALL1(STG_REGISTER, bind_register_keywords, &bind_kws);
1909
Willy Tarreau7ac908b2019-02-27 12:02:18 +01001910/* config keyword parsers */
1911static struct cfg_kw_list cfg_kws = {ILH, {
1912 { CFG_GLOBAL, "tune.listener.multi-queue", cfg_parse_tune_listener_mq },
1913 { 0, NULL, NULL }
1914}};
1915
1916INITCALL1(STG_REGISTER, cfg_register_keywords, &cfg_kws);
1917
Willy Tarreau645513a2010-05-24 20:55:15 +02001918/*
1919 * Local variables:
1920 * c-indent-level: 8
1921 * c-basic-offset: 8
1922 * End:
1923 */