blob: 505291f9a259775eccf797d9f19306013230c236 [file] [log] [blame]
Willy Tarreaubaaee002006-06-26 02:48:02 +02001/*
Willy Tarreau8d5d77e2009-10-18 07:25:52 +02002 * include/types/fd.h
Willy Tarreauf817e9f2014-01-10 16:58:45 +01003 * File descriptors states - check src/fd.c for explanations.
Willy Tarreau8d5d77e2009-10-18 07:25:52 +02004 *
Willy Tarreauf817e9f2014-01-10 16:58:45 +01005 * Copyright (C) 2000-2014 Willy Tarreau - w@1wt.eu
Willy Tarreau8d5d77e2009-10-18 07:25:52 +02006 *
7 * This library is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation, version 2.1
10 * exclusively.
11 *
12 * This library is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with this library; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
Willy Tarreaubaaee002006-06-26 02:48:02 +020021
22#ifndef _TYPES_FD_H
23#define _TYPES_FD_H
24
Willy Tarreau4c7e4b72020-05-27 12:58:42 +020025#include <haproxy/api-t.h>
Willy Tarreaueb6f7012020-05-27 16:21:26 +020026#include <import/ist.h>
Willy Tarreaudd2f85e2012-09-02 22:34:23 +020027#include <types/port_range.h>
Willy Tarreaubaaee002006-06-26 02:48:02 +020028
Willy Tarreau7be79a42012-11-11 15:02:54 +010029/* Direction for each FD event update */
Willy Tarreau54469402006-07-29 16:59:06 +020030enum {
31 DIR_RD=0,
32 DIR_WR=1,
Willy Tarreau54469402006-07-29 16:59:06 +020033};
Willy Tarreaubaaee002006-06-26 02:48:02 +020034
Willy Tarreau7be79a42012-11-11 15:02:54 +010035/* Polling status flags returned in fdtab[].ev :
Willy Tarreaud6f087e2008-01-18 17:20:13 +010036 * FD_POLL_IN remains set as long as some data is pending for read.
37 * FD_POLL_OUT remains set as long as the fd accepts to write data.
38 * FD_POLL_ERR and FD_POLL_ERR remain set forever (until processed).
39 */
Willy Tarreau3d32d3a2007-04-15 11:31:05 +020040#define FD_POLL_IN 0x01
41#define FD_POLL_PRI 0x02
42#define FD_POLL_OUT 0x04
43#define FD_POLL_ERR 0x08
44#define FD_POLL_HUP 0x10
Willy Tarreau3d32d3a2007-04-15 11:31:05 +020045
Willy Tarreaud6f087e2008-01-18 17:20:13 +010046#define FD_POLL_DATA (FD_POLL_IN | FD_POLL_OUT)
47#define FD_POLL_STICKY (FD_POLL_ERR | FD_POLL_HUP)
Willy Tarreau3d32d3a2007-04-15 11:31:05 +020048
Willy Tarreaua135ea62020-02-21 16:26:19 +010049/* FD_EV_* are the values used in fdtab[].state to define the polling states in
50 * each direction. Most of them are manipulated using test-and-set operations
51 * which require the bit position in the mask, which is given in the _BIT
52 * variant.
53 */
Willy Tarreauf817e9f2014-01-10 16:58:45 +010054
Willy Tarreau1dad3842019-07-08 23:09:03 +020055/* bits positions for a few flags */
Willy Tarreauf8ecc7f2019-09-04 13:22:50 +020056#define FD_EV_ACTIVE_R_BIT 0
Willy Tarreau77abb432019-09-06 18:27:02 +020057#define FD_EV_READY_R_BIT 1
58#define FD_EV_SHUT_R_BIT 2
Willy Tarreau1ed37812020-02-26 16:12:45 +010059/* unused: 3 */
Willy Tarreauf8ecc7f2019-09-04 13:22:50 +020060
61#define FD_EV_ACTIVE_W_BIT 4
Willy Tarreau77abb432019-09-06 18:27:02 +020062#define FD_EV_READY_W_BIT 5
63#define FD_EV_SHUT_W_BIT 6
Willy Tarreau1ed37812020-02-26 16:12:45 +010064#define FD_EV_ERR_RW_BIT 7
Willy Tarreau1dad3842019-07-08 23:09:03 +020065
Willy Tarreaua135ea62020-02-21 16:26:19 +010066/* and flag values */
67#define FD_EV_ACTIVE_R (1U << FD_EV_ACTIVE_R_BIT)
68#define FD_EV_ACTIVE_W (1U << FD_EV_ACTIVE_W_BIT)
Willy Tarreau7be79a42012-11-11 15:02:54 +010069#define FD_EV_ACTIVE_RW (FD_EV_ACTIVE_R | FD_EV_ACTIVE_W)
70
Willy Tarreaua135ea62020-02-21 16:26:19 +010071#define FD_EV_READY_R (1U << FD_EV_READY_R_BIT)
72#define FD_EV_READY_W (1U << FD_EV_READY_W_BIT)
Willy Tarreauf817e9f2014-01-10 16:58:45 +010073#define FD_EV_READY_RW (FD_EV_READY_R | FD_EV_READY_W)
74
Willy Tarreau77abb432019-09-06 18:27:02 +020075/* note that when FD_EV_SHUT is set, ACTIVE and READY are cleared */
Willy Tarreaua135ea62020-02-21 16:26:19 +010076#define FD_EV_SHUT_R (1U << FD_EV_SHUT_R_BIT)
77#define FD_EV_SHUT_W (1U << FD_EV_SHUT_W_BIT)
Willy Tarreau77abb432019-09-06 18:27:02 +020078#define FD_EV_SHUT_RW (FD_EV_SHUT_R | FD_EV_SHUT_W)
79
Willy Tarreau1ed37812020-02-26 16:12:45 +010080/* note that when FD_EV_ERR is set, SHUT is also set. Also, ERR is for both
81 * directions at once (write error, socket dead, etc).
82 */
83#define FD_EV_ERR_RW (1U << FD_EV_ERR_RW_BIT)
Willy Tarreau77abb432019-09-06 18:27:02 +020084
Willy Tarreau733b1322016-11-17 14:22:52 +010085
86/* This is the value used to mark a file descriptor as dead. This value is
87 * negative, this is important so that tests on fd < 0 properly match. It
Joseph Herlantf69b8072018-11-25 13:34:43 -080088 * also has the nice property of being highly negative but neither overflowing
89 * nor changing sign on 32-bit machines when multiplied by sizeof(fdtab).
Willy Tarreau733b1322016-11-17 14:22:52 +010090 * This ensures that any unexpected dereference of such an uninitialized
91 * file descriptor will lead to so large a dereference that it will crash
92 * the process at the exact location of the bug with a clean stack trace
93 * instead of causing silent manipulation of other FDs. And it's readable
94 * when found in a dump.
95 */
96#define DEAD_FD_MAGIC 0xFDDEADFD
97
Olivier Houchard12568362018-01-31 18:07:29 +010098/* fdlist_entry: entry used by the fd cache.
99 * >= 0 means we're in the cache and gives the FD of the next in the cache,
100 * -1 means we're in the cache and the last element,
101 * -2 means the entry is locked,
102 * <= -3 means not in the cache, and next element is -4-fd
103 *
104 * It must remain 8-aligned so that aligned CAS operations may be done on both
105 * entries at once.
106 */
Olivier Houchard4815c8c2018-01-24 18:17:56 +0100107struct fdlist_entry {
Olivier Houchard12568362018-01-31 18:07:29 +0100108 int next;
109 int prev;
Olivier Houchard4815c8c2018-01-24 18:17:56 +0100110} __attribute__ ((aligned(8)));
111
Olivier Houchard12568362018-01-31 18:07:29 +0100112/* head of the fd cache */
Olivier Houchard4815c8c2018-01-24 18:17:56 +0100113struct fdlist {
Olivier Houchard12568362018-01-31 18:07:29 +0100114 int first;
115 int last;
Olivier Houchard4815c8c2018-01-24 18:17:56 +0100116} __attribute__ ((aligned(8)));
117
Willy Tarreaubaaee002006-06-26 02:48:02 +0200118/* info about one given fd */
119struct fdtab {
Ilya Shipitsin856aabc2020-04-16 23:51:34 +0500120 unsigned long running_mask; /* mask of thread IDs currently using the fd */
Olivier Houcharda7bf5732020-02-27 17:26:13 +0100121 unsigned long thread_mask; /* mask of thread IDs authorized to process the fd */
Willy Tarreauebc78d72018-01-20 23:53:50 +0100122 unsigned long update_mask; /* mask of thread IDs having an update for fd */
Olivier Houchard6b96f722018-04-25 16:58:25 +0200123 struct fdlist_entry update; /* Entry in the global update list */
Willy Tarreau7a798e52016-04-14 11:13:20 +0200124 void (*iocb)(int fd); /* I/O handler */
Willy Tarreau80184712012-07-06 14:54:49 +0200125 void *owner; /* the connection or listener associated with this fd, NULL if closed */
Willy Tarreaua135ea62020-02-21 16:26:19 +0100126 unsigned char state; /* FD state for read and write directions (FD_EV_*) */
Willy Tarreau3d32d3a2007-04-15 11:31:05 +0200127 unsigned char ev; /* event seen in return of poll() : FD_POLL_* */
Willy Tarreauad38ace2013-12-15 14:19:38 +0100128 unsigned char linger_risk:1; /* 1 if we must kill lingering before closing */
Conrad Hoffmann041751c2014-05-20 14:28:24 +0200129 unsigned char cloned:1; /* 1 if a cloned socket, requires EPOLL_CTL_DEL on close */
Willy Tarreaud6609902019-08-30 14:36:10 +0200130 unsigned char initialized:1; /* 1 if init phase was done on this fd (e.g. set non-blocking) */
Willy Tarreau76913d32019-08-30 14:33:11 +0200131}
132#ifdef USE_THREAD
133/* only align on cache lines when using threads; 32-bit small archs
134 * can put everything in 32-bytes when threads are disabled.
135 */
136__attribute__((aligned(64)))
137#endif
138;
Willy Tarreau8d5d77e2009-10-18 07:25:52 +0200139
140/* less often used information */
141struct fdinfo {
Willy Tarreauc6f4ce82009-06-10 11:09:37 +0200142 struct port_range *port_range; /* optional port range to bind to */
Willy Tarreau8d5d77e2009-10-18 07:25:52 +0200143 int local_port; /* optional local port */
Willy Tarreaubaaee002006-06-26 02:48:02 +0200144};
145
Willy Tarreau4f60f162007-04-08 16:39:58 +0200146/*
147 * Poller descriptors.
148 * - <name> is initialized by the poller's register() function, and should not
149 * be allocated, just linked to.
150 * - <pref> is initialized by the poller's register() function. It is set to 0
151 * by default, meaning the poller is disabled. init() should set it to 0 in
152 * case of failure. term() must set it to 0. A generic unoptimized select()
153 * poller should set it to 100.
154 * - <private> is initialized by the poller's init() function, and cleaned by
155 * the term() function.
Willy Tarreau70c6fd82012-11-11 21:02:34 +0100156 * - clo() should be used to do indicate the poller that fd will be closed.
Willy Tarreau2ae84e42019-05-28 16:44:05 +0200157 * - poll() calls the poller, expiring at <exp>, or immediately if <wake> is set
Willy Tarreau5a767692017-03-13 11:38:28 +0100158 * - flags indicate what the poller supports (HAP_POLL_F_*)
Willy Tarreau4f60f162007-04-08 16:39:58 +0200159 */
Willy Tarreau5a767692017-03-13 11:38:28 +0100160
Willy Tarreau11ef0832019-11-28 18:17:33 +0100161#define HAP_POLL_F_RDHUP 0x00000001 /* the poller notifies of HUP with reads */
162#define HAP_POLL_F_ERRHUP 0x00000002 /* the poller reports ERR and HUP */
Willy Tarreau5a767692017-03-13 11:38:28 +0100163
Willy Tarreau4f60f162007-04-08 16:39:58 +0200164struct poller {
165 void *private; /* any private data for the poller */
Willy Tarreau03e78532020-02-25 07:38:05 +0100166 void (*clo)(const int fd); /* mark <fd> as closed */
167 void (*poll)(struct poller *p, int exp, int wake); /* the poller itself */
168 int (*init)(struct poller *p); /* poller initialization */
169 void (*term)(struct poller *p); /* termination of this poller */
170 int (*test)(struct poller *p); /* pre-init check of the poller */
171 int (*fork)(struct poller *p); /* post-fork re-opening */
Willy Tarreau4f60f162007-04-08 16:39:58 +0200172 const char *name; /* poller name */
Willy Tarreau5a767692017-03-13 11:38:28 +0100173 unsigned int flags; /* HAP_POLL_F_* */
Willy Tarreau4f60f162007-04-08 16:39:58 +0200174 int pref; /* try pollers with higher preference first */
175};
176
177extern struct poller cur_poller; /* the current poller */
178extern int nbpollers;
179#define MAX_POLLERS 10
180extern struct poller pollers[MAX_POLLERS]; /* all registered pollers */
181
Willy Tarreaubaaee002006-06-26 02:48:02 +0200182extern struct fdtab *fdtab; /* array of all the file descriptors */
Willy Tarreau8d5d77e2009-10-18 07:25:52 +0200183extern struct fdinfo *fdinfo; /* less-often used infos for file descriptors */
Willy Tarreaubaaee002006-06-26 02:48:02 +0200184extern int totalconn; /* total # of terminated sessions */
185extern int actconn; /* # of active sessions */
186
187#endif /* _TYPES_FD_H */
188
189/*
190 * Local variables:
191 * c-indent-level: 8
192 * c-basic-offset: 8
193 * End:
194 */