Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 1 | /* |
| 2 | * QUIC socket management. |
| 3 | * |
Willy Tarreau | 3dfb7da | 2022-03-02 22:33:39 +0100 | [diff] [blame] | 4 | * Copyright 2020 HAProxy Technologies, Frederic Lecaille <flecaille@haproxy.com> |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 5 | * |
| 6 | * This program is free software; you can redistribute it and/or |
| 7 | * modify it under the terms of the GNU General Public License |
| 8 | * as published by the Free Software Foundation; either version |
| 9 | * 2 of the License, or (at your option) any later version. |
| 10 | * |
| 11 | */ |
| 12 | |
| 13 | #include <errno.h> |
| 14 | |
| 15 | #include <sys/socket.h> |
| 16 | #include <sys/types.h> |
| 17 | |
| 18 | #include <haproxy/connection.h> |
| 19 | #include <haproxy/listener.h> |
Frédéric Lécaille | 6492e66 | 2022-05-17 17:23:16 +0200 | [diff] [blame] | 20 | #include <haproxy/proto_quic.h> |
Amaury Denoyelle | 4d29504 | 2022-01-19 16:18:44 +0100 | [diff] [blame] | 21 | #include <haproxy/quic_sock.h> |
Amaury Denoyelle | eb01f59 | 2021-10-07 16:44:05 +0200 | [diff] [blame] | 22 | #include <haproxy/session.h> |
Amaury Denoyelle | 777969c | 2022-03-24 16:06:26 +0100 | [diff] [blame] | 23 | #include <haproxy/tools.h> |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 24 | #include <haproxy/xprt_quic.h> |
| 25 | |
| 26 | /* This function is called from the protocol layer accept() in order to |
| 27 | * instantiate a new session on behalf of a given listener and frontend. It |
| 28 | * returns a positive value upon success, 0 if the connection can be ignored, |
| 29 | * or a negative value upon critical failure. The accepted connection is |
| 30 | * closed if we return <= 0. If no handshake is needed, it immediately tries |
| 31 | * to instantiate a new stream. The connection must already have been filled |
| 32 | * with the incoming connection handle (a fd), a target (the listener) and a |
| 33 | * source address. |
| 34 | */ |
| 35 | int quic_session_accept(struct connection *cli_conn) |
| 36 | { |
| 37 | struct listener *l = __objt_listener(cli_conn->target); |
| 38 | struct proxy *p = l->bind_conf->frontend; |
| 39 | struct session *sess; |
| 40 | |
| 41 | cli_conn->proxy_netns = l->rx.settings->netns; |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 42 | /* This flag is ordinarily set by conn_ctrl_init() which cannot |
| 43 | * be called for now. |
| 44 | */ |
| 45 | cli_conn->flags |= CO_FL_CTRL_READY; |
| 46 | |
| 47 | /* wait for a PROXY protocol header */ |
| 48 | if (l->options & LI_O_ACC_PROXY) |
| 49 | cli_conn->flags |= CO_FL_ACCEPT_PROXY; |
| 50 | |
| 51 | /* wait for a NetScaler client IP insertion protocol header */ |
| 52 | if (l->options & LI_O_ACC_CIP) |
| 53 | cli_conn->flags |= CO_FL_ACCEPT_CIP; |
| 54 | |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 55 | /* Add the handshake pseudo-XPRT */ |
| 56 | if (cli_conn->flags & (CO_FL_ACCEPT_PROXY | CO_FL_ACCEPT_CIP)) { |
| 57 | if (xprt_add_hs(cli_conn) != 0) |
| 58 | goto out_free_conn; |
| 59 | } |
Olivier Houchard | 1b3c931 | 2021-03-05 23:37:48 +0100 | [diff] [blame] | 60 | |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 61 | sess = session_new(p, l, &cli_conn->obj_type); |
| 62 | if (!sess) |
| 63 | goto out_free_conn; |
| 64 | |
| 65 | conn_set_owner(cli_conn, sess, NULL); |
| 66 | |
Frédéric Lécaille | ecb5872 | 2021-05-27 17:12:36 +0200 | [diff] [blame] | 67 | if (conn_complete_session(cli_conn) < 0) |
| 68 | goto out_free_sess; |
| 69 | |
Amaury Denoyelle | 622ec41 | 2022-04-13 16:58:26 +0200 | [diff] [blame] | 70 | if (conn_xprt_start(cli_conn) < 0) { |
| 71 | /* conn_complete_session has succeeded : conn is the owner of |
| 72 | * the session and the MUX is initialized. |
| 73 | * Let the MUX free all resources on error. |
| 74 | */ |
| 75 | cli_conn->mux->destroy(cli_conn->ctx); |
| 76 | return -1; |
| 77 | } |
| 78 | |
| 79 | return 1; |
Frédéric Lécaille | 27faba7 | 2021-03-03 16:21:00 +0100 | [diff] [blame] | 80 | |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 81 | out_free_sess: |
| 82 | /* prevent call to listener_release during session_free. It will be |
| 83 | * done below, for all errors. */ |
| 84 | sess->listener = NULL; |
| 85 | session_free(sess); |
| 86 | out_free_conn: |
Willy Tarreau | 784b868 | 2022-04-11 14:18:10 +0200 | [diff] [blame] | 87 | cli_conn->handle.qc->conn = NULL; |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 88 | conn_stop_tracking(cli_conn); |
| 89 | conn_xprt_close(cli_conn); |
| 90 | conn_free(cli_conn); |
| 91 | out: |
| 92 | |
Frédéric Lécaille | e8139f3 | 2021-03-11 17:06:30 +0100 | [diff] [blame] | 93 | return -1; |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 94 | } |
| 95 | |
Willy Tarreau | cdf7c8e | 2022-04-11 16:20:00 +0200 | [diff] [blame] | 96 | /* Retrieve a connection's source address. Returns -1 on failure. */ |
| 97 | int quic_sock_get_src(struct connection *conn, struct sockaddr *addr, socklen_t len) |
| 98 | { |
| 99 | struct quic_conn *qc; |
| 100 | |
Willy Tarreau | 784b868 | 2022-04-11 14:18:10 +0200 | [diff] [blame] | 101 | if (!conn || !conn->handle.qc) |
Willy Tarreau | cdf7c8e | 2022-04-11 16:20:00 +0200 | [diff] [blame] | 102 | return -1; |
| 103 | |
Willy Tarreau | 784b868 | 2022-04-11 14:18:10 +0200 | [diff] [blame] | 104 | qc = conn->handle.qc; |
Willy Tarreau | cdf7c8e | 2022-04-11 16:20:00 +0200 | [diff] [blame] | 105 | if (conn_is_back(conn)) { |
| 106 | /* no source address defined for outgoing connections for now */ |
| 107 | return -1; |
| 108 | } else { |
| 109 | /* front connection, return the peer's address */ |
| 110 | if (len > sizeof(qc->peer_addr)) |
| 111 | len = sizeof(qc->peer_addr); |
| 112 | memcpy(addr, &qc->peer_addr, len); |
| 113 | return 0; |
| 114 | } |
| 115 | } |
| 116 | |
| 117 | /* Retrieve a connection's destination address. Returns -1 on failure. */ |
| 118 | int quic_sock_get_dst(struct connection *conn, struct sockaddr *addr, socklen_t len) |
| 119 | { |
| 120 | struct quic_conn *qc; |
| 121 | |
Willy Tarreau | 784b868 | 2022-04-11 14:18:10 +0200 | [diff] [blame] | 122 | if (!conn || !conn->handle.qc) |
Willy Tarreau | cdf7c8e | 2022-04-11 16:20:00 +0200 | [diff] [blame] | 123 | return -1; |
| 124 | |
Willy Tarreau | 784b868 | 2022-04-11 14:18:10 +0200 | [diff] [blame] | 125 | qc = conn->handle.qc; |
Willy Tarreau | cdf7c8e | 2022-04-11 16:20:00 +0200 | [diff] [blame] | 126 | if (conn_is_back(conn)) { |
| 127 | /* back connection, return the peer's address */ |
| 128 | if (len > sizeof(qc->peer_addr)) |
| 129 | len = sizeof(qc->peer_addr); |
| 130 | memcpy(addr, &qc->peer_addr, len); |
| 131 | } else { |
| 132 | /* FIXME: front connection, no local address for now, we'll |
| 133 | * return the listener's address instead. |
| 134 | */ |
| 135 | BUG_ON(!qc->li); |
| 136 | |
| 137 | if (len > sizeof(qc->li->rx.addr)) |
| 138 | len = sizeof(qc->li->rx.addr); |
| 139 | memcpy(addr, &qc->li->rx.addr, len); |
| 140 | } |
| 141 | return 0; |
| 142 | } |
| 143 | |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 144 | /* |
| 145 | * Inspired from session_accept_fd(). |
| 146 | * Instantiate a new connection (connection struct) to be attached to <qc> |
| 147 | * QUIC connection of <l> listener. |
| 148 | * Returns 1 if succeeded, 0 if not. |
| 149 | */ |
| 150 | static int new_quic_cli_conn(struct quic_conn *qc, struct listener *l, |
| 151 | struct sockaddr_storage *saddr) |
| 152 | { |
| 153 | struct connection *cli_conn; |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 154 | |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 155 | if (unlikely((cli_conn = conn_new(&l->obj_type)) == NULL)) |
| 156 | goto out; |
| 157 | |
Willy Tarreau | 9cc88c3 | 2022-04-08 14:34:31 +0200 | [diff] [blame] | 158 | if (!sockaddr_alloc(&cli_conn->src, saddr, sizeof *saddr)) |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 159 | goto out_free_conn; |
| 160 | |
Willy Tarreau | 030b3e6 | 2022-05-02 17:47:46 +0200 | [diff] [blame] | 161 | cli_conn->flags |= CO_FL_FDLESS; |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 162 | qc->conn = cli_conn; |
Willy Tarreau | 784b868 | 2022-04-11 14:18:10 +0200 | [diff] [blame] | 163 | cli_conn->handle.qc = qc; |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 164 | |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 165 | cli_conn->target = &l->obj_type; |
| 166 | |
Frédéric Lécaille | 01ab661 | 2021-06-14 10:31:43 +0200 | [diff] [blame] | 167 | /* We need the xprt context before accepting (->accept()) the connection: |
| 168 | * we may receive packet before this connection acception. |
| 169 | */ |
| 170 | if (conn_prepare(cli_conn, l->rx.proto, l->bind_conf->xprt) < 0) |
| 171 | goto out_free_conn; |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 172 | |
| 173 | return 1; |
| 174 | |
| 175 | out_free_conn: |
Frédéric Lécaille | 01ab661 | 2021-06-14 10:31:43 +0200 | [diff] [blame] | 176 | qc->conn = NULL; |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 177 | conn_stop_tracking(cli_conn); |
| 178 | conn_xprt_close(cli_conn); |
| 179 | conn_free(cli_conn); |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 180 | out: |
| 181 | |
| 182 | return 0; |
| 183 | } |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 184 | |
| 185 | /* Tests if the receiver supports accepting connections. Returns positive on |
| 186 | * success, 0 if not possible |
| 187 | */ |
| 188 | int quic_sock_accepting_conn(const struct receiver *rx) |
| 189 | { |
| 190 | return 1; |
| 191 | } |
| 192 | |
| 193 | /* Accept an incoming connection from listener <l>, and return it, as well as |
| 194 | * a CO_AC_* status code into <status> if not null. Null is returned on error. |
| 195 | * <l> must be a valid listener with a valid frontend. |
| 196 | */ |
| 197 | struct connection *quic_sock_accept_conn(struct listener *l, int *status) |
| 198 | { |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 199 | struct quic_conn *qc; |
Amaury Denoyelle | cfa2d56 | 2022-01-19 16:01:05 +0100 | [diff] [blame] | 200 | struct li_per_thread *lthr = &l->per_thr[tid]; |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 201 | |
Amaury Denoyelle | cfa2d56 | 2022-01-19 16:01:05 +0100 | [diff] [blame] | 202 | qc = MT_LIST_POP(<hr->quic_accept.conns, struct quic_conn *, accept_list); |
| 203 | if (!qc) |
| 204 | goto done; |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 205 | |
Amaury Denoyelle | cfa2d56 | 2022-01-19 16:01:05 +0100 | [diff] [blame] | 206 | if (!new_quic_cli_conn(qc, l, &qc->peer_addr)) |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 207 | goto err; |
| 208 | |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 209 | done: |
Amaury Denoyelle | cfa2d56 | 2022-01-19 16:01:05 +0100 | [diff] [blame] | 210 | *status = CO_AC_DONE; |
Frédéric Lécaille | 026a792 | 2020-11-23 15:46:36 +0100 | [diff] [blame] | 211 | return qc ? qc->conn : NULL; |
| 212 | |
| 213 | err: |
Amaury Denoyelle | cfa2d56 | 2022-01-19 16:01:05 +0100 | [diff] [blame] | 214 | /* in case of error reinsert the element to process it later. */ |
| 215 | MT_LIST_INSERT(<hr->quic_accept.conns, &qc->accept_list); |
| 216 | |
| 217 | *status = CO_AC_PAUSE; |
| 218 | return NULL; |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 219 | } |
| 220 | |
Frédéric Lécaille | 6492e66 | 2022-05-17 17:23:16 +0200 | [diff] [blame] | 221 | /* Retrieve the DCID from the datagram found in <buf> and deliver it to the |
| 222 | * correct datagram handler. |
| 223 | * Return 1 if a correct datagram could be found, 0 if not. |
| 224 | */ |
| 225 | static int quic_lstnr_dgram_dispatch(unsigned char *buf, size_t len, void *owner, |
| 226 | struct sockaddr_storage *saddr, |
| 227 | struct quic_dgram *new_dgram, struct list *dgrams) |
| 228 | { |
| 229 | struct quic_dgram *dgram; |
| 230 | unsigned char *dcid; |
| 231 | size_t dcid_len; |
| 232 | int cid_tid; |
| 233 | |
| 234 | if (!len || !quic_get_dgram_dcid(buf, buf + len, &dcid, &dcid_len)) |
| 235 | goto err; |
| 236 | |
| 237 | dgram = new_dgram ? new_dgram : pool_alloc(pool_head_quic_dgram); |
| 238 | if (!dgram) |
| 239 | goto err; |
| 240 | |
| 241 | cid_tid = quic_get_cid_tid(dcid); |
| 242 | |
| 243 | /* All the members must be initialized! */ |
| 244 | dgram->owner = owner; |
| 245 | dgram->buf = buf; |
| 246 | dgram->len = len; |
| 247 | dgram->dcid = dcid; |
| 248 | dgram->dcid_len = dcid_len; |
| 249 | dgram->saddr = *saddr; |
| 250 | dgram->qc = NULL; |
| 251 | LIST_APPEND(dgrams, &dgram->list); |
| 252 | MT_LIST_APPEND(&quic_dghdlrs[cid_tid].dgrams, &dgram->mt_list); |
| 253 | |
| 254 | tasklet_wakeup(quic_dghdlrs[cid_tid].task); |
| 255 | |
| 256 | return 1; |
| 257 | |
| 258 | err: |
| 259 | return 0; |
| 260 | } |
| 261 | |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 262 | /* Function called on a read event from a listening socket. It tries |
| 263 | * to handle as many connections as possible. |
| 264 | */ |
| 265 | void quic_sock_fd_iocb(int fd) |
| 266 | { |
| 267 | ssize_t ret; |
Frédéric Lécaille | 324ecda | 2021-11-02 10:14:44 +0100 | [diff] [blame] | 268 | struct rxbuf *rxbuf; |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 269 | struct buffer *buf; |
| 270 | struct listener *l = objt_listener(fdtab[fd].owner); |
Frédéric Lécaille | c4becf5 | 2021-11-08 11:23:17 +0100 | [diff] [blame] | 271 | struct quic_transport_params *params; |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 272 | /* Source address */ |
| 273 | struct sockaddr_storage saddr = {0}; |
Frédéric Lécaille | 320744b | 2022-01-27 12:19:28 +0100 | [diff] [blame] | 274 | size_t max_sz, cspace; |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 275 | socklen_t saddrlen; |
Frédéric Lécaille | 2bed1f1 | 2022-06-23 21:05:05 +0200 | [diff] [blame] | 276 | struct quic_dgram *new_dgram; |
Frédéric Lécaille | f6f7520 | 2022-02-02 09:44:22 +0100 | [diff] [blame] | 277 | unsigned char *dgram_buf; |
Frédéric Lécaille | 1b0707f | 2022-06-30 11:28:56 +0200 | [diff] [blame] | 278 | int max_dgrams; |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 279 | |
Tim Duesterhus | 1655424 | 2021-09-15 13:58:49 +0200 | [diff] [blame] | 280 | BUG_ON(!l); |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 281 | |
Frédéric Lécaille | 19ef636 | 2022-06-23 18:00:37 +0200 | [diff] [blame] | 282 | new_dgram = NULL; |
Frédéric Lécaille | c4becf5 | 2021-11-08 11:23:17 +0100 | [diff] [blame] | 283 | if (!l) |
| 284 | return; |
| 285 | |
Willy Tarreau | f509065 | 2021-04-06 17:23:40 +0200 | [diff] [blame] | 286 | if (!(fdtab[fd].state & FD_POLL_IN) || !fd_recv_ready(fd)) |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 287 | return; |
| 288 | |
Frédéric Lécaille | 324ecda | 2021-11-02 10:14:44 +0100 | [diff] [blame] | 289 | rxbuf = MT_LIST_POP(&l->rx.rxbuf_list, typeof(rxbuf), mt_list); |
Amaury Denoyelle | ee72a43 | 2021-11-19 15:49:29 +0100 | [diff] [blame] | 290 | if (!rxbuf) |
Frédéric Lécaille | c4becf5 | 2021-11-08 11:23:17 +0100 | [diff] [blame] | 291 | goto out; |
Frédéric Lécaille | 37ae505 | 2022-01-27 11:31:50 +0100 | [diff] [blame] | 292 | |
Amaury Denoyelle | ee72a43 | 2021-11-19 15:49:29 +0100 | [diff] [blame] | 293 | buf = &rxbuf->buf; |
Frédéric Lécaille | c4becf5 | 2021-11-08 11:23:17 +0100 | [diff] [blame] | 294 | |
Frédéric Lécaille | 1b0707f | 2022-06-30 11:28:56 +0200 | [diff] [blame] | 295 | max_dgrams = global.tune.maxpollevents; |
| 296 | start: |
Frédéric Lécaille | 2bed1f1 | 2022-06-23 21:05:05 +0200 | [diff] [blame] | 297 | /* Try to reuse an existing dgram. Note that there is alway at |
| 298 | * least one datagram to pick, except the first time we enter |
| 299 | * this function for this <rxbuf> buffer. |
| 300 | */ |
| 301 | if (!LIST_ISEMPTY(&rxbuf->dgrams)) { |
| 302 | struct quic_dgram *dg = |
| 303 | LIST_ELEM(rxbuf->dgrams.n, struct quic_dgram *, list); |
Frédéric Lécaille | 37ae505 | 2022-01-27 11:31:50 +0100 | [diff] [blame] | 304 | |
Frédéric Lécaille | 2bed1f1 | 2022-06-23 21:05:05 +0200 | [diff] [blame] | 305 | if (!dg->buf) { |
| 306 | LIST_DELETE(&dg->list); |
| 307 | b_del(buf, dg->len); |
| 308 | new_dgram = dg; |
| 309 | } |
Frédéric Lécaille | 37ae505 | 2022-01-27 11:31:50 +0100 | [diff] [blame] | 310 | } |
| 311 | |
Frédéric Lécaille | c4becf5 | 2021-11-08 11:23:17 +0100 | [diff] [blame] | 312 | params = &l->bind_conf->quic_params; |
Frédéric Lécaille | 324ecda | 2021-11-02 10:14:44 +0100 | [diff] [blame] | 313 | max_sz = params->max_udp_payload_size; |
Frédéric Lécaille | 320744b | 2022-01-27 12:19:28 +0100 | [diff] [blame] | 314 | cspace = b_contig_space(buf); |
| 315 | if (cspace < max_sz) { |
Frédéric Lécaille | 1712b1d | 2022-01-28 13:10:24 +0100 | [diff] [blame] | 316 | struct quic_dgram *dgram; |
| 317 | |
Frédéric Lécaille | 0c53568 | 2022-06-23 17:47:10 +0200 | [diff] [blame] | 318 | /* Do no mark <buf> as full, and do not try to consume it |
| 319 | * if the contiguous remmaining space is not at the end |
| 320 | */ |
| 321 | if (b_tail(buf) + cspace < b_wrap(buf)) |
| 322 | goto out; |
| 323 | |
Frédéric Lécaille | 1712b1d | 2022-01-28 13:10:24 +0100 | [diff] [blame] | 324 | /* Allocate a fake datagram, without data to locate |
| 325 | * the end of the RX buffer (required during purging). |
| 326 | */ |
| 327 | dgram = pool_zalloc(pool_head_quic_dgram); |
| 328 | if (!dgram) |
| 329 | goto out; |
| 330 | |
| 331 | dgram->len = cspace; |
| 332 | LIST_APPEND(&rxbuf->dgrams, &dgram->list); |
Frédéric Lécaille | 0c53568 | 2022-06-23 17:47:10 +0200 | [diff] [blame] | 333 | |
Frédéric Lécaille | 320744b | 2022-01-27 12:19:28 +0100 | [diff] [blame] | 334 | /* Consume the remaining space */ |
| 335 | b_add(buf, cspace); |
Frédéric Lécaille | 324ecda | 2021-11-02 10:14:44 +0100 | [diff] [blame] | 336 | if (b_contig_space(buf) < max_sz) |
| 337 | goto out; |
| 338 | } |
| 339 | |
Frédéric Lécaille | f6f7520 | 2022-02-02 09:44:22 +0100 | [diff] [blame] | 340 | dgram_buf = (unsigned char *)b_tail(buf); |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 341 | saddrlen = sizeof saddr; |
| 342 | do { |
Frédéric Lécaille | f6f7520 | 2022-02-02 09:44:22 +0100 | [diff] [blame] | 343 | ret = recvfrom(fd, dgram_buf, max_sz, 0, |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 344 | (struct sockaddr *)&saddr, &saddrlen); |
Willy Tarreau | acef5e2 | 2022-04-25 20:32:15 +0200 | [diff] [blame] | 345 | if (ret < 0 && (errno == EAGAIN || errno == EWOULDBLOCK)) { |
Frédéric Lécaille | 439c464 | 2022-02-02 14:33:10 +0100 | [diff] [blame] | 346 | fd_cant_recv(fd); |
Frédéric Lécaille | 324ecda | 2021-11-02 10:14:44 +0100 | [diff] [blame] | 347 | goto out; |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 348 | } |
Frédéric Lécaille | 439c464 | 2022-02-02 14:33:10 +0100 | [diff] [blame] | 349 | } while (ret < 0 && errno == EINTR); |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 350 | |
Frédéric Lécaille | 324ecda | 2021-11-02 10:14:44 +0100 | [diff] [blame] | 351 | b_add(buf, ret); |
Frédéric Lécaille | f6f7520 | 2022-02-02 09:44:22 +0100 | [diff] [blame] | 352 | if (!quic_lstnr_dgram_dispatch(dgram_buf, ret, l, &saddr, |
| 353 | new_dgram, &rxbuf->dgrams)) { |
Frédéric Lécaille | 37ae505 | 2022-01-27 11:31:50 +0100 | [diff] [blame] | 354 | /* If wrong, consume this datagram */ |
| 355 | b_del(buf, ret); |
| 356 | } |
Frédéric Lécaille | 19ef636 | 2022-06-23 18:00:37 +0200 | [diff] [blame] | 357 | new_dgram = NULL; |
Frédéric Lécaille | 1b0707f | 2022-06-30 11:28:56 +0200 | [diff] [blame] | 358 | if (--max_dgrams > 0) |
| 359 | goto start; |
Frédéric Lécaille | 324ecda | 2021-11-02 10:14:44 +0100 | [diff] [blame] | 360 | out: |
Frédéric Lécaille | 19ef636 | 2022-06-23 18:00:37 +0200 | [diff] [blame] | 361 | pool_free(pool_head_quic_dgram, new_dgram); |
Frédéric Lécaille | 324ecda | 2021-11-02 10:14:44 +0100 | [diff] [blame] | 362 | MT_LIST_APPEND(&l->rx.rxbuf_list, &rxbuf->mt_list); |
Frédéric Lécaille | 70da889 | 2020-11-06 15:49:49 +0100 | [diff] [blame] | 363 | } |
Amaury Denoyelle | 2ce99fe | 2022-01-19 15:46:11 +0100 | [diff] [blame] | 364 | |
Amaury Denoyelle | 58a7704 | 2022-02-09 15:43:07 +0100 | [diff] [blame] | 365 | /* TODO standardize this function for a generic UDP sendto wrapper. This can be |
| 366 | * done by removing the <qc> arg and replace it with address/port. |
| 367 | */ |
| 368 | size_t qc_snd_buf(struct quic_conn *qc, const struct buffer *buf, size_t count, |
| 369 | int flags) |
| 370 | { |
| 371 | ssize_t ret; |
| 372 | size_t try, done; |
| 373 | int send_flag; |
| 374 | |
| 375 | done = 0; |
| 376 | /* send the largest possible block. For this we perform only one call |
| 377 | * to send() unless the buffer wraps and we exactly fill the first hunk, |
| 378 | * in which case we accept to do it once again. |
| 379 | */ |
| 380 | while (count) { |
| 381 | try = b_contig_data(buf, done); |
| 382 | if (try > count) |
| 383 | try = count; |
| 384 | |
| 385 | send_flag = MSG_DONTWAIT | MSG_NOSIGNAL; |
| 386 | if (try < count || flags & CO_SFL_MSG_MORE) |
| 387 | send_flag |= MSG_MORE; |
| 388 | |
| 389 | ret = sendto(qc->li->rx.fd, b_peek(buf, done), try, send_flag, |
| 390 | (struct sockaddr *)&qc->peer_addr, get_addr_len(&qc->peer_addr)); |
| 391 | if (ret > 0) { |
| 392 | /* TODO remove partial sending support for UDP */ |
| 393 | count -= ret; |
| 394 | done += ret; |
| 395 | |
| 396 | if (ret < try) |
| 397 | break; |
| 398 | } |
Amaury Denoyelle | ad5df38 | 2022-05-18 18:26:13 +0200 | [diff] [blame] | 399 | else if (errno == EINTR) { |
| 400 | /* try again */ |
| 401 | continue; |
| 402 | } |
Amaury Denoyelle | 3dde0d8 | 2022-05-19 11:53:56 +0200 | [diff] [blame] | 403 | else if (ret == 0 || errno == EAGAIN || errno == EWOULDBLOCK || errno == ENOTCONN || errno == EINPROGRESS || errno == EBADF) { |
Amaury Denoyelle | 58a7704 | 2022-02-09 15:43:07 +0100 | [diff] [blame] | 404 | /* TODO must be handle properly. It is justified for UDP ? */ |
Frédéric Lécaille | 8726d63 | 2022-05-03 10:32:21 +0200 | [diff] [blame] | 405 | qc->sendto_err++; |
Amaury Denoyelle | 8fa6666 | 2022-05-18 18:14:12 +0200 | [diff] [blame] | 406 | break; |
Amaury Denoyelle | 58a7704 | 2022-02-09 15:43:07 +0100 | [diff] [blame] | 407 | } |
Amaury Denoyelle | ad5df38 | 2022-05-18 18:26:13 +0200 | [diff] [blame] | 408 | else if (errno) { |
| 409 | /* TODO unlisted errno : handle it explicitely. */ |
| 410 | ABORT_NOW(); |
Amaury Denoyelle | 58a7704 | 2022-02-09 15:43:07 +0100 | [diff] [blame] | 411 | } |
| 412 | } |
| 413 | |
| 414 | if (done > 0) { |
| 415 | /* we count the total bytes sent, and the send rate for 32-byte |
| 416 | * blocks. The reason for the latter is that freq_ctr are |
| 417 | * limited to 4GB and that it's not enough per second. |
| 418 | */ |
| 419 | _HA_ATOMIC_ADD(&global.out_bytes, done); |
| 420 | update_freq_ctr(&global.out_32bps, (done + 16) / 32); |
| 421 | } |
| 422 | return done; |
| 423 | } |
| 424 | |
Amaury Denoyelle | 2ce99fe | 2022-01-19 15:46:11 +0100 | [diff] [blame] | 425 | |
| 426 | /*********************** QUIC accept queue management ***********************/ |
| 427 | /* per-thread accept queues */ |
| 428 | struct quic_accept_queue *quic_accept_queues; |
| 429 | |
Amaury Denoyelle | cfa2d56 | 2022-01-19 16:01:05 +0100 | [diff] [blame] | 430 | /* Install <qc> on the queue ready to be accepted. The queue task is then woken |
Frédéric Lécaille | 91f083a | 2022-01-28 21:43:48 +0100 | [diff] [blame] | 431 | * up. If <qc> accept is already scheduled or done, nothing is done. |
Amaury Denoyelle | cfa2d56 | 2022-01-19 16:01:05 +0100 | [diff] [blame] | 432 | */ |
| 433 | void quic_accept_push_qc(struct quic_conn *qc) |
| 434 | { |
| 435 | struct quic_accept_queue *queue = &quic_accept_queues[qc->tid]; |
| 436 | struct li_per_thread *lthr = &qc->li->per_thr[qc->tid]; |
| 437 | |
Frédéric Lécaille | 91f083a | 2022-01-28 21:43:48 +0100 | [diff] [blame] | 438 | /* early return if accept is already in progress/done for this |
| 439 | * connection |
| 440 | */ |
Frédéric Lécaille | fc79006 | 2022-03-28 17:10:31 +0200 | [diff] [blame] | 441 | if (qc->flags & QUIC_FL_CONN_ACCEPT_REGISTERED) |
Frédéric Lécaille | 91f083a | 2022-01-28 21:43:48 +0100 | [diff] [blame] | 442 | return; |
| 443 | |
Amaury Denoyelle | cfa2d56 | 2022-01-19 16:01:05 +0100 | [diff] [blame] | 444 | BUG_ON(MT_LIST_INLIST(&qc->accept_list)); |
| 445 | |
Frédéric Lécaille | fc79006 | 2022-03-28 17:10:31 +0200 | [diff] [blame] | 446 | qc->flags |= QUIC_FL_CONN_ACCEPT_REGISTERED; |
Amaury Denoyelle | cfa2d56 | 2022-01-19 16:01:05 +0100 | [diff] [blame] | 447 | /* 1. insert the listener in the accept queue |
| 448 | * |
| 449 | * Use TRY_APPEND as there is a possible race even with INLIST if |
| 450 | * multiple threads try to add the same listener instance from several |
| 451 | * quic_conn. |
| 452 | */ |
| 453 | if (!MT_LIST_INLIST(&(lthr->quic_accept.list))) |
| 454 | MT_LIST_TRY_APPEND(&queue->listeners, &(lthr->quic_accept.list)); |
| 455 | |
| 456 | /* 2. insert the quic_conn in the listener per-thread queue. */ |
| 457 | MT_LIST_APPEND(<hr->quic_accept.conns, &qc->accept_list); |
| 458 | |
| 459 | /* 3. wake up the queue tasklet */ |
| 460 | tasklet_wakeup(quic_accept_queues[qc->tid].tasklet); |
| 461 | } |
| 462 | |
Amaury Denoyelle | 2ce99fe | 2022-01-19 15:46:11 +0100 | [diff] [blame] | 463 | /* Tasklet handler to accept QUIC connections. Call listener_accept on every |
| 464 | * listener instances registered in the accept queue. |
| 465 | */ |
| 466 | static struct task *quic_accept_run(struct task *t, void *ctx, unsigned int i) |
| 467 | { |
| 468 | struct li_per_thread *lthr; |
| 469 | struct mt_list *elt1, elt2; |
| 470 | struct quic_accept_queue *queue = &quic_accept_queues[tid]; |
| 471 | |
| 472 | mt_list_for_each_entry_safe(lthr, &queue->listeners, quic_accept.list, elt1, elt2) { |
| 473 | listener_accept(lthr->li); |
| 474 | MT_LIST_DELETE_SAFE(elt1); |
| 475 | } |
| 476 | |
| 477 | return NULL; |
| 478 | } |
| 479 | |
| 480 | static int quic_alloc_accept_queues(void) |
| 481 | { |
| 482 | int i; |
| 483 | |
Tim Duesterhus | 9fb57e8 | 2022-06-01 21:58:37 +0200 | [diff] [blame] | 484 | quic_accept_queues = calloc(global.nbthread, |
| 485 | sizeof(*quic_accept_queues)); |
Amaury Denoyelle | 2ce99fe | 2022-01-19 15:46:11 +0100 | [diff] [blame] | 486 | if (!quic_accept_queues) { |
| 487 | ha_alert("Failed to allocate the quic accept queues.\n"); |
| 488 | return 0; |
| 489 | } |
| 490 | |
| 491 | for (i = 0; i < global.nbthread; ++i) { |
| 492 | struct tasklet *task; |
| 493 | if (!(task = tasklet_new())) { |
| 494 | ha_alert("Failed to allocate the quic accept queue on thread %d.\n", i); |
| 495 | return 0; |
| 496 | } |
| 497 | |
| 498 | tasklet_set_tid(task, i); |
| 499 | task->process = quic_accept_run; |
| 500 | quic_accept_queues[i].tasklet = task; |
| 501 | |
| 502 | MT_LIST_INIT(&quic_accept_queues[i].listeners); |
| 503 | } |
| 504 | |
| 505 | return 1; |
| 506 | } |
| 507 | REGISTER_POST_CHECK(quic_alloc_accept_queues); |
| 508 | |
| 509 | static int quic_deallocate_accept_queues(void) |
| 510 | { |
| 511 | int i; |
| 512 | |
| 513 | if (quic_accept_queues) { |
| 514 | for (i = 0; i < global.nbthread; ++i) |
| 515 | tasklet_free(quic_accept_queues[i].tasklet); |
| 516 | free(quic_accept_queues); |
| 517 | } |
| 518 | |
| 519 | return 1; |
| 520 | } |
| 521 | REGISTER_POST_DEINIT(quic_deallocate_accept_queues); |