Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 1 | /* |
| 2 | * AF_INET/AF_INET6 SOCK_STREAM protocol layer (tcp) |
| 3 | * |
Willy Tarreau | 1a68794 | 2010-05-23 22:40:30 +0200 | [diff] [blame] | 4 | * Copyright 2000-2010 Willy Tarreau <w@1wt.eu> |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 5 | * |
| 6 | * This program is free software; you can redistribute it and/or |
| 7 | * modify it under the terms of the GNU General Public License |
| 8 | * as published by the Free Software Foundation; either version |
| 9 | * 2 of the License, or (at your option) any later version. |
| 10 | * |
| 11 | */ |
| 12 | |
| 13 | #include <ctype.h> |
| 14 | #include <errno.h> |
| 15 | #include <fcntl.h> |
| 16 | #include <stdio.h> |
| 17 | #include <stdlib.h> |
| 18 | #include <string.h> |
| 19 | #include <time.h> |
| 20 | |
| 21 | #include <sys/param.h> |
| 22 | #include <sys/socket.h> |
| 23 | #include <sys/stat.h> |
| 24 | #include <sys/types.h> |
| 25 | #include <sys/un.h> |
| 26 | |
Dmitry Sivachenko | caf5898 | 2009-08-24 15:11:06 +0400 | [diff] [blame] | 27 | #include <netinet/tcp.h> |
| 28 | |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 29 | #include <common/cfgparse.h> |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 30 | #include <common/compat.h> |
| 31 | #include <common/config.h> |
| 32 | #include <common/debug.h> |
| 33 | #include <common/errors.h> |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 34 | #include <common/mini-clist.h> |
| 35 | #include <common/standard.h> |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 36 | |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 37 | #include <types/global.h> |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 38 | #include <types/server.h> |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 39 | |
| 40 | #include <proto/acl.h> |
Willy Tarreau | 9fcb984 | 2012-04-20 14:45:49 +0200 | [diff] [blame] | 41 | #include <proto/arg.h> |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 42 | #include <proto/buffers.h> |
Willy Tarreau | 03fa5df | 2010-05-24 21:02:37 +0200 | [diff] [blame] | 43 | #include <proto/frontend.h> |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 44 | #include <proto/log.h> |
| 45 | #include <proto/port_range.h> |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 46 | #include <proto/protocols.h> |
| 47 | #include <proto/proto_tcp.h> |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 48 | #include <proto/proxy.h> |
Willy Tarreau | cd3b094 | 2012-04-27 21:52:18 +0200 | [diff] [blame] | 49 | #include <proto/sample.h> |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 50 | #include <proto/session.h> |
Willy Tarreau | c63190d | 2012-05-11 14:23:52 +0200 | [diff] [blame] | 51 | #include <proto/sock_raw.h> |
Willy Tarreau | a975b8f | 2010-06-05 19:13:27 +0200 | [diff] [blame] | 52 | #include <proto/stick_table.h> |
Willy Tarreau | 59b9479 | 2012-05-11 16:16:40 +0200 | [diff] [blame] | 53 | #include <proto/stream_interface.h> |
Willy Tarreau | a975b8f | 2010-06-05 19:13:27 +0200 | [diff] [blame] | 54 | #include <proto/task.h> |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 55 | #include <proto/buffers.h> |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 56 | |
Willy Tarreau | e8c66af | 2008-01-13 18:40:14 +0100 | [diff] [blame] | 57 | #ifdef CONFIG_HAP_CTTPROXY |
| 58 | #include <import/ip_tproxy.h> |
| 59 | #endif |
| 60 | |
Emeric Brun | cf20bf1 | 2010-10-22 16:06:11 +0200 | [diff] [blame] | 61 | static int tcp_bind_listeners(struct protocol *proto, char *errmsg, int errlen); |
| 62 | static int tcp_bind_listener(struct listener *listener, char *errmsg, int errlen); |
Willy Tarreau | eeda90e | 2012-05-11 19:53:32 +0200 | [diff] [blame] | 63 | static int tcp_connect_write(int fd); |
| 64 | static int tcp_connect_read(int fd); |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 65 | |
| 66 | /* Note: must not be declared <const> as its list will be overwritten */ |
| 67 | static struct protocol proto_tcpv4 = { |
| 68 | .name = "tcpv4", |
| 69 | .sock_domain = AF_INET, |
| 70 | .sock_type = SOCK_STREAM, |
| 71 | .sock_prot = IPPROTO_TCP, |
| 72 | .sock_family = AF_INET, |
| 73 | .sock_addrlen = sizeof(struct sockaddr_in), |
| 74 | .l3_addrlen = 32/8, |
Willy Tarreau | bbebbbf | 2012-05-07 21:22:09 +0200 | [diff] [blame] | 75 | .accept = &listener_accept, |
Willy Tarreau | 26d8c59 | 2012-05-07 18:12:14 +0200 | [diff] [blame] | 76 | .connect = tcp_connect_server, |
Emeric Brun | cf20bf1 | 2010-10-22 16:06:11 +0200 | [diff] [blame] | 77 | .bind = tcp_bind_listener, |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 78 | .bind_all = tcp_bind_listeners, |
| 79 | .unbind_all = unbind_all_listeners, |
| 80 | .enable_all = enable_all_listeners, |
Willy Tarreau | 59b9479 | 2012-05-11 16:16:40 +0200 | [diff] [blame] | 81 | .get_src = tcp_get_src, |
| 82 | .get_dst = tcp_get_dst, |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 83 | .listeners = LIST_HEAD_INIT(proto_tcpv4.listeners), |
| 84 | .nb_listeners = 0, |
| 85 | }; |
| 86 | |
| 87 | /* Note: must not be declared <const> as its list will be overwritten */ |
| 88 | static struct protocol proto_tcpv6 = { |
| 89 | .name = "tcpv6", |
| 90 | .sock_domain = AF_INET6, |
| 91 | .sock_type = SOCK_STREAM, |
| 92 | .sock_prot = IPPROTO_TCP, |
| 93 | .sock_family = AF_INET6, |
| 94 | .sock_addrlen = sizeof(struct sockaddr_in6), |
| 95 | .l3_addrlen = 128/8, |
Willy Tarreau | bbebbbf | 2012-05-07 21:22:09 +0200 | [diff] [blame] | 96 | .accept = &listener_accept, |
Willy Tarreau | 26d8c59 | 2012-05-07 18:12:14 +0200 | [diff] [blame] | 97 | .connect = tcp_connect_server, |
Emeric Brun | cf20bf1 | 2010-10-22 16:06:11 +0200 | [diff] [blame] | 98 | .bind = tcp_bind_listener, |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 99 | .bind_all = tcp_bind_listeners, |
| 100 | .unbind_all = unbind_all_listeners, |
| 101 | .enable_all = enable_all_listeners, |
Willy Tarreau | 59b9479 | 2012-05-11 16:16:40 +0200 | [diff] [blame] | 102 | .get_src = tcp_get_src, |
| 103 | .get_dst = tcp_get_dst, |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 104 | .listeners = LIST_HEAD_INIT(proto_tcpv6.listeners), |
| 105 | .nb_listeners = 0, |
| 106 | }; |
| 107 | |
Willy Tarreau | e8c66af | 2008-01-13 18:40:14 +0100 | [diff] [blame] | 108 | |
David du Colombier | 6f5ccb1 | 2011-03-10 22:26:24 +0100 | [diff] [blame] | 109 | /* Binds ipv4/ipv6 address <local> to socket <fd>, unless <flags> is set, in which |
Willy Tarreau | e8c66af | 2008-01-13 18:40:14 +0100 | [diff] [blame] | 110 | * case we try to bind <remote>. <flags> is a 2-bit field consisting of : |
| 111 | * - 0 : ignore remote address (may even be a NULL pointer) |
| 112 | * - 1 : use provided address |
| 113 | * - 2 : use provided port |
| 114 | * - 3 : use both |
| 115 | * |
| 116 | * The function supports multiple foreign binding methods : |
| 117 | * - linux_tproxy: we directly bind to the foreign address |
| 118 | * - cttproxy: we bind to a local address then nat. |
| 119 | * The second one can be used as a fallback for the first one. |
| 120 | * This function returns 0 when everything's OK, 1 if it could not bind, to the |
| 121 | * local address, 2 if it could not bind to the foreign address. |
| 122 | */ |
David du Colombier | 6f5ccb1 | 2011-03-10 22:26:24 +0100 | [diff] [blame] | 123 | int tcp_bind_socket(int fd, int flags, struct sockaddr_storage *local, struct sockaddr_storage *remote) |
Willy Tarreau | e8c66af | 2008-01-13 18:40:14 +0100 | [diff] [blame] | 124 | { |
David du Colombier | 6f5ccb1 | 2011-03-10 22:26:24 +0100 | [diff] [blame] | 125 | struct sockaddr_storage bind_addr; |
Willy Tarreau | e8c66af | 2008-01-13 18:40:14 +0100 | [diff] [blame] | 126 | int foreign_ok = 0; |
| 127 | int ret; |
| 128 | |
| 129 | #ifdef CONFIG_HAP_LINUX_TPROXY |
| 130 | static int ip_transp_working = 1; |
| 131 | if (flags && ip_transp_working) { |
Simon Horman | de072bd | 2011-06-24 15:11:37 +0900 | [diff] [blame] | 132 | if (setsockopt(fd, SOL_IP, IP_TRANSPARENT, &one, sizeof(one)) == 0 |
| 133 | || setsockopt(fd, SOL_IP, IP_FREEBIND, &one, sizeof(one)) == 0) |
Willy Tarreau | e8c66af | 2008-01-13 18:40:14 +0100 | [diff] [blame] | 134 | foreign_ok = 1; |
| 135 | else |
| 136 | ip_transp_working = 0; |
| 137 | } |
| 138 | #endif |
| 139 | if (flags) { |
| 140 | memset(&bind_addr, 0, sizeof(bind_addr)); |
Willy Tarreau | 96dd079 | 2011-04-19 07:20:57 +0200 | [diff] [blame] | 141 | bind_addr.ss_family = remote->ss_family; |
David du Colombier | 6f5ccb1 | 2011-03-10 22:26:24 +0100 | [diff] [blame] | 142 | switch (remote->ss_family) { |
| 143 | case AF_INET: |
| 144 | if (flags & 1) |
| 145 | ((struct sockaddr_in *)&bind_addr)->sin_addr = ((struct sockaddr_in *)remote)->sin_addr; |
| 146 | if (flags & 2) |
| 147 | ((struct sockaddr_in *)&bind_addr)->sin_port = ((struct sockaddr_in *)remote)->sin_port; |
| 148 | break; |
| 149 | case AF_INET6: |
| 150 | if (flags & 1) |
| 151 | ((struct sockaddr_in6 *)&bind_addr)->sin6_addr = ((struct sockaddr_in6 *)remote)->sin6_addr; |
| 152 | if (flags & 2) |
| 153 | ((struct sockaddr_in6 *)&bind_addr)->sin6_port = ((struct sockaddr_in6 *)remote)->sin6_port; |
| 154 | break; |
Willy Tarreau | 5dc1e98 | 2011-12-16 21:25:11 +0100 | [diff] [blame] | 155 | default: |
| 156 | /* we don't want to try to bind to an unknown address family */ |
| 157 | foreign_ok = 0; |
David du Colombier | 6f5ccb1 | 2011-03-10 22:26:24 +0100 | [diff] [blame] | 158 | } |
Willy Tarreau | e8c66af | 2008-01-13 18:40:14 +0100 | [diff] [blame] | 159 | } |
| 160 | |
Simon Horman | de072bd | 2011-06-24 15:11:37 +0900 | [diff] [blame] | 161 | setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, &one, sizeof(one)); |
Willy Tarreau | e8c66af | 2008-01-13 18:40:14 +0100 | [diff] [blame] | 162 | if (foreign_ok) { |
Willy Tarreau | 1b4b7ce | 2011-04-05 16:56:50 +0200 | [diff] [blame] | 163 | ret = bind(fd, (struct sockaddr *)&bind_addr, get_addr_len(&bind_addr)); |
Willy Tarreau | e8c66af | 2008-01-13 18:40:14 +0100 | [diff] [blame] | 164 | if (ret < 0) |
| 165 | return 2; |
| 166 | } |
| 167 | else { |
Willy Tarreau | 1b4b7ce | 2011-04-05 16:56:50 +0200 | [diff] [blame] | 168 | ret = bind(fd, (struct sockaddr *)local, get_addr_len(local)); |
Willy Tarreau | e8c66af | 2008-01-13 18:40:14 +0100 | [diff] [blame] | 169 | if (ret < 0) |
| 170 | return 1; |
| 171 | } |
| 172 | |
| 173 | if (!flags) |
| 174 | return 0; |
| 175 | |
| 176 | #ifdef CONFIG_HAP_CTTPROXY |
Willy Tarreau | 6f831b4 | 2011-03-20 14:03:54 +0100 | [diff] [blame] | 177 | if (!foreign_ok && remote->ss_family == AF_INET) { |
Willy Tarreau | e8c66af | 2008-01-13 18:40:14 +0100 | [diff] [blame] | 178 | struct in_tproxy itp1, itp2; |
| 179 | memset(&itp1, 0, sizeof(itp1)); |
| 180 | |
| 181 | itp1.op = TPROXY_ASSIGN; |
Willy Tarreau | 6f831b4 | 2011-03-20 14:03:54 +0100 | [diff] [blame] | 182 | itp1.v.addr.faddr = ((struct sockaddr_in *)&bind_addr)->sin_addr; |
| 183 | itp1.v.addr.fport = ((struct sockaddr_in *)&bind_addr)->sin_port; |
Willy Tarreau | e8c66af | 2008-01-13 18:40:14 +0100 | [diff] [blame] | 184 | |
| 185 | /* set connect flag on socket */ |
| 186 | itp2.op = TPROXY_FLAGS; |
| 187 | itp2.v.flags = ITP_CONNECT | ITP_ONCE; |
| 188 | |
| 189 | if (setsockopt(fd, SOL_IP, IP_TPROXY, &itp1, sizeof(itp1)) != -1 && |
| 190 | setsockopt(fd, SOL_IP, IP_TPROXY, &itp2, sizeof(itp2)) != -1) { |
| 191 | foreign_ok = 1; |
| 192 | } |
| 193 | } |
| 194 | #endif |
| 195 | if (!foreign_ok) |
| 196 | /* we could not bind to a foreign address */ |
| 197 | return 2; |
| 198 | |
| 199 | return 0; |
| 200 | } |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 201 | |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 202 | |
| 203 | /* |
Willy Tarreau | ac82540 | 2011-03-04 22:04:29 +0100 | [diff] [blame] | 204 | * This function initiates a connection to the target assigned to this session |
Willy Tarreau | 6471afb | 2011-09-23 10:54:59 +0200 | [diff] [blame] | 205 | * (si->{target,addr.to}). A source address may be pointed to by si->addr.from |
Willy Tarreau | ac82540 | 2011-03-04 22:04:29 +0100 | [diff] [blame] | 206 | * in case of transparent proxying. Normal source bind addresses are still |
| 207 | * determined locally (due to the possible need of a source port). |
| 208 | * si->target may point either to a valid server or to a backend, depending |
| 209 | * on si->target.type. Only TARG_TYPE_PROXY and TARG_TYPE_SERVER are supported. |
Willy Tarreau | b1d6774 | 2010-03-29 19:36:59 +0200 | [diff] [blame] | 210 | * |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 211 | * It can return one of : |
| 212 | * - SN_ERR_NONE if everything's OK |
| 213 | * - SN_ERR_SRVTO if there are no more servers |
| 214 | * - SN_ERR_SRVCL if the connection was refused by the server |
| 215 | * - SN_ERR_PRXCOND if the connection has been limited by the proxy (maxconn) |
| 216 | * - SN_ERR_RESOURCE if a system resource is lacking (eg: fd limits, ports, ...) |
| 217 | * - SN_ERR_INTERNAL for any other purely internal errors |
| 218 | * Additionnally, in the case of SN_ERR_RESOURCE, an emergency log will be emitted. |
| 219 | */ |
Willy Tarreau | f153686 | 2011-03-03 18:27:32 +0100 | [diff] [blame] | 220 | |
David du Colombier | 6f5ccb1 | 2011-03-10 22:26:24 +0100 | [diff] [blame] | 221 | int tcp_connect_server(struct stream_interface *si) |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 222 | { |
| 223 | int fd; |
Willy Tarreau | ac82540 | 2011-03-04 22:04:29 +0100 | [diff] [blame] | 224 | struct server *srv; |
| 225 | struct proxy *be; |
| 226 | |
| 227 | switch (si->target.type) { |
| 228 | case TARG_TYPE_PROXY: |
| 229 | be = si->target.ptr.p; |
| 230 | srv = NULL; |
| 231 | break; |
| 232 | case TARG_TYPE_SERVER: |
| 233 | srv = si->target.ptr.s; |
| 234 | be = srv->proxy; |
| 235 | break; |
| 236 | default: |
| 237 | return SN_ERR_INTERNAL; |
| 238 | } |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 239 | |
Willy Tarreau | 6471afb | 2011-09-23 10:54:59 +0200 | [diff] [blame] | 240 | if ((fd = si->fd = socket(si->addr.to.ss_family, SOCK_STREAM, IPPROTO_TCP)) == -1) { |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 241 | qfprintf(stderr, "Cannot get a server socket.\n"); |
| 242 | |
| 243 | if (errno == ENFILE) |
| 244 | send_log(be, LOG_EMERG, |
| 245 | "Proxy %s reached system FD limit at %d. Please check system tunables.\n", |
| 246 | be->id, maxfd); |
| 247 | else if (errno == EMFILE) |
| 248 | send_log(be, LOG_EMERG, |
| 249 | "Proxy %s reached process FD limit at %d. Please check 'ulimit-n' and restart.\n", |
| 250 | be->id, maxfd); |
| 251 | else if (errno == ENOBUFS || errno == ENOMEM) |
| 252 | send_log(be, LOG_EMERG, |
| 253 | "Proxy %s reached system memory limit at %d sockets. Please check system tunables.\n", |
| 254 | be->id, maxfd); |
| 255 | /* this is a resource error */ |
| 256 | return SN_ERR_RESOURCE; |
| 257 | } |
| 258 | |
| 259 | if (fd >= global.maxsock) { |
| 260 | /* do not log anything there, it's a normal condition when this option |
| 261 | * is used to serialize connections to a server ! |
| 262 | */ |
| 263 | Alert("socket(): not enough free sockets. Raise -n argument. Giving up.\n"); |
| 264 | close(fd); |
| 265 | return SN_ERR_PRXCOND; /* it is a configuration limit */ |
| 266 | } |
| 267 | |
| 268 | if ((fcntl(fd, F_SETFL, O_NONBLOCK)==-1) || |
Simon Horman | de072bd | 2011-06-24 15:11:37 +0900 | [diff] [blame] | 269 | (setsockopt(fd, IPPROTO_TCP, TCP_NODELAY, &one, sizeof(one)) == -1)) { |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 270 | qfprintf(stderr,"Cannot set client socket to non blocking mode.\n"); |
| 271 | close(fd); |
| 272 | return SN_ERR_INTERNAL; |
| 273 | } |
| 274 | |
| 275 | if (be->options & PR_O_TCP_SRV_KA) |
Simon Horman | de072bd | 2011-06-24 15:11:37 +0900 | [diff] [blame] | 276 | setsockopt(fd, SOL_SOCKET, SO_KEEPALIVE, &one, sizeof(one)); |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 277 | |
| 278 | if (be->options & PR_O_TCP_NOLING) |
Willy Tarreau | f6f8225 | 2011-11-30 18:02:24 +0100 | [diff] [blame] | 279 | si->flags |= SI_FL_NOLINGER; |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 280 | |
| 281 | /* allow specific binding : |
| 282 | * - server-specific at first |
| 283 | * - proxy-specific next |
| 284 | */ |
| 285 | if (srv != NULL && srv->state & SRV_BIND_SRC) { |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 286 | int ret, flags = 0; |
| 287 | |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 288 | switch (srv->state & SRV_TPROXY_MASK) { |
| 289 | case SRV_TPROXY_ADDR: |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 290 | case SRV_TPROXY_CLI: |
Willy Tarreau | b1d6774 | 2010-03-29 19:36:59 +0200 | [diff] [blame] | 291 | flags = 3; |
| 292 | break; |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 293 | case SRV_TPROXY_CIP: |
Willy Tarreau | 090466c | 2009-09-07 11:51:47 +0200 | [diff] [blame] | 294 | case SRV_TPROXY_DYN: |
Willy Tarreau | b1d6774 | 2010-03-29 19:36:59 +0200 | [diff] [blame] | 295 | flags = 1; |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 296 | break; |
| 297 | } |
Willy Tarreau | b1d6774 | 2010-03-29 19:36:59 +0200 | [diff] [blame] | 298 | |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 299 | #ifdef SO_BINDTODEVICE |
| 300 | /* Note: this might fail if not CAP_NET_RAW */ |
| 301 | if (srv->iface_name) |
| 302 | setsockopt(fd, SOL_SOCKET, SO_BINDTODEVICE, srv->iface_name, srv->iface_len + 1); |
| 303 | #endif |
| 304 | |
| 305 | if (srv->sport_range) { |
| 306 | int attempts = 10; /* should be more than enough to find a spare port */ |
David du Colombier | 6f5ccb1 | 2011-03-10 22:26:24 +0100 | [diff] [blame] | 307 | struct sockaddr_storage src; |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 308 | |
| 309 | ret = 1; |
| 310 | src = srv->source_addr; |
| 311 | |
| 312 | do { |
| 313 | /* note: in case of retry, we may have to release a previously |
| 314 | * allocated port, hence this loop's construct. |
| 315 | */ |
Willy Tarreau | 8d5d77e | 2009-10-18 07:25:52 +0200 | [diff] [blame] | 316 | port_range_release_port(fdinfo[fd].port_range, fdinfo[fd].local_port); |
| 317 | fdinfo[fd].port_range = NULL; |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 318 | |
| 319 | if (!attempts) |
| 320 | break; |
| 321 | attempts--; |
| 322 | |
Willy Tarreau | 8d5d77e | 2009-10-18 07:25:52 +0200 | [diff] [blame] | 323 | fdinfo[fd].local_port = port_range_alloc_port(srv->sport_range); |
| 324 | if (!fdinfo[fd].local_port) |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 325 | break; |
| 326 | |
Willy Tarreau | 8d5d77e | 2009-10-18 07:25:52 +0200 | [diff] [blame] | 327 | fdinfo[fd].port_range = srv->sport_range; |
Willy Tarreau | 86ad42c | 2011-08-27 12:29:07 +0200 | [diff] [blame] | 328 | set_host_port(&src, fdinfo[fd].local_port); |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 329 | |
Willy Tarreau | 6471afb | 2011-09-23 10:54:59 +0200 | [diff] [blame] | 330 | ret = tcp_bind_socket(fd, flags, &src, &si->addr.from); |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 331 | } while (ret != 0); /* binding NOK */ |
| 332 | } |
| 333 | else { |
Willy Tarreau | 6471afb | 2011-09-23 10:54:59 +0200 | [diff] [blame] | 334 | ret = tcp_bind_socket(fd, flags, &srv->source_addr, &si->addr.from); |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 335 | } |
| 336 | |
| 337 | if (ret) { |
Willy Tarreau | 8d5d77e | 2009-10-18 07:25:52 +0200 | [diff] [blame] | 338 | port_range_release_port(fdinfo[fd].port_range, fdinfo[fd].local_port); |
| 339 | fdinfo[fd].port_range = NULL; |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 340 | close(fd); |
| 341 | |
| 342 | if (ret == 1) { |
| 343 | Alert("Cannot bind to source address before connect() for server %s/%s. Aborting.\n", |
| 344 | be->id, srv->id); |
| 345 | send_log(be, LOG_EMERG, |
| 346 | "Cannot bind to source address before connect() for server %s/%s.\n", |
| 347 | be->id, srv->id); |
| 348 | } else { |
| 349 | Alert("Cannot bind to tproxy source address before connect() for server %s/%s. Aborting.\n", |
| 350 | be->id, srv->id); |
| 351 | send_log(be, LOG_EMERG, |
| 352 | "Cannot bind to tproxy source address before connect() for server %s/%s.\n", |
| 353 | be->id, srv->id); |
| 354 | } |
| 355 | return SN_ERR_RESOURCE; |
| 356 | } |
| 357 | } |
| 358 | else if (be->options & PR_O_BIND_SRC) { |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 359 | int ret, flags = 0; |
| 360 | |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 361 | switch (be->options & PR_O_TPXY_MASK) { |
| 362 | case PR_O_TPXY_ADDR: |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 363 | case PR_O_TPXY_CLI: |
Willy Tarreau | b1d6774 | 2010-03-29 19:36:59 +0200 | [diff] [blame] | 364 | flags = 3; |
| 365 | break; |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 366 | case PR_O_TPXY_CIP: |
Willy Tarreau | 090466c | 2009-09-07 11:51:47 +0200 | [diff] [blame] | 367 | case PR_O_TPXY_DYN: |
Willy Tarreau | b1d6774 | 2010-03-29 19:36:59 +0200 | [diff] [blame] | 368 | flags = 1; |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 369 | break; |
| 370 | } |
Willy Tarreau | b1d6774 | 2010-03-29 19:36:59 +0200 | [diff] [blame] | 371 | |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 372 | #ifdef SO_BINDTODEVICE |
| 373 | /* Note: this might fail if not CAP_NET_RAW */ |
| 374 | if (be->iface_name) |
| 375 | setsockopt(fd, SOL_SOCKET, SO_BINDTODEVICE, be->iface_name, be->iface_len + 1); |
| 376 | #endif |
Willy Tarreau | 6471afb | 2011-09-23 10:54:59 +0200 | [diff] [blame] | 377 | ret = tcp_bind_socket(fd, flags, &be->source_addr, &si->addr.from); |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 378 | if (ret) { |
| 379 | close(fd); |
| 380 | if (ret == 1) { |
| 381 | Alert("Cannot bind to source address before connect() for proxy %s. Aborting.\n", |
| 382 | be->id); |
| 383 | send_log(be, LOG_EMERG, |
| 384 | "Cannot bind to source address before connect() for proxy %s.\n", |
| 385 | be->id); |
| 386 | } else { |
| 387 | Alert("Cannot bind to tproxy source address before connect() for proxy %s. Aborting.\n", |
| 388 | be->id); |
| 389 | send_log(be, LOG_EMERG, |
| 390 | "Cannot bind to tproxy source address before connect() for proxy %s.\n", |
| 391 | be->id); |
| 392 | } |
| 393 | return SN_ERR_RESOURCE; |
| 394 | } |
| 395 | } |
| 396 | |
Dmitry Sivachenko | caf5898 | 2009-08-24 15:11:06 +0400 | [diff] [blame] | 397 | #if defined(TCP_QUICKACK) |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 398 | /* disabling tcp quick ack now allows the first request to leave the |
| 399 | * machine with the first ACK. We only do this if there are pending |
| 400 | * data in the buffer. |
| 401 | */ |
Willy Tarreau | 2e046c6 | 2012-03-01 16:08:30 +0100 | [diff] [blame] | 402 | if ((be->options2 & PR_O2_SMARTCON) && si->ob->o) |
Simon Horman | de072bd | 2011-06-24 15:11:37 +0900 | [diff] [blame] | 403 | setsockopt(fd, IPPROTO_TCP, TCP_QUICKACK, &zero, sizeof(zero)); |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 404 | #endif |
| 405 | |
Willy Tarreau | e803de2 | 2010-01-21 17:43:04 +0100 | [diff] [blame] | 406 | if (global.tune.server_sndbuf) |
| 407 | setsockopt(fd, SOL_SOCKET, SO_SNDBUF, &global.tune.server_sndbuf, sizeof(global.tune.server_sndbuf)); |
| 408 | |
| 409 | if (global.tune.server_rcvbuf) |
| 410 | setsockopt(fd, SOL_SOCKET, SO_RCVBUF, &global.tune.server_rcvbuf, sizeof(global.tune.server_rcvbuf)); |
| 411 | |
Willy Tarreau | 9b061e3 | 2012-04-07 18:03:52 +0200 | [diff] [blame] | 412 | si->flags &= ~SI_FL_FROM_SET; |
Willy Tarreau | 6471afb | 2011-09-23 10:54:59 +0200 | [diff] [blame] | 413 | if ((connect(fd, (struct sockaddr *)&si->addr.to, get_addr_len(&si->addr.to)) == -1) && |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 414 | (errno != EINPROGRESS) && (errno != EALREADY) && (errno != EISCONN)) { |
| 415 | |
| 416 | if (errno == EAGAIN || errno == EADDRINUSE) { |
| 417 | char *msg; |
| 418 | if (errno == EAGAIN) /* no free ports left, try again later */ |
| 419 | msg = "no free ports"; |
| 420 | else |
| 421 | msg = "local address already in use"; |
| 422 | |
| 423 | qfprintf(stderr,"Cannot connect: %s.\n",msg); |
Willy Tarreau | 8d5d77e | 2009-10-18 07:25:52 +0200 | [diff] [blame] | 424 | port_range_release_port(fdinfo[fd].port_range, fdinfo[fd].local_port); |
| 425 | fdinfo[fd].port_range = NULL; |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 426 | close(fd); |
| 427 | send_log(be, LOG_EMERG, |
| 428 | "Connect() failed for server %s/%s: %s.\n", |
| 429 | be->id, srv->id, msg); |
| 430 | return SN_ERR_RESOURCE; |
| 431 | } else if (errno == ETIMEDOUT) { |
| 432 | //qfprintf(stderr,"Connect(): ETIMEDOUT"); |
Willy Tarreau | 8d5d77e | 2009-10-18 07:25:52 +0200 | [diff] [blame] | 433 | port_range_release_port(fdinfo[fd].port_range, fdinfo[fd].local_port); |
| 434 | fdinfo[fd].port_range = NULL; |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 435 | close(fd); |
| 436 | return SN_ERR_SRVTO; |
| 437 | } else { |
| 438 | // (errno == ECONNREFUSED || errno == ENETUNREACH || errno == EACCES || errno == EPERM) |
| 439 | //qfprintf(stderr,"Connect(): %d", errno); |
Willy Tarreau | 8d5d77e | 2009-10-18 07:25:52 +0200 | [diff] [blame] | 440 | port_range_release_port(fdinfo[fd].port_range, fdinfo[fd].local_port); |
| 441 | fdinfo[fd].port_range = NULL; |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 442 | close(fd); |
| 443 | return SN_ERR_SRVCL; |
| 444 | } |
| 445 | } |
| 446 | |
William Lallemand | b7ff6a3 | 2012-03-02 14:35:21 +0100 | [diff] [blame] | 447 | /* needs src ip/port for logging */ |
Willy Tarreau | 9b061e3 | 2012-04-07 18:03:52 +0200 | [diff] [blame] | 448 | if (si->flags & SI_FL_SRC_ADDR) |
Willy Tarreau | 59b9479 | 2012-05-11 16:16:40 +0200 | [diff] [blame] | 449 | si_get_from_addr(si); |
William Lallemand | b7ff6a3 | 2012-03-02 14:35:21 +0100 | [diff] [blame] | 450 | |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 451 | fdtab[fd].owner = si; |
| 452 | fdtab[fd].state = FD_STCONN; /* connection in progress */ |
| 453 | fdtab[fd].flags = FD_FL_TCP | FD_FL_TCP_NODELAY; |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 454 | |
Willy Tarreau | be0688c | 2012-05-18 15:15:26 +0200 | [diff] [blame] | 455 | /* If we have nothing to send, we want to confirm that the TCP |
| 456 | * connection is established before doing so, so we use our own write |
| 457 | * callback then switch to the sock layer. |
Willy Tarreau | eeda90e | 2012-05-11 19:53:32 +0200 | [diff] [blame] | 458 | */ |
Willy Tarreau | be0688c | 2012-05-18 15:15:26 +0200 | [diff] [blame] | 459 | if ((si->ob->flags & BF_OUT_EMPTY) && !si->send_proxy_ofs) { |
Willy Tarreau | eeda90e | 2012-05-11 19:53:32 +0200 | [diff] [blame] | 460 | fdtab[fd].cb[DIR_RD].f = tcp_connect_read; |
| 461 | fdtab[fd].cb[DIR_WR].f = tcp_connect_write; |
| 462 | } |
| 463 | else { |
| 464 | fdtab[fd].cb[DIR_RD].f = si->sock.read; |
| 465 | fdtab[fd].cb[DIR_WR].f = si->sock.write; |
| 466 | } |
| 467 | |
Willy Tarreau | 6471afb | 2011-09-23 10:54:59 +0200 | [diff] [blame] | 468 | fdinfo[fd].peeraddr = (struct sockaddr *)&si->addr.to; |
| 469 | fdinfo[fd].peerlen = get_addr_len(&si->addr.to); |
Willy Tarreau | 9650f37 | 2009-08-16 14:02:45 +0200 | [diff] [blame] | 470 | |
| 471 | fd_insert(fd); |
| 472 | EV_FD_SET(fd, DIR_WR); /* for connect status */ |
| 473 | |
| 474 | si->state = SI_ST_CON; |
| 475 | si->flags |= SI_FL_CAP_SPLTCP; /* TCP supports splicing */ |
| 476 | si->exp = tick_add_ifset(now_ms, be->timeout.connect); |
| 477 | |
| 478 | return SN_ERR_NONE; /* connection is OK */ |
| 479 | } |
| 480 | |
| 481 | |
Willy Tarreau | 59b9479 | 2012-05-11 16:16:40 +0200 | [diff] [blame] | 482 | /* |
| 483 | * Retrieves the source address for the socket <fd>, with <dir> indicating |
| 484 | * if we're a listener (=0) or an initiator (!=0). It returns 0 in case of |
| 485 | * success, -1 in case of error. The socket's source address is stored in |
| 486 | * <sa> for <salen> bytes. |
| 487 | */ |
| 488 | int tcp_get_src(int fd, struct sockaddr *sa, socklen_t salen, int dir) |
| 489 | { |
| 490 | if (dir) |
| 491 | return getsockname(fd, sa, &salen); |
| 492 | else |
| 493 | return getpeername(fd, sa, &salen); |
| 494 | } |
| 495 | |
| 496 | |
| 497 | /* |
| 498 | * Retrieves the original destination address for the socket <fd>, with <dir> |
| 499 | * indicating if we're a listener (=0) or an initiator (!=0). In the case of a |
| 500 | * listener, if the original destination address was translated, the original |
| 501 | * address is retrieved. It returns 0 in case of success, -1 in case of error. |
| 502 | * The socket's source address is stored in <sa> for <salen> bytes. |
| 503 | */ |
| 504 | int tcp_get_dst(int fd, struct sockaddr *sa, socklen_t salen, int dir) |
| 505 | { |
| 506 | if (dir) |
| 507 | return getpeername(fd, sa, &salen); |
| 508 | #if defined(TPROXY) && defined(SO_ORIGINAL_DST) |
| 509 | else if (getsockopt(fd, SOL_IP, SO_ORIGINAL_DST, sa, &salen) == 0) |
| 510 | return 0; |
| 511 | #endif |
| 512 | else |
| 513 | return getsockname(fd, sa, &salen); |
| 514 | } |
| 515 | |
Willy Tarreau | eeda90e | 2012-05-11 19:53:32 +0200 | [diff] [blame] | 516 | /* This is the callback which is set when a connection establishment is pending |
| 517 | * and we have nothing to send, or if we have an init function we want to call |
| 518 | * once the connection is established. |
| 519 | */ |
| 520 | static int tcp_connect_write(int fd) |
| 521 | { |
| 522 | struct stream_interface *si = fdtab[fd].owner; |
| 523 | struct buffer *b = si->ob; |
| 524 | int retval = 1; |
| 525 | |
| 526 | if (fdtab[fd].state == FD_STERROR) |
| 527 | goto out_error; |
| 528 | |
| 529 | if (fdtab[fd].state != FD_STCONN) { |
| 530 | retval = 0; |
| 531 | goto out_ignore; /* strange we were called while ready */ |
| 532 | } |
| 533 | |
| 534 | /* we might have been called just after an asynchronous shutw */ |
| 535 | if (b->flags & BF_SHUTW) |
| 536 | goto out_wakeup; |
| 537 | |
| 538 | /* We have no data to send to check the connection, and |
| 539 | * getsockopt() will not inform us whether the connection |
| 540 | * is still pending. So we'll reuse connect() to check the |
| 541 | * state of the socket. This has the advantage of giving us |
| 542 | * the following info : |
| 543 | * - error |
| 544 | * - connecting (EALREADY, EINPROGRESS) |
| 545 | * - connected (EISCONN, 0) |
| 546 | */ |
| 547 | if ((connect(fd, fdinfo[fd].peeraddr, fdinfo[fd].peerlen) == 0)) |
| 548 | errno = 0; |
| 549 | |
| 550 | if (errno == EALREADY || errno == EINPROGRESS) { |
| 551 | retval = 0; |
| 552 | goto out_ignore; |
| 553 | } |
| 554 | |
| 555 | if (errno && errno != EISCONN) |
| 556 | goto out_error; |
| 557 | |
| 558 | /* OK we just need to indicate that we got a connection |
| 559 | * and that we wrote nothing. |
| 560 | */ |
| 561 | b->flags |= BF_WRITE_NULL; |
| 562 | |
| 563 | /* The FD is ready now, we can hand the handlers to the socket layer */ |
| 564 | fdtab[fd].cb[DIR_RD].f = si->sock.read; |
| 565 | fdtab[fd].cb[DIR_WR].f = si->sock.write; |
| 566 | fdtab[fd].state = FD_STREADY; |
| 567 | |
| 568 | out_wakeup: |
| 569 | task_wakeup(si->owner, TASK_WOKEN_IO); |
| 570 | |
| 571 | out_ignore: |
| 572 | fdtab[fd].ev &= ~FD_POLL_OUT; |
| 573 | return retval; |
| 574 | |
| 575 | out_error: |
| 576 | /* Write error on the file descriptor. We mark the FD as STERROR so |
| 577 | * that we don't use it anymore. The error is reported to the stream |
| 578 | * interface which will take proper action. We must not perturbate the |
| 579 | * buffer because the stream interface wants to ensure transparent |
| 580 | * connection retries. |
| 581 | */ |
| 582 | |
| 583 | fdtab[fd].state = FD_STERROR; |
| 584 | fdtab[fd].ev &= ~FD_POLL_STICKY; |
| 585 | EV_FD_REM(fd); |
| 586 | si->flags |= SI_FL_ERR; |
| 587 | goto out_wakeup; |
| 588 | } |
| 589 | |
| 590 | |
| 591 | /* might be used on connect error */ |
| 592 | static int tcp_connect_read(int fd) |
| 593 | { |
| 594 | struct stream_interface *si = fdtab[fd].owner; |
| 595 | int retval; |
| 596 | |
| 597 | retval = 1; |
| 598 | |
| 599 | if (fdtab[fd].state == FD_STERROR) |
| 600 | goto out_error; |
| 601 | |
| 602 | if (fdtab[fd].state != FD_STCONN) { |
| 603 | retval = 0; |
| 604 | goto out_ignore; /* strange we were called while ready */ |
| 605 | } |
| 606 | |
| 607 | /* stop here if we reached the end of data */ |
| 608 | if ((fdtab[fd].ev & (FD_POLL_IN|FD_POLL_HUP)) == FD_POLL_HUP) |
| 609 | goto out_error; |
| 610 | |
| 611 | out_wakeup: |
| 612 | task_wakeup(si->owner, TASK_WOKEN_IO); |
| 613 | out_ignore: |
| 614 | fdtab[fd].ev &= ~FD_POLL_IN; |
| 615 | return retval; |
| 616 | |
| 617 | out_error: |
| 618 | /* Read error on the file descriptor. We mark the FD as STERROR so |
| 619 | * that we don't use it anymore. The error is reported to the stream |
| 620 | * interface which will take proper action. We must not perturbate the |
| 621 | * buffer because the stream interface wants to ensure transparent |
| 622 | * connection retries. |
| 623 | */ |
| 624 | |
| 625 | fdtab[fd].state = FD_STERROR; |
| 626 | fdtab[fd].ev &= ~FD_POLL_STICKY; |
| 627 | EV_FD_REM(fd); |
| 628 | si->flags |= SI_FL_ERR; |
| 629 | goto out_wakeup; |
| 630 | } |
| 631 | |
Willy Tarreau | 59b9479 | 2012-05-11 16:16:40 +0200 | [diff] [blame] | 632 | |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 633 | /* This function tries to bind a TCPv4/v6 listener. It may return a warning or |
| 634 | * an error message in <err> if the message is at most <errlen> bytes long |
| 635 | * (including '\0'). The return value is composed from ERR_ABORT, ERR_WARN, |
| 636 | * ERR_ALERT, ERR_RETRYABLE and ERR_FATAL. ERR_NONE indicates that everything |
| 637 | * was alright and that no message was returned. ERR_RETRYABLE means that an |
| 638 | * error occurred but that it may vanish after a retry (eg: port in use), and |
Aman Gupta | d94991d | 2012-04-06 17:39:26 -0700 | [diff] [blame] | 639 | * ERR_FATAL indicates a non-fixable error. ERR_WARN and ERR_ALERT do not alter |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 640 | * the meaning of the error, but just indicate that a message is present which |
| 641 | * should be displayed with the respective level. Last, ERR_ABORT indicates |
| 642 | * that it's pointless to try to start other listeners. No error message is |
| 643 | * returned if errlen is NULL. |
| 644 | */ |
| 645 | int tcp_bind_listener(struct listener *listener, char *errmsg, int errlen) |
| 646 | { |
| 647 | __label__ tcp_return, tcp_close_return; |
| 648 | int fd, err; |
| 649 | const char *msg = NULL; |
| 650 | |
| 651 | /* ensure we never return garbage */ |
| 652 | if (errmsg && errlen) |
| 653 | *errmsg = 0; |
| 654 | |
| 655 | if (listener->state != LI_ASSIGNED) |
| 656 | return ERR_NONE; /* already bound */ |
| 657 | |
| 658 | err = ERR_NONE; |
| 659 | |
| 660 | if ((fd = socket(listener->addr.ss_family, SOCK_STREAM, IPPROTO_TCP)) == -1) { |
| 661 | err |= ERR_RETRYABLE | ERR_ALERT; |
| 662 | msg = "cannot create listening socket"; |
| 663 | goto tcp_return; |
| 664 | } |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 665 | |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 666 | if (fd >= global.maxsock) { |
| 667 | err |= ERR_FATAL | ERR_ABORT | ERR_ALERT; |
| 668 | msg = "not enough free sockets (raise '-n' parameter)"; |
| 669 | goto tcp_close_return; |
| 670 | } |
| 671 | |
Willy Tarreau | fb14edc | 2009-06-14 15:24:37 +0200 | [diff] [blame] | 672 | if (fcntl(fd, F_SETFL, O_NONBLOCK) == -1) { |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 673 | err |= ERR_FATAL | ERR_ALERT; |
| 674 | msg = "cannot make socket non-blocking"; |
| 675 | goto tcp_close_return; |
| 676 | } |
| 677 | |
Simon Horman | de072bd | 2011-06-24 15:11:37 +0900 | [diff] [blame] | 678 | if (setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, &one, sizeof(one)) == -1) { |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 679 | /* not fatal but should be reported */ |
| 680 | msg = "cannot do so_reuseaddr"; |
| 681 | err |= ERR_ALERT; |
| 682 | } |
| 683 | |
| 684 | if (listener->options & LI_O_NOLINGER) |
Simon Horman | de072bd | 2011-06-24 15:11:37 +0900 | [diff] [blame] | 685 | setsockopt(fd, SOL_SOCKET, SO_LINGER, &nolinger, sizeof(struct linger)); |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 686 | |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 687 | #ifdef SO_REUSEPORT |
| 688 | /* OpenBSD supports this. As it's present in old libc versions of Linux, |
| 689 | * it might return an error that we will silently ignore. |
| 690 | */ |
Simon Horman | de072bd | 2011-06-24 15:11:37 +0900 | [diff] [blame] | 691 | setsockopt(fd, SOL_SOCKET, SO_REUSEPORT, &one, sizeof(one)); |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 692 | #endif |
Willy Tarreau | b1e52e8 | 2008-01-13 14:49:51 +0100 | [diff] [blame] | 693 | #ifdef CONFIG_HAP_LINUX_TPROXY |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 694 | if ((listener->options & LI_O_FOREIGN) |
Simon Horman | de072bd | 2011-06-24 15:11:37 +0900 | [diff] [blame] | 695 | && (setsockopt(fd, SOL_IP, IP_TRANSPARENT, &one, sizeof(one)) == -1) |
| 696 | && (setsockopt(fd, SOL_IP, IP_FREEBIND, &one, sizeof(one)) == -1)) { |
Willy Tarreau | b1e52e8 | 2008-01-13 14:49:51 +0100 | [diff] [blame] | 697 | msg = "cannot make listening socket transparent"; |
| 698 | err |= ERR_ALERT; |
| 699 | } |
| 700 | #endif |
Willy Tarreau | 5e6e204 | 2009-02-04 17:19:29 +0100 | [diff] [blame] | 701 | #ifdef SO_BINDTODEVICE |
| 702 | /* Note: this might fail if not CAP_NET_RAW */ |
| 703 | if (listener->interface) { |
| 704 | if (setsockopt(fd, SOL_SOCKET, SO_BINDTODEVICE, |
Willy Tarreau | 604e830 | 2009-03-06 00:48:23 +0100 | [diff] [blame] | 705 | listener->interface, strlen(listener->interface) + 1) == -1) { |
Willy Tarreau | 5e6e204 | 2009-02-04 17:19:29 +0100 | [diff] [blame] | 706 | msg = "cannot bind listener to device"; |
| 707 | err |= ERR_WARN; |
| 708 | } |
| 709 | } |
| 710 | #endif |
Dmitry Sivachenko | caf5898 | 2009-08-24 15:11:06 +0400 | [diff] [blame] | 711 | #if defined(TCP_MAXSEG) |
Willy Tarreau | 48a7e72 | 2010-12-24 15:26:39 +0100 | [diff] [blame] | 712 | if (listener->maxseg > 0) { |
Dmitry Sivachenko | caf5898 | 2009-08-24 15:11:06 +0400 | [diff] [blame] | 713 | if (setsockopt(fd, IPPROTO_TCP, TCP_MAXSEG, |
Willy Tarreau | be1b918 | 2009-06-14 18:48:19 +0200 | [diff] [blame] | 714 | &listener->maxseg, sizeof(listener->maxseg)) == -1) { |
| 715 | msg = "cannot set MSS"; |
| 716 | err |= ERR_WARN; |
| 717 | } |
| 718 | } |
| 719 | #endif |
Willy Tarreau | cb6cd43 | 2009-10-13 07:34:14 +0200 | [diff] [blame] | 720 | #if defined(TCP_DEFER_ACCEPT) |
| 721 | if (listener->options & LI_O_DEF_ACCEPT) { |
| 722 | /* defer accept by up to one second */ |
| 723 | int accept_delay = 1; |
| 724 | if (setsockopt(fd, IPPROTO_TCP, TCP_DEFER_ACCEPT, &accept_delay, sizeof(accept_delay)) == -1) { |
| 725 | msg = "cannot enable DEFER_ACCEPT"; |
| 726 | err |= ERR_WARN; |
| 727 | } |
| 728 | } |
| 729 | #endif |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 730 | if (bind(fd, (struct sockaddr *)&listener->addr, listener->proto->sock_addrlen) == -1) { |
| 731 | err |= ERR_RETRYABLE | ERR_ALERT; |
| 732 | msg = "cannot bind socket"; |
| 733 | goto tcp_close_return; |
| 734 | } |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 735 | |
Willy Tarreau | c73ce2b | 2008-01-06 10:55:10 +0100 | [diff] [blame] | 736 | if (listen(fd, listener->backlog ? listener->backlog : listener->maxconn) == -1) { |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 737 | err |= ERR_RETRYABLE | ERR_ALERT; |
| 738 | msg = "cannot listen to socket"; |
| 739 | goto tcp_close_return; |
| 740 | } |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 741 | |
Dmitry Sivachenko | caf5898 | 2009-08-24 15:11:06 +0400 | [diff] [blame] | 742 | #if defined(TCP_QUICKACK) |
Willy Tarreau | 9ea05a7 | 2009-06-14 12:07:01 +0200 | [diff] [blame] | 743 | if (listener->options & LI_O_NOQUICKACK) |
Simon Horman | de072bd | 2011-06-24 15:11:37 +0900 | [diff] [blame] | 744 | setsockopt(fd, IPPROTO_TCP, TCP_QUICKACK, &zero, sizeof(zero)); |
Willy Tarreau | 9ea05a7 | 2009-06-14 12:07:01 +0200 | [diff] [blame] | 745 | #endif |
| 746 | |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 747 | /* the socket is ready */ |
| 748 | listener->fd = fd; |
| 749 | listener->state = LI_LISTEN; |
| 750 | |
Willy Tarreau | eabf313 | 2008-08-29 23:36:51 +0200 | [diff] [blame] | 751 | fdtab[fd].owner = listener; /* reference the listener instead of a task */ |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 752 | fdtab[fd].state = FD_STLISTEN; |
Willy Tarreau | eb47268 | 2010-05-28 18:46:57 +0200 | [diff] [blame] | 753 | fdtab[fd].flags = FD_FL_TCP | ((listener->options & LI_O_NOLINGER) ? FD_FL_TCP_NOLING : 0); |
| 754 | fdtab[fd].cb[DIR_RD].f = listener->proto->accept; |
| 755 | fdtab[fd].cb[DIR_WR].f = NULL; /* never called */ |
Willy Tarreau | 5d707e1 | 2009-06-28 11:09:07 +0200 | [diff] [blame] | 756 | |
Willy Tarreau | 8d5d77e | 2009-10-18 07:25:52 +0200 | [diff] [blame] | 757 | fdinfo[fd].peeraddr = NULL; |
| 758 | fdinfo[fd].peerlen = 0; |
Willy Tarreau | eb47268 | 2010-05-28 18:46:57 +0200 | [diff] [blame] | 759 | fd_insert(fd); |
| 760 | |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 761 | tcp_return: |
Cyril Bonté | 43ba1b3 | 2010-11-01 19:26:01 +0100 | [diff] [blame] | 762 | if (msg && errlen) { |
| 763 | char pn[INET6_ADDRSTRLEN]; |
| 764 | |
Willy Tarreau | 631f01c | 2011-09-05 00:36:48 +0200 | [diff] [blame] | 765 | addr_to_str(&listener->addr, pn, sizeof(pn)); |
| 766 | snprintf(errmsg, errlen, "%s [%s:%d]", msg, pn, get_host_port(&listener->addr)); |
Cyril Bonté | 43ba1b3 | 2010-11-01 19:26:01 +0100 | [diff] [blame] | 767 | } |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 768 | return err; |
| 769 | |
| 770 | tcp_close_return: |
| 771 | close(fd); |
| 772 | goto tcp_return; |
| 773 | } |
| 774 | |
| 775 | /* This function creates all TCP sockets bound to the protocol entry <proto>. |
| 776 | * It is intended to be used as the protocol's bind_all() function. |
| 777 | * The sockets will be registered but not added to any fd_set, in order not to |
| 778 | * loose them across the fork(). A call to enable_all_listeners() is needed |
| 779 | * to complete initialization. The return value is composed from ERR_*. |
| 780 | */ |
Emeric Brun | cf20bf1 | 2010-10-22 16:06:11 +0200 | [diff] [blame] | 781 | static int tcp_bind_listeners(struct protocol *proto, char *errmsg, int errlen) |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 782 | { |
| 783 | struct listener *listener; |
| 784 | int err = ERR_NONE; |
| 785 | |
| 786 | list_for_each_entry(listener, &proto->listeners, proto_list) { |
Emeric Brun | cf20bf1 | 2010-10-22 16:06:11 +0200 | [diff] [blame] | 787 | err |= tcp_bind_listener(listener, errmsg, errlen); |
| 788 | if (err & ERR_ABORT) |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 789 | break; |
| 790 | } |
| 791 | |
| 792 | return err; |
| 793 | } |
| 794 | |
| 795 | /* Add listener to the list of tcpv4 listeners. The listener's state |
| 796 | * is automatically updated from LI_INIT to LI_ASSIGNED. The number of |
| 797 | * listeners is updated. This is the function to use to add a new listener. |
| 798 | */ |
| 799 | void tcpv4_add_listener(struct listener *listener) |
| 800 | { |
| 801 | if (listener->state != LI_INIT) |
| 802 | return; |
| 803 | listener->state = LI_ASSIGNED; |
| 804 | listener->proto = &proto_tcpv4; |
| 805 | LIST_ADDQ(&proto_tcpv4.listeners, &listener->proto_list); |
| 806 | proto_tcpv4.nb_listeners++; |
| 807 | } |
| 808 | |
| 809 | /* Add listener to the list of tcpv4 listeners. The listener's state |
| 810 | * is automatically updated from LI_INIT to LI_ASSIGNED. The number of |
| 811 | * listeners is updated. This is the function to use to add a new listener. |
| 812 | */ |
| 813 | void tcpv6_add_listener(struct listener *listener) |
| 814 | { |
| 815 | if (listener->state != LI_INIT) |
| 816 | return; |
| 817 | listener->state = LI_ASSIGNED; |
| 818 | listener->proto = &proto_tcpv6; |
| 819 | LIST_ADDQ(&proto_tcpv6.listeners, &listener->proto_list); |
| 820 | proto_tcpv6.nb_listeners++; |
| 821 | } |
| 822 | |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 823 | /* This function performs the TCP request analysis on the current request. It |
| 824 | * returns 1 if the processing can continue on next analysers, or zero if it |
| 825 | * needs more data, encounters an error, or wants to immediately abort the |
Willy Tarreau | fb35620 | 2010-08-03 14:02:05 +0200 | [diff] [blame] | 826 | * request. It relies on buffers flags, and updates s->req->analysers. The |
| 827 | * function may be called for frontend rules and backend rules. It only relies |
| 828 | * on the backend pointer so this works for both cases. |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 829 | */ |
Willy Tarreau | 3a81629 | 2009-07-07 10:55:49 +0200 | [diff] [blame] | 830 | int tcp_inspect_request(struct session *s, struct buffer *req, int an_bit) |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 831 | { |
| 832 | struct tcp_rule *rule; |
Willy Tarreau | d1f9652 | 2010-08-03 19:34:32 +0200 | [diff] [blame] | 833 | struct stksess *ts; |
| 834 | struct stktable *t; |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 835 | int partial; |
| 836 | |
Willy Tarreau | 02d6cfc | 2012-03-01 18:19:58 +0100 | [diff] [blame] | 837 | DPRINTF(stderr,"[%u] %s: session=%p b=%p, exp(r,w)=%u,%u bf=%08x bh=%d analysers=%02x\n", |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 838 | now_ms, __FUNCTION__, |
| 839 | s, |
| 840 | req, |
| 841 | req->rex, req->wex, |
| 842 | req->flags, |
Willy Tarreau | 02d6cfc | 2012-03-01 18:19:58 +0100 | [diff] [blame] | 843 | req->i, |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 844 | req->analysers); |
| 845 | |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 846 | /* We don't know whether we have enough data, so must proceed |
| 847 | * this way : |
| 848 | * - iterate through all rules in their declaration order |
| 849 | * - if one rule returns MISS, it means the inspect delay is |
| 850 | * not over yet, then return immediately, otherwise consider |
| 851 | * it as a non-match. |
| 852 | * - if one rule returns OK, then return OK |
| 853 | * - if one rule returns KO, then return KO |
| 854 | */ |
| 855 | |
Willy Tarreau | b824b00 | 2010-09-29 16:36:16 +0200 | [diff] [blame] | 856 | if (req->flags & (BF_SHUTR|BF_FULL) || !s->be->tcp_req.inspect_delay || tick_is_expired(req->analyse_exp, now_ms)) |
Willy Tarreau | 32a6f2e | 2012-04-25 10:13:36 +0200 | [diff] [blame] | 857 | partial = SMP_OPT_FINAL; |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 858 | else |
Willy Tarreau | 32a6f2e | 2012-04-25 10:13:36 +0200 | [diff] [blame] | 859 | partial = 0; |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 860 | |
Willy Tarreau | fb35620 | 2010-08-03 14:02:05 +0200 | [diff] [blame] | 861 | list_for_each_entry(rule, &s->be->tcp_req.inspect_rules, list) { |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 862 | int ret = ACL_PAT_PASS; |
| 863 | |
| 864 | if (rule->cond) { |
Willy Tarreau | 32a6f2e | 2012-04-25 10:13:36 +0200 | [diff] [blame] | 865 | ret = acl_exec_cond(rule->cond, s->be, s, &s->txn, SMP_OPT_DIR_REQ | partial); |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 866 | if (ret == ACL_PAT_MISS) { |
Willy Tarreau | 520d95e | 2009-09-19 21:04:57 +0200 | [diff] [blame] | 867 | buffer_dont_connect(req); |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 868 | /* just set the request timeout once at the beginning of the request */ |
Willy Tarreau | fb35620 | 2010-08-03 14:02:05 +0200 | [diff] [blame] | 869 | if (!tick_isset(req->analyse_exp) && s->be->tcp_req.inspect_delay) |
| 870 | req->analyse_exp = tick_add_ifset(now_ms, s->be->tcp_req.inspect_delay); |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 871 | return 0; |
| 872 | } |
| 873 | |
| 874 | ret = acl_pass(ret); |
| 875 | if (rule->cond->pol == ACL_COND_UNLESS) |
| 876 | ret = !ret; |
| 877 | } |
| 878 | |
| 879 | if (ret) { |
| 880 | /* we have a matching rule. */ |
| 881 | if (rule->action == TCP_ACT_REJECT) { |
| 882 | buffer_abort(req); |
| 883 | buffer_abort(s->rep); |
| 884 | req->analysers = 0; |
Krzysztof Piotr Oledzki | aeebf9b | 2009-10-04 15:43:17 +0200 | [diff] [blame] | 885 | |
Willy Tarreau | 7d0aaf3 | 2011-03-10 23:25:56 +0100 | [diff] [blame] | 886 | s->be->be_counters.denied_req++; |
| 887 | s->fe->fe_counters.denied_req++; |
Krzysztof Piotr Oledzki | aeebf9b | 2009-10-04 15:43:17 +0200 | [diff] [blame] | 888 | if (s->listener->counters) |
Willy Tarreau | 23968d8 | 2010-05-23 23:50:44 +0200 | [diff] [blame] | 889 | s->listener->counters->denied_req++; |
Krzysztof Piotr Oledzki | aeebf9b | 2009-10-04 15:43:17 +0200 | [diff] [blame] | 890 | |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 891 | if (!(s->flags & SN_ERR_MASK)) |
| 892 | s->flags |= SN_ERR_PRXCOND; |
| 893 | if (!(s->flags & SN_FINST_MASK)) |
| 894 | s->flags |= SN_FINST_R; |
| 895 | return 0; |
| 896 | } |
Willy Tarreau | 5612328 | 2010-08-06 19:06:56 +0200 | [diff] [blame] | 897 | else if (rule->action == TCP_ACT_TRK_SC1) { |
| 898 | if (!s->stkctr1_entry) { |
| 899 | /* only the first valid track-sc1 directive applies. |
Willy Tarreau | d1f9652 | 2010-08-03 19:34:32 +0200 | [diff] [blame] | 900 | * Also, note that right now we can only track SRC so we |
| 901 | * don't check how to get the key, but later we may need |
| 902 | * to consider rule->act_prm->trk_ctr.type. |
| 903 | */ |
| 904 | t = rule->act_prm.trk_ctr.table.t; |
David du Colombier | 4f92d32 | 2011-03-24 11:09:31 +0100 | [diff] [blame] | 905 | ts = stktable_get_entry(t, tcp_src_to_stktable_key(s)); |
Willy Tarreau | 0a4838c | 2010-08-06 20:11:05 +0200 | [diff] [blame] | 906 | if (ts) { |
Willy Tarreau | 5612328 | 2010-08-06 19:06:56 +0200 | [diff] [blame] | 907 | session_track_stkctr1(s, t, ts); |
Willy Tarreau | 0a4838c | 2010-08-06 20:11:05 +0200 | [diff] [blame] | 908 | if (s->fe != s->be) |
| 909 | s->flags |= SN_BE_TRACK_SC1; |
| 910 | } |
Willy Tarreau | d1f9652 | 2010-08-03 19:34:32 +0200 | [diff] [blame] | 911 | } |
| 912 | } |
Willy Tarreau | 5612328 | 2010-08-06 19:06:56 +0200 | [diff] [blame] | 913 | else if (rule->action == TCP_ACT_TRK_SC2) { |
| 914 | if (!s->stkctr2_entry) { |
| 915 | /* only the first valid track-sc2 directive applies. |
Willy Tarreau | d1f9652 | 2010-08-03 19:34:32 +0200 | [diff] [blame] | 916 | * Also, note that right now we can only track SRC so we |
| 917 | * don't check how to get the key, but later we may need |
| 918 | * to consider rule->act_prm->trk_ctr.type. |
| 919 | */ |
| 920 | t = rule->act_prm.trk_ctr.table.t; |
David du Colombier | 4f92d32 | 2011-03-24 11:09:31 +0100 | [diff] [blame] | 921 | ts = stktable_get_entry(t, tcp_src_to_stktable_key(s)); |
Willy Tarreau | 0a4838c | 2010-08-06 20:11:05 +0200 | [diff] [blame] | 922 | if (ts) { |
Willy Tarreau | 5612328 | 2010-08-06 19:06:56 +0200 | [diff] [blame] | 923 | session_track_stkctr2(s, t, ts); |
Willy Tarreau | 0a4838c | 2010-08-06 20:11:05 +0200 | [diff] [blame] | 924 | if (s->fe != s->be) |
| 925 | s->flags |= SN_BE_TRACK_SC2; |
| 926 | } |
Willy Tarreau | d1f9652 | 2010-08-03 19:34:32 +0200 | [diff] [blame] | 927 | } |
| 928 | } |
| 929 | else { |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 930 | /* otherwise accept */ |
Willy Tarreau | d1f9652 | 2010-08-03 19:34:32 +0200 | [diff] [blame] | 931 | break; |
| 932 | } |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 933 | } |
| 934 | } |
| 935 | |
| 936 | /* if we get there, it means we have no rule which matches, or |
| 937 | * we have an explicit accept, so we apply the default accept. |
| 938 | */ |
Willy Tarreau | 3a81629 | 2009-07-07 10:55:49 +0200 | [diff] [blame] | 939 | req->analysers &= ~an_bit; |
Willy Tarreau | edcf668 | 2008-11-30 23:15:34 +0100 | [diff] [blame] | 940 | req->analyse_exp = TICK_ETERNITY; |
| 941 | return 1; |
| 942 | } |
| 943 | |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 944 | /* This function performs the TCP response analysis on the current response. It |
| 945 | * returns 1 if the processing can continue on next analysers, or zero if it |
| 946 | * needs more data, encounters an error, or wants to immediately abort the |
| 947 | * response. It relies on buffers flags, and updates s->rep->analysers. The |
| 948 | * function may be called for backend rules. |
| 949 | */ |
| 950 | int tcp_inspect_response(struct session *s, struct buffer *rep, int an_bit) |
| 951 | { |
| 952 | struct tcp_rule *rule; |
| 953 | int partial; |
| 954 | |
Willy Tarreau | 02d6cfc | 2012-03-01 18:19:58 +0100 | [diff] [blame] | 955 | DPRINTF(stderr,"[%u] %s: session=%p b=%p, exp(r,w)=%u,%u bf=%08x bh=%d analysers=%02x\n", |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 956 | now_ms, __FUNCTION__, |
| 957 | s, |
| 958 | rep, |
| 959 | rep->rex, rep->wex, |
| 960 | rep->flags, |
Willy Tarreau | 02d6cfc | 2012-03-01 18:19:58 +0100 | [diff] [blame] | 961 | rep->i, |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 962 | rep->analysers); |
| 963 | |
| 964 | /* We don't know whether we have enough data, so must proceed |
| 965 | * this way : |
| 966 | * - iterate through all rules in their declaration order |
| 967 | * - if one rule returns MISS, it means the inspect delay is |
| 968 | * not over yet, then return immediately, otherwise consider |
| 969 | * it as a non-match. |
| 970 | * - if one rule returns OK, then return OK |
| 971 | * - if one rule returns KO, then return KO |
| 972 | */ |
| 973 | |
| 974 | if (rep->flags & BF_SHUTR || tick_is_expired(rep->analyse_exp, now_ms)) |
Willy Tarreau | 32a6f2e | 2012-04-25 10:13:36 +0200 | [diff] [blame] | 975 | partial = SMP_OPT_FINAL; |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 976 | else |
Willy Tarreau | 32a6f2e | 2012-04-25 10:13:36 +0200 | [diff] [blame] | 977 | partial = 0; |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 978 | |
| 979 | list_for_each_entry(rule, &s->be->tcp_rep.inspect_rules, list) { |
| 980 | int ret = ACL_PAT_PASS; |
| 981 | |
| 982 | if (rule->cond) { |
Willy Tarreau | 32a6f2e | 2012-04-25 10:13:36 +0200 | [diff] [blame] | 983 | ret = acl_exec_cond(rule->cond, s->be, s, &s->txn, SMP_OPT_DIR_RES | partial); |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 984 | if (ret == ACL_PAT_MISS) { |
| 985 | /* just set the analyser timeout once at the beginning of the response */ |
| 986 | if (!tick_isset(rep->analyse_exp) && s->be->tcp_rep.inspect_delay) |
| 987 | rep->analyse_exp = tick_add_ifset(now_ms, s->be->tcp_rep.inspect_delay); |
| 988 | return 0; |
| 989 | } |
| 990 | |
| 991 | ret = acl_pass(ret); |
| 992 | if (rule->cond->pol == ACL_COND_UNLESS) |
| 993 | ret = !ret; |
| 994 | } |
| 995 | |
| 996 | if (ret) { |
| 997 | /* we have a matching rule. */ |
| 998 | if (rule->action == TCP_ACT_REJECT) { |
| 999 | buffer_abort(rep); |
| 1000 | buffer_abort(s->req); |
| 1001 | rep->analysers = 0; |
| 1002 | |
Willy Tarreau | 7d0aaf3 | 2011-03-10 23:25:56 +0100 | [diff] [blame] | 1003 | s->be->be_counters.denied_resp++; |
| 1004 | s->fe->fe_counters.denied_resp++; |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1005 | if (s->listener->counters) |
| 1006 | s->listener->counters->denied_resp++; |
| 1007 | |
| 1008 | if (!(s->flags & SN_ERR_MASK)) |
| 1009 | s->flags |= SN_ERR_PRXCOND; |
| 1010 | if (!(s->flags & SN_FINST_MASK)) |
| 1011 | s->flags |= SN_FINST_D; |
| 1012 | return 0; |
| 1013 | } |
| 1014 | else { |
| 1015 | /* otherwise accept */ |
| 1016 | break; |
| 1017 | } |
| 1018 | } |
| 1019 | } |
| 1020 | |
| 1021 | /* if we get there, it means we have no rule which matches, or |
| 1022 | * we have an explicit accept, so we apply the default accept. |
| 1023 | */ |
| 1024 | rep->analysers &= ~an_bit; |
| 1025 | rep->analyse_exp = TICK_ETERNITY; |
| 1026 | return 1; |
| 1027 | } |
| 1028 | |
| 1029 | |
Willy Tarreau | a5c0ab2 | 2010-05-31 10:30:33 +0200 | [diff] [blame] | 1030 | /* This function performs the TCP layer4 analysis on the current request. It |
| 1031 | * returns 0 if a reject rule matches, otherwise 1 if either an accept rule |
| 1032 | * matches or if no more rule matches. It can only use rules which don't need |
| 1033 | * any data. |
| 1034 | */ |
| 1035 | int tcp_exec_req_rules(struct session *s) |
| 1036 | { |
| 1037 | struct tcp_rule *rule; |
Willy Tarreau | f059a0f | 2010-08-03 16:29:52 +0200 | [diff] [blame] | 1038 | struct stksess *ts; |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 1039 | struct stktable *t = NULL; |
| 1040 | int result = 1; |
Willy Tarreau | a5c0ab2 | 2010-05-31 10:30:33 +0200 | [diff] [blame] | 1041 | int ret; |
| 1042 | |
| 1043 | list_for_each_entry(rule, &s->fe->tcp_req.l4_rules, list) { |
| 1044 | ret = ACL_PAT_PASS; |
| 1045 | |
| 1046 | if (rule->cond) { |
Willy Tarreau | 32a6f2e | 2012-04-25 10:13:36 +0200 | [diff] [blame] | 1047 | ret = acl_exec_cond(rule->cond, s->fe, s, NULL, SMP_OPT_DIR_REQ|SMP_OPT_FINAL); |
Willy Tarreau | a5c0ab2 | 2010-05-31 10:30:33 +0200 | [diff] [blame] | 1048 | ret = acl_pass(ret); |
| 1049 | if (rule->cond->pol == ACL_COND_UNLESS) |
| 1050 | ret = !ret; |
| 1051 | } |
| 1052 | |
| 1053 | if (ret) { |
| 1054 | /* we have a matching rule. */ |
| 1055 | if (rule->action == TCP_ACT_REJECT) { |
Willy Tarreau | 7d0aaf3 | 2011-03-10 23:25:56 +0100 | [diff] [blame] | 1056 | s->fe->fe_counters.denied_conn++; |
Willy Tarreau | a5c0ab2 | 2010-05-31 10:30:33 +0200 | [diff] [blame] | 1057 | if (s->listener->counters) |
Willy Tarreau | 2799e98 | 2010-06-05 15:43:21 +0200 | [diff] [blame] | 1058 | s->listener->counters->denied_conn++; |
Willy Tarreau | a5c0ab2 | 2010-05-31 10:30:33 +0200 | [diff] [blame] | 1059 | |
| 1060 | if (!(s->flags & SN_ERR_MASK)) |
| 1061 | s->flags |= SN_ERR_PRXCOND; |
| 1062 | if (!(s->flags & SN_FINST_MASK)) |
| 1063 | s->flags |= SN_FINST_R; |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 1064 | result = 0; |
| 1065 | break; |
Willy Tarreau | a5c0ab2 | 2010-05-31 10:30:33 +0200 | [diff] [blame] | 1066 | } |
Willy Tarreau | 5612328 | 2010-08-06 19:06:56 +0200 | [diff] [blame] | 1067 | else if (rule->action == TCP_ACT_TRK_SC1) { |
| 1068 | if (!s->stkctr1_entry) { |
| 1069 | /* only the first valid track-sc1 directive applies. |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 1070 | * Also, note that right now we can only track SRC so we |
| 1071 | * don't check how to get the key, but later we may need |
| 1072 | * to consider rule->act_prm->trk_ctr.type. |
| 1073 | */ |
| 1074 | t = rule->act_prm.trk_ctr.table.t; |
David du Colombier | 4f92d32 | 2011-03-24 11:09:31 +0100 | [diff] [blame] | 1075 | ts = stktable_get_entry(t, tcp_src_to_stktable_key(s)); |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 1076 | if (ts) |
Willy Tarreau | 5612328 | 2010-08-06 19:06:56 +0200 | [diff] [blame] | 1077 | session_track_stkctr1(s, t, ts); |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 1078 | } |
| 1079 | } |
Willy Tarreau | 5612328 | 2010-08-06 19:06:56 +0200 | [diff] [blame] | 1080 | else if (rule->action == TCP_ACT_TRK_SC2) { |
| 1081 | if (!s->stkctr2_entry) { |
| 1082 | /* only the first valid track-sc2 directive applies. |
Willy Tarreau | f059a0f | 2010-08-03 16:29:52 +0200 | [diff] [blame] | 1083 | * Also, note that right now we can only track SRC so we |
| 1084 | * don't check how to get the key, but later we may need |
| 1085 | * to consider rule->act_prm->trk_ctr.type. |
| 1086 | */ |
| 1087 | t = rule->act_prm.trk_ctr.table.t; |
David du Colombier | 4f92d32 | 2011-03-24 11:09:31 +0100 | [diff] [blame] | 1088 | ts = stktable_get_entry(t, tcp_src_to_stktable_key(s)); |
Willy Tarreau | f059a0f | 2010-08-03 16:29:52 +0200 | [diff] [blame] | 1089 | if (ts) |
Willy Tarreau | 5612328 | 2010-08-06 19:06:56 +0200 | [diff] [blame] | 1090 | session_track_stkctr2(s, t, ts); |
Willy Tarreau | f059a0f | 2010-08-03 16:29:52 +0200 | [diff] [blame] | 1091 | } |
| 1092 | } |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 1093 | else { |
| 1094 | /* otherwise it's an accept */ |
| 1095 | break; |
| 1096 | } |
Willy Tarreau | a5c0ab2 | 2010-05-31 10:30:33 +0200 | [diff] [blame] | 1097 | } |
| 1098 | } |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 1099 | return result; |
Willy Tarreau | a5c0ab2 | 2010-05-31 10:30:33 +0200 | [diff] [blame] | 1100 | } |
| 1101 | |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1102 | /* Parse a tcp-response rule. Return a negative value in case of failure */ |
| 1103 | static int tcp_parse_response_rule(char **args, int arg, int section_type, |
| 1104 | struct proxy *curpx, struct proxy *defpx, |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1105 | struct tcp_rule *rule, char **err) |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1106 | { |
| 1107 | if (curpx == defpx || !(curpx->cap & PR_CAP_BE)) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1108 | memprintf(err, "%s %s is only allowed in 'backend' sections", |
| 1109 | args[0], args[1]); |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1110 | return -1; |
| 1111 | } |
| 1112 | |
| 1113 | if (strcmp(args[arg], "accept") == 0) { |
| 1114 | arg++; |
| 1115 | rule->action = TCP_ACT_ACCEPT; |
| 1116 | } |
| 1117 | else if (strcmp(args[arg], "reject") == 0) { |
| 1118 | arg++; |
| 1119 | rule->action = TCP_ACT_REJECT; |
| 1120 | } |
| 1121 | else { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1122 | memprintf(err, |
| 1123 | "'%s %s' expects 'accept' or 'reject' in %s '%s' (got '%s')", |
| 1124 | args[0], args[1], proxy_type_str(curpx), curpx->id, args[arg]); |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1125 | return -1; |
| 1126 | } |
| 1127 | |
| 1128 | if (strcmp(args[arg], "if") == 0 || strcmp(args[arg], "unless") == 0) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1129 | if ((rule->cond = build_acl_cond(NULL, 0, curpx, (const char **)args+arg, err)) == NULL) { |
| 1130 | memprintf(err, |
| 1131 | "'%s %s %s' : error detected in %s '%s' while parsing '%s' condition : %s", |
| 1132 | args[0], args[1], args[2], proxy_type_str(curpx), curpx->id, args[arg], *err); |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1133 | return -1; |
| 1134 | } |
| 1135 | } |
| 1136 | else if (*args[arg]) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1137 | memprintf(err, |
| 1138 | "'%s %s %s' only accepts 'if' or 'unless', in %s '%s' (got '%s')", |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1139 | args[0], args[1], args[2], proxy_type_str(curpx), curpx->id, args[arg]); |
| 1140 | return -1; |
| 1141 | } |
| 1142 | return 0; |
| 1143 | } |
| 1144 | |
| 1145 | |
| 1146 | |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1147 | /* Parse a tcp-request rule. Return a negative value in case of failure */ |
| 1148 | static int tcp_parse_request_rule(char **args, int arg, int section_type, |
| 1149 | struct proxy *curpx, struct proxy *defpx, |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1150 | struct tcp_rule *rule, char **err) |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1151 | { |
| 1152 | if (curpx == defpx) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1153 | memprintf(err, "%s %s is not allowed in 'defaults' sections", |
| 1154 | args[0], args[1]); |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1155 | return -1; |
| 1156 | } |
| 1157 | |
| 1158 | if (!strcmp(args[arg], "accept")) { |
| 1159 | arg++; |
| 1160 | rule->action = TCP_ACT_ACCEPT; |
| 1161 | } |
| 1162 | else if (!strcmp(args[arg], "reject")) { |
| 1163 | arg++; |
| 1164 | rule->action = TCP_ACT_REJECT; |
| 1165 | } |
Willy Tarreau | 5612328 | 2010-08-06 19:06:56 +0200 | [diff] [blame] | 1166 | else if (strcmp(args[arg], "track-sc1") == 0) { |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1167 | int ret; |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1168 | int kw = arg; |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1169 | |
| 1170 | arg++; |
| 1171 | ret = parse_track_counters(args, &arg, section_type, curpx, |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1172 | &rule->act_prm.trk_ctr, defpx, err); |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1173 | |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1174 | if (ret < 0) { /* nb: warnings are not handled yet */ |
| 1175 | memprintf(err, |
| 1176 | "'%s %s %s' : %s in %s '%s'", |
| 1177 | args[0], args[1], args[kw], *err, proxy_type_str(curpx), curpx->id); |
| 1178 | return ret; |
| 1179 | } |
Willy Tarreau | 5612328 | 2010-08-06 19:06:56 +0200 | [diff] [blame] | 1180 | rule->action = TCP_ACT_TRK_SC1; |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1181 | } |
Willy Tarreau | 5612328 | 2010-08-06 19:06:56 +0200 | [diff] [blame] | 1182 | else if (strcmp(args[arg], "track-sc2") == 0) { |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1183 | int ret; |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1184 | int kw = arg; |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1185 | |
| 1186 | arg++; |
| 1187 | ret = parse_track_counters(args, &arg, section_type, curpx, |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1188 | &rule->act_prm.trk_ctr, defpx, err); |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1189 | |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1190 | if (ret < 0) { /* nb: warnings are not handled yet */ |
| 1191 | memprintf(err, |
| 1192 | "'%s %s %s' : %s in %s '%s'", |
| 1193 | args[0], args[1], args[kw], *err, proxy_type_str(curpx), curpx->id); |
| 1194 | return ret; |
| 1195 | } |
Willy Tarreau | 5612328 | 2010-08-06 19:06:56 +0200 | [diff] [blame] | 1196 | rule->action = TCP_ACT_TRK_SC2; |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1197 | } |
| 1198 | else { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1199 | memprintf(err, |
| 1200 | "'%s %s' expects 'accept', 'reject', 'track-sc1' " |
| 1201 | "or 'track-sc2' in %s '%s' (got '%s')", |
| 1202 | args[0], args[1], proxy_type_str(curpx), curpx->id, args[arg]); |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1203 | return -1; |
| 1204 | } |
| 1205 | |
| 1206 | if (strcmp(args[arg], "if") == 0 || strcmp(args[arg], "unless") == 0) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1207 | if ((rule->cond = build_acl_cond(NULL, 0, curpx, (const char **)args+arg, err)) == NULL) { |
| 1208 | memprintf(err, |
| 1209 | "'%s %s %s' : error detected in %s '%s' while parsing '%s' condition : %s", |
| 1210 | args[0], args[1], args[2], proxy_type_str(curpx), curpx->id, args[arg], *err); |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1211 | return -1; |
| 1212 | } |
| 1213 | } |
| 1214 | else if (*args[arg]) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1215 | memprintf(err, |
| 1216 | "'%s %s %s' only accepts 'if' or 'unless', in %s '%s' (got '%s')", |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1217 | args[0], args[1], args[2], proxy_type_str(curpx), curpx->id, args[arg]); |
| 1218 | return -1; |
| 1219 | } |
| 1220 | return 0; |
| 1221 | } |
| 1222 | |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1223 | /* This function should be called to parse a line starting with the "tcp-response" |
| 1224 | * keyword. |
| 1225 | */ |
| 1226 | static int tcp_parse_tcp_rep(char **args, int section_type, struct proxy *curpx, |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1227 | struct proxy *defpx, char **err) |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1228 | { |
| 1229 | const char *ptr = NULL; |
| 1230 | unsigned int val; |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1231 | int warn = 0; |
| 1232 | int arg; |
| 1233 | struct tcp_rule *rule; |
| 1234 | |
| 1235 | if (!*args[1]) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1236 | memprintf(err, "missing argument for '%s' in %s '%s'", |
| 1237 | args[0], proxy_type_str(curpx), curpx->id); |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1238 | return -1; |
| 1239 | } |
| 1240 | |
| 1241 | if (strcmp(args[1], "inspect-delay") == 0) { |
| 1242 | if (curpx == defpx || !(curpx->cap & PR_CAP_BE)) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1243 | memprintf(err, "%s %s is only allowed in 'backend' sections", |
| 1244 | args[0], args[1]); |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1245 | return -1; |
| 1246 | } |
| 1247 | |
| 1248 | if (!*args[2] || (ptr = parse_time_err(args[2], &val, TIME_UNIT_MS))) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1249 | memprintf(err, |
| 1250 | "'%s %s' expects a positive delay in milliseconds, in %s '%s'", |
| 1251 | args[0], args[1], proxy_type_str(curpx), curpx->id); |
| 1252 | if (ptr) |
| 1253 | memprintf(err, "%s (unexpected character '%c')", *err, *ptr); |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1254 | return -1; |
| 1255 | } |
| 1256 | |
| 1257 | if (curpx->tcp_rep.inspect_delay) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1258 | memprintf(err, "ignoring %s %s (was already defined) in %s '%s'", |
| 1259 | args[0], args[1], proxy_type_str(curpx), curpx->id); |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1260 | return 1; |
| 1261 | } |
| 1262 | curpx->tcp_rep.inspect_delay = val; |
| 1263 | return 0; |
| 1264 | } |
| 1265 | |
Simon Horman | de072bd | 2011-06-24 15:11:37 +0900 | [diff] [blame] | 1266 | rule = calloc(1, sizeof(*rule)); |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1267 | LIST_INIT(&rule->list); |
| 1268 | arg = 1; |
| 1269 | |
| 1270 | if (strcmp(args[1], "content") == 0) { |
| 1271 | arg++; |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1272 | if (tcp_parse_response_rule(args, arg, section_type, curpx, defpx, rule, err) < 0) |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1273 | goto error; |
| 1274 | |
| 1275 | if (rule->cond && (rule->cond->requires & ACL_USE_L6REQ_VOLATILE)) { |
| 1276 | struct acl *acl; |
| 1277 | const char *name; |
| 1278 | |
| 1279 | acl = cond_find_require(rule->cond, ACL_USE_L6REQ_VOLATILE); |
| 1280 | name = acl ? acl->name : "(unknown)"; |
| 1281 | |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1282 | memprintf(err, |
| 1283 | "acl '%s' involves some request-only criteria which will be ignored in '%s %s'", |
| 1284 | name, args[0], args[1]); |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1285 | warn++; |
| 1286 | } |
| 1287 | |
| 1288 | LIST_ADDQ(&curpx->tcp_rep.inspect_rules, &rule->list); |
| 1289 | } |
| 1290 | else { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1291 | memprintf(err, |
| 1292 | "'%s' expects 'inspect-delay' or 'content' in %s '%s' (got '%s')", |
| 1293 | args[0], proxy_type_str(curpx), curpx->id, args[1]); |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1294 | goto error; |
| 1295 | } |
| 1296 | |
| 1297 | return warn; |
| 1298 | error: |
| 1299 | free(rule); |
| 1300 | return -1; |
| 1301 | } |
| 1302 | |
| 1303 | |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1304 | /* This function should be called to parse a line starting with the "tcp-request" |
| 1305 | * keyword. |
| 1306 | */ |
| 1307 | static int tcp_parse_tcp_req(char **args, int section_type, struct proxy *curpx, |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1308 | struct proxy *defpx, char **err) |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1309 | { |
| 1310 | const char *ptr = NULL; |
Willy Tarreau | c7e961e | 2008-08-17 17:13:47 +0200 | [diff] [blame] | 1311 | unsigned int val; |
Willy Tarreau | 1a68794 | 2010-05-23 22:40:30 +0200 | [diff] [blame] | 1312 | int warn = 0; |
Willy Tarreau | 6a984fa | 2010-06-14 16:44:27 +0200 | [diff] [blame] | 1313 | int arg; |
Willy Tarreau | 1a68794 | 2010-05-23 22:40:30 +0200 | [diff] [blame] | 1314 | struct tcp_rule *rule; |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1315 | |
| 1316 | if (!*args[1]) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1317 | if (curpx == defpx) |
| 1318 | memprintf(err, "missing argument for '%s' in defaults section", args[0]); |
| 1319 | else |
| 1320 | memprintf(err, "missing argument for '%s' in %s '%s'", |
| 1321 | args[0], proxy_type_str(curpx), curpx->id); |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1322 | return -1; |
| 1323 | } |
| 1324 | |
| 1325 | if (!strcmp(args[1], "inspect-delay")) { |
| 1326 | if (curpx == defpx) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1327 | memprintf(err, "%s %s is not allowed in 'defaults' sections", |
| 1328 | args[0], args[1]); |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1329 | return -1; |
| 1330 | } |
| 1331 | |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1332 | if (!*args[2] || (ptr = parse_time_err(args[2], &val, TIME_UNIT_MS))) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1333 | memprintf(err, |
| 1334 | "'%s %s' expects a positive delay in milliseconds, in %s '%s'", |
| 1335 | args[0], args[1], proxy_type_str(curpx), curpx->id); |
| 1336 | if (ptr) |
| 1337 | memprintf(err, "%s (unexpected character '%c')", *err, *ptr); |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1338 | return -1; |
| 1339 | } |
| 1340 | |
| 1341 | if (curpx->tcp_req.inspect_delay) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1342 | memprintf(err, "ignoring %s %s (was already defined) in %s '%s'", |
| 1343 | args[0], args[1], proxy_type_str(curpx), curpx->id); |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1344 | return 1; |
| 1345 | } |
| 1346 | curpx->tcp_req.inspect_delay = val; |
| 1347 | return 0; |
| 1348 | } |
| 1349 | |
Simon Horman | de072bd | 2011-06-24 15:11:37 +0900 | [diff] [blame] | 1350 | rule = calloc(1, sizeof(*rule)); |
Willy Tarreau | fb024dc | 2010-08-20 13:35:41 +0200 | [diff] [blame] | 1351 | LIST_INIT(&rule->list); |
Willy Tarreau | 6a984fa | 2010-06-14 16:44:27 +0200 | [diff] [blame] | 1352 | arg = 1; |
| 1353 | |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1354 | if (strcmp(args[1], "content") == 0) { |
Willy Tarreau | d1f9652 | 2010-08-03 19:34:32 +0200 | [diff] [blame] | 1355 | arg++; |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1356 | if (tcp_parse_request_rule(args, arg, section_type, curpx, defpx, rule, err) < 0) |
Willy Tarreau | 6a984fa | 2010-06-14 16:44:27 +0200 | [diff] [blame] | 1357 | goto error; |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1358 | |
Willy Tarreau | 6a984fa | 2010-06-14 16:44:27 +0200 | [diff] [blame] | 1359 | if (rule->cond && (rule->cond->requires & ACL_USE_RTR_ANY)) { |
Willy Tarreau | dd64f8d | 2008-07-27 22:02:32 +0200 | [diff] [blame] | 1360 | struct acl *acl; |
| 1361 | const char *name; |
| 1362 | |
Willy Tarreau | 6a984fa | 2010-06-14 16:44:27 +0200 | [diff] [blame] | 1363 | acl = cond_find_require(rule->cond, ACL_USE_RTR_ANY); |
Willy Tarreau | dd64f8d | 2008-07-27 22:02:32 +0200 | [diff] [blame] | 1364 | name = acl ? acl->name : "(unknown)"; |
| 1365 | |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1366 | memprintf(err, |
| 1367 | "acl '%s' involves some response-only criteria which will be ignored in '%s %s'", |
| 1368 | name, args[0], args[1]); |
Willy Tarreau | dd64f8d | 2008-07-27 22:02:32 +0200 | [diff] [blame] | 1369 | warn++; |
| 1370 | } |
Willy Tarreau | fb024dc | 2010-08-20 13:35:41 +0200 | [diff] [blame] | 1371 | LIST_ADDQ(&curpx->tcp_req.inspect_rules, &rule->list); |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 1372 | } |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1373 | else if (strcmp(args[1], "connection") == 0) { |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 1374 | arg++; |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 1375 | |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1376 | if (!(curpx->cap & PR_CAP_FE)) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1377 | memprintf(err, "%s %s is not allowed because %s %s is not a frontend", |
| 1378 | args[0], args[1], proxy_type_str(curpx), curpx->id); |
Simon Horman | 6c54d8b | 2011-07-15 13:14:06 +0900 | [diff] [blame] | 1379 | goto error; |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1380 | } |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 1381 | |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1382 | if (tcp_parse_request_rule(args, arg, section_type, curpx, defpx, rule, err) < 0) |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 1383 | goto error; |
| 1384 | |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1385 | if (rule->cond && (rule->cond->requires & (ACL_USE_RTR_ANY|ACL_USE_L6_ANY|ACL_USE_L7_ANY))) { |
| 1386 | struct acl *acl; |
| 1387 | const char *name; |
Willy Tarreau | f059a0f | 2010-08-03 16:29:52 +0200 | [diff] [blame] | 1388 | |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1389 | acl = cond_find_require(rule->cond, ACL_USE_RTR_ANY|ACL_USE_L6_ANY|ACL_USE_L7_ANY); |
| 1390 | name = acl ? acl->name : "(unknown)"; |
Willy Tarreau | f059a0f | 2010-08-03 16:29:52 +0200 | [diff] [blame] | 1391 | |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1392 | if (acl->requires & (ACL_USE_L6_ANY|ACL_USE_L7_ANY)) { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1393 | memprintf(err, |
| 1394 | "'%s %s' may not reference acl '%s' which makes use of " |
| 1395 | "payload in %s '%s'. Please use '%s content' for this.", |
| 1396 | args[0], args[1], name, proxy_type_str(curpx), curpx->id, args[0]); |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1397 | goto error; |
| 1398 | } |
| 1399 | if (acl->requires & ACL_USE_RTR_ANY) |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1400 | memprintf(err, |
| 1401 | "acl '%s' involves some response-only criteria which will be ignored in '%s %s'", |
| 1402 | name, args[0], args[1]); |
Willy Tarreau | 68c03ab | 2010-08-06 15:08:45 +0200 | [diff] [blame] | 1403 | warn++; |
| 1404 | } |
Willy Tarreau | fb024dc | 2010-08-20 13:35:41 +0200 | [diff] [blame] | 1405 | LIST_ADDQ(&curpx->tcp_req.l4_rules, &rule->list); |
Willy Tarreau | 9ba2dcc | 2010-06-14 21:04:55 +0200 | [diff] [blame] | 1406 | } |
Willy Tarreau | 1a68794 | 2010-05-23 22:40:30 +0200 | [diff] [blame] | 1407 | else { |
Willy Tarreau | 0a3dd74 | 2012-05-08 19:47:01 +0200 | [diff] [blame] | 1408 | if (curpx == defpx) |
| 1409 | memprintf(err, |
| 1410 | "'%s' expects 'inspect-delay', 'connection', or 'content' in defaults section (got '%s')", |
| 1411 | args[0], args[1]); |
| 1412 | else |
| 1413 | memprintf(err, |
| 1414 | "'%s' expects 'inspect-delay', 'connection', or 'content' in %s '%s' (got '%s')", |
| 1415 | args[0], args[1], proxy_type_str(curpx), curpx->id); |
Willy Tarreau | 6a984fa | 2010-06-14 16:44:27 +0200 | [diff] [blame] | 1416 | goto error; |
Willy Tarreau | 1a68794 | 2010-05-23 22:40:30 +0200 | [diff] [blame] | 1417 | } |
| 1418 | |
Willy Tarreau | 1a68794 | 2010-05-23 22:40:30 +0200 | [diff] [blame] | 1419 | return warn; |
Willy Tarreau | 6a984fa | 2010-06-14 16:44:27 +0200 | [diff] [blame] | 1420 | error: |
| 1421 | free(rule); |
| 1422 | return -1; |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1423 | } |
| 1424 | |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1425 | |
| 1426 | /************************************************************************/ |
Willy Tarreau | 32389b7 | 2012-04-23 23:13:20 +0200 | [diff] [blame] | 1427 | /* All supported sample fetch functios must be declared here */ |
| 1428 | /************************************************************************/ |
| 1429 | |
| 1430 | /* Fetch the request RDP cookie identified in the args, or any cookie if no arg |
Willy Tarreau | 1278578 | 2012-04-27 21:37:17 +0200 | [diff] [blame] | 1431 | * is passed. It is usable both for ACL and for samples. Note: this decoder |
Willy Tarreau | 32389b7 | 2012-04-23 23:13:20 +0200 | [diff] [blame] | 1432 | * only works with non-wrapping data. Accepts either 0 or 1 argument. Argument |
| 1433 | * is a string (cookie name), other types will lead to undefined behaviour. |
| 1434 | */ |
| 1435 | int |
Willy Tarreau | 32a6f2e | 2012-04-25 10:13:36 +0200 | [diff] [blame] | 1436 | smp_fetch_rdp_cookie(struct proxy *px, struct session *l4, void *l7, unsigned int opt, |
Willy Tarreau | 32389b7 | 2012-04-23 23:13:20 +0200 | [diff] [blame] | 1437 | const struct arg *args, struct sample *smp) |
| 1438 | { |
| 1439 | int bleft; |
| 1440 | const unsigned char *data; |
| 1441 | |
| 1442 | if (!l4 || !l4->req) |
| 1443 | return 0; |
| 1444 | |
| 1445 | smp->flags = 0; |
| 1446 | smp->type = SMP_T_CSTR; |
| 1447 | |
| 1448 | bleft = l4->req->i; |
| 1449 | if (bleft <= 11) |
| 1450 | goto too_short; |
| 1451 | |
| 1452 | data = (const unsigned char *)l4->req->p + 11; |
| 1453 | bleft -= 11; |
| 1454 | |
| 1455 | if (bleft <= 7) |
| 1456 | goto too_short; |
| 1457 | |
| 1458 | if (strncasecmp((const char *)data, "Cookie:", 7) != 0) |
| 1459 | goto not_cookie; |
| 1460 | |
| 1461 | data += 7; |
| 1462 | bleft -= 7; |
| 1463 | |
| 1464 | while (bleft > 0 && *data == ' ') { |
| 1465 | data++; |
| 1466 | bleft--; |
| 1467 | } |
| 1468 | |
| 1469 | if (args) { |
| 1470 | |
| 1471 | if (bleft <= args->data.str.len) |
| 1472 | goto too_short; |
| 1473 | |
| 1474 | if ((data[args->data.str.len] != '=') || |
| 1475 | strncasecmp(args->data.str.str, (const char *)data, args->data.str.len) != 0) |
| 1476 | goto not_cookie; |
| 1477 | |
| 1478 | data += args->data.str.len + 1; |
| 1479 | bleft -= args->data.str.len + 1; |
| 1480 | } else { |
| 1481 | while (bleft > 0 && *data != '=') { |
| 1482 | if (*data == '\r' || *data == '\n') |
| 1483 | goto not_cookie; |
| 1484 | data++; |
| 1485 | bleft--; |
| 1486 | } |
| 1487 | |
| 1488 | if (bleft < 1) |
| 1489 | goto too_short; |
| 1490 | |
| 1491 | if (*data != '=') |
| 1492 | goto not_cookie; |
| 1493 | |
| 1494 | data++; |
| 1495 | bleft--; |
| 1496 | } |
| 1497 | |
| 1498 | /* data points to cookie value */ |
| 1499 | smp->data.str.str = (char *)data; |
| 1500 | smp->data.str.len = 0; |
| 1501 | |
| 1502 | while (bleft > 0 && *data != '\r') { |
| 1503 | data++; |
| 1504 | bleft--; |
| 1505 | } |
| 1506 | |
| 1507 | if (bleft < 2) |
| 1508 | goto too_short; |
| 1509 | |
| 1510 | if (data[0] != '\r' || data[1] != '\n') |
| 1511 | goto not_cookie; |
| 1512 | |
| 1513 | smp->data.str.len = (char *)data - smp->data.str.str; |
| 1514 | smp->flags = SMP_F_VOLATILE; |
| 1515 | return 1; |
| 1516 | |
| 1517 | too_short: |
| 1518 | smp->flags = SMP_F_MAY_CHANGE; |
| 1519 | not_cookie: |
| 1520 | return 0; |
| 1521 | } |
| 1522 | |
Willy Tarreau | 32389b7 | 2012-04-23 23:13:20 +0200 | [diff] [blame] | 1523 | /************************************************************************/ |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1524 | /* All supported ACL keywords must be declared here. */ |
| 1525 | /************************************************************************/ |
| 1526 | |
Willy Tarreau | 32389b7 | 2012-04-23 23:13:20 +0200 | [diff] [blame] | 1527 | /* returns either 1 or 0 depending on whether an RDP cookie is found or not */ |
| 1528 | static int |
Willy Tarreau | 32a6f2e | 2012-04-25 10:13:36 +0200 | [diff] [blame] | 1529 | acl_fetch_rdp_cookie_cnt(struct proxy *px, struct session *l4, void *l7, unsigned int opt, |
Willy Tarreau | 24e32d8 | 2012-04-23 23:55:44 +0200 | [diff] [blame] | 1530 | const struct arg *args, struct sample *smp) |
Willy Tarreau | 32389b7 | 2012-04-23 23:13:20 +0200 | [diff] [blame] | 1531 | { |
| 1532 | int ret; |
| 1533 | |
Willy Tarreau | 32a6f2e | 2012-04-25 10:13:36 +0200 | [diff] [blame] | 1534 | ret = smp_fetch_rdp_cookie(px, l4, l7, opt, args, smp); |
Willy Tarreau | 32389b7 | 2012-04-23 23:13:20 +0200 | [diff] [blame] | 1535 | |
| 1536 | if (smp->flags & SMP_F_MAY_CHANGE) |
| 1537 | return 0; |
| 1538 | |
| 1539 | smp->flags = SMP_F_VOLATILE; |
| 1540 | smp->type = SMP_T_UINT; |
| 1541 | smp->data.uint = ret; |
| 1542 | return 1; |
| 1543 | } |
| 1544 | |
| 1545 | |
Willy Tarreau | 4a12981 | 2012-04-25 17:31:42 +0200 | [diff] [blame] | 1546 | /* fetch the connection's source IPv4/IPv6 address */ |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1547 | static int |
Willy Tarreau | 4a12981 | 2012-04-25 17:31:42 +0200 | [diff] [blame] | 1548 | smp_fetch_src(struct proxy *px, struct session *l4, void *l7, unsigned int opt, |
Willy Tarreau | 24e32d8 | 2012-04-23 23:55:44 +0200 | [diff] [blame] | 1549 | const struct arg *args, struct sample *smp) |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1550 | { |
Willy Tarreau | f4362b3 | 2011-12-16 17:49:52 +0100 | [diff] [blame] | 1551 | switch (l4->si[0].addr.from.ss_family) { |
| 1552 | case AF_INET: |
Willy Tarreau | f853c46 | 2012-04-23 18:53:56 +0200 | [diff] [blame] | 1553 | smp->data.ipv4 = ((struct sockaddr_in *)&l4->si[0].addr.from)->sin_addr; |
| 1554 | smp->type = SMP_T_IPV4; |
Willy Tarreau | f4362b3 | 2011-12-16 17:49:52 +0100 | [diff] [blame] | 1555 | break; |
| 1556 | case AF_INET6: |
Willy Tarreau | f853c46 | 2012-04-23 18:53:56 +0200 | [diff] [blame] | 1557 | smp->data.ipv6 = ((struct sockaddr_in6 *)(&l4->si[0].addr.from))->sin6_addr; |
| 1558 | smp->type = SMP_T_IPV6; |
Willy Tarreau | f4362b3 | 2011-12-16 17:49:52 +0100 | [diff] [blame] | 1559 | break; |
| 1560 | default: |
Emeric Brun | f769f51 | 2010-10-22 17:14:01 +0200 | [diff] [blame] | 1561 | return 0; |
Willy Tarreau | f4362b3 | 2011-12-16 17:49:52 +0100 | [diff] [blame] | 1562 | } |
Emeric Brun | f769f51 | 2010-10-22 17:14:01 +0200 | [diff] [blame] | 1563 | |
Willy Tarreau | 3740635 | 2012-04-23 16:16:37 +0200 | [diff] [blame] | 1564 | smp->flags = 0; |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1565 | return 1; |
| 1566 | } |
| 1567 | |
Willy Tarreau | a5e3756 | 2011-12-16 17:06:15 +0100 | [diff] [blame] | 1568 | /* set temp integer to the connection's source port */ |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1569 | static int |
Willy Tarreau | 25c1ebc | 2012-04-25 16:21:44 +0200 | [diff] [blame] | 1570 | smp_fetch_sport(struct proxy *px, struct session *l4, void *l7, unsigned int opt, |
Willy Tarreau | 24e32d8 | 2012-04-23 23:55:44 +0200 | [diff] [blame] | 1571 | const struct arg *args, struct sample *smp) |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1572 | { |
Willy Tarreau | f853c46 | 2012-04-23 18:53:56 +0200 | [diff] [blame] | 1573 | smp->type = SMP_T_UINT; |
| 1574 | if (!(smp->data.uint = get_host_port(&l4->si[0].addr.from))) |
Emeric Brun | f769f51 | 2010-10-22 17:14:01 +0200 | [diff] [blame] | 1575 | return 0; |
| 1576 | |
Willy Tarreau | 3740635 | 2012-04-23 16:16:37 +0200 | [diff] [blame] | 1577 | smp->flags = 0; |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1578 | return 1; |
| 1579 | } |
| 1580 | |
Willy Tarreau | 4a12981 | 2012-04-25 17:31:42 +0200 | [diff] [blame] | 1581 | /* fetch the connection's destination IPv4/IPv6 address */ |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1582 | static int |
Willy Tarreau | 4a12981 | 2012-04-25 17:31:42 +0200 | [diff] [blame] | 1583 | smp_fetch_dst(struct proxy *px, struct session *l4, void *l7, unsigned int opt, |
Willy Tarreau | 24e32d8 | 2012-04-23 23:55:44 +0200 | [diff] [blame] | 1584 | const struct arg *args, struct sample *smp) |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1585 | { |
Willy Tarreau | 59b9479 | 2012-05-11 16:16:40 +0200 | [diff] [blame] | 1586 | si_get_to_addr(&l4->si[0]); |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1587 | |
Willy Tarreau | f4362b3 | 2011-12-16 17:49:52 +0100 | [diff] [blame] | 1588 | switch (l4->si[0].addr.to.ss_family) { |
| 1589 | case AF_INET: |
Willy Tarreau | f853c46 | 2012-04-23 18:53:56 +0200 | [diff] [blame] | 1590 | smp->data.ipv4 = ((struct sockaddr_in *)&l4->si[0].addr.to)->sin_addr; |
| 1591 | smp->type = SMP_T_IPV4; |
Willy Tarreau | f4362b3 | 2011-12-16 17:49:52 +0100 | [diff] [blame] | 1592 | break; |
| 1593 | case AF_INET6: |
Willy Tarreau | f853c46 | 2012-04-23 18:53:56 +0200 | [diff] [blame] | 1594 | smp->data.ipv6 = ((struct sockaddr_in6 *)(&l4->si[0].addr.to))->sin6_addr; |
| 1595 | smp->type = SMP_T_IPV6; |
Willy Tarreau | f4362b3 | 2011-12-16 17:49:52 +0100 | [diff] [blame] | 1596 | break; |
| 1597 | default: |
Emeric Brun | f769f51 | 2010-10-22 17:14:01 +0200 | [diff] [blame] | 1598 | return 0; |
Willy Tarreau | f4362b3 | 2011-12-16 17:49:52 +0100 | [diff] [blame] | 1599 | } |
Emeric Brun | f769f51 | 2010-10-22 17:14:01 +0200 | [diff] [blame] | 1600 | |
Willy Tarreau | 3740635 | 2012-04-23 16:16:37 +0200 | [diff] [blame] | 1601 | smp->flags = 0; |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1602 | return 1; |
| 1603 | } |
| 1604 | |
Willy Tarreau | a5e3756 | 2011-12-16 17:06:15 +0100 | [diff] [blame] | 1605 | /* set temp integer to the frontend connexion's destination port */ |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1606 | static int |
Willy Tarreau | 25c1ebc | 2012-04-25 16:21:44 +0200 | [diff] [blame] | 1607 | smp_fetch_dport(struct proxy *px, struct session *l4, void *l7, unsigned int opt, |
Willy Tarreau | 24e32d8 | 2012-04-23 23:55:44 +0200 | [diff] [blame] | 1608 | const struct arg *args, struct sample *smp) |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1609 | { |
Willy Tarreau | 59b9479 | 2012-05-11 16:16:40 +0200 | [diff] [blame] | 1610 | si_get_to_addr(&l4->si[0]); |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1611 | |
Willy Tarreau | f853c46 | 2012-04-23 18:53:56 +0200 | [diff] [blame] | 1612 | smp->type = SMP_T_UINT; |
| 1613 | if (!(smp->data.uint = get_host_port(&l4->si[0].addr.to))) |
Emeric Brun | f769f51 | 2010-10-22 17:14:01 +0200 | [diff] [blame] | 1614 | return 0; |
| 1615 | |
Willy Tarreau | 3740635 | 2012-04-23 16:16:37 +0200 | [diff] [blame] | 1616 | smp->flags = 0; |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1617 | return 1; |
| 1618 | } |
| 1619 | |
| 1620 | static int |
Willy Tarreau | 0ce3aa0 | 2012-04-25 18:46:33 +0200 | [diff] [blame] | 1621 | smp_fetch_payload_lv(struct proxy *px, struct session *l4, void *l7, unsigned int opt, |
| 1622 | const struct arg *arg_p, struct sample *smp) |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1623 | { |
Willy Tarreau | 82ea800 | 2012-04-25 19:19:43 +0200 | [diff] [blame] | 1624 | unsigned int len_offset = arg_p[0].data.uint; |
| 1625 | unsigned int len_size = arg_p[1].data.uint; |
| 1626 | unsigned int buf_offset; |
| 1627 | unsigned int buf_size = 0; |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1628 | struct buffer *b; |
| 1629 | int i; |
| 1630 | |
| 1631 | /* Format is (len offset, len size, buf offset) or (len offset, len size) */ |
| 1632 | /* by default buf offset == len offset + len size */ |
| 1633 | /* buf offset could be absolute or relative to len offset + len size if prefixed by + or - */ |
| 1634 | |
| 1635 | if (!l4) |
| 1636 | return 0; |
| 1637 | |
Willy Tarreau | 32a6f2e | 2012-04-25 10:13:36 +0200 | [diff] [blame] | 1638 | b = ((opt & SMP_OPT_DIR) == SMP_OPT_DIR_RES) ? l4->rep : l4->req; |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1639 | |
Willy Tarreau | 0ce3aa0 | 2012-04-25 18:46:33 +0200 | [diff] [blame] | 1640 | if (!b) |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1641 | return 0; |
| 1642 | |
Willy Tarreau | 02d6cfc | 2012-03-01 18:19:58 +0100 | [diff] [blame] | 1643 | if (len_offset + len_size > b->i) |
Willy Tarreau | 0ce3aa0 | 2012-04-25 18:46:33 +0200 | [diff] [blame] | 1644 | goto too_short; |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1645 | |
| 1646 | for (i = 0; i < len_size; i++) { |
Willy Tarreau | 89fa706 | 2012-03-02 16:13:16 +0100 | [diff] [blame] | 1647 | buf_size = (buf_size << 8) + ((unsigned char *)b->p)[i + len_offset]; |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1648 | } |
| 1649 | |
Willy Tarreau | 9fcb984 | 2012-04-20 14:45:49 +0200 | [diff] [blame] | 1650 | /* buf offset may be implicit, absolute or relative */ |
| 1651 | buf_offset = len_offset + len_size; |
| 1652 | if (arg_p[2].type == ARGT_UINT) |
| 1653 | buf_offset = arg_p[2].data.uint; |
| 1654 | else if (arg_p[2].type == ARGT_SINT) |
| 1655 | buf_offset += arg_p[2].data.sint; |
| 1656 | |
Willy Tarreau | 82ea800 | 2012-04-25 19:19:43 +0200 | [diff] [blame] | 1657 | if (!buf_size || buf_size > b->size || buf_offset + buf_size > b->size) { |
| 1658 | /* will never match */ |
| 1659 | smp->flags = 0; |
| 1660 | return 0; |
| 1661 | } |
| 1662 | |
Willy Tarreau | 02d6cfc | 2012-03-01 18:19:58 +0100 | [diff] [blame] | 1663 | if (buf_offset + buf_size > b->i) |
Willy Tarreau | 0ce3aa0 | 2012-04-25 18:46:33 +0200 | [diff] [blame] | 1664 | goto too_short; |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1665 | |
| 1666 | /* init chunk as read only */ |
Willy Tarreau | b8c8f1f | 2012-04-23 22:38:26 +0200 | [diff] [blame] | 1667 | smp->type = SMP_T_CBIN; |
Willy Tarreau | 342acb4 | 2012-04-23 22:03:39 +0200 | [diff] [blame] | 1668 | chunk_initlen(&smp->data.str, b->p + buf_offset, 0, buf_size); |
Willy Tarreau | 0ce3aa0 | 2012-04-25 18:46:33 +0200 | [diff] [blame] | 1669 | smp->flags = SMP_F_VOLATILE; |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1670 | return 1; |
Willy Tarreau | 0ce3aa0 | 2012-04-25 18:46:33 +0200 | [diff] [blame] | 1671 | |
| 1672 | too_short: |
| 1673 | smp->flags = SMP_F_MAY_CHANGE; |
| 1674 | return 0; |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1675 | } |
| 1676 | |
| 1677 | static int |
Willy Tarreau | 0ce3aa0 | 2012-04-25 18:46:33 +0200 | [diff] [blame] | 1678 | smp_fetch_payload(struct proxy *px, struct session *l4, void *l7, unsigned int opt, |
| 1679 | const struct arg *arg_p, struct sample *smp) |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1680 | { |
Willy Tarreau | 82ea800 | 2012-04-25 19:19:43 +0200 | [diff] [blame] | 1681 | unsigned int buf_offset = arg_p[0].data.uint; |
| 1682 | unsigned int buf_size = arg_p[1].data.uint; |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1683 | struct buffer *b; |
| 1684 | |
| 1685 | if (!l4) |
| 1686 | return 0; |
| 1687 | |
Willy Tarreau | 32a6f2e | 2012-04-25 10:13:36 +0200 | [diff] [blame] | 1688 | b = ((opt & SMP_OPT_DIR) == SMP_OPT_DIR_RES) ? l4->rep : l4->req; |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1689 | |
Willy Tarreau | 0ce3aa0 | 2012-04-25 18:46:33 +0200 | [diff] [blame] | 1690 | if (!b) |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1691 | return 0; |
Willy Tarreau | 82ea800 | 2012-04-25 19:19:43 +0200 | [diff] [blame] | 1692 | |
| 1693 | if (!buf_size || buf_size > b->size || buf_offset + buf_size > b->size) { |
| 1694 | /* will never match */ |
| 1695 | smp->flags = 0; |
| 1696 | return 0; |
| 1697 | } |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1698 | |
Willy Tarreau | 02d6cfc | 2012-03-01 18:19:58 +0100 | [diff] [blame] | 1699 | if (buf_offset + buf_size > b->i) |
Willy Tarreau | 0ce3aa0 | 2012-04-25 18:46:33 +0200 | [diff] [blame] | 1700 | goto too_short; |
Emeric | f2d7cae | 2010-11-05 18:13:50 +0100 | [diff] [blame] | 1701 | |
| 1702 | /* init chunk as read only */ |
Willy Tarreau | b8c8f1f | 2012-04-23 22:38:26 +0200 | [diff] [blame] | 1703 | smp->type = SMP_T_CBIN; |
Willy Tarreau | 342acb4 | 2012-04-23 22:03:39 +0200 | [diff] [blame] | 1704 | chunk_initlen(&smp->data.str, b->p + buf_offset, 0, buf_size); |
Willy Tarreau | 0ce3aa0 | 2012-04-25 18:46:33 +0200 | [diff] [blame] | 1705 | smp->flags = SMP_F_VOLATILE; |
Simon Horman | ab814e0 | 2011-06-24 14:50:20 +0900 | [diff] [blame] | 1706 | return 1; |
Willy Tarreau | 0ce3aa0 | 2012-04-25 18:46:33 +0200 | [diff] [blame] | 1707 | |
| 1708 | too_short: |
| 1709 | smp->flags = SMP_F_MAY_CHANGE; |
| 1710 | return 0; |
Simon Horman | ab814e0 | 2011-06-24 14:50:20 +0900 | [diff] [blame] | 1711 | } |
| 1712 | |
Willy Tarreau | 21d68a6 | 2012-04-20 15:52:36 +0200 | [diff] [blame] | 1713 | /* This function is used to validate the arguments passed to a "payload" fetch |
| 1714 | * keyword. This keyword expects two positive integers, with the second one |
| 1715 | * being strictly positive. It is assumed that the types are already the correct |
| 1716 | * ones. Returns 0 on error, non-zero if OK. If <err_msg> is not NULL, it will be |
| 1717 | * filled with a pointer to an error message in case of error, that the caller |
| 1718 | * is responsible for freeing. The initial location must either be freeable or |
| 1719 | * NULL. |
| 1720 | */ |
| 1721 | static int val_payload(struct arg *arg, char **err_msg) |
| 1722 | { |
| 1723 | if (!arg[1].data.uint) { |
| 1724 | if (err_msg) |
| 1725 | memprintf(err_msg, "payload length must be > 0"); |
| 1726 | return 0; |
| 1727 | } |
| 1728 | return 1; |
| 1729 | } |
| 1730 | |
| 1731 | /* This function is used to validate the arguments passed to a "payload_lv" fetch |
| 1732 | * keyword. This keyword allows two positive integers and an optional signed one, |
| 1733 | * with the second one being strictly positive and the third one being greater than |
| 1734 | * the opposite of the two others if negative. It is assumed that the types are |
| 1735 | * already the correct ones. Returns 0 on error, non-zero if OK. If <err_msg> is |
| 1736 | * not NULL, it will be filled with a pointer to an error message in case of |
| 1737 | * error, that the caller is responsible for freeing. The initial location must |
| 1738 | * either be freeable or NULL. |
| 1739 | */ |
| 1740 | static int val_payload_lv(struct arg *arg, char **err_msg) |
| 1741 | { |
| 1742 | if (!arg[1].data.uint) { |
| 1743 | if (err_msg) |
| 1744 | memprintf(err_msg, "payload length must be > 0"); |
| 1745 | return 0; |
| 1746 | } |
| 1747 | |
| 1748 | if (arg[2].type == ARGT_SINT && |
| 1749 | (int)(arg[0].data.uint + arg[1].data.uint + arg[2].data.sint) < 0) { |
| 1750 | if (err_msg) |
| 1751 | memprintf(err_msg, "payload offset too negative"); |
| 1752 | return 0; |
| 1753 | } |
| 1754 | return 1; |
| 1755 | } |
| 1756 | |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1757 | static struct cfg_kw_list cfg_kws = {{ },{ |
| 1758 | { CFG_LISTEN, "tcp-request", tcp_parse_tcp_req }, |
Emeric Brun | 97679e7 | 2010-09-23 17:56:44 +0200 | [diff] [blame] | 1759 | { CFG_LISTEN, "tcp-response", tcp_parse_tcp_rep }, |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1760 | { 0, NULL, NULL }, |
| 1761 | }}; |
| 1762 | |
Willy Tarreau | 61612d4 | 2012-04-19 18:42:05 +0200 | [diff] [blame] | 1763 | /* Note: must not be declared <const> as its list will be overwritten. |
| 1764 | * Please take care of keeping this list alphabetically sorted. |
| 1765 | */ |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1766 | static struct acl_kw_list acl_kws = {{ },{ |
Willy Tarreau | 4a12981 | 2012-04-25 17:31:42 +0200 | [diff] [blame] | 1767 | { "dst", acl_parse_ip, smp_fetch_dst, acl_match_ip, ACL_USE_TCP4_PERMANENT|ACL_MAY_LOOKUP, 0 }, |
Willy Tarreau | 25c1ebc | 2012-04-25 16:21:44 +0200 | [diff] [blame] | 1768 | { "dst_port", acl_parse_int, smp_fetch_dport, acl_match_int, ACL_USE_TCP_PERMANENT, 0 }, |
Willy Tarreau | 0d5fe14 | 2012-04-26 12:24:45 +0200 | [diff] [blame] | 1769 | { "payload", acl_parse_str, smp_fetch_payload, acl_match_str, ACL_USE_L6REQ_VOLATILE|ACL_MAY_LOOKUP, ARG2(2,UINT,UINT), val_payload }, |
| 1770 | { "payload_lv", acl_parse_str, smp_fetch_payload_lv, acl_match_str, ACL_USE_L6REQ_VOLATILE|ACL_MAY_LOOKUP, ARG3(2,UINT,UINT,SINT), val_payload_lv }, |
Willy Tarreau | 9fb4bc7 | 2012-04-24 00:09:26 +0200 | [diff] [blame] | 1771 | { "req_rdp_cookie", acl_parse_str, smp_fetch_rdp_cookie, acl_match_str, ACL_USE_L6REQ_VOLATILE|ACL_MAY_LOOKUP, ARG1(0,STR) }, |
Willy Tarreau | 32389b7 | 2012-04-23 23:13:20 +0200 | [diff] [blame] | 1772 | { "req_rdp_cookie_cnt", acl_parse_int, acl_fetch_rdp_cookie_cnt, acl_match_int, ACL_USE_L6REQ_VOLATILE, ARG1(0,STR) }, |
Willy Tarreau | 4a12981 | 2012-04-25 17:31:42 +0200 | [diff] [blame] | 1773 | { "src", acl_parse_ip, smp_fetch_src, acl_match_ip, ACL_USE_TCP4_PERMANENT|ACL_MAY_LOOKUP, 0 }, |
Willy Tarreau | 25c1ebc | 2012-04-25 16:21:44 +0200 | [diff] [blame] | 1774 | { "src_port", acl_parse_int, smp_fetch_sport, acl_match_int, ACL_USE_TCP_PERMANENT, 0 }, |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1775 | { NULL, NULL, NULL, NULL }, |
| 1776 | }}; |
| 1777 | |
Willy Tarreau | 4a12981 | 2012-04-25 17:31:42 +0200 | [diff] [blame] | 1778 | /* Note: must not be declared <const> as its list will be overwritten. |
| 1779 | * Note: fetches that may return multiple types must be declared as the lowest |
| 1780 | * common denominator, the type that can be casted into all other ones. For |
| 1781 | * instance v4/v6 must be declared v4. |
| 1782 | */ |
Willy Tarreau | 1278578 | 2012-04-27 21:37:17 +0200 | [diff] [blame] | 1783 | static struct sample_fetch_kw_list sample_fetch_keywords = {{ },{ |
Willy Tarreau | 4a12981 | 2012-04-25 17:31:42 +0200 | [diff] [blame] | 1784 | { "src", smp_fetch_src, 0, NULL, SMP_T_IPV4, SMP_CAP_REQ|SMP_CAP_RES }, |
Willy Tarreau | 4a12981 | 2012-04-25 17:31:42 +0200 | [diff] [blame] | 1785 | { "dst", smp_fetch_dst, 0, NULL, SMP_T_IPV4, SMP_CAP_REQ|SMP_CAP_RES }, |
Willy Tarreau | 25c1ebc | 2012-04-25 16:21:44 +0200 | [diff] [blame] | 1786 | { "dst_port", smp_fetch_dport, 0, NULL, SMP_T_UINT, SMP_CAP_REQ|SMP_CAP_RES }, |
Willy Tarreau | 0ce3aa0 | 2012-04-25 18:46:33 +0200 | [diff] [blame] | 1787 | { "payload", smp_fetch_payload, ARG2(2,UINT,UINT), val_payload, SMP_T_CBIN, SMP_CAP_REQ|SMP_CAP_RES }, |
| 1788 | { "payload_lv", smp_fetch_payload_lv, ARG3(2,UINT,UINT,SINT), val_payload_lv, SMP_T_CBIN, SMP_CAP_REQ|SMP_CAP_RES }, |
Willy Tarreau | d6281ae | 2012-04-26 11:23:39 +0200 | [diff] [blame] | 1789 | { "rdp_cookie", smp_fetch_rdp_cookie, ARG1(1,STR), NULL, SMP_T_CSTR, SMP_CAP_REQ|SMP_CAP_RES }, |
Willy Tarreau | 25c1ebc | 2012-04-25 16:21:44 +0200 | [diff] [blame] | 1790 | { "src_port", smp_fetch_sport, 0, NULL, SMP_T_UINT, SMP_CAP_REQ|SMP_CAP_RES }, |
Willy Tarreau | 9fcb984 | 2012-04-20 14:45:49 +0200 | [diff] [blame] | 1791 | { NULL, NULL, 0, 0, 0 }, |
Willy Tarreau | 645513a | 2010-05-24 20:55:15 +0200 | [diff] [blame] | 1792 | }}; |
| 1793 | |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 1794 | __attribute__((constructor)) |
| 1795 | static void __tcp_protocol_init(void) |
| 1796 | { |
| 1797 | protocol_register(&proto_tcpv4); |
| 1798 | protocol_register(&proto_tcpv6); |
Willy Tarreau | 1278578 | 2012-04-27 21:37:17 +0200 | [diff] [blame] | 1799 | sample_register_fetches(&sample_fetch_keywords); |
Willy Tarreau | b686644 | 2008-07-14 23:54:42 +0200 | [diff] [blame] | 1800 | cfg_register_keywords(&cfg_kws); |
| 1801 | acl_register_keywords(&acl_kws); |
Willy Tarreau | e6b9894 | 2007-10-29 01:09:36 +0100 | [diff] [blame] | 1802 | } |
| 1803 | |
| 1804 | |
| 1805 | /* |
| 1806 | * Local variables: |
| 1807 | * c-indent-level: 8 |
| 1808 | * c-basic-offset: 8 |
| 1809 | * End: |
| 1810 | */ |