Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1 | /* |
| 2 | * Pattern management functions. |
| 3 | * |
| 4 | * Copyright 2000-2013 Willy Tarreau <w@1wt.eu> |
| 5 | * |
| 6 | * This program is free software; you can redistribute it and/or |
| 7 | * modify it under the terms of the GNU General Public License |
| 8 | * as published by the Free Software Foundation; either version |
| 9 | * 2 of the License, or (at your option) any later version. |
| 10 | * |
| 11 | */ |
| 12 | |
| 13 | #include <ctype.h> |
| 14 | #include <stdio.h> |
Jerome Magnin | b8bd6d7 | 2020-01-17 18:01:20 +0100 | [diff] [blame] | 15 | #include <errno.h> |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 16 | |
Willy Tarreau | b255105 | 2020-06-09 09:07:15 +0200 | [diff] [blame] | 17 | #include <import/ebsttree.h> |
| 18 | #include <import/lru.h> |
Willy Tarreau | b255105 | 2020-06-09 09:07:15 +0200 | [diff] [blame] | 19 | |
Willy Tarreau | 4c7e4b7 | 2020-05-27 12:58:42 +0200 | [diff] [blame] | 20 | #include <haproxy/api.h> |
Willy Tarreau | f268ee8 | 2020-06-04 17:05:57 +0200 | [diff] [blame] | 21 | #include <haproxy/global.h> |
Willy Tarreau | aeed4a8 | 2020-06-04 22:01:04 +0200 | [diff] [blame] | 22 | #include <haproxy/log.h> |
Willy Tarreau | 6131d6a | 2020-06-02 16:48:09 +0200 | [diff] [blame] | 23 | #include <haproxy/net_helper.h> |
Willy Tarreau | 225a90a | 2020-06-04 15:06:28 +0200 | [diff] [blame] | 24 | #include <haproxy/pattern.h> |
Willy Tarreau | 7cd8b6e | 2020-06-02 17:32:26 +0200 | [diff] [blame] | 25 | #include <haproxy/regex.h> |
Willy Tarreau | e6ce10b | 2020-06-04 15:33:47 +0200 | [diff] [blame] | 26 | #include <haproxy/sample.h> |
Willy Tarreau | b255105 | 2020-06-09 09:07:15 +0200 | [diff] [blame] | 27 | #include <haproxy/tools.h> |
Tim Duesterhus | d5fc8fc | 2021-09-11 17:51:13 +0200 | [diff] [blame] | 28 | #include <haproxy/xxhash.h> |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 29 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 30 | |
Willy Tarreau | 9057a00 | 2021-04-10 17:44:27 +0200 | [diff] [blame] | 31 | const char *const pat_match_names[PAT_MATCH_NUM] = { |
Thierry FOURNIER | a65b343 | 2013-11-28 18:22:00 +0100 | [diff] [blame] | 32 | [PAT_MATCH_FOUND] = "found", |
| 33 | [PAT_MATCH_BOOL] = "bool", |
| 34 | [PAT_MATCH_INT] = "int", |
| 35 | [PAT_MATCH_IP] = "ip", |
| 36 | [PAT_MATCH_BIN] = "bin", |
| 37 | [PAT_MATCH_LEN] = "len", |
| 38 | [PAT_MATCH_STR] = "str", |
| 39 | [PAT_MATCH_BEG] = "beg", |
| 40 | [PAT_MATCH_SUB] = "sub", |
| 41 | [PAT_MATCH_DIR] = "dir", |
| 42 | [PAT_MATCH_DOM] = "dom", |
| 43 | [PAT_MATCH_END] = "end", |
| 44 | [PAT_MATCH_REG] = "reg", |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 45 | [PAT_MATCH_REGM] = "regm", |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 46 | }; |
| 47 | |
Willy Tarreau | 9057a00 | 2021-04-10 17:44:27 +0200 | [diff] [blame] | 48 | int (*const pat_parse_fcts[PAT_MATCH_NUM])(const char *, struct pattern *, int, char **) = { |
Thierry FOURNIER | a65b343 | 2013-11-28 18:22:00 +0100 | [diff] [blame] | 49 | [PAT_MATCH_FOUND] = pat_parse_nothing, |
| 50 | [PAT_MATCH_BOOL] = pat_parse_nothing, |
| 51 | [PAT_MATCH_INT] = pat_parse_int, |
| 52 | [PAT_MATCH_IP] = pat_parse_ip, |
| 53 | [PAT_MATCH_BIN] = pat_parse_bin, |
Thierry FOURNIER | 5d34408 | 2014-01-27 14:19:53 +0100 | [diff] [blame] | 54 | [PAT_MATCH_LEN] = pat_parse_int, |
Thierry FOURNIER | a65b343 | 2013-11-28 18:22:00 +0100 | [diff] [blame] | 55 | [PAT_MATCH_STR] = pat_parse_str, |
| 56 | [PAT_MATCH_BEG] = pat_parse_str, |
| 57 | [PAT_MATCH_SUB] = pat_parse_str, |
| 58 | [PAT_MATCH_DIR] = pat_parse_str, |
| 59 | [PAT_MATCH_DOM] = pat_parse_str, |
| 60 | [PAT_MATCH_END] = pat_parse_str, |
| 61 | [PAT_MATCH_REG] = pat_parse_reg, |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 62 | [PAT_MATCH_REGM] = pat_parse_reg, |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 63 | }; |
| 64 | |
Willy Tarreau | 9057a00 | 2021-04-10 17:44:27 +0200 | [diff] [blame] | 65 | int (*const pat_index_fcts[PAT_MATCH_NUM])(struct pattern_expr *, struct pattern *, char **) = { |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 66 | [PAT_MATCH_FOUND] = pat_idx_list_val, |
| 67 | [PAT_MATCH_BOOL] = pat_idx_list_val, |
| 68 | [PAT_MATCH_INT] = pat_idx_list_val, |
| 69 | [PAT_MATCH_IP] = pat_idx_tree_ip, |
| 70 | [PAT_MATCH_BIN] = pat_idx_list_ptr, |
| 71 | [PAT_MATCH_LEN] = pat_idx_list_val, |
| 72 | [PAT_MATCH_STR] = pat_idx_tree_str, |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 73 | [PAT_MATCH_BEG] = pat_idx_tree_pfx, |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 74 | [PAT_MATCH_SUB] = pat_idx_list_str, |
| 75 | [PAT_MATCH_DIR] = pat_idx_list_str, |
| 76 | [PAT_MATCH_DOM] = pat_idx_list_str, |
| 77 | [PAT_MATCH_END] = pat_idx_list_str, |
| 78 | [PAT_MATCH_REG] = pat_idx_list_reg, |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 79 | [PAT_MATCH_REGM] = pat_idx_list_regm, |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 80 | }; |
| 81 | |
Willy Tarreau | 9057a00 | 2021-04-10 17:44:27 +0200 | [diff] [blame] | 82 | void (*const pat_prune_fcts[PAT_MATCH_NUM])(struct pattern_expr *) = { |
Willy Tarreau | 6d8a689 | 2020-11-02 19:26:02 +0100 | [diff] [blame] | 83 | [PAT_MATCH_FOUND] = pat_prune_gen, |
| 84 | [PAT_MATCH_BOOL] = pat_prune_gen, |
| 85 | [PAT_MATCH_INT] = pat_prune_gen, |
| 86 | [PAT_MATCH_IP] = pat_prune_gen, |
| 87 | [PAT_MATCH_BIN] = pat_prune_gen, |
| 88 | [PAT_MATCH_LEN] = pat_prune_gen, |
| 89 | [PAT_MATCH_STR] = pat_prune_gen, |
| 90 | [PAT_MATCH_BEG] = pat_prune_gen, |
| 91 | [PAT_MATCH_SUB] = pat_prune_gen, |
| 92 | [PAT_MATCH_DIR] = pat_prune_gen, |
| 93 | [PAT_MATCH_DOM] = pat_prune_gen, |
| 94 | [PAT_MATCH_END] = pat_prune_gen, |
| 95 | [PAT_MATCH_REG] = pat_prune_gen, |
| 96 | [PAT_MATCH_REGM] = pat_prune_gen, |
Thierry FOURNIER | 6f7203d | 2014-01-14 16:24:51 +0100 | [diff] [blame] | 97 | }; |
| 98 | |
Willy Tarreau | 9057a00 | 2021-04-10 17:44:27 +0200 | [diff] [blame] | 99 | struct pattern *(*const pat_match_fcts[PAT_MATCH_NUM])(struct sample *, struct pattern_expr *, int) = { |
Thierry FOURNIER | a65b343 | 2013-11-28 18:22:00 +0100 | [diff] [blame] | 100 | [PAT_MATCH_FOUND] = NULL, |
| 101 | [PAT_MATCH_BOOL] = pat_match_nothing, |
| 102 | [PAT_MATCH_INT] = pat_match_int, |
| 103 | [PAT_MATCH_IP] = pat_match_ip, |
| 104 | [PAT_MATCH_BIN] = pat_match_bin, |
| 105 | [PAT_MATCH_LEN] = pat_match_len, |
| 106 | [PAT_MATCH_STR] = pat_match_str, |
| 107 | [PAT_MATCH_BEG] = pat_match_beg, |
| 108 | [PAT_MATCH_SUB] = pat_match_sub, |
| 109 | [PAT_MATCH_DIR] = pat_match_dir, |
| 110 | [PAT_MATCH_DOM] = pat_match_dom, |
| 111 | [PAT_MATCH_END] = pat_match_end, |
| 112 | [PAT_MATCH_REG] = pat_match_reg, |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 113 | [PAT_MATCH_REGM] = pat_match_regm, |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 114 | }; |
| 115 | |
Thierry FOURNIER | e3ded59 | 2013-12-06 15:36:54 +0100 | [diff] [blame] | 116 | /* Just used for checking configuration compatibility */ |
Willy Tarreau | 9057a00 | 2021-04-10 17:44:27 +0200 | [diff] [blame] | 117 | int const pat_match_types[PAT_MATCH_NUM] = { |
Thierry FOURNIER | 07ee64e | 2015-07-06 23:43:03 +0200 | [diff] [blame] | 118 | [PAT_MATCH_FOUND] = SMP_T_SINT, |
| 119 | [PAT_MATCH_BOOL] = SMP_T_SINT, |
| 120 | [PAT_MATCH_INT] = SMP_T_SINT, |
Thierry FOURNIER | e3ded59 | 2013-12-06 15:36:54 +0100 | [diff] [blame] | 121 | [PAT_MATCH_IP] = SMP_T_ADDR, |
Thierry FOURNIER | 7654c9f | 2013-12-17 00:20:33 +0100 | [diff] [blame] | 122 | [PAT_MATCH_BIN] = SMP_T_BIN, |
| 123 | [PAT_MATCH_LEN] = SMP_T_STR, |
| 124 | [PAT_MATCH_STR] = SMP_T_STR, |
| 125 | [PAT_MATCH_BEG] = SMP_T_STR, |
| 126 | [PAT_MATCH_SUB] = SMP_T_STR, |
| 127 | [PAT_MATCH_DIR] = SMP_T_STR, |
| 128 | [PAT_MATCH_DOM] = SMP_T_STR, |
| 129 | [PAT_MATCH_END] = SMP_T_STR, |
| 130 | [PAT_MATCH_REG] = SMP_T_STR, |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 131 | [PAT_MATCH_REGM] = SMP_T_STR, |
Thierry FOURNIER | e3ded59 | 2013-12-06 15:36:54 +0100 | [diff] [blame] | 132 | }; |
| 133 | |
Thierry FOURNIER | 1794fdf | 2014-01-17 15:25:13 +0100 | [diff] [blame] | 134 | /* this struct is used to return information */ |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 135 | static THREAD_LOCAL struct pattern static_pattern; |
| 136 | static THREAD_LOCAL struct sample_data static_sample_data; |
Thierry FOURNIER | 1794fdf | 2014-01-17 15:25:13 +0100 | [diff] [blame] | 137 | |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 138 | /* This is the root of the list of all pattern_ref avalaibles. */ |
| 139 | struct list pattern_reference = LIST_HEAD_INIT(pattern_reference); |
| 140 | |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 141 | static THREAD_LOCAL struct lru64_head *pat_lru_tree; |
Willy Tarreau | 295a89c | 2021-04-10 17:42:04 +0200 | [diff] [blame] | 142 | static unsigned long long pat_lru_seed __read_mostly; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 143 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 144 | /* |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 145 | * |
| 146 | * The following functions are not exported and are used by internals process |
| 147 | * of pattern matching |
| 148 | * |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 149 | */ |
| 150 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 151 | /* Background: Fast way to find a zero byte in a word |
| 152 | * http://graphics.stanford.edu/~seander/bithacks.html#ZeroInWord |
| 153 | * hasZeroByte = (v - 0x01010101UL) & ~v & 0x80808080UL; |
| 154 | * |
| 155 | * To look for 4 different byte values, xor the word with those bytes and |
| 156 | * then check for zero bytes: |
| 157 | * |
| 158 | * v = (((unsigned char)c * 0x1010101U) ^ delimiter) |
| 159 | * where <delimiter> is the 4 byte values to look for (as an uint) |
| 160 | * and <c> is the character that is being tested |
| 161 | */ |
| 162 | static inline unsigned int is_delimiter(unsigned char c, unsigned int mask) |
| 163 | { |
| 164 | mask ^= (c * 0x01010101); /* propagate the char to all 4 bytes */ |
| 165 | return (mask - 0x01010101) & ~mask & 0x80808080U; |
| 166 | } |
| 167 | |
| 168 | static inline unsigned int make_4delim(unsigned char d1, unsigned char d2, unsigned char d3, unsigned char d4) |
| 169 | { |
| 170 | return d1 << 24 | d2 << 16 | d3 << 8 | d4; |
| 171 | } |
| 172 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 173 | |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 174 | /* |
| 175 | * |
| 176 | * These functions are exported and may be used by any other component. |
| 177 | * |
Willy Tarreau | 5def8ef | 2014-08-29 15:19:33 +0200 | [diff] [blame] | 178 | * The following functions are used for parsing pattern matching input value. |
| 179 | * The <text> contain the string to be parsed. <pattern> must be a preallocated |
| 180 | * pattern. The pat_parse_* functions fill this structure with the parsed value. |
| 181 | * <err> is filled with an error message built with memprintf() function. It is |
| 182 | * allowed to use a trash as a temporary storage for the returned pattern, as |
| 183 | * the next call after these functions will be pat_idx_*. |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 184 | * |
Willy Tarreau | 5def8ef | 2014-08-29 15:19:33 +0200 | [diff] [blame] | 185 | * In success case, the pat_parse_* function returns 1. If the function |
| 186 | * fails, it returns 0 and <err> is filled. |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 187 | */ |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 188 | |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 189 | /* ignore the current line */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 190 | int pat_parse_nothing(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 191 | { |
| 192 | return 1; |
| 193 | } |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 194 | |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 195 | /* Parse a string. It is allocated and duplicated. */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 196 | int pat_parse_str(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 197 | { |
Thierry FOURNIER | 7654c9f | 2013-12-17 00:20:33 +0100 | [diff] [blame] | 198 | pattern->type = SMP_T_STR; |
Thierry FOURNIER | edc15c3 | 2013-12-13 15:36:59 +0100 | [diff] [blame] | 199 | pattern->ptr.str = (char *)text; |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 200 | pattern->len = strlen(text); |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 201 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 202 | } |
| 203 | |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 204 | /* Parse a binary written in hexa. It is allocated. */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 205 | int pat_parse_bin(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 206 | { |
Willy Tarreau | 83061a8 | 2018-07-13 11:56:34 +0200 | [diff] [blame] | 207 | struct buffer *trash; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 208 | |
Thierry FOURNIER | 7654c9f | 2013-12-17 00:20:33 +0100 | [diff] [blame] | 209 | pattern->type = SMP_T_BIN; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 210 | trash = get_trash_chunk(); |
| 211 | pattern->len = trash->size; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 212 | pattern->ptr.str = trash->area; |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 213 | return !!parse_binary(text, &pattern->ptr.str, &pattern->len, err); |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 214 | } |
| 215 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 216 | /* Parse a regex. It is allocated. */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 217 | int pat_parse_reg(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 218 | { |
Thierry FOURNIER | 0b6d15f | 2014-01-29 19:35:16 +0100 | [diff] [blame] | 219 | pattern->ptr.str = (char *)text; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 220 | return 1; |
| 221 | } |
| 222 | |
| 223 | /* Parse a range of positive integers delimited by either ':' or '-'. If only |
| 224 | * one integer is read, it is set as both min and max. An operator may be |
| 225 | * specified as the prefix, among this list of 5 : |
| 226 | * |
| 227 | * 0:eq, 1:gt, 2:ge, 3:lt, 4:le |
| 228 | * |
| 229 | * The default operator is "eq". It supports range matching. Ranges are |
| 230 | * rejected for other operators. The operator may be changed at any time. |
| 231 | * The operator is stored in the 'opaque' argument. |
| 232 | * |
| 233 | * If err is non-NULL, an error message will be returned there on errors and |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 234 | * the caller will have to free it. The function returns zero on error, and |
| 235 | * non-zero on success. |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 236 | * |
| 237 | */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 238 | int pat_parse_int(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 239 | { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 240 | const char *ptr = text; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 241 | |
Thierry FOURNIER | 07ee64e | 2015-07-06 23:43:03 +0200 | [diff] [blame] | 242 | pattern->type = SMP_T_SINT; |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 243 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 244 | /* Empty string is not valid */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 245 | if (!*text) |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 246 | goto not_valid_range; |
| 247 | |
| 248 | /* Search ':' or '-' separator. */ |
| 249 | while (*ptr != '\0' && *ptr != ':' && *ptr != '-') |
| 250 | ptr++; |
| 251 | |
| 252 | /* If separator not found. */ |
| 253 | if (!*ptr) { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 254 | if (strl2llrc(text, ptr - text, &pattern->val.range.min) != 0) { |
| 255 | memprintf(err, "'%s' is not a number", text); |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 256 | return 0; |
| 257 | } |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 258 | pattern->val.range.max = pattern->val.range.min; |
| 259 | pattern->val.range.min_set = 1; |
| 260 | pattern->val.range.max_set = 1; |
| 261 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 262 | } |
| 263 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 264 | /* If the separator is the first character. */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 265 | if (ptr == text && *(ptr + 1) != '\0') { |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 266 | if (strl2llrc(ptr + 1, strlen(ptr + 1), &pattern->val.range.max) != 0) |
| 267 | goto not_valid_range; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 268 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 269 | pattern->val.range.min_set = 0; |
| 270 | pattern->val.range.max_set = 1; |
| 271 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 272 | } |
| 273 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 274 | /* If separator is the last character. */ |
| 275 | if (*(ptr + 1) == '\0') { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 276 | if (strl2llrc(text, ptr - text, &pattern->val.range.min) != 0) |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 277 | goto not_valid_range; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 278 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 279 | pattern->val.range.min_set = 1; |
| 280 | pattern->val.range.max_set = 0; |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 281 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 282 | } |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 283 | |
| 284 | /* Else, parse two numbers. */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 285 | if (strl2llrc(text, ptr - text, &pattern->val.range.min) != 0) |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 286 | goto not_valid_range; |
| 287 | |
| 288 | if (strl2llrc(ptr + 1, strlen(ptr + 1), &pattern->val.range.max) != 0) |
| 289 | goto not_valid_range; |
| 290 | |
| 291 | if (pattern->val.range.min > pattern->val.range.max) |
| 292 | goto not_valid_range; |
| 293 | |
| 294 | pattern->val.range.min_set = 1; |
| 295 | pattern->val.range.max_set = 1; |
| 296 | return 1; |
| 297 | |
| 298 | not_valid_range: |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 299 | memprintf(err, "'%s' is not a valid number range", text); |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 300 | return 0; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 301 | } |
| 302 | |
| 303 | /* Parse a range of positive 2-component versions delimited by either ':' or |
| 304 | * '-'. The version consists in a major and a minor, both of which must be |
| 305 | * smaller than 65536, because internally they will be represented as a 32-bit |
| 306 | * integer. |
| 307 | * If only one version is read, it is set as both min and max. Just like for |
| 308 | * pure integers, an operator may be specified as the prefix, among this list |
| 309 | * of 5 : |
| 310 | * |
| 311 | * 0:eq, 1:gt, 2:ge, 3:lt, 4:le |
| 312 | * |
| 313 | * The default operator is "eq". It supports range matching. Ranges are |
| 314 | * rejected for other operators. The operator may be changed at any time. |
| 315 | * The operator is stored in the 'opaque' argument. This allows constructs |
| 316 | * such as the following one : |
| 317 | * |
| 318 | * acl obsolete_ssl ssl_req_proto lt 3 |
| 319 | * acl unsupported_ssl ssl_req_proto gt 3.1 |
| 320 | * acl valid_ssl ssl_req_proto 3.0-3.1 |
| 321 | * |
| 322 | */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 323 | int pat_parse_dotted_ver(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 324 | { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 325 | const char *ptr = text; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 326 | |
Thierry FOURNIER | 07ee64e | 2015-07-06 23:43:03 +0200 | [diff] [blame] | 327 | pattern->type = SMP_T_SINT; |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 328 | |
| 329 | /* Search ':' or '-' separator. */ |
| 330 | while (*ptr != '\0' && *ptr != ':' && *ptr != '-') |
| 331 | ptr++; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 332 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 333 | /* If separator not found. */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 334 | if (*ptr == '\0' && ptr > text) { |
| 335 | if (strl2llrc_dotted(text, ptr-text, &pattern->val.range.min) != 0) { |
| 336 | memprintf(err, "'%s' is not a dotted number", text); |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 337 | return 0; |
| 338 | } |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 339 | pattern->val.range.max = pattern->val.range.min; |
| 340 | pattern->val.range.min_set = 1; |
| 341 | pattern->val.range.max_set = 1; |
| 342 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 343 | } |
| 344 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 345 | /* If the separator is the first character. */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 346 | if (ptr == text && *(ptr+1) != '\0') { |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 347 | if (strl2llrc_dotted(ptr+1, strlen(ptr+1), &pattern->val.range.max) != 0) { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 348 | memprintf(err, "'%s' is not a valid dotted number range", text); |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 349 | return 0; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 350 | } |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 351 | pattern->val.range.min_set = 0; |
| 352 | pattern->val.range.max_set = 1; |
| 353 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 354 | } |
| 355 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 356 | /* If separator is the last character. */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 357 | if (ptr == &text[strlen(text)-1]) { |
| 358 | if (strl2llrc_dotted(text, ptr-text, &pattern->val.range.min) != 0) { |
| 359 | memprintf(err, "'%s' is not a valid dotted number range", text); |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 360 | return 0; |
| 361 | } |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 362 | pattern->val.range.min_set = 1; |
| 363 | pattern->val.range.max_set = 0; |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 364 | return 1; |
| 365 | } |
| 366 | |
| 367 | /* Else, parse two numbers. */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 368 | if (strl2llrc_dotted(text, ptr-text, &pattern->val.range.min) != 0) { |
| 369 | memprintf(err, "'%s' is not a valid dotted number range", text); |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 370 | return 0; |
| 371 | } |
| 372 | if (strl2llrc_dotted(ptr+1, strlen(ptr+1), &pattern->val.range.max) != 0) { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 373 | memprintf(err, "'%s' is not a valid dotted number range", text); |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 374 | return 0; |
| 375 | } |
| 376 | if (pattern->val.range.min > pattern->val.range.max) { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 377 | memprintf(err, "'%s' is not a valid dotted number range", text); |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 378 | return 0; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 379 | } |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 380 | pattern->val.range.min_set = 1; |
| 381 | pattern->val.range.max_set = 1; |
| 382 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 383 | } |
| 384 | |
| 385 | /* Parse an IP address and an optional mask in the form addr[/mask]. |
| 386 | * The addr may either be an IPv4 address or a hostname. The mask |
| 387 | * may either be a dotted mask or a number of bits. Returns 1 if OK, |
| 388 | * otherwise 0. NOTE: IP address patterns are typed (IPV4/IPV6). |
| 389 | */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 390 | int pat_parse_ip(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 391 | { |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 392 | if (str2net(text, !(mflags & PAT_MF_NO_DNS) && (global.mode & MODE_STARTING), |
Thierry FOURNIER | fc7ac7b | 2014-02-11 15:23:04 +0100 | [diff] [blame] | 393 | &pattern->val.ipv4.addr, &pattern->val.ipv4.mask)) { |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 394 | pattern->type = SMP_T_IPV4; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 395 | return 1; |
| 396 | } |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 397 | else if (str62net(text, &pattern->val.ipv6.addr, &pattern->val.ipv6.mask)) { |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 398 | pattern->type = SMP_T_IPV6; |
| 399 | return 1; |
| 400 | } |
| 401 | else { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 402 | memprintf(err, "'%s' is not a valid IPv4 or IPv6 address", text); |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 403 | return 0; |
| 404 | } |
| 405 | } |
| 406 | |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 407 | /* |
| 408 | * |
| 409 | * These functions are exported and may be used by any other component. |
| 410 | * |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 411 | * This function just takes a sample <smp> and checks if this sample matches |
| 412 | * with the pattern <pattern>. This function returns only PAT_MATCH or |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 413 | * PAT_NOMATCH. |
| 414 | * |
| 415 | */ |
| 416 | |
| 417 | /* always return false */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 418 | struct pattern *pat_match_nothing(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 419 | { |
Thierry FOURNIER | 136f9d3 | 2015-08-19 09:07:19 +0200 | [diff] [blame] | 420 | if (smp->data.u.sint) { |
Thierry FOURNIER | e5978bf | 2014-03-17 19:53:10 +0100 | [diff] [blame] | 421 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 422 | static_pattern.data = NULL; |
Thierry FOURNIER | e5978bf | 2014-03-17 19:53:10 +0100 | [diff] [blame] | 423 | static_pattern.ref = NULL; |
Thierry FOURNIER | e5978bf | 2014-03-17 19:53:10 +0100 | [diff] [blame] | 424 | static_pattern.type = 0; |
| 425 | static_pattern.ptr.str = NULL; |
| 426 | } |
| 427 | return &static_pattern; |
| 428 | } |
| 429 | else |
| 430 | return NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 431 | } |
| 432 | |
| 433 | |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 434 | /* NB: For two strings to be identical, it is required that their length match */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 435 | struct pattern *pat_match_str(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 436 | { |
| 437 | int icase; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 438 | struct ebmb_node *node; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 439 | struct pattern_tree *elt; |
| 440 | struct pattern_list *lst; |
| 441 | struct pattern *pattern; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 442 | struct pattern *ret = NULL; |
| 443 | struct lru64 *lru = NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 444 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 445 | /* Lookup a string in the expression's pattern tree. */ |
| 446 | if (!eb_is_empty(&expr->pattern_tree)) { |
Christopher Faulet | b4cf7ab | 2020-06-30 18:52:32 +0200 | [diff] [blame] | 447 | char prev = 0; |
| 448 | |
| 449 | if (smp->data.u.str.data < smp->data.u.str.size) { |
| 450 | /* we may have to force a trailing zero on the test pattern and |
Thierry Fournier | a68affe | 2020-11-10 20:51:36 +0100 | [diff] [blame] | 451 | * the buffer is large enough to accommodate it. If the flag |
| 452 | * CONST is set, duplicate the string |
Christopher Faulet | b4cf7ab | 2020-06-30 18:52:32 +0200 | [diff] [blame] | 453 | */ |
| 454 | prev = smp->data.u.str.area[smp->data.u.str.data]; |
Thierry Fournier | a68affe | 2020-11-10 20:51:36 +0100 | [diff] [blame] | 455 | if (prev) { |
| 456 | if (smp->flags & SMP_F_CONST) { |
| 457 | if (!smp_dup(smp)) |
| 458 | return NULL; |
| 459 | } else { |
| 460 | smp->data.u.str.area[smp->data.u.str.data] = '\0'; |
| 461 | } |
| 462 | } |
Christopher Faulet | b4cf7ab | 2020-06-30 18:52:32 +0200 | [diff] [blame] | 463 | } |
| 464 | else { |
| 465 | /* Otherwise, the sample is duplicated. A trailing zero |
| 466 | * is automatically added to the string. |
| 467 | */ |
| 468 | if (!smp_dup(smp)) |
| 469 | return NULL; |
| 470 | } |
| 471 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 472 | node = ebst_lookup(&expr->pattern_tree, smp->data.u.str.area); |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 473 | if (prev) |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 474 | smp->data.u.str.area[smp->data.u.str.data] = prev; |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 475 | |
| 476 | while (node) { |
| 477 | elt = ebmb_entry(node, struct pattern_tree, node); |
| 478 | if (elt->ref->gen_id != expr->ref->curr_gen) { |
Willy Tarreau | 51d38a2 | 2022-08-01 11:46:27 +0200 | [diff] [blame] | 479 | node = ebmb_next_dup(node); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 480 | continue; |
| 481 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 482 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 483 | static_pattern.data = elt->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 484 | static_pattern.ref = elt->ref; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 485 | static_pattern.sflags = PAT_SF_TREE; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 486 | static_pattern.type = SMP_T_STR; |
| 487 | static_pattern.ptr.str = (char *)elt->node.key; |
| 488 | } |
| 489 | return &static_pattern; |
| 490 | } |
| 491 | } |
| 492 | |
| 493 | /* look in the list */ |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 494 | if (pat_lru_tree) { |
Willy Tarreau | aee9314 | 2015-05-04 17:18:42 +0200 | [diff] [blame] | 495 | unsigned long long seed = pat_lru_seed ^ (long)expr; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 496 | |
Dragan Dosen | 967e7e7 | 2020-12-22 13:22:34 +0100 | [diff] [blame] | 497 | lru = lru64_get(XXH3(smp->data.u.str.area, smp->data.u.str.data, seed), |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 498 | pat_lru_tree, expr, expr->ref->revision); |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 499 | if (lru && lru->domain) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 500 | ret = lru->data; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 501 | return ret; |
| 502 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 503 | } |
| 504 | |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 505 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 506 | list_for_each_entry(lst, &expr->patterns, list) { |
| 507 | pattern = &lst->pat; |
| 508 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 509 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 510 | continue; |
| 511 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 512 | if (pattern->len != smp->data.u.str.data) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 513 | continue; |
| 514 | |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 515 | icase = expr->mflags & PAT_MF_IGNORE_CASE; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 516 | if ((icase && strncasecmp(pattern->ptr.str, smp->data.u.str.area, smp->data.u.str.data) == 0) || |
| 517 | (!icase && strncmp(pattern->ptr.str, smp->data.u.str.area, smp->data.u.str.data) == 0)) { |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 518 | ret = pattern; |
| 519 | break; |
| 520 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 521 | } |
| 522 | |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 523 | if (lru) |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 524 | lru64_commit(lru, ret, expr, expr->ref->revision, NULL); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 525 | |
| 526 | return ret; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 527 | } |
| 528 | |
| 529 | /* NB: For two binaries buf to be identical, it is required that their lengths match */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 530 | struct pattern *pat_match_bin(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 531 | { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 532 | struct pattern_list *lst; |
| 533 | struct pattern *pattern; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 534 | struct pattern *ret = NULL; |
| 535 | struct lru64 *lru = NULL; |
| 536 | |
| 537 | if (pat_lru_tree) { |
Willy Tarreau | aee9314 | 2015-05-04 17:18:42 +0200 | [diff] [blame] | 538 | unsigned long long seed = pat_lru_seed ^ (long)expr; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 539 | |
Dragan Dosen | 967e7e7 | 2020-12-22 13:22:34 +0100 | [diff] [blame] | 540 | lru = lru64_get(XXH3(smp->data.u.str.area, smp->data.u.str.data, seed), |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 541 | pat_lru_tree, expr, expr->ref->revision); |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 542 | if (lru && lru->domain) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 543 | ret = lru->data; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 544 | return ret; |
| 545 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 546 | } |
| 547 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 548 | list_for_each_entry(lst, &expr->patterns, list) { |
| 549 | pattern = &lst->pat; |
| 550 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 551 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 552 | continue; |
| 553 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 554 | if (pattern->len != smp->data.u.str.data) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 555 | continue; |
| 556 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 557 | if (memcmp(pattern->ptr.str, smp->data.u.str.area, smp->data.u.str.data) == 0) { |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 558 | ret = pattern; |
| 559 | break; |
| 560 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 561 | } |
| 562 | |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 563 | if (lru) |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 564 | lru64_commit(lru, ret, expr, expr->ref->revision, NULL); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 565 | |
| 566 | return ret; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 567 | } |
| 568 | |
| 569 | /* Executes a regex. It temporarily changes the data to add a trailing zero, |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 570 | * and restores the previous character when leaving. This function fills |
| 571 | * a matching array. |
| 572 | */ |
| 573 | struct pattern *pat_match_regm(struct sample *smp, struct pattern_expr *expr, int fill) |
| 574 | { |
| 575 | struct pattern_list *lst; |
| 576 | struct pattern *pattern; |
| 577 | struct pattern *ret = NULL; |
| 578 | |
| 579 | list_for_each_entry(lst, &expr->patterns, list) { |
| 580 | pattern = &lst->pat; |
| 581 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 582 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 583 | continue; |
| 584 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 585 | if (regex_exec_match2(pattern->ptr.reg, smp->data.u.str.area, smp->data.u.str.data, |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 586 | MAX_MATCH, pmatch, 0)) { |
| 587 | ret = pattern; |
| 588 | smp->ctx.a[0] = pmatch; |
| 589 | break; |
| 590 | } |
| 591 | } |
| 592 | |
| 593 | return ret; |
| 594 | } |
| 595 | |
| 596 | /* Executes a regex. It temporarily changes the data to add a trailing zero, |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 597 | * and restores the previous character when leaving. |
| 598 | */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 599 | struct pattern *pat_match_reg(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 600 | { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 601 | struct pattern_list *lst; |
| 602 | struct pattern *pattern; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 603 | struct pattern *ret = NULL; |
| 604 | struct lru64 *lru = NULL; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 605 | |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 606 | if (pat_lru_tree) { |
Willy Tarreau | aee9314 | 2015-05-04 17:18:42 +0200 | [diff] [blame] | 607 | unsigned long long seed = pat_lru_seed ^ (long)expr; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 608 | |
Dragan Dosen | 967e7e7 | 2020-12-22 13:22:34 +0100 | [diff] [blame] | 609 | lru = lru64_get(XXH3(smp->data.u.str.area, smp->data.u.str.data, seed), |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 610 | pat_lru_tree, expr, expr->ref->revision); |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 611 | if (lru && lru->domain) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 612 | ret = lru->data; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 613 | return ret; |
| 614 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 615 | } |
| 616 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 617 | list_for_each_entry(lst, &expr->patterns, list) { |
| 618 | pattern = &lst->pat; |
| 619 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 620 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 621 | continue; |
| 622 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 623 | if (regex_exec2(pattern->ptr.reg, smp->data.u.str.area, smp->data.u.str.data)) { |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 624 | ret = pattern; |
| 625 | break; |
| 626 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 627 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 628 | |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 629 | if (lru) |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 630 | lru64_commit(lru, ret, expr, expr->ref->revision, NULL); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 631 | |
| 632 | return ret; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 633 | } |
| 634 | |
| 635 | /* Checks that the pattern matches the beginning of the tested string. */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 636 | struct pattern *pat_match_beg(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 637 | { |
| 638 | int icase; |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 639 | struct ebmb_node *node; |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 640 | struct pattern_tree *elt; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 641 | struct pattern_list *lst; |
| 642 | struct pattern *pattern; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 643 | struct pattern *ret = NULL; |
| 644 | struct lru64 *lru = NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 645 | |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 646 | /* Lookup a string in the expression's pattern tree. */ |
| 647 | if (!eb_is_empty(&expr->pattern_tree)) { |
Christopher Faulet | b4cf7ab | 2020-06-30 18:52:32 +0200 | [diff] [blame] | 648 | char prev = 0; |
| 649 | |
| 650 | if (smp->data.u.str.data < smp->data.u.str.size) { |
| 651 | /* we may have to force a trailing zero on the test pattern and |
| 652 | * the buffer is large enough to accommodate it. |
| 653 | */ |
| 654 | prev = smp->data.u.str.area[smp->data.u.str.data]; |
| 655 | if (prev) |
| 656 | smp->data.u.str.area[smp->data.u.str.data] = '\0'; |
| 657 | } |
| 658 | else { |
| 659 | /* Otherwise, the sample is duplicated. A trailing zero |
| 660 | * is automatically added to the string. |
| 661 | */ |
| 662 | if (!smp_dup(smp)) |
| 663 | return NULL; |
| 664 | } |
| 665 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 666 | node = ebmb_lookup_longest(&expr->pattern_tree, |
| 667 | smp->data.u.str.area); |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 668 | if (prev) |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 669 | smp->data.u.str.area[smp->data.u.str.data] = prev; |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 670 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 671 | while (node) { |
| 672 | elt = ebmb_entry(node, struct pattern_tree, node); |
| 673 | if (elt->ref->gen_id != expr->ref->curr_gen) { |
Willy Tarreau | 51d38a2 | 2022-08-01 11:46:27 +0200 | [diff] [blame] | 674 | node = ebmb_lookup_shorter(node); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 675 | continue; |
| 676 | } |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 677 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 678 | static_pattern.data = elt->data; |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 679 | static_pattern.ref = elt->ref; |
| 680 | static_pattern.sflags = PAT_SF_TREE; |
| 681 | static_pattern.type = SMP_T_STR; |
| 682 | static_pattern.ptr.str = (char *)elt->node.key; |
| 683 | } |
| 684 | return &static_pattern; |
| 685 | } |
| 686 | } |
| 687 | |
| 688 | /* look in the list */ |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 689 | if (pat_lru_tree) { |
Willy Tarreau | aee9314 | 2015-05-04 17:18:42 +0200 | [diff] [blame] | 690 | unsigned long long seed = pat_lru_seed ^ (long)expr; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 691 | |
Dragan Dosen | 967e7e7 | 2020-12-22 13:22:34 +0100 | [diff] [blame] | 692 | lru = lru64_get(XXH3(smp->data.u.str.area, smp->data.u.str.data, seed), |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 693 | pat_lru_tree, expr, expr->ref->revision); |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 694 | if (lru && lru->domain) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 695 | ret = lru->data; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 696 | return ret; |
| 697 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 698 | } |
| 699 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 700 | list_for_each_entry(lst, &expr->patterns, list) { |
| 701 | pattern = &lst->pat; |
| 702 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 703 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 704 | continue; |
| 705 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 706 | if (pattern->len > smp->data.u.str.data) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 707 | continue; |
| 708 | |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 709 | icase = expr->mflags & PAT_MF_IGNORE_CASE; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 710 | if ((icase && strncasecmp(pattern->ptr.str, smp->data.u.str.area, pattern->len) != 0) || |
| 711 | (!icase && strncmp(pattern->ptr.str, smp->data.u.str.area, pattern->len) != 0)) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 712 | continue; |
| 713 | |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 714 | ret = pattern; |
| 715 | break; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 716 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 717 | |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 718 | if (lru) |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 719 | lru64_commit(lru, ret, expr, expr->ref->revision, NULL); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 720 | |
| 721 | return ret; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 722 | } |
| 723 | |
| 724 | /* Checks that the pattern matches the end of the tested string. */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 725 | struct pattern *pat_match_end(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 726 | { |
| 727 | int icase; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 728 | struct pattern_list *lst; |
| 729 | struct pattern *pattern; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 730 | struct pattern *ret = NULL; |
| 731 | struct lru64 *lru = NULL; |
| 732 | |
| 733 | if (pat_lru_tree) { |
Willy Tarreau | aee9314 | 2015-05-04 17:18:42 +0200 | [diff] [blame] | 734 | unsigned long long seed = pat_lru_seed ^ (long)expr; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 735 | |
Dragan Dosen | 967e7e7 | 2020-12-22 13:22:34 +0100 | [diff] [blame] | 736 | lru = lru64_get(XXH3(smp->data.u.str.area, smp->data.u.str.data, seed), |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 737 | pat_lru_tree, expr, expr->ref->revision); |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 738 | if (lru && lru->domain) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 739 | ret = lru->data; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 740 | return ret; |
| 741 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 742 | } |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 743 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 744 | list_for_each_entry(lst, &expr->patterns, list) { |
| 745 | pattern = &lst->pat; |
| 746 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 747 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 748 | continue; |
| 749 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 750 | if (pattern->len > smp->data.u.str.data) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 751 | continue; |
| 752 | |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 753 | icase = expr->mflags & PAT_MF_IGNORE_CASE; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 754 | if ((icase && strncasecmp(pattern->ptr.str, smp->data.u.str.area + smp->data.u.str.data - pattern->len, pattern->len) != 0) || |
| 755 | (!icase && strncmp(pattern->ptr.str, smp->data.u.str.area + smp->data.u.str.data - pattern->len, pattern->len) != 0)) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 756 | continue; |
| 757 | |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 758 | ret = pattern; |
| 759 | break; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 760 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 761 | |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 762 | if (lru) |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 763 | lru64_commit(lru, ret, expr, expr->ref->revision, NULL); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 764 | |
| 765 | return ret; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 766 | } |
| 767 | |
| 768 | /* Checks that the pattern is included inside the tested string. |
| 769 | * NB: Suboptimal, should be rewritten using a Boyer-Moore method. |
| 770 | */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 771 | struct pattern *pat_match_sub(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 772 | { |
| 773 | int icase; |
| 774 | char *end; |
| 775 | char *c; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 776 | struct pattern_list *lst; |
| 777 | struct pattern *pattern; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 778 | struct pattern *ret = NULL; |
| 779 | struct lru64 *lru = NULL; |
| 780 | |
| 781 | if (pat_lru_tree) { |
Willy Tarreau | aee9314 | 2015-05-04 17:18:42 +0200 | [diff] [blame] | 782 | unsigned long long seed = pat_lru_seed ^ (long)expr; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 783 | |
Dragan Dosen | 967e7e7 | 2020-12-22 13:22:34 +0100 | [diff] [blame] | 784 | lru = lru64_get(XXH3(smp->data.u.str.area, smp->data.u.str.data, seed), |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 785 | pat_lru_tree, expr, expr->ref->revision); |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 786 | if (lru && lru->domain) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 787 | ret = lru->data; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 788 | return ret; |
| 789 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 790 | } |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 791 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 792 | list_for_each_entry(lst, &expr->patterns, list) { |
| 793 | pattern = &lst->pat; |
| 794 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 795 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 796 | continue; |
| 797 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 798 | if (pattern->len > smp->data.u.str.data) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 799 | continue; |
| 800 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 801 | end = smp->data.u.str.area + smp->data.u.str.data - pattern->len; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 802 | icase = expr->mflags & PAT_MF_IGNORE_CASE; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 803 | if (icase) { |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 804 | for (c = smp->data.u.str.area; c <= end; c++) { |
Willy Tarreau | f278eec | 2020-07-05 21:46:32 +0200 | [diff] [blame] | 805 | if (tolower((unsigned char)*c) != tolower((unsigned char)*pattern->ptr.str)) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 806 | continue; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 807 | if (strncasecmp(pattern->ptr.str, c, pattern->len) == 0) { |
| 808 | ret = pattern; |
| 809 | goto leave; |
| 810 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 811 | } |
| 812 | } else { |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 813 | for (c = smp->data.u.str.area; c <= end; c++) { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 814 | if (*c != *pattern->ptr.str) |
| 815 | continue; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 816 | if (strncmp(pattern->ptr.str, c, pattern->len) == 0) { |
| 817 | ret = pattern; |
| 818 | goto leave; |
| 819 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 820 | } |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 821 | } |
| 822 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 823 | leave: |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 824 | if (lru) |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 825 | lru64_commit(lru, ret, expr, expr->ref->revision, NULL); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 826 | |
| 827 | return ret; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 828 | } |
| 829 | |
| 830 | /* This one is used by other real functions. It checks that the pattern is |
| 831 | * included inside the tested string, but enclosed between the specified |
| 832 | * delimiters or at the beginning or end of the string. The delimiters are |
| 833 | * provided as an unsigned int made by make_4delim() and match up to 4 different |
| 834 | * delimiters. Delimiters are stripped at the beginning and end of the pattern. |
| 835 | */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 836 | static int match_word(struct sample *smp, struct pattern *pattern, int mflags, unsigned int delimiters) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 837 | { |
| 838 | int may_match, icase; |
| 839 | char *c, *end; |
| 840 | char *ps; |
| 841 | int pl; |
| 842 | |
| 843 | pl = pattern->len; |
| 844 | ps = pattern->ptr.str; |
| 845 | |
| 846 | while (pl > 0 && is_delimiter(*ps, delimiters)) { |
| 847 | pl--; |
| 848 | ps++; |
| 849 | } |
| 850 | |
| 851 | while (pl > 0 && is_delimiter(ps[pl - 1], delimiters)) |
| 852 | pl--; |
| 853 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 854 | if (pl > smp->data.u.str.data) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 855 | return PAT_NOMATCH; |
| 856 | |
| 857 | may_match = 1; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 858 | icase = mflags & PAT_MF_IGNORE_CASE; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 859 | end = smp->data.u.str.area + smp->data.u.str.data - pl; |
| 860 | for (c = smp->data.u.str.area; c <= end; c++) { |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 861 | if (is_delimiter(*c, delimiters)) { |
| 862 | may_match = 1; |
| 863 | continue; |
| 864 | } |
| 865 | |
| 866 | if (!may_match) |
| 867 | continue; |
| 868 | |
| 869 | if (icase) { |
Willy Tarreau | f278eec | 2020-07-05 21:46:32 +0200 | [diff] [blame] | 870 | if ((tolower((unsigned char)*c) == tolower((unsigned char)*ps)) && |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 871 | (strncasecmp(ps, c, pl) == 0) && |
| 872 | (c == end || is_delimiter(c[pl], delimiters))) |
| 873 | return PAT_MATCH; |
| 874 | } else { |
| 875 | if ((*c == *ps) && |
| 876 | (strncmp(ps, c, pl) == 0) && |
| 877 | (c == end || is_delimiter(c[pl], delimiters))) |
| 878 | return PAT_MATCH; |
| 879 | } |
| 880 | may_match = 0; |
| 881 | } |
| 882 | return PAT_NOMATCH; |
| 883 | } |
| 884 | |
| 885 | /* Checks that the pattern is included inside the tested string, but enclosed |
| 886 | * between the delimiters '?' or '/' or at the beginning or end of the string. |
| 887 | * Delimiters at the beginning or end of the pattern are ignored. |
| 888 | */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 889 | struct pattern *pat_match_dir(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 890 | { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 891 | struct pattern_list *lst; |
| 892 | struct pattern *pattern; |
| 893 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 894 | list_for_each_entry(lst, &expr->patterns, list) { |
| 895 | pattern = &lst->pat; |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 896 | |
| 897 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 898 | continue; |
| 899 | |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 900 | if (match_word(smp, pattern, expr->mflags, make_4delim('/', '?', '?', '?'))) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 901 | return pattern; |
| 902 | } |
| 903 | return NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 904 | } |
| 905 | |
| 906 | /* Checks that the pattern is included inside the tested string, but enclosed |
| 907 | * between the delmiters '/', '?', '.' or ":" or at the beginning or end of |
| 908 | * the string. Delimiters at the beginning or end of the pattern are ignored. |
| 909 | */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 910 | struct pattern *pat_match_dom(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 911 | { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 912 | struct pattern_list *lst; |
| 913 | struct pattern *pattern; |
| 914 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 915 | list_for_each_entry(lst, &expr->patterns, list) { |
| 916 | pattern = &lst->pat; |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 917 | |
| 918 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 919 | continue; |
| 920 | |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 921 | if (match_word(smp, pattern, expr->mflags, make_4delim('/', '?', '.', ':'))) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 922 | return pattern; |
| 923 | } |
| 924 | return NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 925 | } |
| 926 | |
| 927 | /* Checks that the integer in <test> is included between min and max */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 928 | struct pattern *pat_match_int(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 929 | { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 930 | struct pattern_list *lst; |
| 931 | struct pattern *pattern; |
| 932 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 933 | list_for_each_entry(lst, &expr->patterns, list) { |
| 934 | pattern = &lst->pat; |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 935 | |
| 936 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 937 | continue; |
| 938 | |
Thierry FOURNIER | 136f9d3 | 2015-08-19 09:07:19 +0200 | [diff] [blame] | 939 | if ((!pattern->val.range.min_set || pattern->val.range.min <= smp->data.u.sint) && |
| 940 | (!pattern->val.range.max_set || smp->data.u.sint <= pattern->val.range.max)) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 941 | return pattern; |
| 942 | } |
| 943 | return NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 944 | } |
| 945 | |
| 946 | /* Checks that the length of the pattern in <test> is included between min and max */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 947 | struct pattern *pat_match_len(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 948 | { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 949 | struct pattern_list *lst; |
| 950 | struct pattern *pattern; |
| 951 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 952 | list_for_each_entry(lst, &expr->patterns, list) { |
| 953 | pattern = &lst->pat; |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 954 | |
| 955 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 956 | continue; |
| 957 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 958 | if ((!pattern->val.range.min_set || pattern->val.range.min <= smp->data.u.str.data) && |
| 959 | (!pattern->val.range.max_set || smp->data.u.str.data <= pattern->val.range.max)) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 960 | return pattern; |
| 961 | } |
| 962 | return NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 963 | } |
| 964 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 965 | struct pattern *pat_match_ip(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 966 | { |
| 967 | unsigned int v4; /* in network byte order */ |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 968 | struct in6_addr tmp6; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 969 | struct in_addr *s; |
| 970 | struct ebmb_node *node; |
| 971 | struct pattern_tree *elt; |
| 972 | struct pattern_list *lst; |
| 973 | struct pattern *pattern; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 974 | |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 975 | /* The input sample is IPv4. Try to match in the trees. */ |
Thierry FOURNIER | 8c542ca | 2015-08-19 09:00:18 +0200 | [diff] [blame] | 976 | if (smp->data.type == SMP_T_IPV4) { |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 977 | /* Lookup an IPv4 address in the expression's pattern tree using |
| 978 | * the longest match method. |
| 979 | */ |
Thierry FOURNIER | 136f9d3 | 2015-08-19 09:07:19 +0200 | [diff] [blame] | 980 | s = &smp->data.u.ipv4; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 981 | node = ebmb_lookup_longest(&expr->pattern_tree, &s->s_addr); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 982 | while (node) { |
| 983 | elt = ebmb_entry(node, struct pattern_tree, node); |
| 984 | if (elt->ref->gen_id != expr->ref->curr_gen) { |
Willy Tarreau | 51d38a2 | 2022-08-01 11:46:27 +0200 | [diff] [blame] | 985 | node = ebmb_lookup_shorter(node); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 986 | continue; |
| 987 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 988 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 989 | static_pattern.data = elt->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 990 | static_pattern.ref = elt->ref; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 991 | static_pattern.sflags = PAT_SF_TREE; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 992 | static_pattern.type = SMP_T_IPV4; |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 993 | static_pattern.val.ipv4.addr.s_addr = read_u32(elt->node.key); |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 994 | if (!cidr2dotted(elt->node.node.pfx, &static_pattern.val.ipv4.mask)) |
| 995 | return NULL; |
| 996 | } |
| 997 | return &static_pattern; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 998 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 999 | |
Thayne McCombs | 8f0cc5c | 2021-01-07 21:35:52 -0700 | [diff] [blame] | 1000 | /* The IPv4 sample don't match the IPv4 tree. Convert the IPv4 |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1001 | * sample address to IPv6 with the mapping method using the ::ffff: |
| 1002 | * prefix, and try to lookup in the IPv6 tree. |
| 1003 | */ |
| 1004 | memset(&tmp6, 0, 10); |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1005 | write_u16(&tmp6.s6_addr[10], htons(0xffff)); |
| 1006 | write_u32(&tmp6.s6_addr[12], smp->data.u.ipv4.s_addr); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1007 | node = ebmb_lookup_longest(&expr->pattern_tree_2, &tmp6); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 1008 | while (node) { |
| 1009 | elt = ebmb_entry(node, struct pattern_tree, node); |
| 1010 | if (elt->ref->gen_id != expr->ref->curr_gen) { |
Willy Tarreau | 51d38a2 | 2022-08-01 11:46:27 +0200 | [diff] [blame] | 1011 | node = ebmb_lookup_shorter(node); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 1012 | continue; |
| 1013 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1014 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1015 | static_pattern.data = elt->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1016 | static_pattern.ref = elt->ref; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 1017 | static_pattern.sflags = PAT_SF_TREE; |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1018 | static_pattern.type = SMP_T_IPV6; |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1019 | memcpy(&static_pattern.val.ipv6.addr, elt->node.key, 16); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1020 | static_pattern.val.ipv6.mask = elt->node.node.pfx; |
| 1021 | } |
| 1022 | return &static_pattern; |
| 1023 | } |
| 1024 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1025 | |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1026 | /* The input sample is IPv6. Try to match in the trees. */ |
Thierry FOURNIER | 8c542ca | 2015-08-19 09:00:18 +0200 | [diff] [blame] | 1027 | if (smp->data.type == SMP_T_IPV6) { |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1028 | /* Lookup an IPv6 address in the expression's pattern tree using |
| 1029 | * the longest match method. |
| 1030 | */ |
Thierry FOURNIER | 136f9d3 | 2015-08-19 09:07:19 +0200 | [diff] [blame] | 1031 | node = ebmb_lookup_longest(&expr->pattern_tree_2, &smp->data.u.ipv6); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 1032 | while (node) { |
| 1033 | elt = ebmb_entry(node, struct pattern_tree, node); |
| 1034 | if (elt->ref->gen_id != expr->ref->curr_gen) { |
Willy Tarreau | 51d38a2 | 2022-08-01 11:46:27 +0200 | [diff] [blame] | 1035 | node = ebmb_lookup_shorter(node); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 1036 | continue; |
| 1037 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1038 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1039 | static_pattern.data = elt->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1040 | static_pattern.ref = elt->ref; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 1041 | static_pattern.sflags = PAT_SF_TREE; |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1042 | static_pattern.type = SMP_T_IPV6; |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1043 | memcpy(&static_pattern.val.ipv6.addr, elt->node.key, 16); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1044 | static_pattern.val.ipv6.mask = elt->node.node.pfx; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1045 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1046 | return &static_pattern; |
| 1047 | } |
| 1048 | |
| 1049 | /* Try to convert 6 to 4 when the start of the ipv6 address match the |
| 1050 | * following forms : |
| 1051 | * - ::ffff:ip:v4 (ipv4 mapped) |
| 1052 | * - ::0000:ip:v4 (old ipv4 mapped) |
| 1053 | * - 2002:ip:v4:: (6to4) |
| 1054 | */ |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1055 | if ((read_u64(&smp->data.u.ipv6.s6_addr[0]) == 0 && |
| 1056 | (read_u32(&smp->data.u.ipv6.s6_addr[8]) == 0 || |
| 1057 | read_u32(&smp->data.u.ipv6.s6_addr[8]) == htonl(0xFFFF))) || |
| 1058 | read_u16(&smp->data.u.ipv6.s6_addr[0]) == htons(0x2002)) { |
| 1059 | if (read_u32(&smp->data.u.ipv6.s6_addr[0]) == 0) |
| 1060 | v4 = read_u32(&smp->data.u.ipv6.s6_addr[12]); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1061 | else |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1062 | v4 = htonl((ntohs(read_u16(&smp->data.u.ipv6.s6_addr[2])) << 16) + |
| 1063 | ntohs(read_u16(&smp->data.u.ipv6.s6_addr[4]))); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1064 | |
| 1065 | /* Lookup an IPv4 address in the expression's pattern tree using the longest |
| 1066 | * match method. |
| 1067 | */ |
| 1068 | node = ebmb_lookup_longest(&expr->pattern_tree, &v4); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 1069 | while (node) { |
| 1070 | elt = ebmb_entry(node, struct pattern_tree, node); |
| 1071 | if (elt->ref->gen_id != expr->ref->curr_gen) { |
Willy Tarreau | 51d38a2 | 2022-08-01 11:46:27 +0200 | [diff] [blame] | 1072 | node = ebmb_lookup_shorter(node); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 1073 | continue; |
| 1074 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1075 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1076 | static_pattern.data = elt->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1077 | static_pattern.ref = elt->ref; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 1078 | static_pattern.sflags = PAT_SF_TREE; |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1079 | static_pattern.type = SMP_T_IPV4; |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1080 | static_pattern.val.ipv4.addr.s_addr = read_u32(elt->node.key); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1081 | if (!cidr2dotted(elt->node.node.pfx, &static_pattern.val.ipv4.mask)) |
| 1082 | return NULL; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1083 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1084 | return &static_pattern; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1085 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1086 | } |
| 1087 | } |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1088 | |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1089 | /* Lookup in the list. the list contain only IPv4 patterns */ |
| 1090 | list_for_each_entry(lst, &expr->patterns, list) { |
| 1091 | pattern = &lst->pat; |
| 1092 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 1093 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 1094 | continue; |
| 1095 | |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1096 | /* The input sample is IPv4, use it as is. */ |
Thierry FOURNIER | 8c542ca | 2015-08-19 09:00:18 +0200 | [diff] [blame] | 1097 | if (smp->data.type == SMP_T_IPV4) { |
Thierry FOURNIER | 136f9d3 | 2015-08-19 09:07:19 +0200 | [diff] [blame] | 1098 | v4 = smp->data.u.ipv4.s_addr; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1099 | } |
Thierry FOURNIER | 8c542ca | 2015-08-19 09:00:18 +0200 | [diff] [blame] | 1100 | else if (smp->data.type == SMP_T_IPV6) { |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1101 | /* v4 match on a V6 sample. We want to check at least for |
| 1102 | * the following forms : |
| 1103 | * - ::ffff:ip:v4 (ipv4 mapped) |
| 1104 | * - ::0000:ip:v4 (old ipv4 mapped) |
| 1105 | * - 2002:ip:v4:: (6to4) |
| 1106 | */ |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1107 | if (read_u64(&smp->data.u.ipv6.s6_addr[0]) == 0 && |
| 1108 | (read_u32(&smp->data.u.ipv6.s6_addr[8]) == 0 || |
| 1109 | read_u32(&smp->data.u.ipv6.s6_addr[8]) == htonl(0xFFFF))) { |
| 1110 | v4 = read_u32(&smp->data.u.ipv6.s6_addr[12]); |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1111 | } |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1112 | else if (read_u16(&smp->data.u.ipv6.s6_addr[0]) == htons(0x2002)) { |
| 1113 | v4 = htonl((ntohs(read_u16(&smp->data.u.ipv6.s6_addr[2])) << 16) + |
| 1114 | ntohs(read_u16(&smp->data.u.ipv6.s6_addr[4]))); |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1115 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1116 | else |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1117 | continue; |
Andreas Seltenreich | f065319 | 2016-03-03 20:08:35 +0100 | [diff] [blame] | 1118 | } else { |
| 1119 | /* impossible */ |
| 1120 | continue; |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1121 | } |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1122 | |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1123 | /* Check if the input sample match the current pattern. */ |
| 1124 | if (((v4 ^ pattern->val.ipv4.addr.s_addr) & pattern->val.ipv4.mask.s_addr) == 0) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1125 | return pattern; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1126 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1127 | return NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1128 | } |
| 1129 | |
Willy Tarreau | 867a8a5 | 2020-11-03 11:22:04 +0100 | [diff] [blame] | 1130 | /* finds the pattern holding <list> from list head <head> and deletes it. |
| 1131 | * This is made for use for pattern removal within an expression. |
| 1132 | */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1133 | static void pat_unlink_from_head(void **head, void **list) |
Willy Tarreau | 867a8a5 | 2020-11-03 11:22:04 +0100 | [diff] [blame] | 1134 | { |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1135 | while (*head) { |
| 1136 | if (*head == list) { |
| 1137 | *head = *list; |
Willy Tarreau | 867a8a5 | 2020-11-03 11:22:04 +0100 | [diff] [blame] | 1138 | return; |
| 1139 | } |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1140 | head = *head; |
Willy Tarreau | 867a8a5 | 2020-11-03 11:22:04 +0100 | [diff] [blame] | 1141 | } |
| 1142 | } |
| 1143 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1144 | void free_pattern_tree(struct eb_root *root) |
| 1145 | { |
| 1146 | struct eb_node *node, *next; |
Thierry FOURNIER | e1bcac5 | 2013-12-13 16:09:50 +0100 | [diff] [blame] | 1147 | struct pattern_tree *elt; |
Thierry FOURNIER | 3ce88c7 | 2013-12-09 11:29:46 +0100 | [diff] [blame] | 1148 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1149 | node = eb_first(root); |
| 1150 | while (node) { |
| 1151 | next = eb_next(node); |
| 1152 | eb_delete(node); |
Thierry FOURNIER | e1bcac5 | 2013-12-13 16:09:50 +0100 | [diff] [blame] | 1153 | elt = container_of(node, struct pattern_tree, node); |
Willy Tarreau | 867a8a5 | 2020-11-03 11:22:04 +0100 | [diff] [blame] | 1154 | pat_unlink_from_head(&elt->ref->tree_head, &elt->from_ref); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1155 | free(elt->data); |
Thierry FOURNIER | 3ce88c7 | 2013-12-09 11:29:46 +0100 | [diff] [blame] | 1156 | free(elt); |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1157 | node = next; |
| 1158 | } |
| 1159 | } |
| 1160 | |
Willy Tarreau | 6d8a689 | 2020-11-02 19:26:02 +0100 | [diff] [blame] | 1161 | void pat_prune_gen(struct pattern_expr *expr) |
Thierry FOURNIER | d163e1c | 2013-11-28 11:41:23 +0100 | [diff] [blame] | 1162 | { |
Thierry FOURNIER | 6f7203d | 2014-01-14 16:24:51 +0100 | [diff] [blame] | 1163 | struct pattern_list *pat, *tmp; |
| 1164 | |
| 1165 | list_for_each_entry_safe(pat, tmp, &expr->patterns, list) { |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 1166 | LIST_DELETE(&pat->list); |
Willy Tarreau | 867a8a5 | 2020-11-03 11:22:04 +0100 | [diff] [blame] | 1167 | pat_unlink_from_head(&pat->pat.ref->list_head, &pat->from_ref); |
Willy Tarreau | 6d8a689 | 2020-11-02 19:26:02 +0100 | [diff] [blame] | 1168 | if (pat->pat.sflags & PAT_SF_REGFREE) |
| 1169 | regex_free(pat->pat.ptr.ptr); |
| 1170 | else |
| 1171 | free(pat->pat.ptr.ptr); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1172 | free(pat->pat.data); |
Thierry FOURNIER | 6f7203d | 2014-01-14 16:24:51 +0100 | [diff] [blame] | 1173 | free(pat); |
| 1174 | } |
| 1175 | |
Thierry FOURNIER | d163e1c | 2013-11-28 11:41:23 +0100 | [diff] [blame] | 1176 | free_pattern_tree(&expr->pattern_tree); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1177 | free_pattern_tree(&expr->pattern_tree_2); |
Thierry FOURNIER | d163e1c | 2013-11-28 11:41:23 +0100 | [diff] [blame] | 1178 | LIST_INIT(&expr->patterns); |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1179 | expr->ref->revision = rdtsc(); |
Dragan Dosen | a75eea7 | 2021-05-21 16:59:15 +0200 | [diff] [blame] | 1180 | expr->ref->entry_cnt = 0; |
Thierry FOURNIER | d163e1c | 2013-11-28 11:41:23 +0100 | [diff] [blame] | 1181 | } |
| 1182 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1183 | /* |
| 1184 | * |
| 1185 | * The following functions are used for the pattern indexation |
| 1186 | * |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1187 | */ |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1188 | |
| 1189 | int pat_idx_list_val(struct pattern_expr *expr, struct pattern *pat, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1190 | { |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1191 | struct pattern_list *patl; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1192 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1193 | /* allocate pattern */ |
| 1194 | patl = calloc(1, sizeof(*patl)); |
| 1195 | if (!patl) { |
| 1196 | memprintf(err, "out of memory while indexing pattern"); |
Thierry FOURNIER | 972028f | 2014-01-23 17:53:31 +0100 | [diff] [blame] | 1197 | return 0; |
| 1198 | } |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1199 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1200 | /* duplicate pattern */ |
| 1201 | memcpy(&patl->pat, pat, sizeof(*pat)); |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1202 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1203 | /* chain pattern in the expression */ |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 1204 | LIST_APPEND(&expr->patterns, &patl->list); |
Willy Tarreau | 4bdd0a1 | 2020-11-02 12:10:48 +0100 | [diff] [blame] | 1205 | /* and from the reference */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1206 | patl->from_ref = pat->ref->list_head; |
| 1207 | pat->ref->list_head = &patl->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1208 | expr->ref->revision = rdtsc(); |
Dragan Dosen | a75eea7 | 2021-05-21 16:59:15 +0200 | [diff] [blame] | 1209 | expr->ref->entry_cnt++; |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1210 | |
| 1211 | /* that's ok */ |
| 1212 | return 1; |
| 1213 | } |
| 1214 | |
| 1215 | int pat_idx_list_ptr(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1216 | { |
| 1217 | struct pattern_list *patl; |
| 1218 | |
| 1219 | /* allocate pattern */ |
| 1220 | patl = calloc(1, sizeof(*patl)); |
Thierry FOURNIER | 8aa8384 | 2015-02-06 17:50:55 +0100 | [diff] [blame] | 1221 | if (!patl) { |
| 1222 | memprintf(err, "out of memory while indexing pattern"); |
Thierry FOURNIER | 972028f | 2014-01-23 17:53:31 +0100 | [diff] [blame] | 1223 | return 0; |
Thierry FOURNIER | 8aa8384 | 2015-02-06 17:50:55 +0100 | [diff] [blame] | 1224 | } |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1225 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1226 | /* duplicate pattern */ |
| 1227 | memcpy(&patl->pat, pat, sizeof(*pat)); |
| 1228 | patl->pat.ptr.ptr = malloc(patl->pat.len); |
| 1229 | if (!patl->pat.ptr.ptr) { |
| 1230 | free(patl); |
| 1231 | memprintf(err, "out of memory while indexing pattern"); |
| 1232 | return 0; |
| 1233 | } |
| 1234 | memcpy(patl->pat.ptr.ptr, pat->ptr.ptr, pat->len); |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1235 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1236 | /* chain pattern in the expression */ |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 1237 | LIST_APPEND(&expr->patterns, &patl->list); |
Willy Tarreau | 4bdd0a1 | 2020-11-02 12:10:48 +0100 | [diff] [blame] | 1238 | /* and from the reference */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1239 | patl->from_ref = pat->ref->list_head; |
| 1240 | pat->ref->list_head = &patl->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1241 | expr->ref->revision = rdtsc(); |
Dragan Dosen | a75eea7 | 2021-05-21 16:59:15 +0200 | [diff] [blame] | 1242 | expr->ref->entry_cnt++; |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1243 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1244 | /* that's ok */ |
| 1245 | return 1; |
| 1246 | } |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1247 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1248 | int pat_idx_list_str(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1249 | { |
| 1250 | struct pattern_list *patl; |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1251 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1252 | /* allocate pattern */ |
| 1253 | patl = calloc(1, sizeof(*patl)); |
| 1254 | if (!patl) { |
| 1255 | memprintf(err, "out of memory while indexing pattern"); |
| 1256 | return 0; |
| 1257 | } |
| 1258 | |
| 1259 | /* duplicate pattern */ |
| 1260 | memcpy(&patl->pat, pat, sizeof(*pat)); |
| 1261 | patl->pat.ptr.str = malloc(patl->pat.len + 1); |
| 1262 | if (!patl->pat.ptr.str) { |
| 1263 | free(patl); |
| 1264 | memprintf(err, "out of memory while indexing pattern"); |
| 1265 | return 0; |
| 1266 | } |
| 1267 | memcpy(patl->pat.ptr.ptr, pat->ptr.ptr, pat->len); |
| 1268 | patl->pat.ptr.str[patl->pat.len] = '\0'; |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1269 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1270 | /* chain pattern in the expression */ |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 1271 | LIST_APPEND(&expr->patterns, &patl->list); |
Willy Tarreau | 4bdd0a1 | 2020-11-02 12:10:48 +0100 | [diff] [blame] | 1272 | /* and from the reference */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1273 | patl->from_ref = pat->ref->list_head; |
| 1274 | pat->ref->list_head = &patl->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1275 | expr->ref->revision = rdtsc(); |
Dragan Dosen | a75eea7 | 2021-05-21 16:59:15 +0200 | [diff] [blame] | 1276 | expr->ref->entry_cnt++; |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1277 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1278 | /* that's ok */ |
| 1279 | return 1; |
| 1280 | } |
| 1281 | |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 1282 | int pat_idx_list_reg_cap(struct pattern_expr *expr, struct pattern *pat, int cap, char **err) |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1283 | { |
| 1284 | struct pattern_list *patl; |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1285 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1286 | /* allocate pattern */ |
| 1287 | patl = calloc(1, sizeof(*patl)); |
| 1288 | if (!patl) { |
| 1289 | memprintf(err, "out of memory while indexing pattern"); |
| 1290 | return 0; |
Thierry FOURNIER | 972028f | 2014-01-23 17:53:31 +0100 | [diff] [blame] | 1291 | } |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1292 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1293 | /* duplicate pattern */ |
| 1294 | memcpy(&patl->pat, pat, sizeof(*pat)); |
| 1295 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1296 | /* compile regex */ |
Willy Tarreau | 9b5c8bb | 2020-11-02 19:16:23 +0100 | [diff] [blame] | 1297 | patl->pat.sflags |= PAT_SF_REGFREE; |
Dragan Dosen | 2674303 | 2019-04-30 15:54:36 +0200 | [diff] [blame] | 1298 | if (!(patl->pat.ptr.reg = regex_comp(pat->ptr.str, !(expr->mflags & PAT_MF_IGNORE_CASE), |
| 1299 | cap, err))) { |
Dirkjan Bussink | 07fcaaa | 2014-04-28 22:57:16 +0000 | [diff] [blame] | 1300 | free(patl); |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1301 | return 0; |
| 1302 | } |
| 1303 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1304 | /* chain pattern in the expression */ |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 1305 | LIST_APPEND(&expr->patterns, &patl->list); |
Willy Tarreau | 4bdd0a1 | 2020-11-02 12:10:48 +0100 | [diff] [blame] | 1306 | /* and from the reference */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1307 | patl->from_ref = pat->ref->list_head; |
| 1308 | pat->ref->list_head = &patl->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1309 | expr->ref->revision = rdtsc(); |
Dragan Dosen | a75eea7 | 2021-05-21 16:59:15 +0200 | [diff] [blame] | 1310 | expr->ref->entry_cnt++; |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1311 | |
| 1312 | /* that's ok */ |
| 1313 | return 1; |
| 1314 | } |
| 1315 | |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 1316 | int pat_idx_list_reg(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1317 | { |
| 1318 | return pat_idx_list_reg_cap(expr, pat, 0, err); |
| 1319 | } |
| 1320 | |
| 1321 | int pat_idx_list_regm(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1322 | { |
| 1323 | return pat_idx_list_reg_cap(expr, pat, 1, err); |
| 1324 | } |
| 1325 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1326 | int pat_idx_tree_ip(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1327 | { |
| 1328 | unsigned int mask; |
Thierry FOURNIER | e1bcac5 | 2013-12-13 16:09:50 +0100 | [diff] [blame] | 1329 | struct pattern_tree *node; |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1330 | |
| 1331 | /* Only IPv4 can be indexed */ |
| 1332 | if (pat->type == SMP_T_IPV4) { |
Thierry FOURNIER | 972028f | 2014-01-23 17:53:31 +0100 | [diff] [blame] | 1333 | /* in IPv4 case, check if the mask is contiguous so that we can |
| 1334 | * insert the network into the tree. A continuous mask has only |
| 1335 | * ones on the left. This means that this mask + its lower bit |
| 1336 | * added once again is null. |
| 1337 | */ |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1338 | mask = ntohl(pat->val.ipv4.mask.s_addr); |
| 1339 | if (mask + (mask & -mask) == 0) { |
| 1340 | mask = mask ? 33 - flsnz(mask & -mask) : 0; /* equals cidr value */ |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1341 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1342 | /* node memory allocation */ |
| 1343 | node = calloc(1, sizeof(*node) + 4); |
| 1344 | if (!node) { |
| 1345 | memprintf(err, "out of memory while loading pattern"); |
| 1346 | return 0; |
| 1347 | } |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1348 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1349 | /* copy the pointer to sample associated to this node */ |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1350 | node->data = pat->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1351 | node->ref = pat->ref; |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1352 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1353 | /* FIXME: insert <addr>/<mask> into the tree here */ |
| 1354 | memcpy(node->node.key, &pat->val.ipv4.addr, 4); /* network byte order */ |
| 1355 | node->node.node.pfx = mask; |
Thierry FOURNIER | 31db4ae | 2014-01-30 00:27:15 +0100 | [diff] [blame] | 1356 | |
| 1357 | /* Insert the entry. */ |
| 1358 | ebmb_insert_prefix(&expr->pattern_tree, &node->node, 4); |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1359 | node->from_ref = pat->ref->tree_head; |
| 1360 | pat->ref->tree_head = &node->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1361 | expr->ref->revision = rdtsc(); |
Dragan Dosen | a75eea7 | 2021-05-21 16:59:15 +0200 | [diff] [blame] | 1362 | expr->ref->entry_cnt++; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1363 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1364 | /* that's ok */ |
| 1365 | return 1; |
| 1366 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1367 | else { |
| 1368 | /* If the mask is not contiguous, just add the pattern to the list */ |
| 1369 | return pat_idx_list_val(expr, pat, err); |
| 1370 | } |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1371 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1372 | else if (pat->type == SMP_T_IPV6) { |
| 1373 | /* IPv6 also can be indexed */ |
| 1374 | node = calloc(1, sizeof(*node) + 16); |
| 1375 | if (!node) { |
| 1376 | memprintf(err, "out of memory while loading pattern"); |
| 1377 | return 0; |
| 1378 | } |
| 1379 | |
| 1380 | /* copy the pointer to sample associated to this node */ |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1381 | node->data = pat->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1382 | node->ref = pat->ref; |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1383 | |
| 1384 | /* FIXME: insert <addr>/<mask> into the tree here */ |
| 1385 | memcpy(node->node.key, &pat->val.ipv6.addr, 16); /* network byte order */ |
| 1386 | node->node.node.pfx = pat->val.ipv6.mask; |
Thierry FOURNIER | 31db4ae | 2014-01-30 00:27:15 +0100 | [diff] [blame] | 1387 | |
| 1388 | /* Insert the entry. */ |
| 1389 | ebmb_insert_prefix(&expr->pattern_tree_2, &node->node, 16); |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1390 | node->from_ref = pat->ref->tree_head; |
| 1391 | pat->ref->tree_head = &node->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1392 | expr->ref->revision = rdtsc(); |
Dragan Dosen | a75eea7 | 2021-05-21 16:59:15 +0200 | [diff] [blame] | 1393 | expr->ref->entry_cnt++; |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1394 | |
| 1395 | /* that's ok */ |
| 1396 | return 1; |
| 1397 | } |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1398 | |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1399 | return 0; |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1400 | } |
| 1401 | |
| 1402 | int pat_idx_tree_str(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1403 | { |
| 1404 | int len; |
Thierry FOURNIER | e1bcac5 | 2013-12-13 16:09:50 +0100 | [diff] [blame] | 1405 | struct pattern_tree *node; |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1406 | |
| 1407 | /* Only string can be indexed */ |
Thierry FOURNIER | 7654c9f | 2013-12-17 00:20:33 +0100 | [diff] [blame] | 1408 | if (pat->type != SMP_T_STR) { |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1409 | memprintf(err, "internal error: string expected, but the type is '%s'", |
| 1410 | smp_to_type[pat->type]); |
| 1411 | return 0; |
Thierry FOURNIER | 972028f | 2014-01-23 17:53:31 +0100 | [diff] [blame] | 1412 | } |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1413 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1414 | /* If the flag PAT_F_IGNORE_CASE is set, we cannot use trees */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 1415 | if (expr->mflags & PAT_MF_IGNORE_CASE) |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1416 | return pat_idx_list_str(expr, pat, err); |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1417 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1418 | /* Process the key len */ |
| 1419 | len = strlen(pat->ptr.str) + 1; |
| 1420 | |
| 1421 | /* node memory allocation */ |
| 1422 | node = calloc(1, sizeof(*node) + len); |
| 1423 | if (!node) { |
| 1424 | memprintf(err, "out of memory while loading pattern"); |
| 1425 | return 0; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1426 | } |
| 1427 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1428 | /* copy the pointer to sample associated to this node */ |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1429 | node->data = pat->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1430 | node->ref = pat->ref; |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1431 | |
| 1432 | /* copy the string */ |
| 1433 | memcpy(node->node.key, pat->ptr.str, len); |
| 1434 | |
| 1435 | /* index the new node */ |
Thierry FOURNIER | 31db4ae | 2014-01-30 00:27:15 +0100 | [diff] [blame] | 1436 | ebst_insert(&expr->pattern_tree, &node->node); |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1437 | node->from_ref = pat->ref->tree_head; |
| 1438 | pat->ref->tree_head = &node->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1439 | expr->ref->revision = rdtsc(); |
Dragan Dosen | a75eea7 | 2021-05-21 16:59:15 +0200 | [diff] [blame] | 1440 | expr->ref->entry_cnt++; |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1441 | |
| 1442 | /* that's ok */ |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1443 | return 1; |
| 1444 | } |
| 1445 | |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 1446 | int pat_idx_tree_pfx(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1447 | { |
| 1448 | int len; |
| 1449 | struct pattern_tree *node; |
| 1450 | |
| 1451 | /* Only string can be indexed */ |
| 1452 | if (pat->type != SMP_T_STR) { |
| 1453 | memprintf(err, "internal error: string expected, but the type is '%s'", |
| 1454 | smp_to_type[pat->type]); |
| 1455 | return 0; |
| 1456 | } |
| 1457 | |
| 1458 | /* If the flag PAT_F_IGNORE_CASE is set, we cannot use trees */ |
| 1459 | if (expr->mflags & PAT_MF_IGNORE_CASE) |
| 1460 | return pat_idx_list_str(expr, pat, err); |
| 1461 | |
| 1462 | /* Process the key len */ |
| 1463 | len = strlen(pat->ptr.str); |
| 1464 | |
| 1465 | /* node memory allocation */ |
| 1466 | node = calloc(1, sizeof(*node) + len + 1); |
| 1467 | if (!node) { |
| 1468 | memprintf(err, "out of memory while loading pattern"); |
| 1469 | return 0; |
| 1470 | } |
| 1471 | |
| 1472 | /* copy the pointer to sample associated to this node */ |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1473 | node->data = pat->data; |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 1474 | node->ref = pat->ref; |
| 1475 | |
| 1476 | /* copy the string and the trailing zero */ |
| 1477 | memcpy(node->node.key, pat->ptr.str, len + 1); |
| 1478 | node->node.node.pfx = len * 8; |
| 1479 | |
| 1480 | /* index the new node */ |
| 1481 | ebmb_insert_prefix(&expr->pattern_tree, &node->node, len); |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1482 | node->from_ref = pat->ref->tree_head; |
| 1483 | pat->ref->tree_head = &node->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1484 | expr->ref->revision = rdtsc(); |
Dragan Dosen | a75eea7 | 2021-05-21 16:59:15 +0200 | [diff] [blame] | 1485 | expr->ref->entry_cnt++; |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 1486 | |
| 1487 | /* that's ok */ |
| 1488 | return 1; |
| 1489 | } |
| 1490 | |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1491 | /* Deletes all patterns from reference <elt>. Note that all of their |
Willy Tarreau | 78777ea | 2020-11-02 13:55:22 +0100 | [diff] [blame] | 1492 | * expressions must be locked, and the pattern lock must be held as well. |
| 1493 | */ |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1494 | void pat_delete_gen(struct pat_ref *ref, struct pat_ref_elt *elt) |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1495 | { |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1496 | struct pattern_tree *tree; |
| 1497 | struct pattern_list *pat; |
| 1498 | void **node; |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1499 | |
| 1500 | /* delete all known tree nodes. They are all allocated inline */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1501 | for (node = elt->tree_head; node;) { |
| 1502 | tree = container_of(node, struct pattern_tree, from_ref); |
| 1503 | node = *node; |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1504 | BUG_ON(tree->ref != elt); |
| 1505 | |
| 1506 | ebmb_delete(&tree->node); |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1507 | free(tree->data); |
| 1508 | free(tree); |
| 1509 | } |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1510 | |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1511 | /* delete all list nodes and free their pattern entries (str/reg) */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1512 | for (node = elt->list_head; node;) { |
| 1513 | pat = container_of(node, struct pattern_list, from_ref); |
| 1514 | node = *node; |
Willy Tarreau | 78777ea | 2020-11-02 13:55:22 +0100 | [diff] [blame] | 1515 | BUG_ON(pat->pat.ref != elt); |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1516 | |
| 1517 | /* Delete and free entry. */ |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 1518 | LIST_DELETE(&pat->list); |
Willy Tarreau | 6d8a689 | 2020-11-02 19:26:02 +0100 | [diff] [blame] | 1519 | if (pat->pat.sflags & PAT_SF_REGFREE) |
| 1520 | regex_free(pat->pat.ptr.reg); |
| 1521 | else |
| 1522 | free(pat->pat.ptr.ptr); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1523 | free(pat->pat.data); |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1524 | free(pat); |
| 1525 | } |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1526 | |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1527 | /* update revision number to refresh the cache */ |
| 1528 | ref->revision = rdtsc(); |
Dragan Dosen | a75eea7 | 2021-05-21 16:59:15 +0200 | [diff] [blame] | 1529 | ref->entry_cnt--; |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1530 | elt->tree_head = NULL; |
| 1531 | elt->list_head = NULL; |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1532 | } |
| 1533 | |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1534 | void pattern_init_expr(struct pattern_expr *expr) |
| 1535 | { |
| 1536 | LIST_INIT(&expr->patterns); |
Thierry FOURNIER | 31db4ae | 2014-01-30 00:27:15 +0100 | [diff] [blame] | 1537 | expr->pattern_tree = EB_ROOT; |
| 1538 | expr->pattern_tree_2 = EB_ROOT; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1539 | } |
| 1540 | |
| 1541 | void pattern_init_head(struct pattern_head *head) |
| 1542 | { |
| 1543 | LIST_INIT(&head->head); |
| 1544 | } |
| 1545 | |
| 1546 | /* The following functions are relative to the management of the reference |
| 1547 | * lists. These lists are used to store the original pattern and associated |
| 1548 | * value as string form. |
| 1549 | * |
| 1550 | * This is used with modifiable ACL and MAPS |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1551 | * |
| 1552 | * The pattern reference are stored with two identifiers: the unique_id and |
| 1553 | * the reference. |
| 1554 | * |
| 1555 | * The reference identify a file. Each file with the same name point to the |
| 1556 | * same reference. We can register many times one file. If the file is modified, |
| 1557 | * all his dependencies are also modified. The reference can be used with map or |
| 1558 | * acl. |
| 1559 | * |
| 1560 | * The unique_id identify inline acl. The unique id is unique for each acl. |
| 1561 | * You cannot force the same id in the configuration file, because this repoort |
| 1562 | * an error. |
| 1563 | * |
| 1564 | * A particular case appears if the filename is a number. In this case, the |
| 1565 | * unique_id is set with the number represented by the filename and the |
| 1566 | * reference is also set. This method prevent double unique_id. |
| 1567 | * |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1568 | */ |
| 1569 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1570 | /* This function looks up a reference by name. If the reference is found, a |
| 1571 | * pointer to the struct pat_ref is returned, otherwise NULL is returned. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1572 | */ |
| 1573 | struct pat_ref *pat_ref_lookup(const char *reference) |
| 1574 | { |
| 1575 | struct pat_ref *ref; |
| 1576 | |
| 1577 | list_for_each_entry(ref, &pattern_reference, list) |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1578 | if (ref->reference && strcmp(reference, ref->reference) == 0) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1579 | return ref; |
| 1580 | return NULL; |
| 1581 | } |
| 1582 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1583 | /* This function looks up a reference's unique id. If the reference is found, a |
| 1584 | * pointer to the struct pat_ref is returned, otherwise NULL is returned. |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1585 | */ |
| 1586 | struct pat_ref *pat_ref_lookupid(int unique_id) |
| 1587 | { |
| 1588 | struct pat_ref *ref; |
| 1589 | |
| 1590 | list_for_each_entry(ref, &pattern_reference, list) |
| 1591 | if (ref->unique_id == unique_id) |
| 1592 | return ref; |
| 1593 | return NULL; |
| 1594 | } |
| 1595 | |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1596 | /* This function removes from the pattern reference <ref> all the patterns |
| 1597 | * attached to the reference element <elt>, and the element itself. The |
| 1598 | * reference must be locked. |
| 1599 | */ |
| 1600 | void pat_ref_delete_by_ptr(struct pat_ref *ref, struct pat_ref_elt *elt) |
| 1601 | { |
| 1602 | struct pattern_expr *expr; |
| 1603 | struct bref *bref, *back; |
| 1604 | |
| 1605 | /* |
| 1606 | * we have to unlink all watchers from this reference pattern. We must |
| 1607 | * not relink them if this elt was the last one in the list. |
| 1608 | */ |
| 1609 | list_for_each_entry_safe(bref, back, &elt->back_refs, users) { |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 1610 | LIST_DELETE(&bref->users); |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1611 | LIST_INIT(&bref->users); |
| 1612 | if (elt->list.n != &ref->head) |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 1613 | LIST_APPEND(&LIST_ELEM(elt->list.n, typeof(elt), list)->back_refs, &bref->users); |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1614 | bref->ref = elt->list.n; |
| 1615 | } |
| 1616 | |
| 1617 | /* delete all entries from all expressions for this pattern */ |
| 1618 | list_for_each_entry(expr, &ref->pat, list) |
| 1619 | HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock); |
| 1620 | |
| 1621 | pat_delete_gen(ref, elt); |
| 1622 | |
| 1623 | list_for_each_entry(expr, &ref->pat, list) |
| 1624 | HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock); |
| 1625 | |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 1626 | LIST_DELETE(&elt->list); |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1627 | free(elt->sample); |
| 1628 | free(elt->pattern); |
| 1629 | free(elt); |
| 1630 | } |
| 1631 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1632 | /* This function removes all the patterns matching the pointer <refelt> from |
| 1633 | * the reference and from each expr member of this reference. This function |
| 1634 | * returns 1 if the entry was found and deleted, otherwise zero. |
Thierry FOURNIER | 7acca4b | 2014-01-28 16:43:36 +0100 | [diff] [blame] | 1635 | */ |
| 1636 | int pat_ref_delete_by_id(struct pat_ref *ref, struct pat_ref_elt *refelt) |
| 1637 | { |
Thierry FOURNIER | 7acca4b | 2014-01-28 16:43:36 +0100 | [diff] [blame] | 1638 | struct pat_ref_elt *elt, *safe; |
| 1639 | |
| 1640 | /* delete pattern from reference */ |
| 1641 | list_for_each_entry_safe(elt, safe, &ref->head, list) { |
| 1642 | if (elt == refelt) { |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1643 | pat_ref_delete_by_ptr(ref, elt); |
Thierry FOURNIER | 7acca4b | 2014-01-28 16:43:36 +0100 | [diff] [blame] | 1644 | return 1; |
| 1645 | } |
| 1646 | } |
| 1647 | return 0; |
| 1648 | } |
| 1649 | |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1650 | /* This function removes all patterns matching <key> from the reference |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 1651 | * and from each expr member of the reference. This function returns 1 |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1652 | * if the deletion is done and returns 0 is the entry is not found. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1653 | */ |
| 1654 | int pat_ref_delete(struct pat_ref *ref, const char *key) |
| 1655 | { |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1656 | struct pat_ref_elt *elt, *safe; |
| 1657 | int found = 0; |
| 1658 | |
| 1659 | /* delete pattern from reference */ |
| 1660 | list_for_each_entry_safe(elt, safe, &ref->head, list) { |
| 1661 | if (strcmp(key, elt->pattern) == 0) { |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1662 | pat_ref_delete_by_ptr(ref, elt); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1663 | found = 1; |
| 1664 | } |
| 1665 | } |
| 1666 | |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1667 | return found; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1668 | } |
| 1669 | |
Baptiste Assmann | 953f74d | 2014-04-25 16:57:03 +0200 | [diff] [blame] | 1670 | /* |
| 1671 | * find and return an element <elt> matching <key> in a reference <ref> |
| 1672 | * return NULL if not found |
| 1673 | */ |
| 1674 | struct pat_ref_elt *pat_ref_find_elt(struct pat_ref *ref, const char *key) |
| 1675 | { |
| 1676 | struct pat_ref_elt *elt; |
| 1677 | |
| 1678 | list_for_each_entry(elt, &ref->head, list) { |
| 1679 | if (strcmp(key, elt->pattern) == 0) |
| 1680 | return elt; |
| 1681 | } |
| 1682 | |
| 1683 | return NULL; |
| 1684 | } |
| 1685 | |
| 1686 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1687 | /* This function modifies the sample of pat_ref_elt <elt> in all expressions |
| 1688 | * found under <ref> to become <value>. It is assumed that the caller has |
| 1689 | * already verified that <elt> belongs to <ref>. |
| 1690 | */ |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1691 | static inline int pat_ref_set_elt(struct pat_ref *ref, struct pat_ref_elt *elt, |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1692 | const char *value, char **err) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1693 | { |
| 1694 | struct pattern_expr *expr; |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1695 | struct sample_data **data; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1696 | char *sample; |
Thierry FOURNIER | 12ba0c2 | 2015-08-14 00:02:11 +0200 | [diff] [blame] | 1697 | struct sample_data test; |
Thierry FOURNIER | 149e0fe | 2014-01-29 19:35:06 +0100 | [diff] [blame] | 1698 | |
| 1699 | /* Try all needed converters. */ |
| 1700 | list_for_each_entry(expr, &ref->pat, list) { |
| 1701 | if (!expr->pat_head->parse_smp) |
| 1702 | continue; |
| 1703 | |
| 1704 | if (!expr->pat_head->parse_smp(value, &test)) { |
| 1705 | memprintf(err, "unable to parse '%s'", value); |
| 1706 | return 0; |
| 1707 | } |
| 1708 | } |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1709 | |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1710 | /* Modify pattern from reference. */ |
| 1711 | sample = strdup(value); |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1712 | if (!sample) { |
| 1713 | memprintf(err, "out of memory error"); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1714 | return 0; |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1715 | } |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1716 | /* Load sample in each reference. All the conversions are tested |
| 1717 | * below, normally these calls don't fail. |
Thierry FOURNIER | 149e0fe | 2014-01-29 19:35:06 +0100 | [diff] [blame] | 1718 | */ |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 1719 | list_for_each_entry(expr, &ref->pat, list) { |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1720 | if (!expr->pat_head->parse_smp) |
| 1721 | continue; |
| 1722 | |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 1723 | HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1724 | data = pattern_find_smp(expr, elt); |
| 1725 | if (data && *data && !expr->pat_head->parse_smp(sample, *data)) |
| 1726 | *data = NULL; |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 1727 | HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1728 | } |
| 1729 | |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 1730 | /* free old sample only when all exprs are updated */ |
| 1731 | free(elt->sample); |
| 1732 | elt->sample = sample; |
| 1733 | |
| 1734 | |
Thierry FOURNIER | 149e0fe | 2014-01-29 19:35:06 +0100 | [diff] [blame] | 1735 | return 1; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1736 | } |
| 1737 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1738 | /* This function modifies the sample of pat_ref_elt <refelt> in all expressions |
| 1739 | * found under <ref> to become <value>, after checking that <refelt> really |
| 1740 | * belongs to <ref>. |
| 1741 | */ |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1742 | int pat_ref_set_by_id(struct pat_ref *ref, struct pat_ref_elt *refelt, const char *value, char **err) |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1743 | { |
| 1744 | struct pat_ref_elt *elt; |
| 1745 | |
| 1746 | /* Look for pattern in the reference. */ |
| 1747 | list_for_each_entry(elt, &ref->head, list) { |
| 1748 | if (elt == refelt) { |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1749 | if (!pat_ref_set_elt(ref, elt, value, err)) |
| 1750 | return 0; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1751 | return 1; |
| 1752 | } |
| 1753 | } |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1754 | |
| 1755 | memprintf(err, "key or pattern not found"); |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1756 | return 0; |
| 1757 | } |
| 1758 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1759 | /* This function modifies to <value> the sample of all patterns matching <key> |
| 1760 | * under <ref>. |
| 1761 | */ |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1762 | int pat_ref_set(struct pat_ref *ref, const char *key, const char *value, char **err) |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1763 | { |
| 1764 | struct pat_ref_elt *elt; |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1765 | int found = 0; |
| 1766 | char *_merr; |
| 1767 | char **merr; |
| 1768 | |
| 1769 | if (err) { |
| 1770 | merr = &_merr; |
| 1771 | *merr = NULL; |
| 1772 | } |
| 1773 | else |
| 1774 | merr = NULL; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1775 | |
| 1776 | /* Look for pattern in the reference. */ |
| 1777 | list_for_each_entry(elt, &ref->head, list) { |
| 1778 | if (strcmp(key, elt->pattern) == 0) { |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1779 | if (!pat_ref_set_elt(ref, elt, value, merr)) { |
William Lallemand | 579fb25 | 2018-06-11 10:53:46 +0200 | [diff] [blame] | 1780 | if (err && merr) { |
| 1781 | if (!found) { |
| 1782 | *err = *merr; |
| 1783 | } else { |
| 1784 | memprintf(err, "%s, %s", *err, *merr); |
Willy Tarreau | 61cfdf4 | 2021-02-20 10:46:51 +0100 | [diff] [blame] | 1785 | ha_free(merr); |
William Lallemand | 579fb25 | 2018-06-11 10:53:46 +0200 | [diff] [blame] | 1786 | } |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1787 | } |
| 1788 | } |
| 1789 | found = 1; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1790 | } |
| 1791 | } |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1792 | |
| 1793 | if (!found) { |
| 1794 | memprintf(err, "entry not found"); |
| 1795 | return 0; |
| 1796 | } |
| 1797 | return 1; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1798 | } |
| 1799 | |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 1800 | /* This function creates a new reference. <ref> is the reference name. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1801 | * <flags> are PAT_REF_*. /!\ The reference is not checked, and must |
| 1802 | * be unique. The user must check the reference with "pat_ref_lookup()" |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1803 | * before calling this function. If the function fails, it returns NULL, |
| 1804 | * otherwise it returns the new struct pat_ref. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1805 | */ |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1806 | struct pat_ref *pat_ref_new(const char *reference, const char *display, unsigned int flags) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1807 | { |
| 1808 | struct pat_ref *ref; |
| 1809 | |
Willy Tarreau | 8135d9b | 2020-10-30 15:35:11 +0100 | [diff] [blame] | 1810 | ref = calloc(1, sizeof(*ref)); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1811 | if (!ref) |
| 1812 | return NULL; |
| 1813 | |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1814 | if (display) { |
| 1815 | ref->display = strdup(display); |
| 1816 | if (!ref->display) { |
| 1817 | free(ref); |
| 1818 | return NULL; |
| 1819 | } |
| 1820 | } |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1821 | |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1822 | ref->reference = strdup(reference); |
| 1823 | if (!ref->reference) { |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1824 | free(ref->display); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1825 | free(ref); |
| 1826 | return NULL; |
| 1827 | } |
| 1828 | |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1829 | ref->flags = flags; |
| 1830 | ref->unique_id = -1; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1831 | ref->revision = 0; |
Dragan Dosen | a75eea7 | 2021-05-21 16:59:15 +0200 | [diff] [blame] | 1832 | ref->entry_cnt = 0; |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1833 | |
| 1834 | LIST_INIT(&ref->head); |
| 1835 | LIST_INIT(&ref->pat); |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 1836 | HA_SPIN_INIT(&ref->lock); |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 1837 | LIST_APPEND(&pattern_reference, &ref->list); |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1838 | |
| 1839 | return ref; |
| 1840 | } |
| 1841 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1842 | /* This function creates a new reference. <unique_id> is the unique id. If |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1843 | * the value of <unique_id> is -1, the unique id is calculated later. |
| 1844 | * <flags> are PAT_REF_*. /!\ The reference is not checked, and must |
| 1845 | * be unique. The user must check the reference with "pat_ref_lookup()" |
| 1846 | * or pat_ref_lookupid before calling this function. If the function |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1847 | * fails, it returns NULL, otherwise it returns the new struct pat_ref. |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1848 | */ |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1849 | struct pat_ref *pat_ref_newid(int unique_id, const char *display, unsigned int flags) |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1850 | { |
| 1851 | struct pat_ref *ref; |
| 1852 | |
Willy Tarreau | 8135d9b | 2020-10-30 15:35:11 +0100 | [diff] [blame] | 1853 | ref = calloc(1, sizeof(*ref)); |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1854 | if (!ref) |
| 1855 | return NULL; |
| 1856 | |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1857 | if (display) { |
| 1858 | ref->display = strdup(display); |
| 1859 | if (!ref->display) { |
| 1860 | free(ref); |
| 1861 | return NULL; |
| 1862 | } |
| 1863 | } |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1864 | |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1865 | ref->reference = NULL; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1866 | ref->flags = flags; |
Willy Tarreau | 2994774 | 2020-10-28 11:43:49 +0100 | [diff] [blame] | 1867 | ref->curr_gen = 0; |
| 1868 | ref->next_gen = 0; |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1869 | ref->unique_id = unique_id; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1870 | LIST_INIT(&ref->head); |
| 1871 | LIST_INIT(&ref->pat); |
Aurélien Nephtali | 564d15a | 2018-04-19 16:56:07 +0200 | [diff] [blame] | 1872 | HA_SPIN_INIT(&ref->lock); |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 1873 | LIST_APPEND(&pattern_reference, &ref->list); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1874 | |
| 1875 | return ref; |
| 1876 | } |
| 1877 | |
Willy Tarreau | f4edb72 | 2020-10-28 10:52:46 +0100 | [diff] [blame] | 1878 | /* This function adds entry to <ref>. It can fail on memory error. It returns |
| 1879 | * the newly added element on success, or NULL on failure. The PATREF_LOCK on |
Willy Tarreau | 2994774 | 2020-10-28 11:43:49 +0100 | [diff] [blame] | 1880 | * <ref> must be held. It sets the newly created pattern's generation number |
| 1881 | * to the same value as the reference's. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1882 | */ |
Willy Tarreau | f4edb72 | 2020-10-28 10:52:46 +0100 | [diff] [blame] | 1883 | struct pat_ref_elt *pat_ref_append(struct pat_ref *ref, const char *pattern, const char *sample, int line) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1884 | { |
| 1885 | struct pat_ref_elt *elt; |
| 1886 | |
Willy Tarreau | 8135d9b | 2020-10-30 15:35:11 +0100 | [diff] [blame] | 1887 | elt = calloc(1, sizeof(*elt)); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1888 | if (!elt) |
Willy Tarreau | f4edb72 | 2020-10-28 10:52:46 +0100 | [diff] [blame] | 1889 | goto fail; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1890 | |
Willy Tarreau | 2994774 | 2020-10-28 11:43:49 +0100 | [diff] [blame] | 1891 | elt->gen_id = ref->curr_gen; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1892 | elt->line = line; |
| 1893 | |
| 1894 | elt->pattern = strdup(pattern); |
Willy Tarreau | f4edb72 | 2020-10-28 10:52:46 +0100 | [diff] [blame] | 1895 | if (!elt->pattern) |
| 1896 | goto fail; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1897 | |
| 1898 | if (sample) { |
| 1899 | elt->sample = strdup(sample); |
Willy Tarreau | f4edb72 | 2020-10-28 10:52:46 +0100 | [diff] [blame] | 1900 | if (!elt->sample) |
| 1901 | goto fail; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1902 | } |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1903 | |
Emeric Brun | 8d85aa4 | 2017-06-29 15:40:33 +0200 | [diff] [blame] | 1904 | LIST_INIT(&elt->back_refs); |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1905 | elt->list_head = NULL; |
| 1906 | elt->tree_head = NULL; |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 1907 | LIST_APPEND(&ref->head, &elt->list); |
Willy Tarreau | f4edb72 | 2020-10-28 10:52:46 +0100 | [diff] [blame] | 1908 | return elt; |
| 1909 | fail: |
| 1910 | if (elt) |
| 1911 | free(elt->pattern); |
| 1912 | free(elt); |
| 1913 | return NULL; |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1914 | } |
| 1915 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1916 | /* This function creates sample found in <elt>, parses the pattern also |
| 1917 | * found in <elt> and inserts it in <expr>. The function copies <patflags> |
| 1918 | * into <expr>. If the function fails, it returns 0 and <err> is filled. |
Ilya Shipitsin | 47d1718 | 2020-06-21 21:42:57 +0500 | [diff] [blame] | 1919 | * In success case, the function returns 1. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1920 | */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1921 | int pat_ref_push(struct pat_ref_elt *elt, struct pattern_expr *expr, |
| 1922 | int patflags, char **err) |
| 1923 | { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1924 | struct sample_data *data; |
Thierry FOURNIER | d25c842 | 2014-01-28 15:34:35 +0100 | [diff] [blame] | 1925 | struct pattern pattern; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1926 | |
| 1927 | /* Create sample */ |
| 1928 | if (elt->sample && expr->pat_head->parse_smp) { |
| 1929 | /* New sample. */ |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1930 | data = malloc(sizeof(*data)); |
| 1931 | if (!data) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1932 | return 0; |
| 1933 | |
| 1934 | /* Parse value. */ |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1935 | if (!expr->pat_head->parse_smp(elt->sample, data)) { |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1936 | memprintf(err, "unable to parse '%s'", elt->sample); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1937 | free(data); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1938 | return 0; |
| 1939 | } |
| 1940 | |
| 1941 | } |
| 1942 | else |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1943 | data = NULL; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1944 | |
Thierry FOURNIER | d25c842 | 2014-01-28 15:34:35 +0100 | [diff] [blame] | 1945 | /* initialise pattern */ |
| 1946 | memset(&pattern, 0, sizeof(pattern)); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1947 | pattern.data = data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1948 | pattern.ref = elt; |
Thierry FOURNIER | d25c842 | 2014-01-28 15:34:35 +0100 | [diff] [blame] | 1949 | |
| 1950 | /* parse pattern */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 1951 | if (!expr->pat_head->parse(elt->pattern, &pattern, expr->mflags, err)) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1952 | free(data); |
Thierry FOURNIER | d25c842 | 2014-01-28 15:34:35 +0100 | [diff] [blame] | 1953 | return 0; |
| 1954 | } |
| 1955 | |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 1956 | HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock); |
Thierry FOURNIER | d25c842 | 2014-01-28 15:34:35 +0100 | [diff] [blame] | 1957 | /* index pattern */ |
| 1958 | if (!expr->pat_head->index(expr, &pattern, err)) { |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 1959 | HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1960 | free(data); |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1961 | return 0; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1962 | } |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 1963 | HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock); |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1964 | |
| 1965 | return 1; |
| 1966 | } |
| 1967 | |
Willy Tarreau | 0439e5e | 2020-10-28 18:45:45 +0100 | [diff] [blame] | 1968 | /* This function tries to commit entry <elt> into <ref>. The new entry must |
| 1969 | * have already been inserted using pat_ref_append(), and its generation number |
| 1970 | * may have been adjusted as it will not be changed. <err> must point to a NULL |
| 1971 | * pointer. The PATREF lock on <ref> must be held. All the pattern_expr for |
| 1972 | * this reference will be updated (parsing, indexing). On success, non-zero is |
| 1973 | * returned. On failure, all the operation is rolled back (the element is |
| 1974 | * deleted from all expressions and is freed), zero is returned and the error |
| 1975 | * pointer <err> may have been updated (and the caller must free it). Failure |
| 1976 | * causes include memory allocation, parsing error or indexing error. |
| 1977 | */ |
Willy Tarreau | dc2410d | 2021-01-15 14:11:59 +0100 | [diff] [blame] | 1978 | int pat_ref_commit_elt(struct pat_ref *ref, struct pat_ref_elt *elt, char **err) |
Willy Tarreau | 0439e5e | 2020-10-28 18:45:45 +0100 | [diff] [blame] | 1979 | { |
| 1980 | struct pattern_expr *expr; |
| 1981 | |
| 1982 | list_for_each_entry(expr, &ref->pat, list) { |
| 1983 | if (!pat_ref_push(elt, expr, 0, err)) { |
| 1984 | pat_ref_delete_by_ptr(ref, elt); |
| 1985 | return 0; |
| 1986 | } |
| 1987 | } |
| 1988 | return 1; |
| 1989 | } |
| 1990 | |
Willy Tarreau | 1a6857b | 2020-10-29 09:21:43 +0100 | [diff] [blame] | 1991 | /* Loads <pattern>:<sample> into <ref> for generation <gen>. <sample> may be |
| 1992 | * NULL if none exists (e.g. ACL). If not needed, the generation number should |
| 1993 | * be set to ref->curr_gen. The error pointer must initially point to NULL. The |
| 1994 | * new entry will be propagated to all use places, involving allocation, parsing |
| 1995 | * and indexing. On error (parsing, allocation), the operation will be rolled |
| 1996 | * back, an error may be reported, and NULL will be reported. On success, the |
| 1997 | * freshly allocated element will be returned. The PATREF lock on <ref> must be |
| 1998 | * held during the operation. |
| 1999 | */ |
| 2000 | struct pat_ref_elt *pat_ref_load(struct pat_ref *ref, unsigned int gen, |
| 2001 | const char *pattern, const char *sample, |
| 2002 | int line, char **err) |
| 2003 | { |
| 2004 | struct pat_ref_elt *elt; |
| 2005 | |
| 2006 | elt = pat_ref_append(ref, pattern, sample, line); |
| 2007 | if (elt) { |
| 2008 | elt->gen_id = gen; |
Willy Tarreau | dc2410d | 2021-01-15 14:11:59 +0100 | [diff] [blame] | 2009 | if (!pat_ref_commit_elt(ref, elt, err)) |
Willy Tarreau | 1a6857b | 2020-10-29 09:21:43 +0100 | [diff] [blame] | 2010 | elt = NULL; |
| 2011 | } else |
| 2012 | memprintf(err, "out of memory error"); |
| 2013 | |
| 2014 | return elt; |
| 2015 | } |
| 2016 | |
Willy Tarreau | 6a17407 | 2020-10-28 10:58:05 +0100 | [diff] [blame] | 2017 | /* This function adds entry to <ref>. It can fail on memory error. The new |
Thierry FOURNIER | 31db4ae | 2014-01-30 00:27:15 +0100 | [diff] [blame] | 2018 | * entry is added at all the pattern_expr registered in this reference. The |
Willy Tarreau | 6a17407 | 2020-10-28 10:58:05 +0100 | [diff] [blame] | 2019 | * function stops on the first error encountered. It returns 0 and <err> is |
Thierry FOURNIER | 31db4ae | 2014-01-30 00:27:15 +0100 | [diff] [blame] | 2020 | * filled. If an error is encountered, the complete add operation is cancelled. |
| 2021 | * If the insertion is a success the function returns 1. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2022 | */ |
| 2023 | int pat_ref_add(struct pat_ref *ref, |
| 2024 | const char *pattern, const char *sample, |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 2025 | char **err) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2026 | { |
Willy Tarreau | 1a6857b | 2020-10-29 09:21:43 +0100 | [diff] [blame] | 2027 | return !!pat_ref_load(ref, ref->curr_gen, pattern, sample, -1, err); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2028 | } |
| 2029 | |
Willy Tarreau | a13afe6 | 2021-04-30 13:19:37 +0200 | [diff] [blame] | 2030 | /* This function purges all elements from <ref> whose generation is included in |
| 2031 | * the range of <from> to <to> (inclusive), taking wrapping into consideration. |
| 2032 | * It will not purge more than <budget> entries at once, in order to remain |
| 2033 | * responsive. If budget is negative, no limit is applied. |
Willy Tarreau | 94b9abe | 2020-10-28 18:23:49 +0100 | [diff] [blame] | 2034 | * The caller must already hold the PATREF_LOCK on <ref>. The function will |
| 2035 | * take the PATEXP_LOCK on all expressions of the pattern as needed. It returns |
| 2036 | * non-zero on completion, or zero if it had to stop before the end after |
| 2037 | * <budget> was depleted. |
| 2038 | */ |
Willy Tarreau | a13afe6 | 2021-04-30 13:19:37 +0200 | [diff] [blame] | 2039 | int pat_ref_purge_range(struct pat_ref *ref, uint from, uint to, int budget) |
Willy Tarreau | 94b9abe | 2020-10-28 18:23:49 +0100 | [diff] [blame] | 2040 | { |
| 2041 | struct pat_ref_elt *elt, *elt_bck; |
| 2042 | struct bref *bref, *bref_bck; |
| 2043 | struct pattern_expr *expr; |
| 2044 | int done; |
| 2045 | |
| 2046 | list_for_each_entry(expr, &ref->pat, list) |
| 2047 | HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock); |
| 2048 | |
| 2049 | /* all expr are locked, we can safely remove all pat_ref */ |
| 2050 | |
| 2051 | /* assume completion for e.g. empty lists */ |
| 2052 | done = 1; |
| 2053 | list_for_each_entry_safe(elt, elt_bck, &ref->head, list) { |
Willy Tarreau | a13afe6 | 2021-04-30 13:19:37 +0200 | [diff] [blame] | 2054 | if (elt->gen_id - from > to - from) |
Willy Tarreau | 94b9abe | 2020-10-28 18:23:49 +0100 | [diff] [blame] | 2055 | continue; |
| 2056 | |
| 2057 | if (budget >= 0 && !budget--) { |
| 2058 | done = 0; |
| 2059 | break; |
| 2060 | } |
| 2061 | |
| 2062 | /* |
| 2063 | * we have to unlink all watchers from this reference pattern. We must |
| 2064 | * not relink them if this elt was the last one in the list. |
| 2065 | */ |
| 2066 | list_for_each_entry_safe(bref, bref_bck, &elt->back_refs, users) { |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 2067 | LIST_DELETE(&bref->users); |
Willy Tarreau | 94b9abe | 2020-10-28 18:23:49 +0100 | [diff] [blame] | 2068 | LIST_INIT(&bref->users); |
| 2069 | if (elt->list.n != &ref->head) |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 2070 | LIST_APPEND(&LIST_ELEM(elt->list.n, typeof(elt), list)->back_refs, &bref->users); |
Willy Tarreau | 94b9abe | 2020-10-28 18:23:49 +0100 | [diff] [blame] | 2071 | bref->ref = elt->list.n; |
| 2072 | } |
| 2073 | |
| 2074 | /* delete the storage for all representations of this pattern. */ |
| 2075 | pat_delete_gen(ref, elt); |
| 2076 | |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 2077 | LIST_DELETE(&elt->list); |
Willy Tarreau | 94b9abe | 2020-10-28 18:23:49 +0100 | [diff] [blame] | 2078 | free(elt->pattern); |
| 2079 | free(elt->sample); |
| 2080 | free(elt); |
| 2081 | } |
| 2082 | |
| 2083 | list_for_each_entry(expr, &ref->pat, list) |
| 2084 | HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock); |
| 2085 | |
Willy Tarreau | 9b060f1 | 2023-03-22 15:38:13 +0100 | [diff] [blame] | 2086 | if (done) |
| 2087 | trim_all_pools(); |
Willy Tarreau | 94b9abe | 2020-10-28 18:23:49 +0100 | [diff] [blame] | 2088 | |
| 2089 | return done; |
| 2090 | } |
| 2091 | |
Willy Tarreau | ae83e63 | 2020-11-03 10:37:31 +0100 | [diff] [blame] | 2092 | /* This function prunes all entries of <ref> and all their associated |
| 2093 | * pattern_expr. It may return before the end of the list is reached, |
| 2094 | * returning 0, to yield, indicating to the caller that it must call it again. |
| 2095 | * until it returns non-zero. All patterns are purged, both current ones and |
| 2096 | * future or incomplete ones. This is used by "clear map" or "clear acl". |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2097 | */ |
Willy Tarreau | d1d005d | 2019-12-20 18:22:02 +0100 | [diff] [blame] | 2098 | int pat_ref_prune(struct pat_ref *ref) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2099 | { |
Willy Tarreau | a13afe6 | 2021-04-30 13:19:37 +0200 | [diff] [blame] | 2100 | return pat_ref_purge_range(ref, 0, ~0, 100); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2101 | } |
| 2102 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 2103 | /* This function looks up any existing reference <ref> in pattern_head <head>, and |
| 2104 | * returns the associated pattern_expr pointer if found, otherwise NULL. |
| 2105 | */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2106 | struct pattern_expr *pattern_lookup_expr(struct pattern_head *head, struct pat_ref *ref) |
| 2107 | { |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2108 | struct pattern_expr_list *expr; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2109 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2110 | list_for_each_entry(expr, &head->head, list) |
| 2111 | if (expr->expr->ref == ref) |
| 2112 | return expr->expr; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2113 | return NULL; |
| 2114 | } |
| 2115 | |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 2116 | /* This function creates new pattern_expr associated to the reference <ref>. |
| 2117 | * <ref> can be NULL. If an error occurs, the function returns NULL and |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2118 | * <err> is filled. Otherwise, the function returns new pattern_expr linked |
| 2119 | * with <head> and <ref>. |
Thierry FOURNIER | 315ec42 | 2014-11-24 11:14:42 +0100 | [diff] [blame] | 2120 | * |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 2121 | * The returned value can be an already filled pattern list, in this case the |
Thierry FOURNIER | 315ec42 | 2014-11-24 11:14:42 +0100 | [diff] [blame] | 2122 | * flag <reuse> is set. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2123 | */ |
Thierry FOURNIER | 315ec42 | 2014-11-24 11:14:42 +0100 | [diff] [blame] | 2124 | struct pattern_expr *pattern_new_expr(struct pattern_head *head, struct pat_ref *ref, |
Emeric Brun | 7d27f3c | 2017-07-03 17:54:23 +0200 | [diff] [blame] | 2125 | int patflags, char **err, int *reuse) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2126 | { |
| 2127 | struct pattern_expr *expr; |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2128 | struct pattern_expr_list *list; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2129 | |
Thierry FOURNIER | 315ec42 | 2014-11-24 11:14:42 +0100 | [diff] [blame] | 2130 | if (reuse) |
| 2131 | *reuse = 0; |
| 2132 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2133 | /* Memory and initialization of the chain element. */ |
Willy Tarreau | 8135d9b | 2020-10-30 15:35:11 +0100 | [diff] [blame] | 2134 | list = calloc(1, sizeof(*list)); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2135 | if (!list) { |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2136 | memprintf(err, "out of memory"); |
| 2137 | return NULL; |
| 2138 | } |
| 2139 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2140 | /* Look for existing similar expr. No that only the index, parse and |
| 2141 | * parse_smp function must be identical for having similar pattern. |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 2142 | * The other function depends of these first. |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2143 | */ |
| 2144 | if (ref) { |
| 2145 | list_for_each_entry(expr, &ref->pat, list) |
| 2146 | if (expr->pat_head->index == head->index && |
| 2147 | expr->pat_head->parse == head->parse && |
Emeric Brun | 7d27f3c | 2017-07-03 17:54:23 +0200 | [diff] [blame] | 2148 | expr->pat_head->parse_smp == head->parse_smp && |
| 2149 | expr->mflags == patflags) |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2150 | break; |
| 2151 | if (&expr->list == &ref->pat) |
| 2152 | expr = NULL; |
| 2153 | } |
| 2154 | else |
| 2155 | expr = NULL; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2156 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2157 | /* If no similar expr was found, we create new expr. */ |
| 2158 | if (!expr) { |
| 2159 | /* Get a lot of memory for the expr struct. */ |
Willy Tarreau | 8135d9b | 2020-10-30 15:35:11 +0100 | [diff] [blame] | 2160 | expr = calloc(1, sizeof(*expr)); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2161 | if (!expr) { |
Andreas Seltenreich | e6e22e8 | 2016-03-03 20:20:23 +0100 | [diff] [blame] | 2162 | free(list); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2163 | memprintf(err, "out of memory"); |
| 2164 | return NULL; |
| 2165 | } |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2166 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2167 | /* Initialize this new expr. */ |
| 2168 | pattern_init_expr(expr); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2169 | |
Emeric Brun | 7d27f3c | 2017-07-03 17:54:23 +0200 | [diff] [blame] | 2170 | /* Copy the pattern matching and indexing flags. */ |
| 2171 | expr->mflags = patflags; |
| 2172 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2173 | /* This new pattern expression reference one of his heads. */ |
| 2174 | expr->pat_head = head; |
| 2175 | |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 2176 | /* Link with ref, or to self to facilitate LIST_DELETE() */ |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2177 | if (ref) |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 2178 | LIST_APPEND(&ref->pat, &expr->list); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2179 | else |
| 2180 | LIST_INIT(&expr->list); |
| 2181 | |
| 2182 | expr->ref = ref; |
| 2183 | |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2184 | HA_RWLOCK_INIT(&expr->lock); |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2185 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2186 | /* We must free this pattern if it is no more used. */ |
| 2187 | list->do_free = 1; |
| 2188 | } |
| 2189 | else { |
| 2190 | /* If the pattern used already exists, it is already linked |
| 2191 | * with ref and we must not free it. |
| 2192 | */ |
| 2193 | list->do_free = 0; |
Thierry FOURNIER | 315ec42 | 2014-11-24 11:14:42 +0100 | [diff] [blame] | 2194 | if (reuse) |
| 2195 | *reuse = 1; |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2196 | } |
| 2197 | |
| 2198 | /* The new list element reference the pattern_expr. */ |
| 2199 | list->expr = expr; |
| 2200 | |
| 2201 | /* Link the list element with the pattern_head. */ |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 2202 | LIST_APPEND(&head->head, &list->list); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2203 | return expr; |
| 2204 | } |
| 2205 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2206 | /* Reads patterns from a file. If <err_msg> is non-NULL, an error message will |
| 2207 | * be returned there on errors and the caller will have to free it. |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2208 | * |
| 2209 | * The file contains one key + value per line. Lines which start with '#' are |
| 2210 | * ignored, just like empty lines. Leading tabs/spaces are stripped. The key is |
| 2211 | * then the first "word" (series of non-space/tabs characters), and the value is |
| 2212 | * what follows this series of space/tab till the end of the line excluding |
| 2213 | * trailing spaces/tabs. |
| 2214 | * |
| 2215 | * Example : |
| 2216 | * |
| 2217 | * # this is a comment and is ignored |
| 2218 | * 62.212.114.60 1wt.eu \n |
| 2219 | * <-><-----------><---><----><----> |
| 2220 | * | | | | `--- trailing spaces ignored |
| 2221 | * | | | `-------- value |
| 2222 | * | | `--------------- middle spaces ignored |
| 2223 | * | `------------------------ key |
| 2224 | * `-------------------------------- leading spaces ignored |
| 2225 | * |
Ilya Shipitsin | 47d1718 | 2020-06-21 21:42:57 +0500 | [diff] [blame] | 2226 | * Return non-zero in case of success, otherwise 0. |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2227 | */ |
| 2228 | int pat_ref_read_from_file_smp(struct pat_ref *ref, const char *filename, char **err) |
| 2229 | { |
| 2230 | FILE *file; |
| 2231 | char *c; |
| 2232 | int ret = 0; |
| 2233 | int line = 0; |
| 2234 | char *key_beg; |
| 2235 | char *key_end; |
| 2236 | char *value_beg; |
| 2237 | char *value_end; |
| 2238 | |
| 2239 | file = fopen(filename, "r"); |
| 2240 | if (!file) { |
| 2241 | memprintf(err, "failed to open pattern file <%s>", filename); |
| 2242 | return 0; |
| 2243 | } |
| 2244 | |
| 2245 | /* now parse all patterns. The file may contain only one pattern |
| 2246 | * followed by one value per line. The start spaces, separator spaces |
| 2247 | * and and spaces are stripped. Each can contain comment started by '#' |
| 2248 | */ |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2249 | while (fgets(trash.area, trash.size, file) != NULL) { |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2250 | line++; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2251 | c = trash.area; |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2252 | |
| 2253 | /* ignore lines beginning with a dash */ |
| 2254 | if (*c == '#') |
| 2255 | continue; |
| 2256 | |
| 2257 | /* strip leading spaces and tabs */ |
| 2258 | while (*c == ' ' || *c == '\t') |
| 2259 | c++; |
| 2260 | |
| 2261 | /* empty lines are ignored too */ |
| 2262 | if (*c == '\0' || *c == '\r' || *c == '\n') |
| 2263 | continue; |
| 2264 | |
| 2265 | /* look for the end of the key */ |
| 2266 | key_beg = c; |
| 2267 | while (*c && *c != ' ' && *c != '\t' && *c != '\n' && *c != '\r') |
| 2268 | c++; |
| 2269 | |
| 2270 | key_end = c; |
| 2271 | |
| 2272 | /* strip middle spaces and tabs */ |
| 2273 | while (*c == ' ' || *c == '\t') |
| 2274 | c++; |
| 2275 | |
| 2276 | /* look for the end of the value, it is the end of the line */ |
| 2277 | value_beg = c; |
| 2278 | while (*c && *c != '\n' && *c != '\r') |
| 2279 | c++; |
| 2280 | value_end = c; |
| 2281 | |
| 2282 | /* trim possibly trailing spaces and tabs */ |
| 2283 | while (value_end > value_beg && (value_end[-1] == ' ' || value_end[-1] == '\t')) |
| 2284 | value_end--; |
| 2285 | |
| 2286 | /* set final \0 and check entries */ |
| 2287 | *key_end = '\0'; |
| 2288 | *value_end = '\0'; |
| 2289 | |
| 2290 | /* insert values */ |
| 2291 | if (!pat_ref_append(ref, key_beg, value_beg, line)) { |
| 2292 | memprintf(err, "out of memory"); |
| 2293 | goto out_close; |
| 2294 | } |
| 2295 | } |
| 2296 | |
Jerome Magnin | 3c79d4b | 2020-01-17 16:09:33 +0100 | [diff] [blame] | 2297 | if (ferror(file)) { |
| 2298 | memprintf(err, "error encountered while reading <%s> : %s", |
| 2299 | filename, strerror(errno)); |
| 2300 | goto out_close; |
| 2301 | } |
Ilya Shipitsin | 47d1718 | 2020-06-21 21:42:57 +0500 | [diff] [blame] | 2302 | /* success */ |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2303 | ret = 1; |
| 2304 | |
| 2305 | out_close: |
| 2306 | fclose(file); |
| 2307 | return ret; |
| 2308 | } |
| 2309 | |
| 2310 | /* Reads patterns from a file. If <err_msg> is non-NULL, an error message will |
| 2311 | * be returned there on errors and the caller will have to free it. |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2312 | */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2313 | int pat_ref_read_from_file(struct pat_ref *ref, const char *filename, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2314 | { |
| 2315 | FILE *file; |
| 2316 | char *c; |
| 2317 | char *arg; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2318 | int ret = 0; |
| 2319 | int line = 0; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2320 | |
| 2321 | file = fopen(filename, "r"); |
| 2322 | if (!file) { |
| 2323 | memprintf(err, "failed to open pattern file <%s>", filename); |
| 2324 | return 0; |
| 2325 | } |
| 2326 | |
| 2327 | /* now parse all patterns. The file may contain only one pattern per |
| 2328 | * line. If the line contains spaces, they will be part of the pattern. |
| 2329 | * The pattern stops at the first CR, LF or EOF encountered. |
| 2330 | */ |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2331 | while (fgets(trash.area, trash.size, file) != NULL) { |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2332 | line++; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2333 | c = trash.area; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2334 | |
| 2335 | /* ignore lines beginning with a dash */ |
| 2336 | if (*c == '#') |
| 2337 | continue; |
| 2338 | |
| 2339 | /* strip leading spaces and tabs */ |
| 2340 | while (*c == ' ' || *c == '\t') |
| 2341 | c++; |
| 2342 | |
| 2343 | |
| 2344 | arg = c; |
| 2345 | while (*c && *c != '\n' && *c != '\r') |
| 2346 | c++; |
| 2347 | *c = 0; |
| 2348 | |
| 2349 | /* empty lines are ignored too */ |
| 2350 | if (c == arg) |
| 2351 | continue; |
| 2352 | |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2353 | if (!pat_ref_append(ref, arg, NULL, line)) { |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2354 | memprintf(err, "out of memory when loading patterns from file <%s>", filename); |
| 2355 | goto out_close; |
| 2356 | } |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2357 | } |
| 2358 | |
Jerome Magnin | 3c79d4b | 2020-01-17 16:09:33 +0100 | [diff] [blame] | 2359 | if (ferror(file)) { |
| 2360 | memprintf(err, "error encountered while reading <%s> : %s", |
| 2361 | filename, strerror(errno)); |
| 2362 | goto out_close; |
| 2363 | } |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2364 | ret = 1; /* success */ |
| 2365 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2366 | out_close: |
| 2367 | fclose(file); |
| 2368 | return ret; |
| 2369 | } |
| 2370 | |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2371 | int pattern_read_from_file(struct pattern_head *head, unsigned int refflags, |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2372 | const char *filename, int patflags, int load_smp, |
Thierry FOURNIER | 94580c9 | 2014-02-11 14:36:45 +0100 | [diff] [blame] | 2373 | char **err, const char *file, int line) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2374 | { |
| 2375 | struct pat_ref *ref; |
| 2376 | struct pattern_expr *expr; |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2377 | struct pat_ref_elt *elt; |
Willy Tarreau | 4deaf39 | 2014-11-26 13:17:03 +0100 | [diff] [blame] | 2378 | int reuse = 0; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2379 | |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2380 | /* Lookup for the existing reference. */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2381 | ref = pat_ref_lookup(filename); |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2382 | |
| 2383 | /* If the reference doesn't exists, create it and load associated file. */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2384 | if (!ref) { |
Thierry FOURNIER | 94580c9 | 2014-02-11 14:36:45 +0100 | [diff] [blame] | 2385 | chunk_printf(&trash, |
| 2386 | "pattern loaded from file '%s' used by %s at file '%s' line %d", |
| 2387 | filename, refflags & PAT_REF_MAP ? "map" : "acl", file, line); |
| 2388 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2389 | ref = pat_ref_new(filename, trash.area, refflags); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2390 | if (!ref) { |
| 2391 | memprintf(err, "out of memory"); |
| 2392 | return 0; |
| 2393 | } |
| 2394 | |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2395 | if (load_smp) { |
Thierry FOURNIER | c0bd910 | 2014-01-29 12:32:58 +0100 | [diff] [blame] | 2396 | ref->flags |= PAT_REF_SMP; |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2397 | if (!pat_ref_read_from_file_smp(ref, filename, err)) |
| 2398 | return 0; |
| 2399 | } |
| 2400 | else { |
| 2401 | if (!pat_ref_read_from_file(ref, filename, err)) |
| 2402 | return 0; |
| 2403 | } |
| 2404 | } |
| 2405 | else { |
Thierry FOURNIER | c0bd910 | 2014-01-29 12:32:58 +0100 | [diff] [blame] | 2406 | /* The reference already exists, check the map compatibility. */ |
| 2407 | |
| 2408 | /* If the load require samples and the flag PAT_REF_SMP is not set, |
| 2409 | * the reference doesn't contain sample, and cannot be used. |
| 2410 | */ |
| 2411 | if (load_smp) { |
| 2412 | if (!(ref->flags & PAT_REF_SMP)) { |
| 2413 | memprintf(err, "The file \"%s\" is already used as one column file " |
| 2414 | "and cannot be used by as two column file.", |
| 2415 | filename); |
| 2416 | return 0; |
| 2417 | } |
| 2418 | } |
| 2419 | else { |
| 2420 | /* The load doesn't require samples. If the flag PAT_REF_SMP is |
| 2421 | * set, the reference contains a sample, and cannot be used. |
| 2422 | */ |
| 2423 | if (ref->flags & PAT_REF_SMP) { |
| 2424 | memprintf(err, "The file \"%s\" is already used as two column file " |
| 2425 | "and cannot be used by as one column file.", |
| 2426 | filename); |
| 2427 | return 0; |
| 2428 | } |
| 2429 | } |
| 2430 | |
Thierry FOURNIER | 94580c9 | 2014-02-11 14:36:45 +0100 | [diff] [blame] | 2431 | /* Extends display */ |
| 2432 | chunk_printf(&trash, "%s", ref->display); |
| 2433 | chunk_appendf(&trash, ", by %s at file '%s' line %d", |
| 2434 | refflags & PAT_REF_MAP ? "map" : "acl", file, line); |
| 2435 | free(ref->display); |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2436 | ref->display = strdup(trash.area); |
Thierry FOURNIER | 94580c9 | 2014-02-11 14:36:45 +0100 | [diff] [blame] | 2437 | if (!ref->display) { |
| 2438 | memprintf(err, "out of memory"); |
| 2439 | return 0; |
| 2440 | } |
| 2441 | |
Thierry FOURNIER | c0bd910 | 2014-01-29 12:32:58 +0100 | [diff] [blame] | 2442 | /* Merge flags. */ |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2443 | ref->flags |= refflags; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2444 | } |
| 2445 | |
| 2446 | /* Now, we can loading patterns from the reference. */ |
| 2447 | |
| 2448 | /* Lookup for existing reference in the head. If the reference |
| 2449 | * doesn't exists, create it. |
| 2450 | */ |
| 2451 | expr = pattern_lookup_expr(head, ref); |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 2452 | if (!expr || (expr->mflags != patflags)) { |
Emeric Brun | 7d27f3c | 2017-07-03 17:54:23 +0200 | [diff] [blame] | 2453 | expr = pattern_new_expr(head, ref, patflags, err, &reuse); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2454 | if (!expr) |
| 2455 | return 0; |
| 2456 | } |
| 2457 | |
Thierry FOURNIER | 315ec42 | 2014-11-24 11:14:42 +0100 | [diff] [blame] | 2458 | /* The returned expression may be not empty, because the function |
| 2459 | * "pattern_new_expr" lookup for similar pattern list and can |
| 2460 | * reuse a already filled pattern list. In this case, we can not |
| 2461 | * reload the patterns. |
| 2462 | */ |
| 2463 | if (reuse) |
| 2464 | return 1; |
| 2465 | |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2466 | /* Load reference content in the pattern expression. */ |
| 2467 | list_for_each_entry(elt, &ref->head, list) { |
| 2468 | if (!pat_ref_push(elt, expr, patflags, err)) { |
| 2469 | if (elt->line > 0) |
| 2470 | memprintf(err, "%s at line %d of file '%s'", |
| 2471 | *err, elt->line, filename); |
| 2472 | return 0; |
| 2473 | } |
| 2474 | } |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2475 | |
| 2476 | return 1; |
| 2477 | } |
| 2478 | |
Thierry FOURNIER | 1794fdf | 2014-01-17 15:25:13 +0100 | [diff] [blame] | 2479 | /* This function executes a pattern match on a sample. It applies pattern <expr> |
Thayne McCombs | 8f0cc5c | 2021-01-07 21:35:52 -0700 | [diff] [blame] | 2480 | * to sample <smp>. The function returns NULL if the sample don't match. It returns |
Thierry FOURNIER | 1794fdf | 2014-01-17 15:25:13 +0100 | [diff] [blame] | 2481 | * non-null if the sample match. If <fill> is true and the sample match, the |
| 2482 | * function returns the matched pattern. In many cases, this pattern can be a |
| 2483 | * static buffer. |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2484 | */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2485 | struct pattern *pattern_exec_match(struct pattern_head *head, struct sample *smp, int fill) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2486 | { |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2487 | struct pattern_expr_list *list; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2488 | struct pattern *pat; |
| 2489 | |
| 2490 | if (!head->match) { |
Thierry FOURNIER | 1794fdf | 2014-01-17 15:25:13 +0100 | [diff] [blame] | 2491 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 2492 | static_pattern.data = NULL; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 2493 | static_pattern.ref = NULL; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 2494 | static_pattern.sflags = 0; |
Thierry FOURNIER | 07ee64e | 2015-07-06 23:43:03 +0200 | [diff] [blame] | 2495 | static_pattern.type = SMP_T_SINT; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 2496 | static_pattern.val.i = 1; |
Thierry FOURNIER | 1794fdf | 2014-01-17 15:25:13 +0100 | [diff] [blame] | 2497 | } |
Thierry FOURNIER | 1794fdf | 2014-01-17 15:25:13 +0100 | [diff] [blame] | 2498 | return &static_pattern; |
| 2499 | } |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2500 | |
Thierry FOURNIER | 5d34408 | 2014-01-27 14:19:53 +0100 | [diff] [blame] | 2501 | /* convert input to string */ |
| 2502 | if (!sample_convert(smp, head->expect_type)) |
| 2503 | return NULL; |
| 2504 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2505 | list_for_each_entry(list, &head->head, list) { |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2506 | HA_RWLOCK_RDLOCK(PATEXP_LOCK, &list->expr->lock); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2507 | pat = head->match(smp, list->expr, fill); |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2508 | if (pat) { |
| 2509 | /* We duplicate the pattern cause it could be modified |
| 2510 | by another thread */ |
| 2511 | if (pat != &static_pattern) { |
| 2512 | memcpy(&static_pattern, pat, sizeof(struct pattern)); |
| 2513 | pat = &static_pattern; |
| 2514 | } |
| 2515 | |
| 2516 | /* We also duplicate the sample data for |
| 2517 | same reason */ |
| 2518 | if (pat->data && (pat->data != &static_sample_data)) { |
Christopher Faulet | 09fdf4b | 2017-11-09 16:14:16 +0100 | [diff] [blame] | 2519 | switch(pat->data->type) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2520 | case SMP_T_STR: |
| 2521 | static_sample_data.type = SMP_T_STR; |
| 2522 | static_sample_data.u.str = *get_trash_chunk(); |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2523 | static_sample_data.u.str.data = pat->data->u.str.data; |
| 2524 | if (static_sample_data.u.str.data >= static_sample_data.u.str.size) |
| 2525 | static_sample_data.u.str.data = static_sample_data.u.str.size - 1; |
| 2526 | memcpy(static_sample_data.u.str.area, |
Willy Tarreau | 2fc761e | 2020-06-11 16:37:35 +0200 | [diff] [blame] | 2527 | pat->data->u.str.area, static_sample_data.u.str.data); |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2528 | static_sample_data.u.str.area[static_sample_data.u.str.data] = 0; |
Willy Tarreau | 2fc761e | 2020-06-11 16:37:35 +0200 | [diff] [blame] | 2529 | pat->data = &static_sample_data; |
| 2530 | break; |
| 2531 | |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2532 | case SMP_T_IPV4: |
| 2533 | case SMP_T_IPV6: |
| 2534 | case SMP_T_SINT: |
| 2535 | memcpy(&static_sample_data, pat->data, sizeof(struct sample_data)); |
Willy Tarreau | 2fc761e | 2020-06-11 16:37:35 +0200 | [diff] [blame] | 2536 | pat->data = &static_sample_data; |
| 2537 | break; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2538 | default: |
Willy Tarreau | 2fc761e | 2020-06-11 16:37:35 +0200 | [diff] [blame] | 2539 | /* unimplemented pattern type */ |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2540 | pat->data = NULL; |
Willy Tarreau | 2fc761e | 2020-06-11 16:37:35 +0200 | [diff] [blame] | 2541 | break; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2542 | } |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2543 | } |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2544 | HA_RWLOCK_RDUNLOCK(PATEXP_LOCK, &list->expr->lock); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2545 | return pat; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2546 | } |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2547 | HA_RWLOCK_RDUNLOCK(PATEXP_LOCK, &list->expr->lock); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2548 | } |
| 2549 | return NULL; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2550 | } |
| 2551 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 2552 | /* This function prunes the pattern expressions starting at pattern_head <head>. */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2553 | void pattern_prune(struct pattern_head *head) |
Thierry FOURNIER | 6f7203d | 2014-01-14 16:24:51 +0100 | [diff] [blame] | 2554 | { |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2555 | struct pattern_expr_list *list, *safe; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2556 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2557 | list_for_each_entry_safe(list, safe, &head->head, list) { |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 2558 | LIST_DELETE(&list->list); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2559 | if (list->do_free) { |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 2560 | LIST_DELETE(&list->expr->list); |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2561 | HA_RWLOCK_WRLOCK(PATEXP_LOCK, &list->expr->lock); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2562 | head->prune(list->expr); |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2563 | HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &list->expr->lock); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2564 | free(list->expr); |
| 2565 | } |
| 2566 | free(list); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2567 | } |
Thierry FOURNIER | 6f7203d | 2014-01-14 16:24:51 +0100 | [diff] [blame] | 2568 | } |
| 2569 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 2570 | /* This function searches occurrences of pattern reference element <ref> in |
| 2571 | * expression <expr> and returns a pointer to a pointer of the sample storage. |
| 2572 | * If <ref> is not found, NULL is returned. |
Thierry FOURNIER | 55d0b10 | 2014-01-15 11:25:26 +0100 | [diff] [blame] | 2573 | */ |
Thierry FOURNIER | 12ba0c2 | 2015-08-14 00:02:11 +0200 | [diff] [blame] | 2574 | struct sample_data **pattern_find_smp(struct pattern_expr *expr, struct pat_ref_elt *ref) |
Thierry FOURNIER | 55d0b10 | 2014-01-15 11:25:26 +0100 | [diff] [blame] | 2575 | { |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 2576 | struct ebmb_node *node; |
| 2577 | struct pattern_tree *elt; |
| 2578 | struct pattern_list *pat; |
Thierry FOURNIER | 55d0b10 | 2014-01-15 11:25:26 +0100 | [diff] [blame] | 2579 | |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 2580 | for (node = ebmb_first(&expr->pattern_tree); |
| 2581 | node; |
| 2582 | node = ebmb_next(node)) { |
| 2583 | elt = container_of(node, struct pattern_tree, node); |
| 2584 | if (elt->ref == ref) |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 2585 | return &elt->data; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 2586 | } |
| 2587 | |
| 2588 | for (node = ebmb_first(&expr->pattern_tree_2); |
| 2589 | node; |
| 2590 | node = ebmb_next(node)) { |
| 2591 | elt = container_of(node, struct pattern_tree, node); |
| 2592 | if (elt->ref == ref) |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 2593 | return &elt->data; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 2594 | } |
| 2595 | |
| 2596 | list_for_each_entry(pat, &expr->patterns, list) |
| 2597 | if (pat->pat.ref == ref) |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 2598 | return &pat->pat.data; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 2599 | |
| 2600 | return NULL; |
Thierry FOURNIER | 55d0b10 | 2014-01-15 11:25:26 +0100 | [diff] [blame] | 2601 | } |
| 2602 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 2603 | /* This function compares two pat_ref** on their unique_id, and returns -1/0/1 |
| 2604 | * depending on their order (suitable for sorting). |
| 2605 | */ |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2606 | static int cmp_pat_ref(const void *_a, const void *_b) |
| 2607 | { |
| 2608 | struct pat_ref * const *a = _a; |
| 2609 | struct pat_ref * const *b = _b; |
| 2610 | |
| 2611 | if ((*a)->unique_id < (*b)->unique_id) |
| 2612 | return -1; |
| 2613 | else if ((*a)->unique_id > (*b)->unique_id) |
| 2614 | return 1; |
| 2615 | return 0; |
| 2616 | } |
| 2617 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 2618 | /* This function finalizes the configuration parsing. It sets all the |
| 2619 | * automatic ids. |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2620 | */ |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2621 | int pattern_finalize_config(void) |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2622 | { |
Tim Duesterhus | b584b44 | 2020-03-17 21:08:24 +0100 | [diff] [blame] | 2623 | size_t len = 0; |
| 2624 | size_t unassigned_pos = 0; |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2625 | int next_unique_id = 0; |
Tim Duesterhus | b584b44 | 2020-03-17 21:08:24 +0100 | [diff] [blame] | 2626 | size_t i, j; |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2627 | struct pat_ref *ref, **arr; |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2628 | struct list pr = LIST_HEAD_INIT(pr); |
| 2629 | |
Willy Tarreau | 52bf839 | 2020-03-08 00:42:37 +0100 | [diff] [blame] | 2630 | pat_lru_seed = ha_random(); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 2631 | |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2632 | /* Count pat_refs with user defined unique_id and totalt count */ |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2633 | list_for_each_entry(ref, &pattern_reference, list) { |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2634 | len++; |
| 2635 | if (ref->unique_id != -1) |
| 2636 | unassigned_pos++; |
| 2637 | } |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2638 | |
Tim Duesterhus | b584b44 | 2020-03-17 21:08:24 +0100 | [diff] [blame] | 2639 | if (len == 0) { |
| 2640 | return 0; |
| 2641 | } |
| 2642 | |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2643 | arr = calloc(len, sizeof(*arr)); |
| 2644 | if (arr == NULL) { |
| 2645 | ha_alert("Out of memory error.\n"); |
| 2646 | return ERR_ALERT | ERR_FATAL; |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2647 | } |
| 2648 | |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2649 | i = 0; |
| 2650 | j = unassigned_pos; |
| 2651 | list_for_each_entry(ref, &pattern_reference, list) { |
| 2652 | if (ref->unique_id != -1) |
| 2653 | arr[i++] = ref; |
| 2654 | else |
| 2655 | arr[j++] = ref; |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2656 | } |
| 2657 | |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2658 | /* Sort first segment of array with user-defined unique ids for |
| 2659 | * fast lookup when generating unique ids |
| 2660 | */ |
| 2661 | qsort(arr, unassigned_pos, sizeof(*arr), cmp_pat_ref); |
| 2662 | |
| 2663 | /* Assign unique ids to the rest of the elements */ |
| 2664 | for (i = unassigned_pos; i < len; i++) { |
| 2665 | do { |
| 2666 | arr[i]->unique_id = next_unique_id++; |
| 2667 | } while (bsearch(&arr[i], arr, unassigned_pos, sizeof(*arr), cmp_pat_ref)); |
| 2668 | } |
| 2669 | |
| 2670 | /* Sort complete array */ |
| 2671 | qsort(arr, len, sizeof(*arr), cmp_pat_ref); |
| 2672 | |
| 2673 | /* Convert back to linked list */ |
| 2674 | for (i = 0; i < len; i++) |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 2675 | LIST_APPEND(&pr, &arr[i]->list); |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2676 | |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2677 | /* swap root */ |
Willy Tarreau | 2b71810 | 2021-04-21 07:32:39 +0200 | [diff] [blame] | 2678 | LIST_INSERT(&pr, &pattern_reference); |
| 2679 | LIST_DELETE(&pr); |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2680 | |
| 2681 | free(arr); |
| 2682 | return 0; |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2683 | } |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 2684 | |
| 2685 | static int pattern_per_thread_lru_alloc() |
| 2686 | { |
| 2687 | if (!global.tune.pattern_cache) |
| 2688 | return 1; |
| 2689 | pat_lru_tree = lru64_new(global.tune.pattern_cache); |
| 2690 | return !!pat_lru_tree; |
| 2691 | } |
| 2692 | |
| 2693 | static void pattern_per_thread_lru_free() |
| 2694 | { |
| 2695 | lru64_destroy(pat_lru_tree); |
| 2696 | } |
| 2697 | |
| 2698 | REGISTER_PER_THREAD_ALLOC(pattern_per_thread_lru_alloc); |
| 2699 | REGISTER_PER_THREAD_FREE(pattern_per_thread_lru_free); |