Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1 | /* |
| 2 | * Pattern management functions. |
| 3 | * |
| 4 | * Copyright 2000-2013 Willy Tarreau <w@1wt.eu> |
| 5 | * |
| 6 | * This program is free software; you can redistribute it and/or |
| 7 | * modify it under the terms of the GNU General Public License |
| 8 | * as published by the Free Software Foundation; either version |
| 9 | * 2 of the License, or (at your option) any later version. |
| 10 | * |
| 11 | */ |
| 12 | |
| 13 | #include <ctype.h> |
| 14 | #include <stdio.h> |
Jerome Magnin | b8bd6d7 | 2020-01-17 18:01:20 +0100 | [diff] [blame] | 15 | #include <errno.h> |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 16 | |
Willy Tarreau | b255105 | 2020-06-09 09:07:15 +0200 | [diff] [blame] | 17 | #include <import/ebsttree.h> |
| 18 | #include <import/lru.h> |
| 19 | #include <import/xxhash.h> |
| 20 | |
Willy Tarreau | 4c7e4b7 | 2020-05-27 12:58:42 +0200 | [diff] [blame] | 21 | #include <haproxy/api.h> |
Willy Tarreau | f268ee8 | 2020-06-04 17:05:57 +0200 | [diff] [blame] | 22 | #include <haproxy/global.h> |
Willy Tarreau | aeed4a8 | 2020-06-04 22:01:04 +0200 | [diff] [blame] | 23 | #include <haproxy/log.h> |
Willy Tarreau | 6131d6a | 2020-06-02 16:48:09 +0200 | [diff] [blame] | 24 | #include <haproxy/net_helper.h> |
Willy Tarreau | 225a90a | 2020-06-04 15:06:28 +0200 | [diff] [blame] | 25 | #include <haproxy/pattern.h> |
Willy Tarreau | 7cd8b6e | 2020-06-02 17:32:26 +0200 | [diff] [blame] | 26 | #include <haproxy/regex.h> |
Willy Tarreau | e6ce10b | 2020-06-04 15:33:47 +0200 | [diff] [blame] | 27 | #include <haproxy/sample.h> |
Willy Tarreau | b255105 | 2020-06-09 09:07:15 +0200 | [diff] [blame] | 28 | #include <haproxy/tools.h> |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 29 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 30 | |
Thierry FOURNIER | a65b343 | 2013-11-28 18:22:00 +0100 | [diff] [blame] | 31 | char *pat_match_names[PAT_MATCH_NUM] = { |
| 32 | [PAT_MATCH_FOUND] = "found", |
| 33 | [PAT_MATCH_BOOL] = "bool", |
| 34 | [PAT_MATCH_INT] = "int", |
| 35 | [PAT_MATCH_IP] = "ip", |
| 36 | [PAT_MATCH_BIN] = "bin", |
| 37 | [PAT_MATCH_LEN] = "len", |
| 38 | [PAT_MATCH_STR] = "str", |
| 39 | [PAT_MATCH_BEG] = "beg", |
| 40 | [PAT_MATCH_SUB] = "sub", |
| 41 | [PAT_MATCH_DIR] = "dir", |
| 42 | [PAT_MATCH_DOM] = "dom", |
| 43 | [PAT_MATCH_END] = "end", |
| 44 | [PAT_MATCH_REG] = "reg", |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 45 | [PAT_MATCH_REGM] = "regm", |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 46 | }; |
| 47 | |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 48 | int (*pat_parse_fcts[PAT_MATCH_NUM])(const char *, struct pattern *, int, char **) = { |
Thierry FOURNIER | a65b343 | 2013-11-28 18:22:00 +0100 | [diff] [blame] | 49 | [PAT_MATCH_FOUND] = pat_parse_nothing, |
| 50 | [PAT_MATCH_BOOL] = pat_parse_nothing, |
| 51 | [PAT_MATCH_INT] = pat_parse_int, |
| 52 | [PAT_MATCH_IP] = pat_parse_ip, |
| 53 | [PAT_MATCH_BIN] = pat_parse_bin, |
Thierry FOURNIER | 5d34408 | 2014-01-27 14:19:53 +0100 | [diff] [blame] | 54 | [PAT_MATCH_LEN] = pat_parse_int, |
Thierry FOURNIER | a65b343 | 2013-11-28 18:22:00 +0100 | [diff] [blame] | 55 | [PAT_MATCH_STR] = pat_parse_str, |
| 56 | [PAT_MATCH_BEG] = pat_parse_str, |
| 57 | [PAT_MATCH_SUB] = pat_parse_str, |
| 58 | [PAT_MATCH_DIR] = pat_parse_str, |
| 59 | [PAT_MATCH_DOM] = pat_parse_str, |
| 60 | [PAT_MATCH_END] = pat_parse_str, |
| 61 | [PAT_MATCH_REG] = pat_parse_reg, |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 62 | [PAT_MATCH_REGM] = pat_parse_reg, |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 63 | }; |
| 64 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 65 | int (*pat_index_fcts[PAT_MATCH_NUM])(struct pattern_expr *, struct pattern *, char **) = { |
| 66 | [PAT_MATCH_FOUND] = pat_idx_list_val, |
| 67 | [PAT_MATCH_BOOL] = pat_idx_list_val, |
| 68 | [PAT_MATCH_INT] = pat_idx_list_val, |
| 69 | [PAT_MATCH_IP] = pat_idx_tree_ip, |
| 70 | [PAT_MATCH_BIN] = pat_idx_list_ptr, |
| 71 | [PAT_MATCH_LEN] = pat_idx_list_val, |
| 72 | [PAT_MATCH_STR] = pat_idx_tree_str, |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 73 | [PAT_MATCH_BEG] = pat_idx_tree_pfx, |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 74 | [PAT_MATCH_SUB] = pat_idx_list_str, |
| 75 | [PAT_MATCH_DIR] = pat_idx_list_str, |
| 76 | [PAT_MATCH_DOM] = pat_idx_list_str, |
| 77 | [PAT_MATCH_END] = pat_idx_list_str, |
| 78 | [PAT_MATCH_REG] = pat_idx_list_reg, |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 79 | [PAT_MATCH_REGM] = pat_idx_list_regm, |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 80 | }; |
| 81 | |
Thierry FOURNIER | 6f7203d | 2014-01-14 16:24:51 +0100 | [diff] [blame] | 82 | void (*pat_prune_fcts[PAT_MATCH_NUM])(struct pattern_expr *) = { |
Willy Tarreau | 6d8a689 | 2020-11-02 19:26:02 +0100 | [diff] [blame] | 83 | [PAT_MATCH_FOUND] = pat_prune_gen, |
| 84 | [PAT_MATCH_BOOL] = pat_prune_gen, |
| 85 | [PAT_MATCH_INT] = pat_prune_gen, |
| 86 | [PAT_MATCH_IP] = pat_prune_gen, |
| 87 | [PAT_MATCH_BIN] = pat_prune_gen, |
| 88 | [PAT_MATCH_LEN] = pat_prune_gen, |
| 89 | [PAT_MATCH_STR] = pat_prune_gen, |
| 90 | [PAT_MATCH_BEG] = pat_prune_gen, |
| 91 | [PAT_MATCH_SUB] = pat_prune_gen, |
| 92 | [PAT_MATCH_DIR] = pat_prune_gen, |
| 93 | [PAT_MATCH_DOM] = pat_prune_gen, |
| 94 | [PAT_MATCH_END] = pat_prune_gen, |
| 95 | [PAT_MATCH_REG] = pat_prune_gen, |
| 96 | [PAT_MATCH_REGM] = pat_prune_gen, |
Thierry FOURNIER | 6f7203d | 2014-01-14 16:24:51 +0100 | [diff] [blame] | 97 | }; |
| 98 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 99 | struct pattern *(*pat_match_fcts[PAT_MATCH_NUM])(struct sample *, struct pattern_expr *, int) = { |
Thierry FOURNIER | a65b343 | 2013-11-28 18:22:00 +0100 | [diff] [blame] | 100 | [PAT_MATCH_FOUND] = NULL, |
| 101 | [PAT_MATCH_BOOL] = pat_match_nothing, |
| 102 | [PAT_MATCH_INT] = pat_match_int, |
| 103 | [PAT_MATCH_IP] = pat_match_ip, |
| 104 | [PAT_MATCH_BIN] = pat_match_bin, |
| 105 | [PAT_MATCH_LEN] = pat_match_len, |
| 106 | [PAT_MATCH_STR] = pat_match_str, |
| 107 | [PAT_MATCH_BEG] = pat_match_beg, |
| 108 | [PAT_MATCH_SUB] = pat_match_sub, |
| 109 | [PAT_MATCH_DIR] = pat_match_dir, |
| 110 | [PAT_MATCH_DOM] = pat_match_dom, |
| 111 | [PAT_MATCH_END] = pat_match_end, |
| 112 | [PAT_MATCH_REG] = pat_match_reg, |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 113 | [PAT_MATCH_REGM] = pat_match_regm, |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 114 | }; |
| 115 | |
Thierry FOURNIER | e3ded59 | 2013-12-06 15:36:54 +0100 | [diff] [blame] | 116 | /* Just used for checking configuration compatibility */ |
| 117 | int pat_match_types[PAT_MATCH_NUM] = { |
Thierry FOURNIER | 07ee64e | 2015-07-06 23:43:03 +0200 | [diff] [blame] | 118 | [PAT_MATCH_FOUND] = SMP_T_SINT, |
| 119 | [PAT_MATCH_BOOL] = SMP_T_SINT, |
| 120 | [PAT_MATCH_INT] = SMP_T_SINT, |
Thierry FOURNIER | e3ded59 | 2013-12-06 15:36:54 +0100 | [diff] [blame] | 121 | [PAT_MATCH_IP] = SMP_T_ADDR, |
Thierry FOURNIER | 7654c9f | 2013-12-17 00:20:33 +0100 | [diff] [blame] | 122 | [PAT_MATCH_BIN] = SMP_T_BIN, |
| 123 | [PAT_MATCH_LEN] = SMP_T_STR, |
| 124 | [PAT_MATCH_STR] = SMP_T_STR, |
| 125 | [PAT_MATCH_BEG] = SMP_T_STR, |
| 126 | [PAT_MATCH_SUB] = SMP_T_STR, |
| 127 | [PAT_MATCH_DIR] = SMP_T_STR, |
| 128 | [PAT_MATCH_DOM] = SMP_T_STR, |
| 129 | [PAT_MATCH_END] = SMP_T_STR, |
| 130 | [PAT_MATCH_REG] = SMP_T_STR, |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 131 | [PAT_MATCH_REGM] = SMP_T_STR, |
Thierry FOURNIER | e3ded59 | 2013-12-06 15:36:54 +0100 | [diff] [blame] | 132 | }; |
| 133 | |
Thierry FOURNIER | 1794fdf | 2014-01-17 15:25:13 +0100 | [diff] [blame] | 134 | /* this struct is used to return information */ |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 135 | static THREAD_LOCAL struct pattern static_pattern; |
| 136 | static THREAD_LOCAL struct sample_data static_sample_data; |
Thierry FOURNIER | 1794fdf | 2014-01-17 15:25:13 +0100 | [diff] [blame] | 137 | |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 138 | /* This is the root of the list of all pattern_ref avalaibles. */ |
| 139 | struct list pattern_reference = LIST_HEAD_INIT(pattern_reference); |
| 140 | |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 141 | static THREAD_LOCAL struct lru64_head *pat_lru_tree; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 142 | static unsigned long long pat_lru_seed; |
| 143 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 144 | /* |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 145 | * |
| 146 | * The following functions are not exported and are used by internals process |
| 147 | * of pattern matching |
| 148 | * |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 149 | */ |
| 150 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 151 | /* Background: Fast way to find a zero byte in a word |
| 152 | * http://graphics.stanford.edu/~seander/bithacks.html#ZeroInWord |
| 153 | * hasZeroByte = (v - 0x01010101UL) & ~v & 0x80808080UL; |
| 154 | * |
| 155 | * To look for 4 different byte values, xor the word with those bytes and |
| 156 | * then check for zero bytes: |
| 157 | * |
| 158 | * v = (((unsigned char)c * 0x1010101U) ^ delimiter) |
| 159 | * where <delimiter> is the 4 byte values to look for (as an uint) |
| 160 | * and <c> is the character that is being tested |
| 161 | */ |
| 162 | static inline unsigned int is_delimiter(unsigned char c, unsigned int mask) |
| 163 | { |
| 164 | mask ^= (c * 0x01010101); /* propagate the char to all 4 bytes */ |
| 165 | return (mask - 0x01010101) & ~mask & 0x80808080U; |
| 166 | } |
| 167 | |
| 168 | static inline unsigned int make_4delim(unsigned char d1, unsigned char d2, unsigned char d3, unsigned char d4) |
| 169 | { |
| 170 | return d1 << 24 | d2 << 16 | d3 << 8 | d4; |
| 171 | } |
| 172 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 173 | |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 174 | /* |
| 175 | * |
| 176 | * These functions are exported and may be used by any other component. |
| 177 | * |
Willy Tarreau | 5def8ef | 2014-08-29 15:19:33 +0200 | [diff] [blame] | 178 | * The following functions are used for parsing pattern matching input value. |
| 179 | * The <text> contain the string to be parsed. <pattern> must be a preallocated |
| 180 | * pattern. The pat_parse_* functions fill this structure with the parsed value. |
| 181 | * <err> is filled with an error message built with memprintf() function. It is |
| 182 | * allowed to use a trash as a temporary storage for the returned pattern, as |
| 183 | * the next call after these functions will be pat_idx_*. |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 184 | * |
Willy Tarreau | 5def8ef | 2014-08-29 15:19:33 +0200 | [diff] [blame] | 185 | * In success case, the pat_parse_* function returns 1. If the function |
| 186 | * fails, it returns 0 and <err> is filled. |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 187 | */ |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 188 | |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 189 | /* ignore the current line */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 190 | int pat_parse_nothing(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 191 | { |
| 192 | return 1; |
| 193 | } |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 194 | |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 195 | /* Parse a string. It is allocated and duplicated. */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 196 | int pat_parse_str(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 197 | { |
Thierry FOURNIER | 7654c9f | 2013-12-17 00:20:33 +0100 | [diff] [blame] | 198 | pattern->type = SMP_T_STR; |
Thierry FOURNIER | edc15c3 | 2013-12-13 15:36:59 +0100 | [diff] [blame] | 199 | pattern->ptr.str = (char *)text; |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 200 | pattern->len = strlen(text); |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 201 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 202 | } |
| 203 | |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 204 | /* Parse a binary written in hexa. It is allocated. */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 205 | int pat_parse_bin(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 206 | { |
Willy Tarreau | 83061a8 | 2018-07-13 11:56:34 +0200 | [diff] [blame] | 207 | struct buffer *trash; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 208 | |
Thierry FOURNIER | 7654c9f | 2013-12-17 00:20:33 +0100 | [diff] [blame] | 209 | pattern->type = SMP_T_BIN; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 210 | trash = get_trash_chunk(); |
| 211 | pattern->len = trash->size; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 212 | pattern->ptr.str = trash->area; |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 213 | return !!parse_binary(text, &pattern->ptr.str, &pattern->len, err); |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 214 | } |
| 215 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 216 | /* Parse a regex. It is allocated. */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 217 | int pat_parse_reg(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 218 | { |
Thierry FOURNIER | 0b6d15f | 2014-01-29 19:35:16 +0100 | [diff] [blame] | 219 | pattern->ptr.str = (char *)text; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 220 | return 1; |
| 221 | } |
| 222 | |
| 223 | /* Parse a range of positive integers delimited by either ':' or '-'. If only |
| 224 | * one integer is read, it is set as both min and max. An operator may be |
| 225 | * specified as the prefix, among this list of 5 : |
| 226 | * |
| 227 | * 0:eq, 1:gt, 2:ge, 3:lt, 4:le |
| 228 | * |
| 229 | * The default operator is "eq". It supports range matching. Ranges are |
| 230 | * rejected for other operators. The operator may be changed at any time. |
| 231 | * The operator is stored in the 'opaque' argument. |
| 232 | * |
| 233 | * If err is non-NULL, an error message will be returned there on errors and |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 234 | * the caller will have to free it. The function returns zero on error, and |
| 235 | * non-zero on success. |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 236 | * |
| 237 | */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 238 | int pat_parse_int(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 239 | { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 240 | const char *ptr = text; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 241 | |
Thierry FOURNIER | 07ee64e | 2015-07-06 23:43:03 +0200 | [diff] [blame] | 242 | pattern->type = SMP_T_SINT; |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 243 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 244 | /* Empty string is not valid */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 245 | if (!*text) |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 246 | goto not_valid_range; |
| 247 | |
| 248 | /* Search ':' or '-' separator. */ |
| 249 | while (*ptr != '\0' && *ptr != ':' && *ptr != '-') |
| 250 | ptr++; |
| 251 | |
| 252 | /* If separator not found. */ |
| 253 | if (!*ptr) { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 254 | if (strl2llrc(text, ptr - text, &pattern->val.range.min) != 0) { |
| 255 | memprintf(err, "'%s' is not a number", text); |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 256 | return 0; |
| 257 | } |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 258 | pattern->val.range.max = pattern->val.range.min; |
| 259 | pattern->val.range.min_set = 1; |
| 260 | pattern->val.range.max_set = 1; |
| 261 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 262 | } |
| 263 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 264 | /* If the separator is the first character. */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 265 | if (ptr == text && *(ptr + 1) != '\0') { |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 266 | if (strl2llrc(ptr + 1, strlen(ptr + 1), &pattern->val.range.max) != 0) |
| 267 | goto not_valid_range; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 268 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 269 | pattern->val.range.min_set = 0; |
| 270 | pattern->val.range.max_set = 1; |
| 271 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 272 | } |
| 273 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 274 | /* If separator is the last character. */ |
| 275 | if (*(ptr + 1) == '\0') { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 276 | if (strl2llrc(text, ptr - text, &pattern->val.range.min) != 0) |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 277 | goto not_valid_range; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 278 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 279 | pattern->val.range.min_set = 1; |
| 280 | pattern->val.range.max_set = 0; |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 281 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 282 | } |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 283 | |
| 284 | /* Else, parse two numbers. */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 285 | if (strl2llrc(text, ptr - text, &pattern->val.range.min) != 0) |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 286 | goto not_valid_range; |
| 287 | |
| 288 | if (strl2llrc(ptr + 1, strlen(ptr + 1), &pattern->val.range.max) != 0) |
| 289 | goto not_valid_range; |
| 290 | |
| 291 | if (pattern->val.range.min > pattern->val.range.max) |
| 292 | goto not_valid_range; |
| 293 | |
| 294 | pattern->val.range.min_set = 1; |
| 295 | pattern->val.range.max_set = 1; |
| 296 | return 1; |
| 297 | |
| 298 | not_valid_range: |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 299 | memprintf(err, "'%s' is not a valid number range", text); |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 300 | return 0; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 301 | } |
| 302 | |
| 303 | /* Parse a range of positive 2-component versions delimited by either ':' or |
| 304 | * '-'. The version consists in a major and a minor, both of which must be |
| 305 | * smaller than 65536, because internally they will be represented as a 32-bit |
| 306 | * integer. |
| 307 | * If only one version is read, it is set as both min and max. Just like for |
| 308 | * pure integers, an operator may be specified as the prefix, among this list |
| 309 | * of 5 : |
| 310 | * |
| 311 | * 0:eq, 1:gt, 2:ge, 3:lt, 4:le |
| 312 | * |
| 313 | * The default operator is "eq". It supports range matching. Ranges are |
| 314 | * rejected for other operators. The operator may be changed at any time. |
| 315 | * The operator is stored in the 'opaque' argument. This allows constructs |
| 316 | * such as the following one : |
| 317 | * |
| 318 | * acl obsolete_ssl ssl_req_proto lt 3 |
| 319 | * acl unsupported_ssl ssl_req_proto gt 3.1 |
| 320 | * acl valid_ssl ssl_req_proto 3.0-3.1 |
| 321 | * |
| 322 | */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 323 | int pat_parse_dotted_ver(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 324 | { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 325 | const char *ptr = text; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 326 | |
Thierry FOURNIER | 07ee64e | 2015-07-06 23:43:03 +0200 | [diff] [blame] | 327 | pattern->type = SMP_T_SINT; |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 328 | |
| 329 | /* Search ':' or '-' separator. */ |
| 330 | while (*ptr != '\0' && *ptr != ':' && *ptr != '-') |
| 331 | ptr++; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 332 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 333 | /* If separator not found. */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 334 | if (*ptr == '\0' && ptr > text) { |
| 335 | if (strl2llrc_dotted(text, ptr-text, &pattern->val.range.min) != 0) { |
| 336 | memprintf(err, "'%s' is not a dotted number", text); |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 337 | return 0; |
| 338 | } |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 339 | pattern->val.range.max = pattern->val.range.min; |
| 340 | pattern->val.range.min_set = 1; |
| 341 | pattern->val.range.max_set = 1; |
| 342 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 343 | } |
| 344 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 345 | /* If the separator is the first character. */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 346 | if (ptr == text && *(ptr+1) != '\0') { |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 347 | if (strl2llrc_dotted(ptr+1, strlen(ptr+1), &pattern->val.range.max) != 0) { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 348 | memprintf(err, "'%s' is not a valid dotted number range", text); |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 349 | return 0; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 350 | } |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 351 | pattern->val.range.min_set = 0; |
| 352 | pattern->val.range.max_set = 1; |
| 353 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 354 | } |
| 355 | |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 356 | /* If separator is the last character. */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 357 | if (ptr == &text[strlen(text)-1]) { |
| 358 | if (strl2llrc_dotted(text, ptr-text, &pattern->val.range.min) != 0) { |
| 359 | memprintf(err, "'%s' is not a valid dotted number range", text); |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 360 | return 0; |
| 361 | } |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 362 | pattern->val.range.min_set = 1; |
| 363 | pattern->val.range.max_set = 0; |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 364 | return 1; |
| 365 | } |
| 366 | |
| 367 | /* Else, parse two numbers. */ |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 368 | if (strl2llrc_dotted(text, ptr-text, &pattern->val.range.min) != 0) { |
| 369 | memprintf(err, "'%s' is not a valid dotted number range", text); |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 370 | return 0; |
| 371 | } |
| 372 | if (strl2llrc_dotted(ptr+1, strlen(ptr+1), &pattern->val.range.max) != 0) { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 373 | memprintf(err, "'%s' is not a valid dotted number range", text); |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 374 | return 0; |
| 375 | } |
| 376 | if (pattern->val.range.min > pattern->val.range.max) { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 377 | memprintf(err, "'%s' is not a valid dotted number range", text); |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 378 | return 0; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 379 | } |
Thierry FOURNIER | 511e947 | 2014-01-23 17:40:34 +0100 | [diff] [blame] | 380 | pattern->val.range.min_set = 1; |
| 381 | pattern->val.range.max_set = 1; |
| 382 | return 1; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 383 | } |
| 384 | |
| 385 | /* Parse an IP address and an optional mask in the form addr[/mask]. |
| 386 | * The addr may either be an IPv4 address or a hostname. The mask |
| 387 | * may either be a dotted mask or a number of bits. Returns 1 if OK, |
| 388 | * otherwise 0. NOTE: IP address patterns are typed (IPV4/IPV6). |
| 389 | */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 390 | int pat_parse_ip(const char *text, struct pattern *pattern, int mflags, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 391 | { |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 392 | if (str2net(text, !(mflags & PAT_MF_NO_DNS) && (global.mode & MODE_STARTING), |
Thierry FOURNIER | fc7ac7b | 2014-02-11 15:23:04 +0100 | [diff] [blame] | 393 | &pattern->val.ipv4.addr, &pattern->val.ipv4.mask)) { |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 394 | pattern->type = SMP_T_IPV4; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 395 | return 1; |
| 396 | } |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 397 | else if (str62net(text, &pattern->val.ipv6.addr, &pattern->val.ipv6.mask)) { |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 398 | pattern->type = SMP_T_IPV6; |
| 399 | return 1; |
| 400 | } |
| 401 | else { |
Thierry FOURNIER | 580c32c | 2014-01-24 10:58:12 +0100 | [diff] [blame] | 402 | memprintf(err, "'%s' is not a valid IPv4 or IPv6 address", text); |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 403 | return 0; |
| 404 | } |
| 405 | } |
| 406 | |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 407 | /* |
| 408 | * |
| 409 | * These functions are exported and may be used by any other component. |
| 410 | * |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 411 | * This function just takes a sample <smp> and checks if this sample matches |
| 412 | * with the pattern <pattern>. This function returns only PAT_MATCH or |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 413 | * PAT_NOMATCH. |
| 414 | * |
| 415 | */ |
| 416 | |
| 417 | /* always return false */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 418 | struct pattern *pat_match_nothing(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 419 | { |
Thierry FOURNIER | 136f9d3 | 2015-08-19 09:07:19 +0200 | [diff] [blame] | 420 | if (smp->data.u.sint) { |
Thierry FOURNIER | e5978bf | 2014-03-17 19:53:10 +0100 | [diff] [blame] | 421 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 422 | static_pattern.data = NULL; |
Thierry FOURNIER | e5978bf | 2014-03-17 19:53:10 +0100 | [diff] [blame] | 423 | static_pattern.ref = NULL; |
Thierry FOURNIER | e5978bf | 2014-03-17 19:53:10 +0100 | [diff] [blame] | 424 | static_pattern.type = 0; |
| 425 | static_pattern.ptr.str = NULL; |
| 426 | } |
| 427 | return &static_pattern; |
| 428 | } |
| 429 | else |
| 430 | return NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 431 | } |
| 432 | |
| 433 | |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 434 | /* NB: For two strings to be identical, it is required that their length match */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 435 | struct pattern *pat_match_str(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 436 | { |
| 437 | int icase; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 438 | struct ebmb_node *node; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 439 | struct pattern_tree *elt; |
| 440 | struct pattern_list *lst; |
| 441 | struct pattern *pattern; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 442 | struct pattern *ret = NULL; |
| 443 | struct lru64 *lru = NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 444 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 445 | /* Lookup a string in the expression's pattern tree. */ |
| 446 | if (!eb_is_empty(&expr->pattern_tree)) { |
Christopher Faulet | b4cf7ab | 2020-06-30 18:52:32 +0200 | [diff] [blame] | 447 | char prev = 0; |
| 448 | |
| 449 | if (smp->data.u.str.data < smp->data.u.str.size) { |
| 450 | /* we may have to force a trailing zero on the test pattern and |
| 451 | * the buffer is large enough to accommodate it. |
| 452 | */ |
| 453 | prev = smp->data.u.str.area[smp->data.u.str.data]; |
| 454 | if (prev) |
| 455 | smp->data.u.str.area[smp->data.u.str.data] = '\0'; |
| 456 | } |
| 457 | else { |
| 458 | /* Otherwise, the sample is duplicated. A trailing zero |
| 459 | * is automatically added to the string. |
| 460 | */ |
| 461 | if (!smp_dup(smp)) |
| 462 | return NULL; |
| 463 | } |
| 464 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 465 | node = ebst_lookup(&expr->pattern_tree, smp->data.u.str.area); |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 466 | if (prev) |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 467 | smp->data.u.str.area[smp->data.u.str.data] = prev; |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 468 | |
| 469 | while (node) { |
| 470 | elt = ebmb_entry(node, struct pattern_tree, node); |
| 471 | if (elt->ref->gen_id != expr->ref->curr_gen) { |
| 472 | node = ebmb_next(node); |
| 473 | continue; |
| 474 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 475 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 476 | static_pattern.data = elt->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 477 | static_pattern.ref = elt->ref; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 478 | static_pattern.sflags = PAT_SF_TREE; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 479 | static_pattern.type = SMP_T_STR; |
| 480 | static_pattern.ptr.str = (char *)elt->node.key; |
| 481 | } |
| 482 | return &static_pattern; |
| 483 | } |
| 484 | } |
| 485 | |
| 486 | /* look in the list */ |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 487 | if (pat_lru_tree) { |
Willy Tarreau | aee9314 | 2015-05-04 17:18:42 +0200 | [diff] [blame] | 488 | unsigned long long seed = pat_lru_seed ^ (long)expr; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 489 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 490 | lru = lru64_get(XXH64(smp->data.u.str.area, smp->data.u.str.data, seed), |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 491 | pat_lru_tree, expr, expr->ref->revision); |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 492 | if (lru && lru->domain) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 493 | ret = lru->data; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 494 | return ret; |
| 495 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 496 | } |
| 497 | |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 498 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 499 | list_for_each_entry(lst, &expr->patterns, list) { |
| 500 | pattern = &lst->pat; |
| 501 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 502 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 503 | continue; |
| 504 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 505 | if (pattern->len != smp->data.u.str.data) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 506 | continue; |
| 507 | |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 508 | icase = expr->mflags & PAT_MF_IGNORE_CASE; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 509 | if ((icase && strncasecmp(pattern->ptr.str, smp->data.u.str.area, smp->data.u.str.data) == 0) || |
| 510 | (!icase && strncmp(pattern->ptr.str, smp->data.u.str.area, smp->data.u.str.data) == 0)) { |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 511 | ret = pattern; |
| 512 | break; |
| 513 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 514 | } |
| 515 | |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 516 | if (lru) |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 517 | lru64_commit(lru, ret, expr, expr->ref->revision, NULL); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 518 | |
| 519 | return ret; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 520 | } |
| 521 | |
| 522 | /* NB: For two binaries buf to be identical, it is required that their lengths match */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 523 | struct pattern *pat_match_bin(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 524 | { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 525 | struct pattern_list *lst; |
| 526 | struct pattern *pattern; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 527 | struct pattern *ret = NULL; |
| 528 | struct lru64 *lru = NULL; |
| 529 | |
| 530 | if (pat_lru_tree) { |
Willy Tarreau | aee9314 | 2015-05-04 17:18:42 +0200 | [diff] [blame] | 531 | unsigned long long seed = pat_lru_seed ^ (long)expr; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 532 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 533 | lru = lru64_get(XXH64(smp->data.u.str.area, smp->data.u.str.data, seed), |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 534 | pat_lru_tree, expr, expr->ref->revision); |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 535 | if (lru && lru->domain) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 536 | ret = lru->data; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 537 | return ret; |
| 538 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 539 | } |
| 540 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 541 | list_for_each_entry(lst, &expr->patterns, list) { |
| 542 | pattern = &lst->pat; |
| 543 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 544 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 545 | continue; |
| 546 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 547 | if (pattern->len != smp->data.u.str.data) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 548 | continue; |
| 549 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 550 | if (memcmp(pattern->ptr.str, smp->data.u.str.area, smp->data.u.str.data) == 0) { |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 551 | ret = pattern; |
| 552 | break; |
| 553 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 554 | } |
| 555 | |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 556 | if (lru) |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 557 | lru64_commit(lru, ret, expr, expr->ref->revision, NULL); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 558 | |
| 559 | return ret; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 560 | } |
| 561 | |
| 562 | /* Executes a regex. It temporarily changes the data to add a trailing zero, |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 563 | * and restores the previous character when leaving. This function fills |
| 564 | * a matching array. |
| 565 | */ |
| 566 | struct pattern *pat_match_regm(struct sample *smp, struct pattern_expr *expr, int fill) |
| 567 | { |
| 568 | struct pattern_list *lst; |
| 569 | struct pattern *pattern; |
| 570 | struct pattern *ret = NULL; |
| 571 | |
| 572 | list_for_each_entry(lst, &expr->patterns, list) { |
| 573 | pattern = &lst->pat; |
| 574 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 575 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 576 | continue; |
| 577 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 578 | if (regex_exec_match2(pattern->ptr.reg, smp->data.u.str.area, smp->data.u.str.data, |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 579 | MAX_MATCH, pmatch, 0)) { |
| 580 | ret = pattern; |
| 581 | smp->ctx.a[0] = pmatch; |
| 582 | break; |
| 583 | } |
| 584 | } |
| 585 | |
| 586 | return ret; |
| 587 | } |
| 588 | |
| 589 | /* Executes a regex. It temporarily changes the data to add a trailing zero, |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 590 | * and restores the previous character when leaving. |
| 591 | */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 592 | struct pattern *pat_match_reg(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 593 | { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 594 | struct pattern_list *lst; |
| 595 | struct pattern *pattern; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 596 | struct pattern *ret = NULL; |
| 597 | struct lru64 *lru = NULL; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 598 | |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 599 | if (pat_lru_tree) { |
Willy Tarreau | aee9314 | 2015-05-04 17:18:42 +0200 | [diff] [blame] | 600 | unsigned long long seed = pat_lru_seed ^ (long)expr; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 601 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 602 | lru = lru64_get(XXH64(smp->data.u.str.area, smp->data.u.str.data, seed), |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 603 | pat_lru_tree, expr, expr->ref->revision); |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 604 | if (lru && lru->domain) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 605 | ret = lru->data; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 606 | return ret; |
| 607 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 608 | } |
| 609 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 610 | list_for_each_entry(lst, &expr->patterns, list) { |
| 611 | pattern = &lst->pat; |
| 612 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 613 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 614 | continue; |
| 615 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 616 | if (regex_exec2(pattern->ptr.reg, smp->data.u.str.area, smp->data.u.str.data)) { |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 617 | ret = pattern; |
| 618 | break; |
| 619 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 620 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 621 | |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 622 | if (lru) |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 623 | lru64_commit(lru, ret, expr, expr->ref->revision, NULL); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 624 | |
| 625 | return ret; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 626 | } |
| 627 | |
| 628 | /* Checks that the pattern matches the beginning of the tested string. */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 629 | struct pattern *pat_match_beg(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 630 | { |
| 631 | int icase; |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 632 | struct ebmb_node *node; |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 633 | struct pattern_tree *elt; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 634 | struct pattern_list *lst; |
| 635 | struct pattern *pattern; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 636 | struct pattern *ret = NULL; |
| 637 | struct lru64 *lru = NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 638 | |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 639 | /* Lookup a string in the expression's pattern tree. */ |
| 640 | if (!eb_is_empty(&expr->pattern_tree)) { |
Christopher Faulet | b4cf7ab | 2020-06-30 18:52:32 +0200 | [diff] [blame] | 641 | char prev = 0; |
| 642 | |
| 643 | if (smp->data.u.str.data < smp->data.u.str.size) { |
| 644 | /* we may have to force a trailing zero on the test pattern and |
| 645 | * the buffer is large enough to accommodate it. |
| 646 | */ |
| 647 | prev = smp->data.u.str.area[smp->data.u.str.data]; |
| 648 | if (prev) |
| 649 | smp->data.u.str.area[smp->data.u.str.data] = '\0'; |
| 650 | } |
| 651 | else { |
| 652 | /* Otherwise, the sample is duplicated. A trailing zero |
| 653 | * is automatically added to the string. |
| 654 | */ |
| 655 | if (!smp_dup(smp)) |
| 656 | return NULL; |
| 657 | } |
| 658 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 659 | node = ebmb_lookup_longest(&expr->pattern_tree, |
| 660 | smp->data.u.str.area); |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 661 | if (prev) |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 662 | smp->data.u.str.area[smp->data.u.str.data] = prev; |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 663 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 664 | while (node) { |
| 665 | elt = ebmb_entry(node, struct pattern_tree, node); |
| 666 | if (elt->ref->gen_id != expr->ref->curr_gen) { |
| 667 | node = ebmb_next(node); |
| 668 | continue; |
| 669 | } |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 670 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 671 | static_pattern.data = elt->data; |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 672 | static_pattern.ref = elt->ref; |
| 673 | static_pattern.sflags = PAT_SF_TREE; |
| 674 | static_pattern.type = SMP_T_STR; |
| 675 | static_pattern.ptr.str = (char *)elt->node.key; |
| 676 | } |
| 677 | return &static_pattern; |
| 678 | } |
| 679 | } |
| 680 | |
| 681 | /* look in the list */ |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 682 | if (pat_lru_tree) { |
Willy Tarreau | aee9314 | 2015-05-04 17:18:42 +0200 | [diff] [blame] | 683 | unsigned long long seed = pat_lru_seed ^ (long)expr; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 684 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 685 | lru = lru64_get(XXH64(smp->data.u.str.area, smp->data.u.str.data, seed), |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 686 | pat_lru_tree, expr, expr->ref->revision); |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 687 | if (lru && lru->domain) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 688 | ret = lru->data; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 689 | return ret; |
| 690 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 691 | } |
| 692 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 693 | list_for_each_entry(lst, &expr->patterns, list) { |
| 694 | pattern = &lst->pat; |
| 695 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 696 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 697 | continue; |
| 698 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 699 | if (pattern->len > smp->data.u.str.data) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 700 | continue; |
| 701 | |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 702 | icase = expr->mflags & PAT_MF_IGNORE_CASE; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 703 | if ((icase && strncasecmp(pattern->ptr.str, smp->data.u.str.area, pattern->len) != 0) || |
| 704 | (!icase && strncmp(pattern->ptr.str, smp->data.u.str.area, pattern->len) != 0)) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 705 | continue; |
| 706 | |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 707 | ret = pattern; |
| 708 | break; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 709 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 710 | |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 711 | if (lru) |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 712 | lru64_commit(lru, ret, expr, expr->ref->revision, NULL); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 713 | |
| 714 | return ret; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 715 | } |
| 716 | |
| 717 | /* Checks that the pattern matches the end of the tested string. */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 718 | struct pattern *pat_match_end(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 719 | { |
| 720 | int icase; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 721 | struct pattern_list *lst; |
| 722 | struct pattern *pattern; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 723 | struct pattern *ret = NULL; |
| 724 | struct lru64 *lru = NULL; |
| 725 | |
| 726 | if (pat_lru_tree) { |
Willy Tarreau | aee9314 | 2015-05-04 17:18:42 +0200 | [diff] [blame] | 727 | unsigned long long seed = pat_lru_seed ^ (long)expr; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 728 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 729 | lru = lru64_get(XXH64(smp->data.u.str.area, smp->data.u.str.data, seed), |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 730 | pat_lru_tree, expr, expr->ref->revision); |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 731 | if (lru && lru->domain) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 732 | ret = lru->data; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 733 | return ret; |
| 734 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 735 | } |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 736 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 737 | list_for_each_entry(lst, &expr->patterns, list) { |
| 738 | pattern = &lst->pat; |
| 739 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 740 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 741 | continue; |
| 742 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 743 | if (pattern->len > smp->data.u.str.data) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 744 | continue; |
| 745 | |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 746 | icase = expr->mflags & PAT_MF_IGNORE_CASE; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 747 | if ((icase && strncasecmp(pattern->ptr.str, smp->data.u.str.area + smp->data.u.str.data - pattern->len, pattern->len) != 0) || |
| 748 | (!icase && strncmp(pattern->ptr.str, smp->data.u.str.area + smp->data.u.str.data - pattern->len, pattern->len) != 0)) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 749 | continue; |
| 750 | |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 751 | ret = pattern; |
| 752 | break; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 753 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 754 | |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 755 | if (lru) |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 756 | lru64_commit(lru, ret, expr, expr->ref->revision, NULL); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 757 | |
| 758 | return ret; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 759 | } |
| 760 | |
| 761 | /* Checks that the pattern is included inside the tested string. |
| 762 | * NB: Suboptimal, should be rewritten using a Boyer-Moore method. |
| 763 | */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 764 | struct pattern *pat_match_sub(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 765 | { |
| 766 | int icase; |
| 767 | char *end; |
| 768 | char *c; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 769 | struct pattern_list *lst; |
| 770 | struct pattern *pattern; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 771 | struct pattern *ret = NULL; |
| 772 | struct lru64 *lru = NULL; |
| 773 | |
| 774 | if (pat_lru_tree) { |
Willy Tarreau | aee9314 | 2015-05-04 17:18:42 +0200 | [diff] [blame] | 775 | unsigned long long seed = pat_lru_seed ^ (long)expr; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 776 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 777 | lru = lru64_get(XXH64(smp->data.u.str.area, smp->data.u.str.data, seed), |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 778 | pat_lru_tree, expr, expr->ref->revision); |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 779 | if (lru && lru->domain) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 780 | ret = lru->data; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 781 | return ret; |
| 782 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 783 | } |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 784 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 785 | list_for_each_entry(lst, &expr->patterns, list) { |
| 786 | pattern = &lst->pat; |
| 787 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 788 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 789 | continue; |
| 790 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 791 | if (pattern->len > smp->data.u.str.data) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 792 | continue; |
| 793 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 794 | end = smp->data.u.str.area + smp->data.u.str.data - pattern->len; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 795 | icase = expr->mflags & PAT_MF_IGNORE_CASE; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 796 | if (icase) { |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 797 | for (c = smp->data.u.str.area; c <= end; c++) { |
Willy Tarreau | f278eec | 2020-07-05 21:46:32 +0200 | [diff] [blame] | 798 | if (tolower((unsigned char)*c) != tolower((unsigned char)*pattern->ptr.str)) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 799 | continue; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 800 | if (strncasecmp(pattern->ptr.str, c, pattern->len) == 0) { |
| 801 | ret = pattern; |
| 802 | goto leave; |
| 803 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 804 | } |
| 805 | } else { |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 806 | for (c = smp->data.u.str.area; c <= end; c++) { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 807 | if (*c != *pattern->ptr.str) |
| 808 | continue; |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 809 | if (strncmp(pattern->ptr.str, c, pattern->len) == 0) { |
| 810 | ret = pattern; |
| 811 | goto leave; |
| 812 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 813 | } |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 814 | } |
| 815 | } |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 816 | leave: |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 817 | if (lru) |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 818 | lru64_commit(lru, ret, expr, expr->ref->revision, NULL); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 819 | |
| 820 | return ret; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 821 | } |
| 822 | |
| 823 | /* This one is used by other real functions. It checks that the pattern is |
| 824 | * included inside the tested string, but enclosed between the specified |
| 825 | * delimiters or at the beginning or end of the string. The delimiters are |
| 826 | * provided as an unsigned int made by make_4delim() and match up to 4 different |
| 827 | * delimiters. Delimiters are stripped at the beginning and end of the pattern. |
| 828 | */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 829 | static int match_word(struct sample *smp, struct pattern *pattern, int mflags, unsigned int delimiters) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 830 | { |
| 831 | int may_match, icase; |
| 832 | char *c, *end; |
| 833 | char *ps; |
| 834 | int pl; |
| 835 | |
| 836 | pl = pattern->len; |
| 837 | ps = pattern->ptr.str; |
| 838 | |
| 839 | while (pl > 0 && is_delimiter(*ps, delimiters)) { |
| 840 | pl--; |
| 841 | ps++; |
| 842 | } |
| 843 | |
| 844 | while (pl > 0 && is_delimiter(ps[pl - 1], delimiters)) |
| 845 | pl--; |
| 846 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 847 | if (pl > smp->data.u.str.data) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 848 | return PAT_NOMATCH; |
| 849 | |
| 850 | may_match = 1; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 851 | icase = mflags & PAT_MF_IGNORE_CASE; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 852 | end = smp->data.u.str.area + smp->data.u.str.data - pl; |
| 853 | for (c = smp->data.u.str.area; c <= end; c++) { |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 854 | if (is_delimiter(*c, delimiters)) { |
| 855 | may_match = 1; |
| 856 | continue; |
| 857 | } |
| 858 | |
| 859 | if (!may_match) |
| 860 | continue; |
| 861 | |
| 862 | if (icase) { |
Willy Tarreau | f278eec | 2020-07-05 21:46:32 +0200 | [diff] [blame] | 863 | if ((tolower((unsigned char)*c) == tolower((unsigned char)*ps)) && |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 864 | (strncasecmp(ps, c, pl) == 0) && |
| 865 | (c == end || is_delimiter(c[pl], delimiters))) |
| 866 | return PAT_MATCH; |
| 867 | } else { |
| 868 | if ((*c == *ps) && |
| 869 | (strncmp(ps, c, pl) == 0) && |
| 870 | (c == end || is_delimiter(c[pl], delimiters))) |
| 871 | return PAT_MATCH; |
| 872 | } |
| 873 | may_match = 0; |
| 874 | } |
| 875 | return PAT_NOMATCH; |
| 876 | } |
| 877 | |
| 878 | /* Checks that the pattern is included inside the tested string, but enclosed |
| 879 | * between the delimiters '?' or '/' or at the beginning or end of the string. |
| 880 | * Delimiters at the beginning or end of the pattern are ignored. |
| 881 | */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 882 | struct pattern *pat_match_dir(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 883 | { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 884 | struct pattern_list *lst; |
| 885 | struct pattern *pattern; |
| 886 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 887 | list_for_each_entry(lst, &expr->patterns, list) { |
| 888 | pattern = &lst->pat; |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 889 | |
| 890 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 891 | continue; |
| 892 | |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 893 | if (match_word(smp, pattern, expr->mflags, make_4delim('/', '?', '?', '?'))) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 894 | return pattern; |
| 895 | } |
| 896 | return NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 897 | } |
| 898 | |
| 899 | /* Checks that the pattern is included inside the tested string, but enclosed |
| 900 | * between the delmiters '/', '?', '.' or ":" or at the beginning or end of |
| 901 | * the string. Delimiters at the beginning or end of the pattern are ignored. |
| 902 | */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 903 | struct pattern *pat_match_dom(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 904 | { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 905 | struct pattern_list *lst; |
| 906 | struct pattern *pattern; |
| 907 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 908 | list_for_each_entry(lst, &expr->patterns, list) { |
| 909 | pattern = &lst->pat; |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 910 | |
| 911 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 912 | continue; |
| 913 | |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 914 | if (match_word(smp, pattern, expr->mflags, make_4delim('/', '?', '.', ':'))) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 915 | return pattern; |
| 916 | } |
| 917 | return NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 918 | } |
| 919 | |
| 920 | /* Checks that the integer in <test> is included between min and max */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 921 | struct pattern *pat_match_int(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 922 | { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 923 | struct pattern_list *lst; |
| 924 | struct pattern *pattern; |
| 925 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 926 | list_for_each_entry(lst, &expr->patterns, list) { |
| 927 | pattern = &lst->pat; |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 928 | |
| 929 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 930 | continue; |
| 931 | |
Thierry FOURNIER | 136f9d3 | 2015-08-19 09:07:19 +0200 | [diff] [blame] | 932 | if ((!pattern->val.range.min_set || pattern->val.range.min <= smp->data.u.sint) && |
| 933 | (!pattern->val.range.max_set || smp->data.u.sint <= pattern->val.range.max)) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 934 | return pattern; |
| 935 | } |
| 936 | return NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 937 | } |
| 938 | |
| 939 | /* Checks that the length of the pattern in <test> is included between min and max */ |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 940 | struct pattern *pat_match_len(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 941 | { |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 942 | struct pattern_list *lst; |
| 943 | struct pattern *pattern; |
| 944 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 945 | list_for_each_entry(lst, &expr->patterns, list) { |
| 946 | pattern = &lst->pat; |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 947 | |
| 948 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 949 | continue; |
| 950 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 951 | if ((!pattern->val.range.min_set || pattern->val.range.min <= smp->data.u.str.data) && |
| 952 | (!pattern->val.range.max_set || smp->data.u.str.data <= pattern->val.range.max)) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 953 | return pattern; |
| 954 | } |
| 955 | return NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 956 | } |
| 957 | |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 958 | struct pattern *pat_match_ip(struct sample *smp, struct pattern_expr *expr, int fill) |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 959 | { |
| 960 | unsigned int v4; /* in network byte order */ |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 961 | struct in6_addr tmp6; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 962 | struct in_addr *s; |
| 963 | struct ebmb_node *node; |
| 964 | struct pattern_tree *elt; |
| 965 | struct pattern_list *lst; |
| 966 | struct pattern *pattern; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 967 | |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 968 | /* The input sample is IPv4. Try to match in the trees. */ |
Thierry FOURNIER | 8c542ca | 2015-08-19 09:00:18 +0200 | [diff] [blame] | 969 | if (smp->data.type == SMP_T_IPV4) { |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 970 | /* Lookup an IPv4 address in the expression's pattern tree using |
| 971 | * the longest match method. |
| 972 | */ |
Thierry FOURNIER | 136f9d3 | 2015-08-19 09:07:19 +0200 | [diff] [blame] | 973 | s = &smp->data.u.ipv4; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 974 | node = ebmb_lookup_longest(&expr->pattern_tree, &s->s_addr); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 975 | while (node) { |
| 976 | elt = ebmb_entry(node, struct pattern_tree, node); |
| 977 | if (elt->ref->gen_id != expr->ref->curr_gen) { |
| 978 | node = ebmb_next(node); |
| 979 | continue; |
| 980 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 981 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 982 | static_pattern.data = elt->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 983 | static_pattern.ref = elt->ref; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 984 | static_pattern.sflags = PAT_SF_TREE; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 985 | static_pattern.type = SMP_T_IPV4; |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 986 | static_pattern.val.ipv4.addr.s_addr = read_u32(elt->node.key); |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 987 | if (!cidr2dotted(elt->node.node.pfx, &static_pattern.val.ipv4.mask)) |
| 988 | return NULL; |
| 989 | } |
| 990 | return &static_pattern; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 991 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 992 | |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 993 | /* The IPv4 sample dont match the IPv4 tree. Convert the IPv4 |
| 994 | * sample address to IPv6 with the mapping method using the ::ffff: |
| 995 | * prefix, and try to lookup in the IPv6 tree. |
| 996 | */ |
| 997 | memset(&tmp6, 0, 10); |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 998 | write_u16(&tmp6.s6_addr[10], htons(0xffff)); |
| 999 | write_u32(&tmp6.s6_addr[12], smp->data.u.ipv4.s_addr); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1000 | node = ebmb_lookup_longest(&expr->pattern_tree_2, &tmp6); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 1001 | while (node) { |
| 1002 | elt = ebmb_entry(node, struct pattern_tree, node); |
| 1003 | if (elt->ref->gen_id != expr->ref->curr_gen) { |
| 1004 | node = ebmb_next(node); |
| 1005 | continue; |
| 1006 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1007 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1008 | static_pattern.data = elt->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1009 | static_pattern.ref = elt->ref; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 1010 | static_pattern.sflags = PAT_SF_TREE; |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1011 | static_pattern.type = SMP_T_IPV6; |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1012 | memcpy(&static_pattern.val.ipv6.addr, elt->node.key, 16); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1013 | static_pattern.val.ipv6.mask = elt->node.node.pfx; |
| 1014 | } |
| 1015 | return &static_pattern; |
| 1016 | } |
| 1017 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1018 | |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1019 | /* The input sample is IPv6. Try to match in the trees. */ |
Thierry FOURNIER | 8c542ca | 2015-08-19 09:00:18 +0200 | [diff] [blame] | 1020 | if (smp->data.type == SMP_T_IPV6) { |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1021 | /* Lookup an IPv6 address in the expression's pattern tree using |
| 1022 | * the longest match method. |
| 1023 | */ |
Thierry FOURNIER | 136f9d3 | 2015-08-19 09:07:19 +0200 | [diff] [blame] | 1024 | node = ebmb_lookup_longest(&expr->pattern_tree_2, &smp->data.u.ipv6); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 1025 | while (node) { |
| 1026 | elt = ebmb_entry(node, struct pattern_tree, node); |
| 1027 | if (elt->ref->gen_id != expr->ref->curr_gen) { |
| 1028 | node = ebmb_next(node); |
| 1029 | continue; |
| 1030 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1031 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1032 | static_pattern.data = elt->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1033 | static_pattern.ref = elt->ref; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 1034 | static_pattern.sflags = PAT_SF_TREE; |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1035 | static_pattern.type = SMP_T_IPV6; |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1036 | memcpy(&static_pattern.val.ipv6.addr, elt->node.key, 16); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1037 | static_pattern.val.ipv6.mask = elt->node.node.pfx; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1038 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1039 | return &static_pattern; |
| 1040 | } |
| 1041 | |
| 1042 | /* Try to convert 6 to 4 when the start of the ipv6 address match the |
| 1043 | * following forms : |
| 1044 | * - ::ffff:ip:v4 (ipv4 mapped) |
| 1045 | * - ::0000:ip:v4 (old ipv4 mapped) |
| 1046 | * - 2002:ip:v4:: (6to4) |
| 1047 | */ |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1048 | if ((read_u64(&smp->data.u.ipv6.s6_addr[0]) == 0 && |
| 1049 | (read_u32(&smp->data.u.ipv6.s6_addr[8]) == 0 || |
| 1050 | read_u32(&smp->data.u.ipv6.s6_addr[8]) == htonl(0xFFFF))) || |
| 1051 | read_u16(&smp->data.u.ipv6.s6_addr[0]) == htons(0x2002)) { |
| 1052 | if (read_u32(&smp->data.u.ipv6.s6_addr[0]) == 0) |
| 1053 | v4 = read_u32(&smp->data.u.ipv6.s6_addr[12]); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1054 | else |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1055 | v4 = htonl((ntohs(read_u16(&smp->data.u.ipv6.s6_addr[2])) << 16) + |
| 1056 | ntohs(read_u16(&smp->data.u.ipv6.s6_addr[4]))); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1057 | |
| 1058 | /* Lookup an IPv4 address in the expression's pattern tree using the longest |
| 1059 | * match method. |
| 1060 | */ |
| 1061 | node = ebmb_lookup_longest(&expr->pattern_tree, &v4); |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 1062 | while (node) { |
| 1063 | elt = ebmb_entry(node, struct pattern_tree, node); |
| 1064 | if (elt->ref->gen_id != expr->ref->curr_gen) { |
| 1065 | node = ebmb_next(node); |
| 1066 | continue; |
| 1067 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1068 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1069 | static_pattern.data = elt->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1070 | static_pattern.ref = elt->ref; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 1071 | static_pattern.sflags = PAT_SF_TREE; |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1072 | static_pattern.type = SMP_T_IPV4; |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1073 | static_pattern.val.ipv4.addr.s_addr = read_u32(elt->node.key); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1074 | if (!cidr2dotted(elt->node.node.pfx, &static_pattern.val.ipv4.mask)) |
| 1075 | return NULL; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1076 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1077 | return &static_pattern; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1078 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1079 | } |
| 1080 | } |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1081 | |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1082 | /* Lookup in the list. the list contain only IPv4 patterns */ |
| 1083 | list_for_each_entry(lst, &expr->patterns, list) { |
| 1084 | pattern = &lst->pat; |
| 1085 | |
Willy Tarreau | c93da69 | 2020-10-29 09:41:34 +0100 | [diff] [blame] | 1086 | if (pattern->ref->gen_id != expr->ref->curr_gen) |
| 1087 | continue; |
| 1088 | |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1089 | /* The input sample is IPv4, use it as is. */ |
Thierry FOURNIER | 8c542ca | 2015-08-19 09:00:18 +0200 | [diff] [blame] | 1090 | if (smp->data.type == SMP_T_IPV4) { |
Thierry FOURNIER | 136f9d3 | 2015-08-19 09:07:19 +0200 | [diff] [blame] | 1091 | v4 = smp->data.u.ipv4.s_addr; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1092 | } |
Thierry FOURNIER | 8c542ca | 2015-08-19 09:00:18 +0200 | [diff] [blame] | 1093 | else if (smp->data.type == SMP_T_IPV6) { |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1094 | /* v4 match on a V6 sample. We want to check at least for |
| 1095 | * the following forms : |
| 1096 | * - ::ffff:ip:v4 (ipv4 mapped) |
| 1097 | * - ::0000:ip:v4 (old ipv4 mapped) |
| 1098 | * - 2002:ip:v4:: (6to4) |
| 1099 | */ |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1100 | if (read_u64(&smp->data.u.ipv6.s6_addr[0]) == 0 && |
| 1101 | (read_u32(&smp->data.u.ipv6.s6_addr[8]) == 0 || |
| 1102 | read_u32(&smp->data.u.ipv6.s6_addr[8]) == htonl(0xFFFF))) { |
| 1103 | v4 = read_u32(&smp->data.u.ipv6.s6_addr[12]); |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1104 | } |
Willy Tarreau | 296cfd1 | 2020-02-25 09:58:41 +0100 | [diff] [blame] | 1105 | else if (read_u16(&smp->data.u.ipv6.s6_addr[0]) == htons(0x2002)) { |
| 1106 | v4 = htonl((ntohs(read_u16(&smp->data.u.ipv6.s6_addr[2])) << 16) + |
| 1107 | ntohs(read_u16(&smp->data.u.ipv6.s6_addr[4]))); |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1108 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1109 | else |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1110 | continue; |
Andreas Seltenreich | f065319 | 2016-03-03 20:08:35 +0100 | [diff] [blame] | 1111 | } else { |
| 1112 | /* impossible */ |
| 1113 | continue; |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1114 | } |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1115 | |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1116 | /* Check if the input sample match the current pattern. */ |
| 1117 | if (((v4 ^ pattern->val.ipv4.addr.s_addr) & pattern->val.ipv4.mask.s_addr) == 0) |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1118 | return pattern; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1119 | } |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 1120 | return NULL; |
Thierry FOURNIER | e7ba236 | 2014-01-21 11:25:41 +0100 | [diff] [blame] | 1121 | } |
| 1122 | |
Willy Tarreau | 867a8a5 | 2020-11-03 11:22:04 +0100 | [diff] [blame] | 1123 | /* finds the pattern holding <list> from list head <head> and deletes it. |
| 1124 | * This is made for use for pattern removal within an expression. |
| 1125 | */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1126 | static void pat_unlink_from_head(void **head, void **list) |
Willy Tarreau | 867a8a5 | 2020-11-03 11:22:04 +0100 | [diff] [blame] | 1127 | { |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1128 | while (*head) { |
| 1129 | if (*head == list) { |
| 1130 | *head = *list; |
Willy Tarreau | 867a8a5 | 2020-11-03 11:22:04 +0100 | [diff] [blame] | 1131 | return; |
| 1132 | } |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1133 | head = *head; |
Willy Tarreau | 867a8a5 | 2020-11-03 11:22:04 +0100 | [diff] [blame] | 1134 | } |
| 1135 | } |
| 1136 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1137 | void free_pattern_tree(struct eb_root *root) |
| 1138 | { |
| 1139 | struct eb_node *node, *next; |
Thierry FOURNIER | e1bcac5 | 2013-12-13 16:09:50 +0100 | [diff] [blame] | 1140 | struct pattern_tree *elt; |
Thierry FOURNIER | 3ce88c7 | 2013-12-09 11:29:46 +0100 | [diff] [blame] | 1141 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1142 | node = eb_first(root); |
| 1143 | while (node) { |
| 1144 | next = eb_next(node); |
| 1145 | eb_delete(node); |
Thierry FOURNIER | e1bcac5 | 2013-12-13 16:09:50 +0100 | [diff] [blame] | 1146 | elt = container_of(node, struct pattern_tree, node); |
Willy Tarreau | 867a8a5 | 2020-11-03 11:22:04 +0100 | [diff] [blame] | 1147 | pat_unlink_from_head(&elt->ref->tree_head, &elt->from_ref); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1148 | free(elt->data); |
Thierry FOURNIER | 3ce88c7 | 2013-12-09 11:29:46 +0100 | [diff] [blame] | 1149 | free(elt); |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1150 | node = next; |
| 1151 | } |
| 1152 | } |
| 1153 | |
Willy Tarreau | 6d8a689 | 2020-11-02 19:26:02 +0100 | [diff] [blame] | 1154 | void pat_prune_gen(struct pattern_expr *expr) |
Thierry FOURNIER | d163e1c | 2013-11-28 11:41:23 +0100 | [diff] [blame] | 1155 | { |
Thierry FOURNIER | 6f7203d | 2014-01-14 16:24:51 +0100 | [diff] [blame] | 1156 | struct pattern_list *pat, *tmp; |
| 1157 | |
| 1158 | list_for_each_entry_safe(pat, tmp, &expr->patterns, list) { |
Christopher Faulet | 6cfc851 | 2020-09-09 16:09:44 +0200 | [diff] [blame] | 1159 | LIST_DEL(&pat->list); |
Willy Tarreau | 867a8a5 | 2020-11-03 11:22:04 +0100 | [diff] [blame] | 1160 | pat_unlink_from_head(&pat->pat.ref->list_head, &pat->from_ref); |
Willy Tarreau | 6d8a689 | 2020-11-02 19:26:02 +0100 | [diff] [blame] | 1161 | if (pat->pat.sflags & PAT_SF_REGFREE) |
| 1162 | regex_free(pat->pat.ptr.ptr); |
| 1163 | else |
| 1164 | free(pat->pat.ptr.ptr); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1165 | free(pat->pat.data); |
Thierry FOURNIER | 6f7203d | 2014-01-14 16:24:51 +0100 | [diff] [blame] | 1166 | free(pat); |
| 1167 | } |
| 1168 | |
Thierry FOURNIER | d163e1c | 2013-11-28 11:41:23 +0100 | [diff] [blame] | 1169 | free_pattern_tree(&expr->pattern_tree); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1170 | free_pattern_tree(&expr->pattern_tree_2); |
Thierry FOURNIER | d163e1c | 2013-11-28 11:41:23 +0100 | [diff] [blame] | 1171 | LIST_INIT(&expr->patterns); |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1172 | expr->ref->revision = rdtsc(); |
Thierry FOURNIER | d163e1c | 2013-11-28 11:41:23 +0100 | [diff] [blame] | 1173 | } |
| 1174 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1175 | /* |
| 1176 | * |
| 1177 | * The following functions are used for the pattern indexation |
| 1178 | * |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1179 | */ |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1180 | |
| 1181 | int pat_idx_list_val(struct pattern_expr *expr, struct pattern *pat, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1182 | { |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1183 | struct pattern_list *patl; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1184 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1185 | /* allocate pattern */ |
| 1186 | patl = calloc(1, sizeof(*patl)); |
| 1187 | if (!patl) { |
| 1188 | memprintf(err, "out of memory while indexing pattern"); |
Thierry FOURNIER | 972028f | 2014-01-23 17:53:31 +0100 | [diff] [blame] | 1189 | return 0; |
| 1190 | } |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1191 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1192 | /* duplicate pattern */ |
| 1193 | memcpy(&patl->pat, pat, sizeof(*pat)); |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1194 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1195 | /* chain pattern in the expression */ |
| 1196 | LIST_ADDQ(&expr->patterns, &patl->list); |
Willy Tarreau | 4bdd0a1 | 2020-11-02 12:10:48 +0100 | [diff] [blame] | 1197 | /* and from the reference */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1198 | patl->from_ref = pat->ref->list_head; |
| 1199 | pat->ref->list_head = &patl->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1200 | expr->ref->revision = rdtsc(); |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1201 | |
| 1202 | /* that's ok */ |
| 1203 | return 1; |
| 1204 | } |
| 1205 | |
| 1206 | int pat_idx_list_ptr(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1207 | { |
| 1208 | struct pattern_list *patl; |
| 1209 | |
| 1210 | /* allocate pattern */ |
| 1211 | patl = calloc(1, sizeof(*patl)); |
Thierry FOURNIER | 8aa8384 | 2015-02-06 17:50:55 +0100 | [diff] [blame] | 1212 | if (!patl) { |
| 1213 | memprintf(err, "out of memory while indexing pattern"); |
Thierry FOURNIER | 972028f | 2014-01-23 17:53:31 +0100 | [diff] [blame] | 1214 | return 0; |
Thierry FOURNIER | 8aa8384 | 2015-02-06 17:50:55 +0100 | [diff] [blame] | 1215 | } |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1216 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1217 | /* duplicate pattern */ |
| 1218 | memcpy(&patl->pat, pat, sizeof(*pat)); |
| 1219 | patl->pat.ptr.ptr = malloc(patl->pat.len); |
| 1220 | if (!patl->pat.ptr.ptr) { |
| 1221 | free(patl); |
| 1222 | memprintf(err, "out of memory while indexing pattern"); |
| 1223 | return 0; |
| 1224 | } |
| 1225 | memcpy(patl->pat.ptr.ptr, pat->ptr.ptr, pat->len); |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1226 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1227 | /* chain pattern in the expression */ |
| 1228 | LIST_ADDQ(&expr->patterns, &patl->list); |
Willy Tarreau | 4bdd0a1 | 2020-11-02 12:10:48 +0100 | [diff] [blame] | 1229 | /* and from the reference */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1230 | patl->from_ref = pat->ref->list_head; |
| 1231 | pat->ref->list_head = &patl->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1232 | expr->ref->revision = rdtsc(); |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1233 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1234 | /* that's ok */ |
| 1235 | return 1; |
| 1236 | } |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1237 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1238 | int pat_idx_list_str(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1239 | { |
| 1240 | struct pattern_list *patl; |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1241 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1242 | /* allocate pattern */ |
| 1243 | patl = calloc(1, sizeof(*patl)); |
| 1244 | if (!patl) { |
| 1245 | memprintf(err, "out of memory while indexing pattern"); |
| 1246 | return 0; |
| 1247 | } |
| 1248 | |
| 1249 | /* duplicate pattern */ |
| 1250 | memcpy(&patl->pat, pat, sizeof(*pat)); |
| 1251 | patl->pat.ptr.str = malloc(patl->pat.len + 1); |
| 1252 | if (!patl->pat.ptr.str) { |
| 1253 | free(patl); |
| 1254 | memprintf(err, "out of memory while indexing pattern"); |
| 1255 | return 0; |
| 1256 | } |
| 1257 | memcpy(patl->pat.ptr.ptr, pat->ptr.ptr, pat->len); |
| 1258 | patl->pat.ptr.str[patl->pat.len] = '\0'; |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1259 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1260 | /* chain pattern in the expression */ |
| 1261 | LIST_ADDQ(&expr->patterns, &patl->list); |
Willy Tarreau | 4bdd0a1 | 2020-11-02 12:10:48 +0100 | [diff] [blame] | 1262 | /* and from the reference */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1263 | patl->from_ref = pat->ref->list_head; |
| 1264 | pat->ref->list_head = &patl->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1265 | expr->ref->revision = rdtsc(); |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1266 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1267 | /* that's ok */ |
| 1268 | return 1; |
| 1269 | } |
| 1270 | |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 1271 | int pat_idx_list_reg_cap(struct pattern_expr *expr, struct pattern *pat, int cap, char **err) |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1272 | { |
| 1273 | struct pattern_list *patl; |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1274 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1275 | /* allocate pattern */ |
| 1276 | patl = calloc(1, sizeof(*patl)); |
| 1277 | if (!patl) { |
| 1278 | memprintf(err, "out of memory while indexing pattern"); |
| 1279 | return 0; |
Thierry FOURNIER | 972028f | 2014-01-23 17:53:31 +0100 | [diff] [blame] | 1280 | } |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1281 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1282 | /* duplicate pattern */ |
| 1283 | memcpy(&patl->pat, pat, sizeof(*pat)); |
| 1284 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1285 | /* compile regex */ |
Willy Tarreau | 9b5c8bb | 2020-11-02 19:16:23 +0100 | [diff] [blame] | 1286 | patl->pat.sflags |= PAT_SF_REGFREE; |
Dragan Dosen | 2674303 | 2019-04-30 15:54:36 +0200 | [diff] [blame] | 1287 | if (!(patl->pat.ptr.reg = regex_comp(pat->ptr.str, !(expr->mflags & PAT_MF_IGNORE_CASE), |
| 1288 | cap, err))) { |
Dirkjan Bussink | 07fcaaa | 2014-04-28 22:57:16 +0000 | [diff] [blame] | 1289 | free(patl); |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1290 | return 0; |
| 1291 | } |
| 1292 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1293 | /* chain pattern in the expression */ |
| 1294 | LIST_ADDQ(&expr->patterns, &patl->list); |
Willy Tarreau | 4bdd0a1 | 2020-11-02 12:10:48 +0100 | [diff] [blame] | 1295 | /* and from the reference */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1296 | patl->from_ref = pat->ref->list_head; |
| 1297 | pat->ref->list_head = &patl->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1298 | expr->ref->revision = rdtsc(); |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1299 | |
| 1300 | /* that's ok */ |
| 1301 | return 1; |
| 1302 | } |
| 1303 | |
Thierry Fournier | 8feaa66 | 2016-02-10 22:55:20 +0100 | [diff] [blame] | 1304 | int pat_idx_list_reg(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1305 | { |
| 1306 | return pat_idx_list_reg_cap(expr, pat, 0, err); |
| 1307 | } |
| 1308 | |
| 1309 | int pat_idx_list_regm(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1310 | { |
| 1311 | return pat_idx_list_reg_cap(expr, pat, 1, err); |
| 1312 | } |
| 1313 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1314 | int pat_idx_tree_ip(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1315 | { |
| 1316 | unsigned int mask; |
Thierry FOURNIER | e1bcac5 | 2013-12-13 16:09:50 +0100 | [diff] [blame] | 1317 | struct pattern_tree *node; |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1318 | |
| 1319 | /* Only IPv4 can be indexed */ |
| 1320 | if (pat->type == SMP_T_IPV4) { |
Thierry FOURNIER | 972028f | 2014-01-23 17:53:31 +0100 | [diff] [blame] | 1321 | /* in IPv4 case, check if the mask is contiguous so that we can |
| 1322 | * insert the network into the tree. A continuous mask has only |
| 1323 | * ones on the left. This means that this mask + its lower bit |
| 1324 | * added once again is null. |
| 1325 | */ |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1326 | mask = ntohl(pat->val.ipv4.mask.s_addr); |
| 1327 | if (mask + (mask & -mask) == 0) { |
| 1328 | mask = mask ? 33 - flsnz(mask & -mask) : 0; /* equals cidr value */ |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1329 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1330 | /* node memory allocation */ |
| 1331 | node = calloc(1, sizeof(*node) + 4); |
| 1332 | if (!node) { |
| 1333 | memprintf(err, "out of memory while loading pattern"); |
| 1334 | return 0; |
| 1335 | } |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1336 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1337 | /* copy the pointer to sample associated to this node */ |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1338 | node->data = pat->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1339 | node->ref = pat->ref; |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1340 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1341 | /* FIXME: insert <addr>/<mask> into the tree here */ |
| 1342 | memcpy(node->node.key, &pat->val.ipv4.addr, 4); /* network byte order */ |
| 1343 | node->node.node.pfx = mask; |
Thierry FOURNIER | 31db4ae | 2014-01-30 00:27:15 +0100 | [diff] [blame] | 1344 | |
| 1345 | /* Insert the entry. */ |
| 1346 | ebmb_insert_prefix(&expr->pattern_tree, &node->node, 4); |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1347 | node->from_ref = pat->ref->tree_head; |
| 1348 | pat->ref->tree_head = &node->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1349 | expr->ref->revision = rdtsc(); |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1350 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1351 | /* that's ok */ |
| 1352 | return 1; |
| 1353 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1354 | else { |
| 1355 | /* If the mask is not contiguous, just add the pattern to the list */ |
| 1356 | return pat_idx_list_val(expr, pat, err); |
| 1357 | } |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1358 | } |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1359 | else if (pat->type == SMP_T_IPV6) { |
| 1360 | /* IPv6 also can be indexed */ |
| 1361 | node = calloc(1, sizeof(*node) + 16); |
| 1362 | if (!node) { |
| 1363 | memprintf(err, "out of memory while loading pattern"); |
| 1364 | return 0; |
| 1365 | } |
| 1366 | |
| 1367 | /* copy the pointer to sample associated to this node */ |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1368 | node->data = pat->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1369 | node->ref = pat->ref; |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1370 | |
| 1371 | /* FIXME: insert <addr>/<mask> into the tree here */ |
| 1372 | memcpy(node->node.key, &pat->val.ipv6.addr, 16); /* network byte order */ |
| 1373 | node->node.node.pfx = pat->val.ipv6.mask; |
Thierry FOURNIER | 31db4ae | 2014-01-30 00:27:15 +0100 | [diff] [blame] | 1374 | |
| 1375 | /* Insert the entry. */ |
| 1376 | ebmb_insert_prefix(&expr->pattern_tree_2, &node->node, 16); |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1377 | node->from_ref = pat->ref->tree_head; |
| 1378 | pat->ref->tree_head = &node->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1379 | expr->ref->revision = rdtsc(); |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1380 | |
| 1381 | /* that's ok */ |
| 1382 | return 1; |
| 1383 | } |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1384 | |
Thierry FOURNIER | 33a7433 | 2013-12-19 23:54:54 +0100 | [diff] [blame] | 1385 | return 0; |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1386 | } |
| 1387 | |
| 1388 | int pat_idx_tree_str(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1389 | { |
| 1390 | int len; |
Thierry FOURNIER | e1bcac5 | 2013-12-13 16:09:50 +0100 | [diff] [blame] | 1391 | struct pattern_tree *node; |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1392 | |
| 1393 | /* Only string can be indexed */ |
Thierry FOURNIER | 7654c9f | 2013-12-17 00:20:33 +0100 | [diff] [blame] | 1394 | if (pat->type != SMP_T_STR) { |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1395 | memprintf(err, "internal error: string expected, but the type is '%s'", |
| 1396 | smp_to_type[pat->type]); |
| 1397 | return 0; |
Thierry FOURNIER | 972028f | 2014-01-23 17:53:31 +0100 | [diff] [blame] | 1398 | } |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1399 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1400 | /* If the flag PAT_F_IGNORE_CASE is set, we cannot use trees */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 1401 | if (expr->mflags & PAT_MF_IGNORE_CASE) |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1402 | return pat_idx_list_str(expr, pat, err); |
Thierry FOURNIER | 7148ce6 | 2013-12-06 19:06:43 +0100 | [diff] [blame] | 1403 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1404 | /* Process the key len */ |
| 1405 | len = strlen(pat->ptr.str) + 1; |
| 1406 | |
| 1407 | /* node memory allocation */ |
| 1408 | node = calloc(1, sizeof(*node) + len); |
| 1409 | if (!node) { |
| 1410 | memprintf(err, "out of memory while loading pattern"); |
| 1411 | return 0; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1412 | } |
| 1413 | |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1414 | /* copy the pointer to sample associated to this node */ |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1415 | node->data = pat->data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1416 | node->ref = pat->ref; |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1417 | |
| 1418 | /* copy the string */ |
| 1419 | memcpy(node->node.key, pat->ptr.str, len); |
| 1420 | |
| 1421 | /* index the new node */ |
Thierry FOURNIER | 31db4ae | 2014-01-30 00:27:15 +0100 | [diff] [blame] | 1422 | ebst_insert(&expr->pattern_tree, &node->node); |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1423 | node->from_ref = pat->ref->tree_head; |
| 1424 | pat->ref->tree_head = &node->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1425 | expr->ref->revision = rdtsc(); |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1426 | |
| 1427 | /* that's ok */ |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 1428 | return 1; |
| 1429 | } |
| 1430 | |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 1431 | int pat_idx_tree_pfx(struct pattern_expr *expr, struct pattern *pat, char **err) |
| 1432 | { |
| 1433 | int len; |
| 1434 | struct pattern_tree *node; |
| 1435 | |
| 1436 | /* Only string can be indexed */ |
| 1437 | if (pat->type != SMP_T_STR) { |
| 1438 | memprintf(err, "internal error: string expected, but the type is '%s'", |
| 1439 | smp_to_type[pat->type]); |
| 1440 | return 0; |
| 1441 | } |
| 1442 | |
| 1443 | /* If the flag PAT_F_IGNORE_CASE is set, we cannot use trees */ |
| 1444 | if (expr->mflags & PAT_MF_IGNORE_CASE) |
| 1445 | return pat_idx_list_str(expr, pat, err); |
| 1446 | |
| 1447 | /* Process the key len */ |
| 1448 | len = strlen(pat->ptr.str); |
| 1449 | |
| 1450 | /* node memory allocation */ |
| 1451 | node = calloc(1, sizeof(*node) + len + 1); |
| 1452 | if (!node) { |
| 1453 | memprintf(err, "out of memory while loading pattern"); |
| 1454 | return 0; |
| 1455 | } |
| 1456 | |
| 1457 | /* copy the pointer to sample associated to this node */ |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1458 | node->data = pat->data; |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 1459 | node->ref = pat->ref; |
| 1460 | |
| 1461 | /* copy the string and the trailing zero */ |
| 1462 | memcpy(node->node.key, pat->ptr.str, len + 1); |
| 1463 | node->node.node.pfx = len * 8; |
| 1464 | |
| 1465 | /* index the new node */ |
| 1466 | ebmb_insert_prefix(&expr->pattern_tree, &node->node, len); |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1467 | node->from_ref = pat->ref->tree_head; |
| 1468 | pat->ref->tree_head = &node->from_ref; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1469 | expr->ref->revision = rdtsc(); |
Willy Tarreau | b1dd9bf | 2014-05-10 08:53:48 +0200 | [diff] [blame] | 1470 | |
| 1471 | /* that's ok */ |
| 1472 | return 1; |
| 1473 | } |
| 1474 | |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1475 | /* Deletes all patterns from reference <elt>. Note that all of their |
Willy Tarreau | 78777ea | 2020-11-02 13:55:22 +0100 | [diff] [blame] | 1476 | * expressions must be locked, and the pattern lock must be held as well. |
| 1477 | */ |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1478 | void pat_delete_gen(struct pat_ref *ref, struct pat_ref_elt *elt) |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1479 | { |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1480 | struct pattern_tree *tree; |
| 1481 | struct pattern_list *pat; |
| 1482 | void **node; |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1483 | |
| 1484 | /* delete all known tree nodes. They are all allocated inline */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1485 | for (node = elt->tree_head; node;) { |
| 1486 | tree = container_of(node, struct pattern_tree, from_ref); |
| 1487 | node = *node; |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1488 | BUG_ON(tree->ref != elt); |
| 1489 | |
| 1490 | ebmb_delete(&tree->node); |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1491 | free(tree->data); |
| 1492 | free(tree); |
| 1493 | } |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1494 | |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1495 | /* delete all list nodes and free their pattern entries (str/reg) */ |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1496 | for (node = elt->list_head; node;) { |
| 1497 | pat = container_of(node, struct pattern_list, from_ref); |
| 1498 | node = *node; |
Willy Tarreau | 78777ea | 2020-11-02 13:55:22 +0100 | [diff] [blame] | 1499 | BUG_ON(pat->pat.ref != elt); |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1500 | |
| 1501 | /* Delete and free entry. */ |
| 1502 | LIST_DEL(&pat->list); |
Willy Tarreau | 6d8a689 | 2020-11-02 19:26:02 +0100 | [diff] [blame] | 1503 | if (pat->pat.sflags & PAT_SF_REGFREE) |
| 1504 | regex_free(pat->pat.ptr.reg); |
| 1505 | else |
| 1506 | free(pat->pat.ptr.ptr); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1507 | free(pat->pat.data); |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1508 | free(pat); |
| 1509 | } |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1510 | |
Willy Tarreau | f1c0892 | 2020-11-02 19:53:16 +0100 | [diff] [blame] | 1511 | /* update revision number to refresh the cache */ |
| 1512 | ref->revision = rdtsc(); |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1513 | elt->tree_head = NULL; |
| 1514 | elt->list_head = NULL; |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1515 | } |
| 1516 | |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1517 | void pattern_init_expr(struct pattern_expr *expr) |
| 1518 | { |
| 1519 | LIST_INIT(&expr->patterns); |
Thierry FOURNIER | 31db4ae | 2014-01-30 00:27:15 +0100 | [diff] [blame] | 1520 | expr->pattern_tree = EB_ROOT; |
| 1521 | expr->pattern_tree_2 = EB_ROOT; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1522 | } |
| 1523 | |
| 1524 | void pattern_init_head(struct pattern_head *head) |
| 1525 | { |
| 1526 | LIST_INIT(&head->head); |
| 1527 | } |
| 1528 | |
| 1529 | /* The following functions are relative to the management of the reference |
| 1530 | * lists. These lists are used to store the original pattern and associated |
| 1531 | * value as string form. |
| 1532 | * |
| 1533 | * This is used with modifiable ACL and MAPS |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1534 | * |
| 1535 | * The pattern reference are stored with two identifiers: the unique_id and |
| 1536 | * the reference. |
| 1537 | * |
| 1538 | * The reference identify a file. Each file with the same name point to the |
| 1539 | * same reference. We can register many times one file. If the file is modified, |
| 1540 | * all his dependencies are also modified. The reference can be used with map or |
| 1541 | * acl. |
| 1542 | * |
| 1543 | * The unique_id identify inline acl. The unique id is unique for each acl. |
| 1544 | * You cannot force the same id in the configuration file, because this repoort |
| 1545 | * an error. |
| 1546 | * |
| 1547 | * A particular case appears if the filename is a number. In this case, the |
| 1548 | * unique_id is set with the number represented by the filename and the |
| 1549 | * reference is also set. This method prevent double unique_id. |
| 1550 | * |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1551 | */ |
| 1552 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1553 | /* This function looks up a reference by name. If the reference is found, a |
| 1554 | * pointer to the struct pat_ref is returned, otherwise NULL is returned. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1555 | */ |
| 1556 | struct pat_ref *pat_ref_lookup(const char *reference) |
| 1557 | { |
| 1558 | struct pat_ref *ref; |
| 1559 | |
| 1560 | list_for_each_entry(ref, &pattern_reference, list) |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1561 | if (ref->reference && strcmp(reference, ref->reference) == 0) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1562 | return ref; |
| 1563 | return NULL; |
| 1564 | } |
| 1565 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1566 | /* This function looks up a reference's unique id. If the reference is found, a |
| 1567 | * pointer to the struct pat_ref is returned, otherwise NULL is returned. |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1568 | */ |
| 1569 | struct pat_ref *pat_ref_lookupid(int unique_id) |
| 1570 | { |
| 1571 | struct pat_ref *ref; |
| 1572 | |
| 1573 | list_for_each_entry(ref, &pattern_reference, list) |
| 1574 | if (ref->unique_id == unique_id) |
| 1575 | return ref; |
| 1576 | return NULL; |
| 1577 | } |
| 1578 | |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1579 | /* This function removes from the pattern reference <ref> all the patterns |
| 1580 | * attached to the reference element <elt>, and the element itself. The |
| 1581 | * reference must be locked. |
| 1582 | */ |
| 1583 | void pat_ref_delete_by_ptr(struct pat_ref *ref, struct pat_ref_elt *elt) |
| 1584 | { |
| 1585 | struct pattern_expr *expr; |
| 1586 | struct bref *bref, *back; |
| 1587 | |
| 1588 | /* |
| 1589 | * we have to unlink all watchers from this reference pattern. We must |
| 1590 | * not relink them if this elt was the last one in the list. |
| 1591 | */ |
| 1592 | list_for_each_entry_safe(bref, back, &elt->back_refs, users) { |
| 1593 | LIST_DEL(&bref->users); |
| 1594 | LIST_INIT(&bref->users); |
| 1595 | if (elt->list.n != &ref->head) |
| 1596 | LIST_ADDQ(&LIST_ELEM(elt->list.n, typeof(elt), list)->back_refs, &bref->users); |
| 1597 | bref->ref = elt->list.n; |
| 1598 | } |
| 1599 | |
| 1600 | /* delete all entries from all expressions for this pattern */ |
| 1601 | list_for_each_entry(expr, &ref->pat, list) |
| 1602 | HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock); |
| 1603 | |
| 1604 | pat_delete_gen(ref, elt); |
| 1605 | |
| 1606 | list_for_each_entry(expr, &ref->pat, list) |
| 1607 | HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock); |
| 1608 | |
| 1609 | LIST_DEL(&elt->list); |
| 1610 | free(elt->sample); |
| 1611 | free(elt->pattern); |
| 1612 | free(elt); |
| 1613 | } |
| 1614 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1615 | /* This function removes all the patterns matching the pointer <refelt> from |
| 1616 | * the reference and from each expr member of this reference. This function |
| 1617 | * returns 1 if the entry was found and deleted, otherwise zero. |
Thierry FOURNIER | 7acca4b | 2014-01-28 16:43:36 +0100 | [diff] [blame] | 1618 | */ |
| 1619 | int pat_ref_delete_by_id(struct pat_ref *ref, struct pat_ref_elt *refelt) |
| 1620 | { |
Thierry FOURNIER | 7acca4b | 2014-01-28 16:43:36 +0100 | [diff] [blame] | 1621 | struct pat_ref_elt *elt, *safe; |
| 1622 | |
| 1623 | /* delete pattern from reference */ |
| 1624 | list_for_each_entry_safe(elt, safe, &ref->head, list) { |
| 1625 | if (elt == refelt) { |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1626 | pat_ref_delete_by_ptr(ref, elt); |
Thierry FOURNIER | 7acca4b | 2014-01-28 16:43:36 +0100 | [diff] [blame] | 1627 | return 1; |
| 1628 | } |
| 1629 | } |
| 1630 | return 0; |
| 1631 | } |
| 1632 | |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1633 | /* This function removes all patterns matching <key> from the reference |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 1634 | * and from each expr member of the reference. This function returns 1 |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1635 | * if the deletion is done and returns 0 is the entry is not found. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1636 | */ |
| 1637 | int pat_ref_delete(struct pat_ref *ref, const char *key) |
| 1638 | { |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1639 | struct pat_ref_elt *elt, *safe; |
| 1640 | int found = 0; |
| 1641 | |
| 1642 | /* delete pattern from reference */ |
| 1643 | list_for_each_entry_safe(elt, safe, &ref->head, list) { |
| 1644 | if (strcmp(key, elt->pattern) == 0) { |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1645 | pat_ref_delete_by_ptr(ref, elt); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1646 | found = 1; |
| 1647 | } |
| 1648 | } |
| 1649 | |
Willy Tarreau | 1fd52f7 | 2020-11-02 17:30:17 +0100 | [diff] [blame] | 1650 | return found; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1651 | } |
| 1652 | |
Baptiste Assmann | 953f74d | 2014-04-25 16:57:03 +0200 | [diff] [blame] | 1653 | /* |
| 1654 | * find and return an element <elt> matching <key> in a reference <ref> |
| 1655 | * return NULL if not found |
| 1656 | */ |
| 1657 | struct pat_ref_elt *pat_ref_find_elt(struct pat_ref *ref, const char *key) |
| 1658 | { |
| 1659 | struct pat_ref_elt *elt; |
| 1660 | |
| 1661 | list_for_each_entry(elt, &ref->head, list) { |
| 1662 | if (strcmp(key, elt->pattern) == 0) |
| 1663 | return elt; |
| 1664 | } |
| 1665 | |
| 1666 | return NULL; |
| 1667 | } |
| 1668 | |
| 1669 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1670 | /* This function modifies the sample of pat_ref_elt <elt> in all expressions |
| 1671 | * found under <ref> to become <value>. It is assumed that the caller has |
| 1672 | * already verified that <elt> belongs to <ref>. |
| 1673 | */ |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1674 | static inline int pat_ref_set_elt(struct pat_ref *ref, struct pat_ref_elt *elt, |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1675 | const char *value, char **err) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1676 | { |
| 1677 | struct pattern_expr *expr; |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1678 | struct sample_data **data; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1679 | char *sample; |
Thierry FOURNIER | 12ba0c2 | 2015-08-14 00:02:11 +0200 | [diff] [blame] | 1680 | struct sample_data test; |
Thierry FOURNIER | 149e0fe | 2014-01-29 19:35:06 +0100 | [diff] [blame] | 1681 | |
| 1682 | /* Try all needed converters. */ |
| 1683 | list_for_each_entry(expr, &ref->pat, list) { |
| 1684 | if (!expr->pat_head->parse_smp) |
| 1685 | continue; |
| 1686 | |
| 1687 | if (!expr->pat_head->parse_smp(value, &test)) { |
| 1688 | memprintf(err, "unable to parse '%s'", value); |
| 1689 | return 0; |
| 1690 | } |
| 1691 | } |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1692 | |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1693 | /* Modify pattern from reference. */ |
| 1694 | sample = strdup(value); |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1695 | if (!sample) { |
| 1696 | memprintf(err, "out of memory error"); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1697 | return 0; |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1698 | } |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1699 | /* Load sample in each reference. All the conversions are tested |
| 1700 | * below, normally these calls don't fail. |
Thierry FOURNIER | 149e0fe | 2014-01-29 19:35:06 +0100 | [diff] [blame] | 1701 | */ |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 1702 | list_for_each_entry(expr, &ref->pat, list) { |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1703 | if (!expr->pat_head->parse_smp) |
| 1704 | continue; |
| 1705 | |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 1706 | HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1707 | data = pattern_find_smp(expr, elt); |
| 1708 | if (data && *data && !expr->pat_head->parse_smp(sample, *data)) |
| 1709 | *data = NULL; |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 1710 | HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1711 | } |
| 1712 | |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 1713 | /* free old sample only when all exprs are updated */ |
| 1714 | free(elt->sample); |
| 1715 | elt->sample = sample; |
| 1716 | |
| 1717 | |
Thierry FOURNIER | 149e0fe | 2014-01-29 19:35:06 +0100 | [diff] [blame] | 1718 | return 1; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1719 | } |
| 1720 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1721 | /* This function modifies the sample of pat_ref_elt <refelt> in all expressions |
| 1722 | * found under <ref> to become <value>, after checking that <refelt> really |
| 1723 | * belongs to <ref>. |
| 1724 | */ |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1725 | int pat_ref_set_by_id(struct pat_ref *ref, struct pat_ref_elt *refelt, const char *value, char **err) |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1726 | { |
| 1727 | struct pat_ref_elt *elt; |
| 1728 | |
| 1729 | /* Look for pattern in the reference. */ |
| 1730 | list_for_each_entry(elt, &ref->head, list) { |
| 1731 | if (elt == refelt) { |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1732 | if (!pat_ref_set_elt(ref, elt, value, err)) |
| 1733 | return 0; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1734 | return 1; |
| 1735 | } |
| 1736 | } |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1737 | |
| 1738 | memprintf(err, "key or pattern not found"); |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1739 | return 0; |
| 1740 | } |
| 1741 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1742 | /* This function modifies to <value> the sample of all patterns matching <key> |
| 1743 | * under <ref>. |
| 1744 | */ |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1745 | int pat_ref_set(struct pat_ref *ref, const char *key, const char *value, char **err) |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1746 | { |
| 1747 | struct pat_ref_elt *elt; |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1748 | int found = 0; |
| 1749 | char *_merr; |
| 1750 | char **merr; |
| 1751 | |
| 1752 | if (err) { |
| 1753 | merr = &_merr; |
| 1754 | *merr = NULL; |
| 1755 | } |
| 1756 | else |
| 1757 | merr = NULL; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1758 | |
| 1759 | /* Look for pattern in the reference. */ |
| 1760 | list_for_each_entry(elt, &ref->head, list) { |
| 1761 | if (strcmp(key, elt->pattern) == 0) { |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1762 | if (!pat_ref_set_elt(ref, elt, value, merr)) { |
William Lallemand | 579fb25 | 2018-06-11 10:53:46 +0200 | [diff] [blame] | 1763 | if (err && merr) { |
| 1764 | if (!found) { |
| 1765 | *err = *merr; |
| 1766 | } else { |
| 1767 | memprintf(err, "%s, %s", *err, *merr); |
| 1768 | free(*merr); |
| 1769 | *merr = NULL; |
| 1770 | } |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1771 | } |
| 1772 | } |
| 1773 | found = 1; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1774 | } |
| 1775 | } |
Thierry FOURNIER | 364cfdf | 2014-01-29 19:08:49 +0100 | [diff] [blame] | 1776 | |
| 1777 | if (!found) { |
| 1778 | memprintf(err, "entry not found"); |
| 1779 | return 0; |
| 1780 | } |
| 1781 | return 1; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 1782 | } |
| 1783 | |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 1784 | /* This function creates a new reference. <ref> is the reference name. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1785 | * <flags> are PAT_REF_*. /!\ The reference is not checked, and must |
| 1786 | * be unique. The user must check the reference with "pat_ref_lookup()" |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1787 | * before calling this function. If the function fails, it returns NULL, |
| 1788 | * otherwise it returns the new struct pat_ref. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1789 | */ |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1790 | struct pat_ref *pat_ref_new(const char *reference, const char *display, unsigned int flags) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1791 | { |
| 1792 | struct pat_ref *ref; |
| 1793 | |
Willy Tarreau | 8135d9b | 2020-10-30 15:35:11 +0100 | [diff] [blame] | 1794 | ref = calloc(1, sizeof(*ref)); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1795 | if (!ref) |
| 1796 | return NULL; |
| 1797 | |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1798 | if (display) { |
| 1799 | ref->display = strdup(display); |
| 1800 | if (!ref->display) { |
| 1801 | free(ref); |
| 1802 | return NULL; |
| 1803 | } |
| 1804 | } |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1805 | |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1806 | ref->reference = strdup(reference); |
| 1807 | if (!ref->reference) { |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1808 | free(ref->display); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1809 | free(ref); |
| 1810 | return NULL; |
| 1811 | } |
| 1812 | |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1813 | ref->flags = flags; |
| 1814 | ref->unique_id = -1; |
Willy Tarreau | 3ee0de1 | 2020-11-02 15:26:51 +0100 | [diff] [blame] | 1815 | ref->revision = 0; |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1816 | |
| 1817 | LIST_INIT(&ref->head); |
| 1818 | LIST_INIT(&ref->pat); |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 1819 | HA_SPIN_INIT(&ref->lock); |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1820 | LIST_ADDQ(&pattern_reference, &ref->list); |
| 1821 | |
| 1822 | return ref; |
| 1823 | } |
| 1824 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1825 | /* This function creates a new reference. <unique_id> is the unique id. If |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1826 | * the value of <unique_id> is -1, the unique id is calculated later. |
| 1827 | * <flags> are PAT_REF_*. /!\ The reference is not checked, and must |
| 1828 | * be unique. The user must check the reference with "pat_ref_lookup()" |
| 1829 | * or pat_ref_lookupid before calling this function. If the function |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1830 | * fails, it returns NULL, otherwise it returns the new struct pat_ref. |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1831 | */ |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1832 | struct pat_ref *pat_ref_newid(int unique_id, const char *display, unsigned int flags) |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1833 | { |
| 1834 | struct pat_ref *ref; |
| 1835 | |
Willy Tarreau | 8135d9b | 2020-10-30 15:35:11 +0100 | [diff] [blame] | 1836 | ref = calloc(1, sizeof(*ref)); |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1837 | if (!ref) |
| 1838 | return NULL; |
| 1839 | |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1840 | if (display) { |
| 1841 | ref->display = strdup(display); |
| 1842 | if (!ref->display) { |
| 1843 | free(ref); |
| 1844 | return NULL; |
| 1845 | } |
| 1846 | } |
Thierry FOURNIER | 0d6ba51 | 2014-02-11 03:31:34 +0100 | [diff] [blame] | 1847 | |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1848 | ref->reference = NULL; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1849 | ref->flags = flags; |
Willy Tarreau | 2994774 | 2020-10-28 11:43:49 +0100 | [diff] [blame] | 1850 | ref->curr_gen = 0; |
| 1851 | ref->next_gen = 0; |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 1852 | ref->unique_id = unique_id; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1853 | LIST_INIT(&ref->head); |
| 1854 | LIST_INIT(&ref->pat); |
Aurélien Nephtali | 564d15a | 2018-04-19 16:56:07 +0200 | [diff] [blame] | 1855 | HA_SPIN_INIT(&ref->lock); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1856 | LIST_ADDQ(&pattern_reference, &ref->list); |
| 1857 | |
| 1858 | return ref; |
| 1859 | } |
| 1860 | |
Willy Tarreau | f4edb72 | 2020-10-28 10:52:46 +0100 | [diff] [blame] | 1861 | /* This function adds entry to <ref>. It can fail on memory error. It returns |
| 1862 | * the newly added element on success, or NULL on failure. The PATREF_LOCK on |
Willy Tarreau | 2994774 | 2020-10-28 11:43:49 +0100 | [diff] [blame] | 1863 | * <ref> must be held. It sets the newly created pattern's generation number |
| 1864 | * to the same value as the reference's. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1865 | */ |
Willy Tarreau | f4edb72 | 2020-10-28 10:52:46 +0100 | [diff] [blame] | 1866 | struct pat_ref_elt *pat_ref_append(struct pat_ref *ref, const char *pattern, const char *sample, int line) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1867 | { |
| 1868 | struct pat_ref_elt *elt; |
| 1869 | |
Willy Tarreau | 8135d9b | 2020-10-30 15:35:11 +0100 | [diff] [blame] | 1870 | elt = calloc(1, sizeof(*elt)); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1871 | if (!elt) |
Willy Tarreau | f4edb72 | 2020-10-28 10:52:46 +0100 | [diff] [blame] | 1872 | goto fail; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1873 | |
Willy Tarreau | 2994774 | 2020-10-28 11:43:49 +0100 | [diff] [blame] | 1874 | elt->gen_id = ref->curr_gen; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1875 | elt->line = line; |
| 1876 | |
| 1877 | elt->pattern = strdup(pattern); |
Willy Tarreau | f4edb72 | 2020-10-28 10:52:46 +0100 | [diff] [blame] | 1878 | if (!elt->pattern) |
| 1879 | goto fail; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1880 | |
| 1881 | if (sample) { |
| 1882 | elt->sample = strdup(sample); |
Willy Tarreau | f4edb72 | 2020-10-28 10:52:46 +0100 | [diff] [blame] | 1883 | if (!elt->sample) |
| 1884 | goto fail; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1885 | } |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1886 | |
Emeric Brun | 8d85aa4 | 2017-06-29 15:40:33 +0200 | [diff] [blame] | 1887 | LIST_INIT(&elt->back_refs); |
Willy Tarreau | 38d4199 | 2020-11-03 14:50:29 +0100 | [diff] [blame] | 1888 | elt->list_head = NULL; |
| 1889 | elt->tree_head = NULL; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1890 | LIST_ADDQ(&ref->head, &elt->list); |
Willy Tarreau | f4edb72 | 2020-10-28 10:52:46 +0100 | [diff] [blame] | 1891 | return elt; |
| 1892 | fail: |
| 1893 | if (elt) |
| 1894 | free(elt->pattern); |
| 1895 | free(elt); |
| 1896 | return NULL; |
Thierry FOURNIER | b113650 | 2014-01-15 11:38:49 +0100 | [diff] [blame] | 1897 | } |
| 1898 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 1899 | /* This function creates sample found in <elt>, parses the pattern also |
| 1900 | * found in <elt> and inserts it in <expr>. The function copies <patflags> |
| 1901 | * into <expr>. If the function fails, it returns 0 and <err> is filled. |
Ilya Shipitsin | 47d1718 | 2020-06-21 21:42:57 +0500 | [diff] [blame] | 1902 | * In success case, the function returns 1. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1903 | */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1904 | int pat_ref_push(struct pat_ref_elt *elt, struct pattern_expr *expr, |
| 1905 | int patflags, char **err) |
| 1906 | { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1907 | struct sample_data *data; |
Thierry FOURNIER | d25c842 | 2014-01-28 15:34:35 +0100 | [diff] [blame] | 1908 | struct pattern pattern; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1909 | |
| 1910 | /* Create sample */ |
| 1911 | if (elt->sample && expr->pat_head->parse_smp) { |
| 1912 | /* New sample. */ |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1913 | data = malloc(sizeof(*data)); |
| 1914 | if (!data) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1915 | return 0; |
| 1916 | |
| 1917 | /* Parse value. */ |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1918 | if (!expr->pat_head->parse_smp(elt->sample, data)) { |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1919 | memprintf(err, "unable to parse '%s'", elt->sample); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1920 | free(data); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1921 | return 0; |
| 1922 | } |
| 1923 | |
| 1924 | } |
| 1925 | else |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1926 | data = NULL; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1927 | |
Thierry FOURNIER | d25c842 | 2014-01-28 15:34:35 +0100 | [diff] [blame] | 1928 | /* initialise pattern */ |
| 1929 | memset(&pattern, 0, sizeof(pattern)); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1930 | pattern.data = data; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 1931 | pattern.ref = elt; |
Thierry FOURNIER | d25c842 | 2014-01-28 15:34:35 +0100 | [diff] [blame] | 1932 | |
| 1933 | /* parse pattern */ |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 1934 | if (!expr->pat_head->parse(elt->pattern, &pattern, expr->mflags, err)) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1935 | free(data); |
Thierry FOURNIER | d25c842 | 2014-01-28 15:34:35 +0100 | [diff] [blame] | 1936 | return 0; |
| 1937 | } |
| 1938 | |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 1939 | HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock); |
Thierry FOURNIER | d25c842 | 2014-01-28 15:34:35 +0100 | [diff] [blame] | 1940 | /* index pattern */ |
| 1941 | if (!expr->pat_head->index(expr, &pattern, err)) { |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 1942 | HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock); |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 1943 | free(data); |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1944 | return 0; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 1945 | } |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 1946 | HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock); |
Thierry FOURNIER | b9b0846 | 2013-12-13 15:12:32 +0100 | [diff] [blame] | 1947 | |
| 1948 | return 1; |
| 1949 | } |
| 1950 | |
Willy Tarreau | 0439e5e | 2020-10-28 18:45:45 +0100 | [diff] [blame] | 1951 | /* This function tries to commit entry <elt> into <ref>. The new entry must |
| 1952 | * have already been inserted using pat_ref_append(), and its generation number |
| 1953 | * may have been adjusted as it will not be changed. <err> must point to a NULL |
| 1954 | * pointer. The PATREF lock on <ref> must be held. All the pattern_expr for |
| 1955 | * this reference will be updated (parsing, indexing). On success, non-zero is |
| 1956 | * returned. On failure, all the operation is rolled back (the element is |
| 1957 | * deleted from all expressions and is freed), zero is returned and the error |
| 1958 | * pointer <err> may have been updated (and the caller must free it). Failure |
| 1959 | * causes include memory allocation, parsing error or indexing error. |
| 1960 | */ |
| 1961 | int pat_ref_commit(struct pat_ref *ref, struct pat_ref_elt *elt, char **err) |
| 1962 | { |
| 1963 | struct pattern_expr *expr; |
| 1964 | |
| 1965 | list_for_each_entry(expr, &ref->pat, list) { |
| 1966 | if (!pat_ref_push(elt, expr, 0, err)) { |
| 1967 | pat_ref_delete_by_ptr(ref, elt); |
| 1968 | return 0; |
| 1969 | } |
| 1970 | } |
| 1971 | return 1; |
| 1972 | } |
| 1973 | |
Willy Tarreau | 1a6857b | 2020-10-29 09:21:43 +0100 | [diff] [blame] | 1974 | /* Loads <pattern>:<sample> into <ref> for generation <gen>. <sample> may be |
| 1975 | * NULL if none exists (e.g. ACL). If not needed, the generation number should |
| 1976 | * be set to ref->curr_gen. The error pointer must initially point to NULL. The |
| 1977 | * new entry will be propagated to all use places, involving allocation, parsing |
| 1978 | * and indexing. On error (parsing, allocation), the operation will be rolled |
| 1979 | * back, an error may be reported, and NULL will be reported. On success, the |
| 1980 | * freshly allocated element will be returned. The PATREF lock on <ref> must be |
| 1981 | * held during the operation. |
| 1982 | */ |
| 1983 | struct pat_ref_elt *pat_ref_load(struct pat_ref *ref, unsigned int gen, |
| 1984 | const char *pattern, const char *sample, |
| 1985 | int line, char **err) |
| 1986 | { |
| 1987 | struct pat_ref_elt *elt; |
| 1988 | |
| 1989 | elt = pat_ref_append(ref, pattern, sample, line); |
| 1990 | if (elt) { |
| 1991 | elt->gen_id = gen; |
| 1992 | if (!pat_ref_commit(ref, elt, err)) |
| 1993 | elt = NULL; |
| 1994 | } else |
| 1995 | memprintf(err, "out of memory error"); |
| 1996 | |
| 1997 | return elt; |
| 1998 | } |
| 1999 | |
Willy Tarreau | 6a17407 | 2020-10-28 10:58:05 +0100 | [diff] [blame] | 2000 | /* This function adds entry to <ref>. It can fail on memory error. The new |
Thierry FOURNIER | 31db4ae | 2014-01-30 00:27:15 +0100 | [diff] [blame] | 2001 | * entry is added at all the pattern_expr registered in this reference. The |
Willy Tarreau | 6a17407 | 2020-10-28 10:58:05 +0100 | [diff] [blame] | 2002 | * function stops on the first error encountered. It returns 0 and <err> is |
Thierry FOURNIER | 31db4ae | 2014-01-30 00:27:15 +0100 | [diff] [blame] | 2003 | * filled. If an error is encountered, the complete add operation is cancelled. |
| 2004 | * If the insertion is a success the function returns 1. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2005 | */ |
| 2006 | int pat_ref_add(struct pat_ref *ref, |
| 2007 | const char *pattern, const char *sample, |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 2008 | char **err) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2009 | { |
Willy Tarreau | 1a6857b | 2020-10-29 09:21:43 +0100 | [diff] [blame] | 2010 | return !!pat_ref_load(ref, ref->curr_gen, pattern, sample, -1, err); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2011 | } |
| 2012 | |
Willy Tarreau | 94b9abe | 2020-10-28 18:23:49 +0100 | [diff] [blame] | 2013 | /* This function purges all elements from <ref> that are older than generation |
| 2014 | * <oldest>. It will not purge more than <budget> entries at once, in order to |
| 2015 | * remain responsive. If budget is negative, no limit is applied. |
| 2016 | * The caller must already hold the PATREF_LOCK on <ref>. The function will |
| 2017 | * take the PATEXP_LOCK on all expressions of the pattern as needed. It returns |
| 2018 | * non-zero on completion, or zero if it had to stop before the end after |
| 2019 | * <budget> was depleted. |
| 2020 | */ |
| 2021 | int pat_ref_purge_older(struct pat_ref *ref, unsigned int oldest, int budget) |
| 2022 | { |
| 2023 | struct pat_ref_elt *elt, *elt_bck; |
| 2024 | struct bref *bref, *bref_bck; |
| 2025 | struct pattern_expr *expr; |
| 2026 | int done; |
| 2027 | |
| 2028 | list_for_each_entry(expr, &ref->pat, list) |
| 2029 | HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock); |
| 2030 | |
| 2031 | /* all expr are locked, we can safely remove all pat_ref */ |
| 2032 | |
| 2033 | /* assume completion for e.g. empty lists */ |
| 2034 | done = 1; |
| 2035 | list_for_each_entry_safe(elt, elt_bck, &ref->head, list) { |
| 2036 | if ((int)(elt->gen_id - oldest) >= 0) |
| 2037 | continue; |
| 2038 | |
| 2039 | if (budget >= 0 && !budget--) { |
| 2040 | done = 0; |
| 2041 | break; |
| 2042 | } |
| 2043 | |
| 2044 | /* |
| 2045 | * we have to unlink all watchers from this reference pattern. We must |
| 2046 | * not relink them if this elt was the last one in the list. |
| 2047 | */ |
| 2048 | list_for_each_entry_safe(bref, bref_bck, &elt->back_refs, users) { |
| 2049 | LIST_DEL(&bref->users); |
| 2050 | LIST_INIT(&bref->users); |
| 2051 | if (elt->list.n != &ref->head) |
| 2052 | LIST_ADDQ(&LIST_ELEM(elt->list.n, typeof(elt), list)->back_refs, &bref->users); |
| 2053 | bref->ref = elt->list.n; |
| 2054 | } |
| 2055 | |
| 2056 | /* delete the storage for all representations of this pattern. */ |
| 2057 | pat_delete_gen(ref, elt); |
| 2058 | |
| 2059 | LIST_DEL(&elt->list); |
| 2060 | free(elt->pattern); |
| 2061 | free(elt->sample); |
| 2062 | free(elt); |
| 2063 | } |
| 2064 | |
| 2065 | list_for_each_entry(expr, &ref->pat, list) |
| 2066 | HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock); |
| 2067 | |
| 2068 | #if defined(HA_HAVE_MALLOC_TRIM) |
| 2069 | if (done) { |
| 2070 | malloc_trim(0); |
| 2071 | } |
| 2072 | #endif |
| 2073 | |
| 2074 | return done; |
| 2075 | } |
| 2076 | |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 2077 | /* This function prunes <ref>, replaces all references by the references |
| 2078 | * of <replace>, and reindexes all the news values. |
Thierry FOURNIER | 46006bd | 2014-03-21 21:45:15 +0100 | [diff] [blame] | 2079 | * |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 2080 | * The patterns are loaded in best effort and the errors are ignored, |
| 2081 | * but written in the logs. |
Thierry FOURNIER | 46006bd | 2014-03-21 21:45:15 +0100 | [diff] [blame] | 2082 | */ |
| 2083 | void pat_ref_reload(struct pat_ref *ref, struct pat_ref *replace) |
| 2084 | { |
| 2085 | struct pattern_expr *expr; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2086 | struct pat_ref_elt *elt, *safe; |
| 2087 | struct bref *bref, *back; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2088 | struct pattern pattern; |
Thierry FOURNIER | 46006bd | 2014-03-21 21:45:15 +0100 | [diff] [blame] | 2089 | |
Thierry FOURNIER | 46006bd | 2014-03-21 21:45:15 +0100 | [diff] [blame] | 2090 | |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2091 | HA_SPIN_LOCK(PATREF_LOCK, &ref->lock); |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2092 | list_for_each_entry(expr, &ref->pat, list) { |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2093 | HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock); |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2094 | } |
| 2095 | |
| 2096 | /* all expr are locked, we can safely remove all pat_ref */ |
| 2097 | list_for_each_entry_safe(elt, safe, &ref->head, list) { |
| 2098 | list_for_each_entry_safe(bref, back, &elt->back_refs, users) { |
Willy Tarreau | d4164dc | 2020-10-27 18:55:20 +0100 | [diff] [blame] | 2099 | /* we have to unlink all watchers. */ |
| 2100 | LIST_DEL_INIT(&bref->users); |
| 2101 | bref->ref = NULL; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2102 | } |
Willy Tarreau | 2817472 | 2020-11-03 13:36:58 +0100 | [diff] [blame] | 2103 | pat_delete_gen(ref, elt); |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2104 | LIST_DEL(&elt->list); |
| 2105 | free(elt->pattern); |
| 2106 | free(elt->sample); |
| 2107 | free(elt); |
| 2108 | } |
| 2109 | |
| 2110 | /* switch pat_ret_elt lists */ |
Thierry FOURNIER | 46006bd | 2014-03-21 21:45:15 +0100 | [diff] [blame] | 2111 | LIST_ADD(&replace->head, &ref->head); |
| 2112 | LIST_DEL(&replace->head); |
| 2113 | |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2114 | list_for_each_entry(expr, &ref->pat, list) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2115 | list_for_each_entry(elt, &ref->head, list) { |
Dragan Dosen | f147479 | 2018-09-18 20:18:09 +0200 | [diff] [blame] | 2116 | char *err = NULL; |
| 2117 | struct sample_data *data = NULL; |
| 2118 | |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2119 | /* Create sample */ |
| 2120 | if (elt->sample && expr->pat_head->parse_smp) { |
| 2121 | /* New sample. */ |
| 2122 | data = malloc(sizeof(*data)); |
| 2123 | if (!data) |
| 2124 | continue; |
| 2125 | |
| 2126 | /* Parse value. */ |
| 2127 | if (!expr->pat_head->parse_smp(elt->sample, data)) { |
| 2128 | memprintf(&err, "unable to parse '%s'", elt->sample); |
| 2129 | send_log(NULL, LOG_NOTICE, "%s", err); |
| 2130 | free(err); |
| 2131 | free(data); |
| 2132 | continue; |
| 2133 | } |
| 2134 | |
| 2135 | } |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2136 | |
| 2137 | /* initialise pattern */ |
| 2138 | memset(&pattern, 0, sizeof(pattern)); |
| 2139 | pattern.data = data; |
| 2140 | pattern.ref = elt; |
| 2141 | |
| 2142 | /* parse pattern */ |
| 2143 | if (!expr->pat_head->parse(elt->pattern, &pattern, expr->mflags, &err)) { |
Thierry FOURNIER | 46006bd | 2014-03-21 21:45:15 +0100 | [diff] [blame] | 2144 | send_log(NULL, LOG_NOTICE, "%s", err); |
| 2145 | free(err); |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2146 | free(data); |
| 2147 | continue; |
| 2148 | } |
| 2149 | |
| 2150 | /* index pattern */ |
| 2151 | if (!expr->pat_head->index(expr, &pattern, &err)) { |
| 2152 | send_log(NULL, LOG_NOTICE, "%s", err); |
| 2153 | free(err); |
| 2154 | free(data); |
| 2155 | continue; |
Thierry FOURNIER | 46006bd | 2014-03-21 21:45:15 +0100 | [diff] [blame] | 2156 | } |
| 2157 | } |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2158 | HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock); |
Thierry FOURNIER | 46006bd | 2014-03-21 21:45:15 +0100 | [diff] [blame] | 2159 | } |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2160 | HA_SPIN_UNLOCK(PATREF_LOCK, &ref->lock); |
Willy Tarreau | 114d698 | 2020-11-03 15:55:35 +0100 | [diff] [blame] | 2161 | |
| 2162 | #if defined(HA_HAVE_MALLOC_TRIM) |
| 2163 | malloc_trim(0); |
| 2164 | #endif |
Thierry FOURNIER | 46006bd | 2014-03-21 21:45:15 +0100 | [diff] [blame] | 2165 | } |
| 2166 | |
Willy Tarreau | ae83e63 | 2020-11-03 10:37:31 +0100 | [diff] [blame] | 2167 | /* This function prunes all entries of <ref> and all their associated |
| 2168 | * pattern_expr. It may return before the end of the list is reached, |
| 2169 | * returning 0, to yield, indicating to the caller that it must call it again. |
| 2170 | * until it returns non-zero. All patterns are purged, both current ones and |
| 2171 | * future or incomplete ones. This is used by "clear map" or "clear acl". |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2172 | */ |
Willy Tarreau | d1d005d | 2019-12-20 18:22:02 +0100 | [diff] [blame] | 2173 | int pat_ref_prune(struct pat_ref *ref) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2174 | { |
Willy Tarreau | ae83e63 | 2020-11-03 10:37:31 +0100 | [diff] [blame] | 2175 | return pat_ref_purge_older(ref, ref->curr_gen + 1, 100) && |
| 2176 | pat_ref_purge_older(ref, ref->next_gen + 1, 100); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2177 | } |
| 2178 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 2179 | /* This function looks up any existing reference <ref> in pattern_head <head>, and |
| 2180 | * returns the associated pattern_expr pointer if found, otherwise NULL. |
| 2181 | */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2182 | struct pattern_expr *pattern_lookup_expr(struct pattern_head *head, struct pat_ref *ref) |
| 2183 | { |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2184 | struct pattern_expr_list *expr; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2185 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2186 | list_for_each_entry(expr, &head->head, list) |
| 2187 | if (expr->expr->ref == ref) |
| 2188 | return expr->expr; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2189 | return NULL; |
| 2190 | } |
| 2191 | |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 2192 | /* This function creates new pattern_expr associated to the reference <ref>. |
| 2193 | * <ref> can be NULL. If an error occurs, the function returns NULL and |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2194 | * <err> is filled. Otherwise, the function returns new pattern_expr linked |
| 2195 | * with <head> and <ref>. |
Thierry FOURNIER | 315ec42 | 2014-11-24 11:14:42 +0100 | [diff] [blame] | 2196 | * |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 2197 | * The returned value can be an already filled pattern list, in this case the |
Thierry FOURNIER | 315ec42 | 2014-11-24 11:14:42 +0100 | [diff] [blame] | 2198 | * flag <reuse> is set. |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2199 | */ |
Thierry FOURNIER | 315ec42 | 2014-11-24 11:14:42 +0100 | [diff] [blame] | 2200 | struct pattern_expr *pattern_new_expr(struct pattern_head *head, struct pat_ref *ref, |
Emeric Brun | 7d27f3c | 2017-07-03 17:54:23 +0200 | [diff] [blame] | 2201 | int patflags, char **err, int *reuse) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2202 | { |
| 2203 | struct pattern_expr *expr; |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2204 | struct pattern_expr_list *list; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2205 | |
Thierry FOURNIER | 315ec42 | 2014-11-24 11:14:42 +0100 | [diff] [blame] | 2206 | if (reuse) |
| 2207 | *reuse = 0; |
| 2208 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2209 | /* Memory and initialization of the chain element. */ |
Willy Tarreau | 8135d9b | 2020-10-30 15:35:11 +0100 | [diff] [blame] | 2210 | list = calloc(1, sizeof(*list)); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2211 | if (!list) { |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2212 | memprintf(err, "out of memory"); |
| 2213 | return NULL; |
| 2214 | } |
| 2215 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2216 | /* Look for existing similar expr. No that only the index, parse and |
| 2217 | * parse_smp function must be identical for having similar pattern. |
Joseph Herlant | 4189d67 | 2018-11-15 10:22:31 -0800 | [diff] [blame] | 2218 | * The other function depends of these first. |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2219 | */ |
| 2220 | if (ref) { |
| 2221 | list_for_each_entry(expr, &ref->pat, list) |
| 2222 | if (expr->pat_head->index == head->index && |
| 2223 | expr->pat_head->parse == head->parse && |
Emeric Brun | 7d27f3c | 2017-07-03 17:54:23 +0200 | [diff] [blame] | 2224 | expr->pat_head->parse_smp == head->parse_smp && |
| 2225 | expr->mflags == patflags) |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2226 | break; |
| 2227 | if (&expr->list == &ref->pat) |
| 2228 | expr = NULL; |
| 2229 | } |
| 2230 | else |
| 2231 | expr = NULL; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2232 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2233 | /* If no similar expr was found, we create new expr. */ |
| 2234 | if (!expr) { |
| 2235 | /* Get a lot of memory for the expr struct. */ |
Willy Tarreau | 8135d9b | 2020-10-30 15:35:11 +0100 | [diff] [blame] | 2236 | expr = calloc(1, sizeof(*expr)); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2237 | if (!expr) { |
Andreas Seltenreich | e6e22e8 | 2016-03-03 20:20:23 +0100 | [diff] [blame] | 2238 | free(list); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2239 | memprintf(err, "out of memory"); |
| 2240 | return NULL; |
| 2241 | } |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2242 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2243 | /* Initialize this new expr. */ |
| 2244 | pattern_init_expr(expr); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2245 | |
Emeric Brun | 7d27f3c | 2017-07-03 17:54:23 +0200 | [diff] [blame] | 2246 | /* Copy the pattern matching and indexing flags. */ |
| 2247 | expr->mflags = patflags; |
| 2248 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2249 | /* This new pattern expression reference one of his heads. */ |
| 2250 | expr->pat_head = head; |
| 2251 | |
| 2252 | /* Link with ref, or to self to facilitate LIST_DEL() */ |
| 2253 | if (ref) |
| 2254 | LIST_ADDQ(&ref->pat, &expr->list); |
| 2255 | else |
| 2256 | LIST_INIT(&expr->list); |
| 2257 | |
| 2258 | expr->ref = ref; |
| 2259 | |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2260 | HA_RWLOCK_INIT(&expr->lock); |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2261 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2262 | /* We must free this pattern if it is no more used. */ |
| 2263 | list->do_free = 1; |
| 2264 | } |
| 2265 | else { |
| 2266 | /* If the pattern used already exists, it is already linked |
| 2267 | * with ref and we must not free it. |
| 2268 | */ |
| 2269 | list->do_free = 0; |
Thierry FOURNIER | 315ec42 | 2014-11-24 11:14:42 +0100 | [diff] [blame] | 2270 | if (reuse) |
| 2271 | *reuse = 1; |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2272 | } |
| 2273 | |
| 2274 | /* The new list element reference the pattern_expr. */ |
| 2275 | list->expr = expr; |
| 2276 | |
| 2277 | /* Link the list element with the pattern_head. */ |
| 2278 | LIST_ADDQ(&head->head, &list->list); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2279 | return expr; |
| 2280 | } |
| 2281 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2282 | /* Reads patterns from a file. If <err_msg> is non-NULL, an error message will |
| 2283 | * be returned there on errors and the caller will have to free it. |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2284 | * |
| 2285 | * The file contains one key + value per line. Lines which start with '#' are |
| 2286 | * ignored, just like empty lines. Leading tabs/spaces are stripped. The key is |
| 2287 | * then the first "word" (series of non-space/tabs characters), and the value is |
| 2288 | * what follows this series of space/tab till the end of the line excluding |
| 2289 | * trailing spaces/tabs. |
| 2290 | * |
| 2291 | * Example : |
| 2292 | * |
| 2293 | * # this is a comment and is ignored |
| 2294 | * 62.212.114.60 1wt.eu \n |
| 2295 | * <-><-----------><---><----><----> |
| 2296 | * | | | | `--- trailing spaces ignored |
| 2297 | * | | | `-------- value |
| 2298 | * | | `--------------- middle spaces ignored |
| 2299 | * | `------------------------ key |
| 2300 | * `-------------------------------- leading spaces ignored |
| 2301 | * |
Ilya Shipitsin | 47d1718 | 2020-06-21 21:42:57 +0500 | [diff] [blame] | 2302 | * Return non-zero in case of success, otherwise 0. |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2303 | */ |
| 2304 | int pat_ref_read_from_file_smp(struct pat_ref *ref, const char *filename, char **err) |
| 2305 | { |
| 2306 | FILE *file; |
| 2307 | char *c; |
| 2308 | int ret = 0; |
| 2309 | int line = 0; |
| 2310 | char *key_beg; |
| 2311 | char *key_end; |
| 2312 | char *value_beg; |
| 2313 | char *value_end; |
| 2314 | |
| 2315 | file = fopen(filename, "r"); |
| 2316 | if (!file) { |
| 2317 | memprintf(err, "failed to open pattern file <%s>", filename); |
| 2318 | return 0; |
| 2319 | } |
| 2320 | |
| 2321 | /* now parse all patterns. The file may contain only one pattern |
| 2322 | * followed by one value per line. The start spaces, separator spaces |
| 2323 | * and and spaces are stripped. Each can contain comment started by '#' |
| 2324 | */ |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2325 | while (fgets(trash.area, trash.size, file) != NULL) { |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2326 | line++; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2327 | c = trash.area; |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2328 | |
| 2329 | /* ignore lines beginning with a dash */ |
| 2330 | if (*c == '#') |
| 2331 | continue; |
| 2332 | |
| 2333 | /* strip leading spaces and tabs */ |
| 2334 | while (*c == ' ' || *c == '\t') |
| 2335 | c++; |
| 2336 | |
| 2337 | /* empty lines are ignored too */ |
| 2338 | if (*c == '\0' || *c == '\r' || *c == '\n') |
| 2339 | continue; |
| 2340 | |
| 2341 | /* look for the end of the key */ |
| 2342 | key_beg = c; |
| 2343 | while (*c && *c != ' ' && *c != '\t' && *c != '\n' && *c != '\r') |
| 2344 | c++; |
| 2345 | |
| 2346 | key_end = c; |
| 2347 | |
| 2348 | /* strip middle spaces and tabs */ |
| 2349 | while (*c == ' ' || *c == '\t') |
| 2350 | c++; |
| 2351 | |
| 2352 | /* look for the end of the value, it is the end of the line */ |
| 2353 | value_beg = c; |
| 2354 | while (*c && *c != '\n' && *c != '\r') |
| 2355 | c++; |
| 2356 | value_end = c; |
| 2357 | |
| 2358 | /* trim possibly trailing spaces and tabs */ |
| 2359 | while (value_end > value_beg && (value_end[-1] == ' ' || value_end[-1] == '\t')) |
| 2360 | value_end--; |
| 2361 | |
| 2362 | /* set final \0 and check entries */ |
| 2363 | *key_end = '\0'; |
| 2364 | *value_end = '\0'; |
| 2365 | |
| 2366 | /* insert values */ |
| 2367 | if (!pat_ref_append(ref, key_beg, value_beg, line)) { |
| 2368 | memprintf(err, "out of memory"); |
| 2369 | goto out_close; |
| 2370 | } |
| 2371 | } |
| 2372 | |
Jerome Magnin | 3c79d4b | 2020-01-17 16:09:33 +0100 | [diff] [blame] | 2373 | if (ferror(file)) { |
| 2374 | memprintf(err, "error encountered while reading <%s> : %s", |
| 2375 | filename, strerror(errno)); |
| 2376 | goto out_close; |
| 2377 | } |
Ilya Shipitsin | 47d1718 | 2020-06-21 21:42:57 +0500 | [diff] [blame] | 2378 | /* success */ |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2379 | ret = 1; |
| 2380 | |
| 2381 | out_close: |
| 2382 | fclose(file); |
| 2383 | return ret; |
| 2384 | } |
| 2385 | |
| 2386 | /* Reads patterns from a file. If <err_msg> is non-NULL, an error message will |
| 2387 | * be returned there on errors and the caller will have to free it. |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2388 | */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2389 | int pat_ref_read_from_file(struct pat_ref *ref, const char *filename, char **err) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2390 | { |
| 2391 | FILE *file; |
| 2392 | char *c; |
| 2393 | char *arg; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2394 | int ret = 0; |
| 2395 | int line = 0; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2396 | |
| 2397 | file = fopen(filename, "r"); |
| 2398 | if (!file) { |
| 2399 | memprintf(err, "failed to open pattern file <%s>", filename); |
| 2400 | return 0; |
| 2401 | } |
| 2402 | |
| 2403 | /* now parse all patterns. The file may contain only one pattern per |
| 2404 | * line. If the line contains spaces, they will be part of the pattern. |
| 2405 | * The pattern stops at the first CR, LF or EOF encountered. |
| 2406 | */ |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2407 | while (fgets(trash.area, trash.size, file) != NULL) { |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2408 | line++; |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2409 | c = trash.area; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2410 | |
| 2411 | /* ignore lines beginning with a dash */ |
| 2412 | if (*c == '#') |
| 2413 | continue; |
| 2414 | |
| 2415 | /* strip leading spaces and tabs */ |
| 2416 | while (*c == ' ' || *c == '\t') |
| 2417 | c++; |
| 2418 | |
| 2419 | |
| 2420 | arg = c; |
| 2421 | while (*c && *c != '\n' && *c != '\r') |
| 2422 | c++; |
| 2423 | *c = 0; |
| 2424 | |
| 2425 | /* empty lines are ignored too */ |
| 2426 | if (c == arg) |
| 2427 | continue; |
| 2428 | |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2429 | if (!pat_ref_append(ref, arg, NULL, line)) { |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2430 | memprintf(err, "out of memory when loading patterns from file <%s>", filename); |
| 2431 | goto out_close; |
| 2432 | } |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2433 | } |
| 2434 | |
Jerome Magnin | 3c79d4b | 2020-01-17 16:09:33 +0100 | [diff] [blame] | 2435 | if (ferror(file)) { |
| 2436 | memprintf(err, "error encountered while reading <%s> : %s", |
| 2437 | filename, strerror(errno)); |
| 2438 | goto out_close; |
| 2439 | } |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2440 | ret = 1; /* success */ |
| 2441 | |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2442 | out_close: |
| 2443 | fclose(file); |
| 2444 | return ret; |
| 2445 | } |
| 2446 | |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2447 | int pattern_read_from_file(struct pattern_head *head, unsigned int refflags, |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2448 | const char *filename, int patflags, int load_smp, |
Thierry FOURNIER | 94580c9 | 2014-02-11 14:36:45 +0100 | [diff] [blame] | 2449 | char **err, const char *file, int line) |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2450 | { |
| 2451 | struct pat_ref *ref; |
| 2452 | struct pattern_expr *expr; |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2453 | struct pat_ref_elt *elt; |
Willy Tarreau | 4deaf39 | 2014-11-26 13:17:03 +0100 | [diff] [blame] | 2454 | int reuse = 0; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2455 | |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2456 | /* Lookup for the existing reference. */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2457 | ref = pat_ref_lookup(filename); |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2458 | |
| 2459 | /* If the reference doesn't exists, create it and load associated file. */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2460 | if (!ref) { |
Thierry FOURNIER | 94580c9 | 2014-02-11 14:36:45 +0100 | [diff] [blame] | 2461 | chunk_printf(&trash, |
| 2462 | "pattern loaded from file '%s' used by %s at file '%s' line %d", |
| 2463 | filename, refflags & PAT_REF_MAP ? "map" : "acl", file, line); |
| 2464 | |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2465 | ref = pat_ref_new(filename, trash.area, refflags); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2466 | if (!ref) { |
| 2467 | memprintf(err, "out of memory"); |
| 2468 | return 0; |
| 2469 | } |
| 2470 | |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2471 | if (load_smp) { |
Thierry FOURNIER | c0bd910 | 2014-01-29 12:32:58 +0100 | [diff] [blame] | 2472 | ref->flags |= PAT_REF_SMP; |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2473 | if (!pat_ref_read_from_file_smp(ref, filename, err)) |
| 2474 | return 0; |
| 2475 | } |
| 2476 | else { |
| 2477 | if (!pat_ref_read_from_file(ref, filename, err)) |
| 2478 | return 0; |
| 2479 | } |
| 2480 | } |
| 2481 | else { |
Thierry FOURNIER | c0bd910 | 2014-01-29 12:32:58 +0100 | [diff] [blame] | 2482 | /* The reference already exists, check the map compatibility. */ |
| 2483 | |
| 2484 | /* If the load require samples and the flag PAT_REF_SMP is not set, |
| 2485 | * the reference doesn't contain sample, and cannot be used. |
| 2486 | */ |
| 2487 | if (load_smp) { |
| 2488 | if (!(ref->flags & PAT_REF_SMP)) { |
| 2489 | memprintf(err, "The file \"%s\" is already used as one column file " |
| 2490 | "and cannot be used by as two column file.", |
| 2491 | filename); |
| 2492 | return 0; |
| 2493 | } |
| 2494 | } |
| 2495 | else { |
| 2496 | /* The load doesn't require samples. If the flag PAT_REF_SMP is |
| 2497 | * set, the reference contains a sample, and cannot be used. |
| 2498 | */ |
| 2499 | if (ref->flags & PAT_REF_SMP) { |
| 2500 | memprintf(err, "The file \"%s\" is already used as two column file " |
| 2501 | "and cannot be used by as one column file.", |
| 2502 | filename); |
| 2503 | return 0; |
| 2504 | } |
| 2505 | } |
| 2506 | |
Thierry FOURNIER | 94580c9 | 2014-02-11 14:36:45 +0100 | [diff] [blame] | 2507 | /* Extends display */ |
| 2508 | chunk_printf(&trash, "%s", ref->display); |
| 2509 | chunk_appendf(&trash, ", by %s at file '%s' line %d", |
| 2510 | refflags & PAT_REF_MAP ? "map" : "acl", file, line); |
| 2511 | free(ref->display); |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2512 | ref->display = strdup(trash.area); |
Thierry FOURNIER | 94580c9 | 2014-02-11 14:36:45 +0100 | [diff] [blame] | 2513 | if (!ref->display) { |
| 2514 | memprintf(err, "out of memory"); |
| 2515 | return 0; |
| 2516 | } |
| 2517 | |
Thierry FOURNIER | c0bd910 | 2014-01-29 12:32:58 +0100 | [diff] [blame] | 2518 | /* Merge flags. */ |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2519 | ref->flags |= refflags; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2520 | } |
| 2521 | |
| 2522 | /* Now, we can loading patterns from the reference. */ |
| 2523 | |
| 2524 | /* Lookup for existing reference in the head. If the reference |
| 2525 | * doesn't exists, create it. |
| 2526 | */ |
| 2527 | expr = pattern_lookup_expr(head, ref); |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 2528 | if (!expr || (expr->mflags != patflags)) { |
Emeric Brun | 7d27f3c | 2017-07-03 17:54:23 +0200 | [diff] [blame] | 2529 | expr = pattern_new_expr(head, ref, patflags, err, &reuse); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2530 | if (!expr) |
| 2531 | return 0; |
| 2532 | } |
| 2533 | |
Thierry FOURNIER | 315ec42 | 2014-11-24 11:14:42 +0100 | [diff] [blame] | 2534 | /* The returned expression may be not empty, because the function |
| 2535 | * "pattern_new_expr" lookup for similar pattern list and can |
| 2536 | * reuse a already filled pattern list. In this case, we can not |
| 2537 | * reload the patterns. |
| 2538 | */ |
| 2539 | if (reuse) |
| 2540 | return 1; |
| 2541 | |
Thierry FOURNIER | 39bef45 | 2014-01-29 13:29:45 +0100 | [diff] [blame] | 2542 | /* Load reference content in the pattern expression. */ |
| 2543 | list_for_each_entry(elt, &ref->head, list) { |
| 2544 | if (!pat_ref_push(elt, expr, patflags, err)) { |
| 2545 | if (elt->line > 0) |
| 2546 | memprintf(err, "%s at line %d of file '%s'", |
| 2547 | *err, elt->line, filename); |
| 2548 | return 0; |
| 2549 | } |
| 2550 | } |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2551 | |
| 2552 | return 1; |
| 2553 | } |
| 2554 | |
Thierry FOURNIER | 1794fdf | 2014-01-17 15:25:13 +0100 | [diff] [blame] | 2555 | /* This function executes a pattern match on a sample. It applies pattern <expr> |
| 2556 | * to sample <smp>. The function returns NULL if the sample dont match. It returns |
| 2557 | * non-null if the sample match. If <fill> is true and the sample match, the |
| 2558 | * function returns the matched pattern. In many cases, this pattern can be a |
| 2559 | * static buffer. |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2560 | */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2561 | struct pattern *pattern_exec_match(struct pattern_head *head, struct sample *smp, int fill) |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2562 | { |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2563 | struct pattern_expr_list *list; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2564 | struct pattern *pat; |
| 2565 | |
| 2566 | if (!head->match) { |
Thierry FOURNIER | 1794fdf | 2014-01-17 15:25:13 +0100 | [diff] [blame] | 2567 | if (fill) { |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 2568 | static_pattern.data = NULL; |
Thierry FOURNIER | 6bb53ff | 2014-01-28 15:54:36 +0100 | [diff] [blame] | 2569 | static_pattern.ref = NULL; |
Thierry FOURNIER | e47e4e2 | 2014-04-28 11:18:57 +0200 | [diff] [blame] | 2570 | static_pattern.sflags = 0; |
Thierry FOURNIER | 07ee64e | 2015-07-06 23:43:03 +0200 | [diff] [blame] | 2571 | static_pattern.type = SMP_T_SINT; |
Thierry FOURNIER | 5338eea | 2013-12-16 14:22:13 +0100 | [diff] [blame] | 2572 | static_pattern.val.i = 1; |
Thierry FOURNIER | 1794fdf | 2014-01-17 15:25:13 +0100 | [diff] [blame] | 2573 | } |
Thierry FOURNIER | 1794fdf | 2014-01-17 15:25:13 +0100 | [diff] [blame] | 2574 | return &static_pattern; |
| 2575 | } |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2576 | |
Thierry FOURNIER | 5d34408 | 2014-01-27 14:19:53 +0100 | [diff] [blame] | 2577 | /* convert input to string */ |
| 2578 | if (!sample_convert(smp, head->expect_type)) |
| 2579 | return NULL; |
| 2580 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2581 | list_for_each_entry(list, &head->head, list) { |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2582 | HA_RWLOCK_RDLOCK(PATEXP_LOCK, &list->expr->lock); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2583 | pat = head->match(smp, list->expr, fill); |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2584 | if (pat) { |
| 2585 | /* We duplicate the pattern cause it could be modified |
| 2586 | by another thread */ |
| 2587 | if (pat != &static_pattern) { |
| 2588 | memcpy(&static_pattern, pat, sizeof(struct pattern)); |
| 2589 | pat = &static_pattern; |
| 2590 | } |
| 2591 | |
| 2592 | /* We also duplicate the sample data for |
| 2593 | same reason */ |
| 2594 | if (pat->data && (pat->data != &static_sample_data)) { |
Christopher Faulet | 09fdf4b | 2017-11-09 16:14:16 +0100 | [diff] [blame] | 2595 | switch(pat->data->type) { |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2596 | case SMP_T_STR: |
| 2597 | static_sample_data.type = SMP_T_STR; |
| 2598 | static_sample_data.u.str = *get_trash_chunk(); |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2599 | static_sample_data.u.str.data = pat->data->u.str.data; |
| 2600 | if (static_sample_data.u.str.data >= static_sample_data.u.str.size) |
| 2601 | static_sample_data.u.str.data = static_sample_data.u.str.size - 1; |
| 2602 | memcpy(static_sample_data.u.str.area, |
Willy Tarreau | 2fc761e | 2020-06-11 16:37:35 +0200 | [diff] [blame] | 2603 | pat->data->u.str.area, static_sample_data.u.str.data); |
Willy Tarreau | 843b7cb | 2018-07-13 10:54:26 +0200 | [diff] [blame] | 2604 | static_sample_data.u.str.area[static_sample_data.u.str.data] = 0; |
Willy Tarreau | 2fc761e | 2020-06-11 16:37:35 +0200 | [diff] [blame] | 2605 | pat->data = &static_sample_data; |
| 2606 | break; |
| 2607 | |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2608 | case SMP_T_IPV4: |
| 2609 | case SMP_T_IPV6: |
| 2610 | case SMP_T_SINT: |
| 2611 | memcpy(&static_sample_data, pat->data, sizeof(struct sample_data)); |
Willy Tarreau | 2fc761e | 2020-06-11 16:37:35 +0200 | [diff] [blame] | 2612 | pat->data = &static_sample_data; |
| 2613 | break; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2614 | default: |
Willy Tarreau | 2fc761e | 2020-06-11 16:37:35 +0200 | [diff] [blame] | 2615 | /* unimplemented pattern type */ |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2616 | pat->data = NULL; |
Willy Tarreau | 2fc761e | 2020-06-11 16:37:35 +0200 | [diff] [blame] | 2617 | break; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2618 | } |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2619 | } |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2620 | HA_RWLOCK_RDUNLOCK(PATEXP_LOCK, &list->expr->lock); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2621 | return pat; |
Emeric Brun | b5997f7 | 2017-07-03 11:34:05 +0200 | [diff] [blame] | 2622 | } |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2623 | HA_RWLOCK_RDUNLOCK(PATEXP_LOCK, &list->expr->lock); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2624 | } |
| 2625 | return NULL; |
Thierry FOURNIER | ed66c29 | 2013-11-28 11:05:19 +0100 | [diff] [blame] | 2626 | } |
| 2627 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 2628 | /* This function prunes the pattern expressions starting at pattern_head <head>. */ |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2629 | void pattern_prune(struct pattern_head *head) |
Thierry FOURNIER | 6f7203d | 2014-01-14 16:24:51 +0100 | [diff] [blame] | 2630 | { |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2631 | struct pattern_expr_list *list, *safe; |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2632 | |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2633 | list_for_each_entry_safe(list, safe, &head->head, list) { |
| 2634 | LIST_DEL(&list->list); |
| 2635 | if (list->do_free) { |
| 2636 | LIST_DEL(&list->expr->list); |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2637 | HA_RWLOCK_WRLOCK(PATEXP_LOCK, &list->expr->lock); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2638 | head->prune(list->expr); |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 2639 | HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &list->expr->lock); |
Thierry FOURNIER | c5959fd | 2014-01-20 14:29:33 +0100 | [diff] [blame] | 2640 | free(list->expr); |
| 2641 | } |
| 2642 | free(list); |
Thierry FOURNIER | 1e00d38 | 2014-02-11 11:31:40 +0100 | [diff] [blame] | 2643 | } |
Thierry FOURNIER | 6f7203d | 2014-01-14 16:24:51 +0100 | [diff] [blame] | 2644 | } |
| 2645 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 2646 | /* This function searches occurrences of pattern reference element <ref> in |
| 2647 | * expression <expr> and returns a pointer to a pointer of the sample storage. |
| 2648 | * If <ref> is not found, NULL is returned. |
Thierry FOURNIER | 55d0b10 | 2014-01-15 11:25:26 +0100 | [diff] [blame] | 2649 | */ |
Thierry FOURNIER | 12ba0c2 | 2015-08-14 00:02:11 +0200 | [diff] [blame] | 2650 | struct sample_data **pattern_find_smp(struct pattern_expr *expr, struct pat_ref_elt *ref) |
Thierry FOURNIER | 55d0b10 | 2014-01-15 11:25:26 +0100 | [diff] [blame] | 2651 | { |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 2652 | struct ebmb_node *node; |
| 2653 | struct pattern_tree *elt; |
| 2654 | struct pattern_list *pat; |
Thierry FOURNIER | 55d0b10 | 2014-01-15 11:25:26 +0100 | [diff] [blame] | 2655 | |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 2656 | for (node = ebmb_first(&expr->pattern_tree); |
| 2657 | node; |
| 2658 | node = ebmb_next(node)) { |
| 2659 | elt = container_of(node, struct pattern_tree, node); |
| 2660 | if (elt->ref == ref) |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 2661 | return &elt->data; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 2662 | } |
| 2663 | |
| 2664 | for (node = ebmb_first(&expr->pattern_tree_2); |
| 2665 | node; |
| 2666 | node = ebmb_next(node)) { |
| 2667 | elt = container_of(node, struct pattern_tree, node); |
| 2668 | if (elt->ref == ref) |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 2669 | return &elt->data; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 2670 | } |
| 2671 | |
| 2672 | list_for_each_entry(pat, &expr->patterns, list) |
| 2673 | if (pat->pat.ref == ref) |
Thierry FOURNIER | 503bb09 | 2015-08-19 08:35:43 +0200 | [diff] [blame] | 2674 | return &pat->pat.data; |
Thierry FOURNIER | e369ca2 | 2014-01-29 16:24:55 +0100 | [diff] [blame] | 2675 | |
| 2676 | return NULL; |
Thierry FOURNIER | 55d0b10 | 2014-01-15 11:25:26 +0100 | [diff] [blame] | 2677 | } |
| 2678 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 2679 | /* This function compares two pat_ref** on their unique_id, and returns -1/0/1 |
| 2680 | * depending on their order (suitable for sorting). |
| 2681 | */ |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2682 | static int cmp_pat_ref(const void *_a, const void *_b) |
| 2683 | { |
| 2684 | struct pat_ref * const *a = _a; |
| 2685 | struct pat_ref * const *b = _b; |
| 2686 | |
| 2687 | if ((*a)->unique_id < (*b)->unique_id) |
| 2688 | return -1; |
| 2689 | else if ((*a)->unique_id > (*b)->unique_id) |
| 2690 | return 1; |
| 2691 | return 0; |
| 2692 | } |
| 2693 | |
Willy Tarreau | a5bbaaf | 2020-10-30 16:03:50 +0100 | [diff] [blame] | 2694 | /* This function finalizes the configuration parsing. It sets all the |
| 2695 | * automatic ids. |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2696 | */ |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2697 | int pattern_finalize_config(void) |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2698 | { |
Tim Duesterhus | b584b44 | 2020-03-17 21:08:24 +0100 | [diff] [blame] | 2699 | size_t len = 0; |
| 2700 | size_t unassigned_pos = 0; |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2701 | int next_unique_id = 0; |
Tim Duesterhus | b584b44 | 2020-03-17 21:08:24 +0100 | [diff] [blame] | 2702 | size_t i, j; |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2703 | struct pat_ref *ref, **arr; |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2704 | struct list pr = LIST_HEAD_INIT(pr); |
| 2705 | |
Willy Tarreau | 52bf839 | 2020-03-08 00:42:37 +0100 | [diff] [blame] | 2706 | pat_lru_seed = ha_random(); |
Willy Tarreau | f3045d2 | 2015-04-29 16:24:50 +0200 | [diff] [blame] | 2707 | |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2708 | /* Count pat_refs with user defined unique_id and totalt count */ |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2709 | list_for_each_entry(ref, &pattern_reference, list) { |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2710 | len++; |
| 2711 | if (ref->unique_id != -1) |
| 2712 | unassigned_pos++; |
| 2713 | } |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2714 | |
Tim Duesterhus | b584b44 | 2020-03-17 21:08:24 +0100 | [diff] [blame] | 2715 | if (len == 0) { |
| 2716 | return 0; |
| 2717 | } |
| 2718 | |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2719 | arr = calloc(len, sizeof(*arr)); |
| 2720 | if (arr == NULL) { |
| 2721 | ha_alert("Out of memory error.\n"); |
| 2722 | return ERR_ALERT | ERR_FATAL; |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2723 | } |
| 2724 | |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2725 | i = 0; |
| 2726 | j = unassigned_pos; |
| 2727 | list_for_each_entry(ref, &pattern_reference, list) { |
| 2728 | if (ref->unique_id != -1) |
| 2729 | arr[i++] = ref; |
| 2730 | else |
| 2731 | arr[j++] = ref; |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2732 | } |
| 2733 | |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2734 | /* Sort first segment of array with user-defined unique ids for |
| 2735 | * fast lookup when generating unique ids |
| 2736 | */ |
| 2737 | qsort(arr, unassigned_pos, sizeof(*arr), cmp_pat_ref); |
| 2738 | |
| 2739 | /* Assign unique ids to the rest of the elements */ |
| 2740 | for (i = unassigned_pos; i < len; i++) { |
| 2741 | do { |
| 2742 | arr[i]->unique_id = next_unique_id++; |
| 2743 | } while (bsearch(&arr[i], arr, unassigned_pos, sizeof(*arr), cmp_pat_ref)); |
| 2744 | } |
| 2745 | |
| 2746 | /* Sort complete array */ |
| 2747 | qsort(arr, len, sizeof(*arr), cmp_pat_ref); |
| 2748 | |
| 2749 | /* Convert back to linked list */ |
| 2750 | for (i = 0; i < len; i++) |
| 2751 | LIST_ADDQ(&pr, &arr[i]->list); |
| 2752 | |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2753 | /* swap root */ |
| 2754 | LIST_ADD(&pr, &pattern_reference); |
| 2755 | LIST_DEL(&pr); |
Carl Henrik Lunde | f91ac19 | 2020-02-27 16:45:50 +0100 | [diff] [blame] | 2756 | |
| 2757 | free(arr); |
| 2758 | return 0; |
Thierry FOURNIER | af5a29d | 2014-03-11 14:29:22 +0100 | [diff] [blame] | 2759 | } |
Willy Tarreau | 403bfbb | 2019-10-23 06:59:31 +0200 | [diff] [blame] | 2760 | |
| 2761 | static int pattern_per_thread_lru_alloc() |
| 2762 | { |
| 2763 | if (!global.tune.pattern_cache) |
| 2764 | return 1; |
| 2765 | pat_lru_tree = lru64_new(global.tune.pattern_cache); |
| 2766 | return !!pat_lru_tree; |
| 2767 | } |
| 2768 | |
| 2769 | static void pattern_per_thread_lru_free() |
| 2770 | { |
| 2771 | lru64_destroy(pat_lru_tree); |
| 2772 | } |
| 2773 | |
| 2774 | REGISTER_PER_THREAD_ALLOC(pattern_per_thread_lru_alloc); |
| 2775 | REGISTER_PER_THREAD_FREE(pattern_per_thread_lru_free); |