blob: d4988b172f92b4b9f156b3285858237adfb2d627 [file] [log] [blame]
Thierry FOURNIERed66c292013-11-28 11:05:19 +01001/*
2 * Pattern management functions.
3 *
4 * Copyright 2000-2013 Willy Tarreau <w@1wt.eu>
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 */
12
13#include <ctype.h>
14#include <stdio.h>
Jerome Magninb8bd6d72020-01-17 18:01:20 +010015#include <errno.h>
Thierry FOURNIERed66c292013-11-28 11:05:19 +010016
Willy Tarreau4c7e4b72020-05-27 12:58:42 +020017#include <haproxy/api.h>
Willy Tarreau6131d6a2020-06-02 16:48:09 +020018#include <haproxy/net_helper.h>
Willy Tarreau7cd8b6e2020-06-02 17:32:26 +020019#include <haproxy/regex.h>
Willy Tarreau48fbcae2020-06-03 18:09:46 +020020#include <haproxy/tools.h>
Thierry FOURNIERed66c292013-11-28 11:05:19 +010021
22#include <types/global.h>
23#include <types/pattern.h>
24
Thierry FOURNIER46006bd2014-03-21 21:45:15 +010025#include <proto/log.h>
Thierry FOURNIERed66c292013-11-28 11:05:19 +010026#include <proto/pattern.h>
Thierry FOURNIERe3ded592013-12-06 15:36:54 +010027#include <proto/sample.h>
Thierry FOURNIERed66c292013-11-28 11:05:19 +010028
Willy Tarreau8d2b7772020-05-27 10:58:19 +020029#include <import/ebsttree.h>
Willy Tarreauf3045d22015-04-29 16:24:50 +020030#include <import/lru.h>
31#include <import/xxhash.h>
Thierry FOURNIERed66c292013-11-28 11:05:19 +010032
Thierry FOURNIERa65b3432013-11-28 18:22:00 +010033char *pat_match_names[PAT_MATCH_NUM] = {
34 [PAT_MATCH_FOUND] = "found",
35 [PAT_MATCH_BOOL] = "bool",
36 [PAT_MATCH_INT] = "int",
37 [PAT_MATCH_IP] = "ip",
38 [PAT_MATCH_BIN] = "bin",
39 [PAT_MATCH_LEN] = "len",
40 [PAT_MATCH_STR] = "str",
41 [PAT_MATCH_BEG] = "beg",
42 [PAT_MATCH_SUB] = "sub",
43 [PAT_MATCH_DIR] = "dir",
44 [PAT_MATCH_DOM] = "dom",
45 [PAT_MATCH_END] = "end",
46 [PAT_MATCH_REG] = "reg",
Thierry Fournier8feaa662016-02-10 22:55:20 +010047 [PAT_MATCH_REGM] = "regm",
Thierry FOURNIERed66c292013-11-28 11:05:19 +010048};
49
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +020050int (*pat_parse_fcts[PAT_MATCH_NUM])(const char *, struct pattern *, int, char **) = {
Thierry FOURNIERa65b3432013-11-28 18:22:00 +010051 [PAT_MATCH_FOUND] = pat_parse_nothing,
52 [PAT_MATCH_BOOL] = pat_parse_nothing,
53 [PAT_MATCH_INT] = pat_parse_int,
54 [PAT_MATCH_IP] = pat_parse_ip,
55 [PAT_MATCH_BIN] = pat_parse_bin,
Thierry FOURNIER5d344082014-01-27 14:19:53 +010056 [PAT_MATCH_LEN] = pat_parse_int,
Thierry FOURNIERa65b3432013-11-28 18:22:00 +010057 [PAT_MATCH_STR] = pat_parse_str,
58 [PAT_MATCH_BEG] = pat_parse_str,
59 [PAT_MATCH_SUB] = pat_parse_str,
60 [PAT_MATCH_DIR] = pat_parse_str,
61 [PAT_MATCH_DOM] = pat_parse_str,
62 [PAT_MATCH_END] = pat_parse_str,
63 [PAT_MATCH_REG] = pat_parse_reg,
Thierry Fournier8feaa662016-02-10 22:55:20 +010064 [PAT_MATCH_REGM] = pat_parse_reg,
Thierry FOURNIERed66c292013-11-28 11:05:19 +010065};
66
Thierry FOURNIERb9b08462013-12-13 15:12:32 +010067int (*pat_index_fcts[PAT_MATCH_NUM])(struct pattern_expr *, struct pattern *, char **) = {
68 [PAT_MATCH_FOUND] = pat_idx_list_val,
69 [PAT_MATCH_BOOL] = pat_idx_list_val,
70 [PAT_MATCH_INT] = pat_idx_list_val,
71 [PAT_MATCH_IP] = pat_idx_tree_ip,
72 [PAT_MATCH_BIN] = pat_idx_list_ptr,
73 [PAT_MATCH_LEN] = pat_idx_list_val,
74 [PAT_MATCH_STR] = pat_idx_tree_str,
Willy Tarreaub1dd9bf2014-05-10 08:53:48 +020075 [PAT_MATCH_BEG] = pat_idx_tree_pfx,
Thierry FOURNIERb9b08462013-12-13 15:12:32 +010076 [PAT_MATCH_SUB] = pat_idx_list_str,
77 [PAT_MATCH_DIR] = pat_idx_list_str,
78 [PAT_MATCH_DOM] = pat_idx_list_str,
79 [PAT_MATCH_END] = pat_idx_list_str,
80 [PAT_MATCH_REG] = pat_idx_list_reg,
Thierry Fournier8feaa662016-02-10 22:55:20 +010081 [PAT_MATCH_REGM] = pat_idx_list_regm,
Thierry FOURNIERb9b08462013-12-13 15:12:32 +010082};
83
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +010084void (*pat_delete_fcts[PAT_MATCH_NUM])(struct pattern_expr *, struct pat_ref_elt *) = {
Thierry FOURNIERb1136502014-01-15 11:38:49 +010085 [PAT_MATCH_FOUND] = pat_del_list_val,
86 [PAT_MATCH_BOOL] = pat_del_list_val,
87 [PAT_MATCH_INT] = pat_del_list_val,
88 [PAT_MATCH_IP] = pat_del_tree_ip,
89 [PAT_MATCH_BIN] = pat_del_list_ptr,
90 [PAT_MATCH_LEN] = pat_del_list_val,
91 [PAT_MATCH_STR] = pat_del_tree_str,
Willy Tarreaub1dd9bf2014-05-10 08:53:48 +020092 [PAT_MATCH_BEG] = pat_del_tree_str,
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +010093 [PAT_MATCH_SUB] = pat_del_list_ptr,
94 [PAT_MATCH_DIR] = pat_del_list_ptr,
95 [PAT_MATCH_DOM] = pat_del_list_ptr,
96 [PAT_MATCH_END] = pat_del_list_ptr,
Thierry FOURNIERb1136502014-01-15 11:38:49 +010097 [PAT_MATCH_REG] = pat_del_list_reg,
Thierry Fournier8feaa662016-02-10 22:55:20 +010098 [PAT_MATCH_REGM] = pat_del_list_reg,
Thierry FOURNIERb1136502014-01-15 11:38:49 +010099};
100
Thierry FOURNIER6f7203d2014-01-14 16:24:51 +0100101void (*pat_prune_fcts[PAT_MATCH_NUM])(struct pattern_expr *) = {
102 [PAT_MATCH_FOUND] = pat_prune_val,
103 [PAT_MATCH_BOOL] = pat_prune_val,
104 [PAT_MATCH_INT] = pat_prune_val,
105 [PAT_MATCH_IP] = pat_prune_val,
106 [PAT_MATCH_BIN] = pat_prune_ptr,
107 [PAT_MATCH_LEN] = pat_prune_val,
108 [PAT_MATCH_STR] = pat_prune_ptr,
109 [PAT_MATCH_BEG] = pat_prune_ptr,
110 [PAT_MATCH_SUB] = pat_prune_ptr,
111 [PAT_MATCH_DIR] = pat_prune_ptr,
112 [PAT_MATCH_DOM] = pat_prune_ptr,
113 [PAT_MATCH_END] = pat_prune_ptr,
114 [PAT_MATCH_REG] = pat_prune_reg,
Thierry Fournier8feaa662016-02-10 22:55:20 +0100115 [PAT_MATCH_REGM] = pat_prune_reg,
Thierry FOURNIER6f7203d2014-01-14 16:24:51 +0100116};
117
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100118struct pattern *(*pat_match_fcts[PAT_MATCH_NUM])(struct sample *, struct pattern_expr *, int) = {
Thierry FOURNIERa65b3432013-11-28 18:22:00 +0100119 [PAT_MATCH_FOUND] = NULL,
120 [PAT_MATCH_BOOL] = pat_match_nothing,
121 [PAT_MATCH_INT] = pat_match_int,
122 [PAT_MATCH_IP] = pat_match_ip,
123 [PAT_MATCH_BIN] = pat_match_bin,
124 [PAT_MATCH_LEN] = pat_match_len,
125 [PAT_MATCH_STR] = pat_match_str,
126 [PAT_MATCH_BEG] = pat_match_beg,
127 [PAT_MATCH_SUB] = pat_match_sub,
128 [PAT_MATCH_DIR] = pat_match_dir,
129 [PAT_MATCH_DOM] = pat_match_dom,
130 [PAT_MATCH_END] = pat_match_end,
131 [PAT_MATCH_REG] = pat_match_reg,
Thierry Fournier8feaa662016-02-10 22:55:20 +0100132 [PAT_MATCH_REGM] = pat_match_regm,
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100133};
134
Thierry FOURNIERe3ded592013-12-06 15:36:54 +0100135/* Just used for checking configuration compatibility */
136int pat_match_types[PAT_MATCH_NUM] = {
Thierry FOURNIER07ee64e2015-07-06 23:43:03 +0200137 [PAT_MATCH_FOUND] = SMP_T_SINT,
138 [PAT_MATCH_BOOL] = SMP_T_SINT,
139 [PAT_MATCH_INT] = SMP_T_SINT,
Thierry FOURNIERe3ded592013-12-06 15:36:54 +0100140 [PAT_MATCH_IP] = SMP_T_ADDR,
Thierry FOURNIER7654c9f2013-12-17 00:20:33 +0100141 [PAT_MATCH_BIN] = SMP_T_BIN,
142 [PAT_MATCH_LEN] = SMP_T_STR,
143 [PAT_MATCH_STR] = SMP_T_STR,
144 [PAT_MATCH_BEG] = SMP_T_STR,
145 [PAT_MATCH_SUB] = SMP_T_STR,
146 [PAT_MATCH_DIR] = SMP_T_STR,
147 [PAT_MATCH_DOM] = SMP_T_STR,
148 [PAT_MATCH_END] = SMP_T_STR,
149 [PAT_MATCH_REG] = SMP_T_STR,
Thierry Fournier8feaa662016-02-10 22:55:20 +0100150 [PAT_MATCH_REGM] = SMP_T_STR,
Thierry FOURNIERe3ded592013-12-06 15:36:54 +0100151};
152
Thierry FOURNIER1794fdf2014-01-17 15:25:13 +0100153/* this struct is used to return information */
Emeric Brunb5997f72017-07-03 11:34:05 +0200154static THREAD_LOCAL struct pattern static_pattern;
155static THREAD_LOCAL struct sample_data static_sample_data;
Thierry FOURNIER1794fdf2014-01-17 15:25:13 +0100156
Thierry FOURNIER1e00d382014-02-11 11:31:40 +0100157/* This is the root of the list of all pattern_ref avalaibles. */
158struct list pattern_reference = LIST_HEAD_INIT(pattern_reference);
159
Willy Tarreau403bfbb2019-10-23 06:59:31 +0200160static THREAD_LOCAL struct lru64_head *pat_lru_tree;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200161static unsigned long long pat_lru_seed;
162
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100163/*
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100164 *
165 * The following functions are not exported and are used by internals process
166 * of pattern matching
167 *
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100168 */
169
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100170/* Background: Fast way to find a zero byte in a word
171 * http://graphics.stanford.edu/~seander/bithacks.html#ZeroInWord
172 * hasZeroByte = (v - 0x01010101UL) & ~v & 0x80808080UL;
173 *
174 * To look for 4 different byte values, xor the word with those bytes and
175 * then check for zero bytes:
176 *
177 * v = (((unsigned char)c * 0x1010101U) ^ delimiter)
178 * where <delimiter> is the 4 byte values to look for (as an uint)
179 * and <c> is the character that is being tested
180 */
181static inline unsigned int is_delimiter(unsigned char c, unsigned int mask)
182{
183 mask ^= (c * 0x01010101); /* propagate the char to all 4 bytes */
184 return (mask - 0x01010101) & ~mask & 0x80808080U;
185}
186
187static inline unsigned int make_4delim(unsigned char d1, unsigned char d2, unsigned char d3, unsigned char d4)
188{
189 return d1 << 24 | d2 << 16 | d3 << 8 | d4;
190}
191
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100192
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100193/*
194 *
195 * These functions are exported and may be used by any other component.
196 *
Willy Tarreau5def8ef2014-08-29 15:19:33 +0200197 * The following functions are used for parsing pattern matching input value.
198 * The <text> contain the string to be parsed. <pattern> must be a preallocated
199 * pattern. The pat_parse_* functions fill this structure with the parsed value.
200 * <err> is filled with an error message built with memprintf() function. It is
201 * allowed to use a trash as a temporary storage for the returned pattern, as
202 * the next call after these functions will be pat_idx_*.
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100203 *
Willy Tarreau5def8ef2014-08-29 15:19:33 +0200204 * In success case, the pat_parse_* function returns 1. If the function
205 * fails, it returns 0 and <err> is filled.
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100206 */
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100207
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100208/* ignore the current line */
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200209int pat_parse_nothing(const char *text, struct pattern *pattern, int mflags, char **err)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100210{
211 return 1;
212}
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100213
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100214/* Parse a string. It is allocated and duplicated. */
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200215int pat_parse_str(const char *text, struct pattern *pattern, int mflags, char **err)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100216{
Thierry FOURNIER7654c9f2013-12-17 00:20:33 +0100217 pattern->type = SMP_T_STR;
Thierry FOURNIERedc15c32013-12-13 15:36:59 +0100218 pattern->ptr.str = (char *)text;
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100219 pattern->len = strlen(text);
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100220 return 1;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100221}
222
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100223/* Parse a binary written in hexa. It is allocated. */
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200224int pat_parse_bin(const char *text, struct pattern *pattern, int mflags, char **err)
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100225{
Willy Tarreau83061a82018-07-13 11:56:34 +0200226 struct buffer *trash;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100227
Thierry FOURNIER7654c9f2013-12-17 00:20:33 +0100228 pattern->type = SMP_T_BIN;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100229 trash = get_trash_chunk();
230 pattern->len = trash->size;
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200231 pattern->ptr.str = trash->area;
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100232 return !!parse_binary(text, &pattern->ptr.str, &pattern->len, err);
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100233}
234
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100235/* Parse a regex. It is allocated. */
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200236int pat_parse_reg(const char *text, struct pattern *pattern, int mflags, char **err)
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100237{
Thierry FOURNIER0b6d15f2014-01-29 19:35:16 +0100238 pattern->ptr.str = (char *)text;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100239 return 1;
240}
241
242/* Parse a range of positive integers delimited by either ':' or '-'. If only
243 * one integer is read, it is set as both min and max. An operator may be
244 * specified as the prefix, among this list of 5 :
245 *
246 * 0:eq, 1:gt, 2:ge, 3:lt, 4:le
247 *
248 * The default operator is "eq". It supports range matching. Ranges are
249 * rejected for other operators. The operator may be changed at any time.
250 * The operator is stored in the 'opaque' argument.
251 *
252 * If err is non-NULL, an error message will be returned there on errors and
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100253 * the caller will have to free it. The function returns zero on error, and
254 * non-zero on success.
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100255 *
256 */
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200257int pat_parse_int(const char *text, struct pattern *pattern, int mflags, char **err)
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100258{
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100259 const char *ptr = text;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100260
Thierry FOURNIER07ee64e2015-07-06 23:43:03 +0200261 pattern->type = SMP_T_SINT;
Thierry FOURNIER7148ce62013-12-06 19:06:43 +0100262
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100263 /* Empty string is not valid */
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100264 if (!*text)
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100265 goto not_valid_range;
266
267 /* Search ':' or '-' separator. */
268 while (*ptr != '\0' && *ptr != ':' && *ptr != '-')
269 ptr++;
270
271 /* If separator not found. */
272 if (!*ptr) {
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100273 if (strl2llrc(text, ptr - text, &pattern->val.range.min) != 0) {
274 memprintf(err, "'%s' is not a number", text);
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100275 return 0;
276 }
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100277 pattern->val.range.max = pattern->val.range.min;
278 pattern->val.range.min_set = 1;
279 pattern->val.range.max_set = 1;
280 return 1;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100281 }
282
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100283 /* If the separator is the first character. */
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100284 if (ptr == text && *(ptr + 1) != '\0') {
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100285 if (strl2llrc(ptr + 1, strlen(ptr + 1), &pattern->val.range.max) != 0)
286 goto not_valid_range;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100287
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100288 pattern->val.range.min_set = 0;
289 pattern->val.range.max_set = 1;
290 return 1;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100291 }
292
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100293 /* If separator is the last character. */
294 if (*(ptr + 1) == '\0') {
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100295 if (strl2llrc(text, ptr - text, &pattern->val.range.min) != 0)
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100296 goto not_valid_range;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100297
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100298 pattern->val.range.min_set = 1;
299 pattern->val.range.max_set = 0;
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100300 return 1;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100301 }
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100302
303 /* Else, parse two numbers. */
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100304 if (strl2llrc(text, ptr - text, &pattern->val.range.min) != 0)
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100305 goto not_valid_range;
306
307 if (strl2llrc(ptr + 1, strlen(ptr + 1), &pattern->val.range.max) != 0)
308 goto not_valid_range;
309
310 if (pattern->val.range.min > pattern->val.range.max)
311 goto not_valid_range;
312
313 pattern->val.range.min_set = 1;
314 pattern->val.range.max_set = 1;
315 return 1;
316
317 not_valid_range:
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100318 memprintf(err, "'%s' is not a valid number range", text);
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100319 return 0;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100320}
321
322/* Parse a range of positive 2-component versions delimited by either ':' or
323 * '-'. The version consists in a major and a minor, both of which must be
324 * smaller than 65536, because internally they will be represented as a 32-bit
325 * integer.
326 * If only one version is read, it is set as both min and max. Just like for
327 * pure integers, an operator may be specified as the prefix, among this list
328 * of 5 :
329 *
330 * 0:eq, 1:gt, 2:ge, 3:lt, 4:le
331 *
332 * The default operator is "eq". It supports range matching. Ranges are
333 * rejected for other operators. The operator may be changed at any time.
334 * The operator is stored in the 'opaque' argument. This allows constructs
335 * such as the following one :
336 *
337 * acl obsolete_ssl ssl_req_proto lt 3
338 * acl unsupported_ssl ssl_req_proto gt 3.1
339 * acl valid_ssl ssl_req_proto 3.0-3.1
340 *
341 */
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200342int pat_parse_dotted_ver(const char *text, struct pattern *pattern, int mflags, char **err)
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100343{
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100344 const char *ptr = text;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100345
Thierry FOURNIER07ee64e2015-07-06 23:43:03 +0200346 pattern->type = SMP_T_SINT;
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100347
348 /* Search ':' or '-' separator. */
349 while (*ptr != '\0' && *ptr != ':' && *ptr != '-')
350 ptr++;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100351
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100352 /* If separator not found. */
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100353 if (*ptr == '\0' && ptr > text) {
354 if (strl2llrc_dotted(text, ptr-text, &pattern->val.range.min) != 0) {
355 memprintf(err, "'%s' is not a dotted number", text);
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100356 return 0;
357 }
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100358 pattern->val.range.max = pattern->val.range.min;
359 pattern->val.range.min_set = 1;
360 pattern->val.range.max_set = 1;
361 return 1;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100362 }
363
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100364 /* If the separator is the first character. */
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100365 if (ptr == text && *(ptr+1) != '\0') {
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100366 if (strl2llrc_dotted(ptr+1, strlen(ptr+1), &pattern->val.range.max) != 0) {
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100367 memprintf(err, "'%s' is not a valid dotted number range", text);
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100368 return 0;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100369 }
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100370 pattern->val.range.min_set = 0;
371 pattern->val.range.max_set = 1;
372 return 1;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100373 }
374
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100375 /* If separator is the last character. */
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100376 if (ptr == &text[strlen(text)-1]) {
377 if (strl2llrc_dotted(text, ptr-text, &pattern->val.range.min) != 0) {
378 memprintf(err, "'%s' is not a valid dotted number range", text);
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100379 return 0;
380 }
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100381 pattern->val.range.min_set = 1;
382 pattern->val.range.max_set = 0;
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100383 return 1;
384 }
385
386 /* Else, parse two numbers. */
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100387 if (strl2llrc_dotted(text, ptr-text, &pattern->val.range.min) != 0) {
388 memprintf(err, "'%s' is not a valid dotted number range", text);
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100389 return 0;
390 }
391 if (strl2llrc_dotted(ptr+1, strlen(ptr+1), &pattern->val.range.max) != 0) {
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100392 memprintf(err, "'%s' is not a valid dotted number range", text);
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100393 return 0;
394 }
395 if (pattern->val.range.min > pattern->val.range.max) {
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100396 memprintf(err, "'%s' is not a valid dotted number range", text);
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100397 return 0;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100398 }
Thierry FOURNIER511e9472014-01-23 17:40:34 +0100399 pattern->val.range.min_set = 1;
400 pattern->val.range.max_set = 1;
401 return 1;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100402}
403
404/* Parse an IP address and an optional mask in the form addr[/mask].
405 * The addr may either be an IPv4 address or a hostname. The mask
406 * may either be a dotted mask or a number of bits. Returns 1 if OK,
407 * otherwise 0. NOTE: IP address patterns are typed (IPV4/IPV6).
408 */
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200409int pat_parse_ip(const char *text, struct pattern *pattern, int mflags, char **err)
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100410{
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200411 if (str2net(text, !(mflags & PAT_MF_NO_DNS) && (global.mode & MODE_STARTING),
Thierry FOURNIERfc7ac7b2014-02-11 15:23:04 +0100412 &pattern->val.ipv4.addr, &pattern->val.ipv4.mask)) {
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100413 pattern->type = SMP_T_IPV4;
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100414 return 1;
415 }
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100416 else if (str62net(text, &pattern->val.ipv6.addr, &pattern->val.ipv6.mask)) {
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100417 pattern->type = SMP_T_IPV6;
418 return 1;
419 }
420 else {
Thierry FOURNIER580c32c2014-01-24 10:58:12 +0100421 memprintf(err, "'%s' is not a valid IPv4 or IPv6 address", text);
Thierry FOURNIERed66c292013-11-28 11:05:19 +0100422 return 0;
423 }
424}
425
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100426/*
427 *
428 * These functions are exported and may be used by any other component.
429 *
Joseph Herlant4189d672018-11-15 10:22:31 -0800430 * This function just takes a sample <smp> and checks if this sample matches
431 * with the pattern <pattern>. This function returns only PAT_MATCH or
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100432 * PAT_NOMATCH.
433 *
434 */
435
436/* always return false */
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100437struct pattern *pat_match_nothing(struct sample *smp, struct pattern_expr *expr, int fill)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100438{
Thierry FOURNIER136f9d32015-08-19 09:07:19 +0200439 if (smp->data.u.sint) {
Thierry FOURNIERe5978bf2014-03-17 19:53:10 +0100440 if (fill) {
Thierry FOURNIER503bb092015-08-19 08:35:43 +0200441 static_pattern.data = NULL;
Thierry FOURNIERe5978bf2014-03-17 19:53:10 +0100442 static_pattern.ref = NULL;
Thierry FOURNIERe5978bf2014-03-17 19:53:10 +0100443 static_pattern.type = 0;
444 static_pattern.ptr.str = NULL;
445 }
446 return &static_pattern;
447 }
448 else
449 return NULL;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100450}
451
452
Joseph Herlant4189d672018-11-15 10:22:31 -0800453/* NB: For two strings to be identical, it is required that their length match */
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100454struct pattern *pat_match_str(struct sample *smp, struct pattern_expr *expr, int fill)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100455{
456 int icase;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100457 struct ebmb_node *node;
458 char prev;
459 struct pattern_tree *elt;
460 struct pattern_list *lst;
461 struct pattern *pattern;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200462 struct pattern *ret = NULL;
463 struct lru64 *lru = NULL;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100464
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100465 /* Lookup a string in the expression's pattern tree. */
466 if (!eb_is_empty(&expr->pattern_tree)) {
467 /* we may have to force a trailing zero on the test pattern */
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200468 prev = smp->data.u.str.area[smp->data.u.str.data];
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100469 if (prev)
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200470 smp->data.u.str.area[smp->data.u.str.data] = '\0';
471 node = ebst_lookup(&expr->pattern_tree, smp->data.u.str.area);
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100472 if (prev)
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200473 smp->data.u.str.area[smp->data.u.str.data] = prev;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100474
475 if (node) {
476 if (fill) {
477 elt = ebmb_entry(node, struct pattern_tree, node);
Thierry FOURNIER503bb092015-08-19 08:35:43 +0200478 static_pattern.data = elt->data;
Thierry FOURNIER6bb53ff2014-01-28 15:54:36 +0100479 static_pattern.ref = elt->ref;
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200480 static_pattern.sflags = PAT_SF_TREE;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100481 static_pattern.type = SMP_T_STR;
482 static_pattern.ptr.str = (char *)elt->node.key;
483 }
484 return &static_pattern;
485 }
486 }
487
488 /* look in the list */
Willy Tarreauf3045d22015-04-29 16:24:50 +0200489 if (pat_lru_tree) {
Willy Tarreauaee93142015-05-04 17:18:42 +0200490 unsigned long long seed = pat_lru_seed ^ (long)expr;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200491
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200492 lru = lru64_get(XXH64(smp->data.u.str.area, smp->data.u.str.data, seed),
Willy Tarreauf3045d22015-04-29 16:24:50 +0200493 pat_lru_tree, expr, expr->revision);
Willy Tarreau403bfbb2019-10-23 06:59:31 +0200494 if (lru && lru->domain) {
Emeric Brunb5997f72017-07-03 11:34:05 +0200495 ret = lru->data;
Emeric Brunb5997f72017-07-03 11:34:05 +0200496 return ret;
497 }
Willy Tarreauf3045d22015-04-29 16:24:50 +0200498 }
499
Emeric Brunb5997f72017-07-03 11:34:05 +0200500
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100501 list_for_each_entry(lst, &expr->patterns, list) {
502 pattern = &lst->pat;
503
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200504 if (pattern->len != smp->data.u.str.data)
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100505 continue;
506
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200507 icase = expr->mflags & PAT_MF_IGNORE_CASE;
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200508 if ((icase && strncasecmp(pattern->ptr.str, smp->data.u.str.area, smp->data.u.str.data) == 0) ||
509 (!icase && strncmp(pattern->ptr.str, smp->data.u.str.area, smp->data.u.str.data) == 0)) {
Willy Tarreauf3045d22015-04-29 16:24:50 +0200510 ret = pattern;
511 break;
512 }
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100513 }
514
Willy Tarreau403bfbb2019-10-23 06:59:31 +0200515 if (lru)
Emeric Brunb5997f72017-07-03 11:34:05 +0200516 lru64_commit(lru, ret, expr, expr->revision, NULL);
Willy Tarreauf3045d22015-04-29 16:24:50 +0200517
518 return ret;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100519}
520
521/* NB: For two binaries buf to be identical, it is required that their lengths match */
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100522struct pattern *pat_match_bin(struct sample *smp, struct pattern_expr *expr, int fill)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100523{
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100524 struct pattern_list *lst;
525 struct pattern *pattern;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200526 struct pattern *ret = NULL;
527 struct lru64 *lru = NULL;
528
529 if (pat_lru_tree) {
Willy Tarreauaee93142015-05-04 17:18:42 +0200530 unsigned long long seed = pat_lru_seed ^ (long)expr;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100531
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200532 lru = lru64_get(XXH64(smp->data.u.str.area, smp->data.u.str.data, seed),
Willy Tarreauf3045d22015-04-29 16:24:50 +0200533 pat_lru_tree, expr, expr->revision);
Willy Tarreau403bfbb2019-10-23 06:59:31 +0200534 if (lru && lru->domain) {
Emeric Brunb5997f72017-07-03 11:34:05 +0200535 ret = lru->data;
Emeric Brunb5997f72017-07-03 11:34:05 +0200536 return ret;
537 }
Willy Tarreauf3045d22015-04-29 16:24:50 +0200538 }
539
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100540 list_for_each_entry(lst, &expr->patterns, list) {
541 pattern = &lst->pat;
542
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200543 if (pattern->len != smp->data.u.str.data)
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100544 continue;
545
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200546 if (memcmp(pattern->ptr.str, smp->data.u.str.area, smp->data.u.str.data) == 0) {
Willy Tarreauf3045d22015-04-29 16:24:50 +0200547 ret = pattern;
548 break;
549 }
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100550 }
551
Willy Tarreau403bfbb2019-10-23 06:59:31 +0200552 if (lru)
Emeric Brunb5997f72017-07-03 11:34:05 +0200553 lru64_commit(lru, ret, expr, expr->revision, NULL);
Willy Tarreauf3045d22015-04-29 16:24:50 +0200554
555 return ret;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100556}
557
558/* Executes a regex. It temporarily changes the data to add a trailing zero,
Thierry Fournier8feaa662016-02-10 22:55:20 +0100559 * and restores the previous character when leaving. This function fills
560 * a matching array.
561 */
562struct pattern *pat_match_regm(struct sample *smp, struct pattern_expr *expr, int fill)
563{
564 struct pattern_list *lst;
565 struct pattern *pattern;
566 struct pattern *ret = NULL;
567
568 list_for_each_entry(lst, &expr->patterns, list) {
569 pattern = &lst->pat;
570
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200571 if (regex_exec_match2(pattern->ptr.reg, smp->data.u.str.area, smp->data.u.str.data,
Thierry Fournier8feaa662016-02-10 22:55:20 +0100572 MAX_MATCH, pmatch, 0)) {
573 ret = pattern;
574 smp->ctx.a[0] = pmatch;
575 break;
576 }
577 }
578
579 return ret;
580}
581
582/* Executes a regex. It temporarily changes the data to add a trailing zero,
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100583 * and restores the previous character when leaving.
584 */
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100585struct pattern *pat_match_reg(struct sample *smp, struct pattern_expr *expr, int fill)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100586{
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100587 struct pattern_list *lst;
588 struct pattern *pattern;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200589 struct pattern *ret = NULL;
590 struct lru64 *lru = NULL;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100591
Willy Tarreauf3045d22015-04-29 16:24:50 +0200592 if (pat_lru_tree) {
Willy Tarreauaee93142015-05-04 17:18:42 +0200593 unsigned long long seed = pat_lru_seed ^ (long)expr;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200594
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200595 lru = lru64_get(XXH64(smp->data.u.str.area, smp->data.u.str.data, seed),
Willy Tarreauf3045d22015-04-29 16:24:50 +0200596 pat_lru_tree, expr, expr->revision);
Willy Tarreau403bfbb2019-10-23 06:59:31 +0200597 if (lru && lru->domain) {
Emeric Brunb5997f72017-07-03 11:34:05 +0200598 ret = lru->data;
Emeric Brunb5997f72017-07-03 11:34:05 +0200599 return ret;
600 }
Willy Tarreauf3045d22015-04-29 16:24:50 +0200601 }
602
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100603 list_for_each_entry(lst, &expr->patterns, list) {
604 pattern = &lst->pat;
605
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200606 if (regex_exec2(pattern->ptr.reg, smp->data.u.str.area, smp->data.u.str.data)) {
Willy Tarreauf3045d22015-04-29 16:24:50 +0200607 ret = pattern;
608 break;
609 }
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100610 }
Willy Tarreauf3045d22015-04-29 16:24:50 +0200611
Willy Tarreau403bfbb2019-10-23 06:59:31 +0200612 if (lru)
Emeric Brunb5997f72017-07-03 11:34:05 +0200613 lru64_commit(lru, ret, expr, expr->revision, NULL);
Willy Tarreauf3045d22015-04-29 16:24:50 +0200614
615 return ret;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100616}
617
618/* Checks that the pattern matches the beginning of the tested string. */
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100619struct pattern *pat_match_beg(struct sample *smp, struct pattern_expr *expr, int fill)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100620{
621 int icase;
Willy Tarreaub1dd9bf2014-05-10 08:53:48 +0200622 struct ebmb_node *node;
623 char prev;
624 struct pattern_tree *elt;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100625 struct pattern_list *lst;
626 struct pattern *pattern;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200627 struct pattern *ret = NULL;
628 struct lru64 *lru = NULL;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100629
Willy Tarreaub1dd9bf2014-05-10 08:53:48 +0200630 /* Lookup a string in the expression's pattern tree. */
631 if (!eb_is_empty(&expr->pattern_tree)) {
632 /* we may have to force a trailing zero on the test pattern */
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200633 prev = smp->data.u.str.area[smp->data.u.str.data];
Willy Tarreaub1dd9bf2014-05-10 08:53:48 +0200634 if (prev)
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200635 smp->data.u.str.area[smp->data.u.str.data] = '\0';
636 node = ebmb_lookup_longest(&expr->pattern_tree,
637 smp->data.u.str.area);
Willy Tarreaub1dd9bf2014-05-10 08:53:48 +0200638 if (prev)
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200639 smp->data.u.str.area[smp->data.u.str.data] = prev;
Willy Tarreaub1dd9bf2014-05-10 08:53:48 +0200640
641 if (node) {
642 if (fill) {
643 elt = ebmb_entry(node, struct pattern_tree, node);
Thierry FOURNIER503bb092015-08-19 08:35:43 +0200644 static_pattern.data = elt->data;
Willy Tarreaub1dd9bf2014-05-10 08:53:48 +0200645 static_pattern.ref = elt->ref;
646 static_pattern.sflags = PAT_SF_TREE;
647 static_pattern.type = SMP_T_STR;
648 static_pattern.ptr.str = (char *)elt->node.key;
649 }
650 return &static_pattern;
651 }
652 }
653
654 /* look in the list */
Willy Tarreauf3045d22015-04-29 16:24:50 +0200655 if (pat_lru_tree) {
Willy Tarreauaee93142015-05-04 17:18:42 +0200656 unsigned long long seed = pat_lru_seed ^ (long)expr;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200657
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200658 lru = lru64_get(XXH64(smp->data.u.str.area, smp->data.u.str.data, seed),
Willy Tarreauf3045d22015-04-29 16:24:50 +0200659 pat_lru_tree, expr, expr->revision);
Willy Tarreau403bfbb2019-10-23 06:59:31 +0200660 if (lru && lru->domain) {
Emeric Brunb5997f72017-07-03 11:34:05 +0200661 ret = lru->data;
Emeric Brunb5997f72017-07-03 11:34:05 +0200662 return ret;
663 }
Willy Tarreauf3045d22015-04-29 16:24:50 +0200664 }
665
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100666 list_for_each_entry(lst, &expr->patterns, list) {
667 pattern = &lst->pat;
668
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200669 if (pattern->len > smp->data.u.str.data)
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100670 continue;
671
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200672 icase = expr->mflags & PAT_MF_IGNORE_CASE;
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200673 if ((icase && strncasecmp(pattern->ptr.str, smp->data.u.str.area, pattern->len) != 0) ||
674 (!icase && strncmp(pattern->ptr.str, smp->data.u.str.area, pattern->len) != 0))
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100675 continue;
676
Willy Tarreauf3045d22015-04-29 16:24:50 +0200677 ret = pattern;
678 break;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100679 }
Willy Tarreauf3045d22015-04-29 16:24:50 +0200680
Willy Tarreau403bfbb2019-10-23 06:59:31 +0200681 if (lru)
Emeric Brunb5997f72017-07-03 11:34:05 +0200682 lru64_commit(lru, ret, expr, expr->revision, NULL);
Willy Tarreauf3045d22015-04-29 16:24:50 +0200683
684 return ret;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100685}
686
687/* Checks that the pattern matches the end of the tested string. */
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100688struct pattern *pat_match_end(struct sample *smp, struct pattern_expr *expr, int fill)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100689{
690 int icase;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100691 struct pattern_list *lst;
692 struct pattern *pattern;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200693 struct pattern *ret = NULL;
694 struct lru64 *lru = NULL;
695
696 if (pat_lru_tree) {
Willy Tarreauaee93142015-05-04 17:18:42 +0200697 unsigned long long seed = pat_lru_seed ^ (long)expr;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200698
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200699 lru = lru64_get(XXH64(smp->data.u.str.area, smp->data.u.str.data, seed),
Willy Tarreauf3045d22015-04-29 16:24:50 +0200700 pat_lru_tree, expr, expr->revision);
Willy Tarreau403bfbb2019-10-23 06:59:31 +0200701 if (lru && lru->domain) {
Emeric Brunb5997f72017-07-03 11:34:05 +0200702 ret = lru->data;
Emeric Brunb5997f72017-07-03 11:34:05 +0200703 return ret;
704 }
Willy Tarreauf3045d22015-04-29 16:24:50 +0200705 }
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100706
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100707 list_for_each_entry(lst, &expr->patterns, list) {
708 pattern = &lst->pat;
709
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200710 if (pattern->len > smp->data.u.str.data)
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100711 continue;
712
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200713 icase = expr->mflags & PAT_MF_IGNORE_CASE;
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200714 if ((icase && strncasecmp(pattern->ptr.str, smp->data.u.str.area + smp->data.u.str.data - pattern->len, pattern->len) != 0) ||
715 (!icase && strncmp(pattern->ptr.str, smp->data.u.str.area + smp->data.u.str.data - pattern->len, pattern->len) != 0))
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100716 continue;
717
Willy Tarreauf3045d22015-04-29 16:24:50 +0200718 ret = pattern;
719 break;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100720 }
Willy Tarreauf3045d22015-04-29 16:24:50 +0200721
Willy Tarreau403bfbb2019-10-23 06:59:31 +0200722 if (lru)
Emeric Brunb5997f72017-07-03 11:34:05 +0200723 lru64_commit(lru, ret, expr, expr->revision, NULL);
Willy Tarreauf3045d22015-04-29 16:24:50 +0200724
725 return ret;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100726}
727
728/* Checks that the pattern is included inside the tested string.
729 * NB: Suboptimal, should be rewritten using a Boyer-Moore method.
730 */
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100731struct pattern *pat_match_sub(struct sample *smp, struct pattern_expr *expr, int fill)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100732{
733 int icase;
734 char *end;
735 char *c;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100736 struct pattern_list *lst;
737 struct pattern *pattern;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200738 struct pattern *ret = NULL;
739 struct lru64 *lru = NULL;
740
741 if (pat_lru_tree) {
Willy Tarreauaee93142015-05-04 17:18:42 +0200742 unsigned long long seed = pat_lru_seed ^ (long)expr;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200743
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200744 lru = lru64_get(XXH64(smp->data.u.str.area, smp->data.u.str.data, seed),
Willy Tarreauf3045d22015-04-29 16:24:50 +0200745 pat_lru_tree, expr, expr->revision);
Willy Tarreau403bfbb2019-10-23 06:59:31 +0200746 if (lru && lru->domain) {
Emeric Brunb5997f72017-07-03 11:34:05 +0200747 ret = lru->data;
Emeric Brunb5997f72017-07-03 11:34:05 +0200748 return ret;
749 }
Willy Tarreauf3045d22015-04-29 16:24:50 +0200750 }
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100751
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100752 list_for_each_entry(lst, &expr->patterns, list) {
753 pattern = &lst->pat;
754
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200755 if (pattern->len > smp->data.u.str.data)
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100756 continue;
757
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200758 end = smp->data.u.str.area + smp->data.u.str.data - pattern->len;
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200759 icase = expr->mflags & PAT_MF_IGNORE_CASE;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100760 if (icase) {
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200761 for (c = smp->data.u.str.area; c <= end; c++) {
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100762 if (tolower(*c) != tolower(*pattern->ptr.str))
763 continue;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200764 if (strncasecmp(pattern->ptr.str, c, pattern->len) == 0) {
765 ret = pattern;
766 goto leave;
767 }
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100768 }
769 } else {
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200770 for (c = smp->data.u.str.area; c <= end; c++) {
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100771 if (*c != *pattern->ptr.str)
772 continue;
Willy Tarreauf3045d22015-04-29 16:24:50 +0200773 if (strncmp(pattern->ptr.str, c, pattern->len) == 0) {
774 ret = pattern;
775 goto leave;
776 }
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100777 }
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100778 }
779 }
Willy Tarreauf3045d22015-04-29 16:24:50 +0200780 leave:
Willy Tarreau403bfbb2019-10-23 06:59:31 +0200781 if (lru)
Emeric Brunb5997f72017-07-03 11:34:05 +0200782 lru64_commit(lru, ret, expr, expr->revision, NULL);
Willy Tarreauf3045d22015-04-29 16:24:50 +0200783
784 return ret;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100785}
786
787/* This one is used by other real functions. It checks that the pattern is
788 * included inside the tested string, but enclosed between the specified
789 * delimiters or at the beginning or end of the string. The delimiters are
790 * provided as an unsigned int made by make_4delim() and match up to 4 different
791 * delimiters. Delimiters are stripped at the beginning and end of the pattern.
792 */
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200793static int match_word(struct sample *smp, struct pattern *pattern, int mflags, unsigned int delimiters)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100794{
795 int may_match, icase;
796 char *c, *end;
797 char *ps;
798 int pl;
799
800 pl = pattern->len;
801 ps = pattern->ptr.str;
802
803 while (pl > 0 && is_delimiter(*ps, delimiters)) {
804 pl--;
805 ps++;
806 }
807
808 while (pl > 0 && is_delimiter(ps[pl - 1], delimiters))
809 pl--;
810
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200811 if (pl > smp->data.u.str.data)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100812 return PAT_NOMATCH;
813
814 may_match = 1;
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200815 icase = mflags & PAT_MF_IGNORE_CASE;
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200816 end = smp->data.u.str.area + smp->data.u.str.data - pl;
817 for (c = smp->data.u.str.area; c <= end; c++) {
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100818 if (is_delimiter(*c, delimiters)) {
819 may_match = 1;
820 continue;
821 }
822
823 if (!may_match)
824 continue;
825
826 if (icase) {
827 if ((tolower(*c) == tolower(*ps)) &&
828 (strncasecmp(ps, c, pl) == 0) &&
829 (c == end || is_delimiter(c[pl], delimiters)))
830 return PAT_MATCH;
831 } else {
832 if ((*c == *ps) &&
833 (strncmp(ps, c, pl) == 0) &&
834 (c == end || is_delimiter(c[pl], delimiters)))
835 return PAT_MATCH;
836 }
837 may_match = 0;
838 }
839 return PAT_NOMATCH;
840}
841
842/* Checks that the pattern is included inside the tested string, but enclosed
843 * between the delimiters '?' or '/' or at the beginning or end of the string.
844 * Delimiters at the beginning or end of the pattern are ignored.
845 */
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100846struct pattern *pat_match_dir(struct sample *smp, struct pattern_expr *expr, int fill)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100847{
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100848 struct pattern_list *lst;
849 struct pattern *pattern;
850
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100851 list_for_each_entry(lst, &expr->patterns, list) {
852 pattern = &lst->pat;
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200853 if (match_word(smp, pattern, expr->mflags, make_4delim('/', '?', '?', '?')))
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100854 return pattern;
855 }
856 return NULL;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100857}
858
859/* Checks that the pattern is included inside the tested string, but enclosed
860 * between the delmiters '/', '?', '.' or ":" or at the beginning or end of
861 * the string. Delimiters at the beginning or end of the pattern are ignored.
862 */
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100863struct pattern *pat_match_dom(struct sample *smp, struct pattern_expr *expr, int fill)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100864{
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100865 struct pattern_list *lst;
866 struct pattern *pattern;
867
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100868 list_for_each_entry(lst, &expr->patterns, list) {
869 pattern = &lst->pat;
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200870 if (match_word(smp, pattern, expr->mflags, make_4delim('/', '?', '.', ':')))
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100871 return pattern;
872 }
873 return NULL;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100874}
875
876/* Checks that the integer in <test> is included between min and max */
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100877struct pattern *pat_match_int(struct sample *smp, struct pattern_expr *expr, int fill)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100878{
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100879 struct pattern_list *lst;
880 struct pattern *pattern;
881
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100882 list_for_each_entry(lst, &expr->patterns, list) {
883 pattern = &lst->pat;
Thierry FOURNIER136f9d32015-08-19 09:07:19 +0200884 if ((!pattern->val.range.min_set || pattern->val.range.min <= smp->data.u.sint) &&
885 (!pattern->val.range.max_set || smp->data.u.sint <= pattern->val.range.max))
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100886 return pattern;
887 }
888 return NULL;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100889}
890
891/* Checks that the length of the pattern in <test> is included between min and max */
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100892struct pattern *pat_match_len(struct sample *smp, struct pattern_expr *expr, int fill)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100893{
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100894 struct pattern_list *lst;
895 struct pattern *pattern;
896
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100897 list_for_each_entry(lst, &expr->patterns, list) {
898 pattern = &lst->pat;
Willy Tarreau843b7cb2018-07-13 10:54:26 +0200899 if ((!pattern->val.range.min_set || pattern->val.range.min <= smp->data.u.str.data) &&
900 (!pattern->val.range.max_set || smp->data.u.str.data <= pattern->val.range.max))
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100901 return pattern;
902 }
903 return NULL;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100904}
905
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100906struct pattern *pat_match_ip(struct sample *smp, struct pattern_expr *expr, int fill)
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100907{
908 unsigned int v4; /* in network byte order */
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100909 struct in6_addr tmp6;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100910 struct in_addr *s;
911 struct ebmb_node *node;
912 struct pattern_tree *elt;
913 struct pattern_list *lst;
914 struct pattern *pattern;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100915
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100916 /* The input sample is IPv4. Try to match in the trees. */
Thierry FOURNIER8c542ca2015-08-19 09:00:18 +0200917 if (smp->data.type == SMP_T_IPV4) {
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100918 /* Lookup an IPv4 address in the expression's pattern tree using
919 * the longest match method.
920 */
Thierry FOURNIER136f9d32015-08-19 09:07:19 +0200921 s = &smp->data.u.ipv4;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100922 node = ebmb_lookup_longest(&expr->pattern_tree, &s->s_addr);
923 if (node) {
924 if (fill) {
925 elt = ebmb_entry(node, struct pattern_tree, node);
Thierry FOURNIER503bb092015-08-19 08:35:43 +0200926 static_pattern.data = elt->data;
Thierry FOURNIER6bb53ff2014-01-28 15:54:36 +0100927 static_pattern.ref = elt->ref;
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200928 static_pattern.sflags = PAT_SF_TREE;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100929 static_pattern.type = SMP_T_IPV4;
Willy Tarreau296cfd12020-02-25 09:58:41 +0100930 static_pattern.val.ipv4.addr.s_addr = read_u32(elt->node.key);
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100931 if (!cidr2dotted(elt->node.node.pfx, &static_pattern.val.ipv4.mask))
932 return NULL;
933 }
934 return &static_pattern;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100935 }
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100936
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100937 /* The IPv4 sample dont match the IPv4 tree. Convert the IPv4
938 * sample address to IPv6 with the mapping method using the ::ffff:
939 * prefix, and try to lookup in the IPv6 tree.
940 */
941 memset(&tmp6, 0, 10);
Willy Tarreau296cfd12020-02-25 09:58:41 +0100942 write_u16(&tmp6.s6_addr[10], htons(0xffff));
943 write_u32(&tmp6.s6_addr[12], smp->data.u.ipv4.s_addr);
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100944 node = ebmb_lookup_longest(&expr->pattern_tree_2, &tmp6);
945 if (node) {
946 if (fill) {
947 elt = ebmb_entry(node, struct pattern_tree, node);
Thierry FOURNIER503bb092015-08-19 08:35:43 +0200948 static_pattern.data = elt->data;
Thierry FOURNIER6bb53ff2014-01-28 15:54:36 +0100949 static_pattern.ref = elt->ref;
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200950 static_pattern.sflags = PAT_SF_TREE;
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100951 static_pattern.type = SMP_T_IPV6;
Willy Tarreau296cfd12020-02-25 09:58:41 +0100952 memcpy(&static_pattern.val.ipv6.addr, elt->node.key, 16);
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100953 static_pattern.val.ipv6.mask = elt->node.node.pfx;
954 }
955 return &static_pattern;
956 }
957 }
Thierry FOURNIER5338eea2013-12-16 14:22:13 +0100958
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100959 /* The input sample is IPv6. Try to match in the trees. */
Thierry FOURNIER8c542ca2015-08-19 09:00:18 +0200960 if (smp->data.type == SMP_T_IPV6) {
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100961 /* Lookup an IPv6 address in the expression's pattern tree using
962 * the longest match method.
963 */
Thierry FOURNIER136f9d32015-08-19 09:07:19 +0200964 node = ebmb_lookup_longest(&expr->pattern_tree_2, &smp->data.u.ipv6);
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100965 if (node) {
966 if (fill) {
967 elt = ebmb_entry(node, struct pattern_tree, node);
Thierry FOURNIER503bb092015-08-19 08:35:43 +0200968 static_pattern.data = elt->data;
Thierry FOURNIER6bb53ff2014-01-28 15:54:36 +0100969 static_pattern.ref = elt->ref;
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +0200970 static_pattern.sflags = PAT_SF_TREE;
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100971 static_pattern.type = SMP_T_IPV6;
Willy Tarreau296cfd12020-02-25 09:58:41 +0100972 memcpy(&static_pattern.val.ipv6.addr, elt->node.key, 16);
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100973 static_pattern.val.ipv6.mask = elt->node.node.pfx;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +0100974 }
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100975 return &static_pattern;
976 }
977
978 /* Try to convert 6 to 4 when the start of the ipv6 address match the
979 * following forms :
980 * - ::ffff:ip:v4 (ipv4 mapped)
981 * - ::0000:ip:v4 (old ipv4 mapped)
982 * - 2002:ip:v4:: (6to4)
983 */
Willy Tarreau296cfd12020-02-25 09:58:41 +0100984 if ((read_u64(&smp->data.u.ipv6.s6_addr[0]) == 0 &&
985 (read_u32(&smp->data.u.ipv6.s6_addr[8]) == 0 ||
986 read_u32(&smp->data.u.ipv6.s6_addr[8]) == htonl(0xFFFF))) ||
987 read_u16(&smp->data.u.ipv6.s6_addr[0]) == htons(0x2002)) {
988 if (read_u32(&smp->data.u.ipv6.s6_addr[0]) == 0)
989 v4 = read_u32(&smp->data.u.ipv6.s6_addr[12]);
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100990 else
Willy Tarreau296cfd12020-02-25 09:58:41 +0100991 v4 = htonl((ntohs(read_u16(&smp->data.u.ipv6.s6_addr[2])) << 16) +
992 ntohs(read_u16(&smp->data.u.ipv6.s6_addr[4])));
Thierry FOURNIER33a74332013-12-19 23:54:54 +0100993
994 /* Lookup an IPv4 address in the expression's pattern tree using the longest
995 * match method.
996 */
997 node = ebmb_lookup_longest(&expr->pattern_tree, &v4);
998 if (node) {
999 if (fill) {
1000 elt = ebmb_entry(node, struct pattern_tree, node);
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001001 static_pattern.data = elt->data;
Thierry FOURNIER6bb53ff2014-01-28 15:54:36 +01001002 static_pattern.ref = elt->ref;
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +02001003 static_pattern.sflags = PAT_SF_TREE;
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001004 static_pattern.type = SMP_T_IPV4;
Willy Tarreau296cfd12020-02-25 09:58:41 +01001005 static_pattern.val.ipv4.addr.s_addr = read_u32(elt->node.key);
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001006 if (!cidr2dotted(elt->node.node.pfx, &static_pattern.val.ipv4.mask))
1007 return NULL;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +01001008 }
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001009 return &static_pattern;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +01001010 }
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001011 }
1012 }
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +01001013
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001014 /* Lookup in the list. the list contain only IPv4 patterns */
1015 list_for_each_entry(lst, &expr->patterns, list) {
1016 pattern = &lst->pat;
1017
1018 /* The input sample is IPv4, use it as is. */
Thierry FOURNIER8c542ca2015-08-19 09:00:18 +02001019 if (smp->data.type == SMP_T_IPV4) {
Thierry FOURNIER136f9d32015-08-19 09:07:19 +02001020 v4 = smp->data.u.ipv4.s_addr;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +01001021 }
Thierry FOURNIER8c542ca2015-08-19 09:00:18 +02001022 else if (smp->data.type == SMP_T_IPV6) {
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001023 /* v4 match on a V6 sample. We want to check at least for
1024 * the following forms :
1025 * - ::ffff:ip:v4 (ipv4 mapped)
1026 * - ::0000:ip:v4 (old ipv4 mapped)
1027 * - 2002:ip:v4:: (6to4)
1028 */
Willy Tarreau296cfd12020-02-25 09:58:41 +01001029 if (read_u64(&smp->data.u.ipv6.s6_addr[0]) == 0 &&
1030 (read_u32(&smp->data.u.ipv6.s6_addr[8]) == 0 ||
1031 read_u32(&smp->data.u.ipv6.s6_addr[8]) == htonl(0xFFFF))) {
1032 v4 = read_u32(&smp->data.u.ipv6.s6_addr[12]);
Thierry FOURNIER5338eea2013-12-16 14:22:13 +01001033 }
Willy Tarreau296cfd12020-02-25 09:58:41 +01001034 else if (read_u16(&smp->data.u.ipv6.s6_addr[0]) == htons(0x2002)) {
1035 v4 = htonl((ntohs(read_u16(&smp->data.u.ipv6.s6_addr[2])) << 16) +
1036 ntohs(read_u16(&smp->data.u.ipv6.s6_addr[4])));
Thierry FOURNIER5338eea2013-12-16 14:22:13 +01001037 }
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001038 else
Thierry FOURNIER5338eea2013-12-16 14:22:13 +01001039 continue;
Andreas Seltenreichf0653192016-03-03 20:08:35 +01001040 } else {
1041 /* impossible */
1042 continue;
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001043 }
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +01001044
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001045 /* Check if the input sample match the current pattern. */
1046 if (((v4 ^ pattern->val.ipv4.addr.s_addr) & pattern->val.ipv4.mask.s_addr) == 0)
Thierry FOURNIER5338eea2013-12-16 14:22:13 +01001047 return pattern;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +01001048 }
Thierry FOURNIER5338eea2013-12-16 14:22:13 +01001049 return NULL;
Thierry FOURNIERe7ba2362014-01-21 11:25:41 +01001050}
1051
Thierry FOURNIERed66c292013-11-28 11:05:19 +01001052void free_pattern_tree(struct eb_root *root)
1053{
1054 struct eb_node *node, *next;
Thierry FOURNIERe1bcac52013-12-13 16:09:50 +01001055 struct pattern_tree *elt;
Thierry FOURNIER3ce88c72013-12-09 11:29:46 +01001056
Thierry FOURNIERed66c292013-11-28 11:05:19 +01001057 node = eb_first(root);
1058 while (node) {
1059 next = eb_next(node);
1060 eb_delete(node);
Thierry FOURNIERe1bcac52013-12-13 16:09:50 +01001061 elt = container_of(node, struct pattern_tree, node);
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001062 free(elt->data);
Thierry FOURNIER3ce88c72013-12-09 11:29:46 +01001063 free(elt);
Thierry FOURNIERed66c292013-11-28 11:05:19 +01001064 node = next;
1065 }
1066}
1067
Thierry FOURNIER6f7203d2014-01-14 16:24:51 +01001068void pat_prune_val(struct pattern_expr *expr)
Thierry FOURNIERd163e1c2013-11-28 11:41:23 +01001069{
Thierry FOURNIER6f7203d2014-01-14 16:24:51 +01001070 struct pattern_list *pat, *tmp;
1071
1072 list_for_each_entry_safe(pat, tmp, &expr->patterns, list) {
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001073 free(pat->pat.data);
Thierry FOURNIER6f7203d2014-01-14 16:24:51 +01001074 free(pat);
1075 }
1076
Thierry FOURNIERd163e1c2013-11-28 11:41:23 +01001077 free_pattern_tree(&expr->pattern_tree);
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001078 free_pattern_tree(&expr->pattern_tree_2);
Thierry FOURNIERd163e1c2013-11-28 11:41:23 +01001079 LIST_INIT(&expr->patterns);
1080}
1081
Thierry FOURNIER6f7203d2014-01-14 16:24:51 +01001082void pat_prune_ptr(struct pattern_expr *expr)
1083{
1084 struct pattern_list *pat, *tmp;
1085
1086 list_for_each_entry_safe(pat, tmp, &expr->patterns, list) {
1087 free(pat->pat.ptr.ptr);
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001088 free(pat->pat.data);
Thierry FOURNIER6f7203d2014-01-14 16:24:51 +01001089 free(pat);
1090 }
1091
1092 free_pattern_tree(&expr->pattern_tree);
1093 free_pattern_tree(&expr->pattern_tree_2);
1094 LIST_INIT(&expr->patterns);
1095}
1096
1097void pat_prune_reg(struct pattern_expr *expr)
1098{
1099 struct pattern_list *pat, *tmp;
1100
1101 list_for_each_entry_safe(pat, tmp, &expr->patterns, list) {
1102 regex_free(pat->pat.ptr.ptr);
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001103 free(pat->pat.data);
Thierry FOURNIER6f7203d2014-01-14 16:24:51 +01001104 free(pat);
1105 }
1106
1107 free_pattern_tree(&expr->pattern_tree);
1108 free_pattern_tree(&expr->pattern_tree_2);
1109 LIST_INIT(&expr->patterns);
1110}
1111
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001112/*
1113 *
1114 * The following functions are used for the pattern indexation
1115 *
Thierry FOURNIERed66c292013-11-28 11:05:19 +01001116 */
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001117
1118int pat_idx_list_val(struct pattern_expr *expr, struct pattern *pat, char **err)
Thierry FOURNIERed66c292013-11-28 11:05:19 +01001119{
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001120 struct pattern_list *patl;
Thierry FOURNIERed66c292013-11-28 11:05:19 +01001121
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001122 /* allocate pattern */
1123 patl = calloc(1, sizeof(*patl));
1124 if (!patl) {
1125 memprintf(err, "out of memory while indexing pattern");
Thierry FOURNIER972028f2014-01-23 17:53:31 +01001126 return 0;
1127 }
Thierry FOURNIERed66c292013-11-28 11:05:19 +01001128
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001129 /* duplicate pattern */
1130 memcpy(&patl->pat, pat, sizeof(*pat));
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001131
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001132 /* chain pattern in the expression */
1133 LIST_ADDQ(&expr->patterns, &patl->list);
Willy Tarreau72f073b2015-04-29 17:53:47 +02001134 expr->revision = rdtsc();
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001135
1136 /* that's ok */
1137 return 1;
1138}
1139
1140int pat_idx_list_ptr(struct pattern_expr *expr, struct pattern *pat, char **err)
1141{
1142 struct pattern_list *patl;
1143
1144 /* allocate pattern */
1145 patl = calloc(1, sizeof(*patl));
Thierry FOURNIER8aa83842015-02-06 17:50:55 +01001146 if (!patl) {
1147 memprintf(err, "out of memory while indexing pattern");
Thierry FOURNIER972028f2014-01-23 17:53:31 +01001148 return 0;
Thierry FOURNIER8aa83842015-02-06 17:50:55 +01001149 }
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001150
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001151 /* duplicate pattern */
1152 memcpy(&patl->pat, pat, sizeof(*pat));
1153 patl->pat.ptr.ptr = malloc(patl->pat.len);
1154 if (!patl->pat.ptr.ptr) {
1155 free(patl);
1156 memprintf(err, "out of memory while indexing pattern");
1157 return 0;
1158 }
1159 memcpy(patl->pat.ptr.ptr, pat->ptr.ptr, pat->len);
Thierry FOURNIERed66c292013-11-28 11:05:19 +01001160
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001161 /* chain pattern in the expression */
1162 LIST_ADDQ(&expr->patterns, &patl->list);
Willy Tarreau72f073b2015-04-29 17:53:47 +02001163 expr->revision = rdtsc();
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001164
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001165 /* that's ok */
1166 return 1;
1167}
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001168
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001169int pat_idx_list_str(struct pattern_expr *expr, struct pattern *pat, char **err)
1170{
1171 struct pattern_list *patl;
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001172
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001173 /* allocate pattern */
1174 patl = calloc(1, sizeof(*patl));
1175 if (!patl) {
1176 memprintf(err, "out of memory while indexing pattern");
1177 return 0;
1178 }
1179
1180 /* duplicate pattern */
1181 memcpy(&patl->pat, pat, sizeof(*pat));
1182 patl->pat.ptr.str = malloc(patl->pat.len + 1);
1183 if (!patl->pat.ptr.str) {
1184 free(patl);
1185 memprintf(err, "out of memory while indexing pattern");
1186 return 0;
1187 }
1188 memcpy(patl->pat.ptr.ptr, pat->ptr.ptr, pat->len);
1189 patl->pat.ptr.str[patl->pat.len] = '\0';
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001190
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001191 /* chain pattern in the expression */
1192 LIST_ADDQ(&expr->patterns, &patl->list);
Willy Tarreau72f073b2015-04-29 17:53:47 +02001193 expr->revision = rdtsc();
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001194
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001195 /* that's ok */
1196 return 1;
1197}
1198
Thierry Fournier8feaa662016-02-10 22:55:20 +01001199int pat_idx_list_reg_cap(struct pattern_expr *expr, struct pattern *pat, int cap, char **err)
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001200{
1201 struct pattern_list *patl;
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001202
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001203 /* allocate pattern */
1204 patl = calloc(1, sizeof(*patl));
1205 if (!patl) {
1206 memprintf(err, "out of memory while indexing pattern");
1207 return 0;
Thierry FOURNIER972028f2014-01-23 17:53:31 +01001208 }
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001209
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001210 /* duplicate pattern */
1211 memcpy(&patl->pat, pat, sizeof(*pat));
1212
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001213 /* compile regex */
Dragan Dosen26743032019-04-30 15:54:36 +02001214 if (!(patl->pat.ptr.reg = regex_comp(pat->ptr.str, !(expr->mflags & PAT_MF_IGNORE_CASE),
1215 cap, err))) {
Dirkjan Bussink07fcaaa2014-04-28 22:57:16 +00001216 free(patl);
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001217 return 0;
1218 }
1219
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001220 /* chain pattern in the expression */
1221 LIST_ADDQ(&expr->patterns, &patl->list);
Willy Tarreau72f073b2015-04-29 17:53:47 +02001222 expr->revision = rdtsc();
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001223
1224 /* that's ok */
1225 return 1;
1226}
1227
Thierry Fournier8feaa662016-02-10 22:55:20 +01001228int pat_idx_list_reg(struct pattern_expr *expr, struct pattern *pat, char **err)
1229{
1230 return pat_idx_list_reg_cap(expr, pat, 0, err);
1231}
1232
1233int pat_idx_list_regm(struct pattern_expr *expr, struct pattern *pat, char **err)
1234{
1235 return pat_idx_list_reg_cap(expr, pat, 1, err);
1236}
1237
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001238int pat_idx_tree_ip(struct pattern_expr *expr, struct pattern *pat, char **err)
1239{
1240 unsigned int mask;
Thierry FOURNIERe1bcac52013-12-13 16:09:50 +01001241 struct pattern_tree *node;
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001242
1243 /* Only IPv4 can be indexed */
1244 if (pat->type == SMP_T_IPV4) {
Thierry FOURNIER972028f2014-01-23 17:53:31 +01001245 /* in IPv4 case, check if the mask is contiguous so that we can
1246 * insert the network into the tree. A continuous mask has only
1247 * ones on the left. This means that this mask + its lower bit
1248 * added once again is null.
1249 */
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001250 mask = ntohl(pat->val.ipv4.mask.s_addr);
1251 if (mask + (mask & -mask) == 0) {
1252 mask = mask ? 33 - flsnz(mask & -mask) : 0; /* equals cidr value */
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001253
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001254 /* node memory allocation */
1255 node = calloc(1, sizeof(*node) + 4);
1256 if (!node) {
1257 memprintf(err, "out of memory while loading pattern");
1258 return 0;
1259 }
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001260
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001261 /* copy the pointer to sample associated to this node */
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001262 node->data = pat->data;
Thierry FOURNIER6bb53ff2014-01-28 15:54:36 +01001263 node->ref = pat->ref;
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001264
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001265 /* FIXME: insert <addr>/<mask> into the tree here */
1266 memcpy(node->node.key, &pat->val.ipv4.addr, 4); /* network byte order */
1267 node->node.node.pfx = mask;
Thierry FOURNIER31db4ae2014-01-30 00:27:15 +01001268
1269 /* Insert the entry. */
1270 ebmb_insert_prefix(&expr->pattern_tree, &node->node, 4);
Willy Tarreau72f073b2015-04-29 17:53:47 +02001271 expr->revision = rdtsc();
Thierry FOURNIERed66c292013-11-28 11:05:19 +01001272
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001273 /* that's ok */
1274 return 1;
1275 }
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001276 else {
1277 /* If the mask is not contiguous, just add the pattern to the list */
1278 return pat_idx_list_val(expr, pat, err);
1279 }
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001280 }
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001281 else if (pat->type == SMP_T_IPV6) {
1282 /* IPv6 also can be indexed */
1283 node = calloc(1, sizeof(*node) + 16);
1284 if (!node) {
1285 memprintf(err, "out of memory while loading pattern");
1286 return 0;
1287 }
1288
1289 /* copy the pointer to sample associated to this node */
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001290 node->data = pat->data;
Thierry FOURNIER6bb53ff2014-01-28 15:54:36 +01001291 node->ref = pat->ref;
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001292
1293 /* FIXME: insert <addr>/<mask> into the tree here */
1294 memcpy(node->node.key, &pat->val.ipv6.addr, 16); /* network byte order */
1295 node->node.node.pfx = pat->val.ipv6.mask;
Thierry FOURNIER31db4ae2014-01-30 00:27:15 +01001296
1297 /* Insert the entry. */
1298 ebmb_insert_prefix(&expr->pattern_tree_2, &node->node, 16);
Willy Tarreau72f073b2015-04-29 17:53:47 +02001299 expr->revision = rdtsc();
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001300
1301 /* that's ok */
1302 return 1;
1303 }
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001304
Thierry FOURNIER33a74332013-12-19 23:54:54 +01001305 return 0;
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001306}
1307
1308int pat_idx_tree_str(struct pattern_expr *expr, struct pattern *pat, char **err)
1309{
1310 int len;
Thierry FOURNIERe1bcac52013-12-13 16:09:50 +01001311 struct pattern_tree *node;
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001312
1313 /* Only string can be indexed */
Thierry FOURNIER7654c9f2013-12-17 00:20:33 +01001314 if (pat->type != SMP_T_STR) {
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001315 memprintf(err, "internal error: string expected, but the type is '%s'",
1316 smp_to_type[pat->type]);
1317 return 0;
Thierry FOURNIER972028f2014-01-23 17:53:31 +01001318 }
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001319
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001320 /* If the flag PAT_F_IGNORE_CASE is set, we cannot use trees */
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +02001321 if (expr->mflags & PAT_MF_IGNORE_CASE)
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001322 return pat_idx_list_str(expr, pat, err);
Thierry FOURNIER7148ce62013-12-06 19:06:43 +01001323
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001324 /* Process the key len */
1325 len = strlen(pat->ptr.str) + 1;
1326
1327 /* node memory allocation */
1328 node = calloc(1, sizeof(*node) + len);
1329 if (!node) {
1330 memprintf(err, "out of memory while loading pattern");
1331 return 0;
Thierry FOURNIERed66c292013-11-28 11:05:19 +01001332 }
1333
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001334 /* copy the pointer to sample associated to this node */
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001335 node->data = pat->data;
Thierry FOURNIER6bb53ff2014-01-28 15:54:36 +01001336 node->ref = pat->ref;
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001337
1338 /* copy the string */
1339 memcpy(node->node.key, pat->ptr.str, len);
1340
1341 /* index the new node */
Thierry FOURNIER31db4ae2014-01-30 00:27:15 +01001342 ebst_insert(&expr->pattern_tree, &node->node);
Willy Tarreau72f073b2015-04-29 17:53:47 +02001343 expr->revision = rdtsc();
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001344
1345 /* that's ok */
Thierry FOURNIERed66c292013-11-28 11:05:19 +01001346 return 1;
1347}
1348
Willy Tarreaub1dd9bf2014-05-10 08:53:48 +02001349int pat_idx_tree_pfx(struct pattern_expr *expr, struct pattern *pat, char **err)
1350{
1351 int len;
1352 struct pattern_tree *node;
1353
1354 /* Only string can be indexed */
1355 if (pat->type != SMP_T_STR) {
1356 memprintf(err, "internal error: string expected, but the type is '%s'",
1357 smp_to_type[pat->type]);
1358 return 0;
1359 }
1360
1361 /* If the flag PAT_F_IGNORE_CASE is set, we cannot use trees */
1362 if (expr->mflags & PAT_MF_IGNORE_CASE)
1363 return pat_idx_list_str(expr, pat, err);
1364
1365 /* Process the key len */
1366 len = strlen(pat->ptr.str);
1367
1368 /* node memory allocation */
1369 node = calloc(1, sizeof(*node) + len + 1);
1370 if (!node) {
1371 memprintf(err, "out of memory while loading pattern");
1372 return 0;
1373 }
1374
1375 /* copy the pointer to sample associated to this node */
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001376 node->data = pat->data;
Willy Tarreaub1dd9bf2014-05-10 08:53:48 +02001377 node->ref = pat->ref;
1378
1379 /* copy the string and the trailing zero */
1380 memcpy(node->node.key, pat->ptr.str, len + 1);
1381 node->node.node.pfx = len * 8;
1382
1383 /* index the new node */
1384 ebmb_insert_prefix(&expr->pattern_tree, &node->node, len);
Willy Tarreau72f073b2015-04-29 17:53:47 +02001385 expr->revision = rdtsc();
Willy Tarreaub1dd9bf2014-05-10 08:53:48 +02001386
1387 /* that's ok */
1388 return 1;
1389}
1390
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001391void pat_del_list_val(struct pattern_expr *expr, struct pat_ref_elt *ref)
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001392{
1393 struct pattern_list *pat;
1394 struct pattern_list *safe;
1395
1396 list_for_each_entry_safe(pat, safe, &expr->patterns, list) {
1397 /* Check equality. */
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001398 if (pat->pat.ref != ref)
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001399 continue;
1400
1401 /* Delete and free entry. */
1402 LIST_DEL(&pat->list);
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001403 free(pat->pat.data);
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001404 free(pat);
1405 }
Willy Tarreau72f073b2015-04-29 17:53:47 +02001406 expr->revision = rdtsc();
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001407}
1408
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001409void pat_del_tree_ip(struct pattern_expr *expr, struct pat_ref_elt *ref)
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001410{
1411 struct ebmb_node *node, *next_node;
1412 struct pattern_tree *elt;
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001413
1414 /* browse each node of the tree for IPv4 addresses. */
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001415 for (node = ebmb_first(&expr->pattern_tree), next_node = node ? ebmb_next(node) : NULL;
1416 node;
1417 node = next_node, next_node = node ? ebmb_next(node) : NULL) {
1418 /* Extract container of the tree node. */
1419 elt = container_of(node, struct pattern_tree, node);
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001420
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001421 /* Check equality. */
1422 if (elt->ref != ref)
1423 continue;
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001424
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001425 /* Delete and free entry. */
1426 ebmb_delete(node);
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001427 free(elt->data);
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001428 free(elt);
1429 }
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001430
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001431 /* Browse each node of the list for IPv4 addresses. */
1432 pat_del_list_val(expr, ref);
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001433
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001434 /* browse each node of the tree for IPv6 addresses. */
1435 for (node = ebmb_first(&expr->pattern_tree_2), next_node = node ? ebmb_next(node) : NULL;
1436 node;
1437 node = next_node, next_node = node ? ebmb_next(node) : NULL) {
1438 /* Extract container of the tree node. */
1439 elt = container_of(node, struct pattern_tree, node);
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001440
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001441 /* Check equality. */
1442 if (elt->ref != ref)
1443 continue;
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001444
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001445 /* Delete and free entry. */
1446 ebmb_delete(node);
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001447 free(elt->data);
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001448 free(elt);
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001449 }
Willy Tarreau72f073b2015-04-29 17:53:47 +02001450 expr->revision = rdtsc();
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001451}
1452
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001453void pat_del_list_ptr(struct pattern_expr *expr, struct pat_ref_elt *ref)
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001454{
1455 struct pattern_list *pat;
1456 struct pattern_list *safe;
1457
1458 list_for_each_entry_safe(pat, safe, &expr->patterns, list) {
1459 /* Check equality. */
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001460 if (pat->pat.ref != ref)
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001461 continue;
1462
1463 /* Delete and free entry. */
1464 LIST_DEL(&pat->list);
1465 free(pat->pat.ptr.ptr);
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001466 free(pat->pat.data);
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001467 free(pat);
1468 }
Willy Tarreau72f073b2015-04-29 17:53:47 +02001469 expr->revision = rdtsc();
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001470}
1471
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001472void pat_del_tree_str(struct pattern_expr *expr, struct pat_ref_elt *ref)
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001473{
1474 struct ebmb_node *node, *next_node;
1475 struct pattern_tree *elt;
1476
Thierry FOURNIER73bc2852015-02-06 17:53:54 +01001477 /* If the flag PAT_F_IGNORE_CASE is set, we cannot use trees */
1478 if (expr->mflags & PAT_MF_IGNORE_CASE)
1479 return pat_del_list_ptr(expr, ref);
1480
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001481 /* browse each node of the tree. */
1482 for (node = ebmb_first(&expr->pattern_tree), next_node = node ? ebmb_next(node) : NULL;
1483 node;
1484 node = next_node, next_node = node ? ebmb_next(node) : NULL) {
1485 /* Extract container of the tree node. */
1486 elt = container_of(node, struct pattern_tree, node);
1487
1488 /* Check equality. */
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001489 if (elt->ref != ref)
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001490 continue;
1491
1492 /* Delete and free entry. */
1493 ebmb_delete(node);
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001494 free(elt->data);
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001495 free(elt);
1496 }
Willy Tarreau72f073b2015-04-29 17:53:47 +02001497 expr->revision = rdtsc();
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001498}
1499
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001500void pat_del_list_reg(struct pattern_expr *expr, struct pat_ref_elt *ref)
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001501{
1502 struct pattern_list *pat;
1503 struct pattern_list *safe;
1504
1505 list_for_each_entry_safe(pat, safe, &expr->patterns, list) {
1506 /* Check equality. */
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001507 if (pat->pat.ref != ref)
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001508 continue;
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001509
1510 /* Delete and free entry. */
1511 LIST_DEL(&pat->list);
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001512 regex_free(pat->pat.ptr.ptr);
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001513 free(pat->pat.data);
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001514 free(pat);
1515 }
Willy Tarreau72f073b2015-04-29 17:53:47 +02001516 expr->revision = rdtsc();
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001517}
1518
1519void pattern_init_expr(struct pattern_expr *expr)
1520{
1521 LIST_INIT(&expr->patterns);
Willy Tarreau72f073b2015-04-29 17:53:47 +02001522 expr->revision = 0;
Thierry FOURNIER31db4ae2014-01-30 00:27:15 +01001523 expr->pattern_tree = EB_ROOT;
1524 expr->pattern_tree_2 = EB_ROOT;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001525}
1526
1527void pattern_init_head(struct pattern_head *head)
1528{
1529 LIST_INIT(&head->head);
1530}
1531
1532/* The following functions are relative to the management of the reference
1533 * lists. These lists are used to store the original pattern and associated
1534 * value as string form.
1535 *
1536 * This is used with modifiable ACL and MAPS
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01001537 *
1538 * The pattern reference are stored with two identifiers: the unique_id and
1539 * the reference.
1540 *
1541 * The reference identify a file. Each file with the same name point to the
1542 * same reference. We can register many times one file. If the file is modified,
1543 * all his dependencies are also modified. The reference can be used with map or
1544 * acl.
1545 *
1546 * The unique_id identify inline acl. The unique id is unique for each acl.
1547 * You cannot force the same id in the configuration file, because this repoort
1548 * an error.
1549 *
1550 * A particular case appears if the filename is a number. In this case, the
1551 * unique_id is set with the number represented by the filename and the
1552 * reference is also set. This method prevent double unique_id.
1553 *
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001554 */
1555
1556/* This function lookup for reference. If the reference is found, they return
1557 * pointer to the struct pat_ref, else return NULL.
1558 */
1559struct pat_ref *pat_ref_lookup(const char *reference)
1560{
1561 struct pat_ref *ref;
1562
1563 list_for_each_entry(ref, &pattern_reference, list)
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01001564 if (ref->reference && strcmp(reference, ref->reference) == 0)
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001565 return ref;
1566 return NULL;
1567}
1568
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01001569/* This function lookup for unique id. If the reference is found, they return
1570 * pointer to the struct pat_ref, else return NULL.
1571 */
1572struct pat_ref *pat_ref_lookupid(int unique_id)
1573{
1574 struct pat_ref *ref;
1575
1576 list_for_each_entry(ref, &pattern_reference, list)
1577 if (ref->unique_id == unique_id)
1578 return ref;
1579 return NULL;
1580}
1581
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001582/* This function remove all pattern matching the pointer <refelt> from
1583 * the the reference and from each expr member of the reference. This
1584 * function returns 1 if the deletion is done and return 0 is the entry
1585 * is not found.
1586 */
1587int pat_ref_delete_by_id(struct pat_ref *ref, struct pat_ref_elt *refelt)
1588{
1589 struct pattern_expr *expr;
1590 struct pat_ref_elt *elt, *safe;
Emeric Brun8d85aa42017-06-29 15:40:33 +02001591 struct bref *bref, *back;
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001592
1593 /* delete pattern from reference */
1594 list_for_each_entry_safe(elt, safe, &ref->head, list) {
1595 if (elt == refelt) {
Emeric Brun8d85aa42017-06-29 15:40:33 +02001596 list_for_each_entry_safe(bref, back, &elt->back_refs, users) {
1597 /*
1598 * we have to unlink all watchers. We must not relink them if
1599 * this elt was the last one in the list.
1600 */
1601 LIST_DEL(&bref->users);
1602 LIST_INIT(&bref->users);
1603 if (elt->list.n != &ref->head)
Willy Tarreau49ee3b22019-04-30 11:43:43 +02001604 LIST_ADDQ(&LIST_ELEM(elt->list.n, typeof(elt), list)->back_refs, &bref->users);
Emeric Brun8d85aa42017-06-29 15:40:33 +02001605 bref->ref = elt->list.n;
1606 }
peter caiaede6dd2015-10-07 00:07:43 -07001607 list_for_each_entry(expr, &ref->pat, list)
1608 pattern_delete(expr, elt);
1609
Emeric Brunb5997f72017-07-03 11:34:05 +02001610 /* pat_ref_elt is trashed once all expr
1611 are cleaned and there is no ref remaining */
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001612 LIST_DEL(&elt->list);
1613 free(elt->sample);
1614 free(elt->pattern);
1615 free(elt);
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001616 return 1;
1617 }
1618 }
1619 return 0;
1620}
1621
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001622/* This function remove all pattern match <key> from the the reference
Joseph Herlant4189d672018-11-15 10:22:31 -08001623 * and from each expr member of the reference. This function returns 1
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001624 * if the deletion is done and return 0 is the entry is not found.
1625 */
1626int pat_ref_delete(struct pat_ref *ref, const char *key)
1627{
1628 struct pattern_expr *expr;
1629 struct pat_ref_elt *elt, *safe;
Emeric Brun8d85aa42017-06-29 15:40:33 +02001630 struct bref *bref, *back;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001631 int found = 0;
1632
1633 /* delete pattern from reference */
1634 list_for_each_entry_safe(elt, safe, &ref->head, list) {
1635 if (strcmp(key, elt->pattern) == 0) {
Emeric Brun8d85aa42017-06-29 15:40:33 +02001636 list_for_each_entry_safe(bref, back, &elt->back_refs, users) {
1637 /*
1638 * we have to unlink all watchers. We must not relink them if
1639 * this elt was the last one in the list.
1640 */
1641 LIST_DEL(&bref->users);
1642 LIST_INIT(&bref->users);
1643 if (elt->list.n != &ref->head)
Willy Tarreau49ee3b22019-04-30 11:43:43 +02001644 LIST_ADDQ(&LIST_ELEM(elt->list.n, typeof(elt), list)->back_refs, &bref->users);
Emeric Brun8d85aa42017-06-29 15:40:33 +02001645 bref->ref = elt->list.n;
1646 }
Dirkjan Bussink07fcaaa2014-04-28 22:57:16 +00001647 list_for_each_entry(expr, &ref->pat, list)
1648 pattern_delete(expr, elt);
1649
Emeric Brunb5997f72017-07-03 11:34:05 +02001650 /* pat_ref_elt is trashed once all expr
1651 are cleaned and there is no ref remaining */
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001652 LIST_DEL(&elt->list);
1653 free(elt->sample);
1654 free(elt->pattern);
1655 free(elt);
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01001656
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001657 found = 1;
1658 }
1659 }
1660
1661 if (!found)
1662 return 0;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001663 return 1;
1664}
1665
Baptiste Assmann953f74d2014-04-25 16:57:03 +02001666/*
1667 * find and return an element <elt> matching <key> in a reference <ref>
1668 * return NULL if not found
1669 */
1670struct pat_ref_elt *pat_ref_find_elt(struct pat_ref *ref, const char *key)
1671{
1672 struct pat_ref_elt *elt;
1673
1674 list_for_each_entry(elt, &ref->head, list) {
1675 if (strcmp(key, elt->pattern) == 0)
1676 return elt;
1677 }
1678
1679 return NULL;
1680}
1681
1682
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01001683 /* This function modify the sample of the first pattern that match the <key>. */
1684static inline int pat_ref_set_elt(struct pat_ref *ref, struct pat_ref_elt *elt,
Thierry FOURNIER364cfdf2014-01-29 19:08:49 +01001685 const char *value, char **err)
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001686{
1687 struct pattern_expr *expr;
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001688 struct sample_data **data;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001689 char *sample;
Thierry FOURNIER12ba0c22015-08-14 00:02:11 +02001690 struct sample_data test;
Thierry FOURNIER149e0fe2014-01-29 19:35:06 +01001691
1692 /* Try all needed converters. */
1693 list_for_each_entry(expr, &ref->pat, list) {
1694 if (!expr->pat_head->parse_smp)
1695 continue;
1696
1697 if (!expr->pat_head->parse_smp(value, &test)) {
1698 memprintf(err, "unable to parse '%s'", value);
1699 return 0;
1700 }
1701 }
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001702
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01001703 /* Modify pattern from reference. */
1704 sample = strdup(value);
Thierry FOURNIER364cfdf2014-01-29 19:08:49 +01001705 if (!sample) {
1706 memprintf(err, "out of memory error");
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001707 return 0;
Thierry FOURNIER364cfdf2014-01-29 19:08:49 +01001708 }
Thierry FOURNIER149e0fe2014-01-29 19:35:06 +01001709 /* Load sample in each reference. All the conversion are tested
1710 * below, normally these calls dosn't fail.
1711 */
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01001712 list_for_each_entry(expr, &ref->pat, list) {
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01001713 if (!expr->pat_head->parse_smp)
1714 continue;
1715
Christopher Faulet2a944ee2017-11-07 10:42:54 +01001716 HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock);
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001717 data = pattern_find_smp(expr, elt);
1718 if (data && *data && !expr->pat_head->parse_smp(sample, *data))
1719 *data = NULL;
Christopher Faulet2a944ee2017-11-07 10:42:54 +01001720 HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001721 }
1722
Emeric Brunb5997f72017-07-03 11:34:05 +02001723 /* free old sample only when all exprs are updated */
1724 free(elt->sample);
1725 elt->sample = sample;
1726
1727
Thierry FOURNIER149e0fe2014-01-29 19:35:06 +01001728 return 1;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001729}
1730
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01001731/* This function modify the sample of the first pattern that match the <key>. */
Thierry FOURNIER364cfdf2014-01-29 19:08:49 +01001732int pat_ref_set_by_id(struct pat_ref *ref, struct pat_ref_elt *refelt, const char *value, char **err)
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01001733{
1734 struct pat_ref_elt *elt;
1735
1736 /* Look for pattern in the reference. */
1737 list_for_each_entry(elt, &ref->head, list) {
1738 if (elt == refelt) {
Thierry FOURNIER364cfdf2014-01-29 19:08:49 +01001739 if (!pat_ref_set_elt(ref, elt, value, err))
1740 return 0;
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01001741 return 1;
1742 }
1743 }
Thierry FOURNIER364cfdf2014-01-29 19:08:49 +01001744
1745 memprintf(err, "key or pattern not found");
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01001746 return 0;
1747}
1748
1749/* This function modify the sample of the first pattern that match the <key>. */
Thierry FOURNIER364cfdf2014-01-29 19:08:49 +01001750int pat_ref_set(struct pat_ref *ref, const char *key, const char *value, char **err)
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01001751{
1752 struct pat_ref_elt *elt;
Thierry FOURNIER364cfdf2014-01-29 19:08:49 +01001753 int found = 0;
1754 char *_merr;
1755 char **merr;
1756
1757 if (err) {
1758 merr = &_merr;
1759 *merr = NULL;
1760 }
1761 else
1762 merr = NULL;
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01001763
1764 /* Look for pattern in the reference. */
1765 list_for_each_entry(elt, &ref->head, list) {
1766 if (strcmp(key, elt->pattern) == 0) {
Thierry FOURNIER364cfdf2014-01-29 19:08:49 +01001767 if (!pat_ref_set_elt(ref, elt, value, merr)) {
William Lallemand579fb252018-06-11 10:53:46 +02001768 if (err && merr) {
1769 if (!found) {
1770 *err = *merr;
1771 } else {
1772 memprintf(err, "%s, %s", *err, *merr);
1773 free(*merr);
1774 *merr = NULL;
1775 }
Thierry FOURNIER364cfdf2014-01-29 19:08:49 +01001776 }
1777 }
1778 found = 1;
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01001779 }
1780 }
Thierry FOURNIER364cfdf2014-01-29 19:08:49 +01001781
1782 if (!found) {
1783 memprintf(err, "entry not found");
1784 return 0;
1785 }
1786 return 1;
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01001787}
1788
Joseph Herlant4189d672018-11-15 10:22:31 -08001789/* This function creates a new reference. <ref> is the reference name.
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001790 * <flags> are PAT_REF_*. /!\ The reference is not checked, and must
1791 * be unique. The user must check the reference with "pat_ref_lookup()"
Joseph Herlant4189d672018-11-15 10:22:31 -08001792 * before calling this function. If the function fail, it return NULL,
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001793 * else return new struct pat_ref.
1794 */
Thierry FOURNIER0d6ba512014-02-11 03:31:34 +01001795struct pat_ref *pat_ref_new(const char *reference, const char *display, unsigned int flags)
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001796{
1797 struct pat_ref *ref;
1798
1799 ref = malloc(sizeof(*ref));
1800 if (!ref)
1801 return NULL;
1802
Thierry FOURNIER0d6ba512014-02-11 03:31:34 +01001803 if (display) {
1804 ref->display = strdup(display);
1805 if (!ref->display) {
1806 free(ref);
1807 return NULL;
1808 }
1809 }
1810 else
1811 ref->display = NULL;
1812
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001813 ref->reference = strdup(reference);
1814 if (!ref->reference) {
Thierry FOURNIER0d6ba512014-02-11 03:31:34 +01001815 free(ref->display);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001816 free(ref);
1817 return NULL;
1818 }
1819
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01001820 ref->flags = flags;
1821 ref->unique_id = -1;
1822
1823 LIST_INIT(&ref->head);
1824 LIST_INIT(&ref->pat);
Christopher Faulet2a944ee2017-11-07 10:42:54 +01001825 HA_SPIN_INIT(&ref->lock);
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01001826 LIST_ADDQ(&pattern_reference, &ref->list);
1827
1828 return ref;
1829}
1830
1831/* This function create new reference. <unique_id> is the unique id. If
1832 * the value of <unique_id> is -1, the unique id is calculated later.
1833 * <flags> are PAT_REF_*. /!\ The reference is not checked, and must
1834 * be unique. The user must check the reference with "pat_ref_lookup()"
1835 * or pat_ref_lookupid before calling this function. If the function
1836 * fail, it return NULL, else return new struct pat_ref.
1837 */
Thierry FOURNIER0d6ba512014-02-11 03:31:34 +01001838struct pat_ref *pat_ref_newid(int unique_id, const char *display, unsigned int flags)
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01001839{
1840 struct pat_ref *ref;
1841
1842 ref = malloc(sizeof(*ref));
1843 if (!ref)
1844 return NULL;
1845
Thierry FOURNIER0d6ba512014-02-11 03:31:34 +01001846 if (display) {
1847 ref->display = strdup(display);
1848 if (!ref->display) {
1849 free(ref);
1850 return NULL;
1851 }
1852 }
1853 else
1854 ref->display = NULL;
1855
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01001856 ref->reference = NULL;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001857 ref->flags = flags;
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01001858 ref->unique_id = unique_id;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001859 LIST_INIT(&ref->head);
1860 LIST_INIT(&ref->pat);
Aurélien Nephtali564d15a2018-04-19 16:56:07 +02001861 HA_SPIN_INIT(&ref->lock);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001862 LIST_ADDQ(&pattern_reference, &ref->list);
1863
1864 return ref;
1865}
1866
1867/* This function adds entry to <ref>. It can failed with memory error.
1868 * If the function fails, it returns 0.
1869 */
1870int pat_ref_append(struct pat_ref *ref, char *pattern, char *sample, int line)
1871{
1872 struct pat_ref_elt *elt;
1873
1874 elt = malloc(sizeof(*elt));
1875 if (!elt)
1876 return 0;
1877
1878 elt->line = line;
1879
1880 elt->pattern = strdup(pattern);
1881 if (!elt->pattern) {
1882 free(elt);
1883 return 0;
1884 }
1885
1886 if (sample) {
1887 elt->sample = strdup(sample);
1888 if (!elt->sample) {
1889 free(elt->pattern);
1890 free(elt);
1891 return 0;
1892 }
1893 }
1894 else
1895 elt->sample = NULL;
1896
Emeric Brun8d85aa42017-06-29 15:40:33 +02001897 LIST_INIT(&elt->back_refs);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001898 LIST_ADDQ(&ref->head, &elt->list);
1899
1900 return 1;
Thierry FOURNIERb1136502014-01-15 11:38:49 +01001901}
1902
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001903/* This function create sample found in <elt>, parse the pattern also
1904 * found in <elt> and insert it in <expr>. The function copy <patflags>
1905 * in <expr>. If the function fails, it returns0 and <err> is filled.
1906 * In succes case, the function returns 1.
1907 */
1908static inline
1909int pat_ref_push(struct pat_ref_elt *elt, struct pattern_expr *expr,
1910 int patflags, char **err)
1911{
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001912 struct sample_data *data;
Thierry FOURNIERd25c8422014-01-28 15:34:35 +01001913 struct pattern pattern;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001914
1915 /* Create sample */
1916 if (elt->sample && expr->pat_head->parse_smp) {
1917 /* New sample. */
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001918 data = malloc(sizeof(*data));
1919 if (!data)
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001920 return 0;
1921
1922 /* Parse value. */
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001923 if (!expr->pat_head->parse_smp(elt->sample, data)) {
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001924 memprintf(err, "unable to parse '%s'", elt->sample);
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001925 free(data);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001926 return 0;
1927 }
1928
1929 }
1930 else
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001931 data = NULL;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001932
Thierry FOURNIERd25c8422014-01-28 15:34:35 +01001933 /* initialise pattern */
1934 memset(&pattern, 0, sizeof(pattern));
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001935 pattern.data = data;
Thierry FOURNIER6bb53ff2014-01-28 15:54:36 +01001936 pattern.ref = elt;
Thierry FOURNIERd25c8422014-01-28 15:34:35 +01001937
1938 /* parse pattern */
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +02001939 if (!expr->pat_head->parse(elt->pattern, &pattern, expr->mflags, err)) {
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001940 free(data);
Thierry FOURNIERd25c8422014-01-28 15:34:35 +01001941 return 0;
1942 }
1943
Christopher Faulet2a944ee2017-11-07 10:42:54 +01001944 HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock);
Thierry FOURNIERd25c8422014-01-28 15:34:35 +01001945 /* index pattern */
1946 if (!expr->pat_head->index(expr, &pattern, err)) {
Christopher Faulet2a944ee2017-11-07 10:42:54 +01001947 HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock);
Thierry FOURNIER503bb092015-08-19 08:35:43 +02001948 free(data);
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001949 return 0;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001950 }
Christopher Faulet2a944ee2017-11-07 10:42:54 +01001951 HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock);
Thierry FOURNIERb9b08462013-12-13 15:12:32 +01001952
1953 return 1;
1954}
1955
Thierry FOURNIER31db4ae2014-01-30 00:27:15 +01001956/* This function adds entry to <ref>. It can failed with memory error. The new
1957 * entry is added at all the pattern_expr registered in this reference. The
1958 * function stop on the first error encountered. It returns 0 and err is
1959 * filled. If an error is encountered, the complete add operation is cancelled.
1960 * If the insertion is a success the function returns 1.
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001961 */
1962int pat_ref_add(struct pat_ref *ref,
1963 const char *pattern, const char *sample,
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +02001964 char **err)
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001965{
1966 struct pat_ref_elt *elt;
1967 struct pattern_expr *expr;
1968
1969 elt = malloc(sizeof(*elt));
1970 if (!elt) {
1971 memprintf(err, "out of memory error");
1972 return 0;
1973 }
1974
1975 elt->line = -1;
1976
1977 elt->pattern = strdup(pattern);
1978 if (!elt->pattern) {
1979 free(elt);
1980 memprintf(err, "out of memory error");
1981 return 0;
1982 }
1983
1984 if (sample) {
1985 elt->sample = strdup(sample);
1986 if (!elt->sample) {
1987 free(elt->pattern);
1988 free(elt);
1989 memprintf(err, "out of memory error");
1990 return 0;
1991 }
1992 }
1993 else
1994 elt->sample = NULL;
1995
Emeric Brun8d85aa42017-06-29 15:40:33 +02001996 LIST_INIT(&elt->back_refs);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01001997 LIST_ADDQ(&ref->head, &elt->list);
1998
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01001999 list_for_each_entry(expr, &ref->pat, list) {
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +02002000 if (!pat_ref_push(elt, expr, 0, err)) {
Thierry FOURNIER31db4ae2014-01-30 00:27:15 +01002001 /* If the insertion fails, try to delete all the added entries. */
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01002002 pat_ref_delete_by_id(ref, elt);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002003 return 0;
2004 }
2005 }
Emeric Brunb5997f72017-07-03 11:34:05 +02002006
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002007 return 1;
2008}
2009
Joseph Herlant4189d672018-11-15 10:22:31 -08002010/* This function prunes <ref>, replaces all references by the references
2011 * of <replace>, and reindexes all the news values.
Thierry FOURNIER46006bd2014-03-21 21:45:15 +01002012 *
Joseph Herlant4189d672018-11-15 10:22:31 -08002013 * The patterns are loaded in best effort and the errors are ignored,
2014 * but written in the logs.
Thierry FOURNIER46006bd2014-03-21 21:45:15 +01002015 */
2016void pat_ref_reload(struct pat_ref *ref, struct pat_ref *replace)
2017{
2018 struct pattern_expr *expr;
Emeric Brunb5997f72017-07-03 11:34:05 +02002019 struct pat_ref_elt *elt, *safe;
2020 struct bref *bref, *back;
Emeric Brunb5997f72017-07-03 11:34:05 +02002021 struct pattern pattern;
Thierry FOURNIER46006bd2014-03-21 21:45:15 +01002022
Thierry FOURNIER46006bd2014-03-21 21:45:15 +01002023
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002024 HA_SPIN_LOCK(PATREF_LOCK, &ref->lock);
Emeric Brunb5997f72017-07-03 11:34:05 +02002025 list_for_each_entry(expr, &ref->pat, list) {
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002026 HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock);
Emeric Brunb5997f72017-07-03 11:34:05 +02002027 }
2028
2029 /* all expr are locked, we can safely remove all pat_ref */
2030 list_for_each_entry_safe(elt, safe, &ref->head, list) {
2031 list_for_each_entry_safe(bref, back, &elt->back_refs, users) {
2032 /*
2033 * we have to unlink all watchers. We must not relink them if
2034 * this elt was the last one in the list.
2035 */
2036 LIST_DEL(&bref->users);
2037 LIST_INIT(&bref->users);
2038 if (elt->list.n != &ref->head)
Willy Tarreau49ee3b22019-04-30 11:43:43 +02002039 LIST_ADDQ(&LIST_ELEM(elt->list.n, typeof(elt), list)->back_refs, &bref->users);
Emeric Brunb5997f72017-07-03 11:34:05 +02002040 bref->ref = elt->list.n;
2041 }
2042 LIST_DEL(&elt->list);
2043 free(elt->pattern);
2044 free(elt->sample);
2045 free(elt);
2046 }
2047
2048 /* switch pat_ret_elt lists */
Thierry FOURNIER46006bd2014-03-21 21:45:15 +01002049 LIST_ADD(&replace->head, &ref->head);
2050 LIST_DEL(&replace->head);
2051
Emeric Brunb5997f72017-07-03 11:34:05 +02002052 list_for_each_entry(expr, &ref->pat, list) {
2053 expr->pat_head->prune(expr);
2054 list_for_each_entry(elt, &ref->head, list) {
Dragan Dosenf1474792018-09-18 20:18:09 +02002055 char *err = NULL;
2056 struct sample_data *data = NULL;
2057
Emeric Brunb5997f72017-07-03 11:34:05 +02002058 /* Create sample */
2059 if (elt->sample && expr->pat_head->parse_smp) {
2060 /* New sample. */
2061 data = malloc(sizeof(*data));
2062 if (!data)
2063 continue;
2064
2065 /* Parse value. */
2066 if (!expr->pat_head->parse_smp(elt->sample, data)) {
2067 memprintf(&err, "unable to parse '%s'", elt->sample);
2068 send_log(NULL, LOG_NOTICE, "%s", err);
2069 free(err);
2070 free(data);
2071 continue;
2072 }
2073
2074 }
Emeric Brunb5997f72017-07-03 11:34:05 +02002075
2076 /* initialise pattern */
2077 memset(&pattern, 0, sizeof(pattern));
2078 pattern.data = data;
2079 pattern.ref = elt;
2080
2081 /* parse pattern */
2082 if (!expr->pat_head->parse(elt->pattern, &pattern, expr->mflags, &err)) {
Thierry FOURNIER46006bd2014-03-21 21:45:15 +01002083 send_log(NULL, LOG_NOTICE, "%s", err);
2084 free(err);
Emeric Brunb5997f72017-07-03 11:34:05 +02002085 free(data);
2086 continue;
2087 }
2088
2089 /* index pattern */
2090 if (!expr->pat_head->index(expr, &pattern, &err)) {
2091 send_log(NULL, LOG_NOTICE, "%s", err);
2092 free(err);
2093 free(data);
2094 continue;
Thierry FOURNIER46006bd2014-03-21 21:45:15 +01002095 }
2096 }
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002097 HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock);
Thierry FOURNIER46006bd2014-03-21 21:45:15 +01002098 }
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002099 HA_SPIN_UNLOCK(PATREF_LOCK, &ref->lock);
Thierry FOURNIER46006bd2014-03-21 21:45:15 +01002100}
2101
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002102/* This function prune all entries of <ref>. This function
2103 * prune the associated pattern_expr.
2104 */
2105void pat_ref_prune(struct pat_ref *ref)
2106{
2107 struct pat_ref_elt *elt, *safe;
2108 struct pattern_expr *expr;
Emeric Brun8d85aa42017-06-29 15:40:33 +02002109 struct bref *bref, *back;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002110
Emeric Brunb5997f72017-07-03 11:34:05 +02002111 list_for_each_entry(expr, &ref->pat, list) {
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002112 HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock);
Emeric Brunb5997f72017-07-03 11:34:05 +02002113 expr->pat_head->prune(expr);
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002114 HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock);
Emeric Brunb5997f72017-07-03 11:34:05 +02002115 }
2116
2117 /* we trash pat_ref_elt in a second time to ensure that data is
2118 free once there is no ref on it */
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002119 list_for_each_entry_safe(elt, safe, &ref->head, list) {
Emeric Brun8d85aa42017-06-29 15:40:33 +02002120 list_for_each_entry_safe(bref, back, &elt->back_refs, users) {
2121 /*
2122 * we have to unlink all watchers. We must not relink them if
2123 * this elt was the last one in the list.
2124 */
2125 LIST_DEL(&bref->users);
2126 LIST_INIT(&bref->users);
2127 if (elt->list.n != &ref->head)
Willy Tarreau49ee3b22019-04-30 11:43:43 +02002128 LIST_ADDQ(&LIST_ELEM(elt->list.n, typeof(elt), list)->back_refs, &bref->users);
Emeric Brun8d85aa42017-06-29 15:40:33 +02002129 bref->ref = elt->list.n;
2130 }
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002131 LIST_DEL(&elt->list);
2132 free(elt->pattern);
2133 free(elt->sample);
2134 free(elt);
2135 }
2136
Emeric Brunb5997f72017-07-03 11:34:05 +02002137
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002138}
2139
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002140/* This function lookup for existing reference <ref> in pattern_head <head>. */
2141struct pattern_expr *pattern_lookup_expr(struct pattern_head *head, struct pat_ref *ref)
2142{
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002143 struct pattern_expr_list *expr;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002144
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002145 list_for_each_entry(expr, &head->head, list)
2146 if (expr->expr->ref == ref)
2147 return expr->expr;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002148 return NULL;
2149}
2150
Joseph Herlant4189d672018-11-15 10:22:31 -08002151/* This function creates new pattern_expr associated to the reference <ref>.
2152 * <ref> can be NULL. If an error occurs, the function returns NULL and
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002153 * <err> is filled. Otherwise, the function returns new pattern_expr linked
2154 * with <head> and <ref>.
Thierry FOURNIER315ec422014-11-24 11:14:42 +01002155 *
Joseph Herlant4189d672018-11-15 10:22:31 -08002156 * The returned value can be an already filled pattern list, in this case the
Thierry FOURNIER315ec422014-11-24 11:14:42 +01002157 * flag <reuse> is set.
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002158 */
Thierry FOURNIER315ec422014-11-24 11:14:42 +01002159struct pattern_expr *pattern_new_expr(struct pattern_head *head, struct pat_ref *ref,
Emeric Brun7d27f3c2017-07-03 17:54:23 +02002160 int patflags, char **err, int *reuse)
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002161{
2162 struct pattern_expr *expr;
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002163 struct pattern_expr_list *list;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002164
Thierry FOURNIER315ec422014-11-24 11:14:42 +01002165 if (reuse)
2166 *reuse = 0;
2167
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002168 /* Memory and initialization of the chain element. */
2169 list = malloc(sizeof(*list));
2170 if (!list) {
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002171 memprintf(err, "out of memory");
2172 return NULL;
2173 }
2174
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002175 /* Look for existing similar expr. No that only the index, parse and
2176 * parse_smp function must be identical for having similar pattern.
Joseph Herlant4189d672018-11-15 10:22:31 -08002177 * The other function depends of these first.
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002178 */
2179 if (ref) {
2180 list_for_each_entry(expr, &ref->pat, list)
2181 if (expr->pat_head->index == head->index &&
2182 expr->pat_head->parse == head->parse &&
Emeric Brun7d27f3c2017-07-03 17:54:23 +02002183 expr->pat_head->parse_smp == head->parse_smp &&
2184 expr->mflags == patflags)
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002185 break;
2186 if (&expr->list == &ref->pat)
2187 expr = NULL;
2188 }
2189 else
2190 expr = NULL;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002191
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002192 /* If no similar expr was found, we create new expr. */
2193 if (!expr) {
2194 /* Get a lot of memory for the expr struct. */
2195 expr = malloc(sizeof(*expr));
2196 if (!expr) {
Andreas Seltenreiche6e22e82016-03-03 20:20:23 +01002197 free(list);
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002198 memprintf(err, "out of memory");
2199 return NULL;
2200 }
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002201
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002202 /* Initialize this new expr. */
2203 pattern_init_expr(expr);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002204
Emeric Brun7d27f3c2017-07-03 17:54:23 +02002205 /* Copy the pattern matching and indexing flags. */
2206 expr->mflags = patflags;
2207
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002208 /* This new pattern expression reference one of his heads. */
2209 expr->pat_head = head;
2210
2211 /* Link with ref, or to self to facilitate LIST_DEL() */
2212 if (ref)
2213 LIST_ADDQ(&ref->pat, &expr->list);
2214 else
2215 LIST_INIT(&expr->list);
2216
2217 expr->ref = ref;
2218
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002219 HA_RWLOCK_INIT(&expr->lock);
Emeric Brunb5997f72017-07-03 11:34:05 +02002220
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002221 /* We must free this pattern if it is no more used. */
2222 list->do_free = 1;
2223 }
2224 else {
2225 /* If the pattern used already exists, it is already linked
2226 * with ref and we must not free it.
2227 */
2228 list->do_free = 0;
Thierry FOURNIER315ec422014-11-24 11:14:42 +01002229 if (reuse)
2230 *reuse = 1;
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002231 }
2232
2233 /* The new list element reference the pattern_expr. */
2234 list->expr = expr;
2235
2236 /* Link the list element with the pattern_head. */
2237 LIST_ADDQ(&head->head, &list->list);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002238 return expr;
2239}
2240
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002241/* Reads patterns from a file. If <err_msg> is non-NULL, an error message will
2242 * be returned there on errors and the caller will have to free it.
Thierry FOURNIER39bef452014-01-29 13:29:45 +01002243 *
2244 * The file contains one key + value per line. Lines which start with '#' are
2245 * ignored, just like empty lines. Leading tabs/spaces are stripped. The key is
2246 * then the first "word" (series of non-space/tabs characters), and the value is
2247 * what follows this series of space/tab till the end of the line excluding
2248 * trailing spaces/tabs.
2249 *
2250 * Example :
2251 *
2252 * # this is a comment and is ignored
2253 * 62.212.114.60 1wt.eu \n
2254 * <-><-----------><---><----><---->
2255 * | | | | `--- trailing spaces ignored
2256 * | | | `-------- value
2257 * | | `--------------- middle spaces ignored
2258 * | `------------------------ key
2259 * `-------------------------------- leading spaces ignored
2260 *
2261 * Return non-zero in case of succes, otherwise 0.
2262 */
2263int pat_ref_read_from_file_smp(struct pat_ref *ref, const char *filename, char **err)
2264{
2265 FILE *file;
2266 char *c;
2267 int ret = 0;
2268 int line = 0;
2269 char *key_beg;
2270 char *key_end;
2271 char *value_beg;
2272 char *value_end;
2273
2274 file = fopen(filename, "r");
2275 if (!file) {
2276 memprintf(err, "failed to open pattern file <%s>", filename);
2277 return 0;
2278 }
2279
2280 /* now parse all patterns. The file may contain only one pattern
2281 * followed by one value per line. The start spaces, separator spaces
2282 * and and spaces are stripped. Each can contain comment started by '#'
2283 */
Willy Tarreau843b7cb2018-07-13 10:54:26 +02002284 while (fgets(trash.area, trash.size, file) != NULL) {
Thierry FOURNIER39bef452014-01-29 13:29:45 +01002285 line++;
Willy Tarreau843b7cb2018-07-13 10:54:26 +02002286 c = trash.area;
Thierry FOURNIER39bef452014-01-29 13:29:45 +01002287
2288 /* ignore lines beginning with a dash */
2289 if (*c == '#')
2290 continue;
2291
2292 /* strip leading spaces and tabs */
2293 while (*c == ' ' || *c == '\t')
2294 c++;
2295
2296 /* empty lines are ignored too */
2297 if (*c == '\0' || *c == '\r' || *c == '\n')
2298 continue;
2299
2300 /* look for the end of the key */
2301 key_beg = c;
2302 while (*c && *c != ' ' && *c != '\t' && *c != '\n' && *c != '\r')
2303 c++;
2304
2305 key_end = c;
2306
2307 /* strip middle spaces and tabs */
2308 while (*c == ' ' || *c == '\t')
2309 c++;
2310
2311 /* look for the end of the value, it is the end of the line */
2312 value_beg = c;
2313 while (*c && *c != '\n' && *c != '\r')
2314 c++;
2315 value_end = c;
2316
2317 /* trim possibly trailing spaces and tabs */
2318 while (value_end > value_beg && (value_end[-1] == ' ' || value_end[-1] == '\t'))
2319 value_end--;
2320
2321 /* set final \0 and check entries */
2322 *key_end = '\0';
2323 *value_end = '\0';
2324
2325 /* insert values */
2326 if (!pat_ref_append(ref, key_beg, value_beg, line)) {
2327 memprintf(err, "out of memory");
2328 goto out_close;
2329 }
2330 }
2331
Jerome Magnin3c79d4b2020-01-17 16:09:33 +01002332 if (ferror(file)) {
2333 memprintf(err, "error encountered while reading <%s> : %s",
2334 filename, strerror(errno));
2335 goto out_close;
2336 }
Thierry FOURNIER39bef452014-01-29 13:29:45 +01002337 /* succes */
2338 ret = 1;
2339
2340 out_close:
2341 fclose(file);
2342 return ret;
2343}
2344
2345/* Reads patterns from a file. If <err_msg> is non-NULL, an error message will
2346 * be returned there on errors and the caller will have to free it.
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002347 */
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002348int pat_ref_read_from_file(struct pat_ref *ref, const char *filename, char **err)
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002349{
2350 FILE *file;
2351 char *c;
2352 char *arg;
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002353 int ret = 0;
2354 int line = 0;
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002355
2356 file = fopen(filename, "r");
2357 if (!file) {
2358 memprintf(err, "failed to open pattern file <%s>", filename);
2359 return 0;
2360 }
2361
2362 /* now parse all patterns. The file may contain only one pattern per
2363 * line. If the line contains spaces, they will be part of the pattern.
2364 * The pattern stops at the first CR, LF or EOF encountered.
2365 */
Willy Tarreau843b7cb2018-07-13 10:54:26 +02002366 while (fgets(trash.area, trash.size, file) != NULL) {
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002367 line++;
Willy Tarreau843b7cb2018-07-13 10:54:26 +02002368 c = trash.area;
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002369
2370 /* ignore lines beginning with a dash */
2371 if (*c == '#')
2372 continue;
2373
2374 /* strip leading spaces and tabs */
2375 while (*c == ' ' || *c == '\t')
2376 c++;
2377
2378
2379 arg = c;
2380 while (*c && *c != '\n' && *c != '\r')
2381 c++;
2382 *c = 0;
2383
2384 /* empty lines are ignored too */
2385 if (c == arg)
2386 continue;
2387
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002388 if (!pat_ref_append(ref, arg, NULL, line)) {
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002389 memprintf(err, "out of memory when loading patterns from file <%s>", filename);
2390 goto out_close;
2391 }
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002392 }
2393
Jerome Magnin3c79d4b2020-01-17 16:09:33 +01002394 if (ferror(file)) {
2395 memprintf(err, "error encountered while reading <%s> : %s",
2396 filename, strerror(errno));
2397 goto out_close;
2398 }
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002399 ret = 1; /* success */
2400
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002401 out_close:
2402 fclose(file);
2403 return ret;
2404}
2405
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002406int pattern_read_from_file(struct pattern_head *head, unsigned int refflags,
Thierry FOURNIER39bef452014-01-29 13:29:45 +01002407 const char *filename, int patflags, int load_smp,
Thierry FOURNIER94580c92014-02-11 14:36:45 +01002408 char **err, const char *file, int line)
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002409{
2410 struct pat_ref *ref;
2411 struct pattern_expr *expr;
Thierry FOURNIER39bef452014-01-29 13:29:45 +01002412 struct pat_ref_elt *elt;
Willy Tarreau4deaf392014-11-26 13:17:03 +01002413 int reuse = 0;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002414
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01002415 /* Lookup for the existing reference. */
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002416 ref = pat_ref_lookup(filename);
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01002417
2418 /* If the reference doesn't exists, create it and load associated file. */
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002419 if (!ref) {
Thierry FOURNIER94580c92014-02-11 14:36:45 +01002420 chunk_printf(&trash,
2421 "pattern loaded from file '%s' used by %s at file '%s' line %d",
2422 filename, refflags & PAT_REF_MAP ? "map" : "acl", file, line);
2423
Willy Tarreau843b7cb2018-07-13 10:54:26 +02002424 ref = pat_ref_new(filename, trash.area, refflags);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002425 if (!ref) {
2426 memprintf(err, "out of memory");
2427 return 0;
2428 }
2429
Thierry FOURNIER39bef452014-01-29 13:29:45 +01002430 if (load_smp) {
Thierry FOURNIERc0bd9102014-01-29 12:32:58 +01002431 ref->flags |= PAT_REF_SMP;
Thierry FOURNIER39bef452014-01-29 13:29:45 +01002432 if (!pat_ref_read_from_file_smp(ref, filename, err))
2433 return 0;
2434 }
2435 else {
2436 if (!pat_ref_read_from_file(ref, filename, err))
2437 return 0;
2438 }
2439 }
2440 else {
Thierry FOURNIERc0bd9102014-01-29 12:32:58 +01002441 /* The reference already exists, check the map compatibility. */
2442
2443 /* If the load require samples and the flag PAT_REF_SMP is not set,
2444 * the reference doesn't contain sample, and cannot be used.
2445 */
2446 if (load_smp) {
2447 if (!(ref->flags & PAT_REF_SMP)) {
2448 memprintf(err, "The file \"%s\" is already used as one column file "
2449 "and cannot be used by as two column file.",
2450 filename);
2451 return 0;
2452 }
2453 }
2454 else {
2455 /* The load doesn't require samples. If the flag PAT_REF_SMP is
2456 * set, the reference contains a sample, and cannot be used.
2457 */
2458 if (ref->flags & PAT_REF_SMP) {
2459 memprintf(err, "The file \"%s\" is already used as two column file "
2460 "and cannot be used by as one column file.",
2461 filename);
2462 return 0;
2463 }
2464 }
2465
Thierry FOURNIER94580c92014-02-11 14:36:45 +01002466 /* Extends display */
2467 chunk_printf(&trash, "%s", ref->display);
2468 chunk_appendf(&trash, ", by %s at file '%s' line %d",
2469 refflags & PAT_REF_MAP ? "map" : "acl", file, line);
2470 free(ref->display);
Willy Tarreau843b7cb2018-07-13 10:54:26 +02002471 ref->display = strdup(trash.area);
Thierry FOURNIER94580c92014-02-11 14:36:45 +01002472 if (!ref->display) {
2473 memprintf(err, "out of memory");
2474 return 0;
2475 }
2476
Thierry FOURNIERc0bd9102014-01-29 12:32:58 +01002477 /* Merge flags. */
Thierry FOURNIER39bef452014-01-29 13:29:45 +01002478 ref->flags |= refflags;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002479 }
2480
2481 /* Now, we can loading patterns from the reference. */
2482
2483 /* Lookup for existing reference in the head. If the reference
2484 * doesn't exists, create it.
2485 */
2486 expr = pattern_lookup_expr(head, ref);
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +02002487 if (!expr || (expr->mflags != patflags)) {
Emeric Brun7d27f3c2017-07-03 17:54:23 +02002488 expr = pattern_new_expr(head, ref, patflags, err, &reuse);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002489 if (!expr)
2490 return 0;
2491 }
2492
Thierry FOURNIER315ec422014-11-24 11:14:42 +01002493 /* The returned expression may be not empty, because the function
2494 * "pattern_new_expr" lookup for similar pattern list and can
2495 * reuse a already filled pattern list. In this case, we can not
2496 * reload the patterns.
2497 */
2498 if (reuse)
2499 return 1;
2500
Thierry FOURNIER39bef452014-01-29 13:29:45 +01002501 /* Load reference content in the pattern expression. */
2502 list_for_each_entry(elt, &ref->head, list) {
2503 if (!pat_ref_push(elt, expr, patflags, err)) {
2504 if (elt->line > 0)
2505 memprintf(err, "%s at line %d of file '%s'",
2506 *err, elt->line, filename);
2507 return 0;
2508 }
2509 }
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002510
2511 return 1;
2512}
2513
Thierry FOURNIER1794fdf2014-01-17 15:25:13 +01002514/* This function executes a pattern match on a sample. It applies pattern <expr>
2515 * to sample <smp>. The function returns NULL if the sample dont match. It returns
2516 * non-null if the sample match. If <fill> is true and the sample match, the
2517 * function returns the matched pattern. In many cases, this pattern can be a
2518 * static buffer.
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002519 */
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002520struct pattern *pattern_exec_match(struct pattern_head *head, struct sample *smp, int fill)
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002521{
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002522 struct pattern_expr_list *list;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002523 struct pattern *pat;
2524
2525 if (!head->match) {
Thierry FOURNIER1794fdf2014-01-17 15:25:13 +01002526 if (fill) {
Thierry FOURNIER503bb092015-08-19 08:35:43 +02002527 static_pattern.data = NULL;
Thierry FOURNIER6bb53ff2014-01-28 15:54:36 +01002528 static_pattern.ref = NULL;
Thierry FOURNIERe47e4e22014-04-28 11:18:57 +02002529 static_pattern.sflags = 0;
Thierry FOURNIER07ee64e2015-07-06 23:43:03 +02002530 static_pattern.type = SMP_T_SINT;
Thierry FOURNIER5338eea2013-12-16 14:22:13 +01002531 static_pattern.val.i = 1;
Thierry FOURNIER1794fdf2014-01-17 15:25:13 +01002532 }
Thierry FOURNIER1794fdf2014-01-17 15:25:13 +01002533 return &static_pattern;
2534 }
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002535
Thierry FOURNIER5d344082014-01-27 14:19:53 +01002536 /* convert input to string */
2537 if (!sample_convert(smp, head->expect_type))
2538 return NULL;
2539
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002540 list_for_each_entry(list, &head->head, list) {
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002541 HA_RWLOCK_RDLOCK(PATEXP_LOCK, &list->expr->lock);
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002542 pat = head->match(smp, list->expr, fill);
Emeric Brunb5997f72017-07-03 11:34:05 +02002543 if (pat) {
2544 /* We duplicate the pattern cause it could be modified
2545 by another thread */
2546 if (pat != &static_pattern) {
2547 memcpy(&static_pattern, pat, sizeof(struct pattern));
2548 pat = &static_pattern;
2549 }
2550
2551 /* We also duplicate the sample data for
2552 same reason */
2553 if (pat->data && (pat->data != &static_sample_data)) {
Christopher Faulet09fdf4b2017-11-09 16:14:16 +01002554 switch(pat->data->type) {
Emeric Brunb5997f72017-07-03 11:34:05 +02002555 case SMP_T_STR:
2556 static_sample_data.type = SMP_T_STR;
2557 static_sample_data.u.str = *get_trash_chunk();
Willy Tarreau843b7cb2018-07-13 10:54:26 +02002558 static_sample_data.u.str.data = pat->data->u.str.data;
2559 if (static_sample_data.u.str.data >= static_sample_data.u.str.size)
2560 static_sample_data.u.str.data = static_sample_data.u.str.size - 1;
2561 memcpy(static_sample_data.u.str.area,
2562 pat->data->u.str.area,
2563 static_sample_data.u.str.data);
2564 static_sample_data.u.str.area[static_sample_data.u.str.data] = 0;
Emeric Brunb5997f72017-07-03 11:34:05 +02002565 case SMP_T_IPV4:
2566 case SMP_T_IPV6:
2567 case SMP_T_SINT:
2568 memcpy(&static_sample_data, pat->data, sizeof(struct sample_data));
2569 default:
2570 pat->data = NULL;
2571 }
2572 pat->data = &static_sample_data;
2573 }
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002574 HA_RWLOCK_RDUNLOCK(PATEXP_LOCK, &list->expr->lock);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002575 return pat;
Emeric Brunb5997f72017-07-03 11:34:05 +02002576 }
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002577 HA_RWLOCK_RDUNLOCK(PATEXP_LOCK, &list->expr->lock);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002578 }
2579 return NULL;
Thierry FOURNIERed66c292013-11-28 11:05:19 +01002580}
2581
Thierry FOURNIER6f7203d2014-01-14 16:24:51 +01002582/* This function prune the pattern expression. */
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002583void pattern_prune(struct pattern_head *head)
Thierry FOURNIER6f7203d2014-01-14 16:24:51 +01002584{
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002585 struct pattern_expr_list *list, *safe;
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002586
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002587 list_for_each_entry_safe(list, safe, &head->head, list) {
2588 LIST_DEL(&list->list);
2589 if (list->do_free) {
2590 LIST_DEL(&list->expr->list);
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002591 HA_RWLOCK_WRLOCK(PATEXP_LOCK, &list->expr->lock);
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002592 head->prune(list->expr);
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002593 HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &list->expr->lock);
Thierry FOURNIERc5959fd2014-01-20 14:29:33 +01002594 free(list->expr);
2595 }
2596 free(list);
Thierry FOURNIER1e00d382014-02-11 11:31:40 +01002597 }
Thierry FOURNIER6f7203d2014-01-14 16:24:51 +01002598}
2599
Thierry FOURNIER55d0b102014-01-15 11:25:26 +01002600/* This function lookup for a pattern matching the <key> and return a
2601 * pointer to a pointer of the sample stoarge. If the <key> dont match,
2602 * the function returns NULL. If the key cannot be parsed, the function
2603 * fill <err>.
2604 */
Thierry FOURNIER12ba0c22015-08-14 00:02:11 +02002605struct sample_data **pattern_find_smp(struct pattern_expr *expr, struct pat_ref_elt *ref)
Thierry FOURNIER55d0b102014-01-15 11:25:26 +01002606{
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01002607 struct ebmb_node *node;
2608 struct pattern_tree *elt;
2609 struct pattern_list *pat;
Thierry FOURNIER55d0b102014-01-15 11:25:26 +01002610
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01002611 for (node = ebmb_first(&expr->pattern_tree);
2612 node;
2613 node = ebmb_next(node)) {
2614 elt = container_of(node, struct pattern_tree, node);
2615 if (elt->ref == ref)
Thierry FOURNIER503bb092015-08-19 08:35:43 +02002616 return &elt->data;
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01002617 }
2618
2619 for (node = ebmb_first(&expr->pattern_tree_2);
2620 node;
2621 node = ebmb_next(node)) {
2622 elt = container_of(node, struct pattern_tree, node);
2623 if (elt->ref == ref)
Thierry FOURNIER503bb092015-08-19 08:35:43 +02002624 return &elt->data;
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01002625 }
2626
2627 list_for_each_entry(pat, &expr->patterns, list)
2628 if (pat->pat.ref == ref)
Thierry FOURNIER503bb092015-08-19 08:35:43 +02002629 return &pat->pat.data;
Thierry FOURNIERe369ca22014-01-29 16:24:55 +01002630
2631 return NULL;
Thierry FOURNIER55d0b102014-01-15 11:25:26 +01002632}
2633
Thierry FOURNIERb1136502014-01-15 11:38:49 +01002634/* This function search all the pattern matching the <key> and delete it.
2635 * If the parsing of the input key fails, the function returns 0 and the
2636 * <err> is filled, else return 1;
2637 */
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01002638int pattern_delete(struct pattern_expr *expr, struct pat_ref_elt *ref)
Thierry FOURNIERb1136502014-01-15 11:38:49 +01002639{
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002640 HA_RWLOCK_WRLOCK(PATEXP_LOCK, &expr->lock);
Thierry FOURNIER7acca4b2014-01-28 16:43:36 +01002641 expr->pat_head->delete(expr, ref);
Christopher Faulet2a944ee2017-11-07 10:42:54 +01002642 HA_RWLOCK_WRUNLOCK(PATEXP_LOCK, &expr->lock);
Thierry FOURNIERb1136502014-01-15 11:38:49 +01002643 return 1;
2644}
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01002645
Carl Henrik Lundef91ac192020-02-27 16:45:50 +01002646/* This function compares two pat_ref** on unique_id */
2647static int cmp_pat_ref(const void *_a, const void *_b)
2648{
2649 struct pat_ref * const *a = _a;
2650 struct pat_ref * const *b = _b;
2651
2652 if ((*a)->unique_id < (*b)->unique_id)
2653 return -1;
2654 else if ((*a)->unique_id > (*b)->unique_id)
2655 return 1;
2656 return 0;
2657}
2658
2659/* This function finalize the configuration parsing. It sets all the
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01002660 * automatic ids
2661 */
Carl Henrik Lundef91ac192020-02-27 16:45:50 +01002662int pattern_finalize_config(void)
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01002663{
Tim Duesterhusb584b442020-03-17 21:08:24 +01002664 size_t len = 0;
2665 size_t unassigned_pos = 0;
Carl Henrik Lundef91ac192020-02-27 16:45:50 +01002666 int next_unique_id = 0;
Tim Duesterhusb584b442020-03-17 21:08:24 +01002667 size_t i, j;
Carl Henrik Lundef91ac192020-02-27 16:45:50 +01002668 struct pat_ref *ref, **arr;
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01002669 struct list pr = LIST_HEAD_INIT(pr);
2670
Willy Tarreau52bf8392020-03-08 00:42:37 +01002671 pat_lru_seed = ha_random();
Willy Tarreauf3045d22015-04-29 16:24:50 +02002672
Carl Henrik Lundef91ac192020-02-27 16:45:50 +01002673 /* Count pat_refs with user defined unique_id and totalt count */
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01002674 list_for_each_entry(ref, &pattern_reference, list) {
Carl Henrik Lundef91ac192020-02-27 16:45:50 +01002675 len++;
2676 if (ref->unique_id != -1)
2677 unassigned_pos++;
2678 }
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01002679
Tim Duesterhusb584b442020-03-17 21:08:24 +01002680 if (len == 0) {
2681 return 0;
2682 }
2683
Carl Henrik Lundef91ac192020-02-27 16:45:50 +01002684 arr = calloc(len, sizeof(*arr));
2685 if (arr == NULL) {
2686 ha_alert("Out of memory error.\n");
2687 return ERR_ALERT | ERR_FATAL;
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01002688 }
2689
Carl Henrik Lundef91ac192020-02-27 16:45:50 +01002690 i = 0;
2691 j = unassigned_pos;
2692 list_for_each_entry(ref, &pattern_reference, list) {
2693 if (ref->unique_id != -1)
2694 arr[i++] = ref;
2695 else
2696 arr[j++] = ref;
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01002697 }
2698
Carl Henrik Lundef91ac192020-02-27 16:45:50 +01002699 /* Sort first segment of array with user-defined unique ids for
2700 * fast lookup when generating unique ids
2701 */
2702 qsort(arr, unassigned_pos, sizeof(*arr), cmp_pat_ref);
2703
2704 /* Assign unique ids to the rest of the elements */
2705 for (i = unassigned_pos; i < len; i++) {
2706 do {
2707 arr[i]->unique_id = next_unique_id++;
2708 } while (bsearch(&arr[i], arr, unassigned_pos, sizeof(*arr), cmp_pat_ref));
2709 }
2710
2711 /* Sort complete array */
2712 qsort(arr, len, sizeof(*arr), cmp_pat_ref);
2713
2714 /* Convert back to linked list */
2715 for (i = 0; i < len; i++)
2716 LIST_ADDQ(&pr, &arr[i]->list);
2717
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01002718 /* swap root */
2719 LIST_ADD(&pr, &pattern_reference);
2720 LIST_DEL(&pr);
Carl Henrik Lundef91ac192020-02-27 16:45:50 +01002721
2722 free(arr);
2723 return 0;
Thierry FOURNIERaf5a29d2014-03-11 14:29:22 +01002724}
Willy Tarreau403bfbb2019-10-23 06:59:31 +02002725
2726static int pattern_per_thread_lru_alloc()
2727{
2728 if (!global.tune.pattern_cache)
2729 return 1;
2730 pat_lru_tree = lru64_new(global.tune.pattern_cache);
2731 return !!pat_lru_tree;
2732}
2733
2734static void pattern_per_thread_lru_free()
2735{
2736 lru64_destroy(pat_lru_tree);
2737}
2738
2739REGISTER_PER_THREAD_ALLOC(pattern_per_thread_lru_alloc);
2740REGISTER_PER_THREAD_FREE(pattern_per_thread_lru_free);