Willy Tarreau | c7e4238 | 2012-08-24 19:22:53 +0200 | [diff] [blame] | 1 | /* |
| 2 | * Buffer management functions. |
| 3 | * |
| 4 | * Copyright 2000-2012 Willy Tarreau <w@1wt.eu> |
| 5 | * |
| 6 | * This program is free software; you can redistribute it and/or |
| 7 | * modify it under the terms of the GNU General Public License |
| 8 | * as published by the Free Software Foundation; either version |
| 9 | * 2 of the License, or (at your option) any later version. |
| 10 | * |
| 11 | */ |
| 12 | |
William Lallemand | be0efd8 | 2012-11-22 18:01:40 +0100 | [diff] [blame] | 13 | #include <ctype.h> |
Willy Tarreau | c7e4238 | 2012-08-24 19:22:53 +0200 | [diff] [blame] | 14 | #include <stdio.h> |
| 15 | #include <string.h> |
| 16 | |
| 17 | #include <common/config.h> |
| 18 | #include <common/buffer.h> |
Willy Tarreau | 9b28e03 | 2012-10-12 23:49:43 +0200 | [diff] [blame] | 19 | #include <common/memory.h> |
Willy Tarreau | c7e4238 | 2012-08-24 19:22:53 +0200 | [diff] [blame] | 20 | |
| 21 | #include <types/global.h> |
| 22 | |
Willy Tarreau | 9b28e03 | 2012-10-12 23:49:43 +0200 | [diff] [blame] | 23 | struct pool_head *pool2_buffer; |
| 24 | |
Willy Tarreau | f2f7d6b | 2014-11-24 11:55:08 +0100 | [diff] [blame] | 25 | /* These buffers are used to always have a valid pointer to an empty buffer in |
| 26 | * channels. The first buffer is set once a buffer is empty. The second one is |
| 27 | * set when a buffer is desired but no more are available. It helps knowing |
| 28 | * what channel wants a buffer. They can reliably be exchanged, the split |
| 29 | * between the two is only an optimization. |
Willy Tarreau | 2a4b543 | 2014-11-24 11:39:34 +0100 | [diff] [blame] | 30 | */ |
| 31 | struct buffer buf_empty = { .p = buf_empty.data }; |
Willy Tarreau | f2f7d6b | 2014-11-24 11:55:08 +0100 | [diff] [blame] | 32 | struct buffer buf_wanted = { .p = buf_wanted.data }; |
Willy Tarreau | 9b28e03 | 2012-10-12 23:49:43 +0200 | [diff] [blame] | 33 | |
Christopher Faulet | a73e59b | 2016-12-09 17:30:18 +0100 | [diff] [blame] | 34 | /* list of objects waiting for at least one buffer */ |
| 35 | struct list buffer_wq = LIST_HEAD_INIT(buffer_wq); |
Emeric Brun | a1dd243 | 2017-06-21 15:42:52 +0200 | [diff] [blame] | 36 | #ifdef USE_THREAD |
| 37 | HA_SPINLOCK_T buffer_wq_lock; |
| 38 | #endif |
Christopher Faulet | a73e59b | 2016-12-09 17:30:18 +0100 | [diff] [blame] | 39 | |
Christopher Faulet | ad405f1 | 2017-08-29 15:30:11 +0200 | [diff] [blame] | 40 | /* this buffer is always the same size as standard buffers and is used for |
| 41 | * swapping data inside a buffer. |
| 42 | */ |
Christopher Faulet | ba39f23 | 2017-08-29 14:43:04 +0200 | [diff] [blame] | 43 | static THREAD_LOCAL char *swap_buffer = NULL; |
| 44 | |
| 45 | static int init_buffer_per_thread() |
| 46 | { |
| 47 | swap_buffer = calloc(1, global.tune.bufsize); |
| 48 | if (swap_buffer == NULL) |
| 49 | return 0; |
| 50 | return 1; |
| 51 | } |
| 52 | |
| 53 | static void deinit_buffer_per_thread() |
| 54 | { |
| 55 | free(swap_buffer); swap_buffer = NULL; |
| 56 | } |
Christopher Faulet | ad405f1 | 2017-08-29 15:30:11 +0200 | [diff] [blame] | 57 | |
Willy Tarreau | 9b28e03 | 2012-10-12 23:49:43 +0200 | [diff] [blame] | 58 | /* perform minimal intializations, report 0 in case of error, 1 if OK. */ |
| 59 | int init_buffer() |
| 60 | { |
Willy Tarreau | a24adf0 | 2014-11-27 01:11:56 +0100 | [diff] [blame] | 61 | void *buffer; |
| 62 | |
Willy Tarreau | 484b53d | 2016-01-25 02:23:25 +0100 | [diff] [blame] | 63 | pool2_buffer = create_pool("buffer", sizeof (struct buffer) + global.tune.bufsize, MEM_F_SHARED|MEM_F_EXACT); |
Willy Tarreau | a24adf0 | 2014-11-27 01:11:56 +0100 | [diff] [blame] | 64 | if (!pool2_buffer) |
| 65 | return 0; |
| 66 | |
| 67 | /* The reserved buffer is what we leave behind us. Thus we always need |
| 68 | * at least one extra buffer in minavail otherwise we'll end up waking |
| 69 | * up tasks with no memory available, causing a lot of useless wakeups. |
| 70 | * That means that we always want to have at least 3 buffers available |
| 71 | * (2 for current session, one for next session that might be needed to |
| 72 | * release a server connection). |
| 73 | */ |
| 74 | pool2_buffer->minavail = MAX(global.tune.reserved_bufs, 3); |
Willy Tarreau | 33cb065 | 2014-12-23 22:52:37 +0100 | [diff] [blame] | 75 | if (global.tune.buf_limit) |
| 76 | pool2_buffer->limit = global.tune.buf_limit; |
Willy Tarreau | a24adf0 | 2014-11-27 01:11:56 +0100 | [diff] [blame] | 77 | |
Emeric Brun | a1dd243 | 2017-06-21 15:42:52 +0200 | [diff] [blame] | 78 | SPIN_INIT(&buffer_wq_lock); |
| 79 | |
Willy Tarreau | a24adf0 | 2014-11-27 01:11:56 +0100 | [diff] [blame] | 80 | buffer = pool_refill_alloc(pool2_buffer, pool2_buffer->minavail - 1); |
| 81 | if (!buffer) |
| 82 | return 0; |
| 83 | |
| 84 | pool_free2(pool2_buffer, buffer); |
Christopher Faulet | ad405f1 | 2017-08-29 15:30:11 +0200 | [diff] [blame] | 85 | |
Christopher Faulet | ba39f23 | 2017-08-29 14:43:04 +0200 | [diff] [blame] | 86 | if (global.nbthread > 1) { |
| 87 | hap_register_per_thread_init(init_buffer_per_thread); |
| 88 | hap_register_per_thread_deinit(deinit_buffer_per_thread); |
| 89 | } |
| 90 | else if (!init_buffer_per_thread()) |
| 91 | return 0; |
Christopher Faulet | ad405f1 | 2017-08-29 15:30:11 +0200 | [diff] [blame] | 92 | |
Willy Tarreau | a24adf0 | 2014-11-27 01:11:56 +0100 | [diff] [blame] | 93 | return 1; |
Willy Tarreau | 9b28e03 | 2012-10-12 23:49:43 +0200 | [diff] [blame] | 94 | } |
| 95 | |
Christopher Faulet | ad405f1 | 2017-08-29 15:30:11 +0200 | [diff] [blame] | 96 | void deinit_buffer() |
| 97 | { |
Christopher Faulet | ba39f23 | 2017-08-29 14:43:04 +0200 | [diff] [blame] | 98 | deinit_buffer_per_thread(); |
Christopher Faulet | ad405f1 | 2017-08-29 15:30:11 +0200 | [diff] [blame] | 99 | pool_destroy2(pool2_buffer); |
| 100 | } |
| 101 | |
Willy Tarreau | af81935 | 2012-08-27 22:08:00 +0200 | [diff] [blame] | 102 | /* This function writes the string <str> at position <pos> which must be in |
| 103 | * buffer <b>, and moves <end> just after the end of <str>. <b>'s parameters |
| 104 | * <l> and <r> are updated to be valid after the shift. The shift value |
| 105 | * (positive or negative) is returned. If there's no space left, the move is |
| 106 | * not done. The function does not adjust ->o because it does not make sense to |
| 107 | * use it on data scheduled to be sent. For the same reason, it does not make |
| 108 | * sense to call this function on unparsed data, so <orig> is not updated. The |
| 109 | * string length is taken from parameter <len>. If <len> is null, the <str> |
| 110 | * pointer is allowed to be null. |
| 111 | */ |
| 112 | int buffer_replace2(struct buffer *b, char *pos, char *end, const char *str, int len) |
| 113 | { |
| 114 | int delta; |
| 115 | |
| 116 | delta = len - (end - pos); |
| 117 | |
Thierry FOURNIER | fdda677 | 2015-03-10 01:55:01 +0100 | [diff] [blame] | 118 | if (bi_end(b) + delta > b->data + b->size) |
Willy Tarreau | af81935 | 2012-08-27 22:08:00 +0200 | [diff] [blame] | 119 | return 0; /* no space left */ |
| 120 | |
| 121 | if (buffer_not_empty(b) && |
| 122 | bi_end(b) + delta > bo_ptr(b) && |
| 123 | bo_ptr(b) >= bi_end(b)) |
| 124 | return 0; /* no space left before wrapping data */ |
| 125 | |
| 126 | /* first, protect the end of the buffer */ |
| 127 | memmove(end + delta, end, bi_end(b) - end); |
| 128 | |
| 129 | /* now, copy str over pos */ |
| 130 | if (len) |
| 131 | memcpy(pos, str, len); |
| 132 | |
| 133 | b->i += delta; |
| 134 | |
Willy Tarreau | 5fb3803 | 2012-12-16 19:39:09 +0100 | [diff] [blame] | 135 | if (buffer_empty(b)) |
Willy Tarreau | af81935 | 2012-08-27 22:08:00 +0200 | [diff] [blame] | 136 | b->p = b->data; |
| 137 | |
| 138 | return delta; |
| 139 | } |
| 140 | |
| 141 | /* |
| 142 | * Inserts <str> followed by "\r\n" at position <pos> in buffer <b>. The <len> |
| 143 | * argument informs about the length of string <str> so that we don't have to |
| 144 | * measure it. It does not include the "\r\n". If <str> is NULL, then the buffer |
| 145 | * is only opened for len+2 bytes but nothing is copied in. It may be useful in |
| 146 | * some circumstances. The send limit is *not* adjusted. Same comments as above |
| 147 | * for the valid use cases. |
| 148 | * |
| 149 | * The number of bytes added is returned on success. 0 is returned on failure. |
| 150 | */ |
| 151 | int buffer_insert_line2(struct buffer *b, char *pos, const char *str, int len) |
| 152 | { |
| 153 | int delta; |
| 154 | |
| 155 | delta = len + 2; |
| 156 | |
| 157 | if (bi_end(b) + delta >= b->data + b->size) |
| 158 | return 0; /* no space left */ |
| 159 | |
Godbach | a6547c1 | 2014-10-31 13:16:37 +0800 | [diff] [blame] | 160 | if (buffer_not_empty(b) && |
| 161 | bi_end(b) + delta > bo_ptr(b) && |
| 162 | bo_ptr(b) >= bi_end(b)) |
| 163 | return 0; /* no space left before wrapping data */ |
| 164 | |
Willy Tarreau | af81935 | 2012-08-27 22:08:00 +0200 | [diff] [blame] | 165 | /* first, protect the end of the buffer */ |
| 166 | memmove(pos + delta, pos, bi_end(b) - pos); |
| 167 | |
| 168 | /* now, copy str over pos */ |
| 169 | if (len && str) { |
| 170 | memcpy(pos, str, len); |
| 171 | pos[len] = '\r'; |
| 172 | pos[len + 1] = '\n'; |
| 173 | } |
| 174 | |
| 175 | b->i += delta; |
| 176 | return delta; |
| 177 | } |
| 178 | |
Willy Tarreau | 27187ab | 2015-07-02 12:50:23 +0200 | [diff] [blame] | 179 | /* This function realigns a possibly wrapping buffer so that the input part is |
| 180 | * contiguous and starts at the beginning of the buffer and the output part |
| 181 | * ends at the end of the buffer. This provides the best conditions since it |
| 182 | * allows the largest inputs to be processed at once and ensures that once the |
| 183 | * output data leaves, the whole buffer is available at once. |
Willy Tarreau | c7e4238 | 2012-08-24 19:22:53 +0200 | [diff] [blame] | 184 | */ |
| 185 | void buffer_slow_realign(struct buffer *buf) |
| 186 | { |
Willy Tarreau | 27187ab | 2015-07-02 12:50:23 +0200 | [diff] [blame] | 187 | int block1 = buf->o; |
| 188 | int block2 = 0; |
| 189 | |
| 190 | /* process output data in two steps to cover wrapping */ |
| 191 | if (block1 > buf->p - buf->data) { |
| 192 | block2 = buf->p - buf->data; |
| 193 | block1 -= block2; |
| 194 | } |
| 195 | memcpy(swap_buffer + buf->size - buf->o, bo_ptr(buf), block1); |
| 196 | memcpy(swap_buffer + buf->size - block2, buf->data, block2); |
| 197 | |
| 198 | /* process input data in two steps to cover wrapping */ |
| 199 | block1 = buf->i; |
| 200 | block2 = 0; |
| 201 | |
| 202 | if (block1 > buf->data + buf->size - buf->p) { |
| 203 | block1 = buf->data + buf->size - buf->p; |
| 204 | block2 = buf->i - block1; |
Willy Tarreau | c7e4238 | 2012-08-24 19:22:53 +0200 | [diff] [blame] | 205 | } |
Willy Tarreau | 27187ab | 2015-07-02 12:50:23 +0200 | [diff] [blame] | 206 | memcpy(swap_buffer, bi_ptr(buf), block1); |
| 207 | memcpy(swap_buffer + block1, buf->data, block2); |
| 208 | |
| 209 | /* reinject changes into the buffer */ |
| 210 | memcpy(buf->data, swap_buffer, buf->i); |
| 211 | memcpy(buf->data + buf->size - buf->o, swap_buffer + buf->size - buf->o, buf->o); |
Willy Tarreau | c7e4238 | 2012-08-24 19:22:53 +0200 | [diff] [blame] | 212 | |
| 213 | buf->p = buf->data; |
| 214 | } |
| 215 | |
Willy Tarreau | c7e4238 | 2012-08-24 19:22:53 +0200 | [diff] [blame] | 216 | /* |
| 217 | * Dumps part or all of a buffer. |
| 218 | */ |
| 219 | void buffer_dump(FILE *o, struct buffer *b, int from, int to) |
| 220 | { |
| 221 | fprintf(o, "Dumping buffer %p\n", b); |
William Lallemand | be0efd8 | 2012-11-22 18:01:40 +0100 | [diff] [blame] | 222 | fprintf(o, " data=%p o=%d i=%d p=%p\n" |
| 223 | " relative: p=0x%04x\n", |
| 224 | b->data, b->o, b->i, b->p, (unsigned int)(b->p - b->data)); |
Willy Tarreau | c7e4238 | 2012-08-24 19:22:53 +0200 | [diff] [blame] | 225 | |
| 226 | fprintf(o, "Dumping contents from byte %d to byte %d\n", from, to); |
William Lallemand | be0efd8 | 2012-11-22 18:01:40 +0100 | [diff] [blame] | 227 | fprintf(o, " 0 1 2 3 4 5 6 7 8 9 a b c d e f\n"); |
| 228 | /* dump hexa */ |
| 229 | while (from < to) { |
| 230 | int i; |
| 231 | |
| 232 | fprintf(o, " %04x: ", from); |
| 233 | for (i = 0; ((from + i) < to) && (i < 16) ; i++) { |
| 234 | fprintf(o, "%02x ", (unsigned char)b->data[from + i]); |
| 235 | if (((from + i) & 15) == 7) |
| 236 | fprintf(o, "- "); |
| 237 | } |
Godbach | c08057c | 2013-11-14 10:15:20 +0800 | [diff] [blame] | 238 | if (to - from < 16) { |
Godbach | c3916a7 | 2013-11-21 10:21:22 +0800 | [diff] [blame] | 239 | int j = 0; |
| 240 | |
Godbach | c08057c | 2013-11-14 10:15:20 +0800 | [diff] [blame] | 241 | for (j = 0; j < from + 16 - to; j++) |
| 242 | fprintf(o, " "); |
Godbach | c3916a7 | 2013-11-21 10:21:22 +0800 | [diff] [blame] | 243 | if (j > 8) |
| 244 | fprintf(o, " "); |
Godbach | c08057c | 2013-11-14 10:15:20 +0800 | [diff] [blame] | 245 | } |
William Lallemand | be0efd8 | 2012-11-22 18:01:40 +0100 | [diff] [blame] | 246 | fprintf(o, " "); |
| 247 | for (i = 0; (from + i < to) && (i < 16) ; i++) { |
Willy Tarreau | 95898ac | 2012-11-26 00:57:40 +0100 | [diff] [blame] | 248 | fprintf(o, "%c", isprint((int)b->data[from + i]) ? b->data[from + i] : '.') ; |
William Lallemand | be0efd8 | 2012-11-22 18:01:40 +0100 | [diff] [blame] | 249 | if ((((from + i) & 15) == 15) && ((from + i) != to-1)) |
| 250 | fprintf(o, "\n"); |
| 251 | } |
| 252 | from += i; |
Willy Tarreau | c7e4238 | 2012-08-24 19:22:53 +0200 | [diff] [blame] | 253 | } |
| 254 | fprintf(o, "\n--\n"); |
William Lallemand | be0efd8 | 2012-11-22 18:01:40 +0100 | [diff] [blame] | 255 | fflush(o); |
Willy Tarreau | c7e4238 | 2012-08-24 19:22:53 +0200 | [diff] [blame] | 256 | } |
| 257 | |
Christopher Faulet | a73e59b | 2016-12-09 17:30:18 +0100 | [diff] [blame] | 258 | void __offer_buffer(void *from, unsigned int threshold) |
| 259 | { |
| 260 | struct buffer_wait *wait, *bak; |
| 261 | int avail; |
| 262 | |
| 263 | /* For now, we consider that all objects need 1 buffer, so we can stop |
| 264 | * waking up them once we have enough of them to eat all the available |
| 265 | * buffers. Note that we don't really know if they are streams or just |
| 266 | * other tasks, but that's a rough estimate. Similarly, for each cached |
| 267 | * event we'll need 1 buffer. If no buffer is currently used, always |
| 268 | * wake up the number of tasks we can offer a buffer based on what is |
| 269 | * allocated, and in any case at least one task per two reserved |
| 270 | * buffers. |
| 271 | */ |
| 272 | avail = pool2_buffer->allocated - pool2_buffer->used - global.tune.reserved_bufs / 2; |
| 273 | |
| 274 | list_for_each_entry_safe(wait, bak, &buffer_wq, list) { |
| 275 | if (avail <= threshold) |
| 276 | break; |
| 277 | |
| 278 | if (wait->target == from || !wait->wakeup_cb(wait->target)) |
| 279 | continue; |
| 280 | |
| 281 | LIST_DEL(&wait->list); |
| 282 | LIST_INIT(&wait->list); |
| 283 | |
| 284 | avail--; |
| 285 | } |
| 286 | } |
Willy Tarreau | c7e4238 | 2012-08-24 19:22:53 +0200 | [diff] [blame] | 287 | |
| 288 | /* |
| 289 | * Local variables: |
| 290 | * c-indent-level: 8 |
| 291 | * c-basic-offset: 8 |
| 292 | * End: |
| 293 | */ |