Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 1 | /* |
Willy Tarreau | 24f4efa | 2010-08-27 17:56:48 +0200 | [diff] [blame] | 2 | * include/proto/task.h |
| 3 | * Functions for task management. |
| 4 | * |
| 5 | * Copyright (C) 2000-2010 Willy Tarreau - w@1wt.eu |
| 6 | * |
| 7 | * This library is free software; you can redistribute it and/or |
| 8 | * modify it under the terms of the GNU Lesser General Public |
| 9 | * License as published by the Free Software Foundation, version 2.1 |
| 10 | * exclusively. |
| 11 | * |
| 12 | * This library is distributed in the hope that it will be useful, |
| 13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| 15 | * Lesser General Public License for more details. |
| 16 | * |
| 17 | * You should have received a copy of the GNU Lesser General Public |
| 18 | * License along with this library; if not, write to the Free Software |
| 19 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
| 20 | */ |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 21 | |
| 22 | #ifndef _PROTO_TASK_H |
| 23 | #define _PROTO_TASK_H |
| 24 | |
| 25 | |
| 26 | #include <sys/time.h> |
Willy Tarreau | e3ba5f0 | 2006-06-29 18:54:54 +0200 | [diff] [blame] | 27 | |
| 28 | #include <common/config.h> |
Willy Tarreau | 2dd0d47 | 2006-06-29 17:53:05 +0200 | [diff] [blame] | 29 | #include <common/memory.h> |
Willy Tarreau | 96bcfd7 | 2007-04-29 10:41:56 +0200 | [diff] [blame] | 30 | #include <common/mini-clist.h> |
| 31 | #include <common/standard.h> |
Willy Tarreau | d0a201b | 2009-03-08 15:53:06 +0100 | [diff] [blame] | 32 | #include <common/ticks.h> |
Emeric Brun | c60def8 | 2017-09-27 14:59:38 +0200 | [diff] [blame] | 33 | #include <common/hathreads.h> |
| 34 | |
Willy Tarreau | 8d38805 | 2017-11-05 13:34:20 +0100 | [diff] [blame] | 35 | #include <eb32sctree.h> |
Willy Tarreau | 45cb4fb | 2009-10-26 21:10:04 +0100 | [diff] [blame] | 36 | #include <eb32tree.h> |
Willy Tarreau | 96bcfd7 | 2007-04-29 10:41:56 +0200 | [diff] [blame] | 37 | |
Willy Tarreau | eb11889 | 2014-11-13 16:57:19 +0100 | [diff] [blame] | 38 | #include <types/global.h> |
Willy Tarreau | e3ba5f0 | 2006-06-29 18:54:54 +0200 | [diff] [blame] | 39 | #include <types/task.h> |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 40 | |
Willy Tarreau | d0a201b | 2009-03-08 15:53:06 +0100 | [diff] [blame] | 41 | /* Principle of the wait queue. |
| 42 | * |
| 43 | * We want to be able to tell whether an expiration date is before of after the |
| 44 | * current time <now>. We KNOW that expiration dates are never too far apart, |
| 45 | * because they are measured in ticks (milliseconds). We also know that almost |
| 46 | * all dates will be in the future, and that a very small part of them will be |
| 47 | * in the past, they are the ones which have expired since last time we checked |
| 48 | * them. Using ticks, we know if a date is in the future or in the past, but we |
| 49 | * cannot use that to store sorted information because that reference changes |
| 50 | * all the time. |
| 51 | * |
Willy Tarreau | e35c94a | 2009-03-21 10:01:42 +0100 | [diff] [blame] | 52 | * We'll use the fact that the time wraps to sort timers. Timers above <now> |
| 53 | * are in the future, timers below <now> are in the past. Here, "above" and |
| 54 | * "below" are to be considered modulo 2^31. |
Willy Tarreau | d0a201b | 2009-03-08 15:53:06 +0100 | [diff] [blame] | 55 | * |
Willy Tarreau | e35c94a | 2009-03-21 10:01:42 +0100 | [diff] [blame] | 56 | * Timers are stored sorted in an ebtree. We use the new ability for ebtrees to |
| 57 | * lookup values starting from X to only expire tasks between <now> - 2^31 and |
| 58 | * <now>. If the end of the tree is reached while walking over it, we simply |
| 59 | * loop back to the beginning. That way, we have no problem keeping sorted |
| 60 | * wrapping timers in a tree, between (now - 24 days) and (now + 24 days). The |
| 61 | * keys in the tree always reflect their real position, none can be infinite. |
| 62 | * This reduces the number of checks to be performed. |
Willy Tarreau | d0a201b | 2009-03-08 15:53:06 +0100 | [diff] [blame] | 63 | * |
| 64 | * Another nice optimisation is to allow a timer to stay at an old place in the |
| 65 | * queue as long as it's not further than the real expiration date. That way, |
| 66 | * we use the tree as a place holder for a minorant of the real expiration |
| 67 | * date. Since we have a very low chance of hitting a timeout anyway, we can |
| 68 | * bounce the nodes to their right place when we scan the tree if we encounter |
| 69 | * a misplaced node once in a while. This even allows us not to remove the |
| 70 | * infinite timers from the wait queue. |
| 71 | * |
| 72 | * So, to summarize, we have : |
| 73 | * - node->key always defines current position in the wait queue |
| 74 | * - timer is the real expiration date (possibly infinite) |
Willy Tarreau | e35c94a | 2009-03-21 10:01:42 +0100 | [diff] [blame] | 75 | * - node->key is always before or equal to timer |
Willy Tarreau | d0a201b | 2009-03-08 15:53:06 +0100 | [diff] [blame] | 76 | * |
| 77 | * The run queue works similarly to the wait queue except that the current date |
| 78 | * is replaced by an insertion counter which can also wrap without any problem. |
| 79 | */ |
| 80 | |
Willy Tarreau | e35c94a | 2009-03-21 10:01:42 +0100 | [diff] [blame] | 81 | /* The farthest we can look back in a timer tree */ |
| 82 | #define TIMER_LOOK_BACK (1U << 31) |
Willy Tarreau | d0a201b | 2009-03-08 15:53:06 +0100 | [diff] [blame] | 83 | |
| 84 | /* a few exported variables */ |
Willy Tarreau | a461318 | 2009-03-21 18:13:21 +0100 | [diff] [blame] | 85 | extern unsigned int nb_tasks; /* total number of tasks */ |
Olivier Houchard | 9b03c0c | 2018-07-26 18:45:22 +0200 | [diff] [blame] | 86 | extern volatile unsigned long active_tasks_mask; /* Mask of threads with active tasks */ |
Christopher Faulet | 34c5cc9 | 2016-12-06 09:15:30 +0100 | [diff] [blame] | 87 | extern unsigned int tasks_run_queue; /* run queue size */ |
| 88 | extern unsigned int tasks_run_queue_cur; |
Willy Tarreau | c7bdf09 | 2009-03-21 18:33:52 +0100 | [diff] [blame] | 89 | extern unsigned int nb_tasks_cur; |
Willy Tarreau | 91e9993 | 2008-06-30 07:51:00 +0200 | [diff] [blame] | 90 | extern unsigned int niced_tasks; /* number of niced tasks in the run queue */ |
Willy Tarreau | bafbe01 | 2017-11-24 17:34:44 +0100 | [diff] [blame] | 91 | extern struct pool_head *pool_head_task; |
Olivier Houchard | b0bdae7 | 2018-05-18 18:45:28 +0200 | [diff] [blame] | 92 | extern struct pool_head *pool_head_tasklet; |
Willy Tarreau | bafbe01 | 2017-11-24 17:34:44 +0100 | [diff] [blame] | 93 | extern struct pool_head *pool_head_notification; |
Olivier Houchard | 9b36cb4 | 2018-05-04 15:46:16 +0200 | [diff] [blame] | 94 | extern THREAD_LOCAL struct task *curr_task; /* task currently running or NULL */ |
| 95 | extern THREAD_LOCAL struct eb32sc_node *rq_next; /* Next task to be potentially run */ |
Olivier Houchard | b1ca58b | 2018-06-06 14:22:03 +0200 | [diff] [blame] | 96 | #ifdef USE_THREAD |
Willy Tarreau | b20aa9e | 2018-10-15 14:52:21 +0200 | [diff] [blame] | 97 | extern struct eb_root timers; /* sorted timers tree, global */ |
Olivier Houchard | f6e6dc1 | 2018-05-18 18:38:23 +0200 | [diff] [blame] | 98 | extern struct eb_root rqueue; /* tree constituting the run queue */ |
Olivier Houchard | 77551ee | 2018-07-26 15:59:38 +0200 | [diff] [blame] | 99 | extern int global_rqueue_size; /* Number of element sin the global runqueue */ |
Olivier Houchard | b1ca58b | 2018-06-06 14:22:03 +0200 | [diff] [blame] | 100 | #endif |
Olivier Houchard | 77551ee | 2018-07-26 15:59:38 +0200 | [diff] [blame] | 101 | |
Willy Tarreau | 8d8747a | 2018-10-15 16:12:48 +0200 | [diff] [blame] | 102 | /* force to split per-thread stuff into separate cache lines */ |
| 103 | struct task_per_thread { |
| 104 | struct eb_root timers; /* tree constituting the per-thread wait queue */ |
| 105 | struct eb_root rqueue; /* tree constituting the per-thread run queue */ |
| 106 | struct list task_list; /* List of tasks to be run, mixing tasks and tasklets */ |
| 107 | int task_list_size; /* Number of tasks in the task_list */ |
| 108 | int rqueue_size; /* Number of elements in the per-thread run queue */ |
| 109 | __attribute__((aligned(64))) char end[0]; |
| 110 | }; |
| 111 | |
| 112 | extern struct task_per_thread task_per_thread[MAX_THREADS]; |
Christopher Faulet | 9dcf9b6 | 2017-11-13 10:34:01 +0100 | [diff] [blame] | 113 | |
| 114 | __decl_hathreads(extern HA_SPINLOCK_T rq_lock); /* spin lock related to run queue */ |
| 115 | __decl_hathreads(extern HA_SPINLOCK_T wq_lock); /* spin lock related to wait queue */ |
Willy Tarreau | c6ca1a0 | 2007-05-13 19:43:47 +0200 | [diff] [blame] | 116 | |
Olivier Houchard | 5d18718 | 2018-08-01 15:58:44 +0200 | [diff] [blame] | 117 | |
| 118 | static inline void task_insert_into_tasklet_list(struct task *t); |
| 119 | |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 120 | /* return 0 if task is in run queue, otherwise non-zero */ |
| 121 | static inline int task_in_rq(struct task *t) |
| 122 | { |
Olivier Houchard | b0bdae7 | 2018-05-18 18:45:28 +0200 | [diff] [blame] | 123 | /* Check if leaf_p is NULL, in case he's not in the runqueue, and if |
| 124 | * it's not 0x1, which would mean it's in the tasklet list. |
| 125 | */ |
| 126 | return t->rq.node.leaf_p != NULL && t->rq.node.leaf_p != (void *)0x1; |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 127 | } |
| 128 | |
| 129 | /* return 0 if task is in wait queue, otherwise non-zero */ |
| 130 | static inline int task_in_wq(struct task *t) |
| 131 | { |
| 132 | return t->wq.node.leaf_p != NULL; |
| 133 | } |
| 134 | |
Willy Tarreau | fdccded | 2008-08-29 18:19:04 +0200 | [diff] [blame] | 135 | /* puts the task <t> in run queue with reason flags <f>, and returns <t> */ |
Olivier Houchard | f6e6dc1 | 2018-05-18 18:38:23 +0200 | [diff] [blame] | 136 | /* This will put the task in the local runqueue if the task is only runnable |
| 137 | * by the current thread, in the global runqueue otherwies. |
| 138 | */ |
| 139 | void __task_wakeup(struct task *t, struct eb_root *); |
| 140 | static inline void task_wakeup(struct task *t, unsigned int f) |
Willy Tarreau | 4df8206 | 2008-08-29 15:26:14 +0200 | [diff] [blame] | 141 | { |
Olivier Houchard | f6e6dc1 | 2018-05-18 18:38:23 +0200 | [diff] [blame] | 142 | unsigned short state; |
Emeric Brun | c60def8 | 2017-09-27 14:59:38 +0200 | [diff] [blame] | 143 | |
Olivier Houchard | f6e6dc1 | 2018-05-18 18:38:23 +0200 | [diff] [blame] | 144 | #ifdef USE_THREAD |
| 145 | struct eb_root *root; |
Emeric Brun | c60def8 | 2017-09-27 14:59:38 +0200 | [diff] [blame] | 146 | |
Olivier Houchard | b0bdae7 | 2018-05-18 18:45:28 +0200 | [diff] [blame] | 147 | if (t->thread_mask == tid_bit || global.nbthread == 1) |
Willy Tarreau | 8d8747a | 2018-10-15 16:12:48 +0200 | [diff] [blame] | 148 | root = &task_per_thread[tid].rqueue; |
Olivier Houchard | f6e6dc1 | 2018-05-18 18:38:23 +0200 | [diff] [blame] | 149 | else |
| 150 | root = &rqueue; |
| 151 | #else |
Willy Tarreau | 8d8747a | 2018-10-15 16:12:48 +0200 | [diff] [blame] | 152 | struct eb_root *root = &task_per_thread[tid].rqueue; |
Olivier Houchard | f6e6dc1 | 2018-05-18 18:38:23 +0200 | [diff] [blame] | 153 | #endif |
| 154 | |
| 155 | state = HA_ATOMIC_OR(&t->state, f); |
| 156 | if (!(state & TASK_RUNNING)) |
| 157 | __task_wakeup(t, root); |
Willy Tarreau | 4df8206 | 2008-08-29 15:26:14 +0200 | [diff] [blame] | 158 | } |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 159 | |
Willy Tarreau | f65610a | 2017-10-31 16:06:06 +0100 | [diff] [blame] | 160 | /* change the thread affinity of a task to <thread_mask> */ |
Emeric Brun | c60def8 | 2017-09-27 14:59:38 +0200 | [diff] [blame] | 161 | static inline void task_set_affinity(struct task *t, unsigned long thread_mask) |
| 162 | { |
Willy Tarreau | f65610a | 2017-10-31 16:06:06 +0100 | [diff] [blame] | 163 | t->thread_mask = thread_mask; |
Emeric Brun | c60def8 | 2017-09-27 14:59:38 +0200 | [diff] [blame] | 164 | } |
Willy Tarreau | f65610a | 2017-10-31 16:06:06 +0100 | [diff] [blame] | 165 | |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 166 | /* |
| 167 | * Unlink the task from the wait queue, and possibly update the last_timer |
| 168 | * pointer. A pointer to the task itself is returned. The task *must* already |
| 169 | * be in the wait queue before calling this function. If unsure, use the safer |
| 170 | * task_unlink_wq() function. |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 171 | */ |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 172 | static inline struct task *__task_unlink_wq(struct task *t) |
| 173 | { |
| 174 | eb32_delete(&t->wq); |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 175 | return t; |
| 176 | } |
| 177 | |
Willy Tarreau | b20aa9e | 2018-10-15 14:52:21 +0200 | [diff] [blame] | 178 | /* remove a task from its wait queue. It may either be the local wait queue if |
| 179 | * the task is bound to a single thread (in which case there's no locking |
| 180 | * involved) or the global queue, with locking. |
| 181 | */ |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 182 | static inline struct task *task_unlink_wq(struct task *t) |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 183 | { |
Willy Tarreau | b20aa9e | 2018-10-15 14:52:21 +0200 | [diff] [blame] | 184 | if (likely(task_in_wq(t))) { |
| 185 | if (atleast2(t->thread_mask)) |
| 186 | HA_SPIN_LOCK(TASK_WQ_LOCK, &wq_lock); |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 187 | __task_unlink_wq(t); |
Willy Tarreau | b20aa9e | 2018-10-15 14:52:21 +0200 | [diff] [blame] | 188 | if (atleast2(t->thread_mask)) |
| 189 | HA_SPIN_UNLOCK(TASK_WQ_LOCK, &wq_lock); |
| 190 | } |
Willy Tarreau | 96bcfd7 | 2007-04-29 10:41:56 +0200 | [diff] [blame] | 191 | return t; |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 192 | } |
| 193 | |
| 194 | /* |
Christopher Faulet | 34c5cc9 | 2016-12-06 09:15:30 +0100 | [diff] [blame] | 195 | * Unlink the task from the run queue. The tasks_run_queue size and number of |
| 196 | * niced tasks are updated too. A pointer to the task itself is returned. The |
| 197 | * task *must* already be in the run queue before calling this function. If |
| 198 | * unsure, use the safer task_unlink_rq() function. Note that the pointer to the |
| 199 | * next run queue entry is neither checked nor updated. |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 200 | */ |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 201 | static inline struct task *__task_unlink_rq(struct task *t) |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 202 | { |
Olivier Houchard | 09eeb76 | 2018-05-28 13:51:06 +0200 | [diff] [blame] | 203 | HA_ATOMIC_SUB(&tasks_run_queue, 1); |
Olivier Houchard | 77551ee | 2018-07-26 15:59:38 +0200 | [diff] [blame] | 204 | #ifdef USE_THREAD |
| 205 | if (t->state & TASK_GLOBAL) { |
Olivier Houchard | 76e4518 | 2018-07-26 16:19:58 +0200 | [diff] [blame] | 206 | HA_ATOMIC_AND(&t->state, ~TASK_GLOBAL); |
Olivier Houchard | 77551ee | 2018-07-26 15:59:38 +0200 | [diff] [blame] | 207 | global_rqueue_size--; |
| 208 | } else |
| 209 | #endif |
Willy Tarreau | 8d8747a | 2018-10-15 16:12:48 +0200 | [diff] [blame] | 210 | task_per_thread[tid].rqueue_size--; |
Olivier Houchard | 77551ee | 2018-07-26 15:59:38 +0200 | [diff] [blame] | 211 | eb32sc_delete(&t->rq); |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 212 | if (likely(t->nice)) |
Olivier Houchard | f6e6dc1 | 2018-05-18 18:38:23 +0200 | [diff] [blame] | 213 | HA_ATOMIC_SUB(&niced_tasks, 1); |
Willy Tarreau | ce44f12 | 2008-07-05 18:16:19 +0200 | [diff] [blame] | 214 | return t; |
| 215 | } |
Willy Tarreau | 9789f7b | 2008-06-24 08:17:16 +0200 | [diff] [blame] | 216 | |
Willy Tarreau | 501260b | 2015-02-23 16:07:01 +0100 | [diff] [blame] | 217 | /* This function unlinks task <t> from the run queue if it is in it. It also |
| 218 | * takes care of updating the next run queue task if it was this task. |
| 219 | */ |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 220 | static inline struct task *task_unlink_rq(struct task *t) |
| 221 | { |
Olivier Houchard | f6e6dc1 | 2018-05-18 18:38:23 +0200 | [diff] [blame] | 222 | if (t->thread_mask != tid_bit) |
| 223 | HA_SPIN_LOCK(TASK_RQ_LOCK, &rq_lock); |
Olivier Houchard | 9b36cb4 | 2018-05-04 15:46:16 +0200 | [diff] [blame] | 224 | if (likely(task_in_rq(t))) { |
| 225 | if (&t->rq == rq_next) |
| 226 | rq_next = eb32sc_next(rq_next, tid_bit); |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 227 | __task_unlink_rq(t); |
Olivier Houchard | 9b36cb4 | 2018-05-04 15:46:16 +0200 | [diff] [blame] | 228 | } |
Olivier Houchard | f6e6dc1 | 2018-05-18 18:38:23 +0200 | [diff] [blame] | 229 | if (t->thread_mask != tid_bit) |
| 230 | HA_SPIN_UNLOCK(TASK_RQ_LOCK, &rq_lock); |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 231 | return t; |
| 232 | } |
| 233 | |
Olivier Houchard | b0bdae7 | 2018-05-18 18:45:28 +0200 | [diff] [blame] | 234 | static inline void tasklet_wakeup(struct tasklet *tl) |
| 235 | { |
Olivier Houchard | 5d18718 | 2018-08-01 15:58:44 +0200 | [diff] [blame] | 236 | if (!TASK_IS_TASKLET(tl)) { |
| 237 | task_insert_into_tasklet_list((struct task *)tl); |
| 238 | return; |
| 239 | } |
Olivier Houchard | e17c2d3 | 2018-07-17 18:29:22 +0200 | [diff] [blame] | 240 | if (!LIST_ISEMPTY(&tl->list)) |
| 241 | return; |
Willy Tarreau | 8d8747a | 2018-10-15 16:12:48 +0200 | [diff] [blame] | 242 | LIST_ADDQ(&task_per_thread[tid].task_list, &tl->list); |
| 243 | task_per_thread[tid].task_list_size++; |
Olivier Houchard | abedf5f | 2018-08-17 18:57:51 +0200 | [diff] [blame] | 244 | HA_ATOMIC_OR(&active_tasks_mask, tid_bit); |
Olivier Houchard | b0bdae7 | 2018-05-18 18:45:28 +0200 | [diff] [blame] | 245 | HA_ATOMIC_ADD(&tasks_run_queue, 1); |
| 246 | |
| 247 | } |
| 248 | |
| 249 | static inline void task_insert_into_tasklet_list(struct task *t) |
| 250 | { |
| 251 | struct tasklet *tl; |
| 252 | void *expected = NULL; |
| 253 | |
| 254 | /* Protect ourself against anybody trying to insert the task into |
| 255 | * another runqueue. We set leaf_p to 0x1 to indicate that the node is |
| 256 | * not in a tree but that it's in the tasklet list. See task_in_rq(). |
| 257 | */ |
David Carlier | caa8a37 | 2018-06-01 14:32:39 +0200 | [diff] [blame] | 258 | if (unlikely(!HA_ATOMIC_CAS(&t->rq.node.leaf_p, &expected, (void *)0x1))) |
Olivier Houchard | b0bdae7 | 2018-05-18 18:45:28 +0200 | [diff] [blame] | 259 | return; |
Olivier Houchard | 09eeb76 | 2018-05-28 13:51:06 +0200 | [diff] [blame] | 260 | HA_ATOMIC_ADD(&tasks_run_queue, 1); |
Willy Tarreau | 8d8747a | 2018-10-15 16:12:48 +0200 | [diff] [blame] | 261 | task_per_thread[tid].task_list_size++; |
Olivier Houchard | b0bdae7 | 2018-05-18 18:45:28 +0200 | [diff] [blame] | 262 | tl = (struct tasklet *)t; |
Willy Tarreau | 8d8747a | 2018-10-15 16:12:48 +0200 | [diff] [blame] | 263 | LIST_ADDQ(&task_per_thread[tid].task_list, &tl->list); |
Olivier Houchard | b0bdae7 | 2018-05-18 18:45:28 +0200 | [diff] [blame] | 264 | } |
| 265 | |
| 266 | static inline void task_remove_from_task_list(struct task *t) |
| 267 | { |
| 268 | LIST_DEL(&((struct tasklet *)t)->list); |
Olivier Houchard | dcd6f3a | 2018-06-08 17:08:19 +0200 | [diff] [blame] | 269 | LIST_INIT(&((struct tasklet *)t)->list); |
Willy Tarreau | 8d8747a | 2018-10-15 16:12:48 +0200 | [diff] [blame] | 270 | task_per_thread[tid].task_list_size--; |
Olivier Houchard | b0bdae7 | 2018-05-18 18:45:28 +0200 | [diff] [blame] | 271 | HA_ATOMIC_SUB(&tasks_run_queue, 1); |
| 272 | if (!TASK_IS_TASKLET(t)) { |
| 273 | t->rq.node.leaf_p = NULL; // was 0x1 |
| 274 | __ha_barrier_store(); |
| 275 | } |
| 276 | } |
| 277 | |
Willy Tarreau | ce44f12 | 2008-07-05 18:16:19 +0200 | [diff] [blame] | 278 | /* |
| 279 | * Unlinks the task and adjusts run queue stats. |
| 280 | * A pointer to the task itself is returned. |
| 281 | */ |
| 282 | static inline struct task *task_delete(struct task *t) |
| 283 | { |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 284 | task_unlink_wq(t); |
| 285 | task_unlink_rq(t); |
Willy Tarreau | 9789f7b | 2008-06-24 08:17:16 +0200 | [diff] [blame] | 286 | return t; |
| 287 | } |
| 288 | |
| 289 | /* |
Willy Tarreau | a461318 | 2009-03-21 18:13:21 +0100 | [diff] [blame] | 290 | * Initialize a new task. The bare minimum is performed (queue pointers and |
| 291 | * state). The task is returned. This function should not be used outside of |
| 292 | * task_new(). |
Willy Tarreau | 9789f7b | 2008-06-24 08:17:16 +0200 | [diff] [blame] | 293 | */ |
Emeric Brun | c60def8 | 2017-09-27 14:59:38 +0200 | [diff] [blame] | 294 | static inline struct task *task_init(struct task *t, unsigned long thread_mask) |
Willy Tarreau | 9789f7b | 2008-06-24 08:17:16 +0200 | [diff] [blame] | 295 | { |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 296 | t->wq.node.leaf_p = NULL; |
| 297 | t->rq.node.leaf_p = NULL; |
Olivier Houchard | f6e6dc1 | 2018-05-18 18:38:23 +0200 | [diff] [blame] | 298 | t->state = TASK_SLEEPING; |
Willy Tarreau | f65610a | 2017-10-31 16:06:06 +0100 | [diff] [blame] | 299 | t->thread_mask = thread_mask; |
Willy Tarreau | 91e9993 | 2008-06-30 07:51:00 +0200 | [diff] [blame] | 300 | t->nice = 0; |
Willy Tarreau | 3884cba | 2009-03-28 17:54:35 +0100 | [diff] [blame] | 301 | t->calls = 0; |
Willy Tarreau | f421999 | 2017-07-24 17:52:58 +0200 | [diff] [blame] | 302 | t->expire = TICK_ETERNITY; |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 303 | return t; |
| 304 | } |
| 305 | |
Olivier Houchard | b0bdae7 | 2018-05-18 18:45:28 +0200 | [diff] [blame] | 306 | static inline void tasklet_init(struct tasklet *t) |
| 307 | { |
| 308 | t->nice = -32768; |
| 309 | t->calls = 0; |
| 310 | t->state = 0; |
Olivier Houchard | 9ddaf79 | 2018-07-19 16:02:16 +0200 | [diff] [blame] | 311 | t->process = NULL; |
Olivier Houchard | dcd6f3a | 2018-06-08 17:08:19 +0200 | [diff] [blame] | 312 | LIST_INIT(&t->list); |
Olivier Houchard | b0bdae7 | 2018-05-18 18:45:28 +0200 | [diff] [blame] | 313 | } |
| 314 | |
| 315 | static inline struct tasklet *tasklet_new(void) |
| 316 | { |
| 317 | struct tasklet *t = pool_alloc(pool_head_tasklet); |
| 318 | |
| 319 | if (t) { |
| 320 | tasklet_init(t); |
| 321 | } |
| 322 | return t; |
| 323 | } |
| 324 | |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 325 | /* |
Willy Tarreau | a461318 | 2009-03-21 18:13:21 +0100 | [diff] [blame] | 326 | * Allocate and initialise a new task. The new task is returned, or NULL in |
| 327 | * case of lack of memory. The task count is incremented. Tasks should only |
| 328 | * be allocated this way, and must be freed using task_free(). |
| 329 | */ |
Emeric Brun | c60def8 | 2017-09-27 14:59:38 +0200 | [diff] [blame] | 330 | static inline struct task *task_new(unsigned long thread_mask) |
Willy Tarreau | a461318 | 2009-03-21 18:13:21 +0100 | [diff] [blame] | 331 | { |
Willy Tarreau | bafbe01 | 2017-11-24 17:34:44 +0100 | [diff] [blame] | 332 | struct task *t = pool_alloc(pool_head_task); |
Willy Tarreau | a461318 | 2009-03-21 18:13:21 +0100 | [diff] [blame] | 333 | if (t) { |
Emeric Brun | c60def8 | 2017-09-27 14:59:38 +0200 | [diff] [blame] | 334 | HA_ATOMIC_ADD(&nb_tasks, 1); |
| 335 | task_init(t, thread_mask); |
Willy Tarreau | a461318 | 2009-03-21 18:13:21 +0100 | [diff] [blame] | 336 | } |
| 337 | return t; |
| 338 | } |
| 339 | |
| 340 | /* |
| 341 | * Free a task. Its context must have been freed since it will be lost. |
| 342 | * The task count is decremented. |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 343 | */ |
Olivier Houchard | 9b36cb4 | 2018-05-04 15:46:16 +0200 | [diff] [blame] | 344 | static inline void __task_free(struct task *t) |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 345 | { |
Willy Tarreau | bafbe01 | 2017-11-24 17:34:44 +0100 | [diff] [blame] | 346 | pool_free(pool_head_task, t); |
Willy Tarreau | eb11889 | 2014-11-13 16:57:19 +0100 | [diff] [blame] | 347 | if (unlikely(stopping)) |
Willy Tarreau | bafbe01 | 2017-11-24 17:34:44 +0100 | [diff] [blame] | 348 | pool_flush(pool_head_task); |
Emeric Brun | c60def8 | 2017-09-27 14:59:38 +0200 | [diff] [blame] | 349 | HA_ATOMIC_SUB(&nb_tasks, 1); |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 350 | } |
| 351 | |
Olivier Houchard | 9b36cb4 | 2018-05-04 15:46:16 +0200 | [diff] [blame] | 352 | static inline void task_free(struct task *t) |
| 353 | { |
| 354 | /* There's no need to protect t->state with a lock, as the task |
| 355 | * has to run on the current thread. |
| 356 | */ |
| 357 | if (t == curr_task || !(t->state & TASK_RUNNING)) |
| 358 | __task_free(t); |
| 359 | else |
| 360 | t->process = NULL; |
| 361 | } |
| 362 | |
Olivier Houchard | b0bdae7 | 2018-05-18 18:45:28 +0200 | [diff] [blame] | 363 | static inline void tasklet_free(struct tasklet *tl) |
| 364 | { |
Olivier Houchard | 931624a | 2018-09-12 14:55:03 +0200 | [diff] [blame] | 365 | if (!LIST_ISEMPTY(&tl->list)) |
Willy Tarreau | 8d8747a | 2018-10-15 16:12:48 +0200 | [diff] [blame] | 366 | task_per_thread[tid].task_list_size--; |
Olivier Houchard | dcd6f3a | 2018-06-08 17:08:19 +0200 | [diff] [blame] | 367 | LIST_DEL(&tl->list); |
| 368 | |
Olivier Houchard | b0bdae7 | 2018-05-18 18:45:28 +0200 | [diff] [blame] | 369 | pool_free(pool_head_tasklet, tl); |
| 370 | if (unlikely(stopping)) |
| 371 | pool_flush(pool_head_tasklet); |
| 372 | } |
| 373 | |
Willy Tarreau | b20aa9e | 2018-10-15 14:52:21 +0200 | [diff] [blame] | 374 | void __task_queue(struct task *task, struct eb_root *wq); |
| 375 | |
Willy Tarreau | 4726f53 | 2009-03-07 17:25:21 +0100 | [diff] [blame] | 376 | /* Place <task> into the wait queue, where it may already be. If the expiration |
Willy Tarreau | 531cf0c | 2009-03-08 16:35:27 +0100 | [diff] [blame] | 377 | * timer is infinite, do nothing and rely on wake_expired_task to clean up. |
Willy Tarreau | b20aa9e | 2018-10-15 14:52:21 +0200 | [diff] [blame] | 378 | * If the task is bound to a single thread, it's assumed to be bound to the |
| 379 | * current thread's queue and is queued without locking. Otherwise it's queued |
| 380 | * into the global wait queue, protected by locks. |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 381 | */ |
Willy Tarreau | 531cf0c | 2009-03-08 16:35:27 +0100 | [diff] [blame] | 382 | static inline void task_queue(struct task *task) |
| 383 | { |
| 384 | /* If we already have a place in the wait queue no later than the |
| 385 | * timeout we're trying to set, we'll stay there, because it is very |
| 386 | * unlikely that we will reach the timeout anyway. If the timeout |
| 387 | * has been disabled, it's useless to leave the queue as well. We'll |
| 388 | * rely on wake_expired_tasks() to catch the node and move it to the |
| 389 | * proper place should it ever happen. Finally we only add the task |
| 390 | * to the queue if it was not there or if it was further than what |
| 391 | * we want. |
| 392 | */ |
| 393 | if (!tick_isset(task->expire)) |
| 394 | return; |
| 395 | |
Willy Tarreau | b20aa9e | 2018-10-15 14:52:21 +0200 | [diff] [blame] | 396 | #ifdef USE_THREAD |
| 397 | if (atleast2(task->thread_mask)) { |
| 398 | HA_SPIN_LOCK(TASK_WQ_LOCK, &wq_lock); |
| 399 | if (!task_in_wq(task) || tick_is_lt(task->expire, task->wq.key)) |
| 400 | __task_queue(task, &timers); |
| 401 | HA_SPIN_UNLOCK(TASK_WQ_LOCK, &wq_lock); |
| 402 | } else |
| 403 | #endif |
| 404 | { |
| 405 | if (!task_in_wq(task) || tick_is_lt(task->expire, task->wq.key)) |
Willy Tarreau | 8d8747a | 2018-10-15 16:12:48 +0200 | [diff] [blame] | 406 | __task_queue(task, &task_per_thread[tid].timers); |
Willy Tarreau | b20aa9e | 2018-10-15 14:52:21 +0200 | [diff] [blame] | 407 | } |
Willy Tarreau | 531cf0c | 2009-03-08 16:35:27 +0100 | [diff] [blame] | 408 | } |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 409 | |
Willy Tarreau | 26e4881 | 2011-07-25 14:30:42 +0200 | [diff] [blame] | 410 | /* Ensure <task> will be woken up at most at <when>. If the task is already in |
| 411 | * the run queue (but not running), nothing is done. It may be used that way |
| 412 | * with a delay : task_schedule(task, tick_add(now_ms, delay)); |
| 413 | */ |
| 414 | static inline void task_schedule(struct task *task, int when) |
| 415 | { |
Emeric Brun | c60def8 | 2017-09-27 14:59:38 +0200 | [diff] [blame] | 416 | /* TODO: mthread, check if there is no tisk with this test */ |
Willy Tarreau | 26e4881 | 2011-07-25 14:30:42 +0200 | [diff] [blame] | 417 | if (task_in_rq(task)) |
| 418 | return; |
| 419 | |
Willy Tarreau | b20aa9e | 2018-10-15 14:52:21 +0200 | [diff] [blame] | 420 | #ifdef USE_THREAD |
| 421 | if (atleast2(task->thread_mask)) { |
| 422 | HA_SPIN_LOCK(TASK_WQ_LOCK, &wq_lock); |
| 423 | if (task_in_wq(task)) |
| 424 | when = tick_first(when, task->expire); |
| 425 | |
| 426 | task->expire = when; |
| 427 | if (!task_in_wq(task) || tick_is_lt(task->expire, task->wq.key)) |
| 428 | __task_queue(task, &timers); |
| 429 | HA_SPIN_UNLOCK(TASK_WQ_LOCK, &wq_lock); |
| 430 | } else |
| 431 | #endif |
| 432 | { |
| 433 | if (task_in_wq(task)) |
| 434 | when = tick_first(when, task->expire); |
Willy Tarreau | 26e4881 | 2011-07-25 14:30:42 +0200 | [diff] [blame] | 435 | |
Willy Tarreau | b20aa9e | 2018-10-15 14:52:21 +0200 | [diff] [blame] | 436 | task->expire = when; |
| 437 | if (!task_in_wq(task) || tick_is_lt(task->expire, task->wq.key)) |
Willy Tarreau | 8d8747a | 2018-10-15 16:12:48 +0200 | [diff] [blame] | 438 | __task_queue(task, &task_per_thread[tid].timers); |
Willy Tarreau | b20aa9e | 2018-10-15 14:52:21 +0200 | [diff] [blame] | 439 | } |
Willy Tarreau | 26e4881 | 2011-07-25 14:30:42 +0200 | [diff] [blame] | 440 | } |
| 441 | |
Thierry FOURNIER | d697596 | 2017-07-12 14:31:10 +0200 | [diff] [blame] | 442 | /* This function register a new signal. "lua" is the current lua |
| 443 | * execution context. It contains a pointer to the associated task. |
| 444 | * "link" is a list head attached to an other task that must be wake |
| 445 | * the lua task if an event occurs. This is useful with external |
| 446 | * events like TCP I/O or sleep functions. This funcion allocate |
| 447 | * memory for the signal. |
| 448 | */ |
| 449 | static inline struct notification *notification_new(struct list *purge, struct list *event, struct task *wakeup) |
| 450 | { |
Willy Tarreau | bafbe01 | 2017-11-24 17:34:44 +0100 | [diff] [blame] | 451 | struct notification *com = pool_alloc(pool_head_notification); |
Thierry FOURNIER | d697596 | 2017-07-12 14:31:10 +0200 | [diff] [blame] | 452 | if (!com) |
| 453 | return NULL; |
| 454 | LIST_ADDQ(purge, &com->purge_me); |
| 455 | LIST_ADDQ(event, &com->wake_me); |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 456 | HA_SPIN_INIT(&com->lock); |
Thierry FOURNIER | d697596 | 2017-07-12 14:31:10 +0200 | [diff] [blame] | 457 | com->task = wakeup; |
| 458 | return com; |
| 459 | } |
| 460 | |
| 461 | /* This function purge all the pending signals when the LUA execution |
| 462 | * is finished. This prevent than a coprocess try to wake a deleted |
| 463 | * task. This function remove the memory associated to the signal. |
Thierry FOURNIER | d5b7983 | 2017-12-10 17:14:07 +0100 | [diff] [blame] | 464 | * The purge list is not locked because it is owned by only one |
| 465 | * process. before browsing this list, the caller must ensure to be |
| 466 | * the only one browser. |
Thierry FOURNIER | d697596 | 2017-07-12 14:31:10 +0200 | [diff] [blame] | 467 | */ |
| 468 | static inline void notification_purge(struct list *purge) |
| 469 | { |
| 470 | struct notification *com, *back; |
| 471 | |
| 472 | /* Delete all pending communication signals. */ |
| 473 | list_for_each_entry_safe(com, back, purge, purge_me) { |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 474 | HA_SPIN_LOCK(NOTIF_LOCK, &com->lock); |
Thierry FOURNIER | d697596 | 2017-07-12 14:31:10 +0200 | [diff] [blame] | 475 | LIST_DEL(&com->purge_me); |
Thierry FOURNIER | 738a6d7 | 2017-07-17 00:14:07 +0200 | [diff] [blame] | 476 | if (!com->task) { |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 477 | HA_SPIN_UNLOCK(NOTIF_LOCK, &com->lock); |
Willy Tarreau | bafbe01 | 2017-11-24 17:34:44 +0100 | [diff] [blame] | 478 | pool_free(pool_head_notification, com); |
Thierry FOURNIER | 738a6d7 | 2017-07-17 00:14:07 +0200 | [diff] [blame] | 479 | continue; |
| 480 | } |
| 481 | com->task = NULL; |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 482 | HA_SPIN_UNLOCK(NOTIF_LOCK, &com->lock); |
Thierry FOURNIER | d697596 | 2017-07-12 14:31:10 +0200 | [diff] [blame] | 483 | } |
| 484 | } |
| 485 | |
Thierry FOURNIER | cb14688 | 2017-12-10 17:10:57 +0100 | [diff] [blame] | 486 | /* In some cases, the disconnected notifications must be cleared. |
| 487 | * This function just release memory blocs. The purge list is not |
| 488 | * locked because it is owned by only one process. Before browsing |
| 489 | * this list, the caller must ensure to be the only one browser. |
| 490 | * The "com" is not locked because when com->task is NULL, the |
| 491 | * notification is no longer used. |
| 492 | */ |
| 493 | static inline void notification_gc(struct list *purge) |
| 494 | { |
| 495 | struct notification *com, *back; |
| 496 | |
| 497 | /* Delete all pending communication signals. */ |
| 498 | list_for_each_entry_safe (com, back, purge, purge_me) { |
| 499 | if (com->task) |
| 500 | continue; |
| 501 | LIST_DEL(&com->purge_me); |
| 502 | pool_free(pool_head_notification, com); |
| 503 | } |
| 504 | } |
| 505 | |
Thierry FOURNIER | d697596 | 2017-07-12 14:31:10 +0200 | [diff] [blame] | 506 | /* This function sends signals. It wakes all the tasks attached |
| 507 | * to a list head, and remove the signal, and free the used |
Thierry FOURNIER | d5b7983 | 2017-12-10 17:14:07 +0100 | [diff] [blame] | 508 | * memory. The wake list is not locked because it is owned by |
| 509 | * only one process. before browsing this list, the caller must |
| 510 | * ensure to be the only one browser. |
Thierry FOURNIER | d697596 | 2017-07-12 14:31:10 +0200 | [diff] [blame] | 511 | */ |
| 512 | static inline void notification_wake(struct list *wake) |
| 513 | { |
| 514 | struct notification *com, *back; |
| 515 | |
| 516 | /* Wake task and delete all pending communication signals. */ |
| 517 | list_for_each_entry_safe(com, back, wake, wake_me) { |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 518 | HA_SPIN_LOCK(NOTIF_LOCK, &com->lock); |
Thierry FOURNIER | d697596 | 2017-07-12 14:31:10 +0200 | [diff] [blame] | 519 | LIST_DEL(&com->wake_me); |
Thierry FOURNIER | 738a6d7 | 2017-07-17 00:14:07 +0200 | [diff] [blame] | 520 | if (!com->task) { |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 521 | HA_SPIN_UNLOCK(NOTIF_LOCK, &com->lock); |
Willy Tarreau | bafbe01 | 2017-11-24 17:34:44 +0100 | [diff] [blame] | 522 | pool_free(pool_head_notification, com); |
Thierry FOURNIER | 738a6d7 | 2017-07-17 00:14:07 +0200 | [diff] [blame] | 523 | continue; |
| 524 | } |
Thierry FOURNIER | d697596 | 2017-07-12 14:31:10 +0200 | [diff] [blame] | 525 | task_wakeup(com->task, TASK_WOKEN_MSG); |
Thierry FOURNIER | 738a6d7 | 2017-07-17 00:14:07 +0200 | [diff] [blame] | 526 | com->task = NULL; |
Christopher Faulet | 2a944ee | 2017-11-07 10:42:54 +0100 | [diff] [blame] | 527 | HA_SPIN_UNLOCK(NOTIF_LOCK, &com->lock); |
Thierry FOURNIER | d697596 | 2017-07-12 14:31:10 +0200 | [diff] [blame] | 528 | } |
| 529 | } |
| 530 | |
Thierry FOURNIER | 9d5422a | 2018-05-30 11:40:08 +0200 | [diff] [blame] | 531 | /* This function returns true is some notification are pending |
| 532 | */ |
| 533 | static inline int notification_registered(struct list *wake) |
| 534 | { |
| 535 | return !LIST_ISEMPTY(wake); |
| 536 | } |
| 537 | |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 538 | /* |
Willy Tarreau | 918ff60 | 2011-07-25 16:33:49 +0200 | [diff] [blame] | 539 | * This does 3 things : |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 540 | * - wake up all expired tasks |
| 541 | * - call all runnable tasks |
Willy Tarreau | d825eef | 2007-05-12 22:35:00 +0200 | [diff] [blame] | 542 | * - return the date of next event in <next> or eternity. |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 543 | */ |
| 544 | |
Thierry FOURNIER | 9cf7c4b | 2014-12-15 13:26:01 +0100 | [diff] [blame] | 545 | void process_runnable_tasks(); |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 546 | |
Willy Tarreau | 58b458d | 2008-06-29 22:40:23 +0200 | [diff] [blame] | 547 | /* |
| 548 | * Extract all expired timers from the timer queue, and wakes up all |
| 549 | * associated tasks. Returns the date of next event (or eternity). |
| 550 | */ |
Thierry FOURNIER | 9cf7c4b | 2014-12-15 13:26:01 +0100 | [diff] [blame] | 551 | int wake_expired_tasks(); |
Willy Tarreau | 58b458d | 2008-06-29 22:40:23 +0200 | [diff] [blame] | 552 | |
Willy Tarreau | d0a201b | 2009-03-08 15:53:06 +0100 | [diff] [blame] | 553 | /* Perform minimal initializations, report 0 in case of error, 1 if OK. */ |
| 554 | int init_task(); |
Willy Tarreau | baaee00 | 2006-06-26 02:48:02 +0200 | [diff] [blame] | 555 | |
| 556 | #endif /* _PROTO_TASK_H */ |
| 557 | |
| 558 | /* |
| 559 | * Local variables: |
| 560 | * c-indent-level: 8 |
| 561 | * c-basic-offset: 8 |
| 562 | * End: |
| 563 | */ |