blob: c5e0f89d61932abeabf1f1001707b8dcc382b4de [file] [log] [blame]
Willy Tarreauf89c1872009-10-01 11:19:37 +02001/*
2 * Map-based load-balancing (RR and HASH)
3 *
4 * Copyright 2000-2009 Willy Tarreau <w@1wt.eu>
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 */
12
Willy Tarreau4c7e4b72020-05-27 12:58:42 +020013#include <haproxy/api.h>
Willy Tarreau8d2b7772020-05-27 10:58:19 +020014#include <import/eb32tree.h>
Willy Tarreauf89c1872009-10-01 11:19:37 +020015
Willy Tarreauf89c1872009-10-01 11:19:37 +020016#include <types/server.h>
17
18#include <proto/backend.h>
Christopher Faulet5b517552017-06-09 14:17:53 +020019#include <proto/lb_map.h>
Willy Tarreauf89c1872009-10-01 11:19:37 +020020#include <proto/queue.h>
21
Willy Tarreau1b877482018-08-21 19:44:53 +020022/* this function updates the map according to server <srv>'s new state.
23 *
24 * The server's lock must be held. The lbprm's lock will be used.
25 */
Willy Tarreauf89c1872009-10-01 11:19:37 +020026static void map_set_server_status_down(struct server *srv)
27{
28 struct proxy *p = srv->proxy;
29
Willy Tarreauc5150da2014-05-13 19:27:31 +020030 if (!srv_lb_status_changed(srv))
Willy Tarreauf89c1872009-10-01 11:19:37 +020031 return;
32
Emeric Brun52a91d32017-08-31 14:41:55 +020033 if (srv_willbe_usable(srv))
Willy Tarreauf89c1872009-10-01 11:19:37 +020034 goto out_update_state;
35
36 /* FIXME: could be optimized since we know what changed */
Willy Tarreau1b877482018-08-21 19:44:53 +020037 HA_SPIN_LOCK(LBPRM_LOCK, &p->lbprm.lock);
Willy Tarreauf89c1872009-10-01 11:19:37 +020038 recount_servers(p);
39 update_backend_weight(p);
Christopher Faulet5b517552017-06-09 14:17:53 +020040 recalc_server_map(p);
Willy Tarreau1b877482018-08-21 19:44:53 +020041 HA_SPIN_UNLOCK(LBPRM_LOCK, &p->lbprm.lock);
Willy Tarreauf89c1872009-10-01 11:19:37 +020042 out_update_state:
Willy Tarreauc5150da2014-05-13 19:27:31 +020043 srv_lb_commit_status(srv);
Willy Tarreauf89c1872009-10-01 11:19:37 +020044}
45
Willy Tarreau1b877482018-08-21 19:44:53 +020046/* This function updates the map according to server <srv>'s new state.
47 *
48 * The server's lock must be held. The lbprm's lock will be used.
49 */
Willy Tarreauf89c1872009-10-01 11:19:37 +020050static void map_set_server_status_up(struct server *srv)
51{
52 struct proxy *p = srv->proxy;
53
Willy Tarreauc5150da2014-05-13 19:27:31 +020054 if (!srv_lb_status_changed(srv))
Willy Tarreauf89c1872009-10-01 11:19:37 +020055 return;
56
Emeric Brun52a91d32017-08-31 14:41:55 +020057 if (!srv_willbe_usable(srv))
Willy Tarreauf89c1872009-10-01 11:19:37 +020058 goto out_update_state;
59
60 /* FIXME: could be optimized since we know what changed */
Willy Tarreau1b877482018-08-21 19:44:53 +020061 HA_SPIN_LOCK(LBPRM_LOCK, &p->lbprm.lock);
Willy Tarreauf89c1872009-10-01 11:19:37 +020062 recount_servers(p);
63 update_backend_weight(p);
Christopher Faulet5b517552017-06-09 14:17:53 +020064 recalc_server_map(p);
Willy Tarreau1b877482018-08-21 19:44:53 +020065 HA_SPIN_UNLOCK(LBPRM_LOCK, &p->lbprm.lock);
Willy Tarreauf89c1872009-10-01 11:19:37 +020066 out_update_state:
Willy Tarreauc5150da2014-05-13 19:27:31 +020067 srv_lb_commit_status(srv);
Willy Tarreauf89c1872009-10-01 11:19:37 +020068}
69
70/* This function recomputes the server map for proxy px. It relies on
71 * px->lbprm.tot_wact, tot_wbck, tot_used, tot_weight, so it must be
72 * called after recount_servers(). It also expects px->lbprm.map.srv
73 * to be allocated with the largest size needed. It updates tot_weight.
Willy Tarreau1b877482018-08-21 19:44:53 +020074 *
75 * The lbprm's lock must be held.
Willy Tarreauf89c1872009-10-01 11:19:37 +020076 */
77void recalc_server_map(struct proxy *px)
78{
79 int o, tot, flag;
80 struct server *cur, *best;
81
82 switch (px->lbprm.tot_used) {
83 case 0: /* no server */
Willy Tarreauf89c1872009-10-01 11:19:37 +020084 return;
Willy Tarreauf89c1872009-10-01 11:19:37 +020085 default:
86 tot = px->lbprm.tot_weight;
87 break;
88 }
89
90 /* here we *know* that we have some servers */
91 if (px->srv_act)
Willy Tarreauc93cd162014-05-13 15:54:22 +020092 flag = 0;
Willy Tarreauf89c1872009-10-01 11:19:37 +020093 else
Willy Tarreauc93cd162014-05-13 15:54:22 +020094 flag = SRV_F_BACKUP;
Willy Tarreauf89c1872009-10-01 11:19:37 +020095
96 /* this algorithm gives priority to the first server, which means that
97 * it will respect the declaration order for equivalent weights, and
98 * that whatever the weights, the first server called will always be
Ilya Shipitsin6fb0f212020-04-02 15:25:26 +050099 * the first declared. This is an important assumption for the backup
Willy Tarreauf89c1872009-10-01 11:19:37 +0200100 * case, where we want the first server only.
101 */
102 for (cur = px->srv; cur; cur = cur->next)
103 cur->wscore = 0;
104
105 for (o = 0; o < tot; o++) {
106 int max = 0;
107 best = NULL;
108 for (cur = px->srv; cur; cur = cur->next) {
Willy Tarreau9943d312014-05-22 16:20:59 +0200109 if ((cur->flags & SRV_F_BACKUP) == flag &&
Emeric Brun52a91d32017-08-31 14:41:55 +0200110 srv_willbe_usable(cur)) {
Willy Tarreauf89c1872009-10-01 11:19:37 +0200111 int v;
112
113 /* If we are forced to return only one server, we don't want to
114 * go further, because we would return the wrong one due to
115 * divide overflow.
116 */
117 if (tot == 1) {
118 best = cur;
119 /* note that best->wscore will be wrong but we don't care */
120 break;
121 }
122
Olivier Houchard36a8e6f2019-03-08 18:52:46 +0100123 _HA_ATOMIC_ADD(&cur->wscore, cur->next_eweight);
Willy Tarreauf89c1872009-10-01 11:19:37 +0200124 v = (cur->wscore + tot) / tot; /* result between 0 and 3 */
125 if (best == NULL || v > max) {
126 max = v;
127 best = cur;
128 }
129 }
130 }
131 px->lbprm.map.srv[o] = best;
Willy Tarreauc8b476d2018-12-02 19:22:55 +0100132 if (best)
Olivier Houchard36a8e6f2019-03-08 18:52:46 +0100133 _HA_ATOMIC_SUB(&best->wscore, tot);
Willy Tarreauf89c1872009-10-01 11:19:37 +0200134 }
Willy Tarreauf89c1872009-10-01 11:19:37 +0200135}
136
137/* This function is responsible of building the server MAP for map-based LB
138 * algorithms, allocating the map, and setting p->lbprm.wmult to the GCD of the
139 * weights if applicable. It should be called only once per proxy, at config
140 * time.
141 */
142void init_server_map(struct proxy *p)
143{
144 struct server *srv;
145 int pgcd;
146 int act, bck;
147
148 p->lbprm.set_server_status_up = map_set_server_status_up;
149 p->lbprm.set_server_status_down = map_set_server_status_down;
150 p->lbprm.update_server_eweight = NULL;
151
152 if (!p->srv)
153 return;
154
155 /* We will factor the weights to reduce the table,
156 * using Euclide's largest common divisor algorithm.
157 * Since we may have zero weights, we have to first
158 * find a non-zero weight server.
159 */
160 pgcd = 1;
161 srv = p->srv;
162 while (srv && !srv->uweight)
163 srv = srv->next;
164
165 if (srv) {
166 pgcd = srv->uweight; /* note: cannot be zero */
167 while (pgcd > 1 && (srv = srv->next)) {
168 int w = srv->uweight;
169 while (w) {
170 int t = pgcd % w;
171 pgcd = w;
172 w = t;
173 }
174 }
175 }
176
177 /* It is sometimes useful to know what factor to apply
178 * to the backend's effective weight to know its real
179 * weight.
180 */
181 p->lbprm.wmult = pgcd;
182
183 act = bck = 0;
184 for (srv = p->srv; srv; srv = srv->next) {
Emeric Brun52a91d32017-08-31 14:41:55 +0200185 srv->next_eweight = (srv->uweight * p->lbprm.wdiv + p->lbprm.wmult - 1) / p->lbprm.wmult;
Willy Tarreauc5150da2014-05-13 19:27:31 +0200186
Willy Tarreauc93cd162014-05-13 15:54:22 +0200187 if (srv->flags & SRV_F_BACKUP)
Emeric Brun52a91d32017-08-31 14:41:55 +0200188 bck += srv->next_eweight;
Willy Tarreauf89c1872009-10-01 11:19:37 +0200189 else
Emeric Brun52a91d32017-08-31 14:41:55 +0200190 act += srv->next_eweight;
191 srv_lb_commit_status(srv);
Willy Tarreauf89c1872009-10-01 11:19:37 +0200192 }
193
194 /* this is the largest map we will ever need for this servers list */
195 if (act < bck)
196 act = bck;
197
198 if (!act)
199 act = 1;
200
Vincent Bernat3c2f2f22016-04-03 13:48:42 +0200201 p->lbprm.map.srv = calloc(act, sizeof(struct server *));
Willy Tarreauf89c1872009-10-01 11:19:37 +0200202 /* recounts servers and their weights */
Willy Tarreauf89c1872009-10-01 11:19:37 +0200203 recount_servers(p);
204 update_backend_weight(p);
205 recalc_server_map(p);
206}
207
208/*
209 * This function tries to find a running server with free connection slots for
210 * the proxy <px> following the round-robin method.
211 * If any server is found, it will be returned and px->lbprm.map.rr_idx will be updated
212 * to point to the next server. If no valid server is found, NULL is returned.
Willy Tarreau1b877482018-08-21 19:44:53 +0200213 *
214 * The lbprm's lock will be used.
Willy Tarreauf89c1872009-10-01 11:19:37 +0200215 */
216struct server *map_get_server_rr(struct proxy *px, struct server *srvtoavoid)
217{
218 int newidx, avoididx;
219 struct server *srv, *avoided;
220
Christopher Faulet2a944ee2017-11-07 10:42:54 +0100221 HA_SPIN_LOCK(LBPRM_LOCK, &px->lbprm.lock);
Christopher Faulet5b517552017-06-09 14:17:53 +0200222 if (px->lbprm.tot_weight == 0) {
223 avoided = NULL;
224 goto out;
225 }
Willy Tarreauf89c1872009-10-01 11:19:37 +0200226
227 if (px->lbprm.map.rr_idx < 0 || px->lbprm.map.rr_idx >= px->lbprm.tot_weight)
228 px->lbprm.map.rr_idx = 0;
229 newidx = px->lbprm.map.rr_idx;
230
231 avoided = NULL;
232 avoididx = 0; /* shut a gcc warning */
233 do {
234 srv = px->lbprm.map.srv[newidx++];
Godbach8f9fd2f2013-08-07 09:48:23 +0800235 if (!srv->maxconn || (!srv->nbpend && srv->served < srv_dynamic_maxconn(srv))) {
Willy Tarreauf89c1872009-10-01 11:19:37 +0200236 /* make sure it is not the server we are try to exclude... */
Willy Tarreau03071f62017-11-05 10:59:12 +0100237 /* ...but remember that is was selected yet avoided */
238 avoided = srv;
239 avoididx = newidx;
Willy Tarreauf89c1872009-10-01 11:19:37 +0200240 if (srv != srvtoavoid) {
241 px->lbprm.map.rr_idx = newidx;
Willy Tarreau03071f62017-11-05 10:59:12 +0100242 goto out;
Willy Tarreauf89c1872009-10-01 11:19:37 +0200243 }
Willy Tarreauf89c1872009-10-01 11:19:37 +0200244 }
245 if (newidx == px->lbprm.tot_weight)
246 newidx = 0;
247 } while (newidx != px->lbprm.map.rr_idx);
248
249 if (avoided)
250 px->lbprm.map.rr_idx = avoididx;
251
Christopher Faulet5b517552017-06-09 14:17:53 +0200252 out:
Christopher Faulet2a944ee2017-11-07 10:42:54 +0100253 HA_SPIN_UNLOCK(LBPRM_LOCK, &px->lbprm.lock);
Willy Tarreauf89c1872009-10-01 11:19:37 +0200254 /* return NULL or srvtoavoid if found */
255 return avoided;
256}
257
Willy Tarreau39c9ba72009-10-01 21:11:15 +0200258/*
259 * This function returns the running server from the map at the location
260 * pointed to by the result of a modulo operation on <hash>. The server map may
261 * be recomputed if required before being looked up. If any server is found, it
262 * will be returned. If no valid server is found, NULL is returned.
Willy Tarreau1b877482018-08-21 19:44:53 +0200263 *
264 * The lbprm's lock will be used.
Willy Tarreau39c9ba72009-10-01 21:11:15 +0200265 */
266struct server *map_get_server_hash(struct proxy *px, unsigned int hash)
267{
Willy Tarreau1b877482018-08-21 19:44:53 +0200268 struct server *srv = NULL;
269
270 HA_SPIN_LOCK(LBPRM_LOCK, &px->lbprm.lock);
271 if (px->lbprm.tot_weight)
272 srv = px->lbprm.map.srv[hash % px->lbprm.tot_weight];
273 HA_SPIN_UNLOCK(LBPRM_LOCK, &px->lbprm.lock);
274 return srv;
Willy Tarreau39c9ba72009-10-01 21:11:15 +0200275}
276
Willy Tarreauf89c1872009-10-01 11:19:37 +0200277
278/*
279 * Local variables:
280 * c-indent-level: 8
281 * c-basic-offset: 8
282 * End:
283 */