Mercurial > hg > nginx-quic
annotate src/stream/ngx_stream_upstream_hash_module.c @ 7354:1812f1d79d84
Fixed socket leak with "return 444" in error_page (ticket #274).
Socket leak was observed in the following configuration:
error_page 400 = /close;
location = /close {
return 444;
}
The problem is that "return 444" triggers termination of the request,
and due to error_page termination thinks that it needs to use a posted
request to clear stack. But at the early request processing where 400
errors are generated there are no ngx_http_run_posted_requests() calls,
so the request is only terminated after an external event.
Variants of the problem include "error_page 497" instead (ticket #695)
and various other errors generated during early request processing
(405, 414, 421, 494, 495, 496, 501, 505).
The same problem can be also triggered with "return 499" and "return 408"
as both codes trigger ngx_http_terminate_request(), much like "return 444".
To fix this, the patch adds ngx_http_run_posted_requests() calls to
ngx_http_process_request_line() and ngx_http_process_request_headers()
functions, and to ngx_http_v2_run_request() and ngx_http_v2_push_stream()
functions in HTTP/2.
Since the ngx_http_process_request() function is now only called via
other functions which call ngx_http_run_posted_requests(), the call
there is no longer needed and was removed.
author | Maxim Dounin <mdounin@mdounin.ru> |
---|---|
date | Fri, 21 Sep 2018 15:59:30 +0300 |
parents | ed599ea6c1f1 |
children | d964b0aee8e7 |
rev | line source |
---|---|
6115 | 1 |
2 /* | |
3 * Copyright (C) Roman Arutyunyan | |
4 * Copyright (C) Nginx, Inc. | |
5 */ | |
6 | |
7 | |
8 #include <ngx_config.h> | |
9 #include <ngx_core.h> | |
10 #include <ngx_stream.h> | |
11 | |
12 | |
13 typedef struct { | |
14 uint32_t hash; | |
15 ngx_str_t *server; | |
16 } ngx_stream_upstream_chash_point_t; | |
17 | |
18 | |
19 typedef struct { | |
20 ngx_uint_t number; | |
21 ngx_stream_upstream_chash_point_t point[1]; | |
22 } ngx_stream_upstream_chash_points_t; | |
23 | |
24 | |
25 typedef struct { | |
6610
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
26 ngx_stream_complex_value_t key; |
6115 | 27 ngx_stream_upstream_chash_points_t *points; |
28 } ngx_stream_upstream_hash_srv_conf_t; | |
29 | |
30 | |
31 typedef struct { | |
32 /* the round robin data must be first */ | |
33 ngx_stream_upstream_rr_peer_data_t rrp; | |
34 ngx_stream_upstream_hash_srv_conf_t *conf; | |
35 ngx_str_t key; | |
36 ngx_uint_t tries; | |
37 ngx_uint_t rehash; | |
38 uint32_t hash; | |
39 ngx_event_get_peer_pt get_rr_peer; | |
40 } ngx_stream_upstream_hash_peer_data_t; | |
41 | |
42 | |
43 static ngx_int_t ngx_stream_upstream_init_hash(ngx_conf_t *cf, | |
44 ngx_stream_upstream_srv_conf_t *us); | |
45 static ngx_int_t ngx_stream_upstream_init_hash_peer(ngx_stream_session_t *s, | |
46 ngx_stream_upstream_srv_conf_t *us); | |
47 static ngx_int_t ngx_stream_upstream_get_hash_peer(ngx_peer_connection_t *pc, | |
48 void *data); | |
49 | |
50 static ngx_int_t ngx_stream_upstream_init_chash(ngx_conf_t *cf, | |
51 ngx_stream_upstream_srv_conf_t *us); | |
52 static int ngx_libc_cdecl | |
53 ngx_stream_upstream_chash_cmp_points(const void *one, const void *two); | |
54 static ngx_uint_t ngx_stream_upstream_find_chash_point( | |
55 ngx_stream_upstream_chash_points_t *points, uint32_t hash); | |
56 static ngx_int_t ngx_stream_upstream_init_chash_peer(ngx_stream_session_t *s, | |
57 ngx_stream_upstream_srv_conf_t *us); | |
58 static ngx_int_t ngx_stream_upstream_get_chash_peer(ngx_peer_connection_t *pc, | |
59 void *data); | |
60 | |
61 static void *ngx_stream_upstream_hash_create_conf(ngx_conf_t *cf); | |
62 static char *ngx_stream_upstream_hash(ngx_conf_t *cf, ngx_command_t *cmd, | |
63 void *conf); | |
64 | |
65 | |
66 static ngx_command_t ngx_stream_upstream_hash_commands[] = { | |
67 | |
68 { ngx_string("hash"), | |
69 NGX_STREAM_UPS_CONF|NGX_CONF_TAKE12, | |
70 ngx_stream_upstream_hash, | |
71 NGX_STREAM_SRV_CONF_OFFSET, | |
72 0, | |
73 NULL }, | |
74 | |
75 ngx_null_command | |
76 }; | |
77 | |
78 | |
79 static ngx_stream_module_t ngx_stream_upstream_hash_module_ctx = { | |
6606
2f41d383c9c7
Stream: added preconfiguration step.
Vladimir Homutov <vl@nginx.com>
parents:
6174
diff
changeset
|
80 NULL, /* preconfiguration */ |
6174
68c106e6fa0a
Stream: added postconfiguration method to stream modules.
Vladimir Homutov <vl@nginx.com>
parents:
6148
diff
changeset
|
81 NULL, /* postconfiguration */ |
68c106e6fa0a
Stream: added postconfiguration method to stream modules.
Vladimir Homutov <vl@nginx.com>
parents:
6148
diff
changeset
|
82 |
6115 | 83 NULL, /* create main configuration */ |
84 NULL, /* init main configuration */ | |
85 | |
86 ngx_stream_upstream_hash_create_conf, /* create server configuration */ | |
6629 | 87 NULL /* merge server configuration */ |
6115 | 88 }; |
89 | |
90 | |
91 ngx_module_t ngx_stream_upstream_hash_module = { | |
92 NGX_MODULE_V1, | |
93 &ngx_stream_upstream_hash_module_ctx, /* module context */ | |
94 ngx_stream_upstream_hash_commands, /* module directives */ | |
95 NGX_STREAM_MODULE, /* module type */ | |
96 NULL, /* init master */ | |
97 NULL, /* init module */ | |
98 NULL, /* init process */ | |
99 NULL, /* init thread */ | |
100 NULL, /* exit thread */ | |
101 NULL, /* exit process */ | |
102 NULL, /* exit master */ | |
103 NGX_MODULE_V1_PADDING | |
104 }; | |
105 | |
106 | |
107 static ngx_int_t | |
108 ngx_stream_upstream_init_hash(ngx_conf_t *cf, | |
109 ngx_stream_upstream_srv_conf_t *us) | |
110 { | |
111 if (ngx_stream_upstream_init_round_robin(cf, us) != NGX_OK) { | |
112 return NGX_ERROR; | |
113 } | |
114 | |
115 us->peer.init = ngx_stream_upstream_init_hash_peer; | |
116 | |
117 return NGX_OK; | |
118 } | |
119 | |
120 | |
121 static ngx_int_t | |
122 ngx_stream_upstream_init_hash_peer(ngx_stream_session_t *s, | |
123 ngx_stream_upstream_srv_conf_t *us) | |
124 { | |
125 ngx_stream_upstream_hash_srv_conf_t *hcf; | |
126 ngx_stream_upstream_hash_peer_data_t *hp; | |
127 | |
128 hp = ngx_palloc(s->connection->pool, | |
129 sizeof(ngx_stream_upstream_hash_peer_data_t)); | |
130 if (hp == NULL) { | |
131 return NGX_ERROR; | |
132 } | |
133 | |
134 s->upstream->peer.data = &hp->rrp; | |
135 | |
136 if (ngx_stream_upstream_init_round_robin_peer(s, us) != NGX_OK) { | |
137 return NGX_ERROR; | |
138 } | |
139 | |
140 s->upstream->peer.get = ngx_stream_upstream_get_hash_peer; | |
141 | |
142 hcf = ngx_stream_conf_upstream_srv_conf(us, | |
143 ngx_stream_upstream_hash_module); | |
144 | |
6610
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
145 if (ngx_stream_complex_value(s, &hcf->key, &hp->key) != NGX_OK) { |
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
146 return NGX_ERROR; |
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
147 } |
6115 | 148 |
149 ngx_log_debug1(NGX_LOG_DEBUG_STREAM, s->connection->log, 0, | |
150 "upstream hash key:\"%V\"", &hp->key); | |
151 | |
152 hp->conf = hcf; | |
153 hp->tries = 0; | |
154 hp->rehash = 0; | |
155 hp->hash = 0; | |
156 hp->get_rr_peer = ngx_stream_upstream_get_round_robin_peer; | |
157 | |
158 return NGX_OK; | |
159 } | |
160 | |
161 | |
162 static ngx_int_t | |
163 ngx_stream_upstream_get_hash_peer(ngx_peer_connection_t *pc, void *data) | |
164 { | |
165 ngx_stream_upstream_hash_peer_data_t *hp = data; | |
166 | |
167 time_t now; | |
168 u_char buf[NGX_INT_T_LEN]; | |
169 size_t size; | |
170 uint32_t hash; | |
171 ngx_int_t w; | |
172 uintptr_t m; | |
6121
b6047abf5f30
Upstream: simplified ip_hash and hash peer selection code.
Ruslan Ermilov <ru@nginx.com>
parents:
6115
diff
changeset
|
173 ngx_uint_t n, p; |
6115 | 174 ngx_stream_upstream_rr_peer_t *peer; |
175 | |
176 ngx_log_debug1(NGX_LOG_DEBUG_STREAM, pc->log, 0, | |
177 "get hash peer, try: %ui", pc->tries); | |
178 | |
7300
ed599ea6c1f1
Upstream: improved peer selection concurrency for hash and ip_hash.
Ruslan Ermilov <ru@nginx.com>
parents:
7124
diff
changeset
|
179 ngx_stream_upstream_rr_peers_rlock(hp->rrp.peers); |
6115 | 180 |
181 if (hp->tries > 20 || hp->rrp.peers->single) { | |
182 ngx_stream_upstream_rr_peers_unlock(hp->rrp.peers); | |
183 return hp->get_rr_peer(pc, &hp->rrp); | |
184 } | |
185 | |
186 now = ngx_time(); | |
187 | |
188 pc->connection = NULL; | |
189 | |
190 for ( ;; ) { | |
191 | |
192 /* | |
193 * Hash expression is compatible with Cache::Memcached: | |
194 * ((crc32([REHASH] KEY) >> 16) & 0x7fff) + PREV_HASH | |
195 * with REHASH omitted at the first iteration. | |
196 */ | |
197 | |
198 ngx_crc32_init(hash); | |
199 | |
200 if (hp->rehash > 0) { | |
201 size = ngx_sprintf(buf, "%ui", hp->rehash) - buf; | |
202 ngx_crc32_update(&hash, buf, size); | |
203 } | |
204 | |
205 ngx_crc32_update(&hash, hp->key.data, hp->key.len); | |
206 ngx_crc32_final(hash); | |
207 | |
208 hash = (hash >> 16) & 0x7fff; | |
209 | |
210 hp->hash += hash; | |
211 hp->rehash++; | |
212 | |
6121
b6047abf5f30
Upstream: simplified ip_hash and hash peer selection code.
Ruslan Ermilov <ru@nginx.com>
parents:
6115
diff
changeset
|
213 w = hp->hash % hp->rrp.peers->total_weight; |
b6047abf5f30
Upstream: simplified ip_hash and hash peer selection code.
Ruslan Ermilov <ru@nginx.com>
parents:
6115
diff
changeset
|
214 peer = hp->rrp.peers->peer; |
b6047abf5f30
Upstream: simplified ip_hash and hash peer selection code.
Ruslan Ermilov <ru@nginx.com>
parents:
6115
diff
changeset
|
215 p = 0; |
6115 | 216 |
6121
b6047abf5f30
Upstream: simplified ip_hash and hash peer selection code.
Ruslan Ermilov <ru@nginx.com>
parents:
6115
diff
changeset
|
217 while (w >= peer->weight) { |
b6047abf5f30
Upstream: simplified ip_hash and hash peer selection code.
Ruslan Ermilov <ru@nginx.com>
parents:
6115
diff
changeset
|
218 w -= peer->weight; |
b6047abf5f30
Upstream: simplified ip_hash and hash peer selection code.
Ruslan Ermilov <ru@nginx.com>
parents:
6115
diff
changeset
|
219 peer = peer->next; |
b6047abf5f30
Upstream: simplified ip_hash and hash peer selection code.
Ruslan Ermilov <ru@nginx.com>
parents:
6115
diff
changeset
|
220 p++; |
6115 | 221 } |
222 | |
223 n = p / (8 * sizeof(uintptr_t)); | |
224 m = (uintptr_t) 1 << p % (8 * sizeof(uintptr_t)); | |
225 | |
226 if (hp->rrp.tried[n] & m) { | |
227 goto next; | |
228 } | |
229 | |
7300
ed599ea6c1f1
Upstream: improved peer selection concurrency for hash and ip_hash.
Ruslan Ermilov <ru@nginx.com>
parents:
7124
diff
changeset
|
230 ngx_stream_upstream_rr_peer_lock(hp->rrp.peers, peer); |
ed599ea6c1f1
Upstream: improved peer selection concurrency for hash and ip_hash.
Ruslan Ermilov <ru@nginx.com>
parents:
7124
diff
changeset
|
231 |
6115 | 232 ngx_log_debug2(NGX_LOG_DEBUG_STREAM, pc->log, 0, |
233 "get hash peer, value:%uD, peer:%ui", hp->hash, p); | |
234 | |
235 if (peer->down) { | |
7300
ed599ea6c1f1
Upstream: improved peer selection concurrency for hash and ip_hash.
Ruslan Ermilov <ru@nginx.com>
parents:
7124
diff
changeset
|
236 ngx_stream_upstream_rr_peer_unlock(hp->rrp.peers, peer); |
6115 | 237 goto next; |
238 } | |
239 | |
240 if (peer->max_fails | |
241 && peer->fails >= peer->max_fails | |
242 && now - peer->checked <= peer->fail_timeout) | |
243 { | |
7300
ed599ea6c1f1
Upstream: improved peer selection concurrency for hash and ip_hash.
Ruslan Ermilov <ru@nginx.com>
parents:
7124
diff
changeset
|
244 ngx_stream_upstream_rr_peer_unlock(hp->rrp.peers, peer); |
6115 | 245 goto next; |
246 } | |
247 | |
6705 | 248 if (peer->max_conns && peer->conns >= peer->max_conns) { |
7300
ed599ea6c1f1
Upstream: improved peer selection concurrency for hash and ip_hash.
Ruslan Ermilov <ru@nginx.com>
parents:
7124
diff
changeset
|
249 ngx_stream_upstream_rr_peer_unlock(hp->rrp.peers, peer); |
6705 | 250 goto next; |
251 } | |
252 | |
6115 | 253 break; |
254 | |
255 next: | |
256 | |
257 if (++hp->tries > 20) { | |
258 ngx_stream_upstream_rr_peers_unlock(hp->rrp.peers); | |
259 return hp->get_rr_peer(pc, &hp->rrp); | |
260 } | |
261 } | |
262 | |
263 hp->rrp.current = peer; | |
264 | |
265 pc->sockaddr = peer->sockaddr; | |
266 pc->socklen = peer->socklen; | |
267 pc->name = &peer->name; | |
268 | |
269 peer->conns++; | |
270 | |
271 if (now - peer->checked > peer->fail_timeout) { | |
272 peer->checked = now; | |
273 } | |
274 | |
7300
ed599ea6c1f1
Upstream: improved peer selection concurrency for hash and ip_hash.
Ruslan Ermilov <ru@nginx.com>
parents:
7124
diff
changeset
|
275 ngx_stream_upstream_rr_peer_unlock(hp->rrp.peers, peer); |
6115 | 276 ngx_stream_upstream_rr_peers_unlock(hp->rrp.peers); |
277 | |
278 hp->rrp.tried[n] |= m; | |
279 | |
280 return NGX_OK; | |
281 } | |
282 | |
283 | |
284 static ngx_int_t | |
285 ngx_stream_upstream_init_chash(ngx_conf_t *cf, | |
286 ngx_stream_upstream_srv_conf_t *us) | |
287 { | |
288 u_char *host, *port, c; | |
289 size_t host_len, port_len, size; | |
6148
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
290 uint32_t hash, base_hash; |
6115 | 291 ngx_str_t *server; |
292 ngx_uint_t npoints, i, j; | |
293 ngx_stream_upstream_rr_peer_t *peer; | |
294 ngx_stream_upstream_rr_peers_t *peers; | |
295 ngx_stream_upstream_chash_points_t *points; | |
296 ngx_stream_upstream_hash_srv_conf_t *hcf; | |
6148
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
297 union { |
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
298 uint32_t value; |
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
299 u_char byte[4]; |
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
300 } prev_hash; |
6115 | 301 |
302 if (ngx_stream_upstream_init_round_robin(cf, us) != NGX_OK) { | |
303 return NGX_ERROR; | |
304 } | |
305 | |
306 us->peer.init = ngx_stream_upstream_init_chash_peer; | |
307 | |
308 peers = us->peer.data; | |
309 npoints = peers->total_weight * 160; | |
310 | |
311 size = sizeof(ngx_stream_upstream_chash_points_t) | |
312 + sizeof(ngx_stream_upstream_chash_point_t) * (npoints - 1); | |
313 | |
314 points = ngx_palloc(cf->pool, size); | |
315 if (points == NULL) { | |
316 return NGX_ERROR; | |
317 } | |
318 | |
319 points->number = 0; | |
320 | |
321 for (peer = peers->peer; peer; peer = peer->next) { | |
322 server = &peer->server; | |
323 | |
324 /* | |
325 * Hash expression is compatible with Cache::Memcached::Fast: | |
326 * crc32(HOST \0 PORT PREV_HASH). | |
327 */ | |
328 | |
329 if (server->len >= 5 | |
330 && ngx_strncasecmp(server->data, (u_char *) "unix:", 5) == 0) | |
331 { | |
332 host = server->data + 5; | |
333 host_len = server->len - 5; | |
334 port = NULL; | |
335 port_len = 0; | |
336 goto done; | |
337 } | |
338 | |
339 for (j = 0; j < server->len; j++) { | |
340 c = server->data[server->len - j - 1]; | |
341 | |
342 if (c == ':') { | |
343 host = server->data; | |
344 host_len = server->len - j - 1; | |
345 port = server->data + server->len - j; | |
346 port_len = j; | |
347 goto done; | |
348 } | |
349 | |
350 if (c < '0' || c > '9') { | |
351 break; | |
352 } | |
353 } | |
354 | |
355 host = server->data; | |
356 host_len = server->len; | |
357 port = NULL; | |
358 port_len = 0; | |
359 | |
360 done: | |
361 | |
362 ngx_crc32_init(base_hash); | |
363 ngx_crc32_update(&base_hash, host, host_len); | |
364 ngx_crc32_update(&base_hash, (u_char *) "", 1); | |
365 ngx_crc32_update(&base_hash, port, port_len); | |
366 | |
6148
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
367 prev_hash.value = 0; |
6115 | 368 npoints = peer->weight * 160; |
369 | |
370 for (j = 0; j < npoints; j++) { | |
371 hash = base_hash; | |
372 | |
6148
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
373 ngx_crc32_update(&hash, prev_hash.byte, 4); |
6115 | 374 ngx_crc32_final(hash); |
375 | |
376 points->point[points->number].hash = hash; | |
377 points->point[points->number].server = server; | |
378 points->number++; | |
379 | |
6148
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
380 #if (NGX_HAVE_LITTLE_ENDIAN) |
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
381 prev_hash.value = hash; |
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
382 #else |
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
383 prev_hash.byte[0] = (u_char) (hash & 0xff); |
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
384 prev_hash.byte[1] = (u_char) ((hash >> 8) & 0xff); |
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
385 prev_hash.byte[2] = (u_char) ((hash >> 16) & 0xff); |
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
386 prev_hash.byte[3] = (u_char) ((hash >> 24) & 0xff); |
bf8b6534db3a
Upstream hash: consistency across little/big endianness.
Sergey Kandaurov <pluknet@nginx.com>
parents:
6121
diff
changeset
|
387 #endif |
6115 | 388 } |
389 } | |
390 | |
391 ngx_qsort(points->point, | |
392 points->number, | |
393 sizeof(ngx_stream_upstream_chash_point_t), | |
394 ngx_stream_upstream_chash_cmp_points); | |
395 | |
396 for (i = 0, j = 1; j < points->number; j++) { | |
397 if (points->point[i].hash != points->point[j].hash) { | |
398 points->point[++i] = points->point[j]; | |
399 } | |
400 } | |
401 | |
402 points->number = i + 1; | |
403 | |
404 hcf = ngx_stream_conf_upstream_srv_conf(us, | |
405 ngx_stream_upstream_hash_module); | |
406 hcf->points = points; | |
407 | |
408 return NGX_OK; | |
409 } | |
410 | |
411 | |
412 static int ngx_libc_cdecl | |
413 ngx_stream_upstream_chash_cmp_points(const void *one, const void *two) | |
414 { | |
415 ngx_stream_upstream_chash_point_t *first = | |
416 (ngx_stream_upstream_chash_point_t *) one; | |
417 ngx_stream_upstream_chash_point_t *second = | |
418 (ngx_stream_upstream_chash_point_t *) two; | |
419 | |
420 if (first->hash < second->hash) { | |
421 return -1; | |
422 | |
423 } else if (first->hash > second->hash) { | |
424 return 1; | |
425 | |
426 } else { | |
427 return 0; | |
428 } | |
429 } | |
430 | |
431 | |
432 static ngx_uint_t | |
433 ngx_stream_upstream_find_chash_point(ngx_stream_upstream_chash_points_t *points, | |
434 uint32_t hash) | |
435 { | |
436 ngx_uint_t i, j, k; | |
437 ngx_stream_upstream_chash_point_t *point; | |
438 | |
439 /* find first point >= hash */ | |
440 | |
441 point = &points->point[0]; | |
442 | |
443 i = 0; | |
444 j = points->number; | |
445 | |
446 while (i < j) { | |
447 k = (i + j) / 2; | |
448 | |
449 if (hash > point[k].hash) { | |
450 i = k + 1; | |
451 | |
452 } else if (hash < point[k].hash) { | |
453 j = k; | |
454 | |
455 } else { | |
456 return k; | |
457 } | |
458 } | |
459 | |
460 return i; | |
461 } | |
462 | |
463 | |
464 static ngx_int_t | |
465 ngx_stream_upstream_init_chash_peer(ngx_stream_session_t *s, | |
466 ngx_stream_upstream_srv_conf_t *us) | |
467 { | |
468 uint32_t hash; | |
469 ngx_stream_upstream_hash_srv_conf_t *hcf; | |
470 ngx_stream_upstream_hash_peer_data_t *hp; | |
471 | |
472 if (ngx_stream_upstream_init_hash_peer(s, us) != NGX_OK) { | |
473 return NGX_ERROR; | |
474 } | |
475 | |
476 s->upstream->peer.get = ngx_stream_upstream_get_chash_peer; | |
477 | |
478 hp = s->upstream->peer.data; | |
479 hcf = ngx_stream_conf_upstream_srv_conf(us, | |
480 ngx_stream_upstream_hash_module); | |
481 | |
482 hash = ngx_crc32_long(hp->key.data, hp->key.len); | |
483 | |
484 ngx_stream_upstream_rr_peers_rlock(hp->rrp.peers); | |
485 | |
486 hp->hash = ngx_stream_upstream_find_chash_point(hcf->points, hash); | |
487 | |
488 ngx_stream_upstream_rr_peers_unlock(hp->rrp.peers); | |
489 | |
490 return NGX_OK; | |
491 } | |
492 | |
493 | |
494 static ngx_int_t | |
495 ngx_stream_upstream_get_chash_peer(ngx_peer_connection_t *pc, void *data) | |
496 { | |
497 ngx_stream_upstream_hash_peer_data_t *hp = data; | |
498 | |
499 time_t now; | |
500 intptr_t m; | |
501 ngx_str_t *server; | |
502 ngx_int_t total; | |
503 ngx_uint_t i, n, best_i; | |
504 ngx_stream_upstream_rr_peer_t *peer, *best; | |
505 ngx_stream_upstream_chash_point_t *point; | |
506 ngx_stream_upstream_chash_points_t *points; | |
507 ngx_stream_upstream_hash_srv_conf_t *hcf; | |
508 | |
509 ngx_log_debug1(NGX_LOG_DEBUG_STREAM, pc->log, 0, | |
510 "get consistent hash peer, try: %ui", pc->tries); | |
511 | |
512 ngx_stream_upstream_rr_peers_wlock(hp->rrp.peers); | |
513 | |
7123
6c52b24fcf8e
Upstream hash: limited number of tries in consistent case.
Maxim Dounin <mdounin@mdounin.ru>
parents:
6705
diff
changeset
|
514 if (hp->tries > 20 || hp->rrp.peers->single) { |
6c52b24fcf8e
Upstream hash: limited number of tries in consistent case.
Maxim Dounin <mdounin@mdounin.ru>
parents:
6705
diff
changeset
|
515 ngx_stream_upstream_rr_peers_unlock(hp->rrp.peers); |
6c52b24fcf8e
Upstream hash: limited number of tries in consistent case.
Maxim Dounin <mdounin@mdounin.ru>
parents:
6705
diff
changeset
|
516 return hp->get_rr_peer(pc, &hp->rrp); |
6c52b24fcf8e
Upstream hash: limited number of tries in consistent case.
Maxim Dounin <mdounin@mdounin.ru>
parents:
6705
diff
changeset
|
517 } |
6c52b24fcf8e
Upstream hash: limited number of tries in consistent case.
Maxim Dounin <mdounin@mdounin.ru>
parents:
6705
diff
changeset
|
518 |
6115 | 519 pc->connection = NULL; |
520 | |
521 now = ngx_time(); | |
522 hcf = hp->conf; | |
523 | |
524 points = hcf->points; | |
525 point = &points->point[0]; | |
526 | |
527 for ( ;; ) { | |
528 server = point[hp->hash % points->number].server; | |
529 | |
530 ngx_log_debug2(NGX_LOG_DEBUG_STREAM, pc->log, 0, | |
531 "consistent hash peer:%uD, server:\"%V\"", | |
532 hp->hash, server); | |
533 | |
534 best = NULL; | |
535 best_i = 0; | |
536 total = 0; | |
537 | |
538 for (peer = hp->rrp.peers->peer, i = 0; | |
539 peer; | |
540 peer = peer->next, i++) | |
541 { | |
542 n = i / (8 * sizeof(uintptr_t)); | |
543 m = (uintptr_t) 1 << i % (8 * sizeof(uintptr_t)); | |
544 | |
545 if (hp->rrp.tried[n] & m) { | |
546 continue; | |
547 } | |
548 | |
549 if (peer->down) { | |
550 continue; | |
551 } | |
552 | |
553 if (peer->max_fails | |
554 && peer->fails >= peer->max_fails | |
555 && now - peer->checked <= peer->fail_timeout) | |
556 { | |
557 continue; | |
558 } | |
559 | |
6705 | 560 if (peer->max_conns && peer->conns >= peer->max_conns) { |
561 continue; | |
562 } | |
563 | |
7124
3b4fa572d56d
Upstream hash: reordered peer checks.
Maxim Dounin <mdounin@mdounin.ru>
parents:
7123
diff
changeset
|
564 if (peer->server.len != server->len |
3b4fa572d56d
Upstream hash: reordered peer checks.
Maxim Dounin <mdounin@mdounin.ru>
parents:
7123
diff
changeset
|
565 || ngx_strncmp(peer->server.data, server->data, server->len) |
3b4fa572d56d
Upstream hash: reordered peer checks.
Maxim Dounin <mdounin@mdounin.ru>
parents:
7123
diff
changeset
|
566 != 0) |
3b4fa572d56d
Upstream hash: reordered peer checks.
Maxim Dounin <mdounin@mdounin.ru>
parents:
7123
diff
changeset
|
567 { |
3b4fa572d56d
Upstream hash: reordered peer checks.
Maxim Dounin <mdounin@mdounin.ru>
parents:
7123
diff
changeset
|
568 continue; |
3b4fa572d56d
Upstream hash: reordered peer checks.
Maxim Dounin <mdounin@mdounin.ru>
parents:
7123
diff
changeset
|
569 } |
3b4fa572d56d
Upstream hash: reordered peer checks.
Maxim Dounin <mdounin@mdounin.ru>
parents:
7123
diff
changeset
|
570 |
6115 | 571 peer->current_weight += peer->effective_weight; |
572 total += peer->effective_weight; | |
573 | |
574 if (peer->effective_weight < peer->weight) { | |
575 peer->effective_weight++; | |
576 } | |
577 | |
578 if (best == NULL || peer->current_weight > best->current_weight) { | |
579 best = peer; | |
580 best_i = i; | |
581 } | |
582 } | |
583 | |
584 if (best) { | |
585 best->current_weight -= total; | |
586 break; | |
587 } | |
588 | |
589 hp->hash++; | |
590 hp->tries++; | |
591 | |
7123
6c52b24fcf8e
Upstream hash: limited number of tries in consistent case.
Maxim Dounin <mdounin@mdounin.ru>
parents:
6705
diff
changeset
|
592 if (hp->tries > 20) { |
6115 | 593 ngx_stream_upstream_rr_peers_unlock(hp->rrp.peers); |
7123
6c52b24fcf8e
Upstream hash: limited number of tries in consistent case.
Maxim Dounin <mdounin@mdounin.ru>
parents:
6705
diff
changeset
|
594 return hp->get_rr_peer(pc, &hp->rrp); |
6115 | 595 } |
596 } | |
597 | |
598 hp->rrp.current = best; | |
599 | |
600 pc->sockaddr = best->sockaddr; | |
601 pc->socklen = best->socklen; | |
602 pc->name = &best->name; | |
603 | |
604 best->conns++; | |
605 | |
606 if (now - best->checked > best->fail_timeout) { | |
607 best->checked = now; | |
608 } | |
609 | |
610 ngx_stream_upstream_rr_peers_unlock(hp->rrp.peers); | |
611 | |
612 n = best_i / (8 * sizeof(uintptr_t)); | |
613 m = (uintptr_t) 1 << best_i % (8 * sizeof(uintptr_t)); | |
614 | |
615 hp->rrp.tried[n] |= m; | |
616 | |
617 return NGX_OK; | |
618 } | |
619 | |
620 | |
621 static void * | |
622 ngx_stream_upstream_hash_create_conf(ngx_conf_t *cf) | |
623 { | |
624 ngx_stream_upstream_hash_srv_conf_t *conf; | |
625 | |
626 conf = ngx_palloc(cf->pool, sizeof(ngx_stream_upstream_hash_srv_conf_t)); | |
627 if (conf == NULL) { | |
628 return NULL; | |
629 } | |
630 | |
631 conf->points = NULL; | |
632 | |
633 return conf; | |
634 } | |
635 | |
636 | |
637 static char * | |
638 ngx_stream_upstream_hash(ngx_conf_t *cf, ngx_command_t *cmd, void *conf) | |
639 { | |
6610
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
640 ngx_stream_upstream_hash_srv_conf_t *hcf = conf; |
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
641 |
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
642 ngx_str_t *value; |
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
643 ngx_stream_upstream_srv_conf_t *uscf; |
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
644 ngx_stream_compile_complex_value_t ccv; |
6115 | 645 |
646 value = cf->args->elts; | |
647 | |
6610
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
648 ngx_memzero(&ccv, sizeof(ngx_stream_compile_complex_value_t)); |
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
649 |
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
650 ccv.cf = cf; |
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
651 ccv.value = &value[1]; |
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
652 ccv.complex_value = &hcf->key; |
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
653 |
d5b5866c06c4
Stream: got rid of pseudo variables.
Vladimir Homutov <vl@nginx.com>
parents:
6606
diff
changeset
|
654 if (ngx_stream_compile_complex_value(&ccv) != NGX_OK) { |
6115 | 655 return NGX_CONF_ERROR; |
656 } | |
657 | |
658 uscf = ngx_stream_conf_get_module_srv_conf(cf, ngx_stream_upstream_module); | |
659 | |
660 if (uscf->peer.init_upstream) { | |
661 ngx_conf_log_error(NGX_LOG_WARN, cf, 0, | |
662 "load balancing method redefined"); | |
663 } | |
664 | |
665 uscf->flags = NGX_STREAM_UPSTREAM_CREATE | |
666 |NGX_STREAM_UPSTREAM_WEIGHT | |
6705 | 667 |NGX_STREAM_UPSTREAM_MAX_CONNS |
6115 | 668 |NGX_STREAM_UPSTREAM_MAX_FAILS |
669 |NGX_STREAM_UPSTREAM_FAIL_TIMEOUT | |
670 |NGX_STREAM_UPSTREAM_DOWN; | |
671 | |
672 if (cf->args->nelts == 2) { | |
673 uscf->peer.init_upstream = ngx_stream_upstream_init_hash; | |
674 | |
675 } else if (ngx_strcmp(value[2].data, "consistent") == 0) { | |
676 uscf->peer.init_upstream = ngx_stream_upstream_init_chash; | |
677 | |
678 } else { | |
679 ngx_conf_log_error(NGX_LOG_EMERG, cf, 0, | |
680 "invalid parameter \"%V\"", &value[2]); | |
681 return NGX_CONF_ERROR; | |
682 } | |
683 | |
684 return NGX_CONF_OK; | |
685 } |