337a999aa91c2f397fac641c7a69eaf3fcd22db5
[m6w6/libmemcached] / libmemcached / hosts.cc
1 /* vim:expandtab:shiftwidth=2:tabstop=2:smarttab:
2 *
3 * Libmemcached library
4 *
5 * Copyright (C) 2011 Data Differential, http://datadifferential.com/
6 * Copyright (C) 2006-2010 Brian Aker All rights reserved.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions are
10 * met:
11 *
12 * * Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 *
15 * * Redistributions in binary form must reproduce the above
16 * copyright notice, this list of conditions and the following disclaimer
17 * in the documentation and/or other materials provided with the
18 * distribution.
19 *
20 * * The names of its contributors may not be used to endorse or
21 * promote products derived from this software without specific prior
22 * written permission.
23 *
24 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
25 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
26 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
27 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
28 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
29 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
30 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
31 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
32 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
33 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
34 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
35 *
36 */
37
38 #include <libmemcached/common.h>
39
40 #include <cmath>
41 #include <sys/time.h>
42
43 /* Protoypes (static) */
44 static memcached_return_t update_continuum(memcached_st *ptr);
45
46 static int compare_servers(const void *p1, const void *p2)
47 {
48 memcached_server_instance_st a= (memcached_server_instance_st)p1;
49 memcached_server_instance_st b= (memcached_server_instance_st)p2;
50
51 int return_value= strcmp(a->hostname, b->hostname);
52
53 if (return_value == 0)
54 {
55 return_value= (int) (a->port - b->port);
56 }
57
58 return return_value;
59 }
60
61 static void sort_hosts(memcached_st *ptr)
62 {
63 if (memcached_server_count(ptr))
64 {
65 memcached_server_write_instance_st instance;
66
67 qsort(memcached_server_list(ptr), memcached_server_count(ptr), sizeof(memcached_server_st), compare_servers);
68 instance= memcached_server_instance_fetch(ptr, 0);
69 instance->number_of_hosts= memcached_server_count(ptr);
70 }
71 }
72
73
74 memcached_return_t run_distribution(memcached_st *ptr)
75 {
76 if (ptr->flags.use_sort_hosts)
77 {
78 sort_hosts(ptr);
79 }
80
81 switch (ptr->distribution)
82 {
83 case MEMCACHED_DISTRIBUTION_CONSISTENT:
84 case MEMCACHED_DISTRIBUTION_CONSISTENT_KETAMA:
85 case MEMCACHED_DISTRIBUTION_CONSISTENT_KETAMA_SPY:
86 case MEMCACHED_DISTRIBUTION_CONSISTENT_WEIGHTED:
87 return update_continuum(ptr);
88
89 case MEMCACHED_DISTRIBUTION_VIRTUAL_BUCKET:
90 case MEMCACHED_DISTRIBUTION_MODULA:
91 break;
92
93 case MEMCACHED_DISTRIBUTION_RANDOM:
94 srandom((uint32_t) time(NULL));
95 break;
96
97 case MEMCACHED_DISTRIBUTION_CONSISTENT_MAX:
98 default:
99 assert_msg(0, "Invalid distribution type passed to run_distribution()");
100 }
101
102 return MEMCACHED_SUCCESS;
103 }
104
105 static uint32_t ketama_server_hash(const char *key, size_t key_length, uint32_t alignment)
106 {
107 unsigned char results[16];
108
109 libhashkit_md5_signature((unsigned char*)key, key_length, results);
110
111 return ((uint32_t) (results[3 + alignment * 4] & 0xFF) << 24)
112 | ((uint32_t) (results[2 + alignment * 4] & 0xFF) << 16)
113 | ((uint32_t) (results[1 + alignment * 4] & 0xFF) << 8)
114 | (results[0 + alignment * 4] & 0xFF);
115 }
116
117 static int continuum_item_cmp(const void *t1, const void *t2)
118 {
119 memcached_continuum_item_st *ct1= (memcached_continuum_item_st *)t1;
120 memcached_continuum_item_st *ct2= (memcached_continuum_item_st *)t2;
121
122 /* Why 153? Hmmm... */
123 WATCHPOINT_ASSERT(ct1->value != 153);
124 if (ct1->value == ct2->value)
125 return 0;
126 else if (ct1->value > ct2->value)
127 return 1;
128 else
129 return -1;
130 }
131
132 static memcached_return_t update_continuum(memcached_st *ptr)
133 {
134 uint32_t continuum_index= 0;
135 memcached_server_st *list;
136 uint32_t pointer_counter= 0;
137 uint32_t pointer_per_server= MEMCACHED_POINTS_PER_SERVER;
138 uint32_t pointer_per_hash= 1;
139 uint32_t live_servers= 0;
140 struct timeval now;
141
142 if (gettimeofday(&now, NULL))
143 {
144 return memcached_set_errno(*ptr, errno, MEMCACHED_AT);
145 }
146
147 list= memcached_server_list(ptr);
148
149 /* count live servers (those without a retry delay set) */
150 bool is_auto_ejecting= _is_auto_eject_host(ptr);
151 if (is_auto_ejecting)
152 {
153 live_servers= 0;
154 ptr->ketama.next_distribution_rebuild= 0;
155 for (uint32_t host_index= 0; host_index < memcached_server_count(ptr); ++host_index)
156 {
157 if (list[host_index].next_retry <= now.tv_sec)
158 {
159 live_servers++;
160 }
161 else
162 {
163 if (ptr->ketama.next_distribution_rebuild == 0 or list[host_index].next_retry < ptr->ketama.next_distribution_rebuild)
164 {
165 ptr->ketama.next_distribution_rebuild= list[host_index].next_retry;
166 }
167 }
168 }
169 }
170 else
171 {
172 live_servers= memcached_server_count(ptr);
173 }
174
175 uint64_t is_ketama_weighted= memcached_behavior_get(ptr, MEMCACHED_BEHAVIOR_KETAMA_WEIGHTED);
176 uint32_t points_per_server= (uint32_t) (is_ketama_weighted ? MEMCACHED_POINTS_PER_SERVER_KETAMA : MEMCACHED_POINTS_PER_SERVER);
177
178 if (not live_servers)
179 {
180 return MEMCACHED_SUCCESS;
181 }
182
183 if (live_servers > ptr->ketama.continuum_count)
184 {
185 memcached_continuum_item_st *new_ptr;
186
187 new_ptr= libmemcached_xrealloc(ptr, ptr->ketama.continuum, (live_servers + MEMCACHED_CONTINUUM_ADDITION) * points_per_server, memcached_continuum_item_st);
188
189 if (new_ptr == 0)
190 {
191 return MEMCACHED_MEMORY_ALLOCATION_FAILURE;
192 }
193
194 ptr->ketama.continuum= new_ptr;
195 ptr->ketama.continuum_count= live_servers + MEMCACHED_CONTINUUM_ADDITION;
196 }
197
198 uint64_t total_weight= 0;
199 if (is_ketama_weighted)
200 {
201 for (uint32_t host_index = 0; host_index < memcached_server_count(ptr); ++host_index)
202 {
203 if (is_auto_ejecting == false or list[host_index].next_retry <= now.tv_sec)
204 {
205 total_weight += list[host_index].weight;
206 }
207 }
208 }
209
210 for (uint32_t host_index= 0; host_index < memcached_server_count(ptr); ++host_index)
211 {
212 if (is_auto_ejecting and list[host_index].next_retry > now.tv_sec)
213 {
214 continue;
215 }
216
217 if (is_ketama_weighted)
218 {
219 float pct= (float)list[host_index].weight / (float)total_weight;
220 pointer_per_server= (uint32_t) ((::floor((float) (pct * MEMCACHED_POINTS_PER_SERVER_KETAMA / 4 * (float)live_servers + 0.0000000001))) * 4);
221 pointer_per_hash= 4;
222 if (DEBUG)
223 {
224 printf("ketama_weighted:%s|%d|%llu|%u\n",
225 list[host_index].hostname,
226 list[host_index].port,
227 (unsigned long long)list[host_index].weight,
228 pointer_per_server);
229 }
230 }
231
232
233 if (ptr->distribution == MEMCACHED_DISTRIBUTION_CONSISTENT_KETAMA_SPY)
234 {
235 for (uint32_t pointer_index= 0;
236 pointer_index < pointer_per_server / pointer_per_hash;
237 pointer_index++)
238 {
239 char sort_host[1 +MEMCACHED_NI_MAXHOST +1 +MEMCACHED_NI_MAXSERV +1 + MEMCACHED_NI_MAXSERV ]= "";
240 int sort_host_length;
241
242 // Spymemcached ketema key format is: hostname/ip:port-index
243 // If hostname is not available then: /ip:port-index
244 sort_host_length= snprintf(sort_host, sizeof(sort_host),
245 "/%s:%u-%u",
246 list[host_index].hostname,
247 (uint32_t)list[host_index].port,
248 pointer_index);
249
250 if (size_t(sort_host_length) >= sizeof(sort_host) or sort_host_length < 0)
251 {
252 return memcached_set_error(*ptr, MEMCACHED_MEMORY_ALLOCATION_FAILURE, MEMCACHED_AT,
253 memcached_literal_param("snprintf(sizeof(sort_host))"));
254 }
255
256 if (DEBUG)
257 {
258 fprintf(stdout, "update_continuum: key is %s\n", sort_host);
259 }
260
261 if (is_ketama_weighted)
262 {
263 for (uint32_t x= 0; x < pointer_per_hash; x++)
264 {
265 uint32_t value= ketama_server_hash(sort_host, (size_t)sort_host_length, x);
266 ptr->ketama.continuum[continuum_index].index= host_index;
267 ptr->ketama.continuum[continuum_index++].value= value;
268 }
269 }
270 else
271 {
272 uint32_t value= hashkit_digest(&ptr->hashkit, sort_host, (size_t)sort_host_length);
273 ptr->ketama.continuum[continuum_index].index= host_index;
274 ptr->ketama.continuum[continuum_index++].value= value;
275 }
276 }
277 }
278 else
279 {
280 for (uint32_t pointer_index= 1;
281 pointer_index <= pointer_per_server / pointer_per_hash;
282 pointer_index++)
283 {
284 char sort_host[MEMCACHED_NI_MAXHOST +1 +MEMCACHED_NI_MAXSERV +1 +MEMCACHED_NI_MAXSERV]= "";
285 int sort_host_length;
286
287 if (list[host_index].port == MEMCACHED_DEFAULT_PORT)
288 {
289 sort_host_length= snprintf(sort_host, sizeof(sort_host),
290 "%s-%u",
291 list[host_index].hostname,
292 pointer_index - 1);
293 }
294 else
295 {
296 sort_host_length= snprintf(sort_host, sizeof(sort_host),
297 "%s:%u-%u",
298 list[host_index].hostname,
299 (uint32_t)list[host_index].port,
300 pointer_index - 1);
301 }
302
303 if (size_t(sort_host_length) >= sizeof(sort_host) or sort_host_length < 0)
304 {
305 return memcached_set_error(*ptr, MEMCACHED_MEMORY_ALLOCATION_FAILURE, MEMCACHED_AT,
306 memcached_literal_param("snprintf(sizeof(sort_host)))"));
307 }
308
309 if (is_ketama_weighted)
310 {
311 for (uint32_t x = 0; x < pointer_per_hash; x++)
312 {
313 uint32_t value= ketama_server_hash(sort_host, (size_t)sort_host_length, x);
314 ptr->ketama.continuum[continuum_index].index= host_index;
315 ptr->ketama.continuum[continuum_index++].value= value;
316 }
317 }
318 else
319 {
320 uint32_t value= hashkit_digest(&ptr->hashkit, sort_host, (size_t)sort_host_length);
321 ptr->ketama.continuum[continuum_index].index= host_index;
322 ptr->ketama.continuum[continuum_index++].value= value;
323 }
324 }
325 }
326
327 pointer_counter+= pointer_per_server;
328 }
329
330 WATCHPOINT_ASSERT(ptr);
331 WATCHPOINT_ASSERT(ptr->ketama.continuum);
332 WATCHPOINT_ASSERT(memcached_server_count(ptr) * MEMCACHED_POINTS_PER_SERVER <= MEMCACHED_CONTINUUM_SIZE);
333 ptr->ketama.continuum_points_counter= pointer_counter;
334 qsort(ptr->ketama.continuum, ptr->ketama.continuum_points_counter, sizeof(memcached_continuum_item_st), continuum_item_cmp);
335
336 if (DEBUG)
337 {
338 for (uint32_t pointer_index= 0; memcached_server_count(ptr) && pointer_index < ((live_servers * MEMCACHED_POINTS_PER_SERVER) - 1); pointer_index++)
339 {
340 WATCHPOINT_ASSERT(ptr->ketama.continuum[pointer_index].value <= ptr->ketama.continuum[pointer_index + 1].value);
341 }
342 }
343
344 return MEMCACHED_SUCCESS;
345 }
346
347 static memcached_return_t server_add(memcached_st *ptr,
348 const memcached_string_t& hostname,
349 in_port_t port,
350 uint32_t weight,
351 memcached_connection_t type)
352 {
353 assert_msg(ptr, "Programmer mistake, somehow server_add() was passed a NULL memcached_st");
354
355 memcached_server_st *new_host_list= libmemcached_xrealloc(ptr, memcached_server_list(ptr), (ptr->number_of_hosts + 1), memcached_server_st);
356
357 if (new_host_list == NULL)
358 {
359 return memcached_set_error(*ptr, MEMCACHED_MEMORY_ALLOCATION_FAILURE, MEMCACHED_AT);
360 }
361
362 memcached_server_list_set(ptr, new_host_list);
363
364 /* TODO: Check return type */
365 memcached_server_write_instance_st instance= memcached_server_instance_fetch(ptr, memcached_server_count(ptr));
366
367 if (__server_create_with(ptr, instance, hostname, port, weight, type) == NULL)
368 {
369 return memcached_set_error(*ptr, MEMCACHED_MEMORY_ALLOCATION_FAILURE, MEMCACHED_AT);
370 }
371
372 if (weight > 1)
373 {
374 ptr->ketama.weighted= true;
375 }
376
377 ptr->number_of_hosts++;
378
379 // @note we place the count in the bottom of the server list
380 instance= memcached_server_instance_fetch(ptr, 0);
381 memcached_servers_set_count(instance, memcached_server_count(ptr));
382
383 return run_distribution(ptr);
384 }
385
386
387 memcached_return_t memcached_server_push(memcached_st *ptr, const memcached_server_list_st list)
388 {
389 if (list == NULL)
390 {
391 return MEMCACHED_SUCCESS;
392 }
393
394 uint32_t count= memcached_server_list_count(list);
395
396 memcached_server_st *new_host_list;
397 new_host_list= libmemcached_xrealloc(ptr, memcached_server_list(ptr), (count + memcached_server_count(ptr)), memcached_server_st);
398
399 if (new_host_list == NULL)
400 {
401 return MEMCACHED_MEMORY_ALLOCATION_FAILURE;
402 }
403
404 memcached_server_list_set(ptr, new_host_list);
405
406 for (uint32_t x= 0; x < count; x++)
407 {
408 memcached_server_write_instance_st instance;
409
410 WATCHPOINT_ASSERT(list[x].hostname[0] != 0);
411
412 // We have extended the array, and now we will find it, and use it.
413 instance= memcached_server_instance_fetch(ptr, memcached_server_count(ptr));
414 WATCHPOINT_ASSERT(instance);
415
416 memcached_string_t hostname= { memcached_string_make_from_cstr(list[x].hostname) };
417 if (__server_create_with(ptr, instance,
418 hostname,
419 list[x].port, list[x].weight, list[x].type) == NULL)
420 {
421 return memcached_set_error(*ptr, MEMCACHED_MEMORY_ALLOCATION_FAILURE, MEMCACHED_AT);
422 }
423
424 if (list[x].weight > 1)
425 {
426 ptr->ketama.weighted= true;
427 }
428
429 ptr->number_of_hosts++;
430 }
431
432 // Provides backwards compatibility with server list.
433 {
434 memcached_server_write_instance_st instance;
435 instance= memcached_server_instance_fetch(ptr, 0);
436 instance->number_of_hosts= memcached_server_count(ptr);
437 }
438
439 return run_distribution(ptr);
440 }
441
442 memcached_return_t memcached_server_add_unix_socket(memcached_st *ptr,
443 const char *filename)
444 {
445 return memcached_server_add_unix_socket_with_weight(ptr, filename, 0);
446 }
447
448 memcached_return_t memcached_server_add_unix_socket_with_weight(memcached_st *ptr,
449 const char *filename,
450 uint32_t weight)
451 {
452 if (ptr == NULL)
453 {
454 return MEMCACHED_FAILURE;
455 }
456
457 memcached_string_t _filename= { memcached_string_make_from_cstr(filename) };
458 if (memcached_is_valid_servername(_filename) == false)
459 {
460 memcached_set_error(*ptr, MEMCACHED_INVALID_ARGUMENTS, MEMCACHED_AT, memcached_literal_param("Invalid filename for socket provided"));
461 }
462
463 return server_add(ptr, _filename, 0, weight, MEMCACHED_CONNECTION_UNIX_SOCKET);
464 }
465
466 memcached_return_t memcached_server_add_udp(memcached_st *ptr,
467 const char *hostname,
468 in_port_t port)
469 {
470 return memcached_server_add_udp_with_weight(ptr, hostname, port, 0);
471 }
472
473 memcached_return_t memcached_server_add_udp_with_weight(memcached_st *ptr,
474 const char *,
475 in_port_t,
476 uint32_t)
477 {
478 if (ptr == NULL)
479 {
480 return MEMCACHED_INVALID_ARGUMENTS;
481 }
482
483 return memcached_set_error(*ptr, MEMCACHED_DEPRECATED, MEMCACHED_AT);
484 }
485
486 memcached_return_t memcached_server_add(memcached_st *ptr,
487 const char *hostname,
488 in_port_t port)
489 {
490 return memcached_server_add_with_weight(ptr, hostname, port, 0);
491 }
492
493 memcached_return_t memcached_server_add_with_weight(memcached_st *ptr,
494 const char *hostname,
495 in_port_t port,
496 uint32_t weight)
497 {
498 if (ptr == NULL)
499 {
500 return MEMCACHED_INVALID_ARGUMENTS;
501 }
502
503 if (port == 0)
504 {
505 port= MEMCACHED_DEFAULT_PORT;
506 }
507
508 size_t hostname_length= hostname ? strlen(hostname) : 0;
509 if (hostname_length == 0)
510 {
511 hostname= "localhost";
512 hostname_length= memcached_literal_param_size("localhost");
513 }
514
515 memcached_string_t _hostname= { hostname, hostname_length };
516
517 if (memcached_is_valid_servername(_hostname) == false)
518 {
519 return memcached_set_error(*ptr, MEMCACHED_INVALID_ARGUMENTS, MEMCACHED_AT, memcached_literal_param("Invalid hostname provided"));
520 }
521
522 return server_add(ptr, _hostname, port, weight, _hostname.c_str[0] == '/' ? MEMCACHED_CONNECTION_UNIX_SOCKET : MEMCACHED_CONNECTION_TCP);
523 }
524
525 memcached_return_t memcached_server_add_parsed(memcached_st *ptr,
526 const char *hostname,
527 size_t hostname_length,
528 in_port_t port,
529 uint32_t weight)
530 {
531 char buffer[NI_MAXHOST];
532
533 memcpy(buffer, hostname, hostname_length);
534 buffer[hostname_length]= 0;
535
536 memcached_string_t _hostname= { buffer, hostname_length };
537
538 return server_add(ptr, _hostname,
539 port,
540 weight,
541 MEMCACHED_CONNECTION_TCP);
542 }