0
|
1 /* Distributed Checksum Clearinghouse |
|
2 * |
|
3 * helper processes for DNS blacklists |
|
4 * |
|
5 * Copyright (c) 2008 by Rhyolite Software, LLC |
|
6 * |
|
7 * This agreement is not applicable to any entity which sells anti-spam |
|
8 * solutions to others or provides an anti-spam solution as part of a |
|
9 * security solution sold to other entities, or to a private network |
|
10 * which employs the DCC or uses data provided by operation of the DCC |
|
11 * but does not provide corresponding data to other users. |
|
12 * |
|
13 * Permission to use, copy, modify, and distribute this software without |
|
14 * changes for any purpose with or without fee is hereby granted, provided |
|
15 * that the above copyright notice and this permission notice appear in all |
|
16 * copies and any distributed versions or copies are either unchanged |
|
17 * or not called anything similar to "DCC" or "Distributed Checksum |
|
18 * Clearinghouse". |
|
19 * |
|
20 * Parties not eligible to receive a license under this agreement can |
|
21 * obtain a commercial license to use DCC by contacting Rhyolite Software |
|
22 * at sales@rhyolite.com. |
|
23 * |
|
24 * A commercial license would be for Distributed Checksum and Reputation |
|
25 * Clearinghouse software. That software includes additional features. This |
|
26 * free license for Distributed ChecksumClearinghouse Software does not in any |
|
27 * way grant permision to use Distributed Checksum and Reputation Clearinghouse |
|
28 * software |
|
29 * |
|
30 * THE SOFTWARE IS PROVIDED "AS IS" AND RHYOLITE SOFTWARE, LLC DISCLAIMS ALL |
|
31 * WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES |
|
32 * OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL RHYOLITE SOFTWARE, LLC |
|
33 * BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES |
|
34 * OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, |
|
35 * WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, |
|
36 * ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS |
|
37 * SOFTWARE. |
|
38 * |
|
39 * Rhyolite Software DCC 1.3.103-1.42 $Revision$ |
|
40 */ |
|
41 |
|
42 #include "helper.h" |
|
43 #include "dcc_heap_debug.h" |
|
44 #include <signal.h> |
|
45 #include <sys/wait.h> |
|
46 |
|
47 |
|
48 #ifdef HAVE_HELPERS |
|
49 |
|
50 #define HELPER_MAX_FAILURES 5 /* shutdown & restart these total */ |
|
51 |
|
52 #define MAX_SLOW 2 /* 50% excess for slow DNS resolver */ |
|
53 |
|
54 |
|
55 /* add to the argv list for the helper processes */ |
|
56 void |
|
57 helper_save_arg(const char *flag, const char *value) |
|
58 { |
|
59 char const **new_arg; |
|
60 int i; |
|
61 |
|
62 if (helper.free_args <= 1) { |
|
63 /* reserve space for the argv[0] and the null terminator */ |
|
64 helper.free_args += 5; |
|
65 i = (helper.argc + 2*helper.free_args) * sizeof(char *); |
|
66 new_arg = dcc_malloc(i); |
|
67 memset(new_arg, 0, i); |
|
68 if (helper.argv) { |
|
69 for (i = 0; i < helper.argc; ++i) |
|
70 new_arg[i] = helper.argv[i]; |
|
71 dcc_free(helper.argv); |
|
72 } else { |
|
73 ++helper.argc; |
|
74 } |
|
75 helper.argv = new_arg; |
|
76 } |
|
77 |
|
78 helper.argv[helper.argc] = flag; |
|
79 helper.argv[++helper.argc] = value; |
|
80 helper.argv[++helper.argc] = 0; |
|
81 --helper.free_args; |
|
82 } |
|
83 |
|
84 |
|
85 |
|
86 /* initialize things for the parent or one of the helping children */ |
|
87 void |
|
88 helper_init(int max_helpers) |
|
89 { |
|
90 helper.sn = getpid() + time(0); |
|
91 |
|
92 helper.pipe_write = -1; |
|
93 helper.pipe_read = -1; |
|
94 helper.soc = INVALID_SOCKET; |
|
95 helper.req_len = sizeof(DNSBL_REQ); |
|
96 |
|
97 if (max_helpers) { |
|
98 /* max_helpers=0 if we are starting a child, |
|
99 * but != 0 in the parent after parsing all args |
|
100 * |
|
101 * default to dccifd or dccm max_work */ |
|
102 if (!helper.max_helpers) |
|
103 helper.max_helpers = max_helpers; |
|
104 |
|
105 helper.pids = dcc_malloc(sizeof(pid_t) * helper.max_helpers); |
|
106 memset(helper.pids, 0, sizeof(pid_t) * helper.max_helpers); |
|
107 } |
|
108 |
|
109 have_helpers = helper_lock_init(); |
|
110 } |
|
111 |
|
112 |
|
113 |
|
114 /* collect zombies of helpers that died from boredom or otherwise */ |
|
115 void |
|
116 reap_helpers(u_char locked) |
|
117 { |
|
118 int status; |
|
119 pid_t pid; |
|
120 int pid_inx; |
|
121 |
|
122 if (!locked) |
|
123 helper_lock(); |
|
124 |
|
125 for (;;) { |
|
126 wait_again:; |
|
127 pid = waitpid(0, &status, WNOHANG); |
|
128 if (0 >= pid) { |
|
129 if (!locked) |
|
130 helper_unlock(); |
|
131 return; |
|
132 } |
|
133 |
|
134 for (pid_inx = 0; ; ++pid_inx) { |
|
135 if (pid_inx >= helper.max_helpers) { |
|
136 /* not an acknowledged child */ |
|
137 if (helper.debug >= 1) |
|
138 dcc_trace_msg("not a DNSBL" |
|
139 " helper process reaped"); |
|
140 goto wait_again; |
|
141 } |
|
142 |
|
143 if (helper.pids[pid_inx] == pid) |
|
144 break; |
|
145 } |
|
146 |
|
147 helper.pids[pid_inx] = 0; |
|
148 |
|
149 /* races with dying helpers can confuse us */ |
|
150 if (--helper.total_helpers < 0) { |
|
151 if (helper.debug) |
|
152 dcc_trace_msg("DNSBL total helpers=%d", |
|
153 helper.total_helpers); |
|
154 helper.total_helpers = 0; |
|
155 } |
|
156 |
|
157 if (helper.slow_helpers > helper.total_helpers/MAX_SLOW) |
|
158 helper.slow_helpers = helper.total_helpers/MAX_SLOW; |
|
159 |
|
160 if (--helper.idle_helpers < 0) { |
|
161 /* We cannot be certain that a helper that quit was |
|
162 * idle, but it should have been. */ |
|
163 if (helper.debug) |
|
164 dcc_trace_msg("DNSBL idle helpers=%d", |
|
165 helper.idle_helpers); |
|
166 helper.idle_helpers = 0; |
|
167 } else if (helper.idle_helpers > helper.total_helpers) { |
|
168 /* The limit on the total_helpers can let us |
|
169 * drive idle_helpers<0 |
|
170 * which can make the previous fix wrong */ |
|
171 if (helper.debug) |
|
172 dcc_trace_msg("DNSBL idle helpers=%d" |
|
173 " total helpers=%d", |
|
174 helper.idle_helpers, |
|
175 helper.total_helpers); |
|
176 helper.idle_helpers = helper.total_helpers; |
|
177 } |
|
178 |
|
179 /* this is called from the "totals" thread |
|
180 * and so cannot use thr_error_msg() */ |
|
181 |
|
182 #if defined(WIFEXITED) && defined(WEXITSTATUS) |
|
183 if (WIFEXITED(status)) { |
|
184 if (WEXITSTATUS(status) == 0) { |
|
185 if (helper.debug > 1) |
|
186 dcc_trace_msg("DNSBL helper %d quit," |
|
187 " leaving %d helpers," |
|
188 " %d idle", |
|
189 (int)pid, |
|
190 helper.total_helpers, |
|
191 helper.idle_helpers); |
|
192 continue; |
|
193 } |
|
194 dcc_error_msg("DNSBL helper %d quit with exit(%d)," |
|
195 " leaving %d helpers, %d idle", |
|
196 (int)pid, WEXITSTATUS(status), |
|
197 helper.total_helpers, |
|
198 helper.idle_helpers); |
|
199 continue; |
|
200 } |
|
201 #endif |
|
202 #if defined(WTERMSIG) && defined(WIFSIGNALED) |
|
203 if (WIFSIGNALED(status)) { |
|
204 dcc_error_msg("DNSBL helper %d quit with signal %d," |
|
205 " leaving %d helpers, %d idle", |
|
206 (int)pid, WTERMSIG(status), |
|
207 helper.total_helpers, |
|
208 helper.idle_helpers); |
|
209 continue; |
|
210 } |
|
211 #endif |
|
212 dcc_error_msg("DNSBL helper %d quit with %d," |
|
213 " leaving %d helpers, %d idle", |
|
214 (int)pid, status, |
|
215 helper.total_helpers, helper.idle_helpers); |
|
216 } |
|
217 } |
|
218 |
|
219 |
|
220 |
|
221 /* must be called with the counter mutex */ |
|
222 static void |
|
223 terminate_helpers(void) |
|
224 { |
|
225 if (helper.pipe_write != -1) { |
|
226 close(helper.pipe_write); |
|
227 helper.pipe_write = -1; |
|
228 } |
|
229 if (helper.pipe_read != -1) { |
|
230 close(helper.pipe_read); |
|
231 helper.pipe_read = -1; |
|
232 } |
|
233 if (helper.soc != INVALID_SOCKET) { |
|
234 closesocket(helper.soc); |
|
235 helper.soc = INVALID_SOCKET; |
|
236 } |
|
237 |
|
238 reap_helpers(1); |
|
239 ++helper.gen; |
|
240 memset(helper.pids, 0, sizeof(pid_t) * helper.max_helpers); |
|
241 helper.total_helpers = 0; |
|
242 helper.idle_helpers = 0; |
|
243 helper.slow_helpers = 0; |
|
244 |
|
245 helper.failures = 0; |
|
246 } |
|
247 |
|
248 |
|
249 |
|
250 static void |
|
251 help_finish(u_int gen, u_char ok, u_char counted, u_char locked) |
|
252 { |
|
253 if (!locked) |
|
254 helper_lock(); |
|
255 |
|
256 /* forget it if the children have been restarted */ |
|
257 if (gen == helper.gen) { |
|
258 if (counted) |
|
259 ++helper.idle_helpers; |
|
260 |
|
261 if (!ok) { |
|
262 if (++helper.failures >= HELPER_MAX_FAILURES) { |
|
263 if (helper.debug) |
|
264 dcc_trace_msg("restart DNSBL helpers"); |
|
265 terminate_helpers(); |
|
266 } else { |
|
267 reap_helpers(1); |
|
268 } |
|
269 } |
|
270 } |
|
271 |
|
272 if (!locked) |
|
273 helper_unlock(); |
|
274 } |
|
275 |
|
276 |
|
277 |
|
278 static u_char |
|
279 helper_soc_open(DCC_EMSG emsg, DCC_CLNT_CTXT *ctxt) |
|
280 { |
|
281 u_char result; |
|
282 |
|
283 if (ctxt->soc != INVALID_SOCKET) |
|
284 return 1; |
|
285 |
|
286 dcc_ctxts_lock(); |
|
287 if (!dcc_info_lock(emsg)) { |
|
288 dcc_ctxts_unlock(); |
|
289 return 0; |
|
290 } |
|
291 result = dcc_clnt_soc_reopen(emsg, ctxt); |
|
292 if (!dcc_info_unlock(emsg)) |
|
293 result = 0; |
|
294 dcc_ctxts_unlock(); |
|
295 return result; |
|
296 } |
|
297 |
|
298 |
|
299 |
|
300 static u_char |
|
301 helper_soc_connect(DCC_EMSG emsg, DCC_CLNT_CTXT *ctxt, const DCC_SOCKU *su) |
|
302 { |
|
303 u_char result; |
|
304 |
|
305 #ifdef linux |
|
306 /* since at least some versions of Linux refuse to reconnect, |
|
307 * just disconnect */ |
|
308 su = 0; |
|
309 #endif |
|
310 |
|
311 dcc_ctxts_lock(); |
|
312 if (!dcc_info_lock(emsg)) { |
|
313 dcc_ctxts_unlock(); |
|
314 return 0; |
|
315 } |
|
316 result = dcc_clnt_connect(emsg, ctxt, su); |
|
317 if (!dcc_info_unlock(emsg)) |
|
318 result = 0; |
|
319 dcc_ctxts_unlock(); |
|
320 |
|
321 return result; |
|
322 } |
|
323 |
|
324 |
|
325 |
|
326 /* open the helper socket used to send requests to helper processes |
|
327 * must be called with the counter mutex */ |
|
328 static u_char |
|
329 open_helper(DCC_EMSG emsg, DCC_CLNT_CTXT *ctxt, void *lp) |
|
330 { |
|
331 struct in6_addr ipv6_loopback; |
|
332 struct in_addr ipv4_loopback; |
|
333 DCC_SOCKLEN_T soc_len; |
|
334 static int rcvbuf = 32*1024; |
|
335 static u_char rcvbuf_set = 0; |
|
336 |
|
337 /* We want to create a new socket with the same choice of |
|
338 * IPv4 or IPv6 as the DCC client context's socket. To do that, |
|
339 * we must ensure that the context's socket is healthy. */ |
|
340 if (!helper_soc_open(emsg, ctxt)) { |
|
341 thr_error_msg(lp, "DNSBL helper soc_open(): %s", emsg); |
|
342 return 0; |
|
343 } |
|
344 |
|
345 if (dcc_clnt_info->src.family != AF_UNSPEC) { |
|
346 /* bind to the send-from address if available */ |
|
347 dcc_mk_su(&helper.su, dcc_clnt_info->src.family, |
|
348 &dcc_clnt_info->src.u, 0); |
|
349 } else if (ctxt->flags & DCC_CTXT_USING_IPV4) { |
|
350 ipv4_loopback.s_addr = ntohl(0x7f000001); |
|
351 dcc_mk_su(&helper.su, AF_INET, &ipv4_loopback, 0); |
|
352 } else { |
|
353 memset(&ipv6_loopback, 0, sizeof(ipv6_loopback)); |
|
354 ipv6_loopback.s6_addr32[3] = ntohl(1); |
|
355 dcc_mk_su(&helper.su, AF_INET6, &ipv6_loopback, 0); |
|
356 } |
|
357 clean_stdio(); |
|
358 if (0 >= dcc_udp_bind(emsg, &helper.soc, &helper.su, 0)) { |
|
359 thr_error_msg(lp, "DNSBL helper bind(%s): %s", |
|
360 dcc_su2str_err(&helper.su), emsg); |
|
361 terminate_helpers(); |
|
362 return 0; |
|
363 } |
|
364 soc_len = sizeof(helper.su); |
|
365 if (0 > getsockname(helper.soc, &helper.su.sa, &soc_len)) { |
|
366 thr_error_msg(lp, "DNSBL helper getsockname(%d, %s): %s", |
|
367 helper.soc, dcc_su2str_err(&helper.su), |
|
368 ERROR_STR()); |
|
369 terminate_helpers(); |
|
370 return 0; |
|
371 } |
|
372 for (;;) { |
|
373 if (!setsockopt(helper.soc, SOL_SOCKET, SO_RCVBUF, |
|
374 &rcvbuf, sizeof(rcvbuf))) |
|
375 break; |
|
376 if (rcvbuf_set || rcvbuf <= 4096) { |
|
377 thr_error_msg(lp, |
|
378 "DNSBL setsockopt(%s,SO_RCVBUF=%d): %s", |
|
379 dcc_su2str_err(&helper.su), |
|
380 rcvbuf, ERROR_STR()); |
|
381 break; |
|
382 } |
|
383 rcvbuf -= 4096; |
|
384 } |
|
385 rcvbuf_set = 1; |
|
386 return 1; |
|
387 } |
|
388 |
|
389 |
|
390 |
|
391 /* Create the pipe used to awaken and terminate the helper processes |
|
392 * must be called with the counter mutex */ |
|
393 static u_char |
|
394 ready_helpers(void *lp) |
|
395 { |
|
396 int fds[2]; |
|
397 |
|
398 if (helper.pipe_write >= 0 |
|
399 && helper.pipe_read >= 0) |
|
400 return 1; |
|
401 |
|
402 terminate_helpers(); |
|
403 |
|
404 /* give the helper child processes an FD that will go dead |
|
405 * if the parent dies or otherwise closes the other end */ |
|
406 clean_stdio(); |
|
407 if (0 > pipe(fds)) { |
|
408 thr_error_msg(lp, "DNSBL parent helper pipe(): %s", |
|
409 ERROR_STR()); |
|
410 terminate_helpers(); |
|
411 return 0; |
|
412 } |
|
413 helper.pipe_read = fds[0]; |
|
414 helper.pipe_write = fds[1]; |
|
415 if (0 > fcntl(helper.pipe_write, F_SETFD, FD_CLOEXEC)) { |
|
416 thr_error_msg(lp, "DNSBL helper fcntl(FD_CLOEXEC): %s", |
|
417 ERROR_STR()); |
|
418 terminate_helpers(); |
|
419 return 0; |
|
420 } |
|
421 |
|
422 return 1; |
|
423 } |
|
424 |
|
425 |
|
426 |
|
427 /* Start a new helper process. |
|
428 * The counter mutex must be locked */ |
|
429 static u_char |
|
430 new_helper(DCC_EMSG emsg, DCC_CLNT_CTXT *ctxt, void *lp) |
|
431 { |
|
432 pid_t pid; |
|
433 char arg_buf[sizeof("set:")+sizeof(HELPER_PAT)+8+8+8]; |
|
434 char trace_buf[200]; |
|
435 char *bufp; |
|
436 SOCKET soc; |
|
437 int pid_inx, buf_len, i, j; |
|
438 |
|
439 /* open the socket if necessary */ |
|
440 if (helper.soc == INVALID_SOCKET) { |
|
441 if (!ready_helpers(lp)) |
|
442 return 0; |
|
443 if (!open_helper(emsg, ctxt, lp)) |
|
444 return 0; |
|
445 } |
|
446 |
|
447 reap_helpers(1); |
|
448 for (pid_inx = 0; ; ++pid_inx) { |
|
449 if (pid_inx >= helper.max_helpers) |
|
450 dcc_logbad(EX_SOFTWARE, "no free DNSBL pids[] entry"); |
|
451 if (helper.pids[pid_inx] == 0) |
|
452 break; |
|
453 } |
|
454 |
|
455 fflush(stdout); |
|
456 fflush(stderr); |
|
457 pid = fork(); |
|
458 if (pid < 0) { |
|
459 thr_error_msg(lp, "DNSBL helper fork(): %s", ERROR_STR()); |
|
460 return 0; |
|
461 } |
|
462 |
|
463 if (pid != 0) { |
|
464 /* this is the parent */ |
|
465 helper.pids[pid_inx] = pid; |
|
466 ++helper.total_helpers; |
|
467 return 1; |
|
468 } |
|
469 |
|
470 dcc_rel_priv(); /* no fun or games */ |
|
471 clean_stdio(); |
|
472 |
|
473 /* reset FD_CLOEXEC without affecting parent */ |
|
474 soc = dup(helper.soc); |
|
475 if (soc == INVALID_SOCKET) |
|
476 dcc_logbad(EX_UNAVAILABLE, "DNSBL helper soc dup(%d): %s", |
|
477 helper.soc, ERROR_STR()); |
|
478 |
|
479 snprintf(arg_buf, sizeof(arg_buf), "set:"HELPER_PAT, |
|
480 soc, helper.pipe_read, helper.total_helpers); |
|
481 helper_save_arg("-B", arg_buf); |
|
482 helper.argv[0] = dnsbl_progpath; |
|
483 buf_len = sizeof(trace_buf); |
|
484 bufp = trace_buf; |
|
485 for (i = 0; i < helper.argc && buf_len > 2; ++i) { |
|
486 j = snprintf(bufp, buf_len, "%s ", helper.argv[i]); |
|
487 buf_len -= j; |
|
488 bufp += j; |
|
489 } |
|
490 if (helper.debug >= 4) |
|
491 dcc_trace_msg("DNSBL helper exec %s", trace_buf); |
|
492 |
|
493 execv(helper.argv[0], (char * const *)helper.argv); |
|
494 /* This process should continue at helper_child() */ |
|
495 |
|
496 dcc_logbad(EX_UNAVAILABLE, "exec(%s): %s", |
|
497 trace_buf, ERROR_STR()); |
|
498 } |
|
499 |
|
500 |
|
501 |
|
502 static void NRATTRIB |
|
503 helper_exit(const char *reason) |
|
504 { |
|
505 if (helper.debug > 1) |
|
506 dcc_trace_msg("helper process on %s %s", |
|
507 dcc_su2str_err(&helper.su), reason); |
|
508 |
|
509 exit(0); |
|
510 } |
|
511 |
|
512 |
|
513 |
|
514 static u_char helper_alarm_hit; |
|
515 static void |
|
516 helper_alarm(int s UATTRIB) |
|
517 { |
|
518 helper_alarm_hit = 1; |
|
519 } |
|
520 |
|
521 |
|
522 |
|
523 /* helper processes start here via fork()/exec() in the parent */ |
|
524 void NRATTRIB |
|
525 helper_child(SOCKET soc, int fd, int total_helpers) |
|
526 { |
|
527 sigset_t sigs; |
|
528 DCC_SOCKLEN_T soc_len; |
|
529 DNSBL_REQ req; |
|
530 int req_len; |
|
531 DNSBL_RESP resp; |
|
532 DCC_SOCKU req_su; |
|
533 DCC_SOCKLEN_T su_len; |
|
534 struct timeval now; |
|
535 u_char wake_buf; |
|
536 int secs, i; |
|
537 |
|
538 /* this process inherits via exec() by dccm or dccifd odd signal |
|
539 * blocking from some pthreads implementations including FreeBSD 5.* */ |
|
540 signal(SIGHUP, SIG_IGN); |
|
541 signal(SIGINT, SIG_IGN); |
|
542 signal(SIGTERM, SIG_IGN); |
|
543 sigemptyset(&sigs); |
|
544 sigaddset(&sigs, SIGALRM); |
|
545 sigprocmask(SIG_UNBLOCK, &sigs, 0); |
|
546 |
|
547 helper_init(0); |
|
548 if (have_helpers) |
|
549 dcc_logbad(EX_SOFTWARE, "no threads for DNSBL helpers"); |
|
550 |
|
551 helper.total_helpers = total_helpers; |
|
552 |
|
553 helper.pipe_read = fd; |
|
554 helper.soc = soc; |
|
555 soc_len = sizeof(helper.su); |
|
556 if (0 > getsockname(helper.soc, &helper.su.sa, &soc_len)) |
|
557 dcc_logbad(EX_IOERR, "DNSBL helper getsockname(%d): %s", |
|
558 helper.soc, ERROR_STR()); |
|
559 |
|
560 if (helper.debug > 1) |
|
561 dcc_trace_msg("DNSBL helper process starting on %s", |
|
562 dcc_su2str_err(&helper.su)); |
|
563 |
|
564 for (;;) { |
|
565 /* Use read() and SIGALRM to watch for a wake-up byte |
|
566 * from the parent, the parent ending and closing the pipe, |
|
567 * or enough idle time to require our retirement. This |
|
568 * tactic awakens a single child for each wake-up call |
|
569 * from the parent. Using select() or poll() on the main |
|
570 * socket awakens a thundering herd of children */ |
|
571 secs = HELPER_IDLE_STOP_SECS+1; |
|
572 if (helper.total_helpers > 0) |
|
573 secs /= helper.total_helpers+1; |
|
574 if (secs < 5) |
|
575 secs = 5; |
|
576 signal(SIGALRM, helper_alarm); |
|
577 #ifdef HAVE_SIGINTERRUPT |
|
578 siginterrupt(SIGALRM, 1); |
|
579 #endif |
|
580 helper_alarm_hit = 0; |
|
581 alarm(secs); |
|
582 for (;;) { |
|
583 su_len = sizeof(req_su); |
|
584 req_len = recvfrom(helper.soc, &req, ISZ(req), 0, |
|
585 &req_su.sa, &su_len); |
|
586 |
|
587 /* sleep until awakened if no work is ready */ |
|
588 if (req_len <= 0) { |
|
589 if (req_len == 0) |
|
590 dcc_logbad(EX_IOERR, |
|
591 "DNSBL helper recvfrom()=0"); |
|
592 if (!DCC_BLOCK_ERROR()) |
|
593 dcc_logbad(EX_IOERR, |
|
594 "DNSBL helper recvfrom():" |
|
595 " %s", |
|
596 ERROR_STR()); |
|
597 if (helper_alarm_hit) |
|
598 helper_exit("idle helper exit"); |
|
599 |
|
600 i = read(helper.pipe_read, &wake_buf, 1); |
|
601 |
|
602 /* The other end of the pipe can be marked |
|
603 * non-blocking by some pthreads |
|
604 * implementations. That makes read() on this |
|
605 * end fail with EAGAIN. When that happens, |
|
606 * fall back on select() or poll(). |
|
607 * Even on such pthread implementations, |
|
608 * it rarely happens. */ |
|
609 if (i < 0 && DCC_BLOCK_ERROR()) { |
|
610 DCC_EMSG emsg; |
|
611 i = dcc_select_poll(emsg, |
|
612 helper.pipe_read, 0, |
|
613 -1); |
|
614 if (i < 0) |
|
615 dcc_logbad(EX_IOERR, |
|
616 "dnsbl HELPER select():" |
|
617 " %s", emsg); |
|
618 } |
|
619 |
|
620 /* loof for work after a wake-up call */ |
|
621 if (i > 0) |
|
622 continue; |
|
623 |
|
624 if (helper_alarm_hit) |
|
625 continue; |
|
626 if (i == 0) |
|
627 helper_exit("shutdown"); |
|
628 if (i < 0) { |
|
629 dcc_logbad(EX_OSERR, |
|
630 "DNSBL read(terminate): %s", |
|
631 ERROR_STR()); |
|
632 } |
|
633 } |
|
634 if (req_len != helper.req_len) { |
|
635 if (helper.debug) |
|
636 dcc_trace_msg("DNSBL helper" |
|
637 " recvfrom(parent %s)=%d" |
|
638 " instead of %d", |
|
639 dcc_su2str_err(&req_su), |
|
640 req_len, |
|
641 helper.req_len); |
|
642 continue; |
|
643 } |
|
644 |
|
645 /* we might get stray packets because we cannot |
|
646 * connect to a single port */ |
|
647 if (!DCC_SU_EQ(&helper.su, &helper.su)) { |
|
648 if (helper.debug) |
|
649 dcc_trace_msg("DNSBL helper" |
|
650 " request from" |
|
651 " %s instead of %s", |
|
652 dcc_su2str_err(&req_su), |
|
653 dcc_su2str_err(&helper.su)); |
|
654 continue; |
|
655 } |
|
656 |
|
657 if (req.hdr.magic != HELPER_MAGIC_REQ |
|
658 || req.hdr.version != HELPER_VERSION) { |
|
659 if (helper.debug) |
|
660 dcc_trace_msg("DNSBL helper" |
|
661 " recvfrom(parent %s)" |
|
662 " magic=%#08x", |
|
663 dcc_su2str_err(&req_su), |
|
664 req.hdr.magic); |
|
665 continue; |
|
666 } |
|
667 break; |
|
668 } |
|
669 gettimeofday(&now, 0); |
|
670 alarm(0); |
|
671 |
|
672 /* do not bother working if it is already too late to answer, |
|
673 * perhaps because a previous helper died */ |
|
674 if (tv_diff2us(&now, &req.hdr.start) >= req.hdr.avail_us) { |
|
675 if (helper.debug > 1) |
|
676 dcc_trace_msg("%s DNSBL helper" |
|
677 " already too late to answer", |
|
678 req.hdr.id); |
|
679 continue; |
|
680 } |
|
681 |
|
682 memset(&resp, 0, sizeof(resp)); |
|
683 resp.hdr.magic = HELPER_MAGIC_RESP; |
|
684 resp.hdr.version = HELPER_VERSION; |
|
685 resp.hdr.sn = req.hdr.sn; |
|
686 |
|
687 /* do the work and send an answer if we have one */ |
|
688 if (!dnsbl_work(&req, &resp)) |
|
689 continue; |
|
690 |
|
691 /* do not answer if it is too late */ |
|
692 gettimeofday(&now, 0); |
|
693 if (tv_diff2us(&now, &req.hdr.start) > (req.hdr.avail_us |
|
694 + DCC_US/2)) { |
|
695 if (helper.debug > 1) |
|
696 dcc_trace_msg("%s DNSBL helper" |
|
697 " too late to answer", |
|
698 req.hdr.id); |
|
699 continue; |
|
700 } |
|
701 |
|
702 i = sendto(helper.soc, &resp, sizeof(resp), 0, |
|
703 &req_su.sa, DCC_SU_LEN(&req_su)); |
|
704 if (i != sizeof(resp)) { |
|
705 if (i < 0) |
|
706 dcc_error_msg("%s helper sendto(%s): %s", |
|
707 req.hdr.id, |
|
708 dcc_su2str_err(&req_su), |
|
709 ERROR_STR()); |
|
710 else |
|
711 dcc_error_msg("%s helper sendto(%s)=%d", |
|
712 req.hdr.id, |
|
713 dcc_su2str_err(&req_su), i); |
|
714 } |
|
715 } |
|
716 } |
|
717 |
|
718 |
|
719 |
|
720 /* ask a helper process to do some filtering */ |
|
721 u_char /* 1=got an answer */ |
|
722 ask_helper(DCC_CLNT_CTXT *ctxt, void *log_ctxt, |
|
723 time_t avail_us, /* spend at most this much time */ |
|
724 HELPER_REQ_HDR *req, /* request sent to helper */ |
|
725 int req_len, |
|
726 HELPER_RESP_HDR *resp, /* put answer here */ |
|
727 int resp_len) |
|
728 { |
|
729 DCC_EMSG emsg; |
|
730 DCC_SOCKU send_su; |
|
731 DCC_SOCKLEN_T su_len; |
|
732 DCC_SOCKU recv_su; |
|
733 char sustr[DCC_SU2STR_SIZE]; |
|
734 u_char counted; |
|
735 u_int gen; |
|
736 struct timeval now; |
|
737 time_t us; |
|
738 int i; |
|
739 |
|
740 emsg[0] = '\0'; |
|
741 |
|
742 /* keep the lock until we have sent our request and wake-up call |
|
743 * to ensure that some other thread does not shut down all of |
|
744 * the helpers. */ |
|
745 helper_lock(); |
|
746 gettimeofday(&now, 0); |
|
747 |
|
748 /* If it has been a long time since we used a helper, then the last |
|
749 * of them might be about to die of boredom. Fix that race by |
|
750 * restarting all of them. |
|
751 * Most dying helpers should be reaped by the totals timer thread. */ |
|
752 if (helper.idle_helpers > 0 |
|
753 && DCC_IS_TIME(now.tv_sec, helper.idle_restart, |
|
754 HELPER_IDLE_RESTART)) { |
|
755 reap_helpers(1); |
|
756 if (helper.idle_helpers > 0) |
|
757 terminate_helpers(); |
|
758 gettimeofday(&now, 0); |
|
759 } |
|
760 helper.idle_restart = now.tv_sec + HELPER_IDLE_RESTART; |
|
761 |
|
762 if (helper.idle_helpers - helper.slow_helpers > 0) { |
|
763 /* avoid taking the last idle helper because there are |
|
764 * usually fewer truly idle helpers than we think because |
|
765 * we don't always wait for them to finish */ |
|
766 if (helper.idle_helpers > 2 |
|
767 || helper.total_helpers >= helper.max_helpers |
|
768 || !new_helper(emsg, ctxt, log_ctxt)) |
|
769 --helper.idle_helpers; |
|
770 counted = 1; |
|
771 } else if (helper.total_helpers >= helper.max_helpers) { |
|
772 if (helper.debug > 0) |
|
773 thr_trace_msg(log_ctxt, "%s DNSBL %d idle, %d slow, and" |
|
774 " %d total DNSBL helpers", req->id, |
|
775 helper.idle_helpers, helper.slow_helpers, |
|
776 helper.total_helpers); |
|
777 counted = 0; |
|
778 } else { |
|
779 if (!new_helper(emsg, ctxt, log_ctxt)) { |
|
780 helper_unlock(); |
|
781 return 0; |
|
782 } |
|
783 counted = 1; |
|
784 } |
|
785 |
|
786 /* The resolution of the BIND timeout limits is seconds, so even on |
|
787 * systems where the timeout limits work, the helper might delay |
|
788 * a second or two. To keep the count of idle helpers as accurate |
|
789 * as possible, always wait at least 1 second for an answer |
|
790 * and 2 seconds for an answer to reach the parent. */ |
|
791 req->avail_us = avail_us; |
|
792 avail_us += DCC_US; |
|
793 req->start = now; |
|
794 req->magic = HELPER_MAGIC_REQ; |
|
795 req->version = HELPER_VERSION; |
|
796 |
|
797 req->sn = ++helper.sn; |
|
798 gen = helper.gen; |
|
799 |
|
800 /* snapshot the address in case another thread restarts the helpers */ |
|
801 send_su = helper.su; |
|
802 |
|
803 /* Use sendto() if the socket is not already conencted. |
|
804 * If it is already connected, then on many systems other than Linux, |
|
805 * it is possible and presumably cheap to reconnected it, so do so. */ |
|
806 if (!helper_soc_open(emsg, ctxt)) { |
|
807 thr_trace_msg(log_ctxt, "DNSBL reopen(): %s", emsg); |
|
808 help_finish(gen, 0, counted, 1); |
|
809 helper_unlock(); |
|
810 return 0; |
|
811 } |
|
812 if (ctxt->conn_su.sa.sa_family != AF_UNSPEC |
|
813 && memcmp(&ctxt->conn_su, &send_su, sizeof(ctxt->conn_su)) |
|
814 && !helper_soc_connect(emsg, ctxt, &send_su)) { |
|
815 thr_trace_msg(log_ctxt, "DNSBL soc_connect(): %s", emsg); |
|
816 help_finish(gen, 0, counted, 1); |
|
817 helper_unlock(); |
|
818 return 0; |
|
819 } |
|
820 if (ctxt->conn_su.sa.sa_family == AF_UNSPEC) { |
|
821 i = sendto(ctxt->soc, req, req_len, 0, |
|
822 &send_su.sa, DCC_SU_LEN(&send_su)); |
|
823 } else { |
|
824 i = send(ctxt->soc, req, req_len, 0); |
|
825 } |
|
826 if (i != req_len) { |
|
827 if (i < 0) |
|
828 thr_trace_msg(log_ctxt, "%s DNSBL sendto(%s): %s", |
|
829 req->id, dcc_su2str(sustr, sizeof(sustr), |
|
830 &send_su), |
|
831 ERROR_STR()); |
|
832 else |
|
833 thr_trace_msg(log_ctxt, "%s DNSBL sendto(%s)=%d", |
|
834 req->id, dcc_su2str(sustr, sizeof(sustr), |
|
835 &send_su), |
|
836 i); |
|
837 help_finish(gen, 0, counted, 1); |
|
838 helper_unlock(); |
|
839 return 0; |
|
840 } |
|
841 |
|
842 /* awaken a helper */ |
|
843 i = write(helper.pipe_write, "x", 1); |
|
844 if (i != 1) { |
|
845 if (i < 0) |
|
846 thr_trace_msg(log_ctxt, |
|
847 "%s DNSBL write(pipe_write=%d): %s", |
|
848 req->id, helper.pipe_write, ERROR_STR()); |
|
849 else |
|
850 thr_trace_msg(log_ctxt, |
|
851 "%s DNSBL write(pipe_write)=%d", |
|
852 req->id, i); |
|
853 help_finish(gen, 0, counted, 1); |
|
854 helper_unlock(); |
|
855 return 0; |
|
856 } |
|
857 helper_unlock(); |
|
858 |
|
859 for (;;) { |
|
860 us = avail_us - tv_diff2us(&now, &req->start); |
|
861 if (us < 0) |
|
862 us = 0; |
|
863 i = dcc_select_poll(0, ctxt->soc, 1, us); |
|
864 if (i < 0) { |
|
865 thr_error_msg(log_ctxt, "%s DNSBL select_poll: %s", |
|
866 req->id, ERROR_STR()); |
|
867 help_finish(gen, 0, counted, 0); |
|
868 return 0; |
|
869 } |
|
870 gettimeofday(&now, 0); |
|
871 |
|
872 if (i == 0) { |
|
873 if (helper.debug) |
|
874 thr_trace_msg(log_ctxt, |
|
875 "%s DNSBL no helper answer after" |
|
876 " %1.f sec", req->id, |
|
877 tv_diff2us(&now, &req->start) |
|
878 / (DCC_US*1.0)); |
|
879 helper_lock(); |
|
880 if (helper.slow_helpers<=helper.total_helpers/MAX_SLOW) |
|
881 ++helper.slow_helpers; |
|
882 help_finish(gen, 0, counted, 1); |
|
883 helper_unlock(); |
|
884 return 0; |
|
885 } |
|
886 |
|
887 |
|
888 su_len = sizeof(recv_su); |
|
889 i = recvfrom(ctxt->soc, resp, resp_len, |
|
890 0, &recv_su.sa, &su_len); |
|
891 /* because we are using UDP, we might get stray packets */ |
|
892 if (i != resp_len) { |
|
893 if (i < 0) { |
|
894 thr_trace_msg(log_ctxt, |
|
895 "%s DNSBL recvfrom(): %s", |
|
896 req->id, ERROR_STR()); |
|
897 if (DCC_BLOCK_ERROR()) |
|
898 continue; |
|
899 help_finish(gen, 0, counted, 0); |
|
900 return 0; |
|
901 } |
|
902 if (helper.debug > 1) |
|
903 thr_trace_msg(log_ctxt, |
|
904 "%s DNSBL recvfrom(%s)=%d", |
|
905 req->id, |
|
906 dcc_su2str_err(&recv_su), i); |
|
907 continue; |
|
908 } |
|
909 if (!DCC_SU_EQ(&send_su, &recv_su)) { |
|
910 if (helper.debug != 0) |
|
911 thr_trace_msg(log_ctxt, |
|
912 "%s DNSBL recvfrom(%s)" |
|
913 " instead of %s", |
|
914 req->id, |
|
915 dcc_su2str_err(&recv_su), |
|
916 dcc_su2str_err(&send_su)); |
|
917 continue; |
|
918 } |
|
919 if (resp->magic != HELPER_MAGIC_RESP |
|
920 || resp->version != HELPER_VERSION |
|
921 || resp->sn != req->sn) { |
|
922 if (helper.debug >1 ) |
|
923 thr_trace_msg(log_ctxt, |
|
924 "%s DNSBL recvfrom(%s)" |
|
925 " magic=%#08x sn=%d", |
|
926 req->id, dcc_su2str_err(&recv_su), |
|
927 resp->magic, resp->sn); |
|
928 continue; |
|
929 } |
|
930 |
|
931 help_finish(gen, 1, counted, 0); |
|
932 return 1; |
|
933 } |
|
934 } |
|
935 #endif /* HAVE_HELPERS */ |