Miracle of miracles... it seems to work
[freeradius.git] / src / main / event.c
1 /*
2  * event.c      Server event handling
3  *
4  * Version:     $Id$
5  *
6  *   This program is free software; you can redistribute it and/or modify
7  *   it under the terms of the GNU General Public License as published by
8  *   the Free Software Foundation; either version 2 of the License, or
9  *   (at your option) any later version.
10  *
11  *   This program is distributed in the hope that it will be useful,
12  *   but WITHOUT ANY WARRANTY; without even the implied warranty of
13  *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14  *   GNU General Public License for more details.
15  *
16  *   You should have received a copy of the GNU General Public License
17  *   along with this program; if not, write to the Free Software
18  *   Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
19  *
20  * Copyright 2007  The FreeRADIUS server project
21  * Copyright 2007  Alan DeKok <aland@deployingradius.com>
22  */
23
24 #include <freeradius-devel/ident.h>
25 RCSID("$Id$")
26
27 #include <freeradius-devel/radiusd.h>
28 #include <freeradius-devel/modules.h>
29 #include <freeradius-devel/event.h>
30 #include <freeradius-devel/detail.h>
31
32 #include <freeradius-devel/rad_assert.h>
33
34 #include <signal.h>
35 #include <fcntl.h>
36
37 #ifdef HAVE_SYS_WAIT_H
38 #       include <sys/wait.h>
39 #endif
40
41 #define USEC (1000000)
42
43 extern pid_t radius_pid;
44 extern int dont_fork;
45 extern int check_config;
46 extern char *debug_condition;
47
48 /*
49  *      Ridiculous amounts of local state.
50  */
51 static fr_event_list_t  *el = NULL;
52 static fr_packet_list_t *pl = NULL;
53 static int                      request_num_counter = 0;
54 static struct timeval           now;
55 time_t                          fr_start_time;
56 static int                      have_children;
57 static int                      just_started = TRUE;
58
59 #ifndef __MINGW32__
60 #ifdef HAVE_PTHREAD_H
61 #define WITH_SELF_PIPE (1)
62 #endif
63 #endif
64
65 #ifdef WITH_SELF_PIPE
66 static int self_pipe[2];
67 #endif
68
69 #ifdef HAVE_PTHREAD_H
70 #ifdef WITH_PROXY
71 static pthread_mutex_t  proxy_mutex;
72 static rad_listen_t *proxy_listener_list = NULL;
73 static int proxy_no_new_sockets = FALSE;
74 #endif
75
76 #define PTHREAD_MUTEX_LOCK if (have_children) pthread_mutex_lock
77 #define PTHREAD_MUTEX_UNLOCK if (have_children) pthread_mutex_unlock
78
79 static pthread_t NO_SUCH_CHILD_PID;
80 #else
81 /*
82  *      This is easier than ifdef's throughout the code.
83  */
84 #define PTHREAD_MUTEX_LOCK(_x)
85 #define PTHREAD_MUTEX_UNLOCK(_x)
86 int thread_pool_addrequest(REQUEST *request, RAD_REQUEST_FUNP fun)
87 {
88         radius_handle_request(request, fun);
89         return 1;
90 }
91 #endif
92
93 /*
94  *      We need mutexes around the event FD list *only* in certain
95  *      cases.
96  */
97 #if defined (HAVE_PTHREAD_H) && (defined(WITH_PROXY) || defined(WITH_TCP))
98 static pthread_mutex_t  fd_mutex;
99 #define FD_MUTEX_LOCK if (have_children) pthread_mutex_lock
100 #define FD_MUTEX_UNLOCK if (have_children) pthread_mutex_unlock
101 #else
102 /*
103  *      This is easier than ifdef's throughout the code.
104  */
105 #define FD_MUTEX_LOCK(_x)
106 #define FD_MUTEX_UNLOCK(_x)
107 #endif
108
109
110 #define INSERT_EVENT(_function, _ctx) if (!fr_event_insert(el, _function, _ctx, &((_ctx)->when), &((_ctx)->ev))) { _rad_panic(__FILE__, __LINE__, "Failed to insert event"); }
111
112 #ifdef WITH_PROXY
113 static fr_packet_list_t *proxy_list = NULL;
114 static void remove_from_proxy_hash(REQUEST *request);
115
116 static void check_for_zombie_home_server(REQUEST *request);
117 #else
118 #define remove_from_proxy_hash(foo)
119 #endif
120
121 static void request_post_handler(REQUEST *request);
122 static void wait_a_bit(void *ctx);
123 static void event_socket_handler(fr_event_list_t *xel, UNUSED int fd, void *ctx);
124 #ifdef WITH_DETAIL
125 static void event_poll_detail(void *ctx);
126 #endif
127
128 static void NEVER_RETURNS _rad_panic(const char *file, unsigned int line,
129                                     const char *msg)
130 {
131         radlog(L_ERR, "[%s:%d] %s", file, line, msg);
132         _exit(1);
133 }
134
135 #define rad_panic(x) _rad_panic(__FILE__, __LINE__, x)
136
137
138 static void tv_add(struct timeval *tv, int usec_delay)
139 {
140         if (usec_delay > USEC) {
141                 tv->tv_sec += usec_delay / USEC;
142                 usec_delay %= USEC;
143         }
144         tv->tv_usec += usec_delay;
145
146         if (tv->tv_usec > USEC) {
147                 tv->tv_sec += tv->tv_usec / USEC;
148                 tv->tv_usec %= USEC;
149         }
150 }
151
152 static void remove_from_request_hash(REQUEST *request)
153 {
154         if (!request->in_request_hash) return;
155
156         fr_packet_list_yank(pl, request->packet);
157         request->in_request_hash = FALSE;
158
159         request_stats_final(request);
160
161 #ifdef WITH_TCP
162         request->listener->count--;
163 #endif
164 }
165
166 static void ev_request_free(REQUEST **prequest)
167 {
168         REQUEST *request;
169         
170         if (!prequest || !*prequest) return;
171
172         request = *prequest;
173
174 #ifdef WITH_COA
175         if (request->coa) {
176                 /*
177                  *      Divorce the child from the parent first,
178                  *      then clean up the child.
179                  */
180                 request->coa->parent = NULL;
181                 ev_request_free(&request->coa);
182         }
183
184         /*
185          *      Divorce the parent from the child, and leave the
186          *      parent still alive.
187          */
188         if (request->parent && (request->parent->coa == request)) {
189                 request->parent->coa = NULL;
190         }
191 #endif
192
193         if (request->ev) fr_event_delete(el, &request->ev);
194 #ifdef WITH_PROXY
195         if (request->in_proxy_hash) remove_from_proxy_hash(request);
196 #endif
197         if (request->in_request_hash) remove_from_request_hash(request);
198
199         request_free(prequest);
200 }
201
202 #ifdef WITH_PROXY
203 static REQUEST *lookup_in_proxy_hash(RADIUS_PACKET *reply)
204 {
205         RADIUS_PACKET **proxy_p;
206         REQUEST *request;
207
208         PTHREAD_MUTEX_LOCK(&proxy_mutex);
209         proxy_p = fr_packet_list_find_byreply(proxy_list, reply);
210
211         if (!proxy_p) {
212                 PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
213                 return NULL;
214         }
215
216         request = fr_packet2myptr(REQUEST, proxy, proxy_p);
217         request->num_proxied_responses++; /* needs to be protected by lock */
218
219         PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
220
221         return request;
222 }
223
224
225 static void remove_from_proxy_hash(REQUEST *request)
226 {
227         /*
228          *      Check this without grabbing the mutex because it's a
229          *      lot faster that way.
230          */
231         if (!request->in_proxy_hash) return;
232
233         /*
234          *      The "not in hash" flag is definitive.  However, if the
235          *      flag says that it IS in the hash, there might still be
236          *      a race condition where it isn't.
237          */
238         PTHREAD_MUTEX_LOCK(&proxy_mutex);
239
240         if (!request->in_proxy_hash) {
241                 PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
242                 return;
243         }
244
245         fr_packet_list_yank(proxy_list, request->proxy);
246         fr_packet_list_id_free(proxy_list, request->proxy);
247
248         /*
249          *      On the FIRST reply, decrement the count of outstanding
250          *      requests.  Note that this is NOT the count of sent
251          *      packets, but whether or not the home server has
252          *      responded at all.
253          */
254         if (!request->proxy_reply &&
255             request->home_server &&
256             request->home_server->currently_outstanding) {
257                 request->home_server->currently_outstanding--;
258         }
259
260 #ifdef WITH_TCP
261         request->proxy_listener->count--;
262         request->proxy_listener = NULL;
263 #endif
264
265         /*
266          *      Got from YES in hash, to NO, not in hash while we hold
267          *      the mutex.  This guarantees that when another thread
268          *      grabs the mutex, the "not in hash" flag is correct.
269          */
270         request->in_proxy_hash = FALSE;
271
272         PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
273 }
274 #endif  /* WITH_PROXY */
275
276 #ifdef WITH_TCP
277 static int remove_all_requests(void *ctx, void *data)
278 {
279         rad_listen_t *this = ctx;
280         RADIUS_PACKET **packet_p = data;
281         REQUEST *request;
282         
283         request = fr_packet2myptr(REQUEST, packet, packet_p);
284         if (request->packet->sockfd != this->fd) return 0;
285
286         switch (request->child_state) {
287         case REQUEST_RUNNING:
288                 rad_assert(request->ev != NULL); /* or it's lost forever */
289         case REQUEST_QUEUED:
290                 request->master_state = REQUEST_STOP_PROCESSING;
291                 return 0;
292
293                 /*
294                  *      Waiting for a reply.  There's no point in
295                  *      doing anything else.  We remove it from the
296                  *      request hash so that we can close the upstream
297                  *      socket.
298                  */
299         case REQUEST_PROXIED:
300                 remove_from_request_hash(request);
301                 request->child_state = REQUEST_DONE;
302                 return 0;
303
304         case REQUEST_REJECT_DELAY:
305         case REQUEST_CLEANUP_DELAY:
306         case REQUEST_DONE:
307                 ev_request_free(&request);
308                 break;
309         }
310
311         return 0;
312 }
313
314 #ifdef WITH_PROXY
315 static int remove_all_proxied_requests(void *ctx, void *data)
316 {
317         rad_listen_t *this = ctx;
318         RADIUS_PACKET **proxy_p = data;
319         REQUEST *request;
320         
321         request = fr_packet2myptr(REQUEST, proxy, proxy_p);
322         if (request->proxy->sockfd != this->fd) return 0;
323
324         switch (request->child_state) {
325         case REQUEST_RUNNING:
326                 rad_assert(request->ev != NULL); /* or it's lost forever */
327         case REQUEST_QUEUED:
328                 request->master_state = REQUEST_STOP_PROCESSING;
329                 return 0;
330
331                 /*
332                  *      Eventually we will discover that there is no
333                  *      response to the proxied request.
334                  */
335         case REQUEST_PROXIED:
336                 break;
337
338                 /*
339                  *      Keep it in the cache for duplicate detection.
340                  */
341         case REQUEST_REJECT_DELAY:
342         case REQUEST_CLEANUP_DELAY:
343         case REQUEST_DONE:
344                 break;
345         }
346
347         remove_from_proxy_hash(request);
348         return 0;
349 }
350 #endif  /* WITH_PROXY */
351 #endif  /* WITH_TCP */
352
353
354 #ifdef WITH_PROXY
355 static int insert_into_proxy_hash(REQUEST *request)
356 {
357         char buf[128];
358         int rcode, tries;
359         void *proxy_listener;
360
361         rad_assert(request->proxy != NULL);
362         rad_assert(proxy_list != NULL);
363
364         tries = 1;
365 retry:
366         PTHREAD_MUTEX_LOCK(&proxy_mutex);
367         rcode = fr_packet_list_id_alloc(proxy_list,
368                                         request->home_server->proto,
369                                         request->proxy, &proxy_listener);
370         request->num_proxied_requests = 1;
371         request->num_proxied_responses = 0;
372         PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
373         
374         if (!rcode) {
375                 if (proxy_no_new_sockets) return 0;
376
377                 /*
378                  *      Also locks the proxy mutex, so we have to call
379                  *      it with the mutex unlocked.  Some systems
380                  *      don't support recursive mutexes.
381                  */
382                 if (!proxy_new_listener(request->home_server, 0)) {
383                         radlog(L_ERR, "Failed to create a new socket for proxying requests.");
384                         return 0;
385                 }
386                 request->proxy->src_port = 0; /* Use any new socket */
387
388                 tries++;
389                 if (tries > 2) {
390                         RDEBUG2("ERROR: Failed allocating Id for new socket when proxying requests.");
391                         return 0;
392                 }
393                 
394                 goto retry;
395         }
396
397         request->proxy_listener = proxy_listener;
398
399         PTHREAD_MUTEX_LOCK(&proxy_mutex);
400         if (!fr_packet_list_insert(proxy_list, &request->proxy)) {
401                 fr_packet_list_id_free(proxy_list, request->proxy);
402                 PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
403                 radlog(L_PROXY, "Failed to insert entry into proxy list");
404                 return 0;
405         }
406
407         request->in_proxy_hash = TRUE;
408
409         /*
410          *      Keep track of maximum outstanding requests to a
411          *      particular home server.  'max_outstanding' is
412          *      enforced in home_server_ldb(), in realms.c.
413          */
414         if (request->home_server) {
415                 request->home_server->currently_outstanding++;
416         }
417
418 #ifdef WITH_TCP
419         request->proxy_listener->count++;
420 #endif
421
422         PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
423
424         RDEBUG3(" proxy: allocating destination %s port %d - Id %d",
425                inet_ntop(request->proxy->dst_ipaddr.af,
426                          &request->proxy->dst_ipaddr.ipaddr, buf, sizeof(buf)),
427                request->proxy->dst_port,
428                request->proxy->id);
429
430         return 1;
431 }
432
433
434 /*
435  *      Called as BOTH an event, and in-line from other functions.
436  */
437 static void wait_for_proxy_id_to_expire(void *ctx)
438 {
439         REQUEST *request = ctx;
440
441         rad_assert(request->magic == REQUEST_MAGIC);
442         rad_assert(request->proxy != NULL);
443
444         fr_event_now(el, &now);
445         request->when = request->proxy_when;
446
447 #ifdef WITH_COA
448         if (((request->proxy->code == PW_COA_REQUEST) ||
449              (request->proxy->code == PW_DISCONNECT_REQUEST)) &&
450             (request->packet->code != request->proxy->code)) {
451                 request->when.tv_sec += request->home_server->coa_mrd;
452         } else
453 #endif
454         request->when.tv_sec += request->home_server->response_window;
455
456         if ((request->num_proxied_requests == request->num_proxied_responses) ||
457 #ifdef WITH_TCP
458             (request->home_server->proto == IPPROTO_TCP) ||
459 #endif
460             timercmp(&now, &request->when, >)) {
461                 if (request->packet) {
462                         RDEBUG2("Cleaning up request packet ID %d with timestamp +%d",
463                                request->packet->id,
464                                (unsigned int) (request->timestamp - fr_start_time));
465                 } else {
466                         RDEBUG2("Cleaning up request with timestamp +%d",
467                                (unsigned int) (request->timestamp - fr_start_time));
468                 }
469
470                 ev_request_free(&request);
471                 return;
472         }
473
474         INSERT_EVENT(wait_for_proxy_id_to_expire, request);
475 }
476 #endif
477
478 #ifdef HAVE_PTHREAD_H
479 static void wait_for_child_to_die(void *ctx)
480 {
481         REQUEST *request = ctx;
482
483         rad_assert(request->magic == REQUEST_MAGIC);
484
485         /*
486          *      If it's still queued (waiting for a thread to pick it
487          *      up) OR, it's running AND there's still a child thread
488          *      handling it, THEN delay some more.
489          */
490         if ((request->child_state == REQUEST_QUEUED) ||
491             ((request->child_state == REQUEST_RUNNING) &&
492              (pthread_equal(request->child_pid, NO_SUCH_CHILD_PID) == 0))) {
493
494                 /*
495                  *      Cap delay at five minutes.
496                  */
497                 if (request->delay < (USEC * 60 * 5)) {
498                         request->delay += (request->delay >> 1);
499                         radlog_request(L_INFO, 0, request, "WARNING: Child is hung in component %s module %s.",
500                                request->component, request->module);
501                 } else {
502                         RDEBUG2("Child is still stuck");
503                 }
504                 tv_add(&request->when, request->delay);
505
506                 INSERT_EVENT(wait_for_child_to_die, request);
507                 return;
508         }
509
510         RDEBUG2("Child is finally responsive");
511         remove_from_request_hash(request);
512
513 #ifdef WITH_PROXY
514         if (request->proxy) {
515                 wait_for_proxy_id_to_expire(request);
516                 return;
517         }
518 #endif
519
520         ev_request_free(&request);
521 }
522 #endif
523
524 static void cleanup_delay(void *ctx)
525 {
526         REQUEST *request = ctx;
527
528         rad_assert(request->magic == REQUEST_MAGIC);
529         rad_assert((request->child_state == REQUEST_CLEANUP_DELAY) ||
530                    (request->child_state == REQUEST_DONE));
531
532         remove_from_request_hash(request);
533
534 #ifdef WITH_PROXY
535         if (request->proxy && request->in_proxy_hash) {
536                 wait_for_proxy_id_to_expire(request);
537                 return;
538         }
539 #endif
540
541         RDEBUG2("Cleaning up request packet ID %d with timestamp +%d",
542                 request->packet->id,
543                (unsigned int) (request->timestamp - fr_start_time));
544
545         ev_request_free(&request);
546 }
547
548
549 /*
550  *      In daemon mode, AND this request has debug flags set.
551  */
552 #define DEBUG_PACKET if (!debug_flag && request->options && request->radlog) debug_packet
553
554 static void debug_packet(REQUEST *request, RADIUS_PACKET *packet, int direction)
555 {
556         VALUE_PAIR *vp;
557         char buffer[1024];
558         const char *received, *from;
559         const fr_ipaddr_t *ip;
560         int port;
561
562         if (!packet) return;
563
564         rad_assert(request->radlog != NULL);
565
566         if (direction == 0) {
567                 received = "Received";
568                 from = "from";  /* what else? */
569                 ip = &packet->src_ipaddr;
570                 port = packet->src_port;
571
572         } else {
573                 received = "Sending";
574                 from = "to";    /* hah! */
575                 ip = &packet->dst_ipaddr;
576                 port = packet->dst_port;
577         }
578         
579         /*
580          *      Client-specific debugging re-prints the input
581          *      packet into the client log.
582          *
583          *      This really belongs in a utility library
584          */
585         if ((packet->code > 0) && (packet->code < FR_MAX_PACKET_CODE)) {
586                 RDEBUG("%s %s packet %s host %s port %d, id=%d, length=%d",
587                        received, fr_packet_codes[packet->code], from,
588                        inet_ntop(ip->af, &ip->ipaddr, buffer, sizeof(buffer)),
589                        port, packet->id, packet->data_len);
590         } else {
591                 RDEBUG("%s packet %s host %s port %d code=%d, id=%d, length=%d",
592                        received, from,
593                        inet_ntop(ip->af, &ip->ipaddr, buffer, sizeof(buffer)),
594                        port,
595                        packet->code, packet->id, packet->data_len);
596         }
597
598         for (vp = packet->vps; vp != NULL; vp = vp->next) {
599                 vp_prints(buffer, sizeof(buffer), vp);
600                 request->radlog(L_DBG, 0, request, "\t%s", buffer);
601         }
602 }
603
604 static void reject_delay(void *ctx)
605 {
606         REQUEST *request = ctx;
607
608         rad_assert(request->magic == REQUEST_MAGIC);
609         rad_assert(request->child_state == REQUEST_REJECT_DELAY);
610
611         RDEBUG2("Sending delayed reject");
612
613         DEBUG_PACKET(request, request->reply, 1);
614
615         request->listener->send(request->listener, request);
616
617         request->when.tv_sec += request->root->cleanup_delay;
618         request->child_state = REQUEST_CLEANUP_DELAY;
619
620         INSERT_EVENT(cleanup_delay, request);
621 }
622
623
624 #ifdef WITH_PROXY
625 void revive_home_server(void *ctx)
626 {
627         home_server *home = ctx;
628         char buffer[128];
629
630 #ifdef WITH_TCP
631         rad_assert(home->proto != IPPROTO_TCP);
632 #endif
633
634         home->state = HOME_STATE_ALIVE;
635         home->currently_outstanding = 0;
636         home->revive_time = now;
637
638         /*
639          *      Delete any outstanding events.
640          */
641         if (home->ev) fr_event_delete(el, &home->ev);
642
643         radlog(L_PROXY, "Marking home server %s port %d alive again... we have no idea if it really is alive or not.",
644                inet_ntop(home->ipaddr.af, &home->ipaddr.ipaddr,
645                          buffer, sizeof(buffer)),
646                home->port);
647
648 }
649
650
651 static void no_response_to_ping(void *ctx)
652 {
653         REQUEST *request = ctx;
654         home_server *home;
655         char buffer[128];
656
657         rad_assert(request->home_server != NULL);
658
659         home = request->home_server;
660 #ifdef WITH_TCP
661         rad_assert(home->proto != IPPROTO_TCP);
662 #endif
663
664         home->num_received_pings = 0;
665
666         radlog(L_ERR, "No response to status check %d for home server %s port %d",
667                request->number,
668                inet_ntop(request->proxy->dst_ipaddr.af,
669                          &request->proxy->dst_ipaddr.ipaddr,
670                          buffer, sizeof(buffer)),
671                request->proxy->dst_port);
672
673         check_for_zombie_home_server(request);
674
675         wait_for_proxy_id_to_expire(request);
676 }
677
678
679 /*
680  *      Note that we don't care what the value of the code field is.
681  *      If the response has a valid (src ip/port, dst ip/port), id,
682  *      and correctly signed Message-Authenticator, that's good
683  *      enough.
684  */
685 static void received_response_to_ping(REQUEST *request)
686 {
687         home_server *home;
688         char buffer[128];
689
690         rad_assert(request->home_server != NULL);
691
692         home = request->home_server;
693 #ifdef WITH_TCP
694         rad_assert(home->proto != IPPROTO_TCP);
695 #endif
696
697         home->num_received_pings++;
698
699         radlog(L_PROXY, "Received response to status check %d (%d in current sequence)",
700                request->number, home->num_received_pings);
701
702         /*
703          *      Remove the request from any hashes
704          */
705         fr_event_delete(el, &request->ev);
706         remove_from_proxy_hash(request);
707         rad_assert(request->in_request_hash == FALSE);
708
709         /*
710          *      The control socket may have marked the home server as
711          *      alive.  OR, it may have suddenly started responding to
712          *      requests again.  If so, don't re-do the "make alive"
713          *      work.
714          */
715         if (home->state == HOME_STATE_ALIVE) return;
716
717         /*
718          *      We haven't received enough ping responses to mark it
719          *      "alive".  Wait a bit.
720          */
721         if (home->num_received_pings < home->num_pings_to_alive) {
722                 return;
723         }
724
725         home->state = HOME_STATE_ALIVE;
726         home->currently_outstanding = 0;
727         home->revive_time = now;
728
729         if (!fr_event_delete(el, &home->ev)) {
730                 RDEBUG2("Hmm... no event for home server.  Oh well.");
731         }
732
733         radlog(L_PROXY, "Marking home server %s port %d alive",
734                inet_ntop(request->proxy->dst_ipaddr.af,
735                          &request->proxy->dst_ipaddr.ipaddr,
736                          buffer, sizeof(buffer)),
737                request->proxy->dst_port);
738 }
739
740
741 /*
742  *      Called from start of zombie period, OR after control socket
743  *      marks the home server dead.
744  */
745 static void ping_home_server(void *ctx)
746 {
747         uint32_t jitter;
748         home_server *home = ctx;
749         REQUEST *request;
750         VALUE_PAIR *vp;
751
752 #ifdef WITH_TCP
753         rad_assert(home->proto != IPPROTO_TCP);
754 #endif
755
756         if ((home->state == HOME_STATE_ALIVE) ||
757             (home->ping_check == HOME_PING_CHECK_NONE) ||
758             (home->ev != NULL)) {
759                 return;
760         }
761
762         request = request_alloc();
763         request->number = request_num_counter++;
764
765         request->proxy = rad_alloc(1);
766         rad_assert(request->proxy != NULL);
767
768         fr_event_now(el, &request->when);
769         home->when = request->when;
770
771         if (home->ping_check == HOME_PING_CHECK_STATUS_SERVER) {
772                 request->proxy->code = PW_STATUS_SERVER;
773
774                 radius_pairmake(request, &request->proxy->vps,
775                                 "Message-Authenticator", "0x00", T_OP_SET);
776
777         } else if (home->type == HOME_TYPE_AUTH) {
778                 request->proxy->code = PW_AUTHENTICATION_REQUEST;
779
780                 radius_pairmake(request, &request->proxy->vps,
781                                 "User-Name", home->ping_user_name, T_OP_SET);
782                 radius_pairmake(request, &request->proxy->vps,
783                                 "User-Password", home->ping_user_password, T_OP_SET);
784                 radius_pairmake(request, &request->proxy->vps,
785                                 "Service-Type", "Authenticate-Only", T_OP_SET);
786                 radius_pairmake(request, &request->proxy->vps,
787                                 "Message-Authenticator", "0x00", T_OP_SET);
788
789         } else {
790 #ifdef WITH_ACCOUNTING
791                 request->proxy->code = PW_ACCOUNTING_REQUEST;
792                 
793                 radius_pairmake(request, &request->proxy->vps,
794                                 "User-Name", home->ping_user_name, T_OP_SET);
795                 radius_pairmake(request, &request->proxy->vps,
796                                 "Acct-Status-Type", "Stop", T_OP_SET);
797                 radius_pairmake(request, &request->proxy->vps,
798                                 "Acct-Session-Id", "00000000", T_OP_SET);
799                 vp = radius_pairmake(request, &request->proxy->vps,
800                                      "Event-Timestamp", "0", T_OP_SET);
801                 vp->vp_date = now.tv_sec;
802 #else
803                 rad_assert("Internal sanity check failed");
804 #endif
805         }
806
807         radius_pairmake(request, &request->proxy->vps,
808                         "NAS-Identifier", "Status Check. Are you alive?",
809                         T_OP_SET);
810
811         request->proxy->dst_ipaddr = home->ipaddr;
812         request->proxy->dst_port = home->port;
813         request->home_server = home;
814
815         rad_assert(request->proxy_listener == NULL);
816
817         if (!insert_into_proxy_hash(request)) {
818                 radlog(L_PROXY, "Failed inserting status check %d into proxy hash.  Discarding it.",
819                        request->number);
820                 ev_request_free(&request);
821                 return;
822         }
823         rad_assert(request->proxy_listener != NULL);
824         request->proxy_listener->send(request->proxy_listener,
825                                       request);
826
827         request->next_callback = NULL;
828         request->child_state = REQUEST_PROXIED;
829         request->when.tv_sec += home->ping_timeout;;
830
831         INSERT_EVENT(no_response_to_ping, request);
832
833         /*
834          *      Add +/- 2s of jitter, as suggested in RFC 3539
835          *      and in the Issues and Fixes draft.
836          */
837         home->when.tv_sec += home->ping_interval - 2;
838
839         jitter = fr_rand();
840         jitter ^= (jitter >> 10);
841         jitter &= ((1 << 23) - 1); /* 22 bits of 1 */
842
843         tv_add(&home->when, jitter);
844
845         INSERT_EVENT(ping_home_server, home);
846 }
847
848
849 void mark_home_server_dead(home_server *home, struct timeval *when)
850 {
851         int previous_state = home->state;
852         char buffer[128];
853
854         radlog(L_PROXY, "Marking home server %s port %d as dead.",
855                inet_ntop(home->ipaddr.af, &home->ipaddr.ipaddr,
856                          buffer, sizeof(buffer)),
857                home->port);
858
859         home->state = HOME_STATE_IS_DEAD;
860         home->num_received_pings = 0;
861
862         if (home->ping_check != HOME_PING_CHECK_NONE) {
863                 /*
864                  *      If the control socket marks us dead, start
865                  *      pinging.  Otherwise, we already started
866                  *      pinging when it was marked "zombie".
867                  */
868                 if (previous_state == HOME_STATE_ALIVE) {
869                         ping_home_server(home);
870                 }
871
872         } else {
873                 /*
874                  *      Revive it after a fixed period of time.  This
875                  *      is very, very, bad.
876                  */
877                 home->when = *when;
878                 home->when.tv_sec += home->revive_interval;
879
880                 INSERT_EVENT(revive_home_server, home);
881         }
882 }
883
884 static void check_for_zombie_home_server(REQUEST *request)
885 {
886         home_server *home;
887         struct timeval when;
888
889         home = request->home_server;
890
891         if (home->state != HOME_STATE_ZOMBIE) return;
892
893         when = home->zombie_period_start;
894         when.tv_sec += home->zombie_period;
895
896         fr_event_now(el, &now);
897         if (timercmp(&now, &when, <)) {
898                 return;
899         }
900
901         mark_home_server_dead(home, &request->when);
902 }
903
904 static int proxy_to_virtual_server(REQUEST *request);
905
906 static int virtual_server_handler(UNUSED REQUEST *request)
907 {
908         proxy_to_virtual_server(request);
909         return 0;
910 }
911
912 static void proxy_fallback_handler(REQUEST *request)
913 {
914         /*
915          *      A proper time is required for wait_a_bit.
916          */
917         request->delay = USEC / 10;
918         gettimeofday(&now, NULL);
919         request->next_when = now;
920         tv_add(&request->next_when, request->delay);
921         request->next_callback = wait_a_bit;
922
923         /*
924          *      Re-queue the request.
925          */
926         request->child_state = REQUEST_QUEUED;
927         
928         rad_assert(request->proxy != NULL);
929         if (!thread_pool_addrequest(request, virtual_server_handler)) {
930                 request->child_state = REQUEST_DONE;
931         }
932
933 #ifdef HAVE_PTHREAD_H
934         /*
935          *      MAY free the request if we're over max_request_time,
936          *      AND we're not in threaded mode!
937          *
938          *      Note that we call this ONLY if we're threaded, as
939          *      if we're NOT threaded, request_post_handler() calls
940          *      wait_a_bit(), which means that "request" may not
941          *      exist any more...
942          */
943         if (have_children) wait_a_bit(request);
944 #endif
945 }
946
947
948 static int setup_post_proxy_fail(REQUEST *request)
949 {
950         DICT_VALUE *dval = NULL;
951         VALUE_PAIR *vp;
952
953         request->child_state = REQUEST_RUNNING;
954
955         if (request->packet->code == PW_AUTHENTICATION_REQUEST) {
956           dval = dict_valbyname(PW_POST_PROXY_TYPE, 0, "Fail-Authentication");
957
958         } else if (request->packet->code == PW_ACCOUNTING_REQUEST) {
959                 dval = dict_valbyname(PW_POST_PROXY_TYPE, 0, "Fail-Accounting");
960
961 #ifdef WITH_COA
962                 /*
963                  *      See no_response_to_coa_request
964                  */
965         } else if (((request->packet->code >> 8) & 0xff) == PW_COA_REQUEST) {
966                 request->packet->code &= 0xff; /* restore it */
967
968                 if (request->proxy->code == PW_COA_REQUEST) {
969                         dval = dict_valbyname(PW_POST_PROXY_TYPE, 0, "Fail-CoA");
970
971                 } else if (request->proxy->code == PW_DISCONNECT_REQUEST) {
972                         dval = dict_valbyname(PW_POST_PROXY_TYPE, 0, "Fail-Disconnect");
973                 } else {
974                         return 0;
975                 }
976
977 #endif
978         } else {
979                 return 0;
980         }
981
982         if (!dval) dval = dict_valbyname(PW_POST_PROXY_TYPE, 0, "Fail");
983
984         if (!dval) {
985                 pairdelete(&request->config_items, PW_POST_PROXY_TYPE, 0);
986                 return 0;
987         }
988
989         vp = pairfind(request->config_items, PW_POST_PROXY_TYPE, 0);
990         if (!vp) vp = radius_paircreate(request, &request->config_items,
991                                         PW_POST_PROXY_TYPE, 0, PW_TYPE_INTEGER);
992         vp->vp_integer = dval->value;
993
994         rad_assert(request->proxy_reply == NULL);
995
996         return 1;
997 }
998
999
1000 static int null_handler(UNUSED REQUEST *request)
1001 {
1002         return 0;
1003 }
1004
1005 static void post_proxy_fail_handler(REQUEST *request)
1006 {
1007         /*
1008          *      A proper time is required for wait_a_bit.
1009          */
1010         request->delay = USEC / 10;
1011         gettimeofday(&now, NULL);
1012
1013         /*
1014          *      Not set up to run Post-Proxy-Type = Fail.
1015          *
1016          *      Mark the request as still running, and figure out what
1017          *      to do next.
1018          */
1019         if (!setup_post_proxy_fail(request)) {
1020                 request_post_handler(request);
1021
1022         } else {
1023                 /*
1024                  *      Re-queue the request.
1025                  */
1026                 request->child_state = REQUEST_QUEUED;
1027
1028                 /*
1029                  *      There is a post-proxy-type of fail.  We run
1030                  *      the request through the pre/post proxy
1031                  *      handlers, just like it was a real proxied
1032                  *      request.  However, we set the per-request
1033                  *      handler to NULL, as we don't want to do
1034                  *      anything else.
1035                  *
1036                  *      Note that when we're not threaded, this will
1037                  *      process the request even if it's greater than
1038                  *      max_request_time.  That's not fatal.
1039                  */
1040                 request->priority = 0;
1041                 rad_assert(request->proxy != NULL);
1042                 thread_pool_addrequest(request, null_handler);
1043         }
1044
1045         /*
1046          *      MAY free the request if we're over max_request_time,
1047          *      AND we're not in threaded mode!
1048          *
1049          *      Note that we call this ONLY if we're threaded, as
1050          *      if we're NOT threaded, request_post_handler() calls
1051          *      wait_a_bit(), which means that "request" may not
1052          *      exist any more...
1053          */
1054         if (have_children) wait_a_bit(request);
1055 }
1056
1057 /* maybe check this against wait_for_proxy_id_to_expire? */
1058 static void no_response_to_proxied_request(void *ctx)
1059 {
1060         REQUEST *request = ctx;
1061         home_server *home;
1062         char buffer[128];
1063
1064         rad_assert(request->magic == REQUEST_MAGIC);
1065
1066         if (request->master_state == REQUEST_STOP_PROCESSING) {
1067                 ev_request_free(&request);
1068                 return;
1069         }
1070
1071         rad_assert(request->child_state == REQUEST_PROXIED);
1072
1073         /*
1074          *      If we've failed over to an internal home server,
1075          *      replace the callback with the correct one.  This
1076          *      is due to locking issues with child threads...
1077          */
1078         if (request->home_server->server) {
1079                 wait_a_bit(request);
1080                 return;
1081         }
1082
1083 #ifdef WITH_TCP
1084         if (request->home_server->proto != IPPROTO_TCP)
1085 #endif
1086                 check_for_zombie_home_server(request);
1087
1088         home = request->home_server;
1089
1090         /*
1091          *      The default as of 2.1.7 is to allow requests to
1092          *      fail-over to a backup home server when this one does
1093          *      not respond.  The old behavior can be configured as
1094          *      well.
1095          */
1096         if (home->no_response_fail) {
1097                 radlog_request(L_ERR, 0, request, "Rejecting request (proxy Id %d) due to lack of any response from home server %s port %d",
1098                        request->proxy->id,
1099                        inet_ntop(request->proxy->dst_ipaddr.af,
1100                                  &request->proxy->dst_ipaddr.ipaddr,
1101                                  buffer, sizeof(buffer)),
1102                        request->proxy->dst_port);
1103
1104                 post_proxy_fail_handler(request);
1105         } else {
1106                 /*
1107                  *      Enforce max_request_time.
1108                  *
1109                  *      We fail over to another backup home server
1110                  *      when the client re-transmits the request.  If
1111                  *      the client doesn't re-transmit, no fail-over
1112                  *      occurs.
1113                  */
1114                 rad_assert(request->ev == NULL);
1115                 request->child_state = REQUEST_RUNNING;
1116                 wait_a_bit(request);
1117         }
1118
1119         /*
1120          *      Don't touch request due to race conditions
1121          */
1122
1123 #ifdef WITH_TCP
1124         /*
1125          *      Do nothing more.  The home server didn't respond,
1126          *      but that isn't a catastrophic failure.  Some home
1127          *      servers don't respond to packets...
1128          */
1129         if (home->proto == IPPROTO_TCP) {
1130                 /*
1131                  *      FIXME: Set up TCP pinging on this connection.
1132                  *
1133                  *      Maybe the CONNECTION is dead, but the home
1134                  *      server is alive.  In that case, we need to start
1135                  *      pinging on the connection.
1136                  *
1137                  *      This means doing the pinging BEFORE the
1138                  *      post_proxy_fail_handler above, as it may do
1139                  *      something with the request, and cause the
1140                  *      proxy listener to go away!
1141                  */
1142                 return;
1143         }
1144 #endif
1145
1146         if (home->state == HOME_STATE_IS_DEAD) {
1147                 rad_assert(home->ev != NULL); /* or it will never wake up */
1148                 return;
1149         }
1150
1151         /*
1152          *      Enable the zombie period when we notice that the home
1153          *      server hasn't responded.  We do NOT back-date the start
1154          *      of the zombie period.
1155          */
1156         if (home->state == HOME_STATE_ALIVE) {
1157                 home->state = HOME_STATE_ZOMBIE;
1158                 home->zombie_period_start = now;        
1159                 fr_event_delete(el, &home->ev);
1160                 home->currently_outstanding = 0;
1161                 home->num_received_pings = 0;
1162
1163                 radlog(L_PROXY, "Marking home server %s port %d as zombie (it looks like it is dead).",
1164                        inet_ntop(home->ipaddr.af, &home->ipaddr.ipaddr,
1165                                  buffer, sizeof(buffer)),
1166                        home->port);
1167
1168                 /*
1169                  *      Start pinging the home server.
1170                  */
1171                 ping_home_server(home);
1172         }
1173 }
1174 #endif
1175
1176 static void wait_a_bit(void *ctx)
1177 {
1178         struct timeval when;
1179         REQUEST *request = ctx;
1180         fr_event_callback_t callback = NULL;
1181
1182         rad_assert(request->magic == REQUEST_MAGIC);
1183
1184         /*
1185          *      The socket was closed.  Tell the request that
1186          *      there is no point in continuing.
1187          */
1188         if (request->listener->status != RAD_LISTEN_STATUS_KNOWN) {
1189                 goto stop_processing;
1190         }
1191
1192 #ifdef WITH_COA
1193         /*
1194          *      The CoA request is a new (internally generated)
1195          *      request, created in a child thread.  We therefore need
1196          *      some way to tie its events back into the main event
1197          *      handler.
1198          */
1199         if (request->coa && !request->coa->proxy_reply &&
1200             request->coa->next_callback) {
1201                 request->coa->when = request->coa->next_when;
1202                 INSERT_EVENT(request->coa->next_callback, request->coa);
1203                 request->coa->next_callback = NULL;
1204                 request->coa->parent = NULL;
1205                 request->coa = NULL;
1206         }
1207 #endif
1208
1209         switch (request->child_state) {
1210         case REQUEST_QUEUED:
1211         case REQUEST_RUNNING:
1212                 when = request->received;
1213                 when.tv_sec += request->root->max_request_time;
1214
1215                 /*
1216                  *      Normally called from the event loop with the
1217                  *      proper event loop time.  Otherwise, called from
1218                  *      post proxy fail handler, which sets "now", and
1219                  *      this call won't re-set it, because we're not
1220                  *      in the event loop.
1221                  */
1222                 fr_event_now(el, &now);
1223
1224                 /*
1225                  *      Request still has more time.  Continue
1226                  *      waiting.
1227                  */
1228                 if (timercmp(&now, &when, <) ||
1229                     ((request->listener->type == RAD_LISTEN_DETAIL) &&
1230                      (request->child_state == REQUEST_QUEUED))) {
1231                         if (request->delay < (USEC / 10)) {
1232                                 request->delay = USEC / 10;
1233                         }
1234                         request->delay += request->delay >> 1;
1235
1236 #ifdef WITH_DETAIL
1237                         /*
1238                          *      Cap wait at some sane value for detail
1239                          *      files.
1240                          */
1241                         if ((request->listener->type == RAD_LISTEN_DETAIL) &&
1242                             (request->delay > (request->root->max_request_time * USEC))) {
1243                                 request->delay = request->root->max_request_time * USEC;
1244                         }
1245 #endif
1246
1247                         request->when = now;
1248                         tv_add(&request->when, request->delay);
1249                         callback = wait_a_bit;
1250                         break;
1251                 }
1252
1253         stop_processing:
1254 #if defined(HAVE_PTHREAD_H)
1255                 /*
1256                  *      A child thread MAY still be running on the
1257                  *      request.  Ask the thread to stop working on
1258                  *      the request.
1259                  */
1260                 if (have_children &&
1261                     (pthread_equal(request->child_pid, NO_SUCH_CHILD_PID) == 0)) {
1262                         request->master_state = REQUEST_STOP_PROCESSING;
1263
1264                         radlog_request(L_ERR, 0, request, "WARNING: Unresponsive child in module %s component %s",
1265                                request->module ? request->module : "<server core>",
1266                                request->component ? request->component : "<server core>");
1267                         
1268                         request->delay = USEC / 4;
1269                         tv_add(&request->when, request->delay);
1270                         callback = wait_for_child_to_die;
1271                         break;
1272                 }
1273 #endif
1274
1275                 /*
1276                  *      Else no child thread is processing the
1277                  *      request.  We probably should have just marked
1278                  *      the request as 'done' elsewhere, like in the
1279                  *      post-proxy-fail handler.  But doing that would
1280                  *      involve checking for max_request_time in
1281                  *      multiple places, so this may be simplest.
1282                  */
1283                 request->child_state = REQUEST_DONE;
1284                 /* FALL-THROUGH */
1285
1286                 /*
1287                  *      Mark the request as no longer running,
1288                  *      and clean it up.
1289                  */
1290         case REQUEST_DONE:
1291 #ifdef HAVE_PTHREAD_H
1292                 request->child_pid = NO_SUCH_CHILD_PID;
1293 #endif
1294
1295 #ifdef WITH_COA
1296                 /*
1297                  *      This is a CoA request.  It's been divorced
1298                  *      from everything else, so we clean it up now.
1299                  */
1300                 if (!request->in_request_hash &&
1301                     request->proxy &&
1302                     (request->packet->code != request->proxy->code) &&
1303                     ((request->proxy->code == PW_COA_REQUEST) ||
1304                      (request->proxy->code == PW_DISCONNECT_REQUEST))) {
1305                         /*
1306                          *      FIXME: Do CoA MIBs
1307                          */
1308                         ev_request_free(&request);
1309                         return;
1310                 }
1311 #endif
1312                 request_stats_final(request);
1313                 cleanup_delay(request);
1314                 return;
1315
1316         case REQUEST_REJECT_DELAY:
1317         case REQUEST_CLEANUP_DELAY:
1318 #ifdef HAVE_PTHREAD_H
1319                 request->child_pid = NO_SUCH_CHILD_PID;
1320 #endif
1321                 request_stats_final(request);
1322
1323         case REQUEST_PROXIED:
1324                 rad_assert(request->next_callback != NULL);
1325                 rad_assert(request->next_callback != wait_a_bit);
1326
1327                 request->when = request->next_when;
1328                 callback = request->next_callback;
1329                 request->next_callback = NULL;
1330                 break;
1331
1332         default:
1333                 rad_panic("Internal sanity check failure");
1334                 return;
1335         }
1336
1337         /*
1338          *      Something major went wrong.  Discard the request, and
1339          *      keep running.
1340          *
1341          *      FIXME: No idea why this happens or how to fix it...
1342          *      It seems to happen *only* when requests are proxied,
1343          *      and where the home server doesn't respond.  So it looks
1344          *      like a race condition above, but it happens in debug
1345          *      mode, with no threads...
1346          */
1347         if (!callback) {
1348                 RDEBUG("WARNING: Internal sanity check failed in event handler: Discarding the request!");
1349                 ev_request_free(&request);
1350                 return;
1351         }
1352
1353         INSERT_EVENT(callback, request);
1354 }
1355
1356 #ifdef WITH_COA
1357 static void no_response_to_coa_request(void *ctx)
1358 {
1359         REQUEST *request = ctx;
1360         char buffer[128];
1361
1362         rad_assert(request->magic == REQUEST_MAGIC);
1363         rad_assert(request->child_state == REQUEST_PROXIED);
1364         rad_assert(request->home_server != NULL);
1365         rad_assert(!request->in_request_hash);
1366
1367         radlog(L_ERR, "No response to CoA request sent to %s",
1368                inet_ntop(request->proxy->dst_ipaddr.af,
1369                          &request->proxy->dst_ipaddr.ipaddr,
1370                          buffer, sizeof(buffer)));
1371
1372         /*
1373          *      Hack.
1374          */
1375         request->packet->code |= (PW_COA_REQUEST << 8);
1376         post_proxy_fail_handler(request);
1377 }
1378
1379
1380 static int update_event_timestamp(RADIUS_PACKET *packet, time_t when)
1381 {
1382         VALUE_PAIR *vp;
1383
1384         vp = pairfind(packet->vps, PW_EVENT_TIMESTAMP, 0);
1385         if (!vp) return 0;
1386
1387         vp->vp_date = when;
1388
1389         if (packet->data) {
1390                 free(packet->data);
1391                 packet->data = NULL;
1392                 packet->data_len = 0;
1393         }
1394
1395         return 1;               /* time stamp updated */
1396 }
1397
1398
1399 /*
1400  *      Called when we haven't received a response to a CoA request.
1401  */
1402 static void retransmit_coa_request(void *ctx)
1403 {
1404         int delay, frac;
1405         struct timeval mrd;
1406         REQUEST *request = ctx;
1407
1408         rad_assert(request->magic == REQUEST_MAGIC);
1409         rad_assert(request->child_state == REQUEST_PROXIED);
1410         rad_assert(request->home_server != NULL);
1411         rad_assert(!request->in_request_hash);
1412         rad_assert(request->parent == NULL);
1413         
1414         fr_event_now(el, &now);
1415
1416         /*
1417          *      Cap count at MRC, if it is non-zero.
1418          */
1419         if (request->home_server->coa_mrc &&
1420             (request->num_coa_requests >= request->home_server->coa_mrc)) {
1421                 no_response_to_coa_request(request);
1422                 return;
1423         }
1424
1425         /*
1426          *      RFC 5080 Section 2.2.1
1427          *
1428          *      RT = 2*RTprev + RAND*RTprev
1429          *         = 1.9 * RTprev + rand(0,.2) * RTprev
1430          *         = 1.9 * RTprev + rand(0,1) * (RTprev / 5)
1431          */
1432         delay = fr_rand();
1433         delay ^= (delay >> 16);
1434         delay &= 0xffff;
1435         frac = request->delay / 5;
1436         delay = ((frac >> 16) * delay) + (((frac & 0xffff) * delay) >> 16);
1437
1438         delay += (2 * request->delay) - (request->delay / 10);
1439
1440         /*
1441          *      Cap delay at MRT, if MRT is non-zero.
1442          */
1443         if (request->home_server->coa_mrt &&
1444             (delay > (request->home_server->coa_mrt * USEC))) {
1445                 int mrt_usec = request->home_server->coa_mrt * USEC;
1446
1447                 /*
1448                  *      delay = MRT + RAND * MRT
1449                  *            = 0.9 MRT + rand(0,.2)  * MRT
1450                  */
1451                 delay = fr_rand();
1452                 delay ^= (delay >> 15);
1453                 delay &= 0x1ffff;
1454                 delay = ((mrt_usec >> 16) * delay) + (((mrt_usec & 0xffff) * delay) >> 16);
1455                 delay += mrt_usec - (mrt_usec / 10);
1456         }
1457
1458         request->delay = delay;
1459         request->when = now;
1460         tv_add(&request->when, request->delay);
1461         mrd = request->proxy_when;
1462         mrd.tv_sec += request->home_server->coa_mrd;
1463
1464         /*
1465          *      Cap duration at MRD.
1466          */
1467         if (timercmp(&mrd, &request->when, <)) {
1468                 request->when = mrd;
1469                 INSERT_EVENT(no_response_to_coa_request, request);
1470
1471         } else {
1472                 INSERT_EVENT(retransmit_coa_request, request);
1473         }
1474         
1475         if (update_event_timestamp(request->proxy, now.tv_sec)) {
1476                 /*
1477                  *      Keep a copy of the old Id so that the
1478                  *      re-transmitted request doesn't re-use the old
1479                  *      Id.
1480                  */
1481                 RADIUS_PACKET old = *request->proxy;
1482                 home_server *home = request->home_server;
1483                 rad_listen_t *listener = request->proxy_listener;
1484
1485                 /*
1486                  *      Don't free the old Id on error.
1487                  */
1488                 if (!insert_into_proxy_hash(request)) {
1489                         radlog(L_PROXY,"Failed re-inserting CoA request into proxy hash.");
1490                         return;
1491                 }
1492
1493                 /*
1494                  *      Now that we have a new Id, free the old one
1495                  *      and update the various statistics.
1496                  */
1497                 PTHREAD_MUTEX_LOCK(&proxy_mutex);
1498                 fr_packet_list_yank(proxy_list, &old);
1499                 fr_packet_list_id_free(proxy_list, &old);
1500                 if (home) home->currently_outstanding--;
1501 #ifdef WITH_TCP
1502                 if (listener) listener->count--;
1503 #endif
1504                 PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
1505
1506         } else {                /* FIXME: protect by a mutex? */
1507                 request->num_proxied_requests++;
1508         }
1509
1510         request->num_coa_requests++; /* is NOT reset by code 3 lines above! */
1511
1512         request->proxy_listener->send(request->proxy_listener,
1513                                       request);
1514 }
1515
1516
1517 /*
1518  *      The original request is either DONE, or in CLEANUP_DELAY.
1519  */
1520 static int originated_coa_request(REQUEST *request)
1521 {
1522         int delay, rcode, pre_proxy_type = 0;
1523         VALUE_PAIR *vp;
1524         REQUEST *coa;
1525         fr_ipaddr_t ipaddr;
1526         char buffer[256];
1527
1528         rad_assert(request->proxy == NULL);
1529         rad_assert(!request->in_proxy_hash);
1530         rad_assert(request->proxy_reply == NULL);
1531
1532         vp = pairfind(request->config_items, PW_SEND_COA_REQUEST, 0);
1533         if (!vp && request->coa) vp = pairfind(request->coa->proxy->vps, PW_SEND_COA_REQUEST, 0);
1534         if (vp) {
1535                 if (vp->vp_integer == 0) {
1536                         ev_request_free(&request->coa);
1537                         return 1;       /* success */
1538                 }
1539         }
1540
1541         if (!request->coa) request_alloc_coa(request);
1542         if (!request->coa) return 0;
1543
1544         coa = request->coa;
1545
1546         /*
1547          *      src_ipaddr will be set up in proxy_encode.
1548          */
1549         memset(&ipaddr, 0, sizeof(ipaddr));
1550         vp = pairfind(coa->proxy->vps, PW_PACKET_DST_IP_ADDRESS, 0);
1551         if (vp) {
1552                 ipaddr.af = AF_INET;
1553                 ipaddr.ipaddr.ip4addr.s_addr = vp->vp_ipaddr;
1554
1555         } else if ((vp = pairfind(coa->proxy->vps,
1556                                   PW_PACKET_DST_IPV6_ADDRESS, 0)) != NULL) {
1557                 ipaddr.af = AF_INET6;
1558                 ipaddr.ipaddr.ip6addr = vp->vp_ipv6addr;
1559                 
1560         } else if ((vp = pairfind(coa->proxy->vps,
1561                                   PW_HOME_SERVER_POOL, 0)) != NULL) {
1562                 coa->home_pool = home_pool_byname(vp->vp_strvalue,
1563                                                   HOME_TYPE_COA);
1564                 if (!coa->home_pool) {
1565                         RDEBUG2("WARNING: No such home_server_pool %s",
1566                                vp->vp_strvalue);
1567         fail:
1568                         ev_request_free(&request->coa);
1569                         return 0;
1570                 }
1571
1572                 /*
1573                  *      Prefer
1574                  */
1575         } else if (request->client->coa_pool) {
1576                 coa->home_pool = request->client->coa_pool;
1577
1578         } else if (request->client->coa_server) {
1579                 coa->home_server = request->client->coa_server;
1580
1581         } else {
1582                 /*
1583                  *      If all else fails, send it to the client that
1584                  *      originated this request.
1585                  */
1586                 memcpy(&ipaddr, &request->packet->src_ipaddr, sizeof(ipaddr));
1587         }
1588
1589         /*
1590          *      Use the pool, if it exists.
1591          */
1592         if (coa->home_pool) {
1593                 coa->home_server = home_server_ldb(NULL, coa->home_pool, coa);
1594                 if (!coa->home_server) {
1595                         RDEBUG("WARNING: No live home server for home_server_pool %s", vp->vp_strvalue);
1596                         goto fail;
1597                 }
1598
1599         } else if (!coa->home_server) {
1600                 int port = PW_COA_UDP_PORT;
1601
1602                 vp = pairfind(coa->proxy->vps, PW_PACKET_DST_PORT, 0);
1603                 if (vp) port = vp->vp_integer;
1604
1605                 coa->home_server = home_server_find(&ipaddr, port, IPPROTO_UDP);
1606                 if (!coa->home_server) {
1607                         RDEBUG2("WARNING: Unknown destination %s:%d for CoA request.",
1608                                inet_ntop(ipaddr.af, &ipaddr.ipaddr,
1609                                          buffer, sizeof(buffer)), port);
1610                         goto fail;
1611                 }
1612         }
1613
1614         vp = pairfind(coa->proxy->vps, PW_PACKET_TYPE, 0);
1615         if (vp) {
1616                 switch (vp->vp_integer) {
1617                 case PW_COA_REQUEST:
1618                 case PW_DISCONNECT_REQUEST:
1619                         coa->proxy->code = vp->vp_integer;
1620                         break;
1621                         
1622                 default:
1623                         DEBUG("Cannot set CoA Packet-Type to code %d",
1624                               vp->vp_integer);
1625                         goto fail;
1626                 }
1627         }
1628
1629         if (!coa->proxy->code) coa->proxy->code = PW_COA_REQUEST;
1630
1631         /*
1632          *      The rest of the server code assumes that
1633          *      request->packet && request->reply exist.  Copy them
1634          *      from the original request.
1635          */
1636         rad_assert(coa->packet != NULL);
1637         rad_assert(coa->packet->vps == NULL);
1638         memcpy(coa->packet, request->packet, sizeof(*request->packet));
1639         coa->packet->vps = paircopy(request->packet->vps);
1640         coa->packet->data = NULL;
1641         rad_assert(coa->reply != NULL);
1642         rad_assert(coa->reply->vps == NULL);
1643         memcpy(coa->reply, request->reply, sizeof(*request->reply));
1644         coa->reply->vps = paircopy(request->reply->vps);
1645         coa->reply->data = NULL;
1646         coa->config_items = paircopy(request->config_items);
1647
1648         /*
1649          *      Call the pre-proxy routines.
1650          */
1651         vp = pairfind(request->config_items, PW_PRE_PROXY_TYPE, 0);
1652         if (vp) {
1653                 RDEBUG2("  Found Pre-Proxy-Type %s", vp->vp_strvalue);
1654                 pre_proxy_type = vp->vp_integer;
1655         }
1656
1657         if (coa->home_pool && coa->home_pool->virtual_server) {
1658                 const char *old_server = coa->server;
1659                 
1660                 coa->server = coa->home_pool->virtual_server;
1661                 RDEBUG2(" server %s {", coa->server);
1662                 rcode = module_pre_proxy(pre_proxy_type, coa);
1663                 RDEBUG2(" }");
1664                 coa->server = old_server;
1665         } else {
1666                 rcode = module_pre_proxy(pre_proxy_type, coa);
1667         }
1668         switch (rcode) {
1669         default:
1670                 goto fail;
1671
1672         /*
1673          *      Only send the CoA packet if the pre-proxy code succeeded.
1674          */
1675         case RLM_MODULE_NOOP:
1676         case RLM_MODULE_OK:
1677         case RLM_MODULE_UPDATED:
1678                 break;
1679         }
1680
1681         /*
1682          *      Source IP / port is set when the proxy socket
1683          *      is chosen.
1684          */
1685         coa->proxy->dst_ipaddr = coa->home_server->ipaddr;
1686         coa->proxy->dst_port = coa->home_server->port;
1687
1688         if (!insert_into_proxy_hash(coa)) {
1689                 radlog(L_PROXY, "Failed inserting CoA request into proxy hash.");
1690                 goto fail;
1691         }
1692
1693         /*
1694          *      We CANNOT divorce the CoA request from the parent
1695          *      request.  This function is running in a child thread,
1696          *      and we need access to the main event loop in order to
1697          *      to add the timers for the CoA packet.  See
1698          *      wait_a_bit().
1699          */
1700
1701         /*
1702          *      Forget about the original request completely at this
1703          *      point.
1704          */
1705         request = coa;
1706
1707         gettimeofday(&request->proxy_when, NULL);       
1708         request->received = request->next_when = request->proxy_when;
1709         rad_assert(request->proxy_reply == NULL);
1710
1711         /*
1712          *      Implement re-transmit algorithm as per RFC 5080
1713          *      Section 2.2.1.
1714          *
1715          *      We want IRT + RAND*IRT
1716          *      or 0.9 IRT + rand(0,.2) IRT
1717          *
1718          *      2^20 ~ USEC, and we want 2.
1719          *      rand(0,0.2) USEC ~ (rand(0,2^21) / 10)
1720          */
1721         delay = (fr_rand() & ((1 << 22) - 1)) / 10;
1722         request->delay = delay * request->home_server->coa_irt;
1723         delay = request->home_server->coa_irt * USEC;
1724         delay -= delay / 10;
1725         delay += request->delay;
1726      
1727         request->delay = delay;
1728         tv_add(&request->next_when, delay);
1729         request->next_callback = retransmit_coa_request;
1730         
1731         /*
1732          *      Note that we set proxied BEFORE sending the packet.
1733          *
1734          *      Once we send it, the request is tainted, as
1735          *      another thread may have picked it up.  Don't
1736          *      touch it!
1737          */
1738         request->child_pid = NO_SUCH_CHILD_PID;
1739
1740         update_event_timestamp(request->proxy, request->proxy_when.tv_sec);
1741
1742         request->child_state = REQUEST_PROXIED;
1743
1744         DEBUG_PACKET(request, request->proxy, 1);
1745
1746         request->proxy_listener->send(request->proxy_listener,
1747                                       request);
1748         return 1;
1749 }
1750 #endif  /* WITH_COA */
1751
1752 #ifdef WITH_PROXY
1753 static int process_proxy_reply(REQUEST *request)
1754 {
1755         int rcode;
1756         int post_proxy_type = 0;
1757         VALUE_PAIR *vp;
1758         
1759         /*
1760          *      Delete any reply we had accumulated until now.
1761          */
1762         pairfree(&request->reply->vps);
1763         
1764         /*
1765          *      Run the packet through the post-proxy stage,
1766          *      BEFORE playing games with the attributes.
1767          */
1768         vp = pairfind(request->config_items, PW_POST_PROXY_TYPE, 0);
1769         if (vp) {
1770                 RDEBUG2("  Found Post-Proxy-Type %s", vp->vp_strvalue);
1771                 post_proxy_type = vp->vp_integer;
1772         }
1773         
1774         if (request->home_pool && request->home_pool->virtual_server) {
1775                 const char *old_server = request->server;
1776                 
1777                 request->server = request->home_pool->virtual_server;
1778                 RDEBUG2(" server %s {", request->server);
1779                 rcode = module_post_proxy(post_proxy_type, request);
1780                 RDEBUG2(" }");
1781                 request->server = old_server;
1782         } else {
1783                 rcode = module_post_proxy(post_proxy_type, request);
1784         }
1785
1786 #ifdef WITH_COA
1787         if (request->packet->code == request->proxy->code)
1788           /*
1789            *    Don't run the next bit if we originated a CoA
1790            *    packet, after receiving an Access-Request or
1791            *    Accounting-Request.
1792            */
1793 #endif
1794         
1795         /*
1796          *      There may NOT be a proxy reply, as we may be
1797          *      running Post-Proxy-Type = Fail.
1798          */
1799         if (request->proxy_reply) {
1800                 /*
1801                  *      Delete the Proxy-State Attributes from
1802                  *      the reply.  These include Proxy-State
1803                  *      attributes from us and remote server.
1804                  */
1805                 pairdelete(&request->proxy_reply->vps, PW_PROXY_STATE, 0);
1806                 
1807                 /*
1808                  *      Add the attributes left in the proxy
1809                  *      reply to the reply list.
1810                  */
1811                 pairadd(&request->reply->vps, request->proxy_reply->vps);
1812                 request->proxy_reply->vps = NULL;
1813                 
1814                 /*
1815                  *      Free proxy request pairs.
1816                  */
1817                 pairfree(&request->proxy->vps);
1818         }
1819         
1820         switch (rcode) {
1821         default:  /* Don't do anything */
1822                 break;
1823         case RLM_MODULE_FAIL:
1824                 /* FIXME: debug print stuff */
1825                 request->child_state = REQUEST_DONE;
1826                 return 0;
1827                 
1828         case RLM_MODULE_HANDLED:
1829                 /* FIXME: debug print stuff */
1830                 request->child_state = REQUEST_DONE;
1831                 return 0;
1832         }
1833
1834         return 1;
1835 }
1836 #endif
1837
1838 static int request_pre_handler(REQUEST *request)
1839 {
1840         int rcode;
1841
1842         rad_assert(request->magic == REQUEST_MAGIC);
1843         rad_assert(request->packet != NULL);
1844
1845         request->child_state = REQUEST_RUNNING;
1846
1847         /*
1848          *      Don't decode the packet if it's an internal "fake"
1849          *      request.  Instead, just return so that the caller can
1850          *      process it.
1851          */
1852         if (request->packet->dst_port == 0) {
1853                 request->username = pairfind(request->packet->vps,
1854                                              PW_USER_NAME, 0);
1855                 request->password = pairfind(request->packet->vps,
1856                                              PW_USER_PASSWORD, 0);
1857                 return 1;
1858         }
1859
1860 #ifdef WITH_PROXY
1861         /*
1862          *      Put the decoded packet into it's proper place.
1863          */
1864         if (request->proxy_reply != NULL) {
1865                 /*
1866                  *      FIXME: For now, we can only proxy RADIUS packets.
1867                  *
1868                  *      In order to proxy other packets, we need to
1869                  *      somehow cache the "decode" function.
1870                  */
1871                 rcode = rad_decode(request->proxy_reply, request->proxy,
1872                                    request->home_server->secret);
1873                 DEBUG_PACKET(request, request->proxy_reply, 0);
1874         } else
1875 #endif
1876         if (request->packet->vps == NULL) {
1877                 rcode = request->listener->decode(request->listener, request);
1878                 
1879                 if (debug_condition) {
1880                         int result = FALSE;
1881                         const char *my_debug = debug_condition;
1882
1883                         /*
1884                          *      Ignore parse errors.
1885                          */
1886                         radius_evaluate_condition(request, RLM_MODULE_OK, 0,
1887                                                   &my_debug, 1,
1888                                                   &result);
1889                         if (result) {
1890                                 request->options = 2;
1891                                 request->radlog = radlog_request;
1892                         }
1893                 }
1894                 
1895                 DEBUG_PACKET(request, request->packet, 0);
1896         } else {
1897                 rcode = 0;
1898         }
1899
1900         if (rcode < 0) {
1901                 RDEBUG("%s Dropping packet without response.", fr_strerror());
1902                 request->reply->offset = -2; /* bad authenticator */
1903                 request->child_state = REQUEST_DONE;
1904                 return 0;
1905         }
1906
1907         if (!request->username) {
1908                 request->username = pairfind(request->packet->vps,
1909                                              PW_USER_NAME, 0);
1910         }
1911
1912 #ifdef WITH_PROXY
1913         if (request->proxy) {
1914                 return process_proxy_reply(request);
1915 #endif
1916         }
1917
1918         return 1;
1919 }
1920
1921
1922 #ifdef WITH_PROXY
1923 /*
1924  *      Do state handling when we proxy a request.
1925  */
1926 static int proxy_request(REQUEST *request)
1927 {
1928         struct timeval when;
1929         char buffer[128];
1930
1931 #ifdef WITH_COA
1932         if (request->coa) {
1933                 RDEBUG("WARNING: Cannot proxy and originate CoA packets at the same time.  Cancelling CoA request");
1934                 ev_request_free(&request->coa);
1935         }
1936 #endif
1937
1938         if (request->home_server->server) {
1939                 RDEBUG("ERROR: Cannot perform real proxying to a virtual server.");
1940                 return 0;
1941         }
1942
1943         if (!insert_into_proxy_hash(request)) {
1944                 radlog(L_PROXY, "Failed inserting request into proxy hash.");
1945                 return 0;
1946         }
1947
1948         request->proxy_listener->encode(request->proxy_listener, request);
1949
1950         when = request->received;
1951         when.tv_sec += request->root->max_request_time;
1952
1953         gettimeofday(&request->proxy_when, NULL);
1954
1955         request->next_when = request->proxy_when;
1956         request->next_when.tv_sec += request->home_server->response_window;
1957
1958         rad_assert(request->home_server->response_window > 0);
1959
1960         if (timercmp(&when, &request->next_when, <)) {
1961                 request->next_when = when;
1962         }
1963         request->next_callback = no_response_to_proxied_request;
1964
1965         RDEBUG2("Proxying request to home server %s port %d",
1966                inet_ntop(request->proxy->dst_ipaddr.af,
1967                          &request->proxy->dst_ipaddr.ipaddr,
1968                          buffer, sizeof(buffer)),
1969                 request->proxy->dst_port);
1970
1971         /*
1972          *      Note that we set proxied BEFORE sending the packet.
1973          *
1974          *      Once we send it, the request is tainted, as
1975          *      another thread may have picked it up.  Don't
1976          *      touch it!
1977          */
1978 #ifdef HAVE_PTHREAD_H
1979         request->child_pid = NO_SUCH_CHILD_PID;
1980 #endif
1981         request->child_state = REQUEST_PROXIED;
1982
1983         DEBUG_PACKET(request, request->proxy, 1);
1984
1985         request->proxy_listener->send(request->proxy_listener,
1986                                       request);
1987         return 1;
1988 }
1989
1990
1991 /*
1992  *      "Proxy" the request by sending it to a new virtual server.
1993  */
1994 static int proxy_to_virtual_server(REQUEST *request)
1995 {
1996         REQUEST *fake;
1997         RAD_REQUEST_FUNP fun;
1998
1999         if (!request->home_server || !request->home_server->server) return 0;
2000
2001         if (request->parent) {
2002                 RDEBUG2("WARNING: Cancelling proxy request to virtual server %s as this request was itself proxied.", request->home_server->server);
2003                 return 0;
2004         }
2005
2006         fake = request_alloc_fake(request);
2007         if (!fake) {
2008                 RDEBUG2("WARNING: Out of memory");
2009                 return 0;
2010         }
2011
2012         fake->packet->vps = paircopy(request->proxy->vps);
2013         fake->server = request->home_server->server;
2014
2015         if (request->proxy->code == PW_AUTHENTICATION_REQUEST) {
2016                 fun = rad_authenticate;
2017
2018 #ifdef WITH_ACCOUNTING
2019         } else if (request->proxy->code == PW_ACCOUNTING_REQUEST) {
2020                 fun = rad_accounting;
2021 #endif
2022
2023         } else {
2024                 RDEBUG2("Unknown packet type %d", request->proxy->code);
2025                 ev_request_free(&fake);
2026                 return 0;
2027         }
2028
2029         RDEBUG2(">>> Sending proxied request internally to virtual server.");
2030         radius_handle_request(fake, fun);
2031         RDEBUG2("<<< Received proxied response code %d from internal virtual server.", fake->reply->code);
2032
2033         if (fake->reply->code != 0) {
2034                 request->proxy_reply = fake->reply;
2035                 fake->reply = NULL;
2036         } else {
2037                 /*
2038                  *      There was no response
2039                  */
2040                 setup_post_proxy_fail(request);
2041         }
2042
2043         ev_request_free(&fake);
2044
2045         process_proxy_reply(request);
2046
2047         /*
2048          *      Process it through the normal section again, but ONLY
2049          *      if we received a proxy reply..
2050          */
2051         if (request->proxy_reply) {
2052                 if (request->server) RDEBUG("server %s {",
2053                                             request->server != NULL ?
2054                                             request->server : ""); 
2055                 fun(request);
2056                 
2057                 if (request->server) RDEBUG("} # server %s",
2058                                             request->server != NULL ?
2059                                             request->server : "");
2060         }
2061
2062         return 2;               /* success, but NOT '1' !*/
2063 }
2064
2065 /*
2066  *      Return 1 if we did proxy it, or the proxy attempt failed
2067  *      completely.  Either way, the caller doesn't touch the request
2068  *      any more if we return 1.
2069  */
2070 static int successfully_proxied_request(REQUEST *request)
2071 {
2072         int rcode;
2073         int pre_proxy_type = 0;
2074         VALUE_PAIR *realmpair;
2075         VALUE_PAIR *strippedname;
2076         VALUE_PAIR *vp;
2077         char *realmname = NULL;
2078         home_server *home;
2079         REALM *realm = NULL;
2080         home_pool_t *pool;
2081
2082         /*
2083          *      If it was already proxied, do nothing.
2084          *
2085          *      FIXME: This should really be a serious error.
2086          */
2087         if (request->in_proxy_hash ||
2088             (request->proxy_reply && (request->proxy_reply->code != 0))) {
2089                 return 0;
2090         }
2091
2092         realmpair = pairfind(request->config_items, PW_PROXY_TO_REALM, 0);
2093         if (!realmpair || (realmpair->length == 0)) {
2094                 int pool_type;
2095
2096                 vp = pairfind(request->config_items, PW_HOME_SERVER_POOL, 0);
2097                 if (!vp) return 0;
2098
2099                 switch (request->packet->code) {
2100                 case PW_AUTHENTICATION_REQUEST:
2101                         pool_type = HOME_TYPE_AUTH;
2102                         break;
2103
2104 #ifdef WITH_ACCOUNTING
2105                 case PW_ACCOUNTING_REQUEST:
2106                         pool_type = HOME_TYPE_ACCT;
2107                         break;
2108 #endif
2109
2110 #ifdef WITH_COA
2111                 case PW_COA_REQUEST:
2112                 case PW_DISCONNECT_REQUEST:
2113                         pool_type = HOME_TYPE_COA;
2114                         break;
2115 #endif
2116
2117                 default:
2118                         return 0;
2119                 }
2120
2121                 pool = home_pool_byname(vp->vp_strvalue, pool_type);
2122                 if (!pool) {
2123                         RDEBUG2("ERROR: Cannot proxy to unknown pool %s",
2124                                 vp->vp_strvalue);
2125                         return 0;
2126                 }
2127
2128                 realmname = NULL; /* no realms */
2129                 realm = NULL;
2130                 goto found_pool;
2131         }
2132
2133         realmname = (char *) realmpair->vp_strvalue;
2134
2135         realm = realm_find2(realmname);
2136         if (!realm) {
2137                 RDEBUG2("ERROR: Cannot proxy to unknown realm %s", realmname);
2138                 return 0;
2139         }
2140
2141         /*
2142          *      Figure out which pool to use.
2143          */
2144         if (request->packet->code == PW_AUTHENTICATION_REQUEST) {
2145                 pool = realm->auth_pool;
2146
2147 #ifdef WITH_ACCOUNTING
2148         } else if (request->packet->code == PW_ACCOUNTING_REQUEST) {
2149                 pool = realm->acct_pool;
2150 #endif
2151
2152 #ifdef WITH_COA
2153         } else if ((request->packet->code == PW_COA_REQUEST) ||
2154                    (request->packet->code == PW_DISCONNECT_REQUEST)) {
2155                 pool = realm->acct_pool;
2156 #endif
2157
2158         } else {
2159                 rad_panic("Internal sanity check failed");
2160         }
2161
2162         if (!pool) {
2163                 RDEBUG2(" WARNING: Cancelling proxy to Realm %s, as the realm is local.",
2164                        realmname);
2165                 return 0;
2166         }
2167
2168 found_pool:
2169         home = home_server_ldb(realmname, pool, request);
2170         if (!home) {
2171                 RDEBUG2("ERROR: Failed to find live home server for realm %s",
2172                        realmname);
2173                 return -1;
2174         }
2175         request->home_pool = pool;
2176
2177 #ifdef WITH_COA
2178         /*
2179          *      Once we've decided to proxy a request, we cannot send
2180          *      a CoA packet.  So we free up any CoA packet here.
2181          */
2182         ev_request_free(&request->coa);
2183 #endif
2184         /*
2185          *      Remember that we sent the request to a Realm.
2186          */
2187         if (realmname) pairadd(&request->packet->vps,
2188                                pairmake("Realm", realmname, T_OP_EQ));
2189
2190         /*
2191          *      Strip the name, if told to.
2192          *
2193          *      Doing it here catches the case of proxied tunneled
2194          *      requests.
2195          */
2196         if (realm && (realm->striprealm == TRUE) &&
2197            (strippedname = pairfind(request->proxy->vps, PW_STRIPPED_USER_NAME, 0)) != NULL) {
2198                 /*
2199                  *      If there's a Stripped-User-Name attribute in
2200                  *      the request, then use THAT as the User-Name
2201                  *      for the proxied request, instead of the
2202                  *      original name.
2203                  *
2204                  *      This is done by making a copy of the
2205                  *      Stripped-User-Name attribute, turning it into
2206                  *      a User-Name attribute, deleting the
2207                  *      Stripped-User-Name and User-Name attributes
2208                  *      from the vps list, and making the new
2209                  *      User-Name the head of the vps list.
2210                  */
2211                 vp = pairfind(request->proxy->vps, PW_USER_NAME, 0);
2212                 if (!vp) {
2213                         vp = radius_paircreate(request, NULL,
2214                                                PW_USER_NAME, 0, PW_TYPE_STRING);
2215                         rad_assert(vp != NULL); /* handled by above function */
2216                         /* Insert at the START of the list */
2217                         vp->next = request->proxy->vps;
2218                         request->proxy->vps = vp;
2219                 }
2220                 memcpy(vp->vp_strvalue, strippedname->vp_strvalue,
2221                        sizeof(vp->vp_strvalue));
2222                 vp->length = strippedname->length;
2223
2224                 /*
2225                  *      Do NOT delete Stripped-User-Name.
2226                  */
2227         }
2228
2229         /*
2230          *      If there is no PW_CHAP_CHALLENGE attribute but
2231          *      there is a PW_CHAP_PASSWORD we need to add it
2232          *      since we can't use the request authenticator
2233          *      anymore - we changed it.
2234          */
2235         if ((request->packet->code == PW_AUTHENTICATION_REQUEST) &&
2236             pairfind(request->proxy->vps, PW_CHAP_PASSWORD, 0) &&
2237             pairfind(request->proxy->vps, PW_CHAP_CHALLENGE, 0) == NULL) {
2238                 vp = radius_paircreate(request, &request->proxy->vps,
2239                                        PW_CHAP_CHALLENGE, 0, PW_TYPE_OCTETS);
2240                 vp->length = AUTH_VECTOR_LEN;
2241                 memcpy(vp->vp_strvalue, request->packet->vector, AUTH_VECTOR_LEN);
2242         }
2243
2244         /*
2245          *      The RFC's say we have to do this, but FreeRADIUS
2246          *      doesn't need it.
2247          */
2248         vp = radius_paircreate(request, &request->proxy->vps,
2249                                PW_PROXY_STATE, 0, PW_TYPE_OCTETS);
2250         snprintf(vp->vp_strvalue, sizeof(vp->vp_strvalue), "%d",
2251                  request->packet->id);
2252         vp->length = strlen(vp->vp_strvalue);
2253
2254         /*
2255          *      Should be done BEFORE inserting into proxy hash, as
2256          *      pre-proxy may use this information, or change it.
2257          */
2258         request->proxy->code = request->packet->code;
2259
2260         /*
2261          *      Call the pre-proxy routines.
2262          */
2263         vp = pairfind(request->config_items, PW_PRE_PROXY_TYPE, 0);
2264         if (vp) {
2265                 RDEBUG2("  Found Pre-Proxy-Type %s", vp->vp_strvalue);
2266                 pre_proxy_type = vp->vp_integer;
2267         }
2268
2269         rad_assert(request->home_pool != NULL);
2270
2271         if (request->home_pool->virtual_server) {
2272                 const char *old_server = request->server;
2273                 
2274                 request->server = request->home_pool->virtual_server;
2275                 RDEBUG2(" server %s {", request->server);
2276                 rcode = module_pre_proxy(pre_proxy_type, request);
2277                 RDEBUG2(" }");
2278                         request->server = old_server;
2279         } else {
2280                 rcode = module_pre_proxy(pre_proxy_type, request);
2281         }
2282         switch (rcode) {
2283         case RLM_MODULE_FAIL:
2284         case RLM_MODULE_INVALID:
2285         case RLM_MODULE_NOTFOUND:
2286         case RLM_MODULE_USERLOCK:
2287         default:
2288                 /* FIXME: debug print failed stuff */
2289                 return -1;
2290
2291         case RLM_MODULE_REJECT:
2292         case RLM_MODULE_HANDLED:
2293                 return 0;
2294
2295         /*
2296          *      Only proxy the packet if the pre-proxy code succeeded.
2297          */
2298         case RLM_MODULE_NOOP:
2299         case RLM_MODULE_OK:
2300         case RLM_MODULE_UPDATED:
2301                 break;
2302         }
2303
2304         /*
2305          *      If it's a fake request, don't send the proxy
2306          *      packet.  The outer tunnel session will take
2307          *      care of doing that.
2308          */
2309         if (request->packet->dst_port == 0) {
2310                 request->home_server = NULL;
2311                 return 1;
2312         }
2313
2314         if (request->home_server->server) {
2315                 return proxy_to_virtual_server(request);
2316         }
2317
2318         if (!proxy_request(request)) {
2319                 RDEBUG("ERROR: Failed to proxy request");
2320                 return -1;
2321         }
2322         
2323         return 1;
2324 }
2325 #endif
2326
2327 static void request_post_handler(REQUEST *request)
2328 {
2329         int child_state = -1;
2330         struct timeval when;
2331         VALUE_PAIR *vp;
2332
2333         if ((request->master_state == REQUEST_STOP_PROCESSING) ||
2334             (request->parent &&
2335              (request->parent->master_state == REQUEST_STOP_PROCESSING))) {
2336                 RDEBUG2("request was cancelled.");
2337 #ifdef HAVE_PTHREAD_H
2338                 request->child_pid = NO_SUCH_CHILD_PID;
2339 #endif
2340                 child_state = REQUEST_DONE;
2341                 goto cleanup;
2342         }
2343
2344         if (request->child_state != REQUEST_RUNNING) {
2345                 rad_panic("Internal sanity check failed");
2346         }
2347
2348 #ifdef WITH_COA
2349         /*
2350          *      If it's not in the request hash, it's a CoA request.
2351          *      We hope.
2352          */
2353         if (!request->in_request_hash &&
2354             request->proxy &&
2355             ((request->proxy->code == PW_COA_REQUEST) ||
2356              (request->proxy->code == PW_DISCONNECT_REQUEST))) {
2357                 request->next_callback = NULL;
2358                 child_state = REQUEST_DONE;
2359                 goto cleanup;
2360         }
2361 #endif
2362
2363         /*
2364          *      Catch Auth-Type := Reject BEFORE proxying the packet.
2365          */
2366         if ((request->packet->code == PW_AUTHENTICATION_REQUEST) &&
2367             (request->reply->code == 0) &&
2368             ((vp = pairfind(request->config_items, PW_AUTH_TYPE, 0)) != NULL) &&
2369             (vp->vp_integer == PW_AUTHTYPE_REJECT)) {
2370                 request->reply->code = PW_AUTHENTICATION_REJECT;
2371         }
2372
2373 #ifdef WITH_PROXY
2374         if (request->root->proxy_requests &&
2375             !request->in_proxy_hash &&
2376             (request->reply->code == 0) &&
2377             (request->packet->dst_port != 0) &&
2378             (request->packet->code != PW_STATUS_SERVER)) {
2379                 int rcode = successfully_proxied_request(request);
2380
2381                 if (rcode == 1) return; /* request is invalid */
2382
2383                 /*
2384                  *      Failed proxying it (dead home servers, etc.)
2385                  *      Run it through Post-Proxy-Type = Fail, and
2386                  *      respond to the request.
2387                  *
2388                  *      Note that we're in a child thread here, so we
2389                  *      do NOT re-schedule the request.  Instead, we
2390                  *      do what we would have done, which is run the
2391                  *      pre-handler, a NULL request handler, and then
2392                  *      the post handler.
2393                  */
2394                 if ((rcode < 0) && setup_post_proxy_fail(request)) {
2395                         request_pre_handler(request);
2396                 }
2397
2398                 /*
2399                  *      Else we weren't supposed to proxy it,
2400                  *      OR we proxied it internally to a virutal server.
2401                  */
2402         }
2403
2404 #ifdef WITH_COA
2405         else if (request->proxy && request->coa) {
2406                 RDEBUG("WARNING: Cannot proxy and originate CoA packets at the same time.  Cancelling CoA request");
2407                 ev_request_free(&request->coa);
2408         }
2409 #endif
2410 #endif
2411
2412         /*
2413          *      Fake requests don't get encoded or signed.  The caller
2414          *      also requires the reply VP's, so we don't free them
2415          *      here!
2416          */
2417         if (request->packet->dst_port == 0) {
2418                 /* FIXME: RDEBUG going to the next request */
2419 #ifdef HAVE_PTHREAD_H
2420                 request->child_pid = NO_SUCH_CHILD_PID;
2421 #endif
2422                 request->child_state = REQUEST_DONE;
2423                 return;
2424         }
2425
2426 #ifdef WITH_PROXY
2427         /*
2428          *      Copy Proxy-State from the request to the reply.
2429          */
2430         vp = paircopy2(request->packet->vps, PW_PROXY_STATE, 0);
2431         if (vp) pairadd(&request->reply->vps, vp);
2432 #endif
2433
2434         /*
2435          *      Access-Requests get delayed or cached.
2436          */
2437         switch (request->packet->code) {
2438         case PW_AUTHENTICATION_REQUEST:
2439                 gettimeofday(&request->next_when, NULL);
2440
2441                 if (request->reply->code == 0) {
2442                         /*
2443                          *      Check if the lack of response is intentional.
2444                          */
2445                         vp = pairfind(request->config_items,
2446                                       PW_RESPONSE_PACKET_TYPE, 0);
2447                         if (!vp) {
2448                                 RDEBUG2("There was no response configured: rejecting request");
2449                                 request->reply->code = PW_AUTHENTICATION_REJECT;
2450
2451                         } else if (vp->vp_integer == 256) {
2452                                 RDEBUG2("Not responding to request");
2453
2454                                 /*
2455                                  *      Force cleanup after a long
2456                                  *      time, so that we don't
2457                                  *      re-process the packet.
2458                                  */
2459                                 request->next_when.tv_sec += request->root->max_request_time;
2460                                 request->next_callback = cleanup_delay;
2461                                 child_state = REQUEST_CLEANUP_DELAY;
2462                                 break;
2463                         } else {
2464                                 request->reply->code = vp->vp_integer;
2465
2466                         }
2467                 }
2468
2469                 /*
2470                  *      Run rejected packets through
2471                  *
2472                  *      Post-Auth-Type = Reject
2473                  */
2474                 if (request->reply->code == PW_AUTHENTICATION_REJECT) {
2475                         pairdelete(&request->config_items, PW_POST_AUTH_TYPE, 0);
2476                         vp = radius_pairmake(request, &request->config_items,
2477                                              "Post-Auth-Type", "Reject",
2478                                              T_OP_SET);
2479                         if (vp) rad_postauth(request);
2480
2481                         /*
2482                          *      If configured, delay Access-Reject packets.
2483                          *
2484                          *      If request->root->reject_delay = 0, we discover
2485                          *      that we have to send the packet now.
2486                          */
2487                         when = request->received;
2488                         when.tv_sec += request->root->reject_delay;
2489
2490                         if (timercmp(&when, &request->next_when, >)) {
2491                                 RDEBUG2("Delaying reject  for %d seconds",
2492                                        request->root->reject_delay);
2493                                 request->next_when = when;
2494                                 request->next_callback = reject_delay;
2495 #ifdef HAVE_PTHREAD_H
2496                                 request->child_pid = NO_SUCH_CHILD_PID;
2497 #endif
2498                                 request->child_state = REQUEST_REJECT_DELAY;
2499                                 return;
2500                         }
2501                 }
2502
2503 #ifdef WITH_COA
2504         case PW_COA_REQUEST:
2505         case PW_DISCONNECT_REQUEST:
2506 #endif
2507                 request->next_when.tv_sec += request->root->cleanup_delay;
2508                 request->next_callback = cleanup_delay;
2509                 child_state = REQUEST_CLEANUP_DELAY;
2510                 break;
2511
2512         case PW_ACCOUNTING_REQUEST:
2513                 request->next_callback = NULL; /* just to be safe */
2514                 child_state = REQUEST_DONE;
2515                 break;
2516
2517                 /*
2518                  *      FIXME: Status-Server should probably not be
2519                  *      handled here...
2520                  */
2521         case PW_STATUS_SERVER:
2522                 request->next_callback = NULL;
2523                 child_state = REQUEST_DONE;
2524                 break;
2525
2526         default:
2527                 /*
2528                  *      DHCP, VMPS, etc.
2529                  */
2530                 request->next_callback = NULL;
2531                 child_state = REQUEST_DONE;
2532                 break;
2533         }
2534
2535         /*
2536          *      Suppress "no reply" packets here, unless we're reading
2537          *      from the "detail" file.  In that case, we've got to
2538          *      tell the detail file handler that the request is dead,
2539          *      and it should re-send it.
2540          *      If configured, encode, sign, and send.
2541          */
2542         if ((request->reply->code != 0) ||
2543             (request->listener->type == RAD_LISTEN_DETAIL)) {
2544                 DEBUG_PACKET(request, request->reply, 1);
2545                 request->listener->send(request->listener, request);
2546         }
2547
2548 #ifdef WITH_COA
2549         /*
2550          *      Now that we've completely processed the request,
2551          *      see if we need to originate a CoA request.  But ONLY
2552          *      if it wasn't proxied.
2553          */
2554         if (!request->proxy &&
2555             (request->coa ||
2556              (pairfind(request->config_items, PW_SEND_COA_REQUEST, 0) != NULL))) {
2557                 if (!originated_coa_request(request)) {
2558                         RDEBUG2("Do CoA Fail handler here");
2559                 }
2560                 /* request->coa is stil set, so we can update events */
2561         }
2562 #endif
2563
2564  cleanup:
2565         /*
2566          *      Clean up.  These are no longer needed.
2567          */
2568         pairfree(&request->config_items);
2569
2570         pairfree(&request->packet->vps);
2571         request->username = NULL;
2572         request->password = NULL;
2573
2574         pairfree(&request->reply->vps);
2575
2576 #ifdef WITH_PROXY
2577         if (request->proxy) {
2578                 pairfree(&request->proxy->vps);
2579
2580                 if (request->proxy_reply) {
2581                         pairfree(&request->proxy_reply->vps);
2582                 }
2583
2584 #if 0
2585                 /*
2586                  *      We're not tracking responses from the home
2587                  *      server, we can therefore free this memory in
2588                  *      the child thread.
2589                  */
2590                 if (!request->in_proxy_hash) {
2591                         rad_free(&request->proxy);
2592                         rad_free(&request->proxy_reply);
2593                         request->home_server = NULL;
2594                 }
2595 #endif
2596         }
2597 #endif
2598
2599         RDEBUG2("Finished request.");
2600         rad_assert(child_state >= 0);
2601         request->child_state = child_state;
2602
2603         /*
2604          *      Single threaded mode: update timers now.
2605          */
2606         if (!have_children) wait_a_bit(request);
2607 }
2608
2609
2610 static void received_retransmit(REQUEST *request, const RADCLIENT *client)
2611 {
2612 #ifdef WITH_PROXY
2613         char buffer[128];
2614 #endif
2615
2616         RAD_STATS_TYPE_INC(request->listener, total_dup_requests);
2617         RAD_STATS_CLIENT_INC(request->listener, client, total_dup_requests);
2618         
2619         switch (request->child_state) {
2620         case REQUEST_QUEUED:
2621         case REQUEST_RUNNING:
2622 #ifdef WITH_PROXY
2623         discard:
2624 #endif
2625                 radlog(L_ERR, "Discarding duplicate request from "
2626                        "client %s port %d - ID: %d due to unfinished request %u",
2627                        client->shortname,
2628                        request->packet->src_port,request->packet->id,
2629                        request->number);
2630                 break;
2631
2632 #ifdef WITH_PROXY
2633         case REQUEST_PROXIED:
2634                 /*
2635                  *      We're not supposed to have duplicate
2636                  *      accounting packets.  The other states handle
2637                  *      duplicates fine (discard, or send duplicate
2638                  *      reply).  But we do NOT want to retransmit an
2639                  *      accounting request here, because that would
2640                  *      involve updating the Acct-Delay-Time, and
2641                  *      therefore changing the packet Id, etc.
2642                  *
2643                  *      Instead, we just discard the packet.  We may
2644                  *      eventually respond, or the client will send a
2645                  *      new accounting packet.            
2646                  *
2647                  *      The same comments go for Status-Server, and
2648                  *      other packet types.
2649                  *
2650                  *      FIXME: coa: when we proxy CoA && Disconnect
2651                  *      packets, this logic has to be fixed.
2652                  */
2653                 if (request->packet->code != PW_AUTHENTICATION_REQUEST) {
2654                         goto discard;
2655                 }
2656
2657                 check_for_zombie_home_server(request);
2658
2659                 /*
2660                  *      If we've just discovered that the home server
2661                  *      is dead, OR the socket has been closed, look for
2662                  *      another connection to a home server.
2663                  */
2664                 if (((request->packet->dst_port != 0) &&
2665                      (request->home_server->state == HOME_STATE_IS_DEAD)) ||
2666                     (request->proxy_listener->status != RAD_LISTEN_STATUS_KNOWN)) {
2667                         home_server *home;
2668
2669                         remove_from_proxy_hash(request);
2670
2671                         home = home_server_ldb(NULL, request->home_pool, request);
2672                         if (!home) {
2673                                 RDEBUG2("Failed to find live home server for request");
2674                         no_home_servers:
2675                                 /*
2676                                  *      Do post-request processing,
2677                                  *      and any insertion of necessary
2678                                  *      events.
2679                                  */
2680                                 post_proxy_fail_handler(request);
2681                                 return;
2682                         }
2683
2684                         request->proxy->code = request->packet->code;
2685
2686                         /*
2687                          *      Free the old packet, to force re-encoding
2688                          */
2689                         free(request->proxy->data);
2690                         request->proxy->data = NULL;
2691                         request->proxy->data_len = 0;
2692
2693                         /*
2694                          *      This request failed over to a virtual
2695                          *      server.  Push it back onto the queue
2696                          *      to be processed.
2697                          */
2698                         if (request->home_server->server) {
2699                                 proxy_fallback_handler(request);
2700                                 return;
2701                         }
2702
2703                         /*
2704                          *      Try to proxy the request.
2705                          */
2706                         if (!proxy_request(request)) {
2707                                 RDEBUG("ERROR: Failed to re-proxy request");
2708                                 goto no_home_servers;
2709                         }
2710
2711                         /*
2712                          *      This code executes in the main server
2713                          *      thread, so there's no need for locking.
2714                          */
2715                         rad_assert(request->next_callback != NULL);
2716                         INSERT_EVENT(request->next_callback, request);
2717                         request->next_callback = NULL;
2718                         return;
2719                 } /* else the home server is still alive */
2720
2721 #ifdef WITH_TCP
2722                 if (request->home_server->proto == IPPROTO_TCP) {
2723                         DEBUG2("Suppressing duplicate proxied request to home server %s port %d proto TCP - ID: %d",
2724                                inet_ntop(request->proxy->dst_ipaddr.af,
2725                                          &request->proxy->dst_ipaddr.ipaddr,
2726                                          buffer, sizeof(buffer)),
2727                                request->proxy->dst_port,
2728                                request->proxy->id);
2729                         break;
2730                 }
2731 #endif
2732
2733                 RDEBUG2("Sending duplicate proxied request to home server %s port %d - ID: %d",
2734                        inet_ntop(request->proxy->dst_ipaddr.af,
2735                                  &request->proxy->dst_ipaddr.ipaddr,
2736                                  buffer, sizeof(buffer)),
2737                        request->proxy->dst_port,
2738                        request->proxy->id);
2739                 request->num_proxied_requests++;
2740
2741                 DEBUG_PACKET(request, request->proxy, 1);
2742                 request->proxy_listener->send(request->proxy_listener,
2743                                               request);
2744                 break;
2745 #endif
2746
2747         case REQUEST_REJECT_DELAY:
2748                 RDEBUG2("Waiting to send Access-Reject "
2749                        "to client %s port %d - ID: %d",
2750                        client->shortname,
2751                        request->packet->src_port, request->packet->id);
2752                 break;
2753
2754         case REQUEST_CLEANUP_DELAY:
2755         case REQUEST_DONE:
2756                 if (request->reply->code == 0) {
2757                         RDEBUG2("Ignoring retransmit from client %s port %d "
2758                                 "- ID: %d, no reply was configured",
2759                                 client->shortname,
2760                                 request->packet->src_port, request->packet->id);
2761                         return;
2762                 }
2763
2764                 /*
2765                  *      FIXME: This sends duplicate replies to
2766                  *      accounting requests, even if Acct-Delay-Time
2767                  *      or Event-Timestamp is in the packet.  In those
2768                  *      cases, the Id should be changed, and the packet
2769                  *      re-calculated.
2770                  */
2771                 RDEBUG2("Sending duplicate reply "
2772                        "to client %s port %d - ID: %d",
2773                        client->shortname,
2774                        request->packet->src_port, request->packet->id);
2775                 DEBUG_PACKET(request, request->reply, 1);
2776                 request->listener->send(request->listener, request);
2777                 break;
2778         }
2779 }
2780
2781
2782 static void received_conflicting_request(REQUEST *request,
2783                                          const RADCLIENT *client)
2784 {
2785         radlog(L_ERR, "Received conflicting packet from "
2786                "client %s port %d - ID: %d due to unfinished request %u.  Giving up on old request.",
2787                client->shortname,
2788                request->packet->src_port, request->packet->id,
2789                request->number);
2790
2791         /*
2792          *      Nuke it from the request hash, so we can receive new
2793          *      packets.
2794          */
2795         remove_from_request_hash(request);
2796
2797         switch (request->child_state) {
2798                 /*
2799                  *      Tell it to stop, and wait for it to do so.
2800                  */
2801         default:
2802                 request->master_state = REQUEST_STOP_PROCESSING;
2803                 request->delay += request->delay >> 1;
2804
2805                 tv_add(&request->when, request->delay);
2806
2807                 INSERT_EVENT(wait_for_child_to_die, request);
2808                 return;
2809
2810                 /*
2811                  *      Catch race conditions.  It may have switched
2812                  *      from running to done while this code is being
2813                  *      executed.
2814                  */
2815         case REQUEST_REJECT_DELAY:
2816         case REQUEST_CLEANUP_DELAY:
2817         case REQUEST_DONE:
2818                 break;
2819         }
2820 }
2821
2822
2823 static int can_handle_new_request(RADIUS_PACKET *packet,
2824                                   RADCLIENT *client,
2825                                   struct main_config_t *root)
2826 {
2827         /*
2828          *      Count the total number of requests, to see if
2829          *      there are too many.  If so, return with an
2830          *      error.
2831          */
2832         if (root->max_requests) {
2833                 int request_count = fr_packet_list_num_elements(pl);
2834
2835                 /*
2836                  *      This is a new request.  Let's see if
2837                  *      it makes us go over our configured
2838                  *      bounds.
2839                  */
2840                 if (request_count > root->max_requests) {
2841                         radlog(L_ERR, "Dropping request (%d is too many): "
2842                                "from client %s port %d - ID: %d", request_count,
2843                                client->shortname,
2844                                packet->src_port, packet->id);
2845                         radlog(L_INFO, "WARNING: Please check the configuration file.\n"
2846                                "\tThe value for 'max_requests' is probably set too low.\n");
2847                         return 0;
2848                 } /* else there were a small number of requests */
2849         } /* else there was no configured limit for requests */
2850
2851         /*
2852          *      FIXME: Add per-client checks.  If one client is sending
2853          *      too many packets, start discarding them.
2854          *
2855          *      We increment the counters here, and decrement them
2856          *      when the response is sent... somewhere in this file.
2857          */
2858
2859         /*
2860          *      FUTURE: Add checks for system load.  If the system is
2861          *      busy, start dropping requests...
2862          *
2863          *      We can probably keep some statistics ourselves...  if
2864          *      there are more requests coming in than we can handle,
2865          *      start dropping some.
2866          */
2867
2868         return 1;
2869 }
2870
2871
2872 int received_request(rad_listen_t *listener,
2873                      RADIUS_PACKET *packet, REQUEST **prequest,
2874                      RADCLIENT *client)
2875 {
2876         RADIUS_PACKET **packet_p;
2877         REQUEST *request = NULL;
2878         struct main_config_t *root = &mainconfig;
2879
2880         packet_p = fr_packet_list_find(pl, packet);
2881         if (packet_p) {
2882                 request = fr_packet2myptr(REQUEST, packet, packet_p);
2883                 rad_assert(request->in_request_hash);
2884
2885                 if ((request->packet->data_len == packet->data_len) &&
2886                     (memcmp(request->packet->vector, packet->vector,
2887                             sizeof(packet->vector)) == 0)) {
2888                         received_retransmit(request, client);
2889                         return 0;
2890                 }
2891
2892                 /*
2893                  *      The new request is different from the old one,
2894                  *      but maybe the old is finished.  If so, delete
2895                  *      the old one.
2896                  */
2897                 switch (request->child_state) {
2898                         struct timeval when;
2899
2900                 default:
2901                         /*
2902                          *      Special hacks for race conditions.
2903                          *      The reply is encoded, and therefore
2904                          *      likely sent.  We received a *new*
2905                          *      packet from the client, likely before
2906                          *      the next line or two of code which
2907                          *      updated the child state.  In this
2908                          *      case, just accept the new request.
2909                          */
2910                         if ((request->reply->code != 0) &&
2911                             request->reply->data) {
2912                                 radlog(L_INFO, "WARNING: Allowing fast client %s port %d - ID: %d for recent request %u.",
2913                                        client->shortname,
2914                                        packet->src_port, packet->id,
2915                                        request->number);
2916                                 remove_from_request_hash(request);
2917                                 request = NULL;
2918                                 break;
2919                         }
2920
2921                         gettimeofday(&when, NULL);
2922                         when.tv_sec -= 1;
2923
2924                         /*
2925                          *      If the cached request was received
2926                          *      within the last second, then we
2927                          *      discard the NEW request instead of the
2928                          *      old one.  This will happen ONLY when
2929                          *      the client is severely broken, and is
2930                          *      sending conflicting packets very
2931                          *      quickly.
2932                          */
2933                         if (timercmp(&when, &request->received, <)) {
2934                                 radlog(L_ERR, "Discarding conflicting packet from "
2935                                        "client %s port %d - ID: %d due to recent request %u.",
2936                                        client->shortname,
2937                                        packet->src_port, packet->id,
2938                                        request->number);
2939                                 return 0;
2940                         }
2941
2942                         received_conflicting_request(request, client);
2943                         request = NULL;
2944                         break;
2945
2946                 case REQUEST_REJECT_DELAY:
2947                 case REQUEST_CLEANUP_DELAY:
2948                         request->child_state = REQUEST_DONE;
2949                 case REQUEST_DONE:
2950                         cleanup_delay(request);
2951                         request = NULL;
2952                         break;
2953                 }
2954         }
2955
2956         /*
2957          *      We may want to quench the new request.
2958          */
2959         if ((listener->type != RAD_LISTEN_DETAIL) &&
2960             !can_handle_new_request(packet, client, root)) {
2961                 return 0;
2962         }
2963
2964         /*
2965          *      Create and initialize the new request.
2966          */
2967         request = request_alloc(); /* never fails */
2968
2969         if ((request->reply = rad_alloc(0)) == NULL) {
2970                 radlog(L_ERR, "No memory");
2971                 return 0;
2972         }
2973
2974         request->listener = listener;
2975         request->client = client;
2976         request->packet = packet;
2977         request->packet->timestamp = request->timestamp;
2978         request->number = request_num_counter++;
2979         request->priority = listener->type;
2980 #ifdef HAVE_PTHREAD_H
2981         request->child_pid = NO_SUCH_CHILD_PID;
2982 #endif
2983
2984         /*
2985          *      Status-Server packets go to the head of the queue.
2986          */
2987         if (request->packet->code == PW_STATUS_SERVER) request->priority = 0;
2988
2989         /*
2990          *      Set virtual server identity
2991          */
2992         if (client->server) {
2993                 request->server = client->server;
2994         } else if (listener->server) {
2995                 request->server = listener->server;
2996         } else {
2997                 request->server = NULL;
2998         }
2999
3000         /*
3001          *      Remember the request in the list.
3002          */
3003         if (!fr_packet_list_insert(pl, &request->packet)) {
3004                 radlog(L_ERR, "Failed to insert request %u in the list of live requests: discarding", request->number);
3005                 ev_request_free(&request);
3006                 return 0;
3007         }
3008
3009         request->in_request_hash = TRUE;
3010         request->root = root;
3011         root->refcount++;
3012 #ifdef WITH_TCP
3013         request->listener->count++;
3014 #endif
3015
3016         /*
3017          *      The request passes many of our sanity checks.
3018          *      From here on in, if anything goes wrong, we
3019          *      send a reject message, instead of dropping the
3020          *      packet.
3021          */
3022
3023         /*
3024          *      Build the reply template from the request.
3025          */
3026
3027         request->reply->sockfd = request->packet->sockfd;
3028         request->reply->dst_ipaddr = request->packet->src_ipaddr;
3029         request->reply->src_ipaddr = request->packet->dst_ipaddr;
3030         request->reply->dst_port = request->packet->src_port;
3031         request->reply->src_port = request->packet->dst_port;
3032         request->reply->id = request->packet->id;
3033         request->reply->code = 0; /* UNKNOWN code */
3034         memcpy(request->reply->vector, request->packet->vector,
3035                sizeof(request->reply->vector));
3036         request->reply->vps = NULL;
3037         request->reply->data = NULL;
3038         request->reply->data_len = 0;
3039
3040         request->master_state = REQUEST_ACTIVE;
3041         request->child_state = REQUEST_QUEUED;
3042         request->next_callback = NULL;
3043
3044         gettimeofday(&request->received, NULL);
3045         request->timestamp = request->received.tv_sec;
3046         request->when = request->received;
3047
3048         request->delay = USEC;
3049
3050         tv_add(&request->when, request->delay);
3051
3052         INSERT_EVENT(wait_a_bit, request);
3053
3054         *prequest = request;
3055         return 1;
3056 }
3057
3058
3059 #ifdef WITH_PROXY
3060 REQUEST *received_proxy_response(RADIUS_PACKET *packet)
3061 {
3062         char            buffer[128];
3063         REQUEST         *request;
3064
3065         /*
3066          *      Lookup *without* removal.  In versions prior to 2.2.0,
3067          *      this did lookup *and* removal.  That method allowed
3068          *      attackers to spoof replies that caused entries to be
3069          *      removed from the proxy hash prior to validation.
3070          */
3071         request = lookup_in_proxy_hash(packet);
3072
3073         if (!request) {
3074                 radlog(L_PROXY, "No outstanding request was found for reply from host %s port %d - ID %d",
3075                        inet_ntop(packet->src_ipaddr.af,
3076                                  &packet->src_ipaddr.ipaddr,
3077                                  buffer, sizeof(buffer)),
3078                        packet->src_port, packet->id);
3079                 return NULL;
3080         }
3081
3082         /*
3083          *      There's a reply: discard it if it's a conflicting one.
3084          */
3085         if (request->proxy_reply) {
3086                 /*
3087                  *      ? The home server gave us a new proxy
3088                  *      reply which doesn't match the old
3089                  *      one.  Delete it.
3090                  */
3091                 if (memcmp(request->proxy_reply->vector,
3092                            packet->vector,
3093                            sizeof(request->proxy_reply->vector)) != 0) {
3094                         RDEBUG2("Ignoring conflicting proxy reply");
3095                         
3096                 
3097                         /* assert that there's an event queued for request? */
3098                         return NULL;
3099                 } /* else it had previously passed verification */
3100
3101                 /*
3102                  *      Verify the packet before doing ANYTHING with
3103                  *      it.  This means we're doing more MD5 checks in
3104                  *      the server core.  However, we can fix that by
3105                  *      moving to multiple threads listening on
3106                  *      sockets.
3107                  *
3108                  *      We do this AFTER looking the request up in the
3109                  *      hash, and AFTER vhecking if we saw a previous
3110                  *      request.  This helps minimize the DoS effect
3111                  *      of people attacking us with spoofed packets.
3112                  *
3113                  *      FIXME: move the "read from proxy socket" code
3114                  *      into one (or more) threads.  Have it read from
3115                  *      the socket, do the validation, and write a
3116                  *      pointer to the packet into a pipe? Or queue it
3117                  *      to the main server?
3118                  */
3119         } else if (rad_verify(packet, request->proxy,
3120                               request->home_server->secret) != 0) {
3121                 DEBUG("Ignoring spoofed proxy reply.  Signature is invalid");
3122                 return NULL;
3123         }
3124
3125         /*
3126          *      Now that we know it's a good reply, see if we can
3127          *      delete it from the proxy hash.  This lets the source
3128          *      ports && Ids be re-used earlier.
3129          *
3130          *      FIXME: protect by mutex?  This is likely less relevant
3131          *      as if we have the reply, the originating thread knows to
3132          *      avoid touching the request.  Any retransmits are done from
3133          *      the main server thread (i.e. this thread).
3134          */
3135         if (request->num_proxied_requests <= request->num_proxied_responses) {
3136                 remove_from_proxy_hash(request);
3137         }
3138
3139         /*
3140          *      Check (again) if it's a duplicate reply.  We do this
3141          *      after deleting the packet from the proxy hash.
3142          */
3143         if (request->proxy_reply) {
3144                 RDEBUG2("Discarding duplicate reply from host %s port %d  - ID: %d",
3145                         inet_ntop(packet->src_ipaddr.af,
3146                                   &packet->src_ipaddr.ipaddr,
3147                                   buffer, sizeof(buffer)),
3148                         packet->src_port, packet->id);
3149         }
3150
3151         gettimeofday(&now, NULL);
3152
3153         /*
3154          *      Maybe move this earlier in the decision process?
3155          *      Having it here means that late or duplicate proxy
3156          *      replies no longer get the home server marked as
3157          *      "alive".  This might be good for stability, though.
3158          *
3159          *      FIXME: Do we really want to do this whenever we
3160          *      receive a packet?  Setting this here means that we
3161          *      mark it alive on *any* packet, even if it's lost all
3162          *      of the *other* packets in the last 10s.
3163          */
3164         if (request->proxy->code != PW_STATUS_SERVER) {
3165                 request->home_server->state = HOME_STATE_ALIVE;
3166         }
3167         
3168 #ifdef WITH_COA
3169         /*
3170          *      When originating CoA, the "proxy" reply is the reply
3171          *      to the CoA request that we originated.  At this point,
3172          *      the original request is finished, and it has a reply.
3173          *
3174          *      However, if we haven't separated the two requests, do
3175          *      so now.  This is done so that cleaning up the original
3176          *      request won't cause the CoA request to be free'd.  See
3177          *      util.c, request_free()
3178          */
3179         if (request->parent && (request->parent->coa == request)) {
3180                 request->parent->coa = NULL;
3181                 request->parent = NULL;
3182
3183                 /*
3184                  *      The proxied packet was different from the
3185                  *      original packet, AND the proxied packet was
3186                  *      a CoA: allow it.
3187                  */
3188         } else if ((request->packet->code != request->proxy->code) &&
3189                    ((request->proxy->code == PW_COA_REQUEST) ||
3190                     (request->proxy->code == PW_DISCONNECT_REQUEST))) {
3191           /*
3192            *    It's already divorced: do nothing.
3193            */
3194           
3195         } else
3196                 /*
3197                  *      Skip the next set of checks, as the original
3198                  *      reply is cached.  We want to be able to still
3199                  *      process the CoA reply, AND to reference the
3200                  *      original request/reply.
3201                  *
3202                  *      This is getting to be really quite a bit of a
3203                  *      hack.
3204                  */
3205 #endif
3206
3207         /*
3208          *      If there's a reply to the NAS, ignore everything
3209          *      related to proxy responses
3210          */
3211         if (request->reply && request->reply->code != 0) {
3212                 RDEBUG2("Ignoring proxy reply that arrived after we sent a reply to the NAS");
3213                 return NULL;
3214         }
3215         
3216 #ifdef WITH_STATS
3217         /*
3218          *      The average includes our time to receive packets and
3219          *      look them up in the hashes, which should be the same
3220          *      for all packets.
3221          *
3222          *      We update the response time only for the FIRST packet
3223          *      we receive.
3224          */
3225         if (request->home_server->ema.window > 0) {
3226                 radius_stats_ema(&request->home_server->ema,
3227                                  &now, &request->proxy_when);
3228         }
3229 #endif
3230
3231         switch (request->child_state) {
3232         case REQUEST_QUEUED:
3233         case REQUEST_RUNNING:
3234                 radlog(L_ERR, "Internal sanity check failed for child state");
3235                 /* FALL-THROUGH */
3236
3237         case REQUEST_REJECT_DELAY:
3238         case REQUEST_CLEANUP_DELAY:
3239         case REQUEST_DONE:
3240                 radlog(L_ERR, "Reply from home server %s port %d  - ID: %d arrived too late for request %u. Try increasing 'retry_delay' or 'max_request_time'",
3241                        inet_ntop(packet->src_ipaddr.af,
3242                                  &packet->src_ipaddr.ipaddr,
3243                                  buffer, sizeof(buffer)),
3244                        packet->src_port, packet->id,
3245                        request->number);
3246                 /* assert that there's an event queued for request? */
3247                 return NULL;
3248
3249         case REQUEST_PROXIED:
3250                 break;
3251         }
3252
3253         request->proxy_reply = packet;
3254
3255 #if 0
3256         /*
3257          *      Perform RTT calculations, as per RFC 2988 (for TCP).
3258          *      Note that we only do so on the first response.
3259          */
3260         if ((request->num_proxied_responses == 1)
3261                 int rtt;
3262                 home_server *home = request->home_server;
3263
3264                 rtt = now.tv_sec - request->proxy_when.tv_sec;
3265                 rtt *= USEC;
3266                 rtt += now.tv_usec;
3267                 rtt -= request->proxy_when.tv_usec;
3268
3269                 if (!home->has_rtt) {
3270                         home->has_rtt = TRUE;
3271
3272                         home->srtt = rtt;
3273                         home->rttvar = rtt / 2;
3274
3275                 } else {
3276                         home->rttvar -= home->rttvar >> 2;
3277                         home->rttvar += (home->srtt - rtt);
3278                         home->srtt -= home->srtt >> 3;
3279                         home->srtt += rtt >> 3;
3280                 }
3281
3282                 home->rto = home->srtt;
3283                 if (home->rttvar > (USEC / 4)) {
3284                         home->rto += home->rttvar * 4;
3285                 } else {
3286                         home->rto += USEC;
3287                 }
3288         }
3289 #endif
3290
3291         /*
3292          *      There's no incoming request, so it's a proxied packet
3293          *      we originated.
3294          */
3295         if (!request->packet) {
3296                 received_response_to_ping(request);
3297                 request->proxy_reply = NULL; /* caller will free it */
3298                 ev_request_free(&request);
3299                 return NULL;
3300         }
3301
3302         request->child_state = REQUEST_QUEUED;
3303         request->when = now;
3304         request->delay = USEC;
3305         request->priority = RAD_LISTEN_PROXY;
3306         tv_add(&request->when, request->delay);
3307
3308         /*
3309          *      Wait a bit will take care of max_request_time
3310          */
3311         INSERT_EVENT(wait_a_bit, request);
3312
3313         return request;
3314 }
3315
3316 #endif /* WITH_PROXY */
3317
3318 #ifdef WITH_TCP
3319 static void tcp_socket_lifetime(void *ctx)
3320 {
3321         rad_listen_t *listener = ctx;
3322         char buffer[256];
3323
3324         listener->print(listener, buffer, sizeof(buffer));
3325
3326         DEBUG("Reached maximum lifetime on socket %s", buffer);
3327
3328         listener->status = RAD_LISTEN_STATUS_CLOSED;
3329         event_new_fd(listener);
3330 }
3331
3332 static void tcp_socket_idle_timeout(void *ctx)
3333 {
3334         rad_listen_t *listener = ctx;
3335         listen_socket_t *sock = listener->data;
3336         char buffer[256];
3337
3338         fr_event_now(el, &now); /* should always succeed... */
3339
3340         rad_assert(sock->home != NULL);
3341
3342         /*
3343          *      We implement idle timeout by polling, because it's
3344          *      cheaper than resetting the idle timeout every time
3345          *      we send / receive a packet.
3346          */
3347         if ((sock->last_packet + sock->home->idle_timeout) > now.tv_sec) {
3348                 struct timeval when;
3349                 void *fun = tcp_socket_idle_timeout;
3350                 
3351                 when.tv_sec = sock->last_packet;
3352                 when.tv_sec += sock->home->idle_timeout;
3353                 when.tv_usec = 0;
3354
3355                 if (sock->home->lifetime &&
3356                     (sock->opened + sock->home->lifetime < when.tv_sec)) {
3357                         when.tv_sec = sock->opened + sock->home->lifetime;
3358                         fun = tcp_socket_lifetime;
3359                 }
3360                 
3361                 if (!fr_event_insert(el, fun, listener, &when, &sock->ev)) {
3362                         rad_panic("Failed to insert event");
3363                 }
3364
3365                 return;
3366         }
3367
3368         listener->print(listener, buffer, sizeof(buffer));
3369         
3370         DEBUG("Reached idle timeout on socket %s", buffer);
3371
3372         listener->status = RAD_LISTEN_STATUS_CLOSED;
3373         event_new_fd(listener);
3374 }
3375 #endif
3376
3377 int event_new_fd(rad_listen_t *this)
3378 {
3379         char buffer[1024];
3380
3381         if (this->status == RAD_LISTEN_STATUS_KNOWN) return 1;
3382
3383         this->print(this, buffer, sizeof(buffer));
3384
3385         if (this->status == RAD_LISTEN_STATUS_INIT) {
3386                 if (just_started) {
3387                         DEBUG("Listening on %s", buffer);
3388                 } else {
3389                         radlog(L_INFO, " ... adding new socket %s", buffer);
3390                 }
3391
3392 #ifdef WITH_PROXY
3393                 /*
3394                  *      Add it to the list of sockets we can use.
3395                  *      Server sockets (i.e. auth/acct) are never
3396                  *      added to the packet list.
3397                  */
3398                 if (this->type == RAD_LISTEN_PROXY) {
3399                         listen_socket_t *sock = this->data;
3400
3401                         PTHREAD_MUTEX_LOCK(&proxy_mutex);
3402                         if (!fr_packet_list_socket_add(proxy_list, this->fd,
3403                                                        sock->proto,
3404                                                        &sock->other_ipaddr, sock->other_port,
3405                                                        this)) {
3406
3407                                 proxy_no_new_sockets = TRUE;
3408                                 PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
3409
3410                                 /*
3411                                  *      This is bad.  However, the
3412                                  *      packet list now supports 256
3413                                  *      open sockets, which should
3414                                  *      minimize this problem.
3415                                  */
3416                                 radlog(L_ERR, "Failed adding proxy socket: %s",
3417                                        fr_strerror());
3418                                 return 0;
3419                         }
3420
3421                         if (sock->home) {
3422                                 sock->home->num_connections++;
3423                                 
3424                                 /*
3425                                  *      If necessary, add it to the list of
3426                                  *      new proxy listeners.
3427                                  */
3428                                 if (sock->home->lifetime || sock->home->idle_timeout) {
3429                                         this->next = proxy_listener_list;
3430                                         proxy_listener_list = this;
3431                                 }
3432                         }
3433                         PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
3434
3435                         /*
3436                          *      Tell the main thread that we've added
3437                          *      a proxy listener, but only if we need
3438                          *      to update the event list.  Do this
3439                          *      with the mutex unlocked, to reduce
3440                          *      contention.
3441                          */
3442                         if (sock->home) {
3443                                 if (sock->home->lifetime || sock->home->idle_timeout) {
3444                                         radius_signal_self(RADIUS_SIGNAL_SELF_NEW_FD);
3445                                 }
3446                         }
3447                 }
3448 #endif          
3449
3450 #ifdef WITH_DETAIL
3451                 /*
3452                  *      Detail files are always known, and aren't
3453                  *      put into the socket event loop.
3454                  */
3455                 if (this->type == RAD_LISTEN_DETAIL) {
3456                         this->status = RAD_LISTEN_STATUS_KNOWN;
3457                         
3458                         /*
3459                          *      Set up the first poll interval.
3460                          */
3461                         event_poll_detail(this);
3462                         return 1;
3463                 }
3464 #endif
3465
3466                 FD_MUTEX_LOCK(&fd_mutex);
3467                 if (!fr_event_fd_insert(el, 0, this->fd,
3468                                         event_socket_handler, this)) {
3469                         radlog(L_ERR, "Failed adding event handler for proxy socket!");
3470                         exit(1);
3471                 }
3472                 FD_MUTEX_UNLOCK(&fd_mutex);
3473                 
3474                 this->status = RAD_LISTEN_STATUS_KNOWN;
3475                 return 1;
3476         }
3477
3478         /*
3479          *      Something went wrong with the socket: make it harmless.
3480          */
3481         if (this->status == RAD_LISTEN_STATUS_REMOVE_FD) {
3482                 int devnull;
3483
3484                 /*
3485                  *      Remove it from the list of live FD's.
3486                  */
3487                 FD_MUTEX_LOCK(&fd_mutex);
3488                 fr_event_fd_delete(el, 0, this->fd);
3489                 FD_MUTEX_UNLOCK(&fd_mutex);
3490
3491 #ifdef WITH_TCP
3492                 /*
3493                  *      We track requests using this socket only for
3494                  *      TCP.  For UDP, we don't currently close
3495                  *      sockets.
3496                  */
3497 #ifdef WITH_PROXY
3498                 if (this->type != RAD_LISTEN_PROXY)
3499 #endif
3500                 {
3501                         if (this->count != 0) {
3502                                 fr_packet_list_walk(pl, this,
3503                                                     remove_all_requests);
3504                         }
3505
3506                         if (this->count == 0) {
3507                                 this->status = RAD_LISTEN_STATUS_FINISH;
3508                                 goto finish;
3509                         }
3510                 }               
3511 #ifdef WITH_PROXY
3512                 else {
3513                         int count = this->count;
3514
3515                         /*
3516                          *      Duplicate code
3517                          */
3518                         PTHREAD_MUTEX_LOCK(&proxy_mutex);
3519                         if (!fr_packet_list_socket_freeze(proxy_list,
3520                                                           this->fd)) {
3521                                 radlog(L_ERR, "Fatal error freezing socket: %s",
3522                                        fr_strerror());
3523                                 exit(1);
3524                         }
3525
3526                         /*
3527                          *      Doing this with the proxy mutex held
3528                          *      is a Bad Thing.  We should move to
3529                          *      finer-grained mutexes.
3530                          */
3531                         count = this->count;
3532                         if (count > 0) {
3533                                 fr_packet_list_walk(proxy_list, this,
3534                                                     remove_all_proxied_requests);
3535                         }
3536                         count = this->count; /* protected by mutex */
3537                         PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
3538
3539                         if (count == 0) {
3540                                 this->status = RAD_LISTEN_STATUS_FINISH;
3541                                 goto finish;
3542                         }
3543                 }
3544 #endif  /* WITH_PROXY */
3545 #endif  /* WITH_TCP */
3546
3547                 /*
3548                  *      Re-open the socket, pointing it to /dev/null.
3549                  *      This means that all writes proceed without
3550                  *      blocking, and all reads return "no data".
3551                  *
3552                  *      This leaves the socket active, so any child
3553                  *      threads won't go insane.  But it means that
3554                  *      they cannot send or receive any packets.
3555                  *
3556                  *      This is EXTRA work in the normal case, when
3557                  *      sockets are closed without error.  But it lets
3558                  *      us have one simple processing method for all
3559                  *      sockets.
3560                  */
3561                 devnull = open("/dev/null", O_RDWR);
3562                 if (devnull < 0) {
3563                         radlog(L_ERR, "FATAL failure opening /dev/null: %s",
3564                                strerror(errno));
3565                         exit(1);
3566                 }
3567                 if (dup2(devnull, this->fd) < 0) {
3568                         radlog(L_ERR, "FATAL failure closing socket: %s",
3569                                strerror(errno));
3570                         exit(1);
3571                 }
3572                 close(devnull);
3573
3574                 this->status = RAD_LISTEN_STATUS_CLOSED;
3575
3576                 /*
3577                  *      Fall through to the next section.
3578                  */
3579         }
3580
3581 #ifdef WITH_TCP
3582         /*
3583          *      Called ONLY from the main thread.  On the following
3584          *      conditions:
3585          *
3586          *      idle timeout
3587          *      max lifetime
3588          *
3589          *      (and falling through from "forcibly close FD" above)
3590          *      client closed connection on us
3591          *      client sent us a bad packet.
3592          */
3593         if (this->status == RAD_LISTEN_STATUS_CLOSED) {
3594                 int count = this->count;
3595                 rad_assert(this->type != RAD_LISTEN_DETAIL);
3596
3597 #ifdef WITH_PROXY
3598                 /*
3599                  *      Remove it from the list of active sockets, so
3600                  *      that it isn't used when proxying new packets.
3601                  */
3602                 if (this->type == RAD_LISTEN_PROXY) {
3603                         PTHREAD_MUTEX_LOCK(&proxy_mutex);
3604                         if (!fr_packet_list_socket_freeze(proxy_list,
3605                                                           this->fd)) {
3606                                 radlog(L_ERR, "Fatal error freezing socket: %s",
3607                                        fr_strerror());
3608                                 exit(1);
3609                         }
3610                         count = this->count; /* protected by mutex */
3611                         PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
3612                 }
3613 #endif
3614
3615                 /*
3616                  *      Requests are still using the socket.  Wait for
3617                  *      them to finish.
3618                  */
3619                 if (count != 0) {
3620                         struct timeval when;
3621                         listen_socket_t *sock = this->data;
3622
3623                         /*
3624                          *      Try again to clean up the socket in 30
3625                          *      seconds.
3626                          */
3627                         gettimeofday(&when, NULL);
3628                         when.tv_sec += 30;
3629                         
3630                         if (!fr_event_insert(el,
3631                                              (fr_event_callback_t) event_new_fd,
3632                                              this, &when, &sock->ev)) {
3633                                 rad_panic("Failed to insert event");
3634                         }
3635                        
3636                         return 1;
3637                 }
3638
3639                 /*
3640                  *      No one is using this socket: we can delete it
3641                  *      immediately.
3642                  */
3643                 this->status = RAD_LISTEN_STATUS_FINISH;
3644         }
3645         
3646 finish:
3647         if (this->status == RAD_LISTEN_STATUS_FINISH) {
3648                 listen_socket_t *sock = this->data;
3649
3650                 rad_assert(this->count == 0);
3651                 radlog(L_INFO, " ... closing socket %s", buffer);
3652
3653                 /*
3654                  *      Remove it from the list of live FD's.  Note
3655                  *      that it MAY also have been removed above.  We
3656                  *      do it again here, to catch the case of sockets
3657                  *      closing on idle timeout, or max
3658                  *      lifetime... AFTER all requests have finished
3659                  *      using it.
3660                  */
3661                 FD_MUTEX_LOCK(&fd_mutex);
3662                 fr_event_fd_delete(el, 0, this->fd);
3663                 FD_MUTEX_UNLOCK(&fd_mutex);
3664                 
3665 #ifdef WITH_PROXY
3666                 /*
3667                  *      Remove it from the list of sockets to be used
3668                  *      when proxying.
3669                  */
3670                 if (this->type == RAD_LISTEN_PROXY) {
3671                         PTHREAD_MUTEX_LOCK(&proxy_mutex);
3672                         if (!fr_packet_list_socket_remove(proxy_list,
3673                                                           this->fd, NULL)) {
3674                                 radlog(L_ERR, "Fatal error removing socket: %s",
3675                                        fr_strerror());
3676                                 exit(1);
3677                         }
3678                         if (sock->home) sock->home->num_connections--;
3679                         PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
3680                 }
3681 #endif
3682
3683                 /*
3684                  *      Remove any pending cleanups.
3685                  */
3686                 if (sock->ev) fr_event_delete(el, &sock->ev);
3687
3688                 /*
3689                  *      And finally, close the socket.
3690                  */
3691                 listen_free(&this);
3692         }
3693 #endif  /* WITH_TCP */
3694
3695         return 1;
3696 }
3697
3698 static void handle_signal_self(int flag)
3699 {
3700         if ((flag & (RADIUS_SIGNAL_SELF_EXIT | RADIUS_SIGNAL_SELF_TERM)) != 0) {
3701                 if ((flag & RADIUS_SIGNAL_SELF_EXIT) != 0) {
3702                         radlog(L_INFO, "Received TERM signal");
3703                         fr_event_loop_exit(el, 1);
3704                 } else {
3705                         fr_event_loop_exit(el, 2);
3706                 }
3707
3708                 return;
3709         } /* else exit/term flags weren't set */
3710
3711         /*
3712          *      Tell the even loop to stop processing.
3713          */
3714         if ((flag & RADIUS_SIGNAL_SELF_HUP) != 0) {
3715                 time_t when;
3716                 static time_t last_hup = 0;
3717
3718                 when = time(NULL);
3719                 if ((int) (when - last_hup) < 5) {
3720                         radlog(L_INFO, "Ignoring HUP (less than 5s since last one)");
3721                         return;
3722                 }
3723
3724                 radlog(L_INFO, "Received HUP signal.");
3725
3726                 last_hup = when;
3727
3728                 fr_event_loop_exit(el, 0x80);
3729         }
3730
3731 #ifdef WITH_DETAIL
3732         if ((flag & RADIUS_SIGNAL_SELF_DETAIL) != 0) {
3733                 rad_listen_t *this;
3734                 
3735                 /*
3736                  *      FIXME: O(N) loops suck.
3737                  */
3738                 for (this = mainconfig.listen;
3739                      this != NULL;
3740                      this = this->next) {
3741                         if (this->type != RAD_LISTEN_DETAIL) continue;
3742
3743                         /*
3744                          *      This one didn't send the signal, skip
3745                          *      it.
3746                          */
3747                         if (!this->decode(this, NULL)) continue;
3748
3749                         /*
3750                          *      Go service the interrupt.
3751                          */
3752                         event_poll_detail(this);
3753                 }
3754         }
3755 #endif
3756
3757 #ifdef WITH_TCP
3758 #ifdef WITH_PROXY
3759         /*
3760          *      Add event handlers for idle timeouts && maximum lifetime.
3761          */
3762         if ((flag & RADIUS_SIGNAL_SELF_NEW_FD) != 0) {
3763                 struct timeval when;
3764                 void *fun = NULL;
3765
3766                 fr_event_now(el, &now);
3767
3768                 PTHREAD_MUTEX_LOCK(&proxy_mutex);
3769
3770                 while (proxy_listener_list) {
3771                         rad_listen_t *this = proxy_listener_list;
3772                         listen_socket_t *sock = this->data;
3773
3774                         proxy_listener_list = this->next;
3775                         this->next = NULL;
3776
3777                         if (!sock->home) continue; /* skip UDP sockets */
3778
3779                         when = now;
3780
3781                         if (!sock->home->idle_timeout) {
3782                                 rad_assert(sock->home->lifetime != 0);
3783
3784                                 when.tv_sec += sock->home->lifetime;
3785                                 fun = tcp_socket_lifetime;
3786                         } else {
3787                                 rad_assert(sock->home->idle_timeout != 0);
3788
3789                                 when.tv_sec += sock->home->idle_timeout;
3790                                 fun = tcp_socket_idle_timeout;
3791                         }
3792
3793                         if (!fr_event_insert(el, fun, this, &when,
3794                                              &(sock->ev))) {
3795                                 rad_panic("Failed to insert event");
3796                         }
3797                 }
3798
3799                 PTHREAD_MUTEX_UNLOCK(&proxy_mutex);
3800         }
3801 #endif  /* WITH_PROXY */
3802 #endif  /* WITH_TCP */
3803 }
3804
3805 #ifndef WITH_SELF_PIPE
3806 void radius_signal_self(int flag)
3807 {
3808         handle_signal_self(flag);
3809 }
3810 #else
3811 /*
3812  *      Inform ourselves that we received a signal.
3813  */
3814 void radius_signal_self(int flag)
3815 {
3816         ssize_t rcode;
3817         uint8_t buffer[16];
3818
3819         /*
3820          *      The read MUST be non-blocking for this to work.
3821          */
3822         rcode = read(self_pipe[0], buffer, sizeof(buffer));
3823         if (rcode > 0) {
3824                 ssize_t i;
3825
3826                 for (i = 0; i < rcode; i++) {
3827                         buffer[0] |= buffer[i];
3828                 }
3829         } else {
3830                 buffer[0] = 0;
3831         }
3832
3833         buffer[0] |= flag;
3834
3835         write(self_pipe[1], buffer, 1);
3836 }
3837
3838
3839 static void event_signal_handler(UNUSED fr_event_list_t *xel,
3840                                  UNUSED int fd, UNUSED void *ctx)
3841 {
3842         ssize_t i, rcode;
3843         uint8_t buffer[32];
3844
3845         rcode = read(self_pipe[0], buffer, sizeof(buffer));
3846         if (rcode <= 0) return;
3847
3848         /*
3849          *      Merge pending signals.
3850          */
3851         for (i = 0; i < rcode; i++) {
3852                 buffer[0] |= buffer[i];
3853         }
3854
3855         handle_signal_self(buffer[0]);
3856 }
3857 #endif
3858
3859
3860 static void event_socket_handler(fr_event_list_t *xel, UNUSED int fd,
3861                                  void *ctx)
3862 {
3863         rad_listen_t *listener = ctx;
3864         RAD_REQUEST_FUNP fun;
3865         REQUEST *request;
3866
3867         rad_assert(xel == el);
3868
3869         xel = xel;
3870
3871         if (listener->fd < 0) rad_panic("Socket was closed on us!");
3872         
3873         if (!listener->recv(listener, &fun, &request)) return;
3874
3875         if (!thread_pool_addrequest(request, fun)) {
3876                 request->child_state = REQUEST_DONE;
3877         }
3878 }
3879
3880
3881 /*
3882  *      This function is called periodically to see if this detail
3883  *      file is available for reading.
3884  */
3885 static void event_poll_detail(void *ctx)
3886 {
3887         int rcode, delay;
3888         RAD_REQUEST_FUNP fun;
3889         REQUEST *request;
3890         rad_listen_t *this = ctx;
3891         struct timeval when;
3892         listen_detail_t *detail = this->data;
3893
3894         rad_assert(this->type == RAD_LISTEN_DETAIL);
3895
3896         /*
3897          *      Try to read something.
3898          *
3899          *      FIXME: This does poll AND receive.
3900          */
3901         rcode = this->recv(this, &fun, &request);
3902         if (rcode != 0) {
3903                 rad_assert(fun != NULL);
3904                 rad_assert(request != NULL);
3905                 
3906                 if (!thread_pool_addrequest(request, fun)) {
3907                         request->child_state = REQUEST_DONE;
3908                 }
3909         }
3910
3911         fr_event_now(el, &now);
3912         when = now;
3913
3914         /*
3915          *      Backdoor API to get the delay until the next poll
3916          *      time.
3917          */
3918         delay = this->encode(this, NULL);
3919         tv_add(&when, delay);
3920
3921         if (!fr_event_insert(el, event_poll_detail, this,
3922                              &when, &detail->ev)) {
3923                 radlog(L_ERR, "Failed creating handler");
3924                 exit(1);
3925         }
3926 }
3927
3928
3929 static void event_status(struct timeval *wake)
3930 {
3931 #if !defined(HAVE_PTHREAD_H) && defined(WNOHANG)
3932         int argval;
3933 #endif
3934
3935         if (debug_flag == 0) {
3936                 if (just_started) {
3937                         radlog(L_INFO, "Ready to process requests.");
3938                         just_started = FALSE;
3939                 }
3940                 return;
3941         }
3942
3943         if (!wake) {
3944                 radlog(L_INFO, "Ready to process requests.");
3945
3946         } else if ((wake->tv_sec != 0) ||
3947                    (wake->tv_usec >= 100000)) {
3948                 DEBUG("Waking up in %d.%01u seconds.",
3949                       (int) wake->tv_sec, (unsigned int) wake->tv_usec / 100000);
3950         }
3951
3952
3953         /*
3954          *      FIXME: Put this somewhere else, where it isn't called
3955          *      all of the time...
3956          */
3957
3958 #if !defined(HAVE_PTHREAD_H) && defined(WNOHANG)
3959         /*
3960          *      If there are no child threads, then there may
3961          *      be child processes.  In that case, wait for
3962          *      their exit status, and throw that exit status
3963          *      away.  This helps get rid of zxombie children.
3964          */
3965         while (waitpid(-1, &argval, WNOHANG) > 0) {
3966                 /* do nothing */
3967         }
3968 #endif
3969
3970 }
3971
3972 /*
3973  *      Externally-visibly functions.
3974  */
3975 int radius_event_init(CONF_SECTION *cs, int spawn_flag)
3976 {
3977         rad_listen_t *head = NULL;
3978
3979         if (el) return 0;
3980
3981         time(&fr_start_time);
3982
3983         el = fr_event_list_create(event_status);
3984         if (!el) return 0;
3985
3986         pl = fr_packet_list_create(0);
3987         if (!pl) return 0;      /* leak el */
3988
3989         request_num_counter = 0;
3990
3991 #ifdef WITH_PROXY
3992         if (mainconfig.proxy_requests) {
3993                 /*
3994                  *      Create the tree for managing proxied requests and
3995                  *      responses.
3996                  */
3997                 proxy_list = fr_packet_list_create(1);
3998                 if (!proxy_list) return 0;
3999
4000 #ifdef HAVE_PTHREAD_H
4001                 if (pthread_mutex_init(&proxy_mutex, NULL) != 0) {
4002                         radlog(L_ERR, "FATAL: Failed to initialize proxy mutex: %s",
4003                                strerror(errno));
4004                         exit(1);
4005                 }
4006 #endif
4007         }
4008 #endif
4009
4010 #ifdef HAVE_PTHREAD_H
4011 #ifndef __MINGW32__
4012         NO_SUCH_CHILD_PID = (pthread_t ) (0);
4013 #else
4014         NO_SUCH_CHILD_PID = pthread_self(); /* not a child thread */
4015 #endif
4016         /*
4017          *      Initialize the threads ONLY if we're spawning, AND
4018          *      we're running normally.
4019          */
4020         if (spawn_flag && !check_config &&
4021             (thread_pool_init(cs, &spawn_flag) < 0)) {
4022                 exit(1);
4023         }
4024 #endif
4025
4026         /*
4027          *      Move all of the thread calls to this file?
4028          *
4029          *      It may be best for the mutexes to be in this file...
4030          */
4031         have_children = spawn_flag;
4032
4033         if (check_config) {
4034                 DEBUG("%s: #### Skipping IP addresses and Ports ####",
4035                        mainconfig.name);
4036                 return 1;
4037         }
4038
4039 #ifdef WITH_SELF_PIPE
4040         /*
4041          *      Child threads need a pipe to signal us, as do the
4042          *      signal handlers.
4043          */
4044         if (pipe(self_pipe) < 0) {
4045                 radlog(L_ERR, "radiusd: Error opening internal pipe: %s",
4046                        strerror(errno));
4047                 exit(1);
4048         }
4049         if (fcntl(self_pipe[0], F_SETFL, O_NONBLOCK | FD_CLOEXEC) < 0) {
4050                 radlog(L_ERR, "radiusd: Error setting internal flags: %s",
4051                        strerror(errno));
4052                 exit(1);
4053         }
4054         if (fcntl(self_pipe[1], F_SETFL, O_NONBLOCK | FD_CLOEXEC) < 0) {
4055                 radlog(L_ERR, "radiusd: Error setting internal flags: %s",
4056                        strerror(errno));
4057                 exit(1);
4058         }
4059
4060         if (!fr_event_fd_insert(el, 0, self_pipe[0],
4061                                   event_signal_handler, el)) {
4062                 radlog(L_ERR, "Failed creating handler for signals");
4063                 exit(1);
4064         }
4065 #endif  /* WITH_SELF_PIPE */
4066
4067        DEBUG("%s: #### Opening IP addresses and Ports ####",
4068                mainconfig.name);
4069
4070        /*
4071         *       The server temporarily switches to an unprivileged
4072         *       user very early in the bootstrapping process.
4073         *       However, some sockets MAY require privileged access
4074         *       (bind to device, or to port < 1024, or to raw
4075         *       sockets).  Those sockets need to call suid up/down
4076         *       themselves around the functions that need a privileged
4077         *       uid.
4078         */
4079         if (listen_init(cs, &head) < 0) {
4080                 _exit(1);
4081         }
4082         
4083         mainconfig.listen = head;
4084
4085         /*
4086          *      At this point, no one has any business *ever* going
4087          *      back to root uid.
4088          */
4089         fr_suid_down_permanent();
4090
4091         return 1;
4092 }
4093
4094
4095 static int request_hash_cb(UNUSED void *ctx, void *data)
4096 {
4097         REQUEST *request = fr_packet2myptr(REQUEST, packet, data);
4098
4099 #ifdef WITH_PROXY
4100         rad_assert(request->in_proxy_hash == FALSE);
4101 #endif
4102
4103         ev_request_free(&request);
4104
4105         return 0;
4106 }
4107
4108
4109 #ifdef WITH_PROXY
4110 static int proxy_hash_cb(UNUSED void *ctx, void *data)
4111 {
4112         REQUEST *request = fr_packet2myptr(REQUEST, proxy, data);
4113
4114         ev_request_free(&request);
4115
4116         return 0;
4117 }
4118 #endif
4119
4120 void radius_event_free(void)
4121 {
4122         /*
4123          *      FIXME: Stop all threads, or at least check that
4124          *      they're all waiting on the semaphore, and the queues
4125          *      are empty.
4126          */
4127
4128 #ifdef WITH_PROXY
4129         /*
4130          *      There are requests in the proxy hash that aren't
4131          *      referenced from anywhere else.  Remove them first.
4132          */
4133         if (proxy_list) {
4134                 fr_packet_list_walk(proxy_list, NULL, proxy_hash_cb);
4135                 fr_packet_list_free(proxy_list);
4136                 proxy_list = NULL;
4137         }
4138 #endif
4139
4140         fr_packet_list_walk(pl, NULL, request_hash_cb);
4141
4142         fr_packet_list_free(pl);
4143         pl = NULL;
4144
4145         fr_event_list_free(el);
4146 }
4147
4148 int radius_event_process(void)
4149 {
4150         if (!el) return 0;
4151
4152         return fr_event_loop(el);
4153 }
4154
4155 void radius_handle_request(REQUEST *request, RAD_REQUEST_FUNP fun)
4156 {
4157         request->options = RAD_REQUEST_OPTION_DEBUG2;
4158
4159         if (request_pre_handler(request)) {
4160                 rad_assert(fun != NULL);
4161                 rad_assert(request != NULL);
4162                 
4163                 if (request->server) RDEBUG("server %s {",
4164                                             request->server != NULL ?
4165                                             request->server : ""); 
4166                 fun(request);
4167
4168                 if (request->server) RDEBUG("} # server %s",
4169                                              request->server != NULL ?
4170                                             request->server : "");
4171
4172                 request_post_handler(request);
4173         }
4174
4175         DEBUG2("Going to the next request");
4176         return;
4177 }