2 * detail.c Process the detail file
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
20 * Copyright 2007 The FreeRADIUS server project
21 * Copyright 2007 Alan DeKok <aland@deployingradius.com>
24 #include <freeradius-devel/ident.h>
27 #include <freeradius-devel/radiusd.h>
28 #include <freeradius-devel/modules.h>
29 #include <freeradius-devel/detail.h>
30 #include <freeradius-devel/rad_assert.h>
32 #ifdef HAVE_SYS_STAT_H
44 #define USEC (1000000)
46 static FR_NAME_NUMBER state_names[] = {
47 { "unopened", STATE_UNOPENED },
48 { "unlocked", STATE_UNLOCKED },
49 { "header", STATE_HEADER },
50 { "reading", STATE_READING },
51 { "queued", STATE_QUEUED },
52 { "running", STATE_RUNNING },
53 { "no-reply", STATE_NO_REPLY },
54 { "replied", STATE_REPLIED },
60 * If we're limiting outstanding packets, then mark the response
63 int detail_send(rad_listen_t *listener, REQUEST *request)
67 listen_detail_t *data = listener->data;
69 rad_assert(request->listener == listener);
70 rad_assert(listener->send == detail_send);
73 * This request timed out. Remember that, and tell the
74 * caller it's OK to read more "detail" file stuff.
76 if (request->reply->code == 0) {
77 data->delay_time = data->retry_interval * USEC;
79 data->state = STATE_NO_REPLY;
81 RDEBUG("Detail - No response configured for request %d. Will retry in %d seconds",
82 request->number, data->retry_interval);
84 radius_signal_self(RADIUS_SIGNAL_SELF_DETAIL);
89 * We call gettimeofday a lot. But it should be OK,
90 * because there's nothing else to do.
92 gettimeofday(&now, NULL);
95 * If we haven't sent a packet in the last second, reset
99 if (timercmp(&data->last_packet, &now, <)) {
100 data->has_rtt = FALSE;
105 * Only one detail packet may be outstanding at a time,
106 * so it's safe to update some entries in the detail
109 * We keep smoothed round trip time (SRTT), but not round
110 * trip timeout (RTO). We use SRTT to calculate a rough
113 rtt = now.tv_sec - request->received.tv_sec;
116 rtt -= request->received.tv_usec;
119 * If we're proxying, the RTT is our processing time,
120 * plus the network delay there and back, plus the time
121 * on the other end to process the packet. Ideally, we
122 * should remove the network delays from the RTT, but we
123 * don't know what they are.
125 * So, to be safe, we over-estimate the total cost of
126 * processing the packet.
128 if (!data->has_rtt) {
129 data->has_rtt = TRUE;
131 data->rttvar = rtt / 2;
134 data->rttvar -= data->rttvar >> 2;
135 data->rttvar += (data->srtt - rtt);
136 data->srtt -= data->srtt >> 3;
137 data->srtt += rtt >> 3;
141 * Calculate the time we wait before sending the next
144 * rtt / (rtt + delay) = load_factor / 100
146 data->delay_time = (data->srtt * (100 - data->load_factor)) / (data->load_factor);
149 * Cap delay at 4 packets/s. If the end system can't
150 * handle this, then it's very broken.
152 if (data->delay_time > (USEC / 4)) data->delay_time= USEC / 4;
154 RDEBUG3("Received response for request %d. Will read the next packet in %d seconds",
155 request->number, data->delay_time / USEC);
157 data->last_packet = now;
159 data->state = STATE_REPLIED;
160 radius_signal_self(RADIUS_SIGNAL_SELF_DETAIL);
167 * Open the detail file, if we can.
169 * FIXME: create it, if it's not already there, so that the main
170 * server select() will wake us up if there's anything to read.
172 static int detail_open(rad_listen_t *this)
175 listen_detail_t *data = this->data;
176 char *filename = data->filename;
178 rad_assert(data->state == STATE_UNOPENED);
179 data->delay_time = USEC;
182 * Open detail.work first, so we don't lose
183 * accounting packets. It's probably better to
184 * duplicate them than to lose them.
186 * Note that we're not writing to the file, but
187 * we've got to open it for writing in order to
188 * establish the lock, to prevent rlm_detail from
191 * This also means that if we're doing globbing,
192 * this file will be read && processed before the
193 * file globbing is done.
195 this->fd = open(data->filename_work, O_RDWR);
197 DEBUG2("Polling for detail file %s", filename);
200 * Try reading the detail file. If it
201 * doesn't exist, we can't do anything.
203 * Doing the stat will tell us if the file
204 * exists, even if we don't have permissions
207 if (stat(filename, &st) < 0) {
214 memset(&files, 0, sizeof(files));
215 if (glob(filename, 0, NULL, &files) != 0) {
221 for (i = 0; i < files.gl_pathc; i++) {
222 if (stat(files.gl_pathv[i], &st) < 0) continue;
225 (st.st_ctime < chtime)) {
226 chtime = st.st_ctime;
236 filename = strdup(files.gl_pathv[found]);
244 * Open it BEFORE we rename it, just to
247 this->fd = open(filename, O_RDWR);
249 radlog(L_ERR, "Detail - Failed to open %s: %s",
250 filename, strerror(errno));
251 if (filename != data->filename) free(filename);
256 * Rename detail to detail.work
258 DEBUG("Detail - Renaming %s -> %s", filename, data->filename_work);
259 if (rename(filename, data->filename_work) < 0) {
260 if (filename != data->filename) free(filename);
265 if (filename != data->filename) free(filename);
266 } /* else detail.work existed, and we opened it */
268 rad_assert(data->vps == NULL);
269 rad_assert(data->fp == NULL);
271 data->state = STATE_UNLOCKED;
273 data->client_ip.af = AF_UNSPEC;
284 * FIXME: add a configuration "exit when done" so that the detail
285 * file reader can be used as a one-off tool to update stuff.
287 * The time sequence for reading from the detail file is:
289 * t_0 signalled that the server is idle, and we
290 * can read from the detail file.
292 * t_rtt the packet has been processed successfully,
293 * wait for t_delay to enforce load factor.
295 * t_rtt + t_delay wait for signal that the server is idle.
298 int detail_recv(rad_listen_t *listener,
299 RAD_REQUEST_FUNP *pfun, REQUEST **prequest)
301 char key[256], op[8], value[1024];
302 VALUE_PAIR *vp, **tail;
303 RADIUS_PACKET *packet;
305 listen_detail_t *data = listener->data;
308 * We may be in the main thread. It needs to update the
309 * timers before we try to read from the file again.
311 if (data->signal) return 0;
313 switch (data->state) {
316 rad_assert(listener->fd < 0);
318 if (!detail_open(listener)) return 0;
320 rad_assert(data->state == STATE_UNLOCKED);
321 rad_assert(listener->fd >= 0);
326 * Try to lock fd. If we can't, return.
327 * If we can, continue. This means that
328 * the server doesn't block while waiting
329 * for the lock to open...
333 * Note that we do NOT block waiting for
334 * the lock. We've re-named the file
335 * above, so we've already guaranteed
336 * that any *new* detail writer will not
337 * be opening this file. The only
338 * purpose of the lock is to catch a race
339 * condition where the execution
340 * "ping-pongs" between radiusd &
343 if (rad_lockfd_nonblock(listener->fd, 0) < 0) {
345 * Close the FD. The main loop
346 * will wake up in a second and
351 data->state = STATE_UNOPENED;
355 data->fp = fdopen(listener->fd, "r");
357 radlog(L_ERR, "FATAL: Failed to re-open detail file %s: %s",
358 data->filename, strerror(errno));
363 * Look for the header
365 data->state = STATE_HEADER;
366 data->delay_time = USEC;
375 data->state = STATE_UNOPENED;
382 fstat(listener->fd, &buf);
383 if (((off_t) ftell(data->fp)) == buf.st_size) {
389 * End of file. Delete it, and re-set
392 if (feof(data->fp)) {
394 DEBUG("Detail - unlinking %s",
395 data->filename_work);
396 unlink(data->filename_work);
397 if (data->fp) fclose(data->fp);
400 data->state = STATE_UNOPENED;
401 rad_assert(data->vps == NULL);
406 * Else go read something.
411 * Read more value-pair's, unless we're
412 * at EOF. In that case, queue whatever
416 if (data->fp && !feof(data->fp)) break;
417 data->state = STATE_QUEUED;
425 * Periodically check what's going on.
426 * If the request is taking too long,
430 if (time(NULL) < (data->running + data->retry_interval)) {
434 DEBUG("No response to detail request. Retrying");
435 data->state = STATE_NO_REPLY;
439 * If there's no reply, keep
440 * retransmitting the current packet
444 data->state = STATE_QUEUED;
448 * We have a reply. Clean up the old
449 * request, and go read another one.
452 pairfree(&data->vps);
453 data->state = STATE_HEADER;
458 while (*tail) tail = &(*tail)->next;
461 * Read a header, OR a value-pair.
463 while (fgets(buffer, sizeof(buffer), data->fp)) {
464 data->offset = ftell(data->fp); /* for statistics */
467 * Badly formatted file: delete it.
469 * FIXME: Maybe flag an error?
471 if (!strchr(buffer, '\n')) {
472 pairfree(&data->vps);
477 * We're reading VP's, and got a blank line.
480 if ((data->state == STATE_READING) &&
481 (buffer[0] == '\n')) {
482 data->state = STATE_QUEUED;
487 * Look for date/time header, and read VP's if
488 * found. If not, keep reading lines until we
491 if (data->state == STATE_HEADER) {
494 if (sscanf(buffer, "%*s %*s %*d %*d:%*d:%*d %d", &y)) {
495 data->state = STATE_READING;
501 * We have a full "attribute = value" line.
502 * If it doesn't look reasonable, skip it.
504 * FIXME: print an error for badly formatted attributes?
506 if (sscanf(buffer, "%255s %8s %1023s", key, op, value) != 3) {
507 DEBUG2("WARNING: Skipping badly formatted line %s",
513 * Should be =, :=, +=, ...
515 if (!strchr(op, '=')) continue;
518 * Skip non-protocol attributes.
520 if (!strcasecmp(key, "Request-Authenticator")) continue;
523 * Set the original client IP address, based on
524 * what's in the detail file.
526 * Hmm... we don't set the server IP address.
529 if (!strcasecmp(key, "Client-IP-Address")) {
530 data->client_ip.af = AF_INET;
531 ip_hton(value, AF_INET, &data->client_ip);
536 * The original time at which we received the
537 * packet. We need this to properly calculate
540 if (!strcasecmp(key, "Timestamp")) {
541 data->timestamp = atoi(value);
543 vp = paircreate(PW_PACKET_ORIGINAL_TIMESTAMP, 0,
546 vp->vp_date = (uint32_t) data->timestamp;
556 * FIXME: do we want to check for non-protocol
557 * attributes like radsqlrelay does?
560 if ((userparse(buffer, &vp) > 0) &&
568 * Some kind of error.
570 * FIXME: Leave the file in-place, and warn the
573 if (ferror(data->fp)) goto cleanup;
579 * Process the packet.
585 * The writer doesn't check that the record was
586 * completely written. If the disk is full, this can
587 * result in a truncated record. When that happens,
590 if (data->state != STATE_QUEUED) {
591 radlog(L_ERR, "Truncated record: treating it as EOF for detail file %s", data->filename_work);
596 * We're done reading the file, but we didn't read
597 * anything. Clean up, and don't return anything.
600 data->state = STATE_HEADER;
601 if (feof(data->fp)) goto cleanup;
606 * Allocate the packet. If we fail, it's a serious
609 packet = rad_alloc(1);
611 radlog(L_ERR, "FATAL: Failed allocating memory for detail");
615 memset(packet, 0, sizeof(*packet));
617 packet->src_ipaddr.af = AF_INET;
618 packet->src_ipaddr.ipaddr.ip4addr.s_addr = htonl(INADDR_NONE);
619 packet->code = PW_ACCOUNTING_REQUEST;
620 packet->timestamp = time(NULL);
623 * Remember where it came from, so that we don't
624 * proxy it to the place it came from...
626 if (data->client_ip.af != AF_UNSPEC) {
627 packet->src_ipaddr = data->client_ip;
630 vp = pairfind(packet->vps, PW_PACKET_SRC_IP_ADDRESS, 0);
632 packet->src_ipaddr.af = AF_INET;
633 packet->src_ipaddr.ipaddr.ip4addr.s_addr = vp->vp_ipaddr;
635 vp = pairfind(packet->vps, PW_PACKET_SRC_IPV6_ADDRESS, 0);
637 packet->src_ipaddr.af = AF_INET6;
638 memcpy(&packet->src_ipaddr.ipaddr.ip6addr,
639 &vp->vp_ipv6addr, sizeof(vp->vp_ipv6addr));
643 vp = pairfind(packet->vps, PW_PACKET_DST_IP_ADDRESS, 0);
645 packet->dst_ipaddr.af = AF_INET;
646 packet->dst_ipaddr.ipaddr.ip4addr.s_addr = vp->vp_ipaddr;
648 vp = pairfind(packet->vps, PW_PACKET_DST_IPV6_ADDRESS, 0);
650 packet->dst_ipaddr.af = AF_INET6;
651 memcpy(&packet->dst_ipaddr.ipaddr.ip6addr,
652 &vp->vp_ipv6addr, sizeof(vp->vp_ipv6addr));
657 * We've got to give SOME value for Id & ports, so that
658 * the packets can be added to the request queue.
659 * However, we don't want to keep track of used/unused
660 * id's and ports, as that's a lot of work. This hack
661 * ensures that (if we have real random numbers), that
662 * there will be a collision on every 2^(16+15+15+24 - 1)
663 * packets, on average. That means we can read 2^37
664 * packets before having a collision, which means it's
665 * effectively impossible.
667 packet->id = fr_rand() & 0xffff;
668 packet->src_port = 1024 + (fr_rand() & 0x7fff);
669 packet->dst_port = 1024 + (fr_rand() & 0x7fff);
671 packet->dst_ipaddr.af = AF_INET;
672 packet->dst_ipaddr.ipaddr.ip4addr.s_addr = htonl((INADDR_LOOPBACK & ~0xffffff) | (fr_rand() & 0xffffff));
675 * If everything's OK, this is a waste of memory.
676 * Otherwise, it lets us re-send the original packet
677 * contents, unmolested.
679 packet->vps = paircopy(data->vps);
682 * Look for Acct-Delay-Time, and update
683 * based on Acct-Delay-Time += (time(NULL) - timestamp)
685 vp = pairfind(packet->vps, PW_ACCT_DELAY_TIME, 0);
687 vp = paircreate(PW_ACCT_DELAY_TIME, 0, PW_TYPE_INTEGER);
688 rad_assert(vp != NULL);
689 pairadd(&packet->vps, vp);
691 if (data->timestamp != 0) {
692 vp->vp_integer += time(NULL) - data->timestamp;
696 * Set the transmission count.
698 vp = pairfind(packet->vps, PW_PACKET_TRANSMIT_COUNTER, 0);
700 vp = paircreate(PW_PACKET_TRANSMIT_COUNTER, 0, PW_TYPE_INTEGER);
701 rad_assert(vp != NULL);
702 pairadd(&packet->vps, vp);
704 vp->vp_integer = data->tries;
706 *pfun = rad_accounting;
709 fr_printf_log("detail_recv: Read packet from %s\n", data->filename_work);
710 for (vp = packet->vps; vp; vp = vp->next) {
716 * FIXME: many of these checks may not be necessary when
717 * reading from the detail file.
721 if (!received_request(listener, packet, prequest,
722 &data->detail_client)) {
724 data->state = STATE_NO_REPLY; /* try again later */
728 data->state = STATE_RUNNING;
729 data->running = packet->timestamp;
736 * Free detail-specific stuff.
738 void detail_free(rad_listen_t *this)
740 listen_detail_t *data = this->data;
742 free(data->filename);
743 data->filename = NULL;
744 pairfree(&data->vps);
746 if (data->fp != NULL) {
753 int detail_print(const rad_listen_t *this, char *buffer, size_t bufsize)
756 return snprintf(buffer, bufsize, "%s",
757 ((listen_detail_t *)(this->data))->filename);
760 return snprintf(buffer, bufsize, "detail file %s as server %s",
761 ((listen_detail_t *)(this->data))->filename,
766 * Overloaded to return delay times.
768 int detail_encode(rad_listen_t *this, UNUSED REQUEST *request)
770 listen_detail_t *data = this->data;
773 * We haven't sent a packet... delay things a bit.
776 int delay = (data->poll_interval - 1) * USEC;
779 * Add +/- 0.25s of jitter
781 delay += (USEC * 3) / 4;
782 delay += fr_rand() % (USEC / 2);
784 DEBUG2("Detail listener %s state %s signalled %d waiting %d.%06d sec",
786 fr_int2str(state_names, data->state, "?"), data->signal,
787 (delay / USEC), delay % USEC);
794 DEBUG2("Detail listener %s state %s signalled %d waiting %d.%06d sec",
795 data->filename, fr_int2str(state_names, data->state, "?"),
797 data->delay_time / USEC,
798 data->delay_time % USEC);
800 return data->delay_time;
805 * Overloaded to return "should we fix delay times"
807 int detail_decode(rad_listen_t *this, UNUSED REQUEST *request)
809 listen_detail_t *data = this->data;
815 static const CONF_PARSER detail_config[] = {
816 { "filename", PW_TYPE_STRING_PTR,
817 offsetof(listen_detail_t, filename), NULL, NULL },
818 { "load_factor", PW_TYPE_INTEGER,
819 offsetof(listen_detail_t, load_factor), NULL, Stringify(10)},
820 { "poll_interval", PW_TYPE_INTEGER,
821 offsetof(listen_detail_t, poll_interval), NULL, Stringify(1)},
822 { "retry_interval", PW_TYPE_INTEGER,
823 offsetof(listen_detail_t, retry_interval), NULL, Stringify(30)},
825 { NULL, -1, 0, NULL, NULL } /* end the list */
828 extern int check_config;
831 * Parse a detail section.
833 int detail_parse(CONF_SECTION *cs, rad_listen_t *this)
836 listen_detail_t *data;
840 if (check_config) return 0;
843 this->data = rad_malloc(sizeof(*data));
844 memset(this->data, 0, sizeof(*data));
849 rcode = cf_section_parse(cs, data, detail_config);
851 cf_log_err(cf_sectiontoitem(cs), "Failed parsing listen section");
855 if (!data->filename) {
856 cf_log_err(cf_sectiontoitem(cs), "No detail file specified in listen section");
860 if ((data->load_factor < 1) || (data->load_factor > 100)) {
861 cf_log_err(cf_sectiontoitem(cs), "Load factor must be between 1 and 100");
865 if ((data->poll_interval < 1) || (data->poll_interval > 20)) {
866 cf_log_err(cf_sectiontoitem(cs), "poll_interval must be between 1 and 20");
871 * If the filename is a glob, use "detail.work" as the
874 if ((strchr(data->filename, '*') != NULL) ||
875 (strchr(data->filename, '[') != NULL)) {
879 radlog(L_INFO, "WARNING: Detail file \"%s\" appears to use file globbing, but it is not supported on this system.", data->filename);
881 strlcpy(buffer, data->filename, sizeof(buffer));
882 p = strrchr(buffer, FR_DIR_SEP);
888 strlcat(buffer, "detail.work",
889 sizeof(buffer) - strlen(buffer));
892 snprintf(buffer, sizeof(buffer), "%s.work", data->filename);
895 free(data->filename_work);
896 data->filename_work = strdup(buffer); /* FIXME: leaked */
900 data->state = STATE_UNOPENED;
901 data->delay_time = data->poll_interval * USEC;
905 * Initialize the fake client.
907 client = &data->detail_client;
908 memset(client, 0, sizeof(*client));
909 client->ipaddr.af = AF_INET;
910 client->ipaddr.ipaddr.ip4addr.s_addr = INADDR_NONE;
912 client->longname = client->shortname = data->filename;
913 client->secret = client->shortname;
914 client->nastype = strdup("none");