2 * detail.c Process the detail file
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
20 * Copyright 2007 The FreeRADIUS server project
21 * Copyright 2007 Alan DeKok <aland@deployingradius.com>
24 #include <freeradius-devel/ident.h>
27 #include <freeradius-devel/radiusd.h>
28 #include <freeradius-devel/modules.h>
29 #include <freeradius-devel/detail.h>
30 #include <freeradius-devel/process.h>
31 #include <freeradius-devel/rad_assert.h>
33 #ifdef HAVE_SYS_STAT_H
45 #define USEC (1000000)
47 static FR_NAME_NUMBER state_names[] = {
48 { "unopened", STATE_UNOPENED },
49 { "unlocked", STATE_UNLOCKED },
50 { "header", STATE_HEADER },
51 { "reading", STATE_READING },
52 { "queued", STATE_QUEUED },
53 { "running", STATE_RUNNING },
54 { "no-reply", STATE_NO_REPLY },
55 { "replied", STATE_REPLIED },
61 * If we're limiting outstanding packets, then mark the response
64 int detail_send(rad_listen_t *listener, REQUEST *request)
68 listen_detail_t *data = listener->data;
70 rad_assert(request->listener == listener);
71 rad_assert(listener->send == detail_send);
74 * This request timed out. Remember that, and tell the
75 * caller it's OK to read more "detail" file stuff.
77 if (request->reply->code == 0) {
78 data->delay_time = data->retry_interval * USEC;
80 data->state = STATE_NO_REPLY;
82 RDEBUG("Detail - No response configured for request %d. Will retry in %d seconds",
83 request->number, data->retry_interval);
85 radius_signal_self(RADIUS_SIGNAL_SELF_DETAIL);
90 * We call gettimeofday a lot. But it should be OK,
91 * because there's nothing else to do.
93 gettimeofday(&now, NULL);
96 * If we haven't sent a packet in the last second, reset
100 if (timercmp(&data->last_packet, &now, <)) {
101 data->has_rtt = FALSE;
106 * Only one detail packet may be outstanding at a time,
107 * so it's safe to update some entries in the detail
110 * We keep smoothed round trip time (SRTT), but not round
111 * trip timeout (RTO). We use SRTT to calculate a rough
114 rtt = now.tv_sec - request->packet->timestamp.tv_sec;
117 rtt -= request->packet->timestamp.tv_usec;
120 * If we're proxying, the RTT is our processing time,
121 * plus the network delay there and back, plus the time
122 * on the other end to process the packet. Ideally, we
123 * should remove the network delays from the RTT, but we
124 * don't know what they are.
126 * So, to be safe, we over-estimate the total cost of
127 * processing the packet.
129 if (!data->has_rtt) {
130 data->has_rtt = TRUE;
132 data->rttvar = rtt / 2;
135 data->rttvar -= data->rttvar >> 2;
136 data->rttvar += (data->srtt - rtt);
137 data->srtt -= data->srtt >> 3;
138 data->srtt += rtt >> 3;
142 * Calculate the time we wait before sending the next
145 * rtt / (rtt + delay) = load_factor / 100
147 data->delay_time = (data->srtt * (100 - data->load_factor)) / (data->load_factor);
150 * Cap delay at 4 packets/s. If the end system can't
151 * handle this, then it's very broken.
153 if (data->delay_time > (USEC / 4)) data->delay_time= USEC / 4;
155 RDEBUG3("Received response for request %d. Will read the next packet in %d seconds",
156 request->number, data->delay_time / USEC);
158 data->last_packet = now;
160 data->state = STATE_REPLIED;
162 radius_signal_self(RADIUS_SIGNAL_SELF_DETAIL);
169 * Open the detail file, if we can.
171 * FIXME: create it, if it's not already there, so that the main
172 * server select() will wake us up if there's anything to read.
174 static int detail_open(rad_listen_t *this)
177 listen_detail_t *data = this->data;
178 char *filename = data->filename;
180 rad_assert(data->state == STATE_UNOPENED);
181 data->delay_time = USEC;
184 * Open detail.work first, so we don't lose
185 * accounting packets. It's probably better to
186 * duplicate them than to lose them.
188 * Note that we're not writing to the file, but
189 * we've got to open it for writing in order to
190 * establish the lock, to prevent rlm_detail from
193 * This also means that if we're doing globbing,
194 * this file will be read && processed before the
195 * file globbing is done.
197 this->fd = open(data->filename_work, O_RDWR);
199 DEBUG2("Polling for detail file %s", filename);
202 * Try reading the detail file. If it
203 * doesn't exist, we can't do anything.
205 * Doing the stat will tell us if the file
206 * exists, even if we don't have permissions
209 if (stat(filename, &st) < 0) {
216 memset(&files, 0, sizeof(files));
217 if (glob(filename, 0, NULL, &files) != 0) {
224 for (i = 0; i < files.gl_pathc; i++) {
225 if (stat(files.gl_pathv[i], &st) < 0) continue;
228 (st.st_ctime < chtime)) {
229 chtime = st.st_ctime;
239 filename = strdup(files.gl_pathv[found]);
247 * Open it BEFORE we rename it, just to
250 this->fd = open(filename, O_RDWR);
252 radlog(L_ERR, "Detail - Failed to open %s: %s",
253 filename, strerror(errno));
254 if (filename != data->filename) free(filename);
259 * Rename detail to detail.work
261 DEBUG("Detail - Renaming %s -> %s", filename, data->filename_work);
262 if (rename(filename, data->filename_work) < 0) {
263 if (filename != data->filename) free(filename);
268 if (filename != data->filename) free(filename);
269 } /* else detail.work existed, and we opened it */
271 rad_assert(data->vps == NULL);
272 rad_assert(data->fp == NULL);
274 data->state = STATE_UNLOCKED;
276 data->client_ip.af = AF_UNSPEC;
287 * FIXME: add a configuration "exit when done" so that the detail
288 * file reader can be used as a one-off tool to update stuff.
290 * The time sequence for reading from the detail file is:
292 * t_0 signalled that the server is idle, and we
293 * can read from the detail file.
295 * t_rtt the packet has been processed successfully,
296 * wait for t_delay to enforce load factor.
298 * t_rtt + t_delay wait for signal that the server is idle.
301 int detail_recv(rad_listen_t *listener)
303 char key[256], op[8], value[1024];
304 VALUE_PAIR *vp, **tail;
305 RADIUS_PACKET *packet;
307 listen_detail_t *data = listener->data;
311 * We may be in the main thread. It needs to update the
312 * timers before we try to read from the file again.
314 if (data->signal) return 0;
316 switch (data->state) {
319 rad_assert(listener->fd < 0);
321 if (!detail_open(listener)) return 0;
323 rad_assert(data->state == STATE_UNLOCKED);
324 rad_assert(listener->fd >= 0);
329 * Try to lock fd. If we can't, return.
330 * If we can, continue. This means that
331 * the server doesn't block while waiting
332 * for the lock to open...
336 * Note that we do NOT block waiting for
337 * the lock. We've re-named the file
338 * above, so we've already guaranteed
339 * that any *new* detail writer will not
340 * be opening this file. The only
341 * purpose of the lock is to catch a race
342 * condition where the execution
343 * "ping-pongs" between radiusd &
346 if (rad_lockfd_nonblock(listener->fd, 0) < 0) {
348 * Close the FD. The main loop
349 * will wake up in a second and
354 data->state = STATE_UNOPENED;
358 data->fp = fdopen(listener->fd, "r");
360 radlog(L_ERR, "FATAL: Failed to re-open detail file %s: %s",
361 data->filename, strerror(errno));
366 * Look for the header
368 data->state = STATE_HEADER;
369 data->delay_time = USEC;
378 data->state = STATE_UNOPENED;
385 if (fstat(listener->fd, &buf) < 0) {
386 radlog(L_ERR, "Failed to stat "
387 "detail file %s: %s",
393 if (((off_t) ftell(data->fp)) == buf.st_size) {
399 * End of file. Delete it, and re-set
402 if (feof(data->fp)) {
404 DEBUG("Detail - unlinking %s",
405 data->filename_work);
406 unlink(data->filename_work);
407 if (data->fp) fclose(data->fp);
410 data->state = STATE_UNOPENED;
411 rad_assert(data->vps == NULL);
413 if (data->one_shot) {
414 radlog(L_INFO, "Finished reading \"one shot\" detail file - Exiting");
415 radius_signal_self(RADIUS_SIGNAL_SELF_EXIT);
422 * Else go read something.
427 * Read more value-pair's, unless we're
428 * at EOF. In that case, queue whatever
432 if (data->fp && !feof(data->fp)) break;
433 data->state = STATE_QUEUED;
441 * Periodically check what's going on.
442 * If the request is taking too long,
446 if (time(NULL) < (data->running + data->retry_interval)) {
450 DEBUG("No response to detail request. Retrying");
451 data->state = STATE_NO_REPLY;
455 * If there's no reply, keep
456 * retransmitting the current packet
460 data->state = STATE_QUEUED;
464 * We have a reply. Clean up the old
465 * request, and go read another one.
468 pairfree(&data->vps);
469 data->state = STATE_HEADER;
474 while (*tail) tail = &(*tail)->next;
477 * Read a header, OR a value-pair.
479 while (fgets(buffer, sizeof(buffer), data->fp)) {
480 data->offset = ftell(data->fp); /* for statistics */
483 * Badly formatted file: delete it.
485 * FIXME: Maybe flag an error?
487 if (!strchr(buffer, '\n')) {
488 pairfree(&data->vps);
493 * We're reading VP's, and got a blank line.
496 if ((data->state == STATE_READING) &&
497 (buffer[0] == '\n')) {
498 data->state = STATE_QUEUED;
503 * Look for date/time header, and read VP's if
504 * found. If not, keep reading lines until we
507 if (data->state == STATE_HEADER) {
510 if (sscanf(buffer, "%*s %*s %*d %*d:%*d:%*d %d", &y)) {
511 data->state = STATE_READING;
517 * We have a full "attribute = value" line.
518 * If it doesn't look reasonable, skip it.
520 * FIXME: print an error for badly formatted attributes?
522 if (sscanf(buffer, "%255s %8s %1023s", key, op, value) != 3) {
523 DEBUG2("WARNING: Skipping badly formatted line %s",
529 * Should be =, :=, +=, ...
531 if (!strchr(op, '=')) continue;
534 * Skip non-protocol attributes.
536 if (!strcasecmp(key, "Request-Authenticator")) continue;
539 * Set the original client IP address, based on
540 * what's in the detail file.
542 * Hmm... we don't set the server IP address.
545 if (!strcasecmp(key, "Client-IP-Address")) {
546 data->client_ip.af = AF_INET;
547 if (ip_hton(value, AF_INET, &data->client_ip) < 0) {
549 "Failed parsing Client-IP-Address");
551 pairfree(&data->vps);
558 * The original time at which we received the
559 * packet. We need this to properly calculate
562 if (!strcasecmp(key, "Timestamp")) {
563 data->timestamp = atoi(value);
565 vp = paircreate(PW_PACKET_ORIGINAL_TIMESTAMP, 0);
567 vp->vp_date = (uint32_t) data->timestamp;
577 * FIXME: do we want to check for non-protocol
578 * attributes like radsqlrelay does?
581 if ((userparse(buffer, &vp) > 0) &&
589 * Some kind of error.
591 * FIXME: Leave the file in-place, and warn the
594 if (ferror(data->fp)) goto cleanup;
600 * Process the packet.
606 * The writer doesn't check that the record was
607 * completely written. If the disk is full, this can
608 * result in a truncated record. When that happens,
611 if (data->state != STATE_QUEUED) {
612 radlog(L_ERR, "Truncated record: treating it as EOF for detail file %s", data->filename_work);
617 * We're done reading the file, but we didn't read
618 * anything. Clean up, and don't return anything.
621 data->state = STATE_HEADER;
622 if (!data->fp || feof(data->fp)) goto cleanup;
627 * Allocate the packet. If we fail, it's a serious
630 packet = rad_alloc(1);
632 radlog(L_ERR, "FATAL: Failed allocating memory for detail");
636 memset(packet, 0, sizeof(*packet));
638 packet->src_ipaddr.af = AF_INET;
639 packet->src_ipaddr.ipaddr.ip4addr.s_addr = htonl(INADDR_NONE);
640 packet->code = PW_ACCOUNTING_REQUEST;
641 gettimeofday(&packet->timestamp, NULL);
644 * Remember where it came from, so that we don't
645 * proxy it to the place it came from...
647 if (data->client_ip.af != AF_UNSPEC) {
648 packet->src_ipaddr = data->client_ip;
651 vp = pairfind(packet->vps, PW_PACKET_SRC_IP_ADDRESS, 0, TAG_ANY);
653 packet->src_ipaddr.af = AF_INET;
654 packet->src_ipaddr.ipaddr.ip4addr.s_addr = vp->vp_ipaddr;
656 vp = pairfind(packet->vps, PW_PACKET_SRC_IPV6_ADDRESS, 0, TAG_ANY);
658 packet->src_ipaddr.af = AF_INET6;
659 memcpy(&packet->src_ipaddr.ipaddr.ip6addr,
660 &vp->vp_ipv6addr, sizeof(vp->vp_ipv6addr));
664 vp = pairfind(packet->vps, PW_PACKET_DST_IP_ADDRESS, 0, TAG_ANY);
666 packet->dst_ipaddr.af = AF_INET;
667 packet->dst_ipaddr.ipaddr.ip4addr.s_addr = vp->vp_ipaddr;
669 vp = pairfind(packet->vps, PW_PACKET_DST_IPV6_ADDRESS, 0, TAG_ANY);
671 packet->dst_ipaddr.af = AF_INET6;
672 memcpy(&packet->dst_ipaddr.ipaddr.ip6addr,
673 &vp->vp_ipv6addr, sizeof(vp->vp_ipv6addr));
678 * Generate packet ID, ports, IP via a counter.
680 packet->id = data->counter & 0xff;
681 packet->src_port = 1024 + ((data->counter >> 8) & 0xff);
682 packet->dst_port = 1024 + ((data->counter >> 16) & 0xff);
684 packet->dst_ipaddr.af = AF_INET;
685 packet->dst_ipaddr.ipaddr.ip4addr.s_addr = htonl((INADDR_LOOPBACK & ~0xffffff) | ((data->counter >> 24) & 0xff));
688 * If everything's OK, this is a waste of memory.
689 * Otherwise, it lets us re-send the original packet
690 * contents, unmolested.
692 packet->vps = paircopy(data->vps);
695 * Prefer the Event-Timestamp in the packet, if it
696 * exists. That is when the event occurred, whereas the
697 * "Timestamp" field is when we wrote the packet to the
698 * detail file, which could have been much later.
700 vp = pairfind(packet->vps, PW_EVENT_TIMESTAMP, 0, TAG_ANY);
702 data->timestamp = vp->vp_integer;
706 * Look for Acct-Delay-Time, and update
707 * based on Acct-Delay-Time += (time(NULL) - timestamp)
709 vp = pairfind(packet->vps, PW_ACCT_DELAY_TIME, 0, TAG_ANY);
711 vp = paircreate(PW_ACCT_DELAY_TIME, 0);
712 rad_assert(vp != NULL);
713 pairadd(&packet->vps, vp);
715 if (data->timestamp != 0) {
716 vp->vp_integer += time(NULL) - data->timestamp;
720 * Set the transmission count.
722 vp = pairfind(packet->vps, PW_PACKET_TRANSMIT_COUNTER, 0, TAG_ANY);
724 vp = paircreate(PW_PACKET_TRANSMIT_COUNTER, 0);
725 rad_assert(vp != NULL);
726 pairadd(&packet->vps, vp);
728 vp->vp_integer = data->tries;
731 fr_printf_log("detail_recv: Read packet from %s\n", data->filename_work);
732 for (vp = packet->vps; vp; vp = vp->next) {
738 * Don't bother doing limit checks, etc.
740 gettimeofday(&now, NULL);
741 if (!request_insert(listener, packet, &data->detail_client,
742 rad_accounting, &now)) {
744 data->state = STATE_NO_REPLY; /* try again later */
748 data->state = STATE_RUNNING;
749 data->running = packet->timestamp.tv_sec;
756 * Free detail-specific stuff.
758 void detail_free(rad_listen_t *this)
760 listen_detail_t *data = this->data;
762 free(data->filename);
763 data->filename = NULL;
764 pairfree(&data->vps);
766 if (data->fp != NULL) {
773 int detail_print(const rad_listen_t *this, char *buffer, size_t bufsize)
776 return snprintf(buffer, bufsize, "%s",
777 ((listen_detail_t *)(this->data))->filename);
780 return snprintf(buffer, bufsize, "detail file %s as server %s",
781 ((listen_detail_t *)(this->data))->filename,
786 * Overloaded to return delay times.
788 int detail_encode(rad_listen_t *this, UNUSED REQUEST *request)
790 listen_detail_t *data = this->data;
793 * We haven't sent a packet... delay things a bit.
796 int delay = (data->poll_interval - 1) * USEC;
799 * Add +/- 0.25s of jitter
801 delay += (USEC * 3) / 4;
802 delay += fr_rand() % (USEC / 2);
804 DEBUG2("Detail listener %s state %s signalled %d waiting %d.%06d sec",
806 fr_int2str(state_names, data->state, "?"), data->signal,
807 (delay / USEC), delay % USEC);
814 DEBUG2("Detail listener %s state %s signalled %d waiting %d.%06d sec",
815 data->filename, fr_int2str(state_names, data->state, "?"),
817 data->delay_time / USEC,
818 data->delay_time % USEC);
820 return data->delay_time;
825 * Overloaded to return "should we fix delay times"
827 int detail_decode(rad_listen_t *this, UNUSED REQUEST *request)
829 listen_detail_t *data = this->data;
835 static const CONF_PARSER detail_config[] = {
836 { "filename", PW_TYPE_STRING_PTR,
837 offsetof(listen_detail_t, filename), NULL, NULL },
838 { "load_factor", PW_TYPE_INTEGER,
839 offsetof(listen_detail_t, load_factor), NULL, Stringify(10)},
840 { "poll_interval", PW_TYPE_INTEGER,
841 offsetof(listen_detail_t, poll_interval), NULL, Stringify(1)},
842 { "retry_interval", PW_TYPE_INTEGER,
843 offsetof(listen_detail_t, retry_interval), NULL, Stringify(30)},
844 { "one_shot", PW_TYPE_BOOLEAN,
845 offsetof(listen_detail_t, one_shot), NULL, NULL},
846 { "max_outstanding", PW_TYPE_INTEGER,
847 offsetof(listen_detail_t, load_factor), NULL, NULL},
849 { NULL, -1, 0, NULL, NULL } /* end the list */
852 extern int check_config;
855 * Parse a detail section.
857 int detail_parse(CONF_SECTION *cs, rad_listen_t *this)
860 listen_detail_t *data;
864 if (check_config) return 0;
867 this->data = rad_malloc(sizeof(*data));
868 memset(this->data, 0, sizeof(*data));
873 rcode = cf_section_parse(cs, data, detail_config);
875 cf_log_err(cf_sectiontoitem(cs), "Failed parsing listen section");
879 if (!data->filename) {
880 cf_log_err(cf_sectiontoitem(cs), "No detail file specified in listen section");
884 if ((data->load_factor < 1) || (data->load_factor > 100)) {
885 cf_log_err(cf_sectiontoitem(cs), "Load factor must be between 1 and 100");
889 if ((data->poll_interval < 1) || (data->poll_interval > 20)) {
890 cf_log_err(cf_sectiontoitem(cs), "poll_interval must be between 1 and 20");
894 if (data->max_outstanding == 0) data->max_outstanding = 1;
897 * If the filename is a glob, use "detail.work" as the
900 if ((strchr(data->filename, '*') != NULL) ||
901 (strchr(data->filename, '[') != NULL)) {
905 radlog(L_INFO, "WARNING: Detail file \"%s\" appears to use file globbing, but it is not supported on this system.", data->filename);
907 strlcpy(buffer, data->filename, sizeof(buffer));
908 p = strrchr(buffer, FR_DIR_SEP);
914 strlcat(buffer, "detail.work",
915 sizeof(buffer) - strlen(buffer));
918 snprintf(buffer, sizeof(buffer), "%s.work", data->filename);
921 free(data->filename_work);
922 data->filename_work = strdup(buffer); /* FIXME: leaked */
926 data->state = STATE_UNOPENED;
927 data->delay_time = data->poll_interval * USEC;
931 * Initialize the fake client.
933 client = &data->detail_client;
934 memset(client, 0, sizeof(*client));
935 client->ipaddr.af = AF_INET;
936 client->ipaddr.ipaddr.ip4addr.s_addr = INADDR_NONE;
938 client->longname = client->shortname = data->filename;
939 client->secret = client->shortname;
940 client->nastype = strdup("none");