Use struct addr - big cleanup.
[darkstat] / hosts_db.c
1 /* darkstat 3
2 * copyright (c) 2001-2009 Emil Mikulic.
3 *
4 * hosts_db.c: database of hosts, ports, protocols.
5 *
6 * You may use, modify and redistribute this file under the terms of the
7 * GNU General Public License version 2. (see COPYING.GPL)
8 */
9
10 #include "darkstat.h"
11 #include "conv.h"
12 #include "decode.h"
13 #include "dns.h"
14 #include "err.h"
15 #include "hosts_db.h"
16 #include "db.h"
17 #include "html.h"
18 #include "ncache.h"
19 #include "now.h"
20 #include "str.h"
21
22 #include <arpa/inet.h> /* inet_aton() */
23 #include <netdb.h> /* struct addrinfo */
24 #include <assert.h>
25 #include <errno.h>
26 #include <stdio.h>
27 #include <stdlib.h>
28 #include <string.h> /* memset(), strcmp() */
29 #include <unistd.h>
30
31 extern int want_lastseen;
32 int show_mac_addrs = 0;
33 extern const char *interface;
34
35 /* FIXME: specify somewhere more sane/tunable */
36 #define MAX_ENTRIES 30 /* in an HTML table rendered from a hashtable */
37
38 typedef uint32_t (hash_func_t)(const struct hashtable *, const void *);
39 typedef void (free_func_t)(struct bucket *);
40 typedef const void * (key_func_t)(const struct bucket *);
41 typedef int (find_func_t)(const struct bucket *, const void *);
42 typedef struct bucket * (make_func_t)(const void *);
43 typedef void (format_cols_func_t)(struct str *);
44 typedef void (format_row_func_t)(struct str *, const struct bucket *,
45 const char *);
46
47 struct hashtable {
48 uint8_t bits; /* size of hashtable in bits */
49 uint32_t size, mask;
50 uint32_t count, count_max, count_keep; /* items in table */
51 uint32_t coeff; /* coefficient for Fibonacci hashing */
52 struct bucket **table;
53
54 struct {
55 uint64_t inserts, searches, deletions, rehashes;
56 } stats;
57
58 hash_func_t *hash_func;
59 /* returns hash value of given key (passed as void*) */
60
61 free_func_t *free_func;
62 /* free of bucket payload */
63
64 key_func_t *key_func;
65 /* returns pointer to key of bucket (to pass to hash_func) */
66
67 find_func_t *find_func;
68 /* returns true if given bucket matches key (passed as void*) */
69
70 make_func_t *make_func;
71 /* returns bucket containing new record with key (passed as void*) */
72
73 format_cols_func_t *format_cols_func;
74 /* append table columns to str */
75
76 format_row_func_t *format_row_func;
77 /* format record and append to str */
78 };
79
80 static void hashtable_reduce(struct hashtable *ht);
81 static void hashtable_free(struct hashtable *h);
82
83 #define HOST_BITS 1 /* initial size of hosts table */
84 #define PORT_BITS 1 /* initial size of ports tables */
85 #define PROTO_BITS 1 /* initial size of proto table */
86
87 /* We only use one hosts_db hashtable and this is it. */
88 static struct hashtable *hosts_db = NULL;
89
90 /* phi^-1 (reciprocal of golden ratio) = (sqrt(5) - 1) / 2 */
91 static const double phi_1 =
92 0.61803398874989490252573887119069695472717285156250;
93
94 /* Co-prime of u, using phi^-1 */
95 inline static uint32_t
96 coprime(const uint32_t u)
97 {
98 return ( (uint32_t)( (double)(u) * phi_1 ) | 1U );
99 }
100
101 /*
102 * This is the "recommended" IPv4 hash function, as seen in FreeBSD's
103 * src/sys/netinet/tcp_hostcache.c 1.1
104 */
105 inline static uint32_t
106 ipv4_hash(const struct addr *const a)
107 {
108 uint32_t ip = a->ip.v4;
109 return ( (ip) ^ ((ip) >> 7) ^ ((ip) >> 17) );
110 }
111
112 #ifndef s6_addr32
113 /* Covers OpenBSD and FreeBSD. The macro __USE_GNU has
114 * taken care of GNU/Linux and GNU/kfreebsd. */
115 # define s6_addr32 __u6_addr.__u6_addr32
116 #endif
117
118 /*
119 * This is the IPv6 hash function used by FreeBSD in the same file as above,
120 * svn rev 122922.
121 */
122 inline static uint32_t
123 ipv6_hash(const struct addr *const a)
124 {
125 const struct in6_addr *const ip6 = &(a->ip.v6);
126 return ( ip6->s6_addr32[0] ^ ip6->s6_addr32[1] ^
127 ip6->s6_addr32[2] ^ ip6->s6_addr32[3] );
128 }
129
130 /* ---------------------------------------------------------------------------
131 * hash_func collection
132 */
133 static uint32_t
134 hash_func_host(const struct hashtable *h _unused_, const void *key)
135 {
136 const struct addr *a = key;
137 if (a->family == IPv4)
138 return (ipv4_hash(a));
139 else {
140 assert(a->family == IPv6);
141 return (ipv6_hash(a));
142 }
143 }
144
145 #define CASTKEY(type) (*((const type *)key))
146
147 static uint32_t
148 hash_func_short(const struct hashtable *h, const void *key)
149 {
150 return (CASTKEY(uint16_t) * h->coeff);
151 }
152
153 static uint32_t
154 hash_func_byte(const struct hashtable *h, const void *key)
155 {
156 return (CASTKEY(uint8_t) * h->coeff);
157 }
158
159 /* ---------------------------------------------------------------------------
160 * key_func collection
161 */
162
163 static const void *
164 key_func_host(const struct bucket *b)
165 {
166 return &(b->u.host.addr);
167 }
168
169 static const void *
170 key_func_port_tcp(const struct bucket *b)
171 {
172 return &(b->u.port_tcp.port);
173 }
174
175 static const void *
176 key_func_port_udp(const struct bucket *b)
177 {
178 return &(b->u.port_udp.port);
179 }
180
181 static const void *
182 key_func_ip_proto(const struct bucket *b)
183 {
184 return &(b->u.ip_proto.proto);
185 }
186
187 /* ---------------------------------------------------------------------------
188 * find_func collection
189 */
190
191 static int
192 find_func_host(const struct bucket *b, const void *key)
193 {
194 return (addr_equal(key, &(b->u.host.addr)));
195 }
196
197 static int
198 find_func_port_tcp(const struct bucket *b, const void *key)
199 {
200 return (b->u.port_tcp.port == CASTKEY(uint16_t));
201 }
202
203 static int
204 find_func_port_udp(const struct bucket *b, const void *key)
205 {
206 return (b->u.port_udp.port == CASTKEY(uint16_t));
207 }
208
209 static int
210 find_func_ip_proto(const struct bucket *b, const void *key)
211 {
212 return (b->u.ip_proto.proto == CASTKEY(uint8_t));
213 }
214
215 /* ---------------------------------------------------------------------------
216 * make_func collection
217 */
218
219 #define MAKE_BUCKET(name_bucket, name_content, type) struct { \
220 struct bucket *next; \
221 uint64_t in, out, total; \
222 union { struct type t; } u; } _custom_bucket; \
223 struct bucket *name_bucket = xcalloc(1, sizeof(_custom_bucket)); \
224 struct type *name_content = &(name_bucket->u.type); \
225 name_bucket->next = NULL; \
226 name_bucket->in = name_bucket->out = name_bucket->total = 0;
227
228 static struct bucket *
229 make_func_host(const void *key)
230 {
231 MAKE_BUCKET(b, h, host);
232 h->addr = CASTKEY(struct addr);
233 h->dns = NULL;
234 h->last_seen = now;
235 memset(&h->mac_addr, 0, sizeof(h->mac_addr));
236 h->ports_tcp = NULL;
237 h->ports_udp = NULL;
238 h->ip_protos = NULL;
239 return (b);
240 }
241
242 static void
243 free_func_host(struct bucket *b)
244 {
245 struct host *h = &(b->u.host);
246 if (h->dns != NULL) free(h->dns);
247 hashtable_free(h->ports_tcp);
248 hashtable_free(h->ports_udp);
249 hashtable_free(h->ip_protos);
250 }
251
252 static struct bucket *
253 make_func_port_tcp(const void *key)
254 {
255 MAKE_BUCKET(b, p, port_tcp);
256 p->port = CASTKEY(uint16_t);
257 p->syn = 0;
258 return (b);
259 }
260
261 static struct bucket *
262 make_func_port_udp(const void *key)
263 {
264 MAKE_BUCKET(b, p, port_udp);
265 p->port = CASTKEY(uint16_t);
266 return (b);
267 }
268
269 static struct bucket *
270 make_func_ip_proto(const void *key)
271 {
272 MAKE_BUCKET(b, p, ip_proto);
273 p->proto = CASTKEY(uint8_t);
274 return (b);
275 }
276
277 static void
278 free_func_simple(struct bucket *b _unused_)
279 {
280 /* nop */
281 }
282
283 /* ---------------------------------------------------------------------------
284 * format_func collection (ordered by struct)
285 */
286
287 static void
288 format_cols_host(struct str *buf)
289 {
290 /* FIXME: don't clobber parts of the query string
291 * specifically "full" and "start"
292 * when setting sort direction
293 */
294 str_append(buf,
295 "<table>\n"
296 "<tr>\n"
297 " <th>IP</th>\n"
298 " <th>Hostname</th>\n");
299 if (show_mac_addrs) str_append(buf,
300 " <th>MAC Address</th>\n");
301 str_append(buf,
302 " <th><a href=\"?sort=in\">In</a></th>\n"
303 " <th><a href=\"?sort=out\">Out</a></th>\n"
304 " <th><a href=\"?sort=total\">Total</a></th>\n");
305 if (want_lastseen) str_append(buf,
306 " <th><a href=\"?sort=lastseen\">Last seen</a></th>\n");
307 str_append(buf,
308 "</tr>\n");
309 }
310
311 static void
312 format_row_host(struct str *buf, const struct bucket *b,
313 const char *css_class)
314 {
315 const char *ip = addr_to_str(&(b->u.host.addr));
316
317 str_appendf(buf,
318 "<tr class=\"%s\">\n"
319 " <td><a href=\"/hosts/%s/\">%s</a></td>\n"
320 " <td>%s</td>\n",
321 css_class,
322 ip, ip,
323 (b->u.host.dns == NULL) ? "" : b->u.host.dns);
324
325 if (show_mac_addrs)
326 str_appendf(buf,
327 " <td><tt>%x:%x:%x:%x:%x:%x</tt></td>\n",
328 b->u.host.mac_addr[0],
329 b->u.host.mac_addr[1],
330 b->u.host.mac_addr[2],
331 b->u.host.mac_addr[3],
332 b->u.host.mac_addr[4],
333 b->u.host.mac_addr[5]);
334
335 str_appendf(buf,
336 " <td class=\"num\">%'qu</td>\n"
337 " <td class=\"num\">%'qu</td>\n"
338 " <td class=\"num\">%'qu</td>\n",
339 b->in, b->out, b->total);
340
341 if (want_lastseen) {
342 time_t last_t = b->u.host.last_seen;
343 struct str *lastseen = NULL;
344
345 if (now >= last_t)
346 lastseen = length_of_time(now - last_t);
347
348 str_append(buf,
349 " <td class=\"num\">");
350 if (lastseen == NULL)
351 str_append(buf, "(clock error)");
352 else {
353 str_appendstr(buf, lastseen);
354 str_free(lastseen);
355 }
356 str_append(buf,
357 "</td>");
358 }
359
360 str_appendf(buf,
361 "</tr>\n");
362
363 /* Only resolve hosts "on demand" */
364 if (b->u.host.dns == NULL)
365 dns_queue(&(b->u.host.addr));
366 }
367
368 static void
369 format_cols_port_tcp(struct str *buf)
370 {
371 str_append(buf,
372 "<table>\n"
373 "<tr>\n"
374 " <th>Port</td>\n"
375 " <th>Service</td>\n"
376 " <th>In</td>\n"
377 " <th>Out</td>\n"
378 " <th>Total</td>\n"
379 " <th>SYNs</td>\n"
380 "</tr>\n"
381 );
382 }
383
384 static void
385 format_row_port_tcp(struct str *buf, const struct bucket *b,
386 const char *css_class)
387 {
388 const struct port_tcp *p = &(b->u.port_tcp);
389
390 str_appendf(buf,
391 "<tr class=\"%s\">\n"
392 " <td class=\"num\">%u</td>\n"
393 " <td>%s</td>\n"
394 " <td class=\"num\">%'qu</td>\n"
395 " <td class=\"num\">%'qu</td>\n"
396 " <td class=\"num\">%'qu</td>\n"
397 " <td class=\"num\">%'qu</td>\n"
398 "</tr>\n",
399 css_class,
400 p->port, getservtcp(p->port), b->in, b->out, b->total, p->syn
401 );
402 }
403
404 static void
405 format_cols_port_udp(struct str *buf)
406 {
407 str_append(buf,
408 "<table>\n"
409 "<tr>\n"
410 " <th>Port</td>\n"
411 " <th>Service</td>\n"
412 " <th>In</td>\n"
413 " <th>Out</td>\n"
414 " <th>Total</td>\n"
415 "</tr>\n"
416 );
417 }
418
419 static void
420 format_row_port_udp(struct str *buf, const struct bucket *b,
421 const char *css_class)
422 {
423 const struct port_udp *p = &(b->u.port_udp);
424
425 str_appendf(buf,
426 "<tr class=\"%s\">\n"
427 " <td class=\"num\">%u</td>\n"
428 " <td>%s</td>\n"
429 " <td class=\"num\">%'qu</td>\n"
430 " <td class=\"num\">%'qu</td>\n"
431 " <td class=\"num\">%'qu</td>\n"
432 "</tr>\n",
433 css_class,
434 p->port, getservudp(p->port), b->in, b->out, b->total
435 );
436 }
437
438 static void
439 format_cols_ip_proto(struct str *buf)
440 {
441 str_append(buf,
442 "<table>\n"
443 "<tr>\n"
444 " <th>#</td>\n"
445 " <th>Protocol</td>\n"
446 " <th>In</td>\n"
447 " <th>Out</td>\n"
448 " <th>Total</td>\n"
449 "</tr>\n"
450 );
451 }
452
453 static void
454 format_row_ip_proto(struct str *buf, const struct bucket *b,
455 const char *css_class)
456 {
457 const struct ip_proto *p = &(b->u.ip_proto);
458
459 str_appendf(buf,
460 "<tr class=\"%s\">\n"
461 " <td class=\"num\">%u</td>\n"
462 " <td>%s</td>\n"
463 " <td class=\"num\">%'qu</td>\n"
464 " <td class=\"num\">%'qu</td>\n"
465 " <td class=\"num\">%'qu</td>\n"
466 "</tr>\n",
467 css_class,
468 p->proto, getproto(p->proto),
469 b->in, b->out, b->total
470 );
471 }
472
473 /* ---------------------------------------------------------------------------
474 * Initialise a hashtable.
475 */
476 static struct hashtable *
477 hashtable_make(const uint8_t bits,
478 const unsigned int count_max,
479 const unsigned int count_keep,
480 hash_func_t *hash_func,
481 free_func_t *free_func,
482 key_func_t *key_func,
483 find_func_t *find_func,
484 make_func_t *make_func,
485 format_cols_func_t *format_cols_func,
486 format_row_func_t *format_row_func)
487 {
488 struct hashtable *hash;
489 assert(bits > 0);
490
491 hash = xmalloc(sizeof(*hash));
492 hash->bits = bits;
493 hash->count_max = count_max;
494 hash->count_keep = count_keep;
495 hash->size = 1U << bits;
496 hash->mask = hash->size - 1;
497 hash->coeff = coprime(hash->size);
498 hash->hash_func = hash_func;
499 hash->free_func = free_func;
500 hash->key_func = key_func;
501 hash->find_func = find_func;
502 hash->make_func = make_func;
503 hash->format_cols_func = format_cols_func;
504 hash->format_row_func = format_row_func;
505 hash->count = 0;
506 hash->table = xcalloc(hash->size, sizeof(*hash->table));
507 memset(&(hash->stats), 0, sizeof(hash->stats));
508 return (hash);
509 }
510
511 /* ---------------------------------------------------------------------------
512 * Initialise global hosts_db.
513 */
514 void
515 hosts_db_init(void)
516 {
517 assert(hosts_db == NULL);
518 hosts_db = hashtable_make(HOST_BITS, hosts_max, hosts_keep,
519 hash_func_host, free_func_host, key_func_host, find_func_host,
520 make_func_host, format_cols_host, format_row_host);
521 }
522
523 static void
524 hashtable_rehash(struct hashtable *h, const uint8_t bits)
525 {
526 struct bucket **old_table, **new_table;
527 uint32_t i, old_size;
528 assert(h != NULL);
529 assert(bits > 0);
530
531 h->stats.rehashes++;
532 old_size = h->size;
533 old_table = h->table;
534
535 h->bits = bits;
536 h->size = 1U << bits;
537 h->mask = h->size - 1;
538 h->coeff = coprime(h->size);
539 new_table = xcalloc(h->size, sizeof(*new_table));
540
541 for (i=0; i<old_size; i++) {
542 struct bucket *next, *b = old_table[i];
543 while (b != NULL) {
544 uint32_t pos = h->hash_func(h, h->key_func(b)) & h->mask;
545 next = b->next;
546 b->next = new_table[pos];
547 new_table[pos] = b;
548 b = next;
549 }
550 }
551
552 free(h->table);
553 h->table = new_table;
554 }
555
556 static void
557 hashtable_insert(struct hashtable *h, struct bucket *b)
558 {
559 uint32_t pos;
560 assert(h != NULL);
561 assert(b != NULL);
562 assert(b->next == NULL);
563
564 /* Rehash on 80% occupancy */
565 if ((h->count > h->size) ||
566 ((h->size - h->count) < h->size / 5))
567 hashtable_rehash(h, h->bits+1);
568
569 pos = h->hash_func(h, h->key_func(b)) & h->mask;
570 if (h->table[pos] == NULL)
571 h->table[pos] = b;
572 else {
573 /* Insert at top of chain. */
574 b->next = h->table[pos];
575 h->table[pos] = b;
576 }
577 h->count++;
578 h->stats.inserts++;
579 }
580
581 /* Return bucket matching key, or NULL if no such entry. */
582 static struct bucket *
583 hashtable_search(struct hashtable *h, const void *key)
584 {
585 uint32_t pos;
586 struct bucket *b;
587
588 h->stats.searches++;
589 pos = h->hash_func(h, key) & h->mask;
590 b = h->table[pos];
591 while (b != NULL) {
592 if (h->find_func(b, key))
593 return (b);
594 else
595 b = b->next;
596 }
597 return (NULL);
598 }
599
600 /* Search for a key. If it's not there, make and insert a bucket for it. */
601 static struct bucket *
602 hashtable_find_or_insert(struct hashtable *h, const void *key)
603 {
604 struct bucket *b = hashtable_search(h, key);
605
606 if (b == NULL) {
607 /* Not found, so insert after checking occupancy. */
608 /*assert(h->count <= h->count_max);*/
609 if (h->count >= h->count_max) hashtable_reduce(h);
610 b = h->make_func(key);
611 hashtable_insert(h, b);
612 }
613 return (b);
614 }
615
616 /*
617 * Frees the hashtable and the buckets. The contents are assumed to be
618 * "simple" -- i.e. no "destructor" action is required beyond simply freeing
619 * the bucket.
620 */
621 static void
622 hashtable_free(struct hashtable *h)
623 {
624 uint32_t i;
625
626 if (h == NULL)
627 return;
628 for (i=0; i<h->size; i++) {
629 struct bucket *tmp, *b = h->table[i];
630 while (b != NULL) {
631 tmp = b;
632 b = b->next;
633 h->free_func(tmp);
634 free(tmp);
635 }
636 }
637 free(h->table);
638 free(h);
639 }
640
641 /* ---------------------------------------------------------------------------
642 * Return existing host or insert a new one.
643 */
644 struct bucket *
645 host_get(const struct addr *const a)
646 {
647 return (hashtable_find_or_insert(hosts_db, a));
648 }
649
650 /* ---------------------------------------------------------------------------
651 * Find host, returns NULL if not in DB.
652 */
653 struct bucket *
654 host_find(const struct addr *const a)
655 {
656 return (hashtable_search(hosts_db, a));
657 }
658
659 /* ---------------------------------------------------------------------------
660 * Find host, returns NULL if not in DB.
661 */
662 static struct bucket *
663 host_search(const char *ipstr)
664 {
665 struct addr a;
666 struct addrinfo hints, *ai;
667
668 memset(&hints, 0, sizeof(hints));
669 hints.ai_family = AF_UNSPEC;
670 hints.ai_flags = AI_NUMERICHOST;
671
672 if (getaddrinfo(ipstr, NULL, &hints, &ai))
673 return (NULL); /* invalid addr */
674
675 if (ai->ai_family == AF_INET) {
676 a.family = IPv4;
677 a.ip.v4 = ((const struct sockaddr_in *)ai->ai_addr)->sin_addr.s_addr;
678 }
679 else if (ai->ai_family == AF_INET6) {
680 a.family = IPv6;
681 memcpy(&(a.ip.v6),
682 ((struct sockaddr_in6 *)ai->ai_addr)->sin6_addr.s6_addr,
683 sizeof(a.ip.v6));
684 } else {
685 freeaddrinfo(ai);
686 return (NULL); /* unknown family */
687 }
688 freeaddrinfo(ai);
689
690 verbosef("search(%s) turned into %s", ipstr, addr_to_str(&a));
691 return (hashtable_search(hosts_db, &a));
692 }
693
694 /* ---------------------------------------------------------------------------
695 * Reduce a hashtable to the top <keep> entries.
696 */
697 static void
698 hashtable_reduce(struct hashtable *ht)
699 {
700 uint32_t i, pos, rmd;
701 const struct bucket **table;
702 uint64_t cutoff;
703
704 assert(ht->count_keep < ht->count);
705
706 /* Fill table with pointers to buckets in hashtable. */
707 table = xcalloc(ht->count, sizeof(*table));
708 for (pos=0, i=0; i<ht->size; i++) {
709 struct bucket *b = ht->table[i];
710 while (b != NULL) {
711 table[pos++] = b;
712 b = b->next;
713 }
714 }
715 assert(pos == ht->count);
716 qsort_buckets(table, ht->count, 0, ht->count_keep, TOTAL);
717 cutoff = table[ht->count_keep]->total;
718 free(table);
719
720 /* Remove all elements with total <= cutoff. */
721 rmd = 0;
722 for (i=0; i<ht->size; i++) {
723 struct bucket *last = NULL, *next, *b = ht->table[i];
724 while (b != NULL) {
725 next = b->next;
726 if (b->total <= cutoff) {
727 /* Remove this one. */
728 ht->free_func(b);
729 free(b);
730 if (last == NULL)
731 ht->table[i] = next;
732 else
733 last->next = next;
734 rmd++;
735 ht->count--;
736 } else {
737 last = b;
738 }
739 b = next;
740 }
741 }
742 verbosef("hashtable_reduce: removed %u buckets, left %u",
743 rmd, ht->count);
744 hashtable_rehash(ht, ht->bits); /* is this needed? */
745 }
746
747 /* ---------------------------------------------------------------------------
748 * Reset hosts_db to empty.
749 */
750 void
751 hosts_db_reset(void)
752 {
753 unsigned int i;
754
755 for (i=0; i<hosts_db->size; i++) {
756 struct bucket *next, *b = hosts_db->table[i];
757 while (b != NULL) {
758 next = b->next;
759 hosts_db->free_func(b);
760 free(b);
761 b = next;
762 }
763 hosts_db->table[i] = NULL;
764 }
765 verbosef("hosts_db reset to empty, freed %u hosts", hosts_db->count);
766 hosts_db->count = 0;
767 }
768
769 /* ---------------------------------------------------------------------------
770 * Deallocate hosts_db.
771 */
772 void hosts_db_free(void)
773 {
774 uint32_t i;
775
776 assert(hosts_db != NULL);
777 for (i=0; i<hosts_db->size; i++) {
778 struct bucket *tmp, *b = hosts_db->table[i];
779 while (b != NULL) {
780 tmp = b;
781 b = b->next;
782 hosts_db->free_func(tmp);
783 free(tmp);
784 }
785 }
786 free(hosts_db->table);
787 free(hosts_db);
788 hosts_db = NULL;
789 }
790
791 /* ---------------------------------------------------------------------------
792 * Find or create a port_tcp inside a host.
793 */
794 struct bucket *
795 host_get_port_tcp(struct bucket *host, const uint16_t port)
796 {
797 struct host *h = &host->u.host;
798 assert(h != NULL);
799 if (h->ports_tcp == NULL)
800 h->ports_tcp = hashtable_make(PORT_BITS, ports_max, ports_keep,
801 hash_func_short, free_func_simple, key_func_port_tcp,
802 find_func_port_tcp, make_func_port_tcp,
803 format_cols_port_tcp, format_row_port_tcp);
804 return (hashtable_find_or_insert(h->ports_tcp, &port));
805 }
806
807 /* ---------------------------------------------------------------------------
808 * Find or create a port_udp inside a host.
809 */
810 struct bucket *
811 host_get_port_udp(struct bucket *host, const uint16_t port)
812 {
813 struct host *h = &host->u.host;
814 assert(h != NULL);
815 if (h->ports_udp == NULL)
816 h->ports_udp = hashtable_make(PORT_BITS, ports_max, ports_keep,
817 hash_func_short, free_func_simple, key_func_port_udp,
818 find_func_port_udp, make_func_port_udp,
819 format_cols_port_udp, format_row_port_udp);
820 return (hashtable_find_or_insert(h->ports_udp, &port));
821 }
822
823 /* ---------------------------------------------------------------------------
824 * Find or create an ip_proto inside a host.
825 */
826 struct bucket *
827 host_get_ip_proto(struct bucket *host, const uint8_t proto)
828 {
829 struct host *h = &host->u.host;
830 static const unsigned int PROTOS_MAX = 512, PROTOS_KEEP = 256;
831 assert(h != NULL);
832 if (h->ip_protos == NULL)
833 h->ip_protos = hashtable_make(PROTO_BITS, PROTOS_MAX, PROTOS_KEEP,
834 hash_func_byte, free_func_simple, key_func_ip_proto,
835 find_func_ip_proto, make_func_ip_proto,
836 format_cols_ip_proto, format_row_ip_proto);
837 return (hashtable_find_or_insert(h->ip_protos, &proto));
838 }
839
840 static struct str *html_hosts_main(const char *qs);
841 static struct str *html_hosts_detail(const char *ip);
842
843 /* ---------------------------------------------------------------------------
844 * Web interface: delegate the /hosts/ space.
845 */
846 struct str *
847 html_hosts(const char *uri, const char *query)
848 {
849 int i, num_elems;
850 char **elem = split('/', uri, &num_elems);
851 struct str *buf = NULL;
852
853 assert(num_elems >= 1);
854 assert(strcmp(elem[0], "hosts") == 0);
855
856 if (num_elems == 1)
857 /* /hosts/ */
858 buf = html_hosts_main(query);
859 else if (num_elems == 2)
860 /* /hosts/<IP of host>/ */
861 buf = html_hosts_detail(elem[1]);
862
863 for (i=0; i<num_elems; i++)
864 free(elem[i]);
865 free(elem);
866 return (buf); /* FIXME: a NULL here becomes 404 Not Found, we might want
867 other codes to be possible */
868 }
869
870 /* ---------------------------------------------------------------------------
871 * Format hashtable into HTML.
872 */
873 static void
874 format_table(struct str *buf, struct hashtable *ht, int start,
875 const enum sort_dir sort, const int full)
876 {
877 const struct bucket **table;
878 uint32_t i, pos, end;
879 int alt = 0;
880
881 if ((ht == NULL) || (ht->count == 0)) {
882 str_append(buf, "<p>The table is empty.</p>\n");
883 return;
884 }
885
886 /* Fill table with pointers to buckets in hashtable. */
887 table = xcalloc(ht->count, sizeof(*table));
888 for (pos=0, i=0; i<ht->size; i++) {
889 struct bucket *b = ht->table[i];
890 while (b != NULL) {
891 table[pos++] = b;
892 b = b->next;
893 }
894 }
895 assert(pos == ht->count);
896
897 if (full) {
898 /* full report overrides start and end */
899 start = 0;
900 end = ht->count;
901 } else
902 end = min(ht->count, (uint32_t)start+MAX_ENTRIES);
903
904 str_appendf(buf, "(%u-%u of %u)<br/>\n", start+1, end, ht->count);
905 qsort_buckets(table, ht->count, start, end, sort);
906 ht->format_cols_func(buf);
907
908 for (i=start; i<end; i++) {
909 ht->format_row_func(buf, table[i], alt ? "alt1" : "alt2");
910 alt = !alt; /* alternate class for table rows */
911 }
912 free(table);
913 str_append(buf, "</table>\n");
914 }
915
916 /* ---------------------------------------------------------------------------
917 * Web interface: sorted table of hosts.
918 */
919 static struct str *
920 html_hosts_main(const char *qs)
921 {
922 struct str *buf = str_make();
923 char *qs_start, *qs_sort, *qs_full, *ep;
924 const char *sortstr;
925 int start, full = 0;
926 enum sort_dir sort;
927
928 /* parse query string */
929 qs_start = qs_get(qs, "start");
930 qs_sort = qs_get(qs, "sort");
931 qs_full = qs_get(qs, "full");
932 if (qs_full != NULL) {
933 full = 1;
934 free(qs_full);
935 }
936
937 /* validate sort */
938 if (qs_sort == NULL) sort = TOTAL;
939 else if (strcmp(qs_sort, "total") == 0) sort = TOTAL;
940 else if (strcmp(qs_sort, "in") == 0) sort = IN;
941 else if (strcmp(qs_sort, "out") == 0) sort = OUT;
942 else if (strcmp(qs_sort, "lastseen") == 0) sort = LASTSEEN;
943 else {
944 str_append(buf, "Error: invalid value for \"sort\".\n");
945 goto done;
946 }
947
948 /* parse start */
949 if (qs_start == NULL)
950 start = 0;
951 else {
952 start = (int)strtoul(qs_start, &ep, 10);
953 if (*ep != '\0') {
954 str_append(buf, "Error: \"start\" is not a number.\n");
955 goto done;
956 }
957 if ((errno == ERANGE) ||
958 (start < 0) || (start >= (int)hosts_db->count)) {
959 str_append(buf, "Error: \"start\" is out of bounds.\n");
960 goto done;
961 }
962 }
963
964 #define PREV "&lt;&lt;&lt; prev page"
965 #define NEXT "next page &gt;&gt;&gt;"
966 #define FULL "full table"
967
968 str_append(buf, html_header_1);
969 str_appendf(buf, " <title>darkstat3: Hosts (%s)</title>\n", interface);
970 str_append(buf, html_header_2);
971 str_appendf(buf, "<h2 class=\"pageheader\">Hosts (%s)</h2>\n", interface);
972 format_table(buf, hosts_db, start, sort, full);
973
974 /* <prev | full | stats | next> */
975 sortstr = qs_sort;
976 if (sortstr == NULL) sortstr = "total";
977 if (start > 0) {
978 int prev = max(start - MAX_ENTRIES, 0);
979 str_appendf(buf, "<a href=\"?start=%d&sort=%s\">" PREV "</a>",
980 prev, sortstr);
981 } else
982 str_append(buf, PREV);
983
984 if (full)
985 str_append(buf, " | " FULL);
986 else
987 str_appendf(buf, " | <a href=\"?full=yes&sort=%s\">" FULL "</a>",
988 sortstr);
989
990 if (start+MAX_ENTRIES < (int)hosts_db->count)
991 str_appendf(buf, " | <a href=\"?start=%d&sort=%s\">" NEXT "</a>",
992 start+MAX_ENTRIES, sortstr);
993 else
994 str_append(buf, " | " NEXT);
995
996 str_append(buf, "<br/>\n");
997 str_append(buf, html_footer);
998 done:
999 if (qs_start != NULL) free(qs_start);
1000 if (qs_sort != NULL) free(qs_sort);
1001 return buf;
1002 #undef PREV
1003 #undef NEXT
1004 #undef FULL
1005 }
1006
1007 /* ---------------------------------------------------------------------------
1008 * Web interface: detailed view of a single host.
1009 */
1010 static struct str *
1011 html_hosts_detail(const char *ip)
1012 {
1013 struct bucket *h;
1014 struct str *buf, *ls_len;
1015 char ls_when[100];
1016 const char *canonical;
1017 time_t ls;
1018
1019 h = host_search(ip);
1020 if (h == NULL)
1021 return (NULL); /* no such host */
1022
1023 canonical = addr_to_str(&(h->u.host.addr));
1024
1025 /* Overview. */
1026 buf = str_make();
1027 str_append(buf, html_header_1);
1028 str_appendf(buf, " <title>%s</title>\n", ip);
1029 str_append(buf, html_header_2);
1030 str_appendf(buf, "<h2>%s</h2>\n", ip);
1031 if (strcmp(ip, canonical) != 0)
1032 str_appendf(buf, "(canonically <b>%s</b>)\n", canonical);
1033 str_appendf(buf,
1034 "<p>\n"
1035 "<b>Hostname:</b> %s<br/>\n",
1036 (h->u.host.dns == NULL)?"(resolving...)":h->u.host.dns);
1037
1038 /* Resolve host "on demand" */
1039 if (h->u.host.dns == NULL)
1040 dns_queue(&(h->u.host.addr));
1041
1042 if (show_mac_addrs)
1043 str_appendf(buf,
1044 "<b>MAC Address:</b> "
1045 "<tt>%x:%x:%x:%x:%x:%x</tt><br/>\n",
1046 h->u.host.mac_addr[0],
1047 h->u.host.mac_addr[1],
1048 h->u.host.mac_addr[2],
1049 h->u.host.mac_addr[3],
1050 h->u.host.mac_addr[4],
1051 h->u.host.mac_addr[5]);
1052
1053 str_append(buf,
1054 "</p>\n"
1055 "<p>\n"
1056 "<b>Last seen:</b> ");
1057
1058 ls = h->u.host.last_seen;
1059 if (strftime(ls_when, sizeof(ls_when),
1060 "%Y-%m-%d %H:%M:%S %Z%z", localtime(&ls)) != 0)
1061 str_append(buf, ls_when);
1062
1063 if (h->u.host.last_seen <= now) {
1064 ls_len = length_of_time(now - h->u.host.last_seen);
1065 str_append(buf, " (");
1066 str_appendstr(buf, ls_len);
1067 str_free(ls_len);
1068 str_append(buf, " ago)");
1069 } else {
1070 str_append(buf, " (in the future, possible clock problem)");
1071 }
1072
1073 str_appendf(buf,
1074 "</p>\n"
1075 "<p>\n"
1076 " <b>In:</b> %'qu<br/>\n"
1077 " <b>Out:</b> %'qu<br/>\n"
1078 " <b>Total:</b> %'qu<br/>\n"
1079 "</p>\n",
1080 h->in, h->out, h->total);
1081
1082 str_append(buf, "<h3>TCP ports</h3>\n");
1083 format_table(buf, h->u.host.ports_tcp, 0,TOTAL,0);
1084
1085 str_append(buf, "<h3>UDP ports</h3>\n");
1086 format_table(buf, h->u.host.ports_udp, 0,TOTAL,0);
1087
1088 str_append(buf, "<h3>IP protocols</h3>\n");
1089 format_table(buf, h->u.host.ip_protos, 0,TOTAL,0);
1090
1091 str_append(buf, html_footer);
1092 return (buf);
1093 }
1094
1095 /* ---------------------------------------------------------------------------
1096 * Database import and export code:
1097 * Initially written and contributed by Ben Stewart.
1098 * copyright (c) 2007 Ben Stewart, Emil Mikulic.
1099 */
1100 static int hosts_db_export_ip(const struct hashtable *h, const int fd);
1101 static int hosts_db_export_tcp(const struct hashtable *h, const int fd);
1102 static int hosts_db_export_udp(const struct hashtable *h, const int fd);
1103
1104 static const char
1105 export_proto_ip = 'P',
1106 export_proto_tcp = 'T',
1107 export_proto_udp = 'U';
1108
1109 static const unsigned char
1110 export_tag_host_ver1[] = {'H', 'S', 'T', 0x01},
1111 export_tag_host_ver2[] = {'H', 'S', 'T', 0x02};
1112
1113 /* ---------------------------------------------------------------------------
1114 * Load a host's ip_proto table from a file.
1115 * Returns 0 on failure, 1 on success.
1116 */
1117 static int
1118 hosts_db_import_ip(const int fd, struct bucket *host)
1119 {
1120 uint8_t count, i;
1121
1122 if (!expect8(fd, export_proto_ip)) return 0;
1123 if (!read8(fd, &count)) return 0;
1124
1125 for (i=0; i<count; i++) {
1126 struct bucket *b;
1127 uint8_t proto;
1128 uint64_t in, out;
1129
1130 if (!read8(fd, &proto)) return 0;
1131 if (!read64(fd, &in)) return 0;
1132 if (!read64(fd, &out)) return 0;
1133
1134 /* Store data */
1135 b = host_get_ip_proto(host, proto);
1136 b->in = in;
1137 b->out = out;
1138 b->total = in + out;
1139 assert(b->u.ip_proto.proto == proto); /* should be done by make fn */
1140 }
1141 return 1;
1142 }
1143
1144 /* ---------------------------------------------------------------------------
1145 * Load a host's port_tcp table from a file.
1146 * Returns 0 on failure, 1 on success.
1147 */
1148 static int
1149 hosts_db_import_tcp(const int fd, struct bucket *host)
1150 {
1151 uint16_t count, i;
1152
1153 if (!expect8(fd, export_proto_tcp)) return 0;
1154 if (!read16(fd, &count)) return 0;
1155
1156 for (i=0; i<count; i++) {
1157 struct bucket *b;
1158 uint16_t port;
1159 uint64_t in, out, syn;
1160
1161 if (!read16(fd, &port)) return 0;
1162 if (!read64(fd, &syn)) return 0;
1163 if (!read64(fd, &in)) return 0;
1164 if (!read64(fd, &out)) return 0;
1165
1166 /* Store data */
1167 b = host_get_port_tcp(host, port);
1168 b->in = in;
1169 b->out = out;
1170 b->total = in + out;
1171 assert(b->u.port_tcp.port == port); /* done by make_func_port_tcp */
1172 b->u.port_tcp.syn = syn;
1173 }
1174 return 1;
1175 }
1176
1177 /* ---------------------------------------------------------------------------
1178 * Load a host's port_tcp table from a file.
1179 * Returns 0 on failure, 1 on success.
1180 */
1181 static int
1182 hosts_db_import_udp(const int fd, struct bucket *host)
1183 {
1184 uint16_t count, i;
1185
1186 if (!expect8(fd, export_proto_udp)) return 0;
1187 if (!read16(fd, &count)) return 0;
1188
1189 for (i=0; i<count; i++) {
1190 struct bucket *b;
1191 uint16_t port;
1192 uint64_t in, out;
1193
1194 if (!read16(fd, &port)) return 0;
1195 if (!read64(fd, &in)) return 0;
1196 if (!read64(fd, &out)) return 0;
1197
1198 /* Store data */
1199 b = host_get_port_udp(host, port);
1200 b->in = in;
1201 b->out = out;
1202 b->total = in + out;
1203 assert(b->u.port_udp.port == port); /* done by make_func */
1204 }
1205 return 1;
1206 }
1207
1208 /* ---------------------------------------------------------------------------
1209 * Load all hosts from a file.
1210 * Returns 0 on failure, 1 on success.
1211 */
1212 static int
1213 hosts_db_import_host(const int fd)
1214 {
1215 struct bucket *host;
1216 struct addr a;
1217 uint8_t hostname_len;
1218 uint64_t in, out;
1219 unsigned int pos = xtell(fd);
1220 char hdr[4];
1221 int ver = 0;
1222
1223 if (!readn(fd, hdr, sizeof(hdr))) return 0;
1224 if (memcmp(hdr, export_tag_host_ver2, sizeof(hdr)) == 0)
1225 ver = 2;
1226 else if (memcmp(hdr, export_tag_host_ver1, sizeof(hdr)) == 0)
1227 ver = 1;
1228 else {
1229 warnx("bad host header: %02x%02x%02x%02x",
1230 hdr[0], hdr[1], hdr[2], hdr[3]);
1231 return 0;
1232 }
1233
1234 if (!readaddr(fd, &a)) return 0;
1235 verbosef("at file pos %u, importing host %s", pos, addr_to_str(&a));
1236 host = host_get(&a);
1237 assert(addr_equal(&(host->u.host.addr), &a));
1238
1239 if (ver > 1) {
1240 uint64_t t;
1241 if (!read64(fd, &t)) return 0;
1242 host->u.host.last_seen = (time_t)t;
1243 }
1244
1245 assert(sizeof(host->u.host.mac_addr) == 6);
1246 if (!readn(fd, host->u.host.mac_addr, sizeof(host->u.host.mac_addr)))
1247 return 0;
1248
1249 /* HOSTNAME */
1250 assert(host->u.host.dns == NULL); /* make fn? */
1251 if (!read8(fd, &hostname_len)) return 0;
1252 if (hostname_len > 0) {
1253 host->u.host.dns = xmalloc(hostname_len + 1);
1254 host->u.host.dns[0] = '\0';
1255
1256 /* At this point, the hostname is attached to a host which is in our
1257 * hosts_db, so if we bail out due to an import error, this pointer
1258 * isn't lost and leaked, it can be cleaned up in hosts_db_{free,reset}
1259 */
1260
1261 if (!readn(fd, host->u.host.dns, hostname_len)) return 0;
1262 host->u.host.dns[hostname_len] = '\0';
1263 }
1264
1265 if (!read64(fd, &in)) return 0;
1266 if (!read64(fd, &out)) return 0;
1267
1268 host->in = in;
1269 host->out = out;
1270 host->total = in + out;
1271
1272 /* Host's port and proto subtables: */
1273 if (!hosts_db_import_ip(fd, host)) return 0;
1274 if (!hosts_db_import_tcp(fd, host)) return 0;
1275 if (!hosts_db_import_udp(fd, host)) return 0;
1276 return 1;
1277 }
1278
1279 /* ---------------------------------------------------------------------------
1280 * Database Import: Grab hosts_db from a file provided by the caller.
1281 *
1282 * This function will retrieve the data sans the header. We expect the caller
1283 * to have validated the header of the hosts_db segment, and left the file
1284 * sitting at the start of the data.
1285 */
1286 int hosts_db_import(const int fd)
1287 {
1288 uint32_t host_count, i;
1289
1290 if (!read32(fd, &host_count)) return 0;
1291
1292 for (i=0; i<host_count; i++)
1293 if (!hosts_db_import_host(fd)) return 0;
1294
1295 return 1;
1296 }
1297
1298 /* ---------------------------------------------------------------------------
1299 * Database Export: Dump hosts_db into a file provided by the caller.
1300 * The caller is responsible for writing out export_tag_hosts_ver1 first.
1301 */
1302 int hosts_db_export(const int fd)
1303 {
1304 uint32_t i;
1305 struct bucket *b;
1306
1307 if (!write32(fd, hosts_db->count)) return 0;
1308
1309 for (i = 0; i<hosts_db->size; i++)
1310 for (b = hosts_db->table[i]; b != NULL; b = b->next) {
1311 /* For each host: */
1312 if (!writen(fd, export_tag_host_ver2, sizeof(export_tag_host_ver2)))
1313 return 0;
1314
1315 if (!writeaddr(fd, &(b->u.host.addr))) return 0;
1316
1317 if (!write64(fd, (uint64_t)(b->u.host.last_seen))) return 0;
1318
1319 assert(sizeof(b->u.host.mac_addr) == 6);
1320 if (!writen(fd, b->u.host.mac_addr, sizeof(b->u.host.mac_addr)))
1321 return 0;
1322
1323 /* HOSTNAME */
1324 if (b->u.host.dns == NULL) {
1325 if (!write8(fd, 0)) return 0;
1326 } else {
1327 int dnslen = strlen(b->u.host.dns);
1328
1329 if (dnslen > 255) {
1330 warnx("found a very long hostname: \"%s\"\n"
1331 "wasn't expecting one longer than 255 chars (this one is %d)",
1332 b->u.host.dns, dnslen);
1333 dnslen = 255;
1334 }
1335
1336 if (!write8(fd, (uint8_t)dnslen)) return 0;
1337 if (!writen(fd, b->u.host.dns, dnslen)) return 0;
1338 }
1339
1340 if (!write64(fd, b->in)) return 0;
1341 if (!write64(fd, b->out)) return 0;
1342
1343 if (!hosts_db_export_ip(b->u.host.ip_protos, fd)) return 0;
1344 if (!hosts_db_export_tcp(b->u.host.ports_tcp, fd)) return 0;
1345 if (!hosts_db_export_udp(b->u.host.ports_udp, fd)) return 0;
1346 }
1347 return 1;
1348 }
1349
1350 /* ---------------------------------------------------------------------------
1351 * Dump the ip_proto table of a host.
1352 */
1353 static int
1354 hosts_db_export_ip(const struct hashtable *h, const int fd)
1355 {
1356 uint32_t i, written = 0;
1357 struct bucket *b;
1358
1359 /* IP DATA */
1360 if (!write8(fd, export_proto_ip)) return 0;
1361
1362 /* If no data, write a IP Proto count of 0 and we're done. */
1363 if (h == NULL) {
1364 if (!write8(fd, 0)) return 0;
1365 return 1;
1366 }
1367
1368 assert(h->count < 256);
1369 if (!write8(fd, (uint8_t)h->count)) return 0;
1370
1371 for (i = 0; i<h->size; i++)
1372 for (b = h->table[i]; b != NULL; b = b->next) {
1373 /* For each ip_proto bucket: */
1374
1375 if (!write8(fd, b->u.ip_proto.proto)) return 0;
1376 if (!write64(fd, b->in)) return 0;
1377 if (!write64(fd, b->out)) return 0;
1378 written++;
1379 }
1380 assert(written == h->count);
1381 return 1;
1382 }
1383
1384 /* ---------------------------------------------------------------------------
1385 * Dump the port_tcp table of a host.
1386 */
1387 static int
1388 hosts_db_export_tcp(const struct hashtable *h, const int fd)
1389 {
1390 struct bucket *b;
1391 uint32_t i, written = 0;
1392
1393 /* TCP DATA */
1394 if (!write8(fd, export_proto_tcp)) return 0;
1395
1396 /* If no data, write a count of 0 and we're done. */
1397 if (h == NULL) {
1398 if (!write16(fd, 0)) return 0;
1399 return 1;
1400 }
1401
1402 assert(h->count < 65536);
1403 if (!write16(fd, (uint16_t)h->count)) return 0;
1404
1405 for (i = 0; i<h->size; i++)
1406 for (b = h->table[i]; b != NULL; b = b->next) {
1407 if (!write16(fd, b->u.port_tcp.port)) return 0;
1408 if (!write64(fd, b->u.port_tcp.syn)) return 0;
1409 if (!write64(fd, b->in)) return 0;
1410 if (!write64(fd, b->out)) return 0;
1411 written++;
1412 }
1413 assert(written == h->count);
1414 return 1;
1415 }
1416
1417 /* ---------------------------------------------------------------------------
1418 * Dump the port_udp table of a host.
1419 */
1420 static int
1421 hosts_db_export_udp(const struct hashtable *h, const int fd)
1422 {
1423 struct bucket *b;
1424 uint32_t i, written = 0;
1425
1426 /* UDP DATA */
1427 if (!write8(fd, export_proto_udp)) return 0;
1428
1429 /* If no data, write a count of 0 and we're done. */
1430 if (h == NULL) {
1431 if (!write16(fd, 0)) return 0;
1432 return 1;
1433 }
1434
1435 assert(h->count < 65536);
1436 if (!write16(fd, (uint16_t)h->count)) return 0;
1437
1438 for (i = 0; i<h->size; i++)
1439 for (b = h->table[i]; b != NULL; b = b->next) {
1440 if (!write16(fd, b->u.port_udp.port)) return 0;
1441 if (!write64(fd, b->in)) return 0;
1442 if (!write64(fd, b->out)) return 0;
1443 written++;
1444 }
1445 assert(written == h->count);
1446 return 1;
1447 }
1448
1449 /* vim:set ts=3 sw=3 tw=78 expandtab: */