[NETFILTER] NAT sequence adjustment: Save eight bytes per conntrack
[linux-block.git] / net / netfilter / nfnetlink_log.c
CommitLineData
0597f268
HW
1/*
2 * This is a module which is used for logging packets to userspace via
3 * nfetlink.
4 *
5 * (C) 2005 by Harald Welte <laforge@netfilter.org>
6 *
7 * Based on the old ipv4-only ipt_ULOG.c:
8 * (C) 2000-2004 by Harald Welte <laforge@netfilter.org>
9 *
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License version 2 as
12 * published by the Free Software Foundation.
13 *
14 */
15#include <linux/module.h>
16#include <linux/skbuff.h>
17#include <linux/init.h>
18#include <linux/ip.h>
19#include <linux/ipv6.h>
20#include <linux/netdevice.h>
21#include <linux/netfilter.h>
22#include <linux/netlink.h>
23#include <linux/netfilter/nfnetlink.h>
24#include <linux/netfilter/nfnetlink_log.h>
25#include <linux/spinlock.h>
26#include <linux/sysctl.h>
27#include <linux/proc_fs.h>
28#include <linux/security.h>
29#include <linux/list.h>
30#include <linux/jhash.h>
31#include <linux/random.h>
32#include <net/sock.h>
33
34#include <asm/atomic.h>
35
fbcd923c
HW
36#ifdef CONFIG_BRIDGE_NETFILTER
37#include "../bridge/br_private.h"
38#endif
39
c2db2924 40#define NFULNL_NLBUFSIZ_DEFAULT NLMSG_GOODSIZE
0597f268
HW
41#define NFULNL_TIMEOUT_DEFAULT 100 /* every second */
42#define NFULNL_QTHRESH_DEFAULT 100 /* 100 packets */
43
44#define PRINTR(x, args...) do { if (net_ratelimit()) \
45 printk(x, ## args); } while (0);
46
47#if 0
48#define UDEBUG(x, args ...) printk(KERN_DEBUG "%s(%d):%s(): " x, \
49 __FILE__, __LINE__, __FUNCTION__, \
50 ## args)
51#else
52#define UDEBUG(x, ...)
53#endif
54
55struct nfulnl_instance {
56 struct hlist_node hlist; /* global list of instances */
57 spinlock_t lock;
58 atomic_t use; /* use count */
59
60 unsigned int qlen; /* number of nlmsgs in skb */
61 struct sk_buff *skb; /* pre-allocatd skb */
62 struct nlmsghdr *lastnlh; /* netlink header of last msg in skb */
63 struct timer_list timer;
64 int peer_pid; /* PID of the peer process */
65
66 /* configurable parameters */
67 unsigned int flushtimeout; /* timeout until queue flush */
68 unsigned int nlbufsiz; /* netlink buffer allocation size */
69 unsigned int qthreshold; /* threshold of the queue */
70 u_int32_t copy_range;
71 u_int16_t group_num; /* number of this queue */
72 u_int8_t copy_mode;
73};
74
75static DEFINE_RWLOCK(instances_lock);
76
77#define INSTANCE_BUCKETS 16
78static struct hlist_head instance_table[INSTANCE_BUCKETS];
79static unsigned int hash_init;
80
81static inline u_int8_t instance_hashfn(u_int16_t group_num)
82{
83 return ((group_num & 0xff) % INSTANCE_BUCKETS);
84}
85
86static struct nfulnl_instance *
87__instance_lookup(u_int16_t group_num)
88{
89 struct hlist_head *head;
90 struct hlist_node *pos;
91 struct nfulnl_instance *inst;
92
93 UDEBUG("entering (group_num=%u)\n", group_num);
94
95 head = &instance_table[instance_hashfn(group_num)];
96 hlist_for_each_entry(inst, pos, head, hlist) {
97 if (inst->group_num == group_num)
98 return inst;
99 }
100 return NULL;
101}
102
103static inline void
104instance_get(struct nfulnl_instance *inst)
105{
106 atomic_inc(&inst->use);
107}
108
109static struct nfulnl_instance *
110instance_lookup_get(u_int16_t group_num)
111{
112 struct nfulnl_instance *inst;
113
114 read_lock_bh(&instances_lock);
115 inst = __instance_lookup(group_num);
116 if (inst)
117 instance_get(inst);
118 read_unlock_bh(&instances_lock);
119
120 return inst;
121}
122
123static void
124instance_put(struct nfulnl_instance *inst)
125{
126 if (inst && atomic_dec_and_test(&inst->use)) {
127 UDEBUG("kfree(inst=%p)\n", inst);
128 kfree(inst);
129 }
130}
131
132static void nfulnl_timer(unsigned long data);
133
134static struct nfulnl_instance *
135instance_create(u_int16_t group_num, int pid)
136{
137 struct nfulnl_instance *inst;
138
139 UDEBUG("entering (group_num=%u, pid=%d)\n", group_num,
140 pid);
141
142 write_lock_bh(&instances_lock);
143 if (__instance_lookup(group_num)) {
144 inst = NULL;
145 UDEBUG("aborting, instance already exists\n");
146 goto out_unlock;
147 }
148
10dfdc69 149 inst = kzalloc(sizeof(*inst), GFP_ATOMIC);
0597f268
HW
150 if (!inst)
151 goto out_unlock;
152
0597f268 153 INIT_HLIST_NODE(&inst->hlist);
181a46a5 154 spin_lock_init(&inst->lock);
0597f268
HW
155 /* needs to be two, since we _put() after creation */
156 atomic_set(&inst->use, 2);
157
158 init_timer(&inst->timer);
159 inst->timer.function = nfulnl_timer;
160 inst->timer.data = (unsigned long)inst;
161 /* don't start timer yet. (re)start it with every packet */
162
163 inst->peer_pid = pid;
164 inst->group_num = group_num;
165
166 inst->qthreshold = NFULNL_QTHRESH_DEFAULT;
167 inst->flushtimeout = NFULNL_TIMEOUT_DEFAULT;
168 inst->nlbufsiz = NFULNL_NLBUFSIZ_DEFAULT;
169 inst->copy_mode = NFULNL_COPY_PACKET;
170 inst->copy_range = 0xffff;
171
172 if (!try_module_get(THIS_MODULE))
173 goto out_free;
174
175 hlist_add_head(&inst->hlist,
176 &instance_table[instance_hashfn(group_num)]);
177
178 UDEBUG("newly added node: %p, next=%p\n", &inst->hlist,
179 inst->hlist.next);
180
181 write_unlock_bh(&instances_lock);
182
183 return inst;
184
185out_free:
186 instance_put(inst);
187out_unlock:
188 write_unlock_bh(&instances_lock);
189 return NULL;
190}
191
192static int __nfulnl_send(struct nfulnl_instance *inst);
193
194static void
195_instance_destroy2(struct nfulnl_instance *inst, int lock)
196{
197 /* first pull it out of the global list */
198 if (lock)
199 write_lock_bh(&instances_lock);
200
201 UDEBUG("removing instance %p (queuenum=%u) from hash\n",
202 inst, inst->group_num);
203
204 hlist_del(&inst->hlist);
205
206 if (lock)
207 write_unlock_bh(&instances_lock);
208
209 /* then flush all pending packets from skb */
210
211 spin_lock_bh(&inst->lock);
212 if (inst->skb) {
213 if (inst->qlen)
214 __nfulnl_send(inst);
215 if (inst->skb) {
216 kfree_skb(inst->skb);
217 inst->skb = NULL;
218 }
219 }
220 spin_unlock_bh(&inst->lock);
221
222 /* and finally put the refcount */
223 instance_put(inst);
224
225 module_put(THIS_MODULE);
226}
227
228static inline void
229__instance_destroy(struct nfulnl_instance *inst)
230{
231 _instance_destroy2(inst, 0);
232}
233
234static inline void
235instance_destroy(struct nfulnl_instance *inst)
236{
237 _instance_destroy2(inst, 1);
238}
239
240static int
241nfulnl_set_mode(struct nfulnl_instance *inst, u_int8_t mode,
242 unsigned int range)
243{
244 int status = 0;
245
246 spin_lock_bh(&inst->lock);
247
248 switch (mode) {
249 case NFULNL_COPY_NONE:
250 case NFULNL_COPY_META:
251 inst->copy_mode = mode;
252 inst->copy_range = 0;
253 break;
254
255 case NFULNL_COPY_PACKET:
256 inst->copy_mode = mode;
257 /* we're using struct nfattr which has 16bit nfa_len */
258 if (range > 0xffff)
259 inst->copy_range = 0xffff;
260 else
261 inst->copy_range = range;
262 break;
263
264 default:
265 status = -EINVAL;
266 break;
267 }
268
269 spin_unlock_bh(&inst->lock);
270
271 return status;
272}
273
274static int
275nfulnl_set_nlbufsiz(struct nfulnl_instance *inst, u_int32_t nlbufsiz)
276{
277 int status;
278
279 spin_lock_bh(&inst->lock);
280 if (nlbufsiz < NFULNL_NLBUFSIZ_DEFAULT)
281 status = -ERANGE;
282 else if (nlbufsiz > 131072)
283 status = -ERANGE;
284 else {
285 inst->nlbufsiz = nlbufsiz;
286 status = 0;
287 }
288 spin_unlock_bh(&inst->lock);
289
290 return status;
291}
292
293static int
294nfulnl_set_timeout(struct nfulnl_instance *inst, u_int32_t timeout)
295{
296 spin_lock_bh(&inst->lock);
297 inst->flushtimeout = timeout;
298 spin_unlock_bh(&inst->lock);
299
300 return 0;
301}
302
303static int
304nfulnl_set_qthresh(struct nfulnl_instance *inst, u_int32_t qthresh)
305{
306 spin_lock_bh(&inst->lock);
307 inst->qthreshold = qthresh;
308 spin_unlock_bh(&inst->lock);
309
310 return 0;
311}
312
313static struct sk_buff *nfulnl_alloc_skb(unsigned int inst_size,
314 unsigned int pkt_size)
315{
316 struct sk_buff *skb;
ad2ad0f9 317 unsigned int n;
0597f268
HW
318
319 UDEBUG("entered (%u, %u)\n", inst_size, pkt_size);
320
321 /* alloc skb which should be big enough for a whole multipart
322 * message. WARNING: has to be <= 128k due to slab restrictions */
323
ad2ad0f9
PM
324 n = max(inst_size, pkt_size);
325 skb = alloc_skb(n, GFP_ATOMIC);
0597f268
HW
326 if (!skb) {
327 PRINTR("nfnetlink_log: can't alloc whole buffer (%u bytes)\n",
328 inst_size);
329
ad2ad0f9
PM
330 if (n > pkt_size) {
331 /* try to allocate only as much as we need for current
332 * packet */
0597f268 333
ad2ad0f9
PM
334 skb = alloc_skb(pkt_size, GFP_ATOMIC);
335 if (!skb)
336 PRINTR("nfnetlink_log: can't even alloc %u "
337 "bytes\n", pkt_size);
338 }
0597f268
HW
339 }
340
341 return skb;
342}
343
344static int
345__nfulnl_send(struct nfulnl_instance *inst)
346{
347 int status;
348
349 if (timer_pending(&inst->timer))
350 del_timer(&inst->timer);
351
352 if (inst->qlen > 1)
353 inst->lastnlh->nlmsg_type = NLMSG_DONE;
354
355 status = nfnetlink_unicast(inst->skb, inst->peer_pid, MSG_DONTWAIT);
356 if (status < 0) {
357 UDEBUG("netlink_unicast() failed\n");
358 /* FIXME: statistics */
359 }
360
361 inst->qlen = 0;
362 inst->skb = NULL;
363 inst->lastnlh = NULL;
364
365 return status;
366}
367
368static void nfulnl_timer(unsigned long data)
369{
370 struct nfulnl_instance *inst = (struct nfulnl_instance *)data;
371
372 UDEBUG("timer function called, flushing buffer\n");
373
374 spin_lock_bh(&inst->lock);
375 __nfulnl_send(inst);
376 instance_put(inst);
377 spin_unlock_bh(&inst->lock);
378}
379
380static inline int
381__build_packet_message(struct nfulnl_instance *inst,
382 const struct sk_buff *skb,
383 unsigned int data_len,
384 unsigned int pf,
385 unsigned int hooknum,
386 const struct net_device *indev,
387 const struct net_device *outdev,
388 const struct nf_loginfo *li,
389 const char *prefix)
390{
391 unsigned char *old_tail;
392 struct nfulnl_msg_packet_hdr pmsg;
393 struct nlmsghdr *nlh;
394 struct nfgenmsg *nfmsg;
395 u_int32_t tmp_uint;
396
397 UDEBUG("entered\n");
398
399 old_tail = inst->skb->tail;
400 nlh = NLMSG_PUT(inst->skb, 0, 0,
401 NFNL_SUBSYS_ULOG << 8 | NFULNL_MSG_PACKET,
402 sizeof(struct nfgenmsg));
403 nfmsg = NLMSG_DATA(nlh);
404 nfmsg->nfgen_family = pf;
405 nfmsg->version = NFNETLINK_V0;
406 nfmsg->res_id = htons(inst->group_num);
407
408 pmsg.hw_protocol = htons(skb->protocol);
409 pmsg.hook = hooknum;
410
411 NFA_PUT(inst->skb, NFULA_PACKET_HDR, sizeof(pmsg), &pmsg);
412
413 if (prefix) {
414 int slen = strlen(prefix);
415 if (slen > NFULNL_PREFIXLEN)
416 slen = NFULNL_PREFIXLEN;
417 NFA_PUT(inst->skb, NFULA_PREFIX, slen, prefix);
418 }
419
420 if (indev) {
421 tmp_uint = htonl(indev->ifindex);
fbcd923c 422#ifndef CONFIG_BRIDGE_NETFILTER
0597f268
HW
423 NFA_PUT(inst->skb, NFULA_IFINDEX_INDEV, sizeof(tmp_uint),
424 &tmp_uint);
fbcd923c
HW
425#else
426 if (pf == PF_BRIDGE) {
427 /* Case 1: outdev is physical input device, we need to
428 * look for bridge group (when called from
429 * netfilter_bridge) */
430 NFA_PUT(inst->skb, NFULA_IFINDEX_PHYSINDEV,
431 sizeof(tmp_uint), &tmp_uint);
432 /* this is the bridge group "brX" */
433 tmp_uint = htonl(indev->br_port->br->dev->ifindex);
434 NFA_PUT(inst->skb, NFULA_IFINDEX_INDEV,
435 sizeof(tmp_uint), &tmp_uint);
436 } else {
437 /* Case 2: indev is bridge group, we need to look for
438 * physical device (when called from ipv4) */
439 NFA_PUT(inst->skb, NFULA_IFINDEX_INDEV,
440 sizeof(tmp_uint), &tmp_uint);
441 if (skb->nf_bridge && skb->nf_bridge->physindev) {
442 tmp_uint =
443 htonl(skb->nf_bridge->physindev->ifindex);
444 NFA_PUT(inst->skb, NFULA_IFINDEX_PHYSINDEV,
445 sizeof(tmp_uint), &tmp_uint);
446 }
447 }
448#endif
0597f268
HW
449 }
450
451 if (outdev) {
452 tmp_uint = htonl(outdev->ifindex);
fbcd923c 453#ifndef CONFIG_BRIDGE_NETFILTER
0597f268
HW
454 NFA_PUT(inst->skb, NFULA_IFINDEX_OUTDEV, sizeof(tmp_uint),
455 &tmp_uint);
fbcd923c
HW
456#else
457 if (pf == PF_BRIDGE) {
458 /* Case 1: outdev is physical output device, we need to
459 * look for bridge group (when called from
460 * netfilter_bridge) */
461 NFA_PUT(inst->skb, NFULA_IFINDEX_PHYSOUTDEV,
462 sizeof(tmp_uint), &tmp_uint);
463 /* this is the bridge group "brX" */
464 tmp_uint = htonl(outdev->br_port->br->dev->ifindex);
465 NFA_PUT(inst->skb, NFULA_IFINDEX_OUTDEV,
466 sizeof(tmp_uint), &tmp_uint);
467 } else {
468 /* Case 2: indev is a bridge group, we need to look
469 * for physical device (when called from ipv4) */
470 NFA_PUT(inst->skb, NFULA_IFINDEX_OUTDEV,
471 sizeof(tmp_uint), &tmp_uint);
472 if (skb->nf_bridge) {
473 tmp_uint =
474 htonl(skb->nf_bridge->physoutdev->ifindex);
475 NFA_PUT(inst->skb, NFULA_IFINDEX_PHYSOUTDEV,
476 sizeof(tmp_uint), &tmp_uint);
477 }
478 }
479#endif
0597f268
HW
480 }
481
482 if (skb->nfmark) {
483 tmp_uint = htonl(skb->nfmark);
484 NFA_PUT(inst->skb, NFULA_MARK, sizeof(tmp_uint), &tmp_uint);
485 }
486
487 if (indev && skb->dev && skb->dev->hard_header_parse) {
488 struct nfulnl_msg_packet_hw phw;
489
490 phw.hw_addrlen =
491 skb->dev->hard_header_parse((struct sk_buff *)skb,
492 phw.hw_addr);
493 phw.hw_addrlen = htons(phw.hw_addrlen);
494 NFA_PUT(inst->skb, NFULA_HWADDR, sizeof(phw), &phw);
495 }
496
a61bbcf2 497 if (skb->tstamp.off_sec) {
0597f268
HW
498 struct nfulnl_msg_packet_timestamp ts;
499
325ed823
HX
500 ts.sec = cpu_to_be64(skb->tstamp.off_sec);
501 ts.usec = cpu_to_be64(skb->tstamp.off_usec);
0597f268
HW
502
503 NFA_PUT(inst->skb, NFULA_TIMESTAMP, sizeof(ts), &ts);
504 }
505
506 /* UID */
507 if (skb->sk) {
508 read_lock_bh(&skb->sk->sk_callback_lock);
509 if (skb->sk->sk_socket && skb->sk->sk_socket->file) {
510 u_int32_t uid = htonl(skb->sk->sk_socket->file->f_uid);
511 /* need to unlock here since NFA_PUT may goto */
512 read_unlock_bh(&skb->sk->sk_callback_lock);
513 NFA_PUT(inst->skb, NFULA_UID, sizeof(uid), &uid);
514 } else
515 read_unlock_bh(&skb->sk->sk_callback_lock);
516 }
517
518 if (data_len) {
519 struct nfattr *nfa;
520 int size = NFA_LENGTH(data_len);
521
522 if (skb_tailroom(inst->skb) < (int)NFA_SPACE(data_len)) {
523 printk(KERN_WARNING "nfnetlink_log: no tailroom!\n");
524 goto nlmsg_failure;
525 }
526
527 nfa = (struct nfattr *)skb_put(inst->skb, NFA_ALIGN(size));
528 nfa->nfa_type = NFULA_PAYLOAD;
529 nfa->nfa_len = size;
530
531 if (skb_copy_bits(skb, 0, NFA_DATA(nfa), data_len))
532 BUG();
533 }
534
535 nlh->nlmsg_len = inst->skb->tail - old_tail;
536 return 0;
537
538nlmsg_failure:
539 UDEBUG("nlmsg_failure\n");
540nfattr_failure:
541 PRINTR(KERN_ERR "nfnetlink_log: error creating log nlmsg\n");
542 return -1;
543}
544
545#define RCV_SKB_FAIL(err) do { netlink_ack(skb, nlh, (err)); return; } while (0)
546
547static struct nf_loginfo default_loginfo = {
548 .type = NF_LOG_TYPE_ULOG,
549 .u = {
550 .ulog = {
551 .copy_len = 0xffff,
552 .group = 0,
553 .qthreshold = 1,
554 },
555 },
556};
557
558/* log handler for internal netfilter logging api */
559static void
560nfulnl_log_packet(unsigned int pf,
561 unsigned int hooknum,
562 const struct sk_buff *skb,
563 const struct net_device *in,
564 const struct net_device *out,
565 const struct nf_loginfo *li_user,
566 const char *prefix)
567{
568 unsigned int size, data_len;
569 struct nfulnl_instance *inst;
570 const struct nf_loginfo *li;
571 unsigned int qthreshold;
572 unsigned int nlbufsiz;
573
574 if (li_user && li_user->type == NF_LOG_TYPE_ULOG)
575 li = li_user;
576 else
577 li = &default_loginfo;
578
579 inst = instance_lookup_get(li->u.ulog.group);
580 if (!inst)
581 inst = instance_lookup_get(0);
582 if (!inst) {
583 PRINTR("nfnetlink_log: trying to log packet, "
584 "but no instance for group %u\n", li->u.ulog.group);
585 return;
586 }
587
588 /* all macros expand to constant values at compile time */
589 /* FIXME: do we want to make the size calculation conditional based on
590 * what is actually present? way more branches and checks, but more
591 * memory efficient... */
592 size = NLMSG_SPACE(sizeof(struct nfgenmsg))
593 + NFA_SPACE(sizeof(struct nfulnl_msg_packet_hdr))
594 + NFA_SPACE(sizeof(u_int32_t)) /* ifindex */
595 + NFA_SPACE(sizeof(u_int32_t)) /* ifindex */
fbcd923c
HW
596#ifdef CONFIG_BRIDGE_NETFILTER
597 + NFA_SPACE(sizeof(u_int32_t)) /* ifindex */
598 + NFA_SPACE(sizeof(u_int32_t)) /* ifindex */
599#endif
0597f268
HW
600 + NFA_SPACE(sizeof(u_int32_t)) /* mark */
601 + NFA_SPACE(sizeof(u_int32_t)) /* uid */
602 + NFA_SPACE(NFULNL_PREFIXLEN) /* prefix */
603 + NFA_SPACE(sizeof(struct nfulnl_msg_packet_hw))
604 + NFA_SPACE(sizeof(struct nfulnl_msg_packet_timestamp));
605
606 UDEBUG("initial size=%u\n", size);
607
608 spin_lock_bh(&inst->lock);
609
610 qthreshold = inst->qthreshold;
611 /* per-rule qthreshold overrides per-instance */
612 if (qthreshold > li->u.ulog.qthreshold)
613 qthreshold = li->u.ulog.qthreshold;
614
615 switch (inst->copy_mode) {
616 case NFULNL_COPY_META:
617 case NFULNL_COPY_NONE:
618 data_len = 0;
619 break;
620
621 case NFULNL_COPY_PACKET:
622 if (inst->copy_range == 0
623 || inst->copy_range > skb->len)
624 data_len = skb->len;
625 else
626 data_len = inst->copy_range;
627
628 size += NFA_SPACE(data_len);
629 UDEBUG("copy_packet, therefore size now %u\n", size);
630 break;
631
632 default:
633 spin_unlock_bh(&inst->lock);
634 instance_put(inst);
635 return;
636 }
637
638 if (size > inst->nlbufsiz)
639 nlbufsiz = size;
640 else
641 nlbufsiz = inst->nlbufsiz;
642
643 if (!inst->skb) {
644 if (!(inst->skb = nfulnl_alloc_skb(nlbufsiz, size))) {
645 UDEBUG("error in nfulnl_alloc_skb(%u, %u)\n",
646 inst->nlbufsiz, size);
647 goto alloc_failure;
648 }
649 } else if (inst->qlen >= qthreshold ||
650 size > skb_tailroom(inst->skb)) {
651 /* either the queue len is too high or we don't have
652 * enough room in the skb left. flush to userspace. */
653 UDEBUG("flushing old skb\n");
654
655 __nfulnl_send(inst);
656
657 if (!(inst->skb = nfulnl_alloc_skb(nlbufsiz, size))) {
658 UDEBUG("error in nfulnl_alloc_skb(%u, %u)\n",
659 inst->nlbufsiz, size);
660 goto alloc_failure;
661 }
662 }
663
664 UDEBUG("qlen %d, qthreshold %d\n", inst->qlen, qthreshold);
665 inst->qlen++;
666
667 __build_packet_message(inst, skb, data_len, pf,
668 hooknum, in, out, li, prefix);
669
670 /* timer_pending always called within inst->lock, so there
671 * is no chance of a race here */
672 if (!timer_pending(&inst->timer)) {
673 instance_get(inst);
674 inst->timer.expires = jiffies + (inst->flushtimeout*HZ/100);
675 add_timer(&inst->timer);
676 }
677 spin_unlock_bh(&inst->lock);
678
679 return;
680
681alloc_failure:
682 spin_unlock_bh(&inst->lock);
683 instance_put(inst);
684 UDEBUG("error allocating skb\n");
685 /* FIXME: statistics */
686}
687
688static int
689nfulnl_rcv_nl_event(struct notifier_block *this,
690 unsigned long event, void *ptr)
691{
692 struct netlink_notify *n = ptr;
693
694 if (event == NETLINK_URELEASE &&
695 n->protocol == NETLINK_NETFILTER && n->pid) {
696 int i;
697
698 /* destroy all instances for this pid */
699 write_lock_bh(&instances_lock);
700 for (i = 0; i < INSTANCE_BUCKETS; i++) {
701 struct hlist_node *tmp, *t2;
702 struct nfulnl_instance *inst;
703 struct hlist_head *head = &instance_table[i];
704
705 hlist_for_each_entry_safe(inst, tmp, t2, head, hlist) {
706 UDEBUG("node = %p\n", inst);
707 if (n->pid == inst->peer_pid)
708 __instance_destroy(inst);
709 }
710 }
711 write_unlock_bh(&instances_lock);
712 }
713 return NOTIFY_DONE;
714}
715
716static struct notifier_block nfulnl_rtnl_notifier = {
717 .notifier_call = nfulnl_rcv_nl_event,
718};
719
720static int
721nfulnl_recv_unsupp(struct sock *ctnl, struct sk_buff *skb,
722 struct nlmsghdr *nlh, struct nfattr *nfqa[], int *errp)
723{
724 return -ENOTSUPP;
725}
726
727static struct nf_logger nfulnl_logger = {
728 .name = "nfnetlink_log",
729 .logfn = &nfulnl_log_packet,
730 .me = THIS_MODULE,
731};
732
733static const int nfula_min[NFULA_MAX] = {
734 [NFULA_PACKET_HDR-1] = sizeof(struct nfulnl_msg_packet_hdr),
735 [NFULA_MARK-1] = sizeof(u_int32_t),
736 [NFULA_TIMESTAMP-1] = sizeof(struct nfulnl_msg_packet_timestamp),
737 [NFULA_IFINDEX_INDEV-1] = sizeof(u_int32_t),
738 [NFULA_IFINDEX_OUTDEV-1]= sizeof(u_int32_t),
739 [NFULA_HWADDR-1] = sizeof(struct nfulnl_msg_packet_hw),
740 [NFULA_PAYLOAD-1] = 0,
741 [NFULA_PREFIX-1] = 0,
742 [NFULA_UID-1] = sizeof(u_int32_t),
743};
744
745static const int nfula_cfg_min[NFULA_CFG_MAX] = {
746 [NFULA_CFG_CMD-1] = sizeof(struct nfulnl_msg_config_cmd),
747 [NFULA_CFG_MODE-1] = sizeof(struct nfulnl_msg_config_mode),
748 [NFULA_CFG_TIMEOUT-1] = sizeof(u_int32_t),
749 [NFULA_CFG_QTHRESH-1] = sizeof(u_int32_t),
750 [NFULA_CFG_NLBUFSIZ-1] = sizeof(u_int32_t),
751};
752
753static int
754nfulnl_recv_config(struct sock *ctnl, struct sk_buff *skb,
755 struct nlmsghdr *nlh, struct nfattr *nfula[], int *errp)
756{
757 struct nfgenmsg *nfmsg = NLMSG_DATA(nlh);
758 u_int16_t group_num = ntohs(nfmsg->res_id);
759 struct nfulnl_instance *inst;
760 int ret = 0;
761
762 UDEBUG("entering for msg %u\n", NFNL_MSG_TYPE(nlh->nlmsg_type));
763
764 if (nfattr_bad_size(nfula, NFULA_CFG_MAX, nfula_cfg_min)) {
765 UDEBUG("bad attribute size\n");
766 return -EINVAL;
767 }
768
769 inst = instance_lookup_get(group_num);
770 if (nfula[NFULA_CFG_CMD-1]) {
771 u_int8_t pf = nfmsg->nfgen_family;
772 struct nfulnl_msg_config_cmd *cmd;
773 cmd = NFA_DATA(nfula[NFULA_CFG_CMD-1]);
774 UDEBUG("found CFG_CMD for\n");
775
776 switch (cmd->command) {
777 case NFULNL_CFG_CMD_BIND:
778 if (inst) {
779 ret = -EBUSY;
780 goto out_put;
781 }
782
783 inst = instance_create(group_num,
784 NETLINK_CB(skb).pid);
785 if (!inst) {
786 ret = -EINVAL;
787 goto out_put;
788 }
789 break;
790 case NFULNL_CFG_CMD_UNBIND:
791 if (!inst) {
792 ret = -ENODEV;
793 goto out_put;
794 }
795
796 if (inst->peer_pid != NETLINK_CB(skb).pid) {
797 ret = -EPERM;
798 goto out_put;
799 }
800
801 instance_destroy(inst);
802 break;
803 case NFULNL_CFG_CMD_PF_BIND:
804 UDEBUG("registering log handler for pf=%u\n", pf);
805 ret = nf_log_register(pf, &nfulnl_logger);
806 break;
807 case NFULNL_CFG_CMD_PF_UNBIND:
808 UDEBUG("unregistering log handler for pf=%u\n", pf);
809 /* This is a bug and a feature. We cannot unregister
810 * other handlers, like nfnetlink_inst can */
811 nf_log_unregister_pf(pf);
812 break;
813 default:
814 ret = -EINVAL;
815 break;
816 }
817 } else {
818 if (!inst) {
819 UDEBUG("no config command, and no instance for "
820 "group=%u pid=%u =>ENOENT\n",
821 group_num, NETLINK_CB(skb).pid);
822 ret = -ENOENT;
823 goto out_put;
824 }
825
826 if (inst->peer_pid != NETLINK_CB(skb).pid) {
827 UDEBUG("no config command, and wrong pid\n");
828 ret = -EPERM;
829 goto out_put;
830 }
831 }
832
833 if (nfula[NFULA_CFG_MODE-1]) {
834 struct nfulnl_msg_config_mode *params;
835 params = NFA_DATA(nfula[NFULA_CFG_MODE-1]);
836
837 nfulnl_set_mode(inst, params->copy_mode,
838 ntohs(params->copy_range));
839 }
840
841 if (nfula[NFULA_CFG_TIMEOUT-1]) {
842 u_int32_t timeout =
843 *(u_int32_t *)NFA_DATA(nfula[NFULA_CFG_TIMEOUT-1]);
844
845 nfulnl_set_timeout(inst, ntohl(timeout));
846 }
847
848 if (nfula[NFULA_CFG_NLBUFSIZ-1]) {
849 u_int32_t nlbufsiz =
850 *(u_int32_t *)NFA_DATA(nfula[NFULA_CFG_NLBUFSIZ-1]);
851
852 nfulnl_set_nlbufsiz(inst, ntohl(nlbufsiz));
853 }
854
855 if (nfula[NFULA_CFG_QTHRESH-1]) {
856 u_int32_t qthresh =
857 *(u_int16_t *)NFA_DATA(nfula[NFULA_CFG_QTHRESH-1]);
858
859 nfulnl_set_qthresh(inst, ntohl(qthresh));
860 }
861
862out_put:
863 instance_put(inst);
864 return ret;
865}
866
867static struct nfnl_callback nfulnl_cb[NFULNL_MSG_MAX] = {
868 [NFULNL_MSG_PACKET] = { .call = nfulnl_recv_unsupp,
37d2e7a2 869 .attr_count = NFULA_MAX, },
0597f268 870 [NFULNL_MSG_CONFIG] = { .call = nfulnl_recv_config,
37d2e7a2 871 .attr_count = NFULA_CFG_MAX, },
0597f268
HW
872};
873
874static struct nfnetlink_subsystem nfulnl_subsys = {
875 .name = "log",
876 .subsys_id = NFNL_SUBSYS_ULOG,
877 .cb_count = NFULNL_MSG_MAX,
0597f268
HW
878 .cb = nfulnl_cb,
879};
880
881#ifdef CONFIG_PROC_FS
882struct iter_state {
883 unsigned int bucket;
884};
885
886static struct hlist_node *get_first(struct seq_file *seq)
887{
888 struct iter_state *st = seq->private;
889
890 if (!st)
891 return NULL;
892
893 for (st->bucket = 0; st->bucket < INSTANCE_BUCKETS; st->bucket++) {
894 if (!hlist_empty(&instance_table[st->bucket]))
895 return instance_table[st->bucket].first;
896 }
897 return NULL;
898}
899
900static struct hlist_node *get_next(struct seq_file *seq, struct hlist_node *h)
901{
902 struct iter_state *st = seq->private;
903
904 h = h->next;
905 while (!h) {
906 if (++st->bucket >= INSTANCE_BUCKETS)
907 return NULL;
908
909 h = instance_table[st->bucket].first;
910 }
911 return h;
912}
913
914static struct hlist_node *get_idx(struct seq_file *seq, loff_t pos)
915{
916 struct hlist_node *head;
917 head = get_first(seq);
918
919 if (head)
920 while (pos && (head = get_next(seq, head)))
921 pos--;
922 return pos ? NULL : head;
923}
924
925static void *seq_start(struct seq_file *seq, loff_t *pos)
926{
927 read_lock_bh(&instances_lock);
928 return get_idx(seq, *pos);
929}
930
931static void *seq_next(struct seq_file *s, void *v, loff_t *pos)
932{
933 (*pos)++;
934 return get_next(s, v);
935}
936
937static void seq_stop(struct seq_file *s, void *v)
938{
939 read_unlock_bh(&instances_lock);
940}
941
942static int seq_show(struct seq_file *s, void *v)
943{
944 const struct nfulnl_instance *inst = v;
945
946 return seq_printf(s, "%5d %6d %5d %1d %5d %6d %2d\n",
947 inst->group_num,
948 inst->peer_pid, inst->qlen,
949 inst->copy_mode, inst->copy_range,
950 inst->flushtimeout, atomic_read(&inst->use));
951}
952
953static struct seq_operations nful_seq_ops = {
954 .start = seq_start,
955 .next = seq_next,
956 .stop = seq_stop,
957 .show = seq_show,
958};
959
960static int nful_open(struct inode *inode, struct file *file)
961{
962 struct seq_file *seq;
963 struct iter_state *is;
964 int ret;
965
10dfdc69 966 is = kzalloc(sizeof(*is), GFP_KERNEL);
0597f268
HW
967 if (!is)
968 return -ENOMEM;
0597f268
HW
969 ret = seq_open(file, &nful_seq_ops);
970 if (ret < 0)
971 goto out_free;
972 seq = file->private_data;
973 seq->private = is;
974 return ret;
975out_free:
976 kfree(is);
977 return ret;
978}
979
980static struct file_operations nful_file_ops = {
981 .owner = THIS_MODULE,
982 .open = nful_open,
983 .read = seq_read,
984 .llseek = seq_lseek,
985 .release = seq_release_private,
986};
987
988#endif /* PROC_FS */
989
990static int
991init_or_cleanup(int init)
992{
993 int i, status = -ENOMEM;
994#ifdef CONFIG_PROC_FS
995 struct proc_dir_entry *proc_nful;
996#endif
997
998 if (!init)
999 goto cleanup;
1000
1001 for (i = 0; i < INSTANCE_BUCKETS; i++)
1002 INIT_HLIST_HEAD(&instance_table[i]);
1003
1004 /* it's not really all that important to have a random value, so
1005 * we can do this from the init function, even if there hasn't
1006 * been that much entropy yet */
1007 get_random_bytes(&hash_init, sizeof(hash_init));
1008
1009 netlink_register_notifier(&nfulnl_rtnl_notifier);
1010 status = nfnetlink_subsys_register(&nfulnl_subsys);
1011 if (status < 0) {
1012 printk(KERN_ERR "log: failed to create netlink socket\n");
1013 goto cleanup_netlink_notifier;
1014 }
1015
1016#ifdef CONFIG_PROC_FS
1017 proc_nful = create_proc_entry("nfnetlink_log", 0440,
1018 proc_net_netfilter);
1019 if (!proc_nful)
1020 goto cleanup_subsys;
1021 proc_nful->proc_fops = &nful_file_ops;
1022#endif
1023
1024 return status;
1025
1026cleanup:
1027 nf_log_unregister_logger(&nfulnl_logger);
1028#ifdef CONFIG_PROC_FS
1029 remove_proc_entry("nfnetlink_log", proc_net_netfilter);
1030cleanup_subsys:
1031#endif
1032 nfnetlink_subsys_unregister(&nfulnl_subsys);
1033cleanup_netlink_notifier:
1034 netlink_unregister_notifier(&nfulnl_rtnl_notifier);
1035 return status;
1036}
1037
1038static int __init init(void)
1039{
1040
1041 return init_or_cleanup(1);
1042}
1043
1044static void __exit fini(void)
1045{
1046 init_or_cleanup(0);
1047}
1048
1049MODULE_DESCRIPTION("netfilter userspace logging");
1050MODULE_AUTHOR("Harald Welte <laforge@netfilter.org>");
1051MODULE_LICENSE("GPL");
f682faef 1052MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_ULOG);
0597f268
HW
1053
1054module_init(init);
1055module_exit(fini);