1 /* Connection tracking via netlink socket. Allows for user space
2 * protocol helpers and general trouble making from userspace.
4 * (C) 2001 by Jay Schulist <jschlst@samba.org>
5 * (C) 2002-2006 by Harald Welte <laforge@gnumonks.org>
6 * (C) 2003 by Patrick Mchardy <kaber@trash.net>
7 * (C) 2005-2006 by Pablo Neira Ayuso <pablo@eurodev.net>
9 * Initial connection tracking via netlink development funded and
10 * generally made possible by Network Robots, Inc. (www.networkrobots.com)
12 * Further development of this code funded by Astaro AG (http://www.astaro.com)
14 * This software may be used and distributed according to the terms
15 * of the GNU General Public License, incorporated herein by reference.
18 #include <linux/init.h>
19 #include <linux/module.h>
20 #include <linux/kernel.h>
21 #include <linux/types.h>
22 #include <linux/timer.h>
23 #include <linux/skbuff.h>
24 #include <linux/errno.h>
25 #include <linux/netlink.h>
26 #include <linux/spinlock.h>
27 #include <linux/interrupt.h>
28 #include <linux/notifier.h>
30 #include <linux/netfilter.h>
31 #include <net/netlink.h>
32 #include <net/netfilter/nf_conntrack.h>
33 #include <net/netfilter/nf_conntrack_core.h>
34 #include <net/netfilter/nf_conntrack_expect.h>
35 #include <net/netfilter/nf_conntrack_helper.h>
36 #include <net/netfilter/nf_conntrack_l3proto.h>
37 #include <net/netfilter/nf_conntrack_l4proto.h>
38 #include <net/netfilter/nf_conntrack_tuple.h>
39 #ifdef CONFIG_NF_NAT_NEEDED
40 #include <net/netfilter/nf_nat_core.h>
41 #include <net/netfilter/nf_nat_protocol.h>
44 #include <linux/netfilter/nfnetlink.h>
45 #include <linux/netfilter/nfnetlink_conntrack.h>
47 MODULE_LICENSE("GPL");
49 static char __initdata version[] = "0.93";
52 ctnetlink_dump_tuples_proto(struct sk_buff *skb,
53 const struct nf_conntrack_tuple *tuple,
54 struct nf_conntrack_l4proto *l4proto)
57 struct nfattr *nest_parms = NFA_NEST(skb, CTA_TUPLE_PROTO);
59 NFA_PUT(skb, CTA_PROTO_NUM, sizeof(u_int8_t), &tuple->dst.protonum);
61 if (likely(l4proto->tuple_to_nfattr))
62 ret = l4proto->tuple_to_nfattr(skb, tuple);
64 NFA_NEST_END(skb, nest_parms);
73 ctnetlink_dump_tuples_ip(struct sk_buff *skb,
74 const struct nf_conntrack_tuple *tuple,
75 struct nf_conntrack_l3proto *l3proto)
78 struct nfattr *nest_parms = NFA_NEST(skb, CTA_TUPLE_IP);
80 if (likely(l3proto->tuple_to_nfattr))
81 ret = l3proto->tuple_to_nfattr(skb, tuple);
83 NFA_NEST_END(skb, nest_parms);
92 ctnetlink_dump_tuples(struct sk_buff *skb,
93 const struct nf_conntrack_tuple *tuple)
96 struct nf_conntrack_l3proto *l3proto;
97 struct nf_conntrack_l4proto *l4proto;
99 l3proto = nf_ct_l3proto_find_get(tuple->src.l3num);
100 ret = ctnetlink_dump_tuples_ip(skb, tuple, l3proto);
101 nf_ct_l3proto_put(l3proto);
103 if (unlikely(ret < 0))
106 l4proto = nf_ct_l4proto_find_get(tuple->src.l3num, tuple->dst.protonum);
107 ret = ctnetlink_dump_tuples_proto(skb, tuple, l4proto);
108 nf_ct_l4proto_put(l4proto);
114 ctnetlink_dump_status(struct sk_buff *skb, const struct nf_conn *ct)
116 __be32 status = htonl((u_int32_t) ct->status);
117 NFA_PUT(skb, CTA_STATUS, sizeof(status), &status);
125 ctnetlink_dump_timeout(struct sk_buff *skb, const struct nf_conn *ct)
127 long timeout_l = ct->timeout.expires - jiffies;
133 timeout = htonl(timeout_l / HZ);
135 NFA_PUT(skb, CTA_TIMEOUT, sizeof(timeout), &timeout);
143 ctnetlink_dump_protoinfo(struct sk_buff *skb, const struct nf_conn *ct)
145 struct nf_conntrack_l4proto *l4proto = nf_ct_l4proto_find_get(ct->tuplehash[IP_CT_DIR_ORIGINAL].tuple.src.l3num, ct->tuplehash[IP_CT_DIR_ORIGINAL].tuple.dst.protonum);
146 struct nfattr *nest_proto;
149 if (!l4proto->to_nfattr) {
150 nf_ct_l4proto_put(l4proto);
154 nest_proto = NFA_NEST(skb, CTA_PROTOINFO);
156 ret = l4proto->to_nfattr(skb, nest_proto, ct);
158 nf_ct_l4proto_put(l4proto);
160 NFA_NEST_END(skb, nest_proto);
165 nf_ct_l4proto_put(l4proto);
170 ctnetlink_dump_helpinfo(struct sk_buff *skb, const struct nf_conn *ct)
172 struct nfattr *nest_helper;
173 const struct nf_conn_help *help = nfct_help(ct);
175 if (!help || !help->helper)
178 nest_helper = NFA_NEST(skb, CTA_HELP);
179 NFA_PUT(skb, CTA_HELP_NAME, strlen(help->helper->name), help->helper->name);
181 if (help->helper->to_nfattr)
182 help->helper->to_nfattr(skb, ct);
184 NFA_NEST_END(skb, nest_helper);
192 #ifdef CONFIG_NF_CT_ACCT
194 ctnetlink_dump_counters(struct sk_buff *skb, const struct nf_conn *ct,
195 enum ip_conntrack_dir dir)
197 enum ctattr_type type = dir ? CTA_COUNTERS_REPLY: CTA_COUNTERS_ORIG;
198 struct nfattr *nest_count = NFA_NEST(skb, type);
201 tmp = htonl(ct->counters[dir].packets);
202 NFA_PUT(skb, CTA_COUNTERS32_PACKETS, sizeof(u_int32_t), &tmp);
204 tmp = htonl(ct->counters[dir].bytes);
205 NFA_PUT(skb, CTA_COUNTERS32_BYTES, sizeof(u_int32_t), &tmp);
207 NFA_NEST_END(skb, nest_count);
215 #define ctnetlink_dump_counters(a, b, c) (0)
218 #ifdef CONFIG_NF_CONNTRACK_MARK
220 ctnetlink_dump_mark(struct sk_buff *skb, const struct nf_conn *ct)
222 __be32 mark = htonl(ct->mark);
224 NFA_PUT(skb, CTA_MARK, sizeof(u_int32_t), &mark);
231 #define ctnetlink_dump_mark(a, b) (0)
235 ctnetlink_dump_id(struct sk_buff *skb, const struct nf_conn *ct)
237 __be32 id = htonl(ct->id);
238 NFA_PUT(skb, CTA_ID, sizeof(u_int32_t), &id);
246 ctnetlink_dump_use(struct sk_buff *skb, const struct nf_conn *ct)
248 __be32 use = htonl(atomic_read(&ct->ct_general.use));
250 NFA_PUT(skb, CTA_USE, sizeof(u_int32_t), &use);
257 #define tuple(ct, dir) (&(ct)->tuplehash[dir].tuple)
260 ctnetlink_fill_info(struct sk_buff *skb, u32 pid, u32 seq,
261 int event, int nowait,
262 const struct nf_conn *ct)
264 struct nlmsghdr *nlh;
265 struct nfgenmsg *nfmsg;
266 struct nfattr *nest_parms;
267 unsigned char *b = skb_tail_pointer(skb);
269 event |= NFNL_SUBSYS_CTNETLINK << 8;
270 nlh = NLMSG_PUT(skb, pid, seq, event, sizeof(struct nfgenmsg));
271 nfmsg = NLMSG_DATA(nlh);
273 nlh->nlmsg_flags = (nowait && pid) ? NLM_F_MULTI : 0;
274 nfmsg->nfgen_family =
275 ct->tuplehash[IP_CT_DIR_ORIGINAL].tuple.src.l3num;
276 nfmsg->version = NFNETLINK_V0;
279 nest_parms = NFA_NEST(skb, CTA_TUPLE_ORIG);
280 if (ctnetlink_dump_tuples(skb, tuple(ct, IP_CT_DIR_ORIGINAL)) < 0)
282 NFA_NEST_END(skb, nest_parms);
284 nest_parms = NFA_NEST(skb, CTA_TUPLE_REPLY);
285 if (ctnetlink_dump_tuples(skb, tuple(ct, IP_CT_DIR_REPLY)) < 0)
287 NFA_NEST_END(skb, nest_parms);
289 if (ctnetlink_dump_status(skb, ct) < 0 ||
290 ctnetlink_dump_timeout(skb, ct) < 0 ||
291 ctnetlink_dump_counters(skb, ct, IP_CT_DIR_ORIGINAL) < 0 ||
292 ctnetlink_dump_counters(skb, ct, IP_CT_DIR_REPLY) < 0 ||
293 ctnetlink_dump_protoinfo(skb, ct) < 0 ||
294 ctnetlink_dump_helpinfo(skb, ct) < 0 ||
295 ctnetlink_dump_mark(skb, ct) < 0 ||
296 ctnetlink_dump_id(skb, ct) < 0 ||
297 ctnetlink_dump_use(skb, ct) < 0)
300 nlh->nlmsg_len = skb_tail_pointer(skb) - b;
309 #ifdef CONFIG_NF_CONNTRACK_EVENTS
310 static int ctnetlink_conntrack_event(struct notifier_block *this,
311 unsigned long events, void *ptr)
313 struct nlmsghdr *nlh;
314 struct nfgenmsg *nfmsg;
315 struct nfattr *nest_parms;
316 struct nf_conn *ct = (struct nf_conn *)ptr;
320 unsigned int flags = 0, group;
322 /* ignore our fake conntrack entry */
323 if (ct == &nf_conntrack_untracked)
326 if (events & IPCT_DESTROY) {
327 type = IPCTNL_MSG_CT_DELETE;
328 group = NFNLGRP_CONNTRACK_DESTROY;
329 } else if (events & (IPCT_NEW | IPCT_RELATED)) {
330 type = IPCTNL_MSG_CT_NEW;
331 flags = NLM_F_CREATE|NLM_F_EXCL;
332 group = NFNLGRP_CONNTRACK_NEW;
333 } else if (events & (IPCT_STATUS | IPCT_PROTOINFO)) {
334 type = IPCTNL_MSG_CT_NEW;
335 group = NFNLGRP_CONNTRACK_UPDATE;
339 if (!nfnetlink_has_listeners(group))
342 skb = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
348 type |= NFNL_SUBSYS_CTNETLINK << 8;
349 nlh = NLMSG_PUT(skb, 0, 0, type, sizeof(struct nfgenmsg));
350 nfmsg = NLMSG_DATA(nlh);
352 nlh->nlmsg_flags = flags;
353 nfmsg->nfgen_family = ct->tuplehash[IP_CT_DIR_ORIGINAL].tuple.src.l3num;
354 nfmsg->version = NFNETLINK_V0;
357 nest_parms = NFA_NEST(skb, CTA_TUPLE_ORIG);
358 if (ctnetlink_dump_tuples(skb, tuple(ct, IP_CT_DIR_ORIGINAL)) < 0)
360 NFA_NEST_END(skb, nest_parms);
362 nest_parms = NFA_NEST(skb, CTA_TUPLE_REPLY);
363 if (ctnetlink_dump_tuples(skb, tuple(ct, IP_CT_DIR_REPLY)) < 0)
365 NFA_NEST_END(skb, nest_parms);
367 if (events & IPCT_DESTROY) {
368 if (ctnetlink_dump_counters(skb, ct, IP_CT_DIR_ORIGINAL) < 0 ||
369 ctnetlink_dump_counters(skb, ct, IP_CT_DIR_REPLY) < 0)
372 if (ctnetlink_dump_status(skb, ct) < 0)
375 if (ctnetlink_dump_timeout(skb, ct) < 0)
378 if (events & IPCT_PROTOINFO
379 && ctnetlink_dump_protoinfo(skb, ct) < 0)
382 if ((events & IPCT_HELPER || nfct_help(ct))
383 && ctnetlink_dump_helpinfo(skb, ct) < 0)
386 #ifdef CONFIG_NF_CONNTRACK_MARK
387 if ((events & IPCT_MARK || ct->mark)
388 && ctnetlink_dump_mark(skb, ct) < 0)
392 if (events & IPCT_COUNTER_FILLING &&
393 (ctnetlink_dump_counters(skb, ct, IP_CT_DIR_ORIGINAL) < 0 ||
394 ctnetlink_dump_counters(skb, ct, IP_CT_DIR_REPLY) < 0))
398 nlh->nlmsg_len = skb->tail - b;
399 nfnetlink_send(skb, 0, group, 0);
407 #endif /* CONFIG_NF_CONNTRACK_EVENTS */
409 static int ctnetlink_done(struct netlink_callback *cb)
412 nf_ct_put((struct nf_conn *)cb->args[1]);
416 #define L3PROTO(ct) ct->tuplehash[IP_CT_DIR_ORIGINAL].tuple.src.l3num
419 ctnetlink_dump_table(struct sk_buff *skb, struct netlink_callback *cb)
421 struct nf_conn *ct, *last;
422 struct nf_conntrack_tuple_hash *h;
424 struct nfgenmsg *nfmsg = NLMSG_DATA(cb->nlh);
425 u_int8_t l3proto = nfmsg->nfgen_family;
427 read_lock_bh(&nf_conntrack_lock);
428 last = (struct nf_conn *)cb->args[1];
429 for (; cb->args[0] < nf_conntrack_htable_size; cb->args[0]++) {
431 list_for_each_prev(i, &nf_conntrack_hash[cb->args[0]]) {
432 h = (struct nf_conntrack_tuple_hash *) i;
433 if (NF_CT_DIRECTION(h) != IP_CT_DIR_ORIGINAL)
435 ct = nf_ct_tuplehash_to_ctrack(h);
436 /* Dump entries of a given L3 protocol number.
437 * If it is not specified, ie. l3proto == 0,
438 * then dump everything. */
439 if (l3proto && L3PROTO(ct) != l3proto)
446 if (ctnetlink_fill_info(skb, NETLINK_CB(cb->skb).pid,
450 nf_conntrack_get(&ct->ct_general);
451 cb->args[1] = (unsigned long)ct;
454 #ifdef CONFIG_NF_CT_ACCT
455 if (NFNL_MSG_TYPE(cb->nlh->nlmsg_type) ==
456 IPCTNL_MSG_CT_GET_CTRZERO)
457 memset(&ct->counters, 0, sizeof(ct->counters));
466 read_unlock_bh(&nf_conntrack_lock);
474 ctnetlink_parse_tuple_ip(struct nfattr *attr, struct nf_conntrack_tuple *tuple)
476 struct nfattr *tb[CTA_IP_MAX];
477 struct nf_conntrack_l3proto *l3proto;
480 nfattr_parse_nested(tb, CTA_IP_MAX, attr);
482 l3proto = nf_ct_l3proto_find_get(tuple->src.l3num);
484 if (likely(l3proto->nfattr_to_tuple))
485 ret = l3proto->nfattr_to_tuple(tb, tuple);
487 nf_ct_l3proto_put(l3proto);
492 static const size_t cta_min_proto[CTA_PROTO_MAX] = {
493 [CTA_PROTO_NUM-1] = sizeof(u_int8_t),
497 ctnetlink_parse_tuple_proto(struct nfattr *attr,
498 struct nf_conntrack_tuple *tuple)
500 struct nfattr *tb[CTA_PROTO_MAX];
501 struct nf_conntrack_l4proto *l4proto;
504 nfattr_parse_nested(tb, CTA_PROTO_MAX, attr);
506 if (nfattr_bad_size(tb, CTA_PROTO_MAX, cta_min_proto))
509 if (!tb[CTA_PROTO_NUM-1])
511 tuple->dst.protonum = *(u_int8_t *)NFA_DATA(tb[CTA_PROTO_NUM-1]);
513 l4proto = nf_ct_l4proto_find_get(tuple->src.l3num, tuple->dst.protonum);
515 if (likely(l4proto->nfattr_to_tuple))
516 ret = l4proto->nfattr_to_tuple(tb, tuple);
518 nf_ct_l4proto_put(l4proto);
524 ctnetlink_parse_tuple(struct nfattr *cda[], struct nf_conntrack_tuple *tuple,
525 enum ctattr_tuple type, u_int8_t l3num)
527 struct nfattr *tb[CTA_TUPLE_MAX];
530 memset(tuple, 0, sizeof(*tuple));
532 nfattr_parse_nested(tb, CTA_TUPLE_MAX, cda[type-1]);
534 if (!tb[CTA_TUPLE_IP-1])
537 tuple->src.l3num = l3num;
539 err = ctnetlink_parse_tuple_ip(tb[CTA_TUPLE_IP-1], tuple);
543 if (!tb[CTA_TUPLE_PROTO-1])
546 err = ctnetlink_parse_tuple_proto(tb[CTA_TUPLE_PROTO-1], tuple);
550 /* orig and expect tuples get DIR_ORIGINAL */
551 if (type == CTA_TUPLE_REPLY)
552 tuple->dst.dir = IP_CT_DIR_REPLY;
554 tuple->dst.dir = IP_CT_DIR_ORIGINAL;
559 #ifdef CONFIG_NF_NAT_NEEDED
560 static const size_t cta_min_protonat[CTA_PROTONAT_MAX] = {
561 [CTA_PROTONAT_PORT_MIN-1] = sizeof(u_int16_t),
562 [CTA_PROTONAT_PORT_MAX-1] = sizeof(u_int16_t),
565 static int nfnetlink_parse_nat_proto(struct nfattr *attr,
566 const struct nf_conn *ct,
567 struct nf_nat_range *range)
569 struct nfattr *tb[CTA_PROTONAT_MAX];
570 struct nf_nat_protocol *npt;
572 nfattr_parse_nested(tb, CTA_PROTONAT_MAX, attr);
574 if (nfattr_bad_size(tb, CTA_PROTONAT_MAX, cta_min_protonat))
577 npt = nf_nat_proto_find_get(ct->tuplehash[IP_CT_DIR_ORIGINAL].tuple.dst.protonum);
579 if (!npt->nfattr_to_range) {
580 nf_nat_proto_put(npt);
584 /* nfattr_to_range returns 1 if it parsed, 0 if not, neg. on error */
585 if (npt->nfattr_to_range(tb, range) > 0)
586 range->flags |= IP_NAT_RANGE_PROTO_SPECIFIED;
588 nf_nat_proto_put(npt);
593 static const size_t cta_min_nat[CTA_NAT_MAX] = {
594 [CTA_NAT_MINIP-1] = sizeof(u_int32_t),
595 [CTA_NAT_MAXIP-1] = sizeof(u_int32_t),
599 nfnetlink_parse_nat(struct nfattr *nat,
600 const struct nf_conn *ct, struct nf_nat_range *range)
602 struct nfattr *tb[CTA_NAT_MAX];
605 memset(range, 0, sizeof(*range));
607 nfattr_parse_nested(tb, CTA_NAT_MAX, nat);
609 if (nfattr_bad_size(tb, CTA_NAT_MAX, cta_min_nat))
612 if (tb[CTA_NAT_MINIP-1])
613 range->min_ip = *(__be32 *)NFA_DATA(tb[CTA_NAT_MINIP-1]);
615 if (!tb[CTA_NAT_MAXIP-1])
616 range->max_ip = range->min_ip;
618 range->max_ip = *(__be32 *)NFA_DATA(tb[CTA_NAT_MAXIP-1]);
621 range->flags |= IP_NAT_RANGE_MAP_IPS;
623 if (!tb[CTA_NAT_PROTO-1])
626 err = nfnetlink_parse_nat_proto(tb[CTA_NAT_PROTO-1], ct, range);
635 ctnetlink_parse_help(struct nfattr *attr, char **helper_name)
637 struct nfattr *tb[CTA_HELP_MAX];
639 nfattr_parse_nested(tb, CTA_HELP_MAX, attr);
641 if (!tb[CTA_HELP_NAME-1])
644 *helper_name = NFA_DATA(tb[CTA_HELP_NAME-1]);
649 static const size_t cta_min[CTA_MAX] = {
650 [CTA_STATUS-1] = sizeof(u_int32_t),
651 [CTA_TIMEOUT-1] = sizeof(u_int32_t),
652 [CTA_MARK-1] = sizeof(u_int32_t),
653 [CTA_USE-1] = sizeof(u_int32_t),
654 [CTA_ID-1] = sizeof(u_int32_t)
658 ctnetlink_del_conntrack(struct sock *ctnl, struct sk_buff *skb,
659 struct nlmsghdr *nlh, struct nfattr *cda[])
661 struct nf_conntrack_tuple_hash *h;
662 struct nf_conntrack_tuple tuple;
664 struct nfgenmsg *nfmsg = NLMSG_DATA(nlh);
665 u_int8_t u3 = nfmsg->nfgen_family;
668 if (nfattr_bad_size(cda, CTA_MAX, cta_min))
671 if (cda[CTA_TUPLE_ORIG-1])
672 err = ctnetlink_parse_tuple(cda, &tuple, CTA_TUPLE_ORIG, u3);
673 else if (cda[CTA_TUPLE_REPLY-1])
674 err = ctnetlink_parse_tuple(cda, &tuple, CTA_TUPLE_REPLY, u3);
676 /* Flush the whole table */
677 nf_conntrack_flush();
684 h = nf_conntrack_find_get(&tuple, NULL);
688 ct = nf_ct_tuplehash_to_ctrack(h);
691 u_int32_t id = ntohl(*(__be32 *)NFA_DATA(cda[CTA_ID-1]));
697 if (del_timer(&ct->timeout))
698 ct->timeout.function((unsigned long)ct);
706 ctnetlink_get_conntrack(struct sock *ctnl, struct sk_buff *skb,
707 struct nlmsghdr *nlh, struct nfattr *cda[])
709 struct nf_conntrack_tuple_hash *h;
710 struct nf_conntrack_tuple tuple;
712 struct sk_buff *skb2 = NULL;
713 struct nfgenmsg *nfmsg = NLMSG_DATA(nlh);
714 u_int8_t u3 = nfmsg->nfgen_family;
717 if (nlh->nlmsg_flags & NLM_F_DUMP) {
718 #ifndef CONFIG_NF_CT_ACCT
719 if (NFNL_MSG_TYPE(nlh->nlmsg_type) == IPCTNL_MSG_CT_GET_CTRZERO)
722 return netlink_dump_start(ctnl, skb, nlh, ctnetlink_dump_table,
726 if (nfattr_bad_size(cda, CTA_MAX, cta_min))
729 if (cda[CTA_TUPLE_ORIG-1])
730 err = ctnetlink_parse_tuple(cda, &tuple, CTA_TUPLE_ORIG, u3);
731 else if (cda[CTA_TUPLE_REPLY-1])
732 err = ctnetlink_parse_tuple(cda, &tuple, CTA_TUPLE_REPLY, u3);
739 h = nf_conntrack_find_get(&tuple, NULL);
743 ct = nf_ct_tuplehash_to_ctrack(h);
746 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
752 err = ctnetlink_fill_info(skb2, NETLINK_CB(skb).pid, nlh->nlmsg_seq,
753 IPCTNL_MSG_CT_NEW, 1, ct);
758 err = netlink_unicast(ctnl, skb2, NETLINK_CB(skb).pid, MSG_DONTWAIT);
771 ctnetlink_change_status(struct nf_conn *ct, struct nfattr *cda[])
774 unsigned int status = ntohl(*(__be32 *)NFA_DATA(cda[CTA_STATUS-1]));
775 d = ct->status ^ status;
777 if (d & (IPS_EXPECTED|IPS_CONFIRMED|IPS_DYING))
781 if (d & IPS_SEEN_REPLY && !(status & IPS_SEEN_REPLY))
782 /* SEEN_REPLY bit can only be set */
786 if (d & IPS_ASSURED && !(status & IPS_ASSURED))
787 /* ASSURED bit can only be set */
790 if (cda[CTA_NAT_SRC-1] || cda[CTA_NAT_DST-1]) {
791 #ifndef CONFIG_NF_NAT_NEEDED
794 struct nf_nat_range range;
796 if (cda[CTA_NAT_DST-1]) {
797 if (nfnetlink_parse_nat(cda[CTA_NAT_DST-1], ct,
800 if (nf_nat_initialized(ct,
801 HOOK2MANIP(NF_IP_PRE_ROUTING)))
803 nf_nat_setup_info(ct, &range, NF_IP_PRE_ROUTING);
805 if (cda[CTA_NAT_SRC-1]) {
806 if (nfnetlink_parse_nat(cda[CTA_NAT_SRC-1], ct,
809 if (nf_nat_initialized(ct,
810 HOOK2MANIP(NF_IP_POST_ROUTING)))
812 nf_nat_setup_info(ct, &range, NF_IP_POST_ROUTING);
817 /* Be careful here, modifying NAT bits can screw up things,
818 * so don't let users modify them directly if they don't pass
820 ct->status |= status & ~(IPS_NAT_DONE_MASK | IPS_NAT_MASK);
826 ctnetlink_change_helper(struct nf_conn *ct, struct nfattr *cda[])
828 struct nf_conntrack_helper *helper;
829 struct nf_conn_help *help = nfct_help(ct);
834 /* FIXME: we need to reallocate and rehash */
838 /* don't change helper of sibling connections */
842 err = ctnetlink_parse_help(cda[CTA_HELP-1], &helpname);
846 helper = __nf_conntrack_helper_find_byname(helpname);
848 if (!strcmp(helpname, ""))
856 /* we had a helper before ... */
857 nf_ct_remove_expectations(ct);
860 /* need to zero data of old helper */
861 memset(&help->help, 0, sizeof(help->help));
865 help->helper = helper;
871 ctnetlink_change_timeout(struct nf_conn *ct, struct nfattr *cda[])
873 u_int32_t timeout = ntohl(*(__be32 *)NFA_DATA(cda[CTA_TIMEOUT-1]));
875 if (!del_timer(&ct->timeout))
878 ct->timeout.expires = jiffies + timeout * HZ;
879 add_timer(&ct->timeout);
885 ctnetlink_change_protoinfo(struct nf_conn *ct, struct nfattr *cda[])
887 struct nfattr *tb[CTA_PROTOINFO_MAX], *attr = cda[CTA_PROTOINFO-1];
888 struct nf_conntrack_l4proto *l4proto;
889 u_int16_t npt = ct->tuplehash[IP_CT_DIR_ORIGINAL].tuple.dst.protonum;
890 u_int16_t l3num = ct->tuplehash[IP_CT_DIR_ORIGINAL].tuple.src.l3num;
893 nfattr_parse_nested(tb, CTA_PROTOINFO_MAX, attr);
895 l4proto = nf_ct_l4proto_find_get(l3num, npt);
897 if (l4proto->from_nfattr)
898 err = l4proto->from_nfattr(tb, ct);
899 nf_ct_l4proto_put(l4proto);
905 ctnetlink_change_conntrack(struct nf_conn *ct, struct nfattr *cda[])
909 if (cda[CTA_HELP-1]) {
910 err = ctnetlink_change_helper(ct, cda);
915 if (cda[CTA_TIMEOUT-1]) {
916 err = ctnetlink_change_timeout(ct, cda);
921 if (cda[CTA_STATUS-1]) {
922 err = ctnetlink_change_status(ct, cda);
927 if (cda[CTA_PROTOINFO-1]) {
928 err = ctnetlink_change_protoinfo(ct, cda);
933 #if defined(CONFIG_NF_CONNTRACK_MARK)
935 ct->mark = ntohl(*(__be32 *)NFA_DATA(cda[CTA_MARK-1]));
942 ctnetlink_create_conntrack(struct nfattr *cda[],
943 struct nf_conntrack_tuple *otuple,
944 struct nf_conntrack_tuple *rtuple)
948 struct nf_conn_help *help;
950 ct = nf_conntrack_alloc(otuple, rtuple);
951 if (ct == NULL || IS_ERR(ct))
954 if (!cda[CTA_TIMEOUT-1])
956 ct->timeout.expires = ntohl(*(__be32 *)NFA_DATA(cda[CTA_TIMEOUT-1]));
958 ct->timeout.expires = jiffies + ct->timeout.expires * HZ;
959 ct->status |= IPS_CONFIRMED;
961 if (cda[CTA_STATUS-1]) {
962 err = ctnetlink_change_status(ct, cda);
967 if (cda[CTA_PROTOINFO-1]) {
968 err = ctnetlink_change_protoinfo(ct, cda);
973 #if defined(CONFIG_NF_CONNTRACK_MARK)
975 ct->mark = ntohl(*(__be32 *)NFA_DATA(cda[CTA_MARK-1]));
978 help = nfct_help(ct);
980 help->helper = nf_ct_helper_find_get(rtuple);
982 add_timer(&ct->timeout);
983 nf_conntrack_hash_insert(ct);
985 if (help && help->helper)
986 nf_ct_helper_put(help->helper);
991 nf_conntrack_free(ct);
996 ctnetlink_new_conntrack(struct sock *ctnl, struct sk_buff *skb,
997 struct nlmsghdr *nlh, struct nfattr *cda[])
999 struct nf_conntrack_tuple otuple, rtuple;
1000 struct nf_conntrack_tuple_hash *h = NULL;
1001 struct nfgenmsg *nfmsg = NLMSG_DATA(nlh);
1002 u_int8_t u3 = nfmsg->nfgen_family;
1005 if (nfattr_bad_size(cda, CTA_MAX, cta_min))
1008 if (cda[CTA_TUPLE_ORIG-1]) {
1009 err = ctnetlink_parse_tuple(cda, &otuple, CTA_TUPLE_ORIG, u3);
1014 if (cda[CTA_TUPLE_REPLY-1]) {
1015 err = ctnetlink_parse_tuple(cda, &rtuple, CTA_TUPLE_REPLY, u3);
1020 write_lock_bh(&nf_conntrack_lock);
1021 if (cda[CTA_TUPLE_ORIG-1])
1022 h = __nf_conntrack_find(&otuple, NULL);
1023 else if (cda[CTA_TUPLE_REPLY-1])
1024 h = __nf_conntrack_find(&rtuple, NULL);
1027 write_unlock_bh(&nf_conntrack_lock);
1029 if (nlh->nlmsg_flags & NLM_F_CREATE)
1030 err = ctnetlink_create_conntrack(cda, &otuple, &rtuple);
1033 /* implicit 'else' */
1035 /* we only allow nat config for new conntracks */
1036 if (cda[CTA_NAT_SRC-1] || cda[CTA_NAT_DST-1]) {
1041 /* We manipulate the conntrack inside the global conntrack table lock,
1042 * so there's no need to increase the refcount */
1044 if (!(nlh->nlmsg_flags & NLM_F_EXCL))
1045 err = ctnetlink_change_conntrack(nf_ct_tuplehash_to_ctrack(h), cda);
1048 write_unlock_bh(&nf_conntrack_lock);
1052 /***********************************************************************
1054 ***********************************************************************/
1057 ctnetlink_exp_dump_tuple(struct sk_buff *skb,
1058 const struct nf_conntrack_tuple *tuple,
1059 enum ctattr_expect type)
1061 struct nfattr *nest_parms = NFA_NEST(skb, type);
1063 if (ctnetlink_dump_tuples(skb, tuple) < 0)
1064 goto nfattr_failure;
1066 NFA_NEST_END(skb, nest_parms);
1075 ctnetlink_exp_dump_mask(struct sk_buff *skb,
1076 const struct nf_conntrack_tuple *tuple,
1077 const struct nf_conntrack_tuple *mask)
1080 struct nf_conntrack_l3proto *l3proto;
1081 struct nf_conntrack_l4proto *l4proto;
1082 struct nfattr *nest_parms = NFA_NEST(skb, CTA_EXPECT_MASK);
1084 l3proto = nf_ct_l3proto_find_get(tuple->src.l3num);
1085 ret = ctnetlink_dump_tuples_ip(skb, mask, l3proto);
1086 nf_ct_l3proto_put(l3proto);
1088 if (unlikely(ret < 0))
1089 goto nfattr_failure;
1091 l4proto = nf_ct_l4proto_find_get(tuple->src.l3num, tuple->dst.protonum);
1092 ret = ctnetlink_dump_tuples_proto(skb, mask, l4proto);
1093 nf_ct_l4proto_put(l4proto);
1094 if (unlikely(ret < 0))
1095 goto nfattr_failure;
1097 NFA_NEST_END(skb, nest_parms);
1106 ctnetlink_exp_dump_expect(struct sk_buff *skb,
1107 const struct nf_conntrack_expect *exp)
1109 struct nf_conn *master = exp->master;
1110 __be32 timeout = htonl((exp->timeout.expires - jiffies) / HZ);
1111 __be32 id = htonl(exp->id);
1113 if (ctnetlink_exp_dump_tuple(skb, &exp->tuple, CTA_EXPECT_TUPLE) < 0)
1114 goto nfattr_failure;
1115 if (ctnetlink_exp_dump_mask(skb, &exp->tuple, &exp->mask) < 0)
1116 goto nfattr_failure;
1117 if (ctnetlink_exp_dump_tuple(skb,
1118 &master->tuplehash[IP_CT_DIR_ORIGINAL].tuple,
1119 CTA_EXPECT_MASTER) < 0)
1120 goto nfattr_failure;
1122 NFA_PUT(skb, CTA_EXPECT_TIMEOUT, sizeof(timeout), &timeout);
1123 NFA_PUT(skb, CTA_EXPECT_ID, sizeof(u_int32_t), &id);
1132 ctnetlink_exp_fill_info(struct sk_buff *skb, u32 pid, u32 seq,
1135 const struct nf_conntrack_expect *exp)
1137 struct nlmsghdr *nlh;
1138 struct nfgenmsg *nfmsg;
1139 unsigned char *b = skb_tail_pointer(skb);
1141 event |= NFNL_SUBSYS_CTNETLINK_EXP << 8;
1142 nlh = NLMSG_PUT(skb, pid, seq, event, sizeof(struct nfgenmsg));
1143 nfmsg = NLMSG_DATA(nlh);
1145 nlh->nlmsg_flags = (nowait && pid) ? NLM_F_MULTI : 0;
1146 nfmsg->nfgen_family = exp->tuple.src.l3num;
1147 nfmsg->version = NFNETLINK_V0;
1150 if (ctnetlink_exp_dump_expect(skb, exp) < 0)
1151 goto nfattr_failure;
1153 nlh->nlmsg_len = skb_tail_pointer(skb) - b;
1162 #ifdef CONFIG_NF_CONNTRACK_EVENTS
1163 static int ctnetlink_expect_event(struct notifier_block *this,
1164 unsigned long events, void *ptr)
1166 struct nlmsghdr *nlh;
1167 struct nfgenmsg *nfmsg;
1168 struct nf_conntrack_expect *exp = (struct nf_conntrack_expect *)ptr;
1169 struct sk_buff *skb;
1174 if (events & IPEXP_NEW) {
1175 type = IPCTNL_MSG_EXP_NEW;
1176 flags = NLM_F_CREATE|NLM_F_EXCL;
1180 if (!nfnetlink_has_listeners(NFNLGRP_CONNTRACK_EXP_NEW))
1183 skb = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
1189 type |= NFNL_SUBSYS_CTNETLINK_EXP << 8;
1190 nlh = NLMSG_PUT(skb, 0, 0, type, sizeof(struct nfgenmsg));
1191 nfmsg = NLMSG_DATA(nlh);
1193 nlh->nlmsg_flags = flags;
1194 nfmsg->nfgen_family = exp->tuple.src.l3num;
1195 nfmsg->version = NFNETLINK_V0;
1198 if (ctnetlink_exp_dump_expect(skb, exp) < 0)
1199 goto nfattr_failure;
1201 nlh->nlmsg_len = skb->tail - b;
1202 nfnetlink_send(skb, 0, NFNLGRP_CONNTRACK_EXP_NEW, 0);
1213 ctnetlink_exp_dump_table(struct sk_buff *skb, struct netlink_callback *cb)
1215 struct nf_conntrack_expect *exp = NULL;
1216 struct list_head *i;
1217 u_int32_t *id = (u_int32_t *) &cb->args[0];
1218 struct nfgenmsg *nfmsg = NLMSG_DATA(cb->nlh);
1219 u_int8_t l3proto = nfmsg->nfgen_family;
1221 read_lock_bh(&nf_conntrack_lock);
1222 list_for_each_prev(i, &nf_conntrack_expect_list) {
1223 exp = (struct nf_conntrack_expect *) i;
1224 if (l3proto && exp->tuple.src.l3num != l3proto)
1228 if (ctnetlink_exp_fill_info(skb, NETLINK_CB(cb->skb).pid,
1236 read_unlock_bh(&nf_conntrack_lock);
1241 static const size_t cta_min_exp[CTA_EXPECT_MAX] = {
1242 [CTA_EXPECT_TIMEOUT-1] = sizeof(u_int32_t),
1243 [CTA_EXPECT_ID-1] = sizeof(u_int32_t)
1247 ctnetlink_get_expect(struct sock *ctnl, struct sk_buff *skb,
1248 struct nlmsghdr *nlh, struct nfattr *cda[])
1250 struct nf_conntrack_tuple tuple;
1251 struct nf_conntrack_expect *exp;
1252 struct sk_buff *skb2;
1253 struct nfgenmsg *nfmsg = NLMSG_DATA(nlh);
1254 u_int8_t u3 = nfmsg->nfgen_family;
1257 if (nfattr_bad_size(cda, CTA_EXPECT_MAX, cta_min_exp))
1260 if (nlh->nlmsg_flags & NLM_F_DUMP) {
1261 return netlink_dump_start(ctnl, skb, nlh,
1262 ctnetlink_exp_dump_table,
1266 if (cda[CTA_EXPECT_MASTER-1])
1267 err = ctnetlink_parse_tuple(cda, &tuple, CTA_EXPECT_MASTER, u3);
1274 exp = nf_conntrack_expect_find_get(&tuple);
1278 if (cda[CTA_EXPECT_ID-1]) {
1279 __be32 id = *(__be32 *)NFA_DATA(cda[CTA_EXPECT_ID-1]);
1280 if (exp->id != ntohl(id)) {
1281 nf_conntrack_expect_put(exp);
1287 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
1291 err = ctnetlink_exp_fill_info(skb2, NETLINK_CB(skb).pid,
1292 nlh->nlmsg_seq, IPCTNL_MSG_EXP_NEW,
1297 nf_conntrack_expect_put(exp);
1299 return netlink_unicast(ctnl, skb2, NETLINK_CB(skb).pid, MSG_DONTWAIT);
1304 nf_conntrack_expect_put(exp);
1309 ctnetlink_del_expect(struct sock *ctnl, struct sk_buff *skb,
1310 struct nlmsghdr *nlh, struct nfattr *cda[])
1312 struct nf_conntrack_expect *exp, *tmp;
1313 struct nf_conntrack_tuple tuple;
1314 struct nf_conntrack_helper *h;
1315 struct nfgenmsg *nfmsg = NLMSG_DATA(nlh);
1316 u_int8_t u3 = nfmsg->nfgen_family;
1319 if (nfattr_bad_size(cda, CTA_EXPECT_MAX, cta_min_exp))
1322 if (cda[CTA_EXPECT_TUPLE-1]) {
1323 /* delete a single expect by tuple */
1324 err = ctnetlink_parse_tuple(cda, &tuple, CTA_EXPECT_TUPLE, u3);
1328 /* bump usage count to 2 */
1329 exp = nf_conntrack_expect_find_get(&tuple);
1333 if (cda[CTA_EXPECT_ID-1]) {
1334 __be32 id = *(__be32 *)NFA_DATA(cda[CTA_EXPECT_ID-1]);
1335 if (exp->id != ntohl(id)) {
1336 nf_conntrack_expect_put(exp);
1341 /* after list removal, usage count == 1 */
1342 nf_conntrack_unexpect_related(exp);
1343 /* have to put what we 'get' above.
1344 * after this line usage count == 0 */
1345 nf_conntrack_expect_put(exp);
1346 } else if (cda[CTA_EXPECT_HELP_NAME-1]) {
1347 char *name = NFA_DATA(cda[CTA_EXPECT_HELP_NAME-1]);
1349 /* delete all expectations for this helper */
1350 write_lock_bh(&nf_conntrack_lock);
1351 h = __nf_conntrack_helper_find_byname(name);
1353 write_unlock_bh(&nf_conntrack_lock);
1356 list_for_each_entry_safe(exp, tmp, &nf_conntrack_expect_list,
1358 struct nf_conn_help *m_help = nfct_help(exp->master);
1359 if (m_help->helper == h
1360 && del_timer(&exp->timeout)) {
1361 nf_ct_unlink_expect(exp);
1362 nf_conntrack_expect_put(exp);
1365 write_unlock_bh(&nf_conntrack_lock);
1367 /* This basically means we have to flush everything*/
1368 write_lock_bh(&nf_conntrack_lock);
1369 list_for_each_entry_safe(exp, tmp, &nf_conntrack_expect_list,
1371 if (del_timer(&exp->timeout)) {
1372 nf_ct_unlink_expect(exp);
1373 nf_conntrack_expect_put(exp);
1376 write_unlock_bh(&nf_conntrack_lock);
1382 ctnetlink_change_expect(struct nf_conntrack_expect *x, struct nfattr *cda[])
1388 ctnetlink_create_expect(struct nfattr *cda[], u_int8_t u3)
1390 struct nf_conntrack_tuple tuple, mask, master_tuple;
1391 struct nf_conntrack_tuple_hash *h = NULL;
1392 struct nf_conntrack_expect *exp;
1394 struct nf_conn_help *help;
1397 /* caller guarantees that those three CTA_EXPECT_* exist */
1398 err = ctnetlink_parse_tuple(cda, &tuple, CTA_EXPECT_TUPLE, u3);
1401 err = ctnetlink_parse_tuple(cda, &mask, CTA_EXPECT_MASK, u3);
1404 err = ctnetlink_parse_tuple(cda, &master_tuple, CTA_EXPECT_MASTER, u3);
1408 /* Look for master conntrack of this expectation */
1409 h = nf_conntrack_find_get(&master_tuple, NULL);
1412 ct = nf_ct_tuplehash_to_ctrack(h);
1413 help = nfct_help(ct);
1415 if (!help || !help->helper) {
1416 /* such conntrack hasn't got any helper, abort */
1421 exp = nf_conntrack_expect_alloc(ct);
1427 exp->expectfn = NULL;
1431 memcpy(&exp->tuple, &tuple, sizeof(struct nf_conntrack_tuple));
1432 memcpy(&exp->mask, &mask, sizeof(struct nf_conntrack_tuple));
1434 err = nf_conntrack_expect_related(exp);
1435 nf_conntrack_expect_put(exp);
1438 nf_ct_put(nf_ct_tuplehash_to_ctrack(h));
1443 ctnetlink_new_expect(struct sock *ctnl, struct sk_buff *skb,
1444 struct nlmsghdr *nlh, struct nfattr *cda[])
1446 struct nf_conntrack_tuple tuple;
1447 struct nf_conntrack_expect *exp;
1448 struct nfgenmsg *nfmsg = NLMSG_DATA(nlh);
1449 u_int8_t u3 = nfmsg->nfgen_family;
1452 if (nfattr_bad_size(cda, CTA_EXPECT_MAX, cta_min_exp))
1455 if (!cda[CTA_EXPECT_TUPLE-1]
1456 || !cda[CTA_EXPECT_MASK-1]
1457 || !cda[CTA_EXPECT_MASTER-1])
1460 err = ctnetlink_parse_tuple(cda, &tuple, CTA_EXPECT_TUPLE, u3);
1464 write_lock_bh(&nf_conntrack_lock);
1465 exp = __nf_conntrack_expect_find(&tuple);
1468 write_unlock_bh(&nf_conntrack_lock);
1470 if (nlh->nlmsg_flags & NLM_F_CREATE)
1471 err = ctnetlink_create_expect(cda, u3);
1476 if (!(nlh->nlmsg_flags & NLM_F_EXCL))
1477 err = ctnetlink_change_expect(exp, cda);
1478 write_unlock_bh(&nf_conntrack_lock);
1483 #ifdef CONFIG_NF_CONNTRACK_EVENTS
1484 static struct notifier_block ctnl_notifier = {
1485 .notifier_call = ctnetlink_conntrack_event,
1488 static struct notifier_block ctnl_notifier_exp = {
1489 .notifier_call = ctnetlink_expect_event,
1493 static struct nfnl_callback ctnl_cb[IPCTNL_MSG_MAX] = {
1494 [IPCTNL_MSG_CT_NEW] = { .call = ctnetlink_new_conntrack,
1495 .attr_count = CTA_MAX, },
1496 [IPCTNL_MSG_CT_GET] = { .call = ctnetlink_get_conntrack,
1497 .attr_count = CTA_MAX, },
1498 [IPCTNL_MSG_CT_DELETE] = { .call = ctnetlink_del_conntrack,
1499 .attr_count = CTA_MAX, },
1500 [IPCTNL_MSG_CT_GET_CTRZERO] = { .call = ctnetlink_get_conntrack,
1501 .attr_count = CTA_MAX, },
1504 static struct nfnl_callback ctnl_exp_cb[IPCTNL_MSG_EXP_MAX] = {
1505 [IPCTNL_MSG_EXP_GET] = { .call = ctnetlink_get_expect,
1506 .attr_count = CTA_EXPECT_MAX, },
1507 [IPCTNL_MSG_EXP_NEW] = { .call = ctnetlink_new_expect,
1508 .attr_count = CTA_EXPECT_MAX, },
1509 [IPCTNL_MSG_EXP_DELETE] = { .call = ctnetlink_del_expect,
1510 .attr_count = CTA_EXPECT_MAX, },
1513 static struct nfnetlink_subsystem ctnl_subsys = {
1514 .name = "conntrack",
1515 .subsys_id = NFNL_SUBSYS_CTNETLINK,
1516 .cb_count = IPCTNL_MSG_MAX,
1520 static struct nfnetlink_subsystem ctnl_exp_subsys = {
1521 .name = "conntrack_expect",
1522 .subsys_id = NFNL_SUBSYS_CTNETLINK_EXP,
1523 .cb_count = IPCTNL_MSG_EXP_MAX,
1527 MODULE_ALIAS("ip_conntrack_netlink");
1528 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_CTNETLINK);
1529 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_CTNETLINK_EXP);
1531 static int __init ctnetlink_init(void)
1535 printk("ctnetlink v%s: registering with nfnetlink.\n", version);
1536 ret = nfnetlink_subsys_register(&ctnl_subsys);
1538 printk("ctnetlink_init: cannot register with nfnetlink.\n");
1542 ret = nfnetlink_subsys_register(&ctnl_exp_subsys);
1544 printk("ctnetlink_init: cannot register exp with nfnetlink.\n");
1545 goto err_unreg_subsys;
1548 #ifdef CONFIG_NF_CONNTRACK_EVENTS
1549 ret = nf_conntrack_register_notifier(&ctnl_notifier);
1551 printk("ctnetlink_init: cannot register notifier.\n");
1552 goto err_unreg_exp_subsys;
1555 ret = nf_conntrack_expect_register_notifier(&ctnl_notifier_exp);
1557 printk("ctnetlink_init: cannot expect register notifier.\n");
1558 goto err_unreg_notifier;
1564 #ifdef CONFIG_NF_CONNTRACK_EVENTS
1566 nf_conntrack_unregister_notifier(&ctnl_notifier);
1567 err_unreg_exp_subsys:
1568 nfnetlink_subsys_unregister(&ctnl_exp_subsys);
1571 nfnetlink_subsys_unregister(&ctnl_subsys);
1576 static void __exit ctnetlink_exit(void)
1578 printk("ctnetlink: unregistering from nfnetlink.\n");
1580 #ifdef CONFIG_NF_CONNTRACK_EVENTS
1581 nf_conntrack_expect_unregister_notifier(&ctnl_notifier_exp);
1582 nf_conntrack_unregister_notifier(&ctnl_notifier);
1585 nfnetlink_subsys_unregister(&ctnl_exp_subsys);
1586 nfnetlink_subsys_unregister(&ctnl_subsys);
1590 module_init(ctnetlink_init);
1591 module_exit(ctnetlink_exit);