MERGE-master-patchset-edits
[linux-2.6/openmoko-kernel.git] / net / netfilter / nf_conntrack_netlink.c
blobc32a7e8e3a1b0e18a358aa45e3624754346de436
1 /* Connection tracking via netlink socket. Allows for user space
2 * protocol helpers and general trouble making from userspace.
4 * (C) 2001 by Jay Schulist <jschlst@samba.org>
5 * (C) 2002-2006 by Harald Welte <laforge@gnumonks.org>
6 * (C) 2003 by Patrick Mchardy <kaber@trash.net>
7 * (C) 2005-2008 by Pablo Neira Ayuso <pablo@netfilter.org>
9 * Initial connection tracking via netlink development funded and
10 * generally made possible by Network Robots, Inc. (www.networkrobots.com)
12 * Further development of this code funded by Astaro AG (http://www.astaro.com)
14 * This software may be used and distributed according to the terms
15 * of the GNU General Public License, incorporated herein by reference.
18 #include <linux/init.h>
19 #include <linux/module.h>
20 #include <linux/kernel.h>
21 #include <linux/rculist.h>
22 #include <linux/types.h>
23 #include <linux/timer.h>
24 #include <linux/skbuff.h>
25 #include <linux/errno.h>
26 #include <linux/netlink.h>
27 #include <linux/spinlock.h>
28 #include <linux/interrupt.h>
29 #include <linux/notifier.h>
31 #include <linux/netfilter.h>
32 #include <net/netlink.h>
33 #include <net/netfilter/nf_conntrack.h>
34 #include <net/netfilter/nf_conntrack_core.h>
35 #include <net/netfilter/nf_conntrack_expect.h>
36 #include <net/netfilter/nf_conntrack_helper.h>
37 #include <net/netfilter/nf_conntrack_l3proto.h>
38 #include <net/netfilter/nf_conntrack_l4proto.h>
39 #include <net/netfilter/nf_conntrack_tuple.h>
40 #include <net/netfilter/nf_conntrack_acct.h>
41 #ifdef CONFIG_NF_NAT_NEEDED
42 #include <net/netfilter/nf_nat_core.h>
43 #include <net/netfilter/nf_nat_protocol.h>
44 #endif
46 #include <linux/netfilter/nfnetlink.h>
47 #include <linux/netfilter/nfnetlink_conntrack.h>
49 MODULE_LICENSE("GPL");
51 static char __initdata version[] = "0.93";
53 static inline int
54 ctnetlink_dump_tuples_proto(struct sk_buff *skb,
55 const struct nf_conntrack_tuple *tuple,
56 struct nf_conntrack_l4proto *l4proto)
58 int ret = 0;
59 struct nlattr *nest_parms;
61 nest_parms = nla_nest_start(skb, CTA_TUPLE_PROTO | NLA_F_NESTED);
62 if (!nest_parms)
63 goto nla_put_failure;
64 NLA_PUT_U8(skb, CTA_PROTO_NUM, tuple->dst.protonum);
66 if (likely(l4proto->tuple_to_nlattr))
67 ret = l4proto->tuple_to_nlattr(skb, tuple);
69 nla_nest_end(skb, nest_parms);
71 return ret;
73 nla_put_failure:
74 return -1;
77 static inline int
78 ctnetlink_dump_tuples_ip(struct sk_buff *skb,
79 const struct nf_conntrack_tuple *tuple,
80 struct nf_conntrack_l3proto *l3proto)
82 int ret = 0;
83 struct nlattr *nest_parms;
85 nest_parms = nla_nest_start(skb, CTA_TUPLE_IP | NLA_F_NESTED);
86 if (!nest_parms)
87 goto nla_put_failure;
89 if (likely(l3proto->tuple_to_nlattr))
90 ret = l3proto->tuple_to_nlattr(skb, tuple);
92 nla_nest_end(skb, nest_parms);
94 return ret;
96 nla_put_failure:
97 return -1;
100 static int
101 ctnetlink_dump_tuples(struct sk_buff *skb,
102 const struct nf_conntrack_tuple *tuple)
104 int ret;
105 struct nf_conntrack_l3proto *l3proto;
106 struct nf_conntrack_l4proto *l4proto;
108 l3proto = __nf_ct_l3proto_find(tuple->src.l3num);
109 ret = ctnetlink_dump_tuples_ip(skb, tuple, l3proto);
111 if (unlikely(ret < 0))
112 return ret;
114 l4proto = __nf_ct_l4proto_find(tuple->src.l3num, tuple->dst.protonum);
115 ret = ctnetlink_dump_tuples_proto(skb, tuple, l4proto);
117 return ret;
120 static inline int
121 ctnetlink_dump_status(struct sk_buff *skb, const struct nf_conn *ct)
123 NLA_PUT_BE32(skb, CTA_STATUS, htonl(ct->status));
124 return 0;
126 nla_put_failure:
127 return -1;
130 static inline int
131 ctnetlink_dump_timeout(struct sk_buff *skb, const struct nf_conn *ct)
133 long timeout = (ct->timeout.expires - jiffies) / HZ;
135 if (timeout < 0)
136 timeout = 0;
138 NLA_PUT_BE32(skb, CTA_TIMEOUT, htonl(timeout));
139 return 0;
141 nla_put_failure:
142 return -1;
145 static inline int
146 ctnetlink_dump_protoinfo(struct sk_buff *skb, const struct nf_conn *ct)
148 struct nf_conntrack_l4proto *l4proto;
149 struct nlattr *nest_proto;
150 int ret;
152 l4proto = __nf_ct_l4proto_find(nf_ct_l3num(ct), nf_ct_protonum(ct));
153 if (!l4proto->to_nlattr)
154 return 0;
156 nest_proto = nla_nest_start(skb, CTA_PROTOINFO | NLA_F_NESTED);
157 if (!nest_proto)
158 goto nla_put_failure;
160 ret = l4proto->to_nlattr(skb, nest_proto, ct);
162 nla_nest_end(skb, nest_proto);
164 return ret;
166 nla_put_failure:
167 return -1;
170 static inline int
171 ctnetlink_dump_helpinfo(struct sk_buff *skb, const struct nf_conn *ct)
173 struct nlattr *nest_helper;
174 const struct nf_conn_help *help = nfct_help(ct);
175 struct nf_conntrack_helper *helper;
177 if (!help)
178 return 0;
180 helper = rcu_dereference(help->helper);
181 if (!helper)
182 goto out;
184 nest_helper = nla_nest_start(skb, CTA_HELP | NLA_F_NESTED);
185 if (!nest_helper)
186 goto nla_put_failure;
187 NLA_PUT_STRING(skb, CTA_HELP_NAME, helper->name);
189 if (helper->to_nlattr)
190 helper->to_nlattr(skb, ct);
192 nla_nest_end(skb, nest_helper);
193 out:
194 return 0;
196 nla_put_failure:
197 return -1;
200 static int
201 ctnetlink_dump_counters(struct sk_buff *skb, const struct nf_conn *ct,
202 enum ip_conntrack_dir dir)
204 enum ctattr_type type = dir ? CTA_COUNTERS_REPLY: CTA_COUNTERS_ORIG;
205 struct nlattr *nest_count;
206 const struct nf_conn_counter *acct;
208 acct = nf_conn_acct_find(ct);
209 if (!acct)
210 return 0;
212 nest_count = nla_nest_start(skb, type | NLA_F_NESTED);
213 if (!nest_count)
214 goto nla_put_failure;
216 NLA_PUT_BE64(skb, CTA_COUNTERS_PACKETS,
217 cpu_to_be64(acct[dir].packets));
218 NLA_PUT_BE64(skb, CTA_COUNTERS_BYTES,
219 cpu_to_be64(acct[dir].bytes));
221 nla_nest_end(skb, nest_count);
223 return 0;
225 nla_put_failure:
226 return -1;
229 #ifdef CONFIG_NF_CONNTRACK_MARK
230 static inline int
231 ctnetlink_dump_mark(struct sk_buff *skb, const struct nf_conn *ct)
233 NLA_PUT_BE32(skb, CTA_MARK, htonl(ct->mark));
234 return 0;
236 nla_put_failure:
237 return -1;
239 #else
240 #define ctnetlink_dump_mark(a, b) (0)
241 #endif
243 #ifdef CONFIG_NF_CONNTRACK_SECMARK
244 static inline int
245 ctnetlink_dump_secmark(struct sk_buff *skb, const struct nf_conn *ct)
247 NLA_PUT_BE32(skb, CTA_SECMARK, htonl(ct->secmark));
248 return 0;
250 nla_put_failure:
251 return -1;
253 #else
254 #define ctnetlink_dump_secmark(a, b) (0)
255 #endif
257 #define master_tuple(ct) &(ct->master->tuplehash[IP_CT_DIR_ORIGINAL].tuple)
259 static inline int
260 ctnetlink_dump_master(struct sk_buff *skb, const struct nf_conn *ct)
262 struct nlattr *nest_parms;
264 if (!(ct->status & IPS_EXPECTED))
265 return 0;
267 nest_parms = nla_nest_start(skb, CTA_TUPLE_MASTER | NLA_F_NESTED);
268 if (!nest_parms)
269 goto nla_put_failure;
270 if (ctnetlink_dump_tuples(skb, master_tuple(ct)) < 0)
271 goto nla_put_failure;
272 nla_nest_end(skb, nest_parms);
274 return 0;
276 nla_put_failure:
277 return -1;
280 #ifdef CONFIG_NF_NAT_NEEDED
281 static int
282 dump_nat_seq_adj(struct sk_buff *skb, const struct nf_nat_seq *natseq, int type)
284 struct nlattr *nest_parms;
286 nest_parms = nla_nest_start(skb, type | NLA_F_NESTED);
287 if (!nest_parms)
288 goto nla_put_failure;
290 NLA_PUT_BE32(skb, CTA_NAT_SEQ_CORRECTION_POS,
291 htonl(natseq->correction_pos));
292 NLA_PUT_BE32(skb, CTA_NAT_SEQ_OFFSET_BEFORE,
293 htonl(natseq->offset_before));
294 NLA_PUT_BE32(skb, CTA_NAT_SEQ_OFFSET_AFTER,
295 htonl(natseq->offset_after));
297 nla_nest_end(skb, nest_parms);
299 return 0;
301 nla_put_failure:
302 return -1;
305 static inline int
306 ctnetlink_dump_nat_seq_adj(struct sk_buff *skb, const struct nf_conn *ct)
308 struct nf_nat_seq *natseq;
309 struct nf_conn_nat *nat = nfct_nat(ct);
311 if (!(ct->status & IPS_SEQ_ADJUST) || !nat)
312 return 0;
314 natseq = &nat->seq[IP_CT_DIR_ORIGINAL];
315 if (dump_nat_seq_adj(skb, natseq, CTA_NAT_SEQ_ADJ_ORIG) == -1)
316 return -1;
318 natseq = &nat->seq[IP_CT_DIR_REPLY];
319 if (dump_nat_seq_adj(skb, natseq, CTA_NAT_SEQ_ADJ_REPLY) == -1)
320 return -1;
322 return 0;
324 #else
325 #define ctnetlink_dump_nat_seq_adj(a, b) (0)
326 #endif
328 static inline int
329 ctnetlink_dump_id(struct sk_buff *skb, const struct nf_conn *ct)
331 NLA_PUT_BE32(skb, CTA_ID, htonl((unsigned long)ct));
332 return 0;
334 nla_put_failure:
335 return -1;
338 static inline int
339 ctnetlink_dump_use(struct sk_buff *skb, const struct nf_conn *ct)
341 NLA_PUT_BE32(skb, CTA_USE, htonl(atomic_read(&ct->ct_general.use)));
342 return 0;
344 nla_put_failure:
345 return -1;
348 #define tuple(ct, dir) (&(ct)->tuplehash[dir].tuple)
350 static int
351 ctnetlink_fill_info(struct sk_buff *skb, u32 pid, u32 seq,
352 int event, int nowait,
353 const struct nf_conn *ct)
355 struct nlmsghdr *nlh;
356 struct nfgenmsg *nfmsg;
357 struct nlattr *nest_parms;
358 unsigned char *b = skb_tail_pointer(skb);
360 event |= NFNL_SUBSYS_CTNETLINK << 8;
361 nlh = NLMSG_PUT(skb, pid, seq, event, sizeof(struct nfgenmsg));
362 nfmsg = NLMSG_DATA(nlh);
364 nlh->nlmsg_flags = (nowait && pid) ? NLM_F_MULTI : 0;
365 nfmsg->nfgen_family = nf_ct_l3num(ct);
366 nfmsg->version = NFNETLINK_V0;
367 nfmsg->res_id = 0;
369 nest_parms = nla_nest_start(skb, CTA_TUPLE_ORIG | NLA_F_NESTED);
370 if (!nest_parms)
371 goto nla_put_failure;
372 if (ctnetlink_dump_tuples(skb, tuple(ct, IP_CT_DIR_ORIGINAL)) < 0)
373 goto nla_put_failure;
374 nla_nest_end(skb, nest_parms);
376 nest_parms = nla_nest_start(skb, CTA_TUPLE_REPLY | NLA_F_NESTED);
377 if (!nest_parms)
378 goto nla_put_failure;
379 if (ctnetlink_dump_tuples(skb, tuple(ct, IP_CT_DIR_REPLY)) < 0)
380 goto nla_put_failure;
381 nla_nest_end(skb, nest_parms);
383 if (ctnetlink_dump_status(skb, ct) < 0 ||
384 ctnetlink_dump_timeout(skb, ct) < 0 ||
385 ctnetlink_dump_counters(skb, ct, IP_CT_DIR_ORIGINAL) < 0 ||
386 ctnetlink_dump_counters(skb, ct, IP_CT_DIR_REPLY) < 0 ||
387 ctnetlink_dump_protoinfo(skb, ct) < 0 ||
388 ctnetlink_dump_helpinfo(skb, ct) < 0 ||
389 ctnetlink_dump_mark(skb, ct) < 0 ||
390 ctnetlink_dump_secmark(skb, ct) < 0 ||
391 ctnetlink_dump_id(skb, ct) < 0 ||
392 ctnetlink_dump_use(skb, ct) < 0 ||
393 ctnetlink_dump_master(skb, ct) < 0 ||
394 ctnetlink_dump_nat_seq_adj(skb, ct) < 0)
395 goto nla_put_failure;
397 nlh->nlmsg_len = skb_tail_pointer(skb) - b;
398 return skb->len;
400 nlmsg_failure:
401 nla_put_failure:
402 nlmsg_trim(skb, b);
403 return -1;
406 #ifdef CONFIG_NF_CONNTRACK_EVENTS
407 static int ctnetlink_conntrack_event(struct notifier_block *this,
408 unsigned long events, void *ptr)
410 struct nlmsghdr *nlh;
411 struct nfgenmsg *nfmsg;
412 struct nlattr *nest_parms;
413 struct nf_ct_event *item = (struct nf_ct_event *)ptr;
414 struct nf_conn *ct = item->ct;
415 struct sk_buff *skb;
416 unsigned int type;
417 sk_buff_data_t b;
418 unsigned int flags = 0, group;
420 /* ignore our fake conntrack entry */
421 if (ct == &nf_conntrack_untracked)
422 return NOTIFY_DONE;
424 if (events & IPCT_DESTROY) {
425 type = IPCTNL_MSG_CT_DELETE;
426 group = NFNLGRP_CONNTRACK_DESTROY;
427 } else if (events & (IPCT_NEW | IPCT_RELATED)) {
428 type = IPCTNL_MSG_CT_NEW;
429 flags = NLM_F_CREATE|NLM_F_EXCL;
430 group = NFNLGRP_CONNTRACK_NEW;
431 } else if (events & (IPCT_STATUS | IPCT_PROTOINFO)) {
432 type = IPCTNL_MSG_CT_NEW;
433 group = NFNLGRP_CONNTRACK_UPDATE;
434 } else
435 return NOTIFY_DONE;
437 if (!nfnetlink_has_listeners(group))
438 return NOTIFY_DONE;
440 skb = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
441 if (!skb)
442 return NOTIFY_DONE;
444 b = skb->tail;
446 type |= NFNL_SUBSYS_CTNETLINK << 8;
447 nlh = NLMSG_PUT(skb, item->pid, 0, type, sizeof(struct nfgenmsg));
448 nfmsg = NLMSG_DATA(nlh);
450 nlh->nlmsg_flags = flags;
451 nfmsg->nfgen_family = nf_ct_l3num(ct);
452 nfmsg->version = NFNETLINK_V0;
453 nfmsg->res_id = 0;
455 rcu_read_lock();
456 nest_parms = nla_nest_start(skb, CTA_TUPLE_ORIG | NLA_F_NESTED);
457 if (!nest_parms)
458 goto nla_put_failure;
459 if (ctnetlink_dump_tuples(skb, tuple(ct, IP_CT_DIR_ORIGINAL)) < 0)
460 goto nla_put_failure;
461 nla_nest_end(skb, nest_parms);
463 nest_parms = nla_nest_start(skb, CTA_TUPLE_REPLY | NLA_F_NESTED);
464 if (!nest_parms)
465 goto nla_put_failure;
466 if (ctnetlink_dump_tuples(skb, tuple(ct, IP_CT_DIR_REPLY)) < 0)
467 goto nla_put_failure;
468 nla_nest_end(skb, nest_parms);
470 if (ctnetlink_dump_id(skb, ct) < 0)
471 goto nla_put_failure;
473 if (ctnetlink_dump_status(skb, ct) < 0)
474 goto nla_put_failure;
476 if (events & IPCT_DESTROY) {
477 if (ctnetlink_dump_counters(skb, ct, IP_CT_DIR_ORIGINAL) < 0 ||
478 ctnetlink_dump_counters(skb, ct, IP_CT_DIR_REPLY) < 0)
479 goto nla_put_failure;
480 } else {
481 if (ctnetlink_dump_timeout(skb, ct) < 0)
482 goto nla_put_failure;
484 if (events & IPCT_PROTOINFO
485 && ctnetlink_dump_protoinfo(skb, ct) < 0)
486 goto nla_put_failure;
488 if ((events & IPCT_HELPER || nfct_help(ct))
489 && ctnetlink_dump_helpinfo(skb, ct) < 0)
490 goto nla_put_failure;
492 #ifdef CONFIG_NF_CONNTRACK_SECMARK
493 if ((events & IPCT_SECMARK || ct->secmark)
494 && ctnetlink_dump_secmark(skb, ct) < 0)
495 goto nla_put_failure;
496 #endif
498 if (events & IPCT_RELATED &&
499 ctnetlink_dump_master(skb, ct) < 0)
500 goto nla_put_failure;
502 if (events & IPCT_NATSEQADJ &&
503 ctnetlink_dump_nat_seq_adj(skb, ct) < 0)
504 goto nla_put_failure;
507 #ifdef CONFIG_NF_CONNTRACK_MARK
508 if ((events & IPCT_MARK || ct->mark)
509 && ctnetlink_dump_mark(skb, ct) < 0)
510 goto nla_put_failure;
511 #endif
512 rcu_read_unlock();
514 nlh->nlmsg_len = skb->tail - b;
515 nfnetlink_send(skb, item->pid, group, item->report);
516 return NOTIFY_DONE;
518 nla_put_failure:
519 rcu_read_unlock();
520 nlmsg_failure:
521 kfree_skb(skb);
522 return NOTIFY_DONE;
524 #endif /* CONFIG_NF_CONNTRACK_EVENTS */
526 static int ctnetlink_done(struct netlink_callback *cb)
528 if (cb->args[1])
529 nf_ct_put((struct nf_conn *)cb->args[1]);
530 return 0;
533 static int
534 ctnetlink_dump_table(struct sk_buff *skb, struct netlink_callback *cb)
536 struct nf_conn *ct, *last;
537 struct nf_conntrack_tuple_hash *h;
538 struct hlist_node *n;
539 struct nfgenmsg *nfmsg = NLMSG_DATA(cb->nlh);
540 u_int8_t l3proto = nfmsg->nfgen_family;
542 rcu_read_lock();
543 last = (struct nf_conn *)cb->args[1];
544 for (; cb->args[0] < nf_conntrack_htable_size; cb->args[0]++) {
545 restart:
546 hlist_for_each_entry_rcu(h, n, &init_net.ct.hash[cb->args[0]],
547 hnode) {
548 if (NF_CT_DIRECTION(h) != IP_CT_DIR_ORIGINAL)
549 continue;
550 ct = nf_ct_tuplehash_to_ctrack(h);
551 /* Dump entries of a given L3 protocol number.
552 * If it is not specified, ie. l3proto == 0,
553 * then dump everything. */
554 if (l3proto && nf_ct_l3num(ct) != l3proto)
555 continue;
556 if (cb->args[1]) {
557 if (ct != last)
558 continue;
559 cb->args[1] = 0;
561 if (ctnetlink_fill_info(skb, NETLINK_CB(cb->skb).pid,
562 cb->nlh->nlmsg_seq,
563 IPCTNL_MSG_CT_NEW,
564 1, ct) < 0) {
565 if (!atomic_inc_not_zero(&ct->ct_general.use))
566 continue;
567 cb->args[1] = (unsigned long)ct;
568 goto out;
571 if (NFNL_MSG_TYPE(cb->nlh->nlmsg_type) ==
572 IPCTNL_MSG_CT_GET_CTRZERO) {
573 struct nf_conn_counter *acct;
575 acct = nf_conn_acct_find(ct);
576 if (acct)
577 memset(acct, 0, sizeof(struct nf_conn_counter[IP_CT_DIR_MAX]));
580 if (cb->args[1]) {
581 cb->args[1] = 0;
582 goto restart;
585 out:
586 rcu_read_unlock();
587 if (last)
588 nf_ct_put(last);
590 return skb->len;
593 static inline int
594 ctnetlink_parse_tuple_ip(struct nlattr *attr, struct nf_conntrack_tuple *tuple)
596 struct nlattr *tb[CTA_IP_MAX+1];
597 struct nf_conntrack_l3proto *l3proto;
598 int ret = 0;
600 nla_parse_nested(tb, CTA_IP_MAX, attr, NULL);
602 l3proto = nf_ct_l3proto_find_get(tuple->src.l3num);
604 if (likely(l3proto->nlattr_to_tuple)) {
605 ret = nla_validate_nested(attr, CTA_IP_MAX,
606 l3proto->nla_policy);
607 if (ret == 0)
608 ret = l3proto->nlattr_to_tuple(tb, tuple);
611 nf_ct_l3proto_put(l3proto);
613 return ret;
616 static const struct nla_policy proto_nla_policy[CTA_PROTO_MAX+1] = {
617 [CTA_PROTO_NUM] = { .type = NLA_U8 },
620 static inline int
621 ctnetlink_parse_tuple_proto(struct nlattr *attr,
622 struct nf_conntrack_tuple *tuple)
624 struct nlattr *tb[CTA_PROTO_MAX+1];
625 struct nf_conntrack_l4proto *l4proto;
626 int ret = 0;
628 ret = nla_parse_nested(tb, CTA_PROTO_MAX, attr, proto_nla_policy);
629 if (ret < 0)
630 return ret;
632 if (!tb[CTA_PROTO_NUM])
633 return -EINVAL;
634 tuple->dst.protonum = nla_get_u8(tb[CTA_PROTO_NUM]);
636 l4proto = nf_ct_l4proto_find_get(tuple->src.l3num, tuple->dst.protonum);
638 if (likely(l4proto->nlattr_to_tuple)) {
639 ret = nla_validate_nested(attr, CTA_PROTO_MAX,
640 l4proto->nla_policy);
641 if (ret == 0)
642 ret = l4proto->nlattr_to_tuple(tb, tuple);
645 nf_ct_l4proto_put(l4proto);
647 return ret;
650 static int
651 ctnetlink_parse_tuple(struct nlattr *cda[], struct nf_conntrack_tuple *tuple,
652 enum ctattr_tuple type, u_int8_t l3num)
654 struct nlattr *tb[CTA_TUPLE_MAX+1];
655 int err;
657 memset(tuple, 0, sizeof(*tuple));
659 nla_parse_nested(tb, CTA_TUPLE_MAX, cda[type], NULL);
661 if (!tb[CTA_TUPLE_IP])
662 return -EINVAL;
664 tuple->src.l3num = l3num;
666 err = ctnetlink_parse_tuple_ip(tb[CTA_TUPLE_IP], tuple);
667 if (err < 0)
668 return err;
670 if (!tb[CTA_TUPLE_PROTO])
671 return -EINVAL;
673 err = ctnetlink_parse_tuple_proto(tb[CTA_TUPLE_PROTO], tuple);
674 if (err < 0)
675 return err;
677 /* orig and expect tuples get DIR_ORIGINAL */
678 if (type == CTA_TUPLE_REPLY)
679 tuple->dst.dir = IP_CT_DIR_REPLY;
680 else
681 tuple->dst.dir = IP_CT_DIR_ORIGINAL;
683 return 0;
686 static inline int
687 ctnetlink_parse_help(struct nlattr *attr, char **helper_name)
689 struct nlattr *tb[CTA_HELP_MAX+1];
691 nla_parse_nested(tb, CTA_HELP_MAX, attr, NULL);
693 if (!tb[CTA_HELP_NAME])
694 return -EINVAL;
696 *helper_name = nla_data(tb[CTA_HELP_NAME]);
698 return 0;
701 static const struct nla_policy ct_nla_policy[CTA_MAX+1] = {
702 [CTA_STATUS] = { .type = NLA_U32 },
703 [CTA_TIMEOUT] = { .type = NLA_U32 },
704 [CTA_MARK] = { .type = NLA_U32 },
705 [CTA_USE] = { .type = NLA_U32 },
706 [CTA_ID] = { .type = NLA_U32 },
709 static int
710 ctnetlink_del_conntrack(struct sock *ctnl, struct sk_buff *skb,
711 struct nlmsghdr *nlh, struct nlattr *cda[])
713 struct nf_conntrack_tuple_hash *h;
714 struct nf_conntrack_tuple tuple;
715 struct nf_conn *ct;
716 struct nfgenmsg *nfmsg = NLMSG_DATA(nlh);
717 u_int8_t u3 = nfmsg->nfgen_family;
718 int err = 0;
720 if (cda[CTA_TUPLE_ORIG])
721 err = ctnetlink_parse_tuple(cda, &tuple, CTA_TUPLE_ORIG, u3);
722 else if (cda[CTA_TUPLE_REPLY])
723 err = ctnetlink_parse_tuple(cda, &tuple, CTA_TUPLE_REPLY, u3);
724 else {
725 /* Flush the whole table */
726 nf_conntrack_flush(&init_net,
727 NETLINK_CB(skb).pid,
728 nlmsg_report(nlh));
729 return 0;
732 if (err < 0)
733 return err;
735 h = nf_conntrack_find_get(&init_net, &tuple);
736 if (!h)
737 return -ENOENT;
739 ct = nf_ct_tuplehash_to_ctrack(h);
741 if (cda[CTA_ID]) {
742 u_int32_t id = ntohl(nla_get_be32(cda[CTA_ID]));
743 if (id != (u32)(unsigned long)ct) {
744 nf_ct_put(ct);
745 return -ENOENT;
749 nf_conntrack_event_report(IPCT_DESTROY,
751 NETLINK_CB(skb).pid,
752 nlmsg_report(nlh));
754 /* death_by_timeout would report the event again */
755 set_bit(IPS_DYING_BIT, &ct->status);
757 nf_ct_kill(ct);
758 nf_ct_put(ct);
760 return 0;
763 static int
764 ctnetlink_get_conntrack(struct sock *ctnl, struct sk_buff *skb,
765 struct nlmsghdr *nlh, struct nlattr *cda[])
767 struct nf_conntrack_tuple_hash *h;
768 struct nf_conntrack_tuple tuple;
769 struct nf_conn *ct;
770 struct sk_buff *skb2 = NULL;
771 struct nfgenmsg *nfmsg = NLMSG_DATA(nlh);
772 u_int8_t u3 = nfmsg->nfgen_family;
773 int err = 0;
775 if (nlh->nlmsg_flags & NLM_F_DUMP)
776 return netlink_dump_start(ctnl, skb, nlh, ctnetlink_dump_table,
777 ctnetlink_done);
779 if (cda[CTA_TUPLE_ORIG])
780 err = ctnetlink_parse_tuple(cda, &tuple, CTA_TUPLE_ORIG, u3);
781 else if (cda[CTA_TUPLE_REPLY])
782 err = ctnetlink_parse_tuple(cda, &tuple, CTA_TUPLE_REPLY, u3);
783 else
784 return -EINVAL;
786 if (err < 0)
787 return err;
789 h = nf_conntrack_find_get(&init_net, &tuple);
790 if (!h)
791 return -ENOENT;
793 ct = nf_ct_tuplehash_to_ctrack(h);
795 err = -ENOMEM;
796 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
797 if (!skb2) {
798 nf_ct_put(ct);
799 return -ENOMEM;
802 rcu_read_lock();
803 err = ctnetlink_fill_info(skb2, NETLINK_CB(skb).pid, nlh->nlmsg_seq,
804 IPCTNL_MSG_CT_NEW, 1, ct);
805 rcu_read_unlock();
806 nf_ct_put(ct);
807 if (err <= 0)
808 goto free;
810 err = netlink_unicast(ctnl, skb2, NETLINK_CB(skb).pid, MSG_DONTWAIT);
811 if (err < 0)
812 goto out;
814 return 0;
816 free:
817 kfree_skb(skb2);
818 out:
819 return err;
822 #ifdef CONFIG_NF_NAT_NEEDED
823 static int
824 ctnetlink_parse_nat_setup(struct nf_conn *ct,
825 enum nf_nat_manip_type manip,
826 struct nlattr *attr)
828 typeof(nfnetlink_parse_nat_setup_hook) parse_nat_setup;
830 parse_nat_setup = rcu_dereference(nfnetlink_parse_nat_setup_hook);
831 if (!parse_nat_setup) {
832 #ifdef CONFIG_MODULES
833 rcu_read_unlock();
834 spin_unlock_bh(&nf_conntrack_lock);
835 nfnl_unlock();
836 if (request_module("nf-nat-ipv4") < 0) {
837 nfnl_lock();
838 spin_lock_bh(&nf_conntrack_lock);
839 rcu_read_lock();
840 return -EOPNOTSUPP;
842 nfnl_lock();
843 spin_lock_bh(&nf_conntrack_lock);
844 rcu_read_lock();
845 if (nfnetlink_parse_nat_setup_hook)
846 return -EAGAIN;
847 #endif
848 return -EOPNOTSUPP;
851 return parse_nat_setup(ct, manip, attr);
853 #endif
855 static int
856 ctnetlink_change_status(struct nf_conn *ct, struct nlattr *cda[])
858 unsigned long d;
859 unsigned int status = ntohl(nla_get_be32(cda[CTA_STATUS]));
860 d = ct->status ^ status;
862 if (d & (IPS_EXPECTED|IPS_CONFIRMED|IPS_DYING))
863 /* unchangeable */
864 return -EBUSY;
866 if (d & IPS_SEEN_REPLY && !(status & IPS_SEEN_REPLY))
867 /* SEEN_REPLY bit can only be set */
868 return -EBUSY;
870 if (d & IPS_ASSURED && !(status & IPS_ASSURED))
871 /* ASSURED bit can only be set */
872 return -EBUSY;
874 /* Be careful here, modifying NAT bits can screw up things,
875 * so don't let users modify them directly if they don't pass
876 * nf_nat_range. */
877 ct->status |= status & ~(IPS_NAT_DONE_MASK | IPS_NAT_MASK);
878 return 0;
881 static int
882 ctnetlink_change_nat(struct nf_conn *ct, struct nlattr *cda[])
884 #ifdef CONFIG_NF_NAT_NEEDED
885 int ret;
887 if (cda[CTA_NAT_DST]) {
888 ret = ctnetlink_parse_nat_setup(ct,
889 IP_NAT_MANIP_DST,
890 cda[CTA_NAT_DST]);
891 if (ret < 0)
892 return ret;
894 if (cda[CTA_NAT_SRC]) {
895 ret = ctnetlink_parse_nat_setup(ct,
896 IP_NAT_MANIP_SRC,
897 cda[CTA_NAT_SRC]);
898 if (ret < 0)
899 return ret;
901 return 0;
902 #else
903 return -EOPNOTSUPP;
904 #endif
907 static inline int
908 ctnetlink_change_helper(struct nf_conn *ct, struct nlattr *cda[])
910 struct nf_conntrack_helper *helper;
911 struct nf_conn_help *help = nfct_help(ct);
912 char *helpname;
913 int err;
915 /* don't change helper of sibling connections */
916 if (ct->master)
917 return -EBUSY;
919 err = ctnetlink_parse_help(cda[CTA_HELP], &helpname);
920 if (err < 0)
921 return err;
923 if (!strcmp(helpname, "")) {
924 if (help && help->helper) {
925 /* we had a helper before ... */
926 nf_ct_remove_expectations(ct);
927 rcu_assign_pointer(help->helper, NULL);
930 return 0;
933 helper = __nf_conntrack_helper_find_byname(helpname);
934 if (helper == NULL) {
935 #ifdef CONFIG_MODULES
936 spin_unlock_bh(&nf_conntrack_lock);
938 if (request_module("nfct-helper-%s", helpname) < 0) {
939 spin_lock_bh(&nf_conntrack_lock);
940 return -EOPNOTSUPP;
943 spin_lock_bh(&nf_conntrack_lock);
944 helper = __nf_conntrack_helper_find_byname(helpname);
945 if (helper)
946 return -EAGAIN;
947 #endif
948 return -EOPNOTSUPP;
951 if (help) {
952 if (help->helper == helper)
953 return 0;
954 if (help->helper)
955 return -EBUSY;
956 /* need to zero data of old helper */
957 memset(&help->help, 0, sizeof(help->help));
958 } else {
959 help = nf_ct_helper_ext_add(ct, GFP_ATOMIC);
960 if (help == NULL)
961 return -ENOMEM;
964 rcu_assign_pointer(help->helper, helper);
966 return 0;
969 static inline int
970 ctnetlink_change_timeout(struct nf_conn *ct, struct nlattr *cda[])
972 u_int32_t timeout = ntohl(nla_get_be32(cda[CTA_TIMEOUT]));
974 if (!del_timer(&ct->timeout))
975 return -ETIME;
977 ct->timeout.expires = jiffies + timeout * HZ;
978 add_timer(&ct->timeout);
980 return 0;
983 static inline int
984 ctnetlink_change_protoinfo(struct nf_conn *ct, struct nlattr *cda[])
986 struct nlattr *tb[CTA_PROTOINFO_MAX+1], *attr = cda[CTA_PROTOINFO];
987 struct nf_conntrack_l4proto *l4proto;
988 int err = 0;
990 nla_parse_nested(tb, CTA_PROTOINFO_MAX, attr, NULL);
992 l4proto = nf_ct_l4proto_find_get(nf_ct_l3num(ct), nf_ct_protonum(ct));
993 if (l4proto->from_nlattr)
994 err = l4proto->from_nlattr(tb, ct);
995 nf_ct_l4proto_put(l4proto);
997 return err;
1000 #ifdef CONFIG_NF_NAT_NEEDED
1001 static inline int
1002 change_nat_seq_adj(struct nf_nat_seq *natseq, struct nlattr *attr)
1004 struct nlattr *cda[CTA_NAT_SEQ_MAX+1];
1006 nla_parse_nested(cda, CTA_NAT_SEQ_MAX, attr, NULL);
1008 if (!cda[CTA_NAT_SEQ_CORRECTION_POS])
1009 return -EINVAL;
1011 natseq->correction_pos =
1012 ntohl(nla_get_be32(cda[CTA_NAT_SEQ_CORRECTION_POS]));
1014 if (!cda[CTA_NAT_SEQ_OFFSET_BEFORE])
1015 return -EINVAL;
1017 natseq->offset_before =
1018 ntohl(nla_get_be32(cda[CTA_NAT_SEQ_OFFSET_BEFORE]));
1020 if (!cda[CTA_NAT_SEQ_OFFSET_AFTER])
1021 return -EINVAL;
1023 natseq->offset_after =
1024 ntohl(nla_get_be32(cda[CTA_NAT_SEQ_OFFSET_AFTER]));
1026 return 0;
1029 static int
1030 ctnetlink_change_nat_seq_adj(struct nf_conn *ct, struct nlattr *cda[])
1032 int ret = 0;
1033 struct nf_conn_nat *nat = nfct_nat(ct);
1035 if (!nat)
1036 return 0;
1038 if (cda[CTA_NAT_SEQ_ADJ_ORIG]) {
1039 ret = change_nat_seq_adj(&nat->seq[IP_CT_DIR_ORIGINAL],
1040 cda[CTA_NAT_SEQ_ADJ_ORIG]);
1041 if (ret < 0)
1042 return ret;
1044 ct->status |= IPS_SEQ_ADJUST;
1047 if (cda[CTA_NAT_SEQ_ADJ_REPLY]) {
1048 ret = change_nat_seq_adj(&nat->seq[IP_CT_DIR_REPLY],
1049 cda[CTA_NAT_SEQ_ADJ_REPLY]);
1050 if (ret < 0)
1051 return ret;
1053 ct->status |= IPS_SEQ_ADJUST;
1056 return 0;
1058 #endif
1060 static int
1061 ctnetlink_change_conntrack(struct nf_conn *ct, struct nlattr *cda[])
1063 int err;
1065 if (cda[CTA_HELP]) {
1066 err = ctnetlink_change_helper(ct, cda);
1067 if (err < 0)
1068 return err;
1071 if (cda[CTA_TIMEOUT]) {
1072 err = ctnetlink_change_timeout(ct, cda);
1073 if (err < 0)
1074 return err;
1077 if (cda[CTA_STATUS]) {
1078 err = ctnetlink_change_status(ct, cda);
1079 if (err < 0)
1080 return err;
1083 if (cda[CTA_PROTOINFO]) {
1084 err = ctnetlink_change_protoinfo(ct, cda);
1085 if (err < 0)
1086 return err;
1089 #if defined(CONFIG_NF_CONNTRACK_MARK)
1090 if (cda[CTA_MARK])
1091 ct->mark = ntohl(nla_get_be32(cda[CTA_MARK]));
1092 #endif
1094 #ifdef CONFIG_NF_NAT_NEEDED
1095 if (cda[CTA_NAT_SEQ_ADJ_ORIG] || cda[CTA_NAT_SEQ_ADJ_REPLY]) {
1096 err = ctnetlink_change_nat_seq_adj(ct, cda);
1097 if (err < 0)
1098 return err;
1100 #endif
1102 return 0;
1105 static inline void
1106 ctnetlink_event_report(struct nf_conn *ct, u32 pid, int report)
1108 unsigned int events = 0;
1110 if (test_bit(IPS_EXPECTED_BIT, &ct->status))
1111 events |= IPCT_RELATED;
1112 else
1113 events |= IPCT_NEW;
1115 nf_conntrack_event_report(IPCT_STATUS |
1116 IPCT_HELPER |
1117 IPCT_REFRESH |
1118 IPCT_PROTOINFO |
1119 IPCT_NATSEQADJ |
1120 IPCT_MARK |
1121 events,
1123 pid,
1124 report);
1127 static int
1128 ctnetlink_create_conntrack(struct nlattr *cda[],
1129 struct nf_conntrack_tuple *otuple,
1130 struct nf_conntrack_tuple *rtuple,
1131 struct nf_conn *master_ct,
1132 u32 pid,
1133 int report)
1135 struct nf_conn *ct;
1136 int err = -EINVAL;
1137 struct nf_conntrack_helper *helper;
1139 ct = nf_conntrack_alloc(&init_net, otuple, rtuple, GFP_ATOMIC);
1140 if (IS_ERR(ct))
1141 return -ENOMEM;
1143 if (!cda[CTA_TIMEOUT])
1144 goto err;
1145 ct->timeout.expires = ntohl(nla_get_be32(cda[CTA_TIMEOUT]));
1147 ct->timeout.expires = jiffies + ct->timeout.expires * HZ;
1148 ct->status |= IPS_CONFIRMED;
1150 rcu_read_lock();
1151 if (cda[CTA_HELP]) {
1152 char *helpname;
1154 err = ctnetlink_parse_help(cda[CTA_HELP], &helpname);
1155 if (err < 0) {
1156 rcu_read_unlock();
1157 goto err;
1160 helper = __nf_conntrack_helper_find_byname(helpname);
1161 if (helper == NULL) {
1162 rcu_read_unlock();
1163 #ifdef CONFIG_MODULES
1164 if (request_module("nfct-helper-%s", helpname) < 0) {
1165 err = -EOPNOTSUPP;
1166 goto err;
1169 rcu_read_lock();
1170 helper = __nf_conntrack_helper_find_byname(helpname);
1171 if (helper) {
1172 rcu_read_unlock();
1173 err = -EAGAIN;
1174 goto err;
1176 rcu_read_unlock();
1177 #endif
1178 err = -EOPNOTSUPP;
1179 goto err;
1180 } else {
1181 struct nf_conn_help *help;
1183 help = nf_ct_helper_ext_add(ct, GFP_ATOMIC);
1184 if (help == NULL) {
1185 rcu_read_unlock();
1186 err = -ENOMEM;
1187 goto err;
1190 /* not in hash table yet so not strictly necessary */
1191 rcu_assign_pointer(help->helper, helper);
1193 } else {
1194 /* try an implicit helper assignation */
1195 err = __nf_ct_try_assign_helper(ct, GFP_ATOMIC);
1196 if (err < 0) {
1197 rcu_read_unlock();
1198 goto err;
1202 if (cda[CTA_STATUS]) {
1203 err = ctnetlink_change_status(ct, cda);
1204 if (err < 0) {
1205 rcu_read_unlock();
1206 goto err;
1210 if (cda[CTA_NAT_SRC] || cda[CTA_NAT_DST]) {
1211 err = ctnetlink_change_nat(ct, cda);
1212 if (err < 0) {
1213 rcu_read_unlock();
1214 goto err;
1218 if (cda[CTA_PROTOINFO]) {
1219 err = ctnetlink_change_protoinfo(ct, cda);
1220 if (err < 0) {
1221 rcu_read_unlock();
1222 goto err;
1226 nf_ct_acct_ext_add(ct, GFP_ATOMIC);
1228 #if defined(CONFIG_NF_CONNTRACK_MARK)
1229 if (cda[CTA_MARK])
1230 ct->mark = ntohl(nla_get_be32(cda[CTA_MARK]));
1231 #endif
1233 /* setup master conntrack: this is a confirmed expectation */
1234 if (master_ct) {
1235 __set_bit(IPS_EXPECTED_BIT, &ct->status);
1236 ct->master = master_ct;
1239 nf_conntrack_get(&ct->ct_general);
1240 add_timer(&ct->timeout);
1241 nf_conntrack_hash_insert(ct);
1242 rcu_read_unlock();
1243 ctnetlink_event_report(ct, pid, report);
1244 nf_ct_put(ct);
1246 return 0;
1248 err:
1249 nf_conntrack_free(ct);
1250 return err;
1253 static int
1254 ctnetlink_new_conntrack(struct sock *ctnl, struct sk_buff *skb,
1255 struct nlmsghdr *nlh, struct nlattr *cda[])
1257 struct nf_conntrack_tuple otuple, rtuple;
1258 struct nf_conntrack_tuple_hash *h = NULL;
1259 struct nfgenmsg *nfmsg = NLMSG_DATA(nlh);
1260 u_int8_t u3 = nfmsg->nfgen_family;
1261 int err = 0;
1263 if (cda[CTA_TUPLE_ORIG]) {
1264 err = ctnetlink_parse_tuple(cda, &otuple, CTA_TUPLE_ORIG, u3);
1265 if (err < 0)
1266 return err;
1269 if (cda[CTA_TUPLE_REPLY]) {
1270 err = ctnetlink_parse_tuple(cda, &rtuple, CTA_TUPLE_REPLY, u3);
1271 if (err < 0)
1272 return err;
1275 spin_lock_bh(&nf_conntrack_lock);
1276 if (cda[CTA_TUPLE_ORIG])
1277 h = __nf_conntrack_find(&init_net, &otuple);
1278 else if (cda[CTA_TUPLE_REPLY])
1279 h = __nf_conntrack_find(&init_net, &rtuple);
1281 if (h == NULL) {
1282 struct nf_conntrack_tuple master;
1283 struct nf_conntrack_tuple_hash *master_h = NULL;
1284 struct nf_conn *master_ct = NULL;
1286 if (cda[CTA_TUPLE_MASTER]) {
1287 err = ctnetlink_parse_tuple(cda,
1288 &master,
1289 CTA_TUPLE_MASTER,
1290 u3);
1291 if (err < 0)
1292 goto out_unlock;
1294 master_h = __nf_conntrack_find(&init_net, &master);
1295 if (master_h == NULL) {
1296 err = -ENOENT;
1297 goto out_unlock;
1299 master_ct = nf_ct_tuplehash_to_ctrack(master_h);
1300 nf_conntrack_get(&master_ct->ct_general);
1303 err = -ENOENT;
1304 if (nlh->nlmsg_flags & NLM_F_CREATE)
1305 err = ctnetlink_create_conntrack(cda,
1306 &otuple,
1307 &rtuple,
1308 master_ct,
1309 NETLINK_CB(skb).pid,
1310 nlmsg_report(nlh));
1311 spin_unlock_bh(&nf_conntrack_lock);
1312 if (err < 0 && master_ct)
1313 nf_ct_put(master_ct);
1315 return err;
1317 /* implicit 'else' */
1319 /* We manipulate the conntrack inside the global conntrack table lock,
1320 * so there's no need to increase the refcount */
1321 err = -EEXIST;
1322 if (!(nlh->nlmsg_flags & NLM_F_EXCL)) {
1323 struct nf_conn *ct = nf_ct_tuplehash_to_ctrack(h);
1325 /* we only allow nat config for new conntracks */
1326 if (cda[CTA_NAT_SRC] || cda[CTA_NAT_DST]) {
1327 err = -EOPNOTSUPP;
1328 goto out_unlock;
1330 /* can't link an existing conntrack to a master */
1331 if (cda[CTA_TUPLE_MASTER]) {
1332 err = -EOPNOTSUPP;
1333 goto out_unlock;
1336 err = ctnetlink_change_conntrack(ct, cda);
1337 if (err == 0) {
1338 nf_conntrack_get(&ct->ct_general);
1339 spin_unlock_bh(&nf_conntrack_lock);
1340 ctnetlink_event_report(ct,
1341 NETLINK_CB(skb).pid,
1342 nlmsg_report(nlh));
1343 nf_ct_put(ct);
1344 } else
1345 spin_unlock_bh(&nf_conntrack_lock);
1347 return err;
1350 out_unlock:
1351 spin_unlock_bh(&nf_conntrack_lock);
1352 return err;
1355 /***********************************************************************
1356 * EXPECT
1357 ***********************************************************************/
1359 static inline int
1360 ctnetlink_exp_dump_tuple(struct sk_buff *skb,
1361 const struct nf_conntrack_tuple *tuple,
1362 enum ctattr_expect type)
1364 struct nlattr *nest_parms;
1366 nest_parms = nla_nest_start(skb, type | NLA_F_NESTED);
1367 if (!nest_parms)
1368 goto nla_put_failure;
1369 if (ctnetlink_dump_tuples(skb, tuple) < 0)
1370 goto nla_put_failure;
1371 nla_nest_end(skb, nest_parms);
1373 return 0;
1375 nla_put_failure:
1376 return -1;
1379 static inline int
1380 ctnetlink_exp_dump_mask(struct sk_buff *skb,
1381 const struct nf_conntrack_tuple *tuple,
1382 const struct nf_conntrack_tuple_mask *mask)
1384 int ret;
1385 struct nf_conntrack_l3proto *l3proto;
1386 struct nf_conntrack_l4proto *l4proto;
1387 struct nf_conntrack_tuple m;
1388 struct nlattr *nest_parms;
1390 memset(&m, 0xFF, sizeof(m));
1391 m.src.u.all = mask->src.u.all;
1392 memcpy(&m.src.u3, &mask->src.u3, sizeof(m.src.u3));
1394 nest_parms = nla_nest_start(skb, CTA_EXPECT_MASK | NLA_F_NESTED);
1395 if (!nest_parms)
1396 goto nla_put_failure;
1398 l3proto = __nf_ct_l3proto_find(tuple->src.l3num);
1399 ret = ctnetlink_dump_tuples_ip(skb, &m, l3proto);
1401 if (unlikely(ret < 0))
1402 goto nla_put_failure;
1404 l4proto = __nf_ct_l4proto_find(tuple->src.l3num, tuple->dst.protonum);
1405 ret = ctnetlink_dump_tuples_proto(skb, &m, l4proto);
1406 if (unlikely(ret < 0))
1407 goto nla_put_failure;
1409 nla_nest_end(skb, nest_parms);
1411 return 0;
1413 nla_put_failure:
1414 return -1;
1417 static int
1418 ctnetlink_exp_dump_expect(struct sk_buff *skb,
1419 const struct nf_conntrack_expect *exp)
1421 struct nf_conn *master = exp->master;
1422 long timeout = (exp->timeout.expires - jiffies) / HZ;
1424 if (timeout < 0)
1425 timeout = 0;
1427 if (ctnetlink_exp_dump_tuple(skb, &exp->tuple, CTA_EXPECT_TUPLE) < 0)
1428 goto nla_put_failure;
1429 if (ctnetlink_exp_dump_mask(skb, &exp->tuple, &exp->mask) < 0)
1430 goto nla_put_failure;
1431 if (ctnetlink_exp_dump_tuple(skb,
1432 &master->tuplehash[IP_CT_DIR_ORIGINAL].tuple,
1433 CTA_EXPECT_MASTER) < 0)
1434 goto nla_put_failure;
1436 NLA_PUT_BE32(skb, CTA_EXPECT_TIMEOUT, htonl(timeout));
1437 NLA_PUT_BE32(skb, CTA_EXPECT_ID, htonl((unsigned long)exp));
1439 return 0;
1441 nla_put_failure:
1442 return -1;
1445 static int
1446 ctnetlink_exp_fill_info(struct sk_buff *skb, u32 pid, u32 seq,
1447 int event,
1448 int nowait,
1449 const struct nf_conntrack_expect *exp)
1451 struct nlmsghdr *nlh;
1452 struct nfgenmsg *nfmsg;
1453 unsigned char *b = skb_tail_pointer(skb);
1455 event |= NFNL_SUBSYS_CTNETLINK_EXP << 8;
1456 nlh = NLMSG_PUT(skb, pid, seq, event, sizeof(struct nfgenmsg));
1457 nfmsg = NLMSG_DATA(nlh);
1459 nlh->nlmsg_flags = (nowait && pid) ? NLM_F_MULTI : 0;
1460 nfmsg->nfgen_family = exp->tuple.src.l3num;
1461 nfmsg->version = NFNETLINK_V0;
1462 nfmsg->res_id = 0;
1464 if (ctnetlink_exp_dump_expect(skb, exp) < 0)
1465 goto nla_put_failure;
1467 nlh->nlmsg_len = skb_tail_pointer(skb) - b;
1468 return skb->len;
1470 nlmsg_failure:
1471 nla_put_failure:
1472 nlmsg_trim(skb, b);
1473 return -1;
1476 #ifdef CONFIG_NF_CONNTRACK_EVENTS
1477 static int ctnetlink_expect_event(struct notifier_block *this,
1478 unsigned long events, void *ptr)
1480 struct nlmsghdr *nlh;
1481 struct nfgenmsg *nfmsg;
1482 struct nf_exp_event *item = (struct nf_exp_event *)ptr;
1483 struct nf_conntrack_expect *exp = item->exp;
1484 struct sk_buff *skb;
1485 unsigned int type;
1486 sk_buff_data_t b;
1487 int flags = 0;
1489 if (events & IPEXP_NEW) {
1490 type = IPCTNL_MSG_EXP_NEW;
1491 flags = NLM_F_CREATE|NLM_F_EXCL;
1492 } else
1493 return NOTIFY_DONE;
1495 if (!nfnetlink_has_listeners(NFNLGRP_CONNTRACK_EXP_NEW))
1496 return NOTIFY_DONE;
1498 skb = alloc_skb(NLMSG_GOODSIZE, GFP_ATOMIC);
1499 if (!skb)
1500 return NOTIFY_DONE;
1502 b = skb->tail;
1504 type |= NFNL_SUBSYS_CTNETLINK_EXP << 8;
1505 nlh = NLMSG_PUT(skb, item->pid, 0, type, sizeof(struct nfgenmsg));
1506 nfmsg = NLMSG_DATA(nlh);
1508 nlh->nlmsg_flags = flags;
1509 nfmsg->nfgen_family = exp->tuple.src.l3num;
1510 nfmsg->version = NFNETLINK_V0;
1511 nfmsg->res_id = 0;
1513 rcu_read_lock();
1514 if (ctnetlink_exp_dump_expect(skb, exp) < 0)
1515 goto nla_put_failure;
1516 rcu_read_unlock();
1518 nlh->nlmsg_len = skb->tail - b;
1519 nfnetlink_send(skb, item->pid, NFNLGRP_CONNTRACK_EXP_NEW, item->report);
1520 return NOTIFY_DONE;
1522 nla_put_failure:
1523 rcu_read_unlock();
1524 nlmsg_failure:
1525 kfree_skb(skb);
1526 return NOTIFY_DONE;
1528 #endif
1529 static int ctnetlink_exp_done(struct netlink_callback *cb)
1531 if (cb->args[1])
1532 nf_ct_expect_put((struct nf_conntrack_expect *)cb->args[1]);
1533 return 0;
1536 static int
1537 ctnetlink_exp_dump_table(struct sk_buff *skb, struct netlink_callback *cb)
1539 struct net *net = &init_net;
1540 struct nf_conntrack_expect *exp, *last;
1541 struct nfgenmsg *nfmsg = NLMSG_DATA(cb->nlh);
1542 struct hlist_node *n;
1543 u_int8_t l3proto = nfmsg->nfgen_family;
1545 rcu_read_lock();
1546 last = (struct nf_conntrack_expect *)cb->args[1];
1547 for (; cb->args[0] < nf_ct_expect_hsize; cb->args[0]++) {
1548 restart:
1549 hlist_for_each_entry(exp, n, &net->ct.expect_hash[cb->args[0]],
1550 hnode) {
1551 if (l3proto && exp->tuple.src.l3num != l3proto)
1552 continue;
1553 if (cb->args[1]) {
1554 if (exp != last)
1555 continue;
1556 cb->args[1] = 0;
1558 if (ctnetlink_exp_fill_info(skb, NETLINK_CB(cb->skb).pid,
1559 cb->nlh->nlmsg_seq,
1560 IPCTNL_MSG_EXP_NEW,
1561 1, exp) < 0) {
1562 if (!atomic_inc_not_zero(&exp->use))
1563 continue;
1564 cb->args[1] = (unsigned long)exp;
1565 goto out;
1568 if (cb->args[1]) {
1569 cb->args[1] = 0;
1570 goto restart;
1573 out:
1574 rcu_read_unlock();
1575 if (last)
1576 nf_ct_expect_put(last);
1578 return skb->len;
1581 static const struct nla_policy exp_nla_policy[CTA_EXPECT_MAX+1] = {
1582 [CTA_EXPECT_TIMEOUT] = { .type = NLA_U32 },
1583 [CTA_EXPECT_ID] = { .type = NLA_U32 },
1586 static int
1587 ctnetlink_get_expect(struct sock *ctnl, struct sk_buff *skb,
1588 struct nlmsghdr *nlh, struct nlattr *cda[])
1590 struct nf_conntrack_tuple tuple;
1591 struct nf_conntrack_expect *exp;
1592 struct sk_buff *skb2;
1593 struct nfgenmsg *nfmsg = NLMSG_DATA(nlh);
1594 u_int8_t u3 = nfmsg->nfgen_family;
1595 int err = 0;
1597 if (nlh->nlmsg_flags & NLM_F_DUMP) {
1598 return netlink_dump_start(ctnl, skb, nlh,
1599 ctnetlink_exp_dump_table,
1600 ctnetlink_exp_done);
1603 if (cda[CTA_EXPECT_MASTER])
1604 err = ctnetlink_parse_tuple(cda, &tuple, CTA_EXPECT_MASTER, u3);
1605 else
1606 return -EINVAL;
1608 if (err < 0)
1609 return err;
1611 exp = nf_ct_expect_find_get(&init_net, &tuple);
1612 if (!exp)
1613 return -ENOENT;
1615 if (cda[CTA_EXPECT_ID]) {
1616 __be32 id = nla_get_be32(cda[CTA_EXPECT_ID]);
1617 if (ntohl(id) != (u32)(unsigned long)exp) {
1618 nf_ct_expect_put(exp);
1619 return -ENOENT;
1623 err = -ENOMEM;
1624 skb2 = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL);
1625 if (!skb2)
1626 goto out;
1628 rcu_read_lock();
1629 err = ctnetlink_exp_fill_info(skb2, NETLINK_CB(skb).pid,
1630 nlh->nlmsg_seq, IPCTNL_MSG_EXP_NEW,
1631 1, exp);
1632 rcu_read_unlock();
1633 if (err <= 0)
1634 goto free;
1636 nf_ct_expect_put(exp);
1638 return netlink_unicast(ctnl, skb2, NETLINK_CB(skb).pid, MSG_DONTWAIT);
1640 free:
1641 kfree_skb(skb2);
1642 out:
1643 nf_ct_expect_put(exp);
1644 return err;
1647 static int
1648 ctnetlink_del_expect(struct sock *ctnl, struct sk_buff *skb,
1649 struct nlmsghdr *nlh, struct nlattr *cda[])
1651 struct nf_conntrack_expect *exp;
1652 struct nf_conntrack_tuple tuple;
1653 struct nf_conntrack_helper *h;
1654 struct nfgenmsg *nfmsg = NLMSG_DATA(nlh);
1655 struct hlist_node *n, *next;
1656 u_int8_t u3 = nfmsg->nfgen_family;
1657 unsigned int i;
1658 int err;
1660 if (cda[CTA_EXPECT_TUPLE]) {
1661 /* delete a single expect by tuple */
1662 err = ctnetlink_parse_tuple(cda, &tuple, CTA_EXPECT_TUPLE, u3);
1663 if (err < 0)
1664 return err;
1666 /* bump usage count to 2 */
1667 exp = nf_ct_expect_find_get(&init_net, &tuple);
1668 if (!exp)
1669 return -ENOENT;
1671 if (cda[CTA_EXPECT_ID]) {
1672 __be32 id = nla_get_be32(cda[CTA_EXPECT_ID]);
1673 if (ntohl(id) != (u32)(unsigned long)exp) {
1674 nf_ct_expect_put(exp);
1675 return -ENOENT;
1679 /* after list removal, usage count == 1 */
1680 nf_ct_unexpect_related(exp);
1681 /* have to put what we 'get' above.
1682 * after this line usage count == 0 */
1683 nf_ct_expect_put(exp);
1684 } else if (cda[CTA_EXPECT_HELP_NAME]) {
1685 char *name = nla_data(cda[CTA_EXPECT_HELP_NAME]);
1686 struct nf_conn_help *m_help;
1688 /* delete all expectations for this helper */
1689 spin_lock_bh(&nf_conntrack_lock);
1690 h = __nf_conntrack_helper_find_byname(name);
1691 if (!h) {
1692 spin_unlock_bh(&nf_conntrack_lock);
1693 return -EOPNOTSUPP;
1695 for (i = 0; i < nf_ct_expect_hsize; i++) {
1696 hlist_for_each_entry_safe(exp, n, next,
1697 &init_net.ct.expect_hash[i],
1698 hnode) {
1699 m_help = nfct_help(exp->master);
1700 if (m_help->helper == h
1701 && del_timer(&exp->timeout)) {
1702 nf_ct_unlink_expect(exp);
1703 nf_ct_expect_put(exp);
1707 spin_unlock_bh(&nf_conntrack_lock);
1708 } else {
1709 /* This basically means we have to flush everything*/
1710 spin_lock_bh(&nf_conntrack_lock);
1711 for (i = 0; i < nf_ct_expect_hsize; i++) {
1712 hlist_for_each_entry_safe(exp, n, next,
1713 &init_net.ct.expect_hash[i],
1714 hnode) {
1715 if (del_timer(&exp->timeout)) {
1716 nf_ct_unlink_expect(exp);
1717 nf_ct_expect_put(exp);
1721 spin_unlock_bh(&nf_conntrack_lock);
1724 return 0;
1726 static int
1727 ctnetlink_change_expect(struct nf_conntrack_expect *x, struct nlattr *cda[])
1729 return -EOPNOTSUPP;
1732 static int
1733 ctnetlink_create_expect(struct nlattr *cda[], u_int8_t u3, u32 pid, int report)
1735 struct nf_conntrack_tuple tuple, mask, master_tuple;
1736 struct nf_conntrack_tuple_hash *h = NULL;
1737 struct nf_conntrack_expect *exp;
1738 struct nf_conn *ct;
1739 struct nf_conn_help *help;
1740 int err = 0;
1742 /* caller guarantees that those three CTA_EXPECT_* exist */
1743 err = ctnetlink_parse_tuple(cda, &tuple, CTA_EXPECT_TUPLE, u3);
1744 if (err < 0)
1745 return err;
1746 err = ctnetlink_parse_tuple(cda, &mask, CTA_EXPECT_MASK, u3);
1747 if (err < 0)
1748 return err;
1749 err = ctnetlink_parse_tuple(cda, &master_tuple, CTA_EXPECT_MASTER, u3);
1750 if (err < 0)
1751 return err;
1753 /* Look for master conntrack of this expectation */
1754 h = nf_conntrack_find_get(&init_net, &master_tuple);
1755 if (!h)
1756 return -ENOENT;
1757 ct = nf_ct_tuplehash_to_ctrack(h);
1758 help = nfct_help(ct);
1760 if (!help || !help->helper) {
1761 /* such conntrack hasn't got any helper, abort */
1762 err = -EOPNOTSUPP;
1763 goto out;
1766 exp = nf_ct_expect_alloc(ct);
1767 if (!exp) {
1768 err = -ENOMEM;
1769 goto out;
1772 exp->expectfn = NULL;
1773 exp->flags = 0;
1774 exp->master = ct;
1775 exp->helper = NULL;
1776 memcpy(&exp->tuple, &tuple, sizeof(struct nf_conntrack_tuple));
1777 memcpy(&exp->mask.src.u3, &mask.src.u3, sizeof(exp->mask.src.u3));
1778 exp->mask.src.u.all = mask.src.u.all;
1780 err = nf_ct_expect_related_report(exp, pid, report);
1781 nf_ct_expect_put(exp);
1783 out:
1784 nf_ct_put(nf_ct_tuplehash_to_ctrack(h));
1785 return err;
1788 static int
1789 ctnetlink_new_expect(struct sock *ctnl, struct sk_buff *skb,
1790 struct nlmsghdr *nlh, struct nlattr *cda[])
1792 struct nf_conntrack_tuple tuple;
1793 struct nf_conntrack_expect *exp;
1794 struct nfgenmsg *nfmsg = NLMSG_DATA(nlh);
1795 u_int8_t u3 = nfmsg->nfgen_family;
1796 int err = 0;
1798 if (!cda[CTA_EXPECT_TUPLE]
1799 || !cda[CTA_EXPECT_MASK]
1800 || !cda[CTA_EXPECT_MASTER])
1801 return -EINVAL;
1803 err = ctnetlink_parse_tuple(cda, &tuple, CTA_EXPECT_TUPLE, u3);
1804 if (err < 0)
1805 return err;
1807 spin_lock_bh(&nf_conntrack_lock);
1808 exp = __nf_ct_expect_find(&init_net, &tuple);
1810 if (!exp) {
1811 spin_unlock_bh(&nf_conntrack_lock);
1812 err = -ENOENT;
1813 if (nlh->nlmsg_flags & NLM_F_CREATE) {
1814 err = ctnetlink_create_expect(cda,
1816 NETLINK_CB(skb).pid,
1817 nlmsg_report(nlh));
1819 return err;
1822 err = -EEXIST;
1823 if (!(nlh->nlmsg_flags & NLM_F_EXCL))
1824 err = ctnetlink_change_expect(exp, cda);
1825 spin_unlock_bh(&nf_conntrack_lock);
1827 return err;
1830 #ifdef CONFIG_NF_CONNTRACK_EVENTS
1831 static struct notifier_block ctnl_notifier = {
1832 .notifier_call = ctnetlink_conntrack_event,
1835 static struct notifier_block ctnl_notifier_exp = {
1836 .notifier_call = ctnetlink_expect_event,
1838 #endif
1840 static const struct nfnl_callback ctnl_cb[IPCTNL_MSG_MAX] = {
1841 [IPCTNL_MSG_CT_NEW] = { .call = ctnetlink_new_conntrack,
1842 .attr_count = CTA_MAX,
1843 .policy = ct_nla_policy },
1844 [IPCTNL_MSG_CT_GET] = { .call = ctnetlink_get_conntrack,
1845 .attr_count = CTA_MAX,
1846 .policy = ct_nla_policy },
1847 [IPCTNL_MSG_CT_DELETE] = { .call = ctnetlink_del_conntrack,
1848 .attr_count = CTA_MAX,
1849 .policy = ct_nla_policy },
1850 [IPCTNL_MSG_CT_GET_CTRZERO] = { .call = ctnetlink_get_conntrack,
1851 .attr_count = CTA_MAX,
1852 .policy = ct_nla_policy },
1855 static const struct nfnl_callback ctnl_exp_cb[IPCTNL_MSG_EXP_MAX] = {
1856 [IPCTNL_MSG_EXP_GET] = { .call = ctnetlink_get_expect,
1857 .attr_count = CTA_EXPECT_MAX,
1858 .policy = exp_nla_policy },
1859 [IPCTNL_MSG_EXP_NEW] = { .call = ctnetlink_new_expect,
1860 .attr_count = CTA_EXPECT_MAX,
1861 .policy = exp_nla_policy },
1862 [IPCTNL_MSG_EXP_DELETE] = { .call = ctnetlink_del_expect,
1863 .attr_count = CTA_EXPECT_MAX,
1864 .policy = exp_nla_policy },
1867 static const struct nfnetlink_subsystem ctnl_subsys = {
1868 .name = "conntrack",
1869 .subsys_id = NFNL_SUBSYS_CTNETLINK,
1870 .cb_count = IPCTNL_MSG_MAX,
1871 .cb = ctnl_cb,
1874 static const struct nfnetlink_subsystem ctnl_exp_subsys = {
1875 .name = "conntrack_expect",
1876 .subsys_id = NFNL_SUBSYS_CTNETLINK_EXP,
1877 .cb_count = IPCTNL_MSG_EXP_MAX,
1878 .cb = ctnl_exp_cb,
1881 MODULE_ALIAS("ip_conntrack_netlink");
1882 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_CTNETLINK);
1883 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_CTNETLINK_EXP);
1885 static int __init ctnetlink_init(void)
1887 int ret;
1889 printk("ctnetlink v%s: registering with nfnetlink.\n", version);
1890 ret = nfnetlink_subsys_register(&ctnl_subsys);
1891 if (ret < 0) {
1892 printk("ctnetlink_init: cannot register with nfnetlink.\n");
1893 goto err_out;
1896 ret = nfnetlink_subsys_register(&ctnl_exp_subsys);
1897 if (ret < 0) {
1898 printk("ctnetlink_init: cannot register exp with nfnetlink.\n");
1899 goto err_unreg_subsys;
1902 #ifdef CONFIG_NF_CONNTRACK_EVENTS
1903 ret = nf_conntrack_register_notifier(&ctnl_notifier);
1904 if (ret < 0) {
1905 printk("ctnetlink_init: cannot register notifier.\n");
1906 goto err_unreg_exp_subsys;
1909 ret = nf_ct_expect_register_notifier(&ctnl_notifier_exp);
1910 if (ret < 0) {
1911 printk("ctnetlink_init: cannot expect register notifier.\n");
1912 goto err_unreg_notifier;
1914 #endif
1916 return 0;
1918 #ifdef CONFIG_NF_CONNTRACK_EVENTS
1919 err_unreg_notifier:
1920 nf_conntrack_unregister_notifier(&ctnl_notifier);
1921 err_unreg_exp_subsys:
1922 nfnetlink_subsys_unregister(&ctnl_exp_subsys);
1923 #endif
1924 err_unreg_subsys:
1925 nfnetlink_subsys_unregister(&ctnl_subsys);
1926 err_out:
1927 return ret;
1930 static void __exit ctnetlink_exit(void)
1932 printk("ctnetlink: unregistering from nfnetlink.\n");
1934 #ifdef CONFIG_NF_CONNTRACK_EVENTS
1935 nf_ct_expect_unregister_notifier(&ctnl_notifier_exp);
1936 nf_conntrack_unregister_notifier(&ctnl_notifier);
1937 #endif
1939 nfnetlink_subsys_unregister(&ctnl_exp_subsys);
1940 nfnetlink_subsys_unregister(&ctnl_subsys);
1941 return;
1944 module_init(ctnetlink_init);
1945 module_exit(ctnetlink_exit);