3 * (C) 2012 by Vyatta Inc. <http://www.vyatta.com>
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License version 2 as
7 * published by the Free Software Foundation (or any later at your option).
9 #include <linux/init.h>
10 #include <linux/module.h>
11 #include <linux/kernel.h>
12 #include <linux/rculist.h>
13 #include <linux/rculist_nulls.h>
14 #include <linux/types.h>
15 #include <linux/timer.h>
16 #include <linux/security.h>
17 #include <linux/skbuff.h>
18 #include <linux/errno.h>
19 #include <linux/netlink.h>
20 #include <linux/spinlock.h>
21 #include <linux/interrupt.h>
22 #include <linux/slab.h>
24 #include <linux/netfilter.h>
25 #include <net/netlink.h>
27 #include <net/netfilter/nf_conntrack.h>
28 #include <net/netfilter/nf_conntrack_core.h>
29 #include <net/netfilter/nf_conntrack_l3proto.h>
30 #include <net/netfilter/nf_conntrack_l4proto.h>
31 #include <net/netfilter/nf_conntrack_tuple.h>
32 #include <net/netfilter/nf_conntrack_timeout.h>
34 #include <linux/netfilter/nfnetlink.h>
35 #include <linux/netfilter/nfnetlink_cttimeout.h>
37 MODULE_LICENSE("GPL");
39 MODULE_DESCRIPTION("cttimeout: Extended Netfilter Connection Tracking timeout tuning");
41 static LIST_HEAD(cttimeout_list);
43 static const struct nla_policy cttimeout_nla_policy[CTA_TIMEOUT_MAX+1] = {
44 [CTA_TIMEOUT_NAME] = { .type = NLA_NUL_STRING,
45 .len = CTNL_TIMEOUT_NAME_MAX - 1},
46 [CTA_TIMEOUT_L3PROTO] = { .type = NLA_U16 },
47 [CTA_TIMEOUT_L4PROTO] = { .type = NLA_U8 },
48 [CTA_TIMEOUT_DATA] = { .type = NLA_NESTED },
52 ctnl_timeout_parse_policy(void *timeouts, struct nf_conntrack_l4proto *l4proto,
53 struct net *net, const struct nlattr *attr)
57 if (likely(l4proto->ctnl_timeout.nlattr_to_obj)) {
58 struct nlattr *tb[l4proto->ctnl_timeout.nlattr_max+1];
60 ret = nla_parse_nested(tb, l4proto->ctnl_timeout.nlattr_max,
61 attr, l4proto->ctnl_timeout.nla_policy);
65 ret = l4proto->ctnl_timeout.nlattr_to_obj(tb, net, timeouts);
71 cttimeout_new_timeout(struct sock *ctnl, struct sk_buff *skb,
72 const struct nlmsghdr *nlh,
73 const struct nlattr * const cda[])
77 struct nf_conntrack_l4proto *l4proto;
78 struct ctnl_timeout *timeout, *matching = NULL;
79 struct net *net = sock_net(skb->sk);
83 if (!cda[CTA_TIMEOUT_NAME] ||
84 !cda[CTA_TIMEOUT_L3PROTO] ||
85 !cda[CTA_TIMEOUT_L4PROTO] ||
86 !cda[CTA_TIMEOUT_DATA])
89 name = nla_data(cda[CTA_TIMEOUT_NAME]);
90 l3num = ntohs(nla_get_be16(cda[CTA_TIMEOUT_L3PROTO]));
91 l4num = nla_get_u8(cda[CTA_TIMEOUT_L4PROTO]);
93 list_for_each_entry(timeout, &cttimeout_list, head) {
94 if (strncmp(timeout->name, name, CTNL_TIMEOUT_NAME_MAX) != 0)
97 if (nlh->nlmsg_flags & NLM_F_EXCL)
104 l4proto = nf_ct_l4proto_find_get(l3num, l4num);
106 /* This protocol is not supportted, skip. */
107 if (l4proto->l4proto != l4num) {
113 if (nlh->nlmsg_flags & NLM_F_REPLACE) {
114 /* You cannot replace one timeout policy by another of
115 * different kind, sorry.
117 if (matching->l3num != l3num ||
118 matching->l4proto->l4proto != l4num) {
123 ret = ctnl_timeout_parse_policy(&matching->data,
125 cda[CTA_TIMEOUT_DATA]);
132 timeout = kzalloc(sizeof(struct ctnl_timeout) +
133 l4proto->ctnl_timeout.obj_size, GFP_KERNEL);
134 if (timeout == NULL) {
139 ret = ctnl_timeout_parse_policy(&timeout->data, l4proto, net,
140 cda[CTA_TIMEOUT_DATA]);
144 strcpy(timeout->name, nla_data(cda[CTA_TIMEOUT_NAME]));
145 timeout->l3num = l3num;
146 timeout->l4proto = l4proto;
147 atomic_set(&timeout->refcnt, 1);
148 list_add_tail_rcu(&timeout->head, &cttimeout_list);
154 nf_ct_l4proto_put(l4proto);
159 ctnl_timeout_fill_info(struct sk_buff *skb, u32 portid, u32 seq, u32 type,
160 int event, struct ctnl_timeout *timeout)
162 struct nlmsghdr *nlh;
163 struct nfgenmsg *nfmsg;
164 unsigned int flags = portid ? NLM_F_MULTI : 0;
165 struct nf_conntrack_l4proto *l4proto = timeout->l4proto;
167 event |= NFNL_SUBSYS_CTNETLINK_TIMEOUT << 8;
168 nlh = nlmsg_put(skb, portid, seq, event, sizeof(*nfmsg), flags);
172 nfmsg = nlmsg_data(nlh);
173 nfmsg->nfgen_family = AF_UNSPEC;
174 nfmsg->version = NFNETLINK_V0;
177 if (nla_put_string(skb, CTA_TIMEOUT_NAME, timeout->name) ||
178 nla_put_be16(skb, CTA_TIMEOUT_L3PROTO, htons(timeout->l3num)) ||
179 nla_put_u8(skb, CTA_TIMEOUT_L4PROTO, timeout->l4proto->l4proto) ||
180 nla_put_be32(skb, CTA_TIMEOUT_USE,
181 htonl(atomic_read(&timeout->refcnt))))
182 goto nla_put_failure;
184 if (likely(l4proto->ctnl_timeout.obj_to_nlattr)) {
185 struct nlattr *nest_parms;
188 nest_parms = nla_nest_start(skb,
189 CTA_TIMEOUT_DATA | NLA_F_NESTED);
191 goto nla_put_failure;
193 ret = l4proto->ctnl_timeout.obj_to_nlattr(skb, &timeout->data);
195 goto nla_put_failure;
197 nla_nest_end(skb, nest_parms);
205 nlmsg_cancel(skb, nlh);
210 ctnl_timeout_dump(struct sk_buff *skb, struct netlink_callback *cb)
212 struct ctnl_timeout *cur, *last;
217 last = (struct ctnl_timeout *)cb->args[1];
222 list_for_each_entry_rcu(cur, &cttimeout_list, head) {
229 if (ctnl_timeout_fill_info(skb, NETLINK_CB(cb->skb).portid,
231 NFNL_MSG_TYPE(cb->nlh->nlmsg_type),
232 IPCTNL_MSG_TIMEOUT_NEW, cur) < 0) {
233 cb->args[1] = (unsigned long)cur;
244 cttimeout_get_timeout(struct sock *ctnl, struct sk_buff *skb,
245 const struct nlmsghdr *nlh,
246 const struct nlattr * const cda[])
250 struct ctnl_timeout *cur;
252 if (nlh->nlmsg_flags & NLM_F_DUMP) {
253 struct netlink_dump_control c = {
254 .dump = ctnl_timeout_dump,
256 return netlink_dump_start(ctnl, skb, nlh, &c);
259 if (!cda[CTA_TIMEOUT_NAME])
261 name = nla_data(cda[CTA_TIMEOUT_NAME]);
263 list_for_each_entry(cur, &cttimeout_list, head) {
264 struct sk_buff *skb2;
266 if (strncmp(cur->name, name, CTNL_TIMEOUT_NAME_MAX) != 0)
269 skb2 = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
275 ret = ctnl_timeout_fill_info(skb2, NETLINK_CB(skb).portid,
277 NFNL_MSG_TYPE(nlh->nlmsg_type),
278 IPCTNL_MSG_TIMEOUT_NEW, cur);
283 ret = netlink_unicast(ctnl, skb2, NETLINK_CB(skb).portid,
288 /* this avoids a loop in nfnetlink. */
289 return ret == -EAGAIN ? -ENOBUFS : ret;
294 static void untimeout(struct nf_conntrack_tuple_hash *i,
295 struct ctnl_timeout *timeout)
297 struct nf_conn *ct = nf_ct_tuplehash_to_ctrack(i);
298 struct nf_conn_timeout *timeout_ext = nf_ct_timeout_find(ct);
300 if (timeout_ext && (!timeout || timeout_ext->timeout == timeout))
301 RCU_INIT_POINTER(timeout_ext->timeout, NULL);
304 static void ctnl_untimeout(struct ctnl_timeout *timeout)
306 struct nf_conntrack_tuple_hash *h;
307 const struct hlist_nulls_node *nn;
311 for (i = 0; i < init_net.ct.htable_size; i++) {
312 spin_lock(&nf_conntrack_locks[i % CONNTRACK_LOCKS]);
313 if (i < init_net.ct.htable_size) {
314 hlist_nulls_for_each_entry(h, nn, &init_net.ct.hash[i], hnnode)
315 untimeout(h, timeout);
317 spin_unlock(&nf_conntrack_locks[i % CONNTRACK_LOCKS]);
322 /* try to delete object, fail if it is still in use. */
323 static int ctnl_timeout_try_del(struct ctnl_timeout *timeout)
327 /* we want to avoid races with nf_ct_timeout_find_get. */
328 if (atomic_dec_and_test(&timeout->refcnt)) {
329 /* We are protected by nfnl mutex. */
330 list_del_rcu(&timeout->head);
331 nf_ct_l4proto_put(timeout->l4proto);
332 ctnl_untimeout(timeout);
333 kfree_rcu(timeout, rcu_head);
335 /* still in use, restore reference counter. */
336 atomic_inc(&timeout->refcnt);
343 cttimeout_del_timeout(struct sock *ctnl, struct sk_buff *skb,
344 const struct nlmsghdr *nlh,
345 const struct nlattr * const cda[])
348 struct ctnl_timeout *cur;
351 if (!cda[CTA_TIMEOUT_NAME]) {
352 list_for_each_entry(cur, &cttimeout_list, head)
353 ctnl_timeout_try_del(cur);
357 name = nla_data(cda[CTA_TIMEOUT_NAME]);
359 list_for_each_entry(cur, &cttimeout_list, head) {
360 if (strncmp(cur->name, name, CTNL_TIMEOUT_NAME_MAX) != 0)
363 ret = ctnl_timeout_try_del(cur);
373 cttimeout_default_set(struct sock *ctnl, struct sk_buff *skb,
374 const struct nlmsghdr *nlh,
375 const struct nlattr * const cda[])
379 struct nf_conntrack_l4proto *l4proto;
380 struct net *net = sock_net(skb->sk);
381 unsigned int *timeouts;
384 if (!cda[CTA_TIMEOUT_L3PROTO] ||
385 !cda[CTA_TIMEOUT_L4PROTO] ||
386 !cda[CTA_TIMEOUT_DATA])
389 l3num = ntohs(nla_get_be16(cda[CTA_TIMEOUT_L3PROTO]));
390 l4num = nla_get_u8(cda[CTA_TIMEOUT_L4PROTO]);
391 l4proto = nf_ct_l4proto_find_get(l3num, l4num);
393 /* This protocol is not supported, skip. */
394 if (l4proto->l4proto != l4num) {
399 timeouts = l4proto->get_timeouts(net);
401 ret = ctnl_timeout_parse_policy(timeouts, l4proto, net,
402 cda[CTA_TIMEOUT_DATA]);
406 nf_ct_l4proto_put(l4proto);
409 nf_ct_l4proto_put(l4proto);
414 cttimeout_default_fill_info(struct net *net, struct sk_buff *skb, u32 portid,
415 u32 seq, u32 type, int event,
416 struct nf_conntrack_l4proto *l4proto)
418 struct nlmsghdr *nlh;
419 struct nfgenmsg *nfmsg;
420 unsigned int flags = portid ? NLM_F_MULTI : 0;
422 event |= NFNL_SUBSYS_CTNETLINK_TIMEOUT << 8;
423 nlh = nlmsg_put(skb, portid, seq, event, sizeof(*nfmsg), flags);
427 nfmsg = nlmsg_data(nlh);
428 nfmsg->nfgen_family = AF_UNSPEC;
429 nfmsg->version = NFNETLINK_V0;
432 if (nla_put_be16(skb, CTA_TIMEOUT_L3PROTO, htons(l4proto->l3proto)) ||
433 nla_put_u8(skb, CTA_TIMEOUT_L4PROTO, l4proto->l4proto))
434 goto nla_put_failure;
436 if (likely(l4proto->ctnl_timeout.obj_to_nlattr)) {
437 struct nlattr *nest_parms;
438 unsigned int *timeouts = l4proto->get_timeouts(net);
441 nest_parms = nla_nest_start(skb,
442 CTA_TIMEOUT_DATA | NLA_F_NESTED);
444 goto nla_put_failure;
446 ret = l4proto->ctnl_timeout.obj_to_nlattr(skb, timeouts);
448 goto nla_put_failure;
450 nla_nest_end(skb, nest_parms);
458 nlmsg_cancel(skb, nlh);
462 static int cttimeout_default_get(struct sock *ctnl, struct sk_buff *skb,
463 const struct nlmsghdr *nlh,
464 const struct nlattr * const cda[])
468 struct nf_conntrack_l4proto *l4proto;
469 struct net *net = sock_net(skb->sk);
470 struct sk_buff *skb2;
473 if (!cda[CTA_TIMEOUT_L3PROTO] || !cda[CTA_TIMEOUT_L4PROTO])
476 l3num = ntohs(nla_get_be16(cda[CTA_TIMEOUT_L3PROTO]));
477 l4num = nla_get_u8(cda[CTA_TIMEOUT_L4PROTO]);
478 l4proto = nf_ct_l4proto_find_get(l3num, l4num);
480 /* This protocol is not supported, skip. */
481 if (l4proto->l4proto != l4num) {
486 skb2 = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
492 ret = cttimeout_default_fill_info(net, skb2, NETLINK_CB(skb).portid,
494 NFNL_MSG_TYPE(nlh->nlmsg_type),
495 IPCTNL_MSG_TIMEOUT_DEFAULT_SET,
502 ret = netlink_unicast(ctnl, skb2, NETLINK_CB(skb).portid, MSG_DONTWAIT);
506 /* this avoids a loop in nfnetlink. */
507 return ret == -EAGAIN ? -ENOBUFS : ret;
509 nf_ct_l4proto_put(l4proto);
513 #ifdef CONFIG_NF_CONNTRACK_TIMEOUT
514 static struct ctnl_timeout *ctnl_timeout_find_get(const char *name)
516 struct ctnl_timeout *timeout, *matching = NULL;
519 list_for_each_entry_rcu(timeout, &cttimeout_list, head) {
520 if (strncmp(timeout->name, name, CTNL_TIMEOUT_NAME_MAX) != 0)
523 if (!try_module_get(THIS_MODULE))
526 if (!atomic_inc_not_zero(&timeout->refcnt)) {
527 module_put(THIS_MODULE);
538 static void ctnl_timeout_put(struct ctnl_timeout *timeout)
540 atomic_dec(&timeout->refcnt);
541 module_put(THIS_MODULE);
543 #endif /* CONFIG_NF_CONNTRACK_TIMEOUT */
545 static const struct nfnl_callback cttimeout_cb[IPCTNL_MSG_TIMEOUT_MAX] = {
546 [IPCTNL_MSG_TIMEOUT_NEW] = { .call = cttimeout_new_timeout,
547 .attr_count = CTA_TIMEOUT_MAX,
548 .policy = cttimeout_nla_policy },
549 [IPCTNL_MSG_TIMEOUT_GET] = { .call = cttimeout_get_timeout,
550 .attr_count = CTA_TIMEOUT_MAX,
551 .policy = cttimeout_nla_policy },
552 [IPCTNL_MSG_TIMEOUT_DELETE] = { .call = cttimeout_del_timeout,
553 .attr_count = CTA_TIMEOUT_MAX,
554 .policy = cttimeout_nla_policy },
555 [IPCTNL_MSG_TIMEOUT_DEFAULT_SET]= { .call = cttimeout_default_set,
556 .attr_count = CTA_TIMEOUT_MAX,
557 .policy = cttimeout_nla_policy },
558 [IPCTNL_MSG_TIMEOUT_DEFAULT_GET]= { .call = cttimeout_default_get,
559 .attr_count = CTA_TIMEOUT_MAX,
560 .policy = cttimeout_nla_policy },
563 static const struct nfnetlink_subsystem cttimeout_subsys = {
564 .name = "conntrack_timeout",
565 .subsys_id = NFNL_SUBSYS_CTNETLINK_TIMEOUT,
566 .cb_count = IPCTNL_MSG_TIMEOUT_MAX,
570 MODULE_ALIAS_NFNL_SUBSYS(NFNL_SUBSYS_CTNETLINK_TIMEOUT);
572 static int __init cttimeout_init(void)
576 ret = nfnetlink_subsys_register(&cttimeout_subsys);
578 pr_err("cttimeout_init: cannot register cttimeout with "
582 #ifdef CONFIG_NF_CONNTRACK_TIMEOUT
583 RCU_INIT_POINTER(nf_ct_timeout_find_get_hook, ctnl_timeout_find_get);
584 RCU_INIT_POINTER(nf_ct_timeout_put_hook, ctnl_timeout_put);
585 #endif /* CONFIG_NF_CONNTRACK_TIMEOUT */
592 static void __exit cttimeout_exit(void)
594 struct ctnl_timeout *cur, *tmp;
596 pr_info("cttimeout: unregistering from nfnetlink.\n");
598 nfnetlink_subsys_unregister(&cttimeout_subsys);
600 /* Make sure no conntrack objects refer to custom timeouts anymore. */
601 ctnl_untimeout(NULL);
603 list_for_each_entry_safe(cur, tmp, &cttimeout_list, head) {
604 list_del_rcu(&cur->head);
605 /* We are sure that our objects have no clients at this point,
606 * it's safe to release them all without checking refcnt.
608 nf_ct_l4proto_put(cur->l4proto);
609 kfree_rcu(cur, rcu_head);
611 #ifdef CONFIG_NF_CONNTRACK_TIMEOUT
612 RCU_INIT_POINTER(nf_ct_timeout_find_get_hook, NULL);
613 RCU_INIT_POINTER(nf_ct_timeout_put_hook, NULL);
614 #endif /* CONFIG_NF_CONNTRACK_TIMEOUT */
618 module_init(cttimeout_init);
619 module_exit(cttimeout_exit);