efb9a8c28c
netns list (just list) is under RTNL. But helper and proto unregistration happen during rmmod when RTNL is not held, and that's how it was tested: modprobe/rmmod vs clone(CLONE_NEWNET)/exit. BUG: unable to handle kernel paging request at 0000000000100100 <=== IP: [<ffffffffa009890f>] nf_conntrack_l4proto_unregister+0x96/0xae [nf_conntrack] PGD 15e300067 PUD 15e1d8067 PMD 0 Oops: 0000 [#1] PREEMPT SMP DEBUG_PAGEALLOC last sysfs file: /sys/kernel/uevent_seqnum CPU 0 Modules linked in: nf_conntrack_proto_sctp(-) nf_conntrack_proto_dccp(-) af_packet iptable_nat nf_nat nf_conntrack_ipv4 nf_conntrack nf_defrag_ipv4 iptable_filter ip_tables xt_tcpudp ip6table_filter ip6_tables x_tables ipv6 sr_mod cdrom [last unloaded: nf_conntrack_proto_sctp] Pid: 16758, comm: rmmod Not tainted 2.6.28-rc2-netns-xfrm #3 RIP: 0010:[<ffffffffa009890f>] [<ffffffffa009890f>] nf_conntrack_l4proto_unregister+0x96/0xae [nf_conntrack] RSP: 0018:ffff88015dc1fec8 EFLAGS: 00010212 RAX: 0000000000000000 RBX: 00000000001000f8 RCX: 0000000000000000 RDX: ffffffffa009575c RSI: 0000000000000003 RDI: ffffffffa00956b5 RBP: ffff88015dc1fed8 R08: 0000000000000002 R09: 0000000000000000 R10: 0000000000000000 R11: ffff88015dc1fe48 R12: ffffffffa0458f60 R13: 0000000000000880 R14: 00007fff4c361d30 R15: 0000000000000880 FS: 00007f624435a6f0(0000) GS:ffffffff80521580(0000) knlGS:0000000000000000 CS: 0010 DS: 0000 ES: 0000 CR0: 000000008005003b CR2: 0000000000100100 CR3: 0000000168969000 CR4: 00000000000006e0 DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000 DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400 Process rmmod (pid: 16758, threadinfo ffff88015dc1e000, task ffff880179864218) Stack: ffffffffa0459100 0000000000000000 ffff88015dc1fee8 ffffffffa0457934 ffff88015dc1ff78 ffffffff80253fef 746e6e6f635f666e 6f72705f6b636172 00707463735f6f74 ffffffff8024cb30 00000000023b8010 0000000000000000 Call Trace: [<ffffffffa0457934>] nf_conntrack_proto_sctp_fini+0x10/0x1e [nf_conntrack_proto_sctp] [<ffffffff80253fef>] sys_delete_module+0x19f/0x1fe [<ffffffff8024cb30>] ? trace_hardirqs_on_caller+0xf0/0x114 [<ffffffff803ea9b2>] ? trace_hardirqs_on_thunk+0x3a/0x3f [<ffffffff8020b52b>] system_call_fastpath+0x16/0x1b Code: 13 35 e0 e8 c4 6c 1a e0 48 8b 1d 6d c6 46 e0 eb 16 48 89 df 4c 89 e2 48 c7 c6 fc 85 09 a0 e8 61 cd ff ff 48 8b 5b 08 48 83 eb 08 <48> 8b 43 08 0f 18 08 48 8d 43 08 48 3d 60 4f 50 80 75 d3 5b 41 RIP [<ffffffffa009890f>] nf_conntrack_l4proto_unregister+0x96/0xae [nf_conntrack] RSP <ffff88015dc1fec8> CR2: 0000000000100100 ---[ end trace bde8ac82debf7192 ]--- Signed-off-by: Alexey Dobriyan <adobriyan@gmail.com> Signed-off-by: Patrick McHardy <kaber@trash.net> Signed-off-by: David S. Miller <davem@davemloft.net>
371 lines
9.2 KiB
C
371 lines
9.2 KiB
C
/* L3/L4 protocol support for nf_conntrack. */
|
|
|
|
/* (C) 1999-2001 Paul `Rusty' Russell
|
|
* (C) 2002-2006 Netfilter Core Team <coreteam@netfilter.org>
|
|
* (C) 2003,2004 USAGI/WIDE Project <http://www.linux-ipv6.org>
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License version 2 as
|
|
* published by the Free Software Foundation.
|
|
*/
|
|
|
|
#include <linux/types.h>
|
|
#include <linux/netfilter.h>
|
|
#include <linux/module.h>
|
|
#include <linux/mutex.h>
|
|
#include <linux/skbuff.h>
|
|
#include <linux/vmalloc.h>
|
|
#include <linux/stddef.h>
|
|
#include <linux/err.h>
|
|
#include <linux/percpu.h>
|
|
#include <linux/moduleparam.h>
|
|
#include <linux/notifier.h>
|
|
#include <linux/kernel.h>
|
|
#include <linux/netdevice.h>
|
|
#include <linux/rtnetlink.h>
|
|
|
|
#include <net/netfilter/nf_conntrack.h>
|
|
#include <net/netfilter/nf_conntrack_l3proto.h>
|
|
#include <net/netfilter/nf_conntrack_l4proto.h>
|
|
#include <net/netfilter/nf_conntrack_core.h>
|
|
|
|
static struct nf_conntrack_l4proto **nf_ct_protos[PF_MAX] __read_mostly;
|
|
struct nf_conntrack_l3proto *nf_ct_l3protos[AF_MAX] __read_mostly;
|
|
EXPORT_SYMBOL_GPL(nf_ct_l3protos);
|
|
|
|
static DEFINE_MUTEX(nf_ct_proto_mutex);
|
|
|
|
#ifdef CONFIG_SYSCTL
|
|
static int
|
|
nf_ct_register_sysctl(struct ctl_table_header **header, struct ctl_path *path,
|
|
struct ctl_table *table, unsigned int *users)
|
|
{
|
|
if (*header == NULL) {
|
|
*header = register_sysctl_paths(path, table);
|
|
if (*header == NULL)
|
|
return -ENOMEM;
|
|
}
|
|
if (users != NULL)
|
|
(*users)++;
|
|
return 0;
|
|
}
|
|
|
|
static void
|
|
nf_ct_unregister_sysctl(struct ctl_table_header **header,
|
|
struct ctl_table *table, unsigned int *users)
|
|
{
|
|
if (users != NULL && --*users > 0)
|
|
return;
|
|
|
|
unregister_sysctl_table(*header);
|
|
*header = NULL;
|
|
}
|
|
#endif
|
|
|
|
struct nf_conntrack_l4proto *
|
|
__nf_ct_l4proto_find(u_int16_t l3proto, u_int8_t l4proto)
|
|
{
|
|
if (unlikely(l3proto >= AF_MAX || nf_ct_protos[l3proto] == NULL))
|
|
return &nf_conntrack_l4proto_generic;
|
|
|
|
return rcu_dereference(nf_ct_protos[l3proto][l4proto]);
|
|
}
|
|
EXPORT_SYMBOL_GPL(__nf_ct_l4proto_find);
|
|
|
|
/* this is guaranteed to always return a valid protocol helper, since
|
|
* it falls back to generic_protocol */
|
|
struct nf_conntrack_l4proto *
|
|
nf_ct_l4proto_find_get(u_int16_t l3proto, u_int8_t l4proto)
|
|
{
|
|
struct nf_conntrack_l4proto *p;
|
|
|
|
rcu_read_lock();
|
|
p = __nf_ct_l4proto_find(l3proto, l4proto);
|
|
if (!try_module_get(p->me))
|
|
p = &nf_conntrack_l4proto_generic;
|
|
rcu_read_unlock();
|
|
|
|
return p;
|
|
}
|
|
EXPORT_SYMBOL_GPL(nf_ct_l4proto_find_get);
|
|
|
|
void nf_ct_l4proto_put(struct nf_conntrack_l4proto *p)
|
|
{
|
|
module_put(p->me);
|
|
}
|
|
EXPORT_SYMBOL_GPL(nf_ct_l4proto_put);
|
|
|
|
struct nf_conntrack_l3proto *
|
|
nf_ct_l3proto_find_get(u_int16_t l3proto)
|
|
{
|
|
struct nf_conntrack_l3proto *p;
|
|
|
|
rcu_read_lock();
|
|
p = __nf_ct_l3proto_find(l3proto);
|
|
if (!try_module_get(p->me))
|
|
p = &nf_conntrack_l3proto_generic;
|
|
rcu_read_unlock();
|
|
|
|
return p;
|
|
}
|
|
EXPORT_SYMBOL_GPL(nf_ct_l3proto_find_get);
|
|
|
|
void nf_ct_l3proto_put(struct nf_conntrack_l3proto *p)
|
|
{
|
|
module_put(p->me);
|
|
}
|
|
EXPORT_SYMBOL_GPL(nf_ct_l3proto_put);
|
|
|
|
int
|
|
nf_ct_l3proto_try_module_get(unsigned short l3proto)
|
|
{
|
|
int ret;
|
|
struct nf_conntrack_l3proto *p;
|
|
|
|
retry: p = nf_ct_l3proto_find_get(l3proto);
|
|
if (p == &nf_conntrack_l3proto_generic) {
|
|
ret = request_module("nf_conntrack-%d", l3proto);
|
|
if (!ret)
|
|
goto retry;
|
|
|
|
return -EPROTOTYPE;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
EXPORT_SYMBOL_GPL(nf_ct_l3proto_try_module_get);
|
|
|
|
void nf_ct_l3proto_module_put(unsigned short l3proto)
|
|
{
|
|
struct nf_conntrack_l3proto *p;
|
|
|
|
/* rcu_read_lock not necessary since the caller holds a reference */
|
|
p = __nf_ct_l3proto_find(l3proto);
|
|
module_put(p->me);
|
|
}
|
|
EXPORT_SYMBOL_GPL(nf_ct_l3proto_module_put);
|
|
|
|
static int kill_l3proto(struct nf_conn *i, void *data)
|
|
{
|
|
return nf_ct_l3num(i) == ((struct nf_conntrack_l3proto *)data)->l3proto;
|
|
}
|
|
|
|
static int kill_l4proto(struct nf_conn *i, void *data)
|
|
{
|
|
struct nf_conntrack_l4proto *l4proto;
|
|
l4proto = (struct nf_conntrack_l4proto *)data;
|
|
return nf_ct_protonum(i) == l4proto->l4proto &&
|
|
nf_ct_l3num(i) == l4proto->l3proto;
|
|
}
|
|
|
|
static int nf_ct_l3proto_register_sysctl(struct nf_conntrack_l3proto *l3proto)
|
|
{
|
|
int err = 0;
|
|
|
|
#ifdef CONFIG_SYSCTL
|
|
if (l3proto->ctl_table != NULL) {
|
|
err = nf_ct_register_sysctl(&l3proto->ctl_table_header,
|
|
l3proto->ctl_table_path,
|
|
l3proto->ctl_table, NULL);
|
|
}
|
|
#endif
|
|
return err;
|
|
}
|
|
|
|
static void nf_ct_l3proto_unregister_sysctl(struct nf_conntrack_l3proto *l3proto)
|
|
{
|
|
#ifdef CONFIG_SYSCTL
|
|
if (l3proto->ctl_table_header != NULL)
|
|
nf_ct_unregister_sysctl(&l3proto->ctl_table_header,
|
|
l3proto->ctl_table, NULL);
|
|
#endif
|
|
}
|
|
|
|
int nf_conntrack_l3proto_register(struct nf_conntrack_l3proto *proto)
|
|
{
|
|
int ret = 0;
|
|
|
|
if (proto->l3proto >= AF_MAX)
|
|
return -EBUSY;
|
|
|
|
mutex_lock(&nf_ct_proto_mutex);
|
|
if (nf_ct_l3protos[proto->l3proto] != &nf_conntrack_l3proto_generic) {
|
|
ret = -EBUSY;
|
|
goto out_unlock;
|
|
}
|
|
|
|
ret = nf_ct_l3proto_register_sysctl(proto);
|
|
if (ret < 0)
|
|
goto out_unlock;
|
|
|
|
rcu_assign_pointer(nf_ct_l3protos[proto->l3proto], proto);
|
|
|
|
out_unlock:
|
|
mutex_unlock(&nf_ct_proto_mutex);
|
|
return ret;
|
|
}
|
|
EXPORT_SYMBOL_GPL(nf_conntrack_l3proto_register);
|
|
|
|
void nf_conntrack_l3proto_unregister(struct nf_conntrack_l3proto *proto)
|
|
{
|
|
struct net *net;
|
|
|
|
BUG_ON(proto->l3proto >= AF_MAX);
|
|
|
|
mutex_lock(&nf_ct_proto_mutex);
|
|
BUG_ON(nf_ct_l3protos[proto->l3proto] != proto);
|
|
rcu_assign_pointer(nf_ct_l3protos[proto->l3proto],
|
|
&nf_conntrack_l3proto_generic);
|
|
nf_ct_l3proto_unregister_sysctl(proto);
|
|
mutex_unlock(&nf_ct_proto_mutex);
|
|
|
|
synchronize_rcu();
|
|
|
|
/* Remove all contrack entries for this protocol */
|
|
rtnl_lock();
|
|
for_each_net(net)
|
|
nf_ct_iterate_cleanup(net, kill_l3proto, proto);
|
|
rtnl_unlock();
|
|
}
|
|
EXPORT_SYMBOL_GPL(nf_conntrack_l3proto_unregister);
|
|
|
|
static int nf_ct_l4proto_register_sysctl(struct nf_conntrack_l4proto *l4proto)
|
|
{
|
|
int err = 0;
|
|
|
|
#ifdef CONFIG_SYSCTL
|
|
if (l4proto->ctl_table != NULL) {
|
|
err = nf_ct_register_sysctl(l4proto->ctl_table_header,
|
|
nf_net_netfilter_sysctl_path,
|
|
l4proto->ctl_table,
|
|
l4proto->ctl_table_users);
|
|
if (err < 0)
|
|
goto out;
|
|
}
|
|
#ifdef CONFIG_NF_CONNTRACK_PROC_COMPAT
|
|
if (l4proto->ctl_compat_table != NULL) {
|
|
err = nf_ct_register_sysctl(&l4proto->ctl_compat_table_header,
|
|
nf_net_ipv4_netfilter_sysctl_path,
|
|
l4proto->ctl_compat_table, NULL);
|
|
if (err == 0)
|
|
goto out;
|
|
nf_ct_unregister_sysctl(l4proto->ctl_table_header,
|
|
l4proto->ctl_table,
|
|
l4proto->ctl_table_users);
|
|
}
|
|
#endif /* CONFIG_NF_CONNTRACK_PROC_COMPAT */
|
|
out:
|
|
#endif /* CONFIG_SYSCTL */
|
|
return err;
|
|
}
|
|
|
|
static void nf_ct_l4proto_unregister_sysctl(struct nf_conntrack_l4proto *l4proto)
|
|
{
|
|
#ifdef CONFIG_SYSCTL
|
|
if (l4proto->ctl_table_header != NULL &&
|
|
*l4proto->ctl_table_header != NULL)
|
|
nf_ct_unregister_sysctl(l4proto->ctl_table_header,
|
|
l4proto->ctl_table,
|
|
l4proto->ctl_table_users);
|
|
#ifdef CONFIG_NF_CONNTRACK_PROC_COMPAT
|
|
if (l4proto->ctl_compat_table_header != NULL)
|
|
nf_ct_unregister_sysctl(&l4proto->ctl_compat_table_header,
|
|
l4proto->ctl_compat_table, NULL);
|
|
#endif /* CONFIG_NF_CONNTRACK_PROC_COMPAT */
|
|
#endif /* CONFIG_SYSCTL */
|
|
}
|
|
|
|
/* FIXME: Allow NULL functions and sub in pointers to generic for
|
|
them. --RR */
|
|
int nf_conntrack_l4proto_register(struct nf_conntrack_l4proto *l4proto)
|
|
{
|
|
int ret = 0;
|
|
|
|
if (l4proto->l3proto >= PF_MAX)
|
|
return -EBUSY;
|
|
|
|
mutex_lock(&nf_ct_proto_mutex);
|
|
if (!nf_ct_protos[l4proto->l3proto]) {
|
|
/* l3proto may be loaded latter. */
|
|
struct nf_conntrack_l4proto **proto_array;
|
|
int i;
|
|
|
|
proto_array = kmalloc(MAX_NF_CT_PROTO *
|
|
sizeof(struct nf_conntrack_l4proto *),
|
|
GFP_KERNEL);
|
|
if (proto_array == NULL) {
|
|
ret = -ENOMEM;
|
|
goto out_unlock;
|
|
}
|
|
|
|
for (i = 0; i < MAX_NF_CT_PROTO; i++)
|
|
proto_array[i] = &nf_conntrack_l4proto_generic;
|
|
nf_ct_protos[l4proto->l3proto] = proto_array;
|
|
} else if (nf_ct_protos[l4proto->l3proto][l4proto->l4proto] !=
|
|
&nf_conntrack_l4proto_generic) {
|
|
ret = -EBUSY;
|
|
goto out_unlock;
|
|
}
|
|
|
|
ret = nf_ct_l4proto_register_sysctl(l4proto);
|
|
if (ret < 0)
|
|
goto out_unlock;
|
|
|
|
rcu_assign_pointer(nf_ct_protos[l4proto->l3proto][l4proto->l4proto],
|
|
l4proto);
|
|
|
|
out_unlock:
|
|
mutex_unlock(&nf_ct_proto_mutex);
|
|
return ret;
|
|
}
|
|
EXPORT_SYMBOL_GPL(nf_conntrack_l4proto_register);
|
|
|
|
void nf_conntrack_l4proto_unregister(struct nf_conntrack_l4proto *l4proto)
|
|
{
|
|
struct net *net;
|
|
|
|
BUG_ON(l4proto->l3proto >= PF_MAX);
|
|
|
|
mutex_lock(&nf_ct_proto_mutex);
|
|
BUG_ON(nf_ct_protos[l4proto->l3proto][l4proto->l4proto] != l4proto);
|
|
rcu_assign_pointer(nf_ct_protos[l4proto->l3proto][l4proto->l4proto],
|
|
&nf_conntrack_l4proto_generic);
|
|
nf_ct_l4proto_unregister_sysctl(l4proto);
|
|
mutex_unlock(&nf_ct_proto_mutex);
|
|
|
|
synchronize_rcu();
|
|
|
|
/* Remove all contrack entries for this protocol */
|
|
rtnl_lock();
|
|
for_each_net(net)
|
|
nf_ct_iterate_cleanup(net, kill_l4proto, l4proto);
|
|
rtnl_unlock();
|
|
}
|
|
EXPORT_SYMBOL_GPL(nf_conntrack_l4proto_unregister);
|
|
|
|
int nf_conntrack_proto_init(void)
|
|
{
|
|
unsigned int i;
|
|
int err;
|
|
|
|
err = nf_ct_l4proto_register_sysctl(&nf_conntrack_l4proto_generic);
|
|
if (err < 0)
|
|
return err;
|
|
|
|
for (i = 0; i < AF_MAX; i++)
|
|
rcu_assign_pointer(nf_ct_l3protos[i],
|
|
&nf_conntrack_l3proto_generic);
|
|
return 0;
|
|
}
|
|
|
|
void nf_conntrack_proto_fini(void)
|
|
{
|
|
unsigned int i;
|
|
|
|
nf_ct_l4proto_unregister_sysctl(&nf_conntrack_l4proto_generic);
|
|
|
|
/* free l3proto protocol tables */
|
|
for (i = 0; i < PF_MAX; i++)
|
|
kfree(nf_ct_protos[i]);
|
|
}
|