2007-09-12 13:50:50 +04:00
/*
* Operations on the network namespace
*/
# ifndef __NET_NET_NAMESPACE_H
# define __NET_NET_NAMESPACE_H
2011-07-27 03:09:06 +04:00
# include <linux/atomic.h>
2017-06-30 13:08:08 +03:00
# include <linux/refcount.h>
2007-09-12 13:50:50 +04:00
# include <linux/workqueue.h>
# include <linux/list.h>
2011-05-27 00:40:37 +04:00
# include <linux/sysctl.h>
2007-09-12 13:50:50 +04:00
ipv4, fib: pass LOOPBACK_IFINDEX instead of 0 to flowi4_iif
As suggested by Julian:
Simply, flowi4_iif must not contain 0, it does not
look logical to ignore all ip rules with specified iif.
because in fib_rule_match() we do:
if (rule->iifindex && (rule->iifindex != fl->flowi_iif))
goto out;
flowi4_iif should be LOOPBACK_IFINDEX by default.
We need to move LOOPBACK_IFINDEX to include/net/flow.h:
1) It is mostly used by flowi_iif
2) Fix the following compile error if we use it in flow.h
by the patches latter:
In file included from include/linux/netfilter.h:277:0,
from include/net/netns/netfilter.h:5,
from include/net/net_namespace.h:21,
from include/linux/netdevice.h:43,
from include/linux/icmpv6.h:12,
from include/linux/ipv6.h:61,
from include/net/ipv6.h:16,
from include/linux/sunrpc/clnt.h:27,
from include/linux/nfs_fs.h:30,
from init/do_mounts.c:32:
include/net/flow.h: In function ‘flowi4_init_output’:
include/net/flow.h:84:32: error: ‘LOOPBACK_IFINDEX’ undeclared (first use in this function)
Cc: Eric Biederman <ebiederm@xmission.com>
Cc: Julian Anastasov <ja@ssi.bg>
Cc: David S. Miller <davem@davemloft.net>
Signed-off-by: Cong Wang <xiyou.wangcong@gmail.com>
Signed-off-by: Cong Wang <cwang@twopensource.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2014-04-16 03:25:34 +04:00
# include <net/flow.h>
2008-04-01 06:41:14 +04:00
# include <net/netns/core.h>
2008-07-18 15:01:24 +04:00
# include <net/netns/mib.h>
2007-12-11 15:19:17 +03:00
# include <net/netns/unix.h>
2007-12-11 15:19:54 +03:00
# include <net/netns/packet.h>
2007-12-17 00:29:36 +03:00
# include <net/netns/ipv4.h>
2008-01-10 13:49:06 +03:00
# include <net/netns/ipv6.h>
2014-02-28 10:32:49 +04:00
# include <net/netns/ieee802154_6lowpan.h>
2012-08-06 12:42:04 +04:00
# include <net/netns/sctp.h>
2008-04-14 09:28:42 +04:00
# include <net/netns/dccp.h>
2013-03-25 03:50:39 +04:00
# include <net/netns/netfilter.h>
2008-01-31 15:02:13 +03:00
# include <net/netns/x_tables.h>
2008-10-08 13:35:02 +04:00
# if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE)
# include <net/netns/conntrack.h>
# endif
2013-10-11 01:28:33 +04:00
# include <net/netns/nftables.h>
2008-11-26 04:14:31 +03:00
# include <net/netns/xfrm.h>
2015-03-04 04:10:47 +03:00
# include <net/netns/mpls.h>
2017-02-21 14:19:47 +03:00
# include <net/netns/can.h>
2014-11-01 05:56:04 +03:00
# include <linux/ns_common.h>
2015-06-17 18:28:25 +03:00
# include <linux/idr.h>
# include <linux/skbuff.h>
2007-12-11 15:19:17 +03:00
2012-06-14 13:31:10 +04:00
struct user_namespace ;
2007-09-12 14:01:34 +04:00
struct proc_dir_entry ;
2007-09-27 09:10:56 +04:00
struct net_device ;
2007-11-20 09:26:51 +03:00
struct sock ;
2007-12-01 15:51:01 +03:00
struct ctl_table_header ;
2008-04-15 11:36:08 +04:00
struct net_generic ;
2009-07-10 13:51:34 +04:00
struct sock ;
2011-03-04 13:18:07 +03:00
struct netns_ipvs ;
2007-12-01 15:51:01 +03:00
2009-10-24 17:13:17 +04:00
# define NETDEV_HASHBITS 8
# define NETDEV_HASHENTRIES (1 << NETDEV_HASHBITS)
2007-09-12 13:50:50 +04:00
struct net {
2017-06-30 13:08:08 +03:00
refcount_t passive ; /* To decided when the network
2011-06-09 05:13:01 +04:00
* namespace should be freed .
*/
2007-09-12 13:50:50 +04:00
atomic_t count ; /* To decided when the network
2011-06-09 05:13:01 +04:00
* namespace should be shut down .
2007-09-12 13:50:50 +04:00
*/
2010-10-14 09:56:18 +04:00
spinlock_t rules_mod_lock ;
2015-03-12 04:53:14 +03:00
atomic64_t cookie_gen ;
2007-09-12 13:50:50 +04:00
struct list_head list ; /* list of network namespaces */
2009-11-30 01:25:27 +03:00
struct list_head cleanup_list ; /* namespaces on death row */
2009-12-03 05:29:03 +03:00
struct list_head exit_list ; /* Use only net_mutex */
2007-09-12 14:01:34 +04:00
2012-06-14 13:31:10 +04:00
struct user_namespace * user_ns ; /* Owning user namespace */
2016-08-08 22:33:23 +03:00
struct ucounts * ucounts ;
2015-05-16 00:47:32 +03:00
spinlock_t nsid_lock ;
2015-01-15 17:11:15 +03:00
struct idr netns_ids ;
2012-06-14 13:31:10 +04:00
2014-11-01 05:56:04 +03:00
struct ns_common ns ;
2011-06-15 21:21:48 +04:00
2007-09-12 14:01:34 +04:00
struct proc_dir_entry * proc_net ;
struct proc_dir_entry * proc_net_stat ;
2007-09-17 22:56:21 +04:00
2008-07-15 05:22:20 +04:00
# ifdef CONFIG_SYSCTL
struct ctl_table_set sysctls ;
# endif
2007-11-30 15:55:42 +03:00
2010-10-14 09:56:18 +04:00
struct sock * rtnl ; /* rtnetlink socket */
struct sock * genl_sock ;
2007-09-27 09:10:56 +04:00
2007-09-17 22:56:21 +04:00
struct list_head dev_base_head ;
struct hlist_head * dev_name_head ;
struct hlist_head * dev_index_head ;
2011-06-21 07:11:20 +04:00
unsigned int dev_base_seq ; /* protected by rtnl_mutex */
2012-08-09 01:53:19 +04:00
int ifindex ;
2013-09-24 08:19:49 +04:00
unsigned int dev_unreg_count ;
2007-11-20 09:26:51 +03:00
2008-01-10 14:20:28 +03:00
/* core fib_rules */
struct list_head rules_ops ;
2017-08-03 14:28:11 +03:00
struct list_head fib_notifier_ops ; /* protected by net_mutex */
2007-11-20 09:28:35 +03:00
2010-10-14 09:56:18 +04:00
struct net_device * loopback_dev ; /* The loopback */
2008-04-01 06:41:14 +04:00
struct netns_core core ;
2008-07-18 15:01:24 +04:00
struct netns_mib mib ;
2007-12-11 15:19:54 +03:00
struct netns_packet packet ;
2007-12-11 15:19:17 +03:00
struct netns_unix unx ;
2007-12-17 00:29:36 +03:00
struct netns_ipv4 ipv4 ;
2011-12-10 13:48:31 +04:00
# if IS_ENABLED(CONFIG_IPV6)
2008-01-10 13:49:06 +03:00
struct netns_ipv6 ipv6 ;
# endif
2014-02-28 10:32:49 +04:00
# if IS_ENABLED(CONFIG_IEEE802154_6LOWPAN)
struct netns_ieee802154_lowpan ieee802154_lowpan ;
# endif
2012-08-06 12:42:04 +04:00
# if defined(CONFIG_IP_SCTP) || defined(CONFIG_IP_SCTP_MODULE)
struct netns_sctp sctp ;
# endif
2008-04-14 09:28:42 +04:00
# if defined(CONFIG_IP_DCCP) || defined(CONFIG_IP_DCCP_MODULE)
struct netns_dccp dccp ;
# endif
2008-01-31 15:02:13 +03:00
# ifdef CONFIG_NETFILTER
2013-03-25 03:50:39 +04:00
struct netns_nf nf ;
2008-01-31 15:02:13 +03:00
struct netns_xt xt ;
2008-10-08 13:35:02 +04:00
# if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE)
struct netns_ct ct ;
2012-09-18 20:50:08 +04:00
# endif
2013-10-11 01:28:33 +04:00
# if defined(CONFIG_NF_TABLES) || defined(CONFIG_NF_TABLES_MODULE)
struct netns_nftables nft ;
# endif
2012-09-18 20:50:08 +04:00
# if IS_ENABLED(CONFIG_NF_DEFRAG_IPV6)
struct netns_nf_frag nf_frag ;
2008-10-08 13:35:02 +04:00
# endif
2010-01-13 18:02:14 +03:00
struct sock * nfnl ;
struct sock * nfnl_stash ;
2015-08-05 18:51:45 +03:00
# if IS_ENABLED(CONFIG_NETFILTER_NETLINK_ACCT)
struct list_head nfnl_acct_list ;
# endif
2015-12-09 16:07:40 +03:00
# if IS_ENABLED(CONFIG_NF_CT_NETLINK_TIMEOUT)
struct list_head nfct_timeout_list ;
# endif
2008-11-26 04:14:31 +03:00
# endif
2009-09-30 01:27:28 +04:00
# ifdef CONFIG_WEXT_CORE
2009-06-24 05:34:48 +04:00
struct sk_buff_head wext_nlevents ;
2008-01-31 15:02:13 +03:00
# endif
2010-10-25 07:20:11 +04:00
struct net_generic __rcu * gen ;
2010-10-14 09:56:18 +04:00
/* Note : following structs are cache line aligned */
# ifdef CONFIG_XFRM
struct netns_xfrm xfrm ;
# endif
2013-06-26 12:40:06 +04:00
# if IS_ENABLED(CONFIG_IP_VS)
2011-01-03 16:44:42 +03:00
struct netns_ipvs * ipvs ;
2015-03-04 04:10:47 +03:00
# endif
# if IS_ENABLED(CONFIG_MPLS)
struct netns_mpls mpls ;
2017-02-21 14:19:47 +03:00
# endif
# if IS_ENABLED(CONFIG_CAN)
struct netns_can can ;
2013-06-26 12:40:06 +04:00
# endif
2012-07-16 08:28:49 +04:00
struct sock * diag_nlsk ;
2013-05-28 00:46:33 +04:00
atomic_t fnhe_genid ;
2016-10-28 11:22:25 +03:00
} __randomize_layout ;
2007-09-12 13:50:50 +04:00
2008-04-02 11:10:28 +04:00
# include <linux/seq_file_net.h>
2007-09-13 11:16:29 +04:00
/* Init's network namespace */
2007-09-12 13:50:50 +04:00
extern struct net init_net ;
2008-04-04 00:04:33 +04:00
2012-06-14 13:16:42 +04:00
# ifdef CONFIG_NET_NS
2013-09-21 21:22:48 +04:00
struct net * copy_net_ns ( unsigned long flags , struct user_namespace * user_ns ,
struct net * old_net ) ;
2008-04-02 11:09:29 +04:00
2017-05-30 12:38:12 +03:00
void net_ns_barrier ( void ) ;
2012-06-14 13:16:42 +04:00
# else /* CONFIG_NET_NS */
# include <linux/sched.h>
# include <linux/nsproxy.h>
2012-06-14 13:31:10 +04:00
static inline struct net * copy_net_ns ( unsigned long flags ,
struct user_namespace * user_ns , struct net * old_net )
2007-09-27 09:04:26 +04:00
{
2012-06-14 13:16:42 +04:00
if ( flags & CLONE_NEWNET )
return ERR_PTR ( - EINVAL ) ;
return old_net ;
2007-09-27 09:04:26 +04:00
}
2017-05-30 12:38:12 +03:00
static inline void net_ns_barrier ( void ) { }
2012-06-14 13:16:42 +04:00
# endif /* CONFIG_NET_NS */
2008-04-02 11:09:29 +04:00
extern struct list_head net_namespace_list ;
2007-09-27 09:04:26 +04:00
2013-09-21 21:22:48 +04:00
struct net * get_net_ns_by_pid ( pid_t pid ) ;
2016-11-18 12:41:46 +03:00
struct net * get_net_ns_by_fd ( int fd ) ;
2009-07-10 13:51:35 +04:00
2014-02-09 20:59:14 +04:00
# ifdef CONFIG_SYSCTL
void ipx_register_sysctl ( void ) ;
void ipx_unregister_sysctl ( void ) ;
# else
# define ipx_register_sysctl()
# define ipx_unregister_sysctl()
# endif
2007-11-01 10:43:49 +03:00
# ifdef CONFIG_NET_NS
2013-09-21 21:22:48 +04:00
void __put_net ( struct net * net ) ;
2007-09-12 13:50:50 +04:00
static inline struct net * get_net ( struct net * net )
{
atomic_inc ( & net - > count ) ;
return net ;
}
2007-09-13 11:18:57 +04:00
static inline struct net * maybe_get_net ( struct net * net )
{
/* Used when we know struct net exists but we
* aren ' t guaranteed a previous reference count
* exists . If the reference count is zero this
* function fails and returns NULL .
*/
if ( ! atomic_inc_not_zero ( & net - > count ) )
net = NULL ;
return net ;
}
2007-09-12 13:50:50 +04:00
static inline void put_net ( struct net * net )
{
if ( atomic_dec_and_test ( & net - > count ) )
__put_net ( net ) ;
}
2008-03-25 21:57:35 +03:00
static inline
int net_eq ( const struct net * net1 , const struct net * net2 )
{
return net1 = = net2 ;
}
2011-06-09 05:13:01 +04:00
2013-09-21 21:22:48 +04:00
void net_drop_ns ( void * ) ;
2011-06-09 05:13:01 +04:00
2007-11-01 10:43:49 +03:00
# else
2008-06-21 09:16:51 +04:00
2007-11-01 10:43:49 +03:00
static inline struct net * get_net ( struct net * net )
{
return net ;
}
static inline void put_net ( struct net * net )
{
}
2008-04-16 12:58:04 +04:00
static inline struct net * maybe_get_net ( struct net * net )
{
return net ;
}
static inline
int net_eq ( const struct net * net1 , const struct net * net2 )
{
return 1 ;
}
2011-06-09 05:13:01 +04:00
# define net_drop_ns NULL
2008-04-16 12:58:04 +04:00
# endif
2015-03-12 07:06:44 +03:00
typedef struct {
2008-11-12 11:53:30 +03:00
# ifdef CONFIG_NET_NS
2015-03-12 07:06:44 +03:00
struct net * net ;
# endif
} possible_net_t ;
2008-11-12 11:53:30 +03:00
2015-03-12 07:06:44 +03:00
static inline void write_pnet ( possible_net_t * pnet , struct net * net )
2008-11-12 11:53:30 +03:00
{
2015-03-12 07:06:44 +03:00
# ifdef CONFIG_NET_NS
pnet - > net = net ;
# endif
2008-11-12 11:53:30 +03:00
}
2015-03-12 07:06:44 +03:00
static inline struct net * read_pnet ( const possible_net_t * pnet )
2008-11-12 11:53:30 +03:00
{
2015-03-12 07:06:44 +03:00
# ifdef CONFIG_NET_NS
return pnet - > net ;
2008-11-12 11:53:30 +03:00
# else
2015-03-12 07:06:44 +03:00
return & init_net ;
2008-11-12 11:53:30 +03:00
# endif
2015-03-12 07:06:44 +03:00
}
2008-04-16 12:58:04 +04:00
2007-09-12 13:50:50 +04:00
# define for_each_net(VAR) \
list_for_each_entry ( VAR , & net_namespace_list , list )
2009-07-10 13:51:33 +04:00
# define for_each_net_rcu(VAR) \
list_for_each_entry_rcu ( VAR , & net_namespace_list , list )
2007-10-09 07:38:39 +04:00
# ifdef CONFIG_NET_NS
# define __net_init
# define __net_exit
2007-11-13 14:23:50 +03:00
# define __net_initdata
2012-10-05 04:12:11 +04:00
# define __net_initconst
2007-10-09 07:38:39 +04:00
# else
# define __net_init __init
2016-08-03 00:03:33 +03:00
# define __net_exit __ref
2007-11-13 14:23:50 +03:00
# define __net_initdata __initdata
2012-10-05 04:12:11 +04:00
# define __net_initconst __initconst
2007-10-09 07:38:39 +04:00
# endif
2007-09-12 13:50:50 +04:00
2015-05-07 12:02:49 +03:00
int peernet2id_alloc ( struct net * net , struct net * peer ) ;
2015-05-07 12:02:53 +03:00
int peernet2id ( struct net * net , struct net * peer ) ;
bool peernet_has_id ( struct net * net , struct net * peer ) ;
2015-01-15 17:11:15 +03:00
struct net * get_net_ns_by_id ( struct net * net , int id ) ;
2007-09-12 13:50:50 +04:00
struct pernet_operations {
struct list_head list ;
int ( * init ) ( struct net * net ) ;
void ( * exit ) ( struct net * net ) ;
2009-12-03 05:29:03 +03:00
void ( * exit_batch ) ( struct list_head * net_exit_list ) ;
netns: make struct pernet_operations::id unsigned int
Make struct pernet_operations::id unsigned.
There are 2 reasons to do so:
1)
This field is really an index into an zero based array and
thus is unsigned entity. Using negative value is out-of-bound
access by definition.
2)
On x86_64 unsigned 32-bit data which are mixed with pointers
via array indexing or offsets added or subtracted to pointers
are preffered to signed 32-bit data.
"int" being used as an array index needs to be sign-extended
to 64-bit before being used.
void f(long *p, int i)
{
g(p[i]);
}
roughly translates to
movsx rsi, esi
mov rdi, [rsi+...]
call g
MOVSX is 3 byte instruction which isn't necessary if the variable is
unsigned because x86_64 is zero extending by default.
Now, there is net_generic() function which, you guessed it right, uses
"int" as an array index:
static inline void *net_generic(const struct net *net, int id)
{
...
ptr = ng->ptr[id - 1];
...
}
And this function is used a lot, so those sign extensions add up.
Patch snipes ~1730 bytes on allyesconfig kernel (without all junk
messing with code generation):
add/remove: 0/0 grow/shrink: 70/598 up/down: 396/-2126 (-1730)
Unfortunately some functions actually grow bigger.
This is a semmingly random artefact of code generation with register
allocator being used differently. gcc decides that some variable
needs to live in new r8+ registers and every access now requires REX
prefix. Or it is shifted into r12, so [r12+0] addressing mode has to be
used which is longer than [r8]
However, overall balance is in negative direction:
add/remove: 0/0 grow/shrink: 70/598 up/down: 396/-2126 (-1730)
function old new delta
nfsd4_lock 3886 3959 +73
tipc_link_build_proto_msg 1096 1140 +44
mac80211_hwsim_new_radio 2776 2808 +32
tipc_mon_rcv 1032 1058 +26
svcauth_gss_legacy_init 1413 1429 +16
tipc_bcbase_select_primary 379 392 +13
nfsd4_exchange_id 1247 1260 +13
nfsd4_setclientid_confirm 782 793 +11
...
put_client_renew_locked 494 480 -14
ip_set_sockfn_get 730 716 -14
geneve_sock_add 829 813 -16
nfsd4_sequence_done 721 703 -18
nlmclnt_lookup_host 708 686 -22
nfsd4_lockt 1085 1063 -22
nfs_get_client 1077 1050 -27
tcf_bpf_init 1106 1076 -30
nfsd4_encode_fattr 5997 5930 -67
Total: Before=154856051, After=154854321, chg -0.00%
Signed-off-by: Alexey Dobriyan <adobriyan@gmail.com>
Signed-off-by: David S. Miller <davem@davemloft.net>
2016-11-17 04:58:21 +03:00
unsigned int * id ;
2009-11-30 01:25:28 +03:00
size_t size ;
2007-09-12 13:50:50 +04:00
} ;
2009-02-22 11:11:09 +03:00
/*
* Use these carefully . If you implement a network device and it
* needs per network namespace operations use device pernet operations ,
* otherwise use pernet subsys operations .
*
2009-07-15 10:16:34 +04:00
* Network interfaces need to be removed from a dying netns _before_
* subsys notifiers can be called , as most of the network code cleanup
* ( which is done from subsys notifiers ) runs with the assumption that
* dev_remove_pack has been called so no new packets will arrive during
* and after the cleanup functions have been called . dev_remove_pack
* is not per namespace so instead the guarantee of no more packets
* arriving in a network namespace is provided by ensuring that all
* network devices and all sockets have left the network namespace
* before the cleanup methods are called .
2009-02-22 11:11:09 +03:00
*
* For the longest time the ipv4 icmp code was registered as a pernet
* device which caused kernel oops , and panics during network
* namespace cleanup . So please don ' t get this wrong .
*/
2013-09-21 21:22:48 +04:00
int register_pernet_subsys ( struct pernet_operations * ) ;
void unregister_pernet_subsys ( struct pernet_operations * ) ;
int register_pernet_device ( struct pernet_operations * ) ;
void unregister_pernet_device ( struct pernet_operations * ) ;
2009-11-30 01:25:28 +03:00
2007-11-30 15:55:42 +03:00
struct ctl_table ;
struct ctl_table_header ;
2008-05-20 00:45:33 +04:00
2012-04-19 17:20:32 +04:00
# ifdef CONFIG_SYSCTL
2013-09-21 21:22:48 +04:00
int net_sysctl_init ( void ) ;
struct ctl_table_header * register_net_sysctl ( struct net * net , const char * path ,
struct ctl_table * table ) ;
void unregister_net_sysctl_table ( struct ctl_table_header * header ) ;
2012-04-23 16:13:02 +04:00
# else
static inline int net_sysctl_init ( void ) { return 0 ; }
static inline struct ctl_table_header * register_net_sysctl ( struct net * net ,
const char * path , struct ctl_table * table )
{
return NULL ;
}
static inline void unregister_net_sysctl_table ( struct ctl_table_header * header )
{
}
# endif
2013-07-30 04:33:53 +04:00
static inline int rt_genid_ipv4 ( struct net * net )
2012-09-11 02:09:44 +04:00
{
2013-07-30 04:33:53 +04:00
return atomic_read ( & net - > ipv4 . rt_genid ) ;
2012-09-11 02:09:44 +04:00
}
2013-07-30 04:33:53 +04:00
static inline void rt_genid_bump_ipv4 ( struct net * net )
2012-09-11 02:09:44 +04:00
{
2013-07-30 04:33:53 +04:00
atomic_inc ( & net - > ipv4 . rt_genid ) ;
}
2014-09-28 02:46:06 +04:00
extern void ( * __fib6_flush_trees ) ( struct net * net ) ;
2013-07-30 04:33:53 +04:00
static inline void rt_genid_bump_ipv6 ( struct net * net )
{
2014-09-28 02:46:06 +04:00
if ( __fib6_flush_trees )
__fib6_flush_trees ( net ) ;
2013-07-30 04:33:53 +04:00
}
2014-04-18 05:22:54 +04:00
# if IS_ENABLED(CONFIG_IEEE802154_6LOWPAN)
static inline struct netns_ieee802154_lowpan *
net_ieee802154_lowpan ( struct net * net )
{
return & net - > ieee802154_lowpan ;
}
# endif
2013-07-30 04:33:53 +04:00
/* For callers who don't really care about whether it's IPv4 or IPv6 */
static inline void rt_genid_bump_all ( struct net * net )
{
rt_genid_bump_ipv4 ( net ) ;
rt_genid_bump_ipv6 ( net ) ;
2012-09-11 02:09:44 +04:00
}
2007-11-30 15:55:42 +03:00
2013-05-28 00:46:33 +04:00
static inline int fnhe_genid ( struct net * net )
{
return atomic_read ( & net - > fnhe_genid ) ;
}
static inline void fnhe_genid_bump ( struct net * net )
{
atomic_inc ( & net - > fnhe_genid ) ;
}
2007-09-12 13:50:50 +04:00
# endif /* __NET_NET_NAMESPACE_H */