2013-08-19 22:23:34 +04:00
/*
* Copyright ( c ) 2013 Nicira , Inc .
* Copyright ( c ) 2013 Cisco Systems , Inc .
*
* This program is free software ; you can redistribute it and / or
* modify it under the terms of version 2 of the GNU General Public
* License as published by the Free Software Foundation .
*
* This program is distributed in the hope that it will be useful , but
* WITHOUT ANY WARRANTY ; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the GNU
* General Public License for more details .
*
* You should have received a copy of the GNU General Public License
* along with this program ; if not , write to the Free Software
* Foundation , Inc . , 51 Franklin Street , Fifth Floor , Boston , MA
* 02110 - 1301 , USA
*/
# define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
# include <linux/in.h>
# include <linux/ip.h>
# include <linux/net.h>
# include <linux/rculist.h>
# include <linux/udp.h>
# include <net/icmp.h>
# include <net/ip.h>
# include <net/udp.h>
# include <net/ip_tunnels.h>
# include <net/rtnetlink.h>
# include <net/route.h>
# include <net/dsfield.h>
# include <net/inet_ecn.h>
# include <net/net_namespace.h>
# include <net/netns/generic.h>
# include <net/vxlan.h>
# include "datapath.h"
# include "vport.h"
/**
* struct vxlan_port - Keeps track of open UDP ports
* @ vs : vxlan_sock created for the port .
* @ name : vport name .
*/
struct vxlan_port {
struct vxlan_sock * vs ;
char name [ IFNAMSIZ ] ;
} ;
static inline struct vxlan_port * vxlan_vport ( const struct vport * vport )
{
return vport_priv ( vport ) ;
}
/* Called with rcu_read_lock and BH disabled. */
static void vxlan_rcv ( struct vxlan_sock * vs , struct sk_buff * skb , __be32 vx_vni )
{
struct ovs_key_ipv4_tunnel tun_key ;
struct vport * vport = vs - > data ;
struct iphdr * iph ;
__be64 key ;
/* Save outer tunnel values */
iph = ip_hdr ( skb ) ;
key = cpu_to_be64 ( ntohl ( vx_vni ) > > 8 ) ;
ovs_flow_tun_key_init ( & tun_key , iph , key , TUNNEL_KEY ) ;
ovs_vport_receive ( vport , skb , & tun_key ) ;
}
static int vxlan_get_options ( const struct vport * vport , struct sk_buff * skb )
{
struct vxlan_port * vxlan_port = vxlan_vport ( vport ) ;
__be16 dst_port = inet_sk ( vxlan_port - > vs - > sock - > sk ) - > inet_sport ;
if ( nla_put_u16 ( skb , OVS_TUNNEL_ATTR_DST_PORT , ntohs ( dst_port ) ) )
return - EMSGSIZE ;
return 0 ;
}
static void vxlan_tnl_destroy ( struct vport * vport )
{
struct vxlan_port * vxlan_port = vxlan_vport ( vport ) ;
vxlan_sock_release ( vxlan_port - > vs ) ;
ovs_vport_deferred_free ( vport ) ;
}
static struct vport * vxlan_tnl_create ( const struct vport_parms * parms )
{
struct net * net = ovs_dp_get_net ( parms - > dp ) ;
struct nlattr * options = parms - > options ;
struct vxlan_port * vxlan_port ;
struct vxlan_sock * vs ;
struct vport * vport ;
struct nlattr * a ;
u16 dst_port ;
int err ;
if ( ! options ) {
err = - EINVAL ;
goto error ;
}
a = nla_find_nested ( options , OVS_TUNNEL_ATTR_DST_PORT ) ;
if ( a & & nla_len ( a ) = = sizeof ( u16 ) ) {
dst_port = nla_get_u16 ( a ) ;
} else {
/* Require destination port from userspace. */
err = - EINVAL ;
goto error ;
}
vport = ovs_vport_alloc ( sizeof ( struct vxlan_port ) ,
& ovs_vxlan_vport_ops , parms ) ;
if ( IS_ERR ( vport ) )
return vport ;
vxlan_port = vxlan_vport ( vport ) ;
strncpy ( vxlan_port - > name , parms - > name , IFNAMSIZ ) ;
2013-08-31 09:44:33 +04:00
vs = vxlan_sock_add ( net , htons ( dst_port ) , vxlan_rcv , vport , true , false ) ;
2013-08-19 22:23:34 +04:00
if ( IS_ERR ( vs ) ) {
ovs_vport_free ( vport ) ;
return ( void * ) vs ;
}
vxlan_port - > vs = vs ;
return vport ;
error :
return ERR_PTR ( err ) ;
}
static int vxlan_tnl_send ( struct vport * vport , struct sk_buff * skb )
{
struct net * net = ovs_dp_get_net ( vport - > dp ) ;
struct vxlan_port * vxlan_port = vxlan_vport ( vport ) ;
__be16 dst_port = inet_sk ( vxlan_port - > vs - > sock - > sk ) - > inet_sport ;
struct rtable * rt ;
struct flowi4 fl ;
__be16 src_port ;
int port_min ;
int port_max ;
__be16 df ;
int err ;
if ( unlikely ( ! OVS_CB ( skb ) - > tun_key ) ) {
err = - EINVAL ;
goto error ;
}
/* Route lookup */
memset ( & fl , 0 , sizeof ( fl ) ) ;
fl . daddr = OVS_CB ( skb ) - > tun_key - > ipv4_dst ;
fl . saddr = OVS_CB ( skb ) - > tun_key - > ipv4_src ;
fl . flowi4_tos = RT_TOS ( OVS_CB ( skb ) - > tun_key - > ipv4_tos ) ;
fl . flowi4_mark = skb - > mark ;
fl . flowi4_proto = IPPROTO_UDP ;
rt = ip_route_output_key ( net , & fl ) ;
if ( IS_ERR ( rt ) ) {
err = PTR_ERR ( rt ) ;
goto error ;
}
df = OVS_CB ( skb ) - > tun_key - > tun_flags & TUNNEL_DONT_FRAGMENT ?
htons ( IP_DF ) : 0 ;
skb - > local_df = 1 ;
2013-09-29 01:10:59 +04:00
inet_get_local_port_range ( net , & port_min , & port_max ) ;
2013-08-19 22:23:34 +04:00
src_port = vxlan_src_port ( port_min , port_max , skb ) ;
2013-09-02 17:34:55 +04:00
err = vxlan_xmit_skb ( vxlan_port - > vs , rt , skb ,
2013-08-19 22:23:34 +04:00
fl . saddr , OVS_CB ( skb ) - > tun_key - > ipv4_dst ,
OVS_CB ( skb ) - > tun_key - > ipv4_tos ,
OVS_CB ( skb ) - > tun_key - > ipv4_ttl , df ,
src_port , dst_port ,
htonl ( be64_to_cpu ( OVS_CB ( skb ) - > tun_key - > tun_id ) < < 8 ) ) ;
if ( err < 0 )
ip_rt_put ( rt ) ;
error :
return err ;
}
static const char * vxlan_get_name ( const struct vport * vport )
{
struct vxlan_port * vxlan_port = vxlan_vport ( vport ) ;
return vxlan_port - > name ;
}
const struct vport_ops ovs_vxlan_vport_ops = {
. type = OVS_VPORT_TYPE_VXLAN ,
. create = vxlan_tnl_create ,
. destroy = vxlan_tnl_destroy ,
. get_name = vxlan_get_name ,
. get_options = vxlan_get_options ,
. send = vxlan_tnl_send ,
} ;