10b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou/* 20b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou * Geneve: Generic Network Virtualization Encapsulation 30b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou * 40b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou * Copyright (c) 2014 Nicira, Inc. 50b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou * 60b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou * This program is free software; you can redistribute it and/or 70b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou * modify it under the terms of the GNU General Public License 80b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou * as published by the Free Software Foundation; either version 90b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou * 2 of the License, or (at your option) any later version. 100b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou */ 110b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 120b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt 130b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 140b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/kernel.h> 150b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/types.h> 160b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/module.h> 170b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/errno.h> 180b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/slab.h> 190b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/skbuff.h> 200b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/rculist.h> 210b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/netdevice.h> 220b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/in.h> 230b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/ip.h> 240b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/udp.h> 250b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/igmp.h> 260b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/etherdevice.h> 270b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/if_ether.h> 280b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/if_vlan.h> 290b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/hash.h> 300b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <linux/ethtool.h> 310b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/arp.h> 320b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/ndisc.h> 330b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/ip.h> 340b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/ip_tunnels.h> 350b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/icmp.h> 360b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/udp.h> 370b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/rtnetlink.h> 380b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/route.h> 390b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/dsfield.h> 400b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/inet_ecn.h> 410b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/net_namespace.h> 420b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/netns/generic.h> 430b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/geneve.h> 440b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/protocol.h> 450b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/udp_tunnel.h> 460b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#if IS_ENABLED(CONFIG_IPV6) 470b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/ipv6.h> 480b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/addrconf.h> 490b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/ip6_tunnel.h> 500b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#include <net/ip6_checksum.h> 510b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#endif 520b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 530b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#define PORT_HASH_BITS 8 540b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou#define PORT_HASH_SIZE (1<<PORT_HASH_BITS) 550b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 560b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou/* per-network namespace private data for this module */ 570b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustruct geneve_net { 580b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct hlist_head sock_list[PORT_HASH_SIZE]; 590b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou spinlock_t sock_lock; /* Protects sock_list */ 600b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou}; 610b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 620b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic int geneve_net_id; 630b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 640b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic struct workqueue_struct *geneve_wq; 650b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 660b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic inline struct genevehdr *geneve_hdr(const struct sk_buff *skb) 670b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 680b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return (struct genevehdr *)(udp_hdr(skb) + 1); 690b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 700b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 710b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic struct hlist_head *gs_head(struct net *net, __be16 port) 720b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 730b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct geneve_net *gn = net_generic(net, geneve_net_id); 740b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 750b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return &gn->sock_list[hash_32(ntohs(port), PORT_HASH_BITS)]; 760b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 770b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 780b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou/* Find geneve socket based on network namespace and UDP port */ 790b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic struct geneve_sock *geneve_find_sock(struct net *net, __be16 port) 800b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 810b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct geneve_sock *gs; 820b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 830b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou hlist_for_each_entry_rcu(gs, gs_head(net, port), hlist) { 840b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (inet_sk(gs->sock->sk)->inet_sport == port) 850b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return gs; 860b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou } 870b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 880b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return NULL; 890b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 900b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 910b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic void geneve_build_header(struct genevehdr *geneveh, 920b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou __be16 tun_flags, u8 vni[3], 930b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou u8 options_len, u8 *options) 940b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 950b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou geneveh->ver = GENEVE_VER; 960b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou geneveh->opt_len = options_len / 4; 970b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou geneveh->oam = !!(tun_flags & TUNNEL_OAM); 980b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou geneveh->critical = !!(tun_flags & TUNNEL_CRIT_OPT); 990b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou geneveh->rsvd1 = 0; 1000b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou memcpy(geneveh->vni, vni, 3); 1010b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou geneveh->proto_type = htons(ETH_P_TEB); 1020b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou geneveh->rsvd2 = 0; 1030b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1040b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou memcpy(geneveh->options, options, options_len); 1050b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 1060b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1070b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou/* Transmit a fully formated Geneve frame. 1080b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou * 1090b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou * When calling this function. The skb->data should point 1100b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou * to the geneve header which is fully formed. 1110b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou * 1120b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou * This function will add other UDP tunnel headers. 1130b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou */ 1140b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhouint geneve_xmit_skb(struct geneve_sock *gs, struct rtable *rt, 1150b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct sk_buff *skb, __be32 src, __be32 dst, __u8 tos, 1160b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou __u8 ttl, __be16 df, __be16 src_port, __be16 dst_port, 1170b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou __be16 tun_flags, u8 vni[3], u8 opt_len, u8 *opt, 1180b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou bool xnet) 1190b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 1200b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct genevehdr *gnvh; 1210b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou int min_headroom; 1220b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou int err; 1230b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1240b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou skb = udp_tunnel_handle_offloads(skb, !gs->sock->sk->sk_no_check_tx); 1250b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1260b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou min_headroom = LL_RESERVED_SPACE(rt->dst.dev) + rt->dst.header_len 1270b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou + GENEVE_BASE_HLEN + opt_len + sizeof(struct iphdr) 1280b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou + (vlan_tx_tag_present(skb) ? VLAN_HLEN : 0); 1290b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1300b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou err = skb_cow_head(skb, min_headroom); 1310b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (unlikely(err)) 1320b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return err; 1330b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1340b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (vlan_tx_tag_present(skb)) { 1350b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (unlikely(!__vlan_put_tag(skb, 1360b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou skb->vlan_proto, 1370b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou vlan_tx_tag_get(skb)))) { 1380b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou err = -ENOMEM; 1390b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return err; 1400b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou } 1410b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou skb->vlan_tci = 0; 1420b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou } 1430b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1440b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gnvh = (struct genevehdr *)__skb_push(skb, sizeof(*gnvh) + opt_len); 1450b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou geneve_build_header(gnvh, tun_flags, vni, opt_len, opt); 1460b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 14745cac46e51da75628ac2a593c70f5144abb9b31dJesse Gross skb_set_inner_protocol(skb, htons(ETH_P_TEB)); 14845cac46e51da75628ac2a593c70f5144abb9b31dJesse Gross 1490b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return udp_tunnel_xmit_skb(gs->sock, rt, skb, src, dst, 1500b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou tos, ttl, df, src_port, dst_port, xnet); 1510b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 1520b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy ZhouEXPORT_SYMBOL_GPL(geneve_xmit_skb); 1530b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1540b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic void geneve_notify_add_rx_port(struct geneve_sock *gs) 1550b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 1560b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct sock *sk = gs->sock->sk; 1570b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou sa_family_t sa_family = sk->sk_family; 1580b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou int err; 1590b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1600b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (sa_family == AF_INET) { 1610b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou err = udp_add_offload(&gs->udp_offloads); 1620b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (err) 1630b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou pr_warn("geneve: udp_add_offload failed with status %d\n", 1640b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou err); 1650b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou } 1660b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 1670b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1680b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou/* Callback from net/ipv4/udp.c to receive packets */ 1690b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic int geneve_udp_encap_recv(struct sock *sk, struct sk_buff *skb) 1700b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 1710b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct genevehdr *geneveh; 1720b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct geneve_sock *gs; 1730b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou int opts_len; 1740b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1750b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou /* Need Geneve and inner Ethernet header to be present */ 1760b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (unlikely(!pskb_may_pull(skb, GENEVE_BASE_HLEN))) 1770b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou goto error; 1780b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1790b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou /* Return packets with reserved bits set */ 1800b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou geneveh = geneve_hdr(skb); 1810b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1820b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (unlikely(geneveh->ver != GENEVE_VER)) 1830b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou goto error; 1840b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1850b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (unlikely(geneveh->proto_type != htons(ETH_P_TEB))) 1860b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou goto error; 1870b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1880b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou opts_len = geneveh->opt_len * 4; 1890b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (iptunnel_pull_header(skb, GENEVE_BASE_HLEN + opts_len, 1900b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou htons(ETH_P_TEB))) 1910b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou goto drop; 1920b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1930b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gs = rcu_dereference_sk_user_data(sk); 1940b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (!gs) 1950b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou goto drop; 1960b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 1970b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gs->rcv(gs, skb); 1980b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return 0; 1990b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2000b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoudrop: 2010b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou /* Consume bad packet */ 2020b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou kfree_skb(skb); 2030b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return 0; 2040b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2050b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhouerror: 2060b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou /* Let the UDP layer deal with the skb */ 2070b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return 1; 2080b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 2090b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2100b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic void geneve_del_work(struct work_struct *work) 2110b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 2120b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct geneve_sock *gs = container_of(work, struct geneve_sock, 2130b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou del_work); 2140b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2150b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou udp_tunnel_sock_release(gs->sock); 2160b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou kfree_rcu(gs, rcu); 2170b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 2180b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2190b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic struct socket *geneve_create_sock(struct net *net, bool ipv6, 2200b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou __be16 port) 2210b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 2220b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct socket *sock; 2230b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct udp_port_cfg udp_conf; 2240b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou int err; 2250b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2260b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou memset(&udp_conf, 0, sizeof(udp_conf)); 2270b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2280b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (ipv6) { 2290b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou udp_conf.family = AF_INET6; 2300b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou } else { 2310b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou udp_conf.family = AF_INET; 23242350dcaaf1d8d95d58e8b43aee006d62c84bc2eAndy Zhou udp_conf.local_ip.s_addr = htonl(INADDR_ANY); 2330b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou } 2340b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2350b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou udp_conf.local_udp_port = port; 2360b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2370b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou /* Open UDP socket */ 2380b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou err = udp_sock_create(net, &udp_conf, &sock); 2390b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (err < 0) 2400b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return ERR_PTR(err); 2410b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2420b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return sock; 2430b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 2440b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2450b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou/* Create new listen socket if needed */ 2460b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic struct geneve_sock *geneve_socket_create(struct net *net, __be16 port, 2470b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou geneve_rcv_t *rcv, void *data, 2480b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou bool ipv6) 2490b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 2500b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct geneve_net *gn = net_generic(net, geneve_net_id); 2510b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct geneve_sock *gs; 2520b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct socket *sock; 2530b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct udp_tunnel_sock_cfg tunnel_cfg; 2540b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2550b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gs = kzalloc(sizeof(*gs), GFP_KERNEL); 2560b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (!gs) 2570b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return ERR_PTR(-ENOMEM); 2580b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2590b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou INIT_WORK(&gs->del_work, geneve_del_work); 2600b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2610b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou sock = geneve_create_sock(net, ipv6, port); 2620b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (IS_ERR(sock)) { 2630b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou kfree(gs); 2640b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return ERR_CAST(sock); 2650b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou } 2660b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2670b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gs->sock = sock; 2680b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou atomic_set(&gs->refcnt, 1); 2690b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gs->rcv = rcv; 2700b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gs->rcv_data = data; 2710b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2720b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou /* Initialize the geneve udp offloads structure */ 2730b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gs->udp_offloads.port = port; 2740b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gs->udp_offloads.callbacks.gro_receive = NULL; 2750b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gs->udp_offloads.callbacks.gro_complete = NULL; 2760b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2770b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou spin_lock(&gn->sock_lock); 2780b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou hlist_add_head_rcu(&gs->hlist, gs_head(net, port)); 2790b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou geneve_notify_add_rx_port(gs); 2800b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou spin_unlock(&gn->sock_lock); 2810b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2820b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou /* Mark socket as an encapsulation socket */ 2830b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou tunnel_cfg.sk_user_data = gs; 2840b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou tunnel_cfg.encap_type = 1; 2850b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou tunnel_cfg.encap_rcv = geneve_udp_encap_recv; 2860b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou tunnel_cfg.encap_destroy = NULL; 2870b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou setup_udp_tunnel_sock(net, sock, &tunnel_cfg); 2880b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2890b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return gs; 2900b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 2910b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2920b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustruct geneve_sock *geneve_sock_add(struct net *net, __be16 port, 2930b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou geneve_rcv_t *rcv, void *data, 2940b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou bool no_share, bool ipv6) 2950b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 2960b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct geneve_sock *gs; 2970b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 2980b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gs = geneve_socket_create(net, port, rcv, data, ipv6); 2990b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (!IS_ERR(gs)) 3000b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return gs; 3010b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3020b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (no_share) /* Return error if sharing is not allowed. */ 3030b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return ERR_PTR(-EINVAL); 3040b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3050b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gs = geneve_find_sock(net, port); 3060b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (gs) { 3070b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (gs->rcv == rcv) 3080b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou atomic_inc(&gs->refcnt); 3090b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou else 3100b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gs = ERR_PTR(-EBUSY); 3110b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou } else { 3120b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou gs = ERR_PTR(-EINVAL); 3130b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou } 3140b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3150b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return gs; 3160b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 3170b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy ZhouEXPORT_SYMBOL_GPL(geneve_sock_add); 3180b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3190b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhouvoid geneve_sock_release(struct geneve_sock *gs) 3200b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 3210b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (!atomic_dec_and_test(&gs->refcnt)) 3220b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return; 3230b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3240b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou queue_work(geneve_wq, &gs->del_work); 3250b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 3260b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy ZhouEXPORT_SYMBOL_GPL(geneve_sock_release); 3270b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3280b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic __net_init int geneve_init_net(struct net *net) 3290b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 3300b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou struct geneve_net *gn = net_generic(net, geneve_net_id); 3310b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou unsigned int h; 3320b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3330b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou spin_lock_init(&gn->sock_lock); 3340b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3350b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou for (h = 0; h < PORT_HASH_SIZE; ++h) 3360b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou INIT_HLIST_HEAD(&gn->sock_list[h]); 3370b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3380b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return 0; 3390b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 3400b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3410b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic struct pernet_operations geneve_net_ops = { 3420b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou .init = geneve_init_net, 3430b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou .exit = NULL, 3440b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou .id = &geneve_net_id, 3450b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou .size = sizeof(struct geneve_net), 3460b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou}; 3470b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3480b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic int __init geneve_init_module(void) 3490b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 3500b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou int rc; 3510b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3520b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou geneve_wq = alloc_workqueue("geneve", 0, 0); 3530b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (!geneve_wq) 3540b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return -ENOMEM; 3550b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3560b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou rc = register_pernet_subsys(&geneve_net_ops); 3570b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou if (rc) 3580b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return rc; 3590b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3600b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou pr_info("Geneve driver\n"); 3610b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3620b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou return 0; 3630b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 3640b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoulate_initcall(geneve_init_module); 3650b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3660b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoustatic void __exit geneve_cleanup_module(void) 3670b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou{ 3680b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou destroy_workqueue(geneve_wq); 369d3ca9eafc0ed97b8f56fdf23655cfece89c48354Jesse Gross unregister_pernet_subsys(&geneve_net_ops); 3700b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou} 3710b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhoumodule_exit(geneve_cleanup_module); 3720b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy Zhou 3730b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy ZhouMODULE_LICENSE("GPL"); 3740b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy ZhouMODULE_AUTHOR("Jesse Gross <jesse@nicira.com>"); 3750b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy ZhouMODULE_DESCRIPTION("Driver for GENEVE encapsulated traffic"); 3760b5e8b8eeae40bae6ad7c7e91c97c3c0d0e57882Andy ZhouMODULE_ALIAS_RTNL_LINK("geneve"); 377