datapath/tunnel.h

   1 /*
   2  * Copyright (c) 2010, 2011 Nicira Networks.
   3  * Distributed under the terms of the GNU GPL version 2.
   4  *
   5  * Significant portions of this file may be copied from parts of the Linux
   6  * kernel, by Linus Torvalds and others.
   7  */
   8
   9 #ifndef TUNNEL_H
  10 #define TUNNEL_H 1
  11
  12 #include <linux/version.h>
  13
  14 #include "flow.h"
  15 #include "openvswitch/tunnel.h"
  16 #include "table.h"
  17 #include "vport.h"
  18
  19 /*
  20  * The absolute minimum fragment size.  Note that there are many other
  21  * definitions of the minimum MTU.
  22  */
  23 #define IP_MIN_MTU 68
  24
  25 /*
  26  * One of these goes in struct tnl_ops and in tnl_find_port().
  27  * These values are in the same namespace as other TNL_T_* values, so
  28  * only the least significant 10 bits are available to define protocol
  29  * identifiers.
  30  */
  31 #define TNL_T_PROTO_GRE         0
  32 #define TNL_T_PROTO_CAPWAP      1
  33
  34 /* These flags are only needed when calling tnl_find_port(). */
  35 #define TNL_T_KEY_EXACT         (1 << 10)
  36 #define TNL_T_KEY_MATCH         (1 << 11)
  37 #define TNL_T_KEY_EITHER        (TNL_T_KEY_EXACT | TNL_T_KEY_MATCH)
  38
  39 /* Private flags not exposed to userspace in this form. */
  40 #define TNL_F_IN_KEY_MATCH      (1 << 16) /* Store the key in tun_id to match in flow table. */
  41 #define TNL_F_OUT_KEY_ACTION    (1 << 17) /* Get the key from a SET_TUNNEL action. */
  42
  43 /* All public tunnel flags. */
  44 #define TNL_F_PUBLIC (TNL_F_CSUM | TNL_F_TOS_INHERIT | TNL_F_TTL_INHERIT | \
  45                       TNL_F_PMTUD | TNL_F_HDR_CACHE | TNL_F_IPSEC)
  46
  47 /**
  48  * struct tnl_mutable_config - modifiable configuration for a tunnel.
  49  * @rcu: RCU callback head for deferred destruction.
  50  * @seq: Sequence number for distinguishing configuration versions.
  51  * @tunnel_type: Set of TNL_T_* flags that define lookup.
  52  * @tunnel_hlen: Tunnel header length.
  53  * @eth_addr: Source address for packets generated by tunnel itself
  54  * (e.g. ICMP fragmentation needed messages).
  55  * @mtu: MTU of tunnel.
  56  * @in_key: Key to match on input, 0 for wildcard.
  57  * @out_key: Key to use on output, 0 if this tunnel has no fixed output key.
  58  * @flags: TNL_F_* flags.
  59  * @saddr: IPv4 source address to match, 0 to accept any source address.
  60  * @daddr: IPv4 destination of tunnel.
  61  * @tos: IPv4 TOS value to use for tunnel, 0 if no fixed TOS.
  62  * @ttl: IPv4 TTL value to use for tunnel, 0 if no fixed TTL.
  63  */
  64 struct tnl_mutable_config {
  65         struct rcu_head rcu;
  66
  67         unsigned seq;
  68
  69         u32 tunnel_type;
  70         unsigned tunnel_hlen;
  71
  72         unsigned char eth_addr[ETH_ALEN];
  73         unsigned mtu;
  74
  75         /* Configured via ODP_TUNNEL_ATTR_* attributes. */
  76         __be64  in_key;
  77         __be64  out_key;
  78         u32     flags;
  79         __be32  saddr;
  80         __be32  daddr;
  81         u8      tos;
  82         u8      ttl;
  83 };
  84
  85 struct tnl_ops {
  86         u32 tunnel_type;        /* Put the TNL_T_PROTO_* type in here. */
  87         u8 ipproto;             /* The IP protocol for the tunnel. */
  88
  89         /*
  90          * Returns the length of the tunnel header that will be added in
  91          * build_header() (i.e. excludes the IP header).  Returns a negative
  92          * error code if the configuration is invalid.
  93          */
  94         int (*hdr_len)(const struct tnl_mutable_config *);
  95
  96         /*
  97          * Builds the static portion of the tunnel header, which is stored in
  98          * the header cache.  In general the performance of this function is
  99          * not too important as we try to only call it when building the cache
 100          * so it is preferable to shift as much work as possible here.  However,
 101          * in some circumstances caching is disabled and this function will be
 102          * called for every packet, so try not to make it too slow.
 103          */
 104         void (*build_header)(const struct vport *,
 105                              const struct tnl_mutable_config *, void *header);
 106
 107         /*
 108          * Updates the cached header of a packet to match the actual packet
 109          * data.  Typical things that might need to be updated are length,
 110          * checksum, etc.  The IP header will have already been updated and this
 111          * is the final step before transmission.  Returns a linked list of
 112          * completed SKBs (multiple packets may be generated in the event
 113          * of fragmentation).
 114          */
 115         struct sk_buff *(*update_header)(const struct vport *,
 116                                          const struct tnl_mutable_config *,
 117                                          struct dst_entry *, struct sk_buff *);
 118 };
 119
 120 #if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,20)
 121 /*
 122  * On these kernels we have a fast mechanism to tell if the ARP cache for a
 123  * particular destination has changed.
 124  */
 125 #define HAVE_HH_SEQ
 126 #endif
 127 #if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,27)
 128 /*
 129  * On these kernels we have a fast mechanism to tell if the routing table
 130  * has changed.
 131  */
 132 #define HAVE_RT_GENID
 133 #endif
 134 #if !defined(HAVE_HH_SEQ) || !defined(HAVE_RT_GENID)
 135 /* If we can't detect all system changes directly we need to use a timeout. */
 136 #define NEED_CACHE_TIMEOUT
 137 #endif
 138 struct tnl_cache {
 139         struct rcu_head rcu;
 140
 141         int len;                /* Length of data to be memcpy'd from cache. */
 142
 143         /* Sequence number of mutable->seq from which this cache was generated. */
 144         unsigned mutable_seq;
 145
 146 #ifdef HAVE_HH_SEQ
 147         /*
 148          * The sequence number from the seqlock protecting the hardware header
 149          * cache (in the ARP cache).  Since every write increments the counter
 150          * this gives us an easy way to tell if it has changed.
 151          */
 152         unsigned hh_seq;
 153 #endif
 154
 155 #ifdef NEED_CACHE_TIMEOUT
 156         /*
 157          * If we don't have direct mechanisms to detect all important changes in
 158          * the system fall back to an expiration time.  This expiration time
 159          * can be relatively short since at high rates there will be millions of
 160          * packets per second, so we'll still get plenty of benefit from the
 161          * cache.  Note that if something changes we may blackhole packets
 162          * until the expiration time (depending on what changed and the kernel
 163          * version we may be able to detect the change sooner).  Expiration is
 164          * expressed as a time in jiffies.
 165          */
 166         unsigned long expiration;
 167 #endif
 168
 169         /*
 170          * The routing table entry that is the result of looking up the tunnel
 171          * endpoints.  It also contains a sequence number (called a generation
 172          * ID) that can be compared to a global sequence to tell if the routing
 173          * table has changed (and therefore there is a potential that this
 174          * cached route has been invalidated).
 175          */
 176         struct rtable *rt;
 177
 178         /*
 179          * If the output device for tunnel traffic is an OVS internal device,
 180          * the flow of that datapath.  Since all tunnel traffic will have the
 181          * same headers this allows us to cache the flow lookup.  NULL if the
 182          * output device is not OVS or if there is no flow installed.
 183          */
 184         struct sw_flow *flow;
 185
 186         /* The cached header follows after padding for alignment. */
 187 };
 188
 189 struct tnl_vport {
 190         struct rcu_head rcu;
 191         struct tbl_node tbl_node;
 192
 193         char name[IFNAMSIZ];
 194         const struct tnl_ops *tnl_ops;
 195
 196         struct tnl_mutable_config __rcu *mutable;
 197
 198         /*
 199          * ID of last fragment sent (for tunnel protocols with direct support
 200          * fragmentation).  If the protocol relies on IP fragmentation then
 201          * this is not needed.
 202          */
 203         atomic_t frag_id;
 204
 205         spinlock_t cache_lock;
 206         struct tnl_cache __rcu *cache;          /* Protected by RCU/cache_lock. */
 207
 208 #ifdef NEED_CACHE_TIMEOUT
 209         /*
 210          * If we must rely on expiration time to invalidate the cache, this is
 211          * the interval.  It is randomized within a range (defined by
 212          * MAX_CACHE_EXP in tunnel.c) to avoid synchronized expirations caused
 213          * by creation of a large number of tunnels at a one time.
 214          */
 215         unsigned long cache_exp_interval;
 216 #endif
 217 };
 218
 219 struct vport *tnl_create(const struct vport_parms *, const struct vport_ops *,
 220                          const struct tnl_ops *);
 221 int tnl_destroy(struct vport *);
 222
 223 int tnl_set_options(struct vport *, struct nlattr *);
 224 int tnl_get_options(const struct vport *, struct sk_buff *);
 225
 226 int tnl_set_mtu(struct vport *vport, int mtu);
 227 int tnl_set_addr(struct vport *vport, const unsigned char *addr);
 228 const char *tnl_get_name(const struct vport *vport);
 229 const unsigned char *tnl_get_addr(const struct vport *vport);
 230 int tnl_get_mtu(const struct vport *vport);
 231 int tnl_send(struct vport *vport, struct sk_buff *skb);
 232 void tnl_rcv(struct vport *vport, struct sk_buff *skb);
 233
 234 struct vport *tnl_find_port(__be32 saddr, __be32 daddr, __be64 key,
 235                             int tunnel_type,
 236                             const struct tnl_mutable_config **mutable);
 237 bool tnl_frag_needed(struct vport *vport,
 238                      const struct tnl_mutable_config *mutable,
 239                      struct sk_buff *skb, unsigned int mtu, __be64 flow_key);
 240 void tnl_free_linked_skbs(struct sk_buff *skb);
 241
 242 static inline struct tnl_vport *tnl_vport_priv(const struct vport *vport)
 243 {
 244         return vport_priv(vport);
 245 }
 246
 247
 248 #endif /* tunnel.h */