fedora core 6 1.2949 + vserver 2.2.0
[linux-2.6.git] / net / ipv6 / xfrm6_policy.c
index ab4e40b..8dffd4d 100644 (file)
  * 
  */
 
-#include <linux/config.h>
+#include <linux/compiler.h>
+#include <linux/netdevice.h>
+#include <net/addrconf.h>
 #include <net/xfrm.h>
 #include <net/ip.h>
 #include <net/ipv6.h>
 #include <net/ip6_route.h>
+#ifdef CONFIG_IPV6_MIP6
+#include <net/mip6.h>
+#endif
 
-extern struct dst_ops xfrm6_dst_ops;
-extern struct xfrm_policy_afinfo xfrm6_policy_afinfo;
+static struct dst_ops xfrm6_dst_ops;
+static struct xfrm_policy_afinfo xfrm6_policy_afinfo;
 
-static struct xfrm_type_map xfrm6_type_map = { .lock = RW_LOCK_UNLOCKED };
-
-int xfrm6_dst_lookup(struct xfrm_dst **dst, struct flowi *fl)
+static int xfrm6_dst_lookup(struct xfrm_dst **xdst, struct flowi *fl)
 {
-       int err = 0;
-       *dst = (struct xfrm_dst*)ip6_route_output(NULL, fl);
-       if (!*dst)
-               err = -ENETUNREACH;
+       struct dst_entry *dst = ip6_route_output(NULL, fl);
+       int err = dst->error;
+       if (!err)
+               *xdst = (struct xfrm_dst *) dst;
+       else
+               dst_release(dst);
        return err;
 }
 
-/* Check that the bundle accepts the flow and its components are
- * still valid.
- */
-
-static int __xfrm6_bundle_ok(struct xfrm_dst *xdst, struct flowi *fl)
+static int xfrm6_get_saddr(xfrm_address_t *saddr, xfrm_address_t *daddr)
 {
-       do {
-               if (xdst->u.dst.ops != &xfrm6_dst_ops)
-                       return 1;
-
-               if (!xfrm_selector_match(&xdst->u.dst.xfrm->sel, fl, AF_INET6))
-                       return 0;
-               if (xdst->u.dst.xfrm->km.state != XFRM_STATE_VALID ||
-                   xdst->u.dst.path->obsolete > 0)
-                       return 0;
-               xdst = (struct xfrm_dst*)xdst->u.dst.child;
-       } while (xdst);
-       return 0;
+       struct rt6_info *rt;
+       struct flowi fl_tunnel = {
+               .nl_u = {
+                       .ip6_u = {
+                               .daddr = *(struct in6_addr *)&daddr->a6,
+                       },
+               },
+       };
+
+       if (!xfrm6_dst_lookup((struct xfrm_dst **)&rt, &fl_tunnel)) {
+               ipv6_get_saddr(&rt->u.dst, (struct in6_addr *)&daddr->a6,
+                              (struct in6_addr *)&saddr->a6);
+               dst_release(&rt->u.dst);
+               return 0;
+       }
+       return -EHOSTUNREACH;
 }
 
 static struct dst_entry *
@@ -68,9 +73,11 @@ __xfrm6_find_bundle(struct flowi *fl, struct xfrm_policy *policy)
                ipv6_addr_prefix(&fl_src_prefix,
                                 &fl->fl6_src,
                                 xdst->u.rt6.rt6i_src.plen);
-               if (!ipv6_addr_cmp(&xdst->u.rt6.rt6i_dst.addr, &fl_dst_prefix) &&
-                   !ipv6_addr_cmp(&xdst->u.rt6.rt6i_src.addr, &fl_src_prefix) &&
-                   __xfrm6_bundle_ok(xdst, fl)) {
+               if (ipv6_addr_equal(&xdst->u.rt6.rt6i_dst.addr, &fl_dst_prefix) &&
+                   ipv6_addr_equal(&xdst->u.rt6.rt6i_src.addr, &fl_src_prefix) &&
+                   xfrm_bundle_ok(policy, xdst, fl, AF_INET6,
+                                  (xdst->u.rt6.rt6i_dst.plen != 128 ||
+                                   xdst->u.rt6.rt6i_src.plen != 128))) {
                        dst_clone(dst);
                        break;
                }
@@ -79,6 +86,40 @@ __xfrm6_find_bundle(struct flowi *fl, struct xfrm_policy *policy)
        return dst;
 }
 
+static inline struct in6_addr*
+__xfrm6_bundle_addr_remote(struct xfrm_state *x, struct in6_addr *addr)
+{
+       return (x->type->remote_addr) ?
+               (struct in6_addr*)x->type->remote_addr(x, (xfrm_address_t *)addr) :
+               (struct in6_addr*)&x->id.daddr;
+}
+
+static inline struct in6_addr*
+__xfrm6_bundle_addr_local(struct xfrm_state *x, struct in6_addr *addr)
+{
+       return (x->type->local_addr) ?
+               (struct in6_addr*)x->type->local_addr(x, (xfrm_address_t *)addr) :
+               (struct in6_addr*)&x->props.saddr;
+}
+
+static inline void
+__xfrm6_bundle_len_inc(int *len, int *nflen, struct xfrm_state *x)
+{
+       if (x->type->flags & XFRM_TYPE_NON_FRAGMENT)
+               *nflen += x->props.header_len;
+       else
+               *len += x->props.header_len;
+}
+
+static inline void
+__xfrm6_bundle_len_dec(int *len, int *nflen, struct xfrm_state *x)
+{
+       if (x->type->flags & XFRM_TYPE_NON_FRAGMENT)
+               *nflen -= x->props.header_len;
+       else
+               *len -= x->props.header_len;
+}
+
 /* Allocate chain of dst_entry's, attach known xfrm's, calculate
  * all the metrics... Shortly, bundle a bundle.
  */
@@ -92,18 +133,31 @@ __xfrm6_bundle_create(struct xfrm_policy *policy, struct xfrm_state **xfrm, int
        struct rt6_info *rt  = rt0;
        struct in6_addr *remote = &fl->fl6_dst;
        struct in6_addr *local  = &fl->fl6_src;
+       struct flowi fl_tunnel = {
+               .nl_u = {
+                       .ip6_u = {
+                               .saddr = *local,
+                               .daddr = *remote
+                       }
+               }
+       };
        int i;
        int err = 0;
        int header_len = 0;
+       int nfheader_len = 0;
        int trailer_len = 0;
 
        dst = dst_prev = NULL;
+       dst_hold(&rt->u.dst);
 
        for (i = 0; i < nx; i++) {
                struct dst_entry *dst1 = dst_alloc(&xfrm6_dst_ops);
+               struct xfrm_dst *xdst;
+               int tunnel = 0;
 
                if (unlikely(dst1 == NULL)) {
                        err = -ENOBUFS;
+                       dst_release(&rt->u.dst);
                        goto error;
                }
 
@@ -114,32 +168,45 @@ __xfrm6_bundle_create(struct xfrm_policy *policy, struct xfrm_state **xfrm, int
                        dst1->flags |= DST_NOHASH;
                        dst_clone(dst1);
                }
+
+               xdst = (struct xfrm_dst *)dst1;
+               xdst->route = &rt->u.dst;
+               xdst->genid = xfrm[i]->genid;
+               if (rt->rt6i_node)
+                       xdst->route_cookie = rt->rt6i_node->fn_sernum;
+
+               dst1->next = dst_prev;
                dst_prev = dst1;
-               if (xfrm[i]->props.mode) {
-                       remote = (struct in6_addr*)&xfrm[i]->id.daddr;
-                       local  = (struct in6_addr*)&xfrm[i]->props.saddr;
+               if (xfrm[i]->props.mode != XFRM_MODE_TRANSPORT) {
+                       remote = __xfrm6_bundle_addr_remote(xfrm[i], remote);
+                       local  = __xfrm6_bundle_addr_local(xfrm[i], local);
+                       tunnel = 1;
                }
-               header_len += xfrm[i]->props.header_len;
+               __xfrm6_bundle_len_inc(&header_len, &nfheader_len, xfrm[i]);
                trailer_len += xfrm[i]->props.trailer_len;
+
+               if (tunnel) {
+                       ipv6_addr_copy(&fl_tunnel.fl6_dst, remote);
+                       ipv6_addr_copy(&fl_tunnel.fl6_src, local);
+                       err = xfrm_dst_lookup((struct xfrm_dst **) &rt,
+                                             &fl_tunnel, AF_INET6);
+                       if (err)
+                               goto error;
+               } else
+                       dst_hold(&rt->u.dst);
        }
 
-       if (ipv6_addr_cmp(remote, &fl->fl6_dst)) {
-               struct flowi fl_tunnel;
+       dst_prev->child = &rt->u.dst;
+       dst->path = &rt->u.dst;
+       if (rt->rt6i_node)
+               ((struct xfrm_dst *)dst)->path_cookie = rt->rt6i_node->fn_sernum;
 
-               memset(&fl_tunnel, 0, sizeof(fl_tunnel));
-               ipv6_addr_copy(&fl_tunnel.fl6_dst, remote);
-               ipv6_addr_copy(&fl_tunnel.fl6_src, local);
+       *dst_p = dst;
+       dst = dst_prev;
 
-               err = xfrm_dst_lookup((struct xfrm_dst **) &rt,
-                                     &fl_tunnel, AF_INET6);
-               if (err)
-                       goto error;
-       } else {
-               dst_hold(&rt->u.dst);
-       }
-       dst_prev->child = &rt->u.dst;
+       dst_prev = *dst_p;
        i = 0;
-       for (dst_prev = dst; dst_prev != &rt->u.dst; dst_prev = dst_prev->child) {
+       for (; dst_prev != &rt->u.dst; dst_prev = dst_prev->child) {
                struct xfrm_dst *x = (struct xfrm_dst*)dst_prev;
 
                dst_prev->xfrm = xfrm[i++];
@@ -150,9 +217,9 @@ __xfrm6_bundle_create(struct xfrm_policy *policy, struct xfrm_state **xfrm, int
                dst_prev->flags        |= DST_HOST;
                dst_prev->lastuse       = jiffies;
                dst_prev->header_len    = header_len;
+               dst_prev->nfheader_len  = nfheader_len;
                dst_prev->trailer_len   = trailer_len;
-               memcpy(&dst_prev->metrics, &rt->u.dst.metrics, sizeof(dst_prev->metrics));
-               dst_prev->path          = &rt->u.dst;
+               memcpy(&dst_prev->metrics, &x->route->metrics, sizeof(dst_prev->metrics));
 
                /* Copy neighbour for reachability confirmation */
                dst_prev->neighbour     = neigh_clone(rt->u.dst.neighbour);
@@ -167,10 +234,13 @@ __xfrm6_bundle_create(struct xfrm_policy *policy, struct xfrm_state **xfrm, int
                memcpy(&x->u.rt6.rt6i_gateway, &rt0->rt6i_gateway, sizeof(x->u.rt6.rt6i_gateway)); 
                x->u.rt6.rt6i_dst      = rt0->rt6i_dst;
                x->u.rt6.rt6i_src      = rt0->rt6i_src; 
-               header_len -= x->u.dst.xfrm->props.header_len;
+               x->u.rt6.rt6i_idev     = rt0->rt6i_idev;
+               in6_dev_hold(rt0->rt6i_idev);
+               __xfrm6_bundle_len_dec(&header_len, &nfheader_len, x->u.dst.xfrm);
                trailer_len -= x->u.dst.xfrm->props.trailer_len;
        }
-       *dst_p = dst;
+
+       xfrm_init_pmtu(dst);
        return 0;
 
 error:
@@ -182,16 +252,18 @@ error:
 static inline void
 _decode_session6(struct sk_buff *skb, struct flowi *fl)
 {
-       u16 offset = sizeof(struct ipv6hdr);
+       u16 offset = skb->h.raw - skb->nh.raw;
        struct ipv6hdr *hdr = skb->nh.ipv6h;
-       struct ipv6_opt_hdr *exthdr = (struct ipv6_opt_hdr*)(skb->nh.raw + offset);
-       u8 nexthdr = skb->nh.ipv6h->nexthdr;
+       struct ipv6_opt_hdr *exthdr;
+       u8 nexthdr = skb->nh.raw[IP6CB(skb)->nhoff];
 
        memset(fl, 0, sizeof(struct flowi));
        ipv6_addr_copy(&fl->fl6_dst, &hdr->daddr);
        ipv6_addr_copy(&fl->fl6_src, &hdr->saddr);
 
        while (pskb_may_pull(skb, skb->nh.raw + offset + 1 - skb->data)) {
+               exthdr = (struct ipv6_opt_hdr*)(skb->nh.raw + offset);
+
                switch (nexthdr) {
                case NEXTHDR_ROUTING:
                case NEXTHDR_HOP:
@@ -202,10 +274,12 @@ _decode_session6(struct sk_buff *skb, struct flowi *fl)
                        break;
 
                case IPPROTO_UDP:
+               case IPPROTO_UDPLITE:
                case IPPROTO_TCP:
                case IPPROTO_SCTP:
+               case IPPROTO_DCCP:
                        if (pskb_may_pull(skb, skb->nh.raw + offset + 4 - skb->data)) {
-                               u16 *ports = (u16 *)exthdr;
+                               __be16 *ports = (__be16 *)exthdr;
 
                                fl->fl_ip_sport = ports[0];
                                fl->fl_ip_dport = ports[1];
@@ -213,6 +287,28 @@ _decode_session6(struct sk_buff *skb, struct flowi *fl)
                        fl->proto = nexthdr;
                        return;
 
+               case IPPROTO_ICMPV6:
+                       if (pskb_may_pull(skb, skb->nh.raw + offset + 2 - skb->data)) {
+                               u8 *icmp = (u8 *)exthdr;
+
+                               fl->fl_icmp_type = icmp[0];
+                               fl->fl_icmp_code = icmp[1];
+                       }
+                       fl->proto = nexthdr;
+                       return;
+
+#ifdef CONFIG_IPV6_MIP6
+               case IPPROTO_MH:
+                       if (pskb_may_pull(skb, skb->nh.raw + offset + 3 - skb->data)) {
+                               struct ip6_mh *mh;
+                               mh = (struct ip6_mh *)exthdr;
+
+                               fl->fl_mh_type = mh->ip6mh_type;
+                       }
+                       fl->proto = nexthdr;
+                       return;
+#endif
+
                /* XXX Why are there these headers? */
                case IPPROTO_AH:
                case IPPROTO_ESP:
@@ -227,48 +323,80 @@ _decode_session6(struct sk_buff *skb, struct flowi *fl)
 
 static inline int xfrm6_garbage_collect(void)
 {
-       read_lock(&xfrm6_policy_afinfo.lock);
        xfrm6_policy_afinfo.garbage_collect();
-       read_unlock(&xfrm6_policy_afinfo.lock);
        return (atomic_read(&xfrm6_dst_ops.entries) > xfrm6_dst_ops.gc_thresh*2);
 }
 
 static void xfrm6_update_pmtu(struct dst_entry *dst, u32 mtu)
 {
-       struct dst_entry *path = dst->path;
+       struct xfrm_dst *xdst = (struct xfrm_dst *)dst;
+       struct dst_entry *path = xdst->route;
+
+       path->ops->update_pmtu(path, mtu);
+}
+
+static void xfrm6_dst_destroy(struct dst_entry *dst)
+{
+       struct xfrm_dst *xdst = (struct xfrm_dst *)dst;
+
+       if (likely(xdst->u.rt6.rt6i_idev))
+               in6_dev_put(xdst->u.rt6.rt6i_idev);
+       xfrm_dst_destroy(xdst);
+}
+
+static void xfrm6_dst_ifdown(struct dst_entry *dst, struct net_device *dev,
+                            int unregister)
+{
+       struct xfrm_dst *xdst;
+
+       if (!unregister)
+               return;
+
+       xdst = (struct xfrm_dst *)dst;
+       if (xdst->u.rt6.rt6i_idev->dev == dev) {
+               struct inet6_dev *loopback_idev = in6_dev_get(&loopback_dev);
+               BUG_ON(!loopback_idev);
+
+               do {
+                       in6_dev_put(xdst->u.rt6.rt6i_idev);
+                       xdst->u.rt6.rt6i_idev = loopback_idev;
+                       in6_dev_hold(loopback_idev);
+                       xdst = (struct xfrm_dst *)xdst->u.dst.child;
+               } while (xdst->u.dst.xfrm);
+
+               __in6_dev_put(loopback_idev);
+       }
 
-       if (mtu >= IPV6_MIN_MTU && mtu < dst_pmtu(dst))
-               path->ops->update_pmtu(path, mtu);
-       
-       return;
+       xfrm_dst_ifdown(dst, dev);
 }
 
-struct dst_ops xfrm6_dst_ops = {
+static struct dst_ops xfrm6_dst_ops = {
        .family =               AF_INET6,
        .protocol =             __constant_htons(ETH_P_IPV6),
        .gc =                   xfrm6_garbage_collect,
        .update_pmtu =          xfrm6_update_pmtu,
+       .destroy =              xfrm6_dst_destroy,
+       .ifdown =               xfrm6_dst_ifdown,
        .gc_thresh =            1024,
        .entry_size =           sizeof(struct xfrm_dst),
 };
 
-struct xfrm_policy_afinfo xfrm6_policy_afinfo = {
+static struct xfrm_policy_afinfo xfrm6_policy_afinfo = {
        .family =               AF_INET6,
-       .lock =                 RW_LOCK_UNLOCKED,
-       .type_map =             &xfrm6_type_map,
        .dst_ops =              &xfrm6_dst_ops,
        .dst_lookup =           xfrm6_dst_lookup,
+       .get_saddr =            xfrm6_get_saddr,
        .find_bundle =          __xfrm6_find_bundle,
        .bundle_create =        __xfrm6_bundle_create,
        .decode_session =       _decode_session6,
 };
 
-void __init xfrm6_policy_init(void)
+static void __init xfrm6_policy_init(void)
 {
        xfrm_policy_register_afinfo(&xfrm6_policy_afinfo);
 }
 
-void __exit xfrm6_policy_fini(void)
+static void xfrm6_policy_fini(void)
 {
        xfrm_policy_unregister_afinfo(&xfrm6_policy_afinfo);
 }
@@ -277,12 +405,10 @@ void __init xfrm6_init(void)
 {
        xfrm6_policy_init();
        xfrm6_state_init();
-       xfrm6_tunnel_init();
 }
 
-void __exit xfrm6_fini(void)
+void xfrm6_fini(void)
 {
-       xfrm6_tunnel_fini();
        //xfrm6_input_fini();
        xfrm6_policy_fini();
        xfrm6_state_fini();