On Fri, 2015-07-24 at 16:16 +0200, Nicolas Dichtel wrote:
> This patch takes advantage of the newly added lwtunnel framework to
> allow the user to set routes that point to a peer netns.
> 
> Packets are injected to the peer netns via the loopback device. It works
> only when the output device is 'lo'.
> 
> Example:
> ip route add 40.1.1.1/32 encap netns nsid 5 via dev lo
> 

Is this feature so badly wanted to add complexity on lo device ?

> Signed-off-by: Nicolas Dichtel <nicolas.dich...@6wind.com>
> ---
> 
> v2: rework loopback handling part (update stats and call skb_dst_force())
>     fix ipv6 processing
>     check lwtunnel type before converting data to a nsid
> 
>  drivers/net/loopback.c        | 33 +++++++++++++++++++++------
>  include/net/lwtunnel.h        | 27 ++++++++++++++++++++++
>  include/uapi/linux/lwtunnel.h |  1 +
>  net/core/net_namespace.c      | 52 
> +++++++++++++++++++++++++++++++++++++++++++
>  net/ipv6/route.c              |  9 ++++++--
>  5 files changed, 113 insertions(+), 9 deletions(-)
> 
> diff --git a/drivers/net/loopback.c b/drivers/net/loopback.c
> index c76283c2f84a..4358256ff94e 100644
> --- a/drivers/net/loopback.c
> +++ b/drivers/net/loopback.c
> @@ -57,6 +57,7 @@
>  #include <linux/percpu.h>
>  #include <net/net_namespace.h>
>  #include <linux/u64_stats_sync.h>
> +#include <net/lwtunnel.h>
>  
>  struct pcpu_lstats {
>       u64                     packets;
> @@ -71,29 +72,47 @@ struct pcpu_lstats {
>  static netdev_tx_t loopback_xmit(struct sk_buff *skb,
>                                struct net_device *dev)
>  {
> +     int nsid = skb_lwt_netns_info(skb);
>       struct pcpu_lstats *lb_stats;
> -     int len;
> -
> -     skb_orphan(skb);
> +     struct net *peernet = NULL;
> +     int len, ret;
>  
>       /* Before queueing this packet to netif_rx(),
>        * make sure dst is refcounted.
>        */
>       skb_dst_force(skb);
>  
> -     skb->protocol = eth_type_trans(skb, dev);
> +     if (nsid != NETNSA_NSID_NOT_ASSIGNED) {
> +             peernet = get_net_ns_by_id(dev_net(dev), nsid);
> +             if (!peernet) {
> +                     kfree_skb(skb);
> +                     goto end;
> +             }
> +
> +             /* it's OK to use per_cpu_ptr() because BHs are off */
> +             lb_stats = this_cpu_ptr(peernet->loopback_dev->lstats);
> +             ret = dev_forward_skb(peernet->loopback_dev, skb);
> +     } else {
> +             skb_orphan(skb);
>  
> -     /* it's OK to use per_cpu_ptr() because BHs are off */
> -     lb_stats = this_cpu_ptr(dev->lstats);
> +             skb->protocol = eth_type_trans(skb, dev);
> +
> +             /* it's OK to use per_cpu_ptr() because BHs are off */
> +             lb_stats = this_cpu_ptr(dev->lstats);
> +             ret = netif_rx(skb);
> +     }
>  
>       len = skb->len;

<use after free error>  At this point you no longer can access skb

> -     if (likely(netif_rx(skb) == NET_RX_SUCCESS)) {
> +     if (likely(ret == NET_RX_SUCCESS)) {
>               u64_stats_update_begin(&lb_stats->syncp);
>               lb_stats->bytes += len;
>               lb_stats->packets++;
>               u64_stats_update_end(&lb_stats->syncp);
>       }
>  
> +end:
> +     if (peernet)
> +             put_net(peernet);
>       return NETDEV_TX_OK;
>  }
>  



--
To unsubscribe from this list: send the line "unsubscribe netdev" in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Reply via email to