Some more feedback after doing a deeper review.

On Mon,  5 Oct 2015 10:58:17 -0700, Pravin B Shelar wrote:
> --- a/drivers/net/geneve.c
> +++ b/drivers/net/geneve.c
> @@ -703,6 +703,32 @@ err:
>       return NETDEV_TX_OK;
>  }
>  
> +static int geneve_egress_tun_info(struct net_device *dev, struct sk_buff 
> *skb,
> +                               struct ip_tunnel_info *egress_tun_info,
> +                               const void **egress_tun_opts)
> +{
> +     struct geneve_dev *geneve = netdev_priv(dev);
> +     struct ip_tunnel_info *info;
> +     struct rtable *rt;
> +     struct flowi4 fl4;
> +     __be16 sport;
> +
> +     info = skb_tunnel_info(skb);
> +     if (ip_tunnel_info_af(info) != AF_INET)
> +             return -EINVAL;
> +
> +     rt = geneve_get_rt(skb, dev, &fl4, info);

This will increase dev tx error stats in case the lookup fails which is
probably something we don't want.

[...]
> --- a/include/linux/netdevice.h
> +++ b/include/linux/netdevice.h
> @@ -60,6 +60,7 @@ struct wireless_dev;
>  /* 802.15.4 specific */
>  struct wpan_dev;
>  struct mpls_dev;
> +struct ip_tunnel_info;
>  
>  void netdev_set_default_ethtool_ops(struct net_device *dev,
>                                   const struct ethtool_ops *ops);
> @@ -1054,6 +1055,11 @@ typedef u16 (*select_queue_fallback_t)(struct 
> net_device *dev,
>   *   This function is used to pass protocol port error state information
>   *   to the switch driver. The switch driver can react to the proto_down
>   *      by doing a phys down on the associated switch port.
> + * int (*ndo_get_egress_info)(struct net_device *dev, struct sk_buff *skb,
> + *                         __be32 *saddr, __be16 *sport, __be16 *dport);
> + *   This function is used to get egress tunnel information for given skb.
> + *   This is useful for retrieving outer tunnel header parameters while
> + *   sampling packet.
>   *
>   */
>  struct net_device_ops {
> @@ -1227,6 +1233,10 @@ struct net_device_ops {
>       int                     (*ndo_get_iflink)(const struct net_device *dev);
>       int                     (*ndo_change_proto_down)(struct net_device *dev,
>                                                        bool proto_down);
> +     int                     (*ndo_get_egress_info)(struct net_device *dev,
> +                                                    struct sk_buff *skb,
> +                                                    struct ip_tunnel_info 
> *egress_tun_info,
> +                                                    const void 
> **egress_tun_opts);

This should have at least a better name to reflect it is about IP
tunnels.

But I don't like having an IP tunnel specific ndo, that doesn't sound
right. The real thing that is wanted here is to complete the dst
metadata. What about:

int (*ndo_fill_metadata_dst)(struct net_device *dev, struct sk_buff *skb);

The function will use skb_tunnel_info to get the template info, then
skb_dst_drop and allocate and attach a fully populated metadata_dst.
The egress_tun_info in struct dp_upcall_info then can be completely
dropped, as all the necessary tunnel information will be available
through skb_tunnel_info(skb). Also, when implemented correctly, such
skb will be just sent out without route lookups etc. if afterwards
handed to ndo_start_xmit.

[...]
> --- a/include/net/ip_tunnels.h
> +++ b/include/net/ip_tunnels.h
> @@ -337,6 +337,11 @@ void __init ip_tunnel_core_init(void);
>  void ip_tunnel_need_metadata(void);
>  void ip_tunnel_unneed_metadata(void);
>  
> +void ipv4_egress_info_init(struct ip_tunnel_info *egress_tun_info,
> +                        const void **egress_tun_opts,
> +                        struct ip_tunnel_info *info, __be32 saddr,
> +                        __be16 sport, __be16 dport);

Please use the ip_tunnel prefix as the rest of the functions, this is
not ipv4 egress info but ip *tunnel* egress info.

Also, it's not clear what the difference between "egress_tun_info" and
"info" is. I'd suggest to use "dst_info" and "src_info" or something
similar.

[...]
> --- a/net/ipv4/ip_tunnel_core.c
> +++ b/net/ipv4/ip_tunnel_core.c
> @@ -424,3 +424,40 @@ void ip_tunnel_unneed_metadata(void)
>       static_key_slow_dec(&ip_tunnel_metadata_cnt);
>  }
>  EXPORT_SYMBOL_GPL(ip_tunnel_unneed_metadata);
> +
> +static void tnl_egress_opts_init(struct ip_tunnel_info *egress_tun_info,
> +                              const void **egress_tun_opts,
> +                              struct ip_tunnel_info *info)
> +{
> +     egress_tun_info->options_len = info->options_len;
> +     egress_tun_info->mode = info->mode;
> +
> +     /* Tunnel options. */
> +     if (info->options_len)
> +             *egress_tun_opts = ip_tunnel_info_opts(info);
> +     else
> +             *egress_tun_opts = NULL;
> +}
> +
> +void ipv4_egress_info_init(struct ip_tunnel_info *egress_tun_info,
> +                        const void **egress_tun_opts,
> +                        struct ip_tunnel_info *info, __be32 saddr,
> +                        __be16 sport, __be16 dport)
> +{
> +     const struct ip_tunnel_key *tun_key;
> +
> +     /* Generate egress_tun_info based on tun_info,
> +      * saddr, tp_src and tp_dst
> +      */
> +     tun_key = &egress_tun_info->key;
> +     ip_tunnel_key_init(&egress_tun_info->key,

Just pass tun_key as the first parameter, it will be clearer what's
going on. (I believe the assignments that have no effect will be
optimized out by the compiler, since ip_tunnel_key_init is an inline
function.)

> +                        saddr, tun_key->u.ipv4.dst,
> +                        tun_key->tos,
> +                        tun_key->ttl,
> +                        sport, dport,
> +                        tun_key->tun_id,
> +                        tun_key->tun_flags);

-- 
Jiri Benc
--
To unsubscribe from this list: send the line "unsubscribe netdev" in
the body of a message to majord...@vger.kernel.org
More majordomo info at  http://vger.kernel.org/majordomo-info.html

Reply via email to