On 2018/11/10 3:43, Cong Wang wrote:
> Currently netdev_rx_csum_fault() only shows a device name,
> we need more information about the skb for debugging.
> 
> Sample output:
> 
>  ens3: hw csum failure
>  dev features: 0x0000000000014b89
>  skb len=84 data_len=0 gso_size=0 gso_type=0 ip_summed=0 csum=0, 
> csum_complete_sw=0, csum_valid=0
> 
> Signed-off-by: Cong Wang <xiyou.wangc...@gmail.com>
> ---
>  include/linux/netdevice.h |  5 +++--
>  net/core/datagram.c       |  6 +++---
>  net/core/dev.c            | 10 ++++++++--
>  net/sunrpc/socklib.c      |  2 +-
>  4 files changed, 15 insertions(+), 8 deletions(-)
> 
> diff --git a/include/linux/netdevice.h b/include/linux/netdevice.h
> index 857f8abf7b91..fabcd9fa6cf7 100644
> --- a/include/linux/netdevice.h
> +++ b/include/linux/netdevice.h
> @@ -4332,9 +4332,10 @@ static inline bool 
> can_checksum_protocol(netdev_features_t features,
>  }
>  
>  #ifdef CONFIG_BUG
> -void netdev_rx_csum_fault(struct net_device *dev);
> +void netdev_rx_csum_fault(struct net_device *dev, struct sk_buff *skb);
>  #else
> -static inline void netdev_rx_csum_fault(struct net_device *dev)
> +static inline void netdev_rx_csum_fault(struct net_device *dev,
> +                                     struct sk_buff *skb)
>  {
>  }
>  #endif
> diff --git a/net/core/datagram.c b/net/core/datagram.c
> index 57f3a6fcfc1e..d8f4d55cd6c5 100644
> --- a/net/core/datagram.c
> +++ b/net/core/datagram.c
> @@ -736,7 +736,7 @@ __sum16 __skb_checksum_complete_head(struct sk_buff *skb, 
> int len)
>       if (likely(!sum)) {
>               if (unlikely(skb->ip_summed == CHECKSUM_COMPLETE) &&
>                   !skb->csum_complete_sw)
> -                     netdev_rx_csum_fault(skb->dev);
> +                     netdev_rx_csum_fault(skb->dev, skb);
>       }
>       if (!skb_shared(skb))
>               skb->csum_valid = !sum;
> @@ -756,7 +756,7 @@ __sum16 __skb_checksum_complete(struct sk_buff *skb)
>       if (likely(!sum)) {
>               if (unlikely(skb->ip_summed == CHECKSUM_COMPLETE) &&
>                   !skb->csum_complete_sw)
> -                     netdev_rx_csum_fault(skb->dev);
> +                     netdev_rx_csum_fault(skb->dev, skb);
>       }
>  
>       if (!skb_shared(skb)) {
> @@ -810,7 +810,7 @@ int skb_copy_and_csum_datagram_msg(struct sk_buff *skb,
>  
>               if (unlikely(skb->ip_summed == CHECKSUM_COMPLETE) &&
>                   !skb->csum_complete_sw)
> -                     netdev_rx_csum_fault(NULL);
> +                     netdev_rx_csum_fault(NULL, skb);
>       }
>       return 0;
>  fault:
> diff --git a/net/core/dev.c b/net/core/dev.c
> index 0ffcbdd55fa9..2b337df26117 100644
> --- a/net/core/dev.c
> +++ b/net/core/dev.c
> @@ -3091,10 +3091,16 @@ EXPORT_SYMBOL(__skb_gso_segment);
>  
>  /* Take action when hardware reception checksum errors are detected. */
>  #ifdef CONFIG_BUG
> -void netdev_rx_csum_fault(struct net_device *dev)
> +void netdev_rx_csum_fault(struct net_device *dev, struct sk_buff *skb)
>  {
>       if (net_ratelimit()) {
>               pr_err("%s: hw csum failure\n", dev ? dev->name : "<unknown>");
> +             if (dev)
> +                     pr_err("dev features: %pNF\n", &dev->features);
> +             pr_err("skb len=%d data_len=%d gso_size=%d gso_type=%d 
> ip_summed=%d csum=%x, csum_complete_sw=%d, csum_valid=%d\n",
> +                    skb->len, skb->data_len, skb_shinfo(skb)->gso_size,
> +                    skb_shinfo(skb)->gso_type, skb->ip_summed, skb->csum,
> +                    skb->csum_complete_sw, skb->csum_valid);


This function also have the netdev available, use netdev_err to log the error?

Also, dev->features was dumped before this patch, why remove it?


>               dump_stack();
>       }
>  }
> @@ -5779,7 +5785,7 @@ __sum16 __skb_gro_checksum_complete(struct sk_buff *skb)
>       if (likely(!sum)) {
>               if (unlikely(skb->ip_summed == CHECKSUM_COMPLETE) &&
>                   !skb->csum_complete_sw)
> -                     netdev_rx_csum_fault(skb->dev);
> +                     netdev_rx_csum_fault(skb->dev, skb);
>       }
>  
>       NAPI_GRO_CB(skb)->csum = wsum;
> diff --git a/net/sunrpc/socklib.c b/net/sunrpc/socklib.c
> index 9062967575c4..7e55cfc69697 100644
> --- a/net/sunrpc/socklib.c
> +++ b/net/sunrpc/socklib.c
> @@ -175,7 +175,7 @@ int csum_partial_copy_to_xdr(struct xdr_buf *xdr, struct 
> sk_buff *skb)
>               return -1;
>       if (unlikely(skb->ip_summed == CHECKSUM_COMPLETE) &&
>           !skb->csum_complete_sw)
> -             netdev_rx_csum_fault(skb->dev);
> +             netdev_rx_csum_fault(skb->dev, skb);
>       return 0;
>  no_checksum:
>       if (xdr_partial_copy_from_skb(xdr, 0, &desc, xdr_skb_read_bits) < 0)
> 

Reply via email to