GRO: Add support for TCP with fixed IPv4 ID field, limit tunnel IP ID values

author Alexander Duyck <aduyck@mirantis.com>

Mon, 11 Apr 2016 01:44:57 +0000 (21:44 -0400)

committer David S. Miller <davem@davemloft.net>

Thu, 14 Apr 2016 20:23:41 +0000 (16:23 -0400)
author Alexander Duyck <aduyck@mirantis.com>
Mon, 11 Apr 2016 01:44:57 +0000 (21:44 -0400)
committer David S. Miller <davem@davemloft.net>
Thu, 14 Apr 2016 20:23:41 +0000 (16:23 -0400)
diff --git a/include/linux/netdevice.h b/include/linux/netdevice.h

index 8e372d0..2d70c52 100644 (file)
--- a/include/linux/netdevice.h
+++ b/include/linux/netdevice.h
@@ -2121,7 +2121,10 @@ struct napi_gro_cb {
         /* Used in GRE, set in fou/gue_gro_receive */
         u8      is_fou:1;
  
-       /* 6 bit hole */
+       /* Used to determine if flush_id can be ignored */
+       u8      is_atomic:1;
+
+       /* 5 bit hole */
  
         /* used to support CHECKSUM_COMPLETE for tunneling protocols */
         __wsum  csum;
diff --git a/net/core/dev.c b/net/core/dev.c

index e896b19..b78b586 100644 (file)
--- a/net/core/dev.c
+++ b/net/core/dev.c
@@ -4462,6 +4462,7 @@ static enum gro_result dev_gro_receive(struct napi_struct *napi, struct sk_buff
                 NAPI_GRO_CB(skb)->free = 0;
                 NAPI_GRO_CB(skb)->encap_mark = 0;
                 NAPI_GRO_CB(skb)->is_fou = 0;
+               NAPI_GRO_CB(skb)->is_atomic = 1;
                 NAPI_GRO_CB(skb)->gro_remcsum_start = 0;
  
                 /* Setup for GRO checksum validation */
diff --git a/net/ipv4/af_inet.c b/net/ipv4/af_inet.c

index 5bbea9a..8564cab 100644 (file)
--- a/net/ipv4/af_inet.c
+++ b/net/ipv4/af_inet.c
@@ -1328,6 +1328,7 @@ static struct sk_buff **inet_gro_receive(struct sk_buff **head,
  
         for (p = *head; p; p = p->next) {
                 struct iphdr *iph2;
+               u16 flush_id;
  
                 if (!NAPI_GRO_CB(p)->same_flow)
                         continue;
@@ -1351,16 +1352,36 @@ static struct sk_buff **inet_gro_receive(struct sk_buff **head,
                         (iph->tos ^ iph2->tos) |
                         ((iph->frag_off ^ iph2->frag_off) & htons(IP_DF));
  
-               /* Save the IP ID check to be included later when we get to
-                * the transport layer so only the inner most IP ID is checked.
-                * This is because some GSO/TSO implementations do not
-                * correctly increment the IP ID for the outer hdrs.
-                */
-               NAPI_GRO_CB(p)->flush_id =
-                           ((u16)(ntohs(iph2->id) + NAPI_GRO_CB(p)->count) ^ id);
                 NAPI_GRO_CB(p)->flush |= flush;
+
+               /* We need to store of the IP ID check to be included later
+                * when we can verify that this packet does in fact belong
+                * to a given flow.
+                */
+               flush_id = (u16)(id - ntohs(iph2->id));
+
+               /* This bit of code makes it much easier for us to identify
+                * the cases where we are doing atomic vs non-atomic IP ID
+                * checks.  Specifically an atomic check can return IP ID
+                * values 0 - 0xFFFF, while a non-atomic check can only
+                * return 0 or 0xFFFF.
+                */
+               if (!NAPI_GRO_CB(p)->is_atomic ||
+                   !(iph->frag_off & htons(IP_DF))) {
+                       flush_id ^= NAPI_GRO_CB(p)->count;
+                       flush_id = flush_id ? 0xFFFF : 0;
+               }
+
+               /* If the previous IP ID value was based on an atomic
+                * datagram we can overwrite the value and ignore it.
+                */
+               if (NAPI_GRO_CB(skb)->is_atomic)
+                       NAPI_GRO_CB(p)->flush_id = flush_id;
+               else
+                       NAPI_GRO_CB(p)->flush_id |= flush_id;
         }
  
+       NAPI_GRO_CB(skb)->is_atomic = !!(iph->frag_off & htons(IP_DF));
         NAPI_GRO_CB(skb)->flush |= flush;
         skb_set_network_header(skb, off);
         /* The above will be needed by the transport layer if there is one
diff --git a/net/ipv4/tcp_offload.c b/net/ipv4/tcp_offload.c

index 08dd25d..d1ffd55 100644 (file)
--- a/net/ipv4/tcp_offload.c
+++ b/net/ipv4/tcp_offload.c
@@ -239,7 +239,7 @@ struct sk_buff **tcp_gro_receive(struct sk_buff **head, struct sk_buff *skb)
  
  found:
         /* Include the IP ID check below from the inner most IP hdr */
-       flush = NAPI_GRO_CB(p)->flush | NAPI_GRO_CB(p)->flush_id;
+       flush = NAPI_GRO_CB(p)->flush;
         flush |= (__force int)(flags & TCP_FLAG_CWR);
         flush |= (__force int)((flags ^ tcp_flag_word(th2)) &
                   ~(TCP_FLAG_CWR | TCP_FLAG_FIN | TCP_FLAG_PSH));
@@ -248,6 +248,17 @@ found:
                 flush |= *(u32 *)((u8 *)th + i) ^
                          *(u32 *)((u8 *)th2 + i);
  
+       /* When we receive our second frame we can made a decision on if we
+        * continue this flow as an atomic flow with a fixed ID or if we use
+        * an incrementing ID.
+        */
+       if (NAPI_GRO_CB(p)->flush_id != 1 ||
+           NAPI_GRO_CB(p)->count != 1 ||
+           !NAPI_GRO_CB(p)->is_atomic)
+               flush |= NAPI_GRO_CB(p)->flush_id;
+       else
+               NAPI_GRO_CB(p)->is_atomic = false;
+
         mss = skb_shinfo(p)->gso_size;
  
         flush |= (len - 1) >= mss;
@@ -316,6 +327,9 @@ static int tcp4_gro_complete(struct sk_buff *skb, int thoff)
                                   iph->daddr, 0);
         skb_shinfo(skb)->gso_type |= SKB_GSO_TCPV4;
  
+       if (NAPI_GRO_CB(skb)->is_atomic)
+               skb_shinfo(skb)->gso_type |= SKB_GSO_TCP_FIXEDID;
+
         return tcp_gro_complete(skb);
  }
  
diff --git a/net/ipv6/ip6_offload.c b/net/ipv6/ip6_offload.c

index b3a7793..061adcd 100644 (file)
--- a/net/ipv6/ip6_offload.c
+++ b/net/ipv6/ip6_offload.c
@@ -240,10 +240,14 @@ static struct sk_buff **ipv6_gro_receive(struct sk_buff **head,
                 NAPI_GRO_CB(p)->flush |= !!(first_word & htonl(0x0FF00000));
                 NAPI_GRO_CB(p)->flush |= flush;
  
-               /* Clear flush_id, there's really no concept of ID in IPv6. */
-               NAPI_GRO_CB(p)->flush_id = 0;
+               /* If the previous IP ID value was based on an atomic
+                * datagram we can overwrite the value and ignore it.
+                */
+               if (NAPI_GRO_CB(skb)->is_atomic)
+                       NAPI_GRO_CB(p)->flush_id = 0;
         }
  
+       NAPI_GRO_CB(skb)->is_atomic = true;
         NAPI_GRO_CB(skb)->flush |= flush;
  
         skb_gro_postpull_rcsum(skb, iph, nlen);
author	Alexander Duyck <aduyck@mirantis.com>
	Mon, 11 Apr 2016 01:44:57 +0000 (21:44 -0400)
committer	David S. Miller <davem@davemloft.net>
	Thu, 14 Apr 2016 20:23:41 +0000 (16:23 -0400)
include/linux/netdevice.h		patch \| blob \| history
net/core/dev.c		patch \| blob \| history
net/ipv4/af_inet.c		patch \| blob \| history
net/ipv4/tcp_offload.c		patch \| blob \| history
net/ipv6/ip6_offload.c		patch \| blob \| history