Re: [ovs-dev] ipf question

Darrell Ball Mon, 25 Nov 2019 18:38:28 -0800

Thanks Li,Rongqing

On Mon, Nov 18, 2019 at 9:35 PM Li,Rongqing <lirongq...@baidu.com> wrote:


> Thanks, Darrell
>
>
>
> I can try to test it
>

thanks !; can you try this 2 patch series ?

dball@ubuntu:~/openvswitch/ovs$ cat
outgoing2/0001-dp-packet-Cache-batch-action-list-in-batch.patch
From 80436fb57a54ecfd532e99086dbb0e5142415070 Mon Sep 17 00:00:00 2001
From: Darrell Ball <dlu...@gmail.com>
Date: Sun, 24 Nov 2019 17:29:07 -0800
Subject: [patch v1 1/2] dp-packet: Cache batch action list in batch.
To: d...@openvswitch.org

Cache the batch action list in the batch itself. This will be
used in a subsequent patch.

Signed-off-by: Darrell Ball <dlu...@gmail.com>
---
 lib/dp-packet.h | 27 ++++++++++++++++++++++++++-
 1 file changed, 26 insertions(+), 1 deletion(-)

diff --git a/lib/dp-packet.h b/lib/dp-packet.h
index 14f0897..77df801 100644
--- a/lib/dp-packet.h
+++ b/lib/dp-packet.h
@@ -775,9 +775,11 @@ enum { NETDEV_MAX_BURST = 32 }; /* Maximum number
packets in a batch. */

 struct dp_packet_batch {
     size_t count;
+    size_t actions_len;
+    const struct nlattr *actions;
+    struct dp_packet *packets[NETDEV_MAX_BURST];
     bool trunc; /* true if the batch needs truncate. */
     bool do_not_steal; /* Indicate that the packets should not be stolen.
*/
-    struct dp_packet *packets[NETDEV_MAX_BURST];
 };

 static inline void
@@ -786,6 +788,8 @@ dp_packet_batch_init(struct dp_packet_batch *batch)
     batch->count = 0;
     batch->trunc = false;
     batch->do_not_steal = false;
+    batch->actions = NULL;
+    batch->actions_len = 0;
 }

 static inline void
@@ -930,6 +934,27 @@ dp_packet_batch_reset_cutlen(struct dp_packet_batch
*batch)
     }
 }

+static inline void
+dp_packet_batch_set_action_ctx(struct dp_packet_batch *batch,
+                               const struct nlattr *actions,
+                               size_t actions_len)
+{
+    batch->actions = actions;
+    batch->actions_len = actions_len;
+}
+
+static inline const struct nlattr *
+dp_packet_batch_get_actions(struct dp_packet_batch *batch)
+{
+    return batch->actions;
+}
+
+static inline size_t
+dp_packet_batch_get_action_len(struct dp_packet_batch *batch)
+{
+    return batch->actions_len;
+}
+
 #ifdef  __cplusplus
 }
 #endif
-- 
1.9.1

dball@ubuntu:~/openvswitch/ovs$ cat
outgoing2/0002-ipf-Resume-fragments-in-same-action-list.patch
From 4aefd4e791f9d7b6ef916e41136cb59e6020bb22 Mon Sep 17 00:00:00 2001
From: Darrell Ball <dlu...@gmail.com>
Date: Sun, 24 Nov 2019 17:33:58 -0800
Subject: [patch v1 2/2] ipf: Resume fragments in same action list.
To: d...@openvswitch.org

Once fragments are reassembled and go through conntrack, the fragments
need to resume processing in the same action list.  There is a
semantic requirement that the list have, at most, one conntrack action,
so this specifies the resume point in the list as well.  A memcmp is
used to compare pre and post processing lists as padding is zeroed out,
therefore having predictable values.

Signed-off-by: Darrell Ball <dlu...@gmail.com>
---
 lib/dpif-netdev.c |  1 +
 lib/ipf.c         | 49 ++++++++++++++++++++++++++++++++++++-------------
 2 files changed, 37 insertions(+), 13 deletions(-)

diff --git a/lib/dpif-netdev.c b/lib/dpif-netdev.c
index 5142bad..3ddca5b 100644
--- a/lib/dpif-netdev.c
+++ b/lib/dpif-netdev.c
@@ -7363,6 +7363,7 @@ dp_netdev_execute_actions(struct dp_netdev_pmd_thread
*pmd,
 {
     struct dp_netdev_execute_aux aux = { pmd, flow };

+    dp_packet_batch_set_action_ctx(packets, actions, actions_len);
     odp_execute_actions(&aux, packets, should_steal, actions,
                         actions_len, dp_execute_cb);
 }
diff --git a/lib/ipf.c b/lib/ipf.c
index 45c4891..ad82620 100644
--- a/lib/ipf.c
+++ b/lib/ipf.c
@@ -91,6 +91,8 @@ union ipf_addr {
 /* Represents a single fragment; part of a list of fragments. */
 struct ipf_frag {
     struct dp_packet *pkt;
+    struct nlattr *actions;
+    size_t actions_len;
     uint16_t start_data_byte;
     uint16_t end_data_byte;
     bool dnsteal; /* 'do not steal': if true, ipf should not free packet.
*/
@@ -261,7 +263,12 @@ ipf_list_clean(struct hmap *frag_lists,
 {
     ovs_list_remove(&ipf_list->list_node);
     hmap_remove(frag_lists, &ipf_list->node);
-    free(ipf_list->frag_list);
+    struct ipf_frag *frag_list = ipf_list->frag_list;
+    ovs_assert(frag_list);
+    for (int i = 0; i <= ipf_list->last_inuse_idx; i++) {
+        free(frag_list[i].actions);
+    }
+    free(frag_list);
     free(ipf_list);
 }

@@ -793,7 +800,7 @@ static bool
 ipf_process_frag(struct ipf *ipf, struct ipf_list *ipf_list,
                  struct dp_packet *pkt, uint16_t start_data_byte,
                  uint16_t end_data_byte, bool ff, bool lf, bool v6,
-                 bool dnsteal)
+                 struct dp_packet_batch *pb)
     OVS_REQUIRES(ipf->ipf_lock)
 {
     bool duped_frag = ipf_is_frag_duped(ipf_list->frag_list,
@@ -811,7 +818,11 @@ ipf_process_frag(struct ipf *ipf, struct ipf_list
*ipf_list,
             frag->pkt = pkt;
             frag->start_data_byte = start_data_byte;
             frag->end_data_byte = end_data_byte;
-            frag->dnsteal = dnsteal;
+            frag->dnsteal = pb->do_not_steal;
+            frag->actions_len = dp_packet_batch_get_action_len(pb);
+            ovs_assert(dp_packet_batch_get_actions(pb));
+            frag->actions = xmemdup(dp_packet_batch_get_actions(pb),
+                                    frag->actions_len);
             ipf_list->last_inuse_idx++;
             atomic_count_inc(&ipf->nfrag);
             ipf_count(ipf, v6, IPF_NFRAGS_ACCEPTED);
@@ -849,7 +860,7 @@ ipf_list_init(struct ipf_list *ipf_list, struct
ipf_list_key *key,
 static bool
 ipf_handle_frag(struct ipf *ipf, struct dp_packet *pkt, ovs_be16 dl_type,
                 uint16_t zone, long long now, uint32_t hash_basis,
-                bool dnsteal)
+                struct dp_packet_batch *pb)
     OVS_REQUIRES(ipf->ipf_lock)
 {
     struct ipf_list_key key;
@@ -918,7 +929,7 @@ ipf_handle_frag(struct ipf *ipf, struct dp_packet *pkt,
ovs_be16 dl_type,
     }

     return ipf_process_frag(ipf, ipf_list, pkt, start_data_byte,
-                            end_data_byte, ff, lf, v6, dnsteal);
+                            end_data_byte, ff, lf, v6, pb);
 }

 /* Filters out fragments from a batch of fragments and adjust the batch. */
@@ -940,7 +951,7 @@ ipf_extract_frags_from_batch(struct ipf *ipf, struct
dp_packet_batch *pb,

             ovs_mutex_lock(&ipf->ipf_lock);
             if (!ipf_handle_frag(ipf, pkt, dl_type, zone, now, hash_basis,
-                                 pb->do_not_steal)) {
+                                 pb)) {
                 dp_packet_batch_refill(pb, pkt, pb_idx);
             }
             ovs_mutex_unlock(&ipf->ipf_lock);
@@ -954,20 +965,30 @@ ipf_extract_frags_from_batch(struct ipf *ipf, struct
dp_packet_batch *pb,
  * management has trouble dealing with multiple source types.  The
  * check_source paramater is used to indicate when this check is needed. */
 static bool
-ipf_dp_packet_batch_add(struct dp_packet_batch *pb , struct dp_packet *pkt,
-                        bool check_source OVS_UNUSED)
+ipf_dp_packet_batch_add(struct dp_packet_batch *pb, struct dp_packet *pkt,
+                        struct ipf_frag *frag, bool check_source
OVS_UNUSED)
 {
 #ifdef DPDK_NETDEV
     if ((dp_packet_batch_is_full(pb)) ||
         /* DPDK cannot handle multiple sources in a batch. */
         (check_source && !dp_packet_batch_is_empty(pb)
-         && pb->packets[0]->source != pkt->source)) {
+         && pb->packets[0]->source != frag->pkt->source)) {
 #else
     if (dp_packet_batch_is_full(pb)) {
 #endif
         return false;
     }

+    /* Make sure that the fragment resumes processing in the same action
list.
+     * There is a semantic requirement that an action list have, at most,
one
+     * conntrack action, which could be enforced when the action list is
+     * generated.  Netlink padding is predictably zero, hence memcmp should
+     * be reliable to compare action lists. */
+    if ((dp_packet_batch_get_action_len(pb) != frag->actions_len) ||
+        (memcmp(dp_packet_batch_get_actions(pb), frag->actions,
+                frag->actions_len))) {
+        return false;
+    }
     dp_packet_batch_add(pb, pkt);
     return true;
 }
@@ -1020,9 +1041,11 @@ ipf_send_frags_in_list(struct ipf *ipf, struct
ipf_list *ipf_list,
     }

     while (ipf_list->last_sent_idx < ipf_list->last_inuse_idx) {
-        struct dp_packet *pkt
-            = ipf_list->frag_list[ipf_list->last_sent_idx + 1].pkt;
-        if (ipf_dp_packet_batch_add(pb, pkt, true)) {
+        struct ipf_frag *frag =
+            &ipf_list->frag_list[ipf_list->last_sent_idx + 1];
+        struct dp_packet *pkt = frag->pkt;
+
+        if (ipf_dp_packet_batch_add(pb, pkt, frag, true)) {
             ipf_list->last_sent_idx++;
             atomic_count_dec(&ipf->nfrag);

@@ -1122,7 +1145,7 @@ ipf_execute_reass_pkts(struct ipf *ipf, struct
dp_packet_batch *pb)

     LIST_FOR_EACH_SAFE (rp, next, rp_list_node,
&ipf->reassembled_pkt_list) {
         if (!rp->list->reass_execute_ctx &&
-            ipf_dp_packet_batch_add(pb, rp->pkt, false)) {
+            ipf_dp_packet_batch_add(pb, rp->pkt, rp->list->frag_list,
false)) {
             rp->list->reass_execute_ctx = rp->pkt;
         }
     }
-- 
1.9.1


>
>
> Other question, it seems that ipf is driven by input packet, no timer,  if
> a packet has 40 fragment, first time, 32 fragments are received, next time,
> 8 fragment are received,  reassemble is success, and send out 32 fragment.
> After that,  if no new packets are received, the remaining 8 fragment will
> in complete list, and can not send out until expired to clean them, is it
> true?
>

Fragments will continually try to be sent out to resume to a same type
action list execution batch and point of processing as they were received
from;
At least, there would be subsequent batches for retries.


>
>
> -RongQing
>
>
>
> *发件人:* Darrell Ball [mailto:dlu...@gmail.com]
> *发送时间:* 2019年11月19日 10:22
> *收件人:* Li,Rongqing <lirongq...@baidu.com>
> *抄送:* ovs dev <d...@openvswitch.org>
> *主题:* Re: ipf question
>
>
>
> Thanks; I had a look and I noticed ipf does not keep all the context it
> needs
>
> to properly resume fragment processing in the general case; I have a
> potential fix,
>
> but won't get to it this week.
>
>
>
>
>
> On Sun, Nov 17, 2019 at 11:08 PM Darrell Ball <dlu...@gmail.com> wrote:
>
>
>
>
>
> On Fri, Nov 15, 2019 at 6:03 PM Li,Rongqing <lirongq...@baidu.com> wrote:
>
> 发件人: Darrell Ball <dlu...@gmail.com>
> 发送时间: 2019年11月15日 22:58
> 收件人: Li,Rongqing
> 抄送: ovs dev
> 主题: Re: ipf question
>
>
> >Let me paraphrase, just to confirm we are on the same page.
> >IIUC, for example, in the case of a 33 fragment packet, in the first pass
> all 33 fragments enter ipf, then are >reassembled, pass thru conntrack
> >and then the frags sent out, while in the second pass, only 32 fragments
> enter conntrack/ipf, while index 32 >fragment is being forwarded out
> without going thru conntrack/ipf ?
>
> true.
> the second pass is recirculation
> and index 32 fragment is not into contrack/ipf, and send out to vm
> directly.
>
>
>
> can you check what rule is being hit by that fragment packet vs others and
> then compare the pkt metadata
>
>
>
>
> if  I change  NETDEV_MAX_BURST to 64, it works
>
>
>
> good test
>
>
>
>
> thanks
>
> -RongQing
>
>
>
>
>
>
_______________________________________________
dev mailing list
d...@openvswitch.org
https://mail.openvswitch.org/mailman/listinfo/ovs-dev

Re: [ovs-dev] ipf question

Reply via email to