The ARP/ND responder stage (ls_in_arp_rsp) unconditionally
bypassed all traffic arriving from localnet ports via a
priority-100 "next;" flow.  This caused broadcast ARP/ND
requests from the physical network to be flooded to every
logical switch port instead of being handled by proxy
ARP/ND.  On switches with ~200+ ports the resulting
multicast replication exceeded the OVS 4K resubmit limit,
dropping the packets and breaking connectivity.

Replace the bypass with a targeted mechanism:

  - In ls_in_lookup_fdb, set flags.localnet = 1 for
    packets arriving from localnet ports (P50 fallback;
    the existing P100 FDB-learning flow already sets this
    flag when FDB learning is enabled).

  - In the P50 ARP/ND reply flows, append the condition
    "((flags.localnet == 1 && is_chassis_resident(port))
     || flags.localnet == 0)" on switches that have
    localnet ports.

This ensures that ARP/ND requests from localnet are only
answered on the chassis hosting the target VIF, preventing
both the flood and duplicate replies from multiple
hypervisors.  VIF-to-VIF proxy ARP/ND is unchanged because
flags.localnet is 0 for non-localnet-sourced traffic.

Fixes: f763a3273b84 ("ovn: Avoid ARP responder for packets from localnet port")
Reported-at: https://redhat.atlassian.net/browse/FDP-3436
Assisted-by: Claude Opus 4.6, Claude Code
Signed-off-by: Dumitru Ceara <[email protected]>
---
 northd/northd.c         |  44 +++++++---
 northd/ovn-northd.8.xml |  76 +++++++++++-----
 tests/ovn-northd.at     | 111 ++++++++++++++++++++++-
 tests/ovn.at            | 189 ++++++++++++++++++++++++++++++++++++++++
 4 files changed, 389 insertions(+), 31 deletions(-)

diff --git a/northd/northd.c b/northd/northd.c
index 02c7e7e54e..8305e0428b 100644
--- a/northd/northd.c
+++ b/northd/northd.c
@@ -10402,25 +10402,43 @@ build_arp_nd_service_monitor_lflow(const char 
*svc_monitor_mac,
     }
 }
 
-/* Ingress table 24: ARP/ND responder, skip requests coming from localnet
- * ports. (priority 100); see ovn-northd.8.xml for the rationale. */
-
+/* Ingress table: Lookup FDB.  Set flags.localnet for packets arriving from
+ * localnet ports so that downstream stages (e.g., ARP/ND responder) can
+ * condition their behavior on whether the packet came from localnet. */
 static void
-build_lswitch_arp_nd_responder_skip_local(struct ovn_port *op,
-                                          struct lflow_table *lflows,
-                                          struct ds *match)
+build_lswitch_from_localnet_op(struct ovn_port *op,
+                               struct lflow_table *lflows,
+                               struct ds *match)
 {
     ovs_assert(op->nbsp);
-    if (!lsp_is_localnet(op->nbsp) || op->od->has_arp_proxy_port) {
+    if (!lsp_is_localnet(op->nbsp)) {
         return;
     }
     ds_clear(match);
     ds_put_format(match, "inport == %s", op->json_key);
-    ovn_lflow_add(lflows, op->od, S_SWITCH_IN_ARP_ND_RSP, 100, ds_cstr(match),
-                  "next;", op->lflow_ref, WITH_IO_PORT(op->key),
+    ovn_lflow_add(lflows, op->od, S_SWITCH_IN_LOOKUP_FDB, 50,
+                  ds_cstr(match), "flags.localnet = 1; next;",
+                  op->lflow_ref, WITH_IO_PORT(op->key),
                   WITH_HINT(&op->nbsp->header_));
 }
 
+/* On switches with localnet ports, restrict ARP/ND replies for
+ * localnet-sourced requests to the chassis hosting the target VIF
+ * (preventing duplicate replies from every hypervisor).  Non-localnet
+ * requests (VIF-to-VIF) are answered unconditionally as before. */
+static void
+build_lswitch_arp_nd_local_resp_match(struct ds *match,
+                                      const struct ovn_port *op)
+{
+    if (!ls_has_localnet_port(op->od)) {
+        return;
+    }
+
+    ds_put_format(match,
+        " && ((flags.localnet == 1 && is_chassis_resident(%s))"
+            " || flags.localnet == 0)", op->json_key);
+}
+
 /* Ingress table 24: ARP/ND responder, reply for known IPs.
  * (priority 50). */
 static void
@@ -10562,6 +10580,8 @@ build_lswitch_arp_nd_responder_known_ips(struct 
ovn_port *op,
                     ds_truncate(match, match_len);
                 }
                 ds_put_cstr(match, " && eth.dst == ff:ff:ff:ff:ff:ff");
+                size_t match_arp_len = match->length;
+                build_lswitch_arp_nd_local_resp_match(match, op);
 
                 ds_clear(actions);
                 ds_put_format(actions,
@@ -10593,6 +10613,7 @@ build_lswitch_arp_nd_responder_known_ips(struct 
ovn_port *op,
                  * address is intended to detect situations where the
                  * network is not working as configured, so dropping the
                  * request would frustrate that intent.) */
+                ds_truncate(match, match_arp_len);
                 ds_put_format(match, " && inport == %s", op->json_key);
                 ovn_lflow_add(lflows, op->od, S_SWITCH_IN_ARP_ND_RSP, 100,
                               ds_cstr(match), "next;", op->lflow_ref,
@@ -10632,6 +10653,8 @@ build_lswitch_arp_nd_responder_known_ips(struct 
ovn_port *op,
                     "nd_ns_mcast && ip6.dst == %s && nd.target == %s",
                     op->lsp_addrs[i].ipv6_addrs[j].sn_addr_s,
                     op->lsp_addrs[i].ipv6_addrs[j].addr_s);
+                size_t match_nd_len = match->length;
+                build_lswitch_arp_nd_local_resp_match(match, op);
 
                 ds_clear(actions);
                 ds_put_format(actions,
@@ -10658,6 +10681,7 @@ build_lswitch_arp_nd_responder_known_ips(struct 
ovn_port *op,
 
                 /* Do not reply to a solicitation from the port that owns
                  * the address (otherwise DAD detection will fail). */
+                ds_truncate(match, match_nd_len);
                 ds_put_format(match, " && inport == %s", op->json_key);
                 ovn_lflow_add(lflows, op->od, S_SWITCH_IN_ARP_ND_RSP, 100,
                               ds_cstr(match), "next;", op->lflow_ref,
@@ -19554,7 +19578,7 @@ build_lswitch_and_lrouter_iterate_by_lsp(struct 
ovn_port *op,
     build_mirror_lflows(op, ls_ports, lflows);
     build_lswitch_port_sec_op(op, lflows, actions, match);
     build_lswitch_learn_fdb_op(op, lflows, actions, match);
-    build_lswitch_arp_nd_responder_skip_local(op, lflows, match);
+    build_lswitch_from_localnet_op(op, lflows, match);
     build_lswitch_arp_nd_responder_known_ips(op, lflows, ls_ports,
                                              meter_groups, actions, match);
     build_lswitch_dhcp_options_and_response(op, lflows, meter_groups);
diff --git a/northd/ovn-northd.8.xml b/northd/ovn-northd.8.xml
index 4d6370da6b..4ba4ab3cd1 100644
--- a/northd/ovn-northd.8.xml
+++ b/northd/ovn-northd.8.xml
@@ -488,6 +488,21 @@
         </ul>
       </li>
 
+      <li>
+        <p>
+          For each localnet logical port <var>p</var>, a priority-50
+          fallback flow is added with the match
+          <code>inport == <var>p</var></code> and action
+          <code>flags.localnet = 1; next;</code>.  This marks traffic
+          arriving from localnet ports so that downstream stages (e.g.,
+          ARP/ND responder) can condition their behavior.  When FDB
+          learning is enabled on the localnet port, the priority-100
+          flow described above already sets <code>flags.localnet</code>,
+          so this priority-50 flow only takes effect when FDB learning
+          is not configured.
+        </p>
+      </li>
+
       <li>
         One priority-0 fallback flow that matches all packets and advances to
         the next table.
@@ -1734,12 +1749,16 @@
     </p>
 
     <p>
-      Note that ARP requests received from <code>localnet</code> logical
-      inports can either go directly to VMs, in which case the VM responds or
-      can hit an ARP responder for a logical router port if the packet is used
-      to resolve a logical router port next hop address.  In either case,
-      logical switch ARP responder rules will not be hit.  It contains these
-      logical flows:
+      ARP/ND requests received from <code>localnet</code> logical inports
+      do hit the ARP/ND responder, but the response is limited to the
+      chassis that hosts the target VIF.  This is achieved by adding
+      a <code>flags.localnet</code> check to the priority-50 reply flows
+      (see below): when the request arrives from a localnet port
+      (<code>flags.localnet == 1</code>), only the chassis on which the
+      target port is resident will reply.  When the request arrives from
+      a non-localnet port (<code>flags.localnet == 0</code>), the
+      response is unconditional, preserving VIF-to-VIF proxy ARP/ND
+      behavior.  It contains these logical flows:
      </p>
 
     <ul>
@@ -1750,18 +1769,10 @@
         router ingress pipeline.
       </li>
       <li>
-        If the logical switch has no router ports with options:arp_proxy
-        configured add a priority-100 flows to skip the ARP responder if inport
-        is of type <code>localnet</code> advances directly to the next table.
-        ARP requests sent to <code>localnet</code> ports can be received by
-        multiple hypervisors.  Now, because the same mac binding rules are
-        downloaded to all hypervisors, each of the multiple hypervisors will
-        respond.  This will confuse L2 learning on the source of the ARP
-        requests.  ARP requests received on an inport of type
-        <code>router</code> are not expected to hit any logical switch ARP
-        responder flows.  However, no skip flows are installed for these
-        packets, as there would be some additional flow cost for this and the
-        value appears limited.
+        ARP/ND requests received on an inport of type <code>router</code> are
+        not expected to hit any logical switch ARP responder flows.  However,
+        no skip flows are installed for these packets, as there would be some
+        additional flow cost for this and the value appears limited.
       </li>
 
       <li>
@@ -1816,6 +1827,18 @@ flags.loopback = 1;
 output;
         </pre>
 
+        <p>
+          On logical switches that have a localnet port, the match for
+          these flows includes an additional condition:
+          <code>((flags.localnet == 1 &amp;&amp;
+          is_chassis_resident(<var>port</var>)) ||
+          flags.localnet == 0)</code>.
+          This ensures that when an ARP request arrives from a localnet
+          port, only the chassis hosting the target VIF responds.  When
+          the request arrives from a non-localnet port, the response is
+          unconditional, preserving VIF-to-VIF proxy ARP behavior.
+        </p>
+
         <p>
           These flows are omitted for logical ports (other than router ports or
           <code>localport</code> ports) that are down (unless <code>
@@ -1877,6 +1900,19 @@ nd_na_router {
 };
         </pre>
 
+        <p>
+          On logical switches that have a localnet port, the match for
+          these flows includes an additional condition:
+          <code>((flags.localnet == 1 &amp;&amp;
+          is_chassis_resident(<var>port</var>)) ||
+          flags.localnet == 0)</code>.
+          This ensures that when an ND solicitation arrives from a
+          localnet port, only the chassis hosting the target VIF
+          responds.  When the solicitation arrives from a non-localnet
+          port, the response is unconditional, preserving VIF-to-VIF
+          proxy ND behavior.
+        </p>
+
         <p>
           These flows are omitted for logical ports (other than router ports or
           <code>localport</code> ports) that are down (unless <code>
@@ -1896,8 +1932,8 @@ nd_na_router {
 
       <li>
         <p>
-          Priority-100 flows with match criteria like the ARP and ND flows
-          above, except that they only match packets from the
+          Priority-100 flows with match criteria similar to the ARP and ND
+          flows above, except that they only match packets from the
           <code>inport</code> that owns the IP addresses in question, with
           action <code>next;</code>.  These flows prevent OVN from replying to,
           for example, an ARP request emitted by a VM for its own IP address.
diff --git a/tests/ovn-northd.at b/tests/ovn-northd.at
index 1d7bd6c288..df7bac1529 100644
--- a/tests/ovn-northd.at
+++ b/tests/ovn-northd.at
@@ -7730,7 +7730,9 @@ AT_CHECK([grep -e "ls_in_.*_fdb.*S1-vm1" S1flows | 
ovn_strip_lflows], [0], [dnl
 ])
 
 #Verify the flows for a non-default port type (localnet port)
-AT_CHECK([grep -e "ls_in_.*_fdb.*S1-localnet" S1flows], [1], [])
+AT_CHECK([grep -e "ls_in_.*_fdb.*S1-localnet" S1flows | ovn_strip_lflows], 
[0], [dnl
+  table=??(ls_in_lookup_fdb   ), priority=50   , match=(inport == 
"S1-localnet"), action=(flags.localnet = 1; next;)
+])
 
 OVN_CLEANUP_NORTHD
 AT_CLEANUP
@@ -10039,6 +10041,7 @@ AT_CHECK([ovn-nbctl --wait=sb sync])
 # Check MAC learning flows with 'localnet_learn_fdb' default (false)
 AT_CHECK([ovn-sbctl dump-flows ls0 | grep -e 'ls_in_\(put\|lookup\)_fdb' | 
ovn_strip_lflows], [0], [dnl
   table=??(ls_in_lookup_fdb   ), priority=0    , match=(1), action=(next;)
+  table=??(ls_in_lookup_fdb   ), priority=50   , match=(inport == "ln_port"), 
action=(flags.localnet = 1; next;)
   table=??(ls_in_put_fdb      ), priority=0    , match=(1), action=(next;)
 ])
 
@@ -10047,6 +10050,7 @@ AT_CHECK([ovn-nbctl --wait=sb lsp-set-options ln_port 
localnet_learn_fdb=true])
 AT_CHECK([ovn-sbctl dump-flows ls0 | grep -e 'ls_in_\(put\|lookup\)_fdb' | 
ovn_strip_lflows], [0], [dnl
   table=??(ls_in_lookup_fdb   ), priority=0    , match=(1), action=(next;)
   table=??(ls_in_lookup_fdb   ), priority=100  , match=(inport == "ln_port"), 
action=(flags.localnet = 1; reg0[[11]] = lookup_fdb(inport, eth.src); next;)
+  table=??(ls_in_lookup_fdb   ), priority=50   , match=(inport == "ln_port"), 
action=(flags.localnet = 1; next;)
   table=??(ls_in_put_fdb      ), priority=0    , match=(1), action=(next;)
   table=??(ls_in_put_fdb      ), priority=100  , match=(inport == "ln_port" && 
reg0[[11]] == 0), action=(put_fdb(inport, eth.src); next;)
 ])
@@ -10055,6 +10059,7 @@ AT_CHECK([ovn-sbctl dump-flows ls0 | grep -e 
'ls_in_\(put\|lookup\)_fdb' | ovn_s
 AT_CHECK([ovn-nbctl --wait=sb lsp-set-options ln_port 
localnet_learn_fdb=false])
 AT_CHECK([ovn-sbctl dump-flows ls0 | grep -e 'ls_in_\(put\|lookup\)_fdb' | 
ovn_strip_lflows], [0], [dnl
   table=??(ls_in_lookup_fdb   ), priority=0    , match=(1), action=(next;)
+  table=??(ls_in_lookup_fdb   ), priority=50   , match=(inport == "ln_port"), 
action=(flags.localnet = 1; next;)
   table=??(ls_in_put_fdb      ), priority=0    , match=(1), action=(next;)
 ])
 
@@ -10404,6 +10409,110 @@ OVN_CLEANUP_NORTHD
 AT_CLEANUP
 ])
 
+OVN_FOR_EACH_NORTHD_NO_HV([
+AT_SETUP([ARP/ND responder for localnet-sourced requests])
+ovn_start
+
+dnl Switch with localnet port.
+check ovn-nbctl ls-add ls1
+check ovn-nbctl lsp-add-localnet-port ls1 ln1 physnet1
+check ovn-nbctl lsp-add ls1 vm1 \
+    -- lsp-set-addresses vm1 "00:00:00:00:00:01 10.0.0.1 fd01::1"
+check ovn-nbctl lsp-add ls1 vm2 \
+    -- lsp-set-addresses vm2 "00:00:00:00:00:02 10.0.0.2 fd01::2"
+
+dnl Switch without localnet port.
+check ovn-nbctl ls-add ls2
+check ovn-nbctl --wait=sb lsp-add ls2 vm3 \
+    -- lsp-set-addresses vm3 "00:00:00:00:00:03 10.0.0.3 fd01::3"
+
+AS_BOX([FDB learning disabled])
+
+dnl ls1: ls_in_lookup_fdb should have priority 0 default +
+dnl priority 50 flags.localnet.
+AT_CHECK([ovn-sbctl dump-flows ls1 | grep -e 'ls_in_lookup_fdb' | 
ovn_strip_lflows], [0], [dnl
+  table=??(ls_in_lookup_fdb   ), priority=0    , match=(1), action=(next;)
+  table=??(ls_in_lookup_fdb   ), priority=50   , match=(inport == "ln1"), 
action=(flags.localnet = 1; next;)
+])
+
+dnl ls1: ls_in_arp_rsp should include flags.localnet condition for
+dnl priority 50 ARP/ND reply flows but NOT for priority 100 self-reply
+dnl flows (since those match on inport == VIF, flags.localnet is always 0).
+AT_CHECK([ovn-sbctl dump-flows ls1 | grep -e 'ls_in_arp_rsp' | 
ovn_strip_lflows], [0], [dnl
+  table=??(ls_in_arp_rsp      ), priority=0    , match=(1), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(arp.tpa == 10.0.0.1 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff && inport == "vm1"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(arp.tpa == 10.0.0.2 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff && inport == "vm2"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:1 && nd.target == fd01::1 && inport == "vm1"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:2 && nd.target == fd01::2 && inport == "vm2"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(arp.tpa == 10.0.0.1 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff && ((flags.localnet == 1 && 
is_chassis_resident("vm1")) || flags.localnet == 0)), action=(eth.dst = 
eth.src; eth.src = 00:00:00:00:00:01; arp.op = 2; /* ARP reply */ arp.tha = 
arp.sha; arp.sha = 00:00:00:00:00:01; arp.tpa = arp.spa; arp.spa = 10.0.0.1; 
outport = inport; flags.loopback = 1; output;)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(arp.tpa == 10.0.0.2 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff && ((flags.localnet == 1 && 
is_chassis_resident("vm2")) || flags.localnet == 0)), action=(eth.dst = 
eth.src; eth.src = 00:00:00:00:00:02; arp.op = 2; /* ARP reply */ arp.tha = 
arp.sha; arp.sha = 00:00:00:00:00:02; arp.tpa = arp.spa; arp.spa = 10.0.0.2; 
outport = inport; flags.loopback = 1; output;)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:1 && nd.target == fd01::1 && ((flags.localnet == 1 && 
is_chassis_resident("vm1")) || flags.localnet == 0)), action=(nd_na { eth.src = 
00:00:00:00:00:01; ip6.src = fd01::1; nd.target = fd01::1; nd.tll = 
00:00:00:00:00:01; outport = inport; flags.loopback = 1; output; };)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:2 && nd.target == fd01::2 && ((flags.localnet == 1 && 
is_chassis_resident("vm2")) || flags.localnet == 0)), action=(nd_na { eth.src = 
00:00:00:00:00:02; ip6.src = fd01::2; nd.target = fd01::2; nd.tll = 
00:00:00:00:00:02; outport = inport; flags.loopback = 1; output; };)
+])
+
+dnl ls2: ls_in_arp_rsp should NOT include flags.localnet condition.
+AT_CHECK([ovn-sbctl dump-flows ls2 | grep -e 'ls_in_arp_rsp' | 
ovn_strip_lflows], [0], [dnl
+  table=??(ls_in_arp_rsp      ), priority=0    , match=(1), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(arp.tpa == 10.0.0.3 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff && inport == "vm3"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:3 && nd.target == fd01::3 && inport == "vm3"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(arp.tpa == 10.0.0.3 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff), action=(eth.dst = eth.src; 
eth.src = 00:00:00:00:00:03; arp.op = 2; /* ARP reply */ arp.tha = arp.sha; 
arp.sha = 00:00:00:00:00:03; arp.tpa = arp.spa; arp.spa = 10.0.0.3; outport = 
inport; flags.loopback = 1; output;)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:3 && nd.target == fd01::3), action=(nd_na { eth.src = 
00:00:00:00:00:03; ip6.src = fd01::3; nd.target = fd01::3; nd.tll = 
00:00:00:00:00:03; outport = inport; flags.loopback = 1; output; };)
+])
+
+dnl ls2: ls_in_lookup_fdb should only have priority 0 default,
+dnl no priority 50 flags.localnet.
+AT_CHECK([ovn-sbctl dump-flows ls2 | grep -e 'ls_in_lookup_fdb' | 
ovn_strip_lflows], [0], [dnl
+  table=??(ls_in_lookup_fdb   ), priority=0    , match=(1), action=(next;)
+])
+
+AS_BOX([Enable FDB learning on ln1])
+check ovn-nbctl --wait=sb lsp-set-options ln1 localnet_learn_fdb=true
+
+dnl ls1: ls_in_lookup_fdb should have priority 100 FDB +
+dnl priority 50 fallback.
+AT_CHECK([ovn-sbctl dump-flows ls1 | grep -e 'ls_in_lookup_fdb' | 
ovn_strip_lflows], [0], [dnl
+  table=??(ls_in_lookup_fdb   ), priority=0    , match=(1), action=(next;)
+  table=??(ls_in_lookup_fdb   ), priority=100  , match=(inport == "ln1"), 
action=(flags.localnet = 1; reg0[[11]] = lookup_fdb(inport, eth.src); next;)
+  table=??(ls_in_lookup_fdb   ), priority=50   , match=(inport == "ln1"), 
action=(flags.localnet = 1; next;)
+])
+
+dnl ls1: ls_in_arp_rsp should be unchanged.
+AT_CHECK([ovn-sbctl dump-flows ls1 | grep -e 'ls_in_arp_rsp' | 
ovn_strip_lflows], [0], [dnl
+  table=??(ls_in_arp_rsp      ), priority=0    , match=(1), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(arp.tpa == 10.0.0.1 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff && inport == "vm1"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(arp.tpa == 10.0.0.2 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff && inport == "vm2"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:1 && nd.target == fd01::1 && inport == "vm1"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:2 && nd.target == fd01::2 && inport == "vm2"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(arp.tpa == 10.0.0.1 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff && ((flags.localnet == 1 && 
is_chassis_resident("vm1")) || flags.localnet == 0)), action=(eth.dst = 
eth.src; eth.src = 00:00:00:00:00:01; arp.op = 2; /* ARP reply */ arp.tha = 
arp.sha; arp.sha = 00:00:00:00:00:01; arp.tpa = arp.spa; arp.spa = 10.0.0.1; 
outport = inport; flags.loopback = 1; output;)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(arp.tpa == 10.0.0.2 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff && ((flags.localnet == 1 && 
is_chassis_resident("vm2")) || flags.localnet == 0)), action=(eth.dst = 
eth.src; eth.src = 00:00:00:00:00:02; arp.op = 2; /* ARP reply */ arp.tha = 
arp.sha; arp.sha = 00:00:00:00:00:02; arp.tpa = arp.spa; arp.spa = 10.0.0.2; 
outport = inport; flags.loopback = 1; output;)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:1 && nd.target == fd01::1 && ((flags.localnet == 1 && 
is_chassis_resident("vm1")) || flags.localnet == 0)), action=(nd_na { eth.src = 
00:00:00:00:00:01; ip6.src = fd01::1; nd.target = fd01::1; nd.tll = 
00:00:00:00:00:01; outport = inport; flags.loopback = 1; output; };)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:2 && nd.target == fd01::2 && ((flags.localnet == 1 && 
is_chassis_resident("vm2")) || flags.localnet == 0)), action=(nd_na { eth.src = 
00:00:00:00:00:02; ip6.src = fd01::2; nd.target = fd01::2; nd.tll = 
00:00:00:00:00:02; outport = inport; flags.loopback = 1; output; };)
+])
+
+AS_BOX([Disable FDB learning])
+check ovn-nbctl --wait=sb lsp-set-options ln1 localnet_learn_fdb=false
+
+AT_CHECK([ovn-sbctl dump-flows ls1 | grep -e 'ls_in_lookup_fdb' | 
ovn_strip_lflows], [0], [dnl
+  table=??(ls_in_lookup_fdb   ), priority=0    , match=(1), action=(next;)
+  table=??(ls_in_lookup_fdb   ), priority=50   , match=(inport == "ln1"), 
action=(flags.localnet = 1; next;)
+])
+
+AT_CHECK([ovn-sbctl dump-flows ls1 | grep -e 'ls_in_arp_rsp' | 
ovn_strip_lflows], [0], [dnl
+  table=??(ls_in_arp_rsp      ), priority=0    , match=(1), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(arp.tpa == 10.0.0.1 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff && inport == "vm1"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(arp.tpa == 10.0.0.2 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff && inport == "vm2"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:1 && nd.target == fd01::1 && inport == "vm1"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=100  , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:2 && nd.target == fd01::2 && inport == "vm2"), action=(next;)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(arp.tpa == 10.0.0.1 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff && ((flags.localnet == 1 && 
is_chassis_resident("vm1")) || flags.localnet == 0)), action=(eth.dst = 
eth.src; eth.src = 00:00:00:00:00:01; arp.op = 2; /* ARP reply */ arp.tha = 
arp.sha; arp.sha = 00:00:00:00:00:01; arp.tpa = arp.spa; arp.spa = 10.0.0.1; 
outport = inport; flags.loopback = 1; output;)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(arp.tpa == 10.0.0.2 && 
arp.op == 1 && eth.dst == ff:ff:ff:ff:ff:ff && ((flags.localnet == 1 && 
is_chassis_resident("vm2")) || flags.localnet == 0)), action=(eth.dst = 
eth.src; eth.src = 00:00:00:00:00:02; arp.op = 2; /* ARP reply */ arp.tha = 
arp.sha; arp.sha = 00:00:00:00:00:02; arp.tpa = arp.spa; arp.spa = 10.0.0.2; 
outport = inport; flags.loopback = 1; output;)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:1 && nd.target == fd01::1 && ((flags.localnet == 1 && 
is_chassis_resident("vm1")) || flags.localnet == 0)), action=(nd_na { eth.src = 
00:00:00:00:00:01; ip6.src = fd01::1; nd.target = fd01::1; nd.tll = 
00:00:00:00:00:01; outport = inport; flags.loopback = 1; output; };)
+  table=??(ls_in_arp_rsp      ), priority=50   , match=(nd_ns_mcast && ip6.dst 
== ff02::1:ff00:2 && nd.target == fd01::2 && ((flags.localnet == 1 && 
is_chassis_resident("vm2")) || flags.localnet == 0)), action=(nd_na { eth.src = 
00:00:00:00:00:02; ip6.src = fd01::2; nd.target = fd01::2; nd.tll = 
00:00:00:00:00:02; outport = inport; flags.loopback = 1; output; };)
+])
+
+OVN_CLEANUP_NORTHD
+AT_CLEANUP
+])
+
 OVN_FOR_EACH_NORTHD_NO_HV([
 AT_SETUP([Address set incremental processing])
 ovn_start
diff --git a/tests/ovn.at b/tests/ovn.at
index c0ae611bc9..fbaa63d99c 100644
--- a/tests/ovn.at
+++ b/tests/ovn.at
@@ -10190,6 +10190,195 @@ OVN_CLEANUP([hv1])
 AT_CLEANUP
 ])
 
+OVN_FOR_EACH_NORTHD([
+AT_SETUP([ARP/ND from localnet -- proxy reply on resident chassis only])
+AT_SKIP_IF([test $HAVE_SCAPY = no])
+ovn_start
+
+dnl Create logical switch with localnet port.
+check ovn-nbctl ls-add ls1
+check ovn-nbctl lsp-add-localnet-port ls1 ln1 physnet1
+check ovn-nbctl lsp-add ls1 vm1 \
+    -- lsp-set-addresses vm1 "f0:00:00:00:00:01 10.0.0.1 fd01::1"
+check ovn-nbctl lsp-add ls1 vm2 \
+    -- lsp-set-addresses vm2 "f0:00:00:00:00:02 10.0.0.2 fd01::2"
+
+dnl Two hypervisors with bridge-mappings.
+net_add n1
+
+sim_add hv1
+as hv1
+ovs-vsctl \
+    -- add-br br-phys \
+    -- add-br br-eth0
+ovn_attach n1 br-phys 192.168.0.1
+check ovs-vsctl set Open_vSwitch . 
external-ids:ovn-bridge-mappings=physnet1:br-eth0
+check ovs-vsctl add-port br-eth0 snoopvif1 \
+    -- set Interface snoopvif1 options:tx_pcap=hv1/snoopvif-tx.pcap \
+                                options:rxq_pcap=hv1/snoopvif-rx.pcap
+check ovs-vsctl add-port br-int vm1 \
+    -- set Interface vm1 external-ids:iface-id=vm1 \
+                         options:tx_pcap=hv1/vm1-tx.pcap \
+                         options:rxq_pcap=hv1/vm1-rx.pcap
+
+sim_add hv2
+as hv2
+ovs-vsctl \
+    -- add-br br-phys \
+    -- add-br br-eth0
+ovn_attach n1 br-phys 192.168.0.2
+check ovs-vsctl set Open_vSwitch . 
external-ids:ovn-bridge-mappings=physnet1:br-eth0
+check ovs-vsctl add-port br-eth0 snoopvif2 \
+    -- set Interface snoopvif2 options:tx_pcap=hv2/snoopvif-tx.pcap \
+                                options:rxq_pcap=hv2/snoopvif-rx.pcap
+check ovs-vsctl add-port br-int vm2 \
+    -- set Interface vm2 external-ids:iface-id=vm2 \
+                         options:tx_pcap=hv2/vm2-tx.pcap \
+                         options:rxq_pcap=hv2/vm2-rx.pcap
+
+wait_for_ports_up vm1 vm2
+OVN_POPULATE_ARP
+check ovn-nbctl --wait=hv sync
+
+dnl Helper: construct ARP request.
+build_arp_request() {
+    local sha=$1 spa=$2 tpa=$3
+    fmt_pkt "Ether(dst='ff:ff:ff:ff:ff:ff', src='${sha}')/ \
+             ARP(hwsrc='${sha}', hwdst='ff:ff:ff:ff:ff:ff', \
+                 psrc='${spa}', pdst='${tpa}')"
+}
+
+dnl Helper: construct expected ARP reply.
+build_arp_reply() {
+    local req_sha=$1 req_spa=$2 reply_sha=$3 reply_spa=$4
+    fmt_pkt "Ether(dst='${req_sha}', src='${reply_sha}')/ \
+             ARP(op=2, hwsrc='${reply_sha}', hwdst='${req_sha}', \
+                 psrc='${reply_spa}', pdst='${req_spa}')"
+}
+
+dnl Helper: construct ND solicitation.
+build_nd_ns() {
+    local sha=$1 spa=$2 tpa=$3 sol_mcast=$4
+    fmt_pkt "Ether(dst='33:33:ff:00:00:0${tpa##*:}', src='${sha}')/ \
+             IPv6(src='${spa}', dst='${sol_mcast}')/ \
+             ICMPv6ND_NS(tgt='${tpa}')/ \
+             ICMPv6NDOptSrcLLAddr(lladdr='${sha}')"
+}
+
+dnl Helper: construct expected ND advertisement.
+build_nd_na() {
+    local req_sha=$1 req_spa=$2 reply_sha=$3 reply_tgt=$4
+    fmt_pkt "Ether(dst='${req_sha}', src='${reply_sha}')/ \
+             IPv6(src='${reply_tgt}', dst='${req_spa}')/ \
+             ICMPv6ND_NA(tgt='${reply_tgt}', R=0, S=1, O=1)/ \
+             ICMPv6NDOptDstLLAddr(lladdr='${reply_sha}')"
+}
+
+test_arp_nd_localnet() {
+    AS_BOX([ARP from localnet on hv1 for vm1 - expect reply])
+    as hv1 reset_pcap_file snoopvif1 hv1/snoopvif
+    as hv2 reset_pcap_file snoopvif2 hv2/snoopvif
+    as hv1 reset_pcap_file vm1 hv1/vm1
+    as hv2 reset_pcap_file vm2 hv2/vm2
+
+    dnl ARP request from br-eth0 on hv1 for vm1 (10.0.0.1).
+    dnl vm1 is resident on hv1, so hv1 should reply.
+    local arp_req=$(build_arp_request "f0:00:00:00:00:99" "10.0.0.99" 
"10.0.0.1")
+    as hv1 ovs-appctl netdev-dummy/receive snoopvif1 $arp_req
+    local arp_rep=$(build_arp_reply "f0:00:00:00:00:99" "10.0.0.99" \
+                                    "f0:00:00:00:00:01" "10.0.0.1")
+    echo $arp_rep > expected_arp_reply
+    OVN_CHECK_PACKETS_CONTAIN([hv1/snoopvif-tx.pcap], [expected_arp_reply])
+
+    AS_BOX([ARP from localnet on hv2 for vm1 - expect no reply])
+    as hv2 reset_pcap_file snoopvif2 hv2/snoopvif
+
+    dnl ARP request from br-eth0 on hv2 for vm1 (10.0.0.1).
+    dnl vm1 is NOT resident on hv2, so hv2 should NOT reply.
+    dnl To avoid relying on sleep, we also send an ARP request for vm2
+    dnl (which IS resident on hv2) and wait for that reply.  This proves
+    dnl the pipeline is running and any reply for vm1 would have appeared.
+    as hv2 ovs-appctl netdev-dummy/receive snoopvif2 $arp_req
+
+    local arp_req_vm2=$(build_arp_request "f0:00:00:00:00:99" "10.0.0.99" 
"10.0.0.2")
+    as hv2 ovs-appctl netdev-dummy/receive snoopvif2 $arp_req_vm2
+    local arp_rep_vm2=$(build_arp_reply "f0:00:00:00:00:99" "10.0.0.99" \
+                                        "f0:00:00:00:00:02" "10.0.0.2")
+    echo $arp_rep_vm2 > expected_arp_vm2
+    OVN_CHECK_PACKETS_CONTAIN([hv2/snoopvif-tx.pcap], [expected_arp_vm2])
+
+    dnl Now verify that no ARP reply for vm1 was generated on hv2.
+    AT_CHECK([$PYTHON "$ovs_srcdir/utilities/ovs-pcap.in" hv2/snoopvif-tx.pcap 
| \
+              grep -c "$arp_rep"], [1], [dnl
+0
+])
+
+    AS_BOX([ARP from vm2 VIF for vm1 - expect proxy reply])
+    as hv2 reset_pcap_file vm2 hv2/vm2
+    local arp_req2=$(build_arp_request "f0:00:00:00:00:02" "10.0.0.2" 
"10.0.0.1")
+    as hv2 ovs-appctl netdev-dummy/receive vm2 $arp_req2
+    local arp_rep2=$(build_arp_reply "f0:00:00:00:00:02" "10.0.0.2" \
+                                     "f0:00:00:00:00:01" "10.0.0.1")
+    echo $arp_rep2 > expected_arp_proxy
+    OVN_CHECK_PACKETS_CONTAIN([hv2/vm2-tx.pcap], [expected_arp_proxy])
+
+    AS_BOX([ND from localnet on hv1 for vm1 - expect reply])
+    as hv1 reset_pcap_file snoopvif1 hv1/snoopvif
+    as hv2 reset_pcap_file snoopvif2 hv2/snoopvif
+
+    dnl ND solicitation from br-eth0 on hv1 for vm1 IPv6 (fd01::1).
+    dnl vm1 is resident on hv1, so hv1 should reply.
+    local nd_ns=$(build_nd_ns "f0:00:00:00:00:99" "fd01::99" "fd01::1" 
"ff02::1:ff00:1")
+    as hv1 ovs-appctl netdev-dummy/receive snoopvif1 $nd_ns
+    local nd_na=$(build_nd_na "f0:00:00:00:00:99" "fd01::99" \
+                               "f0:00:00:00:00:01" "fd01::1")
+    echo $nd_na > expected_nd_reply
+    OVN_CHECK_PACKETS_CONTAIN([hv1/snoopvif-tx.pcap], [expected_nd_reply])
+
+    AS_BOX([ND from localnet on hv2 for vm1 - expect no reply])
+    as hv2 reset_pcap_file snoopvif2 hv2/snoopvif
+
+    dnl ND solicitation from br-eth0 on hv2 for vm1 IPv6 (fd01::1).
+    dnl vm1 is NOT resident on hv2, so hv2 should NOT reply.
+    dnl Same technique: send ND for vm2 (resident) and wait for that reply.
+    as hv2 ovs-appctl netdev-dummy/receive snoopvif2 $nd_ns
+
+    local nd_ns_vm2=$(build_nd_ns "f0:00:00:00:00:99" "fd01::99" "fd01::2" 
"ff02::1:ff00:2")
+    as hv2 ovs-appctl netdev-dummy/receive snoopvif2 $nd_ns_vm2
+    local nd_na_vm2=$(build_nd_na "f0:00:00:00:00:99" "fd01::99" \
+                                   "f0:00:00:00:00:02" "fd01::2")
+    echo $nd_na_vm2 > expected_nd_vm2
+    OVN_CHECK_PACKETS_CONTAIN([hv2/snoopvif-tx.pcap], [expected_nd_vm2])
+
+    dnl Now verify that no ND advertisement for vm1 was generated on hv2.
+    AT_CHECK([$PYTHON "$ovs_srcdir/utilities/ovs-pcap.in" hv2/snoopvif-tx.pcap 
| \
+              grep -c "$nd_na"], [1], [dnl
+0
+])
+
+    AS_BOX([ND from vm2 VIF for vm1 - expect proxy reply])
+    as hv2 reset_pcap_file vm2 hv2/vm2
+    local nd_ns2=$(build_nd_ns "f0:00:00:00:00:02" "fd01::2" "fd01::1" 
"ff02::1:ff00:1")
+    as hv2 ovs-appctl netdev-dummy/receive vm2 $nd_ns2
+    local nd_na2=$(build_nd_na "f0:00:00:00:00:02" "fd01::2" \
+                                "f0:00:00:00:00:01" "fd01::1")
+    echo $nd_na2 > expected_nd_proxy
+    OVN_CHECK_PACKETS_CONTAIN([hv2/vm2-tx.pcap], [expected_nd_proxy])
+}
+
+AS_BOX([FDB learning disabled])
+test_arp_nd_localnet
+
+AS_BOX([FDB learning enabled])
+dnl Use 'set' instead of 'lsp-set-options' to preserve network_name.
+check ovn-nbctl --wait=hv set Logical_Switch_Port ln1 \
+    options:localnet_learn_fdb=true
+test_arp_nd_localnet
+
+OVN_CLEANUP([hv1],[hv2])
+AT_CLEANUP
+])
+
 OVN_FOR_EACH_NORTHD([
 AT_SETUP([send reverse arp for router without ipv4 address])
 ovn_start
-- 
2.53.0

_______________________________________________
dev mailing list
[email protected]
https://mail.openvswitch.org/mailman/listinfo/ovs-dev

Reply via email to