VFs should continue normal packet Rx/Tx after PF ifconfig down/up. When mailbox messages lack the TXGBE_VT_MSGTYPE_CTS flag, the PF is considered down. In this state, the VF reports link down and stops transmitting. Upon detecting the loss of CTS, the VF sends a reset request to the PF. If the request succeeds (indicating PF recovery), the VF triggers an RTE_ETH_EVENT_INTR_RESET event to notify the application or users to reset the VF.
The write_posted() based VF_RESET request is the only recovery path: the PF only marks this VF as ready (and starts sending CTS) after it processes VF_RESET, so this request is required for the VF to recover. write_posted() may busy-wait for the ACK in the interrupt thread, but the PF does not send further mailbox messages once it is down, so this blocking is not continuously triggered. Additionally, hw->rx_loaded and hw->offset_loaded must be reset when PF ifconfig down; otherwise, because hardware counter registers are cleared during PF reset, the VF's software counters will overflow to 0xFFFFFFFF. Signed-off-by: Zaiyu Wang <[email protected]> --- doc/guides/rel_notes/release_26_07.rst | 5 ++ drivers/net/txgbe/base/txgbe_type.h | 1 + drivers/net/txgbe/txgbe_ethdev.c | 4 +- drivers/net/txgbe/txgbe_ethdev_vf.c | 86 ++++++++++++++++++++++---- 4 files changed, 83 insertions(+), 13 deletions(-) diff --git a/doc/guides/rel_notes/release_26_07.rst b/doc/guides/rel_notes/release_26_07.rst index 06cd52b777..46935ba872 100644 --- a/doc/guides/rel_notes/release_26_07.rst +++ b/doc/guides/rel_notes/release_26_07.rst @@ -190,6 +190,11 @@ New Features The ``RTE_ETH_TX_OFFLOAD_UDP_TSO`` capability was advertised since the driver's initial integration but the data path was missing; it is now functional. + * Added support for VF sensing PF down. VFs now detect when the PF goes + down (via the mailbox ``TXGBE_VT_MSGTYPE_CTS`` flag) and report link + down. When the PF comes back, the VF triggers an + ``RTE_ETH_EVENT_INTR_RESET`` event so the application can reset the VF + and resume normal packet Rx/Tx. Removed Items diff --git a/drivers/net/txgbe/base/txgbe_type.h b/drivers/net/txgbe/base/txgbe_type.h index ede780321f..c73a9ebcb4 100644 --- a/drivers/net/txgbe/base/txgbe_type.h +++ b/drivers/net/txgbe/base/txgbe_type.h @@ -883,6 +883,7 @@ struct txgbe_hw { rte_atomic32_t swfw_busy; u32 fec_mode; u32 cur_fec_link; + RTE_ATOMIC(bool) pf_running; }; struct txgbe_backplane_ability { diff --git a/drivers/net/txgbe/txgbe_ethdev.c b/drivers/net/txgbe/txgbe_ethdev.c index 0f484dfe91..c99734cced 100644 --- a/drivers/net/txgbe/txgbe_ethdev.c +++ b/drivers/net/txgbe/txgbe_ethdev.c @@ -3150,7 +3150,9 @@ txgbe_dev_link_update_share(struct rte_eth_dev *dev, hw->mac.get_link_status = true; - if (intr->flags & TXGBE_FLAG_NEED_LINK_CONFIG) + if (intr->flags & TXGBE_FLAG_NEED_LINK_CONFIG || + (txgbe_is_vf(hw) && !rte_atomic_load_explicit(&hw->pf_running, + rte_memory_order_acquire))) return rte_eth_linkstatus_set(dev, &link); /* check if it needs to wait to complete, if lsc interrupt is enabled */ diff --git a/drivers/net/txgbe/txgbe_ethdev_vf.c b/drivers/net/txgbe/txgbe_ethdev_vf.c index 7a50c7a855..c57ac57141 100644 --- a/drivers/net/txgbe/txgbe_ethdev_vf.c +++ b/drivers/net/txgbe/txgbe_ethdev_vf.c @@ -281,6 +281,8 @@ eth_txgbevf_dev_init(struct rte_eth_dev *eth_dev) hw->subsystem_device_id = pci_dev->id.subsystem_device_id; hw->subsystem_vendor_id = pci_dev->id.subsystem_vendor_id; hw->hw_addr = (void *)pci_dev->mem_resource[0].addr; + rte_atomic_store_explicit(&hw->pf_running, true, + rte_memory_order_release); /* initialize the vfta */ memset(shadow_vfta, 0, sizeof(*shadow_vfta)); @@ -1405,10 +1407,21 @@ static s32 txgbevf_get_pf_link_status(struct rte_eth_dev *dev) if (retval) return 0; + if (!(msgbuf[0] & TXGBE_NOFITY_VF_LINK_STATUS)) + return 0; + rte_eth_linkstatus_get(dev, &link); + if (!rte_atomic_load_explicit(&hw->pf_running, + rte_memory_order_acquire)) { + link.link_status = RTE_ETH_LINK_DOWN; + link.link_speed = RTE_ETH_SPEED_NUM_NONE; + link.link_duplex = RTE_ETH_LINK_HALF_DUPLEX; + return rte_eth_linkstatus_set(dev, &link); + } + link_up = msgbuf[1] & TXGBE_VFSTATUS_UP; - link_speed = (msgbuf[1] & 0xFFF0) >> 1; + link_speed = (msgbuf[1] & 0x1FFFFE) >> 1; if (link_up == link.link_status && link_speed == link.link_speed) return 0; @@ -1434,10 +1447,23 @@ static s32 txgbevf_get_pf_link_status(struct rte_eth_dev *dev) static void txgbevf_check_link_for_intr(struct rte_eth_dev *dev) { struct rte_eth_link orig_link, new_link; + struct txgbe_hw *hw = TXGBE_DEV_HW(dev); rte_eth_linkstatus_get(dev, &orig_link); - txgbevf_dev_link_update(dev, 0); - rte_eth_linkstatus_get(dev, &new_link); + + if (rte_atomic_load_explicit(&hw->pf_running, + rte_memory_order_acquire)) { + txgbevf_dev_link_update(dev, 0); + rte_eth_linkstatus_get(dev, &new_link); + } else { + DEBUGOUT("PF ifconfig down, so VF link down"); + new_link.link_status = RTE_ETH_LINK_DOWN; + new_link.link_speed = RTE_ETH_SPEED_NUM_NONE; + new_link.link_duplex = RTE_ETH_LINK_HALF_DUPLEX; + new_link.link_autoneg = !(dev->data->dev_conf.link_speeds & + RTE_ETH_LINK_SPEED_FIXED); + rte_eth_linkstatus_set(dev, &new_link); + } PMD_DRV_LOG(INFO, "orig_link: %d, new_link: %d", orig_link.link_status, new_link.link_status); @@ -1450,22 +1476,58 @@ static void txgbevf_check_link_for_intr(struct rte_eth_dev *dev) static void txgbevf_mbx_process(struct rte_eth_dev *dev) { struct txgbe_hw *hw = TXGBE_DEV_HW(dev); + struct txgbe_mbx_info *mbx = &hw->mbx; + u32 msgbuf = 0; u32 in_msg = 0; - /* peek the message first */ + /* Peek the message first */ in_msg = rd32(hw, TXGBE_VFMBX); - /* PF reset VF event */ - if (in_msg & TXGBE_PF_CONTROL_MSG) { - if (in_msg & TXGBE_NOFITY_VF_LINK_STATUS) { - txgbevf_get_pf_link_status(dev); - } else { - /* dummy mbx read to ack pf */ - txgbe_read_mbx(hw, &in_msg, 1, 0); - /* check link status if pf ping vf */ + /* PF control message */ + if (!(in_msg & TXGBE_PF_CONTROL_MSG)) + return; + + txgbevf_get_pf_link_status(dev); + + if (!(in_msg & TXGBE_VT_MSGTYPE_CTS)) { + /* + * PF is not ready for this VF (e.g. PF ifconfig down). + * + * Send VF_RESET to ask the PF to reconfigure us. The PF only + * marks this VF as ready (and starts sending CTS) after it + * processes VF_RESET, so this request is the only way to + * recover. If write_posted() succeeds the PF is back up and + * we notify the application to reset the VF; otherwise the PF + * is still down, so we mark it down and reset the stats + * baselines (hardware counters are cleared during PF reset). + * + * write_posted() may busy-wait for the ACK in the interrupt + * thread, but the PF does not send further mailbox messages + * once it is down, so this blocking is not continuously + * triggered. + */ + int err; + + msgbuf = TXGBE_VF_RESET; + err = mbx->write_posted(hw, &msgbuf, 1, 0); + if (err) { + rte_atomic_store_explicit(&hw->pf_running, false, + rte_memory_order_release); txgbevf_check_link_for_intr(dev); + hw->rx_loaded = true; + hw->offset_loaded = true; + } else { + rte_atomic_store_explicit(&hw->pf_running, true, + rte_memory_order_release); + rte_eth_dev_callback_process(dev, + RTE_ETH_EVENT_INTR_RESET, NULL); } + return; } + + /* Check link status if pf only ping vf */ + if (!(in_msg & TXGBE_NOFITY_VF_LINK_STATUS)) + txgbevf_check_link_for_intr(dev); } static int -- 2.21.0.windows.1

