Author: mw
Date: Tue May 26 15:58:48 2020
New Revision: 361526
URL: https://svnweb.freebsd.org/changeset/base/361526

Log:
  Create ENA IO queues with optional backoff
  
  If requested size of IO queues is not supported try to decrease it until
  finding the highest value that can be satisfied.
  
  Submitted by:  Maciej Bielski <m...@semihalf.com>
  Obtained from: Semihalf
  Sponsored by:  Amazon, Inc.

Modified:
  head/sys/dev/ena/ena.c
  head/sys/dev/ena/ena.h
  head/sys/dev/ena/ena_netmap.c
  head/sys/dev/ena/ena_sysctl.c

Modified: head/sys/dev/ena/ena.c
==============================================================================
--- head/sys/dev/ena/ena.c      Tue May 26 15:57:02 2020        (r361525)
+++ head/sys/dev/ena/ena.c      Tue May 26 15:58:48 2020        (r361526)
@@ -408,13 +408,9 @@ ena_init_io_rings_basic(struct ena_adapter *adapter)
                ena_init_io_rings_common(adapter, rxr, i);
 
                /* TX specific ring state */
-               txr->ring_size = adapter->tx_ring_size;
                txr->tx_max_header_size = ena_dev->tx_max_header_size;
                txr->tx_mem_queue_type = ena_dev->tx_mem_queue_type;
 
-               /* RX specific ring state */
-               rxr->ring_size = adapter->rx_ring_size;
-
                que = &adapter->que[i];
                que->adapter = adapter;
                que->id = i;
@@ -1193,10 +1189,10 @@ ena_update_queue_size(struct ena_adapter *adapter, uin
 
        ENA_LOCK_LOCK(adapter);
 
-       old_tx_size = adapter->tx_ring_size;
-       old_rx_size = adapter->rx_ring_size;
-       adapter->tx_ring_size = new_tx_size;
-       adapter->rx_ring_size = new_rx_size;
+       old_tx_size = adapter->requested_tx_ring_size;
+       old_rx_size = adapter->requested_rx_ring_size;
+       adapter->requested_tx_ring_size = new_tx_size;
+       adapter->requested_rx_ring_size = new_rx_size;
 
        dev_was_up = ENA_FLAG_ISSET(ENA_FLAG_DEV_UP, adapter);
        ena_down(adapter);
@@ -1211,8 +1207,8 @@ ena_update_queue_size(struct ena_adapter *adapter, uin
                            new_tx_size, new_rx_size, old_tx_size, old_rx_size);
 
                        /* Revert old size. */
-                       adapter->tx_ring_size = old_tx_size;
-                       adapter->rx_ring_size = old_rx_size;
+                       adapter->requested_tx_ring_size = old_tx_size;
+                       adapter->requested_rx_ring_size = old_rx_size;
                        ena_init_io_rings_basic(adapter);
 
                        /* And try again. */
@@ -1455,7 +1451,7 @@ ena_create_io_queues(struct ena_adapter *adapter)
                ena_qid = ENA_IO_TXQ_IDX(i);
                ctx.mem_queue_type = ena_dev->tx_mem_queue_type;
                ctx.direction = ENA_COM_IO_QUEUE_DIRECTION_TX;
-               ctx.queue_size = adapter->tx_ring_size;
+               ctx.queue_size = adapter->requested_tx_ring_size;
                ctx.msix_vector = msix_vector;
                ctx.qid = ena_qid;
                rc = ena_com_create_io_queue(ena_dev, &ctx);
@@ -1483,7 +1479,7 @@ ena_create_io_queues(struct ena_adapter *adapter)
                ena_qid = ENA_IO_RXQ_IDX(i);
                ctx.mem_queue_type = ENA_ADMIN_PLACEMENT_POLICY_HOST;
                ctx.direction = ENA_COM_IO_QUEUE_DIRECTION_RX;
-               ctx.queue_size = adapter->rx_ring_size;
+               ctx.queue_size = adapter->requested_rx_ring_size;
                ctx.msix_vector = msix_vector;
                ctx.qid = ena_qid;
                rc = ena_com_create_io_queue(ena_dev, &ctx);
@@ -1975,6 +1971,104 @@ ena_up_complete(struct ena_adapter *adapter)
        return (0);
 }
 
+static void
+set_io_rings_size(struct ena_adapter *adapter, int new_tx_size,
+    int new_rx_size)
+{
+       int i;
+
+       for (i = 0; i < adapter->num_io_queues; i++) {
+               adapter->tx_ring[i].ring_size = new_tx_size;
+               adapter->rx_ring[i].ring_size = new_rx_size;
+       }
+}
+
+static int
+create_queues_with_size_backoff(struct ena_adapter *adapter)
+{
+       int rc;
+       uint32_t cur_rx_ring_size, cur_tx_ring_size;
+       uint32_t new_rx_ring_size, new_tx_ring_size;
+
+       /*
+        * Current queue sizes might be set to smaller than the requested
+        * ones due to past queue allocation failures.
+        */
+       set_io_rings_size(adapter, adapter->requested_tx_ring_size,
+           adapter->requested_rx_ring_size);
+
+       while (1) {
+               /* Allocate transmit descriptors */
+               rc = ena_setup_all_tx_resources(adapter);
+               if (unlikely(rc != 0)) {
+                       ena_trace(ENA_ALERT, "err_setup_tx\n");
+                       goto err_setup_tx;
+               }
+
+               /* Allocate receive descriptors */
+               rc = ena_setup_all_rx_resources(adapter);
+               if (unlikely(rc != 0)) {
+                       ena_trace(ENA_ALERT, "err_setup_rx\n");
+                       goto err_setup_rx;
+               }
+
+               /* Create IO queues for Rx & Tx */
+               rc = ena_create_io_queues(adapter);
+               if (unlikely(rc != 0)) {
+                       ena_trace(ENA_ALERT,
+                           "create IO queues failed\n");
+                       goto err_io_que;
+               }
+
+               return (0);
+
+err_io_que:
+               ena_free_all_rx_resources(adapter);
+err_setup_rx:
+               ena_free_all_tx_resources(adapter);
+err_setup_tx:
+               /*
+                * Lower the ring size if ENOMEM. Otherwise, return the
+                * error straightaway.
+                */
+               if (unlikely(rc != ENOMEM)) {
+                       ena_trace(ENA_ALERT,
+                           "Queue creation failed with error code: %d\n", rc);
+                       return (rc);
+               }
+
+               cur_tx_ring_size = adapter->tx_ring[0].ring_size;
+               cur_rx_ring_size = adapter->rx_ring[0].ring_size;
+
+               device_printf(adapter->pdev,
+                   "Not enough memory to create queues with sizes TX=%d, 
RX=%d\n",
+                   cur_tx_ring_size, cur_rx_ring_size);
+
+               new_tx_ring_size = cur_tx_ring_size;
+               new_rx_ring_size = cur_rx_ring_size;
+
+               /*
+                * Decrease the size of a larger queue, or decrease both if 
they are
+                * the same size.
+                */
+               if (cur_rx_ring_size <= cur_tx_ring_size)
+                       new_tx_ring_size = cur_tx_ring_size / 2;
+               if (cur_rx_ring_size >= cur_tx_ring_size)
+                       new_rx_ring_size = cur_rx_ring_size / 2;
+
+               if (new_tx_ring_size < ENA_MIN_RING_SIZE ||
+                   new_rx_ring_size < ENA_MIN_RING_SIZE) {
+                       device_printf(adapter->pdev,
+                           "Queue creation failed with the smallest possible 
queue size"
+                           "of %d for both queues. Not retrying with smaller 
queues\n",
+                           ENA_MIN_RING_SIZE);
+                       return (rc);
+               }
+
+               set_io_rings_size(adapter, new_tx_ring_size, new_rx_ring_size);
+       }
+}
+
 int
 ena_up(struct ena_adapter *adapter)
 {
@@ -2003,33 +2097,19 @@ ena_up(struct ena_adapter *adapter)
        }
 
        device_printf(adapter->pdev,
-           "Creating %u IO queues. Rx queue size: %d, Tx queue size: %d, LLQ 
is %s\n",
+           "Creating %u IO queues. Rx queue size: %d, Tx queue size: %d, "
+           "LLQ is %s\n",
            adapter->num_io_queues,
-           adapter->rx_ring_size,
-           adapter->tx_ring_size,
-           (adapter->ena_dev->tx_mem_queue_type == 
ENA_ADMIN_PLACEMENT_POLICY_DEV) ?
-           "ENABLED" : "DISABLED");
+           adapter->requested_rx_ring_size,
+           adapter->requested_tx_ring_size,
+           (adapter->ena_dev->tx_mem_queue_type ==
+               ENA_ADMIN_PLACEMENT_POLICY_DEV) ?  "ENABLED" : "DISABLED");
 
-       /* allocate transmit descriptors */
-       rc = ena_setup_all_tx_resources(adapter);
+       rc = create_queues_with_size_backoff(adapter);
        if (unlikely(rc != 0)) {
-               ena_trace(ENA_ALERT, "err_setup_tx\n");
-               goto err_setup_tx;
-       }
-
-       /* allocate receive descriptors */
-       rc = ena_setup_all_rx_resources(adapter);
-       if (unlikely(rc != 0)) {
-               ena_trace(ENA_ALERT, "err_setup_rx\n");
-               goto err_setup_rx;
-       }
-
-       /* create IO queues for Rx & Tx */
-       rc = ena_create_io_queues(adapter);
-       if (unlikely(rc != 0)) {
                ena_trace(ENA_ALERT,
-                       "create IO queues failed\n");
-               goto err_io_que;
+                   "error creating queues with size backoff\n");
+               goto err_create_queues_with_backoff;
        }
 
        if (ENA_FLAG_ISSET(ENA_FLAG_LINK_UP, adapter))
@@ -2063,11 +2143,9 @@ ena_up(struct ena_adapter *adapter)
 
 err_up_complete:
        ena_destroy_all_io_queues(adapter);
-err_io_que:
        ena_free_all_rx_resources(adapter);
-err_setup_rx:
        ena_free_all_tx_resources(adapter);
-err_setup_tx:
+err_create_queues_with_backoff:
        ena_free_io_irq(adapter);
 error:
        return (rc);
@@ -2329,7 +2407,7 @@ ena_setup_ifnet(device_t pdev, struct ena_adapter *ada
        if_setioctlfn(ifp, ena_ioctl);
        if_setgetcounterfn(ifp, ena_get_counter);
 
-       if_setsendqlen(ifp, adapter->tx_ring_size);
+       if_setsendqlen(ifp, adapter->requested_tx_ring_size);
        if_setsendqready(ifp);
        if_setmtu(ifp, ETHERMTU);
        if_setbaudrate(ifp, 0);
@@ -3461,8 +3539,8 @@ ena_attach(device_t pdev)
                goto err_com_free;
        }
 
-       adapter->tx_ring_size = calc_queue_ctx.tx_queue_size;
-       adapter->rx_ring_size = calc_queue_ctx.rx_queue_size;
+       adapter->requested_tx_ring_size = calc_queue_ctx.tx_queue_size;
+       adapter->requested_rx_ring_size = calc_queue_ctx.rx_queue_size;
        adapter->max_tx_ring_size = calc_queue_ctx.max_tx_queue_size;
        adapter->max_rx_ring_size = calc_queue_ctx.max_rx_queue_size;
        adapter->max_tx_sgl_size = calc_queue_ctx.max_tx_sgl_size;

Modified: head/sys/dev/ena/ena.h
==============================================================================
--- head/sys/dev/ena/ena.h      Tue May 26 15:57:02 2020        (r361525)
+++ head/sys/dev/ena/ena.h      Tue May 26 15:58:48 2020        (r361526)
@@ -415,8 +415,8 @@ struct ena_adapter {
        uint32_t num_io_queues;
        uint32_t max_num_io_queues;
 
-       uint32_t tx_ring_size;
-       uint32_t rx_ring_size;
+       uint32_t requested_tx_ring_size;
+       uint32_t requested_rx_ring_size;
 
        uint32_t max_tx_ring_size;
        uint32_t max_rx_ring_size;

Modified: head/sys/dev/ena/ena_netmap.c
==============================================================================
--- head/sys/dev/ena/ena_netmap.c       Tue May 26 15:57:02 2020        
(r361525)
+++ head/sys/dev/ena/ena_netmap.c       Tue May 26 15:58:48 2020        
(r361526)
@@ -93,8 +93,8 @@ ena_netmap_attach(struct ena_adapter *adapter)
        bzero(&na, sizeof(na));
        na.na_flags = NAF_MOREFRAG;
        na.ifp = adapter->ifp;
-       na.num_tx_desc = adapter->tx_ring_size;
-       na.num_rx_desc = adapter->rx_ring_size;
+       na.num_tx_desc = adapter->requested_tx_ring_size;
+       na.num_rx_desc = adapter->requested_rx_ring_size;
        na.num_tx_rings = adapter->num_io_queues;
        na.num_rx_rings = adapter->num_io_queues;
        na.rx_buf_maxsize = adapter->buf_ring_size;

Modified: head/sys/dev/ena/ena_sysctl.c
==============================================================================
--- head/sys/dev/ena/ena_sysctl.c       Tue May 26 15:57:02 2020        
(r361525)
+++ head/sys/dev/ena/ena_sysctl.c       Tue May 26 15:58:48 2020        
(r361526)
@@ -373,7 +373,7 @@ ena_sysctl_rx_queue_size(SYSCTL_HANDLER_ARGS)
        val = 0;
        error = sysctl_wire_old_buffer(req, sizeof(val));
        if (error == 0) {
-               val = adapter->rx_ring_size;
+               val = adapter->requested_rx_ring_size;
                error = sysctl_handle_32(oidp, &val, 0, req);
        }
        if (error != 0 || req->newptr == NULL)
@@ -394,17 +394,17 @@ ena_sysctl_rx_queue_size(SYSCTL_HANDLER_ARGS)
                return (EINVAL);
        }
 
-       if (val != adapter->rx_ring_size) {
+       if (val != adapter->requested_rx_ring_size) {
                device_printf(adapter->pdev,
                    "Requested new Rx queue size: %u. Old size: %u\n",
-                   val, adapter->rx_ring_size);
+                   val, adapter->requested_rx_ring_size);
 
-               error = ena_update_queue_size(adapter, adapter->tx_ring_size,
-                   val);
+               error = ena_update_queue_size(adapter,
+                   adapter->requested_tx_ring_size, val);
        } else {
                device_printf(adapter->pdev,
                    "New Rx queue size is the same as already used: %u\n",
-                   adapter->rx_ring_size);
+                   adapter->requested_rx_ring_size);
        }
 
        return (error);
_______________________________________________
svn-src-all@freebsd.org mailing list
https://lists.freebsd.org/mailman/listinfo/svn-src-all
To unsubscribe, send any mail to "svn-src-all-unsubscr...@freebsd.org"

Reply via email to