On 07/14/2017 01:48 PM, Moritz Fischer wrote:
> Add support for the National Instruments XGE 1/10G network device.
> 
> It uses the EEPROM on the board via NVMEM.
> 
> Signed-off-by: Moritz Fischer <m...@kernel.org>
> ---

> +
> +static void nixge_handle_link_change(struct net_device *ndev)
> +{
> +     struct nixge_priv *priv = netdev_priv(ndev);
> +     struct phy_device *phydev = ndev->phydev;
> +     unsigned long flags;
> +     int status_change = 0;
> +
> +     spin_lock_irqsave(&priv->lock, flags);

The adjust_link function is called with the PHY device mutex held so the
spinlock here looks completely unnecessary.

> +
> +     if (phydev->link != priv->link || phydev->speed != priv->speed ||
> +         phydev->duplex != priv->duplex) {
> +             priv->link = phydev->link;
> +             priv->speed = phydev->speed;
> +             priv->duplex = phydev->duplex;
> +             status_change = 1;
> +     }
> +
> +     spin_unlock_irqrestore(&priv->lock, flags);
> +
> +     if (status_change)
> +             phy_print_status(phydev);

It's fine to print what changed, but surely the hardware should also
react to link changes, like change of duplex, speed, pause etc.

> +}
> +
> +static void nixge_start_xmit_done(struct net_device *ndev)
> +{

This should be done in a NAPI context (soft IRQ) as well, except that
for TX you don't need to bind the reclaiming process against the NAPI
budget.

> +     u32 size = 0;
> +     u32 packets = 0;
> +     struct nixge_priv *priv = netdev_priv(ndev);
> +     struct nixge_dma_bd *cur_p;
> +     unsigned int status = 0;
> +
> +     cur_p = &priv->tx_bd_v[priv->tx_bd_ci];
> +     status = cur_p->status;
> +
> +     while (status & XAXIDMA_BD_STS_COMPLETE_MASK) {
> +             dma_unmap_single(ndev->dev.parent, cur_p->phys,
> +                              (cur_p->cntrl & XAXIDMA_BD_CTRL_LENGTH_MASK),
> +                             DMA_TO_DEVICE);

Fragments are unmapped with dma_unmap_page(), how are you unmapping them
at the moment?

> +             if (cur_p->app4)
> +                     dev_kfree_skb_irq((struct sk_buff *)cur_p->app4);
> +             /*cur_p->phys = 0;*/
> +             cur_p->app0 = 0;
> +             cur_p->app1 = 0;
> +             cur_p->app2 = 0;
> +             cur_p->app4 = 0;
> +             cur_p->status = 0;

Is this really necessary? Your descriptor is in coherent memory which
means that you are doing slow uncached/writethrough accesses to the
memory that holds them. Can't you just set status to 0 for the HW to
ignore this descriptor?

> +
> +             size += status & XAXIDMA_BD_STS_ACTUAL_LEN_MASK;
> +             packets++;
> +
> +             ++priv->tx_bd_ci;
> +             priv->tx_bd_ci %= TX_BD_NUM;
> +             cur_p = &priv->tx_bd_v[priv->tx_bd_ci];
> +             status = cur_p->status;
> +     }
> +
> +     ndev->stats.tx_packets += packets;
> +     ndev->stats.tx_bytes += size;
> +     netif_wake_queue(ndev);

You can only wake the queue if you were successful transmitting packets.

> +}
> +
> +static inline int nixge_check_tx_bd_space(struct nixge_priv *priv,
> +                                       int num_frag)
> +{
> +     struct nixge_dma_bd *cur_p;
> +
> +     cur_p = &priv->tx_bd_v[(priv->tx_bd_tail + num_frag) % TX_BD_NUM];
> +     if (cur_p->status & XAXIDMA_BD_STS_ALL_MASK)
> +             return NETDEV_TX_BUSY;

You are not propagating this to the caller, so just return a boolean for
this.

> +     return 0;
> +}
> +
> +static int nixge_start_xmit(struct sk_buff *skb, struct net_device *ndev)
> +{
> +     u32 ii;
> +     u32 num_frag;
> +     skb_frag_t *frag;
> +     dma_addr_t tail_p;
> +     struct nixge_priv *priv = netdev_priv(ndev);
> +     struct nixge_dma_bd *cur_p;
> +
> +     num_frag = skb_shinfo(skb)->nr_frags;
> +     cur_p = &priv->tx_bd_v[priv->tx_bd_tail];
> +
> +     if (nixge_check_tx_bd_space(priv, num_frag)) {
> +             if (!netif_queue_stopped(ndev))
> +                     netif_stop_queue(ndev);
> +             return NETDEV_TX_BUSY;

NETDEV_TX_OK is what you should return since you properly asserted flow
contro with netif_stop_queue().

> +     }
> +
> +     cur_p->cntrl = skb_headlen(skb) | XAXIDMA_BD_CTRL_TXSOF_MASK;
> +     cur_p->phys = dma_map_single(ndev->dev.parent, skb->data,
> +                                  skb_headlen(skb), DMA_TO_DEVICE);

This needs to be checked with dma_mapping_error().

> +
> +     for (ii = 0; ii < num_frag; ii++) {
> +             ++priv->tx_bd_tail;
> +             priv->tx_bd_tail %= TX_BD_NUM;
> +             cur_p = &priv->tx_bd_v[priv->tx_bd_tail];
> +             frag = &skb_shinfo(skb)->frags[ii];
> +             cur_p->phys = dma_map_single(ndev->dev.parent,
> +                                          skb_frag_address(frag),
> +                                          skb_frag_size(frag),
> +                                          DMA_TO_DEVICE);

Needs to be checked against dma_mapping_error() and you would have to
unwind the whole SKB linear + fragments mappings and buffer descriptors.

> +             cur_p->cntrl = skb_frag_size(frag);
> +     }
> +
> +     cur_p->cntrl |= XAXIDMA_BD_CTRL_TXEOF_MASK;
> +     cur_p->app4 = (unsigned long)skb;
> +
> +     tail_p = priv->tx_bd_p + sizeof(*priv->tx_bd_v) * priv->tx_bd_tail;
> +     /* Start the transfer */

You might be able to check for (!skb->xmit_more ||
netif_queue_stopped()) here to only do the write when you know for sure
there is nothing more coming.

> +     nixge_dma_write_reg(priv, XAXIDMA_TX_TDESC_OFFSET, tail_p);
> +     ++priv->tx_bd_tail;
> +     priv->tx_bd_tail %= TX_BD_NUM;
> +
> +     return NETDEV_TX_OK;
> +}
> +
> +static void nixge_recv(struct net_device *ndev)
> +{
> +     u32 length;
> +     u32 size = 0;
> +     u32 packets = 0;
> +     dma_addr_t tail_p = 0;
> +     struct nixge_priv *priv = netdev_priv(ndev);
> +     struct sk_buff *skb, *new_skb;
> +     struct nixge_dma_bd *cur_p;
> +
> +     cur_p = &priv->rx_bd_v[priv->rx_bd_ci];

Please do this in a NAPI context and bound the reception to the NAPI budget.

> +
> +     while ((cur_p->status & XAXIDMA_BD_STS_COMPLETE_MASK)) {
> +             tail_p = priv->rx_bd_p
> +                     + sizeof(*priv->rx_bd_v) * priv->rx_bd_ci;
> +             skb = (struct sk_buff *)(cur_p->sw_id_offset);
> +
> +             length = cur_p->status & 0x7fffff;

You can't trust the HW to return a length that is correct, you need to
check that length is smaller than or equal to priv->max_frm_size here,
otherwise you will overflow your skb size.

> +             dma_unmap_single(ndev->dev.parent, cur_p->phys,
> +                              priv->max_frm_size,
> +                              DMA_FROM_DEVICE);
> +
> +             skb_put(skb, length);
> +
> +             skb->protocol = eth_type_trans(skb, ndev);
> +             skb_checksum_none_assert(skb);
> +
> +             /* For now mark them as CHECKSUM_NONE since
> +              * we don't have offload capabilities
> +              */
> +             skb->ip_summed = CHECKSUM_NONE;
> +
> +             netif_rx(skb);

napi_gro_receive() or netif_receive_skb() at the very least, but that
needs a conversion to NAPI first.

> +
> +             size += length;
> +             packets++;
> +
> +             new_skb = netdev_alloc_skb_ip_align(ndev, priv->max_frm_size);
> +             if (!new_skb)
> +                     return;
> +
> +             cur_p->phys = dma_map_single(ndev->dev.parent, new_skb->data,
> +                                          priv->max_frm_size,
> +                                          DMA_FROM_DEVICE);

You need to check for dma_maping_error() here.

> +             cur_p->cntrl = priv->max_frm_size;
> +             cur_p->status = 0;
> +             cur_p->sw_id_offset = (u32)new_skb;
> +
> +             ++priv->rx_bd_ci;
> +             priv->rx_bd_ci %= RX_BD_NUM;
> +             cur_p = &priv->rx_bd_v[priv->rx_bd_ci];
> +     }
> +
> +     ndev->stats.rx_packets += packets;
> +     ndev->stats.rx_bytes += size;
> +
> +     if (tail_p)
> +             nixge_dma_write_reg(priv, XAXIDMA_RX_TDESC_OFFSET, tail_p);
> +}

> +static int nixge_open(struct net_device *ndev)
> +{
> +     struct nixge_priv *priv = netdev_priv(ndev);
> +     struct phy_device *phy;
> +     int ret;
> +
> +     nixge_device_reset(ndev);
> +
> +     phy = of_phy_connect(ndev, priv->phy_node,
> +                          &nixge_handle_link_change, 0, priv->phy_mode);
> +     if (!phy)
> +             return -ENODEV;
> +
> +     phy_start(phy);
> +
> +     /* Enable tasklets for Axi DMA error handling */
> +     tasklet_init(&priv->dma_err_tasklet, nixge_dma_err_handler,
> +                  (unsigned long)priv);
> +
> +     /* Enable interrupts for Axi DMA Tx */
> +     ret = request_irq(priv->tx_irq, nixge_tx_irq, 0, ndev->name, ndev);
> +     if (ret)
> +             goto err_tx_irq;
> +     /* Enable interrupts for Axi DMA Rx */
> +     ret = request_irq(priv->rx_irq, nixge_rx_irq, 0, ndev->name, ndev);
> +     if (ret)
> +             goto err_rx_irq;

netif_start_queue() is missing, if your queues were stopped before (try
several up/down/up/down sequences to check) then it would never transmit.

> +
> +     return 0;
> +
> +err_rx_irq:
> +     free_irq(priv->tx_irq, ndev);
> +err_tx_irq:
> +     tasklet_kill(&priv->dma_err_tasklet);
> +     netdev_err(ndev, "request_irq() failed\n");

You are not stopping nor disconnecting the PHY in case of error.

> +     return ret;
> +}
> +
> +static int nixge_stop(struct net_device *ndev)
> +{
> +     u32 cr;
> +     struct nixge_priv *priv = netdev_priv(ndev);

First thing is probably to stop the transmit queue(s) with
netif_stop_queue() to avoid submitting new packets.

> +
> +     cr = nixge_dma_read_reg(priv, XAXIDMA_RX_CR_OFFSET);
> +     nixge_dma_write_reg(priv, XAXIDMA_RX_CR_OFFSET,
> +                         cr & (~XAXIDMA_CR_RUNSTOP_MASK));
> +     cr = nixge_dma_read_reg(priv, XAXIDMA_TX_CR_OFFSET);
> +     nixge_dma_write_reg(priv, XAXIDMA_TX_CR_OFFSET,
> +                         cr & (~XAXIDMA_CR_RUNSTOP_MASK));
> +
> +     tasklet_kill(&priv->dma_err_tasklet);
> +
> +     free_irq(priv->tx_irq, ndev);
> +     free_irq(priv->rx_irq, ndev);
> +
> +     nixge_dma_bd_release(ndev);
> +
> +     if (ndev->phydev) {
> +             phy_stop(ndev->phydev);
> +             phy_disconnect(ndev->phydev);
> +     }
> +
> +     return 0;
> +}
> +

> +
> +static void nixge_ethtools_get_drvinfo(struct net_device *ndev,
> +                                    struct ethtool_drvinfo *ed)
> +{
> +     strlcpy(ed->driver, "nixge", sizeof(ed->driver));

You might want to return the bus type as well (e.g: platform).

> +}
> +
> +static int nixge_ethtools_get_coalesce(struct net_device *ndev,
> +                                    struct ethtool_coalesce *ecoalesce)
> +{
> +     u32 regval = 0;
> +     struct nixge_priv *priv = netdev_priv(ndev);

Reverse christmas tree declarations.

> +
> +     regval = nixge_dma_read_reg(priv, XAXIDMA_RX_CR_OFFSET);
> +     ecoalesce->rx_max_coalesced_frames = (regval & XAXIDMA_COALESCE_MASK)
> +                                          >> XAXIDMA_COALESCE_SHIFT;
> +     regval = nixge_dma_read_reg(priv, XAXIDMA_TX_CR_OFFSET);
> +     ecoalesce->tx_max_coalesced_frames = (regval & XAXIDMA_COALESCE_MASK)
> +                                          >> XAXIDMA_COALESCE_SHIFT;
> +     return 0;
> +}
> +
> +static int nixge_ethtools_set_coalesce(struct net_device *ndev,
> +                                    struct ethtool_coalesce *ecoalesce)
> +{
> +     struct nixge_priv *priv = netdev_priv(ndev);
> +
> +     if (netif_running(ndev)) {
> +             netdev_err(ndev,
> +                        "Please stop netif before applying configuration\n");
> +             return -EFAULT;

-EBUSY may be, or -EINVAL? You are supposed to be able to allow changing
coalescing parameters while the interface is running.

> +     }

> +     err = nixge_ctrl_poll_timeout(priv, NIXGE_REG_MDIO_CTRL, status,
> +                                   !status, 10, 1000);
> +     if (err) {
> +             dev_err(priv->dev, "timeout setting read command");
> +             return err;
> +     }
> +
> +     status = nixge_ctrl_read_reg(priv, NIXGE_REG_MDIO_DATA);
> +
> +     dev_dbg(priv->dev, "%s: phy_id = %x reg = %x got %x\n", __func__,
> +             phy_id, reg & 0xffff, status);

mdiobus_read() already contains trace points that would return the same
information.

> +
> +     return status;
> +}
> +
> +static int nixge_mdio_write(struct mii_bus *bus, int phy_id, int reg, u16 
> val)
> +{
> +     struct nixge_priv *priv = bus->priv;
> +     u32 status, tmp;
> +     int err;
> +     u16 device;
> +
> +     /* FIXME: Currently don't do writes */
> +     if (reg & MII_ADDR_C45)
> +             return -EOPNOTSUPP;

Then you might as well remove Clause 45 read support, because it's not
going to be very useful if you can't do writes. I could see how this
allows you to get e.g: a 10GB PHY working with little to no intervention.

> +
> +     device = reg & 0x1f;
> +
> +     tmp = NIXGE_MDIO_CLAUSE22 | NIXGE_MDIO_OP(MDIO_C22_WRITE) |
> +             NIXGE_MDIO_ADDR(phy_id) | NIXGE_MDIO_MMD(device);
> +
> +     nixge_ctrl_write_reg(priv, NIXGE_REG_MDIO_DATA, val);
> +     nixge_ctrl_write_reg(priv, NIXGE_REG_MDIO_OP, tmp);
> +     nixge_ctrl_write_reg(priv, NIXGE_REG_MDIO_CTRL, 1);
> +
> +     err = nixge_ctrl_poll_timeout(priv, NIXGE_REG_MDIO_CTRL, status,
> +                                   !status, 10, 1000);
> +     if (err) {
> +             dev_err(priv->dev, "timeout setting write command");
> +             return -ETIMEDOUT;
> +     }
> +
> +     dev_dbg(priv->dev, "%x %x <- %x\n", phy_id, reg, val);
> +
> +     return 0;
> +}
> +
> +static int nixge_mdio_setup(struct nixge_priv *priv, struct device_node *np)
> +{
> +     struct mii_bus *bus;
> +     struct resource res;
> +     int err;
> +
> +     bus = mdiobus_alloc();
> +     if (!bus)
> +             return -ENOMEM;
> +
> +     of_address_to_resource(np, 0, &res);

You don't appear to be using this resource.

> +     snprintf(bus->id, MII_BUS_ID_SIZE, "%s-mii", dev_name(priv->dev));
> +     bus->priv = priv;
> +     bus->name = "nixge_mii_bus";
> +     bus->read = nixge_mdio_read;
> +     bus->write = nixge_mdio_write;
> +     bus->parent = priv->dev;
> +
> +     priv->mii_bus = bus;
> +     err = of_mdiobus_register(bus, np);
> +     if (err)
> +             goto err_register;
> +
> +     dev_info(priv->dev, "MDIO bus registered\n");

This is redundant with what you can obtain from of_mdiobus_register()
and a "... MDIO bus probed type of message.

> +
> +     return 0;
> +
> +err_register:
> +     mdiobus_free(bus);
> +     return err;
> +}
> +
> +static void *nixge_get_nvmem_address(struct device *dev)
> +{
> +     struct nvmem_cell *cell;
> +     size_t cell_size;
> +     char *mac;
> +
> +     cell = nvmem_cell_get(dev, "address");
> +     if (IS_ERR(cell))
> +             return cell;
> +
> +     mac = nvmem_cell_read(cell, &cell_size);
> +     nvmem_cell_put(cell);
> +
> +     return mac;
> +}

I would if this could be a candidate for some kind of generic helper
function that would retrieve the MAC address, food for thought.

> +
> +static int nixge_probe(struct platform_device *pdev)
> +{
> +     int err;
> +     struct nixge_priv *priv;
> +     struct net_device *ndev;
> +     struct resource *dmares;
> +     const char *mac_addr;
> +
> +     ndev = alloc_etherdev(sizeof(*priv));
> +     if (!ndev)
> +             return -ENOMEM;
> +
> +     platform_set_drvdata(pdev, ndev);
> +     SET_NETDEV_DEV(ndev, &pdev->dev);
> +
> +     ndev->flags &= ~IFF_MULTICAST;  /* clear multicast */
> +     ndev->features = NETIF_F_SG;
> +     ndev->netdev_ops = &nixge_netdev_ops;
> +     ndev->ethtool_ops = &nixge_ethtool_ops;
> +
> +     /* MTU range: 64 - 9000 */
> +     ndev->min_mtu = 64;
> +     ndev->max_mtu = NIXGE_JUMBO_MTU;
> +
> +     mac_addr = nixge_get_nvmem_address(&pdev->dev);
> +     if (mac_addr && is_valid_ether_addr(mac_addr))
> +             ether_addr_copy(ndev->dev_addr, mac_addr);
> +     else
> +             eth_hw_addr_random(ndev);
> +
> +     priv = netdev_priv(ndev);
> +     priv->ndev = ndev;
> +     priv->dev = &pdev->dev;
> +     priv->rxmem = NIXGE_DEFAULT_RX_MEM;
> +
> +     dmares = platform_get_resource(pdev, IORESOURCE_MEM, 0);
> +     priv->dma_regs = devm_ioremap_resource(&pdev->dev, dmares);
> +     if (IS_ERR(priv->dma_regs)) {
> +             netdev_err(ndev, "failed to map dma regs\n");
> +             return PTR_ERR(priv->dma_regs);
> +     }
> +     priv->ctrl_regs = priv->dma_regs + NIXGE_REG_CTRL_OFFSET;
> +     __nixge_hw_set_mac_address(ndev);
> +
> +     priv->tx_irq = platform_get_irq_byname(pdev, "tx-irq");
> +     if (priv->tx_irq < 0) {
> +             netdev_err(ndev, "no tx irq available");
> +             return priv->tx_irq;
> +     }
> +
> +     priv->rx_irq = platform_get_irq_byname(pdev, "rx-irq");
> +     if (priv->rx_irq < 0) {
> +             netdev_err(ndev, "no rx irq available");
> +             return priv->rx_irq;
> +     }
> +
> +     priv->coalesce_count_rx = XAXIDMA_DFT_RX_THRESHOLD;
> +     priv->coalesce_count_tx = XAXIDMA_DFT_TX_THRESHOLD;
> +
> +     spin_lock_init(&priv->lock);
> +
> +     err = nixge_mdio_setup(priv, pdev->dev.of_node);
> +     if (err) {
> +             netdev_err(ndev, "error registering mdio bus");
> +             goto free_netdev;
> +     }
> +
> +     priv->phy_mode = of_get_phy_mode(pdev->dev.of_node);
> +     if (priv->phy_mode < 0) {
> +             netdev_err(ndev, "not find phy-mode\n");

"Could not find \"phy-mode\" property" maybe?

> +             err = -EINVAL;
> +             goto unregister_mdio;
> +     }
> +
> +     priv->phy_node = of_parse_phandle(pdev->dev.of_node, "phy-handle", 0);
> +     if (!priv->phy_node) {
> +             netdev_err(ndev, "not find phy-handle\n");

Same here.

> +             err = -EINVAL;
> +             goto unregister_mdio;
> +     }
> +
> +     err = register_netdev(priv->ndev);
> +     if (err) {
> +             netdev_err(ndev, "register_netdev() error (%i)\n", err);
> +             goto unregister_mdio;
> +     }
> +
> +     return 0;
> +
> +unregister_mdio:
> +     mdiobus_unregister(priv->mii_bus);
> +     mdiobus_free(priv->mii_bus);
> +
> +free_netdev:
> +     free_netdev(ndev);
> +
> +     return err;
> +}
> +
> +static int nixge_remove(struct platform_device *pdev)
> +{
> +     struct net_device *ndev = platform_get_drvdata(pdev);
> +     struct nixge_priv *priv = netdev_priv(ndev);
> +
> +     if (ndev->phydev)
> +             phy_disconnect(ndev->phydev);

You should consider moving this to the ndo_stop() for mainly two reasons:

- to be strictly symmetrical with your ndo_open() function which does
the of_phy_connect() call
- to leverage possible power savings by suspending the PHY when the
interface is not used

> +     ndev->phydev = NULL;

phy_disconnect() does NULLify dev->phydev already

> +
> +     mdiobus_unregister(priv->mii_bus);
> +     mdiobus_free(priv->mii_bus);
> +     priv->mii_bus = NULL;

This is not necessary, probe() and remove() won't be called with
partially initialized private structure data.

> +
> +     unregister_netdev(ndev);
> +
> +     free_netdev(ndev);
> +
> +     return 0;
> +}
> +
> +/* Match table for of_platform binding */
> +static const struct of_device_id nixge_dt_ids[] = {
> +     { .compatible = "ni,xge-enet-2.00", },
> +     {},
> +};
> +MODULE_DEVICE_TABLE(of, nixge_dt_ids);
> +
> +static struct platform_driver nixge_driver = {
> +     .probe          = nixge_probe,
> +     .remove         = nixge_remove,
> +     .driver         = {
> +             .name           = "nixge",
> +             .of_match_table = of_match_ptr(nixge_dt_ids),
> +     },
> +};
> +module_platform_driver(nixge_driver);
> +
> +MODULE_LICENSE("GPL");
> +MODULE_DESCRIPTION("National Instruments XGE Management MAC");
> +MODULE_AUTHOR("Moritz Fischer <m...@kernel.org>");
> 


-- 
Florian

Reply via email to