On 09-04-19, 15:22, Peng Ma wrote:
> DPPA2(Data Path Acceleration Architecture 2) qDMA
> The qDMA supports channel virtualization by allowing DMA jobs to be enqueued
> into different frame queues. Core can initiate a DMA transaction by preparing
> a frame descriptor(FD) for each DMA job and enqueuing this job to a frame 
> queue.
> through a hardware portal. The qDMA prefetches DMA jobs from the frame queues.
> It then schedules and dispatches to internal DMA hardware engines, which
> generate read and write requests. Both qDMA source data and destination data 
> can
> be either contiguous or non-contiguous using one or more scatter/gather 
> tables.
> The qDMA supports global bandwidth flow control where all DMA transactions are
> stalled if the bandwidth threshold has been reached. Also supported are
> transaction based read throttling.
> 
> Add NXP dppa2 qDMA to support some of Layerscape SoCs.
> such as: LS1088A, LS208xA, LX2, etc.
> 
> Signed-off-by: Peng Ma <peng...@nxp.com>
> ---
> changed for v3:
>       - Add depends on arm64 for dpaa2 qdma driver 
>       - The dpaa2_io_service_[de]register functions have a new parameter
>       So update all calls to some functions
> 
>  drivers/dma/Kconfig                     |    2 +
>  drivers/dma/Makefile                    |    1 +
>  drivers/dma/fsl-dpaa2-qdma/Kconfig      |    9 +
>  drivers/dma/fsl-dpaa2-qdma/Makefile     |    3 +
>  drivers/dma/fsl-dpaa2-qdma/dpaa2-qdma.c |  782 
> +++++++++++++++++++++++++++++++
>  drivers/dma/fsl-dpaa2-qdma/dpaa2-qdma.h |  152 ++++++
>  6 files changed, 949 insertions(+), 0 deletions(-)
>  create mode 100644 drivers/dma/fsl-dpaa2-qdma/Kconfig
>  create mode 100644 drivers/dma/fsl-dpaa2-qdma/Makefile
>  create mode 100644 drivers/dma/fsl-dpaa2-qdma/dpaa2-qdma.c
>  create mode 100644 drivers/dma/fsl-dpaa2-qdma/dpaa2-qdma.h
> 
> diff --git a/drivers/dma/Kconfig b/drivers/dma/Kconfig
> index eaf78f4..08aae01 100644
> --- a/drivers/dma/Kconfig
> +++ b/drivers/dma/Kconfig
> @@ -671,6 +671,8 @@ source "drivers/dma/sh/Kconfig"
>  
>  source "drivers/dma/ti/Kconfig"
>  
> +source "drivers/dma/fsl-dpaa2-qdma/Kconfig"
> +
>  # clients
>  comment "DMA Clients"
>       depends on DMA_ENGINE
> diff --git a/drivers/dma/Makefile b/drivers/dma/Makefile
> index 6126e1c..2499ed8 100644
> --- a/drivers/dma/Makefile
> +++ b/drivers/dma/Makefile
> @@ -75,6 +75,7 @@ obj-$(CONFIG_UNIPHIER_MDMAC) += uniphier-mdmac.o
>  obj-$(CONFIG_XGENE_DMA) += xgene-dma.o
>  obj-$(CONFIG_ZX_DMA) += zx_dma.o
>  obj-$(CONFIG_ST_FDMA) += st_fdma.o
> +obj-$(CONFIG_FSL_DPAA2_QDMA) += fsl-dpaa2-qdma/
>  
>  obj-y += mediatek/
>  obj-y += qcom/
> diff --git a/drivers/dma/fsl-dpaa2-qdma/Kconfig 
> b/drivers/dma/fsl-dpaa2-qdma/Kconfig
> new file mode 100644
> index 0000000..258ed6b
> --- /dev/null
> +++ b/drivers/dma/fsl-dpaa2-qdma/Kconfig
> @@ -0,0 +1,9 @@
> +menuconfig FSL_DPAA2_QDMA
> +     tristate "NXP DPAA2 QDMA"
> +     depends on ARM64
> +     depends on FSL_MC_BUS && FSL_MC_DPIO
> +     select DMA_ENGINE
> +     select DMA_VIRTUAL_CHANNELS
> +     help
> +       NXP Data Path Acceleration Architecture 2 QDMA driver,
> +       using the NXP MC bus driver.
> diff --git a/drivers/dma/fsl-dpaa2-qdma/Makefile 
> b/drivers/dma/fsl-dpaa2-qdma/Makefile
> new file mode 100644
> index 0000000..c1d0226
> --- /dev/null
> +++ b/drivers/dma/fsl-dpaa2-qdma/Makefile
> @@ -0,0 +1,3 @@
> +# SPDX-License-Identifier: GPL-2.0
> +# Makefile for the NXP DPAA2 qDMA controllers
> +obj-$(CONFIG_FSL_DPAA2_QDMA) += dpaa2-qdma.o dpdmai.o
> diff --git a/drivers/dma/fsl-dpaa2-qdma/dpaa2-qdma.c 
> b/drivers/dma/fsl-dpaa2-qdma/dpaa2-qdma.c
> new file mode 100644
> index 0000000..0cdde0f
> --- /dev/null
> +++ b/drivers/dma/fsl-dpaa2-qdma/dpaa2-qdma.c
> @@ -0,0 +1,782 @@
> +// SPDX-License-Identifier: GPL-2.0
> +// Copyright 2014-2018 NXP
> +
> +/*
> + * Author: Changming Huang <jerry.hu...@nxp.com>
> + *
> + * Driver for the NXP QDMA engine with QMan mode.
> + * Channel virtualization is supported through enqueuing of DMA jobs to,
> + * or dequeuing DMA jobs from different work queues with QMan portal.
> + * This module can be found on NXP LS2 SoCs.
> + *
> + */
> +
> +#include <linux/init.h>
> +#include <linux/module.h>
> +#include <linux/dmapool.h>
> +#include <linux/of_irq.h>
> +#include <linux/iommu.h>
> +#include <linux/sys_soc.h>
> +#include <linux/fsl/mc.h>
> +#include <soc/fsl/dpaa2-io.h>
> +
> +#include "../virt-dma.h"
> +#include "dpdmai_cmd.h"
> +#include "dpdmai.h"
> +#include "dpaa2-qdma.h"
> +
> +static bool smmu_disable = true;
> +
> +static struct dpaa2_qdma_chan *to_dpaa2_qdma_chan(struct dma_chan *chan)
> +{
> +     return container_of(chan, struct dpaa2_qdma_chan, vchan.chan);
> +}
> +
> +static struct dpaa2_qdma_comp *to_fsl_qdma_comp(struct virt_dma_desc *vd)
> +{
> +     return container_of(vd, struct dpaa2_qdma_comp, vdesc);
> +}
> +
> +static int dpaa2_qdma_alloc_chan_resources(struct dma_chan *chan)
> +{
> +     struct dpaa2_qdma_chan *dpaa2_chan = to_dpaa2_qdma_chan(chan);
> +     struct dpaa2_qdma_engine *dpaa2_qdma = dpaa2_chan->qdma;
> +     struct device *dev = &dpaa2_qdma->priv->dpdmai_dev->dev;
> +
> +     dpaa2_chan->fd_pool = dma_pool_create("fd_pool", dev,
> +                                           FD_POOL_SIZE, 32, 0);
> +     if (!dpaa2_chan->fd_pool)
> +             return -ENOMEM;
> +
> +     return dpaa2_qdma->desc_allocated++;
> +}
> +
> +static void dpaa2_qdma_free_chan_resources(struct dma_chan *chan)
> +{
> +     struct dpaa2_qdma_chan *dpaa2_chan = to_dpaa2_qdma_chan(chan);
> +     struct dpaa2_qdma_engine *dpaa2_qdma = dpaa2_chan->qdma;
> +     unsigned long flags;
> +
> +     LIST_HEAD(head);
> +
> +     spin_lock_irqsave(&dpaa2_chan->vchan.lock, flags);
> +     vchan_get_all_descriptors(&dpaa2_chan->vchan, &head);
> +     spin_unlock_irqrestore(&dpaa2_chan->vchan.lock, flags);
> +
> +     vchan_dma_desc_free_list(&dpaa2_chan->vchan, &head);
> +
> +     dpaa2_dpdmai_free_comp(dpaa2_chan, &dpaa2_chan->comp_used);
> +     dpaa2_dpdmai_free_comp(dpaa2_chan, &dpaa2_chan->comp_free);
> +
> +     dma_pool_destroy(dpaa2_chan->fd_pool);
> +     dpaa2_qdma->desc_allocated--;
> +}
> +
> +/*
> + * Request a command descriptor for enqueue.
> + */
> +static struct dpaa2_qdma_comp *
> +dpaa2_qdma_request_desc(struct dpaa2_qdma_chan *dpaa2_chan)
> +{
> +     struct dpaa2_qdma_comp *comp_temp = NULL;
> +     unsigned long flags;
> +
> +     spin_lock_irqsave(&dpaa2_chan->queue_lock, flags);
> +     if (list_empty(&dpaa2_chan->comp_free)) {
> +             spin_unlock_irqrestore(&dpaa2_chan->queue_lock, flags);
> +             comp_temp = kzalloc(sizeof(*comp_temp), GFP_KERNEL);

GFP_NOWAIT?

> +             if (!comp_temp)
> +                     goto err;
> +             comp_temp->fd_virt_addr =
> +                     dma_pool_alloc(dpaa2_chan->fd_pool, GFP_NOWAIT,
> +                                    &comp_temp->fd_bus_addr);
> +             if (!comp_temp->fd_virt_addr)

err handling seems incorrect, you dont clean up, caller doesnt check
return!

> +                     goto err;
> +
> +             comp_temp->fl_virt_addr =
> +                     (void *)((struct dpaa2_fd *)
> +                             comp_temp->fd_virt_addr + 1);

casts and pointer math, what could go wrong!! This doesnt smell right!

> +             comp_temp->fl_bus_addr = comp_temp->fd_bus_addr +
> +                                     sizeof(struct dpaa2_fd);

why not use fl_virt_addr and get the bus_address?

> +             comp_temp->desc_virt_addr =
> +                     (void *)((struct dpaa2_fl_entry *)
> +                             comp_temp->fl_virt_addr + 3);
> +             comp_temp->desc_bus_addr = comp_temp->fl_bus_addr +
> +                             sizeof(struct dpaa2_fl_entry) * 3;

pointer math in the two calls doesnt match and as I said doesnt look
good...

> +
> +             comp_temp->qchan = dpaa2_chan;
> +             return comp_temp;
> +     }
> +     comp_temp = list_first_entry(&dpaa2_chan->comp_free,
> +                                  struct dpaa2_qdma_comp, list);
> +     list_del(&comp_temp->list);
> +     spin_unlock_irqrestore(&dpaa2_chan->queue_lock, flags);
> +
> +     comp_temp->qchan = dpaa2_chan;
> +err:
> +     return comp_temp;
> +}
> +
> +static void
> +dpaa2_qdma_populate_fd(u32 format, struct dpaa2_qdma_comp *dpaa2_comp)
> +{
> +     struct dpaa2_fd *fd;
> +
> +     fd = (struct dpaa2_fd *)dpaa2_comp->fd_virt_addr;

whats with the casts! you seem to like them! You are casting away from
void!

> +     memset(fd, 0, sizeof(struct dpaa2_fd));
> +
> +     /* fd populated */
> +     dpaa2_fd_set_addr(fd, dpaa2_comp->fl_bus_addr);
> +     /* Bypass memory translation, Frame list format, short length disable */
> +     /* we need to disable BMT if fsl-mc use iova addr */
> +     if (smmu_disable)
> +             dpaa2_fd_set_bpid(fd, QMAN_FD_BMT_ENABLE);
> +     dpaa2_fd_set_format(fd, QMAN_FD_FMT_ENABLE | QMAN_FD_SL_DISABLE);
> +
> +     dpaa2_fd_set_frc(fd, format | QDMA_SER_CTX);
> +}
> +
> +/* first frame list for descriptor buffer */
> +static void
> +dpaa2_qdma_populate_first_framel(struct dpaa2_fl_entry *f_list,
> +                              struct dpaa2_qdma_comp *dpaa2_comp,
> +                              bool wrt_changed)
> +{
> +     struct dpaa2_qdma_sd_d *sdd;
> +
> +     sdd = (struct dpaa2_qdma_sd_d *)dpaa2_comp->desc_virt_addr;

again

> +     memset(sdd, 0, 2 * (sizeof(*sdd)));
> +
> +     /* source descriptor CMD */
> +     sdd->cmd = cpu_to_le32(QDMA_SD_CMD_RDTTYPE_COHERENT);
> +     sdd++;
> +
> +     /* dest descriptor CMD */
> +     if (wrt_changed)
> +             sdd->cmd = cpu_to_le32(LX2160_QDMA_DD_CMD_WRTTYPE_COHERENT);
> +     else
> +             sdd->cmd = cpu_to_le32(QDMA_DD_CMD_WRTTYPE_COHERENT);
> +
> +     memset(f_list, 0, sizeof(struct dpaa2_fl_entry));
> +
> +     /* first frame list to source descriptor */
> +     dpaa2_fl_set_addr(f_list, dpaa2_comp->desc_bus_addr);
> +     dpaa2_fl_set_len(f_list, 0x20);
> +     dpaa2_fl_set_format(f_list, QDMA_FL_FMT_SBF | QDMA_FL_SL_LONG);
> +
> +     /* bypass memory translation */
> +     if (smmu_disable)
> +             f_list->bpid = cpu_to_le16(QDMA_FL_BMT_ENABLE);
> +}
> +
> +/* source and destination frame list */
> +static void
> +dpaa2_qdma_populate_frames(struct dpaa2_fl_entry *f_list,
> +                        dma_addr_t dst, dma_addr_t src,
> +                        size_t len, uint8_t fmt)
> +{
> +     /* source frame list to source buffer */
> +     memset(f_list, 0, sizeof(struct dpaa2_fl_entry));
> +
> +     dpaa2_fl_set_addr(f_list, src);
> +     dpaa2_fl_set_len(f_list, len);
> +
> +     /* single buffer frame or scatter gather frame */
> +     dpaa2_fl_set_format(f_list, (fmt | QDMA_FL_SL_LONG));
> +
> +     /* bypass memory translation */
> +     if (smmu_disable)
> +             f_list->bpid = cpu_to_le16(QDMA_FL_BMT_ENABLE);
> +
> +     f_list++;
> +
> +     /* destination frame list to destination buffer */
> +     memset(f_list, 0, sizeof(struct dpaa2_fl_entry));
> +
> +     dpaa2_fl_set_addr(f_list, dst);
> +     dpaa2_fl_set_len(f_list, len);
> +     dpaa2_fl_set_format(f_list, (fmt | QDMA_FL_SL_LONG));
> +     /* single buffer frame or scatter gather frame */
> +     dpaa2_fl_set_final(f_list, QDMA_FL_F);
> +     /* bypass memory translation */
> +     if (smmu_disable)
> +             f_list->bpid = cpu_to_le16(QDMA_FL_BMT_ENABLE);
> +}
> +
> +static struct dma_async_tx_descriptor
> +*dpaa2_qdma_prep_memcpy(struct dma_chan *chan, dma_addr_t dst,
> +                     dma_addr_t src, size_t len, ulong flags)
> +{
> +     struct dpaa2_qdma_chan *dpaa2_chan = to_dpaa2_qdma_chan(chan);
> +     struct dpaa2_qdma_engine *dpaa2_qdma;
> +     struct dpaa2_qdma_comp *dpaa2_comp;
> +     struct dpaa2_fl_entry *f_list;
> +     bool wrt_changed;
> +     u32 format;
> +
> +     dpaa2_qdma = dpaa2_chan->qdma;
> +     dpaa2_comp = dpaa2_qdma_request_desc(dpaa2_chan);
> +     wrt_changed = (bool)dpaa2_qdma->qdma_wrtype_fixup;
> +
> +#ifdef LONG_FORMAT

 compile flag and define, so else part is dead code??

> +     format = QDMA_FD_LONG_FORMAT;
> +#else
> +     format = QDMA_FD_SHORT_FORMAT;
> +#endif
> +     /* populate Frame descriptor */
> +     dpaa2_qdma_populate_fd(format, dpaa2_comp);
> +
> +     f_list = (struct dpaa2_fl_entry *)dpaa2_comp->fl_virt_addr;
> +
> +#ifdef LONG_FORMAT
> +     /* first frame list for descriptor buffer (logn format) */
> +     dpaa2_qdma_populate_first_framel(f_list, dpaa2_comp, wrt_changed);
> +
> +     f_list++;
> +#endif
> +
> +     dpaa2_qdma_populate_frames(f_list, dst, src, len, QDMA_FL_FMT_SBF);
> +
> +     return vchan_tx_prep(&dpaa2_chan->vchan, &dpaa2_comp->vdesc, flags);
> +}
> +
> +static enum
> +dma_status dpaa2_qdma_tx_status(struct dma_chan *chan,
> +                             dma_cookie_t cookie,
> +                             struct dma_tx_state *txstate)
> +{
> +     return dma_cookie_status(chan, cookie, txstate);
> +}
> +
> +static void dpaa2_qdma_issue_pending(struct dma_chan *chan)
> +{
> +     struct dpaa2_qdma_chan *dpaa2_chan = to_dpaa2_qdma_chan(chan);
> +     struct dpaa2_qdma_engine *dpaa2_qdma = dpaa2_chan->qdma;
> +     struct dpaa2_qdma_priv *priv = dpaa2_qdma->priv;
> +     struct dpaa2_qdma_comp *dpaa2_comp;
> +     struct virt_dma_desc *vdesc;
> +     struct dpaa2_fd *fd;
> +     unsigned long flags;
> +     int err;
> +
> +     spin_lock_irqsave(&dpaa2_chan->queue_lock, flags);
> +     spin_lock(&dpaa2_chan->vchan.lock);
> +     if (vchan_issue_pending(&dpaa2_chan->vchan)) {
> +             vdesc = vchan_next_desc(&dpaa2_chan->vchan);
> +             if (!vdesc)
> +                     goto err_enqueue;
> +             dpaa2_comp = to_fsl_qdma_comp(vdesc);
> +
> +             fd = (struct dpaa2_fd *)dpaa2_comp->fd_virt_addr;
> +
> +             list_del(&vdesc->node);
> +             list_add_tail(&dpaa2_comp->list, &dpaa2_chan->comp_used);

what does this list do?

> +
> +             /* TOBO: priority hard-coded to zero */

You mean TODO?

> +             err = dpaa2_io_service_enqueue_fq(NULL,
> +                             priv->tx_queue_attr[0].fqid, fd);
> +             if (err) {
> +                     list_del(&dpaa2_comp->list);
> +                     list_add_tail(&dpaa2_comp->list,
> +                                   &dpaa2_chan->comp_free);
> +             }
> +     }
> +err_enqueue:
> +     spin_unlock(&dpaa2_chan->vchan.lock);
> +     spin_unlock_irqrestore(&dpaa2_chan->queue_lock, flags);
> +}
> +
> +static int __cold dpaa2_qdma_setup(struct fsl_mc_device *ls_dev)
> +{
> +     struct dpaa2_qdma_priv_per_prio *ppriv;
> +     struct device *dev = &ls_dev->dev;
> +     struct dpaa2_qdma_priv *priv;
> +     u8 prio_def = DPDMAI_PRIO_NUM;
> +     int err;
> +     int i;
> +
> +     priv = dev_get_drvdata(dev);
> +
> +     priv->dev = dev;
> +     priv->dpqdma_id = ls_dev->obj_desc.id;
> +
> +     /*Get the handle for the DPDMAI this interface is associate with */

Please run checkpatch, it should have told you that you need space after
comment marker /* foo...

> +     err = dpdmai_open(priv->mc_io, 0, priv->dpqdma_id, &ls_dev->mc_handle);
> +     if (err) {
> +             dev_err(dev, "dpdmai_open() failed\n");
> +             return err;
> +     }
> +     dev_info(dev, "Opened dpdmai object successfully\n");
> +
> +     err = dpdmai_get_attributes(priv->mc_io, 0, ls_dev->mc_handle,
> +                                 &priv->dpdmai_attr);
> +     if (err) {
> +             dev_err(dev, "dpdmai_get_attributes() failed\n");
> +             return err;

so you dont close what you opened in dpdmai_open() Please give a serious
thought and testing to this driver

> +     }
> +
> +     if (priv->dpdmai_attr.version.major > DPDMAI_VER_MAJOR) {
> +             dev_err(dev, "DPDMAI major version mismatch\n"
> +                          "Found %u.%u, supported version is %u.%u\n",
> +                             priv->dpdmai_attr.version.major,
> +                             priv->dpdmai_attr.version.minor,
> +                             DPDMAI_VER_MAJOR, DPDMAI_VER_MINOR);
> +     }
> +
> +     if (priv->dpdmai_attr.version.minor > DPDMAI_VER_MINOR) {
> +             dev_err(dev, "DPDMAI minor version mismatch\n"
> +                          "Found %u.%u, supported version is %u.%u\n",
> +                             priv->dpdmai_attr.version.major,
> +                             priv->dpdmai_attr.version.minor,
> +                             DPDMAI_VER_MAJOR, DPDMAI_VER_MINOR);

what is the implication of these error, why not bail out on these?

> +     }
> +
> +     priv->num_pairs = min(priv->dpdmai_attr.num_of_priorities, prio_def);
> +     ppriv = kcalloc(priv->num_pairs, sizeof(*ppriv), GFP_KERNEL);

what is the context of the fn, sleepy, atomic?

> +     if (!ppriv) {
> +             dev_err(dev, "kzalloc for ppriv failed\n");

this need not be logged, core will do so

> +             return -1;

really -1??

I think this driver needs more work, please fix these issues in the
comments above and also see in rest of the code

-- 
~Vinod

Reply via email to