Hi Evan,

Thanks for taking the time to review and feedback!


On 7/27/2018 2:12 PM, Evan Green wrote:
Hi David,

On Thu, Jul 26, 2018 at 4:30 PM David Dai <daidav...@codeaurora.org> wrote:
Introduce Qualcomm SDM845 specific provider driver using the
interconnect framework.

Signed-off-by: David Dai <daidav...@codeaurora.org>
---
  .../bindings/interconnect/qcom-sdm845.txt          |  22 +
  drivers/interconnect/qcom/Kconfig                  |   8 +
  drivers/interconnect/qcom/Makefile                 |   1 +
  drivers/interconnect/qcom/qcom-icc-ids.h           | 142 ++++
  drivers/interconnect/qcom/sdm845.c                 | 826 +++++++++++++++++++++
  5 files changed, 999 insertions(+)
  create mode 100644 
Documentation/devicetree/bindings/interconnect/qcom-sdm845.txt
  create mode 100644 drivers/interconnect/qcom/qcom-icc-ids.h
  create mode 100644 drivers/interconnect/qcom/sdm845.c

...
diff --git a/drivers/interconnect/qcom/sdm845.c 
b/drivers/interconnect/qcom/sdm845.c
new file mode 100644
index 0000000..bf13053
--- /dev/null
+++ b/drivers/interconnect/qcom/sdm845.c
@@ -0,0 +1,826 @@
+/* SPDX-License-Identifier: GPL-2.0 */
+/*
+ * Copyright (c) 2018, The Linux Foundation. All rights reserved.
+ *
+ */
+
+#include <linux/device.h>
+#include <linux/io.h>
+#include <linux/interconnect.h>
+#include <linux/interconnect-provider.h>
+#include <linux/module.h>
+#include <linux/of_device.h>
+#include <linux/of_platform.h>
+#include <linux/platform_device.h>
+#include <linux/slab.h>
+#include <linux/sort.h>
+
+#include <soc/qcom/cmd-db.h>
+#include <soc/qcom/rpmh.h>
+#include <soc/qcom/tcs.h>
+
+#include "qcom-icc-ids.h"
+
+#define BCM_TCS_CMD_COMMIT_SHFT                30
+#define BCM_TCS_CMD_COMMIT_MASK                0x40000000
+#define BCM_TCS_CMD_VALID_SHFT         29
+#define BCM_TCS_CMD_VALID_MASK         0x200010000
+#define BCM_TCS_CMD_VOTE_X_SHFT                14
+#define BCM_TCS_CMD_VOTE_MASK          0x3fff
+#define BCM_TCS_CMD_VOTE_Y_SHFT                0
+#define BCM_TCS_CMD_VOTE_Y_MASK                0xfffc000
+
+#define BCM_TCS_CMD(commit, valid, vote_x, vote_y) \
+       ((commit << BCM_TCS_CMD_COMMIT_SHFT) |\
+       (valid << BCM_TCS_CMD_VALID_SHFT) |\
+       ((vote_x & BCM_TCS_CMD_VOTE_MASK) << BCM_TCS_CMD_VOTE_X_SHFT) |\
+       ((vote_y & BCM_TCS_CMD_VOTE_MASK) << BCM_TCS_CMD_VOTE_Y_SHFT))
These values that are >8 bits (vote_x and vote_y) should be converted
from cpu to little endian.
Done.

+
+#define to_qcom_provider(_provider) \
+       container_of(_provider, struct qcom_icc_provider, provider)
+
+#define DEFINE_QNODE(_name, _id, _channels, _buswidth,                 \
+                       _numlinks, ...)                                 \
+               static struct qcom_icc_node _name = {                   \
+               .id = _id,                                              \
+               .name = #_name,                                         \
+               .channels = _channels,                                  \
+               .buswidth = _buswidth,                                  \
+               .num_links = _numlinks,                                 \
+               .links = { __VA_ARGS__ },                               \
+       }
+
+#define DEFINE_QBCM(_name, _bcmname, _keepalive, _numnodes, ...)       \
+               static struct qcom_icc_bcm _name = {                    \
+               .name = _bcmname,                                       \
+               .keepalive = _keepalive,                                \
+               .num_nodes = _numnodes,                                 \
+               .nodes = { __VA_ARGS__ },                               \
+       }
+
+struct qcom_icc_provider {
+       struct icc_provider     provider;
+       void __iomem            *base;
+       struct device           *dev;
+       struct qcom_icc_bcm     **bcms;
+       size_t num_bcms;
+};
+
+/**
+ * struct bcm_db - Auxiliary data pertaining to each Bus Clock Manager(BCM)
+ * @unit: bcm threshold values are in magnitudes of this
+ * @width: prototype width
+ * @vcd: virtual clock domain that this bcm belongs to
+ */
+
+struct bcm_db {
+       u32 unit;
+       u16 width;
+       u8 vcd;
+       u8 reserved;
+};
+
+#define SDM845_MAX_LINKS       43
+#define SDM845_MAX_BCMS                30
+#define SDM845_MAX_BCM_PER_NODE        2
+#define SDM845_MAX_VCD         10
+
+/**
+ * struct qcom_icc_node - Qualcomm specific interconnect nodes
+ * @name: the node name used in debugfs
+ * @links: an array of nodes where we can go next while traversing
+ * @id: a unique node identifier
+ * @num_links: the total number of @links
+ * @channels: num of channels at this node
+ * @buswidth: width of the interconnect between a node and the bus
+ * @sum_avg: current sum aggregate value of all avg bw requests
+ * @max_peak: current max aggregate value of all peak bw requests
+ * @bcms: list of bcms associated with this logical node
+ * @num_bcm: num of @bcms
+ */
+struct qcom_icc_node {
+       const char *name;
+       u16 links[SDM845_MAX_LINKS];
+       u16 id;
+       u16 num_links;
+       u16 channels;
+       u16 buswidth;
+       u64 sum_avg;
+       u64 max_peak;
+       struct qcom_icc_bcm *bcms[SDM845_MAX_BCM_PER_NODE];
+       size_t num_bcms;
+};
+
+/**
+ * struct qcom_icc_bcm - Qualcomm specific hardware accelerator nodes
+ * known as Bus Clock Manager(BCM)
+ * @name: the bcm node name used to fetch BCM data from command db
+ * @type: latency or bandwidth bcm
+ * @addr: address offsets used when voting to RPMH
+ * @vote_x: aggregated threshold values, represents sum_bw when @type is bw bcm
+ * @vote_y: aggregated threshold values, represents peak_bw when @type is bw 
bcm
+ * @dirty: flag used to indicate whether or bcm needs to be committed
+ * @aux_data: auxiliary data used when calculating threshold values and
+ * communicating with RPMh
+ * @list: used to link to other bcms when compiling lists for commit
+ * @num_nodes: total number of @num_nodes
+ * @nodes: list of qcom_icc_nodes that this BCM encapsulates
+ */
+
+struct qcom_icc_bcm {
+       const char *name;
+       u32 type;
+       u32 addr;
+       u64 vote_x;
+       u64 vote_y;
+       bool dirty;
+       bool keepalive;
+       struct bcm_db aux_data;
+       struct list_head list;
+       size_t num_nodes;
+       struct qcom_icc_node *nodes[];
+};
+
+struct qcom_icc_fabric {
+       struct qcom_icc_node **nodes;
+       size_t num_nodes;
+       u32 base_offset;
+       u32 qos_offset;
+};
+
+struct qcom_icc_desc {
+       struct qcom_icc_node **nodes;
+       size_t num_nodes;
+       struct qcom_icc_bcm **bcms;
+       size_t num_bcms;
+};
+
...
+
+static int qcom_icc_init(struct icc_node *node)
+{
+       /* TODO: init qos and priority */
+
+       return 0;
+}
+
+static int qcom_icc_bcm_init(struct qcom_icc_bcm *bcm, struct device *dev)
+{
+       struct qcom_icc_node *qn;
+       int ret, i;
+
+       bcm->addr = cmd_db_read_addr(bcm->name);
+       if (!bcm->addr) {
+               dev_err(dev, "%s could not find RPMh address\n",
+                       bcm->name);
+               return -EINVAL;
+       }
+
+       if (!cmd_db_read_aux_data_len(bcm->name)) {
I think you should validate that the aux data length being returned is
the length you expect it to be. Or maybe "at least" the length you
expect it to be, if this structure is meant to be backwards
compatible?
Done.
+               dev_err(dev, "%s command db missing aux data\n",
+                       bcm->name);
+               return -EINVAL;
+       }
+
+       ret = cmd_db_read_aux_data(bcm->name, (u8 *)&bcm->aux_data,
+                                  sizeof(struct bcm_db));
This still doesn't work for big endian, after being read the
multi-byte members of this structure need to be converted from little
endian to cpu format.
Done. I'll convert the values to cpu format.
+       if (ret < 0) {
+               dev_err(dev, "%s command db read error (%d)\n",
+                       bcm->name, ret);
+               return ret;
+       }
+
+       for (i = 0; i < bcm->num_nodes; i++) {
This loop could use a comment describing what it's doing, which I
understand to be: Add links back to the BCM for each node in the BCM.
Done.
+               qn = bcm->nodes[i];
+               qn->bcms[qn->num_bcms] = bcm;
+               qn->num_bcms++;
+       }
+
+       return 0;
+}
+
+static int qcom_tcs_cmd_gen(struct tcs_cmd *cmd, u64 vote_x,
+                                       u64 vote_y, u32 addr, bool commit)
+{
+       int ret = 0;
+       bool valid = true;
+
+       if (!cmd)
+               return ret;
+
+       if (vote_x == 0 && vote_y == 0)
+               valid = false;
+
+       if (vote_x > BCM_TCS_CMD_VOTE_MASK)
+               vote_x = BCM_TCS_CMD_VOTE_MASK;
+
+       if (vote_y > BCM_TCS_CMD_VOTE_MASK)
+               vote_y = BCM_TCS_CMD_VOTE_MASK;
+
+       cmd->addr = addr;
+       cmd->data = BCM_TCS_CMD(commit, valid, vote_x, vote_y);
+
+       /* Set the wait for completion flag on commands that have the commit
I think the preferred style of multiline commenting has /* on its own line.
Done.
+        * set, in order to indicate to the RSC to not release the TCS slot
+        * until hardware has acknowledged that this transaction has completed
+        */
+       if (commit)
+               cmd->wait = true;
+
+       return ret;
+}
+
+static void qcom_tcs_list_gen(struct list_head *bcm_list,
+                                       struct tcs_cmd *tcs_list, int *n)
+{
+       struct qcom_icc_bcm *bcm;
+       bool commit;
+       size_t idx = 0, batch = 0, cur_vcd_size = 0;
+
+       memset(n, 0, sizeof(int) * SDM845_MAX_VCD);
+
+       list_for_each_entry(bcm, bcm_list, list) {
+               commit = false;
+               cur_vcd_size++;
+               if ((bcm->aux_data.vcd !=
+                       list_next_entry(bcm, list)->aux_data.vcd) ||
+                       list_is_last(&bcm->list, bcm_list)) {
You should switch the order of these conditions. Otherwise for the
last node you end up reaching through the list head object to get
aux_data.vcd, which is a wild memory access.
In my mind at the time, it didn't really matter that the last member compared itself against head, since it would have a different VCD anyways unless there's only a single VCD in the entire commit list, which is what the list_is_list check takes care of. Though now that you mention it, it shouldn't need to compare at all if it sees that it's the last entry. I'll swap them.
+                       commit = true;
+                       cur_vcd_size = 0;
+               }
+               qcom_tcs_cmd_gen(&tcs_list[idx], bcm->vote_x, bcm->vote_y,
+                               bcm->addr, commit);
+               idx++;
+               n[batch]++;
+               if (n[batch] >= MAX_RPMH_PAYLOAD) {
+                       if (!commit) {
+                               n[batch] -= cur_vcd_size;
+                               n[batch+1] = cur_vcd_size;
+                       }
+                       batch++;
I think I have my head around this, but it at least needs a comment
describing what it's doing, because it's still mind boggling. My
understanding is: "Avoid splitting requests for the same BCM across
multiple RPMh payloads. If the current set of BCM requests would be
split, move it to the next batch."
I agree that the logic here gets a bit busy, will add comments to clarify.

I would also include a warning if cur_vcd_size is > MAX_RPMH_PAYLOAD,
or if n[batch] <= cur_vcd_size. This would help with readability, and
help catch any sort of crazy situation not anticipated by this logic.
hm, I think cur_vcd_size is > MAX_RPMH_PAYLOAD is a useful check if somehow we got bad data to begin with, n[batch] <= cur_vcd_size is only a useful check when cur_vcd_size is > MAX_RPMH_PAYLOAD, since n[batch] == cur_vcd_size can be valid if cur_vcd_size == MAX_RPMH_PAYLOAD.
+               }
+       }
+}
+
+static void qcom_icc_bcm_aggregate(struct qcom_icc_bcm *bcm)
+{
+       size_t i;
+       u64 agg_avg = 0;
+       u64 agg_peak = 0;
+
+       for (i = 0; i < bcm->num_nodes; i++) {
+               agg_avg = max(agg_avg,
+                       bcm->nodes[i]->sum_avg * bcm->aux_data.width /
+                       (bcm->nodes[i]->buswidth * bcm->nodes[i]->channels));
+               agg_peak = max(agg_peak,
+                       bcm->nodes[i]->max_peak * bcm->aux_data.width /
+                       bcm->nodes[i]->buswidth);
+       }
+
+       bcm->vote_x = (u64)(agg_avg * 1000ULL / bcm->aux_data.unit);
+       bcm->vote_y = (u64)(agg_peak * 1000ULL / bcm->aux_data.unit);
+
+       if (bcm->keepalive && bcm->vote_x == 0 && bcm->vote_y == 0) {
+               bcm->vote_x = 1;
+               bcm->vote_y = 1;
+       }
+
+       bcm->dirty = false;
+}
+
+static int qcom_icc_aggregate(struct icc_node *node, u32 avg_bw,
+                               u32 peak_bw, u32 *agg_avg, u32 *agg_peak)
+{
+       size_t i;
+       struct qcom_icc_node *qn;
+
+       qn = node->data;
+
+       *agg_avg += avg_bw;
+       *agg_peak = max_t(u64, agg_peak, peak_bw);
+
+       qn->sum_avg = *agg_avg;
+       qn->max_peak = *agg_peak;
+
+       for (i = 0; i < qn->num_bcms; i++)
+               qn->bcms[i]->dirty = true;
+
+       return 0;
+}
+
+static int qcom_icc_set(struct icc_node *src, struct icc_node *dst,
+                       u32 avg, u32 peak)
+{
+       struct qcom_icc_provider *qp;
+       struct qcom_icc_node *qn;
+       struct icc_node *node;
+       struct icc_provider *provider;
+       struct tcs_cmd cmds[SDM845_MAX_BCMS];
+       struct list_head commit_list;
+       int commit_idx[SDM845_MAX_VCD];
+       int ret = 0, i;
+
+       if (!src)
+               node = dst;
+       else
+               node = src;
+
+       qn = node->data;
+       provider = node->provider;
+       qp = to_qcom_provider(node->provider);
+
+       INIT_LIST_HEAD(&commit_list);
+
+       for (i = 0; i < qp->num_bcms; i++) {
+               if (qp->bcms[i]->dirty) {
+                       qcom_icc_bcm_aggregate(qp->bcms[i]);
+                       list_add_tail(&qp->bcms[i]->list, &commit_list);
+               }
+       }
+
+       /* Construct the command list based on a pre ordered list of BCMs
Another networking-style comment.
Done.

+        * based on VCD
period?
Done.

+        */
+       qcom_tcs_list_gen(&commit_list, cmds, commit_idx);
+
+       if (!commit_idx[0])
+               return ret;
+
+       ret = rpmh_invalidate(qp->dev);
+       if (ret) {
+               pr_err("Error invalidating RPMH client (%d)\n", ret);
+               return ret;
+       }
+
+       ret = rpmh_write_batch(qp->dev, RPMH_ACTIVE_ONLY_STATE,
+                              cmds, commit_idx);
+       if (ret) {
+               pr_err("Error sending AMC RPMH requests (%d)\n", ret);
+               return ret;
+       }
+
+       /* TODO: collect and send wake and sleep sets */
+       return ret;
+}
+
+static int cmp_vcd(const void *_l, const void *_r)
+{
+       const struct qcom_icc_bcm **l = (const struct qcom_icc_bcm **)_l;
+       const struct qcom_icc_bcm **r = (const struct qcom_icc_bcm **)_r;
+
+       if (l[0]->aux_data.vcd < r[0]->aux_data.vcd)
+               return -1;
+       else if (l[0]->aux_data.vcd == r[0]->aux_data.vcd)
+               return 0;
+       else
+               return 1;
+}
+
+static int qnoc_probe(struct platform_device *pdev)
+{
+       const struct qcom_icc_desc *desc;
+       struct qcom_icc_node **qnodes;
+       struct qcom_icc_provider *qp;
+       struct icc_provider *provider;
+       size_t num_nodes, i;
+       int ret;
+
+       desc = of_device_get_match_data(&pdev->dev);
+       if (!desc)
+               return -EINVAL;
+
+       qnodes = desc->nodes;
+       num_nodes = desc->num_nodes;
+
+       qp = devm_kzalloc(&pdev->dev, sizeof(*qp), GFP_KERNEL);
+       if (!qp)
+               return -ENOMEM;
+
+       provider = &qp->provider;
+       provider->dev = &pdev->dev;
+       provider->set = &qcom_icc_set;
+       provider->aggregate = &qcom_icc_aggregate;
+       INIT_LIST_HEAD(&provider->nodes);
+       provider->data = qp;
+
+       qp->dev = &pdev->dev;
+       qp->bcms = desc->bcms;
+       qp->num_bcms = desc->num_bcms;
+
+       ret = icc_provider_add(provider);
+       if (ret) {
+               dev_err(&pdev->dev, "error adding interconnect provider\n");
+               return ret;
+       }
+
+       for (i = 0; i < num_nodes; i++) {
+               struct icc_node *node;
+               int ret;
+               size_t j;
+
+               node = icc_node_create(qnodes[i]->id);
+               if (IS_ERR(node)) {
+                       ret = PTR_ERR(node);
+                       goto err;
I think you need to clean up the nodes you've already created and
added, otherwise provider_del will end up printing a warning and
failing.
Done.
+               }
+
+               node->name = qnodes[i]->name;
+               node->data = qnodes[i];
+               icc_node_add(node, provider);
+
+               dev_dbg(&pdev->dev, "registered node %p %s %d\n", node,
+                       qnodes[i]->name, node->id);
+
+               ret = qcom_icc_init(node);
+               if (ret)
+                       dev_err(&pdev->dev, "%s init error (%d)\n", node->name,
+                               ret);
+
+               /* populate links */
+               for (j = 0; j < qnodes[i]->num_links; j++)
+                       if (qnodes[i]->links[j])
+                               icc_link_create(node, qnodes[i]->links[j]);
+       }
+
+       for (i = 0; i < qp->num_bcms; i++)
+               qcom_icc_bcm_init(qp->bcms[i], &pdev->dev);
+
+       /* Pre sort the BCMs based on VCD for ease of generating a command list
Another comment that needs the /* line on its own. It turns out I do
this a lot too :)
Done.
+        * that groups the BCMs with the same VCD together. VCDs are numbered
+        * with lowest being the most expensive time wise, ensuring that
+        * those commands are being sent the earliest in the queue.
+        */
+       sort(qp->bcms, qp->num_bcms, sizeof(*qp->bcms), cmp_vcd, NULL);
+
+       platform_set_drvdata(pdev, provider);
+       dev_info(&pdev->dev, "Registered SDM845 ICC\n");
+
+       return ret;
+err:
+       icc_provider_del(provider);
+       return ret;
+}
+
+static int qnoc_remove(struct platform_device *pdev)
+{
+       struct icc_provider *provider = platform_get_drvdata(pdev);
+
+       icc_provider_del(provider);
Don't you need to tear all the nodes down too? Otherwise this function
will fail. Should you check the return value as well and complain at
least, or maybe fail qnoc_remove entirely?
Done.
+
+       return 0;
+}
+
+static const struct of_device_id qnoc_of_match[] = {
+       { .compatible = "qcom,sdm845-rsc-hlos", .data = &sdm845_rsc_hlos },
+       { },
+};
+MODULE_DEVICE_TABLE(of, qnoc_of_match);
+
+static struct platform_driver qnoc_driver = {
+       .probe = qnoc_probe,
+       .remove = qnoc_remove,
+       .driver = {
+               .name = "qnoc-sdm845",
+               .of_match_table = qnoc_of_match,
+       },
+};
+module_platform_driver(qnoc_driver);
+
+MODULE_AUTHOR("David Dai <daidav...@codeaurora.org>");
+MODULE_DESCRIPTION("Qualcomm sdm845 NoC driver");
+MODULE_LICENSE("GPL v2");

--
The Qualcomm Innovation Center, Inc. is a member of the Code Aurora Forum,
a Linux Foundation Collaborative Project

Reply via email to