Hi Evan, Thanks for helping to improve this!
On 07/11/2018 01:34 AM, Evan Green wrote: > Ahoy Georgi! > On Mon, Jul 9, 2018 at 8:51 AM Georgi Djakov <georgi.dja...@linaro.org> wrote: >> >> This patch introduces a new API to get requirements and configure the >> interconnect buses across the entire chipset to fit with the current >> demand. >> >> The API is using a consumer/provider-based model, where the providers are >> the interconnect buses and the consumers could be various drivers. >> The consumers request interconnect resources (path) between endpoints and >> set the desired constraints on this data flow path. The providers receive >> requests from consumers and aggregate these requests for all master-slave >> pairs on that path. Then the providers configure each participating in the >> topology node according to the requested data flow path, physical links and >> constraints. The topology could be complicated and multi-tiered and is SoC >> specific. >> >> Signed-off-by: Georgi Djakov <georgi.dja...@linaro.org> >> --- [..] >> +Interconnect node is the software definition of the interconnect hardware >> +port. Each interconnect provider consists of multiple interconnect nodes, >> +which are connected to other SoC components including other interconnect >> +providers. The point on the diagram where the CPUs connects to the memory is > > CPUs connect Ok. [..] >> + >> +#include <linux/device.h> >> +#include <linux/idr.h> >> +#include <linux/init.h> >> +#include <linux/interconnect.h> >> +#include <linux/interconnect-provider.h> >> +#include <linux/list.h> >> +#include <linux/module.h> >> +#include <linux/mutex.h> > > I needed to add #include <linux/overflow.h> to get struct_size() (used > in path_init) in order to get this to compile, but maybe my kernel is > missing some upstream picks. Yes, should be included. >> +#include <linux/slab.h> >> + >> +static DEFINE_IDR(icc_idr); >> +static LIST_HEAD(icc_provider_list); >> +static DEFINE_MUTEX(icc_lock); >> + >> +/** >> + * struct icc_req - constraints that are attached to each node >> + * >> + * @req_node: entry in list of requests for the particular @node >> + * @node: the interconnect node to which this constraint applies >> + * @dev: reference to the device that sets the constraints >> + * @avg_bw: an integer describing the average bandwidth in kbps >> + * @peak_bw: an integer describing the peak bandwidth in kbps >> + */ >> +struct icc_req { >> + struct hlist_node req_node; >> + struct icc_node *node; >> + struct device *dev; >> + u32 avg_bw; >> + u32 peak_bw; >> +}; >> + >> +/** >> + * struct icc_path - interconnect path structure >> + * @num_nodes: number of hops (nodes) >> + * @reqs: array of the requests applicable to this path of nodes >> + */ >> +struct icc_path { >> + size_t num_nodes; >> + struct icc_req reqs[]; >> +}; >> + >> +static struct icc_node *node_find(const int id) >> +{ >> + return idr_find(&icc_idr, id); > > Wasn't there going to be a warning if the mutex is not held? I think that it would be really useful if the functions are exported, but for now let's skip it. >> +} >> + >> +static struct icc_path *path_init(struct device *dev, struct icc_node *dst, >> + ssize_t num_nodes) >> +{ >> + struct icc_node *node = dst; >> + struct icc_path *path; >> + size_t i; >> + >> + path = kzalloc(struct_size(path, reqs, num_nodes), GFP_KERNEL); >> + if (!path) >> + return ERR_PTR(-ENOMEM); >> + >> + path->num_nodes = num_nodes; >> + > > There should probably also be a warning here about holding the lock, > since you're modifying node->req_list. This is called only by path_find() with the lock held. >> + for (i = 0; i < num_nodes; i++) { >> + hlist_add_head(&path->reqs[i].req_node, &node->req_list); >> + >> + path->reqs[i].node = node; >> + path->reqs[i].dev = dev; >> + /* reference to previous node was saved during path >> traversal */ >> + node = node->reverse; >> + } >> + >> + return path; >> +} >> + >> +static struct icc_path *path_find(struct device *dev, struct icc_node *src, >> + struct icc_node *dst) >> +{ >> + struct icc_node *n, *node = NULL; >> + struct icc_provider *provider; >> + struct list_head traverse_list; >> + struct list_head edge_list; >> + struct list_head visited_list; >> + size_t i, depth = 1; >> + bool found = false; >> + int ret = -EPROBE_DEFER; >> + >> + INIT_LIST_HEAD(&traverse_list); >> + INIT_LIST_HEAD(&edge_list); >> + INIT_LIST_HEAD(&visited_list); >> + > > A warning here too about holding the lock would also be good, since > multiple people in here at once would be bad. This is only called by icc_get() with locked mutex. >> + list_add_tail(&src->search_list, &traverse_list); >> + src->reverse = NULL; >> + >> + do { >> + list_for_each_entry_safe(node, n, &traverse_list, >> search_list) { >> + if (node == dst) { >> + found = true; >> + list_add(&node->search_list, &visited_list); >> + break; >> + } >> + for (i = 0; i < node->num_links; i++) { >> + struct icc_node *tmp = node->links[i]; >> + >> + if (!tmp) { >> + ret = -ENOENT; >> + goto out; >> + } >> + >> + if (tmp->is_traversed) >> + continue; >> + >> + tmp->is_traversed = true; >> + tmp->reverse = node; >> + list_add(&tmp->search_list, &edge_list); >> + } >> + } >> + if (found) >> + break; >> + >> + list_splice_init(&traverse_list, &visited_list); >> + list_splice_init(&edge_list, &traverse_list); >> + >> + /* count the hops including the source */ >> + depth++; >> + >> + } while (!list_empty(&traverse_list)); >> + >> +out: >> + /* reset the traversed state */ >> + list_for_each_entry(provider, &icc_provider_list, provider_list) >> + list_for_each_entry(n, &provider->nodes, node_list) >> + n->is_traversed = false; > > I think I missed this on the last round. I thought you had been > keeping visited_list specifically so you could use it to reset > is_traversed here. But now it looks like you're going through the > entire graph. What happened? Hm, will review and fix. >> + >> + if (found) { >> + struct icc_path *path = path_init(dev, dst, depth); >> + >> + if (IS_ERR(path)) >> + return path; >> + >> + for (i = 0; i < path->num_nodes; i++) { >> + node = path->reqs[i].node; >> + node->provider->users++; > > Hm, should this go in path_init as well? What do you think? You sort > of become a user once you tack your path.req_node on the > node.req_list. Ok, will move it. >> + } >> + return path; >> + } >> + >> + return ERR_PTR(ret); >> +} >> + >> +/* >> + * We want the path to honor all bandwidth requests, so the average >> + * bandwidth requirements from each consumer are aggregated at each node >> + * and provider level. By default the average bandwidth is the sum of all >> + * averages and the peak will be the highest of all peak bandwidth requests. >> + */ >> + >> +static int aggregate_requests(struct icc_node *node) >> +{ >> + struct icc_provider *p = node->provider; >> + struct icc_req *r; >> + >> + node->avg_bw = 0; >> + node->peak_bw = 0; >> + >> + hlist_for_each_entry(r, &node->req_list, req_node) >> + p->aggregate(node, r->avg_bw, r->peak_bw, >> + &node->avg_bw, &node->peak_bw); >> + >> + return 0; >> +} > > This doesn't have to be addressed in this series, but I wonder if the > aggregate() callback should be made aware of whether its aggregating > requests within a node, or nodes within a provider? Right now the > aggregate callback has no way of knowing what it's aggregating for; I > guess the question is: might it need to? I'm unsure. Currently the platforms that would be using this do not need this differentiation, but this can be revised if needed in the future. >> + >> +static void aggregate_provider(struct icc_provider *p) >> +{ >> + struct icc_node *n; >> + >> + p->avg_bw = 0; >> + p->peak_bw = 0; >> + >> + list_for_each_entry(n, &p->nodes, node_list) >> + p->aggregate(n, n->avg_bw, n->peak_bw, >> + &p->avg_bw, &p->peak_bw); >> +} >> + >> +static int apply_constraints(struct icc_path *path) >> +{ >> + struct icc_node *next, *prev = NULL; >> + int ret; >> + int i; >> + >> + for (i = 0; i < path->num_nodes; i++, prev = next) { >> + struct icc_provider *p; >> + >> + next = path->reqs[i].node; >> + /* >> + * Both endpoints should be valid master-slave pairs of the >> + * same interconnect provider that will be configured. >> + */ >> + if (!prev || next->provider != prev->provider) >> + continue; >> + >> + p = next->provider; >> + >> + aggregate_provider(p); >> + >> + /* set the constraints */ >> + ret = p->set(prev, next, p->avg_bw, p->peak_bw); >> + if (ret) >> + goto out; >> + } >> +out: >> + return ret; >> +} >> + >> +/** >> + * icc_set() - set constraints on an interconnect path between two endpoints >> + * @path: reference to the path returned by icc_get() >> + * @avg_bw: average bandwidth in kbps >> + * @peak_bw: peak bandwidth in kbps >> + * >> + * This function is used by an interconnect consumer to express its own >> needs >> + * in terms of bandwidth for a previously requested path between two >> endpoints. >> + * The requests are aggregated and each node is updated accordingly. The >> entire >> + * path is locked by a mutex to ensure that the set() is completed. >> + * The @path can be NULL when the "interconnects" DT properties is missing, >> + * which will mean that no constraints will be set. >> + * >> + * Returns 0 on success, or an appropriate error code otherwise. >> + */ >> +int icc_set(struct icc_path *path, u32 avg_bw, u32 peak_bw) >> +{ >> + struct icc_node *node; >> + struct icc_provider *p; >> + size_t i; >> + int ret; >> + >> + if (!path) >> + return 0; >> + >> + mutex_lock(&icc_lock); >> + >> + for (i = 0; i < path->num_nodes; i++) { >> + node = path->reqs[i].node; >> + p = node->provider; >> + >> + /* update the consumer request for this path */ >> + path->reqs[i].avg_bw = avg_bw; >> + path->reqs[i].peak_bw = peak_bw; >> + >> + /* aggregate requests for this node */ >> + aggregate_requests(node); >> + } >> + >> + ret = apply_constraints(path); >> + if (ret) >> + pr_err("interconnect: error applying constraints (%d)", ret); >> + >> + mutex_unlock(&icc_lock); >> + >> + return ret; >> +} >> +EXPORT_SYMBOL_GPL(icc_set); >> + >> +/** >> + * icc_get() - return a handle for path between two endpoints >> + * @dev: the device requesting the path >> + * @src_id: source device port id >> + * @dst_id: destination device port id >> + * >> + * This function will search for a path between two endpoints and return an >> + * icc_path handle on success. Use icc_put() to release >> + * constraints when the they are not needed anymore. >> + * >> + * Return: icc_path pointer on success, or ERR_PTR() on error >> + */ >> +struct icc_path *icc_get(struct device *dev, const int src_id, const int >> dst_id) >> +{ >> + struct icc_node *src, *dst; >> + struct icc_path *path = ERR_PTR(-EPROBE_DEFER); >> + >> + mutex_lock(&icc_lock); >> + >> + src = node_find(src_id); >> + if (!src) >> + goto out; >> + >> + dst = node_find(dst_id); >> + if (!dst) >> + goto out; >> + >> + path = path_find(dev, src, dst); >> + if (IS_ERR(path)) >> + dev_err(dev, "%s: invalid path=%ld\n", __func__, >> PTR_ERR(path)); >> + >> +out: >> + mutex_unlock(&icc_lock); >> + return path; >> +} >> +EXPORT_SYMBOL_GPL(icc_get); >> + >> +/** >> + * icc_put() - release the reference to the icc_path >> + * @path: interconnect path >> + * >> + * Use this function to release the constraints on a path when the path is >> + * no longer needed. The constraints will be re-aggregated. >> + */ >> +void icc_put(struct icc_path *path) >> +{ >> + struct icc_node *node; >> + size_t i; >> + int ret; >> + >> + if (!path || WARN_ON(IS_ERR(path))) >> + return; >> + >> + ret = icc_set(path, 0, 0); >> + if (ret) >> + pr_err("%s: error (%d)\n", __func__, ret); >> + >> + mutex_lock(&icc_lock); >> + for (i = 0; i < path->num_nodes; i++) { >> + node = path->reqs[i].node; >> + hlist_del(&path->reqs[i].req_node); >> + > > Maybe a warning if users is zero? Yes, good idea. >> + node->provider->users--; >> + } >> + mutex_unlock(&icc_lock); >> + >> + kfree(path); >> +} >> +EXPORT_SYMBOL_GPL(icc_put); >> + >> +static struct icc_node *icc_node_create_nolock(int id) >> +{ >> + struct icc_node *node; >> + >> + /* check if node already exists */ >> + node = node_find(id); >> + if (node) >> + goto out; >> + >> + node = kzalloc(sizeof(*node), GFP_KERNEL); >> + if (!node) { >> + node = ERR_PTR(-ENOMEM); >> + goto out; >> + } >> + >> + id = idr_alloc(&icc_idr, node, id, id + 1, GFP_KERNEL); >> + if (WARN(id < 0, "couldn't get idr")) { >> + kfree(node); >> + node = ERR_PTR(id); >> + goto out; >> + } >> + >> + node->id = id; >> + >> +out: >> + return node; >> +} >> + >> +/** >> + * icc_node_create() - create a node >> + * @id: node id >> + * >> + * Return: icc_node pointer on success, or ERR_PTR() on error >> + */ >> +struct icc_node *icc_node_create(int id) >> +{ >> + struct icc_node *node; >> + >> + mutex_lock(&icc_lock); >> + >> + node = icc_node_create_nolock(id); >> + >> + mutex_unlock(&icc_lock); >> + >> + return node; >> +} >> +EXPORT_SYMBOL_GPL(icc_node_create); >> + >> +/** >> + * icc_node_destroy() - destroy a node >> + * @id: node id >> + * >> + */ >> +void icc_node_destroy(int id) >> +{ >> + struct icc_node *node; >> + >> + node = node_find(id); >> + if (node) { >> + mutex_lock(&icc_lock); > > mutex_lock should be moved above node_find, since node_find needs the lock > held. Ok. >> + idr_remove(&icc_idr, node->id); >> + WARN_ON(!hlist_empty(&node->req_list)); >> + mutex_unlock(&icc_lock); >> + } >> + >> + kfree(node); >> +} >> +EXPORT_SYMBOL_GPL(icc_node_destroy); >> + >> +/** >> + * icc_link_create() - create a link between two nodes >> + * @src_id: source node id >> + * @dst_id: destination node id >> + * >> + * Create a link between two nodes. The nodes might belong to different >> + * interconnect providers and the @dst_id node might not exist (if the >> + * provider driver has not probed yet). So just create the @dst_id node >> + * and when the actual provider driver is probed, the rest of the node >> + * data is filled. >> + * >> + * Return: 0 on success, or an error code otherwise >> + */ >> +int icc_link_create(struct icc_node *node, const int dst_id) >> +{ >> + struct icc_node *dst; >> + struct icc_node **new; >> + int ret = 0; >> + >> + if (!node->provider) >> + return -EINVAL; >> + >> + mutex_lock(&icc_lock); >> + >> + dst = node_find(dst_id); >> + if (!dst) { >> + dst = icc_node_create_nolock(dst_id); >> + >> + if (IS_ERR(dst)) { >> + ret = PTR_ERR(dst); >> + goto out; >> + } >> + } >> + >> + new = krealloc(node->links, >> + (node->num_links + 1) * sizeof(*node->links), >> + GFP_KERNEL); >> + if (!new) { >> + ret = -ENOMEM; >> + goto out; >> + } >> + >> + node->links = new; >> + node->links[node->num_links++] = dst; >> + >> +out: >> + mutex_unlock(&icc_lock); >> + >> + return ret; >> +} >> +EXPORT_SYMBOL_GPL(icc_link_create); >> + >> +/** >> + * icc_link_destroy() - destroy a link between two nodes >> + * @src: pointer to source node >> + * @dst: pointer to destination node >> + * >> + * Return: 0 on success, or an error code otherwise >> + */ >> +int icc_link_destroy(struct icc_node *src, struct icc_node *dst) >> +{ >> + struct icc_node **new; >> + struct icc_node *last; >> + int ret = 0; >> + size_t slot; >> + >> + if (IS_ERR_OR_NULL(src)) >> + return -EINVAL; >> + >> + if (IS_ERR_OR_NULL(dst)) >> + return -EINVAL; >> + >> + mutex_lock(&icc_lock); >> + >> + for (slot = 0; slot < src->num_links; slot++) >> + if (src->links[slot] == dst) >> + break; >> + > > How about a warning or failure if slot == src->num_links, meaning > someone is trying to tear down a link they never set up. Ok. >> + last = src->links[src->num_links]; > > Shouldn't it be src->num_links - 1? Yes, indeed. >> + >> + new = krealloc(src->links, >> + (src->num_links - 1) * sizeof(*src->links), >> + GFP_KERNEL); >> + if (!new) { >> + ret = -ENOMEM; >> + goto out; > > It's technically not really a problem if this realloc fails, right? > Your old array should still be valid, and it's big enough to hold > everything you wanted. Just only assign src->link = new if realloc > succeeds. > >> + } >> + >> + src->links = new; >> + >> + if (slot < src->num_links - 1) >> + /* move the last element to the slot that was freed */ >> + src->links[slot] = last; > > If you moved this above the realloc, then you could do away with the > conditional part of it, since at worst it would end up being: > src->links[num_links - 1] = src->links[num_links - 1]; which is a > no-op. You also wouldn't need the "last" local either. Ok. Will simplify it! Thanks, Georgi