dlock-list: Distributed and lock-protected lists

Boqun Feng Mon, 09 Oct 2017 22:35:12 -0700

On Thu, Oct 05, 2017 at 06:43:23PM +0000, Waiman Long wrote:
[...]
> +/*
> + * As all the locks in the dlock list are dynamically allocated, they need
> + * to belong to their own special lock class to avoid warning and stack
> + * trace in kernel log when lockdep is enabled. Statically allocated locks
> + * don't have this problem.
> + */
> +static struct lock_class_key dlock_list_key;
> +


So in this way, you make all dlock_lists share the same lock_class_key,
which means if there are two structures:

        struct some_a {
                ...
                struct dlock_list_heads dlists;
        };

        struct some_b {
                ...
                struct dlock_list_heads dlists;
        };

some_a::dlists and some_b::dlists are going to have the same lockdep
key, is this what you want? If not, you may want to do something like
init_srcu_struct() does.

> +/*
> + * Initialize cpu2idx mapping table
> + *
> + * It is possible that a dlock-list can be allocated before the cpu2idx is
> + * initialized. In this case, all the cpus are mapped to the first entry
> + * before initialization.
> + *
> + */
> +static int __init cpu2idx_init(void)
> +{
> +     int idx, cpu;
> +
> +     idx = 0;
> +     for_each_possible_cpu(cpu)
> +             per_cpu(cpu2idx, cpu) = idx++;
> +     return 0;
> +}
> +postcore_initcall(cpu2idx_init);
> +
> +/**
> + * alloc_dlock_list_heads - Initialize and allocate the list of head entries
> + * @dlist: Pointer to the dlock_list_heads structure to be initialized
> + * Return: 0 if successful, -ENOMEM if memory allocation error
> + *
> + * This function does not allocate the dlock_list_heads structure itself. The
> + * callers will have to do their own memory allocation, if necessary. 
> However,
> + * this allows embedding the dlock_list_heads structure directly into other
> + * structures.
> + */
> +int alloc_dlock_list_heads(struct dlock_list_heads *dlist)
> +{
> +     int idx;
> +
> +     dlist->heads = kcalloc(nr_cpu_ids, sizeof(struct dlock_list_head),
> +                            GFP_KERNEL);
> +
> +     if (!dlist->heads)
> +             return -ENOMEM;
> +
> +     for (idx = 0; idx < nr_cpu_ids; idx++) {
> +             struct dlock_list_head *head = &dlist->heads[idx];
> +
> +             INIT_LIST_HEAD(&head->list);
> +             head->lock = __SPIN_LOCK_UNLOCKED(&head->lock);
> +             lockdep_set_class(&head->lock, &dlock_list_key);
> +     }
> +     return 0;
> +}
> +
> +/**
> + * free_dlock_list_heads - Free all the heads entries of the dlock list
> + * @dlist: Pointer of the dlock_list_heads structure to be freed
> + *
> + * This function doesn't free the dlock_list_heads structure itself. So
> + * the caller will have to do it, if necessary.
> + */
> +void free_dlock_list_heads(struct dlock_list_heads *dlist)
> +{
> +     kfree(dlist->heads);
> +     dlist->heads = NULL;
> +}
> +
> +/**
> + * dlock_lists_empty - Check if all the dlock lists are empty
> + * @dlist: Pointer to the dlock_list_heads structure
> + * Return: true if list is empty, false otherwise.
> + *
> + * This can be a pretty expensive function call. If this function is required
> + * in a performance critical path, we may have to maintain a global count
> + * of the list entries in the global dlock_list_heads structure instead.
> + */
> +bool dlock_lists_empty(struct dlock_list_heads *dlist)
> +{
> +     int idx;
> +
> +     for (idx = 0; idx < nr_cpu_ids; idx++)
> +             if (!list_empty(&dlist->heads[idx].list))
> +                     return false;
> +     return true;
> +}
> +
> +/**
> + * dlock_lists_add - Adds a node to the given dlock list
> + * @node : The node to be added
> + * @dlist: The dlock list where the node is to be added
> + *
> + * List selection is based on the CPU being used when the dlock_list_add()
> + * function is called. However, deletion may be done by a different CPU.
> + */
> +void dlock_lists_add(struct dlock_list_node *node,
> +                  struct dlock_list_heads *dlist)
> +{
> +     struct dlock_list_head *head = &dlist->heads[this_cpu_read(cpu2idx)];
> +
> +     /*
> +      * There is no need to disable preemption
> +      */
> +     spin_lock(&head->lock);
> +     node->head = head;
> +     list_add(&node->list, &head->list);
> +     spin_unlock(&head->lock);
> +}
> +
> +/**
> + * dlock_lists_del - Delete a node from a dlock list
> + * @node : The node to be deleted
> + *
> + * We need to check the lock pointer again after taking the lock to guard
> + * against concurrent deletion of the same node. If the lock pointer changes
> + * (becomes NULL or to a different one), we assume that the deletion was done
> + * elsewhere. A warning will be printed if this happens as it is likely to be
> + * a bug.
> + */
> +void dlock_lists_del(struct dlock_list_node *node)
> +{
> +     struct dlock_list_head *head;
> +     bool retry;
> +
> +     do {
> +             head = READ_ONCE(node->head);

Since we read node->head locklessly here, I think we should use
WRITE_ONCE() for all the stores of node->head, to avoid store tearings?

Regards,
Boqun

> +             if (WARN_ONCE(!head, "%s: node 0x%lx has no associated head\n",
> +                           __func__, (unsigned long)node))
> +                     return;
> +
> +             spin_lock(&head->lock);
> +             if (likely(head == node->head)) {
> +                     list_del_init(&node->list);
> +                     node->head = NULL;
> +                     retry = false;
> +             } else {
> +                     /*
> +                      * The lock has somehow changed. Retry again if it is
> +                      * not NULL. Otherwise, just ignore the delete
> +                      * operation.
> +                      */
> +                     retry = (node->head != NULL);
> +             }
> +             spin_unlock(&head->lock);
> +     } while (retry);
> +}
> +
[...]

signature.asc
Description: PGP signature

Re: [PATCH v7 1/6] lib/dlock-list: Distributed and lock-protected lists

Reply via email to