On Tue, 2009-02-17 at 16:59 -0800, Eric Anholt wrote:
> The basic problem was
> mmap_sem (do_mmap()) -> struct_mutex (drm_gem_mmap(), i915_gem_fault())
> struct_mutex (i915_gem_execbuffer()) -> mmap_sem (copy_from/to_user())

That's not the only problem, there's also:

dup_mmap()
  down_write(mmap_sem)
  vm_ops->open() -> drm_vm_open()
    mutex_lock(struct_mutex);

> We have plenty of places where we want to hold device state the same
> (struct_mutex) while we move a non-trivial amount of data
> (copy_from/to_user()), such as i915_gem_pwrite().  Solve this by moving the
> easy things that needed struct_mutex with mmap_sem held to using a lock to
> cover just those data structures (offset hash and offset manager), and do
> trylock and reschedule in fault.

So we establish,

  mmap_sem
    offset_mutex

  i915_gem_mmap_gtt_ioctl()
    mutex_lock(struct_mutex)
    i915_gem_create_mmap_offset()
      mutex_lock(offset_mutex)

However we still have

  struct_mutex
    mmap_sem

in basically every copy_*_user() case

But you cannot seem to switch ->fault() to use offset_mutex, which would
work out the inversion because you then have:

  struct_mutex
    mmap_sem
      offset_mutex

So why bother with the offset_mutex? Instead you make your ->fault()
fail randomly.

I'm not sure what Wang Chen sees after this patch, but I should not be
the exact same splat, still it would not at all surprise me if there's
plenty left.

The locking looks very fragile and I don't think this patch is helping
anything, sorry.

> Signed-off-by: Eric Anholt <e...@anholt.net>
> ---
>  drivers/gpu/drm/drm_gem.c       |    8 ++++----
>  drivers/gpu/drm/i915/i915_gem.c |   15 ++++++++++++++-
>  include/drm/drmP.h              |    1 +
>  3 files changed, 19 insertions(+), 5 deletions(-)
> 
> diff --git a/drivers/gpu/drm/drm_gem.c b/drivers/gpu/drm/drm_gem.c
> index 88d3368..13a0184 100644
> --- a/drivers/gpu/drm/drm_gem.c
> +++ b/drivers/gpu/drm/drm_gem.c
> @@ -97,6 +97,7 @@ drm_gem_init(struct drm_device *dev)
>  
>       dev->mm_private = mm;
>  
> +     mutex_init(&mm->offset_mutex);
>       if (drm_ht_create(&mm->offset_hash, 19)) {
>               drm_free(mm, sizeof(struct drm_gem_mm), DRM_MEM_MM);
>               return -ENOMEM;
> @@ -508,10 +509,9 @@ int drm_gem_mmap(struct file *filp, struct 
> vm_area_struct *vma)
>       unsigned long prot;
>       int ret = 0;
>  
> -     mutex_lock(&dev->struct_mutex);
> -
> +     mutex_lock(&mm->offset_mutex);
>       if (drm_ht_find_item(&mm->offset_hash, vma->vm_pgoff, &hash)) {
> -             mutex_unlock(&dev->struct_mutex);
> +             mutex_unlock(&mm->offset_mutex);
>               return drm_mmap(filp, vma);
>       }
>  
> @@ -556,7 +556,7 @@ int drm_gem_mmap(struct file *filp, struct vm_area_struct 
> *vma)
>       drm_vm_open_locked(vma);
>  
>  out_unlock:
> -     mutex_unlock(&dev->struct_mutex);
> +     mutex_unlock(&mm->offset_mutex);
>  
>       return ret;
>  }
> diff --git a/drivers/gpu/drm/i915/i915_gem.c b/drivers/gpu/drm/i915/i915_gem.c
> index ac534c9..da9a2cb 100644
> --- a/drivers/gpu/drm/i915/i915_gem.c
> +++ b/drivers/gpu/drm/i915/i915_gem.c
> @@ -573,8 +573,16 @@ int i915_gem_fault(struct vm_area_struct *vma, struct 
> vm_fault *vmf)
>       page_offset = ((unsigned long)vmf->virtual_address - vma->vm_start) >>
>               PAGE_SHIFT;
>  
> +     /* Get the struct mutex before accessing GEM data structures, but
> +      * keep the struct_mutex -> mmap_sem lock ordering so that we don't
> +      * need to mangle pwrite/pread to allow mmap_sem -> struct_mutex.
> +      */
> +     if (!mutex_trylock(&dev->struct_mutex)) {
> +             need_resched();
> +             return VM_FAULT_NOPAGE;
> +     }

So we just fail the fault if someone happens to hold the struct_mutex?
Seems rather fragile, could be another thread doing an ioctl.

>       /* Now bind it into the GTT if needed */
> -     mutex_lock(&dev->struct_mutex);
>       if (!obj_priv->gtt_space) {
>               ret = i915_gem_object_bind_to_gtt(obj, obj_priv->gtt_alignment);
>               if (ret) {


> @@ -646,6 +654,7 @@ i915_gem_create_mmap_offset(struct drm_gem_object *obj)
>       map->size = obj->size;
>       map->handle = obj;
>  
> +     mutex_lock(&mm->offset_mutex);
>       /* Get a DRM GEM mmap offset allocated... */
>       list->file_offset_node = drm_mm_search_free(&mm->offset_manager,
>                                                   obj->size / PAGE_SIZE, 0, 
> 0);
> @@ -671,12 +680,14 @@ i915_gem_create_mmap_offset(struct drm_gem_object *obj)
>       /* By now we should be all set, any drm_mmap request on the offset
>        * below will get to our mmap & fault handler */
>       obj_priv->mmap_offset = ((uint64_t) list->hash.key) << PAGE_SHIFT;
> +     mutex_unlock(&mm->offset_mutex);
>  
>       return 0;
>  
>  out_free_mm:
>       drm_mm_put_block(list->file_offset_node);
>  out_free_list:
> +     mutex_unlock(&mm->offset_mutex);
>       drm_free(list->map, sizeof(struct drm_map_list), DRM_MEM_DRIVER);
>  
>       return ret;
> @@ -690,6 +701,7 @@ i915_gem_free_mmap_offset(struct drm_gem_object *obj)
>       struct drm_gem_mm *mm = dev->mm_private;
>       struct drm_map_list *list;
>  
> +     mutex_lock(&mm->offset_mutex);
>       list = &obj->map_list;
>       drm_ht_remove_item(&mm->offset_hash, &list->hash);
>  
> @@ -704,6 +716,7 @@ i915_gem_free_mmap_offset(struct drm_gem_object *obj)
>       }
>  
>       obj_priv->mmap_offset = 0;
> +     mutex_unlock(&mm->offset_mutex);
>  }
>  
>  /**
> diff --git a/include/drm/drmP.h b/include/drm/drmP.h
> index e5f4ae9..04f765b 100644
> --- a/include/drm/drmP.h
> +++ b/include/drm/drmP.h
> @@ -570,6 +570,7 @@ struct drm_ati_pcigart_info {
>  struct drm_gem_mm {
>       struct drm_mm offset_manager;   /**< Offset mgmt for buffer objects */
>       struct drm_open_hash offset_hash; /**< User token hash table for maps */
> +     struct mutex offset_mutex; /**< covers offset_manager and offset_hash */
>  };
>  
>  /**


------------------------------------------------------------------------------
Open Source Business Conference (OSBC), March 24-25, 2009, San Francisco, CA
-OSBC tackles the biggest issue in open source: Open Sourcing the Enterprise
-Strategies to boost innovation and cut costs with open source participation
-Receive a $600 discount off the registration fee with the source code: SFAD
http://p.sf.net/sfu/XcvMzF8H
--
_______________________________________________
Dri-devel mailing list
Dri-devel@lists.sourceforge.net
https://lists.sourceforge.net/lists/listinfo/dri-devel

Reply via email to