restoration

Steven Price Fri, 16 Jan 2026 07:56:30 -0800

On 16/01/2026 12:57, Nicolas Frattaroli wrote:
> The current IRQ helpers do not guarantee mutual exclusion that covers
> the entire transaction from accessing the mask member and modifying the
> mask register.
> 
> This makes it hard, if not impossible, to implement mask modification
> helpers that may change one of these outside the normal
> suspend/resume/isr code paths.
> 
> Add a spinlock to struct panthor_irq that protects both the mask member
> and register. Acquire it in all code paths that access these, but drop
> it before processing the threaded handler function. Then, add the
> aforementioned new helpers: enable_events, and disable_events. They work
> by ORing and NANDing the mask bits.
> 
> resume is changed to no longer have a mask passed, as pirq->mask is
> supposed to be the user-requested mask now, rather than a mirror of the
> INT_MASK register contents. Users of the resume helper are adjusted
> accordingly, including a rather painful refactor in panthor_mmu.c.
> 
> In panthor_mmu.c, the bespoke mask modification is excised, and replaced
> with enable_events/disable_events in as_enable/as_disable.
> 
> Co-developed-by: Boris Brezillon <[email protected]>
> Signed-off-by: Boris Brezillon <[email protected]>
> Signed-off-by: Nicolas Frattaroli <[email protected]>


Reviewed-by: Steven Price <[email protected]>

> ---
>  drivers/gpu/drm/panthor/panthor_device.h | 86 
> ++++++++++++++++++++++++++------
>  drivers/gpu/drm/panthor/panthor_fw.c     |  3 +-
>  drivers/gpu/drm/panthor/panthor_gpu.c    |  2 +-
>  drivers/gpu/drm/panthor/panthor_mmu.c    | 47 ++++++++---------
>  drivers/gpu/drm/panthor/panthor_pwr.c    |  2 +-
>  5 files changed, 98 insertions(+), 42 deletions(-)
> 
> diff --git a/drivers/gpu/drm/panthor/panthor_device.h 
> b/drivers/gpu/drm/panthor/panthor_device.h
> index 8597b388cc40..8664adb1febf 100644
> --- a/drivers/gpu/drm/panthor/panthor_device.h
> +++ b/drivers/gpu/drm/panthor/panthor_device.h
> @@ -84,9 +84,19 @@ struct panthor_irq {
>       /** @irq: IRQ number. */
>       int irq;
>  
> -     /** @mask: Current mask being applied to xxx_INT_MASK. */
> +     /** @mask: Values to write to xxx_INT_MASK if active. */
>       u32 mask;
>  
> +     /**
> +      * @mask_lock: protects modifications to _INT_MASK and @mask.
> +      *
> +      * In paths where _INT_MASK is updated based on a state
> +      * transition/check, it's crucial for the state update/check to be
> +      * inside the locked section, otherwise it introduces a race window
> +      * leading to potential _INT_MASK inconsistencies.
> +      */
> +     spinlock_t mask_lock;
> +
>       /** @state: one of &enum panthor_irq_state reflecting the current 
> state. */
>       atomic_t state;
>  };
> @@ -425,13 +435,14 @@ static irqreturn_t panthor_ ## __name ## 
> _irq_raw_handler(int irq, void *data)
>       if (!gpu_read(ptdev, __reg_prefix ## _INT_STAT))                        
>                 \
>               return IRQ_NONE;                                                
>                 \
>                                                                               
>                 \
> +     guard(spinlock_irqsave)(&pirq->mask_lock);                              
>                 \
> +     gpu_write(ptdev, __reg_prefix ## _INT_MASK, 0);                         
>                 \
>       old_state = atomic_cmpxchg(&pirq->state,                                
>                 \
>                                  PANTHOR_IRQ_STATE_ACTIVE,                    
>                 \
>                                  PANTHOR_IRQ_STATE_PROCESSING);               
>                 \
>       if (old_state != PANTHOR_IRQ_STATE_ACTIVE)                              
>                 \
>               return IRQ_NONE;                                                
>                 \
>                                                                               
>                 \
> -     gpu_write(ptdev, __reg_prefix ## _INT_MASK, 0);                         
>                 \
>       return IRQ_WAKE_THREAD;                                                 
>                 \
>  }                                                                            
>                 \
>                                                                               
>                 \
> @@ -439,10 +450,17 @@ static irqreturn_t panthor_ ## __name ## 
> _irq_threaded_handler(int irq, void *da
>  {                                                                            
>                 \
>       struct panthor_irq *pirq = data;                                        
>                 \
>       struct panthor_device *ptdev = pirq->ptdev;                             
>                 \
> -     enum panthor_irq_state old_state;                                       
>                 \
>       irqreturn_t ret = IRQ_NONE;                                             
>                 \
>                                                                               
>                 \
>       while (true) {                                                          
>                 \
> +             /* It's safe to access pirq->mask without the lock held here. 
> If a new          \
> +              * event gets added to the mask and the corresponding IRQ is 
> pending,           \
> +              * we'll process it right away instead of adding an extra raw 
> -> threaded       \
> +              * round trip. If an event is removed and the status bit is 
> set, it will        \
> +              * be ignored, just like it would have been if the mask had 
> been adjusted       \
> +              * right before the HW event kicks in. TLDR; it's all expected 
> races we're      \
> +              * covered for.                                                 
>                 \
> +              */                                                             
>                 \
>               u32 status = gpu_read(ptdev, __reg_prefix ## _INT_RAWSTAT) & 
> pirq->mask;        \
>                                                                               
>                 \
>               if (!status)                                                    
>                 \
> @@ -452,30 +470,36 @@ static irqreturn_t panthor_ ## __name ## 
> _irq_threaded_handler(int irq, void *da
>               ret = IRQ_HANDLED;                                              
>                 \
>       }                                                                       
>                 \
>                                                                               
>                 \
> -     old_state = atomic_cmpxchg(&pirq->state,                                
>                 \
> -                                PANTHOR_IRQ_STATE_PROCESSING,                
>                 \
> -                                PANTHOR_IRQ_STATE_ACTIVE);                   
>                 \
> -     if (old_state == PANTHOR_IRQ_STATE_PROCESSING)                          
>                 \
> -             gpu_write(ptdev, __reg_prefix ## _INT_MASK, pirq->mask);        
>                 \
> +     scoped_guard(spinlock_irqsave, &pirq->mask_lock) {                      
>                 \
> +             enum panthor_irq_state old_state;                               
>                 \
> +                                                                             
>                 \
> +             old_state = atomic_cmpxchg(&pirq->state,                        
>                 \
> +                                        PANTHOR_IRQ_STATE_PROCESSING,        
>                 \
> +                                        PANTHOR_IRQ_STATE_ACTIVE);           
>                 \
> +             if (old_state == PANTHOR_IRQ_STATE_PROCESSING)                  
>                 \
> +                     gpu_write(ptdev, __reg_prefix ## _INT_MASK, 
> pirq->mask);                \
> +     }                                                                       
>                 \
>                                                                               
>                 \
>       return ret;                                                             
>                 \
>  }                                                                            
>                 \
>                                                                               
>                 \
>  static inline void panthor_ ## __name ## _irq_suspend(struct panthor_irq 
> *pirq)                      \
>  {                                                                            
>                 \
> -     pirq->mask = 0;                                                         
>                 \
> -     gpu_write(pirq->ptdev, __reg_prefix ## _INT_MASK, 0);                   
>                 \
> -     atomic_set(&pirq->state, PANTHOR_IRQ_STATE_SUSPENDING);                 
>                 \
> +     scoped_guard(spinlock_irqsave, &pirq->mask_lock) {                      
>                 \
> +             atomic_set(&pirq->state, PANTHOR_IRQ_STATE_SUSPENDING);         
>                 \
> +             gpu_write(pirq->ptdev, __reg_prefix ## _INT_MASK, 0);           
>                 \
> +     }                                                                       
>                 \
>       synchronize_irq(pirq->irq);                                             
>                 \
>       atomic_set(&pirq->state, PANTHOR_IRQ_STATE_SUSPENDED);                  
>                 \
>  }                                                                            
>                 \
>                                                                               
>                 \
> -static inline void panthor_ ## __name ## _irq_resume(struct panthor_irq 
> *pirq, u32 mask)     \
> +static inline void panthor_ ## __name ## _irq_resume(struct panthor_irq 
> *pirq)                       \
>  {                                                                            
>                 \
> -     pirq->mask = mask;                                                      
>                 \
> +     guard(spinlock_irqsave)(&pirq->mask_lock);                              
>                 \
> +                                                                             
>                 \
>       atomic_set(&pirq->state, PANTHOR_IRQ_STATE_ACTIVE);                     
>                 \
> -     gpu_write(pirq->ptdev, __reg_prefix ## _INT_CLEAR, mask);               
>                 \
> -     gpu_write(pirq->ptdev, __reg_prefix ## _INT_MASK, mask);                
>                 \
> +     gpu_write(pirq->ptdev, __reg_prefix ## _INT_CLEAR, pirq->mask);         
>                 \
> +     gpu_write(pirq->ptdev, __reg_prefix ## _INT_MASK, pirq->mask);          
>                 \
>  }                                                                            
>                 \
>                                                                               
>                 \
>  static int panthor_request_ ## __name ## _irq(struct panthor_device *ptdev,  
>                 \
> @@ -484,13 +508,43 @@ static int panthor_request_ ## __name ## _irq(struct 
> panthor_device *ptdev,                     \
>  {                                                                            
>                 \
>       pirq->ptdev = ptdev;                                                    
>                 \
>       pirq->irq = irq;                                                        
>                 \
> -     panthor_ ## __name ## _irq_resume(pirq, mask);                          
>                 \
> +     pirq->mask = mask;                                                      
>                 \
> +     spin_lock_init(&pirq->mask_lock);                                       
>                 \
> +     panthor_ ## __name ## _irq_resume(pirq);                                
>                 \
>                                                                               
>                 \
>       return devm_request_threaded_irq(ptdev->base.dev, irq,                  
>                 \
>                                        panthor_ ## __name ## 
> _irq_raw_handler,                \
>                                        panthor_ ## __name ## 
> _irq_threaded_handler,           \
>                                        IRQF_SHARED, KBUILD_MODNAME "-" # 
> __name,              \
>                                        pirq);                                 
>                 \
> +}                                                                            
>                 \
> +                                                                             
>                 \
> +static inline void panthor_ ## __name ## _irq_enable_events(struct 
> panthor_irq *pirq, u32 mask)      \
> +{                                                                            
>                 \
> +     guard(spinlock_irqsave)(&pirq->mask_lock);                              
>                 \
> +     pirq->mask |= mask;                                                     
>                 \
> +                                                                             
>                 \
> +     /* The only situation where we need to write the new mask is if the IRQ 
> is active.      \
> +      * If it's being processed, the mask will be restored for us in 
> _irq_threaded_handler() \
> +      * on the PROCESSING -> ACTIVE transition.                              
>                 \
> +      * If the IRQ is suspended/suspending, the mask is restored at resume 
> time.             \
> +      */                                                                     
>                 \
> +     if (atomic_read(&pirq->state) == PANTHOR_IRQ_STATE_ACTIVE)              
>                 \
> +             gpu_write(pirq->ptdev, __reg_prefix ## _INT_MASK, pirq->mask);  
>                 \
> +}                                                                            
>                 \
> +                                                                             
>                 \
> +static inline void panthor_ ## __name ## _irq_disable_events(struct 
> panthor_irq *pirq, u32 mask)\
> +{                                                                            
>                 \
> +     guard(spinlock_irqsave)(&pirq->mask_lock);                              
>                 \
> +     pirq->mask &= ~mask;                                                    
>                 \
> +                                                                             
>                 \
> +     /* The only situation where we need to write the new mask is if the IRQ 
> is active.      \
> +      * If it's being processed, the mask will be restored for us in 
> _irq_threaded_handler() \
> +      * on the PROCESSING -> ACTIVE transition.                              
>                 \
> +      * If the IRQ is suspended/suspending, the mask is restored at resume 
> time.             \
> +      */                                                                     
>                 \
> +     if (atomic_read(&pirq->state) == PANTHOR_IRQ_STATE_ACTIVE)              
>                 \
> +             gpu_write(pirq->ptdev, __reg_prefix ## _INT_MASK, pirq->mask);  
>                 \
>  }
>  
>  extern struct workqueue_struct *panthor_cleanup_wq;
> diff --git a/drivers/gpu/drm/panthor/panthor_fw.c 
> b/drivers/gpu/drm/panthor/panthor_fw.c
> index a64ec8756bed..0e46625f7621 100644
> --- a/drivers/gpu/drm/panthor/panthor_fw.c
> +++ b/drivers/gpu/drm/panthor/panthor_fw.c
> @@ -1080,7 +1080,8 @@ static int panthor_fw_start(struct panthor_device 
> *ptdev)
>       bool timedout = false;
>  
>       ptdev->fw->booted = false;
> -     panthor_job_irq_resume(&ptdev->fw->irq, ~0);
> +     panthor_job_irq_enable_events(&ptdev->fw->irq, ~0);
> +     panthor_job_irq_resume(&ptdev->fw->irq);
>       gpu_write(ptdev, MCU_CONTROL, MCU_CONTROL_AUTO);
>  
>       if (!wait_event_timeout(ptdev->fw->req_waitqueue,
> diff --git a/drivers/gpu/drm/panthor/panthor_gpu.c 
> b/drivers/gpu/drm/panthor/panthor_gpu.c
> index 057e167468d0..9304469a711a 100644
> --- a/drivers/gpu/drm/panthor/panthor_gpu.c
> +++ b/drivers/gpu/drm/panthor/panthor_gpu.c
> @@ -395,7 +395,7 @@ void panthor_gpu_suspend(struct panthor_device *ptdev)
>   */
>  void panthor_gpu_resume(struct panthor_device *ptdev)
>  {
> -     panthor_gpu_irq_resume(&ptdev->gpu->irq, GPU_INTERRUPTS_MASK);
> +     panthor_gpu_irq_resume(&ptdev->gpu->irq);
>       panthor_hw_l2_power_on(ptdev);
>  }
>  
> diff --git a/drivers/gpu/drm/panthor/panthor_mmu.c 
> b/drivers/gpu/drm/panthor/panthor_mmu.c
> index 198d59f42578..a1b7917a31b1 100644
> --- a/drivers/gpu/drm/panthor/panthor_mmu.c
> +++ b/drivers/gpu/drm/panthor/panthor_mmu.c
> @@ -562,9 +562,21 @@ static u64 pack_region_range(struct panthor_device 
> *ptdev, u64 *region_start, u6
>       return region_width | *region_start;
>  }
>  
> +static u32 panthor_mmu_as_fault_mask(struct panthor_device *ptdev, u32 as)
> +{
> +     return BIT(as);
> +}
> +
> +/* Forward declaration to call helpers within as_enable/disable */
> +static void panthor_mmu_irq_handler(struct panthor_device *ptdev, u32 
> status);
> +PANTHOR_IRQ_HANDLER(mmu, MMU, panthor_mmu_irq_handler);
> +
>  static int panthor_mmu_as_enable(struct panthor_device *ptdev, u32 as_nr,
>                                u64 transtab, u64 transcfg, u64 memattr)
>  {
> +     panthor_mmu_irq_enable_events(&ptdev->mmu->irq,
> +                                    panthor_mmu_as_fault_mask(ptdev, as_nr));
> +
>       gpu_write64(ptdev, AS_TRANSTAB(as_nr), transtab);
>       gpu_write64(ptdev, AS_MEMATTR(as_nr), memattr);
>       gpu_write64(ptdev, AS_TRANSCFG(as_nr), transcfg);
> @@ -580,6 +592,9 @@ static int panthor_mmu_as_disable(struct panthor_device 
> *ptdev, u32 as_nr,
>  
>       lockdep_assert_held(&ptdev->mmu->as.slots_lock);
>  
> +     panthor_mmu_irq_disable_events(&ptdev->mmu->irq,
> +                                    panthor_mmu_as_fault_mask(ptdev, as_nr));
> +
>       /* Flush+invalidate RW caches, invalidate RO ones. */
>       ret = panthor_gpu_flush_caches(ptdev, CACHE_CLEAN | CACHE_INV,
>                                      CACHE_CLEAN | CACHE_INV, CACHE_INV);
> @@ -612,11 +627,6 @@ static u32 panthor_mmu_fault_mask(struct panthor_device 
> *ptdev, u32 value)
>       return value & GENMASK(15, 0);
>  }
>  
> -static u32 panthor_mmu_as_fault_mask(struct panthor_device *ptdev, u32 as)
> -{
> -     return BIT(as);
> -}
> -
>  /**
>   * panthor_vm_has_unhandled_faults() - Check if a VM has unhandled faults
>   * @vm: VM to check.
> @@ -670,6 +680,7 @@ int panthor_vm_active(struct panthor_vm *vm)
>       struct io_pgtable_cfg *cfg = 
> &io_pgtable_ops_to_pgtable(vm->pgtbl_ops)->cfg;
>       int ret = 0, as, cookie;
>       u64 transtab, transcfg;
> +     u32 fault_mask;
>  
>       if (!drm_dev_enter(&ptdev->base, &cookie))
>               return -ENODEV;
> @@ -743,14 +754,13 @@ int panthor_vm_active(struct panthor_vm *vm)
>       /* If the VM is re-activated, we clear the fault. */
>       vm->unhandled_fault = false;
>  
> -     /* Unhandled pagefault on this AS, clear the fault and re-enable 
> interrupts
> -      * before enabling the AS.
> +     /* Unhandled pagefault on this AS, clear the fault and enable the AS,
> +      * which re-enables interrupts.
>        */
> -     if (ptdev->mmu->as.faulty_mask & panthor_mmu_as_fault_mask(ptdev, as)) {
> -             gpu_write(ptdev, MMU_INT_CLEAR, 
> panthor_mmu_as_fault_mask(ptdev, as));
> -             ptdev->mmu->as.faulty_mask &= ~panthor_mmu_as_fault_mask(ptdev, 
> as);
> -             ptdev->mmu->irq.mask |= panthor_mmu_as_fault_mask(ptdev, as);
> -             gpu_write(ptdev, MMU_INT_MASK, ~ptdev->mmu->as.faulty_mask);
> +     fault_mask = panthor_mmu_as_fault_mask(ptdev, as);
> +     if (ptdev->mmu->as.faulty_mask & fault_mask) {
> +             gpu_write(ptdev, MMU_INT_CLEAR, fault_mask);
> +             ptdev->mmu->as.faulty_mask &= ~fault_mask;
>       }
>  
>       /* The VM update is guarded by ::op_lock, which we take at the beginning
> @@ -1698,7 +1708,6 @@ static void panthor_mmu_irq_handler(struct 
> panthor_device *ptdev, u32 status)
>       while (status) {
>               u32 as = ffs(status | (status >> 16)) - 1;
>               u32 mask = panthor_mmu_as_fault_mask(ptdev, as);
> -             u32 new_int_mask;
>               u64 addr;
>               u32 fault_status;
>               u32 exception_type;
> @@ -1716,8 +1725,6 @@ static void panthor_mmu_irq_handler(struct 
> panthor_device *ptdev, u32 status)
>               mutex_lock(&ptdev->mmu->as.slots_lock);
>  
>               ptdev->mmu->as.faulty_mask |= mask;
> -             new_int_mask =
> -                     panthor_mmu_fault_mask(ptdev, 
> ~ptdev->mmu->as.faulty_mask);
>  
>               /* terminal fault, print info about the fault */
>               drm_err(&ptdev->base,
> @@ -1741,11 +1748,6 @@ static void panthor_mmu_irq_handler(struct 
> panthor_device *ptdev, u32 status)
>                */
>               gpu_write(ptdev, MMU_INT_CLEAR, mask);
>  
> -             /* Ignore MMU interrupts on this AS until it's been
> -              * re-enabled.
> -              */
> -             ptdev->mmu->irq.mask = new_int_mask;
> -
>               if (ptdev->mmu->as.slots[as].vm)
>                       ptdev->mmu->as.slots[as].vm->unhandled_fault = true;
>  
> @@ -1760,7 +1762,6 @@ static void panthor_mmu_irq_handler(struct 
> panthor_device *ptdev, u32 status)
>       if (has_unhandled_faults)
>               panthor_sched_report_mmu_fault(ptdev);
>  }
> -PANTHOR_IRQ_HANDLER(mmu, MMU, panthor_mmu_irq_handler);
>  
>  /**
>   * panthor_mmu_suspend() - Suspend the MMU logic
> @@ -1805,7 +1806,7 @@ void panthor_mmu_resume(struct panthor_device *ptdev)
>       ptdev->mmu->as.faulty_mask = 0;
>       mutex_unlock(&ptdev->mmu->as.slots_lock);
>  
> -     panthor_mmu_irq_resume(&ptdev->mmu->irq, panthor_mmu_fault_mask(ptdev, 
> ~0));
> +     panthor_mmu_irq_resume(&ptdev->mmu->irq);
>  }
>  
>  /**
> @@ -1859,7 +1860,7 @@ void panthor_mmu_post_reset(struct panthor_device 
> *ptdev)
>  
>       mutex_unlock(&ptdev->mmu->as.slots_lock);
>  
> -     panthor_mmu_irq_resume(&ptdev->mmu->irq, panthor_mmu_fault_mask(ptdev, 
> ~0));
> +     panthor_mmu_irq_resume(&ptdev->mmu->irq);
>  
>       /* Restart the VM_BIND queues. */
>       mutex_lock(&ptdev->mmu->vm.lock);
> diff --git a/drivers/gpu/drm/panthor/panthor_pwr.c 
> b/drivers/gpu/drm/panthor/panthor_pwr.c
> index 57cfc7ce715b..ed3b2b4479ca 100644
> --- a/drivers/gpu/drm/panthor/panthor_pwr.c
> +++ b/drivers/gpu/drm/panthor/panthor_pwr.c
> @@ -545,5 +545,5 @@ void panthor_pwr_resume(struct panthor_device *ptdev)
>       if (!ptdev->pwr)
>               return;
>  
> -     panthor_pwr_irq_resume(&ptdev->pwr->irq, PWR_INTERRUPTS_MASK);
> +     panthor_pwr_irq_resume(&ptdev->pwr->irq);
>  }
>

Re: [PATCH v10 2/4] drm/panthor: Extend IRQ helpers for mask modification/restoration

Reply via email to