On 11/06/2026 17:11, Karunika Choo wrote:
> On 11/06/2026 15:45, Steven Price wrote:
>> On 28/05/2026 16:05, Karunika Choo wrote:
>>> Move the MMU address-space register layout into the hardware description
>>> by storing the MMU_AS base offset and per-AS stride in the Panthor HW
>>> map.
>>>
>>> Use those values to compute the iomem pointer for each AS slot and make
>>> the MMU AS register definitions relative to the per-slot register window
>>> instead of hard-coding the slot offset in every register macro.
>>>
>>> This prepares the MMU code for GPUs where the MMU AS register region is
>>> not at a fixed offset while keeping the existing register accesses
>>> scoped to a single AS window.
>>>
>>> Signed-off-by: Karunika Choo <[email protected]>
>>> ---
>>>  drivers/gpu/drm/panthor/panthor_hw.c       |  8 +++++
>>>  drivers/gpu/drm/panthor/panthor_hw.h       |  8 +++++
>>>  drivers/gpu/drm/panthor/panthor_mmu.c      | 35 ++++++++++++++--------
>>>  drivers/gpu/drm/panthor/panthor_mmu_regs.h | 23 ++++++--------
>>>  4 files changed, 47 insertions(+), 27 deletions(-)
>>>
>>> diff --git a/drivers/gpu/drm/panthor/panthor_hw.c 
>>> b/drivers/gpu/drm/panthor/panthor_hw.c
>>> index 1f7fab4caf4d..e677f1a8f488 100644
>>> --- a/drivers/gpu/drm/panthor/panthor_hw.c
>>> +++ b/drivers/gpu/drm/panthor/panthor_hw.c
>>> @@ -41,6 +41,10 @@ static struct panthor_hw panthor_hw_arch_v10 = {
>>>     .map = {
>>>             .gpu_control_base = 0x0,
>>>             .mcu_control_base = 0x700,
>>> +           .mmu_as = {
>>> +                   .base = 0x2400,
>>> +                   .stride = 0x40,
>>> +           },
>>>     },
>>>  };
>>>  
>>> @@ -54,6 +58,10 @@ static struct panthor_hw panthor_hw_arch_v14 = {
>>>             .gpu_control_base = 0x0,
>>>             .pwr_control_base = 0x800,
>>>             .mcu_control_base = 0x700,
>>> +           .mmu_as = {
>>> +                   .base = 0x2400,
>>> +                   .stride = 0x40,
>>> +           },
>>>     },
>>>  };
>>>  
>>> diff --git a/drivers/gpu/drm/panthor/panthor_hw.h 
>>> b/drivers/gpu/drm/panthor/panthor_hw.h
>>> index 58673a427bc9..0ae11b78c77e 100644
>>> --- a/drivers/gpu/drm/panthor/panthor_hw.h
>>> +++ b/drivers/gpu/drm/panthor/panthor_hw.h
>>> @@ -38,6 +38,14 @@ struct panthor_hw_regmap {
>>>  
>>>     /** @mcu_control_base: MCU_CONTROL base address */
>>>     u32 mcu_control_base;
>>> +
>>> +   struct {
>>> +           /** @mmu_as.base: MMU_AS base address */
>>> +           u32 base;
>>> +
>>> +           /** @mmu_as.stride: Stride between subsequent MMU_AS register 
>>> blocks */
>>> +           u32 stride;
>>> +   } mmu_as;
>>>  };
>>>  
>>>  /**
>>> diff --git a/drivers/gpu/drm/panthor/panthor_mmu.c 
>>> b/drivers/gpu/drm/panthor/panthor_mmu.c
>>> index 48127313332f..9a64f977d28c 100644
>>> --- a/drivers/gpu/drm/panthor/panthor_mmu.c
>>> +++ b/drivers/gpu/drm/panthor/panthor_mmu.c
>>> @@ -36,6 +36,7 @@
>>>  #include "panthor_gpu.h"
>>>  #include "panthor_gpu_regs.h"
>>>  #include "panthor_heap.h"
>>> +#include "panthor_hw.h"
>>>  #include "panthor_mmu.h"
>>>  #include "panthor_mmu_regs.h"
>>>  #include "panthor_sched.h"
>>> @@ -57,7 +58,7 @@ struct panthor_as_slot {
>>>   */
>>>  struct panthor_mmu {
>>>     /** @iomem: CPU mapping of MMU_AS_CONTROL iomem region */
>>> -   void __iomem *iomem;
>>> +   void __iomem *iomem[MAX_AS_SLOTS];
>>
>> I'm not convinced that having a iomem pointer per AS is worth it. It 
>> seems excessive.
>>
>> Boris's suggestion of moving it to panthor_as_slot at least avoids the 
>> array indexing, but I did wonder about just having a helper function. AI 
>> cooked up the below diff (untested, applies on top) which demonstrates
>> the idea.
>>
>> I think the AI was a bit over the top with the as_present check in the
>> helper, although that would clearly indicate a serious bug if it
>> triggered.
>>
>> What do you think?
>>
>> Thanks,
>> Steve
> 
> TBF, with Boris's suggestion, I included a new as_iomem() helper
> anyways, this isn't that far off as an option. Perhaps maybe
> rename `iomem` to `as_iomem` to clarify that this isn't the
> MMU_CONTROL iomem. 
> 
> I don't really mind either way, this option has the ambiguity
> of where the iomem belongs to, while Boris' solution adds a
> little more baggage to the struct but ownership is clear.

Yeah I wasn't really happy with the AI's output - I just wanted to see
what it would look like and it was a quick way of doing that. There's
definitely some cases where the helper makes the code easier to read and
I disliked the array.

It sounds like you've already got something with Boris's suggestion and
a helper, so I think we're probably good to stick with that.

Thanks,
Steve

> Kind regards,
> Karunika
> 
>>
>> ----8<-----
>> diff --git a/drivers/gpu/drm/panthor/panthor_mmu.c 
>> b/drivers/gpu/drm/panthor/panthor_mmu.c
>> index 53c5744609fa..6127df893476 100644
>> --- a/drivers/gpu/drm/panthor/panthor_mmu.c
>> +++ b/drivers/gpu/drm/panthor/panthor_mmu.c
>> @@ -58,7 +58,7 @@ struct panthor_as_slot {
>>   */
>>  struct panthor_mmu {
>>      /** @iomem: CPU mapping of MMU_AS_CONTROL iomem region */
>> -    void __iomem *iomem[MAX_AS_SLOTS];
>> +    void __iomem *iomem;
>>  
>>      /** @irq: The MMU irq. */
>>      struct panthor_irq irq;
>> @@ -112,6 +112,20 @@ struct panthor_mmu {
>>      } vm;
>>  };
>>  
>> +static void __iomem *
>> +panthor_mmu_as_iomem(struct panthor_device *ptdev, u32 as_nr)
>> +{
>> +    struct panthor_mmu *mmu = ptdev->mmu;
>> +
>> +    if (drm_WARN_ON(&ptdev->base, as_nr >= MAX_AS_SLOTS))
>> +            return mmu->iomem;
>> +
>> +    if (drm_WARN_ON(&ptdev->base, !(ptdev->gpu_info.as_present & 
>> BIT(as_nr))))
>> +            return mmu->iomem;
>> +
>> +    return mmu->iomem + (ptdev->hw->map.mmu_as.stride * as_nr);
>> +}
>> +
>>  /**
>>   * struct panthor_vm_pool - VM pool object
>>   */
>> @@ -522,14 +536,14 @@ static void free_pt(void *cookie, void *data, size_t 
>> size)
>>  
>>  static int wait_ready(struct panthor_device *ptdev, u32 as_nr)
>>  {
>> -    struct panthor_mmu *mmu = ptdev->mmu;
>> +    void __iomem *as_iomem = panthor_mmu_as_iomem(ptdev, as_nr);
>>      int ret;
>>      u32 val;
>>  
>>      /* Wait for the MMU status to indicate there is no active command, in
>>       * case one is pending.
>>       */
>> -    ret = gpu_read_relaxed_poll_timeout_atomic(mmu->iomem[as_nr], 
>> AS_STATUS, val,
>> +    ret = gpu_read_relaxed_poll_timeout_atomic(as_iomem, AS_STATUS, val,
>>                                                 !(val & 
>> AS_STATUS_AS_ACTIVE), 10, 100000);
>>  
>>      if (ret) {
>> @@ -542,12 +556,13 @@ static int wait_ready(struct panthor_device *ptdev, 
>> u32 as_nr)
>>  
>>  static int as_send_cmd_and_wait(struct panthor_device *ptdev, u32 as_nr, 
>> u32 cmd)
>>  {
>> +    void __iomem *as_iomem = panthor_mmu_as_iomem(ptdev, as_nr);
>>      int status;
>>  
>>      /* write AS_COMMAND when MMU is ready to accept another command */
>>      status = wait_ready(ptdev, as_nr);
>>      if (!status) {
>> -            gpu_write(ptdev->mmu->iomem[as_nr], AS_COMMAND, cmd);
>> +            gpu_write(as_iomem, AS_COMMAND, cmd);
>>              status = wait_ready(ptdev, as_nr);
>>      }
>>  
>> @@ -595,14 +610,14 @@ PANTHOR_IRQ_HANDLER(mmu, panthor_mmu_irq_handler);
>>  static int panthor_mmu_as_enable(struct panthor_device *ptdev, u32 as_nr,
>>                               u64 transtab, u64 transcfg, u64 memattr)
>>  {
>> -    struct panthor_mmu *mmu = ptdev->mmu;
>> +    void __iomem *as_iomem = panthor_mmu_as_iomem(ptdev, as_nr);
>>  
>>      panthor_mmu_irq_enable_events(&ptdev->mmu->irq,
>>                                    panthor_mmu_as_fault_mask(ptdev, as_nr));
>>  
>> -    gpu_write64(mmu->iomem[as_nr], AS_TRANSTAB, transtab);
>> -    gpu_write64(mmu->iomem[as_nr], AS_MEMATTR, memattr);
>> -    gpu_write64(mmu->iomem[as_nr], AS_TRANSCFG, transcfg);
>> +    gpu_write64(as_iomem, AS_TRANSTAB, transtab);
>> +    gpu_write64(as_iomem, AS_MEMATTR, memattr);
>> +    gpu_write64(as_iomem, AS_TRANSCFG, transcfg);
>>  
>>      return as_send_cmd_and_wait(ptdev, as_nr, AS_COMMAND_UPDATE);
>>  }
>> @@ -610,8 +625,8 @@ static int panthor_mmu_as_enable(struct panthor_device 
>> *ptdev, u32 as_nr,
>>  static int panthor_mmu_as_disable(struct panthor_device *ptdev, u32 as_nr,
>>                                bool recycle_slot)
>>  {
>> -    struct panthor_mmu *mmu = ptdev->mmu;
>>      struct panthor_vm *vm = ptdev->mmu->as.slots[as_nr].vm;
>> +    void __iomem *as_iomem = panthor_mmu_as_iomem(ptdev, as_nr);
>>      int ret;
>>  
>>      lockdep_assert_held(&ptdev->mmu->as.slots_lock);
>> @@ -638,9 +653,9 @@ static int panthor_mmu_as_disable(struct panthor_device 
>> *ptdev, u32 as_nr,
>>      if (recycle_slot)
>>              return 0;
>>  
>> -    gpu_write64(mmu->iomem[as_nr], AS_TRANSTAB, 0);
>> -    gpu_write64(mmu->iomem[as_nr], AS_MEMATTR, 0);
>> -    gpu_write64(mmu->iomem[as_nr], AS_TRANSCFG, 
>> AS_TRANSCFG_ADRMODE_UNMAPPED);
>> +    gpu_write64(as_iomem, AS_TRANSTAB, 0);
>> +    gpu_write64(as_iomem, AS_MEMATTR, 0);
>> +    gpu_write64(as_iomem, AS_TRANSCFG, AS_TRANSCFG_ADRMODE_UNMAPPED);
>>  
>>      return as_send_cmd_and_wait(ptdev, as_nr, AS_COMMAND_UPDATE);
>>  }
>> @@ -1740,7 +1755,7 @@ static int panthor_vm_lock_region(struct panthor_vm 
>> *vm, u64 start, u64 size)
>>      mutex_lock(&ptdev->mmu->as.slots_lock);
>>      if (vm->as.id >= 0 && size) {
>>              /* Lock the region that needs to be updated */
>> -            gpu_write64(ptdev->mmu->iomem[vm->as.id], AS_LOCKADDR,
>> +            gpu_write64(panthor_mmu_as_iomem(ptdev, vm->as.id), AS_LOCKADDR,
>>                          pack_region_range(ptdev, &start, &size));
>>  
>>              /* If the lock succeeded, update the locked_region info. */
>> @@ -1789,21 +1804,21 @@ static void panthor_vm_unlock_region(struct 
>> panthor_vm *vm)
>>  
>>  static void panthor_mmu_irq_handler(struct panthor_device *ptdev, u32 
>> status)
>>  {
>> -    struct panthor_mmu *mmu = ptdev->mmu;
>>      bool has_unhandled_faults = false;
>>  
>>      status = panthor_mmu_fault_mask(ptdev, status);
>>      while (status) {
>>              u32 as = ffs(status | (status >> 16)) - 1;
>>              u32 mask = panthor_mmu_as_fault_mask(ptdev, as);
>> +            void __iomem *as_iomem = panthor_mmu_as_iomem(ptdev, as);
>>              u64 addr;
>>              u32 fault_status;
>>              u32 exception_type;
>>              u32 access_type;
>>              u32 source_id;
>>  
>> -            fault_status = gpu_read(mmu->iomem[as], AS_FAULTSTATUS);
>> -            addr = gpu_read64(mmu->iomem[as], AS_FAULTADDRESS);
>> +            fault_status = gpu_read(as_iomem, AS_FAULTSTATUS);
>> +            addr = gpu_read64(as_iomem, AS_FAULTADDRESS);
>>  
>>              /* decode the fault status */
>>              exception_type = fault_status & 0xFF;
>> @@ -1834,7 +1849,7 @@ static void panthor_mmu_irq_handler(struct 
>> panthor_device *ptdev, u32 status)
>>               * Note that COMPLETED irqs are never cleared, but this is fine
>>               * because they are always masked.
>>               */
>> -            gpu_write(mmu->irq.iomem, INT_CLEAR, mask);
>> +            gpu_write(ptdev->mmu->irq.iomem, INT_CLEAR, mask);
>>  
>>              if (ptdev->mmu->as.slots[as].vm)
>>                      ptdev->mmu->as.slots[as].vm->unhandled_fault = true;
>> @@ -3239,11 +3254,8 @@ static void panthor_mmu_release_wq(struct drm_device 
>> *ddev, void *res)
>>  int panthor_mmu_init(struct panthor_device *ptdev)
>>  {
>>      u32 va_bits = GPU_MMU_FEATURES_VA_BITS(ptdev->gpu_info.mmu_features);
>> -    unsigned long as_present_mask = ptdev->gpu_info.as_present;
>> -    struct panthor_hw_regmap *regmap = &ptdev->hw->map;
>>      struct panthor_mmu *mmu;
>>      int ret, irq;
>> -    u32 as_id;
>>  
>>      mmu = drmm_kzalloc(&ptdev->base, sizeof(*mmu), GFP_KERNEL);
>>      if (!mmu)
>> @@ -3260,12 +3272,7 @@ int panthor_mmu_init(struct panthor_device *ptdev)
>>      if (ret)
>>              return ret;
>>  
>> -    for_each_set_bit(as_id, &as_present_mask, MAX_AS_SLOTS) {
>> -            u64 offset = regmap->mmu_as.base + (regmap->mmu_as.stride * 
>> as_id);
>> -
>> -            mmu->iomem[as_id] = ptdev->iomem + offset;
>> -    }
>> -
>> +    mmu->iomem = ptdev->iomem + ptdev->hw->map.mmu_as.base;
>>      ptdev->mmu = mmu;
>>  
>>      irq = platform_get_irq_byname(to_platform_device(ptdev->base.dev), 
>> "mmu");
>>
> 

Reply via email to