Hi Christoffer,

On 17/10/2017 23:40, Christoffer Dall wrote:
> On Tue, Oct 17, 2017 at 09:09:59AM +0200, Eric Auger wrote:
>> AT the moment if ITT only contains invalid entries,
>> vgic_its_restore_itt returns 1 and this is considered as
>> an an error in vgic_its_restore_dte.
>>
>> Also in case the device table only contains invalid entries,
>> the table restore fails and this is not correct.
>>
>> This patch fully revisits the errror handling while fixing those
>> 2 bugs.
>>
>> - entry_fn_t now takes a valid output paraleter
> 
>                                         parameter
> 
>> - scan_its_table() now returns <= 0 values and output 2 booleans,
>                                                  outputs
>>   valid and last.
>> - vgic_its_restore_itt() now returns <= 0 values.
>> - vgic_its_restore_device_tables() also returns <= 0 values.
>>
>> With that patch we are able to properly handle the case where
>> all data are invalid but we still are able to detect the case
>> where a next entry was referenced by some valid entry and
>> never found.
>>
>> Fixes: 57a9a117154c93 (KVM: arm64: vgic-its: Device table save/restore)
>> Fixes: eff484e0298da5 (KVM: arm64: vgic-its: ITT save and restore)
>> Signed-off-by: Eric Auger <[email protected]>
>> Reported-by: wanghaibin <[email protected]>
>>
>> ---
>>
>> need to CC stable
>>
>> v3 -> v4:
>> - set *valid at beginning of handle_l1_dte
>>
>> v2 -> v3:
>> - add comments
>> - added valid parameter
>> - vgic_its_restore_itt don't return +1 anymore
>> - reword the commit message
>>
>> v1 -> v2:
>> - if (ret > 0) ret = 0
>> ---
>>  virt/kvm/arm/vgic/vgic-its.c | 95 
>> ++++++++++++++++++++++++++++++++------------
>>  1 file changed, 70 insertions(+), 25 deletions(-)
>>
>> diff --git a/virt/kvm/arm/vgic/vgic-its.c b/virt/kvm/arm/vgic/vgic-its.c
>> index f51c1e1..eea14a1 100644
>> --- a/virt/kvm/arm/vgic/vgic-its.c
>> +++ b/virt/kvm/arm/vgic/vgic-its.c
>> @@ -1772,16 +1772,20 @@ static u32 compute_next_eventid_offset(struct 
>> list_head *h, struct its_ite *ite)
>>  
>>  /**
>>   * entry_fn_t - Callback called on a table entry restore path
>> + *
>>   * @its: its handle
>>   * @id: id of the entry
>>   * @entry: pointer to the entry
>>   * @opaque: pointer to an opaque data
>> + * @valid: indicates whether valid data is associated to this entry
>> + * (the entry itself in case of linear table or entries in the next level,
>> + * in case of hierachical tables)
>>   *
>>   * Return: < 0 on error, 0 if last element was identified, id offset to next
>>   * element otherwise
>>   */
>>  typedef int (*entry_fn_t)(struct vgic_its *its, u32 id, void *entry,
>> -                      void *opaque);
>> +                      void *opaque, bool *valid);
>>  
>>  /**
>>   * scan_its_table - Scan a contiguous table in guest RAM and applies a 
>> function
>> @@ -1794,29 +1798,34 @@ typedef int (*entry_fn_t)(struct vgic_its *its, u32 
>> id, void *entry,
>>   * @start_id: the ID of the first entry in the table
>>   * (non zero for 2d level tables)
>>   * @fn: function to apply on each entry
>> + * @opaque: opaque data passed to @fn
>> + * @valid: indicates whether the table contains any valid data
>> + * @last: returns whether the last valid entry was decoded
>>   *
>> - * Return: < 0 on error, 0 if last element was identified, 1 otherwise
>> - * (the last element may not be found on second level tables)
>> + * Return: < 0 on error, 0 on success
>>   */
>>  static int scan_its_table(struct vgic_its *its, gpa_t base, int size, int 
>> esz,
>> -                      int start_id, entry_fn_t fn, void *opaque)
>> +                      int start_id, entry_fn_t fn, void *opaque,
>> +                      bool *valid, bool *last)
>>  {
>>      void *entry = kzalloc(esz, GFP_KERNEL);
>>      struct kvm *kvm = its->dev->kvm;
>>      unsigned long len = size;
>>      int id = start_id;
>>      gpa_t gpa = base;
>> +    int next_offset = 0;
>>      int ret;
>>  
>>      while (len > 0) {
>> -            int next_offset;
>>              size_t byte_offset;
>> +            bool entry_valid;
>>  
>>              ret = kvm_read_guest(kvm, gpa, entry, esz);
>>              if (ret)
>>                      goto out;
>>  
>> -            next_offset = fn(its, id, entry, opaque);
>> +            next_offset = fn(its, id, entry, opaque, &entry_valid);
>> +            *valid |= entry_valid;
>>              if (next_offset <= 0) {
>>                      ret = next_offset;
>>                      goto out;
>> @@ -1827,9 +1836,15 @@ static int scan_its_table(struct vgic_its *its, gpa_t 
>> base, int size, int esz,
>>              gpa += byte_offset;
>>              len -= byte_offset;
>>      }
>> -    ret =  1;
>> -
>> +    /*
>> +     * the table lookup was completed without identifying the
>> +     * last valid entry (ie. next_offset > 0).
>> +     */
> 
> but you never set last to false?  If you require the caller to set the
> variable to false, that should be documented, but it's weird.
> 
>> +    ret = 0;
>>  out:
>> +    if (!next_offset)
>> +            *last = true;
>> +
> 
> so if we scan the entire table to the end we won't set last?  Isn't that
> a bit strange?
> 
> Also, if we can get id of the valid out parameter and instead handle
> that within this function, I don't think you'll need the 'last' return
> value in vgic_its_restore_device_tables, and you could make this:
> 
>       if (!next_offset && last)
>               *last = true;
>       else if (last)
>               *last = false;
> 
>>      kfree(entry);
>>      return ret;
>>  }
>> @@ -1854,12 +1869,14 @@ static int vgic_its_save_ite(struct vgic_its *its, 
>> struct its_device *dev,
>>  
>>  /**
>>   * vgic_its_restore_ite - restore an interrupt translation entry
>> + *
>>   * @event_id: id used for indexing
>>   * @ptr: pointer to the ITE entry
>>   * @opaque: pointer to the its_device
>> + * @valid: indicates whether the ite is valid
>>   */
>>  static int vgic_its_restore_ite(struct vgic_its *its, u32 event_id,
>> -                            void *ptr, void *opaque)
>> +                            void *ptr, void *opaque, bool *valid)
>>  {
>>      struct its_device *dev = (struct its_device *)opaque;
>>      struct its_collection *collection;
>> @@ -1879,7 +1896,9 @@ static int vgic_its_restore_ite(struct vgic_its *its, 
>> u32 event_id,
>>      coll_id = val & KVM_ITS_ITE_ICID_MASK;
>>      lpi_id = (val & KVM_ITS_ITE_PINTID_MASK) >> KVM_ITS_ITE_PINTID_SHIFT;
>>  
>> -    if (!lpi_id)
>> +    *valid = !!lpi_id;
>> +
>> +    if (!*valid)
>>              return 1; /* invalid entry, no choice but to scan next entry */
>>  
>>      if (lpi_id < VGIC_MIN_LPI)
>> @@ -1940,6 +1959,14 @@ static int vgic_its_save_itt(struct vgic_its *its, 
>> struct its_device *device)
>>      return 0;
>>  }
>>  
>> +/**
>> + * vgic_its_restore_itt - restore the ITT of a device
>> + *
>> + * @its: its handle
>> + * @dev: device handle
>> + *
>> + * Return 0 on success, < 0 on error
>> + */
>>  static int vgic_its_restore_itt(struct vgic_its *its, struct its_device 
>> *dev)
>>  {
>>      const struct vgic_its_abi *abi = vgic_its_get_abi(its);
>> @@ -1947,9 +1974,15 @@ static int vgic_its_restore_itt(struct vgic_its *its, 
>> struct its_device *dev)
>>      int ret;
>>      int ite_esz = abi->ite_esz;
>>      size_t max_size = BIT_ULL(dev->num_eventid_bits) * ite_esz;
>> +    bool valid = false, last = false;
>>  
>>      ret = scan_its_table(its, base, max_size, ite_esz, 0,
>> -                         vgic_its_restore_ite, dev);
>> +                         vgic_its_restore_ite, dev, &valid, &last);
>> +
>> +    if (!ret && valid && !last) {
>> +            /* a next element was referenced but not found */
>> +            return -EINVAL;
> 
> So this is if we ever found a valid entry, but somehow it didn't lead us
> to the last entry, right?  Can't you handle that within the
> scan_its_table?
> 
> As I understand it, scan_its_table is in one of two modes, either it's
> linearly scanning, or it found a valid entry, and it's jumping from one
> entry to the next, given the offsets.  If it's in the second mode, and
> finds an invalid entry, it should return an error.
> 
> I think you can also get rid of the '*valid = false; return 1;' thing,
> which looks a bit strange.

Given the number of changes this rework will produce I guess this patch
wouldn't be candidate for cc'ed stable. Then shouldn't we consider to
first apply the fix proposed by Wanghaibin (cc'ed stable) and then apply
the rework in a second and subsequent patch?

Thanks

Eric
> 
>> +    }
>>  
>>      return ret;
>>  }
>> @@ -1985,29 +2018,29 @@ static int vgic_its_save_dte(struct vgic_its *its, 
>> struct its_device *dev,
>>   * @id: device id the DTE corresponds to
>>   * @ptr: kernel VA where the 8 byte DTE is located
>>   * @opaque: unused
>> + * @valid: indicates whether the dte is valid
>>   *
>>   * Return: < 0 on error, 0 if the dte is the last one, id offset to the
>>   * next dte otherwise
>>   */
>>  static int vgic_its_restore_dte(struct vgic_its *its, u32 id,
>> -                            void *ptr, void *opaque)
>> +                            void *ptr, void *opaque, bool *valid)
>>  {
>>      struct its_device *dev;
>>      gpa_t itt_addr;
>>      u8 num_eventid_bits;
>>      u64 entry = *(u64 *)ptr;
>> -    bool valid;
>>      u32 offset;
>>      int ret;
>>  
>>      entry = le64_to_cpu(entry);
>>  
>> -    valid = entry >> KVM_ITS_DTE_VALID_SHIFT;
>> +    *valid = entry >> KVM_ITS_DTE_VALID_SHIFT;
>>      num_eventid_bits = (entry & KVM_ITS_DTE_SIZE_MASK) + 1;
>>      itt_addr = ((entry & KVM_ITS_DTE_ITTADDR_MASK)
>>                      >> KVM_ITS_DTE_ITTADDR_SHIFT) << 8;
>>  
>> -    if (!valid)
>> +    if (!*valid)
>>              return 1;
>>  
>>      /* dte entry is valid */
>> @@ -2082,13 +2115,14 @@ static int vgic_its_save_device_tables(struct 
>> vgic_its *its)
>>   * @id: index of the entry in the L1 table
>>   * @addr: kernel VA
>>   * @opaque: unused
>> + * @valid: indicates whether any dte entry was found
>>   *
>>   * L1 table entries are scanned by steps of 1 entry
>>   * Return < 0 if error, 0 if last dte was found when scanning the L2
>>   * table, +1 otherwise (meaning next L1 entry must be scanned)
>>   */
>>  static int handle_l1_dte(struct vgic_its *its, u32 id, void *addr,
>> -                     void *opaque)
>> +                     void *opaque, bool *valid)
>>  {
>>      const struct vgic_its_abi *abi = vgic_its_get_abi(its);
>>      int l2_start_id = id * (SZ_64K / abi->dte_esz);
>> @@ -2096,21 +2130,29 @@ static int handle_l1_dte(struct vgic_its *its, u32 
>> id, void *addr,
>>      int dte_esz = abi->dte_esz;
>>      gpa_t gpa;
>>      int ret;
>> +    bool last;
>>  
>>      entry = le64_to_cpu(entry);
>>  
>> -    if (!(entry & KVM_ITS_L1E_VALID_MASK))
>> +    *valid = entry & KVM_ITS_L1E_VALID_MASK;
>> +
>> +    if (!*valid)
>>              return 1;
>>  
>>      gpa = entry & KVM_ITS_L1E_ADDR_MASK;
>>  
>>      ret = scan_its_table(its, gpa, SZ_64K, dte_esz,
>> -                         l2_start_id, vgic_its_restore_dte, NULL);
>> +                         l2_start_id, vgic_its_restore_dte, NULL,
>> +                         valid, &last);
>>  
>> -    if (ret <= 0)
>> -            return ret;
>> +    /*
>> +     * if the last dte has not been found in this L2 table, we
>> +     * need to scan the next L1 entry
>> +     */
>> +    if (!ret && !last)
>> +            return 1;
>>  
>> -    return 1;
>> +    return ret;
>>  }
>>  
>>  /**
>> @@ -2124,6 +2166,7 @@ static int vgic_its_restore_device_tables(struct 
>> vgic_its *its)
>>      int l1_esz, ret;
>>      int l1_tbl_size = GITS_BASER_NR_PAGES(baser) * SZ_64K;
>>      gpa_t l1_gpa;
>> +    bool valid = false, last = false;
>>  
>>      if (!(baser & GITS_BASER_VALID))
>>              return 0;
>> @@ -2133,15 +2176,17 @@ static int vgic_its_restore_device_tables(struct 
>> vgic_its *its)
>>      if (baser & GITS_BASER_INDIRECT) {
>>              l1_esz = GITS_LVL1_ENTRY_SIZE;
>>              ret = scan_its_table(its, l1_gpa, l1_tbl_size, l1_esz, 0,
>> -                                 handle_l1_dte, NULL);
>> +                                 handle_l1_dte, NULL, &valid, &last);
>>      } else {
>>              l1_esz = abi->dte_esz;
>>              ret = scan_its_table(its, l1_gpa, l1_tbl_size, l1_esz, 0,
>> -                                 vgic_its_restore_dte, NULL);
>> +                                 vgic_its_restore_dte, NULL, &valid, &last);
>>      }
>>  
>> -    if (ret > 0)
>> -            ret = -EINVAL;
>> +    if (!ret && valid && !last) {
>> +            /* a next element was referenced but not found */
>> +            return -EINVAL;
>> +    }
> 
> Same comment as above.
> 
>>  
>>      return ret;
>>  }
>> -- 
>> 2.5.5
>>
> Thanks,
> -Christoffer
> 

Reply via email to