On Thu, Jan 13, 2022 at 01:06:09PM +0800, Peter Xu wrote:
> On Wed, Jan 05, 2022 at 12:19:45PM +0800, Jason Wang wrote:
> > @@ -1725,11 +1780,16 @@ static bool vtd_do_iommu_translate(VTDAddressSpace 
> > *vtd_as, PCIBus *bus,
> >          cc_entry->context_cache_gen = s->context_cache_gen;
> >      }
> >  
> > +    /* Try to fetch slpte form IOTLB */
> > +    if ((pasid == PCI_NO_PASID) && s->root_scalable) {
> > +        pasid = VTD_CE_GET_RID2PASID(&ce);
> > +    }
> > +
> >      /*
> >       * We don't need to translate for pass-through context entries.
> >       * Also, let's ignore IOTLB caching as well for PT devices.
> >       */
> > -    if (vtd_dev_pt_enabled(s, &ce)) {
> > +    if (vtd_dev_pt_enabled(s, &ce, pasid)) {
> >          entry->iova = addr & VTD_PAGE_MASK_4K;
> >          entry->translated_addr = entry->iova;
> >          entry->addr_mask = ~VTD_PAGE_MASK_4K;
> > @@ -1750,14 +1810,24 @@ static bool vtd_do_iommu_translate(VTDAddressSpace 
> > *vtd_as, PCIBus *bus,
> >          return true;
> >      }
> >  
> > +    iotlb_entry = vtd_lookup_iotlb(s, source_id, addr, pasid);
> > +    if (iotlb_entry) {
> > +        trace_vtd_iotlb_page_hit(source_id, addr, iotlb_entry->slpte,
> > +                                 iotlb_entry->domain_id);
> > +        slpte = iotlb_entry->slpte;
> > +        access_flags = iotlb_entry->access_flags;
> > +        page_mask = iotlb_entry->mask;
> > +        goto out;
> > +    }
> 
> IIUC the iotlb lookup moved down just because the pasid==NO_PASID case then
> we'll need to fetch the default pasid from the context entry.  That looks
> reasonable.
> 
> It's just a bit of pity because logically it'll slow down iotlb hits due to
> context entry operations.  When NO_PASID we could have looked up iotlb without
> checking pasid at all, assuming that "default pasid" will always match.  But
> that is a little bit hacky.

Maybe that's not a bad idea for an optimization.


> vIOMMU seems to be mostly used for assigned devices and dpdk in production in
> the future due to its slowness otherwise.. so maybe not a big deal at all.
> 
> [...]
> 
> > @@ -2011,7 +2083,52 @@ static void 
> > vtd_iotlb_page_invalidate(IntelIOMMUState *s, uint16_t domain_id,
> >      vtd_iommu_lock(s);
> >      g_hash_table_foreach_remove(s->iotlb, vtd_hash_remove_by_page, &info);
> >      vtd_iommu_unlock(s);
> > -    vtd_iotlb_page_invalidate_notify(s, domain_id, addr, am);
> > +    vtd_iotlb_page_invalidate_notify(s, domain_id, addr, am, PCI_NO_PASID);
> > +}
> > +
> > +static void vtd_iotlb_page_pasid_invalidate(IntelIOMMUState *s,
> > +                                            uint16_t domain_id,
> > +                                            hwaddr addr, uint8_t am,
> > +                                            uint32_t pasid)
> > +{
> > +    VTDIOTLBPageInvInfo info;
> > +
> > +    trace_vtd_inv_desc_iotlb_pasid_pages(domain_id, addr, am, pasid);
> > +
> > +    assert(am <= VTD_MAMV);
> > +    info.domain_id = domain_id;
> > +    info.addr = addr;
> > +    info.mask = ~((1 << am) - 1);
> > +    info.pasid = pasid;
> > +    vtd_iommu_lock(s);
> > +    g_hash_table_foreach_remove(s->iotlb, vtd_hash_remove_by_page_pasid, 
> > &info);
> > +    vtd_iommu_unlock(s);
> > +    vtd_iotlb_page_invalidate_notify(s, domain_id, addr, am, pasid);
> 
> Hmm, I think indeed we need a notification, but it'll be unnecessary for
> e.g. vfio map notifiers, because this is 1st level invalidation and at least 
> so
> far vfio map notifiers are rewalking only the 2nd level page table, so it'll 
> be
> destined to be a no-op and pure overhead.
> 
> > +}
> > +
> > +static void vtd_iotlb_pasid_invalidate(IntelIOMMUState *s, uint16_t 
> > domain_id,
> > +                                       uint32_t pasid)
> > +{
> > +    VTDIOTLBPageInvInfo info;
> > +    VTDAddressSpace *vtd_as;
> > +    VTDContextEntry ce;
> > +
> > +    trace_vtd_inv_desc_iotlb_pasid(domain_id, pasid);
> > +
> > +    info.domain_id = domain_id;
> > +    info.pasid = pasid;
> > +    vtd_iommu_lock(s);
> > +    g_hash_table_foreach_remove(s->iotlb, vtd_hash_remove_by_pasid, &info);
> > +    vtd_iommu_unlock(s);
> > +
> > +    QLIST_FOREACH(vtd_as, &s->vtd_as_with_notifiers, next) {
> > +        if (!vtd_dev_to_context_entry(s, pci_bus_num(vtd_as->bus),
> > +                                      vtd_as->devfn, &ce) &&
> > +            domain_id == vtd_get_domain_id(s, &ce, vtd_as->pasid) &&
> > +            pasid == vtd_as->pasid) {
> > +            vtd_sync_shadow_page_table(vtd_as);
> 
> Do we need to rewalk the shadow pgtable (which is the 2nd level, afaict) even
> if we got the 1st level pgtable invalidated?
> 
> > +        }
> > +    }
> >  }
> 
> The rest looks mostly good to me; thanks.
> 
> -- 
> Peter Xu


Reply via email to