[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

Re: [Xen-devel] [PATCH v2 13/13] [RFC] iommu: AMD-Vi: Squash map_pages/unmap_pages with map_page/unmap_page



Hi, all.

Any comments?

On Tue, Jul 25, 2017 at 8:26 PM, Oleksandr Tyshchenko
<olekstysh@xxxxxxxxx> wrote:
> From: Oleksandr Tyshchenko <oleksandr_tyshchenko@xxxxxxxx>
>
> Reduce the scope of the TODO by squashing single-page stuff with
> multi-page one. Next target is to use large pages whenever possible
> in the case that hardware supports them.
>
> Signed-off-by: Oleksandr Tyshchenko <oleksandr_tyshchenko@xxxxxxxx>
> CC: Jan Beulich <jbeulich@xxxxxxxx>
> CC: Suravee Suthikulpanit <suravee.suthikulpanit@xxxxxxx>
>
> ---
>    Changes in v1:
>       -
>
>    Changes in v2:
>       -
>
> Signed-off-by: Oleksandr Tyshchenko <oleksandr_tyshchenko@xxxxxxxx>
> ---
>  xen/drivers/passthrough/amd/iommu_map.c | 250 
> ++++++++++++++++----------------
>  1 file changed, 121 insertions(+), 129 deletions(-)
>
> diff --git a/xen/drivers/passthrough/amd/iommu_map.c 
> b/xen/drivers/passthrough/amd/iommu_map.c
> index ea3a728..22d0cc6 100644
> --- a/xen/drivers/passthrough/amd/iommu_map.c
> +++ b/xen/drivers/passthrough/amd/iommu_map.c
> @@ -631,188 +631,180 @@ static int update_paging_mode(struct domain *d, 
> unsigned long gfn)
>      return 0;
>  }
>
> -static int __must_check amd_iommu_map_page(struct domain *d, unsigned long 
> gfn,
> -                                           unsigned long mfn,
> -                                           unsigned int flags)
> +/*
> + * TODO: Optimize by using large pages whenever possible in the case
> + * that hardware supports them.
> + */
> +int __must_check amd_iommu_map_pages(struct domain *d, unsigned long gfn,
> +                                     unsigned long mfn,
> +                                     unsigned int order,
> +                                     unsigned int flags)
>  {
> -    bool_t need_flush = 0;
>      struct domain_iommu *hd = dom_iommu(d);
>      int rc;
> -    unsigned long pt_mfn[7];
> -    unsigned int merge_level;
> +    unsigned long orig_gfn = gfn;
> +    unsigned long i;
>
>      if ( iommu_use_hap_pt(d) )
>          return 0;
>
> -    memset(pt_mfn, 0, sizeof(pt_mfn));
> -
>      spin_lock(&hd->arch.mapping_lock);
> -
>      rc = amd_iommu_alloc_root(hd);
> +    spin_unlock(&hd->arch.mapping_lock);
>      if ( rc )
>      {
> -        spin_unlock(&hd->arch.mapping_lock);
>          AMD_IOMMU_DEBUG("Root table alloc failed, gfn = %lx\n", gfn);
>          domain_crash(d);
>          return rc;
>      }
>
> -    /* Since HVM domain is initialized with 2 level IO page table,
> -     * we might need a deeper page table for lager gfn now */
> -    if ( is_hvm_domain(d) )
> +    for ( i = 0; i < (1UL << order); i++, gfn++, mfn++ )
>      {
> -        if ( update_paging_mode(d, gfn) )
> +        bool_t need_flush = 0;
> +        unsigned long pt_mfn[7];
> +        unsigned int merge_level;
> +
> +        memset(pt_mfn, 0, sizeof(pt_mfn));
> +
> +        spin_lock(&hd->arch.mapping_lock);
> +
> +        /* Since HVM domain is initialized with 2 level IO page table,
> +         * we might need a deeper page table for lager gfn now */
> +        if ( is_hvm_domain(d) )
> +        {
> +            if ( update_paging_mode(d, gfn) )
> +            {
> +                spin_unlock(&hd->arch.mapping_lock);
> +                AMD_IOMMU_DEBUG("Update page mode failed gfn = %lx\n", gfn);
> +                domain_crash(d);
> +                rc = -EFAULT;
> +                goto err;
> +            }
> +        }
> +
> +        if ( iommu_pde_from_gfn(d, gfn, pt_mfn) || (pt_mfn[1] == 0) )
>          {
>              spin_unlock(&hd->arch.mapping_lock);
> -            AMD_IOMMU_DEBUG("Update page mode failed gfn = %lx\n", gfn);
> +            AMD_IOMMU_DEBUG("Invalid IO pagetable entry gfn = %lx\n", gfn);
>              domain_crash(d);
> -            return -EFAULT;
> +            rc = -EFAULT;
> +            goto err;
>          }
> -    }
>
> -    if ( iommu_pde_from_gfn(d, gfn, pt_mfn) || (pt_mfn[1] == 0) )
> -    {
> -        spin_unlock(&hd->arch.mapping_lock);
> -        AMD_IOMMU_DEBUG("Invalid IO pagetable entry gfn = %lx\n", gfn);
> -        domain_crash(d);
> -        return -EFAULT;
> -    }
> +        /* Install 4k mapping first */
> +        need_flush = set_iommu_pte_present(pt_mfn[1], gfn, mfn,
> +                                           IOMMU_PAGING_MODE_LEVEL_1,
> +                                           !!(flags & IOMMUF_writable),
> +                                           !!(flags & IOMMUF_readable));
>
> -    /* Install 4k mapping first */
> -    need_flush = set_iommu_pte_present(pt_mfn[1], gfn, mfn,
> -                                       IOMMU_PAGING_MODE_LEVEL_1,
> -                                       !!(flags & IOMMUF_writable),
> -                                       !!(flags & IOMMUF_readable));
> +        /* Do not increase pde count if io mapping has not been changed */
> +        if ( !need_flush )
> +        {
> +            spin_unlock(&hd->arch.mapping_lock);
> +            continue;
> +        }
>
> -    /* Do not increase pde count if io mapping has not been changed */
> -    if ( !need_flush )
> -        goto out;
> +        /* 4K mapping for PV guests never changes,
> +         * no need to flush if we trust non-present bits */
> +        if ( is_hvm_domain(d) )
> +            amd_iommu_flush_pages(d, gfn, 0);
>
> -    /* 4K mapping for PV guests never changes,
> -     * no need to flush if we trust non-present bits */
> -    if ( is_hvm_domain(d) )
> -        amd_iommu_flush_pages(d, gfn, 0);
> -
> -    for ( merge_level = IOMMU_PAGING_MODE_LEVEL_2;
> -          merge_level <= hd->arch.paging_mode; merge_level++ )
> -    {
> -        if ( pt_mfn[merge_level] == 0 )
> -            break;
> -        if ( !iommu_update_pde_count(d, pt_mfn[merge_level],
> -                                     gfn, mfn, merge_level) )
> -            break;
> -
> -        if ( iommu_merge_pages(d, pt_mfn[merge_level], gfn,
> -                               flags, merge_level) )
> +        for ( merge_level = IOMMU_PAGING_MODE_LEVEL_2;
> +              merge_level <= hd->arch.paging_mode; merge_level++ )
>          {
> -            spin_unlock(&hd->arch.mapping_lock);
> -            AMD_IOMMU_DEBUG("Merge iommu page failed at level %d, "
> -                            "gfn = %lx mfn = %lx\n", merge_level, gfn, mfn);
> -            domain_crash(d);
> -            return -EFAULT;
> +            if ( pt_mfn[merge_level] == 0 )
> +                break;
> +            if ( !iommu_update_pde_count(d, pt_mfn[merge_level],
> +                                         gfn, mfn, merge_level) )
> +                break;
> +
> +            if ( iommu_merge_pages(d, pt_mfn[merge_level], gfn,
> +                                   flags, merge_level) )
> +            {
> +                spin_unlock(&hd->arch.mapping_lock);
> +                AMD_IOMMU_DEBUG("Merge iommu page failed at level %d, "
> +                                "gfn = %lx mfn = %lx\n", merge_level, gfn, 
> mfn);
> +                domain_crash(d);
> +                rc = -EFAULT;
> +                goto err;
> +            }
> +
> +            /* Deallocate lower level page table */
> +            free_amd_iommu_pgtable(mfn_to_page(pt_mfn[merge_level - 1]));
>          }
>
> -        /* Deallocate lower level page table */
> -        free_amd_iommu_pgtable(mfn_to_page(pt_mfn[merge_level - 1]));
> +        spin_unlock(&hd->arch.mapping_lock);
>      }
>
> -out:
> -    spin_unlock(&hd->arch.mapping_lock);
>      return 0;
> +
> +err:
> +    while ( i-- )
> +        /* If statement to satisfy __must_check. */
> +        if ( amd_iommu_unmap_pages(d, orig_gfn + i, 0) )
> +            continue;
> +
> +    return rc;
>  }
>
> -static int __must_check amd_iommu_unmap_page(struct domain *d,
> -                                             unsigned long gfn)
> +int __must_check amd_iommu_unmap_pages(struct domain *d,
> +                                       unsigned long gfn,
> +                                       unsigned int order)
>  {
> -    unsigned long pt_mfn[7];
>      struct domain_iommu *hd = dom_iommu(d);
> +    int rt = 0;
> +    unsigned long i;
>
>      if ( iommu_use_hap_pt(d) )
>          return 0;
>
> -    memset(pt_mfn, 0, sizeof(pt_mfn));
> -
> -    spin_lock(&hd->arch.mapping_lock);
> -
>      if ( !hd->arch.root_table )
> -    {
> -        spin_unlock(&hd->arch.mapping_lock);
>          return 0;
> -    }
>
> -    /* Since HVM domain is initialized with 2 level IO page table,
> -     * we might need a deeper page table for lager gfn now */
> -    if ( is_hvm_domain(d) )
> +    for ( i = 0; i < (1UL << order); i++, gfn++ )
>      {
> -        int rc = update_paging_mode(d, gfn);
> +        unsigned long pt_mfn[7];
>
> -        if ( rc )
> -        {
> -            spin_unlock(&hd->arch.mapping_lock);
> -            AMD_IOMMU_DEBUG("Update page mode failed gfn = %lx\n", gfn);
> -            if ( rc != -EADDRNOTAVAIL )
> -                domain_crash(d);
> -            return rc;
> -        }
> -    }
> +        memset(pt_mfn, 0, sizeof(pt_mfn));
>
> -    if ( iommu_pde_from_gfn(d, gfn, pt_mfn) || (pt_mfn[1] == 0) )
> -    {
> -        spin_unlock(&hd->arch.mapping_lock);
> -        AMD_IOMMU_DEBUG("Invalid IO pagetable entry gfn = %lx\n", gfn);
> -        domain_crash(d);
> -        return -EFAULT;
> -    }
> -
> -    /* mark PTE as 'page not present' */
> -    clear_iommu_pte_present(pt_mfn[1], gfn);
> -    spin_unlock(&hd->arch.mapping_lock);
> +        spin_lock(&hd->arch.mapping_lock);
>
> -    amd_iommu_flush_pages(d, gfn, 0);
> -
> -    return 0;
> -}
> -
> -/* TODO: Optimize by squashing map_pages/unmap_pages with 
> map_page/unmap_page */
> -int __must_check amd_iommu_map_pages(struct domain *d, unsigned long gfn,
> -                                     unsigned long mfn, unsigned int order,
> -                                     unsigned int flags)
> -{
> -    unsigned long i;
> -    int rc = 0;
> -
> -    for ( i = 0; i < (1UL << order); i++ )
> -    {
> -        rc = amd_iommu_map_page(d, gfn + i, mfn + i, flags);
> -        if ( unlikely(rc) )
> +        /* Since HVM domain is initialized with 2 level IO page table,
> +         * we might need a deeper page table for lager gfn now */
> +        if ( is_hvm_domain(d) )
>          {
> -            while ( i-- )
> -                /* If statement to satisfy __must_check. */
> -                if ( amd_iommu_unmap_page(d, gfn + i) )
> -                    continue;
> +            int rc = update_paging_mode(d, gfn);
>
> -            break;
> +            if ( rc )
> +            {
> +                spin_unlock(&hd->arch.mapping_lock);
> +                AMD_IOMMU_DEBUG("Update page mode failed gfn = %lx\n", gfn);
> +                if ( rc != -EADDRNOTAVAIL )
> +                    domain_crash(d);
> +                if ( !rt )
> +                    rt = rc;
> +                continue;
> +            }
>          }
> -    }
> -
> -    return rc;
> -}
>
> -int __must_check amd_iommu_unmap_pages(struct domain *d, unsigned long gfn,
> -                                       unsigned int order)
> -{
> -    unsigned long i;
> -    int rc = 0;
> +        if ( iommu_pde_from_gfn(d, gfn, pt_mfn) || (pt_mfn[1] == 0) )
> +        {
> +            spin_unlock(&hd->arch.mapping_lock);
> +            AMD_IOMMU_DEBUG("Invalid IO pagetable entry gfn = %lx\n", gfn);
> +            domain_crash(d);
> +            if ( !rt )
> +                rt = -EFAULT;
> +            continue;
> +        }
>
> -    for ( i = 0; i < (1UL << order); i++ )
> -    {
> -        int ret = amd_iommu_unmap_page(d, gfn + i);
> +        /* mark PTE as 'page not present' */
> +        clear_iommu_pte_present(pt_mfn[1], gfn);
> +        spin_unlock(&hd->arch.mapping_lock);
>
> -        if ( !rc )
> -            rc = ret;
> +        amd_iommu_flush_pages(d, gfn, 0);
>      }
>
> -    return rc;
> +    return rt;
>  }
>
>  int amd_iommu_reserve_domain_unity_map(struct domain *domain,
> @@ -831,7 +823,7 @@ int amd_iommu_reserve_domain_unity_map(struct domain 
> *domain,
>      gfn = phys_addr >> PAGE_SHIFT;
>      for ( i = 0; i < npages; i++ )
>      {
> -        rt = amd_iommu_map_page(domain, gfn +i, gfn +i, flags);
> +        rt = amd_iommu_map_pages(domain, gfn +i, gfn +i, flags, 0);
>          if ( rt != 0 )
>              return rt;
>      }
> --
> 2.7.4
>



-- 
Regards,

Oleksandr Tyshchenko

_______________________________________________
Xen-devel mailing list
Xen-devel@xxxxxxxxxxxxx
https://lists.xen.org/xen-devel

 


Rackspace

Lists.xenproject.org is hosted with RackSpace, monitoring our
servers 24x7x365 and backed by RackSpace's Fanatical Support®.