iommu/ipmmu-vmsa: Rewrite page table management

The IOMMU core will only call us with page sizes advertized as supported by the driver. We can thus simplify the code by removing loops over PGD and PMD entries. Signed-off-by: N Laurent Pinchart <laurent.pinchart+renesas@ideasonboard.com> Signed-off-by: N Joerg Roedel <jroedel@suse.de>

iommu/ipmmu-vmsa: Rewrite page table management
The IOMMU core will only call us with page sizes advertized as supported by the driver. We can thus simplify the code by removing loops over PGD and PMD entries. Signed-off-by: N Laurent Pinchart <laurent.pinchart+renesas@ideasonboard.com> Signed-off-by: N Joerg Roedel <jroedel@suse.de>
9009f256 · Laurent Pinchart · Joerg Roedel · 14e5123e · 9009f256
显示空白变更内容
内联并排

Showing with 86 addition and 107 deletion

drivers/iommu/ipmmu-vmsa.c drivers/iommu/ipmmu-vmsa.c +86 -107

未找到文件。
--- a/drivers/iommu/ipmmu-vmsa.c
+++ b/drivers/iommu/ipmmu-vmsa.c
@@ -517,118 +517,97 @@ static void ipmmu_free_pgtables(struct ipmmu_vmsa_domain *domain)
 * functions as they would flush the CPU TLB.
 */
-static int ipmmu_alloc_init_pte(struct ipmmu_vmsa_device *mmu, pmd_t *pmd,
+static pte_t *ipmmu_alloc_pte(struct ipmmu_vmsa_device *mmu, pmd_t *pmd,
-				unsigned long addr, unsigned long end,
+			      unsigned long iova)
-				phys_addr_t phys, int prot)
 {
-	unsigned long pfn = __phys_to_pfn(phys);
+	pte_t *pte;
-	pteval_t pteval = ARM_VMSA_PTE_PAGE | ARM_VMSA_PTE_NS | ARM_VMSA_PTE_AF
-			| ARM_VMSA_PTE_XN;
+	if (!pmd_none(*pmd))
-	pte_t *pte, *start;
+		return pte_offset_kernel(pmd, iova);
-	if (pmd_none(*pmd)) {
-		/* Allocate a new set of tables */
 	pte = (pte_t *)get_zeroed_page(GFP_ATOMIC);
 	if (!pte)
-			return -ENOMEM;
+		return NULL;
 	ipmmu_flush_pgtable(mmu, pte, PAGE_SIZE);
 	*pmd = __pmd(__pa(pte) | PMD_NSTABLE | PMD_TYPE_TABLE);
 	ipmmu_flush_pgtable(mmu, pmd, sizeof(*pmd));
-		pte += pte_index(addr);
+	return pte + pte_index(iova);
-	} else
+}
-		pte = pte_offset_kernel(pmd, addr);
+static pmd_t *ipmmu_alloc_pmd(struct ipmmu_vmsa_device *mmu, pgd_t *pgd,
+			      unsigned long iova)
+{
+	pud_t *pud = (pud_t *)pgd;
+	pmd_t *pmd;
+	if (!pud_none(*pud))
+		return pmd_offset(pud, iova);
+	pmd = (pmd_t *)get_zeroed_page(GFP_ATOMIC);
+	if (!pmd)
+		return NULL;
+	ipmmu_flush_pgtable(mmu, pmd, PAGE_SIZE);
+	*pud = __pud(__pa(pmd) | PMD_NSTABLE | PMD_TYPE_TABLE);
+	ipmmu_flush_pgtable(mmu, pud, sizeof(*pud));
+	return pmd + pmd_index(iova);
+}
+static u64 ipmmu_page_prot(unsigned int prot, u64 type)
+{
+	u64 pgprot = ARM_VMSA_PTE_XN | ARM_VMSA_PTE_nG | ARM_VMSA_PTE_AF
+		   | ARM_VMSA_PTE_SH_IS | ARM_VMSA_PTE_AP_UNPRIV
+		   | ARM_VMSA_PTE_NS | type;
-	pteval |= ARM_VMSA_PTE_AP_UNPRIV | ARM_VMSA_PTE_nG;
 	if (!(prot & IOMMU_WRITE) && (prot & IOMMU_READ))
-		pteval |= ARM_VMSA_PTE_AP_RDONLY;
+		pgprot |= ARM_VMSA_PTE_AP_RDONLY;
 	if (prot & IOMMU_CACHE)
-		pteval |= (IMMAIR_ATTR_IDX_WBRWA <<
+		pgprot |= IMMAIR_ATTR_IDX_WBRWA << ARM_VMSA_PTE_ATTRINDX_SHIFT;
-			   ARM_VMSA_PTE_ATTRINDX_SHIFT);
-	/* If no access, create a faulting entry to avoid TLB fills */
 	if (prot & IOMMU_EXEC)
-		pteval &= ~ARM_VMSA_PTE_XN;
+		pgprot &= ~ARM_VMSA_PTE_XN;
 	else if (!(prot & (IOMMU_READ | IOMMU_WRITE)))
-		pteval &= ~ARM_VMSA_PTE_PAGE;
+		/* If no access create a faulting entry to avoid TLB fills. */
+		pgprot &= ~ARM_VMSA_PTE_PAGE;
-	pteval |= ARM_VMSA_PTE_SH_IS;
+	return pgprot;
-	start = pte;
+}
-	/*
+static int ipmmu_alloc_init_pte(struct ipmmu_vmsa_device *mmu, pmd_t *pmd,
-	 * Install the page table entries.
+				unsigned long iova, unsigned long pfn,
-	 *
+				size_t size, int prot)
-	 * Set the contiguous hint in the PTEs where possible. The hint
+{
-	 * indicates a series of ARM_VMSA_PTE_CONT_ENTRIES PTEs mapping a
+	pteval_t pteval = ipmmu_page_prot(prot, ARM_VMSA_PTE_PAGE);
-	 * physically contiguous region with the following constraints:
+	unsigned int num_ptes = 1;
-	 *
+	pte_t *pte, *start;
-	 * - The region start is aligned to ARM_VMSA_PTE_CONT_SIZE
+	unsigned int i;
-	 * - Each PTE in the region has the contiguous hint bit set
-	 *
+	pte = ipmmu_alloc_pte(mmu, pmd, iova);
-	 * We don't support partial unmapping so there's no need to care about
+	if (!pte)
-	 * clearing the contiguous hint from neighbour PTEs.
+		return -ENOMEM;
-	 */
-	do {
+	start = pte;
-		unsigned long chunk_end;
 	/*
-		 * If the address is aligned to a contiguous region size and the
+	 * Install the page table entries. We can be called both for a single
-		 * mapping size is large enough, process the largest possible
+	 * page or for a block of 16 physically contiguous pages. In the latter
-		 * number of PTEs multiple of ARM_VMSA_PTE_CONT_ENTRIES.
+	 * case set the PTE contiguous hint.
-		 * Otherwise process the smallest number of PTEs to align the
-		 * address to a contiguous region size or to complete the
-		 * mapping.
 	 */
-		if (IS_ALIGNED(addr, ARM_VMSA_PTE_CONT_SIZE) &&
+	if (size == SZ_64K) {
-		    end - addr >= ARM_VMSA_PTE_CONT_SIZE) {
-			chunk_end = round_down(end, ARM_VMSA_PTE_CONT_SIZE);
 		pteval |= ARM_VMSA_PTE_CONT;
-		} else {
+		num_ptes = ARM_VMSA_PTE_CONT_ENTRIES;
-			chunk_end = min(ALIGN(addr, ARM_VMSA_PTE_CONT_SIZE),
-					end);
-			pteval &= ~ARM_VMSA_PTE_CONT;
 	}
-		do {
+	for (i = num_ptes; i; --i)
 		*pte++ = pfn_pte(pfn++, __pgprot(pteval));
-			addr += PAGE_SIZE;
-		} while (addr != chunk_end);
-	} while (addr != end);
-	ipmmu_flush_pgtable(mmu, start, sizeof(*pte) * (pte - start));
-	return 0;
-}
-static int ipmmu_alloc_init_pmd(struct ipmmu_vmsa_device *mmu, pud_t *pud,
-				unsigned long addr, unsigned long end,
-				phys_addr_t phys, int prot)
-{
-	unsigned long next;
-	pmd_t *pmd;
-	int ret;
-	if (pud_none(*pud)) {
+	ipmmu_flush_pgtable(mmu, start, sizeof(*pte) * num_ptes);
-		pmd = (pmd_t *)get_zeroed_page(GFP_ATOMIC);
-		if (!pmd)
-			return -ENOMEM;
-		ipmmu_flush_pgtable(mmu, pmd, PAGE_SIZE);
+	return 0;
-		*pud = __pud(__pa(pmd) | PMD_NSTABLE | PMD_TYPE_TABLE);
-		ipmmu_flush_pgtable(mmu, pud, sizeof(*pud));
-		pmd += pmd_index(addr);
-	} else
-		pmd = pmd_offset(pud, addr);
-	do {
-		next = pmd_addr_end(addr, end);
-		ret = ipmmu_alloc_init_pte(mmu, pmd, addr, end, phys, prot);
-		phys += next - addr;
-	} while (pmd++, addr = next, addr < end);
-	return ret;
 }
 static int ipmmu_handle_mapping(struct ipmmu_vmsa_domain *domain,
@@ -638,7 +617,8 @@ static int ipmmu_handle_mapping(struct ipmmu_vmsa_domain *domain,
 	struct ipmmu_vmsa_device *mmu = domain->mmu;
 	pgd_t *pgd = domain->pgd;
 	unsigned long flags;
-	unsigned long end;
+	unsigned long pfn;
+	pmd_t *pmd;
 	int ret;
 	if (!pgd)
@@ -650,25 +630,24 @@ static int ipmmu_handle_mapping(struct ipmmu_vmsa_domain *domain,
 	if (paddr & ~((1ULL << 40) - 1))
 		return -ERANGE;
-	spin_lock_irqsave(&domain->lock, flags);
+	pfn = __phys_to_pfn(paddr);
 	pgd += pgd_index(iova);
-	end = iova + size;
-	do {
+	/* Update the page tables. */
-		unsigned long next = pgd_addr_end(iova, end);
+	spin_lock_irqsave(&domain->lock, flags);
-		ret = ipmmu_alloc_init_pmd(mmu, (pud_t *)pgd, iova, next, paddr,
+	pmd = ipmmu_alloc_pmd(mmu, pgd, iova);
-					   prot);
+	if (!pmd) {
-		if (ret)
+		ret = -ENOMEM;
-			break;
+		goto done;
+	}
-		paddr += next - iova;
+	ret = ipmmu_alloc_init_pte(mmu, pmd, iova, pfn, size, prot);
-		iova = next;
-	} while (pgd++, iova != end);
+done:
 	spin_unlock_irqrestore(&domain->lock, flags);
+	if (!ret)
 		ipmmu_tlb_invalidate(domain);
 	return ret;
@@ -951,7 +930,7 @@ static struct iommu_ops ipmmu_ops = {
 	.iova_to_phys = ipmmu_iova_to_phys,
 	.add_device = ipmmu_add_device,
 	.remove_device = ipmmu_remove_device,
-	.pgsize_bitmap = SZ_2M | SZ_64K | SZ_4K,
+	.pgsize_bitmap = SZ_64K | SZ_4K,
 };
 /* -----------------------------------------------------------------------------