Inter-revision diff: patch 2

Comparing v1 (message) to v4 (message)

--- v1
+++ v4
@@ -1,212 +1,43 @@
-At the moment pnv_pci_ioda_tce_invalidate() gets the PE pointer via
-container_of(tbl). Since we are going to have to add Dynamic DMA windows
-and that means having 2 IOMMU tables per PE, this is not going to work.
-
-This implements pnv_pci_ioda(1|2)_tce_invalidate as a pnv_ioda_pe callback.
-
-This adds a pnv_iommu_table wrapper around iommu_table and stores a pointer
-to PE there. PNV's ppc_md.tce_build() call uses this to find PE and
-do the invalidation. This will be used later for Dynamic DMA windows too.
-
-This registers invalidate() callbacks for IODA1 and IODA2:
-- pnv_pci_ioda1_tce_invalidate;
-- pnv_pci_ioda2_tce_invalidate.
+This clears the TCE table when a container is being closed as this is
+a good thing to leave the table clean before passing the ownership
+back to the host kernel.
 
 Signed-off-by: Alexey Kardashevskiy <aik@ozlabs.ru>
 ---
- arch/powerpc/platforms/powernv/pci-ioda.c | 35 ++++++++++++-------------------
- arch/powerpc/platforms/powernv/pci.c      | 31 ++++++++++++++++++++-------
- arch/powerpc/platforms/powernv/pci.h      | 13 +++++++++++-
- 3 files changed, 48 insertions(+), 31 deletions(-)
+ drivers/vfio/vfio_iommu_spapr_tce.c | 14 +++++++++++---
+ 1 file changed, 11 insertions(+), 3 deletions(-)
 
-diff --git a/arch/powerpc/platforms/powernv/pci-ioda.c b/arch/powerpc/platforms/powernv/pci-ioda.c
-index df241b1..136e765 100644
---- a/arch/powerpc/platforms/powernv/pci-ioda.c
-+++ b/arch/powerpc/platforms/powernv/pci-ioda.c
-@@ -857,7 +857,7 @@ static void pnv_pci_ioda_dma_dev_setup(struct pnv_phb *phb, struct pci_dev *pdev
- 
- 	pe = &phb->ioda.pe_array[pdn->pe_number];
- 	WARN_ON(get_dma_ops(&pdev->dev) != &dma_iommu_ops);
--	set_iommu_table_base_and_group(&pdev->dev, &pe->tce32_table);
-+	set_iommu_table_base_and_group(&pdev->dev, &pe->tce32.table);
+diff --git a/drivers/vfio/vfio_iommu_spapr_tce.c b/drivers/vfio/vfio_iommu_spapr_tce.c
+index 1ef46c3..daf2e2c 100644
+--- a/drivers/vfio/vfio_iommu_spapr_tce.c
++++ b/drivers/vfio/vfio_iommu_spapr_tce.c
+@@ -134,16 +134,24 @@ static void *tce_iommu_open(unsigned long arg)
+ 	return container;
  }
  
- static int pnv_pci_ioda_dma_set_mask(struct pnv_phb *phb,
-@@ -884,7 +884,7 @@ static int pnv_pci_ioda_dma_set_mask(struct pnv_phb *phb,
- 	} else {
- 		dev_info(&pdev->dev, "Using 32-bit DMA via iommu\n");
- 		set_dma_ops(&pdev->dev, &dma_iommu_ops);
--		set_iommu_table_base(&pdev->dev, &pe->tce32_table);
-+		set_iommu_table_base(&pdev->dev, &pe->tce32.table);
- 	}
- 	*pdev->dev.dma_mask = dma_mask;
- 	return 0;
-@@ -899,9 +899,9 @@ static void pnv_ioda_setup_bus_dma(struct pnv_ioda_pe *pe,
- 	list_for_each_entry(dev, &bus->devices, bus_list) {
- 		if (add_to_iommu_group)
- 			set_iommu_table_base_and_group(&dev->dev,
--						       &pe->tce32_table);
-+						       &pe->tce32.table);
- 		else
--			set_iommu_table_base(&dev->dev, &pe->tce32_table);
-+			set_iommu_table_base(&dev->dev, &pe->tce32.table);
++static int tce_iommu_clear(struct tce_container *container,
++		struct iommu_table *tbl,
++		unsigned long entry, unsigned long pages);
++
+ static void tce_iommu_release(void *iommu_data)
+ {
+ 	struct tce_container *container = iommu_data;
++	struct iommu_table *tbl = container->tbl;
  
- 		if (dev->subordinate)
- 			pnv_ioda_setup_bus_dma(pe, dev->subordinate,
-@@ -988,19 +988,6 @@ static void pnv_pci_ioda2_tce_invalidate(struct pnv_ioda_pe *pe,
- 	}
- }
+-	WARN_ON(container->tbl && !container->tbl->it_group);
++	WARN_ON(tbl && !tbl->it_group);
+ 	tce_iommu_disable(container);
  
--void pnv_pci_ioda_tce_invalidate(struct iommu_table *tbl,
--				 __be64 *startp, __be64 *endp, bool rm)
--{
--	struct pnv_ioda_pe *pe = container_of(tbl, struct pnv_ioda_pe,
--					      tce32_table);
--	struct pnv_phb *phb = pe->phb;
--
--	if (phb->type == PNV_PHB_IODA1)
--		pnv_pci_ioda1_tce_invalidate(pe, tbl, startp, endp, rm);
--	else
--		pnv_pci_ioda2_tce_invalidate(pe, tbl, startp, endp, rm);
--}
--
- static void pnv_pci_ioda_setup_dma_pe(struct pnv_phb *phb,
- 				      struct pnv_ioda_pe *pe, unsigned int base,
- 				      unsigned int segs)
-@@ -1058,9 +1045,11 @@ static void pnv_pci_ioda_setup_dma_pe(struct pnv_phb *phb,
- 	}
+-	if (container->tbl && container->tbl->it_group)
+-		tce_iommu_detach_group(iommu_data, container->tbl->it_group);
++	if (tbl) {
++		tce_iommu_clear(container, tbl,	tbl->it_offset, tbl->it_size);
  
- 	/* Setup linux iommu table */
--	tbl = &pe->tce32_table;
-+	tbl = &pe->tce32.table;
- 	pnv_pci_setup_iommu_table(tbl, addr, TCE32_TABLE_SIZE * segs,
- 				  base << 28, IOMMU_PAGE_SHIFT_4K);
-+	pe->tce32.pe = pe;
-+	pe->tce32.invalidate_fn = pnv_pci_ioda1_tce_invalidate;
++		if (tbl->it_group)
++			tce_iommu_detach_group(iommu_data, tbl->it_group);
++	}
+ 	mutex_destroy(&container->lock);
  
- 	/* OPAL variant of P7IOC SW invalidated TCEs */
- 	swinvp = of_get_property(phb->hose->dn, "ibm,opal-tce-kill", NULL);
-@@ -1097,7 +1086,7 @@ static void pnv_pci_ioda_setup_dma_pe(struct pnv_phb *phb,
- static void pnv_pci_ioda2_set_bypass(struct iommu_table *tbl, bool enable)
- {
- 	struct pnv_ioda_pe *pe = container_of(tbl, struct pnv_ioda_pe,
--					      tce32_table);
-+					      tce32.table);
- 	uint16_t window_id = (pe->pe_number << 1 ) + 1;
- 	int64_t rc;
- 
-@@ -1142,10 +1131,10 @@ static void pnv_pci_ioda2_setup_bypass_pe(struct pnv_phb *phb,
- 	pe->tce_bypass_base = 1ull << 59;
- 
- 	/* Install set_bypass callback for VFIO */
--	pe->tce32_table.set_bypass = pnv_pci_ioda2_set_bypass;
-+	pe->tce32.table.set_bypass = pnv_pci_ioda2_set_bypass;
- 
- 	/* Enable bypass by default */
--	pnv_pci_ioda2_set_bypass(&pe->tce32_table, true);
-+	pnv_pci_ioda2_set_bypass(&pe->tce32.table, true);
- }
- 
- static void pnv_pci_ioda2_setup_dma_pe(struct pnv_phb *phb,
-@@ -1193,9 +1182,11 @@ static void pnv_pci_ioda2_setup_dma_pe(struct pnv_phb *phb,
- 	}
- 
- 	/* Setup linux iommu table */
--	tbl = &pe->tce32_table;
-+	tbl = &pe->tce32.table;
- 	pnv_pci_setup_iommu_table(tbl, addr, tce_table_size, 0,
- 			IOMMU_PAGE_SHIFT_4K);
-+	pe->tce32.pe = pe;
-+	pe->tce32.invalidate_fn = pnv_pci_ioda2_tce_invalidate;
- 
- 	/* OPAL variant of PHB3 invalidated TCEs */
- 	swinvp = of_get_property(phb->hose->dn, "ibm,opal-tce-kill", NULL);
-diff --git a/arch/powerpc/platforms/powernv/pci.c b/arch/powerpc/platforms/powernv/pci.c
-index b854b57..97895d4 100644
---- a/arch/powerpc/platforms/powernv/pci.c
-+++ b/arch/powerpc/platforms/powernv/pci.c
-@@ -599,6 +599,27 @@ struct pci_ops pnv_pci_ops = {
- 	.write = pnv_pci_write_config,
- };
- 
-+static void pnv_tce_invalidate(struct iommu_table *tbl, __be64 *startp,
-+	__be64 *endp, bool rm)
-+{
-+	struct pnv_iommu_table *ptbl = container_of(tbl,
-+			struct pnv_iommu_table, table);
-+	struct pnv_ioda_pe *pe = ptbl->pe;
-+
-+	/*
-+	 * Some implementations won't cache invalid TCEs and thus may not
-+	 * need that flush. We'll probably turn it_type into a bit mask
-+	 * of flags if that becomes the case
-+	 */
-+	if (!(tbl->it_type & TCE_PCI_SWINV_FREE))
-+		return;
-+
-+	if (!pe || !ptbl->invalidate_fn)
-+		return;
-+
-+	ptbl->invalidate_fn(pe, tbl, startp, endp, rm);
-+}
-+
- static int pnv_tce_build(struct iommu_table *tbl, long index, long npages,
- 			 unsigned long uaddr, enum dma_data_direction direction,
- 			 struct dma_attrs *attrs, bool rm)
-@@ -619,12 +640,7 @@ static int pnv_tce_build(struct iommu_table *tbl, long index, long npages,
- 		*(tcep++) = cpu_to_be64(proto_tce |
- 				(rpn++ << tbl->it_page_shift));
- 
--	/* Some implementations won't cache invalid TCEs and thus may not
--	 * need that flush. We'll probably turn it_type into a bit mask
--	 * of flags if that becomes the case
--	 */
--	if (tbl->it_type & TCE_PCI_SWINV_CREATE)
--		pnv_pci_ioda_tce_invalidate(tbl, tces, tcep - 1, rm);
-+	pnv_tce_invalidate(tbl, tces, tcep - 1, rm);
- 
- 	return 0;
- }
-@@ -648,8 +664,7 @@ static void pnv_tce_free(struct iommu_table *tbl, long index, long npages,
- 	while (npages--)
- 		*(tcep++) = cpu_to_be64(0);
- 
--	if (tbl->it_type & TCE_PCI_SWINV_FREE)
--		pnv_pci_ioda_tce_invalidate(tbl, tces, tcep - 1, rm);
-+	pnv_tce_invalidate(tbl, tces, tcep - 1, rm);
- }
- 
- static void pnv_tce_free_vm(struct iommu_table *tbl, long index, long npages)
-diff --git a/arch/powerpc/platforms/powernv/pci.h b/arch/powerpc/platforms/powernv/pci.h
-index 48494d4..095db43 100644
---- a/arch/powerpc/platforms/powernv/pci.h
-+++ b/arch/powerpc/platforms/powernv/pci.h
-@@ -24,6 +24,17 @@ enum pnv_phb_model {
- #define PNV_IODA_PE_MASTER	(1 << 3)	/* Master PE in compound case	*/
- #define PNV_IODA_PE_SLAVE	(1 << 4)	/* Slave PE in compound case	*/
- 
-+struct pnv_ioda_pe;
-+typedef void (*pnv_invalidate_fn)(struct pnv_ioda_pe *pe,
-+		struct iommu_table *tbl,
-+		__be64 *startp, __be64 *endp, bool rm);
-+
-+struct pnv_iommu_table {
-+	struct iommu_table	table;
-+	struct pnv_ioda_pe	*pe;
-+	pnv_invalidate_fn	invalidate_fn;
-+};
-+
- /* Data associated with a PE, including IOMMU tracking etc.. */
- struct pnv_phb;
- struct pnv_ioda_pe {
-@@ -53,7 +64,7 @@ struct pnv_ioda_pe {
- 	/* "Base" iommu table, ie, 4K TCEs, 32-bit DMA */
- 	int			tce32_seg;
- 	int			tce32_segcount;
--	struct iommu_table	tce32_table;
-+	struct pnv_iommu_table	tce32;
- 	phys_addr_t		tce_inval_reg_phys;
- 
- 	/* 64-bit TCE bypass region */
+ 	kfree(container);
 -- 
 2.0.0
Keyboard shortcuts
hback out one level
jnext message in thread
kprevious message in thread
ldrill in
Escclose help / fold thread tree
?toggle this help