Inter-revision diff: patch 4

Comparing v2 (message) to v5 (message)

--- v2
+++ v5
@@ -1,293 +1,189 @@
-__ioremap(), ioremap(), ioremap_wc() et ioremap_prot() are
-very similar between PPC32 and PPC64, they can easily be
-made common.
+The 8xx TLB miss routines are patched when (de)activating
+perf counters.
 
-_PAGE_WRITE equals to _PAGE_RW on PPC32
-_PAGE_RO and _PAGE_HWWRITE are 0 on PPC64
-
-iounmap() can also be made common by renaming the PPC32
-iounmap() as __iounmap() then __iounmap() can also
-be made common to PPC32 and PPC64.
-
-This patch also makes __ioremap_caller() common to PPC32 and PPC64
+This patch uses the new patch_site functionality in order
+to get a better code readability and avoid a label mess when
+dumping the code with 'objdump -d'
 
 Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
 ---
- arch/powerpc/include/asm/book3s/64/pgtable.h |   2 +
- arch/powerpc/include/asm/machdep.h           |   2 +-
- arch/powerpc/mm/ioremap.c                    | 190 ++++++---------------------
- 3 files changed, 46 insertions(+), 148 deletions(-)
+ arch/powerpc/include/asm/mmu-8xx.h |  4 ++++
+ arch/powerpc/kernel/head_8xx.S     | 33 +++++++++++++++++++--------------
+ arch/powerpc/perf/8xx-pmu.c        | 27 ++++++++++++---------------
+ 3 files changed, 35 insertions(+), 29 deletions(-)
 
-diff --git a/arch/powerpc/include/asm/book3s/64/pgtable.h b/arch/powerpc/include/asm/book3s/64/pgtable.h
-index 47b5ffc8715d..2bebdd8302cb 100644
---- a/arch/powerpc/include/asm/book3s/64/pgtable.h
-+++ b/arch/powerpc/include/asm/book3s/64/pgtable.h
-@@ -17,6 +17,8 @@
- #define _PAGE_NA		0
- #define _PAGE_RO		0
- #define _PAGE_USER		0
-+#define _PAGE_HWWRITE		0
-+#define _PAGE_COHERENT		0
+diff --git a/arch/powerpc/include/asm/mmu-8xx.h b/arch/powerpc/include/asm/mmu-8xx.h
+index 3a15d6647d47..fa05aa566ece 100644
+--- a/arch/powerpc/include/asm/mmu-8xx.h
++++ b/arch/powerpc/include/asm/mmu-8xx.h
+@@ -234,6 +234,10 @@ extern s32 patch__itlbmiss_linmem_top;
+ extern s32 patch__dtlbmiss_linmem_top, patch__dtlbmiss_immr_jmp;
+ extern s32 patch__fixupdar_linmem_top;
  
- #define _PAGE_EXEC		0x00001 /* execute permission */
- #define _PAGE_WRITE		0x00002 /* write access allowed */
-diff --git a/arch/powerpc/include/asm/machdep.h b/arch/powerpc/include/asm/machdep.h
-index ffe7c71e1132..84d99ed82d5d 100644
---- a/arch/powerpc/include/asm/machdep.h
-+++ b/arch/powerpc/include/asm/machdep.h
-@@ -33,11 +33,11 @@ struct pci_host_bridge;
++extern s32 patch__itlbmiss_exit_1, patch__itlbmiss_exit_2;
++extern s32 patch__dtlbmiss_exit_1, patch__dtlbmiss_exit_2, patch__dtlbmiss_exit_3;
++extern s32 patch__itlbmiss_perf, patch__dtlbmiss_perf;
++
+ #endif /* !__ASSEMBLY__ */
  
- struct machdep_calls {
- 	char		*name;
--#ifdef CONFIG_PPC64
- 	void __iomem *	(*ioremap)(phys_addr_t addr, unsigned long size,
- 				   unsigned long flags, void *caller);
- 	void		(*iounmap)(volatile void __iomem *token);
+ #if defined(CONFIG_PPC_4K_PAGES)
+diff --git a/arch/powerpc/kernel/head_8xx.S b/arch/powerpc/kernel/head_8xx.S
+index 0425571a533d..3b67b9533c82 100644
+--- a/arch/powerpc/kernel/head_8xx.S
++++ b/arch/powerpc/kernel/head_8xx.S
+@@ -374,16 +374,17 @@ InstructionTLBMiss:
+ 	mtspr	SPRN_MI_RPN, r10	/* Update TLB entry */
  
-+#ifdef CONFIG_PPC64
- #ifdef CONFIG_PM
- 	void		(*iommu_save)(void);
- 	void		(*iommu_restore)(void);
-diff --git a/arch/powerpc/mm/ioremap.c b/arch/powerpc/mm/ioremap.c
-index a498e3cade9e..a140feec2f8a 100644
---- a/arch/powerpc/mm/ioremap.c
-+++ b/arch/powerpc/mm/ioremap.c
-@@ -35,147 +35,6 @@ unsigned long ioremap_bot = IOREMAP_BASE;
+ 	/* Restore registers */
+-_ENTRY(itlb_miss_exit_1)
+-	mfspr	r10, SPRN_SPRG_SCRATCH0
++0:	mfspr	r10, SPRN_SPRG_SCRATCH0
+ 	mfspr	r11, SPRN_SPRG_SCRATCH1
+ #if defined(ITLB_MISS_KERNEL) || defined(CONFIG_HUGETLB_PAGE)
+ 	mfspr	r12, SPRN_SPRG_SCRATCH2
  #endif
- EXPORT_SYMBOL(ioremap_bot);	/* aka VMALLOC_END */
+ 	rfi
++	patch_site	0b, patch__itlbmiss_exit_1
++
+ #ifdef CONFIG_PERF_EVENTS
+-_ENTRY(itlb_miss_perf)
+-	lis	r10, (itlb_miss_counter - PAGE_OFFSET)@ha
++	patch_site	0f, patch__itlbmiss_perf
++0:	lis	r10, (itlb_miss_counter - PAGE_OFFSET)@ha
+ 	lwz	r11, (itlb_miss_counter - PAGE_OFFSET)@l(r10)
+ 	addi	r11, r11, 1
+ 	stw	r11, (itlb_miss_counter - PAGE_OFFSET)@l(r10)
+@@ -499,14 +500,16 @@ DataStoreTLBMiss:
  
--#ifdef CONFIG_PPC32
--
--void __iomem *
--ioremap(phys_addr_t addr, unsigned long size)
--{
--	return __ioremap_caller(addr, size, _PAGE_NO_CACHE | _PAGE_GUARDED,
--				__builtin_return_address(0));
--}
--EXPORT_SYMBOL(ioremap);
--
--void __iomem *
--ioremap_wc(phys_addr_t addr, unsigned long size)
--{
--	return __ioremap_caller(addr, size, _PAGE_NO_CACHE,
--				__builtin_return_address(0));
--}
--EXPORT_SYMBOL(ioremap_wc);
--
--void __iomem *
--ioremap_prot(phys_addr_t addr, unsigned long size, unsigned long flags)
--{
--	/* writeable implies dirty for kernel addresses */
--	if ((flags & (_PAGE_RW | _PAGE_RO)) != _PAGE_RO)
--		flags |= _PAGE_DIRTY | _PAGE_HWWRITE;
--
--	/* we don't want to let _PAGE_USER and _PAGE_EXEC leak out */
--	flags &= ~(_PAGE_USER | _PAGE_EXEC);
--	flags |= _PAGE_PRIVILEGED;
--
--	return __ioremap_caller(addr, size, flags, __builtin_return_address(0));
--}
--EXPORT_SYMBOL(ioremap_prot);
--
--void __iomem *
--__ioremap(phys_addr_t addr, unsigned long size, unsigned long flags)
--{
--	return __ioremap_caller(addr, size, flags, __builtin_return_address(0));
--}
--EXPORT_SYMBOL(__ioremap);
--
--void __iomem *
--__ioremap_caller(phys_addr_t addr, unsigned long size, unsigned long flags,
--		 void *caller)
--{
--	unsigned long v, i;
--	phys_addr_t p;
--	int err;
--
--	/* Make sure we have the base flags */
--	if ((flags & _PAGE_PRESENT) == 0)
--		flags |= pgprot_val(PAGE_KERNEL);
--
--	/* Non-cacheable page cannot be coherent */
--	if (flags & _PAGE_NO_CACHE)
--		flags &= ~_PAGE_COHERENT;
--
--	/*
--	 * Choose an address to map it to.
--	 * Once the vmalloc system is running, we use it.
--	 * Before then, we use space going up from IOREMAP_BASE
--	 * (ioremap_bot records where we're up to).
--	 */
--	p = addr & PAGE_MASK;
--	size = PAGE_ALIGN(addr + size) - p;
--
--	/*
--	 * If the address lies within the first 16 MB, assume it's in ISA
--	 * memory space
--	 */
--	if (p < 16*1024*1024)
--		p += _ISA_MEM_BASE;
--
--#ifndef CONFIG_CRASH_DUMP
--	/*
--	 * Don't allow anybody to remap normal RAM that we're using.
--	 * mem_init() sets high_memory so only do the check after that.
--	 */
--	if (slab_is_available() && (p < virt_to_phys(high_memory)) &&
--	    page_is_ram(__phys_to_pfn(p))) {
--		printk("__ioremap(): phys addr 0x%llx is RAM lr %ps\n",
--		       (unsigned long long)p, __builtin_return_address(0));
--		return NULL;
--	}
--#endif
--
--	if (size == 0)
--		return NULL;
--
--	/*
--	 * Is it already mapped?  Perhaps overlapped by a previous
--	 * mapping.
--	 */
--	v = p_block_mapped(p);
--	if (v)
--		goto out;
--
--	if (slab_is_available()) {
--		struct vm_struct *area;
--		area = get_vm_area_caller(size, VM_IOREMAP, caller);
--		if (area == 0)
--			return NULL;
--		area->phys_addr = p;
--		v = (unsigned long) area->addr;
--	} else {
--		v = ioremap_bot;
--		ioremap_bot += size;
--	}
--
--	/*
--	 * Should check if it is a candidate for a BAT mapping
--	 */
--
--	err = 0;
--	for (i = 0; i < size && err == 0; i += PAGE_SIZE)
--		err = map_kernel_page(v+i, p+i, flags);
--	if (err) {
--		if (slab_is_available())
--			vunmap((void *)v);
--		return NULL;
--	}
--
--out:
--	return (void __iomem *) (v + ((unsigned long)addr & ~PAGE_MASK));
--}
--
--void iounmap(volatile void __iomem *addr)
--{
--	/*
--	 * If mapped by BATs then there is nothing to do.
--	 * Calling vfree() generates a benign warning.
--	 */
--	if (v_block_mapped((unsigned long)addr))
--		return;
--
--	if ((unsigned long) addr >= ioremap_bot)
--		vunmap((void *) (PAGE_MASK & (unsigned long)addr));
--}
--EXPORT_SYMBOL(iounmap);
--
--#else
--
- /**
-  * __ioremap_at - Low level function to establish the page tables
-  *                for an IO mapping
-@@ -189,6 +48,10 @@ void __iomem * __ioremap_at(phys_addr_t pa, void *ea, unsigned long size,
- 	if ((flags & _PAGE_PRESENT) == 0)
- 		flags |= pgprot_val(PAGE_KERNEL);
+ 	/* Restore registers */
+ 	mtspr	SPRN_DAR, r11	/* Tag DAR */
+-_ENTRY(dtlb_miss_exit_1)
+-	mfspr	r10, SPRN_SPRG_SCRATCH0
++
++0:	mfspr	r10, SPRN_SPRG_SCRATCH0
+ 	mfspr	r11, SPRN_SPRG_SCRATCH1
+ 	mfspr	r12, SPRN_SPRG_SCRATCH2
+ 	rfi
++	patch_site	0b, patch__dtlbmiss_exit_1
++
+ #ifdef CONFIG_PERF_EVENTS
+-_ENTRY(dtlb_miss_perf)
+-	lis	r10, (dtlb_miss_counter - PAGE_OFFSET)@ha
++	patch_site	0f, patch__dtlbmiss_perf
++0:	lis	r10, (dtlb_miss_counter - PAGE_OFFSET)@ha
+ 	lwz	r11, (dtlb_miss_counter - PAGE_OFFSET)@l(r10)
+ 	addi	r11, r11, 1
+ 	stw	r11, (dtlb_miss_counter - PAGE_OFFSET)@l(r10)
+@@ -658,11 +661,12 @@ DTLBMissIMMR:
  
-+	/* Non-cacheable page cannot be coherent */
-+	if (flags & _PAGE_NO_CACHE)
-+		flags &= ~_PAGE_COHERENT;
+ 	li	r11, RPN_PATTERN
+ 	mtspr	SPRN_DAR, r11	/* Tag DAR */
+-_ENTRY(dtlb_miss_exit_2)
+-	mfspr	r10, SPRN_SPRG_SCRATCH0
 +
- 	/* We don't support the 4K PFN hack with ioremap */
- 	if (flags & H_PAGE_4K_PFN)
- 		return NULL;
-@@ -241,6 +104,33 @@ void __iomem * __ioremap_caller(phys_addr_t addr, unsigned long size,
- 	if ((size == 0) || (paligned == 0))
- 		return NULL;
++0:	mfspr	r10, SPRN_SPRG_SCRATCH0
+ 	mfspr	r11, SPRN_SPRG_SCRATCH1
+ 	mfspr	r12, SPRN_SPRG_SCRATCH2
+ 	rfi
++	patch_site	0b, patch__dtlbmiss_exit_2
  
-+	/*
-+	 * If the address lies within the first 16 MB, assume it's in ISA
-+	 * memory space
-+	 */
-+	if (IS_ENABLED(CONFIG_PPC32) && paligned < 16*1024*1024)
-+		paligned += _ISA_MEM_BASE;
+ DTLBMissLinear:
+ 	mtcr	r12
+@@ -676,11 +680,12 @@ DTLBMissLinear:
+ 
+ 	li	r11, RPN_PATTERN
+ 	mtspr	SPRN_DAR, r11	/* Tag DAR */
+-_ENTRY(dtlb_miss_exit_3)
+-	mfspr	r10, SPRN_SPRG_SCRATCH0
 +
-+	/*
-+	 * Don't allow anybody to remap normal RAM that we're using.
-+	 * mem_init() sets high_memory so only do the check after that.
-+	 */
-+	if (!IS_ENABLED(CONFIG_CRASH_DUMP) &&
-+	    slab_is_available() && (paligned < virt_to_phys(high_memory)) &&
-+	    page_is_ram(__phys_to_pfn(paligned))) {
-+		printk("__ioremap(): phys addr 0x%llx is RAM lr %ps\n",
-+		       (u64)paligned, __builtin_return_address(0));
-+		return NULL;
-+	}
-+
-+	/*
-+	 * Is it already mapped?  Perhaps overlapped by a previous
-+	 * mapping.
-+	 */
-+	ret = (void __iomem *)p_block_mapped(paligned);
-+	if (ret)
-+		goto out;
-+
- 	if (slab_is_available()) {
- 		struct vm_struct *area;
++0:	mfspr	r10, SPRN_SPRG_SCRATCH0
+ 	mfspr	r11, SPRN_SPRG_SCRATCH1
+ 	mfspr	r12, SPRN_SPRG_SCRATCH2
+ 	rfi
++	patch_site	0b, patch__dtlbmiss_exit_3
  
-@@ -259,9 +149,9 @@ void __iomem * __ioremap_caller(phys_addr_t addr, unsigned long size,
- 		if (ret)
- 			ioremap_bot += size;
+ #ifndef CONFIG_PIN_TLB_TEXT
+ ITLBMissLinear:
+@@ -693,11 +698,11 @@ ITLBMissLinear:
+ 			  _PAGE_PRESENT
+ 	mtspr	SPRN_MI_RPN, r10	/* Update TLB entry */
+ 
+-_ENTRY(itlb_miss_exit_2)
+-	mfspr	r10, SPRN_SPRG_SCRATCH0
++0:	mfspr	r10, SPRN_SPRG_SCRATCH0
+ 	mfspr	r11, SPRN_SPRG_SCRATCH1
+ 	mfspr	r12, SPRN_SPRG_SCRATCH2
+ 	rfi
++	patch_site	0b, patch__itlbmiss_exit_2
+ #endif
+ 
+ /* This is the procedure to calculate the data EA for buggy dcbx,dcbi instructions
+diff --git a/arch/powerpc/perf/8xx-pmu.c b/arch/powerpc/perf/8xx-pmu.c
+index 6c0020d1c561..808f1873de61 100644
+--- a/arch/powerpc/perf/8xx-pmu.c
++++ b/arch/powerpc/perf/8xx-pmu.c
+@@ -31,9 +31,6 @@
+ 
+ extern unsigned long itlb_miss_counter, dtlb_miss_counter;
+ extern atomic_t instruction_counter;
+-extern unsigned int itlb_miss_perf, dtlb_miss_perf;
+-extern unsigned int itlb_miss_exit_1, itlb_miss_exit_2;
+-extern unsigned int dtlb_miss_exit_1, dtlb_miss_exit_2, dtlb_miss_exit_3;
+ 
+ static atomic_t insn_ctr_ref;
+ static atomic_t itlb_miss_ref;
+@@ -103,22 +100,22 @@ static int mpc8xx_pmu_add(struct perf_event *event, int flags)
+ 		break;
+ 	case PERF_8xx_ID_ITLB_LOAD_MISS:
+ 		if (atomic_inc_return(&itlb_miss_ref) == 1) {
+-			unsigned long target = (unsigned long)&itlb_miss_perf;
++			unsigned long target = site_addr(&patch__itlbmiss_perf);
+ 
+-			patch_branch(&itlb_miss_exit_1, target, 0);
++			patch_branch_site(&patch__itlbmiss_exit_1, target, 0);
+ #ifndef CONFIG_PIN_TLB_TEXT
+-			patch_branch(&itlb_miss_exit_2, target, 0);
++			patch_branch_site(&patch__itlbmiss_exit_2, target, 0);
+ #endif
+ 		}
+ 		val = itlb_miss_counter;
+ 		break;
+ 	case PERF_8xx_ID_DTLB_LOAD_MISS:
+ 		if (atomic_inc_return(&dtlb_miss_ref) == 1) {
+-			unsigned long target = (unsigned long)&dtlb_miss_perf;
++			unsigned long target = site_addr(&patch__dtlbmiss_perf);
+ 
+-			patch_branch(&dtlb_miss_exit_1, target, 0);
+-			patch_branch(&dtlb_miss_exit_2, target, 0);
+-			patch_branch(&dtlb_miss_exit_3, target, 0);
++			patch_branch_site(&patch__dtlbmiss_exit_1, target, 0);
++			patch_branch_site(&patch__dtlbmiss_exit_2, target, 0);
++			patch_branch_site(&patch__dtlbmiss_exit_3, target, 0);
+ 		}
+ 		val = dtlb_miss_counter;
+ 		break;
+@@ -180,17 +177,17 @@ static void mpc8xx_pmu_del(struct perf_event *event, int flags)
+ 		break;
+ 	case PERF_8xx_ID_ITLB_LOAD_MISS:
+ 		if (atomic_dec_return(&itlb_miss_ref) == 0) {
+-			patch_instruction(&itlb_miss_exit_1, insn);
++			patch_instruction_site(&patch__itlbmiss_exit_1, insn);
+ #ifndef CONFIG_PIN_TLB_TEXT
+-			patch_instruction(&itlb_miss_exit_2, insn);
++			patch_instruction_site(&patch__itlbmiss_exit_2, insn);
+ #endif
+ 		}
+ 		break;
+ 	case PERF_8xx_ID_DTLB_LOAD_MISS:
+ 		if (atomic_dec_return(&dtlb_miss_ref) == 0) {
+-			patch_instruction(&dtlb_miss_exit_1, insn);
+-			patch_instruction(&dtlb_miss_exit_2, insn);
+-			patch_instruction(&dtlb_miss_exit_3, insn);
++			patch_instruction_site(&patch__dtlbmiss_exit_1, insn);
++			patch_instruction_site(&patch__dtlbmiss_exit_2, insn);
++			patch_instruction_site(&patch__dtlbmiss_exit_3, insn);
+ 		}
+ 		break;
  	}
--
-+out:
- 	if (ret)
--		ret += addr & ~PAGE_MASK;
-+		ret += (unsigned long)addr & ~PAGE_MASK;
- 	return ret;
- }
- 
-@@ -300,8 +190,8 @@ void __iomem * ioremap_prot(phys_addr_t addr, unsigned long size,
- 	void *caller = __builtin_return_address(0);
- 
- 	/* writeable implies dirty for kernel addresses */
--	if (flags & _PAGE_WRITE)
--		flags |= _PAGE_DIRTY;
-+	if ((flags & (_PAGE_WRITE | _PAGE_RO)) != _PAGE_RO)
-+		flags |= _PAGE_DIRTY | _PAGE_HWWRITE;
- 
- 	/* we don't want to let _PAGE_EXEC leak out */
- 	flags &= ~_PAGE_EXEC;
-@@ -330,6 +220,14 @@ void __iounmap(volatile void __iomem *token)
- 
- 	addr = (void *) ((unsigned long __force)
- 			 PCI_FIX_ADDR(token) & PAGE_MASK);
-+
-+	/*
-+	 * If mapped by BATs then there is nothing to do.
-+	 * Calling vfree() generates a benign warning.
-+	 */
-+	if (v_block_mapped((unsigned long)addr))
-+		return;
-+
- 	if ((unsigned long)addr < ioremap_bot) {
- 		printk(KERN_WARNING "Attempt to iounmap early bolted mapping"
- 		       " at 0x%p\n", addr);
-@@ -347,5 +245,3 @@ void iounmap(volatile void __iomem *token)
- 		__iounmap(token);
- }
- EXPORT_SYMBOL(iounmap);
--
--#endif
 -- 
 2.13.3
Keyboard shortcuts
hback out one level
jnext message in thread
kprevious message in thread
ldrill in
Escclose help / fold thread tree
?toggle this help