diff options
Diffstat (limited to 'arch/sparc/kernel')
28 files changed, 649 insertions, 239 deletions
| diff --git a/arch/sparc/kernel/Makefile b/arch/sparc/kernel/Makefile index fdb13327fded..fa3c02d41138 100644 --- a/arch/sparc/kernel/Makefile +++ b/arch/sparc/kernel/Makefile @@ -86,7 +86,7 @@ obj-y                     += auxio_$(BITS).o  obj-$(CONFIG_SUN_PM)      += apc.o pmc.o  obj-$(CONFIG_MODULES)     += module.o -obj-$(CONFIG_MODULES)     += sparc_ksyms_$(BITS).o +obj-$(CONFIG_MODULES)     += sparc_ksyms.o  obj-$(CONFIG_SPARC_LED)   += led.o  obj-$(CONFIG_KGDB)        += kgdb_$(BITS).o diff --git a/arch/sparc/kernel/entry.S b/arch/sparc/kernel/entry.S index 07918ab3062e..d85bdb999819 100644 --- a/arch/sparc/kernel/entry.S +++ b/arch/sparc/kernel/entry.S @@ -29,6 +29,7 @@  #include <asm/unistd.h>  #include <asm/asmmacro.h> +#include <asm/export.h>  #define curptr      g6 @@ -1207,6 +1208,8 @@ delay_continue:  	ret  	restore +EXPORT_SYMBOL(__udelay) +EXPORT_SYMBOL(__ndelay)  	/* Handle a software breakpoint */  	/* We have to inform parent that child has stopped */ diff --git a/arch/sparc/kernel/ftrace.c b/arch/sparc/kernel/ftrace.c index 0a2d2ddff543..6bcff698069b 100644 --- a/arch/sparc/kernel/ftrace.c +++ b/arch/sparc/kernel/ftrace.c @@ -131,7 +131,7 @@ unsigned long prepare_ftrace_return(unsigned long parent,  		return parent + 8UL;  	if (ftrace_push_return_trace(parent, self_addr, &trace.depth, -				     frame_pointer) == -EBUSY) +				     frame_pointer, NULL) == -EBUSY)  		return parent + 8UL;  	trace.func = self_addr; diff --git a/arch/sparc/kernel/head_32.S b/arch/sparc/kernel/head_32.S index 3d92c0a8f6c4..7bb317b87dde 100644 --- a/arch/sparc/kernel/head_32.S +++ b/arch/sparc/kernel/head_32.S @@ -24,6 +24,7 @@  #include <asm/thread_info.h>	/* TI_UWINMASK */  #include <asm/errno.h>  #include <asm/pgtsrmmu.h>	/* SRMMU_PGDIR_SHIFT */ +#include <asm/export.h>  	.data  /* The following are used with the prom_vector node-ops to figure out @@ -60,6 +61,7 @@ sun4e_notsup:   */  	.globl empty_zero_page  empty_zero_page:	.skip PAGE_SIZE +EXPORT_SYMBOL(empty_zero_page)  	.global root_flags  	.global ram_flags @@ -813,3 +815,4 @@ lvl14_save:  __ret_efault:          ret           restore %g0, -EFAULT, %o0 +EXPORT_SYMBOL(__ret_efault) diff --git a/arch/sparc/kernel/head_64.S b/arch/sparc/kernel/head_64.S index a076b4249e62..6aa3da152c20 100644 --- a/arch/sparc/kernel/head_64.S +++ b/arch/sparc/kernel/head_64.S @@ -32,7 +32,8 @@  #include <asm/estate.h>  #include <asm/sfafsr.h>  #include <asm/unistd.h> -	 +#include <asm/export.h> +  /* This section from from _start to sparc64_boot_end should fit into   * 0x0000000000404000 to 0x0000000000408000.   */ @@ -143,6 +144,7 @@ prom_cpu_compatible:  	.skip	64  prom_root_node:  	.word	0 +EXPORT_SYMBOL(prom_root_node)  prom_mmu_ihandle_cache:  	.word	0  prom_boot_mapped_pc: @@ -158,6 +160,7 @@ is_sun4v:  	.word	0  sun4v_chip_type:  	.word	SUN4V_CHIP_INVALID +EXPORT_SYMBOL(sun4v_chip_type)  1:  	rd	%pc, %l0 @@ -920,49 +923,14 @@ swapper_4m_tsb:  	.globl	prom_tba, tlb_type  prom_tba:	.xword	0  tlb_type:	.word	0	/* Must NOT end up in BSS */ +EXPORT_SYMBOL(tlb_type)  	.section	".fixup",#alloc,#execinstr -	.globl	__ret_efault, __retl_efault, __ret_one, __retl_one -ENTRY(__ret_efault) -	ret -	 restore %g0, -EFAULT, %o0 -ENDPROC(__ret_efault) -  ENTRY(__retl_efault)  	retl  	 mov	-EFAULT, %o0  ENDPROC(__retl_efault) -ENTRY(__retl_one) -	retl -	 mov	1, %o0 -ENDPROC(__retl_one) - -ENTRY(__retl_one_fp) -	VISExitHalf -	retl -	 mov	1, %o0 -ENDPROC(__retl_one_fp) - -ENTRY(__ret_one_asi) -	wr	%g0, ASI_AIUS, %asi -	ret -	 restore %g0, 1, %o0 -ENDPROC(__ret_one_asi) - -ENTRY(__retl_one_asi) -	wr	%g0, ASI_AIUS, %asi -	retl -	 mov	1, %o0 -ENDPROC(__retl_one_asi) - -ENTRY(__retl_one_asi_fp) -	wr	%g0, ASI_AIUS, %asi -	VISExitHalf -	retl -	 mov	1, %o0 -ENDPROC(__retl_one_asi_fp) -  ENTRY(__retl_o1)  	retl  	 mov	%o1, %o0 diff --git a/arch/sparc/kernel/helpers.S b/arch/sparc/kernel/helpers.S index 314dd0c9fc5b..e4e5b832fcb6 100644 --- a/arch/sparc/kernel/helpers.S +++ b/arch/sparc/kernel/helpers.S @@ -15,6 +15,7 @@ __flushw_user:  2:	retl  	 nop  	.size	__flushw_user,.-__flushw_user +EXPORT_SYMBOL(__flushw_user)  	/* Flush %fp and %i7 to the stack for all register  	 * windows active inside of the cpu.  This allows @@ -61,3 +62,4 @@ real_hard_smp_processor_id:  	.size		hard_smp_processor_id,.-hard_smp_processor_id  #endif  	.size		real_hard_smp_processor_id,.-real_hard_smp_processor_id +EXPORT_SYMBOL_GPL(real_hard_smp_processor_id) diff --git a/arch/sparc/kernel/hvapi.c b/arch/sparc/kernel/hvapi.c index 662500fa555f..267731234ce8 100644 --- a/arch/sparc/kernel/hvapi.c +++ b/arch/sparc/kernel/hvapi.c @@ -39,6 +39,7 @@ static struct api_info api_table[] = {  	{ .group = HV_GRP_SDIO,					},  	{ .group = HV_GRP_SDIO_ERR,				},  	{ .group = HV_GRP_REBOOT_DATA,				}, +	{ .group = HV_GRP_ATU,		.flags = FLAG_PRE_API	},  	{ .group = HV_GRP_NIAG_PERF,	.flags = FLAG_PRE_API	},  	{ .group = HV_GRP_FIRE_PERF,				},  	{ .group = HV_GRP_N2_CPU,				}, diff --git a/arch/sparc/kernel/hvcalls.S b/arch/sparc/kernel/hvcalls.S index d127130bf424..4116ee5c7791 100644 --- a/arch/sparc/kernel/hvcalls.S +++ b/arch/sparc/kernel/hvcalls.S @@ -343,6 +343,7 @@ ENTRY(sun4v_mach_set_watchdog)  0:	retl  	 nop  ENDPROC(sun4v_mach_set_watchdog) +EXPORT_SYMBOL(sun4v_mach_set_watchdog)  	/* No inputs and does not return.  */  ENTRY(sun4v_mach_sir) @@ -776,6 +777,7 @@ ENTRY(sun4v_niagara_getperf)  	retl  	 nop  ENDPROC(sun4v_niagara_getperf) +EXPORT_SYMBOL(sun4v_niagara_getperf)  ENTRY(sun4v_niagara_setperf)  	mov	HV_FAST_SET_PERFREG, %o5 @@ -783,6 +785,7 @@ ENTRY(sun4v_niagara_setperf)  	retl  	 nop  ENDPROC(sun4v_niagara_setperf) +EXPORT_SYMBOL(sun4v_niagara_setperf)  ENTRY(sun4v_niagara2_getperf)  	mov	%o0, %o4 @@ -792,6 +795,7 @@ ENTRY(sun4v_niagara2_getperf)  	retl  	 nop  ENDPROC(sun4v_niagara2_getperf) +EXPORT_SYMBOL(sun4v_niagara2_getperf)  ENTRY(sun4v_niagara2_setperf)  	mov	HV_FAST_N2_SET_PERFREG, %o5 @@ -799,6 +803,7 @@ ENTRY(sun4v_niagara2_setperf)  	retl  	 nop  ENDPROC(sun4v_niagara2_setperf) +EXPORT_SYMBOL(sun4v_niagara2_setperf)  ENTRY(sun4v_reboot_data_set)  	mov	HV_FAST_REBOOT_DATA_SET, %o5 diff --git a/arch/sparc/kernel/iommu.c b/arch/sparc/kernel/iommu.c index 5c615abff030..852a3291db96 100644 --- a/arch/sparc/kernel/iommu.c +++ b/arch/sparc/kernel/iommu.c @@ -760,8 +760,12 @@ int dma_supported(struct device *dev, u64 device_mask)  	struct iommu *iommu = dev->archdata.iommu;  	u64 dma_addr_mask = iommu->dma_addr_mask; -	if (device_mask >= (1UL << 32UL)) -		return 0; +	if (device_mask > DMA_BIT_MASK(32)) { +		if (iommu->atu) +			dma_addr_mask = iommu->atu->dma_addr_mask; +		else +			return 0; +	}  	if ((device_mask & dma_addr_mask) == dma_addr_mask)  		return 1; diff --git a/arch/sparc/kernel/iommu_common.h b/arch/sparc/kernel/iommu_common.h index b40cec252905..828493329f68 100644 --- a/arch/sparc/kernel/iommu_common.h +++ b/arch/sparc/kernel/iommu_common.h @@ -13,7 +13,6 @@  #include <linux/scatterlist.h>  #include <linux/device.h>  #include <linux/iommu-helper.h> -#include <linux/scatterlist.h>  #include <asm/iommu.h> diff --git a/arch/sparc/kernel/jump_label.c b/arch/sparc/kernel/jump_label.c index 59bbeff55024..07933b9e9ce0 100644 --- a/arch/sparc/kernel/jump_label.c +++ b/arch/sparc/kernel/jump_label.c @@ -13,19 +13,30 @@  void arch_jump_label_transform(struct jump_entry *entry,  			       enum jump_label_type type)  { -	u32 val;  	u32 *insn = (u32 *) (unsigned long) entry->code; +	u32 val;  	if (type == JUMP_LABEL_JMP) {  		s32 off = (s32)entry->target - (s32)entry->code; +		bool use_v9_branch = false; + +		BUG_ON(off & 3);  #ifdef CONFIG_SPARC64 -		/* ba,pt %xcc, . + (off << 2) */ -		val = 0x10680000 | ((u32) off >> 2); -#else -		/* ba . + (off << 2) */ -		val = 0x10800000 | ((u32) off >> 2); +		if (off <= 0xfffff && off >= -0x100000) +			use_v9_branch = true;  #endif +		if (use_v9_branch) { +			/* WDISP19 - target is . + immed << 2 */ +			/* ba,pt %xcc, . + off */ +			val = 0x10680000 | (((u32) off >> 2) & 0x7ffff); +		} else { +			/* WDISP22 - target is . + immed << 2 */ +			BUG_ON(off > 0x7fffff); +			BUG_ON(off < -0x800000); +			/* ba . + off */ +			val = 0x10800000 | (((u32) off >> 2) & 0x3fffff); +		}  	} else {  		val = 0x01000000;  	} diff --git a/arch/sparc/kernel/kprobes.c b/arch/sparc/kernel/kprobes.c index cd83be527586..b0377db12d83 100644 --- a/arch/sparc/kernel/kprobes.c +++ b/arch/sparc/kernel/kprobes.c @@ -5,7 +5,7 @@  #include <linux/kernel.h>  #include <linux/kprobes.h> -#include <linux/module.h> +#include <linux/extable.h>  #include <linux/kdebug.h>  #include <linux/slab.h>  #include <linux/context_tracking.h> diff --git a/arch/sparc/kernel/mdesc.c b/arch/sparc/kernel/mdesc.c index 11228861d9b4..8a6982dfd733 100644 --- a/arch/sparc/kernel/mdesc.c +++ b/arch/sparc/kernel/mdesc.c @@ -645,13 +645,20 @@ static void __mark_core_id(struct mdesc_handle *hp, u64 node,  		cpu_data(*id).core_id = core_id;  } -static void __mark_sock_id(struct mdesc_handle *hp, u64 node, -			   int sock_id) +static void __mark_max_cache_id(struct mdesc_handle *hp, u64 node, +				int max_cache_id)  {  	const u64 *id = mdesc_get_property(hp, node, "id", NULL); -	if (*id < num_possible_cpus()) -		cpu_data(*id).sock_id = sock_id; +	if (*id < num_possible_cpus()) { +		cpu_data(*id).max_cache_id = max_cache_id; + +		/** +		 * On systems without explicit socket descriptions socket +		 * is max_cache_id +		 */ +		cpu_data(*id).sock_id = max_cache_id; +	}  }  static void mark_core_ids(struct mdesc_handle *hp, u64 mp, @@ -660,10 +667,11 @@ static void mark_core_ids(struct mdesc_handle *hp, u64 mp,  	find_back_node_value(hp, mp, "cpu", __mark_core_id, core_id, 10);  } -static void mark_sock_ids(struct mdesc_handle *hp, u64 mp, -			  int sock_id) +static void mark_max_cache_ids(struct mdesc_handle *hp, u64 mp, +			       int max_cache_id)  { -	find_back_node_value(hp, mp, "cpu", __mark_sock_id, sock_id, 10); +	find_back_node_value(hp, mp, "cpu", __mark_max_cache_id, +			     max_cache_id, 10);  }  static void set_core_ids(struct mdesc_handle *hp) @@ -694,14 +702,15 @@ static void set_core_ids(struct mdesc_handle *hp)  	}  } -static int set_sock_ids_by_cache(struct mdesc_handle *hp, int level) +static int set_max_cache_ids_by_cache(struct mdesc_handle *hp, int level)  {  	u64 mp;  	int idx = 1;  	int fnd = 0; -	/* Identify unique sockets by looking for cpus backpointed to by -	 * shared level n caches. +	/** +	 * Identify unique highest level of shared cache by looking for cpus +	 * backpointed to by shared level N caches.  	 */  	mdesc_for_each_node_by_name(hp, mp, "cache") {  		const u64 *cur_lvl; @@ -709,8 +718,7 @@ static int set_sock_ids_by_cache(struct mdesc_handle *hp, int level)  		cur_lvl = mdesc_get_property(hp, mp, "level", NULL);  		if (*cur_lvl != level)  			continue; - -		mark_sock_ids(hp, mp, idx); +		mark_max_cache_ids(hp, mp, idx);  		idx++;  		fnd = 1;  	} @@ -745,15 +753,17 @@ static void set_sock_ids(struct mdesc_handle *hp)  {  	u64 mp; -	/* If machine description exposes sockets data use it. -	 * Otherwise fallback to use shared L3 or L2 caches. +	/** +	 * Find the highest level of shared cache which pre-T7 is also +	 * the socket.  	 */ +	if (!set_max_cache_ids_by_cache(hp, 3)) +		set_max_cache_ids_by_cache(hp, 2); + +	/* If machine description exposes sockets data use it.*/  	mp = mdesc_node_by_name(hp, MDESC_NODE_NULL, "sockets");  	if (mp != MDESC_NODE_NULL) -		return set_sock_ids_by_socket(hp, mp); - -	if (!set_sock_ids_by_cache(hp, 3)) -		set_sock_ids_by_cache(hp, 2); +		set_sock_ids_by_socket(hp, mp);  }  static void mark_proc_ids(struct mdesc_handle *hp, u64 mp, int proc_id) diff --git a/arch/sparc/kernel/pci_sun4v.c b/arch/sparc/kernel/pci_sun4v.c index 61c6f935accc..06981cc716b6 100644 --- a/arch/sparc/kernel/pci_sun4v.c +++ b/arch/sparc/kernel/pci_sun4v.c @@ -30,8 +30,22 @@  #define DRIVER_NAME	"pci_sun4v"  #define PFX		DRIVER_NAME ": " -static unsigned long vpci_major = 1; -static unsigned long vpci_minor = 1; +static unsigned long vpci_major; +static unsigned long vpci_minor; + +struct vpci_version { +	unsigned long major; +	unsigned long minor; +}; + +/* Ordered from largest major to lowest */ +static struct vpci_version vpci_versions[] = { +	{ .major = 2, .minor = 0 }, +	{ .major = 1, .minor = 1 }, +}; + +static unsigned long vatu_major = 1; +static unsigned long vatu_minor = 1;  #define PGLIST_NENTS	(PAGE_SIZE / sizeof(u64)) @@ -58,30 +72,57 @@ static inline void iommu_batch_start(struct device *dev, unsigned long prot, uns  }  /* Interrupts must be disabled.  */ -static long iommu_batch_flush(struct iommu_batch *p) +static long iommu_batch_flush(struct iommu_batch *p, u64 mask)  {  	struct pci_pbm_info *pbm = p->dev->archdata.host_controller; +	u64 *pglist = p->pglist; +	u64 index_count;  	unsigned long devhandle = pbm->devhandle;  	unsigned long prot = p->prot;  	unsigned long entry = p->entry; -	u64 *pglist = p->pglist;  	unsigned long npages = p->npages; +	unsigned long iotsb_num; +	unsigned long ret; +	long num; + +	/* VPCI maj=1, min=[0,1] only supports read and write */ +	if (vpci_major < 2) +		prot &= (HV_PCI_MAP_ATTR_READ | HV_PCI_MAP_ATTR_WRITE);  	while (npages != 0) { -		long num; - -		num = pci_sun4v_iommu_map(devhandle, HV_PCI_TSBID(0, entry), -					  npages, prot, __pa(pglist)); -		if (unlikely(num < 0)) { -			if (printk_ratelimit()) -				printk("iommu_batch_flush: IOMMU map of " -				       "[%08lx:%08llx:%lx:%lx:%lx] failed with " -				       "status %ld\n", -				       devhandle, HV_PCI_TSBID(0, entry), -				       npages, prot, __pa(pglist), num); -			return -1; +		if (mask <= DMA_BIT_MASK(32)) { +			num = pci_sun4v_iommu_map(devhandle, +						  HV_PCI_TSBID(0, entry), +						  npages, +						  prot, +						  __pa(pglist)); +			if (unlikely(num < 0)) { +				pr_err_ratelimited("%s: IOMMU map of [%08lx:%08llx:%lx:%lx:%lx] failed with status %ld\n", +						   __func__, +						   devhandle, +						   HV_PCI_TSBID(0, entry), +						   npages, prot, __pa(pglist), +						   num); +				return -1; +			} +		} else { +			index_count = HV_PCI_IOTSB_INDEX_COUNT(npages, entry), +			iotsb_num = pbm->iommu->atu->iotsb->iotsb_num; +			ret = pci_sun4v_iotsb_map(devhandle, +						  iotsb_num, +						  index_count, +						  prot, +						  __pa(pglist), +						  &num); +			if (unlikely(ret != HV_EOK)) { +				pr_err_ratelimited("%s: ATU map of [%08lx:%lx:%llx:%lx:%lx] failed with status %ld\n", +						   __func__, +						   devhandle, iotsb_num, +						   index_count, prot, +						   __pa(pglist), ret); +				return -1; +			}  		} -  		entry += num;  		npages -= num;  		pglist += num; @@ -93,19 +134,19 @@ static long iommu_batch_flush(struct iommu_batch *p)  	return 0;  } -static inline void iommu_batch_new_entry(unsigned long entry) +static inline void iommu_batch_new_entry(unsigned long entry, u64 mask)  {  	struct iommu_batch *p = this_cpu_ptr(&iommu_batch);  	if (p->entry + p->npages == entry)  		return;  	if (p->entry != ~0UL) -		iommu_batch_flush(p); +		iommu_batch_flush(p, mask);  	p->entry = entry;  }  /* Interrupts must be disabled.  */ -static inline long iommu_batch_add(u64 phys_page) +static inline long iommu_batch_add(u64 phys_page, u64 mask)  {  	struct iommu_batch *p = this_cpu_ptr(&iommu_batch); @@ -113,27 +154,31 @@ static inline long iommu_batch_add(u64 phys_page)  	p->pglist[p->npages++] = phys_page;  	if (p->npages == PGLIST_NENTS) -		return iommu_batch_flush(p); +		return iommu_batch_flush(p, mask);  	return 0;  }  /* Interrupts must be disabled.  */ -static inline long iommu_batch_end(void) +static inline long iommu_batch_end(u64 mask)  {  	struct iommu_batch *p = this_cpu_ptr(&iommu_batch);  	BUG_ON(p->npages >= PGLIST_NENTS); -	return iommu_batch_flush(p); +	return iommu_batch_flush(p, mask);  }  static void *dma_4v_alloc_coherent(struct device *dev, size_t size,  				   dma_addr_t *dma_addrp, gfp_t gfp,  				   unsigned long attrs)  { +	u64 mask;  	unsigned long flags, order, first_page, npages, n; +	unsigned long prot = 0;  	struct iommu *iommu; +	struct atu *atu; +	struct iommu_map_table *tbl;  	struct page *page;  	void *ret;  	long entry; @@ -146,6 +191,9 @@ static void *dma_4v_alloc_coherent(struct device *dev, size_t size,  	npages = size >> IO_PAGE_SHIFT; +	if (attrs & DMA_ATTR_WEAK_ORDERING) +		prot = HV_PCI_MAP_ATTR_RELAXED_ORDER; +  	nid = dev->archdata.numa_node;  	page = alloc_pages_node(nid, gfp, order);  	if (unlikely(!page)) @@ -155,31 +203,38 @@ static void *dma_4v_alloc_coherent(struct device *dev, size_t size,  	memset((char *)first_page, 0, PAGE_SIZE << order);  	iommu = dev->archdata.iommu; +	atu = iommu->atu; + +	mask = dev->coherent_dma_mask; +	if (mask <= DMA_BIT_MASK(32)) +		tbl = &iommu->tbl; +	else +		tbl = &atu->tbl; -	entry = iommu_tbl_range_alloc(dev, &iommu->tbl, npages, NULL, +	entry = iommu_tbl_range_alloc(dev, tbl, npages, NULL,  				      (unsigned long)(-1), 0);  	if (unlikely(entry == IOMMU_ERROR_CODE))  		goto range_alloc_fail; -	*dma_addrp = (iommu->tbl.table_map_base + (entry << IO_PAGE_SHIFT)); +	*dma_addrp = (tbl->table_map_base + (entry << IO_PAGE_SHIFT));  	ret = (void *) first_page;  	first_page = __pa(first_page);  	local_irq_save(flags);  	iommu_batch_start(dev, -			  (HV_PCI_MAP_ATTR_READ | +			  (HV_PCI_MAP_ATTR_READ | prot |  			   HV_PCI_MAP_ATTR_WRITE),  			  entry);  	for (n = 0; n < npages; n++) { -		long err = iommu_batch_add(first_page + (n * PAGE_SIZE)); +		long err = iommu_batch_add(first_page + (n * PAGE_SIZE), mask);  		if (unlikely(err < 0L))  			goto iommu_map_fail;  	} -	if (unlikely(iommu_batch_end() < 0L)) +	if (unlikely(iommu_batch_end(mask) < 0L))  		goto iommu_map_fail;  	local_irq_restore(flags); @@ -187,25 +242,71 @@ static void *dma_4v_alloc_coherent(struct device *dev, size_t size,  	return ret;  iommu_map_fail: -	iommu_tbl_range_free(&iommu->tbl, *dma_addrp, npages, IOMMU_ERROR_CODE); +	iommu_tbl_range_free(tbl, *dma_addrp, npages, IOMMU_ERROR_CODE);  range_alloc_fail:  	free_pages(first_page, order);  	return NULL;  } -static void dma_4v_iommu_demap(void *demap_arg, unsigned long entry, -			       unsigned long npages) +unsigned long dma_4v_iotsb_bind(unsigned long devhandle, +				unsigned long iotsb_num, +				struct pci_bus *bus_dev) +{ +	struct pci_dev *pdev; +	unsigned long err; +	unsigned int bus; +	unsigned int device; +	unsigned int fun; + +	list_for_each_entry(pdev, &bus_dev->devices, bus_list) { +		if (pdev->subordinate) { +			/* No need to bind pci bridge */ +			dma_4v_iotsb_bind(devhandle, iotsb_num, +					  pdev->subordinate); +		} else { +			bus = bus_dev->number; +			device = PCI_SLOT(pdev->devfn); +			fun = PCI_FUNC(pdev->devfn); +			err = pci_sun4v_iotsb_bind(devhandle, iotsb_num, +						   HV_PCI_DEVICE_BUILD(bus, +								       device, +								       fun)); + +			/* If bind fails for one device it is going to fail +			 * for rest of the devices because we are sharing +			 * IOTSB. So in case of failure simply return with +			 * error. +			 */ +			if (err) +				return err; +		} +	} + +	return 0; +} + +static void dma_4v_iommu_demap(struct device *dev, unsigned long devhandle, +			       dma_addr_t dvma, unsigned long iotsb_num, +			       unsigned long entry, unsigned long npages)  { -	u32 devhandle = *(u32 *)demap_arg;  	unsigned long num, flags; +	unsigned long ret;  	local_irq_save(flags);  	do { -		num = pci_sun4v_iommu_demap(devhandle, -					    HV_PCI_TSBID(0, entry), -					    npages); - +		if (dvma <= DMA_BIT_MASK(32)) { +			num = pci_sun4v_iommu_demap(devhandle, +						    HV_PCI_TSBID(0, entry), +						    npages); +		} else { +			ret = pci_sun4v_iotsb_demap(devhandle, iotsb_num, +						    entry, npages, &num); +			if (unlikely(ret != HV_EOK)) { +				pr_err_ratelimited("pci_iotsb_demap() failed with error: %ld\n", +						   ret); +			} +		}  		entry += num;  		npages -= num;  	} while (npages != 0); @@ -217,16 +318,28 @@ static void dma_4v_free_coherent(struct device *dev, size_t size, void *cpu,  {  	struct pci_pbm_info *pbm;  	struct iommu *iommu; +	struct atu *atu; +	struct iommu_map_table *tbl;  	unsigned long order, npages, entry; +	unsigned long iotsb_num;  	u32 devhandle;  	npages = IO_PAGE_ALIGN(size) >> IO_PAGE_SHIFT;  	iommu = dev->archdata.iommu;  	pbm = dev->archdata.host_controller; +	atu = iommu->atu;  	devhandle = pbm->devhandle; -	entry = ((dvma - iommu->tbl.table_map_base) >> IO_PAGE_SHIFT); -	dma_4v_iommu_demap(&devhandle, entry, npages); -	iommu_tbl_range_free(&iommu->tbl, dvma, npages, IOMMU_ERROR_CODE); + +	if (dvma <= DMA_BIT_MASK(32)) { +		tbl = &iommu->tbl; +		iotsb_num = 0; /* we don't care for legacy iommu */ +	} else { +		tbl = &atu->tbl; +		iotsb_num = atu->iotsb->iotsb_num; +	} +	entry = ((dvma - tbl->table_map_base) >> IO_PAGE_SHIFT); +	dma_4v_iommu_demap(dev, devhandle, dvma, iotsb_num, entry, npages); +	iommu_tbl_range_free(tbl, dvma, npages, IOMMU_ERROR_CODE);  	order = get_order(size);  	if (order < 10)  		free_pages((unsigned long)cpu, order); @@ -238,13 +351,17 @@ static dma_addr_t dma_4v_map_page(struct device *dev, struct page *page,  				  unsigned long attrs)  {  	struct iommu *iommu; +	struct atu *atu; +	struct iommu_map_table *tbl; +	u64 mask;  	unsigned long flags, npages, oaddr;  	unsigned long i, base_paddr; -	u32 bus_addr, ret;  	unsigned long prot; +	dma_addr_t bus_addr, ret;  	long entry;  	iommu = dev->archdata.iommu; +	atu = iommu->atu;  	if (unlikely(direction == DMA_NONE))  		goto bad; @@ -253,29 +370,38 @@ static dma_addr_t dma_4v_map_page(struct device *dev, struct page *page,  	npages = IO_PAGE_ALIGN(oaddr + sz) - (oaddr & IO_PAGE_MASK);  	npages >>= IO_PAGE_SHIFT; -	entry = iommu_tbl_range_alloc(dev, &iommu->tbl, npages, NULL, +	mask = *dev->dma_mask; +	if (mask <= DMA_BIT_MASK(32)) +		tbl = &iommu->tbl; +	else +		tbl = &atu->tbl; + +	entry = iommu_tbl_range_alloc(dev, tbl, npages, NULL,  				      (unsigned long)(-1), 0);  	if (unlikely(entry == IOMMU_ERROR_CODE))  		goto bad; -	bus_addr = (iommu->tbl.table_map_base + (entry << IO_PAGE_SHIFT)); +	bus_addr = (tbl->table_map_base + (entry << IO_PAGE_SHIFT));  	ret = bus_addr | (oaddr & ~IO_PAGE_MASK);  	base_paddr = __pa(oaddr & IO_PAGE_MASK);  	prot = HV_PCI_MAP_ATTR_READ;  	if (direction != DMA_TO_DEVICE)  		prot |= HV_PCI_MAP_ATTR_WRITE; +	if (attrs & DMA_ATTR_WEAK_ORDERING) +		prot |= HV_PCI_MAP_ATTR_RELAXED_ORDER; +  	local_irq_save(flags);  	iommu_batch_start(dev, prot, entry);  	for (i = 0; i < npages; i++, base_paddr += IO_PAGE_SIZE) { -		long err = iommu_batch_add(base_paddr); +		long err = iommu_batch_add(base_paddr, mask);  		if (unlikely(err < 0L))  			goto iommu_map_fail;  	} -	if (unlikely(iommu_batch_end() < 0L)) +	if (unlikely(iommu_batch_end(mask) < 0L))  		goto iommu_map_fail;  	local_irq_restore(flags); @@ -288,7 +414,7 @@ bad:  	return DMA_ERROR_CODE;  iommu_map_fail: -	iommu_tbl_range_free(&iommu->tbl, bus_addr, npages, IOMMU_ERROR_CODE); +	iommu_tbl_range_free(tbl, bus_addr, npages, IOMMU_ERROR_CODE);  	return DMA_ERROR_CODE;  } @@ -298,7 +424,10 @@ static void dma_4v_unmap_page(struct device *dev, dma_addr_t bus_addr,  {  	struct pci_pbm_info *pbm;  	struct iommu *iommu; +	struct atu *atu; +	struct iommu_map_table *tbl;  	unsigned long npages; +	unsigned long iotsb_num;  	long entry;  	u32 devhandle; @@ -310,14 +439,23 @@ static void dma_4v_unmap_page(struct device *dev, dma_addr_t bus_addr,  	iommu = dev->archdata.iommu;  	pbm = dev->archdata.host_controller; +	atu = iommu->atu;  	devhandle = pbm->devhandle;  	npages = IO_PAGE_ALIGN(bus_addr + sz) - (bus_addr & IO_PAGE_MASK);  	npages >>= IO_PAGE_SHIFT;  	bus_addr &= IO_PAGE_MASK; -	entry = (bus_addr - iommu->tbl.table_map_base) >> IO_PAGE_SHIFT; -	dma_4v_iommu_demap(&devhandle, entry, npages); -	iommu_tbl_range_free(&iommu->tbl, bus_addr, npages, IOMMU_ERROR_CODE); + +	if (bus_addr <= DMA_BIT_MASK(32)) { +		iotsb_num = 0; /* we don't care for legacy iommu */ +		tbl = &iommu->tbl; +	} else { +		iotsb_num = atu->iotsb->iotsb_num; +		tbl = &atu->tbl; +	} +	entry = (bus_addr - tbl->table_map_base) >> IO_PAGE_SHIFT; +	dma_4v_iommu_demap(dev, devhandle, bus_addr, iotsb_num, entry, npages); +	iommu_tbl_range_free(tbl, bus_addr, npages, IOMMU_ERROR_CODE);  }  static int dma_4v_map_sg(struct device *dev, struct scatterlist *sglist, @@ -331,12 +469,17 @@ static int dma_4v_map_sg(struct device *dev, struct scatterlist *sglist,  	unsigned long seg_boundary_size;  	int outcount, incount, i;  	struct iommu *iommu; +	struct atu *atu; +	struct iommu_map_table *tbl; +	u64 mask;  	unsigned long base_shift;  	long err;  	BUG_ON(direction == DMA_NONE);  	iommu = dev->archdata.iommu; +	atu = iommu->atu; +  	if (nelems == 0 || !iommu)  		return 0; @@ -344,6 +487,9 @@ static int dma_4v_map_sg(struct device *dev, struct scatterlist *sglist,  	if (direction != DMA_TO_DEVICE)  		prot |= HV_PCI_MAP_ATTR_WRITE; +	if (attrs & DMA_ATTR_WEAK_ORDERING) +		prot |= HV_PCI_MAP_ATTR_RELAXED_ORDER; +  	outs = s = segstart = &sglist[0];  	outcount = 1;  	incount = nelems; @@ -359,7 +505,15 @@ static int dma_4v_map_sg(struct device *dev, struct scatterlist *sglist,  	max_seg_size = dma_get_max_seg_size(dev);  	seg_boundary_size = ALIGN(dma_get_seg_boundary(dev) + 1,  				  IO_PAGE_SIZE) >> IO_PAGE_SHIFT; -	base_shift = iommu->tbl.table_map_base >> IO_PAGE_SHIFT; + +	mask = *dev->dma_mask; +	if (mask <= DMA_BIT_MASK(32)) +		tbl = &iommu->tbl; +	else +		tbl = &atu->tbl; + +	base_shift = tbl->table_map_base >> IO_PAGE_SHIFT; +  	for_each_sg(sglist, s, nelems, i) {  		unsigned long paddr, npages, entry, out_entry = 0, slen; @@ -372,27 +526,26 @@ static int dma_4v_map_sg(struct device *dev, struct scatterlist *sglist,  		/* Allocate iommu entries for that segment */  		paddr = (unsigned long) SG_ENT_PHYS_ADDRESS(s);  		npages = iommu_num_pages(paddr, slen, IO_PAGE_SIZE); -		entry = iommu_tbl_range_alloc(dev, &iommu->tbl, npages, +		entry = iommu_tbl_range_alloc(dev, tbl, npages,  					      &handle, (unsigned long)(-1), 0);  		/* Handle failure */  		if (unlikely(entry == IOMMU_ERROR_CODE)) { -			if (printk_ratelimit()) -				printk(KERN_INFO "iommu_alloc failed, iommu %p paddr %lx" -				       " npages %lx\n", iommu, paddr, npages); +			pr_err_ratelimited("iommu_alloc failed, iommu %p paddr %lx npages %lx\n", +					   tbl, paddr, npages);  			goto iommu_map_failed;  		} -		iommu_batch_new_entry(entry); +		iommu_batch_new_entry(entry, mask);  		/* Convert entry to a dma_addr_t */ -		dma_addr = iommu->tbl.table_map_base + (entry << IO_PAGE_SHIFT); +		dma_addr = tbl->table_map_base + (entry << IO_PAGE_SHIFT);  		dma_addr |= (s->offset & ~IO_PAGE_MASK);  		/* Insert into HW table */  		paddr &= IO_PAGE_MASK;  		while (npages--) { -			err = iommu_batch_add(paddr); +			err = iommu_batch_add(paddr, mask);  			if (unlikely(err < 0L))  				goto iommu_map_failed;  			paddr += IO_PAGE_SIZE; @@ -427,7 +580,7 @@ static int dma_4v_map_sg(struct device *dev, struct scatterlist *sglist,  		dma_next = dma_addr + slen;  	} -	err = iommu_batch_end(); +	err = iommu_batch_end(mask);  	if (unlikely(err < 0L))  		goto iommu_map_failed; @@ -450,7 +603,7 @@ iommu_map_failed:  			vaddr = s->dma_address & IO_PAGE_MASK;  			npages = iommu_num_pages(s->dma_address, s->dma_length,  						 IO_PAGE_SIZE); -			iommu_tbl_range_free(&iommu->tbl, vaddr, npages, +			iommu_tbl_range_free(tbl, vaddr, npages,  					     IOMMU_ERROR_CODE);  			/* XXX demap? XXX */  			s->dma_address = DMA_ERROR_CODE; @@ -471,13 +624,16 @@ static void dma_4v_unmap_sg(struct device *dev, struct scatterlist *sglist,  	struct pci_pbm_info *pbm;  	struct scatterlist *sg;  	struct iommu *iommu; +	struct atu *atu;  	unsigned long flags, entry; +	unsigned long iotsb_num;  	u32 devhandle;  	BUG_ON(direction == DMA_NONE);  	iommu = dev->archdata.iommu;  	pbm = dev->archdata.host_controller; +	atu = iommu->atu;  	devhandle = pbm->devhandle;  	local_irq_save(flags); @@ -487,15 +643,24 @@ static void dma_4v_unmap_sg(struct device *dev, struct scatterlist *sglist,  		dma_addr_t dma_handle = sg->dma_address;  		unsigned int len = sg->dma_length;  		unsigned long npages; -		struct iommu_map_table *tbl = &iommu->tbl; +		struct iommu_map_table *tbl;  		unsigned long shift = IO_PAGE_SHIFT;  		if (!len)  			break;  		npages = iommu_num_pages(dma_handle, len, IO_PAGE_SIZE); + +		if (dma_handle <= DMA_BIT_MASK(32)) { +			iotsb_num = 0; /* we don't care for legacy iommu */ +			tbl = &iommu->tbl; +		} else { +			iotsb_num = atu->iotsb->iotsb_num; +			tbl = &atu->tbl; +		}  		entry = ((dma_handle - tbl->table_map_base) >> shift); -		dma_4v_iommu_demap(&devhandle, entry, npages); -		iommu_tbl_range_free(&iommu->tbl, dma_handle, npages, +		dma_4v_iommu_demap(dev, devhandle, dma_handle, iotsb_num, +				   entry, npages); +		iommu_tbl_range_free(tbl, dma_handle, npages,  				     IOMMU_ERROR_CODE);  		sg = sg_next(sg);  	} @@ -556,6 +721,132 @@ static unsigned long probe_existing_entries(struct pci_pbm_info *pbm,  	return cnt;  } +static int pci_sun4v_atu_alloc_iotsb(struct pci_pbm_info *pbm) +{ +	struct atu *atu = pbm->iommu->atu; +	struct atu_iotsb *iotsb; +	void *table; +	u64 table_size; +	u64 iotsb_num; +	unsigned long order; +	unsigned long err; + +	iotsb = kzalloc(sizeof(*iotsb), GFP_KERNEL); +	if (!iotsb) { +		err = -ENOMEM; +		goto out_err; +	} +	atu->iotsb = iotsb; + +	/* calculate size of IOTSB */ +	table_size = (atu->size / IO_PAGE_SIZE) * 8; +	order = get_order(table_size); +	table = (void *)__get_free_pages(GFP_KERNEL | __GFP_ZERO, order); +	if (!table) { +		err = -ENOMEM; +		goto table_failed; +	} +	iotsb->table = table; +	iotsb->ra = __pa(table); +	iotsb->dvma_size = atu->size; +	iotsb->dvma_base = atu->base; +	iotsb->table_size = table_size; +	iotsb->page_size = IO_PAGE_SIZE; + +	/* configure and register IOTSB with HV */ +	err = pci_sun4v_iotsb_conf(pbm->devhandle, +				   iotsb->ra, +				   iotsb->table_size, +				   iotsb->page_size, +				   iotsb->dvma_base, +				   &iotsb_num); +	if (err) { +		pr_err(PFX "pci_iotsb_conf failed error: %ld\n", err); +		goto iotsb_conf_failed; +	} +	iotsb->iotsb_num = iotsb_num; + +	err = dma_4v_iotsb_bind(pbm->devhandle, iotsb_num, pbm->pci_bus); +	if (err) { +		pr_err(PFX "pci_iotsb_bind failed error: %ld\n", err); +		goto iotsb_conf_failed; +	} + +	return 0; + +iotsb_conf_failed: +	free_pages((unsigned long)table, order); +table_failed: +	kfree(iotsb); +out_err: +	return err; +} + +static int pci_sun4v_atu_init(struct pci_pbm_info *pbm) +{ +	struct atu *atu = pbm->iommu->atu; +	unsigned long err; +	const u64 *ranges; +	u64 map_size, num_iotte; +	u64 dma_mask; +	const u32 *page_size; +	int len; + +	ranges = of_get_property(pbm->op->dev.of_node, "iommu-address-ranges", +				 &len); +	if (!ranges) { +		pr_err(PFX "No iommu-address-ranges\n"); +		return -EINVAL; +	} + +	page_size = of_get_property(pbm->op->dev.of_node, "iommu-pagesizes", +				    NULL); +	if (!page_size) { +		pr_err(PFX "No iommu-pagesizes\n"); +		return -EINVAL; +	} + +	/* There are 4 iommu-address-ranges supported. Each range is pair of +	 * {base, size}. The ranges[0] and ranges[1] are 32bit address space +	 * while ranges[2] and ranges[3] are 64bit space.  We want to use 64bit +	 * address ranges to support 64bit addressing. Because 'size' for +	 * address ranges[2] and ranges[3] are same we can select either of +	 * ranges[2] or ranges[3] for mapping. However due to 'size' is too +	 * large for OS to allocate IOTSB we are using fix size 32G +	 * (ATU_64_SPACE_SIZE) which is more than enough for all PCIe devices +	 * to share. +	 */ +	atu->ranges = (struct atu_ranges *)ranges; +	atu->base = atu->ranges[3].base; +	atu->size = ATU_64_SPACE_SIZE; + +	/* Create IOTSB */ +	err = pci_sun4v_atu_alloc_iotsb(pbm); +	if (err) { +		pr_err(PFX "Error creating ATU IOTSB\n"); +		return err; +	} + +	/* Create ATU iommu map. +	 * One bit represents one iotte in IOTSB table. +	 */ +	dma_mask = (roundup_pow_of_two(atu->size) - 1UL); +	num_iotte = atu->size / IO_PAGE_SIZE; +	map_size = num_iotte / 8; +	atu->tbl.table_map_base = atu->base; +	atu->dma_addr_mask = dma_mask; +	atu->tbl.map = kzalloc(map_size, GFP_KERNEL); +	if (!atu->tbl.map) +		return -ENOMEM; + +	iommu_tbl_pool_init(&atu->tbl, num_iotte, IO_PAGE_SHIFT, +			    NULL, false /* no large_pool */, +			    0 /* default npools */, +			    false /* want span boundary checking */); + +	return 0; +} +  static int pci_sun4v_iommu_init(struct pci_pbm_info *pbm)  {  	static const u32 vdma_default[] = { 0x80000000, 0x80000000 }; @@ -893,6 +1184,18 @@ static int pci_sun4v_pbm_init(struct pci_pbm_info *pbm,  	pci_sun4v_scan_bus(pbm, &op->dev); +	/* if atu_init fails its not complete failure. +	 * we can still continue using legacy iommu. +	 */ +	if (pbm->iommu->atu) { +		err = pci_sun4v_atu_init(pbm); +		if (err) { +			kfree(pbm->iommu->atu); +			pbm->iommu->atu = NULL; +			pr_err(PFX "ATU init failed, err=%d\n", err); +		} +	} +  	pbm->next = pci_pbm_root;  	pci_pbm_root = pbm; @@ -906,23 +1209,43 @@ static int pci_sun4v_probe(struct platform_device *op)  	struct pci_pbm_info *pbm;  	struct device_node *dp;  	struct iommu *iommu; +	struct atu *atu;  	u32 devhandle; -	int i, err; +	int i, err = -ENODEV; +	static bool hv_atu = true;  	dp = op->dev.of_node;  	if (!hvapi_negotiated++) { -		err = sun4v_hvapi_register(HV_GRP_PCI, -					   vpci_major, -					   &vpci_minor); +		for (i = 0; i < ARRAY_SIZE(vpci_versions); i++) { +			vpci_major = vpci_versions[i].major; +			vpci_minor = vpci_versions[i].minor; + +			err = sun4v_hvapi_register(HV_GRP_PCI, vpci_major, +						   &vpci_minor); +			if (!err) +				break; +		}  		if (err) { -			printk(KERN_ERR PFX "Could not register hvapi, " -			       "err=%d\n", err); +			pr_err(PFX "Could not register hvapi, err=%d\n", err);  			return err;  		} -		printk(KERN_INFO PFX "Registered hvapi major[%lu] minor[%lu]\n", -		       vpci_major, vpci_minor); +		pr_info(PFX "Registered hvapi major[%lu] minor[%lu]\n", +			vpci_major, vpci_minor); + +		err = sun4v_hvapi_register(HV_GRP_ATU, vatu_major, &vatu_minor); +		if (err) { +			/* don't return an error if we fail to register the +			 * ATU group, but ATU hcalls won't be available. +			 */ +			hv_atu = false; +			pr_err(PFX "Could not register hvapi ATU err=%d\n", +			       err); +		} else { +			pr_info(PFX "Registered hvapi ATU major[%lu] minor[%lu]\n", +				vatu_major, vatu_minor); +		}  		dma_ops = &sun4v_dma_ops;  	} @@ -961,6 +1284,14 @@ static int pci_sun4v_probe(struct platform_device *op)  	}  	pbm->iommu = iommu; +	iommu->atu = NULL; +	if (hv_atu) { +		atu = kzalloc(sizeof(*atu), GFP_KERNEL); +		if (!atu) +			pr_err(PFX "Could not allocate atu\n"); +		else +			iommu->atu = atu; +	}  	err = pci_sun4v_pbm_init(pbm, op, devhandle);  	if (err) @@ -971,6 +1302,7 @@ static int pci_sun4v_probe(struct platform_device *op)  	return 0;  out_free_iommu: +	kfree(iommu->atu);  	kfree(pbm->iommu);  out_free_controller: diff --git a/arch/sparc/kernel/pci_sun4v.h b/arch/sparc/kernel/pci_sun4v.h index 5642212390b2..22603a4e48bf 100644 --- a/arch/sparc/kernel/pci_sun4v.h +++ b/arch/sparc/kernel/pci_sun4v.h @@ -89,4 +89,25 @@ unsigned long pci_sun4v_msg_setvalid(unsigned long devhandle,  				     unsigned long msinum,  				     unsigned long valid); +/* Sun4v HV IOMMU v2 APIs */ +unsigned long pci_sun4v_iotsb_conf(unsigned long devhandle, +				   unsigned long ra, +				   unsigned long table_size, +				   unsigned long page_size, +				   unsigned long dvma_base, +				   u64 *iotsb_num); +unsigned long pci_sun4v_iotsb_bind(unsigned long devhandle, +				   unsigned long iotsb_num, +				   unsigned int pci_device); +unsigned long pci_sun4v_iotsb_map(unsigned long devhandle, +				  unsigned long iotsb_num, +				  unsigned long iotsb_index_iottes, +				  unsigned long io_attributes, +				  unsigned long io_page_list_pa, +				  long *mapped); +unsigned long pci_sun4v_iotsb_demap(unsigned long devhandle, +				    unsigned long iotsb_num, +				    unsigned long iotsb_index, +				    unsigned long iottes, +				    unsigned long *demapped);  #endif /* !(_PCI_SUN4V_H) */ diff --git a/arch/sparc/kernel/pci_sun4v_asm.S b/arch/sparc/kernel/pci_sun4v_asm.S index e606d46c6815..578f09657916 100644 --- a/arch/sparc/kernel/pci_sun4v_asm.S +++ b/arch/sparc/kernel/pci_sun4v_asm.S @@ -360,3 +360,71 @@ ENTRY(pci_sun4v_msg_setvalid)  	 mov	%o0, %o0  ENDPROC(pci_sun4v_msg_setvalid) +	/* +	 * %o0:	devhandle +	 * %o1:	r_addr +	 * %o2:	size +	 * %o3:	pagesize +	 * %o4:	virt +	 * %o5: &iotsb_num/&iotsb_handle +	 * +	 * returns %o0:	status +	 *         %o1:	iotsb_num/iotsb_handle +	 */ +ENTRY(pci_sun4v_iotsb_conf) +	mov	%o5, %g1 +	mov	HV_FAST_PCI_IOTSB_CONF, %o5 +	ta	HV_FAST_TRAP +	retl +	 stx	%o1, [%g1] +ENDPROC(pci_sun4v_iotsb_conf) + +	/* +	 * %o0:	devhandle +	 * %o1:	iotsb_num/iotsb_handle +	 * %o2:	pci_device +	 * +	 * returns %o0:	status +	 */ +ENTRY(pci_sun4v_iotsb_bind) +	mov	HV_FAST_PCI_IOTSB_BIND, %o5 +	ta	HV_FAST_TRAP +	retl +	 nop +ENDPROC(pci_sun4v_iotsb_bind) + +	/* +	 * %o0:	devhandle +	 * %o1:	iotsb_num/iotsb_handle +	 * %o2:	index_count +	 * %o3:	iotte_attributes +	 * %o4:	io_page_list_p +	 * %o5: &mapped +	 * +	 * returns %o0:	status +	 *         %o1:	#mapped +	 */ +ENTRY(pci_sun4v_iotsb_map) +	mov	%o5, %g1 +	mov	HV_FAST_PCI_IOTSB_MAP, %o5 +	ta	HV_FAST_TRAP +	retl +	 stx	%o1, [%g1] +ENDPROC(pci_sun4v_iotsb_map) + +	/* +	 * %o0:	devhandle +	 * %o1:	iotsb_num/iotsb_handle +	 * %o2:	iotsb_index +	 * %o3:	#iottes +	 * %o4: &demapped +	 * +	 * returns %o0:	status +	 *         %o1:	#demapped +	 */ +ENTRY(pci_sun4v_iotsb_demap) +	mov	HV_FAST_PCI_IOTSB_DEMAP, %o5 +	ta	HV_FAST_TRAP +	retl +	 stx	%o1, [%o4] +ENDPROC(pci_sun4v_iotsb_demap) diff --git a/arch/sparc/kernel/process_64.c b/arch/sparc/kernel/process_64.c index fa14402b33f9..47ff5588e521 100644 --- a/arch/sparc/kernel/process_64.c +++ b/arch/sparc/kernel/process_64.c @@ -239,7 +239,7 @@ static void __global_reg_poll(struct global_reg_snapshot *gp)  	}  } -void arch_trigger_all_cpu_backtrace(bool include_self) +void arch_trigger_cpumask_backtrace(const cpumask_t *mask, bool exclude_self)  {  	struct thread_info *tp = current_thread_info();  	struct pt_regs *regs = get_irq_regs(); @@ -255,15 +255,15 @@ void arch_trigger_all_cpu_backtrace(bool include_self)  	memset(global_cpu_snapshot, 0, sizeof(global_cpu_snapshot)); -	if (include_self) +	if (cpumask_test_cpu(this_cpu, mask) && !exclude_self)  		__global_reg_self(tp, regs, this_cpu);  	smp_fetch_global_regs(); -	for_each_online_cpu(cpu) { +	for_each_cpu(cpu, mask) {  		struct global_reg_snapshot *gp; -		if (!include_self && cpu == this_cpu) +		if (exclude_self && cpu == this_cpu)  			continue;  		gp = &global_cpu_snapshot[cpu].reg; @@ -300,7 +300,7 @@ void arch_trigger_all_cpu_backtrace(bool include_self)  static void sysrq_handle_globreg(int key)  { -	arch_trigger_all_cpu_backtrace(true); +	trigger_all_cpu_backtrace();  }  static struct sysrq_key_op sparc_globalreg_op = { diff --git a/arch/sparc/kernel/ptrace_64.c b/arch/sparc/kernel/ptrace_64.c index 9ddc4928a089..ac082dd8c67d 100644 --- a/arch/sparc/kernel/ptrace_64.c +++ b/arch/sparc/kernel/ptrace_64.c @@ -127,7 +127,8 @@ static int get_from_target(struct task_struct *target, unsigned long uaddr,  		if (copy_from_user(kbuf, (void __user *) uaddr, len))  			return -EFAULT;  	} else { -		int len2 = access_process_vm(target, uaddr, kbuf, len, 0); +		int len2 = access_process_vm(target, uaddr, kbuf, len, +				FOLL_FORCE);  		if (len2 != len)  			return -EFAULT;  	} @@ -141,7 +142,8 @@ static int set_to_target(struct task_struct *target, unsigned long uaddr,  		if (copy_to_user((void __user *) uaddr, kbuf, len))  			return -EFAULT;  	} else { -		int len2 = access_process_vm(target, uaddr, kbuf, len, 1); +		int len2 = access_process_vm(target, uaddr, kbuf, len, +				FOLL_FORCE | FOLL_WRITE);  		if (len2 != len)  			return -EFAULT;  	} @@ -505,7 +507,8 @@ static int genregs32_get(struct task_struct *target,  				if (access_process_vm(target,  						      (unsigned long)  						      ®_window[pos], -						      k, sizeof(*k), 0) +						      k, sizeof(*k), +						      FOLL_FORCE)  				    != sizeof(*k))  					return -EFAULT;  				k++; @@ -531,12 +534,14 @@ static int genregs32_get(struct task_struct *target,  				if (access_process_vm(target,  						      (unsigned long)  						      ®_window[pos], -						      ®, sizeof(reg), 0) +						      ®, sizeof(reg), +						      FOLL_FORCE)  				    != sizeof(reg))  					return -EFAULT;  				if (access_process_vm(target,  						      (unsigned long) u, -						      ®, sizeof(reg), 1) +						      ®, sizeof(reg), +						      FOLL_FORCE | FOLL_WRITE)  				    != sizeof(reg))  					return -EFAULT;  				pos++; @@ -615,7 +620,8 @@ static int genregs32_set(struct task_struct *target,  						      (unsigned long)  						      ®_window[pos],  						      (void *) k, -						      sizeof(*k), 1) +						      sizeof(*k), +						      FOLL_FORCE | FOLL_WRITE)  				    != sizeof(*k))  					return -EFAULT;  				k++; @@ -642,13 +648,15 @@ static int genregs32_set(struct task_struct *target,  				if (access_process_vm(target,  						      (unsigned long)  						      u, -						      ®, sizeof(reg), 0) +						      ®, sizeof(reg), +						      FOLL_FORCE)  				    != sizeof(reg))  					return -EFAULT;  				if (access_process_vm(target,  						      (unsigned long)  						      ®_window[pos], -						      ®, sizeof(reg), 1) +						      ®, sizeof(reg), +						      FOLL_FORCE | FOLL_WRITE)  				    != sizeof(reg))  					return -EFAULT;  				pos++; diff --git a/arch/sparc/kernel/setup_64.c b/arch/sparc/kernel/setup_64.c index 599f1207eed2..6b7331d198e9 100644 --- a/arch/sparc/kernel/setup_64.c +++ b/arch/sparc/kernel/setup_64.c @@ -31,6 +31,7 @@  #include <linux/initrd.h>  #include <linux/module.h>  #include <linux/start_kernel.h> +#include <linux/bootmem.h>  #include <asm/io.h>  #include <asm/processor.h> @@ -50,6 +51,8 @@  #include <asm/elf.h>  #include <asm/mdesc.h>  #include <asm/cacheflush.h> +#include <asm/dma.h> +#include <asm/irq.h>  #ifdef CONFIG_IP_PNP  #include <net/ipconfig.h> @@ -590,6 +593,22 @@ static void __init init_sparc64_elf_hwcap(void)  		pause_patch();  } +void __init alloc_irqstack_bootmem(void) +{ +	unsigned int i, node; + +	for_each_possible_cpu(i) { +		node = cpu_to_node(i); + +		softirq_stack[i] = __alloc_bootmem_node(NODE_DATA(node), +							THREAD_SIZE, +							THREAD_SIZE, 0); +		hardirq_stack[i] = __alloc_bootmem_node(NODE_DATA(node), +							THREAD_SIZE, +							THREAD_SIZE, 0); +	} +} +  void __init setup_arch(char **cmdline_p)  {  	/* Initialize PROM console and command line. */ @@ -650,6 +669,13 @@ void __init setup_arch(char **cmdline_p)  	paging_init();  	init_sparc64_elf_hwcap(); +	smp_fill_in_cpu_possible_map(); +	/* +	 * Once the OF device tree and MDESC have been setup and nr_cpus has +	 * been parsed, we know the list of possible cpus.  Therefore we can +	 * allocate the IRQ stacks. +	 */ +	alloc_irqstack_bootmem();  }  extern int stop_a_enabled; diff --git a/arch/sparc/kernel/signal_32.c b/arch/sparc/kernel/signal_32.c index c3c12efe0bc0..9c0c8fd0b292 100644 --- a/arch/sparc/kernel/signal_32.c +++ b/arch/sparc/kernel/signal_32.c @@ -89,7 +89,7 @@ asmlinkage void do_sigreturn(struct pt_regs *regs)  	sf = (struct signal_frame __user *) regs->u_regs[UREG_FP];  	/* 1. Make sure we are not getting garbage from the user */ -	if (!invalid_frame_pointer(sf, sizeof(*sf))) +	if (invalid_frame_pointer(sf, sizeof(*sf)))  		goto segv_and_exit;  	if (get_user(ufp, &sf->info.si_regs.u_regs[UREG_FP])) @@ -150,7 +150,7 @@ asmlinkage void do_rt_sigreturn(struct pt_regs *regs)  	synchronize_user_stack();  	sf = (struct rt_signal_frame __user *) regs->u_regs[UREG_FP]; -	if (!invalid_frame_pointer(sf, sizeof(*sf))) +	if (invalid_frame_pointer(sf, sizeof(*sf)))  		goto segv;  	if (get_user(ufp, &sf->regs.u_regs[UREG_FP])) diff --git a/arch/sparc/kernel/smp_32.c b/arch/sparc/kernel/smp_32.c index fb30e7c6a5b1..e80e6ba3d500 100644 --- a/arch/sparc/kernel/smp_32.c +++ b/arch/sparc/kernel/smp_32.c @@ -352,9 +352,7 @@ static void sparc_start_secondary(void *arg)  	preempt_disable();  	cpu = smp_processor_id(); -	/* Invoke the CPU_STARTING notifier callbacks */  	notify_cpu_starting(cpu); -  	arch_cpu_pre_online(arg);  	/* Set the CPU in the cpu_online_mask */ diff --git a/arch/sparc/kernel/smp_64.c b/arch/sparc/kernel/smp_64.c index 8a6151a628ce..8182f7caf5b1 100644 --- a/arch/sparc/kernel/smp_64.c +++ b/arch/sparc/kernel/smp_64.c @@ -63,9 +63,13 @@ cpumask_t cpu_core_map[NR_CPUS] __read_mostly =  cpumask_t cpu_core_sib_map[NR_CPUS] __read_mostly = {  	[0 ... NR_CPUS-1] = CPU_MASK_NONE }; +cpumask_t cpu_core_sib_cache_map[NR_CPUS] __read_mostly = { +	[0 ... NR_CPUS - 1] = CPU_MASK_NONE }; +  EXPORT_PER_CPU_SYMBOL(cpu_sibling_map);  EXPORT_SYMBOL(cpu_core_map);  EXPORT_SYMBOL(cpu_core_sib_map); +EXPORT_SYMBOL(cpu_core_sib_cache_map);  static cpumask_t smp_commenced_mask; @@ -1227,6 +1231,20 @@ void __init smp_setup_processor_id(void)  		xcall_deliver_impl = hypervisor_xcall_deliver;  } +void __init smp_fill_in_cpu_possible_map(void) +{ +	int possible_cpus = num_possible_cpus(); +	int i; + +	if (possible_cpus > nr_cpu_ids) +		possible_cpus = nr_cpu_ids; + +	for (i = 0; i < possible_cpus; i++) +		set_cpu_possible(i, true); +	for (; i < NR_CPUS; i++) +		set_cpu_possible(i, false); +} +  void smp_fill_in_sib_core_maps(void)  {  	unsigned int i; @@ -1251,6 +1269,10 @@ void smp_fill_in_sib_core_maps(void)  		unsigned int j;  		for_each_present_cpu(j)  { +			if (cpu_data(i).max_cache_id == +			    cpu_data(j).max_cache_id) +				cpumask_set_cpu(j, &cpu_core_sib_cache_map[i]); +  			if (cpu_data(i).sock_id == cpu_data(j).sock_id)  				cpumask_set_cpu(j, &cpu_core_sib_map[i]);  		} diff --git a/arch/sparc/kernel/sparc_ksyms.c b/arch/sparc/kernel/sparc_ksyms.c new file mode 100644 index 000000000000..09aa69e422e5 --- /dev/null +++ b/arch/sparc/kernel/sparc_ksyms.c @@ -0,0 +1,12 @@ +/* + * arch/sparc/kernel/ksyms.c: Sparc specific ksyms support. + * + * Copyright (C) 1996 David S. Miller ([email protected]) + * Copyright (C) 1996 Eddie C. Dost ([email protected]) + */ + +#include <linux/init.h> +#include <linux/export.h> + +/* This is needed only for drivers/sbus/char/openprom.c */ +EXPORT_SYMBOL(saved_command_line); diff --git a/arch/sparc/kernel/sparc_ksyms_32.c b/arch/sparc/kernel/sparc_ksyms_32.c deleted file mode 100644 index bf4ccb10a78c..000000000000 --- a/arch/sparc/kernel/sparc_ksyms_32.c +++ /dev/null @@ -1,31 +0,0 @@ -/* - * arch/sparc/kernel/ksyms.c: Sparc specific ksyms support. - * - * Copyright (C) 1996 David S. Miller ([email protected]) - * Copyright (C) 1996 Eddie C. Dost ([email protected]) - */ - -#include <linux/module.h> - -#include <asm/pgtable.h> -#include <asm/uaccess.h> -#include <asm/delay.h> -#include <asm/head.h> -#include <asm/dma.h> - -struct poll { -	int fd; -	short events; -	short revents; -}; - -/* from entry.S */ -EXPORT_SYMBOL(__udelay); -EXPORT_SYMBOL(__ndelay); - -/* from head_32.S */ -EXPORT_SYMBOL(__ret_efault); -EXPORT_SYMBOL(empty_zero_page); - -/* Exporting a symbol from /init/main.c */ -EXPORT_SYMBOL(saved_command_line); diff --git a/arch/sparc/kernel/sparc_ksyms_64.c b/arch/sparc/kernel/sparc_ksyms_64.c deleted file mode 100644 index 9e034f29dcc5..000000000000 --- a/arch/sparc/kernel/sparc_ksyms_64.c +++ /dev/null @@ -1,53 +0,0 @@ -/* arch/sparc64/kernel/sparc64_ksyms.c: Sparc64 specific ksyms support. - * - * Copyright (C) 1996, 2007 David S. Miller ([email protected]) - * Copyright (C) 1996 Eddie C. Dost ([email protected]) - * Copyright (C) 1999 Jakub Jelinek ([email protected]) - */ - -#include <linux/export.h> -#include <linux/pci.h> -#include <linux/bitops.h> - -#include <asm/cpudata.h> -#include <asm/uaccess.h> -#include <asm/spitfire.h> -#include <asm/oplib.h> -#include <asm/hypervisor.h> -#include <asm/cacheflush.h> - -struct poll { -	int fd; -	short events; -	short revents; -}; - -/* from helpers.S */ -EXPORT_SYMBOL(__flushw_user); -EXPORT_SYMBOL_GPL(real_hard_smp_processor_id); - -/* from head_64.S */ -EXPORT_SYMBOL(__ret_efault); -EXPORT_SYMBOL(tlb_type); -EXPORT_SYMBOL(sun4v_chip_type); -EXPORT_SYMBOL(prom_root_node); - -/* from hvcalls.S */ -EXPORT_SYMBOL(sun4v_niagara_getperf); -EXPORT_SYMBOL(sun4v_niagara_setperf); -EXPORT_SYMBOL(sun4v_niagara2_getperf); -EXPORT_SYMBOL(sun4v_niagara2_setperf); -EXPORT_SYMBOL(sun4v_mach_set_watchdog); - -/* from hweight.S */ -EXPORT_SYMBOL(__arch_hweight8); -EXPORT_SYMBOL(__arch_hweight16); -EXPORT_SYMBOL(__arch_hweight32); -EXPORT_SYMBOL(__arch_hweight64); - -/* from ffs_ffz.S */ -EXPORT_SYMBOL(ffs); -EXPORT_SYMBOL(__ffs); - -/* Exporting a symbol from /init/main.c */ -EXPORT_SYMBOL(saved_command_line); diff --git a/arch/sparc/kernel/traps_64.c b/arch/sparc/kernel/traps_64.c index d21cd625c0de..4094a51b1970 100644 --- a/arch/sparc/kernel/traps_64.c +++ b/arch/sparc/kernel/traps_64.c @@ -8,7 +8,7 @@   * I like traps on v9, :))))   */ -#include <linux/module.h> +#include <linux/extable.h>  #include <linux/sched.h>  #include <linux/linkage.h>  #include <linux/kernel.h> diff --git a/arch/sparc/kernel/unaligned_64.c b/arch/sparc/kernel/unaligned_64.c index 9aacb9159262..52c00d90d4b4 100644 --- a/arch/sparc/kernel/unaligned_64.c +++ b/arch/sparc/kernel/unaligned_64.c @@ -11,7 +11,7 @@  #include <linux/kernel.h>  #include <linux/sched.h>  #include <linux/mm.h> -#include <linux/module.h> +#include <linux/extable.h>  #include <asm/asi.h>  #include <asm/ptrace.h>  #include <asm/pstate.h> diff --git a/arch/sparc/kernel/vmlinux.lds.S b/arch/sparc/kernel/vmlinux.lds.S index d79b3b734245..572db686f845 100644 --- a/arch/sparc/kernel/vmlinux.lds.S +++ b/arch/sparc/kernel/vmlinux.lds.S @@ -49,6 +49,7 @@ SECTIONS  		HEAD_TEXT  		TEXT_TEXT  		SCHED_TEXT +		CPUIDLE_TEXT  		LOCK_TEXT  		KPROBES_TEXT  		IRQENTRY_TEXT |