| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516 | /* *	linux/arch/alpha/kernel/core_t2.c * * Written by Jay A Estabrook (jestabro@amt.tay1.dec.com). * December 1996. * * based on CIA code by David A Rusling (david.rusling@reo.mts.dec.com) * * Code common to all T2 core logic chips. */#define __EXTERN_INLINE#include <asm/io.h>#include <asm/core_t2.h>#undef __EXTERN_INLINE#include <linux/types.h>#include <linux/pci.h>#include <linux/sched.h>#include <linux/init.h>#include <asm/ptrace.h>#include <asm/delay.h>#include <asm/mce.h>#include "proto.h"#include "pci_impl.h"/* For dumping initial DMA window settings. */#define DEBUG_PRINT_INITIAL_SETTINGS 0/* For dumping final DMA window settings. */#define DEBUG_PRINT_FINAL_SETTINGS 0/* * By default, we direct-map starting at 2GB, in order to allow the * maximum size direct-map window (2GB) to match the maximum amount of * memory (2GB) that can be present on SABLEs. But that limits the * floppy to DMA only via the scatter/gather window set up for 8MB * ISA DMA, since the maximum ISA DMA address is 2GB-1. * * For now, this seems a reasonable trade-off: even though most SABLEs * have less than 1GB of memory, floppy usage/performance will not * really be affected by forcing it to go via scatter/gather... */#define T2_DIRECTMAP_2G 1#if T2_DIRECTMAP_2G# define T2_DIRECTMAP_START	0x80000000UL# define T2_DIRECTMAP_LENGTH	0x80000000UL#else# define T2_DIRECTMAP_START	0x40000000UL# define T2_DIRECTMAP_LENGTH	0x40000000UL#endif/* The ISA scatter/gather window settings. */#define T2_ISA_SG_START		0x00800000UL#define T2_ISA_SG_LENGTH	0x00800000UL/* * NOTE: Herein lie back-to-back mb instructions.  They are magic.  * One plausible explanation is that the i/o controller does not properly * handle the system transaction.  Another involves timing.  Ho hum. *//* * BIOS32-style PCI interface: */#define DEBUG_CONFIG 0#if DEBUG_CONFIG# define DBG(args)	printk args#else# define DBG(args)#endifstatic volatile unsigned int t2_mcheck_any_expected;static volatile unsigned int t2_mcheck_last_taken;/* Place to save the DMA Window registers as set up by SRM   for restoration during shutdown. */static struct{	struct {		unsigned long wbase;		unsigned long wmask;		unsigned long tbase;	} window[2];	unsigned long hae_1;  	unsigned long hae_2;	unsigned long hae_3;	unsigned long hae_4;	unsigned long hbase;} t2_saved_config __attribute((common));/* * Given a bus, device, and function number, compute resulting * configuration space address and setup the T2_HAXR2 register * accordingly.  It is therefore not safe to have concurrent * invocations to configuration space access routines, but there * really shouldn't be any need for this. * * Type 0: * *  3 3|3 3 2 2|2 2 2 2|2 2 2 2|1 1 1 1|1 1 1 1|1 1  *  3 2|1 0 9 8|7 6 5 4|3 2 1 0|9 8 7 6|5 4 3 2|1 0 9 8|7 6 5 4|3 2 1 0 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ * | | |D|D|D|D|D|D|D|D|D|D|D|D|D|D|D|D|D|D|D|D|D|F|F|F|R|R|R|R|R|R|0|0| * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ * *	31:11	Device select bit. * 	10:8	Function number * 	 7:2	Register number * * Type 1: * *  3 3|3 3 2 2|2 2 2 2|2 2 2 2|1 1 1 1|1 1 1 1|1 1  *  3 2|1 0 9 8|7 6 5 4|3 2 1 0|9 8 7 6|5 4 3 2|1 0 9 8|7 6 5 4|3 2 1 0 * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ * | | | | | | | | | | |B|B|B|B|B|B|B|B|D|D|D|D|D|F|F|F|R|R|R|R|R|R|0|1| * +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+ * *	31:24	reserved *	23:16	bus number (8 bits = 128 possible buses) *	15:11	Device number (5 bits) *	10:8	function number *	 7:2	register number *   * Notes: *	The function number selects which function of a multi-function device  *	(e.g., SCSI and Ethernet). *  *	The register selects a DWORD (32 bit) register offset.  Hence it *	doesn't get shifted by 2 bits as we want to "drop" the bottom two *	bits. */static intmk_conf_addr(struct pci_bus *pbus, unsigned int device_fn, int where,	     unsigned long *pci_addr, unsigned char *type1){	unsigned long addr;	u8 bus = pbus->number;	DBG(("mk_conf_addr(bus=%d, dfn=0x%x, where=0x%x,"	     " addr=0x%lx, type1=0x%x)\n",	     bus, device_fn, where, pci_addr, type1));	if (bus == 0) {		int device = device_fn >> 3;		/* Type 0 configuration cycle.  */		if (device > 8) {			DBG(("mk_conf_addr: device (%d)>20, returning -1\n",			     device));			return -1;		}		*type1 = 0;		addr = (0x0800L << device) | ((device_fn & 7) << 8) | (where);	} else {		/* Type 1 configuration cycle.  */		*type1 = 1;		addr = (bus << 16) | (device_fn << 8) | (where);	}	*pci_addr = addr;	DBG(("mk_conf_addr: returning pci_addr 0x%lx\n", addr));	return 0;}/* * NOTE: both conf_read() and conf_write() may set HAE_3 when needing *       to do type1 access. This is protected by the use of spinlock IRQ *       primitives in the wrapper functions pci_{read,write}_config_*() *       defined in drivers/pci/pci.c. */static unsigned intconf_read(unsigned long addr, unsigned char type1){	unsigned int value, cpu, taken;	unsigned long t2_cfg = 0;	cpu = smp_processor_id();	DBG(("conf_read(addr=0x%lx, type1=%d)\n", addr, type1));	/* If Type1 access, must set T2 CFG.  */	if (type1) {		t2_cfg = *(vulp)T2_HAE_3 & ~0xc0000000UL;		*(vulp)T2_HAE_3 = 0x40000000UL | t2_cfg;		mb();	}	mb();	draina();	mcheck_expected(cpu) = 1;	mcheck_taken(cpu) = 0;	t2_mcheck_any_expected |= (1 << cpu);	mb();	/* Access configuration space. */	value = *(vuip)addr;	mb();	mb();  /* magic */	/* Wait for possible mcheck. Also, this lets other CPUs clear	   their mchecks as well, as they can reliably tell when	   another CPU is in the midst of handling a real mcheck via	   the "taken" function. */	udelay(100);	if ((taken = mcheck_taken(cpu))) {		mcheck_taken(cpu) = 0;		t2_mcheck_last_taken |= (1 << cpu);		value = 0xffffffffU;		mb();	}	mcheck_expected(cpu) = 0;	t2_mcheck_any_expected = 0;	mb();	/* If Type1 access, must reset T2 CFG so normal IO space ops work.  */	if (type1) {		*(vulp)T2_HAE_3 = t2_cfg;		mb();	}	return value;}static voidconf_write(unsigned long addr, unsigned int value, unsigned char type1){	unsigned int cpu, taken;	unsigned long t2_cfg = 0;	cpu = smp_processor_id();	/* If Type1 access, must set T2 CFG.  */	if (type1) {		t2_cfg = *(vulp)T2_HAE_3 & ~0xc0000000UL;		*(vulp)T2_HAE_3 = t2_cfg | 0x40000000UL;		mb();	}	mb();	draina();	mcheck_expected(cpu) = 1;	mcheck_taken(cpu) = 0;	t2_mcheck_any_expected |= (1 << cpu);	mb();	/* Access configuration space.  */	*(vuip)addr = value;	mb();	mb();  /* magic */	/* Wait for possible mcheck. Also, this lets other CPUs clear	   their mchecks as well, as they can reliably tell when	   this CPU is in the midst of handling a real mcheck via	   the "taken" function. */	udelay(100);	if ((taken = mcheck_taken(cpu))) {		mcheck_taken(cpu) = 0;		t2_mcheck_last_taken |= (1 << cpu);		mb();	}	mcheck_expected(cpu) = 0;	t2_mcheck_any_expected = 0;	mb();	/* If Type1 access, must reset T2 CFG so normal IO space ops work.  */	if (type1) {		*(vulp)T2_HAE_3 = t2_cfg;		mb();	}}static intt2_read_config(struct pci_bus *bus, unsigned int devfn, int where,	       int size, u32 *value){	unsigned long addr, pci_addr;	unsigned char type1;	int shift;	long mask;	if (mk_conf_addr(bus, devfn, where, &pci_addr, &type1))		return PCIBIOS_DEVICE_NOT_FOUND;	mask = (size - 1) * 8;	shift = (where & 3) * 8;	addr = (pci_addr << 5) + mask + T2_CONF;	*value = conf_read(addr, type1) >> (shift);	return PCIBIOS_SUCCESSFUL;}static int t2_write_config(struct pci_bus *bus, unsigned int devfn, int where, int size,		u32 value){	unsigned long addr, pci_addr;	unsigned char type1;	long mask;	if (mk_conf_addr(bus, devfn, where, &pci_addr, &type1))		return PCIBIOS_DEVICE_NOT_FOUND;	mask = (size - 1) * 8;	addr = (pci_addr << 5) + mask + T2_CONF;	conf_write(addr, value << ((where & 3) * 8), type1);	return PCIBIOS_SUCCESSFUL;}struct pci_ops t2_pci_ops = {	.read =		t2_read_config,	.write =	t2_write_config,};static void __initt2_direct_map_window1(unsigned long base, unsigned long length){	unsigned long temp;	__direct_map_base = base;	__direct_map_size = length;	temp = (base & 0xfff00000UL) | ((base + length - 1) >> 20);	*(vulp)T2_WBASE1 = temp | 0x80000UL; /* OR in ENABLE bit */	temp = (length - 1) & 0xfff00000UL;	*(vulp)T2_WMASK1 = temp;	*(vulp)T2_TBASE1 = 0;#if DEBUG_PRINT_FINAL_SETTINGS	printk("%s: setting WBASE1=0x%lx WMASK1=0x%lx TBASE1=0x%lx\n",	       __func__, *(vulp)T2_WBASE1, *(vulp)T2_WMASK1, *(vulp)T2_TBASE1);#endif}static void __initt2_sg_map_window2(struct pci_controller *hose,		  unsigned long base,		  unsigned long length){	unsigned long temp;	/* Note we can only do 1 SG window, as the other is for direct, so	   do an ISA SG area, especially for the floppy. */	hose->sg_isa = iommu_arena_new(hose, base, length, 0);	hose->sg_pci = NULL;	temp = (base & 0xfff00000UL) | ((base + length - 1) >> 20);	*(vulp)T2_WBASE2 = temp | 0xc0000UL; /* OR in ENABLE/SG bits */	temp = (length - 1) & 0xfff00000UL;	*(vulp)T2_WMASK2 = temp;	*(vulp)T2_TBASE2 = virt_to_phys(hose->sg_isa->ptes) >> 1;	mb();	t2_pci_tbi(hose, 0, -1); /* flush TLB all */#if DEBUG_PRINT_FINAL_SETTINGS	printk("%s: setting WBASE2=0x%lx WMASK2=0x%lx TBASE2=0x%lx\n",	       __func__, *(vulp)T2_WBASE2, *(vulp)T2_WMASK2, *(vulp)T2_TBASE2);#endif}static void __initt2_save_configuration(void){#if DEBUG_PRINT_INITIAL_SETTINGS	printk("%s: HAE_1 was 0x%lx\n", __func__, srm_hae); /* HW is 0 */	printk("%s: HAE_2 was 0x%lx\n", __func__, *(vulp)T2_HAE_2);	printk("%s: HAE_3 was 0x%lx\n", __func__, *(vulp)T2_HAE_3);	printk("%s: HAE_4 was 0x%lx\n", __func__, *(vulp)T2_HAE_4);	printk("%s: HBASE was 0x%lx\n", __func__, *(vulp)T2_HBASE);	printk("%s: WBASE1=0x%lx WMASK1=0x%lx TBASE1=0x%lx\n", __func__,	       *(vulp)T2_WBASE1, *(vulp)T2_WMASK1, *(vulp)T2_TBASE1);	printk("%s: WBASE2=0x%lx WMASK2=0x%lx TBASE2=0x%lx\n", __func__,	       *(vulp)T2_WBASE2, *(vulp)T2_WMASK2, *(vulp)T2_TBASE2);#endif	/*	 * Save the DMA Window registers.	 */	t2_saved_config.window[0].wbase = *(vulp)T2_WBASE1;	t2_saved_config.window[0].wmask = *(vulp)T2_WMASK1;	t2_saved_config.window[0].tbase = *(vulp)T2_TBASE1;	t2_saved_config.window[1].wbase = *(vulp)T2_WBASE2;	t2_saved_config.window[1].wmask = *(vulp)T2_WMASK2;	t2_saved_config.window[1].tbase = *(vulp)T2_TBASE2;	t2_saved_config.hae_1 = srm_hae; /* HW is already set to 0 */	t2_saved_config.hae_2 = *(vulp)T2_HAE_2;	t2_saved_config.hae_3 = *(vulp)T2_HAE_3;	t2_saved_config.hae_4 = *(vulp)T2_HAE_4;	t2_saved_config.hbase = *(vulp)T2_HBASE;}void __initt2_init_arch(void){	struct pci_controller *hose;	struct resource *hae_mem;	unsigned long temp;	unsigned int i;	for (i = 0; i < NR_CPUS; i++) {		mcheck_expected(i) = 0;		mcheck_taken(i) = 0;	}	t2_mcheck_any_expected = 0;	t2_mcheck_last_taken = 0;	/* Enable scatter/gather TLB use.  */	temp = *(vulp)T2_IOCSR;	if (!(temp & (0x1UL << 26))) {		printk("t2_init_arch: enabling SG TLB, IOCSR was 0x%lx\n",		       temp);		*(vulp)T2_IOCSR = temp | (0x1UL << 26);		mb();			*(vulp)T2_IOCSR; /* read it back to make sure */	}	t2_save_configuration();	/*	 * Create our single hose.	 */	pci_isa_hose = hose = alloc_pci_controller();	hose->io_space = &ioport_resource;	hae_mem = alloc_resource();	hae_mem->start = 0;	hae_mem->end = T2_MEM_R1_MASK;	hae_mem->name = pci_hae0_name;	if (request_resource(&iomem_resource, hae_mem) < 0)		printk(KERN_ERR "Failed to request HAE_MEM\n");	hose->mem_space = hae_mem;	hose->index = 0;	hose->sparse_mem_base = T2_SPARSE_MEM - IDENT_ADDR;	hose->dense_mem_base = T2_DENSE_MEM - IDENT_ADDR;	hose->sparse_io_base = T2_IO - IDENT_ADDR;	hose->dense_io_base = 0;	/*	 * Set up the PCI->physical memory translation windows.	 *	 * Window 1 is direct mapped.	 * Window 2 is scatter/gather (for ISA).	 */	t2_direct_map_window1(T2_DIRECTMAP_START, T2_DIRECTMAP_LENGTH);	/* Always make an ISA DMA window. */	t2_sg_map_window2(hose, T2_ISA_SG_START, T2_ISA_SG_LENGTH);	*(vulp)T2_HBASE = 0x0; /* Disable HOLES. */	/* Zero HAE.  */	*(vulp)T2_HAE_1 = 0; mb(); /* Sparse MEM HAE */	*(vulp)T2_HAE_2 = 0; mb(); /* Sparse I/O HAE */	*(vulp)T2_HAE_3 = 0; mb(); /* Config Space HAE */	/*	 * We also now zero out HAE_4, the dense memory HAE, so that	 * we need not account for its "offset" when accessing dense	 * memory resources which we allocated in our normal way. This	 * HAE would need to stay untouched were we to keep the SRM	 * resource settings.	 *	 * Thus we can now run standard X servers on SABLE/LYNX. :-)	 */	*(vulp)T2_HAE_4 = 0; mb();}voidt2_kill_arch(int mode){	/*	 * Restore the DMA Window registers.	 */	*(vulp)T2_WBASE1 = t2_saved_config.window[0].wbase;	*(vulp)T2_WMASK1 = t2_saved_config.window[0].wmask;	*(vulp)T2_TBASE1 = t2_saved_config.window[0].tbase;	*(vulp)T2_WBASE2 = t2_saved_config.window[1].wbase;	*(vulp)T2_WMASK2 = t2_saved_config.window[1].wmask;	*(vulp)T2_TBASE2 = t2_saved_config.window[1].tbase;	mb();	*(vulp)T2_HAE_1 = srm_hae;	*(vulp)T2_HAE_2 = t2_saved_config.hae_2;	*(vulp)T2_HAE_3 = t2_saved_config.hae_3;	*(vulp)T2_HAE_4 = t2_saved_config.hae_4;	*(vulp)T2_HBASE = t2_saved_config.hbase;	mb();	*(vulp)T2_HBASE; /* READ it back to ensure WRITE occurred. */}voidt2_pci_tbi(struct pci_controller *hose, dma_addr_t start, dma_addr_t end){	unsigned long t2_iocsr;	t2_iocsr = *(vulp)T2_IOCSR;	/* set the TLB Clear bit */	*(vulp)T2_IOCSR = t2_iocsr | (0x1UL << 28);	mb();	*(vulp)T2_IOCSR; /* read it back to make sure */	/* clear the TLB Clear bit */
 |