/* * AMD K8 NUMA support. * Discover the memory map and associated nodes. * * Doesn't use the ACPI SRAT table because it has a questionable license. * Instead the northbridge registers are read directly. * * Copyright 2002 Andi Kleen, SuSE Labs. * $Id: k8topology.c,v 1.12 2004/01/29 00:51:01 ak Exp $ */ #include #include #include #include #include #include #include #include #include #include #include #define Dprintk(x...) int memnode_shift; u8 memnodemap[NODEMAPSIZE]; static __init int find_northbridge(void) { int num; for (num = 0; num < 32; num++) { u32 header; header = read_pci_config(0, num, 0, 0x00); if (header != (PCI_VENDOR_ID_AMD | (0x1100<<16))) continue; header = read_pci_config(0, num, 1, 0x00); if (header != (PCI_VENDOR_ID_AMD | (0x1101<<16))) continue; return num; } return -1; } #define MAXNODE 8 #define NODEMASK 0xff struct node { u64 start,end; }; #define for_all_nodes(n) \ for (n=0; n> shift] != 0xff && memnodemap[addr >> shift] != i) { printk("node %d shift %d addr %Lx conflict %d\n", i, shift, addr, memnodemap[addr>>shift]); goto next; } memnodemap[addr >> shift] = i; } } return shift; next: shift++; } memset(memnodemap,0,sizeof(*memnodemap) * NODEMAPSIZE); return -1; } extern unsigned long nodes_present; extern unsigned long end_pfn; int __init k8_scan_nodes(unsigned long start, unsigned long end) { unsigned long prevbase; struct node nodes[MAXNODE]; int nodeid, numnodes, maxnode, i, nb; nb = find_northbridge(); if (nb < 0) return nb; printk(KERN_INFO "Scanning NUMA topology in Northbridge %d\n", nb); numnodes = (read_pci_config(0, nb, 0, 0x60 ) >> 4) & 7; memset(&nodes,0,sizeof(nodes)); prevbase = 0; maxnode = -1; for (i = 0; i < MAXNODE; i++) { unsigned long base,limit; base = read_pci_config(0, nb, 1, 0x40 + i*8); limit = read_pci_config(0, nb, 1, 0x44 + i*8); nodeid = limit & 7; if ((base & 3) == 0) { continue; } if (!limit) { printk(KERN_INFO "Skipping node entry %d (base %lx)\n", i, base); continue; } if ((base >> 8) & 3 || (limit >> 8) & 3) { printk(KERN_ERR "Node %d using interleaving mode %lx/%lx\n", nodeid, (base>>8)&3, (limit>>8) & 3); return -1; } if (nodeid > maxnode) maxnode = nodeid; if ((1UL << nodeid) & nodes_present) { printk("Node %d already present. Skipping\n", nodeid); continue; } limit >>= 16; limit <<= 24; limit |= (1<<24)-1; if (limit > end_pfn << PAGE_SHIFT) limit = end_pfn << PAGE_SHIFT; if (limit <= base) continue; base >>= 16; base <<= 24; if (base < start) base = start; if (limit > end) limit = end; if (limit == base) continue; if (limit < base) { Dprintk(KERN_INFO"Node %d bogus settings %lx-%lx. Ignored.\n", nodeid, base, limit); continue; } /* Could sort here, but pun for now. Should not happen anyroads. */ if (prevbase > base) { printk(KERN_INFO "Node map not sorted %lx,%lx\n", prevbase,base); return -1; } printk(KERN_INFO "Node %d MemBase %016lx Limit %016lx\n", nodeid, base, limit); nodes[nodeid].start = base; nodes[nodeid].end = limit; prevbase = base; } if (maxnode <= 0) return -1; memnode_shift = compute_hash_shift(nodes,maxnode,end); if (memnode_shift < 0) { printk(KERN_ERR "No NUMA node hash function found. Contact maintainer\n"); return -1; } printk(KERN_INFO "Using node hash shift of %d\n", memnode_shift); for (i = 0; i < MAXNODE; i++) { if (nodes[i].start != nodes[i].end) setup_node_bootmem(i, nodes[i].start, nodes[i].end); } /* There are unfortunately some poorly designed mainboards around that only connect memory to a single CPU. This breaks the 1:1 cpu->node mapping. To avoid this fill in the mapping for all possible CPUs, as the number of CPUs is not known yet. We round robin the existing nodes. */ int rr = 0; for (i = 0; i < MAXNODE; i++) { if (nodes[i].start != nodes[i].end) continue; if ((nodes_present >> rr) == 0) rr = 0; rr += ffz(~nodes_present >> rr); PLAT_NODE_DATA(i) = PLAT_NODE_DATA(rr); rr++; } return 0; }