1/* 2 * srmmu.c: SRMMU specific routines for memory management. 3 * 4 * Copyright (C) 1995 David S. Miller (davem@caip.rutgers.edu) 5 * Copyright (C) 1995,2002 Pete Zaitcev (zaitcev@yahoo.com) 6 * Copyright (C) 1996 Eddie C. Dost (ecd@skynet.be) 7 * Copyright (C) 1997,1998 Jakub Jelinek (jj@sunsite.mff.cuni.cz) 8 * Copyright (C) 1999,2000 Anton Blanchard (anton@samba.org) 9 */ 10 11#include <linux/seq_file.h> 12#include <linux/spinlock.h> 13#include <linux/bootmem.h> 14#include <linux/pagemap.h> 15#include <linux/vmalloc.h> 16#include <linux/kdebug.h> 17#include <linux/export.h> 18#include <linux/kernel.h> 19#include <linux/init.h> 20#include <linux/log2.h> 21#include <linux/gfp.h> 22#include <linux/fs.h> 23#include <linux/mm.h> 24 25#include <asm/mmu_context.h> 26#include <asm/cacheflush.h> 27#include <asm/tlbflush.h> 28#include <asm/io-unit.h> 29#include <asm/pgalloc.h> 30#include <asm/pgtable.h> 31#include <asm/bitext.h> 32#include <asm/vaddrs.h> 33#include <asm/cache.h> 34#include <asm/traps.h> 35#include <asm/oplib.h> 36#include <asm/mbus.h> 37#include <asm/page.h> 38#include <asm/asi.h> 39#include <asm/msi.h> 40#include <asm/smp.h> 41#include <asm/io.h> 42 43/* Now the cpu specific definitions. */ 44#include <asm/turbosparc.h> 45#include <asm/tsunami.h> 46#include <asm/viking.h> 47#include <asm/swift.h> 48#include <asm/leon.h> 49#include <asm/mxcc.h> 50#include <asm/ross.h> 51 52#include "mm_32.h" 53 54enum mbus_module srmmu_modtype; 55static unsigned int hwbug_bitmask; 56int vac_cache_size; 57int vac_line_size; 58 59extern struct resource sparc_iomap; 60 61extern unsigned long last_valid_pfn; 62 63static pgd_t *srmmu_swapper_pg_dir; 64 65const struct sparc32_cachetlb_ops *sparc32_cachetlb_ops; 66EXPORT_SYMBOL(sparc32_cachetlb_ops); 67 68#ifdef CONFIG_SMP 69const struct sparc32_cachetlb_ops *local_ops; 70 71#define FLUSH_BEGIN(mm) 72#define FLUSH_END 73#else 74#define FLUSH_BEGIN(mm) if ((mm)->context != NO_CONTEXT) { 75#define FLUSH_END } 76#endif 77 78int flush_page_for_dma_global = 1; 79 80char *srmmu_name; 81 82ctxd_t *srmmu_ctx_table_phys; 83static ctxd_t *srmmu_context_table; 84 85int viking_mxcc_present; 86static DEFINE_SPINLOCK(srmmu_context_spinlock); 87 88static int is_hypersparc; 89 90static int srmmu_cache_pagetables; 91 92/* these will be initialized in srmmu_nocache_calcsize() */ 93static unsigned long srmmu_nocache_size; 94static unsigned long srmmu_nocache_end; 95 96/* 1 bit <=> 256 bytes of nocache <=> 64 PTEs */ 97#define SRMMU_NOCACHE_BITMAP_SHIFT (PAGE_SHIFT - 4) 98 99/* The context table is a nocache user with the biggest alignment needs. */ 100#define SRMMU_NOCACHE_ALIGN_MAX (sizeof(ctxd_t)*SRMMU_MAX_CONTEXTS) 101 102void *srmmu_nocache_pool; 103static struct bit_map srmmu_nocache_map; 104 105static inline int srmmu_pmd_none(pmd_t pmd) 106{ return !(pmd_val(pmd) & 0xFFFFFFF); } 107 108/* XXX should we hyper_flush_whole_icache here - Anton */ 109static inline void srmmu_ctxd_set(ctxd_t *ctxp, pgd_t *pgdp) 110{ set_pte((pte_t *)ctxp, (SRMMU_ET_PTD | (__nocache_pa((unsigned long) pgdp) >> 4))); } 111 112void pmd_set(pmd_t *pmdp, pte_t *ptep) 113{ 114 unsigned long ptp; /* Physical address, shifted right by 4 */ 115 int i; 116 117 ptp = __nocache_pa((unsigned long) ptep) >> 4; 118 for (i = 0; i < PTRS_PER_PTE/SRMMU_REAL_PTRS_PER_PTE; i++) { 119 set_pte((pte_t *)&pmdp->pmdv[i], SRMMU_ET_PTD | ptp); 120 ptp += (SRMMU_REAL_PTRS_PER_PTE*sizeof(pte_t) >> 4); 121 } 122} 123 124void pmd_populate(struct mm_struct *mm, pmd_t *pmdp, struct page *ptep) 125{ 126 unsigned long ptp; /* Physical address, shifted right by 4 */ 127 int i; 128 129 ptp = page_to_pfn(ptep) << (PAGE_SHIFT-4); /* watch for overflow */ 130 for (i = 0; i < PTRS_PER_PTE/SRMMU_REAL_PTRS_PER_PTE; i++) { 131 set_pte((pte_t *)&pmdp->pmdv[i], SRMMU_ET_PTD | ptp); 132 ptp += (SRMMU_REAL_PTRS_PER_PTE*sizeof(pte_t) >> 4); 133 } 134} 135 136/* Find an entry in the third-level page table.. */ 137pte_t *pte_offset_kernel(pmd_t *dir, unsigned long address) 138{ 139 void *pte; 140 141 pte = __nocache_va((dir->pmdv[0] & SRMMU_PTD_PMASK) << 4); 142 return (pte_t *) pte + 143 ((address >> PAGE_SHIFT) & (PTRS_PER_PTE - 1)); 144} 145 146/* 147 * size: bytes to allocate in the nocache area. 148 * align: bytes, number to align at. 149 * Returns the virtual address of the allocated area. 150 */ 151static void *__srmmu_get_nocache(int size, int align) 152{ 153 int offset; 154 unsigned long addr; 155 156 if (size < SRMMU_NOCACHE_BITMAP_SHIFT) { 157 printk(KERN_ERR "Size 0x%x too small for nocache request\n", 158 size); 159 size = SRMMU_NOCACHE_BITMAP_SHIFT; 160 } 161 if (size & (SRMMU_NOCACHE_BITMAP_SHIFT - 1)) { 162 printk(KERN_ERR "Size 0x%x unaligned int nocache request\n", 163 size); 164 size += SRMMU_NOCACHE_BITMAP_SHIFT - 1; 165 } 166 BUG_ON(align > SRMMU_NOCACHE_ALIGN_MAX); 167 168 offset = bit_map_string_get(&srmmu_nocache_map, 169 size >> SRMMU_NOCACHE_BITMAP_SHIFT, 170 align >> SRMMU_NOCACHE_BITMAP_SHIFT); 171 if (offset == -1) { 172 printk(KERN_ERR "srmmu: out of nocache %d: %d/%d\n", 173 size, (int) srmmu_nocache_size, 174 srmmu_nocache_map.used << SRMMU_NOCACHE_BITMAP_SHIFT); 175 return NULL; 176 } 177 178 addr = SRMMU_NOCACHE_VADDR + (offset << SRMMU_NOCACHE_BITMAP_SHIFT); 179 return (void *)addr; 180} 181 182void *srmmu_get_nocache(int size, int align) 183{ 184 void *tmp; 185 186 tmp = __srmmu_get_nocache(size, align); 187 188 if (tmp) 189 memset(tmp, 0, size); 190 191 return tmp; 192} 193 194void srmmu_free_nocache(void *addr, int size) 195{ 196 unsigned long vaddr; 197 int offset; 198 199 vaddr = (unsigned long)addr; 200 if (vaddr < SRMMU_NOCACHE_VADDR) { 201 printk("Vaddr %lx is smaller than nocache base 0x%lx\n", 202 vaddr, (unsigned long)SRMMU_NOCACHE_VADDR); 203 BUG(); 204 } 205 if (vaddr + size > srmmu_nocache_end) { 206 printk("Vaddr %lx is bigger than nocache end 0x%lx\n", 207 vaddr, srmmu_nocache_end); 208 BUG(); 209 } 210 if (!is_power_of_2(size)) { 211 printk("Size 0x%x is not a power of 2\n", size); 212 BUG(); 213 } 214 if (size < SRMMU_NOCACHE_BITMAP_SHIFT) { 215 printk("Size 0x%x is too small\n", size); 216 BUG(); 217 } 218 if (vaddr & (size - 1)) { 219 printk("Vaddr %lx is not aligned to size 0x%x\n", vaddr, size); 220 BUG(); 221 } 222 223 offset = (vaddr - SRMMU_NOCACHE_VADDR) >> SRMMU_NOCACHE_BITMAP_SHIFT; 224 size = size >> SRMMU_NOCACHE_BITMAP_SHIFT; 225 226 bit_map_clear(&srmmu_nocache_map, offset, size); 227} 228 229static void srmmu_early_allocate_ptable_skeleton(unsigned long start, 230 unsigned long end); 231 232/* Return how much physical memory we have. */ 233static unsigned long __init probe_memory(void) 234{ 235 unsigned long total = 0; 236 int i; 237 238 for (i = 0; sp_banks[i].num_bytes; i++) 239 total += sp_banks[i].num_bytes; 240 241 return total; 242} 243 244/* 245 * Reserve nocache dynamically proportionally to the amount of 246 * system RAM. -- Tomas Szepe <szepe@pinerecords.com>, June 2002 247 */ 248static void __init srmmu_nocache_calcsize(void) 249{ 250 unsigned long sysmemavail = probe_memory() / 1024; 251 int srmmu_nocache_npages; 252 253 srmmu_nocache_npages = 254 sysmemavail / SRMMU_NOCACHE_ALCRATIO / 1024 * 256; 255 256 /* P3 XXX The 4x overuse: corroborated by /proc/meminfo. */ 257 // if (srmmu_nocache_npages < 256) srmmu_nocache_npages = 256; 258 if (srmmu_nocache_npages < SRMMU_MIN_NOCACHE_PAGES) 259 srmmu_nocache_npages = SRMMU_MIN_NOCACHE_PAGES; 260 261 /* anything above 1280 blows up */ 262 if (srmmu_nocache_npages > SRMMU_MAX_NOCACHE_PAGES) 263 srmmu_nocache_npages = SRMMU_MAX_NOCACHE_PAGES; 264 265 srmmu_nocache_size = srmmu_nocache_npages * PAGE_SIZE; 266 srmmu_nocache_end = SRMMU_NOCACHE_VADDR + srmmu_nocache_size; 267} 268 269static void __init srmmu_nocache_init(void) 270{ 271 void *srmmu_nocache_bitmap; 272 unsigned int bitmap_bits; 273 pgd_t *pgd; 274 pmd_t *pmd; 275 pte_t *pte; 276 unsigned long paddr, vaddr; 277 unsigned long pteval; 278 279 bitmap_bits = srmmu_nocache_size >> SRMMU_NOCACHE_BITMAP_SHIFT; 280 281 srmmu_nocache_pool = __alloc_bootmem(srmmu_nocache_size, 282 SRMMU_NOCACHE_ALIGN_MAX, 0UL); 283 memset(srmmu_nocache_pool, 0, srmmu_nocache_size); 284 285 srmmu_nocache_bitmap = 286 __alloc_bootmem(BITS_TO_LONGS(bitmap_bits) * sizeof(long), 287 SMP_CACHE_BYTES, 0UL); 288 bit_map_init(&srmmu_nocache_map, srmmu_nocache_bitmap, bitmap_bits); 289 290 srmmu_swapper_pg_dir = __srmmu_get_nocache(SRMMU_PGD_TABLE_SIZE, SRMMU_PGD_TABLE_SIZE); 291 memset(__nocache_fix(srmmu_swapper_pg_dir), 0, SRMMU_PGD_TABLE_SIZE); 292 init_mm.pgd = srmmu_swapper_pg_dir; 293 294 srmmu_early_allocate_ptable_skeleton(SRMMU_NOCACHE_VADDR, srmmu_nocache_end); 295 296 paddr = __pa((unsigned long)srmmu_nocache_pool); 297 vaddr = SRMMU_NOCACHE_VADDR; 298 299 while (vaddr < srmmu_nocache_end) { 300 pgd = pgd_offset_k(vaddr); 301 pmd = pmd_offset(__nocache_fix(pgd), vaddr); 302 pte = pte_offset_kernel(__nocache_fix(pmd), vaddr); 303 304 pteval = ((paddr >> 4) | SRMMU_ET_PTE | SRMMU_PRIV); 305 306 if (srmmu_cache_pagetables) 307 pteval |= SRMMU_CACHE; 308 309 set_pte(__nocache_fix(pte), __pte(pteval)); 310 311 vaddr += PAGE_SIZE; 312 paddr += PAGE_SIZE; 313 } 314 315 flush_cache_all(); 316 flush_tlb_all(); 317} 318 319pgd_t *get_pgd_fast(void) 320{ 321 pgd_t *pgd = NULL; 322 323 pgd = __srmmu_get_nocache(SRMMU_PGD_TABLE_SIZE, SRMMU_PGD_TABLE_SIZE); 324 if (pgd) { 325 pgd_t *init = pgd_offset_k(0); 326 memset(pgd, 0, USER_PTRS_PER_PGD * sizeof(pgd_t)); 327 memcpy(pgd + USER_PTRS_PER_PGD, init + USER_PTRS_PER_PGD, 328 (PTRS_PER_PGD - USER_PTRS_PER_PGD) * sizeof(pgd_t)); 329 } 330 331 return pgd; 332} 333 334/* 335 * Hardware needs alignment to 256 only, but we align to whole page size 336 * to reduce fragmentation problems due to the buddy principle. 337 * XXX Provide actual fragmentation statistics in /proc. 338 * 339 * Alignments up to the page size are the same for physical and virtual 340 * addresses of the nocache area. 341 */ 342pgtable_t pte_alloc_one(struct mm_struct *mm, unsigned long address) 343{ 344 unsigned long pte; 345 struct page *page; 346 347 if ((pte = (unsigned long)pte_alloc_one_kernel(mm, address)) == 0) 348 return NULL; 349 page = pfn_to_page(__nocache_pa(pte) >> PAGE_SHIFT); 350 if (!pgtable_page_ctor(page)) { 351 __free_page(page); 352 return NULL; 353 } 354 return page; 355} 356 357void pte_free(struct mm_struct *mm, pgtable_t pte) 358{ 359 unsigned long p; 360 361 pgtable_page_dtor(pte); 362 p = (unsigned long)page_address(pte); /* Cached address (for test) */ 363 if (p == 0) 364 BUG(); 365 p = page_to_pfn(pte) << PAGE_SHIFT; /* Physical address */ 366 367 /* free non cached virtual address*/ 368 srmmu_free_nocache(__nocache_va(p), PTE_SIZE); 369} 370 371/* context handling - a dynamically sized pool is used */ 372#define NO_CONTEXT -1 373 374struct ctx_list { 375 struct ctx_list *next; 376 struct ctx_list *prev; 377 unsigned int ctx_number; 378 struct mm_struct *ctx_mm; 379}; 380 381static struct ctx_list *ctx_list_pool; 382static struct ctx_list ctx_free; 383static struct ctx_list ctx_used; 384 385/* At boot time we determine the number of contexts */ 386static int num_contexts; 387 388static inline void remove_from_ctx_list(struct ctx_list *entry) 389{ 390 entry->next->prev = entry->prev; 391 entry->prev->next = entry->next; 392} 393 394static inline void add_to_ctx_list(struct ctx_list *head, struct ctx_list *entry) 395{ 396 entry->next = head; 397 (entry->prev = head->prev)->next = entry; 398 head->prev = entry; 399} 400#define add_to_free_ctxlist(entry) add_to_ctx_list(&ctx_free, entry) 401#define add_to_used_ctxlist(entry) add_to_ctx_list(&ctx_used, entry) 402 403 404static inline void alloc_context(struct mm_struct *old_mm, struct mm_struct *mm) 405{ 406 struct ctx_list *ctxp; 407 408 ctxp = ctx_free.next; 409 if (ctxp != &ctx_free) { 410 remove_from_ctx_list(ctxp); 411 add_to_used_ctxlist(ctxp); 412 mm->context = ctxp->ctx_number; 413 ctxp->ctx_mm = mm; 414 return; 415 } 416 ctxp = ctx_used.next; 417 if (ctxp->ctx_mm == old_mm) 418 ctxp = ctxp->next; 419 if (ctxp == &ctx_used) 420 panic("out of mmu contexts"); 421 flush_cache_mm(ctxp->ctx_mm); 422 flush_tlb_mm(ctxp->ctx_mm); 423 remove_from_ctx_list(ctxp); 424 add_to_used_ctxlist(ctxp); 425 ctxp->ctx_mm->context = NO_CONTEXT; 426 ctxp->ctx_mm = mm; 427 mm->context = ctxp->ctx_number; 428} 429 430static inline void free_context(int context) 431{ 432 struct ctx_list *ctx_old; 433 434 ctx_old = ctx_list_pool + context; 435 remove_from_ctx_list(ctx_old); 436 add_to_free_ctxlist(ctx_old); 437} 438 439static void __init sparc_context_init(int numctx) 440{ 441 int ctx; 442 unsigned long size; 443 444 size = numctx * sizeof(struct ctx_list); 445 ctx_list_pool = __alloc_bootmem(size, SMP_CACHE_BYTES, 0UL); 446 447 for (ctx = 0; ctx < numctx; ctx++) { 448 struct ctx_list *clist; 449 450 clist = (ctx_list_pool + ctx); 451 clist->ctx_number = ctx; 452 clist->ctx_mm = NULL; 453 } 454 ctx_free.next = ctx_free.prev = &ctx_free; 455 ctx_used.next = ctx_used.prev = &ctx_used; 456 for (ctx = 0; ctx < numctx; ctx++) 457 add_to_free_ctxlist(ctx_list_pool + ctx); 458} 459 460void switch_mm(struct mm_struct *old_mm, struct mm_struct *mm, 461 struct task_struct *tsk) 462{ 463 unsigned long flags; 464 465 if (mm->context == NO_CONTEXT) { 466 spin_lock_irqsave(&srmmu_context_spinlock, flags); 467 alloc_context(old_mm, mm); 468 spin_unlock_irqrestore(&srmmu_context_spinlock, flags); 469 srmmu_ctxd_set(&srmmu_context_table[mm->context], mm->pgd); 470 } 471 472 if (sparc_cpu_model == sparc_leon) 473 leon_switch_mm(); 474 475 if (is_hypersparc) 476 hyper_flush_whole_icache(); 477 478 srmmu_set_context(mm->context); 479} 480 481/* Low level IO area allocation on the SRMMU. */ 482static inline void srmmu_mapioaddr(unsigned long physaddr, 483 unsigned long virt_addr, int bus_type) 484{ 485 pgd_t *pgdp; 486 pmd_t *pmdp; 487 pte_t *ptep; 488 unsigned long tmp; 489 490 physaddr &= PAGE_MASK; 491 pgdp = pgd_offset_k(virt_addr); 492 pmdp = pmd_offset(pgdp, virt_addr); 493 ptep = pte_offset_kernel(pmdp, virt_addr); 494 tmp = (physaddr >> 4) | SRMMU_ET_PTE; 495 496 /* I need to test whether this is consistent over all 497 * sun4m's. The bus_type represents the upper 4 bits of 498 * 36-bit physical address on the I/O space lines... 499 */ 500 tmp |= (bus_type << 28); 501 tmp |= SRMMU_PRIV; 502 __flush_page_to_ram(virt_addr); 503 set_pte(ptep, __pte(tmp)); 504} 505 506void srmmu_mapiorange(unsigned int bus, unsigned long xpa, 507 unsigned long xva, unsigned int len) 508{ 509 while (len != 0) { 510 len -= PAGE_SIZE; 511 srmmu_mapioaddr(xpa, xva, bus); 512 xva += PAGE_SIZE; 513 xpa += PAGE_SIZE; 514 } 515 flush_tlb_all(); 516} 517 518static inline void srmmu_unmapioaddr(unsigned long virt_addr) 519{ 520 pgd_t *pgdp; 521 pmd_t *pmdp; 522 pte_t *ptep; 523 524 pgdp = pgd_offset_k(virt_addr); 525 pmdp = pmd_offset(pgdp, virt_addr); 526 ptep = pte_offset_kernel(pmdp, virt_addr); 527 528 /* No need to flush uncacheable page. */ 529 __pte_clear(ptep); 530} 531 532void srmmu_unmapiorange(unsigned long virt_addr, unsigned int len) 533{ 534 while (len != 0) { 535 len -= PAGE_SIZE; 536 srmmu_unmapioaddr(virt_addr); 537 virt_addr += PAGE_SIZE; 538 } 539 flush_tlb_all(); 540} 541 542/* tsunami.S */ 543extern void tsunami_flush_cache_all(void); 544extern void tsunami_flush_cache_mm(struct mm_struct *mm); 545extern void tsunami_flush_cache_range(struct vm_area_struct *vma, unsigned long start, unsigned long end); 546extern void tsunami_flush_cache_page(struct vm_area_struct *vma, unsigned long page); 547extern void tsunami_flush_page_to_ram(unsigned long page); 548extern void tsunami_flush_page_for_dma(unsigned long page); 549extern void tsunami_flush_sig_insns(struct mm_struct *mm, unsigned long insn_addr); 550extern void tsunami_flush_tlb_all(void); 551extern void tsunami_flush_tlb_mm(struct mm_struct *mm); 552extern void tsunami_flush_tlb_range(struct vm_area_struct *vma, unsigned long start, unsigned long end); 553extern void tsunami_flush_tlb_page(struct vm_area_struct *vma, unsigned long page); 554extern void tsunami_setup_blockops(void); 555 556/* swift.S */ 557extern void swift_flush_cache_all(void); 558extern void swift_flush_cache_mm(struct mm_struct *mm); 559extern void swift_flush_cache_range(struct vm_area_struct *vma, 560 unsigned long start, unsigned long end); 561extern void swift_flush_cache_page(struct vm_area_struct *vma, unsigned long page); 562extern void swift_flush_page_to_ram(unsigned long page); 563extern void swift_flush_page_for_dma(unsigned long page); 564extern void swift_flush_sig_insns(struct mm_struct *mm, unsigned long insn_addr); 565extern void swift_flush_tlb_all(void); 566extern void swift_flush_tlb_mm(struct mm_struct *mm); 567extern void swift_flush_tlb_range(struct vm_area_struct *vma, 568 unsigned long start, unsigned long end); 569extern void swift_flush_tlb_page(struct vm_area_struct *vma, unsigned long page); 570 571#if 0 /* P3: deadwood to debug precise flushes on Swift. */ 572void swift_flush_tlb_page(struct vm_area_struct *vma, unsigned long page) 573{ 574 int cctx, ctx1; 575 576 page &= PAGE_MASK; 577 if ((ctx1 = vma->vm_mm->context) != -1) { 578 cctx = srmmu_get_context(); 579/* Is context # ever different from current context? P3 */ 580 if (cctx != ctx1) { 581 printk("flush ctx %02x curr %02x\n", ctx1, cctx); 582 srmmu_set_context(ctx1); 583 swift_flush_page(page); 584 __asm__ __volatile__("sta %%g0, [%0] %1\n\t" : : 585 "r" (page), "i" (ASI_M_FLUSH_PROBE)); 586 srmmu_set_context(cctx); 587 } else { 588 /* Rm. prot. bits from virt. c. */ 589 /* swift_flush_cache_all(); */ 590 /* swift_flush_cache_page(vma, page); */ 591 swift_flush_page(page); 592 593 __asm__ __volatile__("sta %%g0, [%0] %1\n\t" : : 594 "r" (page), "i" (ASI_M_FLUSH_PROBE)); 595 /* same as above: srmmu_flush_tlb_page() */ 596 } 597 } 598} 599#endif 600 601/* 602 * The following are all MBUS based SRMMU modules, and therefore could 603 * be found in a multiprocessor configuration. On the whole, these 604 * chips seems to be much more touchy about DVMA and page tables 605 * with respect to cache coherency. 606 */ 607 608/* viking.S */ 609extern void viking_flush_cache_all(void); 610extern void viking_flush_cache_mm(struct mm_struct *mm); 611extern void viking_flush_cache_range(struct vm_area_struct *vma, unsigned long start, 612 unsigned long end); 613extern void viking_flush_cache_page(struct vm_area_struct *vma, unsigned long page); 614extern void viking_flush_page_to_ram(unsigned long page); 615extern void viking_flush_page_for_dma(unsigned long page); 616extern void viking_flush_sig_insns(struct mm_struct *mm, unsigned long addr); 617extern void viking_flush_page(unsigned long page); 618extern void viking_mxcc_flush_page(unsigned long page); 619extern void viking_flush_tlb_all(void); 620extern void viking_flush_tlb_mm(struct mm_struct *mm); 621extern void viking_flush_tlb_range(struct vm_area_struct *vma, unsigned long start, 622 unsigned long end); 623extern void viking_flush_tlb_page(struct vm_area_struct *vma, 624 unsigned long page); 625extern void sun4dsmp_flush_tlb_all(void); 626extern void sun4dsmp_flush_tlb_mm(struct mm_struct *mm); 627extern void sun4dsmp_flush_tlb_range(struct vm_area_struct *vma, unsigned long start, 628 unsigned long end); 629extern void sun4dsmp_flush_tlb_page(struct vm_area_struct *vma, 630 unsigned long page); 631 632/* hypersparc.S */ 633extern void hypersparc_flush_cache_all(void); 634extern void hypersparc_flush_cache_mm(struct mm_struct *mm); 635extern void hypersparc_flush_cache_range(struct vm_area_struct *vma, unsigned long start, unsigned long end); 636extern void hypersparc_flush_cache_page(struct vm_area_struct *vma, unsigned long page); 637extern void hypersparc_flush_page_to_ram(unsigned long page); 638extern void hypersparc_flush_page_for_dma(unsigned long page); 639extern void hypersparc_flush_sig_insns(struct mm_struct *mm, unsigned long insn_addr); 640extern void hypersparc_flush_tlb_all(void); 641extern void hypersparc_flush_tlb_mm(struct mm_struct *mm); 642extern void hypersparc_flush_tlb_range(struct vm_area_struct *vma, unsigned long start, unsigned long end); 643extern void hypersparc_flush_tlb_page(struct vm_area_struct *vma, unsigned long page); 644extern void hypersparc_setup_blockops(void); 645 646/* 647 * NOTE: All of this startup code assumes the low 16mb (approx.) of 648 * kernel mappings are done with one single contiguous chunk of 649 * ram. On small ram machines (classics mainly) we only get 650 * around 8mb mapped for us. 651 */ 652 653static void __init early_pgtable_allocfail(char *type) 654{ 655 prom_printf("inherit_prom_mappings: Cannot alloc kernel %s.\n", type); 656 prom_halt(); 657} 658 659static void __init srmmu_early_allocate_ptable_skeleton(unsigned long start, 660 unsigned long end) 661{ 662 pgd_t *pgdp; 663 pmd_t *pmdp; 664 pte_t *ptep; 665 666 while (start < end) { 667 pgdp = pgd_offset_k(start); 668 if (pgd_none(*(pgd_t *)__nocache_fix(pgdp))) { 669 pmdp = __srmmu_get_nocache( 670 SRMMU_PMD_TABLE_SIZE, SRMMU_PMD_TABLE_SIZE); 671 if (pmdp == NULL) 672 early_pgtable_allocfail("pmd"); 673 memset(__nocache_fix(pmdp), 0, SRMMU_PMD_TABLE_SIZE); 674 pgd_set(__nocache_fix(pgdp), pmdp); 675 } 676 pmdp = pmd_offset(__nocache_fix(pgdp), start); 677 if (srmmu_pmd_none(*(pmd_t *)__nocache_fix(pmdp))) { 678 ptep = __srmmu_get_nocache(PTE_SIZE, PTE_SIZE); 679 if (ptep == NULL) 680 early_pgtable_allocfail("pte"); 681 memset(__nocache_fix(ptep), 0, PTE_SIZE); 682 pmd_set(__nocache_fix(pmdp), ptep); 683 } 684 if (start > (0xffffffffUL - PMD_SIZE)) 685 break; 686 start = (start + PMD_SIZE) & PMD_MASK; 687 } 688} 689 690static void __init srmmu_allocate_ptable_skeleton(unsigned long start, 691 unsigned long end) 692{ 693 pgd_t *pgdp; 694 pmd_t *pmdp; 695 pte_t *ptep; 696 697 while (start < end) { 698 pgdp = pgd_offset_k(start); 699 if (pgd_none(*pgdp)) { 700 pmdp = __srmmu_get_nocache(SRMMU_PMD_TABLE_SIZE, SRMMU_PMD_TABLE_SIZE); 701 if (pmdp == NULL) 702 early_pgtable_allocfail("pmd"); 703 memset(pmdp, 0, SRMMU_PMD_TABLE_SIZE); 704 pgd_set(pgdp, pmdp); 705 } 706 pmdp = pmd_offset(pgdp, start); 707 if (srmmu_pmd_none(*pmdp)) { 708 ptep = __srmmu_get_nocache(PTE_SIZE, 709 PTE_SIZE); 710 if (ptep == NULL) 711 early_pgtable_allocfail("pte"); 712 memset(ptep, 0, PTE_SIZE); 713 pmd_set(pmdp, ptep); 714 } 715 if (start > (0xffffffffUL - PMD_SIZE)) 716 break; 717 start = (start + PMD_SIZE) & PMD_MASK; 718 } 719} 720 721/* These flush types are not available on all chips... */ 722static inline unsigned long srmmu_probe(unsigned long vaddr) 723{ 724 unsigned long retval; 725 726 if (sparc_cpu_model != sparc_leon) { 727 728 vaddr &= PAGE_MASK; 729 __asm__ __volatile__("lda [%1] %2, %0\n\t" : 730 "=r" (retval) : 731 "r" (vaddr | 0x400), "i" (ASI_M_FLUSH_PROBE)); 732 } else { 733 retval = leon_swprobe(vaddr, NULL); 734 } 735 return retval; 736} 737 738/* 739 * This is much cleaner than poking around physical address space 740 * looking at the prom's page table directly which is what most 741 * other OS's do. Yuck... this is much better. 742 */ 743static void __init srmmu_inherit_prom_mappings(unsigned long start, 744 unsigned long end) 745{ 746 unsigned long probed; 747 unsigned long addr; 748 pgd_t *pgdp; 749 pmd_t *pmdp; 750 pte_t *ptep; 751 int what; /* 0 = normal-pte, 1 = pmd-level pte, 2 = pgd-level pte */ 752 753 while (start <= end) { 754 if (start == 0) 755 break; /* probably wrap around */ 756 if (start == 0xfef00000) 757 start = KADB_DEBUGGER_BEGVM; 758 probed = srmmu_probe(start); 759 if (!probed) { 760 /* continue probing until we find an entry */ 761 start += PAGE_SIZE; 762 continue; 763 } 764 765 /* A red snapper, see what it really is. */ 766 what = 0; 767 addr = start - PAGE_SIZE; 768 769 if (!(start & ~(SRMMU_REAL_PMD_MASK))) { 770 if (srmmu_probe(addr + SRMMU_REAL_PMD_SIZE) == probed) 771 what = 1; 772 } 773 774 if (!(start & ~(SRMMU_PGDIR_MASK))) { 775 if (srmmu_probe(addr + SRMMU_PGDIR_SIZE) == probed) 776 what = 2; 777 } 778 779 pgdp = pgd_offset_k(start); 780 if (what == 2) { 781 *(pgd_t *)__nocache_fix(pgdp) = __pgd(probed); 782 start += SRMMU_PGDIR_SIZE; 783 continue; 784 } 785 if (pgd_none(*(pgd_t *)__nocache_fix(pgdp))) { 786 pmdp = __srmmu_get_nocache(SRMMU_PMD_TABLE_SIZE, 787 SRMMU_PMD_TABLE_SIZE); 788 if (pmdp == NULL) 789 early_pgtable_allocfail("pmd"); 790 memset(__nocache_fix(pmdp), 0, SRMMU_PMD_TABLE_SIZE); 791 pgd_set(__nocache_fix(pgdp), pmdp); 792 } 793 pmdp = pmd_offset(__nocache_fix(pgdp), start); 794 if (srmmu_pmd_none(*(pmd_t *)__nocache_fix(pmdp))) { 795 ptep = __srmmu_get_nocache(PTE_SIZE, PTE_SIZE); 796 if (ptep == NULL) 797 early_pgtable_allocfail("pte"); 798 memset(__nocache_fix(ptep), 0, PTE_SIZE); 799 pmd_set(__nocache_fix(pmdp), ptep); 800 } 801 if (what == 1) { 802 /* We bend the rule where all 16 PTPs in a pmd_t point 803 * inside the same PTE page, and we leak a perfectly 804 * good hardware PTE piece. Alternatives seem worse. 805 */ 806 unsigned int x; /* Index of HW PMD in soft cluster */ 807 unsigned long *val; 808 x = (start >> PMD_SHIFT) & 15; 809 val = &pmdp->pmdv[x]; 810 *(unsigned long *)__nocache_fix(val) = probed; 811 start += SRMMU_REAL_PMD_SIZE; 812 continue; 813 } 814 ptep = pte_offset_kernel(__nocache_fix(pmdp), start); 815 *(pte_t *)__nocache_fix(ptep) = __pte(probed); 816 start += PAGE_SIZE; 817 } 818} 819 820#define KERNEL_PTE(page_shifted) ((page_shifted)|SRMMU_CACHE|SRMMU_PRIV|SRMMU_VALID) 821 822/* Create a third-level SRMMU 16MB page mapping. */ 823static void __init do_large_mapping(unsigned long vaddr, unsigned long phys_base) 824{ 825 pgd_t *pgdp = pgd_offset_k(vaddr); 826 unsigned long big_pte; 827 828 big_pte = KERNEL_PTE(phys_base >> 4); 829 *(pgd_t *)__nocache_fix(pgdp) = __pgd(big_pte); 830} 831 832/* Map sp_bank entry SP_ENTRY, starting at virtual address VBASE. */ 833static unsigned long __init map_spbank(unsigned long vbase, int sp_entry) 834{ 835 unsigned long pstart = (sp_banks[sp_entry].base_addr & SRMMU_PGDIR_MASK); 836 unsigned long vstart = (vbase & SRMMU_PGDIR_MASK); 837 unsigned long vend = SRMMU_PGDIR_ALIGN(vbase + sp_banks[sp_entry].num_bytes); 838 /* Map "low" memory only */ 839 const unsigned long min_vaddr = PAGE_OFFSET; 840 const unsigned long max_vaddr = PAGE_OFFSET + SRMMU_MAXMEM; 841 842 if (vstart < min_vaddr || vstart >= max_vaddr) 843 return vstart; 844 845 if (vend > max_vaddr || vend < min_vaddr) 846 vend = max_vaddr; 847 848 while (vstart < vend) { 849 do_large_mapping(vstart, pstart); 850 vstart += SRMMU_PGDIR_SIZE; pstart += SRMMU_PGDIR_SIZE; 851 } 852 return vstart; 853} 854 855static void __init map_kernel(void) 856{ 857 int i; 858 859 if (phys_base > 0) { 860 do_large_mapping(PAGE_OFFSET, phys_base); 861 } 862 863 for (i = 0; sp_banks[i].num_bytes != 0; i++) { 864 map_spbank((unsigned long)__va(sp_banks[i].base_addr), i); 865 } 866} 867 868void (*poke_srmmu)(void) = NULL; 869 870void __init srmmu_paging_init(void) 871{ 872 int i; 873 phandle cpunode; 874 char node_str[128]; 875 pgd_t *pgd; 876 pmd_t *pmd; 877 pte_t *pte; 878 unsigned long pages_avail; 879 880 init_mm.context = (unsigned long) NO_CONTEXT; 881 sparc_iomap.start = SUN4M_IOBASE_VADDR; /* 16MB of IOSPACE on all sun4m's. */ 882 883 if (sparc_cpu_model == sun4d) 884 num_contexts = 65536; /* We know it is Viking */ 885 else { 886 /* Find the number of contexts on the srmmu. */ 887 cpunode = prom_getchild(prom_root_node); 888 num_contexts = 0; 889 while (cpunode != 0) { 890 prom_getstring(cpunode, "device_type", node_str, sizeof(node_str)); 891 if (!strcmp(node_str, "cpu")) { 892 num_contexts = prom_getintdefault(cpunode, "mmu-nctx", 0x8); 893 break; 894 } 895 cpunode = prom_getsibling(cpunode); 896 } 897 } 898 899 if (!num_contexts) { 900 prom_printf("Something wrong, can't find cpu node in paging_init.\n"); 901 prom_halt(); 902 } 903 904 pages_avail = 0; 905 last_valid_pfn = bootmem_init(&pages_avail); 906 907 srmmu_nocache_calcsize(); 908 srmmu_nocache_init(); 909 srmmu_inherit_prom_mappings(0xfe400000, (LINUX_OPPROM_ENDVM - PAGE_SIZE)); 910 map_kernel(); 911 912 /* ctx table has to be physically aligned to its size */ 913 srmmu_context_table = __srmmu_get_nocache(num_contexts * sizeof(ctxd_t), num_contexts * sizeof(ctxd_t)); 914 srmmu_ctx_table_phys = (ctxd_t *)__nocache_pa((unsigned long)srmmu_context_table); 915 916 for (i = 0; i < num_contexts; i++) 917 srmmu_ctxd_set((ctxd_t *)__nocache_fix(&srmmu_context_table[i]), srmmu_swapper_pg_dir); 918 919 flush_cache_all(); 920 srmmu_set_ctable_ptr((unsigned long)srmmu_ctx_table_phys); 921#ifdef CONFIG_SMP 922 /* Stop from hanging here... */ 923 local_ops->tlb_all(); 924#else 925 flush_tlb_all(); 926#endif 927 poke_srmmu(); 928 929 srmmu_allocate_ptable_skeleton(sparc_iomap.start, IOBASE_END); 930 srmmu_allocate_ptable_skeleton(DVMA_VADDR, DVMA_END); 931 932 srmmu_allocate_ptable_skeleton( 933 __fix_to_virt(__end_of_fixed_addresses - 1), FIXADDR_TOP); 934 srmmu_allocate_ptable_skeleton(PKMAP_BASE, PKMAP_END); 935 936 pgd = pgd_offset_k(PKMAP_BASE); 937 pmd = pmd_offset(pgd, PKMAP_BASE); 938 pte = pte_offset_kernel(pmd, PKMAP_BASE); 939 pkmap_page_table = pte; 940 941 flush_cache_all(); 942 flush_tlb_all(); 943 944 sparc_context_init(num_contexts); 945 946 kmap_init(); 947 948 { 949 unsigned long zones_size[MAX_NR_ZONES]; 950 unsigned long zholes_size[MAX_NR_ZONES]; 951 unsigned long npages; 952 int znum; 953 954 for (znum = 0; znum < MAX_NR_ZONES; znum++) 955 zones_size[znum] = zholes_size[znum] = 0; 956 957 npages = max_low_pfn - pfn_base; 958 959 zones_size[ZONE_DMA] = npages; 960 zholes_size[ZONE_DMA] = npages - pages_avail; 961 962 npages = highend_pfn - max_low_pfn; 963 zones_size[ZONE_HIGHMEM] = npages; 964 zholes_size[ZONE_HIGHMEM] = npages - calc_highpages(); 965 966 free_area_init_node(0, zones_size, pfn_base, zholes_size); 967 } 968} 969 970void mmu_info(struct seq_file *m) 971{ 972 seq_printf(m, 973 "MMU type\t: %s\n" 974 "contexts\t: %d\n" 975 "nocache total\t: %ld\n" 976 "nocache used\t: %d\n", 977 srmmu_name, 978 num_contexts, 979 srmmu_nocache_size, 980 srmmu_nocache_map.used << SRMMU_NOCACHE_BITMAP_SHIFT); 981} 982 983int init_new_context(struct task_struct *tsk, struct mm_struct *mm) 984{ 985 mm->context = NO_CONTEXT; 986 return 0; 987} 988 989void destroy_context(struct mm_struct *mm) 990{ 991 unsigned long flags; 992 993 if (mm->context != NO_CONTEXT) { 994 flush_cache_mm(mm); 995 srmmu_ctxd_set(&srmmu_context_table[mm->context], srmmu_swapper_pg_dir); 996 flush_tlb_mm(mm); 997 spin_lock_irqsave(&srmmu_context_spinlock, flags); 998 free_context(mm->context); 999 spin_unlock_irqrestore(&srmmu_context_spinlock, flags); 1000 mm->context = NO_CONTEXT; 1001 } 1002} 1003 1004/* Init various srmmu chip types. */ 1005static void __init srmmu_is_bad(void) 1006{ 1007 prom_printf("Could not determine SRMMU chip type.\n"); 1008 prom_halt(); 1009} 1010 1011static void __init init_vac_layout(void) 1012{ 1013 phandle nd; 1014 int cache_lines; 1015 char node_str[128]; 1016#ifdef CONFIG_SMP 1017 int cpu = 0; 1018 unsigned long max_size = 0; 1019 unsigned long min_line_size = 0x10000000; 1020#endif 1021 1022 nd = prom_getchild(prom_root_node); 1023 while ((nd = prom_getsibling(nd)) != 0) { 1024 prom_getstring(nd, "device_type", node_str, sizeof(node_str)); 1025 if (!strcmp(node_str, "cpu")) { 1026 vac_line_size = prom_getint(nd, "cache-line-size"); 1027 if (vac_line_size == -1) { 1028 prom_printf("can't determine cache-line-size, halting.\n"); 1029 prom_halt(); 1030 } 1031 cache_lines = prom_getint(nd, "cache-nlines"); 1032 if (cache_lines == -1) { 1033 prom_printf("can't determine cache-nlines, halting.\n"); 1034 prom_halt(); 1035 } 1036 1037 vac_cache_size = cache_lines * vac_line_size; 1038#ifdef CONFIG_SMP 1039 if (vac_cache_size > max_size) 1040 max_size = vac_cache_size; 1041 if (vac_line_size < min_line_size) 1042 min_line_size = vac_line_size; 1043 //FIXME: cpus not contiguous!! 1044 cpu++; 1045 if (cpu >= nr_cpu_ids || !cpu_online(cpu)) 1046 break; 1047#else 1048 break; 1049#endif 1050 } 1051 } 1052 if (nd == 0) { 1053 prom_printf("No CPU nodes found, halting.\n"); 1054 prom_halt(); 1055 } 1056#ifdef CONFIG_SMP 1057 vac_cache_size = max_size; 1058 vac_line_size = min_line_size; 1059#endif 1060 printk("SRMMU: Using VAC size of %d bytes, line size %d bytes.\n", 1061 (int)vac_cache_size, (int)vac_line_size); 1062} 1063 1064static void poke_hypersparc(void) 1065{ 1066 volatile unsigned long clear; 1067 unsigned long mreg = srmmu_get_mmureg(); 1068 1069 hyper_flush_unconditional_combined(); 1070 1071 mreg &= ~(HYPERSPARC_CWENABLE); 1072 mreg |= (HYPERSPARC_CENABLE | HYPERSPARC_WBENABLE); 1073 mreg |= (HYPERSPARC_CMODE); 1074 1075 srmmu_set_mmureg(mreg); 1076 1077#if 0 /* XXX I think this is bad news... -DaveM */ 1078 hyper_clear_all_tags(); 1079#endif 1080 1081 put_ross_icr(HYPERSPARC_ICCR_FTD | HYPERSPARC_ICCR_ICE); 1082 hyper_flush_whole_icache(); 1083 clear = srmmu_get_faddr(); 1084 clear = srmmu_get_fstatus(); 1085} 1086 1087static const struct sparc32_cachetlb_ops hypersparc_ops = { 1088 .cache_all = hypersparc_flush_cache_all, 1089 .cache_mm = hypersparc_flush_cache_mm, 1090 .cache_page = hypersparc_flush_cache_page, 1091 .cache_range = hypersparc_flush_cache_range, 1092 .tlb_all = hypersparc_flush_tlb_all, 1093 .tlb_mm = hypersparc_flush_tlb_mm, 1094 .tlb_page = hypersparc_flush_tlb_page, 1095 .tlb_range = hypersparc_flush_tlb_range, 1096 .page_to_ram = hypersparc_flush_page_to_ram, 1097 .sig_insns = hypersparc_flush_sig_insns, 1098 .page_for_dma = hypersparc_flush_page_for_dma, 1099}; 1100 1101static void __init init_hypersparc(void) 1102{ 1103 srmmu_name = "ROSS HyperSparc"; 1104 srmmu_modtype = HyperSparc; 1105 1106 init_vac_layout(); 1107 1108 is_hypersparc = 1; 1109 sparc32_cachetlb_ops = &hypersparc_ops; 1110 1111 poke_srmmu = poke_hypersparc; 1112 1113 hypersparc_setup_blockops(); 1114} 1115 1116static void poke_swift(void) 1117{ 1118 unsigned long mreg; 1119 1120 /* Clear any crap from the cache or else... */ 1121 swift_flush_cache_all(); 1122 1123 /* Enable I & D caches */ 1124 mreg = srmmu_get_mmureg(); 1125 mreg |= (SWIFT_IE | SWIFT_DE); 1126 /* 1127 * The Swift branch folding logic is completely broken. At 1128 * trap time, if things are just right, if can mistakenly 1129 * think that a trap is coming from kernel mode when in fact 1130 * it is coming from user mode (it mis-executes the branch in 1131 * the trap code). So you see things like crashme completely 1132 * hosing your machine which is completely unacceptable. Turn 1133 * this shit off... nice job Fujitsu. 1134 */ 1135 mreg &= ~(SWIFT_BF); 1136 srmmu_set_mmureg(mreg); 1137} 1138 1139static const struct sparc32_cachetlb_ops swift_ops = { 1140 .cache_all = swift_flush_cache_all, 1141 .cache_mm = swift_flush_cache_mm, 1142 .cache_page = swift_flush_cache_page, 1143 .cache_range = swift_flush_cache_range, 1144 .tlb_all = swift_flush_tlb_all, 1145 .tlb_mm = swift_flush_tlb_mm, 1146 .tlb_page = swift_flush_tlb_page, 1147 .tlb_range = swift_flush_tlb_range, 1148 .page_to_ram = swift_flush_page_to_ram, 1149 .sig_insns = swift_flush_sig_insns, 1150 .page_for_dma = swift_flush_page_for_dma, 1151}; 1152 1153#define SWIFT_MASKID_ADDR 0x10003018 1154static void __init init_swift(void) 1155{ 1156 unsigned long swift_rev; 1157 1158 __asm__ __volatile__("lda [%1] %2, %0\n\t" 1159 "srl %0, 0x18, %0\n\t" : 1160 "=r" (swift_rev) : 1161 "r" (SWIFT_MASKID_ADDR), "i" (ASI_M_BYPASS)); 1162 srmmu_name = "Fujitsu Swift"; 1163 switch (swift_rev) { 1164 case 0x11: 1165 case 0x20: 1166 case 0x23: 1167 case 0x30: 1168 srmmu_modtype = Swift_lots_o_bugs; 1169 hwbug_bitmask |= (HWBUG_KERN_ACCBROKEN | HWBUG_KERN_CBITBROKEN); 1170 /* 1171 * Gee george, I wonder why Sun is so hush hush about 1172 * this hardware bug... really braindamage stuff going 1173 * on here. However I think we can find a way to avoid 1174 * all of the workaround overhead under Linux. Basically, 1175 * any page fault can cause kernel pages to become user 1176 * accessible (the mmu gets confused and clears some of 1177 * the ACC bits in kernel ptes). Aha, sounds pretty 1178 * horrible eh? But wait, after extensive testing it appears 1179 * that if you use pgd_t level large kernel pte's (like the 1180 * 4MB pages on the Pentium) the bug does not get tripped 1181 * at all. This avoids almost all of the major overhead. 1182 * Welcome to a world where your vendor tells you to, 1183 * "apply this kernel patch" instead of "sorry for the 1184 * broken hardware, send it back and we'll give you 1185 * properly functioning parts" 1186 */ 1187 break; 1188 case 0x25: 1189 case 0x31: 1190 srmmu_modtype = Swift_bad_c; 1191 hwbug_bitmask |= HWBUG_KERN_CBITBROKEN; 1192 /* 1193 * You see Sun allude to this hardware bug but never 1194 * admit things directly, they'll say things like, 1195 * "the Swift chip cache problems" or similar. 1196 */ 1197 break; 1198 default: 1199 srmmu_modtype = Swift_ok; 1200 break; 1201 } 1202 1203 sparc32_cachetlb_ops = &swift_ops; 1204 flush_page_for_dma_global = 0; 1205 1206 /* 1207 * Are you now convinced that the Swift is one of the 1208 * biggest VLSI abortions of all time? Bravo Fujitsu! 1209 * Fujitsu, the !#?!%$'d up processor people. I bet if 1210 * you examined the microcode of the Swift you'd find 1211 * XXX's all over the place. 1212 */ 1213 poke_srmmu = poke_swift; 1214} 1215 1216static void turbosparc_flush_cache_all(void) 1217{ 1218 flush_user_windows(); 1219 turbosparc_idflash_clear(); 1220} 1221 1222static void turbosparc_flush_cache_mm(struct mm_struct *mm) 1223{ 1224 FLUSH_BEGIN(mm) 1225 flush_user_windows(); 1226 turbosparc_idflash_clear(); 1227 FLUSH_END 1228} 1229 1230static void turbosparc_flush_cache_range(struct vm_area_struct *vma, unsigned long start, unsigned long end) 1231{ 1232 FLUSH_BEGIN(vma->vm_mm) 1233 flush_user_windows(); 1234 turbosparc_idflash_clear(); 1235 FLUSH_END 1236} 1237 1238static void turbosparc_flush_cache_page(struct vm_area_struct *vma, unsigned long page) 1239{ 1240 FLUSH_BEGIN(vma->vm_mm) 1241 flush_user_windows(); 1242 if (vma->vm_flags & VM_EXEC) 1243 turbosparc_flush_icache(); 1244 turbosparc_flush_dcache(); 1245 FLUSH_END 1246} 1247 1248/* TurboSparc is copy-back, if we turn it on, but this does not work. */ 1249static void turbosparc_flush_page_to_ram(unsigned long page) 1250{ 1251#ifdef TURBOSPARC_WRITEBACK 1252 volatile unsigned long clear; 1253 1254 if (srmmu_probe(page)) 1255 turbosparc_flush_page_cache(page); 1256 clear = srmmu_get_fstatus(); 1257#endif 1258} 1259 1260static void turbosparc_flush_sig_insns(struct mm_struct *mm, unsigned long insn_addr) 1261{ 1262} 1263 1264static void turbosparc_flush_page_for_dma(unsigned long page) 1265{ 1266 turbosparc_flush_dcache(); 1267} 1268 1269static void turbosparc_flush_tlb_all(void) 1270{ 1271 srmmu_flush_whole_tlb(); 1272} 1273 1274static void turbosparc_flush_tlb_mm(struct mm_struct *mm) 1275{ 1276 FLUSH_BEGIN(mm) 1277 srmmu_flush_whole_tlb(); 1278 FLUSH_END 1279} 1280 1281static void turbosparc_flush_tlb_range(struct vm_area_struct *vma, unsigned long start, unsigned long end) 1282{ 1283 FLUSH_BEGIN(vma->vm_mm) 1284 srmmu_flush_whole_tlb(); 1285 FLUSH_END 1286} 1287 1288static void turbosparc_flush_tlb_page(struct vm_area_struct *vma, unsigned long page) 1289{ 1290 FLUSH_BEGIN(vma->vm_mm) 1291 srmmu_flush_whole_tlb(); 1292 FLUSH_END 1293} 1294 1295 1296static void poke_turbosparc(void) 1297{ 1298 unsigned long mreg = srmmu_get_mmureg(); 1299 unsigned long ccreg; 1300 1301 /* Clear any crap from the cache or else... */ 1302 turbosparc_flush_cache_all(); 1303 /* Temporarily disable I & D caches */ 1304 mreg &= ~(TURBOSPARC_ICENABLE | TURBOSPARC_DCENABLE); 1305 mreg &= ~(TURBOSPARC_PCENABLE); /* Don't check parity */ 1306 srmmu_set_mmureg(mreg); 1307 1308 ccreg = turbosparc_get_ccreg(); 1309 1310#ifdef TURBOSPARC_WRITEBACK 1311 ccreg |= (TURBOSPARC_SNENABLE); /* Do DVMA snooping in Dcache */ 1312 ccreg &= ~(TURBOSPARC_uS2 | TURBOSPARC_WTENABLE); 1313 /* Write-back D-cache, emulate VLSI 1314 * abortion number three, not number one */ 1315#else 1316 /* For now let's play safe, optimize later */ 1317 ccreg |= (TURBOSPARC_SNENABLE | TURBOSPARC_WTENABLE); 1318 /* Do DVMA snooping in Dcache, Write-thru D-cache */ 1319 ccreg &= ~(TURBOSPARC_uS2); 1320 /* Emulate VLSI abortion number three, not number one */ 1321#endif 1322 1323 switch (ccreg & 7) { 1324 case 0: /* No SE cache */ 1325 case 7: /* Test mode */ 1326 break; 1327 default: 1328 ccreg |= (TURBOSPARC_SCENABLE); 1329 } 1330 turbosparc_set_ccreg(ccreg); 1331 1332 mreg |= (TURBOSPARC_ICENABLE | TURBOSPARC_DCENABLE); /* I & D caches on */ 1333 mreg |= (TURBOSPARC_ICSNOOP); /* Icache snooping on */ 1334 srmmu_set_mmureg(mreg); 1335} 1336 1337static const struct sparc32_cachetlb_ops turbosparc_ops = { 1338 .cache_all = turbosparc_flush_cache_all, 1339 .cache_mm = turbosparc_flush_cache_mm, 1340 .cache_page = turbosparc_flush_cache_page, 1341 .cache_range = turbosparc_flush_cache_range, 1342 .tlb_all = turbosparc_flush_tlb_all, 1343 .tlb_mm = turbosparc_flush_tlb_mm, 1344 .tlb_page = turbosparc_flush_tlb_page, 1345 .tlb_range = turbosparc_flush_tlb_range, 1346 .page_to_ram = turbosparc_flush_page_to_ram, 1347 .sig_insns = turbosparc_flush_sig_insns, 1348 .page_for_dma = turbosparc_flush_page_for_dma, 1349}; 1350 1351static void __init init_turbosparc(void) 1352{ 1353 srmmu_name = "Fujitsu TurboSparc"; 1354 srmmu_modtype = TurboSparc; 1355 sparc32_cachetlb_ops = &turbosparc_ops; 1356 poke_srmmu = poke_turbosparc; 1357} 1358 1359static void poke_tsunami(void) 1360{ 1361 unsigned long mreg = srmmu_get_mmureg(); 1362 1363 tsunami_flush_icache(); 1364 tsunami_flush_dcache(); 1365 mreg &= ~TSUNAMI_ITD; 1366 mreg |= (TSUNAMI_IENAB | TSUNAMI_DENAB); 1367 srmmu_set_mmureg(mreg); 1368} 1369 1370static const struct sparc32_cachetlb_ops tsunami_ops = { 1371 .cache_all = tsunami_flush_cache_all, 1372 .cache_mm = tsunami_flush_cache_mm, 1373 .cache_page = tsunami_flush_cache_page, 1374 .cache_range = tsunami_flush_cache_range, 1375 .tlb_all = tsunami_flush_tlb_all, 1376 .tlb_mm = tsunami_flush_tlb_mm, 1377 .tlb_page = tsunami_flush_tlb_page, 1378 .tlb_range = tsunami_flush_tlb_range, 1379 .page_to_ram = tsunami_flush_page_to_ram, 1380 .sig_insns = tsunami_flush_sig_insns, 1381 .page_for_dma = tsunami_flush_page_for_dma, 1382}; 1383 1384static void __init init_tsunami(void) 1385{ 1386 /* 1387 * Tsunami's pretty sane, Sun and TI actually got it 1388 * somewhat right this time. Fujitsu should have 1389 * taken some lessons from them. 1390 */ 1391 1392 srmmu_name = "TI Tsunami"; 1393 srmmu_modtype = Tsunami; 1394 sparc32_cachetlb_ops = &tsunami_ops; 1395 poke_srmmu = poke_tsunami; 1396 1397 tsunami_setup_blockops(); 1398} 1399 1400static void poke_viking(void) 1401{ 1402 unsigned long mreg = srmmu_get_mmureg(); 1403 static int smp_catch; 1404 1405 if (viking_mxcc_present) { 1406 unsigned long mxcc_control = mxcc_get_creg(); 1407 1408 mxcc_control |= (MXCC_CTL_ECE | MXCC_CTL_PRE | MXCC_CTL_MCE); 1409 mxcc_control &= ~(MXCC_CTL_RRC); 1410 mxcc_set_creg(mxcc_control); 1411 1412 /* 1413 * We don't need memory parity checks. 1414 * XXX This is a mess, have to dig out later. ecd. 1415 viking_mxcc_turn_off_parity(&mreg, &mxcc_control); 1416 */ 1417 1418 /* We do cache ptables on MXCC. */ 1419 mreg |= VIKING_TCENABLE; 1420 } else { 1421 unsigned long bpreg; 1422 1423 mreg &= ~(VIKING_TCENABLE); 1424 if (smp_catch++) { 1425 /* Must disable mixed-cmd mode here for other cpu's. */ 1426 bpreg = viking_get_bpreg(); 1427 bpreg &= ~(VIKING_ACTION_MIX); 1428 viking_set_bpreg(bpreg); 1429 1430 /* Just in case PROM does something funny. */ 1431 msi_set_sync(); 1432 } 1433 } 1434 1435 mreg |= VIKING_SPENABLE; 1436 mreg |= (VIKING_ICENABLE | VIKING_DCENABLE); 1437 mreg |= VIKING_SBENABLE; 1438 mreg &= ~(VIKING_ACENABLE); 1439 srmmu_set_mmureg(mreg); 1440} 1441 1442static struct sparc32_cachetlb_ops viking_ops = { 1443 .cache_all = viking_flush_cache_all, 1444 .cache_mm = viking_flush_cache_mm, 1445 .cache_page = viking_flush_cache_page, 1446 .cache_range = viking_flush_cache_range, 1447 .tlb_all = viking_flush_tlb_all, 1448 .tlb_mm = viking_flush_tlb_mm, 1449 .tlb_page = viking_flush_tlb_page, 1450 .tlb_range = viking_flush_tlb_range, 1451 .page_to_ram = viking_flush_page_to_ram, 1452 .sig_insns = viking_flush_sig_insns, 1453 .page_for_dma = viking_flush_page_for_dma, 1454}; 1455 1456#ifdef CONFIG_SMP 1457/* On sun4d the cpu broadcasts local TLB flushes, so we can just 1458 * perform the local TLB flush and all the other cpus will see it. 1459 * But, unfortunately, there is a bug in the sun4d XBUS backplane 1460 * that requires that we add some synchronization to these flushes. 1461 * 1462 * The bug is that the fifo which keeps track of all the pending TLB 1463 * broadcasts in the system is an entry or two too small, so if we 1464 * have too many going at once we'll overflow that fifo and lose a TLB 1465 * flush resulting in corruption. 1466 * 1467 * Our workaround is to take a global spinlock around the TLB flushes, 1468 * which guarentees we won't ever have too many pending. It's a big 1469 * hammer, but a semaphore like system to make sure we only have N TLB 1470 * flushes going at once will require SMP locking anyways so there's 1471 * no real value in trying any harder than this. 1472 */ 1473static struct sparc32_cachetlb_ops viking_sun4d_smp_ops = { 1474 .cache_all = viking_flush_cache_all, 1475 .cache_mm = viking_flush_cache_mm, 1476 .cache_page = viking_flush_cache_page, 1477 .cache_range = viking_flush_cache_range, 1478 .tlb_all = sun4dsmp_flush_tlb_all, 1479 .tlb_mm = sun4dsmp_flush_tlb_mm, 1480 .tlb_page = sun4dsmp_flush_tlb_page, 1481 .tlb_range = sun4dsmp_flush_tlb_range, 1482 .page_to_ram = viking_flush_page_to_ram, 1483 .sig_insns = viking_flush_sig_insns, 1484 .page_for_dma = viking_flush_page_for_dma, 1485}; 1486#endif 1487 1488static void __init init_viking(void) 1489{ 1490 unsigned long mreg = srmmu_get_mmureg(); 1491 1492 /* Ahhh, the viking. SRMMU VLSI abortion number two... */ 1493 if (mreg & VIKING_MMODE) { 1494 srmmu_name = "TI Viking"; 1495 viking_mxcc_present = 0; 1496 msi_set_sync(); 1497 1498 /* 1499 * We need this to make sure old viking takes no hits 1500 * on it's cache for dma snoops to workaround the 1501 * "load from non-cacheable memory" interrupt bug. 1502 * This is only necessary because of the new way in 1503 * which we use the IOMMU. 1504 */ 1505 viking_ops.page_for_dma = viking_flush_page; 1506#ifdef CONFIG_SMP 1507 viking_sun4d_smp_ops.page_for_dma = viking_flush_page; 1508#endif 1509 flush_page_for_dma_global = 0; 1510 } else { 1511 srmmu_name = "TI Viking/MXCC"; 1512 viking_mxcc_present = 1; 1513 srmmu_cache_pagetables = 1; 1514 } 1515 1516 sparc32_cachetlb_ops = (const struct sparc32_cachetlb_ops *) 1517 &viking_ops; 1518#ifdef CONFIG_SMP 1519 if (sparc_cpu_model == sun4d) 1520 sparc32_cachetlb_ops = (const struct sparc32_cachetlb_ops *) 1521 &viking_sun4d_smp_ops; 1522#endif 1523 1524 poke_srmmu = poke_viking; 1525} 1526 1527/* Probe for the srmmu chip version. */ 1528static void __init get_srmmu_type(void) 1529{ 1530 unsigned long mreg, psr; 1531 unsigned long mod_typ, mod_rev, psr_typ, psr_vers; 1532 1533 srmmu_modtype = SRMMU_INVAL_MOD; 1534 hwbug_bitmask = 0; 1535 1536 mreg = srmmu_get_mmureg(); psr = get_psr(); 1537 mod_typ = (mreg & 0xf0000000) >> 28; 1538 mod_rev = (mreg & 0x0f000000) >> 24; 1539 psr_typ = (psr >> 28) & 0xf; 1540 psr_vers = (psr >> 24) & 0xf; 1541 1542 /* First, check for sparc-leon. */ 1543 if (sparc_cpu_model == sparc_leon) { 1544 init_leon(); 1545 return; 1546 } 1547 1548 /* Second, check for HyperSparc or Cypress. */ 1549 if (mod_typ == 1) { 1550 switch (mod_rev) { 1551 case 7: 1552 /* UP or MP Hypersparc */ 1553 init_hypersparc(); 1554 break; 1555 case 0: 1556 case 2: 1557 case 10: 1558 case 11: 1559 case 12: 1560 case 13: 1561 case 14: 1562 case 15: 1563 default: 1564 prom_printf("Sparc-Linux Cypress support does not longer exit.\n"); 1565 prom_halt(); 1566 break; 1567 } 1568 return; 1569 } 1570 1571 /* Now Fujitsu TurboSparc. It might happen that it is 1572 * in Swift emulation mode, so we will check later... 1573 */ 1574 if (psr_typ == 0 && psr_vers == 5) { 1575 init_turbosparc(); 1576 return; 1577 } 1578 1579 /* Next check for Fujitsu Swift. */ 1580 if (psr_typ == 0 && psr_vers == 4) { 1581 phandle cpunode; 1582 char node_str[128]; 1583 1584 /* Look if it is not a TurboSparc emulating Swift... */ 1585 cpunode = prom_getchild(prom_root_node); 1586 while ((cpunode = prom_getsibling(cpunode)) != 0) { 1587 prom_getstring(cpunode, "device_type", node_str, sizeof(node_str)); 1588 if (!strcmp(node_str, "cpu")) { 1589 if (!prom_getintdefault(cpunode, "psr-implementation", 1) && 1590 prom_getintdefault(cpunode, "psr-version", 1) == 5) { 1591 init_turbosparc(); 1592 return; 1593 } 1594 break; 1595 } 1596 } 1597 1598 init_swift(); 1599 return; 1600 } 1601 1602 /* Now the Viking family of srmmu. */ 1603 if (psr_typ == 4 && 1604 ((psr_vers == 0) || 1605 ((psr_vers == 1) && (mod_typ == 0) && (mod_rev == 0)))) { 1606 init_viking(); 1607 return; 1608 } 1609 1610 /* Finally the Tsunami. */ 1611 if (psr_typ == 4 && psr_vers == 1 && (mod_typ || mod_rev)) { 1612 init_tsunami(); 1613 return; 1614 } 1615 1616 /* Oh well */ 1617 srmmu_is_bad(); 1618} 1619 1620#ifdef CONFIG_SMP 1621/* Local cross-calls. */ 1622static void smp_flush_page_for_dma(unsigned long page) 1623{ 1624 xc1((smpfunc_t) local_ops->page_for_dma, page); 1625 local_ops->page_for_dma(page); 1626} 1627 1628static void smp_flush_cache_all(void) 1629{ 1630 xc0((smpfunc_t) local_ops->cache_all); 1631 local_ops->cache_all(); 1632} 1633 1634static void smp_flush_tlb_all(void) 1635{ 1636 xc0((smpfunc_t) local_ops->tlb_all); 1637 local_ops->tlb_all(); 1638} 1639 1640static void smp_flush_cache_mm(struct mm_struct *mm) 1641{ 1642 if (mm->context != NO_CONTEXT) { 1643 cpumask_t cpu_mask; 1644 cpumask_copy(&cpu_mask, mm_cpumask(mm)); 1645 cpumask_clear_cpu(smp_processor_id(), &cpu_mask); 1646 if (!cpumask_empty(&cpu_mask)) 1647 xc1((smpfunc_t) local_ops->cache_mm, (unsigned long) mm); 1648 local_ops->cache_mm(mm); 1649 } 1650} 1651 1652static void smp_flush_tlb_mm(struct mm_struct *mm) 1653{ 1654 if (mm->context != NO_CONTEXT) { 1655 cpumask_t cpu_mask; 1656 cpumask_copy(&cpu_mask, mm_cpumask(mm)); 1657 cpumask_clear_cpu(smp_processor_id(), &cpu_mask); 1658 if (!cpumask_empty(&cpu_mask)) { 1659 xc1((smpfunc_t) local_ops->tlb_mm, (unsigned long) mm); 1660 if (atomic_read(&mm->mm_users) == 1 && current->active_mm == mm) 1661 cpumask_copy(mm_cpumask(mm), 1662 cpumask_of(smp_processor_id())); 1663 } 1664 local_ops->tlb_mm(mm); 1665 } 1666} 1667 1668static void smp_flush_cache_range(struct vm_area_struct *vma, 1669 unsigned long start, 1670 unsigned long end) 1671{ 1672 struct mm_struct *mm = vma->vm_mm; 1673 1674 if (mm->context != NO_CONTEXT) { 1675 cpumask_t cpu_mask; 1676 cpumask_copy(&cpu_mask, mm_cpumask(mm)); 1677 cpumask_clear_cpu(smp_processor_id(), &cpu_mask); 1678 if (!cpumask_empty(&cpu_mask)) 1679 xc3((smpfunc_t) local_ops->cache_range, 1680 (unsigned long) vma, start, end); 1681 local_ops->cache_range(vma, start, end); 1682 } 1683} 1684 1685static void smp_flush_tlb_range(struct vm_area_struct *vma, 1686 unsigned long start, 1687 unsigned long end) 1688{ 1689 struct mm_struct *mm = vma->vm_mm; 1690 1691 if (mm->context != NO_CONTEXT) { 1692 cpumask_t cpu_mask; 1693 cpumask_copy(&cpu_mask, mm_cpumask(mm)); 1694 cpumask_clear_cpu(smp_processor_id(), &cpu_mask); 1695 if (!cpumask_empty(&cpu_mask)) 1696 xc3((smpfunc_t) local_ops->tlb_range, 1697 (unsigned long) vma, start, end); 1698 local_ops->tlb_range(vma, start, end); 1699 } 1700} 1701 1702static void smp_flush_cache_page(struct vm_area_struct *vma, unsigned long page) 1703{ 1704 struct mm_struct *mm = vma->vm_mm; 1705 1706 if (mm->context != NO_CONTEXT) { 1707 cpumask_t cpu_mask; 1708 cpumask_copy(&cpu_mask, mm_cpumask(mm)); 1709 cpumask_clear_cpu(smp_processor_id(), &cpu_mask); 1710 if (!cpumask_empty(&cpu_mask)) 1711 xc2((smpfunc_t) local_ops->cache_page, 1712 (unsigned long) vma, page); 1713 local_ops->cache_page(vma, page); 1714 } 1715} 1716 1717static void smp_flush_tlb_page(struct vm_area_struct *vma, unsigned long page) 1718{ 1719 struct mm_struct *mm = vma->vm_mm; 1720 1721 if (mm->context != NO_CONTEXT) { 1722 cpumask_t cpu_mask; 1723 cpumask_copy(&cpu_mask, mm_cpumask(mm)); 1724 cpumask_clear_cpu(smp_processor_id(), &cpu_mask); 1725 if (!cpumask_empty(&cpu_mask)) 1726 xc2((smpfunc_t) local_ops->tlb_page, 1727 (unsigned long) vma, page); 1728 local_ops->tlb_page(vma, page); 1729 } 1730} 1731 1732static void smp_flush_page_to_ram(unsigned long page) 1733{ 1734 /* Current theory is that those who call this are the one's 1735 * who have just dirtied their cache with the pages contents 1736 * in kernel space, therefore we only run this on local cpu. 1737 * 1738 * XXX This experiment failed, research further... -DaveM 1739 */ 1740#if 1 1741 xc1((smpfunc_t) local_ops->page_to_ram, page); 1742#endif 1743 local_ops->page_to_ram(page); 1744} 1745 1746static void smp_flush_sig_insns(struct mm_struct *mm, unsigned long insn_addr) 1747{ 1748 cpumask_t cpu_mask; 1749 cpumask_copy(&cpu_mask, mm_cpumask(mm)); 1750 cpumask_clear_cpu(smp_processor_id(), &cpu_mask); 1751 if (!cpumask_empty(&cpu_mask)) 1752 xc2((smpfunc_t) local_ops->sig_insns, 1753 (unsigned long) mm, insn_addr); 1754 local_ops->sig_insns(mm, insn_addr); 1755} 1756 1757static struct sparc32_cachetlb_ops smp_cachetlb_ops = { 1758 .cache_all = smp_flush_cache_all, 1759 .cache_mm = smp_flush_cache_mm, 1760 .cache_page = smp_flush_cache_page, 1761 .cache_range = smp_flush_cache_range, 1762 .tlb_all = smp_flush_tlb_all, 1763 .tlb_mm = smp_flush_tlb_mm, 1764 .tlb_page = smp_flush_tlb_page, 1765 .tlb_range = smp_flush_tlb_range, 1766 .page_to_ram = smp_flush_page_to_ram, 1767 .sig_insns = smp_flush_sig_insns, 1768 .page_for_dma = smp_flush_page_for_dma, 1769}; 1770#endif 1771 1772/* Load up routines and constants for sun4m and sun4d mmu */ 1773void __init load_mmu(void) 1774{ 1775 /* Functions */ 1776 get_srmmu_type(); 1777 1778#ifdef CONFIG_SMP 1779 /* El switcheroo... */ 1780 local_ops = sparc32_cachetlb_ops; 1781 1782 if (sparc_cpu_model == sun4d || sparc_cpu_model == sparc_leon) { 1783 smp_cachetlb_ops.tlb_all = local_ops->tlb_all; 1784 smp_cachetlb_ops.tlb_mm = local_ops->tlb_mm; 1785 smp_cachetlb_ops.tlb_range = local_ops->tlb_range; 1786 smp_cachetlb_ops.tlb_page = local_ops->tlb_page; 1787 } 1788 1789 if (poke_srmmu == poke_viking) { 1790 /* Avoid unnecessary cross calls. */ 1791 smp_cachetlb_ops.cache_all = local_ops->cache_all; 1792 smp_cachetlb_ops.cache_mm = local_ops->cache_mm; 1793 smp_cachetlb_ops.cache_range = local_ops->cache_range; 1794 smp_cachetlb_ops.cache_page = local_ops->cache_page; 1795 1796 smp_cachetlb_ops.page_to_ram = local_ops->page_to_ram; 1797 smp_cachetlb_ops.sig_insns = local_ops->sig_insns; 1798 smp_cachetlb_ops.page_for_dma = local_ops->page_for_dma; 1799 } 1800 1801 /* It really is const after this point. */ 1802 sparc32_cachetlb_ops = (const struct sparc32_cachetlb_ops *) 1803 &smp_cachetlb_ops; 1804#endif 1805 1806 if (sparc_cpu_model == sun4d) 1807 ld_mmu_iounit(); 1808 else 1809 ld_mmu_iommu(); 1810#ifdef CONFIG_SMP 1811 if (sparc_cpu_model == sun4d) 1812 sun4d_init_smp(); 1813 else if (sparc_cpu_model == sparc_leon) 1814 leon_init_smp(); 1815 else 1816 sun4m_init_smp(); 1817#endif 1818} 1819