init.c 13.3 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10
/*
 * This file is subject to the terms and conditions of the GNU General Public
 * License.  See the file "COPYING" in the main directory of this archive
 * for more details.
 *
 * Copyright (C) 1994 - 2000 Ralf Baechle
 * Copyright (C) 1999, 2000 Silicon Graphics, Inc.
 * Kevin D. Kissell, kevink@mips.com and Carsten Langgaard, carstenl@mips.com
 * Copyright (C) 2000 MIPS Technologies, Inc.  All rights reserved.
 */
11
#include <linux/bug.h>
L
Linus Torvalds 已提交
12
#include <linux/init.h>
13
#include <linux/export.h>
L
Linus Torvalds 已提交
14 15
#include <linux/signal.h>
#include <linux/sched.h>
16
#include <linux/smp.h>
L
Linus Torvalds 已提交
17 18 19 20 21 22 23 24 25 26 27
#include <linux/kernel.h>
#include <linux/errno.h>
#include <linux/string.h>
#include <linux/types.h>
#include <linux/pagemap.h>
#include <linux/ptrace.h>
#include <linux/mman.h>
#include <linux/mm.h>
#include <linux/bootmem.h>
#include <linux/highmem.h>
#include <linux/swap.h>
28
#include <linux/proc_fs.h>
D
Dave Hansen 已提交
29
#include <linux/pfn.h>
30
#include <linux/hardirq.h>
31
#include <linux/gfp.h>
32
#include <linux/kcore.h>
33
#include <linux/initrd.h>
L
Linus Torvalds 已提交
34

R
Ralf Baechle 已提交
35
#include <asm/asm-offsets.h>
L
Linus Torvalds 已提交
36 37 38 39
#include <asm/bootinfo.h>
#include <asm/cachectl.h>
#include <asm/cpu.h>
#include <asm/dma.h>
40
#include <asm/kmap_types.h>
41
#include <asm/maar.h>
L
Linus Torvalds 已提交
42 43 44 45 46
#include <asm/mmu_context.h>
#include <asm/sections.h>
#include <asm/pgtable.h>
#include <asm/pgalloc.h>
#include <asm/tlb.h>
47 48
#include <asm/fixmap.h>

L
Linus Torvalds 已提交
49 50
/*
 * We have up to 8 empty zeroed pages so we can map one of the right colour
R
Ralf Baechle 已提交
51
 * when needed.	 This is necessary only on R4000 / R4400 SC and MC versions
L
Linus Torvalds 已提交
52 53 54 55 56
 * where we have to avoid VCED / VECI exceptions for good performance at
 * any price.  Since page is never written to after the initialization we
 * don't have to care about aliases on other CPUs.
 */
unsigned long empty_zero_page, zero_page_mask;
57
EXPORT_SYMBOL_GPL(empty_zero_page);
58
EXPORT_SYMBOL(zero_page_mask);
L
Linus Torvalds 已提交
59 60 61 62

/*
 * Not static inline because used by IP27 special magic initialization code
 */
63
void setup_zero_pages(void)
L
Linus Torvalds 已提交
64
{
65
	unsigned int order, i;
L
Linus Torvalds 已提交
66 67 68 69 70 71 72 73 74 75 76
	struct page *page;

	if (cpu_has_vce)
		order = 3;
	else
		order = 0;

	empty_zero_page = __get_free_pages(GFP_KERNEL | __GFP_ZERO, order);
	if (!empty_zero_page)
		panic("Oh boy, that early out of memory?");

77
	page = virt_to_page((void *)empty_zero_page);
N
Nick Piggin 已提交
78
	split_page(page, order);
79 80
	for (i = 0; i < (1 << order); i++, page++)
		mark_page_reserved(page);
L
Linus Torvalds 已提交
81

82
	zero_page_mask = ((PAGE_SIZE << order) - 1) & PAGE_MASK;
L
Linus Torvalds 已提交
83 84
}

85
static void *__kmap_pgprot(struct page *page, unsigned long addr, pgprot_t prot)
86 87 88 89 90 91 92
{
	enum fixed_addresses idx;
	unsigned long vaddr, flags, entrylo;
	unsigned long old_ctx;
	pte_t pte;
	int tlbidx;

93 94
	BUG_ON(Page_dcache_dirty(page));

95
	preempt_disable();
96
	pagefault_disable();
97
	idx = (addr >> PAGE_SHIFT) & (FIX_N_COLOURS - 1);
98
	idx += in_interrupt() ? FIX_N_COLOURS : 0;
99
	vaddr = __fix_to_virt(FIX_CMAP_END - idx);
100
	pte = mk_pte(page, prot);
101
#if defined(CONFIG_XPA)
S
Steven J. Hill 已提交
102
	entrylo = pte_to_entrylo(pte.pte_high);
103 104
#elif defined(CONFIG_PHYS_ADDR_T_64BIT) && defined(CONFIG_CPU_MIPS32)
	entrylo = pte.pte_high;
105
#else
106
	entrylo = pte_to_entrylo(pte_val(pte));
107 108
#endif

R
Ralf Baechle 已提交
109
	local_irq_save(flags);
110 111 112 113
	old_ctx = read_c0_entryhi();
	write_c0_entryhi(vaddr & (PAGE_MASK << 1));
	write_c0_entrylo0(entrylo);
	write_c0_entrylo1(entrylo);
S
Steven J. Hill 已提交
114
#ifdef CONFIG_XPA
115 116 117 118 119
	if (cpu_has_xpa) {
		entrylo = (pte.pte_low & _PFNX_MASK);
		writex_c0_entrylo0(entrylo);
		writex_c0_entrylo1(entrylo);
	}
S
Steven J. Hill 已提交
120
#endif
121
	tlbidx = num_wired_entries();
122 123 124 125 126 127
	write_c0_wired(tlbidx + 1);
	write_c0_index(tlbidx);
	mtc0_tlbw_hazard();
	tlb_write_indexed();
	tlbw_use_hazard();
	write_c0_entryhi(old_ctx);
R
Ralf Baechle 已提交
128
	local_irq_restore(flags);
129 130 131 132

	return (void*) vaddr;
}

133 134 135 136 137 138 139 140 141 142
void *kmap_coherent(struct page *page, unsigned long addr)
{
	return __kmap_pgprot(page, addr, PAGE_KERNEL);
}

void *kmap_noncoherent(struct page *page, unsigned long addr)
{
	return __kmap_pgprot(page, addr, PAGE_KERNEL_NC);
}

143
void kunmap_coherent(void)
144 145 146 147
{
	unsigned int wired;
	unsigned long flags, old_ctx;

R
Ralf Baechle 已提交
148
	local_irq_save(flags);
149
	old_ctx = read_c0_entryhi();
150
	wired = num_wired_entries() - 1;
151 152 153 154 155 156 157 158 159
	write_c0_wired(wired);
	write_c0_index(wired);
	write_c0_entryhi(UNIQUE_ENTRYHI(wired));
	write_c0_entrylo0(0);
	write_c0_entrylo1(0);
	mtc0_tlbw_hazard();
	tlb_write_indexed();
	tlbw_use_hazard();
	write_c0_entryhi(old_ctx);
R
Ralf Baechle 已提交
160
	local_irq_restore(flags);
161
	pagefault_enable();
162
	preempt_enable();
163 164
}

165 166 167 168 169
void copy_user_highpage(struct page *to, struct page *from,
	unsigned long vaddr, struct vm_area_struct *vma)
{
	void *vfrom, *vto;

170
	vto = kmap_atomic(to);
171
	if (cpu_has_dc_aliases &&
172
	    page_mapcount(from) && !Page_dcache_dirty(from)) {
173 174
		vfrom = kmap_coherent(from, vaddr);
		copy_page(vto, vfrom);
175
		kunmap_coherent();
176
	} else {
177
		vfrom = kmap_atomic(from);
178
		copy_page(vto, vfrom);
179
		kunmap_atomic(vfrom);
180
	}
181
	if ((!cpu_has_ic_fills_f_dc) ||
182 183
	    pages_do_alias((unsigned long)vto, vaddr & PAGE_MASK))
		flush_data_cache_page((unsigned long)vto);
184
	kunmap_atomic(vto);
185 186 187 188
	/* Make sure this page is cleared on other CPU's too before using it */
	smp_wmb();
}

189 190 191 192
void copy_to_user_page(struct vm_area_struct *vma,
	struct page *page, unsigned long vaddr, void *dst, const void *src,
	unsigned long len)
{
193
	if (cpu_has_dc_aliases &&
194
	    page_mapcount(page) && !Page_dcache_dirty(page)) {
195 196
		void *vto = kmap_coherent(page, vaddr) + (vaddr & ~PAGE_MASK);
		memcpy(vto, src, len);
197
		kunmap_coherent();
198
	} else {
199
		memcpy(dst, src, len);
200 201 202
		if (cpu_has_dc_aliases)
			SetPageDcacheDirty(page);
	}
203
	if (vma->vm_flags & VM_EXEC)
204 205 206 207 208 209 210
		flush_cache_page(vma, vaddr, page_to_pfn(page));
}

void copy_from_user_page(struct vm_area_struct *vma,
	struct page *page, unsigned long vaddr, void *dst, const void *src,
	unsigned long len)
{
211
	if (cpu_has_dc_aliases &&
212
	    page_mapcount(page) && !Page_dcache_dirty(page)) {
213
		void *vfrom = kmap_coherent(page, vaddr) + (vaddr & ~PAGE_MASK);
214
		memcpy(dst, vfrom, len);
215
		kunmap_coherent();
216
	} else {
217
		memcpy(dst, src, len);
218 219 220
		if (cpu_has_dc_aliases)
			SetPageDcacheDirty(page);
	}
221
}
222
EXPORT_SYMBOL_GPL(copy_from_user_page);
223

224
void __init fixrange_init(unsigned long start, unsigned long end,
L
Linus Torvalds 已提交
225 226
	pgd_t *pgd_base)
{
R
Ralf Baechle 已提交
227
#ifdef CONFIG_HIGHMEM
L
Linus Torvalds 已提交
228
	pgd_t *pgd;
229
	pud_t *pud;
L
Linus Torvalds 已提交
230 231
	pmd_t *pmd;
	pte_t *pte;
232
	int i, j, k;
L
Linus Torvalds 已提交
233 234 235 236
	unsigned long vaddr;

	vaddr = start;
	i = __pgd_offset(vaddr);
237 238
	j = __pud_offset(vaddr);
	k = __pmd_offset(vaddr);
L
Linus Torvalds 已提交
239 240
	pgd = pgd_base + i;

241
	for ( ; (i < PTRS_PER_PGD) && (vaddr < end); pgd++, i++) {
242
		pud = (pud_t *)pgd;
243
		for ( ; (j < PTRS_PER_PUD) && (vaddr < end); pud++, j++) {
244
			pmd = (pmd_t *)pud;
245
			for (; (k < PTRS_PER_PMD) && (vaddr < end); pmd++, k++) {
246 247
				if (pmd_none(*pmd)) {
					pte = (pte_t *) alloc_bootmem_low_pages(PAGE_SIZE);
248
					set_pmd(pmd, __pmd((unsigned long)pte));
249
					BUG_ON(pte != pte_offset_kernel(pmd, 0));
250 251
				}
				vaddr += PMD_SIZE;
L
Linus Torvalds 已提交
252
			}
253
			k = 0;
L
Linus Torvalds 已提交
254 255 256
		}
		j = 0;
	}
257
#endif
L
Linus Torvalds 已提交
258 259
}

260 261 262 263 264 265 266 267 268 269 270 271 272 273
unsigned __weak platform_maar_init(unsigned num_pairs)
{
	struct maar_config cfg[BOOT_MEM_MAP_MAX];
	unsigned i, num_configured, num_cfg = 0;

	for (i = 0; i < boot_mem_map.nr_map; i++) {
		switch (boot_mem_map.map[i].type) {
		case BOOT_MEM_RAM:
		case BOOT_MEM_INIT_RAM:
			break;
		default:
			continue;
		}

J
James Hogan 已提交
274
		/* Round lower up */
275
		cfg[num_cfg].lower = boot_mem_map.map[i].addr;
J
James Hogan 已提交
276
		cfg[num_cfg].lower = (cfg[num_cfg].lower + 0xffff) & ~0xffff;
277

J
James Hogan 已提交
278 279 280 281
		/* Round upper down */
		cfg[num_cfg].upper = boot_mem_map.map[i].addr +
					boot_mem_map.map[i].size;
		cfg[num_cfg].upper = (cfg[num_cfg].upper & ~0xffff) - 1;
282 283 284 285 286 287 288 289 290 291 292 293 294

		cfg[num_cfg].attrs = MIPS_MAAR_S;
		num_cfg++;
	}

	num_configured = maar_config(cfg, num_cfg, num_pairs);
	if (num_configured < num_cfg)
		pr_warn("Not enough MAAR pairs (%u) for all bootmem regions (%u)\n",
			num_pairs, num_cfg);

	return num_configured;
}

295
void maar_init(void)
296 297
{
	unsigned num_maars, used, i;
298
	phys_addr_t lower, upper, attr;
299 300 301 302
	static struct {
		struct maar_config cfgs[3];
		unsigned used;
	} recorded = { { { 0 } }, 0 };
303 304 305 306 307 308 309 310 311 312 313 314

	if (!cpu_has_maar)
		return;

	/* Detect the number of MAARs */
	write_c0_maari(~0);
	back_to_back_c0_hazard();
	num_maars = read_c0_maari() + 1;

	/* MAARs should be in pairs */
	WARN_ON(num_maars % 2);

315 316 317 318 319 320 321 322
	/* Set MAARs using values we recorded already */
	if (recorded.used) {
		used = maar_config(recorded.cfgs, recorded.used, num_maars / 2);
		BUG_ON(used != recorded.used);
	} else {
		/* Configure the required MAARs */
		used = platform_maar_init(num_maars / 2);
	}
323 324 325 326 327 328 329 330

	/* Disable any further MAARs */
	for (i = (used * 2); i < num_maars; i++) {
		write_c0_maari(i);
		back_to_back_c0_hazard();
		write_c0_maar(0);
		back_to_back_c0_hazard();
	}
331

332 333 334
	if (recorded.used)
		return;

335 336 337 338 339 340 341 342 343 344 345 346 347 348 349
	pr_info("MAAR configuration:\n");
	for (i = 0; i < num_maars; i += 2) {
		write_c0_maari(i);
		back_to_back_c0_hazard();
		upper = read_c0_maar();

		write_c0_maari(i + 1);
		back_to_back_c0_hazard();
		lower = read_c0_maar();

		attr = lower & upper;
		lower = (lower & MIPS_MAAR_ADDR) << 4;
		upper = ((upper & MIPS_MAAR_ADDR) << 4) | 0xffff;

		pr_info("  [%d]: ", i / 2);
350
		if (!(attr & MIPS_MAAR_VL)) {
351 352 353 354 355 356 357 358 359 360
			pr_cont("disabled\n");
			continue;
		}

		pr_cont("%pa-%pa", &lower, &upper);

		if (attr & MIPS_MAAR_S)
			pr_cont(" speculate");

		pr_cont("\n");
361 362 363 364 365 366 367 368

		/* Record the setup for use on secondary CPUs */
		if (used <= ARRAY_SIZE(recorded.cfgs)) {
			recorded.cfgs[recorded.used].lower = lower;
			recorded.cfgs[recorded.used].upper = upper;
			recorded.cfgs[recorded.used].attrs = attr;
			recorded.used++;
		}
369
	}
370 371
}

372
#ifndef CONFIG_NEED_MULTIPLE_NODES
373
int page_is_ram(unsigned long pagenr)
374 375 376 377 378 379
{
	int i;

	for (i = 0; i < boot_mem_map.nr_map; i++) {
		unsigned long addr, end;

380 381 382 383 384
		switch (boot_mem_map.map[i].type) {
		case BOOT_MEM_RAM:
		case BOOT_MEM_INIT_RAM:
			break;
		default:
385 386
			/* not usable memory */
			continue;
387
		}
388 389 390 391 392 393 394 395 396 397 398 399

		addr = PFN_UP(boot_mem_map.map[i].addr);
		end = PFN_DOWN(boot_mem_map.map[i].addr +
			       boot_mem_map.map[i].size);

		if (pagenr >= addr && pagenr < end)
			return 1;
	}

	return 0;
}

L
Linus Torvalds 已提交
400 401
void __init paging_init(void)
{
402
	unsigned long max_zone_pfns[MAX_NR_ZONES];
L
Linus Torvalds 已提交
403 404 405 406 407 408

	pagetable_init();

#ifdef CONFIG_HIGHMEM
	kmap_init();
#endif
409
#ifdef CONFIG_ZONE_DMA
410
	max_zone_pfns[ZONE_DMA] = MAX_DMA_PFN;
L
Linus Torvalds 已提交
411
#endif
412 413 414 415
#ifdef CONFIG_ZONE_DMA32
	max_zone_pfns[ZONE_DMA32] = MAX_DMA32_PFN;
#endif
	max_zone_pfns[ZONE_NORMAL] = max_low_pfn;
L
Linus Torvalds 已提交
416
#ifdef CONFIG_HIGHMEM
417
	max_zone_pfns[ZONE_HIGHMEM] = highend_pfn;
418

419
	if (cpu_has_dc_aliases && max_low_pfn != highend_pfn) {
420
		printk(KERN_WARNING "This processor doesn't support highmem."
421 422 423
		       " %ldk highmem ignored\n",
		       (highend_pfn - max_low_pfn) << (PAGE_SHIFT - 10));
		max_zone_pfns[ZONE_HIGHMEM] = max_low_pfn;
424
	}
L
Linus Torvalds 已提交
425 426
#endif

427
	free_area_init_nodes(max_zone_pfns);
L
Linus Torvalds 已提交
428 429
}

430 431 432 433
#ifdef CONFIG_64BIT
static struct kcore_list kcore_kseg0;
#endif

434
static inline void mem_init_free_highmem(void)
L
Linus Torvalds 已提交
435
{
436 437
#ifdef CONFIG_HIGHMEM
	unsigned long tmp;
L
Linus Torvalds 已提交
438

439 440 441
	if (cpu_has_dc_aliases)
		return;

442 443 444 445 446 447 448 449 450 451 452 453 454
	for (tmp = highstart_pfn; tmp < highend_pfn; tmp++) {
		struct page *page = pfn_to_page(tmp);

		if (!page_is_ram(tmp))
			SetPageReserved(page);
		else
			free_highmem_page(page);
	}
#endif
}

void __init mem_init(void)
{
L
Linus Torvalds 已提交
455 456 457 458
#ifdef CONFIG_HIGHMEM
#ifdef CONFIG_DISCONTIGMEM
#error "CONFIG_HIGHMEM and CONFIG_DISCONTIGMEM dont work together yet"
#endif
459
	max_mapnr = highend_pfn ? highend_pfn : max_low_pfn;
L
Linus Torvalds 已提交
460
#else
461
	max_mapnr = max_low_pfn;
L
Linus Torvalds 已提交
462 463 464
#endif
	high_memory = (void *) __va(max_low_pfn << PAGE_SHIFT);

P
Paul Burton 已提交
465
	maar_init();
466
	free_all_bootmem();
467
	setup_zero_pages();	/* Setup zeroed pages.  */
468 469
	mem_init_free_highmem();
	mem_init_print_info(NULL);
L
Linus Torvalds 已提交
470

471 472 473 474
#ifdef CONFIG_64BIT
	if ((unsigned long) &_text > (unsigned long) CKSEG0)
		/* The -4 is a hack so that user tools don't have to handle
		   the overflow.  */
K
KAMEZAWA Hiroyuki 已提交
475 476
		kclist_add(&kcore_kseg0, (void *) CKSEG0,
				0x80000000 - 4, KCORE_TEXT);
477
#endif
L
Linus Torvalds 已提交
478
}
479
#endif /* !CONFIG_NEED_MULTIPLE_NODES */
L
Linus Torvalds 已提交
480

481
void free_init_pages(const char *what, unsigned long begin, unsigned long end)
482
{
483
	unsigned long pfn;
484

485 486 487 488 489
	for (pfn = PFN_UP(begin); pfn < PFN_DOWN(end); pfn++) {
		struct page *page = pfn_to_page(pfn);
		void *addr = phys_to_virt(PFN_PHYS(pfn));

		memset(addr, POISON_FREE_INITMEM, PAGE_SIZE);
490
		free_reserved_page(page);
491 492 493 494
	}
	printk(KERN_INFO "Freeing %s: %ldk freed\n", what, (end - begin) >> 10);
}

L
Linus Torvalds 已提交
495 496 497
#ifdef CONFIG_BLK_DEV_INITRD
void free_initrd_mem(unsigned long start, unsigned long end)
{
498 499
	free_reserved_area((void *)start, (void *)end, POISON_FREE_INITMEM,
			   "initrd");
L
Linus Torvalds 已提交
500 501 502
}
#endif

503 504
void (*free_init_pages_eva)(void *begin, void *end) = NULL;

505
void __ref free_initmem(void)
L
Linus Torvalds 已提交
506
{
507
	prom_free_prom_memory();
508 509 510 511 512 513 514 515 516
	/*
	 * Let the platform define a specific function to free the
	 * init section since EVA may have used any possible mapping
	 * between virtual and physical addresses.
	 */
	if (free_init_pages_eva)
		free_init_pages_eva((void *)&__init_begin, (void *)&__init_end);
	else
		free_initmem_default(POISON_FREE_INITMEM);
L
Linus Torvalds 已提交
517
}
518

519
#ifndef CONFIG_MIPS_PGD_C0_CONTEXT
520
unsigned long pgd_current[NR_CPUS];
521
#endif
R
Ralf Baechle 已提交
522 523 524 525 526

/*
 * gcc 3.3 and older have trouble determining that PTRS_PER_PGD and PGD_ORDER
 * are constants.  So we use the variants from asm-offset.h until that gcc
 * will officially be retired.
527 528 529 530 531 532
 *
 * Align swapper_pg_dir in to 64K, allows its address to be loaded
 * with a single LUI instruction in the TLB handlers.  If we used
 * __aligned(64K), its size would get rounded up to the alignment
 * size, and waste space.  So we place it in its own section and align
 * it in the linker script.
R
Ralf Baechle 已提交
533
 */
534
pgd_t swapper_pg_dir[_PTRS_PER_PGD] __section(.bss..swapper_pg_dir);
535 536 537
#ifndef __PAGETABLE_PUD_FOLDED
pud_t invalid_pud_table[PTRS_PER_PUD] __page_aligned_bss;
#endif
538
#ifndef __PAGETABLE_PMD_FOLDED
539
pmd_t invalid_pmd_table[PTRS_PER_PMD] __page_aligned_bss;
540
EXPORT_SYMBOL_GPL(invalid_pmd_table);
541
#endif
542
pte_t invalid_pte_table[PTRS_PER_PTE] __page_aligned_bss;
543
EXPORT_SYMBOL(invalid_pte_table);