init.c 13.4 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10
/*
 * This file is subject to the terms and conditions of the GNU General Public
 * License.  See the file "COPYING" in the main directory of this archive
 * for more details.
 *
 * Copyright (C) 1994 - 2000 Ralf Baechle
 * Copyright (C) 1999, 2000 Silicon Graphics, Inc.
 * Kevin D. Kissell, kevink@mips.com and Carsten Langgaard, carstenl@mips.com
 * Copyright (C) 2000 MIPS Technologies, Inc.  All rights reserved.
 */
11
#include <linux/bug.h>
L
Linus Torvalds 已提交
12
#include <linux/init.h>
13
#include <linux/export.h>
L
Linus Torvalds 已提交
14 15
#include <linux/signal.h>
#include <linux/sched.h>
16
#include <linux/smp.h>
L
Linus Torvalds 已提交
17 18 19 20 21 22 23 24 25 26 27
#include <linux/kernel.h>
#include <linux/errno.h>
#include <linux/string.h>
#include <linux/types.h>
#include <linux/pagemap.h>
#include <linux/ptrace.h>
#include <linux/mman.h>
#include <linux/mm.h>
#include <linux/bootmem.h>
#include <linux/highmem.h>
#include <linux/swap.h>
28
#include <linux/proc_fs.h>
D
Dave Hansen 已提交
29
#include <linux/pfn.h>
30
#include <linux/hardirq.h>
31
#include <linux/gfp.h>
32
#include <linux/kcore.h>
33
#include <linux/export.h>
L
Linus Torvalds 已提交
34

R
Ralf Baechle 已提交
35
#include <asm/asm-offsets.h>
L
Linus Torvalds 已提交
36 37 38 39
#include <asm/bootinfo.h>
#include <asm/cachectl.h>
#include <asm/cpu.h>
#include <asm/dma.h>
40
#include <asm/kmap_types.h>
41
#include <asm/maar.h>
L
Linus Torvalds 已提交
42 43 44 45 46
#include <asm/mmu_context.h>
#include <asm/sections.h>
#include <asm/pgtable.h>
#include <asm/pgalloc.h>
#include <asm/tlb.h>
47
#include <asm/fixmap.h>
48
#include <asm/maar.h>
49

L
Linus Torvalds 已提交
50 51
/*
 * We have up to 8 empty zeroed pages so we can map one of the right colour
R
Ralf Baechle 已提交
52
 * when needed.	 This is necessary only on R4000 / R4400 SC and MC versions
L
Linus Torvalds 已提交
53 54 55 56 57
 * where we have to avoid VCED / VECI exceptions for good performance at
 * any price.  Since page is never written to after the initialization we
 * don't have to care about aliases on other CPUs.
 */
unsigned long empty_zero_page, zero_page_mask;
58
EXPORT_SYMBOL_GPL(empty_zero_page);
59
EXPORT_SYMBOL(zero_page_mask);
L
Linus Torvalds 已提交
60 61 62 63

/*
 * Not static inline because used by IP27 special magic initialization code
 */
64
void setup_zero_pages(void)
L
Linus Torvalds 已提交
65
{
66
	unsigned int order, i;
L
Linus Torvalds 已提交
67 68 69 70 71 72 73 74 75 76 77
	struct page *page;

	if (cpu_has_vce)
		order = 3;
	else
		order = 0;

	empty_zero_page = __get_free_pages(GFP_KERNEL | __GFP_ZERO, order);
	if (!empty_zero_page)
		panic("Oh boy, that early out of memory?");

78
	page = virt_to_page((void *)empty_zero_page);
N
Nick Piggin 已提交
79
	split_page(page, order);
80 81
	for (i = 0; i < (1 << order); i++, page++)
		mark_page_reserved(page);
L
Linus Torvalds 已提交
82

83
	zero_page_mask = ((PAGE_SIZE << order) - 1) & PAGE_MASK;
L
Linus Torvalds 已提交
84 85
}

86
static void *__kmap_pgprot(struct page *page, unsigned long addr, pgprot_t prot)
87 88 89 90 91 92 93
{
	enum fixed_addresses idx;
	unsigned long vaddr, flags, entrylo;
	unsigned long old_ctx;
	pte_t pte;
	int tlbidx;

94 95
	BUG_ON(Page_dcache_dirty(page));

96
	preempt_disable();
97
	pagefault_disable();
98
	idx = (addr >> PAGE_SHIFT) & (FIX_N_COLOURS - 1);
99
	idx += in_interrupt() ? FIX_N_COLOURS : 0;
100
	vaddr = __fix_to_virt(FIX_CMAP_END - idx);
101
	pte = mk_pte(page, prot);
102
#if defined(CONFIG_XPA)
S
Steven J. Hill 已提交
103
	entrylo = pte_to_entrylo(pte.pte_high);
104 105
#elif defined(CONFIG_PHYS_ADDR_T_64BIT) && defined(CONFIG_CPU_MIPS32)
	entrylo = pte.pte_high;
106
#else
107
	entrylo = pte_to_entrylo(pte_val(pte));
108 109
#endif

R
Ralf Baechle 已提交
110
	local_irq_save(flags);
111 112 113 114
	old_ctx = read_c0_entryhi();
	write_c0_entryhi(vaddr & (PAGE_MASK << 1));
	write_c0_entrylo0(entrylo);
	write_c0_entrylo1(entrylo);
S
Steven J. Hill 已提交
115
#ifdef CONFIG_XPA
116 117 118 119 120
	if (cpu_has_xpa) {
		entrylo = (pte.pte_low & _PFNX_MASK);
		writex_c0_entrylo0(entrylo);
		writex_c0_entrylo1(entrylo);
	}
S
Steven J. Hill 已提交
121
#endif
122
	tlbidx = num_wired_entries();
123 124 125 126 127 128
	write_c0_wired(tlbidx + 1);
	write_c0_index(tlbidx);
	mtc0_tlbw_hazard();
	tlb_write_indexed();
	tlbw_use_hazard();
	write_c0_entryhi(old_ctx);
R
Ralf Baechle 已提交
129
	local_irq_restore(flags);
130 131 132 133

	return (void*) vaddr;
}

134 135 136 137 138 139 140 141 142 143
void *kmap_coherent(struct page *page, unsigned long addr)
{
	return __kmap_pgprot(page, addr, PAGE_KERNEL);
}

void *kmap_noncoherent(struct page *page, unsigned long addr)
{
	return __kmap_pgprot(page, addr, PAGE_KERNEL_NC);
}

144
void kunmap_coherent(void)
145 146 147 148
{
	unsigned int wired;
	unsigned long flags, old_ctx;

R
Ralf Baechle 已提交
149
	local_irq_save(flags);
150
	old_ctx = read_c0_entryhi();
151
	wired = num_wired_entries() - 1;
152 153 154 155 156 157 158 159 160
	write_c0_wired(wired);
	write_c0_index(wired);
	write_c0_entryhi(UNIQUE_ENTRYHI(wired));
	write_c0_entrylo0(0);
	write_c0_entrylo1(0);
	mtc0_tlbw_hazard();
	tlb_write_indexed();
	tlbw_use_hazard();
	write_c0_entryhi(old_ctx);
R
Ralf Baechle 已提交
161
	local_irq_restore(flags);
162
	pagefault_enable();
163
	preempt_enable();
164 165
}

166 167 168 169 170
void copy_user_highpage(struct page *to, struct page *from,
	unsigned long vaddr, struct vm_area_struct *vma)
{
	void *vfrom, *vto;

171
	vto = kmap_atomic(to);
172
	if (cpu_has_dc_aliases &&
173
	    page_mapcount(from) && !Page_dcache_dirty(from)) {
174 175
		vfrom = kmap_coherent(from, vaddr);
		copy_page(vto, vfrom);
176
		kunmap_coherent();
177
	} else {
178
		vfrom = kmap_atomic(from);
179
		copy_page(vto, vfrom);
180
		kunmap_atomic(vfrom);
181
	}
182
	if ((!cpu_has_ic_fills_f_dc) ||
183 184
	    pages_do_alias((unsigned long)vto, vaddr & PAGE_MASK))
		flush_data_cache_page((unsigned long)vto);
185
	kunmap_atomic(vto);
186 187 188 189
	/* Make sure this page is cleared on other CPU's too before using it */
	smp_wmb();
}

190 191 192 193
void copy_to_user_page(struct vm_area_struct *vma,
	struct page *page, unsigned long vaddr, void *dst, const void *src,
	unsigned long len)
{
194
	if (cpu_has_dc_aliases &&
195
	    page_mapcount(page) && !Page_dcache_dirty(page)) {
196 197
		void *vto = kmap_coherent(page, vaddr) + (vaddr & ~PAGE_MASK);
		memcpy(vto, src, len);
198
		kunmap_coherent();
199
	} else {
200
		memcpy(dst, src, len);
201 202 203
		if (cpu_has_dc_aliases)
			SetPageDcacheDirty(page);
	}
204
	if (vma->vm_flags & VM_EXEC)
205 206 207 208 209 210 211
		flush_cache_page(vma, vaddr, page_to_pfn(page));
}

void copy_from_user_page(struct vm_area_struct *vma,
	struct page *page, unsigned long vaddr, void *dst, const void *src,
	unsigned long len)
{
212
	if (cpu_has_dc_aliases &&
213
	    page_mapcount(page) && !Page_dcache_dirty(page)) {
214
		void *vfrom = kmap_coherent(page, vaddr) + (vaddr & ~PAGE_MASK);
215
		memcpy(dst, vfrom, len);
216
		kunmap_coherent();
217
	} else {
218
		memcpy(dst, src, len);
219 220 221
		if (cpu_has_dc_aliases)
			SetPageDcacheDirty(page);
	}
222
}
223
EXPORT_SYMBOL_GPL(copy_from_user_page);
224

225
void __init fixrange_init(unsigned long start, unsigned long end,
L
Linus Torvalds 已提交
226 227
	pgd_t *pgd_base)
{
R
Ralf Baechle 已提交
228
#ifdef CONFIG_HIGHMEM
L
Linus Torvalds 已提交
229
	pgd_t *pgd;
230
	pud_t *pud;
L
Linus Torvalds 已提交
231 232
	pmd_t *pmd;
	pte_t *pte;
233
	int i, j, k;
L
Linus Torvalds 已提交
234 235 236 237
	unsigned long vaddr;

	vaddr = start;
	i = __pgd_offset(vaddr);
238 239
	j = __pud_offset(vaddr);
	k = __pmd_offset(vaddr);
L
Linus Torvalds 已提交
240 241
	pgd = pgd_base + i;

242
	for ( ; (i < PTRS_PER_PGD) && (vaddr < end); pgd++, i++) {
243
		pud = (pud_t *)pgd;
244
		for ( ; (j < PTRS_PER_PUD) && (vaddr < end); pud++, j++) {
245
			pmd = (pmd_t *)pud;
246
			for (; (k < PTRS_PER_PMD) && (vaddr < end); pmd++, k++) {
247 248
				if (pmd_none(*pmd)) {
					pte = (pte_t *) alloc_bootmem_low_pages(PAGE_SIZE);
249
					set_pmd(pmd, __pmd((unsigned long)pte));
250
					BUG_ON(pte != pte_offset_kernel(pmd, 0));
251 252
				}
				vaddr += PMD_SIZE;
L
Linus Torvalds 已提交
253
			}
254
			k = 0;
L
Linus Torvalds 已提交
255 256 257
		}
		j = 0;
	}
258
#endif
L
Linus Torvalds 已提交
259 260
}

261 262 263 264 265 266 267 268 269 270 271 272 273 274
unsigned __weak platform_maar_init(unsigned num_pairs)
{
	struct maar_config cfg[BOOT_MEM_MAP_MAX];
	unsigned i, num_configured, num_cfg = 0;

	for (i = 0; i < boot_mem_map.nr_map; i++) {
		switch (boot_mem_map.map[i].type) {
		case BOOT_MEM_RAM:
		case BOOT_MEM_INIT_RAM:
			break;
		default:
			continue;
		}

J
James Hogan 已提交
275
		/* Round lower up */
276
		cfg[num_cfg].lower = boot_mem_map.map[i].addr;
J
James Hogan 已提交
277
		cfg[num_cfg].lower = (cfg[num_cfg].lower + 0xffff) & ~0xffff;
278

J
James Hogan 已提交
279 280 281 282
		/* Round upper down */
		cfg[num_cfg].upper = boot_mem_map.map[i].addr +
					boot_mem_map.map[i].size;
		cfg[num_cfg].upper = (cfg[num_cfg].upper & ~0xffff) - 1;
283 284 285 286 287 288 289 290 291 292 293 294 295

		cfg[num_cfg].attrs = MIPS_MAAR_S;
		num_cfg++;
	}

	num_configured = maar_config(cfg, num_cfg, num_pairs);
	if (num_configured < num_cfg)
		pr_warn("Not enough MAAR pairs (%u) for all bootmem regions (%u)\n",
			num_pairs, num_cfg);

	return num_configured;
}

296
void maar_init(void)
297 298
{
	unsigned num_maars, used, i;
299
	phys_addr_t lower, upper, attr;
300 301 302 303
	static struct {
		struct maar_config cfgs[3];
		unsigned used;
	} recorded = { { { 0 } }, 0 };
304 305 306 307 308 309 310 311 312 313 314 315

	if (!cpu_has_maar)
		return;

	/* Detect the number of MAARs */
	write_c0_maari(~0);
	back_to_back_c0_hazard();
	num_maars = read_c0_maari() + 1;

	/* MAARs should be in pairs */
	WARN_ON(num_maars % 2);

316 317 318 319 320 321 322 323
	/* Set MAARs using values we recorded already */
	if (recorded.used) {
		used = maar_config(recorded.cfgs, recorded.used, num_maars / 2);
		BUG_ON(used != recorded.used);
	} else {
		/* Configure the required MAARs */
		used = platform_maar_init(num_maars / 2);
	}
324 325 326 327 328 329 330 331

	/* Disable any further MAARs */
	for (i = (used * 2); i < num_maars; i++) {
		write_c0_maari(i);
		back_to_back_c0_hazard();
		write_c0_maar(0);
		back_to_back_c0_hazard();
	}
332

333 334 335
	if (recorded.used)
		return;

336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361
	pr_info("MAAR configuration:\n");
	for (i = 0; i < num_maars; i += 2) {
		write_c0_maari(i);
		back_to_back_c0_hazard();
		upper = read_c0_maar();

		write_c0_maari(i + 1);
		back_to_back_c0_hazard();
		lower = read_c0_maar();

		attr = lower & upper;
		lower = (lower & MIPS_MAAR_ADDR) << 4;
		upper = ((upper & MIPS_MAAR_ADDR) << 4) | 0xffff;

		pr_info("  [%d]: ", i / 2);
		if (!(attr & MIPS_MAAR_V)) {
			pr_cont("disabled\n");
			continue;
		}

		pr_cont("%pa-%pa", &lower, &upper);

		if (attr & MIPS_MAAR_S)
			pr_cont(" speculate");

		pr_cont("\n");
362 363 364 365 366 367 368 369

		/* Record the setup for use on secondary CPUs */
		if (used <= ARRAY_SIZE(recorded.cfgs)) {
			recorded.cfgs[recorded.used].lower = lower;
			recorded.cfgs[recorded.used].upper = upper;
			recorded.cfgs[recorded.used].attrs = attr;
			recorded.used++;
		}
370
	}
371 372
}

373
#ifndef CONFIG_NEED_MULTIPLE_NODES
374
int page_is_ram(unsigned long pagenr)
375 376 377 378 379 380
{
	int i;

	for (i = 0; i < boot_mem_map.nr_map; i++) {
		unsigned long addr, end;

381 382 383 384 385
		switch (boot_mem_map.map[i].type) {
		case BOOT_MEM_RAM:
		case BOOT_MEM_INIT_RAM:
			break;
		default:
386 387
			/* not usable memory */
			continue;
388
		}
389 390 391 392 393 394 395 396 397 398 399 400

		addr = PFN_UP(boot_mem_map.map[i].addr);
		end = PFN_DOWN(boot_mem_map.map[i].addr +
			       boot_mem_map.map[i].size);

		if (pagenr >= addr && pagenr < end)
			return 1;
	}

	return 0;
}

L
Linus Torvalds 已提交
401 402
void __init paging_init(void)
{
403
	unsigned long max_zone_pfns[MAX_NR_ZONES];
404
	unsigned long lastpfn __maybe_unused;
L
Linus Torvalds 已提交
405 406 407 408 409 410

	pagetable_init();

#ifdef CONFIG_HIGHMEM
	kmap_init();
#endif
411
#ifdef CONFIG_ZONE_DMA
412
	max_zone_pfns[ZONE_DMA] = MAX_DMA_PFN;
L
Linus Torvalds 已提交
413
#endif
414 415 416 417 418
#ifdef CONFIG_ZONE_DMA32
	max_zone_pfns[ZONE_DMA32] = MAX_DMA32_PFN;
#endif
	max_zone_pfns[ZONE_NORMAL] = max_low_pfn;
	lastpfn = max_low_pfn;
L
Linus Torvalds 已提交
419
#ifdef CONFIG_HIGHMEM
420 421
	max_zone_pfns[ZONE_HIGHMEM] = highend_pfn;
	lastpfn = highend_pfn;
422

423
	if (cpu_has_dc_aliases && max_low_pfn != highend_pfn) {
424
		printk(KERN_WARNING "This processor doesn't support highmem."
425 426 427 428
		       " %ldk highmem ignored\n",
		       (highend_pfn - max_low_pfn) << (PAGE_SHIFT - 10));
		max_zone_pfns[ZONE_HIGHMEM] = max_low_pfn;
		lastpfn = max_low_pfn;
429
	}
L
Linus Torvalds 已提交
430 431
#endif

432
	free_area_init_nodes(max_zone_pfns);
L
Linus Torvalds 已提交
433 434
}

435 436 437 438
#ifdef CONFIG_64BIT
static struct kcore_list kcore_kseg0;
#endif

439
static inline void mem_init_free_highmem(void)
L
Linus Torvalds 已提交
440
{
441 442
#ifdef CONFIG_HIGHMEM
	unsigned long tmp;
L
Linus Torvalds 已提交
443

444 445 446
	if (cpu_has_dc_aliases)
		return;

447 448 449 450 451 452 453 454 455 456 457 458 459
	for (tmp = highstart_pfn; tmp < highend_pfn; tmp++) {
		struct page *page = pfn_to_page(tmp);

		if (!page_is_ram(tmp))
			SetPageReserved(page);
		else
			free_highmem_page(page);
	}
#endif
}

void __init mem_init(void)
{
L
Linus Torvalds 已提交
460 461 462 463
#ifdef CONFIG_HIGHMEM
#ifdef CONFIG_DISCONTIGMEM
#error "CONFIG_HIGHMEM and CONFIG_DISCONTIGMEM dont work together yet"
#endif
464
	max_mapnr = highend_pfn ? highend_pfn : max_low_pfn;
L
Linus Torvalds 已提交
465
#else
466
	max_mapnr = max_low_pfn;
L
Linus Torvalds 已提交
467 468 469
#endif
	high_memory = (void *) __va(max_low_pfn << PAGE_SHIFT);

P
Paul Burton 已提交
470
	maar_init();
471
	free_all_bootmem();
472
	setup_zero_pages();	/* Setup zeroed pages.  */
473 474
	mem_init_free_highmem();
	mem_init_print_info(NULL);
L
Linus Torvalds 已提交
475

476 477 478 479
#ifdef CONFIG_64BIT
	if ((unsigned long) &_text > (unsigned long) CKSEG0)
		/* The -4 is a hack so that user tools don't have to handle
		   the overflow.  */
K
KAMEZAWA Hiroyuki 已提交
480 481
		kclist_add(&kcore_kseg0, (void *) CKSEG0,
				0x80000000 - 4, KCORE_TEXT);
482
#endif
L
Linus Torvalds 已提交
483
}
484
#endif /* !CONFIG_NEED_MULTIPLE_NODES */
L
Linus Torvalds 已提交
485

486
void free_init_pages(const char *what, unsigned long begin, unsigned long end)
487
{
488
	unsigned long pfn;
489

490 491 492 493 494
	for (pfn = PFN_UP(begin); pfn < PFN_DOWN(end); pfn++) {
		struct page *page = pfn_to_page(pfn);
		void *addr = phys_to_virt(PFN_PHYS(pfn));

		memset(addr, POISON_FREE_INITMEM, PAGE_SIZE);
495
		free_reserved_page(page);
496 497 498 499
	}
	printk(KERN_INFO "Freeing %s: %ldk freed\n", what, (end - begin) >> 10);
}

L
Linus Torvalds 已提交
500 501 502
#ifdef CONFIG_BLK_DEV_INITRD
void free_initrd_mem(unsigned long start, unsigned long end)
{
503 504
	free_reserved_area((void *)start, (void *)end, POISON_FREE_INITMEM,
			   "initrd");
L
Linus Torvalds 已提交
505 506 507
}
#endif

508 509
void (*free_init_pages_eva)(void *begin, void *end) = NULL;

510
void __ref free_initmem(void)
L
Linus Torvalds 已提交
511
{
512
	prom_free_prom_memory();
513 514 515 516 517 518 519 520 521
	/*
	 * Let the platform define a specific function to free the
	 * init section since EVA may have used any possible mapping
	 * between virtual and physical addresses.
	 */
	if (free_init_pages_eva)
		free_init_pages_eva((void *)&__init_begin, (void *)&__init_end);
	else
		free_initmem_default(POISON_FREE_INITMEM);
L
Linus Torvalds 已提交
522
}
523

524
#ifndef CONFIG_MIPS_PGD_C0_CONTEXT
525
unsigned long pgd_current[NR_CPUS];
526
#endif
R
Ralf Baechle 已提交
527 528 529 530 531

/*
 * gcc 3.3 and older have trouble determining that PTRS_PER_PGD and PGD_ORDER
 * are constants.  So we use the variants from asm-offset.h until that gcc
 * will officially be retired.
532 533 534 535 536 537
 *
 * Align swapper_pg_dir in to 64K, allows its address to be loaded
 * with a single LUI instruction in the TLB handlers.  If we used
 * __aligned(64K), its size would get rounded up to the alignment
 * size, and waste space.  So we place it in its own section and align
 * it in the linker script.
R
Ralf Baechle 已提交
538
 */
539
pgd_t swapper_pg_dir[_PTRS_PER_PGD] __section(.bss..swapper_pg_dir);
540 541 542
#ifndef __PAGETABLE_PUD_FOLDED
pud_t invalid_pud_table[PTRS_PER_PUD] __page_aligned_bss;
#endif
543
#ifndef __PAGETABLE_PMD_FOLDED
544
pmd_t invalid_pmd_table[PTRS_PER_PMD] __page_aligned_bss;
545
EXPORT_SYMBOL_GPL(invalid_pmd_table);
546
#endif
547
pte_t invalid_pte_table[PTRS_PER_PTE] __page_aligned_bss;
548
EXPORT_SYMBOL(invalid_pte_table);