lpar.c 14.1 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
/*
 * pSeries_lpar.c
 * Copyright (C) 2001 Todd Inglett, IBM Corporation
 *
 * pSeries LPAR support.
 * 
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 * 
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 * 
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
 */

22
#undef DEBUG_LOW
L
Linus Torvalds 已提交
23 24 25

#include <linux/kernel.h>
#include <linux/dma-mapping.h>
26
#include <linux/console.h>
L
Linus Torvalds 已提交
27 28 29 30 31 32 33 34 35 36 37 38 39
#include <asm/processor.h>
#include <asm/mmu.h>
#include <asm/page.h>
#include <asm/pgtable.h>
#include <asm/machdep.h>
#include <asm/abs_addr.h>
#include <asm/mmu_context.h>
#include <asm/iommu.h>
#include <asm/tlbflush.h>
#include <asm/tlb.h>
#include <asm/prom.h>
#include <asm/abs_addr.h>
#include <asm/cputable.h>
D
David Gibson 已提交
40
#include <asm/udbg.h>
P
Paul Mackerras 已提交
41
#include <asm/smp.h>
42 43

#include "plpar_wrappers.h"
L
Linus Torvalds 已提交
44

45 46
#ifdef DEBUG_LOW
#define DBG_LOW(fmt...) do { udbg_printf(fmt); } while(0)
L
Linus Torvalds 已提交
47
#else
48
#define DBG_LOW(fmt...) do { } while(0)
L
Linus Torvalds 已提交
49 50
#endif

51
/* in hvCall.S */
L
Linus Torvalds 已提交
52
EXPORT_SYMBOL(plpar_hcall);
53
EXPORT_SYMBOL(plpar_hcall9);
L
Linus Torvalds 已提交
54
EXPORT_SYMBOL(plpar_hcall_norets);
55

L
Linus Torvalds 已提交
56 57 58 59 60 61
extern void pSeries_find_serial_port(void);


int vtermno;	/* virtual terminal# for udbg  */

#define __ALIGNED__ __attribute__((__aligned__(sizeof(long))))
62
static void udbg_hvsi_putc(char c)
L
Linus Torvalds 已提交
63 64 65 66 67 68 69 70 71 72
{
	/* packet's seqno isn't used anyways */
	uint8_t packet[] __ALIGNED__ = { 0xff, 5, 0, 0, c };
	int rc;

	if (c == '\n')
		udbg_hvsi_putc('\r');

	do {
		rc = plpar_put_term_char(vtermno, sizeof(packet), packet);
73
	} while (rc == H_BUSY);
L
Linus Torvalds 已提交
74 75 76 77 78 79 80 81 82 83 84 85
}

static long hvsi_udbg_buf_len;
static uint8_t hvsi_udbg_buf[256];

static int udbg_hvsi_getc_poll(void)
{
	unsigned char ch;
	int rc, i;

	if (hvsi_udbg_buf_len == 0) {
		rc = plpar_get_term_char(vtermno, &hvsi_udbg_buf_len, hvsi_udbg_buf);
86
		if (rc != H_SUCCESS || hvsi_udbg_buf[0] != 0xff) {
L
Linus Torvalds 已提交
87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112
			/* bad read or non-data packet */
			hvsi_udbg_buf_len = 0;
		} else {
			/* remove the packet header */
			for (i = 4; i < hvsi_udbg_buf_len; i++)
				hvsi_udbg_buf[i-4] = hvsi_udbg_buf[i];
			hvsi_udbg_buf_len -= 4;
		}
	}

	if (hvsi_udbg_buf_len <= 0 || hvsi_udbg_buf_len > 256) {
		/* no data ready */
		hvsi_udbg_buf_len = 0;
		return -1;
	}

	ch = hvsi_udbg_buf[0];
	/* shift remaining data down */
	for (i = 1; i < hvsi_udbg_buf_len; i++) {
		hvsi_udbg_buf[i-1] = hvsi_udbg_buf[i];
	}
	hvsi_udbg_buf_len--;

	return ch;
}

113
static int udbg_hvsi_getc(void)
L
Linus Torvalds 已提交
114 115 116 117 118 119 120 121 122 123 124 125 126 127 128
{
	int ch;
	for (;;) {
		ch = udbg_hvsi_getc_poll();
		if (ch == -1) {
			/* This shouldn't be needed...but... */
			volatile unsigned long delay;
			for (delay=0; delay < 2000000; delay++)
				;
		} else {
			return ch;
		}
	}
}

129
static void udbg_putcLP(char c)
L
Linus Torvalds 已提交
130 131 132 133 134 135 136 137 138 139
{
	char buf[16];
	unsigned long rc;

	if (c == '\n')
		udbg_putcLP('\r');

	buf[0] = c;
	do {
		rc = plpar_put_term_char(vtermno, 1, buf);
140
	} while(rc == H_BUSY);
L
Linus Torvalds 已提交
141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158
}

/* Buffered chars getc */
static long inbuflen;
static long inbuf[2];	/* must be 2 longs */

static int udbg_getc_pollLP(void)
{
	/* The interface is tricky because it may return up to 16 chars.
	 * We save them statically for future calls to udbg_getc().
	 */
	char ch, *buf = (char *)inbuf;
	int i;
	long rc;
	if (inbuflen == 0) {
		/* get some more chars. */
		inbuflen = 0;
		rc = plpar_get_term_char(vtermno, &inbuflen, buf);
159
		if (rc != H_SUCCESS)
L
Linus Torvalds 已提交
160 161 162 163 164 165 166 167 168 169 170 171 172 173
			inbuflen = 0;	/* otherwise inbuflen is garbage */
	}
	if (inbuflen <= 0 || inbuflen > 16) {
		/* Catch error case as well as other oddities (corruption) */
		inbuflen = 0;
		return -1;
	}
	ch = buf[0];
	for (i = 1; i < inbuflen; i++)	/* shuffle them down. */
		buf[i-1] = buf[i];
	inbuflen--;
	return ch;
}

174
static int udbg_getcLP(void)
L
Linus Torvalds 已提交
175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192
{
	int ch;
	for (;;) {
		ch = udbg_getc_pollLP();
		if (ch == -1) {
			/* This shouldn't be needed...but... */
			volatile unsigned long delay;
			for (delay=0; delay < 2000000; delay++)
				;
		} else {
			return ch;
		}
	}
}

/* call this from early_init() for a working debug console on
 * vterm capable LPAR machines
 */
193
void __init udbg_init_debug_lpar(void)
L
Linus Torvalds 已提交
194 195
{
	vtermno = 0;
196 197 198
	udbg_putc = udbg_putcLP;
	udbg_getc = udbg_getcLP;
	udbg_getc_poll = udbg_getc_pollLP;
L
Linus Torvalds 已提交
199 200 201
}

/* returns 0 if couldn't find or use /chosen/stdout as console */
202
void __init find_udbg_vterm(void)
L
Linus Torvalds 已提交
203 204
{
	struct device_node *stdout_node;
205 206
	const u32 *termno;
	const char *name;
207
	int add_console;
L
Linus Torvalds 已提交
208 209 210

	/* find the boot console from /chosen/stdout */
	if (!of_chosen)
211
		return;
212
	name = get_property(of_chosen, "linux,stdout-path", NULL);
L
Linus Torvalds 已提交
213
	if (name == NULL)
214
		return;
L
Linus Torvalds 已提交
215 216
	stdout_node = of_find_node_by_path(name);
	if (!stdout_node)
217
		return;
218
	name = get_property(stdout_node, "name", NULL);
L
Linus Torvalds 已提交
219 220 221 222
	if (!name) {
		printk(KERN_WARNING "stdout node missing 'name' property!\n");
		goto out;
	}
223 224
	/* The user has requested a console so this is already set up. */
	add_console = !strstr(cmd_line, "console=");
L
Linus Torvalds 已提交
225

226 227 228
	/* Check if it's a virtual terminal */
	if (strncmp(name, "vty", 3) != 0)
		goto out;
229
	termno = get_property(stdout_node, "reg", NULL);
230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246
	if (termno == NULL)
		goto out;
	vtermno = termno[0];

	if (device_is_compatible(stdout_node, "hvterm1")) {
		udbg_putc = udbg_putcLP;
		udbg_getc = udbg_getcLP;
		udbg_getc_poll = udbg_getc_pollLP;
		if (add_console)
			add_preferred_console("hvc", termno[0] & 0xff, NULL);
	} else if (device_is_compatible(stdout_node, "hvterm-protocol")) {
		vtermno = termno[0];
		udbg_putc = udbg_hvsi_putc;
		udbg_getc = udbg_hvsi_getc;
		udbg_getc_poll = udbg_hvsi_getc_poll;
		if (add_console)
			add_preferred_console("hvsi", termno[0] & 0xff, NULL);
L
Linus Torvalds 已提交
247 248 249 250 251 252 253 254
	}
out:
	of_node_put(stdout_node);
}

void vpa_init(int cpu)
{
	int hwcpu = get_hard_smp_processor_id(cpu);
255
	unsigned long addr;
L
Linus Torvalds 已提交
256
	long ret;
257 258

	if (cpu_has_feature(CPU_FTR_ALTIVEC))
259
		lppaca[cpu].vmxregs_in_use = 1;
260

261 262
	addr = __pa(&lppaca[cpu]);
	ret = register_vpa(hwcpu, addr);
L
Linus Torvalds 已提交
263

264
	if (ret) {
L
Linus Torvalds 已提交
265 266
		printk(KERN_ERR "WARNING: vpa_init: VPA registration for "
				"cpu %d (hw %d) of area %lx returns %ld\n",
267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282
				cpu, hwcpu, addr, ret);
		return;
	}
	/*
	 * PAPR says this feature is SLB-Buffer but firmware never
	 * reports that.  All SPLPAR support SLB shadow buffer.
	 */
	addr = __pa(&slb_shadow[cpu]);
	if (firmware_has_feature(FW_FEATURE_SPLPAR)) {
		ret = register_slb_shadow(hwcpu, addr);
		if (ret)
			printk(KERN_ERR
			       "WARNING: vpa_init: SLB shadow buffer "
			       "registration for cpu %d (hw %d) of area %lx "
			       "returns %ld\n", cpu, hwcpu, addr, ret);
	}
L
Linus Torvalds 已提交
283 284
}

285
static long pSeries_lpar_hpte_insert(unsigned long hpte_group,
286 287 288
 			      unsigned long va, unsigned long pa,
 			      unsigned long rflags, unsigned long vflags,
 			      int psize)
L
Linus Torvalds 已提交
289 290 291 292
{
	unsigned long lpar_rc;
	unsigned long flags;
	unsigned long slot;
293
	unsigned long hpte_v, hpte_r;
L
Linus Torvalds 已提交
294

295 296 297 298 299 300 301 302 303 304 305
	if (!(vflags & HPTE_V_BOLTED))
		DBG_LOW("hpte_insert(group=%lx, va=%016lx, pa=%016lx, "
			"rflags=%lx, vflags=%lx, psize=%d)\n",
		hpte_group, va, pa, rflags, vflags, psize);

 	hpte_v = hpte_encode_v(va, psize) | vflags | HPTE_V_VALID;
	hpte_r = hpte_encode_r(pa, psize) | rflags;

	if (!(vflags & HPTE_V_BOLTED))
		DBG_LOW(" hpte_v=%016lx, hpte_r=%016lx\n", hpte_v, hpte_r);

L
Linus Torvalds 已提交
306 307 308 309 310 311 312 313
	/* Now fill in the actual HPTE */
	/* Set CEC cookie to 0         */
	/* Zero page = 0               */
	/* I-cache Invalidate = 0      */
	/* I-cache synchronize = 0     */
	/* Exact = 0                   */
	flags = 0;

314
	/* Make pHyp happy */
315 316
	if (rflags & (_PAGE_GUARDED|_PAGE_NO_CACHE))
		hpte_r &= ~_PAGE_COHERENT;
L
Linus Torvalds 已提交
317

318
	lpar_rc = plpar_pte_enter(flags, hpte_group, hpte_v, hpte_r, &slot);
319
	if (unlikely(lpar_rc == H_PTEG_FULL)) {
320 321
		if (!(vflags & HPTE_V_BOLTED))
			DBG_LOW(" full\n");
L
Linus Torvalds 已提交
322
		return -1;
323
	}
L
Linus Torvalds 已提交
324 325 326 327 328 329

	/*
	 * Since we try and ioremap PHBs we don't own, the pte insert
	 * will fail. However we must catch the failure in hash_page
	 * or we will loop forever, so return -2 in this case.
	 */
330
	if (unlikely(lpar_rc != H_SUCCESS)) {
331 332
		if (!(vflags & HPTE_V_BOLTED))
			DBG_LOW(" lpar err %d\n", lpar_rc);
L
Linus Torvalds 已提交
333
		return -2;
334 335 336
	}
	if (!(vflags & HPTE_V_BOLTED))
		DBG_LOW(" -> slot: %d\n", slot & 7);
L
Linus Torvalds 已提交
337 338 339 340

	/* Because of iSeries, we have to pass down the secondary
	 * bucket bit here as well
	 */
341
	return (slot & 7) | (!!(vflags & HPTE_V_SECONDARY) << 3);
L
Linus Torvalds 已提交
342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360
}

static DEFINE_SPINLOCK(pSeries_lpar_tlbie_lock);

static long pSeries_lpar_hpte_remove(unsigned long hpte_group)
{
	unsigned long slot_offset;
	unsigned long lpar_rc;
	int i;
	unsigned long dummy1, dummy2;

	/* pick a random slot to start at */
	slot_offset = mftb() & 0x7;

	for (i = 0; i < HPTES_PER_GROUP; i++) {

		/* don't remove a bolted entry */
		lpar_rc = plpar_pte_remove(H_ANDCOND, hpte_group + slot_offset,
					   (0x1UL << 4), &dummy1, &dummy2);
361
		if (lpar_rc == H_SUCCESS)
L
Linus Torvalds 已提交
362
			return i;
363
		BUG_ON(lpar_rc != H_NOT_FOUND);
L
Linus Torvalds 已提交
364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389

		slot_offset++;
		slot_offset &= 0x7;
	}

	return -1;
}

static void pSeries_lpar_hptab_clear(void)
{
	unsigned long size_bytes = 1UL << ppc64_pft_size;
	unsigned long hpte_count = size_bytes >> 4;
	unsigned long dummy1, dummy2;
	int i;

	/* TODO: Use bulk call */
	for (i = 0; i < hpte_count; i++)
		plpar_pte_remove(0, i, 0, &dummy1, &dummy2);
}

/*
 * NOTE: for updatepp ops we are fortunate that the linux "newpp" bits and
 * the low 3 bits of flags happen to line up.  So no transform is needed.
 * We can probably optimize here and assume the high bits of newpp are
 * already zero.  For now I am paranoid.
 */
390 391 392 393
static long pSeries_lpar_hpte_updatepp(unsigned long slot,
				       unsigned long newpp,
				       unsigned long va,
				       int psize, int local)
L
Linus Torvalds 已提交
394 395 396
{
	unsigned long lpar_rc;
	unsigned long flags = (newpp & 7) | H_AVPN;
397
	unsigned long want_v;
L
Linus Torvalds 已提交
398

399
	want_v = hpte_encode_v(va, psize);
L
Linus Torvalds 已提交
400

401 402
	DBG_LOW("    update: avpnv=%016lx, hash=%016lx, f=%x, psize: %d ... ",
		want_v & HPTE_V_AVPN, slot, flags, psize);
L
Linus Torvalds 已提交
403

404 405
	lpar_rc = plpar_pte_protect(flags, slot, want_v & HPTE_V_AVPN);

406
	if (lpar_rc == H_NOT_FOUND) {
407
		DBG_LOW("not found !\n");
L
Linus Torvalds 已提交
408
		return -1;
409 410 411
	}

	DBG_LOW("ok\n");
L
Linus Torvalds 已提交
412

413
	BUG_ON(lpar_rc != H_SUCCESS);
L
Linus Torvalds 已提交
414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431

	return 0;
}

static unsigned long pSeries_lpar_hpte_getword0(unsigned long slot)
{
	unsigned long dword0;
	unsigned long lpar_rc;
	unsigned long dummy_word1;
	unsigned long flags;

	/* Read 1 pte at a time                        */
	/* Do not need RPN to logical page translation */
	/* No cross CEC PFT access                     */
	flags = 0;

	lpar_rc = plpar_pte_read(flags, slot, &dword0, &dummy_word1);

432
	BUG_ON(lpar_rc != H_SUCCESS);
L
Linus Torvalds 已提交
433 434 435 436

	return dword0;
}

437
static long pSeries_lpar_hpte_find(unsigned long va, int psize)
L
Linus Torvalds 已提交
438 439 440 441
{
	unsigned long hash;
	unsigned long i, j;
	long slot;
442
	unsigned long want_v, hpte_v;
L
Linus Torvalds 已提交
443

444 445
	hash = hpt_hash(va, mmu_psize_defs[psize].shift);
	want_v = hpte_encode_v(va, psize);
L
Linus Torvalds 已提交
446 447 448 449

	for (j = 0; j < 2; j++) {
		slot = (hash & htab_hash_mask) * HPTES_PER_GROUP;
		for (i = 0; i < HPTES_PER_GROUP; i++) {
450
			hpte_v = pSeries_lpar_hpte_getword0(slot);
L
Linus Torvalds 已提交
451

452
			if (HPTE_V_COMPARE(hpte_v, want_v)
453 454
			    && (hpte_v & HPTE_V_VALID)
			    && (!!(hpte_v & HPTE_V_SECONDARY) == j)) {
L
Linus Torvalds 已提交
455 456 457 458 459 460 461 462 463 464 465 466 467 468
				/* HPTE matches */
				if (j)
					slot = -slot;
				return slot;
			}
			++slot;
		}
		hash = ~hash;
	}

	return -1;
} 

static void pSeries_lpar_hpte_updateboltedpp(unsigned long newpp,
469 470
					     unsigned long ea,
					     int psize)
L
Linus Torvalds 已提交
471
{
472
	unsigned long lpar_rc, slot, vsid, va, flags;
L
Linus Torvalds 已提交
473 474 475 476

	vsid = get_kernel_vsid(ea);
	va = (vsid << 28) | (ea & 0x0fffffff);

477
	slot = pSeries_lpar_hpte_find(va, psize);
L
Linus Torvalds 已提交
478 479 480 481 482
	BUG_ON(slot == -1);

	flags = newpp & 7;
	lpar_rc = plpar_pte_protect(flags, slot, 0);

483
	BUG_ON(lpar_rc != H_SUCCESS);
L
Linus Torvalds 已提交
484 485 486
}

static void pSeries_lpar_hpte_invalidate(unsigned long slot, unsigned long va,
487
					 int psize, int local)
L
Linus Torvalds 已提交
488
{
489
	unsigned long want_v;
L
Linus Torvalds 已提交
490 491 492
	unsigned long lpar_rc;
	unsigned long dummy1, dummy2;

493 494
	DBG_LOW("    inval : slot=%lx, va=%016lx, psize: %d, local: %d",
		slot, va, psize, local);
L
Linus Torvalds 已提交
495

496 497 498
	want_v = hpte_encode_v(va, psize);
	lpar_rc = plpar_pte_remove(H_AVPN, slot, want_v & HPTE_V_AVPN,
				   &dummy1, &dummy2);
499
	if (lpar_rc == H_NOT_FOUND)
L
Linus Torvalds 已提交
500 501
		return;

502
	BUG_ON(lpar_rc != H_SUCCESS);
L
Linus Torvalds 已提交
503 504
}

505 506 507 508 509 510 511
/* Flag bits for H_BULK_REMOVE */
#define HBR_REQUEST	0x4000000000000000UL
#define HBR_RESPONSE	0x8000000000000000UL
#define HBR_END		0xc000000000000000UL
#define HBR_AVPN	0x0200000000000000UL
#define HBR_ANDCOND	0x0100000000000000UL

L
Linus Torvalds 已提交
512 513 514 515
/*
 * Take a spinlock around flushes to avoid bouncing the hypervisor tlbie
 * lock.
 */
516
static void pSeries_lpar_flush_hash_range(unsigned long number, int local)
L
Linus Torvalds 已提交
517
{
518 519
	unsigned long i, pix, rc;
	unsigned long flags;
L
Linus Torvalds 已提交
520 521
	struct ppc64_tlb_batch *batch = &__get_cpu_var(ppc64_tlb_batch);
	int lock_tlbie = !cpu_has_feature(CPU_FTR_LOCKLESS_TLBIE);
522 523 524 525 526
	unsigned long param[9];
	unsigned long va;
	unsigned long hash, index, shift, hidx, slot;
	real_pte_t pte;
	int psize;
L
Linus Torvalds 已提交
527 528 529 530

	if (lock_tlbie)
		spin_lock_irqsave(&pSeries_lpar_tlbie_lock, flags);

531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562
	psize = batch->psize;
	pix = 0;
	for (i = 0; i < number; i++) {
		va = batch->vaddr[i];
		pte = batch->pte[i];
		pte_iterate_hashed_subpages(pte, psize, va, index, shift) {
			hash = hpt_hash(va, shift);
			hidx = __rpte_to_hidx(pte, index);
			if (hidx & _PTEIDX_SECONDARY)
				hash = ~hash;
			slot = (hash & htab_hash_mask) * HPTES_PER_GROUP;
			slot += hidx & _PTEIDX_GROUP_IX;
			param[pix] = HBR_REQUEST | HBR_AVPN | slot;
			param[pix+1] = hpte_encode_v(va, psize) & HPTE_V_AVPN;
			pix += 2;
			if (pix == 8) {
				rc = plpar_hcall9(H_BULK_REMOVE, param,
						param[0], param[1], param[2],
						param[3], param[4], param[5],
						param[6], param[7]);
				BUG_ON(rc != H_SUCCESS);
				pix = 0;
			}
		} pte_iterate_hashed_end();
	}
	if (pix) {
		param[pix] = HBR_END;
		rc = plpar_hcall9(H_BULK_REMOVE, param, param[0], param[1],
				  param[2], param[3], param[4], param[5],
				  param[6], param[7]);
		BUG_ON(rc != H_SUCCESS);
	}
L
Linus Torvalds 已提交
563 564 565 566 567

	if (lock_tlbie)
		spin_unlock_irqrestore(&pSeries_lpar_tlbie_lock, flags);
}

568
void __init hpte_init_lpar(void)
L
Linus Torvalds 已提交
569 570 571 572 573 574 575 576 577
{
	ppc_md.hpte_invalidate	= pSeries_lpar_hpte_invalidate;
	ppc_md.hpte_updatepp	= pSeries_lpar_hpte_updatepp;
	ppc_md.hpte_updateboltedpp = pSeries_lpar_hpte_updateboltedpp;
	ppc_md.hpte_insert	= pSeries_lpar_hpte_insert;
	ppc_md.hpte_remove	= pSeries_lpar_hpte_remove;
	ppc_md.flush_hash_range	= pSeries_lpar_flush_hash_range;
	ppc_md.hpte_clear_all   = pSeries_lpar_hptab_clear;
}