idle_book3s.S 25.9 KB
Newer Older
1
/*
2 3
 *  This file contains idle entry/exit functions for POWER7,
 *  POWER8 and POWER9 CPUs.
4 5 6 7 8 9 10 11 12 13 14 15 16 17 18
 *
 *  This program is free software; you can redistribute it and/or
 *  modify it under the terms of the GNU General Public License
 *  as published by the Free Software Foundation; either version
 *  2 of the License, or (at your option) any later version.
 */

#include <linux/threads.h>
#include <asm/processor.h>
#include <asm/page.h>
#include <asm/cputable.h>
#include <asm/thread_info.h>
#include <asm/ppc_asm.h>
#include <asm/asm-offsets.h>
#include <asm/ppc-opcode.h>
19
#include <asm/hw_irq.h>
20
#include <asm/kvm_book3s_asm.h>
21
#include <asm/opal.h>
22
#include <asm/cpuidle.h>
23
#include <asm/exception-64s.h>
24
#include <asm/book3s/64/mmu-hash.h>
25
#include <asm/mmu.h>
26 27 28

#undef DEBUG

29 30 31 32
/*
 * Use unused space in the interrupt stack to save and restore
 * registers for winkle support.
 */
33
#define _MMCR0	GPR0
34
#define _SDR1	GPR3
35
#define _PTCR	GPR3
36 37 38 39 40 41 42 43
#define _RPR	GPR4
#define _SPURR	GPR5
#define _PURR	GPR6
#define _TSCR	GPR7
#define _DSCR	GPR8
#define _AMOR	GPR9
#define _WORT	GPR10
#define _WORC	GPR11
44
#define _LPCR	GPR12
45

46
#define PSSCR_EC_ESL_MASK_SHIFTED          (PSSCR_EC | PSSCR_ESL) >> 16
47

48 49
	.text

50 51 52 53 54 55 56 57 58
/*
 * Used by threads before entering deep idle states. Saves SPRs
 * in interrupt stack frame
 */
save_sprs_to_stack:
	/*
	 * Note all register i.e per-core, per-subcore or per-thread is saved
	 * here since any thread in the core might wake up first
	 */
59 60 61 62 63
BEGIN_FTR_SECTION
	/*
	 * Note - SDR1 is dropped in Power ISA v3. Hence not restoring
	 * SDR1 here
	 */
64 65 66 67
	mfspr	r3,SPRN_PTCR
	std	r3,_PTCR(r1)
	mfspr	r3,SPRN_LPCR
	std	r3,_LPCR(r1)
68
FTR_SECTION_ELSE
69 70
	mfspr	r3,SPRN_SDR1
	std	r3,_SDR1(r1)
71
ALT_FTR_SECTION_END_IFSET(CPU_FTR_ARCH_300)
72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87
	mfspr	r3,SPRN_RPR
	std	r3,_RPR(r1)
	mfspr	r3,SPRN_SPURR
	std	r3,_SPURR(r1)
	mfspr	r3,SPRN_PURR
	std	r3,_PURR(r1)
	mfspr	r3,SPRN_TSCR
	std	r3,_TSCR(r1)
	mfspr	r3,SPRN_DSCR
	std	r3,_DSCR(r1)
	mfspr	r3,SPRN_AMOR
	std	r3,_AMOR(r1)
	mfspr	r3,SPRN_WORT
	std	r3,_WORT(r1)
	mfspr	r3,SPRN_WORC
	std	r3,_WORC(r1)
88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107
/*
 * On POWER9, there are idle states such as stop4, invoked via cpuidle,
 * that lose hypervisor resources. In such cases, we need to save
 * additional SPRs before entering those idle states so that they can
 * be restored to their older values on wakeup from the idle state.
 *
 * On POWER8, the only such deep idle state is winkle which is used
 * only in the context of CPU-Hotplug, where these additional SPRs are
 * reinitiazed to a sane value. Hence there is no need to save/restore
 * these SPRs.
 */
BEGIN_FTR_SECTION
	blr
END_FTR_SECTION_IFCLR(CPU_FTR_ARCH_300)

power9_save_additional_sprs:
	mfspr	r3, SPRN_PID
	mfspr	r4, SPRN_LDBAR
	std	r3, STOP_PID(r13)
	std	r4, STOP_LDBAR(r13)
108

109 110 111 112 113 114
	mfspr	r3, SPRN_FSCR
	mfspr	r4, SPRN_HFSCR
	std	r3, STOP_FSCR(r13)
	std	r4, STOP_HFSCR(r13)

	mfspr	r3, SPRN_MMCRA
115
	mfspr	r4, SPRN_MMCR0
116
	std	r3, STOP_MMCRA(r13)
117
	std	r4, _MMCR0(r1)
118

119 120 121 122
	mfspr	r3, SPRN_MMCR1
	mfspr	r4, SPRN_MMCR2
	std	r3, STOP_MMCR1(r13)
	std	r4, STOP_MMCR2(r13)
123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139
	blr

power9_restore_additional_sprs:
	ld	r3,_LPCR(r1)
	ld	r4, STOP_PID(r13)
	mtspr	SPRN_LPCR,r3
	mtspr	SPRN_PID, r4

	ld	r3, STOP_LDBAR(r13)
	ld	r4, STOP_FSCR(r13)
	mtspr	SPRN_LDBAR, r3
	mtspr	SPRN_FSCR, r4

	ld	r3, STOP_HFSCR(r13)
	ld	r4, STOP_MMCRA(r13)
	mtspr	SPRN_HFSCR, r3
	mtspr	SPRN_MMCRA, r4
140 141 142 143 144 145 146 147

	ld	r3, _MMCR0(r1)
	ld	r4, STOP_MMCR1(r13)
	mtspr	SPRN_MMCR0, r3
	mtspr	SPRN_MMCR1, r4

	ld	r3, STOP_MMCR2(r13)
	mtspr	SPRN_MMCR2, r3
148 149
	blr

150 151 152 153 154
/*
 * Used by threads when the lock bit of core_idle_state is set.
 * Threads will spin in HMT_LOW until the lock bit is cleared.
 * r14 - pointer to core_idle_state
 * r15 - used to load contents of core_idle_state
155
 * r9  - used as a temporary variable
156 157 158 159 160
 */

core_idle_lock_held:
	HMT_LOW
3:	lwz	r15,0(r14)
161
	andis.	r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
162 163 164
	bne	3b
	HMT_MEDIUM
	lwarx	r15,0,r14
165 166
	andis.	r9,r15,PNV_CORE_IDLE_LOCK_BIT@h
	bne-	core_idle_lock_held
167 168
	blr

169 170
/*
 * Pass requested state in r3:
171
 *	r3 - PNV_THREAD_NAP/SLEEP/WINKLE in POWER8
172
 *	   - Requested PSSCR value in POWER9
173
 *
174
 * Address of idle handler to branch to in realmode in r4
175
 */
176
pnv_powersave_common:
177
	/* Use r3 to pass state nap/sleep/winkle */
178 179 180 181 182 183
	/* NAP is a state loss, we create a regs frame on the
	 * stack, fill it up with the state we care about and
	 * stick a pointer to it in PACAR1. We really only
	 * need to save PC, some CR bits and the NV GPRs,
	 * but for now an interrupt frame will do.
	 */
184 185
	mtctr	r4

186 187 188 189 190 191
	mflr	r0
	std	r0,16(r1)
	stdu	r1,-INT_FRAME_SIZE(r1)
	std	r0,_LINK(r1)
	std	r0,_NIP(r1)

192
	/* We haven't lost state ... yet */
193
	li	r0,0
194
	stb	r0,PACA_NAPSTATELOST(r13)
195 196 197 198

	/* Continue saving state */
	SAVE_GPR(2, r1)
	SAVE_NVGPRS(r1)
199 200
	mfcr	r5
	std	r5,_CCR(r1)
201 202
	std	r1,PACAR1(r13)

203 204 205 206 207 208 209 210
BEGIN_FTR_SECTION
	/*
	 * POWER9 does not require real mode to stop, and presently does not
	 * set hwthread_state for KVM (threads don't share MMU context), so
	 * we can remain in virtual mode for this.
	 */
	bctr
END_FTR_SECTION_IFSET(CPU_FTR_ARCH_300)
211
	/*
212
	 * POWER8
213 214 215 216 217
	 * Go to real mode to do the nap, as required by the architecture.
	 * Also, we need to be in real mode before setting hwthread_state,
	 * because as soon as we do that, another thread can switch
	 * the MMU context to the guest.
	 */
218
	LOAD_REG_IMMEDIATE(r7, MSR_IDLE)
219 220
	mtmsrd	r7,0
	bctr
221

222 223 224 225
/*
 * This is the sequence required to execute idle instructions, as
 * specified in ISA v2.07 (and earlier). MSR[IR] and MSR[DR] must be 0.
 */
226
#define IDLE_STATE_ENTER_SEQ_NORET(IDLE_INST)			\
227 228 229 230 231 232 233 234 235
	/* Magic NAP/SLEEP/WINKLE mode enter sequence */	\
	std	r0,0(r1);					\
	ptesync;						\
	ld	r0,0(r1);					\
236:	cmpd	cr0,r0,r0;					\
	bne	236b;						\
	IDLE_INST;


236 237
	.globl pnv_enter_arch207_idle_mode
pnv_enter_arch207_idle_mode:
238 239 240 241 242 243 244 245
#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
	/* Tell KVM we're entering idle */
	li	r4,KVM_HWTHREAD_IN_IDLE
	/******************************************************/
	/*  N O T E   W E L L    ! ! !    N O T E   W E L L   */
	/* The following store to HSTATE_HWTHREAD_STATE(r13)  */
	/* MUST occur in real mode, i.e. with the MMU off,    */
	/* and the MMU must stay off until we clear this flag */
246 247
	/* and test HSTATE_HWTHREAD_REQ(r13) in               */
	/* pnv_powersave_wakeup in this file.                 */
248 249 250 251 252 253 254 255 256 257
	/* The reason is that another thread can switch the   */
	/* MMU to a guest context whenever this flag is set   */
	/* to KVM_HWTHREAD_IN_IDLE, and if the MMU was on,    */
	/* that would potentially cause this thread to start  */
	/* executing instructions from guest memory in        */
	/* hypervisor mode, leading to a host crash or data   */
	/* corruption, or worse.                              */
	/******************************************************/
	stb	r4,HSTATE_HWTHREAD_STATE(r13)
#endif
258
	stb	r3,PACA_THREAD_IDLE_STATE(r13)
259 260
	cmpwi	cr3,r3,PNV_THREAD_SLEEP
	bge	cr3,2f
261
	IDLE_STATE_ENTER_SEQ_NORET(PPC_NAP)
262
	/* No return */
263 264 265 266
2:
	/* Sleep or winkle */
	lbz	r7,PACA_THREAD_MASK(r13)
	ld	r14,PACA_CORE_IDLE_STATE_PTR(r13)
267 268 269 270
	li	r5,0
	beq	cr3,3f
	lis	r5,PNV_CORE_IDLE_WINKLE_COUNT@h
3:
271 272
lwarx_loop1:
	lwarx	r15,0,r14
273

274 275
	andis.	r9,r15,PNV_CORE_IDLE_LOCK_BIT@h
	bnel-	core_idle_lock_held
276

277
	add	r15,r15,r5			/* Add if winkle */
278 279
	andc	r15,r15,r7			/* Clear thread bit */

280
	andi.	r9,r15,PNV_CORE_IDLE_THREAD_BITS
281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297

/*
 * If cr0 = 0, then current thread is the last thread of the core entering
 * sleep. Last thread needs to execute the hardware bug workaround code if
 * required by the platform.
 * Make the workaround call unconditionally here. The below branch call is
 * patched out when the idle states are discovered if the platform does not
 * require it.
 */
.global pnv_fastsleep_workaround_at_entry
pnv_fastsleep_workaround_at_entry:
	beq	fastsleep_workaround_at_entry

	stwcx.	r15,0,r14
	bne-	lwarx_loop1
	isync

298 299
common_enter: /* common code for all the threads entering sleep or winkle */
	bgt	cr3,enter_winkle
300
	IDLE_STATE_ENTER_SEQ_NORET(PPC_SLEEP)
301 302

fastsleep_workaround_at_entry:
303
	oris	r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
304 305 306 307 308 309 310
	stwcx.	r15,0,r14
	bne-	lwarx_loop1
	isync

	/* Fast sleep workaround */
	li	r3,1
	li	r4,1
311
	bl	opal_config_cpu_idle_state
312

313 314
	/* Unlock */
	xoris	r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
315
	lwsync
316
	stw	r15,0(r14)
317 318
	b	common_enter

319
enter_winkle:
320 321
	bl	save_sprs_to_stack

322
	IDLE_STATE_ENTER_SEQ_NORET(PPC_WINKLE)
323

324
/*
325
 * r3 - PSSCR value corresponding to the requested stop state.
326
 */
327 328 329 330 331
power_enter_stop:
/*
 * Check if we are executing the lite variant with ESL=EC=0
 */
	andis.   r4,r3,PSSCR_EC_ESL_MASK_SHIFTED
332
	clrldi   r3,r3,60 /* r3 = Bits[60:63] = Requested Level (RL) */
333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352
	bne	 .Lhandle_esl_ec_set
	PPC_STOP
	li	r3,0  /* Since we didn't lose state, return 0 */
	std	r3, PACA_REQ_PSSCR(r13)

	/*
	 * pnv_wakeup_noloss() expects r12 to contain the SRR1 value so
	 * it can determine if the wakeup reason is an HMI in
	 * CHECK_HMI_INTERRUPT.
	 *
	 * However, when we wakeup with ESL=0, SRR1 will not contain the wakeup
	 * reason, so there is no point setting r12 to SRR1.
	 *
	 * Further, we clear r12 here, so that we don't accidentally enter the
	 * HMI in pnv_wakeup_noloss() if the value of r12[42:45] == WAKE_HMI.
	 */
	li	r12, 0
	b 	pnv_wakeup_noloss

.Lhandle_esl_ec_set:
353
BEGIN_FTR_SECTION
354
	/*
355 356
	 * POWER9 DD2.0 or earlier can incorrectly set PMAO when waking up after
	 * a state-loss idle. Saving and restoring MMCR0 over idle is a
357 358 359 360
	 * workaround.
	 */
	mfspr	r4,SPRN_MMCR0
	std	r4,_MMCR0(r1)
361
END_FTR_SECTION_IFCLR(CPU_FTR_POWER9_DD2_1)
362

363 364 365
/*
 * Check if the requested state is a deep idle state.
 */
366
	LOAD_REG_ADDRBASE(r5,pnv_first_deep_stop_state)
367 368
	ld	r4,ADDROFF(pnv_first_deep_stop_state)(r5)
	cmpd	r3,r4
369
	bge	.Lhandle_deep_stop
370 371
	PPC_STOP	/* Does not return (system reset interrupt) */

372
.Lhandle_deep_stop:
373 374 375 376 377 378 379 380 381 382
/*
 * Entering deep idle state.
 * Clear thread bit in PACA_CORE_IDLE_STATE, save SPRs to
 * stack and enter stop
 */
	lbz     r7,PACA_THREAD_MASK(r13)
	ld      r14,PACA_CORE_IDLE_STATE_PTR(r13)

lwarx_loop_stop:
	lwarx   r15,0,r14
383 384
	andis.	r9,r15,PNV_CORE_IDLE_LOCK_BIT@h
	bnel-	core_idle_lock_held
385 386 387 388 389 390 391 392
	andc    r15,r15,r7                      /* Clear thread bit */

	stwcx.  r15,0,r14
	bne-    lwarx_loop_stop
	isync

	bl	save_sprs_to_stack

393
	PPC_STOP	/* Does not return (system reset interrupt) */
394

395 396 397 398 399
/*
 * Entered with MSR[EE]=0 and no soft-masked interrupts pending.
 * r3 contains desired idle state (PNV_THREAD_NAP/SLEEP/WINKLE).
 */
_GLOBAL(power7_idle_insn)
400
	/* Now check if user or arch enabled NAP mode */
401
	LOAD_REG_ADDR(r4, pnv_enter_arch207_idle_mode)
402
	b	pnv_powersave_common
403

404 405
#define CHECK_HMI_INTERRUPT						\
BEGIN_FTR_SECTION_NESTED(66);						\
406
	rlwinm	r0,r12,45-31,0xf;  /* extract wake reason field (P8) */	\
407
FTR_SECTION_ELSE_NESTED(66);						\
408
	rlwinm	r0,r12,45-31,0xe;  /* P7 wake reason field is 3 bits */	\
409 410
ALT_FTR_SECTION_END_NESTED_IFSET(CPU_FTR_ARCH_207S, 66);		\
	cmpwi	r0,0xa;			/* Hypervisor maintenance ? */	\
411
	bne+	20f;							\
412 413 414 415
	/* Invoke opal call to handle hmi */				\
	ld	r2,PACATOC(r13);					\
	ld	r1,PACAR1(r13);						\
	std	r3,ORIG_GPR3(r1);	/* Save original r3 */		\
416 417 418
	li	r3,0;			/* NULL argument */		\
	bl	hmi_exception_realmode;					\
	nop;								\
419 420 421
	ld	r3,ORIG_GPR3(r1);	/* Restore original r3 */	\
20:	nop;

422 423 424
/*
 * Entered with MSR[EE]=0 and no soft-masked interrupts pending.
 * r3 contains desired PSSCR register value.
425 426 427
 *
 * Offline (CPU unplug) case also must notify KVM that the CPU is
 * idle.
428 429 430
 */
_GLOBAL(power9_offline_stop)
#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
431 432 433 434 435 436 437
	/*
	 * Tell KVM we're entering idle.
	 * This does not have to be done in real mode because the P9 MMU
	 * is independent per-thread. Some steppings share radix/hash mode
	 * between threads, but in that case KVM has a barrier sync in real
	 * mode before and after switching between radix and hash.
	 */
438 439 440
	li	r4,KVM_HWTHREAD_IN_IDLE
	stb	r4,HSTATE_HWTHREAD_STATE(r13)
#endif
441
	/* fall through */
442

443
_GLOBAL(power9_idle_stop)
444
	std	r3, PACA_REQ_PSSCR(r13)
445 446
#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
BEGIN_FTR_SECTION
447 448 449
	sync
	lwz	r5, PACA_DONT_STOP(r13)
	cmpwi	r5, 0
450
	bne	1f
451
END_FTR_SECTION_IFSET(CPU_FTR_P9_TM_XER_SO_BUG)
452
#endif
453 454
	mtspr 	SPRN_PSSCR,r3
	LOAD_REG_ADDR(r4,power_enter_stop)
455 456
	b	pnv_powersave_common
	/* No return */
457
#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
458
1:
459 460 461 462 463 464 465 466
	/*
	 * We get here when TM / thread reconfiguration bug workaround
	 * code wants to get the CPU into SMT4 mode, and therefore
	 * we are being asked not to stop.
	 */
	li	r3, 0
	std	r3, PACA_REQ_PSSCR(r13)
	blr		/* return 0 for wakeup cause / SRR1 value */
467
#endif
468

469
/*
470 471 472 473 474 475 476 477 478 479 480
 * On waking up from stop 0,1,2 with ESL=1 on POWER9 DD1,
 * HSPRG0 will be set to the HSPRG0 value of one of the
 * threads in this core. Thus the value we have in r13
 * may not be this thread's paca pointer.
 *
 * Fortunately, the TIR remains invariant. Since this thread's
 * paca pointer is recorded in all its sibling's paca, we can
 * correctly recover this thread's paca pointer if we
 * know the index of this thread in the core.
 *
 * This index can be obtained from the TIR.
481
 *
482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502
 * i.e, thread's position in the core = TIR.
 * If this value is i, then this thread's paca is
 * paca->thread_sibling_pacas[i].
 */
power9_dd1_recover_paca:
	mfspr	r4, SPRN_TIR
	/*
	 * Since each entry in thread_sibling_pacas is 8 bytes
	 * we need to left-shift by 3 bits. Thus r4 = i * 8
	 */
	sldi	r4, r4, 3
	/* Get &paca->thread_sibling_pacas[0] in r5 */
	ld	r5, PACA_SIBLING_PACA_PTRS(r13)
	/* Load paca->thread_sibling_pacas[i] into r13 */
	ldx	r13, r4, r5
	SET_PACA(r13)
	/*
	 * Indicate that we have lost NVGPR state
	 * which needs to be restored from the stack.
	 */
	li	r3, 1
503
	stb	r3,PACA_NAPSTATELOST(r13)
504 505
	blr

506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522
/*
 * Called from machine check handler for powersave wakeups.
 * Low level machine check processing has already been done. Now just
 * go through the wake up path to get everything in order.
 *
 * r3 - The original SRR1 value.
 * Original SRR[01] have been clobbered.
 * MSR_RI is clear.
 */
.global pnv_powersave_wakeup_mce
pnv_powersave_wakeup_mce:
	/* Set cr3 for pnv_powersave_wakeup */
	rlwinm	r11,r3,47-31,30,31
	cmpwi	cr3,r11,2

	/*
	 * Now put the original SRR1 with SRR1_WAKEMCE_RESVD as the wake
523
	 * reason into r12, which allows reuse of the system reset wakeup
524 525
	 * code without being mistaken for another type of wakeup.
	 */
526
	oris	r12,r3,SRR1_WAKEMCE_RESVD@h
527 528 529

	b	pnv_powersave_wakeup

530 531
/*
 * Called from reset vector for powersave wakeups.
532
 * cr3 - set to gt if waking up with partial/complete hypervisor state loss
533
 * r12 - SRR1
534
 */
535 536
.global pnv_powersave_wakeup
pnv_powersave_wakeup:
537 538
	ld	r2, PACATOC(r13)

539
BEGIN_FTR_SECTION
540 541 542
BEGIN_FTR_SECTION_NESTED(70)
	bl	power9_dd1_recover_paca
END_FTR_SECTION_NESTED_IFSET(CPU_FTR_POWER9_DD1, 70)
543 544 545 546
	bl	pnv_restore_hyp_resource_arch300
FTR_SECTION_ELSE
	bl	pnv_restore_hyp_resource_arch207
ALT_FTR_SECTION_END_IFSET(CPU_FTR_ARCH_300)
547 548 549 550

	li	r0,PNV_THREAD_RUNNING
	stb	r0,PACA_THREAD_IDLE_STATE(r13)	/* Clear thread state */

551 552
	mr	r3,r12

553
#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
554 555
	lbz	r0,HSTATE_HWTHREAD_STATE(r13)
	cmpwi	r0,KVM_HWTHREAD_IN_KERNEL
556
	beq	0f
557 558 559 560
	li	r0,KVM_HWTHREAD_IN_KERNEL
	stb	r0,HSTATE_HWTHREAD_STATE(r13)
	/* Order setting hwthread_state vs. testing hwthread_req */
	sync
561
0:	lbz	r0,HSTATE_HWTHREAD_REQ(r13)
562 563 564 565
	cmpwi	r0,0
	beq	1f
	b	kvm_start_guest
1:
566 567 568 569 570 571
#endif

	/* Return SRR1 from power7_nap() */
	blt	cr3,pnv_wakeup_noloss
	b	pnv_wakeup_loss

572
/*
573 574
 * Check whether we have woken up with hypervisor state loss.
 * If yes, restore hypervisor state and return back to link.
575 576 577
 *
 * cr3 - set to gt if waking up with partial/complete hypervisor state loss
 */
578
pnv_restore_hyp_resource_arch300:
579 580
	/*
	 * Workaround for POWER9, if we lost resources, the ERAT
581
	 * might have been mixed up and needs flushing. We also need
582 583
	 * to reload MMCR0 (see comment above). We also need to set
	 * then clear bit 60 in MMCRA to ensure the PMU starts running.
584 585
	 */
	blt	cr3,1f
586
BEGIN_FTR_SECTION
587
	PPC_INVALIDATE_ERAT
588
	ld	r1,PACAR1(r13)
589 590
	ld	r4,_MMCR0(r1)
	mtspr	SPRN_MMCR0,r4
591
END_FTR_SECTION_IFCLR(CPU_FTR_POWER9_DD2_1)
592 593 594 595 596
	mfspr	r4,SPRN_MMCRA
	ori	r4,r4,(1 << (63-60))
	mtspr	SPRN_MMCRA,r4
	xori	r4,r4,(1 << (63-60))
	mtspr	SPRN_MMCRA,r4
597
1:
598 599 600 601 602 603 604
	/*
	 * POWER ISA 3. Use PSSCR to determine if we
	 * are waking up from deep idle state
	 */
	LOAD_REG_ADDRBASE(r5,pnv_first_deep_stop_state)
	ld	r4,ADDROFF(pnv_first_deep_stop_state)(r5)

605 606 607 608 609 610 611 612 613
BEGIN_FTR_SECTION_NESTED(71)
	/*
	 * Assume that we are waking up from the state
	 * same as the Requested Level (RL) in the PSSCR
	 * which are Bits 60-63
	 */
	ld	r5,PACA_REQ_PSSCR(r13)
	rldicl  r5,r5,0,60
FTR_SECTION_ELSE_NESTED(71)
614
	/*
615 616 617
	 * 0-3 bits correspond to Power-Saving Level Status
	 * which indicates the idle state we are waking up from
	 */
618
	mfspr	r5, SPRN_PSSCR
619
	rldicl  r5,r5,4,60
620
ALT_FTR_SECTION_END_NESTED_IFSET(CPU_FTR_POWER9_DD1, 71)
621 622
	li	r0, 0		/* clear requested_psscr to say we're awake */
	std	r0, PACA_REQ_PSSCR(r13)
623
	cmpd	cr4,r5,r4
624
	bge	cr4,pnv_wakeup_tb_loss /* returns to caller */
625

626
	blr	/* Waking up without hypervisor state loss. */
627

628 629
/* Same calling convention as arch300 */
pnv_restore_hyp_resource_arch207:
630 631
	/*
	 * POWER ISA 2.07 or less.
632
	 * Check if we slept with sleep or winkle.
633
	 */
634 635 636
	lbz	r4,PACA_THREAD_IDLE_STATE(r13)
	cmpwi	cr2,r4,PNV_THREAD_NAP
	bgt	cr2,pnv_wakeup_tb_loss	/* Either sleep or Winkle */
637 638 639 640 641 642 643 644

	/*
	 * We fall through here if PACA_THREAD_IDLE_STATE shows we are waking
	 * up from nap. At this stage CR3 shouldn't contains 'gt' since that
	 * indicates we are waking with hypervisor state loss from nap.
	 */
	bgt	cr3,.

645
	blr	/* Waking up without hypervisor state loss */
646

647 648 649 650 651 652 653 654
/*
 * Called if waking up from idle state which can cause either partial or
 * complete hyp state loss.
 * In POWER8, called if waking up from fastsleep or winkle
 * In POWER9, called if waking up from stop state >= pnv_first_deep_stop_state
 *
 * r13 - PACA
 * cr3 - gt if waking up with partial/complete hypervisor state loss
655 656
 *
 * If ISA300:
657
 * cr4 - gt or eq if waking up from complete hypervisor state loss.
658 659 660
 *
 * If ISA207:
 * r4 - PACA_THREAD_IDLE_STATE
661
 */
662
pnv_wakeup_tb_loss:
663
	ld	r1,PACAR1(r13)
664
	/*
665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681
	 * Before entering any idle state, the NVGPRs are saved in the stack.
	 * If there was a state loss, or PACA_NAPSTATELOST was set, then the
	 * NVGPRs are restored. If we are here, it is likely that state is lost,
	 * but not guaranteed -- neither ISA207 nor ISA300 tests to reach
	 * here are the same as the test to restore NVGPRS:
	 * PACA_THREAD_IDLE_STATE test for ISA207, PSSCR test for ISA300,
	 * and SRR1 test for restoring NVGPRs.
	 *
	 * We are about to clobber NVGPRs now, so set NAPSTATELOST to
	 * guarantee they will always be restored. This might be tightened
	 * with careful reading of specs (particularly for ISA300) but this
	 * is already a slow wakeup path and it's simpler to be safe.
	 */
	li	r0,1
	stb	r0,PACA_NAPSTATELOST(r13)

	/*
682
	 *
683
	 * Save SRR1 and LR in NVGPRs as they might be clobbered in
684
	 * opal_call() (called in CHECK_HMI_INTERRUPT). SRR1 is required
685 686 687
	 * to determine the wakeup reason if we branch to kvm_start_guest. LR
	 * is required to return back to reset vector after hypervisor state
	 * restore is complete.
688
	 */
689
	mr	r19,r12
690
	mr	r18,r4
691
	mflr	r17
692 693 694
BEGIN_FTR_SECTION
	CHECK_HMI_INTERRUPT
END_FTR_SECTION_IFSET(CPU_FTR_HVMODE)
695 696

	ld	r14,PACA_CORE_IDLE_STATE_PTR(r13)
697 698
	lbz	r7,PACA_THREAD_MASK(r13)

699
	/*
700 701
	 * Take the core lock to synchronize against other threads.
	 *
702 703 704 705 706 707 708
	 * Lock bit is set in one of the 2 cases-
	 * a. In the sleep/winkle enter path, the last thread is executing
	 * fastsleep workaround code.
	 * b. In the wake up path, another thread is executing fastsleep
	 * workaround undo code or resyncing timebase or restoring context
	 * In either case loop until the lock bit is cleared.
	 */
709 710 711
1:
	lwarx	r15,0,r14
	andis.	r9,r15,PNV_CORE_IDLE_LOCK_BIT@h
712
	bnel-	core_idle_lock_held
713 714 715 716
	oris	r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
	stwcx.	r15,0,r14
	bne-	1b
	isync
717

718 719
	andi.	r9,r15,PNV_CORE_IDLE_THREAD_BITS
	cmpwi	cr2,r9,0
720 721 722

	/*
	 * At this stage
723 724
	 * cr2 - eq if first thread to wakeup in core
	 * cr3-  gt if waking up with partial/complete hypervisor state loss
725
	 * ISA300:
726
	 * cr4 - gt or eq if waking up from complete hypervisor state loss.
727 728
	 */

729
BEGIN_FTR_SECTION
730 731 732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795
	/*
	 * Were we in winkle?
	 * If yes, check if all threads were in winkle, decrement our
	 * winkle count, set all thread winkle bits if all were in winkle.
	 * Check if our thread has a winkle bit set, and set cr4 accordingly
	 * (to match ISA300, above). Pseudo-code for core idle state
	 * transitions for ISA207 is as follows (everything happens atomically
	 * due to store conditional and/or lock bit):
	 *
	 * nap_idle() { }
	 * nap_wake() { }
	 *
	 * sleep_idle()
	 * {
	 *	core_idle_state &= ~thread_in_core
	 * }
	 *
	 * sleep_wake()
	 * {
	 *     bool first_in_core, first_in_subcore;
	 *
	 *     first_in_core = (core_idle_state & IDLE_THREAD_BITS) == 0;
	 *     first_in_subcore = (core_idle_state & SUBCORE_SIBLING_MASK) == 0;
	 *
	 *     core_idle_state |= thread_in_core;
	 * }
	 *
	 * winkle_idle()
	 * {
	 *	core_idle_state &= ~thread_in_core;
	 *	core_idle_state += 1 << WINKLE_COUNT_SHIFT;
	 * }
	 *
	 * winkle_wake()
	 * {
	 *     bool first_in_core, first_in_subcore, winkle_state_lost;
	 *
	 *     first_in_core = (core_idle_state & IDLE_THREAD_BITS) == 0;
	 *     first_in_subcore = (core_idle_state & SUBCORE_SIBLING_MASK) == 0;
	 *
	 *     core_idle_state |= thread_in_core;
	 *
	 *     if ((core_idle_state & WINKLE_MASK) == (8 << WINKLE_COUNT_SIHFT))
	 *         core_idle_state |= THREAD_WINKLE_BITS;
	 *     core_idle_state -= 1 << WINKLE_COUNT_SHIFT;
	 *
	 *     winkle_state_lost = core_idle_state &
	 *				(thread_in_core << WINKLE_THREAD_SHIFT);
	 *     core_idle_state &= ~(thread_in_core << WINKLE_THREAD_SHIFT);
	 * }
	 *
	 */
	cmpwi	r18,PNV_THREAD_WINKLE
	bne	2f
	andis.	r9,r15,PNV_CORE_IDLE_WINKLE_COUNT_ALL_BIT@h
	subis	r15,r15,PNV_CORE_IDLE_WINKLE_COUNT@h
	beq	2f
	ori	r15,r15,PNV_CORE_IDLE_THREAD_WINKLE_BITS /* all were winkle */
2:
	/* Shift thread bit to winkle mask, then test if this thread is set,
	 * and remove it from the winkle bits */
	slwi	r8,r7,8
	and	r8,r8,r15
	andc	r15,r15,r8
	cmpwi	cr4,r8,1 /* cr4 will be gt if our bit is set, lt if not */

796 797 798 799 800 801 802 803 804 805 806 807 808 809 810
	lbz	r4,PACA_SUBCORE_SIBLING_MASK(r13)
	and	r4,r4,r15
	cmpwi	r4,0	/* Check if first in subcore */

	or	r15,r15,r7		/* Set thread bit */
	beq	first_thread_in_subcore
END_FTR_SECTION_IFCLR(CPU_FTR_ARCH_300)

	or	r15,r15,r7		/* Set thread bit */
	beq	cr2,first_thread_in_core

	/* Not first thread in core or subcore to wake up */
	b	clear_lock

first_thread_in_subcore:
811 812 813 814
	/*
	 * If waking up from sleep, subcore state is not lost. Hence
	 * skip subcore state restore
	 */
815
	blt	cr4,subcore_state_restored
816 817 818 819

	/* Restore per-subcore state */
	ld      r4,_SDR1(r1)
	mtspr   SPRN_SDR1,r4
820

821 822 823 824 825 826 827 828 829 830 831 832 833 834
	ld      r4,_RPR(r1)
	mtspr   SPRN_RPR,r4
	ld	r4,_AMOR(r1)
	mtspr	SPRN_AMOR,r4

subcore_state_restored:
	/*
	 * Check if the thread is also the first thread in the core. If not,
	 * skip to clear_lock.
	 */
	bne	cr2,clear_lock

first_thread_in_core:

835
	/*
836 837
	 * First thread in the core waking up from any state which can cause
	 * partial or complete hypervisor state loss. It needs to
838 839
	 * call the fastsleep workaround code if the platform requires it.
	 * Call it unconditionally here. The below branch instruction will
840 841 842
	 * be patched out if the platform does not have fastsleep or does not
	 * require the workaround. Patching will be performed during the
	 * discovery of idle-states.
843 844 845 846 847 848
	 */
.global pnv_fastsleep_workaround_at_exit
pnv_fastsleep_workaround_at_exit:
	b	fastsleep_workaround_at_exit

timebase_resync:
849 850 851 852
	/*
	 * Use cr3 which indicates that we are waking up with atleast partial
	 * hypervisor state loss to determine if TIMEBASE RESYNC is needed.
	 */
853
	ble	cr3,.Ltb_resynced
854
	/* Time base re-sync */
855
	bl	opal_resync_timebase;
856
	/*
857 858
	 * If waking up from sleep (POWER8), per core state
	 * is not lost, skip to clear_lock.
859
	 */
860
.Ltb_resynced:
861
	blt	cr4,clear_lock
862

863 864 865 866 867 868 869 870 871 872
	/*
	 * First thread in the core to wake up and its waking up with
	 * complete hypervisor state loss. Restore per core hypervisor
	 * state.
	 */
BEGIN_FTR_SECTION
	ld	r4,_PTCR(r1)
	mtspr	SPRN_PTCR,r4
	ld	r4,_RPR(r1)
	mtspr	SPRN_RPR,r4
873 874
	ld	r4,_AMOR(r1)
	mtspr	SPRN_AMOR,r4
875 876
END_FTR_SECTION_IFSET(CPU_FTR_ARCH_300)

877 878 879 880 881
	ld	r4,_TSCR(r1)
	mtspr	SPRN_TSCR,r4
	ld	r4,_WORC(r1)
	mtspr	SPRN_WORC,r4

882
clear_lock:
883
	xoris	r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
884 885 886 887
	lwsync
	stw	r15,0(r14)

common_exit:
888 889 890 891 892 893
	/*
	 * Common to all threads.
	 *
	 * If waking up from sleep, hypervisor state is not lost. Hence
	 * skip hypervisor state restore.
	 */
894
	blt	cr4,hypervisor_state_restored
895 896 897

	/* Waking up from winkle */

898 899
BEGIN_MMU_FTR_SECTION
	b	no_segments
900
END_MMU_FTR_SECTION_IFSET(MMU_FTR_TYPE_RADIX)
901 902 903 904 905 906 907 908 909 910 911 912 913
	/* Restore SLB  from PACA */
	ld	r8,PACA_SLBSHADOWPTR(r13)

	.rept	SLB_NUM_BOLTED
	li	r3, SLBSHADOW_SAVEAREA
	LDX_BE	r5, r8, r3
	addi	r3, r3, 8
	LDX_BE	r6, r8, r3
	andis.	r7,r5,SLB_ESID_V@h
	beq	1f
	slbmte	r6,r5
1:	addi	r8,r8,16
	.endr
914 915 916
no_segments:

	/* Restore per thread state */
917 918 919 920 921 922 923 924 925 926

	ld	r4,_SPURR(r1)
	mtspr	SPRN_SPURR,r4
	ld	r4,_PURR(r1)
	mtspr	SPRN_PURR,r4
	ld	r4,_DSCR(r1)
	mtspr	SPRN_DSCR,r4
	ld	r4,_WORT(r1)
	mtspr	SPRN_WORT,r4

927 928 929 930 931 932 933 934 935 936
	/* Call cur_cpu_spec->cpu_restore() */
	LOAD_REG_ADDR(r4, cur_cpu_spec)
	ld	r4,0(r4)
	ld	r12,CPU_SPEC_RESTORE(r4)
#ifdef PPC64_ELF_ABI_v1
	ld	r12,0(r12)
#endif
	mtctr	r12
	bctrl

937 938 939 940 941 942 943 944
/*
 * On POWER9, we can come here on wakeup from a cpuidle stop state.
 * Hence restore the additional SPRs to the saved value.
 *
 * On POWER8, we come here only on winkle. Since winkle is used
 * only in the case of CPU-Hotplug, we don't need to restore
 * the additional SPRs.
 */
945
BEGIN_FTR_SECTION
946
	bl 	power9_restore_additional_sprs
947
END_FTR_SECTION_IFSET(CPU_FTR_ARCH_300)
948 949
hypervisor_state_restored:

950
	mr	r12,r19
951
	mtlr	r17
952
	blr		/* return to pnv_powersave_wakeup */
953

954 955 956
fastsleep_workaround_at_exit:
	li	r3,1
	li	r4,0
957
	bl	opal_config_cpu_idle_state
958 959
	b	timebase_resync

960 961 962
/*
 * R3 here contains the value that will be returned to the caller
 * of power7_nap.
963
 * R12 contains SRR1 for CHECK_HMI_INTERRUPT.
964
 */
965 966
.global pnv_wakeup_loss
pnv_wakeup_loss:
967
	ld	r1,PACAR1(r13)
968 969 970
BEGIN_FTR_SECTION
	CHECK_HMI_INTERRUPT
END_FTR_SECTION_IFSET(CPU_FTR_HVMODE)
971 972
	REST_NVGPRS(r1)
	REST_GPR(2, r1)
973 974
	ld	r4,PACAKMSR(r13)
	ld	r5,_LINK(r1)
975
	ld	r6,_CCR(r1)
976
	addi	r1,r1,INT_FRAME_SIZE
977
	mtlr	r5
978
	mtcr	r6
979 980
	mtmsrd	r4
	blr
981

982 983 984
/*
 * R3 here contains the value that will be returned to the caller
 * of power7_nap.
985
 * R12 contains SRR1 for CHECK_HMI_INTERRUPT.
986
 */
987
pnv_wakeup_noloss:
988 989
	lbz	r0,PACA_NAPSTATELOST(r13)
	cmpwi	r0,0
990
	bne	pnv_wakeup_loss
991
	ld	r1,PACAR1(r13)
992 993 994
BEGIN_FTR_SECTION
	CHECK_HMI_INTERRUPT
END_FTR_SECTION_IFSET(CPU_FTR_HVMODE)
995
	ld	r4,PACAKMSR(r13)
996
	ld	r5,_NIP(r1)
997
	ld	r6,_CCR(r1)
998
	addi	r1,r1,INT_FRAME_SIZE
999
	mtlr	r5
1000
	mtcr	r6
1001 1002
	mtmsrd	r4
	blr