Linux Audio

Check our new training course

Loading...
v4.17
   1/*
   2 *  This file contains idle entry/exit functions for POWER7,
   3 *  POWER8 and POWER9 CPUs.
   4 *
   5 *  This program is free software; you can redistribute it and/or
   6 *  modify it under the terms of the GNU General Public License
   7 *  as published by the Free Software Foundation; either version
   8 *  2 of the License, or (at your option) any later version.
   9 */
  10
  11#include <linux/threads.h>
  12#include <asm/processor.h>
  13#include <asm/page.h>
  14#include <asm/cputable.h>
  15#include <asm/thread_info.h>
  16#include <asm/ppc_asm.h>
  17#include <asm/asm-offsets.h>
  18#include <asm/ppc-opcode.h>
  19#include <asm/hw_irq.h>
  20#include <asm/kvm_book3s_asm.h>
  21#include <asm/opal.h>
  22#include <asm/cpuidle.h>
  23#include <asm/exception-64s.h>
  24#include <asm/book3s/64/mmu-hash.h>
  25#include <asm/mmu.h>
  26
  27#undef DEBUG
  28
  29/*
  30 * Use unused space in the interrupt stack to save and restore
  31 * registers for winkle support.
  32 */
  33#define _MMCR0	GPR0
  34#define _SDR1	GPR3
  35#define _PTCR	GPR3
  36#define _RPR	GPR4
  37#define _SPURR	GPR5
  38#define _PURR	GPR6
  39#define _TSCR	GPR7
  40#define _DSCR	GPR8
  41#define _AMOR	GPR9
  42#define _WORT	GPR10
  43#define _WORC	GPR11
  44#define _LPCR	GPR12
  45
  46#define PSSCR_EC_ESL_MASK_SHIFTED          (PSSCR_EC | PSSCR_ESL) >> 16
 
 
  47
  48	.text
  49
  50/*
  51 * Used by threads before entering deep idle states. Saves SPRs
  52 * in interrupt stack frame
  53 */
  54save_sprs_to_stack:
  55	/*
  56	 * Note all register i.e per-core, per-subcore or per-thread is saved
  57	 * here since any thread in the core might wake up first
  58	 */
  59BEGIN_FTR_SECTION
 
 
  60	/*
  61	 * Note - SDR1 is dropped in Power ISA v3. Hence not restoring
  62	 * SDR1 here
  63	 */
  64	mfspr	r3,SPRN_PTCR
  65	std	r3,_PTCR(r1)
  66	mfspr	r3,SPRN_LPCR
  67	std	r3,_LPCR(r1)
  68FTR_SECTION_ELSE
  69	mfspr	r3,SPRN_SDR1
  70	std	r3,_SDR1(r1)
  71ALT_FTR_SECTION_END_IFSET(CPU_FTR_ARCH_300)
  72	mfspr	r3,SPRN_RPR
  73	std	r3,_RPR(r1)
  74	mfspr	r3,SPRN_SPURR
  75	std	r3,_SPURR(r1)
  76	mfspr	r3,SPRN_PURR
  77	std	r3,_PURR(r1)
  78	mfspr	r3,SPRN_TSCR
  79	std	r3,_TSCR(r1)
  80	mfspr	r3,SPRN_DSCR
  81	std	r3,_DSCR(r1)
  82	mfspr	r3,SPRN_AMOR
  83	std	r3,_AMOR(r1)
  84	mfspr	r3,SPRN_WORT
  85	std	r3,_WORT(r1)
  86	mfspr	r3,SPRN_WORC
  87	std	r3,_WORC(r1)
  88/*
  89 * On POWER9, there are idle states such as stop4, invoked via cpuidle,
  90 * that lose hypervisor resources. In such cases, we need to save
  91 * additional SPRs before entering those idle states so that they can
  92 * be restored to their older values on wakeup from the idle state.
  93 *
  94 * On POWER8, the only such deep idle state is winkle which is used
  95 * only in the context of CPU-Hotplug, where these additional SPRs are
  96 * reinitiazed to a sane value. Hence there is no need to save/restore
  97 * these SPRs.
  98 */
  99BEGIN_FTR_SECTION
 100	blr
 101END_FTR_SECTION_IFCLR(CPU_FTR_ARCH_300)
 102
 103power9_save_additional_sprs:
 104	mfspr	r3, SPRN_PID
 105	mfspr	r4, SPRN_LDBAR
 106	std	r3, STOP_PID(r13)
 107	std	r4, STOP_LDBAR(r13)
 108
 109	mfspr	r3, SPRN_FSCR
 110	mfspr	r4, SPRN_HFSCR
 111	std	r3, STOP_FSCR(r13)
 112	std	r4, STOP_HFSCR(r13)
 113
 114	mfspr	r3, SPRN_MMCRA
 115	mfspr	r4, SPRN_MMCR0
 116	std	r3, STOP_MMCRA(r13)
 117	std	r4, _MMCR0(r1)
 118
 119	mfspr	r3, SPRN_MMCR1
 120	mfspr	r4, SPRN_MMCR2
 121	std	r3, STOP_MMCR1(r13)
 122	std	r4, STOP_MMCR2(r13)
 123	blr
 124
 125power9_restore_additional_sprs:
 126	ld	r3,_LPCR(r1)
 127	ld	r4, STOP_PID(r13)
 128	mtspr	SPRN_LPCR,r3
 129	mtspr	SPRN_PID, r4
 130
 131	ld	r3, STOP_LDBAR(r13)
 132	ld	r4, STOP_FSCR(r13)
 133	mtspr	SPRN_LDBAR, r3
 134	mtspr	SPRN_FSCR, r4
 135
 136	ld	r3, STOP_HFSCR(r13)
 137	ld	r4, STOP_MMCRA(r13)
 138	mtspr	SPRN_HFSCR, r3
 139	mtspr	SPRN_MMCRA, r4
 140
 141	ld	r3, _MMCR0(r1)
 142	ld	r4, STOP_MMCR1(r13)
 143	mtspr	SPRN_MMCR0, r3
 144	mtspr	SPRN_MMCR1, r4
 145
 146	ld	r3, STOP_MMCR2(r13)
 147	mtspr	SPRN_MMCR2, r3
 148	blr
 149
 150/*
 151 * Used by threads when the lock bit of core_idle_state is set.
 152 * Threads will spin in HMT_LOW until the lock bit is cleared.
 153 * r14 - pointer to core_idle_state
 154 * r15 - used to load contents of core_idle_state
 155 * r9  - used as a temporary variable
 156 */
 157
 158core_idle_lock_held:
 159	HMT_LOW
 1603:	lwz	r15,0(r14)
 161	andis.	r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
 162	bne	3b
 163	HMT_MEDIUM
 164	lwarx	r15,0,r14
 165	andis.	r9,r15,PNV_CORE_IDLE_LOCK_BIT@h
 166	bne-	core_idle_lock_held
 167	blr
 168
 169/*
 170 * Pass requested state in r3:
 171 *	r3 - PNV_THREAD_NAP/SLEEP/WINKLE in POWER8
 172 *	   - Requested PSSCR value in POWER9
 
 
 
 
 173 *
 174 * Address of idle handler to branch to in realmode in r4
 175 */
 176pnv_powersave_common:
 177	/* Use r3 to pass state nap/sleep/winkle */
 178	/* NAP is a state loss, we create a regs frame on the
 179	 * stack, fill it up with the state we care about and
 180	 * stick a pointer to it in PACAR1. We really only
 181	 * need to save PC, some CR bits and the NV GPRs,
 182	 * but for now an interrupt frame will do.
 183	 */
 184	mtctr	r4
 185
 186	mflr	r0
 187	std	r0,16(r1)
 188	stdu	r1,-INT_FRAME_SIZE(r1)
 189	std	r0,_LINK(r1)
 190	std	r0,_NIP(r1)
 191
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 192	/* We haven't lost state ... yet */
 193	li	r0,0
 194	stb	r0,PACA_NAPSTATELOST(r13)
 195
 196	/* Continue saving state */
 197	SAVE_GPR(2, r1)
 198	SAVE_NVGPRS(r1)
 199	mfcr	r5
 200	std	r5,_CCR(r1)
 
 201	std	r1,PACAR1(r13)
 202
 203BEGIN_FTR_SECTION
 204	/*
 205	 * POWER9 does not require real mode to stop, and presently does not
 206	 * set hwthread_state for KVM (threads don't share MMU context), so
 207	 * we can remain in virtual mode for this.
 208	 */
 209	bctr
 210END_FTR_SECTION_IFSET(CPU_FTR_ARCH_300)
 211	/*
 212	 * POWER8
 213	 * Go to real mode to do the nap, as required by the architecture.
 214	 * Also, we need to be in real mode before setting hwthread_state,
 215	 * because as soon as we do that, another thread can switch
 216	 * the MMU context to the guest.
 217	 */
 218	LOAD_REG_IMMEDIATE(r7, MSR_IDLE)
 219	mtmsrd	r7,0
 220	bctr
 221
 222/*
 223 * This is the sequence required to execute idle instructions, as
 224 * specified in ISA v2.07 (and earlier). MSR[IR] and MSR[DR] must be 0.
 225 */
 226#define IDLE_STATE_ENTER_SEQ_NORET(IDLE_INST)			\
 227	/* Magic NAP/SLEEP/WINKLE mode enter sequence */	\
 228	std	r0,0(r1);					\
 229	ptesync;						\
 230	ld	r0,0(r1);					\
 231236:	cmpd	cr0,r0,r0;					\
 232	bne	236b;						\
 233	IDLE_INST;
 234
 235
 236	.globl pnv_enter_arch207_idle_mode
 237pnv_enter_arch207_idle_mode:
 238#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
 239	/* Tell KVM we're entering idle */
 240	li	r4,KVM_HWTHREAD_IN_IDLE
 241	/******************************************************/
 242	/*  N O T E   W E L L    ! ! !    N O T E   W E L L   */
 243	/* The following store to HSTATE_HWTHREAD_STATE(r13)  */
 244	/* MUST occur in real mode, i.e. with the MMU off,    */
 245	/* and the MMU must stay off until we clear this flag */
 246	/* and test HSTATE_HWTHREAD_REQ(r13) in               */
 247	/* pnv_powersave_wakeup in this file.                 */
 248	/* The reason is that another thread can switch the   */
 249	/* MMU to a guest context whenever this flag is set   */
 250	/* to KVM_HWTHREAD_IN_IDLE, and if the MMU was on,    */
 251	/* that would potentially cause this thread to start  */
 252	/* executing instructions from guest memory in        */
 253	/* hypervisor mode, leading to a host crash or data   */
 254	/* corruption, or worse.                              */
 255	/******************************************************/
 256	stb	r4,HSTATE_HWTHREAD_STATE(r13)
 257#endif
 258	stb	r3,PACA_THREAD_IDLE_STATE(r13)
 259	cmpwi	cr3,r3,PNV_THREAD_SLEEP
 260	bge	cr3,2f
 261	IDLE_STATE_ENTER_SEQ_NORET(PPC_NAP)
 262	/* No return */
 2632:
 264	/* Sleep or winkle */
 265	lbz	r7,PACA_THREAD_MASK(r13)
 266	ld	r14,PACA_CORE_IDLE_STATE_PTR(r13)
 267	li	r5,0
 268	beq	cr3,3f
 269	lis	r5,PNV_CORE_IDLE_WINKLE_COUNT@h
 2703:
 271lwarx_loop1:
 272	lwarx	r15,0,r14
 273
 274	andis.	r9,r15,PNV_CORE_IDLE_LOCK_BIT@h
 275	bnel-	core_idle_lock_held
 276
 277	add	r15,r15,r5			/* Add if winkle */
 278	andc	r15,r15,r7			/* Clear thread bit */
 279
 280	andi.	r9,r15,PNV_CORE_IDLE_THREAD_BITS
 281
 282/*
 283 * If cr0 = 0, then current thread is the last thread of the core entering
 284 * sleep. Last thread needs to execute the hardware bug workaround code if
 285 * required by the platform.
 286 * Make the workaround call unconditionally here. The below branch call is
 287 * patched out when the idle states are discovered if the platform does not
 288 * require it.
 289 */
 290.global pnv_fastsleep_workaround_at_entry
 291pnv_fastsleep_workaround_at_entry:
 292	beq	fastsleep_workaround_at_entry
 293
 294	stwcx.	r15,0,r14
 295	bne-	lwarx_loop1
 296	isync
 297
 298common_enter: /* common code for all the threads entering sleep or winkle */
 299	bgt	cr3,enter_winkle
 300	IDLE_STATE_ENTER_SEQ_NORET(PPC_SLEEP)
 301
 302fastsleep_workaround_at_entry:
 303	oris	r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
 304	stwcx.	r15,0,r14
 305	bne-	lwarx_loop1
 306	isync
 307
 308	/* Fast sleep workaround */
 309	li	r3,1
 310	li	r4,1
 311	bl	opal_config_cpu_idle_state
 312
 313	/* Unlock */
 314	xoris	r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
 315	lwsync
 316	stw	r15,0(r14)
 317	b	common_enter
 318
 319enter_winkle:
 320	bl	save_sprs_to_stack
 321
 322	IDLE_STATE_ENTER_SEQ_NORET(PPC_WINKLE)
 323
 324/*
 325 * r3 - PSSCR value corresponding to the requested stop state.
 326 */
 327power_enter_stop:
 328/*
 329 * Check if we are executing the lite variant with ESL=EC=0
 330 */
 331	andis.   r4,r3,PSSCR_EC_ESL_MASK_SHIFTED
 332	clrldi   r3,r3,60 /* r3 = Bits[60:63] = Requested Level (RL) */
 333	bne	 .Lhandle_esl_ec_set
 334	PPC_STOP
 335	li	r3,0  /* Since we didn't lose state, return 0 */
 336	std	r3, PACA_REQ_PSSCR(r13)
 337
 338	/*
 339	 * pnv_wakeup_noloss() expects r12 to contain the SRR1 value so
 340	 * it can determine if the wakeup reason is an HMI in
 341	 * CHECK_HMI_INTERRUPT.
 342	 *
 343	 * However, when we wakeup with ESL=0, SRR1 will not contain the wakeup
 344	 * reason, so there is no point setting r12 to SRR1.
 345	 *
 346	 * Further, we clear r12 here, so that we don't accidentally enter the
 347	 * HMI in pnv_wakeup_noloss() if the value of r12[42:45] == WAKE_HMI.
 348	 */
 349	li	r12, 0
 350	b 	pnv_wakeup_noloss
 351
 352.Lhandle_esl_ec_set:
 353BEGIN_FTR_SECTION
 354	/*
 355	 * POWER9 DD2.0 or earlier can incorrectly set PMAO when waking up after
 356	 * a state-loss idle. Saving and restoring MMCR0 over idle is a
 357	 * workaround.
 358	 */
 359	mfspr	r4,SPRN_MMCR0
 360	std	r4,_MMCR0(r1)
 361END_FTR_SECTION_IFCLR(CPU_FTR_POWER9_DD2_1)
 362
 363/*
 364 * Check if the requested state is a deep idle state.
 365 */
 366	LOAD_REG_ADDRBASE(r5,pnv_first_deep_stop_state)
 367	ld	r4,ADDROFF(pnv_first_deep_stop_state)(r5)
 368	cmpd	r3,r4
 369	bge	.Lhandle_deep_stop
 370	PPC_STOP	/* Does not return (system reset interrupt) */
 371
 372.Lhandle_deep_stop:
 373/*
 374 * Entering deep idle state.
 375 * Clear thread bit in PACA_CORE_IDLE_STATE, save SPRs to
 376 * stack and enter stop
 377 */
 378	lbz     r7,PACA_THREAD_MASK(r13)
 379	ld      r14,PACA_CORE_IDLE_STATE_PTR(r13)
 380
 381lwarx_loop_stop:
 382	lwarx   r15,0,r14
 383	andis.	r9,r15,PNV_CORE_IDLE_LOCK_BIT@h
 384	bnel-	core_idle_lock_held
 385	andc    r15,r15,r7                      /* Clear thread bit */
 386
 387	stwcx.  r15,0,r14
 388	bne-    lwarx_loop_stop
 389	isync
 390
 391	bl	save_sprs_to_stack
 392
 393	PPC_STOP	/* Does not return (system reset interrupt) */
 394
 395/*
 396 * Entered with MSR[EE]=0 and no soft-masked interrupts pending.
 397 * r3 contains desired idle state (PNV_THREAD_NAP/SLEEP/WINKLE).
 398 */
 399_GLOBAL(power7_idle_insn)
 400	/* Now check if user or arch enabled NAP mode */
 401	LOAD_REG_ADDR(r4, pnv_enter_arch207_idle_mode)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 402	b	pnv_powersave_common
 
 
 
 
 
 
 
 
 403
 404#define CHECK_HMI_INTERRUPT						\
 
 405BEGIN_FTR_SECTION_NESTED(66);						\
 406	rlwinm	r0,r12,45-31,0xf;  /* extract wake reason field (P8) */	\
 407FTR_SECTION_ELSE_NESTED(66);						\
 408	rlwinm	r0,r12,45-31,0xe;  /* P7 wake reason field is 3 bits */	\
 409ALT_FTR_SECTION_END_NESTED_IFSET(CPU_FTR_ARCH_207S, 66);		\
 410	cmpwi	r0,0xa;			/* Hypervisor maintenance ? */	\
 411	bne+	20f;							\
 412	/* Invoke opal call to handle hmi */				\
 413	ld	r2,PACATOC(r13);					\
 414	ld	r1,PACAR1(r13);						\
 415	std	r3,ORIG_GPR3(r1);	/* Save original r3 */		\
 416	li	r3,0;			/* NULL argument */		\
 417	bl	hmi_exception_realmode;					\
 418	nop;								\
 419	ld	r3,ORIG_GPR3(r1);	/* Restore original r3 */	\
 42020:	nop;
 421
 
 422/*
 423 * Entered with MSR[EE]=0 and no soft-masked interrupts pending.
 424 * r3 contains desired PSSCR register value.
 425 *
 426 * Offline (CPU unplug) case also must notify KVM that the CPU is
 427 * idle.
 428 */
 429_GLOBAL(power9_offline_stop)
 430#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
 431	/*
 432	 * Tell KVM we're entering idle.
 433	 * This does not have to be done in real mode because the P9 MMU
 434	 * is independent per-thread. Some steppings share radix/hash mode
 435	 * between threads, but in that case KVM has a barrier sync in real
 436	 * mode before and after switching between radix and hash.
 437	 */
 438	li	r4,KVM_HWTHREAD_IN_IDLE
 439	stb	r4,HSTATE_HWTHREAD_STATE(r13)
 440#endif
 441	/* fall through */
 442
 443_GLOBAL(power9_idle_stop)
 444	std	r3, PACA_REQ_PSSCR(r13)
 445#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
 446BEGIN_FTR_SECTION
 447	sync
 448	lwz	r5, PACA_DONT_STOP(r13)
 449	cmpwi	r5, 0
 450	bne	1f
 451END_FTR_SECTION_IFSET(CPU_FTR_P9_TM_XER_SO_BUG)
 452#endif
 453	mtspr 	SPRN_PSSCR,r3
 454	LOAD_REG_ADDR(r4,power_enter_stop)
 455	b	pnv_powersave_common
 456	/* No return */
 457#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
 4581:
 459	/*
 460	 * We get here when TM / thread reconfiguration bug workaround
 461	 * code wants to get the CPU into SMT4 mode, and therefore
 462	 * we are being asked not to stop.
 463	 */
 464	li	r3, 0
 465	std	r3, PACA_REQ_PSSCR(r13)
 466	blr		/* return 0 for wakeup cause / SRR1 value */
 467#endif
 468
 469/*
 470 * On waking up from stop 0,1,2 with ESL=1 on POWER9 DD1,
 471 * HSPRG0 will be set to the HSPRG0 value of one of the
 472 * threads in this core. Thus the value we have in r13
 473 * may not be this thread's paca pointer.
 474 *
 475 * Fortunately, the TIR remains invariant. Since this thread's
 476 * paca pointer is recorded in all its sibling's paca, we can
 477 * correctly recover this thread's paca pointer if we
 478 * know the index of this thread in the core.
 479 *
 480 * This index can be obtained from the TIR.
 481 *
 482 * i.e, thread's position in the core = TIR.
 483 * If this value is i, then this thread's paca is
 484 * paca->thread_sibling_pacas[i].
 485 */
 486power9_dd1_recover_paca:
 487	mfspr	r4, SPRN_TIR
 488	/*
 489	 * Since each entry in thread_sibling_pacas is 8 bytes
 490	 * we need to left-shift by 3 bits. Thus r4 = i * 8
 491	 */
 492	sldi	r4, r4, 3
 493	/* Get &paca->thread_sibling_pacas[0] in r5 */
 494	ld	r5, PACA_SIBLING_PACA_PTRS(r13)
 495	/* Load paca->thread_sibling_pacas[i] into r13 */
 496	ldx	r13, r4, r5
 497	SET_PACA(r13)
 498	/*
 499	 * Indicate that we have lost NVGPR state
 500	 * which needs to be restored from the stack.
 501	 */
 502	li	r3, 1
 503	stb	r3,PACA_NAPSTATELOST(r13)
 504	blr
 505
 506/*
 507 * Called from machine check handler for powersave wakeups.
 508 * Low level machine check processing has already been done. Now just
 509 * go through the wake up path to get everything in order.
 510 *
 511 * r3 - The original SRR1 value.
 512 * Original SRR[01] have been clobbered.
 513 * MSR_RI is clear.
 514 */
 515.global pnv_powersave_wakeup_mce
 516pnv_powersave_wakeup_mce:
 517	/* Set cr3 for pnv_powersave_wakeup */
 518	rlwinm	r11,r3,47-31,30,31
 519	cmpwi	cr3,r11,2
 520
 521	/*
 522	 * Now put the original SRR1 with SRR1_WAKEMCE_RESVD as the wake
 523	 * reason into r12, which allows reuse of the system reset wakeup
 524	 * code without being mistaken for another type of wakeup.
 525	 */
 526	oris	r12,r3,SRR1_WAKEMCE_RESVD@h
 527
 528	b	pnv_powersave_wakeup
 529
 530/*
 531 * Called from reset vector for powersave wakeups.
 532 * cr3 - set to gt if waking up with partial/complete hypervisor state loss
 533 * r12 - SRR1
 534 */
 535.global pnv_powersave_wakeup
 536pnv_powersave_wakeup:
 537	ld	r2, PACATOC(r13)
 538
 539BEGIN_FTR_SECTION
 540BEGIN_FTR_SECTION_NESTED(70)
 541	bl	power9_dd1_recover_paca
 542END_FTR_SECTION_NESTED_IFSET(CPU_FTR_POWER9_DD1, 70)
 543	bl	pnv_restore_hyp_resource_arch300
 544FTR_SECTION_ELSE
 545	bl	pnv_restore_hyp_resource_arch207
 546ALT_FTR_SECTION_END_IFSET(CPU_FTR_ARCH_300)
 547
 548	li	r0,PNV_THREAD_RUNNING
 549	stb	r0,PACA_THREAD_IDLE_STATE(r13)	/* Clear thread state */
 550
 551	mr	r3,r12
 552
 553#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
 554	lbz	r0,HSTATE_HWTHREAD_STATE(r13)
 555	cmpwi	r0,KVM_HWTHREAD_IN_KERNEL
 556	beq	0f
 557	li	r0,KVM_HWTHREAD_IN_KERNEL
 558	stb	r0,HSTATE_HWTHREAD_STATE(r13)
 559	/* Order setting hwthread_state vs. testing hwthread_req */
 560	sync
 5610:	lbz	r0,HSTATE_HWTHREAD_REQ(r13)
 562	cmpwi	r0,0
 563	beq	1f
 564	b	kvm_start_guest
 5651:
 566#endif
 567
 568	/* Return SRR1 from power7_nap() */
 569	blt	cr3,pnv_wakeup_noloss
 570	b	pnv_wakeup_loss
 571
 572/*
 573 * Check whether we have woken up with hypervisor state loss.
 574 * If yes, restore hypervisor state and return back to link.
 
 575 *
 
 576 * cr3 - set to gt if waking up with partial/complete hypervisor state loss
 577 */
 578pnv_restore_hyp_resource_arch300:
 579	/*
 580	 * Workaround for POWER9, if we lost resources, the ERAT
 581	 * might have been mixed up and needs flushing. We also need
 582	 * to reload MMCR0 (see comment above). We also need to set
 583	 * then clear bit 60 in MMCRA to ensure the PMU starts running.
 584	 */
 585	blt	cr3,1f
 586BEGIN_FTR_SECTION
 587	PPC_INVALIDATE_ERAT
 588	ld	r1,PACAR1(r13)
 589	ld	r4,_MMCR0(r1)
 590	mtspr	SPRN_MMCR0,r4
 591END_FTR_SECTION_IFCLR(CPU_FTR_POWER9_DD2_1)
 592	mfspr	r4,SPRN_MMCRA
 593	ori	r4,r4,(1 << (63-60))
 594	mtspr	SPRN_MMCRA,r4
 595	xori	r4,r4,(1 << (63-60))
 596	mtspr	SPRN_MMCRA,r4
 5971:
 598	/*
 599	 * POWER ISA 3. Use PSSCR to determine if we
 600	 * are waking up from deep idle state
 601	 */
 602	LOAD_REG_ADDRBASE(r5,pnv_first_deep_stop_state)
 603	ld	r4,ADDROFF(pnv_first_deep_stop_state)(r5)
 604
 605BEGIN_FTR_SECTION_NESTED(71)
 606	/*
 607	 * Assume that we are waking up from the state
 608	 * same as the Requested Level (RL) in the PSSCR
 609	 * which are Bits 60-63
 610	 */
 611	ld	r5,PACA_REQ_PSSCR(r13)
 612	rldicl  r5,r5,0,60
 613FTR_SECTION_ELSE_NESTED(71)
 614	/*
 615	 * 0-3 bits correspond to Power-Saving Level Status
 616	 * which indicates the idle state we are waking up from
 617	 */
 618	mfspr	r5, SPRN_PSSCR
 619	rldicl  r5,r5,4,60
 620ALT_FTR_SECTION_END_NESTED_IFSET(CPU_FTR_POWER9_DD1, 71)
 621	li	r0, 0		/* clear requested_psscr to say we're awake */
 622	std	r0, PACA_REQ_PSSCR(r13)
 623	cmpd	cr4,r5,r4
 624	bge	cr4,pnv_wakeup_tb_loss /* returns to caller */
 
 
 
 
 
 625
 626	blr	/* Waking up without hypervisor state loss. */
 627
 628/* Same calling convention as arch300 */
 629pnv_restore_hyp_resource_arch207:
 630	/*
 631	 * POWER ISA 2.07 or less.
 632	 * Check if we slept with sleep or winkle.
 
 633	 */
 634	lbz	r4,PACA_THREAD_IDLE_STATE(r13)
 635	cmpwi	cr2,r4,PNV_THREAD_NAP
 636	bgt	cr2,pnv_wakeup_tb_loss	/* Either sleep or Winkle */
 
 
 
 
 
 
 
 
 637
 638	/*
 639	 * We fall through here if PACA_THREAD_IDLE_STATE shows we are waking
 640	 * up from nap. At this stage CR3 shouldn't contains 'gt' since that
 641	 * indicates we are waking with hypervisor state loss from nap.
 642	 */
 643	bgt	cr3,.
 644
 645	blr	/* Waking up without hypervisor state loss */
 
 646
 647/*
 648 * Called if waking up from idle state which can cause either partial or
 649 * complete hyp state loss.
 650 * In POWER8, called if waking up from fastsleep or winkle
 651 * In POWER9, called if waking up from stop state >= pnv_first_deep_stop_state
 652 *
 653 * r13 - PACA
 654 * cr3 - gt if waking up with partial/complete hypervisor state loss
 655 *
 656 * If ISA300:
 657 * cr4 - gt or eq if waking up from complete hypervisor state loss.
 658 *
 659 * If ISA207:
 660 * r4 - PACA_THREAD_IDLE_STATE
 661 */
 662pnv_wakeup_tb_loss:
 663	ld	r1,PACAR1(r13)
 664	/*
 665	 * Before entering any idle state, the NVGPRs are saved in the stack.
 666	 * If there was a state loss, or PACA_NAPSTATELOST was set, then the
 667	 * NVGPRs are restored. If we are here, it is likely that state is lost,
 668	 * but not guaranteed -- neither ISA207 nor ISA300 tests to reach
 669	 * here are the same as the test to restore NVGPRS:
 670	 * PACA_THREAD_IDLE_STATE test for ISA207, PSSCR test for ISA300,
 671	 * and SRR1 test for restoring NVGPRs.
 672	 *
 673	 * We are about to clobber NVGPRs now, so set NAPSTATELOST to
 674	 * guarantee they will always be restored. This might be tightened
 675	 * with careful reading of specs (particularly for ISA300) but this
 676	 * is already a slow wakeup path and it's simpler to be safe.
 677	 */
 678	li	r0,1
 679	stb	r0,PACA_NAPSTATELOST(r13)
 680
 681	/*
 682	 *
 683	 * Save SRR1 and LR in NVGPRs as they might be clobbered in
 684	 * opal_call() (called in CHECK_HMI_INTERRUPT). SRR1 is required
 685	 * to determine the wakeup reason if we branch to kvm_start_guest. LR
 686	 * is required to return back to reset vector after hypervisor state
 687	 * restore is complete.
 688	 */
 689	mr	r19,r12
 690	mr	r18,r4
 691	mflr	r17
 
 692BEGIN_FTR_SECTION
 693	CHECK_HMI_INTERRUPT
 694END_FTR_SECTION_IFSET(CPU_FTR_HVMODE)
 695
 696	ld	r14,PACA_CORE_IDLE_STATE_PTR(r13)
 697	lbz	r7,PACA_THREAD_MASK(r13)
 698
 
 
 
 699	/*
 700	 * Take the core lock to synchronize against other threads.
 701	 *
 702	 * Lock bit is set in one of the 2 cases-
 703	 * a. In the sleep/winkle enter path, the last thread is executing
 704	 * fastsleep workaround code.
 705	 * b. In the wake up path, another thread is executing fastsleep
 706	 * workaround undo code or resyncing timebase or restoring context
 707	 * In either case loop until the lock bit is cleared.
 708	 */
 7091:
 710	lwarx	r15,0,r14
 711	andis.	r9,r15,PNV_CORE_IDLE_LOCK_BIT@h
 712	bnel-	core_idle_lock_held
 713	oris	r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
 714	stwcx.	r15,0,r14
 715	bne-	1b
 716	isync
 717
 718	andi.	r9,r15,PNV_CORE_IDLE_THREAD_BITS
 719	cmpwi	cr2,r9,0
 720
 721	/*
 722	 * At this stage
 723	 * cr2 - eq if first thread to wakeup in core
 724	 * cr3-  gt if waking up with partial/complete hypervisor state loss
 725	 * ISA300:
 726	 * cr4 - gt or eq if waking up from complete hypervisor state loss.
 727	 */
 728
 729BEGIN_FTR_SECTION
 730	/*
 731	 * Were we in winkle?
 732	 * If yes, check if all threads were in winkle, decrement our
 733	 * winkle count, set all thread winkle bits if all were in winkle.
 734	 * Check if our thread has a winkle bit set, and set cr4 accordingly
 735	 * (to match ISA300, above). Pseudo-code for core idle state
 736	 * transitions for ISA207 is as follows (everything happens atomically
 737	 * due to store conditional and/or lock bit):
 738	 *
 739	 * nap_idle() { }
 740	 * nap_wake() { }
 741	 *
 742	 * sleep_idle()
 743	 * {
 744	 *	core_idle_state &= ~thread_in_core
 745	 * }
 746	 *
 747	 * sleep_wake()
 748	 * {
 749	 *     bool first_in_core, first_in_subcore;
 750	 *
 751	 *     first_in_core = (core_idle_state & IDLE_THREAD_BITS) == 0;
 752	 *     first_in_subcore = (core_idle_state & SUBCORE_SIBLING_MASK) == 0;
 753	 *
 754	 *     core_idle_state |= thread_in_core;
 755	 * }
 756	 *
 757	 * winkle_idle()
 758	 * {
 759	 *	core_idle_state &= ~thread_in_core;
 760	 *	core_idle_state += 1 << WINKLE_COUNT_SHIFT;
 761	 * }
 762	 *
 763	 * winkle_wake()
 764	 * {
 765	 *     bool first_in_core, first_in_subcore, winkle_state_lost;
 766	 *
 767	 *     first_in_core = (core_idle_state & IDLE_THREAD_BITS) == 0;
 768	 *     first_in_subcore = (core_idle_state & SUBCORE_SIBLING_MASK) == 0;
 769	 *
 770	 *     core_idle_state |= thread_in_core;
 771	 *
 772	 *     if ((core_idle_state & WINKLE_MASK) == (8 << WINKLE_COUNT_SIHFT))
 773	 *         core_idle_state |= THREAD_WINKLE_BITS;
 774	 *     core_idle_state -= 1 << WINKLE_COUNT_SHIFT;
 775	 *
 776	 *     winkle_state_lost = core_idle_state &
 777	 *				(thread_in_core << WINKLE_THREAD_SHIFT);
 778	 *     core_idle_state &= ~(thread_in_core << WINKLE_THREAD_SHIFT);
 779	 * }
 780	 *
 781	 */
 782	cmpwi	r18,PNV_THREAD_WINKLE
 783	bne	2f
 784	andis.	r9,r15,PNV_CORE_IDLE_WINKLE_COUNT_ALL_BIT@h
 785	subis	r15,r15,PNV_CORE_IDLE_WINKLE_COUNT@h
 786	beq	2f
 787	ori	r15,r15,PNV_CORE_IDLE_THREAD_WINKLE_BITS /* all were winkle */
 7882:
 789	/* Shift thread bit to winkle mask, then test if this thread is set,
 790	 * and remove it from the winkle bits */
 791	slwi	r8,r7,8
 792	and	r8,r8,r15
 793	andc	r15,r15,r8
 794	cmpwi	cr4,r8,1 /* cr4 will be gt if our bit is set, lt if not */
 795
 
 796	lbz	r4,PACA_SUBCORE_SIBLING_MASK(r13)
 797	and	r4,r4,r15
 798	cmpwi	r4,0	/* Check if first in subcore */
 799
 800	or	r15,r15,r7		/* Set thread bit */
 801	beq	first_thread_in_subcore
 802END_FTR_SECTION_IFCLR(CPU_FTR_ARCH_300)
 803
 804	or	r15,r15,r7		/* Set thread bit */
 805	beq	cr2,first_thread_in_core
 806
 807	/* Not first thread in core or subcore to wake up */
 808	b	clear_lock
 809
 810first_thread_in_subcore:
 811	/*
 812	 * If waking up from sleep, subcore state is not lost. Hence
 813	 * skip subcore state restore
 814	 */
 815	blt	cr4,subcore_state_restored
 816
 817	/* Restore per-subcore state */
 818	ld      r4,_SDR1(r1)
 819	mtspr   SPRN_SDR1,r4
 820
 821	ld      r4,_RPR(r1)
 822	mtspr   SPRN_RPR,r4
 823	ld	r4,_AMOR(r1)
 824	mtspr	SPRN_AMOR,r4
 825
 826subcore_state_restored:
 827	/*
 828	 * Check if the thread is also the first thread in the core. If not,
 829	 * skip to clear_lock.
 830	 */
 831	bne	cr2,clear_lock
 832
 833first_thread_in_core:
 834
 835	/*
 836	 * First thread in the core waking up from any state which can cause
 837	 * partial or complete hypervisor state loss. It needs to
 838	 * call the fastsleep workaround code if the platform requires it.
 839	 * Call it unconditionally here. The below branch instruction will
 840	 * be patched out if the platform does not have fastsleep or does not
 841	 * require the workaround. Patching will be performed during the
 842	 * discovery of idle-states.
 843	 */
 844.global pnv_fastsleep_workaround_at_exit
 845pnv_fastsleep_workaround_at_exit:
 846	b	fastsleep_workaround_at_exit
 847
 848timebase_resync:
 849	/*
 850	 * Use cr3 which indicates that we are waking up with atleast partial
 851	 * hypervisor state loss to determine if TIMEBASE RESYNC is needed.
 852	 */
 853	ble	cr3,.Ltb_resynced
 854	/* Time base re-sync */
 855	bl	opal_resync_timebase;
 856	/*
 857	 * If waking up from sleep (POWER8), per core state
 858	 * is not lost, skip to clear_lock.
 859	 */
 860.Ltb_resynced:
 861	blt	cr4,clear_lock
 862
 863	/*
 864	 * First thread in the core to wake up and its waking up with
 865	 * complete hypervisor state loss. Restore per core hypervisor
 866	 * state.
 867	 */
 868BEGIN_FTR_SECTION
 869	ld	r4,_PTCR(r1)
 870	mtspr	SPRN_PTCR,r4
 871	ld	r4,_RPR(r1)
 872	mtspr	SPRN_RPR,r4
 873	ld	r4,_AMOR(r1)
 874	mtspr	SPRN_AMOR,r4
 875END_FTR_SECTION_IFSET(CPU_FTR_ARCH_300)
 876
 877	ld	r4,_TSCR(r1)
 878	mtspr	SPRN_TSCR,r4
 879	ld	r4,_WORC(r1)
 880	mtspr	SPRN_WORC,r4
 881
 882clear_lock:
 883	xoris	r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
 884	lwsync
 885	stw	r15,0(r14)
 886
 887common_exit:
 888	/*
 889	 * Common to all threads.
 890	 *
 891	 * If waking up from sleep, hypervisor state is not lost. Hence
 892	 * skip hypervisor state restore.
 893	 */
 894	blt	cr4,hypervisor_state_restored
 895
 896	/* Waking up from winkle */
 897
 898BEGIN_MMU_FTR_SECTION
 899	b	no_segments
 900END_MMU_FTR_SECTION_IFSET(MMU_FTR_TYPE_RADIX)
 901	/* Restore SLB  from PACA */
 902	ld	r8,PACA_SLBSHADOWPTR(r13)
 903
 904	.rept	SLB_NUM_BOLTED
 905	li	r3, SLBSHADOW_SAVEAREA
 906	LDX_BE	r5, r8, r3
 907	addi	r3, r3, 8
 908	LDX_BE	r6, r8, r3
 909	andis.	r7,r5,SLB_ESID_V@h
 910	beq	1f
 911	slbmte	r6,r5
 9121:	addi	r8,r8,16
 913	.endr
 914no_segments:
 915
 916	/* Restore per thread state */
 917
 918	ld	r4,_SPURR(r1)
 919	mtspr	SPRN_SPURR,r4
 920	ld	r4,_PURR(r1)
 921	mtspr	SPRN_PURR,r4
 922	ld	r4,_DSCR(r1)
 923	mtspr	SPRN_DSCR,r4
 924	ld	r4,_WORT(r1)
 925	mtspr	SPRN_WORT,r4
 926
 927	/* Call cur_cpu_spec->cpu_restore() */
 928	LOAD_REG_ADDR(r4, cur_cpu_spec)
 929	ld	r4,0(r4)
 930	ld	r12,CPU_SPEC_RESTORE(r4)
 931#ifdef PPC64_ELF_ABI_v1
 932	ld	r12,0(r12)
 933#endif
 934	mtctr	r12
 935	bctrl
 936
 937/*
 938 * On POWER9, we can come here on wakeup from a cpuidle stop state.
 939 * Hence restore the additional SPRs to the saved value.
 940 *
 941 * On POWER8, we come here only on winkle. Since winkle is used
 942 * only in the case of CPU-Hotplug, we don't need to restore
 943 * the additional SPRs.
 944 */
 945BEGIN_FTR_SECTION
 946	bl 	power9_restore_additional_sprs
 947END_FTR_SECTION_IFSET(CPU_FTR_ARCH_300)
 948hypervisor_state_restored:
 949
 950	mr	r12,r19
 951	mtlr	r17
 952	blr		/* return to pnv_powersave_wakeup */
 
 953
 954fastsleep_workaround_at_exit:
 955	li	r3,1
 956	li	r4,0
 957	bl	opal_config_cpu_idle_state
 958	b	timebase_resync
 959
 960/*
 961 * R3 here contains the value that will be returned to the caller
 962 * of power7_nap.
 963 * R12 contains SRR1 for CHECK_HMI_INTERRUPT.
 964 */
 965.global pnv_wakeup_loss
 966pnv_wakeup_loss:
 967	ld	r1,PACAR1(r13)
 968BEGIN_FTR_SECTION
 969	CHECK_HMI_INTERRUPT
 970END_FTR_SECTION_IFSET(CPU_FTR_HVMODE)
 971	REST_NVGPRS(r1)
 972	REST_GPR(2, r1)
 973	ld	r4,PACAKMSR(r13)
 974	ld	r5,_LINK(r1)
 975	ld	r6,_CCR(r1)
 
 
 976	addi	r1,r1,INT_FRAME_SIZE
 977	mtlr	r5
 978	mtcr	r6
 979	mtmsrd	r4
 980	blr
 
 981
 982/*
 983 * R3 here contains the value that will be returned to the caller
 984 * of power7_nap.
 985 * R12 contains SRR1 for CHECK_HMI_INTERRUPT.
 986 */
 987pnv_wakeup_noloss:
 988	lbz	r0,PACA_NAPSTATELOST(r13)
 989	cmpwi	r0,0
 990	bne	pnv_wakeup_loss
 991	ld	r1,PACAR1(r13)
 992BEGIN_FTR_SECTION
 993	CHECK_HMI_INTERRUPT
 994END_FTR_SECTION_IFSET(CPU_FTR_HVMODE)
 995	ld	r4,PACAKMSR(r13)
 996	ld	r5,_NIP(r1)
 997	ld	r6,_CCR(r1)
 
 
 998	addi	r1,r1,INT_FRAME_SIZE
 999	mtlr	r5
1000	mtcr	r6
1001	mtmsrd	r4
1002	blr
 
v4.10.11
  1/*
  2 *  This file contains idle entry/exit functions for POWER7,
  3 *  POWER8 and POWER9 CPUs.
  4 *
  5 *  This program is free software; you can redistribute it and/or
  6 *  modify it under the terms of the GNU General Public License
  7 *  as published by the Free Software Foundation; either version
  8 *  2 of the License, or (at your option) any later version.
  9 */
 10
 11#include <linux/threads.h>
 12#include <asm/processor.h>
 13#include <asm/page.h>
 14#include <asm/cputable.h>
 15#include <asm/thread_info.h>
 16#include <asm/ppc_asm.h>
 17#include <asm/asm-offsets.h>
 18#include <asm/ppc-opcode.h>
 19#include <asm/hw_irq.h>
 20#include <asm/kvm_book3s_asm.h>
 21#include <asm/opal.h>
 22#include <asm/cpuidle.h>
 
 23#include <asm/book3s/64/mmu-hash.h>
 24#include <asm/mmu.h>
 25
 26#undef DEBUG
 27
 28/*
 29 * Use unused space in the interrupt stack to save and restore
 30 * registers for winkle support.
 31 */
 
 32#define _SDR1	GPR3
 
 33#define _RPR	GPR4
 34#define _SPURR	GPR5
 35#define _PURR	GPR6
 36#define _TSCR	GPR7
 37#define _DSCR	GPR8
 38#define _AMOR	GPR9
 39#define _WORT	GPR10
 40#define _WORC	GPR11
 41#define _PTCR	GPR12
 42
 43#define PSSCR_HV_TEMPLATE	PSSCR_ESL | PSSCR_EC | \
 44				PSSCR_PSLL_MASK | PSSCR_TR_MASK | \
 45				PSSCR_MTL_MASK
 46
 47	.text
 48
 49/*
 50 * Used by threads before entering deep idle states. Saves SPRs
 51 * in interrupt stack frame
 52 */
 53save_sprs_to_stack:
 54	/*
 55	 * Note all register i.e per-core, per-subcore or per-thread is saved
 56	 * here since any thread in the core might wake up first
 57	 */
 58BEGIN_FTR_SECTION
 59	mfspr	r3,SPRN_PTCR
 60	std	r3,_PTCR(r1)
 61	/*
 62	 * Note - SDR1 is dropped in Power ISA v3. Hence not restoring
 63	 * SDR1 here
 64	 */
 
 
 
 
 65FTR_SECTION_ELSE
 66	mfspr	r3,SPRN_SDR1
 67	std	r3,_SDR1(r1)
 68ALT_FTR_SECTION_END_IFSET(CPU_FTR_ARCH_300)
 69	mfspr	r3,SPRN_RPR
 70	std	r3,_RPR(r1)
 71	mfspr	r3,SPRN_SPURR
 72	std	r3,_SPURR(r1)
 73	mfspr	r3,SPRN_PURR
 74	std	r3,_PURR(r1)
 75	mfspr	r3,SPRN_TSCR
 76	std	r3,_TSCR(r1)
 77	mfspr	r3,SPRN_DSCR
 78	std	r3,_DSCR(r1)
 79	mfspr	r3,SPRN_AMOR
 80	std	r3,_AMOR(r1)
 81	mfspr	r3,SPRN_WORT
 82	std	r3,_WORT(r1)
 83	mfspr	r3,SPRN_WORC
 84	std	r3,_WORC(r1)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 85
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 86	blr
 87
 88/*
 89 * Used by threads when the lock bit of core_idle_state is set.
 90 * Threads will spin in HMT_LOW until the lock bit is cleared.
 91 * r14 - pointer to core_idle_state
 92 * r15 - used to load contents of core_idle_state
 93 * r9  - used as a temporary variable
 94 */
 95
 96core_idle_lock_held:
 97	HMT_LOW
 983:	lwz	r15,0(r14)
 99	andi.   r15,r15,PNV_CORE_IDLE_LOCK_BIT
100	bne	3b
101	HMT_MEDIUM
102	lwarx	r15,0,r14
103	andi.	r9,r15,PNV_CORE_IDLE_LOCK_BIT
104	bne	core_idle_lock_held
105	blr
106
107/*
108 * Pass requested state in r3:
109 *	r3 - PNV_THREAD_NAP/SLEEP/WINKLE in POWER8
110 *	   - Requested STOP state in POWER9
111 *
112 * To check IRQ_HAPPENED in r4
113 * 	0 - don't check
114 * 	1 - check
115 *
116 * Address to 'rfid' to in r5
117 */
118_GLOBAL(pnv_powersave_common)
119	/* Use r3 to pass state nap/sleep/winkle */
120	/* NAP is a state loss, we create a regs frame on the
121	 * stack, fill it up with the state we care about and
122	 * stick a pointer to it in PACAR1. We really only
123	 * need to save PC, some CR bits and the NV GPRs,
124	 * but for now an interrupt frame will do.
125	 */
 
 
126	mflr	r0
127	std	r0,16(r1)
128	stdu	r1,-INT_FRAME_SIZE(r1)
129	std	r0,_LINK(r1)
130	std	r0,_NIP(r1)
131
132	/* Hard disable interrupts */
133	mfmsr	r9
134	rldicl	r9,r9,48,1
135	rotldi	r9,r9,16
136	mtmsrd	r9,1			/* hard-disable interrupts */
137
138	/* Check if something happened while soft-disabled */
139	lbz	r0,PACAIRQHAPPENED(r13)
140	andi.	r0,r0,~PACA_IRQ_HARD_DIS@l
141	beq	1f
142	cmpwi	cr0,r4,0
143	beq	1f
144	addi	r1,r1,INT_FRAME_SIZE
145	ld	r0,16(r1)
146	li	r3,0			/* Return 0 (no nap) */
147	mtlr	r0
148	blr
149
1501:	/* We mark irqs hard disabled as this is the state we'll
151	 * be in when returning and we need to tell arch_local_irq_restore()
152	 * about it
153	 */
154	li	r0,PACA_IRQ_HARD_DIS
155	stb	r0,PACAIRQHAPPENED(r13)
156
157	/* We haven't lost state ... yet */
158	li	r0,0
159	stb	r0,PACA_NAPSTATELOST(r13)
160
161	/* Continue saving state */
162	SAVE_GPR(2, r1)
163	SAVE_NVGPRS(r1)
164	mfcr	r4
165	std	r4,_CCR(r1)
166	std	r9,_MSR(r1)
167	std	r1,PACAR1(r13)
168
 
 
 
 
 
 
 
 
169	/*
 
170	 * Go to real mode to do the nap, as required by the architecture.
171	 * Also, we need to be in real mode before setting hwthread_state,
172	 * because as soon as we do that, another thread can switch
173	 * the MMU context to the guest.
174	 */
175	LOAD_REG_IMMEDIATE(r7, MSR_IDLE)
176	li	r6, MSR_RI
177	andc	r6, r9, r6
178	mtmsrd	r6, 1		/* clear RI before setting SRR0/1 */
179	mtspr	SPRN_SRR0, r5
180	mtspr	SPRN_SRR1, r7
181	rfid
 
 
 
 
 
 
 
 
 
 
182
183	.globl pnv_enter_arch207_idle_mode
184pnv_enter_arch207_idle_mode:
185#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
186	/* Tell KVM we're entering idle */
187	li	r4,KVM_HWTHREAD_IN_IDLE
188	/******************************************************/
189	/*  N O T E   W E L L    ! ! !    N O T E   W E L L   */
190	/* The following store to HSTATE_HWTHREAD_STATE(r13)  */
191	/* MUST occur in real mode, i.e. with the MMU off,    */
192	/* and the MMU must stay off until we clear this flag */
193	/* and test HSTATE_HWTHREAD_REQ(r13) in the system    */
194	/* reset interrupt vector in exceptions-64s.S.        */
195	/* The reason is that another thread can switch the   */
196	/* MMU to a guest context whenever this flag is set   */
197	/* to KVM_HWTHREAD_IN_IDLE, and if the MMU was on,    */
198	/* that would potentially cause this thread to start  */
199	/* executing instructions from guest memory in        */
200	/* hypervisor mode, leading to a host crash or data   */
201	/* corruption, or worse.                              */
202	/******************************************************/
203	stb	r4,HSTATE_HWTHREAD_STATE(r13)
204#endif
205	stb	r3,PACA_THREAD_IDLE_STATE(r13)
206	cmpwi	cr3,r3,PNV_THREAD_SLEEP
207	bge	cr3,2f
208	IDLE_STATE_ENTER_SEQ(PPC_NAP)
209	/* No return */
2102:
211	/* Sleep or winkle */
212	lbz	r7,PACA_THREAD_MASK(r13)
213	ld	r14,PACA_CORE_IDLE_STATE_PTR(r13)
 
 
 
 
214lwarx_loop1:
215	lwarx	r15,0,r14
216
217	andi.   r9,r15,PNV_CORE_IDLE_LOCK_BIT
218	bnel	core_idle_lock_held
219
 
220	andc	r15,r15,r7			/* Clear thread bit */
221
222	andi.	r15,r15,PNV_CORE_IDLE_THREAD_BITS
223
224/*
225 * If cr0 = 0, then current thread is the last thread of the core entering
226 * sleep. Last thread needs to execute the hardware bug workaround code if
227 * required by the platform.
228 * Make the workaround call unconditionally here. The below branch call is
229 * patched out when the idle states are discovered if the platform does not
230 * require it.
231 */
232.global pnv_fastsleep_workaround_at_entry
233pnv_fastsleep_workaround_at_entry:
234	beq	fastsleep_workaround_at_entry
235
236	stwcx.	r15,0,r14
237	bne-	lwarx_loop1
238	isync
239
240common_enter: /* common code for all the threads entering sleep or winkle */
241	bgt	cr3,enter_winkle
242	IDLE_STATE_ENTER_SEQ(PPC_SLEEP)
243
244fastsleep_workaround_at_entry:
245	ori	r15,r15,PNV_CORE_IDLE_LOCK_BIT
246	stwcx.	r15,0,r14
247	bne-	lwarx_loop1
248	isync
249
250	/* Fast sleep workaround */
251	li	r3,1
252	li	r4,1
253	bl	opal_rm_config_cpu_idle_state
254
255	/* Clear Lock bit */
256	li	r0,0
257	lwsync
258	stw	r0,0(r14)
259	b	common_enter
260
261enter_winkle:
262	bl	save_sprs_to_stack
263
264	IDLE_STATE_ENTER_SEQ(PPC_WINKLE)
265
266/*
267 * r3 - requested stop state
268 */
269power_enter_stop:
270#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
271	/* Tell KVM we're entering idle */
272	li	r4,KVM_HWTHREAD_IN_IDLE
273	/* DO THIS IN REAL MODE!  See comment above. */
274	stb	r4,HSTATE_HWTHREAD_STATE(r13)
275#endif
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
276/*
277 * Check if the requested state is a deep idle state.
278 */
279	LOAD_REG_ADDRBASE(r5,pnv_first_deep_stop_state)
280	ld	r4,ADDROFF(pnv_first_deep_stop_state)(r5)
281	cmpd	r3,r4
282	bge	2f
283	IDLE_STATE_ENTER_SEQ(PPC_STOP)
2842:
 
285/*
286 * Entering deep idle state.
287 * Clear thread bit in PACA_CORE_IDLE_STATE, save SPRs to
288 * stack and enter stop
289 */
290	lbz     r7,PACA_THREAD_MASK(r13)
291	ld      r14,PACA_CORE_IDLE_STATE_PTR(r13)
292
293lwarx_loop_stop:
294	lwarx   r15,0,r14
295	andi.   r9,r15,PNV_CORE_IDLE_LOCK_BIT
296	bnel    core_idle_lock_held
297	andc    r15,r15,r7                      /* Clear thread bit */
298
299	stwcx.  r15,0,r14
300	bne-    lwarx_loop_stop
301	isync
302
303	bl	save_sprs_to_stack
304
305	IDLE_STATE_ENTER_SEQ(PPC_STOP)
306
307_GLOBAL(power7_idle)
 
 
 
 
308	/* Now check if user or arch enabled NAP mode */
309	LOAD_REG_ADDRBASE(r3,powersave_nap)
310	lwz	r4,ADDROFF(powersave_nap)(r3)
311	cmpwi	0,r4,0
312	beqlr
313	li	r3, 1
314	/* fall through */
315
316_GLOBAL(power7_nap)
317	mr	r4,r3
318	li	r3,PNV_THREAD_NAP
319	LOAD_REG_ADDR(r5, pnv_enter_arch207_idle_mode)
320	b	pnv_powersave_common
321	/* No return */
322
323_GLOBAL(power7_sleep)
324	li	r3,PNV_THREAD_SLEEP
325	li	r4,1
326	LOAD_REG_ADDR(r5, pnv_enter_arch207_idle_mode)
327	b	pnv_powersave_common
328	/* No return */
329
330_GLOBAL(power7_winkle)
331	li	r3,PNV_THREAD_WINKLE
332	li	r4,1
333	LOAD_REG_ADDR(r5, pnv_enter_arch207_idle_mode)
334	b	pnv_powersave_common
335	/* No return */
336
337#define CHECK_HMI_INTERRUPT						\
338	mfspr	r0,SPRN_SRR1;						\
339BEGIN_FTR_SECTION_NESTED(66);						\
340	rlwinm	r0,r0,45-31,0xf;  /* extract wake reason field (P8) */	\
341FTR_SECTION_ELSE_NESTED(66);						\
342	rlwinm	r0,r0,45-31,0xe;  /* P7 wake reason field is 3 bits */	\
343ALT_FTR_SECTION_END_NESTED_IFSET(CPU_FTR_ARCH_207S, 66);		\
344	cmpwi	r0,0xa;			/* Hypervisor maintenance ? */	\
345	bne	20f;							\
346	/* Invoke opal call to handle hmi */				\
347	ld	r2,PACATOC(r13);					\
348	ld	r1,PACAR1(r13);						\
349	std	r3,ORIG_GPR3(r1);	/* Save original r3 */		\
350	li	r3,0;			/* NULL argument */		\
351	bl	hmi_exception_realmode;					\
352	nop;								\
353	ld	r3,ORIG_GPR3(r1);	/* Restore original r3 */	\
35420:	nop;
355
356
357/*
358 * r3 - requested stop state
 
 
 
 
359 */
 
 
 
 
 
 
 
 
 
 
 
 
 
 
360_GLOBAL(power9_idle_stop)
361	LOAD_REG_IMMEDIATE(r4, PSSCR_HV_TEMPLATE)
362	or	r4,r4,r3
363	mtspr	SPRN_PSSCR, r4
364	li	r4, 1
365	LOAD_REG_ADDR(r5,power_enter_stop)
 
 
 
 
 
 
366	b	pnv_powersave_common
367	/* No return */
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
368/*
369 * Called from reset vector. Check whether we have woken up with
370 * hypervisor state loss. If yes, restore hypervisor state and return
371 * back to reset vector.
372 *
373 * r13 - Contents of HSPRG0
374 * cr3 - set to gt if waking up with partial/complete hypervisor state loss
375 */
376_GLOBAL(pnv_restore_hyp_resource)
 
 
 
 
 
 
 
377BEGIN_FTR_SECTION
378	ld	r2,PACATOC(r13);
 
 
 
 
 
 
 
 
 
 
379	/*
380	 * POWER ISA 3. Use PSSCR to determine if we
381	 * are waking up from deep idle state
382	 */
383	LOAD_REG_ADDRBASE(r5,pnv_first_deep_stop_state)
384	ld	r4,ADDROFF(pnv_first_deep_stop_state)(r5)
385
386	mfspr	r5,SPRN_PSSCR
 
 
 
 
 
 
 
 
387	/*
388	 * 0-3 bits correspond to Power-Saving Level Status
389	 * which indicates the idle state we are waking up from
390	 */
 
391	rldicl  r5,r5,4,60
 
 
 
392	cmpd	cr4,r5,r4
393	bge	cr4,pnv_wakeup_tb_loss
394	/*
395	 * Waking up without hypervisor state loss. Return to
396	 * reset vector
397	 */
398	blr
399
400END_FTR_SECTION_IFSET(CPU_FTR_ARCH_300)
401
 
 
402	/*
403	 * POWER ISA 2.07 or less.
404	 * Check if last bit of HSPGR0 is set. This indicates whether we are
405	 * waking up from winkle.
406	 */
407	clrldi	r5,r13,63
408	clrrdi	r13,r13,1
409
410	/* Now that we are sure r13 is corrected, load TOC */
411	ld	r2,PACATOC(r13);
412	cmpwi	cr4,r5,1
413	mtspr	SPRN_HSPRG0,r13
414
415	lbz	r0,PACA_THREAD_IDLE_STATE(r13)
416	cmpwi   cr2,r0,PNV_THREAD_NAP
417	bgt     cr2,pnv_wakeup_tb_loss	/* Either sleep or Winkle */
418
419	/*
420	 * We fall through here if PACA_THREAD_IDLE_STATE shows we are waking
421	 * up from nap. At this stage CR3 shouldn't contains 'gt' since that
422	 * indicates we are waking with hypervisor state loss from nap.
423	 */
424	bgt	cr3,.
425
426	blr	/* Return back to System Reset vector from where
427		   pnv_restore_hyp_resource was invoked */
428
429/*
430 * Called if waking up from idle state which can cause either partial or
431 * complete hyp state loss.
432 * In POWER8, called if waking up from fastsleep or winkle
433 * In POWER9, called if waking up from stop state >= pnv_first_deep_stop_state
434 *
435 * r13 - PACA
436 * cr3 - gt if waking up with partial/complete hypervisor state loss
 
 
437 * cr4 - gt or eq if waking up from complete hypervisor state loss.
 
 
 
438 */
439_GLOBAL(pnv_wakeup_tb_loss)
440	ld	r1,PACAR1(r13)
441	/*
442	 * Before entering any idle state, the NVGPRs are saved in the stack.
443	 * If there was a state loss, or PACA_NAPSTATELOST was set, then the
444	 * NVGPRs are restored. If we are here, it is likely that state is lost,
445	 * but not guaranteed -- neither ISA207 nor ISA300 tests to reach
446	 * here are the same as the test to restore NVGPRS:
447	 * PACA_THREAD_IDLE_STATE test for ISA207, PSSCR test for ISA300,
448	 * and SRR1 test for restoring NVGPRs.
449	 *
450	 * We are about to clobber NVGPRs now, so set NAPSTATELOST to
451	 * guarantee they will always be restored. This might be tightened
452	 * with careful reading of specs (particularly for ISA300) but this
453	 * is already a slow wakeup path and it's simpler to be safe.
454	 */
455	li	r0,1
456	stb	r0,PACA_NAPSTATELOST(r13)
457
458	/*
459	 *
460	 * Save SRR1 and LR in NVGPRs as they might be clobbered in
461	 * opal_call() (called in CHECK_HMI_INTERRUPT). SRR1 is required
462	 * to determine the wakeup reason if we branch to kvm_start_guest. LR
463	 * is required to return back to reset vector after hypervisor state
464	 * restore is complete.
465	 */
 
 
466	mflr	r17
467	mfspr	r16,SPRN_SRR1
468BEGIN_FTR_SECTION
469	CHECK_HMI_INTERRUPT
470END_FTR_SECTION_IFSET(CPU_FTR_HVMODE)
471
 
472	lbz	r7,PACA_THREAD_MASK(r13)
473	ld	r14,PACA_CORE_IDLE_STATE_PTR(r13)
474lwarx_loop2:
475	lwarx	r15,0,r14
476	andi.	r9,r15,PNV_CORE_IDLE_LOCK_BIT
477	/*
 
 
478	 * Lock bit is set in one of the 2 cases-
479	 * a. In the sleep/winkle enter path, the last thread is executing
480	 * fastsleep workaround code.
481	 * b. In the wake up path, another thread is executing fastsleep
482	 * workaround undo code or resyncing timebase or restoring context
483	 * In either case loop until the lock bit is cleared.
484	 */
485	bnel	core_idle_lock_held
 
 
 
 
 
 
 
486
487	cmpwi	cr2,r15,0
 
488
489	/*
490	 * At this stage
491	 * cr2 - eq if first thread to wakeup in core
492	 * cr3-  gt if waking up with partial/complete hypervisor state loss
 
493	 * cr4 - gt or eq if waking up from complete hypervisor state loss.
494	 */
495
496	ori	r15,r15,PNV_CORE_IDLE_LOCK_BIT
497	stwcx.	r15,0,r14
498	bne-	lwarx_loop2
499	isync
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
500
501BEGIN_FTR_SECTION
502	lbz	r4,PACA_SUBCORE_SIBLING_MASK(r13)
503	and	r4,r4,r15
504	cmpwi	r4,0	/* Check if first in subcore */
505
506	or	r15,r15,r7		/* Set thread bit */
507	beq	first_thread_in_subcore
508END_FTR_SECTION_IFCLR(CPU_FTR_ARCH_300)
509
510	or	r15,r15,r7		/* Set thread bit */
511	beq	cr2,first_thread_in_core
512
513	/* Not first thread in core or subcore to wake up */
514	b	clear_lock
515
516first_thread_in_subcore:
517	/*
518	 * If waking up from sleep, subcore state is not lost. Hence
519	 * skip subcore state restore
520	 */
521	blt	cr4,subcore_state_restored
522
523	/* Restore per-subcore state */
524	ld      r4,_SDR1(r1)
525	mtspr   SPRN_SDR1,r4
526
527	ld      r4,_RPR(r1)
528	mtspr   SPRN_RPR,r4
529	ld	r4,_AMOR(r1)
530	mtspr	SPRN_AMOR,r4
531
532subcore_state_restored:
533	/*
534	 * Check if the thread is also the first thread in the core. If not,
535	 * skip to clear_lock.
536	 */
537	bne	cr2,clear_lock
538
539first_thread_in_core:
540
541	/*
542	 * First thread in the core waking up from any state which can cause
543	 * partial or complete hypervisor state loss. It needs to
544	 * call the fastsleep workaround code if the platform requires it.
545	 * Call it unconditionally here. The below branch instruction will
546	 * be patched out if the platform does not have fastsleep or does not
547	 * require the workaround. Patching will be performed during the
548	 * discovery of idle-states.
549	 */
550.global pnv_fastsleep_workaround_at_exit
551pnv_fastsleep_workaround_at_exit:
552	b	fastsleep_workaround_at_exit
553
554timebase_resync:
555	/*
556	 * Use cr3 which indicates that we are waking up with atleast partial
557	 * hypervisor state loss to determine if TIMEBASE RESYNC is needed.
558	 */
559	ble	cr3,clear_lock
560	/* Time base re-sync */
561	bl	opal_rm_resync_timebase;
562	/*
563	 * If waking up from sleep, per core state is not lost, skip to
564	 * clear_lock.
565	 */
 
566	blt	cr4,clear_lock
567
568	/*
569	 * First thread in the core to wake up and its waking up with
570	 * complete hypervisor state loss. Restore per core hypervisor
571	 * state.
572	 */
573BEGIN_FTR_SECTION
574	ld	r4,_PTCR(r1)
575	mtspr	SPRN_PTCR,r4
576	ld	r4,_RPR(r1)
577	mtspr	SPRN_RPR,r4
 
 
578END_FTR_SECTION_IFSET(CPU_FTR_ARCH_300)
579
580	ld	r4,_TSCR(r1)
581	mtspr	SPRN_TSCR,r4
582	ld	r4,_WORC(r1)
583	mtspr	SPRN_WORC,r4
584
585clear_lock:
586	andi.	r15,r15,PNV_CORE_IDLE_THREAD_BITS
587	lwsync
588	stw	r15,0(r14)
589
590common_exit:
591	/*
592	 * Common to all threads.
593	 *
594	 * If waking up from sleep, hypervisor state is not lost. Hence
595	 * skip hypervisor state restore.
596	 */
597	blt	cr4,hypervisor_state_restored
598
599	/* Waking up from winkle */
600
601BEGIN_MMU_FTR_SECTION
602	b	no_segments
603END_MMU_FTR_SECTION_IFSET(MMU_FTR_TYPE_RADIX)
604	/* Restore SLB  from PACA */
605	ld	r8,PACA_SLBSHADOWPTR(r13)
606
607	.rept	SLB_NUM_BOLTED
608	li	r3, SLBSHADOW_SAVEAREA
609	LDX_BE	r5, r8, r3
610	addi	r3, r3, 8
611	LDX_BE	r6, r8, r3
612	andis.	r7,r5,SLB_ESID_V@h
613	beq	1f
614	slbmte	r6,r5
6151:	addi	r8,r8,16
616	.endr
617no_segments:
618
619	/* Restore per thread state */
620
621	ld	r4,_SPURR(r1)
622	mtspr	SPRN_SPURR,r4
623	ld	r4,_PURR(r1)
624	mtspr	SPRN_PURR,r4
625	ld	r4,_DSCR(r1)
626	mtspr	SPRN_DSCR,r4
627	ld	r4,_WORT(r1)
628	mtspr	SPRN_WORT,r4
629
630	/* Call cur_cpu_spec->cpu_restore() */
631	LOAD_REG_ADDR(r4, cur_cpu_spec)
632	ld	r4,0(r4)
633	ld	r12,CPU_SPEC_RESTORE(r4)
634#ifdef PPC64_ELF_ABI_v1
635	ld	r12,0(r12)
636#endif
637	mtctr	r12
638	bctrl
639
 
 
 
 
 
 
 
 
 
 
 
640hypervisor_state_restored:
641
642	mtspr	SPRN_SRR1,r16
643	mtlr	r17
644	blr	/* Return back to System Reset vector from where
645		   pnv_restore_hyp_resource was invoked */
646
647fastsleep_workaround_at_exit:
648	li	r3,1
649	li	r4,0
650	bl	opal_rm_config_cpu_idle_state
651	b	timebase_resync
652
653/*
654 * R3 here contains the value that will be returned to the caller
655 * of power7_nap.
 
656 */
657_GLOBAL(pnv_wakeup_loss)
 
658	ld	r1,PACAR1(r13)
659BEGIN_FTR_SECTION
660	CHECK_HMI_INTERRUPT
661END_FTR_SECTION_IFSET(CPU_FTR_HVMODE)
662	REST_NVGPRS(r1)
663	REST_GPR(2, r1)
 
 
664	ld	r6,_CCR(r1)
665	ld	r4,_MSR(r1)
666	ld	r5,_NIP(r1)
667	addi	r1,r1,INT_FRAME_SIZE
 
668	mtcr	r6
669	mtspr	SPRN_SRR1,r4
670	mtspr	SPRN_SRR0,r5
671	rfid
672
673/*
674 * R3 here contains the value that will be returned to the caller
675 * of power7_nap.
 
676 */
677_GLOBAL(pnv_wakeup_noloss)
678	lbz	r0,PACA_NAPSTATELOST(r13)
679	cmpwi	r0,0
680	bne	pnv_wakeup_loss
 
681BEGIN_FTR_SECTION
682	CHECK_HMI_INTERRUPT
683END_FTR_SECTION_IFSET(CPU_FTR_HVMODE)
684	ld	r1,PACAR1(r13)
 
685	ld	r6,_CCR(r1)
686	ld	r4,_MSR(r1)
687	ld	r5,_NIP(r1)
688	addi	r1,r1,INT_FRAME_SIZE
 
689	mtcr	r6
690	mtspr	SPRN_SRR1,r4
691	mtspr	SPRN_SRR0,r5
692	rfid