Loading...
1/*
2 * This file contains idle entry/exit functions for POWER7,
3 * POWER8 and POWER9 CPUs.
4 *
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License
7 * as published by the Free Software Foundation; either version
8 * 2 of the License, or (at your option) any later version.
9 */
10
11#include <linux/threads.h>
12#include <asm/processor.h>
13#include <asm/page.h>
14#include <asm/cputable.h>
15#include <asm/thread_info.h>
16#include <asm/ppc_asm.h>
17#include <asm/asm-offsets.h>
18#include <asm/ppc-opcode.h>
19#include <asm/hw_irq.h>
20#include <asm/kvm_book3s_asm.h>
21#include <asm/opal.h>
22#include <asm/cpuidle.h>
23#include <asm/exception-64s.h>
24#include <asm/book3s/64/mmu-hash.h>
25#include <asm/mmu.h>
26
27#undef DEBUG
28
29/*
30 * Use unused space in the interrupt stack to save and restore
31 * registers for winkle support.
32 */
33#define _MMCR0 GPR0
34#define _SDR1 GPR3
35#define _PTCR GPR3
36#define _RPR GPR4
37#define _SPURR GPR5
38#define _PURR GPR6
39#define _TSCR GPR7
40#define _DSCR GPR8
41#define _AMOR GPR9
42#define _WORT GPR10
43#define _WORC GPR11
44#define _LPCR GPR12
45
46#define PSSCR_EC_ESL_MASK_SHIFTED (PSSCR_EC | PSSCR_ESL) >> 16
47
48 .text
49
50/*
51 * Used by threads before entering deep idle states. Saves SPRs
52 * in interrupt stack frame
53 */
54save_sprs_to_stack:
55 /*
56 * Note all register i.e per-core, per-subcore or per-thread is saved
57 * here since any thread in the core might wake up first
58 */
59BEGIN_FTR_SECTION
60 /*
61 * Note - SDR1 is dropped in Power ISA v3. Hence not restoring
62 * SDR1 here
63 */
64 mfspr r3,SPRN_PTCR
65 std r3,_PTCR(r1)
66 mfspr r3,SPRN_LPCR
67 std r3,_LPCR(r1)
68FTR_SECTION_ELSE
69 mfspr r3,SPRN_SDR1
70 std r3,_SDR1(r1)
71ALT_FTR_SECTION_END_IFSET(CPU_FTR_ARCH_300)
72 mfspr r3,SPRN_RPR
73 std r3,_RPR(r1)
74 mfspr r3,SPRN_SPURR
75 std r3,_SPURR(r1)
76 mfspr r3,SPRN_PURR
77 std r3,_PURR(r1)
78 mfspr r3,SPRN_TSCR
79 std r3,_TSCR(r1)
80 mfspr r3,SPRN_DSCR
81 std r3,_DSCR(r1)
82 mfspr r3,SPRN_AMOR
83 std r3,_AMOR(r1)
84 mfspr r3,SPRN_WORT
85 std r3,_WORT(r1)
86 mfspr r3,SPRN_WORC
87 std r3,_WORC(r1)
88/*
89 * On POWER9, there are idle states such as stop4, invoked via cpuidle,
90 * that lose hypervisor resources. In such cases, we need to save
91 * additional SPRs before entering those idle states so that they can
92 * be restored to their older values on wakeup from the idle state.
93 *
94 * On POWER8, the only such deep idle state is winkle which is used
95 * only in the context of CPU-Hotplug, where these additional SPRs are
96 * reinitiazed to a sane value. Hence there is no need to save/restore
97 * these SPRs.
98 */
99BEGIN_FTR_SECTION
100 blr
101END_FTR_SECTION_IFCLR(CPU_FTR_ARCH_300)
102
103power9_save_additional_sprs:
104 mfspr r3, SPRN_PID
105 mfspr r4, SPRN_LDBAR
106 std r3, STOP_PID(r13)
107 std r4, STOP_LDBAR(r13)
108
109 mfspr r3, SPRN_FSCR
110 mfspr r4, SPRN_HFSCR
111 std r3, STOP_FSCR(r13)
112 std r4, STOP_HFSCR(r13)
113
114 mfspr r3, SPRN_MMCRA
115 mfspr r4, SPRN_MMCR0
116 std r3, STOP_MMCRA(r13)
117 std r4, _MMCR0(r1)
118
119 mfspr r3, SPRN_MMCR1
120 mfspr r4, SPRN_MMCR2
121 std r3, STOP_MMCR1(r13)
122 std r4, STOP_MMCR2(r13)
123 blr
124
125power9_restore_additional_sprs:
126 ld r3,_LPCR(r1)
127 ld r4, STOP_PID(r13)
128 mtspr SPRN_LPCR,r3
129 mtspr SPRN_PID, r4
130
131 ld r3, STOP_LDBAR(r13)
132 ld r4, STOP_FSCR(r13)
133 mtspr SPRN_LDBAR, r3
134 mtspr SPRN_FSCR, r4
135
136 ld r3, STOP_HFSCR(r13)
137 ld r4, STOP_MMCRA(r13)
138 mtspr SPRN_HFSCR, r3
139 mtspr SPRN_MMCRA, r4
140
141 ld r3, _MMCR0(r1)
142 ld r4, STOP_MMCR1(r13)
143 mtspr SPRN_MMCR0, r3
144 mtspr SPRN_MMCR1, r4
145
146 ld r3, STOP_MMCR2(r13)
147 mtspr SPRN_MMCR2, r3
148 blr
149
150/*
151 * Used by threads when the lock bit of core_idle_state is set.
152 * Threads will spin in HMT_LOW until the lock bit is cleared.
153 * r14 - pointer to core_idle_state
154 * r15 - used to load contents of core_idle_state
155 * r9 - used as a temporary variable
156 */
157
158core_idle_lock_held:
159 HMT_LOW
1603: lwz r15,0(r14)
161 andis. r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
162 bne 3b
163 HMT_MEDIUM
164 lwarx r15,0,r14
165 andis. r9,r15,PNV_CORE_IDLE_LOCK_BIT@h
166 bne- core_idle_lock_held
167 blr
168
169/*
170 * Pass requested state in r3:
171 * r3 - PNV_THREAD_NAP/SLEEP/WINKLE in POWER8
172 * - Requested PSSCR value in POWER9
173 *
174 * Address of idle handler to branch to in realmode in r4
175 */
176pnv_powersave_common:
177 /* Use r3 to pass state nap/sleep/winkle */
178 /* NAP is a state loss, we create a regs frame on the
179 * stack, fill it up with the state we care about and
180 * stick a pointer to it in PACAR1. We really only
181 * need to save PC, some CR bits and the NV GPRs,
182 * but for now an interrupt frame will do.
183 */
184 mtctr r4
185
186 mflr r0
187 std r0,16(r1)
188 stdu r1,-INT_FRAME_SIZE(r1)
189 std r0,_LINK(r1)
190 std r0,_NIP(r1)
191
192 /* We haven't lost state ... yet */
193 li r0,0
194 stb r0,PACA_NAPSTATELOST(r13)
195
196 /* Continue saving state */
197 SAVE_GPR(2, r1)
198 SAVE_NVGPRS(r1)
199 mfcr r5
200 std r5,_CCR(r1)
201 std r1,PACAR1(r13)
202
203BEGIN_FTR_SECTION
204 /*
205 * POWER9 does not require real mode to stop, and presently does not
206 * set hwthread_state for KVM (threads don't share MMU context), so
207 * we can remain in virtual mode for this.
208 */
209 bctr
210END_FTR_SECTION_IFSET(CPU_FTR_ARCH_300)
211 /*
212 * POWER8
213 * Go to real mode to do the nap, as required by the architecture.
214 * Also, we need to be in real mode before setting hwthread_state,
215 * because as soon as we do that, another thread can switch
216 * the MMU context to the guest.
217 */
218 LOAD_REG_IMMEDIATE(r7, MSR_IDLE)
219 mtmsrd r7,0
220 bctr
221
222/*
223 * This is the sequence required to execute idle instructions, as
224 * specified in ISA v2.07 (and earlier). MSR[IR] and MSR[DR] must be 0.
225 */
226#define IDLE_STATE_ENTER_SEQ_NORET(IDLE_INST) \
227 /* Magic NAP/SLEEP/WINKLE mode enter sequence */ \
228 std r0,0(r1); \
229 ptesync; \
230 ld r0,0(r1); \
231236: cmpd cr0,r0,r0; \
232 bne 236b; \
233 IDLE_INST;
234
235
236 .globl pnv_enter_arch207_idle_mode
237pnv_enter_arch207_idle_mode:
238#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
239 /* Tell KVM we're entering idle */
240 li r4,KVM_HWTHREAD_IN_IDLE
241 /******************************************************/
242 /* N O T E W E L L ! ! ! N O T E W E L L */
243 /* The following store to HSTATE_HWTHREAD_STATE(r13) */
244 /* MUST occur in real mode, i.e. with the MMU off, */
245 /* and the MMU must stay off until we clear this flag */
246 /* and test HSTATE_HWTHREAD_REQ(r13) in */
247 /* pnv_powersave_wakeup in this file. */
248 /* The reason is that another thread can switch the */
249 /* MMU to a guest context whenever this flag is set */
250 /* to KVM_HWTHREAD_IN_IDLE, and if the MMU was on, */
251 /* that would potentially cause this thread to start */
252 /* executing instructions from guest memory in */
253 /* hypervisor mode, leading to a host crash or data */
254 /* corruption, or worse. */
255 /******************************************************/
256 stb r4,HSTATE_HWTHREAD_STATE(r13)
257#endif
258 stb r3,PACA_THREAD_IDLE_STATE(r13)
259 cmpwi cr3,r3,PNV_THREAD_SLEEP
260 bge cr3,2f
261 IDLE_STATE_ENTER_SEQ_NORET(PPC_NAP)
262 /* No return */
2632:
264 /* Sleep or winkle */
265 lbz r7,PACA_THREAD_MASK(r13)
266 ld r14,PACA_CORE_IDLE_STATE_PTR(r13)
267 li r5,0
268 beq cr3,3f
269 lis r5,PNV_CORE_IDLE_WINKLE_COUNT@h
2703:
271lwarx_loop1:
272 lwarx r15,0,r14
273
274 andis. r9,r15,PNV_CORE_IDLE_LOCK_BIT@h
275 bnel- core_idle_lock_held
276
277 add r15,r15,r5 /* Add if winkle */
278 andc r15,r15,r7 /* Clear thread bit */
279
280 andi. r9,r15,PNV_CORE_IDLE_THREAD_BITS
281
282/*
283 * If cr0 = 0, then current thread is the last thread of the core entering
284 * sleep. Last thread needs to execute the hardware bug workaround code if
285 * required by the platform.
286 * Make the workaround call unconditionally here. The below branch call is
287 * patched out when the idle states are discovered if the platform does not
288 * require it.
289 */
290.global pnv_fastsleep_workaround_at_entry
291pnv_fastsleep_workaround_at_entry:
292 beq fastsleep_workaround_at_entry
293
294 stwcx. r15,0,r14
295 bne- lwarx_loop1
296 isync
297
298common_enter: /* common code for all the threads entering sleep or winkle */
299 bgt cr3,enter_winkle
300 IDLE_STATE_ENTER_SEQ_NORET(PPC_SLEEP)
301
302fastsleep_workaround_at_entry:
303 oris r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
304 stwcx. r15,0,r14
305 bne- lwarx_loop1
306 isync
307
308 /* Fast sleep workaround */
309 li r3,1
310 li r4,1
311 bl opal_config_cpu_idle_state
312
313 /* Unlock */
314 xoris r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
315 lwsync
316 stw r15,0(r14)
317 b common_enter
318
319enter_winkle:
320 bl save_sprs_to_stack
321
322 IDLE_STATE_ENTER_SEQ_NORET(PPC_WINKLE)
323
324/*
325 * r3 - PSSCR value corresponding to the requested stop state.
326 */
327power_enter_stop:
328/*
329 * Check if we are executing the lite variant with ESL=EC=0
330 */
331 andis. r4,r3,PSSCR_EC_ESL_MASK_SHIFTED
332 clrldi r3,r3,60 /* r3 = Bits[60:63] = Requested Level (RL) */
333 bne .Lhandle_esl_ec_set
334 PPC_STOP
335 li r3,0 /* Since we didn't lose state, return 0 */
336 std r3, PACA_REQ_PSSCR(r13)
337
338 /*
339 * pnv_wakeup_noloss() expects r12 to contain the SRR1 value so
340 * it can determine if the wakeup reason is an HMI in
341 * CHECK_HMI_INTERRUPT.
342 *
343 * However, when we wakeup with ESL=0, SRR1 will not contain the wakeup
344 * reason, so there is no point setting r12 to SRR1.
345 *
346 * Further, we clear r12 here, so that we don't accidentally enter the
347 * HMI in pnv_wakeup_noloss() if the value of r12[42:45] == WAKE_HMI.
348 */
349 li r12, 0
350 b pnv_wakeup_noloss
351
352.Lhandle_esl_ec_set:
353BEGIN_FTR_SECTION
354 /*
355 * POWER9 DD2.0 or earlier can incorrectly set PMAO when waking up after
356 * a state-loss idle. Saving and restoring MMCR0 over idle is a
357 * workaround.
358 */
359 mfspr r4,SPRN_MMCR0
360 std r4,_MMCR0(r1)
361END_FTR_SECTION_IFCLR(CPU_FTR_POWER9_DD2_1)
362
363/*
364 * Check if the requested state is a deep idle state.
365 */
366 LOAD_REG_ADDRBASE(r5,pnv_first_deep_stop_state)
367 ld r4,ADDROFF(pnv_first_deep_stop_state)(r5)
368 cmpd r3,r4
369 bge .Lhandle_deep_stop
370 PPC_STOP /* Does not return (system reset interrupt) */
371
372.Lhandle_deep_stop:
373/*
374 * Entering deep idle state.
375 * Clear thread bit in PACA_CORE_IDLE_STATE, save SPRs to
376 * stack and enter stop
377 */
378 lbz r7,PACA_THREAD_MASK(r13)
379 ld r14,PACA_CORE_IDLE_STATE_PTR(r13)
380
381lwarx_loop_stop:
382 lwarx r15,0,r14
383 andis. r9,r15,PNV_CORE_IDLE_LOCK_BIT@h
384 bnel- core_idle_lock_held
385 andc r15,r15,r7 /* Clear thread bit */
386
387 stwcx. r15,0,r14
388 bne- lwarx_loop_stop
389 isync
390
391 bl save_sprs_to_stack
392
393 PPC_STOP /* Does not return (system reset interrupt) */
394
395/*
396 * Entered with MSR[EE]=0 and no soft-masked interrupts pending.
397 * r3 contains desired idle state (PNV_THREAD_NAP/SLEEP/WINKLE).
398 */
399_GLOBAL(power7_idle_insn)
400 /* Now check if user or arch enabled NAP mode */
401 LOAD_REG_ADDR(r4, pnv_enter_arch207_idle_mode)
402 b pnv_powersave_common
403
404#define CHECK_HMI_INTERRUPT \
405BEGIN_FTR_SECTION_NESTED(66); \
406 rlwinm r0,r12,45-31,0xf; /* extract wake reason field (P8) */ \
407FTR_SECTION_ELSE_NESTED(66); \
408 rlwinm r0,r12,45-31,0xe; /* P7 wake reason field is 3 bits */ \
409ALT_FTR_SECTION_END_NESTED_IFSET(CPU_FTR_ARCH_207S, 66); \
410 cmpwi r0,0xa; /* Hypervisor maintenance ? */ \
411 bne+ 20f; \
412 /* Invoke opal call to handle hmi */ \
413 ld r2,PACATOC(r13); \
414 ld r1,PACAR1(r13); \
415 std r3,ORIG_GPR3(r1); /* Save original r3 */ \
416 li r3,0; /* NULL argument */ \
417 bl hmi_exception_realmode; \
418 nop; \
419 ld r3,ORIG_GPR3(r1); /* Restore original r3 */ \
42020: nop;
421
422/*
423 * Entered with MSR[EE]=0 and no soft-masked interrupts pending.
424 * r3 contains desired PSSCR register value.
425 *
426 * Offline (CPU unplug) case also must notify KVM that the CPU is
427 * idle.
428 */
429_GLOBAL(power9_offline_stop)
430#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
431 /*
432 * Tell KVM we're entering idle.
433 * This does not have to be done in real mode because the P9 MMU
434 * is independent per-thread. Some steppings share radix/hash mode
435 * between threads, but in that case KVM has a barrier sync in real
436 * mode before and after switching between radix and hash.
437 */
438 li r4,KVM_HWTHREAD_IN_IDLE
439 stb r4,HSTATE_HWTHREAD_STATE(r13)
440#endif
441 /* fall through */
442
443_GLOBAL(power9_idle_stop)
444 std r3, PACA_REQ_PSSCR(r13)
445#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
446BEGIN_FTR_SECTION
447 sync
448 lwz r5, PACA_DONT_STOP(r13)
449 cmpwi r5, 0
450 bne 1f
451END_FTR_SECTION_IFSET(CPU_FTR_P9_TM_XER_SO_BUG)
452#endif
453 mtspr SPRN_PSSCR,r3
454 LOAD_REG_ADDR(r4,power_enter_stop)
455 b pnv_powersave_common
456 /* No return */
457#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
4581:
459 /*
460 * We get here when TM / thread reconfiguration bug workaround
461 * code wants to get the CPU into SMT4 mode, and therefore
462 * we are being asked not to stop.
463 */
464 li r3, 0
465 std r3, PACA_REQ_PSSCR(r13)
466 blr /* return 0 for wakeup cause / SRR1 value */
467#endif
468
469/*
470 * On waking up from stop 0,1,2 with ESL=1 on POWER9 DD1,
471 * HSPRG0 will be set to the HSPRG0 value of one of the
472 * threads in this core. Thus the value we have in r13
473 * may not be this thread's paca pointer.
474 *
475 * Fortunately, the TIR remains invariant. Since this thread's
476 * paca pointer is recorded in all its sibling's paca, we can
477 * correctly recover this thread's paca pointer if we
478 * know the index of this thread in the core.
479 *
480 * This index can be obtained from the TIR.
481 *
482 * i.e, thread's position in the core = TIR.
483 * If this value is i, then this thread's paca is
484 * paca->thread_sibling_pacas[i].
485 */
486power9_dd1_recover_paca:
487 mfspr r4, SPRN_TIR
488 /*
489 * Since each entry in thread_sibling_pacas is 8 bytes
490 * we need to left-shift by 3 bits. Thus r4 = i * 8
491 */
492 sldi r4, r4, 3
493 /* Get &paca->thread_sibling_pacas[0] in r5 */
494 ld r5, PACA_SIBLING_PACA_PTRS(r13)
495 /* Load paca->thread_sibling_pacas[i] into r13 */
496 ldx r13, r4, r5
497 SET_PACA(r13)
498 /*
499 * Indicate that we have lost NVGPR state
500 * which needs to be restored from the stack.
501 */
502 li r3, 1
503 stb r3,PACA_NAPSTATELOST(r13)
504 blr
505
506/*
507 * Called from machine check handler for powersave wakeups.
508 * Low level machine check processing has already been done. Now just
509 * go through the wake up path to get everything in order.
510 *
511 * r3 - The original SRR1 value.
512 * Original SRR[01] have been clobbered.
513 * MSR_RI is clear.
514 */
515.global pnv_powersave_wakeup_mce
516pnv_powersave_wakeup_mce:
517 /* Set cr3 for pnv_powersave_wakeup */
518 rlwinm r11,r3,47-31,30,31
519 cmpwi cr3,r11,2
520
521 /*
522 * Now put the original SRR1 with SRR1_WAKEMCE_RESVD as the wake
523 * reason into r12, which allows reuse of the system reset wakeup
524 * code without being mistaken for another type of wakeup.
525 */
526 oris r12,r3,SRR1_WAKEMCE_RESVD@h
527
528 b pnv_powersave_wakeup
529
530/*
531 * Called from reset vector for powersave wakeups.
532 * cr3 - set to gt if waking up with partial/complete hypervisor state loss
533 * r12 - SRR1
534 */
535.global pnv_powersave_wakeup
536pnv_powersave_wakeup:
537 ld r2, PACATOC(r13)
538
539BEGIN_FTR_SECTION
540BEGIN_FTR_SECTION_NESTED(70)
541 bl power9_dd1_recover_paca
542END_FTR_SECTION_NESTED_IFSET(CPU_FTR_POWER9_DD1, 70)
543 bl pnv_restore_hyp_resource_arch300
544FTR_SECTION_ELSE
545 bl pnv_restore_hyp_resource_arch207
546ALT_FTR_SECTION_END_IFSET(CPU_FTR_ARCH_300)
547
548 li r0,PNV_THREAD_RUNNING
549 stb r0,PACA_THREAD_IDLE_STATE(r13) /* Clear thread state */
550
551 mr r3,r12
552
553#ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
554 lbz r0,HSTATE_HWTHREAD_STATE(r13)
555 cmpwi r0,KVM_HWTHREAD_IN_KERNEL
556 beq 0f
557 li r0,KVM_HWTHREAD_IN_KERNEL
558 stb r0,HSTATE_HWTHREAD_STATE(r13)
559 /* Order setting hwthread_state vs. testing hwthread_req */
560 sync
5610: lbz r0,HSTATE_HWTHREAD_REQ(r13)
562 cmpwi r0,0
563 beq 1f
564 b kvm_start_guest
5651:
566#endif
567
568 /* Return SRR1 from power7_nap() */
569 blt cr3,pnv_wakeup_noloss
570 b pnv_wakeup_loss
571
572/*
573 * Check whether we have woken up with hypervisor state loss.
574 * If yes, restore hypervisor state and return back to link.
575 *
576 * cr3 - set to gt if waking up with partial/complete hypervisor state loss
577 */
578pnv_restore_hyp_resource_arch300:
579 /*
580 * Workaround for POWER9, if we lost resources, the ERAT
581 * might have been mixed up and needs flushing. We also need
582 * to reload MMCR0 (see comment above). We also need to set
583 * then clear bit 60 in MMCRA to ensure the PMU starts running.
584 */
585 blt cr3,1f
586BEGIN_FTR_SECTION
587 PPC_INVALIDATE_ERAT
588 ld r1,PACAR1(r13)
589 ld r4,_MMCR0(r1)
590 mtspr SPRN_MMCR0,r4
591END_FTR_SECTION_IFCLR(CPU_FTR_POWER9_DD2_1)
592 mfspr r4,SPRN_MMCRA
593 ori r4,r4,(1 << (63-60))
594 mtspr SPRN_MMCRA,r4
595 xori r4,r4,(1 << (63-60))
596 mtspr SPRN_MMCRA,r4
5971:
598 /*
599 * POWER ISA 3. Use PSSCR to determine if we
600 * are waking up from deep idle state
601 */
602 LOAD_REG_ADDRBASE(r5,pnv_first_deep_stop_state)
603 ld r4,ADDROFF(pnv_first_deep_stop_state)(r5)
604
605BEGIN_FTR_SECTION_NESTED(71)
606 /*
607 * Assume that we are waking up from the state
608 * same as the Requested Level (RL) in the PSSCR
609 * which are Bits 60-63
610 */
611 ld r5,PACA_REQ_PSSCR(r13)
612 rldicl r5,r5,0,60
613FTR_SECTION_ELSE_NESTED(71)
614 /*
615 * 0-3 bits correspond to Power-Saving Level Status
616 * which indicates the idle state we are waking up from
617 */
618 mfspr r5, SPRN_PSSCR
619 rldicl r5,r5,4,60
620ALT_FTR_SECTION_END_NESTED_IFSET(CPU_FTR_POWER9_DD1, 71)
621 li r0, 0 /* clear requested_psscr to say we're awake */
622 std r0, PACA_REQ_PSSCR(r13)
623 cmpd cr4,r5,r4
624 bge cr4,pnv_wakeup_tb_loss /* returns to caller */
625
626 blr /* Waking up without hypervisor state loss. */
627
628/* Same calling convention as arch300 */
629pnv_restore_hyp_resource_arch207:
630 /*
631 * POWER ISA 2.07 or less.
632 * Check if we slept with sleep or winkle.
633 */
634 lbz r4,PACA_THREAD_IDLE_STATE(r13)
635 cmpwi cr2,r4,PNV_THREAD_NAP
636 bgt cr2,pnv_wakeup_tb_loss /* Either sleep or Winkle */
637
638 /*
639 * We fall through here if PACA_THREAD_IDLE_STATE shows we are waking
640 * up from nap. At this stage CR3 shouldn't contains 'gt' since that
641 * indicates we are waking with hypervisor state loss from nap.
642 */
643 bgt cr3,.
644
645 blr /* Waking up without hypervisor state loss */
646
647/*
648 * Called if waking up from idle state which can cause either partial or
649 * complete hyp state loss.
650 * In POWER8, called if waking up from fastsleep or winkle
651 * In POWER9, called if waking up from stop state >= pnv_first_deep_stop_state
652 *
653 * r13 - PACA
654 * cr3 - gt if waking up with partial/complete hypervisor state loss
655 *
656 * If ISA300:
657 * cr4 - gt or eq if waking up from complete hypervisor state loss.
658 *
659 * If ISA207:
660 * r4 - PACA_THREAD_IDLE_STATE
661 */
662pnv_wakeup_tb_loss:
663 ld r1,PACAR1(r13)
664 /*
665 * Before entering any idle state, the NVGPRs are saved in the stack.
666 * If there was a state loss, or PACA_NAPSTATELOST was set, then the
667 * NVGPRs are restored. If we are here, it is likely that state is lost,
668 * but not guaranteed -- neither ISA207 nor ISA300 tests to reach
669 * here are the same as the test to restore NVGPRS:
670 * PACA_THREAD_IDLE_STATE test for ISA207, PSSCR test for ISA300,
671 * and SRR1 test for restoring NVGPRs.
672 *
673 * We are about to clobber NVGPRs now, so set NAPSTATELOST to
674 * guarantee they will always be restored. This might be tightened
675 * with careful reading of specs (particularly for ISA300) but this
676 * is already a slow wakeup path and it's simpler to be safe.
677 */
678 li r0,1
679 stb r0,PACA_NAPSTATELOST(r13)
680
681 /*
682 *
683 * Save SRR1 and LR in NVGPRs as they might be clobbered in
684 * opal_call() (called in CHECK_HMI_INTERRUPT). SRR1 is required
685 * to determine the wakeup reason if we branch to kvm_start_guest. LR
686 * is required to return back to reset vector after hypervisor state
687 * restore is complete.
688 */
689 mr r19,r12
690 mr r18,r4
691 mflr r17
692BEGIN_FTR_SECTION
693 CHECK_HMI_INTERRUPT
694END_FTR_SECTION_IFSET(CPU_FTR_HVMODE)
695
696 ld r14,PACA_CORE_IDLE_STATE_PTR(r13)
697 lbz r7,PACA_THREAD_MASK(r13)
698
699 /*
700 * Take the core lock to synchronize against other threads.
701 *
702 * Lock bit is set in one of the 2 cases-
703 * a. In the sleep/winkle enter path, the last thread is executing
704 * fastsleep workaround code.
705 * b. In the wake up path, another thread is executing fastsleep
706 * workaround undo code or resyncing timebase or restoring context
707 * In either case loop until the lock bit is cleared.
708 */
7091:
710 lwarx r15,0,r14
711 andis. r9,r15,PNV_CORE_IDLE_LOCK_BIT@h
712 bnel- core_idle_lock_held
713 oris r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
714 stwcx. r15,0,r14
715 bne- 1b
716 isync
717
718 andi. r9,r15,PNV_CORE_IDLE_THREAD_BITS
719 cmpwi cr2,r9,0
720
721 /*
722 * At this stage
723 * cr2 - eq if first thread to wakeup in core
724 * cr3- gt if waking up with partial/complete hypervisor state loss
725 * ISA300:
726 * cr4 - gt or eq if waking up from complete hypervisor state loss.
727 */
728
729BEGIN_FTR_SECTION
730 /*
731 * Were we in winkle?
732 * If yes, check if all threads were in winkle, decrement our
733 * winkle count, set all thread winkle bits if all were in winkle.
734 * Check if our thread has a winkle bit set, and set cr4 accordingly
735 * (to match ISA300, above). Pseudo-code for core idle state
736 * transitions for ISA207 is as follows (everything happens atomically
737 * due to store conditional and/or lock bit):
738 *
739 * nap_idle() { }
740 * nap_wake() { }
741 *
742 * sleep_idle()
743 * {
744 * core_idle_state &= ~thread_in_core
745 * }
746 *
747 * sleep_wake()
748 * {
749 * bool first_in_core, first_in_subcore;
750 *
751 * first_in_core = (core_idle_state & IDLE_THREAD_BITS) == 0;
752 * first_in_subcore = (core_idle_state & SUBCORE_SIBLING_MASK) == 0;
753 *
754 * core_idle_state |= thread_in_core;
755 * }
756 *
757 * winkle_idle()
758 * {
759 * core_idle_state &= ~thread_in_core;
760 * core_idle_state += 1 << WINKLE_COUNT_SHIFT;
761 * }
762 *
763 * winkle_wake()
764 * {
765 * bool first_in_core, first_in_subcore, winkle_state_lost;
766 *
767 * first_in_core = (core_idle_state & IDLE_THREAD_BITS) == 0;
768 * first_in_subcore = (core_idle_state & SUBCORE_SIBLING_MASK) == 0;
769 *
770 * core_idle_state |= thread_in_core;
771 *
772 * if ((core_idle_state & WINKLE_MASK) == (8 << WINKLE_COUNT_SIHFT))
773 * core_idle_state |= THREAD_WINKLE_BITS;
774 * core_idle_state -= 1 << WINKLE_COUNT_SHIFT;
775 *
776 * winkle_state_lost = core_idle_state &
777 * (thread_in_core << WINKLE_THREAD_SHIFT);
778 * core_idle_state &= ~(thread_in_core << WINKLE_THREAD_SHIFT);
779 * }
780 *
781 */
782 cmpwi r18,PNV_THREAD_WINKLE
783 bne 2f
784 andis. r9,r15,PNV_CORE_IDLE_WINKLE_COUNT_ALL_BIT@h
785 subis r15,r15,PNV_CORE_IDLE_WINKLE_COUNT@h
786 beq 2f
787 ori r15,r15,PNV_CORE_IDLE_THREAD_WINKLE_BITS /* all were winkle */
7882:
789 /* Shift thread bit to winkle mask, then test if this thread is set,
790 * and remove it from the winkle bits */
791 slwi r8,r7,8
792 and r8,r8,r15
793 andc r15,r15,r8
794 cmpwi cr4,r8,1 /* cr4 will be gt if our bit is set, lt if not */
795
796 lbz r4,PACA_SUBCORE_SIBLING_MASK(r13)
797 and r4,r4,r15
798 cmpwi r4,0 /* Check if first in subcore */
799
800 or r15,r15,r7 /* Set thread bit */
801 beq first_thread_in_subcore
802END_FTR_SECTION_IFCLR(CPU_FTR_ARCH_300)
803
804 or r15,r15,r7 /* Set thread bit */
805 beq cr2,first_thread_in_core
806
807 /* Not first thread in core or subcore to wake up */
808 b clear_lock
809
810first_thread_in_subcore:
811 /*
812 * If waking up from sleep, subcore state is not lost. Hence
813 * skip subcore state restore
814 */
815 blt cr4,subcore_state_restored
816
817 /* Restore per-subcore state */
818 ld r4,_SDR1(r1)
819 mtspr SPRN_SDR1,r4
820
821 ld r4,_RPR(r1)
822 mtspr SPRN_RPR,r4
823 ld r4,_AMOR(r1)
824 mtspr SPRN_AMOR,r4
825
826subcore_state_restored:
827 /*
828 * Check if the thread is also the first thread in the core. If not,
829 * skip to clear_lock.
830 */
831 bne cr2,clear_lock
832
833first_thread_in_core:
834
835 /*
836 * First thread in the core waking up from any state which can cause
837 * partial or complete hypervisor state loss. It needs to
838 * call the fastsleep workaround code if the platform requires it.
839 * Call it unconditionally here. The below branch instruction will
840 * be patched out if the platform does not have fastsleep or does not
841 * require the workaround. Patching will be performed during the
842 * discovery of idle-states.
843 */
844.global pnv_fastsleep_workaround_at_exit
845pnv_fastsleep_workaround_at_exit:
846 b fastsleep_workaround_at_exit
847
848timebase_resync:
849 /*
850 * Use cr3 which indicates that we are waking up with atleast partial
851 * hypervisor state loss to determine if TIMEBASE RESYNC is needed.
852 */
853 ble cr3,.Ltb_resynced
854 /* Time base re-sync */
855 bl opal_resync_timebase;
856 /*
857 * If waking up from sleep (POWER8), per core state
858 * is not lost, skip to clear_lock.
859 */
860.Ltb_resynced:
861 blt cr4,clear_lock
862
863 /*
864 * First thread in the core to wake up and its waking up with
865 * complete hypervisor state loss. Restore per core hypervisor
866 * state.
867 */
868BEGIN_FTR_SECTION
869 ld r4,_PTCR(r1)
870 mtspr SPRN_PTCR,r4
871 ld r4,_RPR(r1)
872 mtspr SPRN_RPR,r4
873 ld r4,_AMOR(r1)
874 mtspr SPRN_AMOR,r4
875END_FTR_SECTION_IFSET(CPU_FTR_ARCH_300)
876
877 ld r4,_TSCR(r1)
878 mtspr SPRN_TSCR,r4
879 ld r4,_WORC(r1)
880 mtspr SPRN_WORC,r4
881
882clear_lock:
883 xoris r15,r15,PNV_CORE_IDLE_LOCK_BIT@h
884 lwsync
885 stw r15,0(r14)
886
887common_exit:
888 /*
889 * Common to all threads.
890 *
891 * If waking up from sleep, hypervisor state is not lost. Hence
892 * skip hypervisor state restore.
893 */
894 blt cr4,hypervisor_state_restored
895
896 /* Waking up from winkle */
897
898BEGIN_MMU_FTR_SECTION
899 b no_segments
900END_MMU_FTR_SECTION_IFSET(MMU_FTR_TYPE_RADIX)
901 /* Restore SLB from PACA */
902 ld r8,PACA_SLBSHADOWPTR(r13)
903
904 .rept SLB_NUM_BOLTED
905 li r3, SLBSHADOW_SAVEAREA
906 LDX_BE r5, r8, r3
907 addi r3, r3, 8
908 LDX_BE r6, r8, r3
909 andis. r7,r5,SLB_ESID_V@h
910 beq 1f
911 slbmte r6,r5
9121: addi r8,r8,16
913 .endr
914no_segments:
915
916 /* Restore per thread state */
917
918 ld r4,_SPURR(r1)
919 mtspr SPRN_SPURR,r4
920 ld r4,_PURR(r1)
921 mtspr SPRN_PURR,r4
922 ld r4,_DSCR(r1)
923 mtspr SPRN_DSCR,r4
924 ld r4,_WORT(r1)
925 mtspr SPRN_WORT,r4
926
927 /* Call cur_cpu_spec->cpu_restore() */
928 LOAD_REG_ADDR(r4, cur_cpu_spec)
929 ld r4,0(r4)
930 ld r12,CPU_SPEC_RESTORE(r4)
931#ifdef PPC64_ELF_ABI_v1
932 ld r12,0(r12)
933#endif
934 mtctr r12
935 bctrl
936
937/*
938 * On POWER9, we can come here on wakeup from a cpuidle stop state.
939 * Hence restore the additional SPRs to the saved value.
940 *
941 * On POWER8, we come here only on winkle. Since winkle is used
942 * only in the case of CPU-Hotplug, we don't need to restore
943 * the additional SPRs.
944 */
945BEGIN_FTR_SECTION
946 bl power9_restore_additional_sprs
947END_FTR_SECTION_IFSET(CPU_FTR_ARCH_300)
948hypervisor_state_restored:
949
950 mr r12,r19
951 mtlr r17
952 blr /* return to pnv_powersave_wakeup */
953
954fastsleep_workaround_at_exit:
955 li r3,1
956 li r4,0
957 bl opal_config_cpu_idle_state
958 b timebase_resync
959
960/*
961 * R3 here contains the value that will be returned to the caller
962 * of power7_nap.
963 * R12 contains SRR1 for CHECK_HMI_INTERRUPT.
964 */
965.global pnv_wakeup_loss
966pnv_wakeup_loss:
967 ld r1,PACAR1(r13)
968BEGIN_FTR_SECTION
969 CHECK_HMI_INTERRUPT
970END_FTR_SECTION_IFSET(CPU_FTR_HVMODE)
971 REST_NVGPRS(r1)
972 REST_GPR(2, r1)
973 ld r4,PACAKMSR(r13)
974 ld r5,_LINK(r1)
975 ld r6,_CCR(r1)
976 addi r1,r1,INT_FRAME_SIZE
977 mtlr r5
978 mtcr r6
979 mtmsrd r4
980 blr
981
982/*
983 * R3 here contains the value that will be returned to the caller
984 * of power7_nap.
985 * R12 contains SRR1 for CHECK_HMI_INTERRUPT.
986 */
987pnv_wakeup_noloss:
988 lbz r0,PACA_NAPSTATELOST(r13)
989 cmpwi r0,0
990 bne pnv_wakeup_loss
991 ld r1,PACAR1(r13)
992BEGIN_FTR_SECTION
993 CHECK_HMI_INTERRUPT
994END_FTR_SECTION_IFSET(CPU_FTR_HVMODE)
995 ld r4,PACAKMSR(r13)
996 ld r5,_NIP(r1)
997 ld r6,_CCR(r1)
998 addi r1,r1,INT_FRAME_SIZE
999 mtlr r5
1000 mtcr r6
1001 mtmsrd r4
1002 blr
1/* SPDX-License-Identifier: GPL-2.0-or-later */
2/*
3 * Copyright 2018, IBM Corporation.
4 *
5 * This file contains general idle entry/exit functions to save
6 * and restore stack and NVGPRs which allows C code to call idle
7 * states that lose GPRs, and it will return transparently with
8 * SRR1 wakeup reason return value.
9 *
10 * The platform / CPU caller must ensure SPRs and any other non-GPR
11 * state is saved and restored correctly, handle KVM, interrupts, etc.
12 */
13
14#include <asm/ppc_asm.h>
15#include <asm/asm-offsets.h>
16#include <asm/ppc-opcode.h>
17#include <asm/cpuidle.h>
18#include <asm/thread_info.h> /* TLF_NAPPING */
19
20#ifdef CONFIG_PPC_P7_NAP
21/*
22 * Desired PSSCR in r3
23 *
24 * No state will be lost regardless of wakeup mechanism (interrupt or NIA).
25 *
26 * An EC=0 type wakeup will return with a value of 0. SRESET wakeup (which can
27 * happen with xscom SRESET and possibly MCE) may clobber volatiles except LR,
28 * and must blr, to return to caller with r3 set according to caller's expected
29 * return code (for Book3S/64 that is SRR1).
30 */
31_GLOBAL(isa300_idle_stop_noloss)
32 mtspr SPRN_PSSCR,r3
33 PPC_STOP
34 li r3,0
35 blr
36
37/*
38 * Desired PSSCR in r3
39 *
40 * GPRs may be lost, so they are saved here. Wakeup is by interrupt only.
41 * The SRESET wakeup returns to this function's caller by calling
42 * idle_return_gpr_loss with r3 set to desired return value.
43 *
44 * A wakeup without GPR loss may alteratively be handled as in
45 * isa300_idle_stop_noloss and blr directly, as an optimisation.
46 *
47 * The caller is responsible for saving/restoring SPRs, MSR, timebase,
48 * etc.
49 */
50_GLOBAL(isa300_idle_stop_mayloss)
51 mtspr SPRN_PSSCR,r3
52 std r1,PACAR1(r13)
53 mflr r4
54 mfcr r5
55 /*
56 * Use the stack red zone rather than a new frame for saving regs since
57 * in the case of no GPR loss the wakeup code branches directly back to
58 * the caller without deallocating the stack frame first.
59 */
60 std r2,-8*1(r1)
61 std r14,-8*2(r1)
62 std r15,-8*3(r1)
63 std r16,-8*4(r1)
64 std r17,-8*5(r1)
65 std r18,-8*6(r1)
66 std r19,-8*7(r1)
67 std r20,-8*8(r1)
68 std r21,-8*9(r1)
69 std r22,-8*10(r1)
70 std r23,-8*11(r1)
71 std r24,-8*12(r1)
72 std r25,-8*13(r1)
73 std r26,-8*14(r1)
74 std r27,-8*15(r1)
75 std r28,-8*16(r1)
76 std r29,-8*17(r1)
77 std r30,-8*18(r1)
78 std r31,-8*19(r1)
79 std r4,-8*20(r1)
80 std r5,-8*21(r1)
81 /* 168 bytes */
82 PPC_STOP
83 b . /* catch bugs */
84
85/*
86 * Desired return value in r3
87 *
88 * The idle wakeup SRESET interrupt can call this after calling
89 * to return to the idle sleep function caller with r3 as the return code.
90 *
91 * This must not be used if idle was entered via a _noloss function (use
92 * a simple blr instead).
93 */
94_GLOBAL(idle_return_gpr_loss)
95 ld r1,PACAR1(r13)
96 ld r4,-8*20(r1)
97 ld r5,-8*21(r1)
98 mtlr r4
99 mtcr r5
100 /*
101 * KVM nap requires r2 to be saved, rather than just restoring it
102 * from PACATOC. This could be avoided for that less common case
103 * if KVM saved its r2.
104 */
105 ld r2,-8*1(r1)
106 ld r14,-8*2(r1)
107 ld r15,-8*3(r1)
108 ld r16,-8*4(r1)
109 ld r17,-8*5(r1)
110 ld r18,-8*6(r1)
111 ld r19,-8*7(r1)
112 ld r20,-8*8(r1)
113 ld r21,-8*9(r1)
114 ld r22,-8*10(r1)
115 ld r23,-8*11(r1)
116 ld r24,-8*12(r1)
117 ld r25,-8*13(r1)
118 ld r26,-8*14(r1)
119 ld r27,-8*15(r1)
120 ld r28,-8*16(r1)
121 ld r29,-8*17(r1)
122 ld r30,-8*18(r1)
123 ld r31,-8*19(r1)
124 blr
125
126/*
127 * This is the sequence required to execute idle instructions, as
128 * specified in ISA v2.07 (and earlier). MSR[IR] and MSR[DR] must be 0.
129 * We have to store a GPR somewhere, ptesync, then reload it, and create
130 * a false dependency on the result of the load. It doesn't matter which
131 * GPR we store, or where we store it. We have already stored r2 to the
132 * stack at -8(r1) in isa206_idle_insn_mayloss, so use that.
133 */
134#define IDLE_STATE_ENTER_SEQ_NORET(IDLE_INST) \
135 /* Magic NAP/SLEEP/WINKLE mode enter sequence */ \
136 std r2,-8(r1); \
137 ptesync; \
138 ld r2,-8(r1); \
139236: cmpd cr0,r2,r2; \
140 bne 236b; \
141 IDLE_INST; \
142 b . /* catch bugs */
143
144/*
145 * Desired instruction type in r3
146 *
147 * GPRs may be lost, so they are saved here. Wakeup is by interrupt only.
148 * The SRESET wakeup returns to this function's caller by calling
149 * idle_return_gpr_loss with r3 set to desired return value.
150 *
151 * A wakeup without GPR loss may alteratively be handled as in
152 * isa300_idle_stop_noloss and blr directly, as an optimisation.
153 *
154 * The caller is responsible for saving/restoring SPRs, MSR, timebase,
155 * etc.
156 *
157 * This must be called in real-mode (MSR_IDLE).
158 */
159_GLOBAL(isa206_idle_insn_mayloss)
160 std r1,PACAR1(r13)
161 mflr r4
162 mfcr r5
163 /*
164 * Use the stack red zone rather than a new frame for saving regs since
165 * in the case of no GPR loss the wakeup code branches directly back to
166 * the caller without deallocating the stack frame first.
167 */
168 std r2,-8*1(r1)
169 std r14,-8*2(r1)
170 std r15,-8*3(r1)
171 std r16,-8*4(r1)
172 std r17,-8*5(r1)
173 std r18,-8*6(r1)
174 std r19,-8*7(r1)
175 std r20,-8*8(r1)
176 std r21,-8*9(r1)
177 std r22,-8*10(r1)
178 std r23,-8*11(r1)
179 std r24,-8*12(r1)
180 std r25,-8*13(r1)
181 std r26,-8*14(r1)
182 std r27,-8*15(r1)
183 std r28,-8*16(r1)
184 std r29,-8*17(r1)
185 std r30,-8*18(r1)
186 std r31,-8*19(r1)
187 std r4,-8*20(r1)
188 std r5,-8*21(r1)
189 cmpwi r3,PNV_THREAD_NAP
190 bne 1f
191 IDLE_STATE_ENTER_SEQ_NORET(PPC_NAP)
1921: cmpwi r3,PNV_THREAD_SLEEP
193 bne 2f
194 IDLE_STATE_ENTER_SEQ_NORET(PPC_SLEEP)
1952: IDLE_STATE_ENTER_SEQ_NORET(PPC_WINKLE)
196#endif
197
198#ifdef CONFIG_PPC_970_NAP
199_GLOBAL(power4_idle_nap)
200 LOAD_REG_IMMEDIATE(r7, MSR_KERNEL|MSR_EE|MSR_POW)
201 ld r9,PACA_THREAD_INFO(r13)
202 ld r8,TI_LOCAL_FLAGS(r9)
203 ori r8,r8,_TLF_NAPPING
204 std r8,TI_LOCAL_FLAGS(r9)
205 /*
206 * NAPPING bit is set, from this point onward power4_fixup_nap
207 * will cause exceptions to return to power4_idle_nap_return.
208 */
2091: sync
210 isync
211 mtmsrd r7
212 isync
213 b 1b
214
215 .globl power4_idle_nap_return
216power4_idle_nap_return:
217 blr
218#endif