powerpc/64s: Stop using bit in HSPRG0 to test winkle
The POWER8 idle code has a neat trick of programming the power on engine to restore a low bit into HSPRG0, so idle wakeup code can test and see if it has been programmed this way and therefore lost all state. Restore time can be reduced if winkle has not been reached. However this messes with our r13 PACA pointer, and requires HSPRG0 to be written to. It also optimizes the slowest and most uncommon case at the expense of another SPR write in the common nap state wakeup. Remove this complexity and assume winkle sleeps always require a state restore. This speedup could be made entirely contained within the winkle idle code by counting per-core winkles and setting a thread bitmap when all have gone to winkle. Reviewed-by: Gautham R. Shenoy <ego@linux.vnet.ibm.com> Signed-off-by: Nicholas Piggin <npiggin@gmail.com> Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
This commit is contained in:
parent
bf0153c143
commit
544686cae8
|
@ -167,17 +167,14 @@ BEGIN_FTR_SECTION_NESTED(943) \
|
|||
std ra,offset(r13); \
|
||||
END_FTR_SECTION_NESTED(ftr,ftr,943)
|
||||
|
||||
#define EXCEPTION_PROLOG_0_PACA(area) \
|
||||
#define EXCEPTION_PROLOG_0(area) \
|
||||
GET_PACA(r13); \
|
||||
std r9,area+EX_R9(r13); /* save r9 */ \
|
||||
OPT_GET_SPR(r9, SPRN_PPR, CPU_FTR_HAS_PPR); \
|
||||
HMT_MEDIUM; \
|
||||
std r10,area+EX_R10(r13); /* save r10 - r12 */ \
|
||||
OPT_GET_SPR(r10, SPRN_CFAR, CPU_FTR_CFAR)
|
||||
|
||||
#define EXCEPTION_PROLOG_0(area) \
|
||||
GET_PACA(r13); \
|
||||
EXCEPTION_PROLOG_0_PACA(area)
|
||||
|
||||
#define __EXCEPTION_PROLOG_1(area, extra, vec) \
|
||||
OPT_SAVE_REG_TO_PACA(area+EX_PPR, r9, CPU_FTR_HAS_PPR); \
|
||||
OPT_SAVE_REG_TO_PACA(area+EX_CFAR, r10, CPU_FTR_CFAR); \
|
||||
|
@ -208,12 +205,6 @@ END_FTR_SECTION_NESTED(ftr,ftr,943)
|
|||
EXCEPTION_PROLOG_1(area, extra, vec); \
|
||||
EXCEPTION_PROLOG_PSERIES_1(label, h);
|
||||
|
||||
/* Have the PACA in r13 already */
|
||||
#define EXCEPTION_PROLOG_PSERIES_PACA(area, label, h, extra, vec) \
|
||||
EXCEPTION_PROLOG_0_PACA(area); \
|
||||
EXCEPTION_PROLOG_1(area, extra, vec); \
|
||||
EXCEPTION_PROLOG_PSERIES_1(label, h);
|
||||
|
||||
#define __KVMTEST(h, n) \
|
||||
lbz r10,HSTATE_IN_GUEST(r13); \
|
||||
cmpwi r10,0; \
|
||||
|
|
|
@ -116,9 +116,7 @@ EXC_VIRT_NONE(0x4000, 0x100)
|
|||
|
||||
EXC_REAL_BEGIN(system_reset, 0x100, 0x100)
|
||||
SET_SCRATCH0(r13)
|
||||
GET_PACA(r13)
|
||||
clrrdi r13,r13,1 /* Last bit of HSPRG0 is set if waking from winkle */
|
||||
EXCEPTION_PROLOG_PSERIES_PACA(PACA_EXGEN, system_reset_common, EXC_STD,
|
||||
EXCEPTION_PROLOG_PSERIES(PACA_EXGEN, system_reset_common, EXC_STD,
|
||||
IDLETEST, 0x100)
|
||||
|
||||
EXC_REAL_END(system_reset, 0x100, 0x100)
|
||||
|
@ -148,14 +146,6 @@ EXC_REAL_BEGIN(machine_check, 0x200, 0x100)
|
|||
* vector
|
||||
*/
|
||||
SET_SCRATCH0(r13) /* save r13 */
|
||||
/*
|
||||
* Running native on arch 2.06 or later, we may wakeup from winkle
|
||||
* inside machine check. If yes, then last bit of HSPRG0 would be set
|
||||
* to 1. Hence clear it unconditionally.
|
||||
*/
|
||||
GET_PACA(r13)
|
||||
clrrdi r13,r13,1
|
||||
SET_PACA(r13)
|
||||
EXCEPTION_PROLOG_0(PACA_EXMC)
|
||||
BEGIN_FTR_SECTION
|
||||
b machine_check_powernv_early
|
||||
|
@ -339,7 +329,7 @@ EXC_COMMON_BEGIN(machine_check_handle_early)
|
|||
* Go back to nap/sleep/winkle mode again if (b) is true.
|
||||
*/
|
||||
rlwinm. r11,r12,47-31,30,31 /* Was it in power saving mode? */
|
||||
beq 4f /* No, it wasn;t */
|
||||
beq 4f /* No, it wasn't */
|
||||
/* Thread was in power saving mode. Go back to nap again. */
|
||||
cmpwi r11,2
|
||||
blt 3f
|
||||
|
@ -369,13 +359,8 @@ EXC_COMMON_BEGIN(machine_check_handle_early)
|
|||
/*
|
||||
* Go back to winkle. Please note that this thread was woken up in
|
||||
* machine check from winkle and have not restored the per-subcore
|
||||
* state. Hence before going back to winkle, set last bit of HSPRG0
|
||||
* to 1. This will make sure that if this thread gets woken up
|
||||
* again at reset vector 0x100 then it will get chance to restore
|
||||
* the subcore state.
|
||||
* state.
|
||||
*/
|
||||
ori r13,r13,1
|
||||
SET_PACA(r13)
|
||||
IDLE_STATE_ENTER_SEQ_NORET(PPC_WINKLE)
|
||||
/* No return */
|
||||
4:
|
||||
|
|
|
@ -415,11 +415,12 @@ power9_dd1_recover_paca:
|
|||
stb r0,PACA_NAPSTATELOST(r13)
|
||||
blr
|
||||
|
||||
/*
|
||||
* Called from reset vector for powersave wakeups.
|
||||
* cr3 - set to gt if waking up with partial/complete hypervisor state loss
|
||||
*/
|
||||
.global pnv_powersave_wakeup
|
||||
pnv_powersave_wakeup:
|
||||
BEGIN_FTR_SECTION
|
||||
GET_PACA(r13) /* Restore HSPRG0 to get the winkle bit in r13 */
|
||||
END_FTR_SECTION_IFCLR(CPU_FTR_ARCH_300)
|
||||
bl pnv_restore_hyp_resource
|
||||
|
||||
li r0,PNV_THREAD_RUNNING
|
||||
|
@ -446,18 +447,18 @@ END_FTR_SECTION_IFCLR(CPU_FTR_ARCH_300)
|
|||
* Check whether we have woken up with hypervisor state loss.
|
||||
* If yes, restore hypervisor state and return back to link.
|
||||
*
|
||||
* r13 - Contents of HSPRG0
|
||||
* cr3 - set to gt if waking up with partial/complete hypervisor state loss
|
||||
*/
|
||||
pnv_restore_hyp_resource:
|
||||
BEGIN_FTR_SECTION
|
||||
BEGIN_FTR_SECTION_NESTED(70)
|
||||
mflr r6
|
||||
bl power9_dd1_recover_paca
|
||||
mtlr r6
|
||||
FTR_SECTION_ELSE_NESTED(70)
|
||||
FTR_SECTION_ELSE
|
||||
ld r2, PACATOC(r13)
|
||||
ALT_FTR_SECTION_END_NESTED_IFSET(CPU_FTR_POWER9_DD1, 70)
|
||||
ALT_FTR_SECTION_END_IFSET(CPU_FTR_POWER9_DD1)
|
||||
|
||||
BEGIN_FTR_SECTION
|
||||
/*
|
||||
* POWER ISA 3. Use PSSCR to determine if we
|
||||
* are waking up from deep idle state
|
||||
|
@ -480,19 +481,11 @@ END_FTR_SECTION_IFSET(CPU_FTR_ARCH_300)
|
|||
|
||||
/*
|
||||
* POWER ISA 2.07 or less.
|
||||
* Check if last bit of HSPGR0 is set. This indicates whether we are
|
||||
* waking up from winkle.
|
||||
* Check if we slept with winkle.
|
||||
*/
|
||||
clrldi r5,r13,63
|
||||
clrrdi r13,r13,1
|
||||
|
||||
/* Now that we are sure r13 is corrected, load TOC */
|
||||
ld r2,PACATOC(r13);
|
||||
cmpwi cr4,r5,1
|
||||
mtspr SPRN_HSPRG0,r13
|
||||
|
||||
lbz r0,PACA_THREAD_IDLE_STATE(r13)
|
||||
cmpwi cr2,r0,PNV_THREAD_NAP
|
||||
cmpwi cr4,r0,PNV_THREAD_WINKLE
|
||||
bgt cr2,pnv_wakeup_tb_loss /* Either sleep or Winkle */
|
||||
|
||||
/*
|
||||
|
|
|
@ -53,19 +53,6 @@ static int pnv_save_sprs_for_deep_states(void)
|
|||
uint64_t pir = get_hard_smp_processor_id(cpu);
|
||||
uint64_t hsprg0_val = (uint64_t)&paca[cpu];
|
||||
|
||||
if (!cpu_has_feature(CPU_FTR_ARCH_300)) {
|
||||
/*
|
||||
* HSPRG0 is used to store the cpu's pointer to paca.
|
||||
* Hence last 3 bits are guaranteed to be 0. Program
|
||||
* slw to restore HSPRG0 with 63rd bit set, so that
|
||||
* when a thread wakes up at 0x100 we can use this bit
|
||||
* to distinguish between fastsleep and deep winkle.
|
||||
* This is not necessary with stop/psscr since PLS
|
||||
* field of psscr indicates which state we are waking
|
||||
* up from.
|
||||
*/
|
||||
hsprg0_val |= 1;
|
||||
}
|
||||
rc = opal_slw_set_reg(pir, SPRN_HSPRG0, hsprg0_val);
|
||||
if (rc != 0)
|
||||
return rc;
|
||||
|
|
Loading…
Reference in New Issue