powerpc/64s: Stop using bit in HSPRG0 to test winkle
authorNicholas Piggin <npiggin@gmail.com>
Wed, 19 Apr 2017 13:05:45 +0000 (23:05 +1000)
committerMichael Ellerman <mpe@ellerman.id.au>
Sun, 23 Apr 2017 10:31:39 +0000 (20:31 +1000)
The POWER8 idle code has a neat trick of programming the power on engine
to restore a low bit into HSPRG0, so idle wakeup code can test and see
if it has been programmed this way and therefore lost all state. Restore
time can be reduced if winkle has not been reached.

However this messes with our r13 PACA pointer, and requires HSPRG0 to be
written to. It also optimizes the slowest and most uncommon case at the
expense of another SPR write in the common nap state wakeup.

Remove this complexity and assume winkle sleeps always require a state
restore. This speedup could be made entirely contained within the winkle
idle code by counting per-core winkles and setting a thread bitmap when
all have gone to winkle.

Reviewed-by: Gautham R. Shenoy <ego@linux.vnet.ibm.com>
Signed-off-by: Nicholas Piggin <npiggin@gmail.com>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
arch/powerpc/include/asm/exception-64s.h
arch/powerpc/kernel/exceptions-64s.S
arch/powerpc/kernel/idle_book3s.S
arch/powerpc/platforms/powernv/idle.c

index 437550175b4dbab6647863e77fcc1f1b592767f6..89259817f5eff7518523144dbb6dffbfccf79a0e 100644 (file)
@@ -167,17 +167,14 @@ BEGIN_FTR_SECTION_NESTED(943)                                             \
        std     ra,offset(r13);                                         \
 END_FTR_SECTION_NESTED(ftr,ftr,943)
 
-#define EXCEPTION_PROLOG_0_PACA(area)                                  \
+#define EXCEPTION_PROLOG_0(area)                                       \
+       GET_PACA(r13);                                                  \
        std     r9,area+EX_R9(r13);     /* save r9 */                   \
        OPT_GET_SPR(r9, SPRN_PPR, CPU_FTR_HAS_PPR);                     \
        HMT_MEDIUM;                                                     \
        std     r10,area+EX_R10(r13);   /* save r10 - r12 */            \
        OPT_GET_SPR(r10, SPRN_CFAR, CPU_FTR_CFAR)
 
-#define EXCEPTION_PROLOG_0(area)                                       \
-       GET_PACA(r13);                                                  \
-       EXCEPTION_PROLOG_0_PACA(area)
-
 #define __EXCEPTION_PROLOG_1(area, extra, vec)                         \
        OPT_SAVE_REG_TO_PACA(area+EX_PPR, r9, CPU_FTR_HAS_PPR);         \
        OPT_SAVE_REG_TO_PACA(area+EX_CFAR, r10, CPU_FTR_CFAR);          \
@@ -208,12 +205,6 @@ END_FTR_SECTION_NESTED(ftr,ftr,943)
        EXCEPTION_PROLOG_1(area, extra, vec);                           \
        EXCEPTION_PROLOG_PSERIES_1(label, h);
 
-/* Have the PACA in r13 already */
-#define EXCEPTION_PROLOG_PSERIES_PACA(area, label, h, extra, vec)      \
-       EXCEPTION_PROLOG_0_PACA(area);                                  \
-       EXCEPTION_PROLOG_1(area, extra, vec);                           \
-       EXCEPTION_PROLOG_PSERIES_1(label, h);
-
 #define __KVMTEST(h, n)                                                        \
        lbz     r10,HSTATE_IN_GUEST(r13);                               \
        cmpwi   r10,0;                                                  \
index 2f837a4a78a2bdf681786e885d984436ee78837b..e390fcd04bcb86bcb48a16565f7937b23231c1a4 100644 (file)
@@ -116,9 +116,7 @@ EXC_VIRT_NONE(0x4000, 0x100)
 
 EXC_REAL_BEGIN(system_reset, 0x100, 0x100)
        SET_SCRATCH0(r13)
-       GET_PACA(r13)
-       clrrdi  r13,r13,1 /* Last bit of HSPRG0 is set if waking from winkle */
-       EXCEPTION_PROLOG_PSERIES_PACA(PACA_EXGEN, system_reset_common, EXC_STD,
+       EXCEPTION_PROLOG_PSERIES(PACA_EXGEN, system_reset_common, EXC_STD,
                                 IDLETEST, 0x100)
 
 EXC_REAL_END(system_reset, 0x100, 0x100)
@@ -148,14 +146,6 @@ EXC_REAL_BEGIN(machine_check, 0x200, 0x100)
         * vector
         */
        SET_SCRATCH0(r13)               /* save r13 */
-       /*
-        * Running native on arch 2.06 or later, we may wakeup from winkle
-        * inside machine check. If yes, then last bit of HSPRG0 would be set
-        * to 1. Hence clear it unconditionally.
-        */
-       GET_PACA(r13)
-       clrrdi  r13,r13,1
-       SET_PACA(r13)
        EXCEPTION_PROLOG_0(PACA_EXMC)
 BEGIN_FTR_SECTION
        b       machine_check_powernv_early
@@ -339,7 +329,7 @@ EXC_COMMON_BEGIN(machine_check_handle_early)
         * Go back to nap/sleep/winkle mode again if (b) is true.
         */
        rlwinm. r11,r12,47-31,30,31     /* Was it in power saving mode? */
-       beq     4f                      /* No, it wasn;t */
+       beq     4f                      /* No, it wasn't */
        /* Thread was in power saving mode. Go back to nap again. */
        cmpwi   r11,2
        blt     3f
@@ -369,13 +359,8 @@ EXC_COMMON_BEGIN(machine_check_handle_early)
        /*
         * Go back to winkle. Please note that this thread was woken up in
         * machine check from winkle and have not restored the per-subcore
-        * state. Hence before going back to winkle, set last bit of HSPRG0
-        * to 1. This will make sure that if this thread gets woken up
-        * again at reset vector 0x100 then it will get chance to restore
-        * the subcore state.
+        * state.
         */
-       ori     r13,r13,1
-       SET_PACA(r13)
        IDLE_STATE_ENTER_SEQ_NORET(PPC_WINKLE)
        /* No return */
 4:
index 99de9de7efe7a88802886ac8022de8aa33efe1c5..a80d76f9e961aef497783641ae02f13e7ebb2cfc 100644 (file)
@@ -415,11 +415,12 @@ power9_dd1_recover_paca:
        stb     r0,PACA_NAPSTATELOST(r13)
        blr
 
+/*
+ * Called from reset vector for powersave wakeups.
+ * cr3 - set to gt if waking up with partial/complete hypervisor state loss
+ */
 .global pnv_powersave_wakeup
 pnv_powersave_wakeup:
-BEGIN_FTR_SECTION
-       GET_PACA(r13) /* Restore HSPRG0 to get the winkle bit in r13 */
-END_FTR_SECTION_IFCLR(CPU_FTR_ARCH_300)
        bl      pnv_restore_hyp_resource
 
        li      r0,PNV_THREAD_RUNNING
@@ -446,18 +447,18 @@ END_FTR_SECTION_IFCLR(CPU_FTR_ARCH_300)
  * Check whether we have woken up with hypervisor state loss.
  * If yes, restore hypervisor state and return back to link.
  *
- * r13 - Contents of HSPRG0
  * cr3 - set to gt if waking up with partial/complete hypervisor state loss
  */
 pnv_restore_hyp_resource:
 BEGIN_FTR_SECTION
-BEGIN_FTR_SECTION_NESTED(70)
        mflr    r6
        bl      power9_dd1_recover_paca
        mtlr    r6
-FTR_SECTION_ELSE_NESTED(70)
+FTR_SECTION_ELSE
        ld      r2, PACATOC(r13)
-ALT_FTR_SECTION_END_NESTED_IFSET(CPU_FTR_POWER9_DD1, 70)
+ALT_FTR_SECTION_END_IFSET(CPU_FTR_POWER9_DD1)
+
+BEGIN_FTR_SECTION
        /*
         * POWER ISA 3. Use PSSCR to determine if we
         * are waking up from deep idle state
@@ -480,19 +481,11 @@ END_FTR_SECTION_IFSET(CPU_FTR_ARCH_300)
 
        /*
         * POWER ISA 2.07 or less.
-        * Check if last bit of HSPGR0 is set. This indicates whether we are
-        * waking up from winkle.
+        * Check if we slept with winkle.
         */
-       clrldi  r5,r13,63
-       clrrdi  r13,r13,1
-
-       /* Now that we are sure r13 is corrected, load TOC */
-       ld      r2,PACATOC(r13);
-       cmpwi   cr4,r5,1
-       mtspr   SPRN_HSPRG0,r13
-
        lbz     r0,PACA_THREAD_IDLE_STATE(r13)
        cmpwi   cr2,r0,PNV_THREAD_NAP
+       cmpwi   cr4,r0,PNV_THREAD_WINKLE
        bgt     cr2,pnv_wakeup_tb_loss  /* Either sleep or Winkle */
 
        /*
index b369e39aa39278a320ee57ca8ab1e37fd916c244..445f30a2c5ef280a71a1b23a1b3736b454c07645 100644 (file)
@@ -53,19 +53,6 @@ static int pnv_save_sprs_for_deep_states(void)
                uint64_t pir = get_hard_smp_processor_id(cpu);
                uint64_t hsprg0_val = (uint64_t)&paca[cpu];
 
-               if (!cpu_has_feature(CPU_FTR_ARCH_300)) {
-                       /*
-                        * HSPRG0 is used to store the cpu's pointer to paca.
-                        * Hence last 3 bits are guaranteed to be 0. Program
-                        * slw to restore HSPRG0 with 63rd bit set, so that
-                        * when a thread wakes up at 0x100 we can use this bit
-                        * to distinguish between fastsleep and deep winkle.
-                        * This is not necessary with stop/psscr since PLS
-                        * field of psscr indicates which state we are waking
-                        * up from.
-                        */
-                       hsprg0_val |= 1;
-               }
                rc = opal_slw_set_reg(pir, SPRN_HSPRG0, hsprg0_val);
                if (rc != 0)
                        return rc;