On Wed, 2017-09-13 at 02:05 +1000, Nicholas Piggin wrote:
> This implements a way to raise system reset interrupts on other
> cores. This has not yet been tested on DD2 or with deeper sleep
> states.

Reminds me, we need to workaround a bug with XSCOMs on P9

PSCOMs to core in the range 20010A80-20010Ab8 (list below) can fail
occasionally with an error of 4 (PCB_ADDRESS_ERROR). We need to
(silently) retry up to 32 times.

> 0000000020010A80 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.SCOMC
> 0000000020010A81 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.SCOMD
> 0000000020010A82 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.OCC_SCOMC
> 0000000020010A83 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.OCC_SCOMD
> 0000000020010A84 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.SPR_MODE
> 0000000020010A85 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.CTRL
> 0000000020010A86 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.SCR0
> 0000000020010A87 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.SCR1
> 0000000020010A88 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.SCR2
> 0000000020010A89 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.SCR3
> 0000000020010A8E EXP.EC.CC.PCC0.COMMON.SPR_COMMON.V0_HMER
> 0000000020010A92 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.V0_HMER
> 0000000020010A8F EXP.EC.CC.PCC0.COMMON.SPR_COMMON.V1_HMER
> 0000000020010A93 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.V1_HMER
> 0000000020010A90 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.V2_HMER
> 0000000020010A94 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.V2_HMER
> 0000000020010A91 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.V3_HMER
> 0000000020010A95 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.V3_HMER
> 0000000020010A96 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.HMEER
> 0000000020010A97 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.SPATTN
> 0000000020010A98 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.SPATTN
> 0000000020010A99 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.SPATTN
> 0000000020010A9A EXP.EC.CC.PCC0.COMMON.SPR_COMMON.SPATTN_MASK
> 0000000020010A9B EXP.EC.CC.PCC0.PMC.THREAD_INFO
> 0000000020010A9C EXP.EC.CC.PCC0.PMC.DIRECT_CONTROLS
> 0000000020010A9D ECP.PC.PMU.SPR_CORE.RAS_MODEREG
> 0000000020010A9E EXP.EC.CC.PCC0.COMMON.POW.THROTTLE_CONTROL
> 0000000020010A9F EXP.EC.CC.PCC0.TFDP.TFP.SPURR_FREQ_DETECT_CYC_CNT
> 0000000020010AA0 EXP.EC.CC.PCC0.TFDP.TFP.SPURR_FREQ_SCALE
> 0000000020010AA1 EXP.EC.CC.PCC0.TFDP.TFP.SPURR_FREQ_REF
> 0000000020010AA2 EXP.EC.CC.PCC0.TFDP.TFP.PWM_EVENTS
> 0000000020010AA3 EXP.EC.CC.PCC0.TOD_READ
> 0000000020010AA3 EXP.EC.CC.PCC0.TOD_SYNC000
> 0000000020010AA3 EXP.EC.CC.PCC0.TOD_SYNC001
> 0000000020010AA3 EXP.EC.CC.PCC0.TOD_SYNC010
> 0000000020010AA3 EXP.EC.CC.PCC0.TOD_SYNC011
> 0000000020010AA3 EXP.EC.CC.PCC0.TOD_SYNC100
> 0000000020010AA3 EXP.EC.CC.PCC0.TOD_SYNC101
> 0000000020010AA3 EXP.EC.CC.PCC0.TOD_SYNC110
> 0000000020010AA3 EXP.EC.CC.PCC0.TOD_SYNC111
> 0000000020010AA4 EXP.EC.CC.PCC0.COMMON.TFC.TOD_STEP_CHECK
> 0000000020010AA5 ECP.PC.PMU.SPR_CORE.SHID0
> 0000000020010AA6 ECP.PC.PMU.SPR_CORE.HV_STATE
> 0000000020010AA7 ECP.PC.PMU.SPR_CORE.CORE_FUSES
> 0000000020010AA8 ECP.PC.IMA.IMA_EVENT_MASK
> 0000000020010AA9 ECP.PC.IMA.IMA_TRACE
> 0000000020010AAA ECP.PC.T0_PMU_SCOM
> 0000000020010AAB ECP.PC.T1_PMU_SCOM
> 0000000020010AAC ECP.PC.T2_PMU_SCOM
> 0000000020010AAD ECP.PC.T3_PMU_SCOM
> 0000000020010AAE ECP.PC.PMU.PMUC.SIER_MASK
> 0000000020010AAF ECP.PC.PMU.PMUC.SRC_MASK
> 0000000020010AB0 ECP.PC.PMU.SPR_CORE.PMU_SCOMC
> 0000000020010AB2 ECP.PC.PMU.SPR_CORE.PMU_SCOMC_EN
> 0000000020010AB3 EXP.EC.CC.PCC0.PMC.CORE_THREAD_STATE
> 0000000020010AB4 ECP.PC.PMU.SPR_CORE.INV_ERATE
> 0000000020010AB5 ECP.PC.PMU.SPR_CORE.SPR_CORE_HOLD_OUT
> 0000000020010AB6 ECP.PC.PMU.SPR_CORE.PMU_HOLD_OUT
> 0000000020010AB7 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.TFAC_HOLD_OUT
> 0000000020010AB8 EXP.EC.CC.PCC0.COMMON.SPR_COMMON.SPR_COMMON_HOLD_OUT 
> ---
>  core/Makefile.inc       |   1 +
>  core/sreset.c           | 237 
> ++++++++++++++++++++++++++++++++++++++++++++++++
>  hw/xscom.c              |   2 +
>  include/skiboot.h       |   3 +
>  platforms/mambo/mambo.c |   3 +-
>  5 files changed, 245 insertions(+), 1 deletion(-)
>  create mode 100644 core/sreset.c
> 
> diff --git a/core/Makefile.inc b/core/Makefile.inc
> index f2de2f64..16204978 100644
> --- a/core/Makefile.inc
> +++ b/core/Makefile.inc
> @@ -9,6 +9,7 @@ CORE_OBJS += vpd.o hostservices.o platform.o nvram.o 
> nvram-format.o hmi.o
>  CORE_OBJS += console-log.o ipmi.o time-utils.o pel.o pool.o errorlog.o
>  CORE_OBJS += timer.o i2c.o rtc.o flash.o sensor.o ipmi-opal.o
>  CORE_OBJS += flash-subpartition.o bitmap.o buddy.o pci-quirk.o powercap.o 
> psr.o
> +CORE_OBJS += sreset.o
>  
>  ifeq ($(SKIBOOT_GCOV),1)
>  CORE_OBJS += gcov-profiling.o
> diff --git a/core/sreset.c b/core/sreset.c
> new file mode 100644
> index 00000000..ff20fe71
> --- /dev/null
> +++ b/core/sreset.c
> @@ -0,0 +1,237 @@
> +/* Copyright 2017 IBM Corp.
> + *
> + * Licensed under the Apache License, Version 2.0 (the "License");
> + * you may not use this file except in compliance with the License.
> + * You may obtain a copy of the License at
> + *
> + *   http://www.apache.org/licenses/LICENSE-2.0
> + *
> + * Unless required by applicable law or agreed to in writing, software
> + * distributed under the License is distributed on an "AS IS" BASIS,
> + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
> + * implied.
> + * See the License for the specific language governing permissions and
> + * limitations under the License.
> + */
> +
> +#include <skiboot.h>
> +#include <cpu.h>
> +#include <fsp.h>
> +#include <psi.h>
> +#include <opal.h>
> +#include <xscom.h>
> +#include <interrupts.h>
> +#include <cec.h>
> +#include <timebase.h>
> +#include <pci.h>
> +#include <chip.h>
> +#include <chiptod.h>
> +#include <ipmi.h>
> +
> +#define P9_RAS_STATUS                        0x10a02
> +#define P9_RSTAT_QUIESCED(t)         PPC_BITMASK(0 + 8*(t), 3 + 8*(t))
> +#define P9_RAS_MODEREG                       0x10a9d
> +#define P9_DIRECT_CONTROLS           0x10a9c
> +#define P9_DCTL_STOP(t)                      PPC_BIT(7 + 8*(t))
> +#define P9_DCTL_CONT(t)                      PPC_BIT(6 + 8*(t))
> +#define P9_DCTL_SRESET(t)            PPC_BIT(4 + 8*(t))
> +#define P9_DCTL_PWR(t)                       PPC_BIT(32 + 8*(t))
> +
> +#define P9_CORE_THREAD_STATE         0x10ab3
> +#define P9_CTS_STOP(t)                       PPC_BIT(56 + (t))
> +
> +#define PPM_GPMMR                    0xf0100
> +#define PPM_SPWKUP_OTR                       0xf010a
> +#define SPECIAL_WKUP_DONE            PPC_BIT(1)
> +
> +
> +static int core_set_special_wakeup(struct cpu_thread *cpu)
> +{
> +     uint32_t chip_id = pir_to_chip_id(cpu->pir);
> +     uint32_t core_id = pir_to_core_id(cpu->pir);
> +     uint32_t swake_addr;
> +     uint32_t gpmmr_addr;
> +     uint64_t val;
> +     int i;
> +
> +     swake_addr = XSCOM_ADDR_P9_EC(core_id, PPM_SPWKUP_OTR);
> +     gpmmr_addr = XSCOM_ADDR_P9_EC(core_id, PPM_GPMMR);
> +
> +     xscom_read(chip_id, swake_addr, &val);
> +     if (xscom_write(chip_id, swake_addr, PPC_BIT(0))) {
> +             prlog(PR_WARNING, "SRESET: Unable to write SPWKUP_OTR 
> register\n");
> +             return OPAL_HARDWARE;
> +     }
> +     xscom_read(chip_id, swake_addr, &val);
> +
> +     for (i = 0; i < 100; i++) {
> +             if (xscom_read(chip_id, gpmmr_addr, &val)) {
> +                     prlog(PR_WARNING, "SRESET: Unable to read GPMMR 
> register\n");
> +                     return OPAL_HARDWARE;
> +             }
> +             if (val & SPECIAL_WKUP_DONE)
> +                     return 0;
> +
> +             time_wait_us(1);
> +     }
> +
> +     xscom_read(chip_id, swake_addr, &val);
> +     xscom_write(chip_id, swake_addr, 0);
> +     xscom_read(chip_id, swake_addr, &val);
> +
> +     prlog(PR_WARNING, "SRESET: Special wakeup mode could not be set.\n");
> +     return OPAL_HARDWARE;
> +}
> +
> +static void core_clear_special_wakeup(struct cpu_thread *cpu)
> +{
> +     uint32_t chip_id = pir_to_chip_id(cpu->pir);
> +     uint32_t core_id = pir_to_core_id(cpu->pir);
> +     uint32_t swake_addr;
> +     uint64_t val;
> +
> +     swake_addr = XSCOM_ADDR_P9_EC(core_id, PPM_SPWKUP_OTR);
> +
> +     /* De-assert special wakeup bit */
> +     xscom_read(chip_id, swake_addr, &val);
> +     xscom_write(chip_id, swake_addr, 0);
> +     xscom_read(chip_id, swake_addr, &val);
> +}
> +
> +static int thread_quiesced(struct cpu_thread *cpu)
> +{
> +     uint32_t chip_id = pir_to_chip_id(cpu->pir);
> +     uint32_t core_id = pir_to_core_id(cpu->pir);
> +     uint32_t thread_id = pir_to_thread_id(cpu->pir);
> +     uint32_t ras_addr;
> +     uint64_t ras_status;
> +
> +     ras_addr = XSCOM_ADDR_P9_EC(core_id, P9_RAS_STATUS);
> +     if (xscom_read(chip_id, ras_addr, &ras_status)) {
> +             prlog(PR_WARNING, "SRESET: Unable to read status register\n");
> +             return OPAL_HARDWARE;
> +     }
> +
> +     if ((ras_status & P9_RSTAT_QUIESCED(thread_id))
> +                     == P9_RSTAT_QUIESCED(thread_id))
> +             return 1;
> +
> +     return 0;
> +}
> +
> +static int stop_thread(struct cpu_thread *cpu)
> +{
> +     uint32_t chip_id = pir_to_chip_id(cpu->pir);
> +     uint32_t core_id = pir_to_core_id(cpu->pir);
> +     uint32_t thread_id = pir_to_thread_id(cpu->pir);
> +     uint32_t dctl_addr;
> +     int i;
> +
> +     dctl_addr = XSCOM_ADDR_P9_EC(core_id, P9_DIRECT_CONTROLS);
> +
> +     xscom_write(chip_id, dctl_addr, P9_DCTL_STOP(thread_id));
> +
> +     for (i = 0; i < 100; i++) {
> +             int rc = thread_quiesced(cpu);
> +             if (rc < 0)
> +                     break;
> +             if (rc)
> +                     return 0;
> +     }
> +
> +     xscom_write(chip_id, dctl_addr, P9_DCTL_CONT(thread_id));
> +     prlog(PR_WARNING, "SRESET: Could not quiesce thread\n");
> +     return OPAL_HARDWARE;
> +}
> +
> +static int sreset_thread(struct cpu_thread *cpu)
> +{
> +     uint32_t chip_id = pir_to_chip_id(cpu->pir);
> +     uint32_t core_id = pir_to_core_id(cpu->pir);
> +     uint32_t thread_id = pir_to_thread_id(cpu->pir);
> +     uint32_t dctl_addr;
> +     uint32_t cts_addr;
> +     uint64_t cts_val;
> +
> +     dctl_addr = XSCOM_ADDR_P9_EC(core_id, P9_DIRECT_CONTROLS);
> +     cts_addr = XSCOM_ADDR_P9_EC(core_id, P9_CORE_THREAD_STATE);
> +
> +     if (xscom_read(chip_id, cts_addr, &cts_val)) {
> +             prlog(PR_WARNING, "SRESET: Unable to read CORE_THREAD_STATE 
> register\n");
> +             return OPAL_HARDWARE;
> +     }
> +     if (!(cts_val & P9_CTS_STOP(thread_id))) {
> +             /* Clear SRR1[46:47] */
> +             if (xscom_write(chip_id, dctl_addr, P9_DCTL_PWR(thread_id))) {
> +                     prlog(PR_WARNING, "SRESET: Unable to set power saving 
> mode\n");
> +                     return OPAL_HARDWARE;
> +             }
> +     }
> +
> +     if (xscom_write(chip_id, dctl_addr, P9_DCTL_SRESET(thread_id))) {
> +             prlog(PR_WARNING, "SRESET: Unable to write DIRECT_CONTROLS 
> register\n");
> +             return OPAL_HARDWARE;
> +     }
> +
> +     return 0;
> +}
> +
> +// static struct lock sreset_lock = LOCK_UNLOCKED;
> +
> +static int64_t sreset_cpu(struct cpu_thread *cpu)
> +{
> +     int rc;
> +
> +     if (this_cpu() == cpu) {
> +             prlog(PR_WARNING, "SRESET: Unable to reset self\n");
> +             return OPAL_UNSUPPORTED;
> +     }
> +     if (this_cpu()->primary == cpu->primary) {
> +             prlog(PR_WARNING, "SRESET: Unable to reset threads on same 
> core\n");
> +             return OPAL_PARTIAL;
> +     }
> +
> +     rc = thread_quiesced(cpu);
> +     if (rc < 0)
> +             return rc;
> +     if (rc) {
> +             prlog(PR_WARNING, "SRESET: Thread is quiesced already\n");
> +             return OPAL_WRONG_STATE;
> +     }
> +
> +     rc = core_set_special_wakeup(cpu);
> +     if (rc)
> +             return rc;
> +
> +     rc = stop_thread(cpu);
> +     if (rc) {
> +             core_clear_special_wakeup(cpu);
> +             return rc;
> +     }
> +
> +     rc = sreset_thread(cpu);
> +
> +     core_clear_special_wakeup(cpu);
> +
> +     return 0;
> +}
> +
> +int64_t signal_system_reset(int cpu_nr)
> +{
> +     struct cpu_thread *cpu;
> +
> +     if (proc_gen != proc_gen_p9)
> +             return OPAL_UNSUPPORTED;
> +
> +     /* Reset a single CPU */
> +     if (cpu_nr >= 0) {
> +             cpu = find_cpu_by_server(cpu_nr);
> +             if (!cpu) {
> +                     printf("SRESET: could not find cpu by server %d\n", 
> cpu_nr);
> +                     return OPAL_PARAMETER;
> +             }
> +             return sreset_cpu(cpu);
> +     }
> +     printf("SRESET: unsupported %d\n", cpu_nr);
> +     return OPAL_PARTIAL;
> +}
> diff --git a/hw/xscom.c b/hw/xscom.c
> index 7bd78bf9..f3e04291 100644
> --- a/hw/xscom.c
> +++ b/hw/xscom.c
> @@ -705,6 +705,8 @@ static void xscom_init_chip_info(struct proc_chip *chip)
>               printf("P9 DD%i.%i%d detected\n", 0xf & (chip->ec_level >> 4),
>                      chip->ec_level & 0xf, rev);
>               chip->ec_rev = rev;
> +
> +             opal_register(OPAL_SIGNAL_SYSTEM_RESET, signal_system_reset, 1);
>       }
>  }
>  
> diff --git a/include/skiboot.h b/include/skiboot.h
> index 4b7d5197..37fd774f 100644
> --- a/include/skiboot.h
> +++ b/include/skiboot.h
> @@ -198,6 +198,9 @@ extern char __sym_map_end[];
>  extern unsigned long get_symbol(unsigned long addr,
>                               char **sym, char **sym_end);
>  
> +/* System reset */
> +extern int64_t signal_system_reset(int cpu_nr);
> +
>  /* Fast reboot support */
>  extern void disable_fast_reboot(const char *reason);
>  extern void fast_reboot(void);
> diff --git a/platforms/mambo/mambo.c b/platforms/mambo/mambo.c
> index cb6e103c..e306ba5c 100644
> --- a/platforms/mambo/mambo.c
> +++ b/platforms/mambo/mambo.c
> @@ -259,7 +259,8 @@ static int64_t mambo_signal_system_reset(int32_t cpu_nr)
>  
>  static void mambo_sreset_init(void)
>  {
> -     opal_register(OPAL_SIGNAL_SYSTEM_RESET, mambo_signal_system_reset, 1);
> +     if (0)
> +             opal_register(OPAL_SIGNAL_SYSTEM_RESET, 
> mambo_signal_system_reset, 1);
>  }
>  
>  static void mambo_platform_init(void)

Reply via email to