[Skiboot] [PATCH 13/14] opal/hmi: check thread 0 tfmr to validate latched tfmr errors.
Mahesh J Salgaonkar
mahesh at linux.vnet.ibm.com
Wed Mar 14 21:08:43 AEDT 2018
From: Mahesh Salgaonkar <mahesh at linux.vnet.ibm.com>
Due to P9 errata, HDEC parity and TB residue errors are latched for
non-zero threads 1-3 even if they are cleared. But these are not
latched on thread 0. Hence, use xscom SCOMC/SCOMD to read thread 0 tfmr
value and ignore them on non-zero threads if they are not present on
thread 0.
Signed-off-by: Mahesh Salgaonkar <mahesh at linux.vnet.ibm.com>
---
core/hmi.c | 61 ++++++++++++++++++++++++++++++++---------------
include/xscom-p9-regs.h | 8 ++++++
2 files changed, 50 insertions(+), 19 deletions(-)
diff --git a/core/hmi.c b/core/hmi.c
index 2e0fa0773..ef9c9c169 100644
--- a/core/hmi.c
+++ b/core/hmi.c
@@ -22,6 +22,7 @@
#include <processor.h>
#include <chiptod.h>
#include <xscom.h>
+#include <xscom-p9-regs.h>
#include <pci.h>
#include <cpu.h>
#include <chip.h>
@@ -1012,6 +1013,45 @@ error_out:
return recover;
}
+static uint64_t read_tfmr_t0(void)
+{
+ uint64_t tfmr_t0;
+ uint32_t chip_id = this_cpu()->chip_id;
+ uint32_t core_id = pir_to_core_id(this_cpu()->pir);
+
+ lock(&hmi_lock);
+
+ xscom_write(chip_id, XSCOM_ADDR_P9_EC(core_id, P9_SCOM_SPRC),
+ SETFIELD(P9_SCOMC_SPR_SELECT, 0, P9_SCOMC_TFMR_T0));
+ xscom_read(chip_id, XSCOM_ADDR_P9_EC(core_id, P9_SCOM_SPRD),
+ &tfmr_t0);
+ unlock(&hmi_lock);
+ return tfmr_t0;
+}
+
+/* P9 errata: In theory, an HDEC error is sent to all threads. However,
+ * due to an errata on P9 where TFMR bit 26 (HDEC parity) cannot be
+ * cleared on thread 1..3, I am not confident we can do a rendez-vous
+ * in all cases.
+ *
+ * Our current approach is to ignore that error unless it is present
+ * on thread 0 TFMR. Also, ignore TB residue error due to a similar
+ * errata as above.
+ */
+static void validate_latched_errors(uint64_t *tfmr)
+{
+ if ((*tfmr & (SPR_TFMR_HDEC_PARITY_ERROR | SPR_TFMR_TB_RESIDUE_ERR))
+ && this_cpu()->is_secondary) {
+ uint64_t tfmr_t0 = read_tfmr_t0();
+
+ if (!(tfmr_t0 & SPR_TFMR_HDEC_PARITY_ERROR))
+ *tfmr &= ~SPR_TFMR_HDEC_PARITY_ERROR;
+
+ if (!(tfmr_t0 & SPR_TFMR_TB_RESIDUE_ERR))
+ *tfmr &= ~SPR_TFMR_TB_RESIDUE_ERR;
+ }
+}
+
static int handle_tfac_errors(struct OpalHMIEvent *hmi_evt, uint64_t *out_flags)
{
int recover = -1;
@@ -1028,25 +1068,8 @@ static int handle_tfac_errors(struct OpalHMIEvent *hmi_evt, uint64_t *out_flags)
this_cpu()->tb_invalid = !(tfmr & SPR_TFMR_TB_VALID);
- /* P9 errata: In theory, an HDEC error is sent to all threads. However,
- * due to an errata on P9 where TFMR bit 26 (HDEC parity) cannot be
- * cleared on thread 1..3, I am not confident we can do a rendez-vous
- * in all cases.
- *
- * Our current approach is to ignore that error unless no other TFAC
- * error is present in the TFMR. The error will be re-detected and
- * re-reported if necessary.
- */
- if (proc_gen == proc_gen_p9 && (tfmr & SPR_TFMR_HDEC_PARITY_ERROR)) {
- if (this_cpu()->tb_invalid || (tfmr & SPR_TFMR_OTHER_ERRORS))
- tfmr &= ~SPR_TFMR_HDEC_PARITY_ERROR;
- }
-
- /* The TB residue error is ignored if TB is valid due to a similar
- * errata as above
- */
- if ((tfmr & SPR_TFMR_TB_RESIDUE_ERR) && !this_cpu()->tb_invalid)
- tfmr &= ~SPR_TFMR_TB_RESIDUE_ERR;
+ if (proc_gen == proc_gen_p9)
+ validate_latched_errors(&tfmr);
/* First, handle thread local errors */
if (tfmr & SPR_TFMR_THREAD_ERRORS) {
diff --git a/include/xscom-p9-regs.h b/include/xscom-p9-regs.h
index 4738e812c..c3322499f 100644
--- a/include/xscom-p9-regs.h
+++ b/include/xscom-p9-regs.h
@@ -21,4 +21,12 @@
#define P9_GPIO_DATA_OUT_ENABLE 0x00000000000B0054ull
#define P9_GPIO_DATA_OUT 0x00000000000B0051ull
+/* xscom address for SCOM Control and data Register */
+/* bits 54:60 of SCOM SPRC register is used for core specific SPR selection. */
+#define P9_SCOM_SPRC 0x20010A80
+#define P9_SCOMC_SPR_SELECT PPC_BITMASK(54, 60)
+#define P9_SCOMC_TFMR_T0 0x8 /* 0b0001000 TFMR */
+
+#define P9_SCOM_SPRD 0x20010A81
+
#endif /* __XSCOM_P9_REGS_H__ */
More information about the Skiboot
mailing list