summaryrefslogtreecommitdiffstats
path: root/hw
diff options
context:
space:
mode:
authorRussell Currey <ruscur@russell.cc>2016-01-18 16:59:41 +1100
committerStewart Smith <stewart@linux.vnet.ibm.com>2016-01-21 11:59:47 +1100
commit526a1705aba57ac151f43245ae0628beb0a791ac (patch)
tree44fb2f1ec118fc86ab6fdc99a9f5db2cd629b54a /hw
parent04b200ce1eaaedaf425a49cc5369941fd837331d (diff)
downloadtalos-skiboot-526a1705aba57ac151f43245ae0628beb0a791ac.tar.gz
talos-skiboot-526a1705aba57ac151f43245ae0628beb0a791ac.zip
nvlink: Add freeze and fence error injection
Enable NPU freeze and fence injection through debugfs. For example, if a NPU is PCI bus 8, a freeze on PE 1 can be injected with: echo 1:0:0:0:0 >> /sys/kernel/debug/powerpc/PCI0008/err_injct or a fence on PE 2 on PCI bus 9 with: echo 2:1:0:0:0 >> /sys/kernel/debug/powerpc/PCI0009/err_injct These will cause the appropriate EEH event to occur upon a DMA to the NVLink. PE number was added to the npu_dev struct to enable this. Signed-off-by: Russell Currey <ruscur@russell.cc> Acked-By: Alistair Popple <alistair@popple.id.au> Signed-off-by: Stewart Smith <stewart@linux.vnet.ibm.com>
Diffstat (limited to 'hw')
-rw-r--r--hw/npu.c44
1 files changed, 43 insertions, 1 deletions
diff --git a/hw/npu.c b/hw/npu.c
index 3c2c0b8f..23facaf2 100644
--- a/hw/npu.c
+++ b/hw/npu.c
@@ -954,6 +954,7 @@ static int64_t npu_set_pe(struct phb *phb,
return OPAL_PARAMETER;
link_idx = dev->index;
+ dev->pe_num = pe_num;
/* Separate links will be mapped to different PEs */
if (bcompare != OpalPciBusAll ||
@@ -1020,6 +1021,47 @@ static int64_t npu_freeze_status(struct phb *phb,
return OPAL_SUCCESS;
}
+/* Sets the NPU to trigger an error when a DMA occurs */
+static int64_t npu_err_inject(struct phb *phb, uint32_t pe_num,
+ uint32_t type, uint32_t func __unused,
+ uint64_t addr __unused, uint64_t mask __unused)
+{
+ struct npu *p = phb_to_npu(phb);
+ struct npu_dev *dev = NULL;
+ int i;
+
+ if (pe_num > NPU_NUM_OF_PES) {
+ prlog(PR_ERR, "NPU: error injection failed, bad PE given\n");
+ return OPAL_PARAMETER;
+ }
+
+ for (i = 0; i < p->total_devices; i++) {
+ if (p->devices[i].pe_num == pe_num) {
+ dev = &p->devices[i];
+ break;
+ }
+ }
+
+ if (!dev) {
+ prlog(PR_ERR, "NPU: couldn't find device with PE %x\n", pe_num);
+ return OPAL_PARAMETER;
+ }
+
+ /* TODO: extend this to conform to OPAL injection standards */
+ if (type > 1) {
+ prlog(PR_ERR, "NPU: invalid error injection type\n");
+ return OPAL_PARAMETER;
+ } else if (type == 1) {
+ /* Emulate fence mode. */
+ p->fenced = true;
+ } else {
+ /* Cause a freeze with an invalid MMIO write. */
+ in_be64((void *)dev->bar.base);
+ }
+
+ return OPAL_SUCCESS;
+}
+
static const struct phb_ops npu_ops = {
.lock = npu_lock,
.unlock = npu_unlock,
@@ -1059,7 +1101,7 @@ static const struct phb_ops npu_ops = {
.eeh_freeze_clear = NULL,
.eeh_freeze_set = NULL,
.next_error = NULL,
- .err_inject = NULL,
+ .err_inject = npu_err_inject,
.get_diag_data = NULL,
.get_diag_data2 = NULL,
.set_capi_mode = NULL,
OpenPOWER on IntegriCloud