diff options
author | Caleb Palmer <cnpalmer@us.ibm.com> | 2017-10-17 08:52:00 -0500 |
---|---|---|
committer | Zane C. Shelley <zshelle@us.ibm.com> | 2017-10-19 10:58:01 -0400 |
commit | c32b7f744b357f2b65dbcdeb624333032899912a (patch) | |
tree | ca7f2769c7be04a8cce3f07869ec722d5ae9305a /src/usr/diag/prdf/common | |
parent | 4b0e1b579ebe1f7df2b4c88e2cef7212d9e8032f (diff) | |
download | talos-hostboot-c32b7f744b357f2b65dbcdeb624333032899912a.tar.gz talos-hostboot-c32b7f744b357f2b65dbcdeb624333032899912a.zip |
PRD: Missing errl for IUEs because of port fail
Change-Id: I0c3af0033a2898b0fc655b2b1774ab03d1a7430c
CQ: SW391845
Reviewed-on: http://ralgit01.raleigh.ibm.com/gerrit1/48496
Tested-by: Jenkins Server <pfd-jenkins+hostboot@us.ibm.com>
Reviewed-by: Benjamin J. Weisenbeck <bweisenb@us.ibm.com>
Reviewed-by: Zane C. Shelley <zshelle@us.ibm.com>
Reviewed-on: http://ralgit01.raleigh.ibm.com/gerrit1/48584
Tested-by: Jenkins OP Build CI <op-jenkins+hostboot@us.ibm.com>
Tested-by: Jenkins OP HW <op-hw-jenkins+hostboot@us.ibm.com>
Tested-by: FSP CI Jenkins <fsp-CI-jenkins+hostboot@us.ibm.com>
Diffstat (limited to 'src/usr/diag/prdf/common')
-rw-r--r-- | src/usr/diag/prdf/common/plat/mem/prdfMemEccAnalysis.C | 39 | ||||
-rw-r--r-- | src/usr/diag/prdf/common/plat/mem/prdfP9McaDataBundle.H | 3 |
2 files changed, 42 insertions, 0 deletions
diff --git a/src/usr/diag/prdf/common/plat/mem/prdfMemEccAnalysis.C b/src/usr/diag/prdf/common/plat/mem/prdfMemEccAnalysis.C index 9fd6324b6..18cc52c6d 100644 --- a/src/usr/diag/prdf/common/plat/mem/prdfMemEccAnalysis.C +++ b/src/usr/diag/prdf/common/plat/mem/prdfMemEccAnalysis.C @@ -173,6 +173,24 @@ uint32_t maskMemPort<TYPE_MCA>( ExtensibleChip * i_chip ) c->setAllBits(); d->setAllBits(); e->setAllBits(); + // We don't want to mask the IUE bits in the MCAECCFIR if they are on + // so if we trigger a port fail that causes a checkstop we have + // something to blame it on. + SCAN_COMM_REGISTER_CLASS * mcaeccfir = i_chip->getRegister("MCAECCFIR"); + + o_rc = mcaeccfir->Read(); + if ( SUCCESS != o_rc ) + { + PRDF_ERR( PRDF_FUNC "Read() Failed on MCAECCFIR: i_chip=0x%08x", + i_chip->getHuid() ); + break; + } + + if ( mcaeccfir->IsBitSet(17) ) + e->ClearBit(17); + if ( mcaeccfir->IsBitSet(37) ) + e->ClearBit(37); + o_rc = c->Write() | d->Write() | e->Write(); if ( SUCCESS != o_rc ) { @@ -256,6 +274,9 @@ uint32_t iuePortFail<TYPE_MCA>( ExtensibleChip * i_chip, { resetTh.second.reset(); } + + db->iv_iuePortFail = true; + break; } } @@ -751,6 +772,24 @@ uint32_t handleMemIue( ExtensibleChip * i_chip, const MemRank & i_rank, // Get the data bundle from chip. D db = static_cast<D>( i_chip->getDataBundle() ); + // If we have already caused a port fail, mask the IUE bits. + if ( true == db->iv_iuePortFail ) + { + SCAN_COMM_REGISTER_CLASS * mask_or = + i_chip->getRegister("MCAECCFIR_MASK_OR"); + + mask_or->SetBit(17); + mask_or->SetBit(37); + + o_rc = mask_or->Write(); + if ( SUCCESS != o_rc ) + { + PRDF_ERR( PRDF_FUNC "Write() failed on 0x%08x", + i_chip->getHuid() ); + break; + } + } + // Get the DIMM select. uint8_t ds = i_rank.getDimmSlct(); diff --git a/src/usr/diag/prdf/common/plat/mem/prdfP9McaDataBundle.H b/src/usr/diag/prdf/common/plat/mem/prdfP9McaDataBundle.H index a43486fdf..4d3c4fa02 100644 --- a/src/usr/diag/prdf/common/plat/mem/prdfP9McaDataBundle.H +++ b/src/usr/diag/prdf/common/plat/mem/prdfP9McaDataBundle.H @@ -190,6 +190,9 @@ class McaDataBundle : public DataBundle /** Threshold table for IUEs. Threshold per DIMM */ std::map<uint8_t, TimeBasedThreshold> iv_iueTh; + /** Bool to indicate if we've triggered a port fail because of IUEs. */ + bool iv_iuePortFail = false; + #endif #ifdef __HOSTBOOT_RUNTIME |