summaryrefslogtreecommitdiffstats
path: root/src/usr/diag/prdf/common
diff options
context:
space:
mode:
authorChris Phan <cphan@us.ibm.com>2014-03-20 12:06:50 -0500
committerA. Patrick Williams III <iawillia@us.ibm.com>2014-04-02 16:00:22 -0500
commit61e5b3d46d89eb026c45e3ac00398ff62069214b (patch)
tree48768612a6267dd1857634fcdb8a69bf5bbc6614 /src/usr/diag/prdf/common
parentcec376b563bafb0c9f7fe4babacdeaa6aed31986 (diff)
downloadtalos-hostboot-61e5b3d46d89eb026c45e3ac00398ff62069214b.tar.gz
talos-hostboot-61e5b3d46d89eb026c45e3ac00398ff62069214b.zip
PRD: add support for PCB Slave internal parity error
Change-Id: Ied0350878079c39e496d9d3713d9221ba9f0fd7f CQ: SW251980 Backport: release-fips810 Reviewed-on: http://gfw160.aus.stglabs.ibm.com:8080/gerrit/9803 Tested-by: Jenkins Server Reviewed-by: Bilicon Patil <bilpatil@in.ibm.com> Reviewed-by: Sachin Gupta <sgupta2m@in.ibm.com> Reviewed-by: Prem Shanker Jha <premjha2@in.ibm.com> Reviewed-by: A. Patrick Williams III <iawillia@us.ibm.com> Reviewed-by: Zane Shelley <zshelle@us.ibm.com> Reviewed-on: http://gfw160.aus.stglabs.ibm.com:8080/gerrit/9972
Diffstat (limited to 'src/usr/diag/prdf/common')
-rwxr-xr-xsrc/usr/diag/prdf/common/plat/pegasus/Proc_acts_TP.rule19
-rwxr-xr-xsrc/usr/diag/prdf/common/plat/pegasus/prdfP8Pll.C382
2 files changed, 346 insertions, 55 deletions
diff --git a/src/usr/diag/prdf/common/plat/pegasus/Proc_acts_TP.rule b/src/usr/diag/prdf/common/plat/pegasus/Proc_acts_TP.rule
index 9389f711f..1f1aaa5dd 100755
--- a/src/usr/diag/prdf/common/plat/pegasus/Proc_acts_TP.rule
+++ b/src/usr/diag/prdf/common/plat/pegasus/Proc_acts_TP.rule
@@ -262,12 +262,12 @@ group gTpLFir filter singlebit
(TpLFir, bit(18)) ? TodReportByPHYP;
/** TP_LFIR[19]
- * Processor PLL error
+ * PCB Slave Internal Parity Error
*
- * These should never trigger directly themselves.
- * Should be handled by global PRD PLL code.
+ * This bit is also shared with the PLL Lock error.
+ * PLL error should already be handled by global PRD PLL code.
*/
- (TpLFir, bit(19)) ? PllError;
+ (TpLFir, bit(19)) ? PcbSlaveInternalParity;
/** TP_LFIR[20]
* Sbe indicated error_event0to4 enabled by mask bit 5 to 9
@@ -1158,12 +1158,17 @@ actionclass analyzeMcs31
analyze(connected(TYPE_MCS, 7));
};
-/** PLL error action */
-actionclass PllError
+# still need to capture PLL FIRs for debugging
+/** PCB Slave Internal parity error action */
+actionclass PcbSlaveInternalParity
{
capture(PllFIRs);
+ calloutSelfHigh;
+ threshold5pday;
+ funccall("AnalyzeParityErr");
funccall("capturePllFfdc");
- threshold32pday;
+ funccall("NoClearFirBits"); # Must be called last so return
+ # code can be passed on to rule code.
};
# TOD Actions:
diff --git a/src/usr/diag/prdf/common/plat/pegasus/prdfP8Pll.C b/src/usr/diag/prdf/common/plat/pegasus/prdfP8Pll.C
index 69e5c8cb6..60946ce03 100755
--- a/src/usr/diag/prdf/common/plat/pegasus/prdfP8Pll.C
+++ b/src/usr/diag/prdf/common/plat/pegasus/prdfP8Pll.C
@@ -59,6 +59,9 @@ enum
PLL_ERROR_BIT = 25,
PB_DMI_RIGHT_PLL_ERROR = 25, // Venice only
PB_DMI_LEFT_PLL_ERROR = 26, // Venice and Murano
+ // PCB Slave internal parity error
+ PARITY_ERROR_MASK = 8,
+ PARITY_ERROR_BIT = 4,
};
/**
@@ -363,78 +366,85 @@ PRDF_PLUGIN_DEFINE( Proc, ClearPll );
/**
* @brief Mask the PLL error for P8 Plugin
* @param i_chip P8 chip
- * @param Output Unused.
+ * @param i_sc The step code data struct
* @returns Failure or Success of query.
* @note
*/
-int32_t MaskPll( ExtensibleChip * i_chip,void * unused)
+int32_t MaskPll( ExtensibleChip * i_chip,
+ STEP_CODE_DATA_STRUCT & i_sc )
{
#define PRDF_FUNC "[Proc::MaskPll] "
int32_t rc = SUCCESS;
- MODEL procModel = getProcModel( i_chip->GetChipHandle() );
- // fence off proc osc error reg bits
- P8DataBundle * procdb = getDataBundle( i_chip );
- P8DataBundle::ProcPllErrRegList & procPllErrRegList =
- procdb->getProcPllErrRegList();
- if( procPllErrRegList.empty() )
- {
- GetProcPllErrRegList( i_chip, procPllErrRegList );
- }
- P8DataBundle::ProcPllErrRegListIter itr = procPllErrRegList.begin();
- for( ; itr != procPllErrRegList.end(); ++itr)
+ if (CHECK_STOP != i_sc.service_data->GetAttentionType())
{
- // Error is already fenced
- if( (*itr).configReg->IsBitSet(PLL_ERROR_MASK) )
+ MODEL procModel = getProcModel( i_chip->GetChipHandle() );
+ // fence off proc osc error reg bits
+ P8DataBundle * procdb = getDataBundle( i_chip );
+ P8DataBundle::ProcPllErrRegList & procPllErrRegList =
+ procdb->getProcPllErrRegList();
+ if( procPllErrRegList.empty() )
{
- continue;
+ GetProcPllErrRegList( i_chip, procPllErrRegList );
}
- bool needMask = false;
- if( P8DataBundle::PB == (*itr).type )
+ P8DataBundle::ProcPllErrRegListIter itr =
+ procPllErrRegList.begin();
+ for( ; itr != procPllErrRegList.end(); ++itr)
{
- if( ((*itr).errReg->IsBitSet(PB_DMI_LEFT_PLL_ERROR)) ||
- (( MODEL_VENICE == procModel) &&
- ( (*itr).errReg->IsBitSet(PB_DMI_RIGHT_PLL_ERROR))) )
+ // Error is already fenced
+ if( (*itr).configReg->IsBitSet(PLL_ERROR_MASK) )
+ {
+ continue;
+ }
+
+ bool needMask = false;
+ if( P8DataBundle::PB == (*itr).type )
+ {
+ if( ((*itr).errReg->IsBitSet(PB_DMI_LEFT_PLL_ERROR)) ||
+ (( MODEL_VENICE == procModel) &&
+ ( (*itr).errReg->IsBitSet(PB_DMI_RIGHT_PLL_ERROR))) )
+ {
+ (*itr).configReg->SetBit(PLL_ERROR_MASK);
+ needMask = true;
+ }
+ }
+ else if( (*itr).errReg->IsBitSet(PLL_ERROR_BIT) )
{
(*itr).configReg->SetBit(PLL_ERROR_MASK);
needMask = true;
}
- }
- else if( (*itr).errReg->IsBitSet(PLL_ERROR_BIT) )
- {
- (*itr).configReg->SetBit(PLL_ERROR_MASK);
- needMask = true;
+
+ if( needMask )
+ {
+ rc |= (*itr).configReg->Write();
+ }
}
- if( needMask )
+ // fence off pci osc error reg bit
+ SCAN_COMM_REGISTER_CLASS * pciErrReg =
+ i_chip->getRegister("PCI_ERROR_REG");
+ SCAN_COMM_REGISTER_CLASS * pciConfigReg =
+ i_chip->getRegister("PCI_CONFIG_REG");
+
+ if(pciErrReg->IsBitSet(PLL_ERROR_BIT) &&
+ !pciConfigReg->IsBitSet(PLL_ERROR_MASK))
{
- rc |= (*itr).configReg->Write();
+ pciConfigReg->SetBit(PLL_ERROR_MASK);
+ rc |= pciConfigReg->Write();
}
- }
- // fence off pci osc error reg bit
- SCAN_COMM_REGISTER_CLASS * pciErrReg =
- i_chip->getRegister("PCI_ERROR_REG");
- SCAN_COMM_REGISTER_CLASS * pciConfigReg =
- i_chip->getRegister("PCI_CONFIG_REG");
+ // Need to clear the PLL Err Reg list so it can
+ // be populated with fresh data on the next analysis
+ // can do this in error case to save some space
+ procPllErrRegList.clear();
- if(pciErrReg->IsBitSet(PLL_ERROR_BIT) &&
- !pciConfigReg->IsBitSet(PLL_ERROR_MASK))
- {
- pciConfigReg->SetBit(PLL_ERROR_MASK);
- rc |= pciConfigReg->Write();
- }
+ // Since TP_LFIR bit is the collection of all of the
+ // pll error reg bits, we can't mask it or we will not
+ // see any PLL errors reported from the error regs
- // Need to clear the PLL Err Reg list so it can
- // be populated with fresh data on the next analysis
- // can do this in error case to save some space
- procPllErrRegList.clear();
-
- // Since TP_LFIR bit is the collection of all of the
- // pll error reg bits, we can't mask it or we will not
- // see any PLL errors reported from the error regs
+ } // if not checkstop
if( rc != SUCCESS )
{
@@ -510,6 +520,282 @@ int32_t capturePllFfdc( ExtensibleChip * i_chip,
}
PRDF_PLUGIN_DEFINE( Proc, capturePllFfdc );
+/**
+ * @brief Check PCB Slave internal parity errors
+ * @param i_chip P8 chip
+ * @param o_parityErr true for parity error, false otherwise
+ * @param io_sc service data collector
+ * @returns FAIL or SUCCESS
+ */
+int32_t CheckParityErr( ExtensibleChip * i_chip,
+ bool & o_parityErr,
+ STEP_CODE_DATA_STRUCT & io_sc )
+{
+ #define PRDF_FUNC "[Proc::CheckParityErr] "
+
+ int32_t rc = SUCCESS;
+ o_parityErr = false;
+ P8DataBundle * procdb = getDataBundle( i_chip );
+ P8DataBundle::ProcPllErrRegList & procPllErrRegList =
+ procdb->getProcPllErrRegList();
+
+ do
+ {
+ // First check PCI chiplet
+ SCAN_COMM_REGISTER_CLASS * pciErrReg =
+ i_chip->getRegister("PCI_ERROR_REG");
+ SCAN_COMM_REGISTER_CLASS * pciConfigReg =
+ i_chip->getRegister("PCI_CONFIG_REG");
+
+ rc = pciErrReg->Read();
+ if (rc != SUCCESS) break;
+
+ rc = pciConfigReg->Read();
+ if (rc != SUCCESS) break;
+
+ if(pciErrReg->IsBitSet(PARITY_ERROR_BIT) &&
+ !pciConfigReg->IsBitSet(PARITY_ERROR_MASK))
+ {
+ o_parityErr = true;
+ break;
+ }
+
+ // Next check other chiplets
+
+ // Always get a list here since this is the entry point
+ GetProcPllErrRegList( i_chip, procPllErrRegList );
+
+ P8DataBundle::ProcPllErrRegListIter itr = procPllErrRegList.begin();
+ for( ; itr != procPllErrRegList.end(); ++itr)
+ {
+ rc = (*itr).errReg->Read();
+ if (rc != SUCCESS) break;
+
+ rc = (*itr).configReg->Read();
+ if (rc != SUCCESS) break;
+
+ if((*itr).errReg->IsBitSet(PARITY_ERROR_BIT) &&
+ !(*itr).configReg->IsBitSet(PARITY_ERROR_MASK))
+ {
+ o_parityErr = true;
+ break;
+ }
+ }
+
+ } while(0);
+
+ if( ! o_parityErr )
+ {
+ PRDF_ERR(PRDF_FUNC"no parity error found for proc: 0x%.8X",
+ i_chip->GetId());
+ }
+
+ if( rc != SUCCESS )
+ {
+ PRDF_ERR(PRDF_FUNC"failed for proc: 0x%.8X", i_chip->GetId());
+ }
+
+ return rc;
+
+ #undef PRDF_FUNC
+}
+
+
+/**
+ * @brief Mask the PCB Slave internal parity error
+ * @param i_chip P8 chip
+ * @param i_sc The step code data struct
+ * @returns Failure or Success
+ */
+int32_t MaskParityErr( ExtensibleChip * i_chip,
+ STEP_CODE_DATA_STRUCT & i_sc)
+{
+ #define PRDF_FUNC "[Proc::MaskParityErr] "
+
+ int32_t rc = SUCCESS;
+
+ if (CHECK_STOP != i_sc.service_data->GetAttentionType())
+ {
+ // fence off proc osc error reg bits
+ P8DataBundle * procdb = getDataBundle( i_chip );
+ P8DataBundle::ProcPllErrRegList & procPllErrRegList =
+ procdb->getProcPllErrRegList();
+
+ if( procPllErrRegList.empty() )
+ {
+ GetProcPllErrRegList( i_chip, procPllErrRegList );
+ }
+
+ P8DataBundle::ProcPllErrRegListIter itr =
+ procPllErrRegList.begin();
+ for( ; itr != procPllErrRegList.end(); ++itr)
+ {
+ // Error is already fenced
+ if( (*itr).configReg->IsBitSet(PARITY_ERROR_MASK) )
+ {
+ continue;
+ }
+
+ if( (*itr).errReg->IsBitSet(PARITY_ERROR_BIT) )
+ {
+ (*itr).configReg->SetBit(PARITY_ERROR_MASK);
+ rc |= (*itr).configReg->Write();
+ }
+ }
+
+ // fence off pci parity error
+ SCAN_COMM_REGISTER_CLASS * pciErrReg =
+ i_chip->getRegister("PCI_ERROR_REG");
+ SCAN_COMM_REGISTER_CLASS * pciConfigReg =
+ i_chip->getRegister("PCI_CONFIG_REG");
+
+ if(pciErrReg->IsBitSet(PARITY_ERROR_BIT) &&
+ !pciConfigReg->IsBitSet(PARITY_ERROR_MASK))
+ {
+ pciConfigReg->SetBit(PARITY_ERROR_MASK);
+ rc |= pciConfigReg->Write();
+ }
+
+ // Since TP_LFIR bit is the collection of all of the
+ // pll error reg bits, we can't mask it or we will not
+ // see any PLL errors reported from the error regs
+
+ } // if not checkstop
+
+ if( rc != SUCCESS )
+ {
+ PRDF_ERR(PRDF_FUNC"failed for proc: 0x%.8X",
+ i_chip->GetId());
+ }
+
+ return rc;
+
+#undef PRDF_FUNC
+}
+
+/**
+ * @brief Clear the Parity errors
+ * @param i_chip P8 chip
+ * @param i_sc The step code data struct
+ * @returns Failure or Success
+ */
+int32_t ClearParityErr( ExtensibleChip * i_chip,
+ STEP_CODE_DATA_STRUCT & i_sc)
+{
+ #define PRDF_FUNC "[Proc::ClearParityErr] "
+
+ int32_t rc = SUCCESS;
+
+ if (CHECK_STOP != i_sc.service_data->GetAttentionType())
+ {
+ // Clear proc osc error reg bits
+ P8DataBundle * procdb = getDataBundle( i_chip );
+ P8DataBundle::ProcPllErrRegList & procPllErrRegList =
+ procdb->getProcPllErrRegList();
+ if( procPllErrRegList.empty() )
+ {
+ GetProcPllErrRegList( i_chip, procPllErrRegList );
+ }
+
+ P8DataBundle::ProcPllErrRegListIter itr = procPllErrRegList.begin();
+ for( ; itr != procPllErrRegList.end(); ++itr)
+ {
+ (*itr).errReg->ClearBit(PARITY_ERROR_BIT);
+ rc |= (*itr).errReg->Write();
+ }
+
+ // Clear pci parity error
+ SCAN_COMM_REGISTER_CLASS * pciErrReg =
+ i_chip->getRegister("PCI_ERROR_REG");
+ pciErrReg->ClearBit(PARITY_ERROR_BIT);
+ rc |= pciErrReg->Write();
+
+ // Clear TP_LFIR
+ SCAN_COMM_REGISTER_CLASS * TP_LFIR =
+ i_chip->getRegister("TP_LFIR_AND");
+ TP_LFIR->setAllBits();
+ // Parity error also feeds into this LFIR
+ TP_LFIR->ClearBit(PLL_DETECT_P8);
+ rc |= TP_LFIR->Write();
+ }
+
+ if( rc != SUCCESS )
+ {
+ PRDF_ERR(PRDF_FUNC"failed for proc: 0x%.8X",
+ i_chip->GetId());
+ }
+
+ return rc;
+
+ #undef PRDF_FUNC
+}
+
+
+/**
+ * @brief analyze PCB Slave internal parity errors
+ * @param i_chip P8 chip
+ * @param io_sc service data collector
+ * @returns Failure or Success
+ */
+int32_t AnalyzeParityErr( ExtensibleChip * i_chip,
+ STEP_CODE_DATA_STRUCT & io_sc )
+{
+ #define PRDF_FUNC "[Proc::AnalyzeParityErr] "
+
+ int32_t rc = SUCCESS;
+ bool found = false;
+
+ do
+ {
+ rc = CheckParityErr(i_chip, found, io_sc);
+ if (rc != SUCCESS) break;
+
+ if(found)
+ {
+ if(io_sc.service_data->IsAtThreshold())
+ {
+ MaskParityErr( i_chip, io_sc );
+ }
+
+ ClearParityErr( i_chip, io_sc );
+ }
+
+ } while(0);
+
+ // clear the PLL Err Reg list
+ P8DataBundle * procdb = getDataBundle( i_chip );
+ P8DataBundle::ProcPllErrRegList & procPllErrRegList =
+ procdb->getProcPllErrRegList();
+ procPllErrRegList.clear();
+
+ if( rc != SUCCESS )
+ {
+ PRDF_ERR(PRDF_FUNC"failed for proc: 0x%.8X", i_chip->GetId());
+ }
+
+ return rc;
+
+ #undef PRDF_FUNC
+}
+PRDF_PLUGIN_DEFINE( Proc, AnalyzeParityErr );
+
+/**
+ * @brief There are some FIR bits that will be cleared manually and must not be
+ * cleared by the framework code. The plugin forces the rule code to
+ * analyze a special copy of the FIR which will not automatically clear
+ * the FIR bits at attention.
+ * @param i_chip P8 chip.
+ * @param i_sc The step code data struct.
+ * @return PRD_NO_CLEAR_FIR_BITS always.
+ */
+int32_t NoClearFirBits( ExtensibleChip * i_chip,
+ STEP_CODE_DATA_STRUCT & i_sc )
+{
+ return PRD_NO_CLEAR_FIR_BITS;
+}
+PRDF_PLUGIN_DEFINE( Proc, NoClearFirBits );
+
+
} // end namespace Proc
} // end namespace PRDF
OpenPOWER on IntegriCloud