Skip to content

Commit

Permalink
PRD: rule updates from RAS XML v91
Browse files Browse the repository at this point in the history
Change-Id: I598ed4a6cd6f4d79008e535e2fad41b647ddb2eb
RTC: 175907
Reviewed-on: http://ralgit01.raleigh.ibm.com/gerrit1/41995
Tested-by: Jenkins Server <pfd-jenkins+hostboot@us.ibm.com>
Reviewed-by: Brian J. Stegmiller <bjs@us.ibm.com>
Reviewed-by: Caleb N. Palmer <cnpalmer@us.ibm.com>
Reviewed-by: Benjamin J. Weisenbeck <bweisenb@us.ibm.com>
Reviewed-by: Zane C. Shelley <zshelle@us.ibm.com>
Reviewed-on: http://ralgit01.raleigh.ibm.com/gerrit1/42208
Tested-by: Jenkins OP Build CI <op-jenkins+hostboot@us.ibm.com>
Tested-by: FSP CI Jenkins <fsp-CI-jenkins+hostboot@us.ibm.com>
  • Loading branch information
zane131 committed Jun 22, 2017
1 parent 7d4cab0 commit 6a1bf63
Show file tree
Hide file tree
Showing 9 changed files with 1,982 additions and 1,959 deletions.
20 changes: 10 additions & 10 deletions src/usr/diag/prdf/common/plat/p9/p9_capp.rule
Expand Up @@ -194,7 +194,7 @@ group gCXAFIR filter singlebit, cs_root_cause
/** CXAFIR[4]
* CXA Timer expired recoverable error
*/
(rCXAFIR, bit(4)) ? level2_th_1; # NIMBUS_10
(rCXAFIR, bit(4)) ? level2_th_1;

/** CXAFIR[5]
* Recovery sequencer hang detection
Expand All @@ -204,12 +204,12 @@ group gCXAFIR filter singlebit, cs_root_cause
/** CXAFIR[6]
* XPT saw UE on PB data
*/
(rCXAFIR, bit(6)) ? level2_th_1; # NIMBUS_10
(rCXAFIR, bit(6)) ? level2_th_1;

/** CXAFIR[7]
* XPT saw SUE on PB data
*/
(rCXAFIR, bit(7)) ? level2_th_1; # NIMBUS_10
(rCXAFIR, bit(7)) ? level2_th_1_SUE;

/** CXAFIR[8]
* Correctable error on Snooper array.
Expand Down Expand Up @@ -239,7 +239,7 @@ group gCXAFIR filter singlebit, cs_root_cause
/** CXAFIR[13]
* Recoverable errors detected in Master
*/
(rCXAFIR, bit(13)) ? level2_th_1; # NIMBUS_10
(rCXAFIR, bit(13)) ? level2_th_1;

/** CXAFIR[14]
* spare
Expand Down Expand Up @@ -317,19 +317,19 @@ group gCXAFIR filter singlebit, cs_root_cause
(rCXAFIR, bit(28)) ? defaultMaskedError;

/** CXAFIR[29]
* CXA: PB Addr Error detected by APC on load
* CXA: PB Addr Error detected by APC : ld
*/
(rCXAFIR, bit(29)) ? level2_th_1;

/** CXAFIR[30]
* CXA PB Addr Error detected by APC on store
* CXA PB Addr Err detected by APC : st
*/
(rCXAFIR, bit(30)) ? level2_th_1;

/** CXAFIR[31]
* CXA: PPHB0 or PHB1 i linkdown
*/
(rCXAFIR, bit(31)) ? level2_th_1; # NIMBUS_10
(rCXAFIR, bit(31)) ? level2_th_1;

/** CXAFIR[32]
* APC ack_dead or ack_ed_dead
Expand Down Expand Up @@ -359,7 +359,7 @@ group gCXAFIR filter singlebit, cs_root_cause
/** CXAFIR[37]
* CXA: TLBI Timeout error.
*/
(rCXAFIR, bit(37)) ? level2_th_1; # NIMBUS_10
(rCXAFIR, bit(37)) ? level2_th_1;

/** CXAFIR[38]
* CXA: TLBI seq_err.
Expand Down Expand Up @@ -399,12 +399,12 @@ group gCXAFIR filter singlebit, cs_root_cause
/** CXAFIR[45]
* Command_queue_UE
*/
(rCXAFIR, bit(45)) ? self_th_1; # NIMBUS_10
(rCXAFIR, bit(45)) ? self_th_1;

/** CXAFIR[46]
* PSL credit timeout error
*/
(rCXAFIR, bit(46)) ? level2_th_1; # NIMBUS_10
(rCXAFIR, bit(46)) ? level2_th_1;

/** CXAFIR[47]
* spare
Expand Down
19 changes: 13 additions & 6 deletions src/usr/diag/prdf/common/plat/p9/p9_common_actions.rule
Expand Up @@ -108,11 +108,11 @@ actionclass threshold_and_mask
# Special Flags #
################################################################################

/** Set SUE generation point */
actionclass SUEGenerationPoint
{
flag(UERE);
};
/** SUE source */
actionclass SueSource { flag(UERE); };

/** SUE originated from somewhere else */
actionclass SueSeen { flag(SUE); };

################################################################################
# Simple Callouts #
Expand Down Expand Up @@ -143,7 +143,6 @@ actionclass calloutSelfLowNoGard
# Callouts with thresholds #
################################################################################


actionclass self_th_1
{
calloutSelfMed;
Expand Down Expand Up @@ -208,6 +207,14 @@ actionclass level2_M_proc_L_th_1
threshold1;
};

################################################################################
# Callouts with flags #
################################################################################

actionclass level2_th_1_SUE { level2_th_1; SueSeen; };
actionclass self_th_1_SUE { self_th_1; SueSeen; };
actionclass self_th_1_UERE { self_th_1; SueSource; };

################################################################################
# Dump Types #
################################################################################
Expand Down
6 changes: 3 additions & 3 deletions src/usr/diag/prdf/common/plat/p9/p9_ec.rule
Expand Up @@ -559,7 +559,7 @@ group gCOREFIR filter singlebit, cs_root_cause
/** COREFIR[14]
* Machine check and ME = 0 Err
*/
(rCOREFIR, bit(14)) ? self_th_1;
(rCOREFIR, bit(14)) ? self_th_1_SUE;

/** COREFIR[15]
* LSU or IFU detected UE from L2
Expand Down Expand Up @@ -754,12 +754,12 @@ group gCOREFIR filter singlebit, cs_root_cause
/** COREFIR[57]
* Other Core Core Checkstop
*/
(rCOREFIR, bit(57)) ? self_th_1;
(rCOREFIR, bit(57)) ? defaultMaskedError;

/** COREFIR[58]
* Other Core System Checkstop
*/
(rCOREFIR, bit(58)) ? self_th_1;
(rCOREFIR, bit(58)) ? defaultMaskedError;

/** COREFIR[59]
* SCOM error handling
Expand Down
2 changes: 1 addition & 1 deletion src/usr/diag/prdf/common/plat/p9/p9_ex.rule
Expand Up @@ -555,7 +555,7 @@ group gNCUFIR filter singlebit, cs_root_cause( 8 )
/** NCUFIR[8]
* NCU Store Queue Data Parity Err
*/
(rNCUFIR, bit(8)) ? self_th_1;
(rNCUFIR, bit(8)) ? self_th_1_UERE;

/** NCUFIR[9]
* store timed out on pb
Expand Down
8 changes: 4 additions & 4 deletions src/usr/diag/prdf/common/plat/p9/p9_mca.rule
Expand Up @@ -302,7 +302,7 @@ group gMCACALFIR filter priority( 13 ), cs_root_cause( 4, 13, 14 )
/** MCACALFIR[13]
* Persistent RCD error, port failed
*/
(rMCACALFIR, bit(13)) ? mem_port_failure;
(rMCACALFIR, bit(13)) ? mem_port_failure_UERE;

/** MCACALFIR[14]
* RCD during periodic cal
Expand Down Expand Up @@ -413,7 +413,7 @@ group gMCAECCFIR filter priority( 14, 17, 37 ), # ensure UEs handled before NCEs
/** MCAECCFIR[14]
* Mainline read UE
*/
(rMCAECCFIR, bit(14)) ? mainline_ue_handling;
(rMCAECCFIR, bit(14)) ? mainline_ue_handling_UERE;

/** MCAECCFIR[15]
* Mainline read RCD
Expand All @@ -428,7 +428,7 @@ group gMCAECCFIR filter priority( 14, 17, 37 ), # ensure UEs handled before NCEs
/** MCAECCFIR[17]
* Mainline read IUE
*/
(rMCAECCFIR, bit(17)) ? mainline_iue_handling;
(rMCAECCFIR, bit(17)) ? mainline_iue_handling_UERE;

/** MCAECCFIR[18]
* Mainline read IRCD
Expand Down Expand Up @@ -493,7 +493,7 @@ group gMCAECCFIR filter priority( 14, 17, 37 ), # ensure UEs handled before NCEs
/** MCAECCFIR[37]
* Maintenance IUE
*/
(rMCAECCFIR, bit(37)) ? maintenance_iue_handling;
(rMCAECCFIR, bit(37)) ? maintenance_iue_handling_UERE;

/** MCAECCFIR[38]
* Maintenance IRCD
Expand Down
15 changes: 8 additions & 7 deletions src/usr/diag/prdf/common/plat/p9/p9_mca_actions.rule
Expand Up @@ -40,18 +40,19 @@ actionclass mainline_nce_handling { funccall("AnalyzeFetchNce"); };
actionclass mainline_tce_handling { funccall("AnalyzeFetchTce"); };

/** Mainline UE handling */
actionclass mainline_ue_handling
actionclass mainline_ue_handling_UERE
{
SUEGenerationPoint;
SueSource;
threshold( field(33 / 30 min ) ); # To prevent flooding. Will be unmasked
# when background scrubbing resumes after
# targeted diagnostics is complete.
funccall("AnalyzeFetchUe");
};

/** Memory Port Failure */
actionclass mem_port_failure
actionclass mem_port_failure_UERE
{
SueSource;
callout(connected(TYPE_DIMM,0), MRU_HIGH); # DIMM 0 HIGH
callout(connected(TYPE_DIMM,1), MRU_HIGH); # DIMM 1 HIGH
calloutSelfLow; # Self LOW
Expand All @@ -70,17 +71,17 @@ actionclass rcd_parity_error
};

/** Handle Mainline IUEs */
actionclass mainline_iue_handling
actionclass mainline_iue_handling_UERE
{
SUEGenerationPoint;
SueSource;
# Thresholding done in the plugin
funccall("AnalyzeMainlineIue");
};

/** Handle Maintenance IUEs */
actionclass maintenance_iue_handling
actionclass maintenance_iue_handling_UERE
{
SUEGenerationPoint;
SueSource;
# Thresholding done in the plugin
funccall("AnalyzeMaintIue");
};
Expand Down

0 comments on commit 6a1bf63

Please sign in to comment.