1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
|
/* IBM_PROLOG_BEGIN_TAG */
/* This is an automatically generated prolog. */
/* */
/* $Source: src/usr/diag/prdf/common/plat/pegasus/prdfCenMembuf.C $ */
/* */
/* IBM CONFIDENTIAL */
/* */
/* COPYRIGHT International Business Machines Corp. 2012,2013 */
/* */
/* p1 */
/* */
/* Object Code Only (OCO) source materials */
/* Licensed Internal Code Source Materials */
/* IBM HostBoot Licensed Internal Code */
/* */
/* The source code for this program is not published or otherwise */
/* divested of its trade secrets, irrespective of what has been */
/* deposited with the U.S. Copyright Office. */
/* */
/* Origin: 30 */
/* */
/* IBM_PROLOG_END_TAG */
/** @file prdfCenMembuf.C
* @brief Contains all the plugin code for the PRD Centaur Membuf
*/
#include <iipServiceDataCollector.h>
#include <prdfCalloutUtil.H>
#include <prdfExtensibleChip.H>
#include <prdfPlatServices.H>
#include <prdfPluginMap.H>
#include <prdfGlobal.H>
#include <iipSystem.h>
#include <prdfLaneRepair.H>
#include <UtilHash.H>
using namespace TARGETING;
#include <prdfCenMembufDataBundle.H>
namespace PRDF
{
namespace Membuf
{
//##############################################################################
//
// Special plugins
//
//##############################################################################
/**
* @brief Plugin that initializes the P8 Centaur Membuf data bundle.
* @param i_mbaChip A Centaur Membuf chip.
* @return SUCCESS
*/
int32_t Initialize( ExtensibleChip * i_mbaChip )
{
i_mbaChip->getDataBundle() = new CenMembufDataBundle( i_mbaChip );
return SUCCESS;
}
PRDF_PLUGIN_DEFINE( Membuf, Initialize );
//------------------------------------------------------------------------------
/**
* @fn CheckForRecovered
* @brief Used when the chip has a CHECK_STOP attention to check for the
* presence of recovered errors.
*
* @param i_chip The Centaur chip.
* @param o_hasRecovered TRUE if a recoverable attention exists in the Centaur.
*
* @return SUCCESS.
*/
int32_t CheckForRecovered(ExtensibleChip * i_chip,
bool & o_hasRecovered)
{
o_hasRecovered = false;
int32_t l_rc = SUCCESS;
SCAN_COMM_REGISTER_CLASS * l_grer = i_chip->getRegister("GLOBAL_RE_FIR");
l_rc = l_grer->Read();
if ( SUCCESS != l_rc )
{
PRDF_ERR("[CheckForRecovered] GLOBAL_RE_FIR read failed"
"for 0x%08x", i_chip->GetId());
}
else if ( 0 != l_grer->GetBitFieldJustified(1,3) )
{
o_hasRecovered = true;
}
return SUCCESS;
} PRDF_PLUGIN_DEFINE( Membuf, CheckForRecovered );
//------------------------------------------------------------------------------
/**
* @brief MBA0 is always analyzed before MBA1 in the rule code.
* This plugin will help prevent starvation of MBA1.
* @param i_membChip The Centaur Membuf chip.
* @param i_sc The step code data struct.
* @return FAIL if MBA1 is not analyzed.
*/
int32_t MBA1_Starvation( ExtensibleChip * i_membChip,
STEP_CODE_DATA_STRUCT & i_sc )
{
using namespace TARGETING;
CenMembufDataBundle * l_membdb = getMembufDataBundle(i_membChip);
do
{
ExtensibleChip * mba1Chip = l_membdb->getMbaChip(1);
if ( NULL == mba1Chip ) break; // No MBA1 target, exit early
if ( l_membdb->iv_analyzeMba1Starvation )
{
// Get the mem chiplet register
SCAN_COMM_REGISTER_CLASS * l_memcFir = NULL;
uint32_t l_checkBits = 0;
switch ( i_sc.service_data->GetCauseAttentionType() )
{
case CHECK_STOP:
l_memcFir = i_membChip->getRegister("MEM_CHIPLET_CS_FIR");
// mba1 CS: bits 6, 8, 10, 13
l_checkBits = 0x02A40000;
break;
case RECOVERABLE:
l_memcFir = i_membChip->getRegister("MEM_CHIPLET_RE_FIR");
// mba1 RE: bits 4, 6, 8, 11
l_checkBits = 0x0A900000;
break;
case SPECIAL:
l_memcFir = i_membChip->getRegister("MEM_CHIPLET_SPA");
// mba1 SA: bit 1
l_checkBits = 0x40000000;
break;
default: ;
}
if( NULL == l_memcFir )
{
break;
}
// Check if MBA1 from Mem Chiplet is reporting an attention
int32_t l_rc = l_memcFir->Read();
if ( SUCCESS != l_rc )
{
PRDF_ERR("[MBA1_Starvation] SCOM fail on 0x%08x",
i_membChip->GetId());
break;
}
uint32_t l_val = l_memcFir->GetBitFieldJustified(0,32);
if ( 0 == ( l_val & l_checkBits ) )
{
break; // No MBA1 attentions
}
// MBA0 takes priority next
l_membdb->iv_analyzeMba1Starvation = false;
// Analyze MBA1
return mba1Chip->Analyze( i_sc,
i_sc.service_data->GetCauseAttentionType() );
}
else
{
// MBA1 takes priority next
l_membdb->iv_analyzeMba1Starvation = true;
}
} while (0);
return FAIL;
}
PRDF_PLUGIN_DEFINE( Membuf, MBA1_Starvation );
//------------------------------------------------------------------------------
/**
* @brief Analysis code that is called before the main analyze() function.
* @param i_mbChip A MEMBUF chip.
* @param i_sc Step Code Data structure
* @param o_analyzed TRUE if analysis has been done on this chip
* @return failure or success
*/
int32_t PreAnalysis( ExtensibleChip * i_mbChip, STEP_CODE_DATA_STRUCT & i_sc,
bool & o_analyzed )
{
#define PRDF_FUNC "[Membuf::PreAnalysis] "
int32_t o_rc = SUCCESS;
o_analyzed = false;
// Get memory capture data.
CaptureData & cd = i_sc.service_data->GetCaptureData();
CenMembufDataBundle * mbdb = getMembufDataBundle( i_mbChip );
ExtensibleChip * mcsChip = mbdb->getMcsChip();
if ( NULL != mcsChip )
{
mcsChip->CaptureErrorData( cd, Util::hashString("FirRegs") );
mcsChip->CaptureErrorData( cd, Util::hashString("CerrRegs") );
for ( uint32_t i = 0; i < MAX_MBA_PER_MEMBUF; i++ )
{
ExtensibleChip * mbaChip = mbdb->getMbaChip(i);
if ( NULL != mbaChip )
{
mbaChip->CaptureErrorData( cd, Util::hashString("FirRegs") );
mbaChip->CaptureErrorData( cd, Util::hashString("CerrRegs") );
}
}
}
// Check for a Centaur Checkstop
do
{
// Skip if we're already analyzing a unit checkstop
if ( i_sc.service_data->GetFlag(ServiceDataCollector::UNIT_CS) )
break;
if ( NULL == mcsChip )
{
PRDF_ERR( PRDF_FUNC"CenMembufDataBundle::getMcsChip() failed" );
o_rc = FAIL; break;
}
// Check MCIFIR[31] for presence of Centaur checkstop
SCAN_COMM_REGISTER_CLASS * fir = mcsChip->getRegister("MCIFIR");
o_rc = fir->Read();
if ( SUCCESS != o_rc )
{
PRDF_ERR( PRDF_FUNC"Failed to read MCIFIR on 0x%08x",
mcsChip->GetId() );
break;
}
if ( !fir->IsBitSet(31) ) break; // No unit checkstop
// Set Unit checkstop flag
i_sc.service_data->SetFlag(ServiceDataCollector::UNIT_CS);
i_sc.service_data->SetThresholdMaskId(0);
// Set the cause attention type
i_sc.service_data->SetCauseAttentionType(UNIT_CS);
} while (0);
return o_rc;
#undef PRDF_FUNC
}
PRDF_PLUGIN_DEFINE( Membuf, PreAnalysis );
//------------------------------------------------------------------------------
/**
* @brief Plugin function called after analysis is complete but before PRD
* exits.
* @param i_mbChip A Centaur chip.
* @param i_sc The step code data struct.
* @note This is especially useful for any analysis that still needs to be
* done after the framework clears the FIR bits that were at attention.
* @return SUCCESS.
*/
int32_t PostAnalysis( ExtensibleChip * i_mbChip, STEP_CODE_DATA_STRUCT & i_sc )
{
#define PRDF_FUNC "[Membuf::PostAnalysis] "
#ifdef __HOSTBOOT_MODULE
// In hostboot, we need to clear associated bits in the MCIFIR bits.
do
{
CenMembufDataBundle * mbdb = getMembufDataBundle(i_mbChip);
ExtensibleChip * mcsChip = mbdb->getMcsChip();
if ( NULL == mcsChip )
{
PRDF_ERR( PRDF_FUNC"CenMembufDataBundle::getMcsChip() failed" );
break;
}
// Clear the associated MCIFIR bits for all attention types.
// NOTE: If there are any active attentions left in the Centaur the
// associated MCIFIR bit will be redriven with the next packet on
// the bus.
SCAN_COMM_REGISTER_CLASS * firand = mcsChip->getRegister("MCIFIR_AND");
firand->setAllBits();
firand->ClearBit(12); // CS
firand->ClearBit(15); // RE
firand->ClearBit(16); // SPA
firand->ClearBit(17); // maintenance command complete
int32_t l_rc = firand->Write();
if ( SUCCESS != l_rc )
{
PRDF_ERR( PRDF_FUNC"MCIFIR_AND write failed" );
break;
}
} while (0);
#endif // __HOSTBOOT_MODULE
return SUCCESS;
#undef PRDF_FUNC
}
PRDF_PLUGIN_DEFINE( Membuf, PostAnalysis );
/**
* @brief Handle DMI Bus 0-1 spare deployed
* @param i_chip Mem Buf chip
* @param i_sc The step code data struct
* @returns Failure or Success
*/
int32_t dmiBus0SpareDeployed( ExtensibleChip * i_chip,
STEP_CODE_DATA_STRUCT & i_sc )
{
return LaneRepair::handleLaneRepairEvent(i_chip, TYPE_MEMBUF, 0, i_sc,
true);
}
PRDF_PLUGIN_DEFINE( Membuf, dmiBus0SpareDeployed );
int32_t dmiBus1SpareDeployed( ExtensibleChip * i_chip,
STEP_CODE_DATA_STRUCT & i_sc )
{
return LaneRepair::handleLaneRepairEvent(i_chip, TYPE_MEMBUF, 1, i_sc,
true);
}
PRDF_PLUGIN_DEFINE( Membuf, dmiBus1SpareDeployed );
/**
* @brief Handle DMI Bus 0-1 spares exceeded
* @param i_chip Mem Buf chip
* @param i_sc The step code data struct
* @returns Failure or Success
*/
int32_t dmiBus0SparesExceeded( ExtensibleChip * i_chip,
STEP_CODE_DATA_STRUCT & i_sc )
{
return LaneRepair::handleLaneRepairEvent(i_chip, TYPE_MEMBUF, 0, i_sc,
false);
}
PRDF_PLUGIN_DEFINE( Membuf, dmiBus0SparesExceeded );
int32_t dmiBus1SparesExceeded( ExtensibleChip * i_chip,
STEP_CODE_DATA_STRUCT & i_sc )
{
return LaneRepair::handleLaneRepairEvent(i_chip, TYPE_MEMBUF, 1, i_sc,
false);
}
PRDF_PLUGIN_DEFINE( Membuf, dmiBus1SparesExceeded );
/**
* @brief Handle DMI Bus 0-1 Too Many Bus Errors
* @param i_chip Mem Buf chip
* @param i_sc The step code data struct
* @returns Failure or Success
*/
int32_t dmiBus0TooManyErrors( ExtensibleChip * i_chip,
STEP_CODE_DATA_STRUCT & i_sc )
{
return LaneRepair::handleLaneRepairEvent(i_chip, TYPE_MEMBUF, 0, i_sc,
false);
}
PRDF_PLUGIN_DEFINE( Membuf, dmiBus0TooManyErrors );
int32_t dmiBus1TooManyErrors( ExtensibleChip * i_chip,
STEP_CODE_DATA_STRUCT & i_sc )
{
return LaneRepair::handleLaneRepairEvent(i_chip, TYPE_MEMBUF, 1, i_sc,
false);
}
PRDF_PLUGIN_DEFINE( Membuf, dmiBus1TooManyErrors );
} // end namespace Membuf
} // end namespace PRDF
|