summaryrefslogtreecommitdiffstats
path: root/src/import/chips/p9/procedures/hwp/cache/p9_hcd_cache_chiplet_reset.C
blob: 57413f0e9ae2c11e50fb8de8521edf5379643d90 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
/* IBM_PROLOG_BEGIN_TAG                                                   */
/* This is an automatically generated prolog.                             */
/*                                                                        */
/* $Source: src/import/chips/p9/procedures/hwp/cache/p9_hcd_cache_chiplet_reset.C $ */
/*                                                                        */
/* OpenPOWER sbe Project                                                  */
/*                                                                        */
/* Contributors Listed Below - COPYRIGHT 2015,2016                        */
/* [+] International Business Machines Corp.                              */
/*                                                                        */
/*                                                                        */
/* Licensed under the Apache License, Version 2.0 (the "License");        */
/* you may not use this file except in compliance with the License.       */
/* You may obtain a copy of the License at                                */
/*                                                                        */
/*     http://www.apache.org/licenses/LICENSE-2.0                         */
/*                                                                        */
/* Unless required by applicable law or agreed to in writing, software    */
/* distributed under the License is distributed on an "AS IS" BASIS,      */
/* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or        */
/* implied. See the License for the specific language governing           */
/* permissions and limitations under the License.                         */
/*                                                                        */
/* IBM_PROLOG_END_TAG                                                     */
///
/// @file  p9_hcd_cache_chiplet_reset.C
/// @brief Cache Chiplet Reset
///
/// Procedure Summary:
///   Reset quad chiplet logic
///   Clocking:
///    - setup cache sector buffer strength,
///      pulse mode and pulsed mode enable values
///      (attribute dependency Nimbus/Cumulus)
///    - Drop glsmux async reset
///   Scan0 flush entire cache chiplet

// *HWP HWP Owner          : David Du       <daviddu@us.ibm.com>
// *HWP Backup HWP Owner   : Greg Still     <stillgs@us.ibm.com>
// *HWP FW Owner           : Sangeetha T S  <sangeet2@in.ibm.com>
// *HWP Team               : PM
// *HWP Consumed by        : SBE:SGPE
// *HWP Level              : 2

//------------------------------------------------------------------------------
// Includes
//------------------------------------------------------------------------------

#include <p9_misc_scom_addresses.H>
#include <p9_quad_scom_addresses.H>
#include <p9_perv_sbe_cmn.H>
#include <p9_hcd_common.H>
#include "p9_hcd_cache_chiplet_reset.H"

#ifdef HW388878_DD1_VCS_POWER_ON_IN_CHIPLET_RESET_FIX
    #include <p9_common_poweronoff.H>
    #include <p9_common_poweronoff.C>
#endif

//------------------------------------------------------------------------------
// Constant Definitions
//------------------------------------------------------------------------------

enum P9_HCD_CACHE_CHIPLET_RESET_CONSTANTS
{
    // (1)PCB_EP_RESET
    // (2)CLK_ASYNC_RESET
    // (3)PLL_TEST_EN
    // (4)PLLRST
    // (5)PLLBYP
    // (11)EDIS
    // (12)VITL_MPW1
    // (13)VITL_MPW2
    // (14)VITL_MPW3
    // (16)VITL_THOLD
    // (18)FENCE_EN
    // (22)FUNC_CLKSEL
    // (25)PCB_FENCE
    // (26)LVLTRANS_FENCE
    Q_NET_CTRL0_INIT_VECTOR = (BITS64(1, 5) | BITS64(11, 4) | BIT64(16) |
                               BIT64(18) | BIT64(22) | BITS64(25, 2)),
    CACHE_GLSMUX_RESET_DELAY_REF_CYCLES = 40
};

/// @todo RTC 162433
/// This is going to break on Nimbus DD2.0 and Cumulus SoA testing.
/// need more discussion in HW/FW interlock on how to handle this.
enum HW388878_DD1_VCS_POWER_ON_IN_CHIPLET_RESET_FIX_CONSTATNS
{
    // Eq_fure + Ex_l2_fure(ex0) + Ex_l2_fure(ex1)
    DD1_EQ_FURE_RING_LENGTH = (46532 + 119192 + 119192)
};

//------------------------------------------------------------------------------
// Procedure: Cache Chiplet Reset
//------------------------------------------------------------------------------

fapi2::ReturnCode
p9_hcd_cache_chiplet_reset(
    const fapi2::Target<fapi2::TARGET_TYPE_EQ>& i_target)
{
    FAPI_INF(">>p9_hcd_cache_chiplet_reset");
    fapi2::buffer<uint64_t>                     l_data64;
    uint16_t                                    l_region_scan0;
    uint64_t                                    l_l2gmux_input       = 0;
    uint64_t                                    l_l2gmux_reset       = 0;
    uint8_t                                     l_attr_chip_unit_pos = 0;
#ifdef HW388878_DD1_VCS_POWER_ON_IN_CHIPLET_RESET_FIX
    fapi2::buffer<uint8_t>                      l_attr_dd1_vcs_workaround;
#endif
    fapi2::Target<fapi2::TARGET_TYPE_PROC_CHIP> l_chip =
        i_target.getParent<fapi2::TARGET_TYPE_PROC_CHIP>();
    fapi2::Target<fapi2::TARGET_TYPE_PERV>      l_perv =
        i_target.getParent<fapi2::TARGET_TYPE_PERV>();
    auto l_core_functional_vector =
        i_target.getChildren<fapi2::TARGET_TYPE_CORE>
        (fapi2::TARGET_STATE_FUNCTIONAL);

    FAPI_TRY(FAPI_ATTR_GET(fapi2::ATTR_CHIP_UNIT_POS, l_perv,
                           l_attr_chip_unit_pos));
    l_attr_chip_unit_pos = l_attr_chip_unit_pos - p9hcd::PERV_TO_EQ_POS_OFFSET;

    FAPI_TRY(getScom(l_chip, PU_OCB_OCI_QCSR_SCOM, l_data64));
    FAPI_DBG("Working on cache[%d], good EXs in QCSR[%016llX]",
             l_attr_chip_unit_pos, l_data64);

    l_region_scan0 = p9hcd::SCAN0_REGION_ALL_BUT_EX;

    if (l_data64 & BIT64(l_attr_chip_unit_pos << 1))
    {
        l_region_scan0 |= p9hcd::SCAN0_REGION_EX0_L2_L3_REFR;
        l_l2gmux_reset |= BIT64(32);
        l_l2gmux_input |= BIT64(34);
    }

    if (l_data64 & BIT64((l_attr_chip_unit_pos << 1) + 1))
    {
        l_region_scan0 |= p9hcd::SCAN0_REGION_EX1_L2_L3_REFR;
        l_l2gmux_reset |= BIT64(33);
        l_l2gmux_input |= BIT64(35);
    }

    //--------------------------
    // Reset cache chiplet logic
    //--------------------------
    // If there is an unused, powered-off cache chiplet which needs to be
    // configured in the following steps to setup the PCB endpoint.

    for(auto it : l_core_functional_vector)
    {
        FAPI_TRY(FAPI_ATTR_GET(fapi2::ATTR_CHIP_UNIT_POS,
                               it.getParent<fapi2::TARGET_TYPE_PERV>(),
                               l_attr_chip_unit_pos));
        FAPI_DBG("Assert core[%d] DCC reset via NET_CTRL0[2]",
                 (l_attr_chip_unit_pos - p9hcd::PERV_TO_CORE_POS_OFFSET));
        FAPI_TRY(putScom(l_chip, (C_NET_CTRL0_WOR + (0x1000000 *
                                  (l_attr_chip_unit_pos - p9hcd::PERV_TO_CORE_POS_OFFSET))),
                         MASK_SET(2)));
    }

    /// @todo needs to revisit this sim workaround
    FAPI_DBG("Init heartbeat hang counter via HANG_PULSE_6[2]");
    FAPI_TRY(putScom(i_target, EQ_HANG_PULSE_6_REG, MASK_SET(2)));

    FAPI_DBG("Init NET_CTRL0[1-5,11-14,16,18,22,25,26],step needed for hotplug");
    l_data64 = Q_NET_CTRL0_INIT_VECTOR;
    FAPI_TRY(putScom(i_target, EQ_NET_CTRL0, l_data64));

    FAPI_DBG("Assert progdly/DCC bypass,L2 DCC reset via NET_CTRL1[1,2,23,24]");
    l_data64.flush<0>().insertFromRight<1, 2>(0x3).insertFromRight<23, 2>(0x3);
    FAPI_TRY(putScom(i_target, EQ_NET_CTRL1_WOR, l_data64));

    FAPI_DBG("Flip cache glsmux to DPLL input via PPM_CGCR[3]");
    FAPI_TRY(putScom(i_target, EQ_PPM_CGCR, MASK_OR(0, 4, 0x9)));

    FAPI_DBG("Flip L2 glsmux to DPLL input via QPPM_EXCGCR[34:35]");
    FAPI_TRY(putScom(i_target, EQ_QPPM_EXCGCR_OR, l_l2gmux_input));

    FAPI_DBG("Assert DPLL ff_bypass via QPPM_DPLL_CTRL[2]");
    FAPI_TRY(putScom(i_target, EQ_QPPM_DPLL_CTRL_OR, MASK_SET(2)));

    FAPI_DBG("Drop vital thold via NET_CTRL0[16]");
    FAPI_TRY(putScom(i_target, EQ_NET_CTRL0_WAND, MASK_UNSET(16)));

    /// @todo optional setup sector buffer strength, pulse mode and pulsed mode enable

    FAPI_DBG("Drop cache glsmux reset via PPM_CGCR[0]");
    FAPI_TRY(putScom(i_target, EQ_PPM_CGCR, MASK_SET(3)));

    FAPI_DBG("Drop L2 glsmux reset via QPPM_EXCGCR[32:33]");
    FAPI_TRY(putScom(i_target, EQ_QPPM_EXCGCR_CLEAR, l_l2gmux_reset));

    FAPI_TRY(fapi2::delay(
                 CACHE_GLSMUX_RESET_DELAY_REF_CYCLES * p9hcd::CLK_PERIOD_10NS,
                 CACHE_GLSMUX_RESET_DELAY_REF_CYCLES * p9hcd::SIM_CYCLE_200UD));

    FAPI_DBG("Assert chiplet enable via NET_CTRL0[0]");
    FAPI_TRY(putScom(i_target, EQ_NET_CTRL0_WOR, MASK_SET(0)));

    FAPI_DBG("Drop PCB endpoint reset via NET_CTRL0[1]");
    FAPI_TRY(putScom(i_target, EQ_NET_CTRL0_WAND, MASK_UNSET(1)));

    FAPI_DBG("Drop chiplet electrical fence via NET_CTRL0[26]");
    FAPI_TRY(putScom(i_target, EQ_NET_CTRL0_WAND, MASK_UNSET(26)));

    FAPI_DBG("Drop PCB fence via NET_CTRL0[25]");
    FAPI_TRY(putScom(i_target, EQ_NET_CTRL0_WAND, MASK_UNSET(25)));

    FAPI_DBG("Set scan ratio to 1:1 in bypass mode via OPCG_ALIGN[47-51]");
    FAPI_TRY(getScom(i_target, EQ_OPCG_ALIGN, l_data64));
    l_data64.insertFromRight<47, 5>(0x0);
    FAPI_TRY(putScom(i_target, EQ_OPCG_ALIGN, l_data64));

#ifndef P9_HCD_STOP_SKIP_FLUSH
    //--------------------------------------------
    // perform scan0 module for pervasive chiplet
    //--------------------------------------------
    // Each scan0 will rotate the ring 8191 latches (2**13 - 1) and the longest
    // ring is defined by P9_HCD_SCAN_FUNC_REPEAT. When the design ALWAYS has
    // all stumps less than 8191, the loop can be removed.

    // Putting in block to avoid c++ crosses initialization compile error
    {
        uint32_t l_loop;

        FAPI_DBG("Scan0 region:all_but_vital type:gptr_repr_time rings");

        for(l_loop = 0; l_loop < P9_HCD_SCAN_GPTR_REPEAT; l_loop++)
            FAPI_TRY(p9_perv_sbe_cmn_scan0_module(l_perv,
                                                  l_region_scan0,
                                                  p9hcd::SCAN0_TYPE_GPTR_REPR_TIME));

#ifdef HW388878_DD1_VCS_POWER_ON_IN_CHIPLET_RESET_FIX
        FAPI_TRY(FAPI_ATTR_GET(
                     fapi2::ATTR_CHIP_EC_FEATURE_HW388878,
                     l_chip, l_attr_dd1_vcs_workaround));

        if (l_attr_dd1_vcs_workaround)
        {
            FAPI_DBG("Enable DD1 VCS workaround");
            FAPI_TRY(p9_hcd_dd1_vcs_workaround(i_target));
        }

#endif

        FAPI_DBG("Scan0 region:all_but_vital type:all_but_gptr_repr_time rings");

        for(l_loop = 0; l_loop < P9_HCD_SCAN_FUNC_REPEAT; l_loop++)
            FAPI_TRY(p9_perv_sbe_cmn_scan0_module(l_perv,
                                                  l_region_scan0,
                                                  p9hcd::SCAN0_TYPE_ALL_BUT_GPTR_REPR_TIME));
    }
#endif

    /// @todo scan_with_setpulse_module(L3 DCC)
    //FAPI_DBG("Drop L3 DCC bypass via NET_CTRL1[1]");
    //FAPI_TRY(putScom(i_target, EQ_NET_CTRL1_WAND, MASK_UNSET(1)));
    /// @todo add VDM_ENABLE attribute control
    //FAPI_DBG("Assert vdm enable via CPPM_VDMCR[0]");
    //FAPI_TRY(putScom(i_target, EQ_PPM_VDMCR_OR, MASK_SET(0)));

fapi_try_exit:

    FAPI_INF("<<p9_hcd_cache_chiplet_reset");
    return fapi2::current_err;
}

#ifdef HW388878_DD1_VCS_POWER_ON_IN_CHIPLET_RESET_FIX
fapi2::ReturnCode
p9_hcd_dd1_vcs_workaround(
    const fapi2::Target<fapi2::TARGET_TYPE_EQ>& i_target)
{
    FAPI_INF(">>p9_hcd_dd1_vcs_workaround");
    fapi2::buffer<uint64_t>                     l_data64;
    uint64_t                                    l_regions;
    uint32_t                                    l_timeout;
    uint32_t                                    l_loop;

    l_regions = p9hcd::CLK_REGION_PERV   |
                p9hcd::CLK_REGION_EX0_L2 |
                p9hcd::CLK_REGION_EX1_L2;

    // ----------------------------------------------------
    // Scan1 initialize region:Perv/L20/L21 type:Fure rings
    // Note: must also scan partial good "bad" L2 rings,
    // and clock start&stop their latches, as well
    // ----------------------------------------------------

    FAPI_DBG("Assert Vital clock regional fence via CPLT_CTRL1[3]");
    FAPI_TRY(putScom(i_target, EQ_CPLT_CTRL1_OR, MASK_SET(3)));

    FAPI_DBG("Assert regional fences of scanned regions via CPLT_CTRL1[4,8,9]");
    FAPI_TRY(putScom(i_target, EQ_CPLT_CTRL1_OR, l_regions));

    FAPI_DBG("Clear clock region register via CLK_REGION");
    FAPI_TRY(putScom(i_target, EQ_CLK_REGION, MASK_ZERO));

    FAPI_DBG("Setup scan select register via SCAN_REGION_TYPE[4,8,9,48,51]");
    FAPI_TRY(putScom(i_target, EQ_SCAN_REGION_TYPE,
                     (l_regions | p9hcd::SCAN_TYPE_FUNC | p9hcd::SCAN_TYPE_REGF)));

    FAPI_DBG("Write scan data register via 0x1003E040");

    for (l_loop = 0; l_loop <= DD1_EQ_FURE_RING_LENGTH / 64; l_loop++)
    {
        FAPI_DBG("Loop Count: %d", l_loop);
        FAPI_TRY(putScom(i_target, 0x1003E040, MASK_ALL));
    }

    // -------------------------------
    // Start Perv/L20/L21 clocks
    // -------------------------------

    FAPI_DBG("Clear all SCAN_REGION_TYPE bits");
    FAPI_TRY(putScom(i_target, EQ_SCAN_REGION_TYPE, MASK_ZERO));

    FAPI_DBG("Start cache clocks(perv/l20/l21) via CLK_REGION");
    l_data64 = (p9hcd::CLK_START_CMD | l_regions | p9hcd::CLK_THOLD_ARY);
    FAPI_TRY(putScom(i_target, EQ_CLK_REGION, l_data64));

    FAPI_DBG("Poll for perv/l20/l21 clocks running via CPLT_STAT0[8]");
    l_timeout = (p9hcd::CYCLES_PER_MS / p9hcd::INSTS_PER_POLL_LOOP);

    do
    {
        FAPI_TRY(getScom(i_target, EQ_CPLT_STAT0, l_data64));
    }
    while((l_data64.getBit<8>() != 1) && ((--l_timeout) != 0));

    FAPI_ASSERT((l_timeout != 0),
                fapi2::PMPROC_CACHECLKSTART_TIMEOUT().set_EQCPLTSTAT(l_data64),
                "perv/l20/l21 Clock Start Timeout");

    FAPI_DBG("Check perv/l20/l21 clocks running");
    FAPI_TRY(getScom(i_target, EQ_CLOCK_STAT_ARY, l_data64));

    FAPI_ASSERT(((l_data64 & l_regions) == 0),
                fapi2::PMPROC_CACHECLKSTART_FAILED().set_EQCLKSTAT(l_data64),
                "perv/l20/l21 Clock Start Failed");
    FAPI_DBG("perv/l20/l21 clocks running now");

    // -------------------------------
    // Turn on power headers for VCS
    // -------------------------------

    FAPI_TRY(p9_common_poweronoff<fapi2::TARGET_TYPE_EQ>(i_target, p9power::POWER_ON_VCS));

    // Because common module raises those fences, we need to lower them here.
    FAPI_DBG("Drop vital thold via NET_CTRL0[16]");
    FAPI_TRY(putScom(i_target, EQ_NET_CTRL0_WAND, MASK_UNSET(16)));

    FAPI_DBG("Drop chiplet electrical fence via NET_CTRL0[26]");
    FAPI_TRY(putScom(i_target, EQ_NET_CTRL0_WAND, MASK_UNSET(26)));

    FAPI_DBG("Drop PCB fence via NET_CTRL0[25]");
    FAPI_TRY(putScom(i_target, EQ_NET_CTRL0_WAND, MASK_UNSET(25)));

    // -------------------------------
    // Stop Perv/L20/L21 clocks
    // -------------------------------

    FAPI_DBG("Clear all SCAN_REGION_TYPE bits");
    FAPI_TRY(putScom(i_target, EQ_SCAN_REGION_TYPE, MASK_ZERO));

    FAPI_DBG("Stop perv/l20/l21 clocks via CLK_REGION");
    l_data64 = (p9hcd::CLK_STOP_CMD | l_regions | p9hcd::CLK_THOLD_ARY);
    FAPI_TRY(putScom(i_target, EQ_CLK_REGION, l_data64));

    FAPI_DBG("Poll for perv/l20/l21 clocks stopped via CPLT_STAT0[8]");
    l_timeout = (p9hcd::CYCLES_PER_MS / p9hcd::INSTS_PER_POLL_LOOP);

    do
    {
        FAPI_TRY(getScom(i_target, EQ_CPLT_STAT0, l_data64));
    }
    while((l_data64.getBit<8>() != 1) && ((--l_timeout) != 0));

    FAPI_ASSERT((l_timeout != 0),
                fapi2::PMPROC_CACHECLKSTOP_TIMEOUT()
                .set_EQ_TARGET(i_target)
                .set_EQCPLTSTAT(l_data64),
                "perv/l20/l21 Clock Stop Timeout");

    FAPI_DBG("Check perv/l20/l21 clocks stopped");
    FAPI_TRY(getScom(i_target, EQ_CLOCK_STAT_ARY, l_data64));

    FAPI_ASSERT((((~l_data64) & l_regions) == 0),
                fapi2::PMPROC_CACHECLKSTOP_FAILED()
                .set_EQ_TARGET(i_target)
                .set_EQCLKSTAT(l_data64),
                "perv/l20/l21 Clock Stop Failed");
    FAPI_DBG("perv/l20/l21 clocks stopped now");

    // -------------------------------
    // Clean up
    // -------------------------------

    FAPI_DBG("Drop Vital clock regional fence via CPLT_CTRL1[3]");
    FAPI_TRY(putScom(i_target, EQ_CPLT_CTRL1_CLEAR, MASK_SET(3)));

    FAPI_DBG("Drop Perv/L20/L21 regional fences via CPLT_CTRL1[4,8,9]");
    FAPI_TRY(putScom(i_target, EQ_CPLT_CTRL1_CLEAR, l_regions));

fapi_try_exit:

    FAPI_INF("<<p9_hcd_dd1_vcs_workaround");
    return fapi2::current_err;
}

#endif
OpenPOWER on IntegriCloud