| // SPDX-License-Identifier: Apache-2.0 OR GPL-2.0-or-later |
| /* |
| * NPU2 (POWER9) Hardware Procedures |
| * |
| * Copyright 2013-2019 IBM Corp. |
| */ |
| |
| #include <skiboot.h> |
| #include <io.h> |
| #include <timebase.h> |
| #include <pci.h> |
| #include <pci-virt.h> |
| #include <interrupts.h> |
| #include <npu2.h> |
| #include <npu2-regs.h> |
| #include <xscom.h> |
| |
| /* Set in npu2.c if there is an nvram override for the zcal settings on this |
| * machine */ |
| int nv_zcal_nominal = -1; |
| |
| /* PHY Registers. The documentation for the PHY training is written in |
| * terms of bits within an actual register so we use that |
| * representation here. */ |
| struct npu2_phy_reg { |
| uint64_t offset; |
| uint64_t start; |
| uint64_t len; |
| }; |
| |
| /* |
| * Currently unused, but documented here: |
| static struct npu2_phy_reg NPU2_PHY_RX_DATA_DAC_SPARE_MODE = {0x000, 63, 64}; |
| static struct npu2_phy_reg NPU2_PHY_RX_DAC_CNTL6 = {0x00c, 63, 64}; |
| static struct npu2_phy_reg NPU2_PHY_RX_DAC_CNTL5 = {0x028, 63, 64}; |
| static struct npu2_phy_reg NPU2_PHY_RX_DAC_CNTL9 = {0x030, 63, 64}; |
| static struct npu2_phy_reg NPU2_PHY_RX_DAC_CNTL5_EO = {0x00a, 63, 64}; |
| static struct npu2_phy_reg NPU2_PHY_RX_DAC_CNTL4 = {0x026, 63, 64}; |
| */ |
| static struct npu2_phy_reg NPU2_PHY_RX_RUN_LANE = {0x0c8, 48, 1}; |
| static struct npu2_phy_reg NPU2_PHY_RX_IORESET = {0x096, 63, 1}; |
| static struct npu2_phy_reg NPU2_PHY_TX_IORESET = {0x113, 48, 1}; |
| static struct npu2_phy_reg NPU2_PHY_RX_PR_RESET = {0x096, 62, 1}; |
| static struct npu2_phy_reg NPU2_PHY_RX_LANE_ANA_PDWN = {0x002, 54, 1}; |
| static struct npu2_phy_reg NPU2_PHY_RX_LANE_DIG_PDWN = {0x088, 48, 1}; |
| static struct npu2_phy_reg NPU2_PHY_RX_PR_IQ_RES_SEL = {0x004, 59, 3}; |
| static struct npu2_phy_reg NPU2_PHY_RX_PR_PHASE_STEP = {0x08a, 60, 4}; |
| static struct npu2_phy_reg NPU2_PHY_TX_LANE_PDWN = {0x101, 48, 1}; |
| static struct npu2_phy_reg NPU2_PHY_RX_RUN_DCCAL = {0x0c8, 49, 1}; |
| static struct npu2_phy_reg NPU2_PHY_RX_DCCAL_DONE = {0x0ca, 49, 1}; |
| static struct npu2_phy_reg NPU2_PHY_RX_LANE_BUSY = {0x0ca, 50, 1}; |
| static struct npu2_phy_reg NPU2_PHY_RX_B_BANK_CONTROLS = {0x002, 58, 6}; |
| static struct npu2_phy_reg NPU2_PHY_TX_UNLOAD_CLK_DISABLE = {0x103, 56, 1}; |
| static struct npu2_phy_reg NPU2_PHY_TX_FIFO_INIT = {0x105, 53, 1}; |
| static struct npu2_phy_reg NPU2_PHY_TX_RXCAL = {0x103, 57, 1}; |
| static struct npu2_phy_reg NPU2_PHY_RX_INIT_DONE = {0x0ca, 48, 1}; |
| static struct npu2_phy_reg NPU2_PHY_RX_PR_EDGE_TRACK_CNTL = {0x092, 48, 2}; |
| static struct npu2_phy_reg NPU2_PHY_RX_PR_BUMP_SL_1UI = {0x092, 57, 1}; |
| static struct npu2_phy_reg NPU2_PHY_RX_PR_FW_OFF = {0x08a, 56, 1}; |
| static struct npu2_phy_reg NPU2_PHY_RX_PR_FW_INERTIA_AMT = {0x08a, 57, 3}; |
| static struct npu2_phy_reg NPU2_PHY_RX_CFG_LTE_MC = {0x000, 60, 4}; |
| static struct npu2_phy_reg NPU2_PHY_RX_A_INTEG_COARSE_GAIN = {0x00a, 48, 4}; |
| static struct npu2_phy_reg NPU2_PHY_RX_A_CTLE_COARSE = {0x00c, 48, 5}; |
| static struct npu2_phy_reg NPU2_PHY_RX_A_CTLE_GAIN = {0x00c, 53, 4}; |
| static struct npu2_phy_reg NPU2_PHY_RX_B_INTEG_COARSE_GAIN = {0x026, 48, 4}; |
| static struct npu2_phy_reg NPU2_PHY_RX_B_CTLE_COARSE = {0x028, 48, 5}; |
| static struct npu2_phy_reg NPU2_PHY_RX_B_CTLE_GAIN = {0x028, 53, 4}; |
| static struct npu2_phy_reg NPU2_PHY_RX_E_INTEG_COARSE_GAIN = {0x030, 48, 4}; |
| static struct npu2_phy_reg NPU2_PHY_RX_E_CTLE_COARSE = {0x032, 48, 5}; |
| static struct npu2_phy_reg NPU2_PHY_RX_E_CTLE_GAIN = {0x032, 53, 4}; |
| |
| /* These registers are per-PHY, not per lane */ |
| static struct npu2_phy_reg NPU2_PHY_RX_SPEED_SELECT = {0x262, 51, 2}; |
| static struct npu2_phy_reg NPU2_PHY_RX_AC_COUPLED = {0x262, 53, 1}; |
| static struct npu2_phy_reg NPU2_PHY_TX_ZCAL_SWO_EN = {0x3c9, 48, 1}; |
| static struct npu2_phy_reg NPU2_PHY_TX_ZCAL_REQ = {0x3c1, 49, 1}; |
| static struct npu2_phy_reg NPU2_PHY_TX_ZCAL_DONE = {0x3c1, 50, 1}; |
| static struct npu2_phy_reg NPU2_PHY_TX_ZCAL_ERROR = {0x3c1, 51, 1}; |
| static struct npu2_phy_reg NPU2_PHY_TX_ZCAL_N = {0x3c3, 48, 9}; |
| static struct npu2_phy_reg NPU2_PHY_TX_ZCAL_P = {0x3c5, 48, 9}; |
| static struct npu2_phy_reg NPU2_PHY_TX_FFE_BOOST_EN = {0x34b, 59, 1}; |
| static struct npu2_phy_reg NPU2_PHY_TX_PSEG_PRE_EN = {0x34d, 51, 5}; |
| static struct npu2_phy_reg NPU2_PHY_TX_PSEG_PRE_SELECT = {0x34d, 56, 5}; |
| static struct npu2_phy_reg NPU2_PHY_TX_NSEG_PRE_EN = {0x34f, 51, 5}; |
| static struct npu2_phy_reg NPU2_PHY_TX_NSEG_PRE_SELECT = {0x34f, 56, 5}; |
| static struct npu2_phy_reg NPU2_PHY_TX_PSEG_POST_EN = {0x361, 49, 7}; |
| static struct npu2_phy_reg NPU2_PHY_TX_PSEG_POST_SELECT = {0x361, 56, 7}; |
| static struct npu2_phy_reg NPU2_PHY_TX_NSEG_POST_EN = {0x363, 49, 7}; |
| static struct npu2_phy_reg NPU2_PHY_TX_NSEG_POST_SELECT = {0x363, 56, 7}; |
| static struct npu2_phy_reg NPU2_PHY_TX_PSEG_MARGINPU_EN = {0x351, 48, 8}; |
| static struct npu2_phy_reg NPU2_PHY_TX_NSEG_MARGINPU_EN = {0x353, 48, 8}; |
| static struct npu2_phy_reg NPU2_PHY_TX_PSEG_MARGINPD_EN = {0x351, 56, 8}; |
| static struct npu2_phy_reg NPU2_PHY_TX_NSEG_MARGINPD_EN = {0x353, 56, 8}; |
| static struct npu2_phy_reg NPU2_PHY_TX_MARGINPU_SELECT = {0x355, 48, 8}; |
| static struct npu2_phy_reg NPU2_PHY_TX_MARGINPD_SELECT = {0x355, 56, 8}; |
| static struct npu2_phy_reg NPU2_PHY_TX_PSEG_MAIN_EN = {0x357, 51, 7}; |
| static struct npu2_phy_reg NPU2_PHY_TX_NSEG_MAIN_EN = {0x359, 51, 7}; |
| /* Currently unused, but documented here |
| static struct npu2_phy_reg NPU2_PHY_RX_HIST_MIN_EYE_WIDTH = {0x24e, 54, 8}; |
| static struct npu2_phy_reg NPU2_PHY_RX_HIST_MIN_EYE_WIDTH_LANE = {0x24e, 49, 5}; |
| static struct npu2_phy_reg NPU2_PHY_RX_HIST_MIN_EYE_WIDTH_VALID= {0x24e, 48, 1}; |
| */ |
| static struct npu2_phy_reg NPU2_PHY_RX_RC_ENABLE_AUTO_RECAL = {0x25c, 51, 1}; |
| |
| static struct npu2_phy_reg NPU2_PHY_RX_CLKDIST_PDWN = {0x204, 48, 3}; |
| static struct npu2_phy_reg NPU2_PHY_RX_IREF_PDWN = {0x230, 54, 1}; |
| static struct npu2_phy_reg NPU2_PHY_TX_CLKDIST_PDWN = {0x305, 48, 3}; |
| static struct npu2_phy_reg NPU2_PHY_RX_CTL_DATASM_CLKDIST_PDWN = {0x2e0, 60, 1}; |
| static struct npu2_phy_reg NPU2_PHY_TX_DRV_DATA_PATTERN_GCRMSG = {0x309, 50, 4}; |
| |
| #define NPU2_PHY_REG(scom_base, reg, lane) \ |
| SETFIELD(PPC_BITMASK(27, 31), ((reg)->offset << 42) | scom_base, lane) |
| |
| #define NPU2_MAX_PHY_LANE 23 |
| |
| /* This is a bit of a gross hack but it does the job */ |
| #define FOR_EACH_LANE(ndev, lane) \ |
| for (lane = 0; lane <= NPU2_MAX_PHY_LANE; lane++) \ |
| if (!(ndev->lane_mask & (1 << (NPU2_MAX_PHY_LANE - lane)))) \ |
| continue; \ |
| else |
| |
| typedef uint32_t (*step)(struct npu2_dev *); |
| |
| struct procedure { |
| const char *name; |
| step steps[]; |
| }; |
| |
| #define DEFINE_PROCEDURE(NAME, STEPS...) \ |
| static struct procedure procedure_##NAME = \ |
| {.name = #NAME, .steps = {NAME, ##STEPS}} |
| |
| #define PROCEDURE_INPROGRESS (1 << 31) |
| #define PROCEDURE_COMPLETE (1 << 30) |
| #define PROCEDURE_NEXT (1 << 29) |
| #define PROCEDURE_FAILED 2 |
| #define PROCEDURE_ABORTED 3 |
| #define PROCEDURE_UNSUPPORTED 4 |
| |
| /* Mask defining which status bits we want to expose */ |
| #define PROCEDURE_STATUS_MASK 0xc000000f |
| |
| static void phy_write_lane(struct npu2_dev *ndev, struct npu2_phy_reg *reg, int lane, uint64_t val) |
| { |
| uint64_t old_val, reg_addr; |
| int rc; |
| uint64_t mask = PPC_BITMASK(reg->start, reg->start + reg->len - 1); |
| |
| /* Check to make sure we're not trying to specify a lane to a |
| * non-per-lane register */ |
| if (lane >= 0) |
| assert(reg->offset < 0x200); |
| else |
| assert(reg->offset >= 0x200); |
| |
| reg_addr = NPU2_PHY_REG(ndev->pl_xscom_base, reg, lane); |
| rc = xscom_read(ndev->npu->chip_id, reg_addr, &old_val); |
| if (rc) |
| NPU2DEVERR(ndev, "error %d reading scom 0x%llx\n", rc, reg_addr); |
| val = SETFIELD(mask, old_val, val); |
| rc = xscom_write(ndev->npu->chip_id, reg_addr, val); |
| if (rc) |
| NPU2DEVERR(ndev, "error %d writing scom 0x%llx\n", rc, reg_addr); |
| } |
| |
| static uint64_t phy_read_lane(struct npu2_dev *ndev, struct npu2_phy_reg *reg, int lane) |
| { |
| uint64_t val, reg_addr; |
| int rc; |
| uint64_t mask = PPC_BITMASK(reg->start, reg->start + reg->len - 1); |
| |
| /* Check to make sure we're not trying to specify a lane to a |
| * non-per-lane register */ |
| if (lane >= 0) |
| assert(reg->offset < 0x200); |
| else |
| assert(reg->offset >= 0x200); |
| |
| reg_addr = NPU2_PHY_REG(ndev->pl_xscom_base, reg, lane); |
| rc = xscom_read(ndev->npu->chip_id, reg_addr, &val); |
| if (rc) |
| NPU2DEVERR(ndev, "error %d reading scom 0x%llx\n", rc, reg_addr); |
| |
| return GETFIELD(mask, val); |
| } |
| |
| #define phy_write(ndev, reg, val) phy_write_lane(ndev, reg, -1, val) |
| #define phy_read(ndev, reg) phy_read_lane(ndev, reg, -1) |
| |
| static uint32_t stop(struct npu2_dev *npu_dev __unused) |
| { |
| return PROCEDURE_COMPLETE | PROCEDURE_ABORTED; |
| } |
| DEFINE_PROCEDURE(stop); |
| |
| static uint32_t nop(struct npu2_dev *npu_dev __unused) |
| { |
| return PROCEDURE_COMPLETE; |
| } |
| DEFINE_PROCEDURE(nop); |
| |
| /* |
| * Return the obus (0 or 1) of a device |
| * |
| * Using the brick index is dangerous, because it varies for a link |
| * depending on the mode (opencapi or nvlink) |
| */ |
| static int obus_index(struct npu2_dev *ndev) |
| { |
| if ((ndev->pl_xscom_base & 0x3F000000) == 0x09000000) |
| return 0; |
| else |
| return 1; |
| } |
| |
| /* |
| * Return the brick number (0-2) within an obus chiplet. |
| * Only valid for nvlink devices |
| */ |
| static int obus_brick_index(struct npu2_dev *ndev) |
| { |
| int index = ndev->brick_index % 3; |
| |
| assert(ndev->type != NPU2_DEV_TYPE_OPENCAPI); |
| /* On the second obus chiplet, index is reversed */ |
| if ((ndev->pl_xscom_base & 0x3F000000) != 0x09000000) |
| return 2 - index; |
| |
| return index; |
| } |
| |
| static void set_iovalid(struct npu2_dev *ndev, bool raise) |
| { |
| uint64_t addr, val, mask; |
| int rc; |
| |
| if (ndev->type == NPU2_DEV_TYPE_OPENCAPI) |
| return; |
| |
| addr = (ndev->pl_xscom_base & 0x3F000000) | 0x9; |
| mask = PPC_BIT(6 + obus_brick_index(ndev)); |
| val = raise ? mask : 0; |
| |
| rc = xscom_write_mask(ndev->npu->chip_id, addr, val, mask); |
| if (rc) |
| NPU2DEVERR(ndev, "error %d writing scom 0x%llx\n", rc, addr); |
| } |
| |
| static bool poll_fence_status(struct npu2_dev *ndev, uint64_t val) |
| { |
| uint64_t fs; |
| int i; |
| |
| for (i = 0; i < 4096; i++) { |
| fs = npu2_read(ndev->npu, NPU2_NTL_CQ_FENCE_STATUS(ndev)); |
| if ((fs & 0xc000000000000000UL) == val) |
| return true; |
| } |
| |
| NPU2DEVERR(ndev, "NPU2_NTL_CQ_FENCE_STATUS timeout (0x%llx)\n", val); |
| return false; |
| } |
| |
| /* Procedure 1.2.1 - Reset NPU/NDL */ |
| uint32_t reset_ntl(struct npu2_dev *ndev) |
| { |
| uint64_t val, check; |
| int lane, i; |
| |
| set_iovalid(ndev, true); |
| |
| /* Power on clocks */ |
| phy_write(ndev, &NPU2_PHY_RX_CLKDIST_PDWN, 0); |
| phy_write(ndev, &NPU2_PHY_RX_IREF_PDWN, 1); |
| phy_write(ndev, &NPU2_PHY_TX_CLKDIST_PDWN, 0); |
| phy_write(ndev, &NPU2_PHY_RX_CTL_DATASM_CLKDIST_PDWN, 0); |
| |
| FOR_EACH_LANE(ndev, lane) { |
| phy_write_lane(ndev, &NPU2_PHY_RX_LANE_ANA_PDWN, lane, 0); |
| phy_write_lane(ndev, &NPU2_PHY_RX_LANE_DIG_PDWN, lane, 0); |
| phy_write_lane(ndev, &NPU2_PHY_TX_LANE_PDWN, lane, 0); |
| } |
| |
| /* Clear fence state for the brick */ |
| val = npu2_read(ndev->npu, NPU2_MISC_FENCE_STATE); |
| if (val) { |
| NPU2DEVINF(ndev, "Clearing all bricks fence\n"); |
| npu2_write(ndev->npu, NPU2_MISC_FENCE_STATE, val); |
| for (i = 0, check = 0; i < 4096; i++) { |
| check = npu2_read(ndev->npu, NPU2_NTL_CQ_FENCE_STATUS(ndev)); |
| if (!check) |
| break; |
| } |
| if (check) |
| NPU2DEVERR(ndev, "Clearing NPU2_MISC_FENCE_STATE=0x%llx timeout, current=0x%llx\n", |
| val, check); |
| } |
| |
| /* Write PRI */ |
| val = SETFIELD(PPC_BITMASK(0,1), 0ull, obus_brick_index(ndev)); |
| npu2_write_mask(ndev->npu, NPU2_NTL_PRI_CFG(ndev), val, -1ULL); |
| |
| val = NPU2_NTL_MISC_CFG2_NDL_RX_PARITY_ENA; |
| npu2_write_mask(ndev->npu, NPU2_NTL_MISC_CFG2(ndev), 0ull, val); |
| |
| /* NTL Reset */ |
| val = npu2_read(ndev->npu, NPU2_NTL_MISC_CFG1(ndev)); |
| val |= PPC_BIT(8) | PPC_BIT(9); |
| npu2_write(ndev->npu, NPU2_NTL_MISC_CFG1(ndev), val); |
| |
| if (!poll_fence_status(ndev, 0xc000000000000000UL)) |
| return PROCEDURE_COMPLETE | PROCEDURE_FAILED; |
| |
| return PROCEDURE_NEXT; |
| } |
| |
| static uint32_t reset_ndl(struct npu2_dev *ndev) |
| { |
| uint64_t val; |
| |
| val = npu2_read_4b(ndev->npu, NPU2_NTL_DL_CONTROL(ndev)); |
| val |= PPC_BIT32(0) | PPC_BIT32(1); |
| npu2_write_4b(ndev->npu, NPU2_NTL_DL_CONTROL(ndev), val); |
| |
| val = npu2_read_4b(ndev->npu, NPU2_NTL_DL_CONTROL(ndev)); |
| val &= ~(PPC_BIT32(0) | PPC_BIT32(1)); |
| npu2_write_4b(ndev->npu, NPU2_NTL_DL_CONTROL(ndev), val); |
| |
| val = PPC_BIT32(0); |
| npu2_write_4b(ndev->npu, NPU2_NTL_DL_CONFIG(ndev), val); |
| |
| return PROCEDURE_NEXT; |
| } |
| |
| static uint32_t reset_ntl_release(struct npu2_dev *ndev) |
| { |
| uint64_t val; |
| uint64_t npu2_fir; |
| uint64_t npu2_fir_addr; |
| int i; |
| |
| /* Clear FIR bits */ |
| npu2_fir_addr = NPU2_FIR_REGISTER_0; |
| npu2_fir = 0; |
| |
| for (i = 0; i < NPU2_TOTAL_FIR_REGISTERS; i++) { |
| xscom_write(ndev->npu->chip_id, npu2_fir_addr, npu2_fir); |
| npu2_fir_addr += NPU2_FIR_OFFSET; |
| |
| } |
| |
| val = npu2_read(ndev->npu, NPU2_NTL_MISC_CFG1(ndev)); |
| val &= 0xFFBFFFFFFFFFFFFFUL; |
| npu2_write(ndev->npu, NPU2_NTL_MISC_CFG1(ndev), val); |
| |
| if (!poll_fence_status(ndev, 0x8000000000000000UL)) |
| return PROCEDURE_COMPLETE | PROCEDURE_FAILED; |
| |
| return PROCEDURE_NEXT; |
| } |
| |
| static uint32_t reset_ntl_finish(struct npu2_dev *ndev) |
| { |
| /* Credit Setup */ |
| npu2_write(ndev->npu, NPU2_NTL_CRED_HDR_CREDIT_TX(ndev), 0x0200000000000000UL); |
| npu2_write(ndev->npu, NPU2_NTL_PRB_HDR_CREDIT_TX(ndev), 0x0200000000000000UL); |
| npu2_write(ndev->npu, NPU2_NTL_ATR_HDR_CREDIT_TX(ndev), 0x0200000000000000UL); |
| npu2_write(ndev->npu, NPU2_NTL_RSP_HDR_CREDIT_TX(ndev), 0x0200000000000000UL); |
| npu2_write(ndev->npu, NPU2_NTL_CRED_DATA_CREDIT_TX(ndev), 0x1000000000000000UL); |
| npu2_write(ndev->npu, NPU2_NTL_RSP_DATA_CREDIT_TX(ndev), 0x1000000000000000UL); |
| npu2_write(ndev->npu, NPU2_NTL_CRED_HDR_CREDIT_RX(ndev), 0x0000BE0000000000UL); |
| npu2_write(ndev->npu, NPU2_NTL_DBD_HDR_CREDIT_RX(ndev), 0x0000640000000000UL); |
| npu2_write(ndev->npu, NPU2_NTL_ATSD_HDR_CREDIT_RX(ndev), 0x0000200000000000UL); |
| npu2_write(ndev->npu, NPU2_NTL_RSP_HDR_CREDIT_RX(ndev), 0x0000BE0000000000UL); |
| npu2_write(ndev->npu, NPU2_NTL_CRED_DATA_CREDIT_RX(ndev), 0x0001000000000000UL); |
| npu2_write(ndev->npu, NPU2_NTL_RSP_DATA_CREDIT_RX(ndev), 0x0001000000000000UL); |
| |
| npu2_set_link_flag(ndev, NPU2_DEV_DL_RESET); |
| |
| return PROCEDURE_COMPLETE; |
| } |
| DEFINE_PROCEDURE(reset_ntl, reset_ndl, reset_ntl_release, reset_ntl_finish); |
| |
| /* Procedure 1.2.2 - Reset I/O PHY Lanes */ |
| static uint32_t phy_reset(struct npu2_dev *ndev) |
| { |
| int lane; |
| |
| set_iovalid(ndev, false); |
| |
| /* Power on clocks */ |
| phy_write(ndev, &NPU2_PHY_RX_CLKDIST_PDWN, 0); |
| phy_write(ndev, &NPU2_PHY_RX_IREF_PDWN, 1); |
| phy_write(ndev, &NPU2_PHY_TX_CLKDIST_PDWN, 0); |
| phy_write(ndev, &NPU2_PHY_RX_CTL_DATASM_CLKDIST_PDWN, 0); |
| |
| FOR_EACH_LANE(ndev, lane) |
| phy_write_lane(ndev, &NPU2_PHY_RX_RUN_LANE, lane, 0); |
| |
| return PROCEDURE_NEXT; |
| } |
| |
| static uint32_t phy_reset_wait(struct npu2_dev *ndev) |
| { |
| int lane; |
| |
| /* Wait for all lanes to become inactive */ |
| FOR_EACH_LANE(ndev, lane) |
| if (phy_read_lane(ndev, &NPU2_PHY_RX_LANE_BUSY, lane)) |
| return PROCEDURE_INPROGRESS; |
| |
| FOR_EACH_LANE(ndev, lane) { |
| /* Set lane in reset */ |
| phy_write_lane(ndev, &NPU2_PHY_RX_IORESET, lane, 1); |
| phy_write_lane(ndev, &NPU2_PHY_TX_IORESET, lane, 1); |
| |
| /* Release lane from reset */ |
| phy_write_lane(ndev, &NPU2_PHY_RX_IORESET, lane, 0); |
| phy_write_lane(ndev, &NPU2_PHY_TX_IORESET, lane, 0); |
| |
| /* Reset the phase rotator */ |
| phy_write_lane(ndev, &NPU2_PHY_RX_PR_RESET, lane, 1); |
| phy_write_lane(ndev, &NPU2_PHY_RX_PR_RESET, lane, 0); |
| } |
| |
| return PROCEDURE_NEXT; |
| } |
| |
| /* Procedure 1.2.3 - Initialise I/O PHY Registers */ |
| static uint32_t phy_reset_complete(struct npu2_dev *ndev) |
| { |
| int lane; |
| |
| FOR_EACH_LANE(ndev, lane) { |
| phy_write_lane(ndev, &NPU2_PHY_RX_LANE_ANA_PDWN, lane, 0); |
| phy_write_lane(ndev, &NPU2_PHY_RX_LANE_DIG_PDWN, lane, 0); |
| phy_write_lane(ndev, &NPU2_PHY_RX_PR_IQ_RES_SEL, lane, 0x7); |
| phy_write_lane(ndev, &NPU2_PHY_RX_PR_PHASE_STEP, lane, 0xc); |
| phy_write_lane(ndev, &NPU2_PHY_TX_LANE_PDWN, lane, 0); |
| phy_write_lane(ndev, &NPU2_PHY_RX_PR_FW_INERTIA_AMT, lane, 4); |
| phy_write_lane(ndev, &NPU2_PHY_RX_CFG_LTE_MC, lane, 3); |
| phy_write_lane(ndev, &NPU2_PHY_RX_A_INTEG_COARSE_GAIN, lane, 11); |
| phy_write_lane(ndev, &NPU2_PHY_RX_B_INTEG_COARSE_GAIN, lane, 11); |
| phy_write_lane(ndev, &NPU2_PHY_RX_E_INTEG_COARSE_GAIN, lane, 11); |
| |
| if (ndev->type == NPU2_DEV_TYPE_OPENCAPI) { |
| phy_write_lane(ndev, &NPU2_PHY_RX_A_CTLE_GAIN, lane, 0); |
| phy_write_lane(ndev, &NPU2_PHY_RX_B_CTLE_GAIN, lane, 0); |
| phy_write_lane(ndev, &NPU2_PHY_RX_E_CTLE_GAIN, lane, 0); |
| |
| phy_write_lane(ndev, &NPU2_PHY_RX_A_CTLE_COARSE, lane, 20); |
| phy_write_lane(ndev, &NPU2_PHY_RX_B_CTLE_COARSE, lane, 20); |
| phy_write_lane(ndev, &NPU2_PHY_RX_E_CTLE_COARSE, lane, 20); |
| } |
| } |
| |
| set_iovalid(ndev, true); |
| |
| return PROCEDURE_COMPLETE; |
| } |
| DEFINE_PROCEDURE(phy_reset, phy_reset_wait, phy_reset_complete); |
| |
| /* Procedure 1.2.6 - I/O PHY Tx Impedance Calibration */ |
| static uint32_t phy_tx_zcal(struct npu2_dev *ndev) |
| { |
| if (ndev->npu->tx_zcal_complete[obus_index(ndev)]) |
| return PROCEDURE_COMPLETE; |
| |
| /* Turn off SW enable and enable zcal state machine */ |
| phy_write(ndev, &NPU2_PHY_TX_ZCAL_SWO_EN, 0); |
| |
| /* Start impedance calibration state machine */ |
| phy_write(ndev, &NPU2_PHY_TX_ZCAL_REQ, 1); |
| |
| return PROCEDURE_NEXT; |
| } |
| |
| static uint32_t phy_tx_zcal_wait(struct npu2_dev *ndev) |
| { |
| int done, error; |
| |
| done = phy_read(ndev, &NPU2_PHY_TX_ZCAL_DONE); |
| error = phy_read(ndev, &NPU2_PHY_TX_ZCAL_ERROR); |
| |
| /* We have never seen this in the field and it is not expected. |
| * Therefore it's best to error out which will complain loudly. Nominal |
| * vaules may be set in nvram to ignore this error. */ |
| if (error && nv_zcal_nominal < 0) { |
| NPU2DEVERR(ndev, "ZCAL failed. Nominal values may be used by" |
| " setting nvram variable nv_zcal_override = 50\n"); |
| NPU2DEVERR(ndev, "However this may impact link performance\n"); |
| return PROCEDURE_COMPLETE | PROCEDURE_FAILED; |
| } |
| |
| if (!done) |
| return PROCEDURE_INPROGRESS; |
| |
| return PROCEDURE_NEXT; |
| } |
| |
| #define MARGIN_RATIO (0) |
| #define FFE_PRE_COEFF (0) |
| #define FFE_POST_COEFF (0) |
| |
| #define PRE_WIDTH (5) |
| #define POST_WIDTH (7) |
| #define MAIN_WIDTH (7) |
| #define ZCAL_MIN (16 * 2) |
| #define ZCAL_MAX (33 * 2) |
| #define PRECURSOR_X2_MAX (4 * 2 + 1) |
| #define POSTCURSOR_X2_MAX (6 * 2 + 1) |
| #define MARGIN_X2_MAX (8 * 2) |
| #define MAIN_X2_MAX ((6 * 2) + 1) |
| #define TOTAL_X2_MAX (PRECURSOR_X2_MAX + POSTCURSOR_X2_MAX + 2*MARGIN_X2_MAX + MAIN_X2_MAX) |
| |
| static uint32_t therm(uint32_t dec) |
| { |
| return ((0x1 << dec) - 1); |
| } |
| |
| static uint32_t therm_with_half(uint32_t dec, uint8_t width) |
| { |
| /* If the LSB of the 2r equivalent is on, then we need to set the 2r bit (MSB) */ |
| uint32_t half_on = ( dec & 0x1 ) << ( width - 1 ); |
| |
| /* Shift the 2r equivalent to a 1r value and convert to a thermometer code. */ |
| uint32_t x1_equiv = ((1 << (dec >> 1 )) - 1); |
| |
| /* Combine 1r equivalent thermometer code + the 2r MSB value. */ |
| return half_on | x1_equiv; |
| } |
| |
| static uint32_t phy_tx_zcal_calculate(struct npu2_dev *ndev) |
| { |
| int p_value, n_value; |
| int ffe_pre_coeff = FFE_PRE_COEFF; |
| int ffe_post_coeff = FFE_POST_COEFF; |
| uint32_t zcal_n; |
| uint32_t zcal_p; |
| uint32_t p_main_enable = MAIN_X2_MAX; |
| uint32_t p_margin_pu_enable = MARGIN_X2_MAX; |
| uint32_t p_margin_pd_enable = MARGIN_X2_MAX; |
| uint32_t p_precursor_select; |
| uint32_t p_postcursor_select; |
| uint32_t margin_pu_select; |
| uint32_t n_main_enable = MAIN_X2_MAX; |
| uint32_t n_margin_pu_enable = MARGIN_X2_MAX; |
| uint32_t n_margin_pd_enable = MARGIN_X2_MAX; |
| uint32_t n_precursor_select; |
| uint32_t n_postcursor_select; |
| uint32_t margin_pd_select; |
| uint32_t margin_select; |
| |
| if (nv_zcal_nominal < 0) { |
| /* Convert the value from 8R to 2R by / 4 */ |
| zcal_n = phy_read(ndev, &NPU2_PHY_TX_ZCAL_N) / 4; |
| zcal_p = phy_read(ndev, &NPU2_PHY_TX_ZCAL_P) / 4; |
| } else { |
| zcal_n = zcal_p = nv_zcal_nominal; |
| NPU2DEVINF(ndev, "Using nominal values for zcal, performance may be impacted\n"); |
| } |
| |
| /* Again, if the hardware detects an unexpected condition it's |
| * better just to fail loudly. */ |
| if ((zcal_n < ZCAL_MIN) || (zcal_n > ZCAL_MAX) || |
| (zcal_p < ZCAL_MIN) || (zcal_p > ZCAL_MAX)) |
| return PROCEDURE_COMPLETE | PROCEDURE_FAILED; |
| |
| if (ndev->type == NPU2_DEV_TYPE_OPENCAPI && |
| platform.ocapi->phy_setup) { |
| ffe_pre_coeff = platform.ocapi->phy_setup->tx_ffe_pre_coeff; |
| ffe_post_coeff = platform.ocapi->phy_setup->tx_ffe_post_coeff; |
| } |
| |
| p_value = zcal_p - TOTAL_X2_MAX; |
| p_precursor_select = (p_value * ffe_pre_coeff)/128; |
| p_postcursor_select = (p_value * ffe_post_coeff)/128; |
| margin_pu_select = (p_value * MARGIN_RATIO)/256; |
| |
| if (p_value % 2) { |
| p_main_enable--; |
| p_value++; |
| } |
| |
| while (p_value < 0) { |
| if (p_main_enable > 1) { |
| p_main_enable -= 2; |
| } else if ((p_margin_pu_enable + p_margin_pd_enable) > 0) { |
| if (p_margin_pu_enable == p_margin_pd_enable) |
| p_margin_pd_enable -= 2; |
| else |
| p_margin_pu_enable -= 2; |
| } |
| p_value += 2; |
| } |
| |
| n_value = zcal_n - TOTAL_X2_MAX; |
| n_precursor_select = (n_value * ffe_pre_coeff)/128; |
| n_postcursor_select = (n_value * ffe_post_coeff)/128; |
| margin_pd_select = (p_value * MARGIN_RATIO)/256; |
| |
| if (n_value % 2) { |
| n_main_enable--; |
| n_value++; |
| } |
| |
| while (n_value < 0) { |
| if (n_main_enable > 1) { |
| n_main_enable -= 2; |
| } else if ((n_margin_pu_enable + n_margin_pd_enable) > 0) { |
| if (n_margin_pu_enable == n_margin_pd_enable) |
| n_margin_pd_enable -= 2; |
| else |
| n_margin_pu_enable -= 2; |
| } |
| n_value += 2; |
| } |
| |
| margin_select = therm((margin_pu_select + 1)/2) & |
| therm((margin_pd_select + 1)/2) & |
| therm((p_margin_pu_enable + 1)/2) & |
| therm((p_margin_pd_enable + 1)/2) & |
| therm((n_margin_pu_enable + 1)/2) & |
| therm((n_margin_pd_enable + 1)/2); |
| |
| phy_write(ndev, &NPU2_PHY_TX_PSEG_PRE_EN, therm_with_half(PRECURSOR_X2_MAX, PRE_WIDTH)); |
| phy_write(ndev, &NPU2_PHY_TX_PSEG_PRE_SELECT, therm_with_half(p_precursor_select, PRE_WIDTH)); |
| phy_write(ndev, &NPU2_PHY_TX_PSEG_POST_EN, therm_with_half(POSTCURSOR_X2_MAX, POST_WIDTH)); |
| phy_write(ndev, &NPU2_PHY_TX_PSEG_POST_SELECT, therm_with_half(p_postcursor_select, POST_WIDTH)); |
| phy_write(ndev, &NPU2_PHY_TX_PSEG_MARGINPU_EN, therm((p_margin_pu_enable + 1)/2)); |
| phy_write(ndev, &NPU2_PHY_TX_PSEG_MARGINPD_EN, therm((p_margin_pd_enable + 1)/2)); |
| phy_write(ndev, &NPU2_PHY_TX_PSEG_MAIN_EN, therm_with_half(p_main_enable, MAIN_WIDTH)); |
| |
| phy_write(ndev, &NPU2_PHY_TX_NSEG_PRE_EN, therm_with_half(PRECURSOR_X2_MAX, PRE_WIDTH)); |
| phy_write(ndev, &NPU2_PHY_TX_NSEG_PRE_SELECT, therm_with_half(n_precursor_select, PRE_WIDTH)); |
| phy_write(ndev, &NPU2_PHY_TX_NSEG_POST_EN, therm_with_half(POSTCURSOR_X2_MAX, POST_WIDTH)); |
| phy_write(ndev, &NPU2_PHY_TX_NSEG_POST_SELECT, therm_with_half(n_postcursor_select, POST_WIDTH)); |
| phy_write(ndev, &NPU2_PHY_TX_NSEG_MARGINPU_EN, therm((n_margin_pu_enable + 1)/2)); |
| phy_write(ndev, &NPU2_PHY_TX_NSEG_MARGINPD_EN, therm((n_margin_pd_enable + 1)/2)); |
| phy_write(ndev, &NPU2_PHY_TX_NSEG_MAIN_EN, therm_with_half(n_main_enable, MAIN_WIDTH)); |
| |
| phy_write(ndev, &NPU2_PHY_TX_MARGINPU_SELECT, therm(margin_select + 1)/2); |
| phy_write(ndev, &NPU2_PHY_TX_MARGINPD_SELECT, therm(margin_select + 1)/2); |
| |
| ndev->npu->tx_zcal_complete[obus_index(ndev)] = 1; |
| return PROCEDURE_COMPLETE; |
| } |
| DEFINE_PROCEDURE(phy_tx_zcal, phy_tx_zcal_wait, phy_tx_zcal_calculate); |
| |
| /* Procedure 1.2.8 - Enable Downstream Link Training */ |
| static uint32_t phy_enable_tx_rxcal(struct npu2_dev *ndev) |
| { |
| int lane; |
| |
| FOR_EACH_LANE(ndev, lane) |
| phy_write_lane(ndev, &NPU2_PHY_TX_RXCAL, lane, 1); |
| |
| return PROCEDURE_COMPLETE; |
| } |
| DEFINE_PROCEDURE(phy_enable_tx_rxcal); |
| |
| /* Procedure 1.2.9 - Disable Downstream Link Training */ |
| static uint32_t phy_disable_tx_rxcal(struct npu2_dev *ndev) |
| { |
| int lane; |
| |
| FOR_EACH_LANE(ndev, lane) |
| phy_write_lane(ndev, &NPU2_PHY_TX_RXCAL, lane, 0); |
| |
| return PROCEDURE_COMPLETE; |
| } |
| DEFINE_PROCEDURE(phy_disable_tx_rxcal); |
| |
| /* Procedure 1.2.4 - I/O PHY DC Calibration */ |
| static uint32_t phy_rx_dccal(struct npu2_dev *ndev) |
| { |
| int lane; |
| |
| set_iovalid(ndev, false); |
| |
| FOR_EACH_LANE(ndev, lane) |
| phy_write_lane(ndev, &NPU2_PHY_RX_PR_FW_OFF, lane, 1); |
| |
| FOR_EACH_LANE(ndev, lane) |
| phy_write_lane(ndev, &NPU2_PHY_RX_RUN_DCCAL, lane, 1); |
| |
| return PROCEDURE_NEXT; |
| } |
| |
| static uint32_t phy_rx_dccal_complete(struct npu2_dev *ndev) |
| { |
| int lane; |
| |
| FOR_EACH_LANE(ndev, lane) |
| if (!phy_read_lane(ndev, &NPU2_PHY_RX_DCCAL_DONE, lane)) |
| return PROCEDURE_INPROGRESS; |
| |
| FOR_EACH_LANE(ndev, lane) |
| phy_write_lane(ndev, &NPU2_PHY_RX_RUN_DCCAL, lane, 0); |
| |
| FOR_EACH_LANE(ndev, lane) { |
| phy_write_lane(ndev, &NPU2_PHY_RX_B_BANK_CONTROLS, lane, 0); |
| phy_write_lane(ndev, &NPU2_PHY_RX_PR_EDGE_TRACK_CNTL, lane, 0); |
| phy_write_lane(ndev, &NPU2_PHY_RX_PR_FW_OFF, lane, 0); |
| } |
| |
| set_iovalid(ndev, true); |
| |
| return PROCEDURE_NEXT; |
| } |
| |
| static uint32_t phy_rx_clock_sel(struct npu2_dev *ndev) |
| { |
| if (ndev->type != NPU2_DEV_TYPE_OPENCAPI) { |
| /* |
| * Change the RX clk mux control to be done by |
| * software instead of HW. This avoids glitches caused |
| * by changing the mux setting. |
| * |
| * Work around a known DL bug by doing these writes |
| * twice. |
| */ |
| npu2_write_mask_4b(ndev->npu, NPU2_NTL_DL_CLK_CTRL(ndev), |
| 0x80000002, 0x80000003); |
| npu2_write_mask_4b(ndev->npu, NPU2_NTL_DL_CLK_CTRL(ndev), |
| 0x80000002, 0x80000003); |
| |
| npu2_write_mask_4b(ndev->npu, NPU2_NTL_DL_CLK_CTRL(ndev), |
| 0x80000000, 0x80000003); |
| npu2_write_mask_4b(ndev->npu, NPU2_NTL_DL_CLK_CTRL(ndev), |
| 0x80000000, 0x80000003); |
| } |
| return PROCEDURE_NEXT; |
| } |
| |
| /* Procedure 1.2.5 - IO PHY Tx FIFO Init */ |
| static uint32_t phy_tx_fifo_init(struct npu2_dev *ndev) |
| { |
| int lane; |
| |
| FOR_EACH_LANE(ndev, lane) { |
| phy_write_lane(ndev, &NPU2_PHY_TX_UNLOAD_CLK_DISABLE, lane, 0); |
| phy_write_lane(ndev, &NPU2_PHY_TX_FIFO_INIT, lane, 1); |
| phy_write_lane(ndev, &NPU2_PHY_TX_UNLOAD_CLK_DISABLE, lane, 1); |
| } |
| |
| return PROCEDURE_COMPLETE; |
| } |
| |
| /* We group TX FIFO init in here mainly because that's what was done |
| * on NVLink1 */ |
| DEFINE_PROCEDURE(phy_rx_dccal, phy_rx_dccal_complete, phy_rx_clock_sel, |
| phy_tx_fifo_init); |
| |
| /* Procedure 1.2.7 - I/O PHY Upstream Link Training */ |
| static uint32_t phy_rx_training(struct npu2_dev *ndev) |
| { |
| int lane; |
| |
| FOR_EACH_LANE(ndev, lane) |
| phy_write_lane(ndev, &NPU2_PHY_RX_RUN_LANE, lane, 1); |
| |
| return PROCEDURE_NEXT; |
| } |
| |
| static uint32_t phy_rx_training_wait(struct npu2_dev *ndev) |
| { |
| int lane; |
| |
| FOR_EACH_LANE(ndev, lane) |
| if (!phy_read_lane(ndev, &NPU2_PHY_RX_INIT_DONE, lane)) |
| return PROCEDURE_INPROGRESS; |
| |
| return PROCEDURE_COMPLETE; |
| } |
| DEFINE_PROCEDURE(phy_rx_training, phy_rx_training_wait); |
| |
| static uint32_t check_credit(struct npu2_dev *ndev, uint64_t reg, |
| const char *reg_name, uint64_t expected) |
| { |
| uint64_t val; |
| |
| val = npu2_read(ndev->npu, reg); |
| if (val == expected) |
| return 0; |
| |
| NPU2DEVERR(ndev, "%s: expected 0x%llx, read 0x%llx\n", |
| reg_name, expected, val); |
| |
| return 1; |
| } |
| |
| #define CHECK_CREDIT(ndev, reg, expected) \ |
| check_credit(ndev, reg(ndev), #reg, expected); |
| |
| static uint32_t check_credits(struct npu2_dev *ndev) |
| { |
| uint64_t val; |
| |
| CHECK_CREDIT(ndev, NPU2_NTL_CRED_HDR_CREDIT_RX, 0x0BE0BE0000000000ULL); |
| CHECK_CREDIT(ndev, NPU2_NTL_RSP_HDR_CREDIT_RX, 0x0BE0BE0000000000ULL); |
| CHECK_CREDIT(ndev, NPU2_NTL_CRED_DATA_CREDIT_RX, 0x1001000000000000ULL); |
| CHECK_CREDIT(ndev, NPU2_NTL_RSP_DATA_CREDIT_RX, 0x1001000000000000ULL); |
| CHECK_CREDIT(ndev, NPU2_NTL_DBD_HDR_CREDIT_RX, 0x0640640000000000ULL); |
| CHECK_CREDIT(ndev, NPU2_NTL_ATSD_HDR_CREDIT_RX, 0x0200200000000000ULL); |
| |
| val = npu2_read(ndev->npu, NPU2_NTL_MISC_CFG1(ndev)); |
| val &= 0xFF3FFFFFFFFFFFFFUL; |
| npu2_write(ndev->npu, NPU2_NTL_MISC_CFG1(ndev), val); |
| |
| if (!poll_fence_status(ndev, 0x0)) |
| return PROCEDURE_COMPLETE | PROCEDURE_FAILED; |
| |
| val = NPU2_NTL_MISC_CFG2_NDL_RX_PARITY_ENA; |
| npu2_write_mask(ndev->npu, NPU2_NTL_MISC_CFG2(ndev), val, val); |
| |
| return PROCEDURE_COMPLETE; |
| } |
| DEFINE_PROCEDURE(check_credits); |
| |
| static struct procedure *npu_procedures[] = { |
| &procedure_stop, |
| &procedure_nop, |
| NULL, |
| NULL, |
| &procedure_phy_reset, |
| &procedure_phy_tx_zcal, |
| &procedure_phy_rx_dccal, |
| &procedure_phy_enable_tx_rxcal, |
| &procedure_phy_disable_tx_rxcal, |
| &procedure_phy_rx_training, |
| &procedure_reset_ntl, |
| |
| /* Place holders for pre-terminate and terminate procedures */ |
| &procedure_nop, |
| &procedure_nop, |
| &procedure_check_credits |
| }; |
| |
| /* Run a procedure step(s) and return status */ |
| static uint32_t get_procedure_status(struct npu2_dev *dev) |
| { |
| uint32_t result; |
| uint16_t procedure = dev->procedure_number; |
| uint16_t step = dev->procedure_step; |
| const char *name = npu_procedures[procedure]->name; |
| |
| do { |
| result = npu_procedures[procedure]->steps[step](dev); |
| |
| if (result & PROCEDURE_NEXT) { |
| step++; |
| NPU2DEVINF(dev, "Running procedure %s step %d\n", name, step); |
| } |
| } while (result & PROCEDURE_NEXT); |
| |
| dev->procedure_step = step; |
| |
| if (result & PROCEDURE_COMPLETE) |
| NPU2DEVINF(dev, "Procedure %s complete\n", name); |
| else if (mftb() > dev->procedure_tb + msecs_to_tb(1000)) { |
| NPU2DEVINF(dev, "Procedure %s timed out\n", name); |
| result = PROCEDURE_COMPLETE | PROCEDURE_FAILED; |
| } |
| |
| /* Mask off internal state bits */ |
| dev->procedure_status = result & PROCEDURE_STATUS_MASK; |
| |
| return dev->procedure_status; |
| } |
| |
| static int64_t npu_dev_procedure_read(struct npu2_dev *dev, uint32_t offset, |
| uint32_t size, uint32_t *data) |
| { |
| int64_t rc = OPAL_SUCCESS; |
| |
| if (size != 4) { |
| /* Short config reads are not supported */ |
| prlog(PR_ERR, "NPU%d: Short read of procedure register\n", npu2_dev_to_phb(dev)->opal_id); |
| return OPAL_PARAMETER; |
| } |
| |
| *data = 0; |
| |
| switch (offset) { |
| case 0: |
| /* Only run the procedure if not already complete */ |
| if (dev->procedure_status & PROCEDURE_COMPLETE) |
| *data = dev->procedure_status; |
| else |
| *data = get_procedure_status(dev); |
| |
| break; |
| |
| case 4: |
| *data = dev->procedure_number; |
| break; |
| |
| default: |
| prlog(PR_ERR, "NPU%d: Invalid vendor specific offset 0x%08x\n", |
| npu2_dev_to_phb(dev)->opal_id, offset); |
| rc = OPAL_PARAMETER; |
| } |
| |
| return rc; |
| } |
| |
| static int64_t npu_dev_procedure_write(struct npu2_dev *dev, uint32_t offset, |
| uint32_t size, uint32_t data) |
| { |
| const char *name; |
| int64_t rc = OPAL_SUCCESS; |
| |
| if (size != 4) { |
| /* Short config writes are not supported */ |
| prlog(PR_ERR, "NPU%d: Short read of procedure register\n", |
| npu2_dev_to_phb(dev)->opal_id); |
| return OPAL_PARAMETER; |
| } |
| |
| switch (offset) { |
| case 0: |
| /* We ignore writes to the status register */ |
| NPU2DEVINF(dev, "Ignoring writes to status register\n"); |
| break; |
| |
| case 4: |
| if (data >= ARRAY_SIZE(npu_procedures) || |
| !npu_procedures[data]) { |
| NPU2DEVINF(dev, "Unsupported procedure number %d\n", data); |
| dev->procedure_status = PROCEDURE_COMPLETE |
| | PROCEDURE_UNSUPPORTED; |
| break; |
| } |
| |
| name = npu_procedures[data]->name; |
| if (dev->procedure_number == data |
| && !(dev->procedure_status & PROCEDURE_COMPLETE)) |
| NPU2DEVINF(dev, "Restarting procedure %s\n", name); |
| else |
| NPU2DEVINF(dev, "Starting procedure %s\n", name); |
| |
| dev->procedure_status = PROCEDURE_INPROGRESS; |
| dev->procedure_number = data; |
| dev->procedure_step = 0; |
| dev->procedure_tb = mftb(); |
| break; |
| |
| default: |
| NPU2DEVINF(dev, "Invalid vendor specific offset 0x%08x\n", offset); |
| rc = OPAL_PARAMETER; |
| } |
| |
| return rc; |
| } |
| |
| int64_t npu2_dev_procedure(void *dev, struct pci_cfg_reg_filter *pcrf, |
| uint32_t offset, uint32_t len, uint32_t *data, |
| bool write) |
| { |
| struct pci_virt_device *pvd = dev; |
| struct npu2_dev *ndev = pvd->data; |
| |
| if (write) |
| return npu_dev_procedure_write(ndev, offset - pcrf->start, |
| len, *data); |
| |
| return npu_dev_procedure_read(ndev, offset - pcrf->start, len, data); |
| } |
| |
| void npu2_dev_procedure_reset(struct npu2_dev *dev) |
| { |
| uint64_t val; |
| |
| /* Fence the brick */ |
| val = npu2_read(dev->npu, NPU2_NTL_MISC_CFG1(dev)); |
| val |= PPC_BIT(8) | PPC_BIT(9); |
| npu2_write(dev->npu, NPU2_NTL_MISC_CFG1(dev), val); |
| |
| npu2_clear_link_flag(dev, NPU2_DEV_DL_RESET); |
| } |
| |
| static uint32_t run_procedure(struct npu2_dev *dev, uint16_t procedure_number) |
| { |
| struct procedure *proc; |
| const char *name; |
| uint32_t result; |
| |
| assert(procedure_number <= ARRAY_SIZE(npu_procedures)); |
| proc = npu_procedures[procedure_number]; |
| assert(proc); |
| |
| name = proc->name; |
| NPU2DEVINF(dev, "Running procedure %s\n", name); |
| dev->procedure_status = PROCEDURE_INPROGRESS; |
| dev->procedure_number = procedure_number; |
| dev->procedure_step = 0; |
| dev->procedure_tb = mftb(); |
| |
| result = get_procedure_status(dev); |
| while (!(result & PROCEDURE_COMPLETE)) { |
| time_wait_ms(1); |
| result = get_procedure_status(dev); |
| } |
| return result; |
| } |
| |
| void npu2_opencapi_bump_ui_lane(struct npu2_dev *dev) |
| { |
| uint64_t reg; |
| uint64_t status_xscom; |
| int lane, bit = 7; |
| |
| status_xscom = OB_ODL_TRAINING_STATUS(dev->brick_index); |
| xscom_read(dev->npu->chip_id, status_xscom, ®); |
| reg = GETFIELD(OB_ODL_TRAINING_STATUS_STS_RX_PATTERN_B, reg); |
| |
| FOR_EACH_LANE(dev, lane) { |
| if (reg & (1 << bit--)) |
| continue; |
| prlog(PR_TRACE, "OCAPI: bumpui bumping lane %d\n", lane); |
| for (int i = 0; i < 4; i++) { |
| phy_write_lane(dev, &NPU2_PHY_RX_PR_BUMP_SL_1UI, lane, 1); |
| phy_write_lane(dev, &NPU2_PHY_RX_PR_BUMP_SL_1UI, lane, 0); |
| } |
| } |
| } |
| |
| void npu2_opencapi_phy_init(struct npu2_dev *dev) |
| { |
| if (platform.ocapi->phy_setup) { |
| OCAPIINF(dev, "Enabling platform-specific PHY setup\n"); |
| phy_write(dev, &NPU2_PHY_TX_FFE_BOOST_EN, |
| platform.ocapi->phy_setup->tx_ffe_boost_en); |
| } |
| |
| run_procedure(dev, 5); /* procedure_phy_tx_zcal */ |
| /* |
| * This is only required for OpenCAPI - Hostboot tries to set this |
| * on systems where it can tell a link is OpenCAPI, but for |
| * Witherspoon it needs to be done in skiboot after device detection. |
| */ |
| phy_write(dev, &NPU2_PHY_RX_RC_ENABLE_AUTO_RECAL, 0x1); |
| phy_write(dev, &NPU2_PHY_RX_AC_COUPLED, 1); |
| |
| switch (dev->link_speed) { |
| case 20000000000UL: |
| OCAPIINF(dev, "Link speed set at 20Gb/s\n"); |
| phy_write(dev, &NPU2_PHY_RX_SPEED_SELECT, 1); |
| break; |
| case 25000000000UL: |
| case 25781250000UL: |
| OCAPIINF(dev, "Link speed set at 25.xGb/s\n"); |
| phy_write(dev, &NPU2_PHY_RX_SPEED_SELECT, 0); |
| break; |
| default: |
| OCAPIERR(dev, "Invalid link speed!\n"); |
| assert(false); |
| } |
| } |
| |
| int npu2_opencapi_phy_reset(struct npu2_dev *dev) |
| { |
| int rc; |
| |
| rc = run_procedure(dev, 4); /* procedure_phy_reset */ |
| if (rc != PROCEDURE_COMPLETE) |
| return -1; |
| rc = run_procedure(dev, 6); /* procedure_phy_rx_dccal */ |
| if (rc != PROCEDURE_COMPLETE) |
| return -1; |
| return 0; |
| } |
| |
| void npu2_opencapi_phy_prbs31(struct npu2_dev *dev) |
| { |
| phy_write(dev, &NPU2_PHY_TX_DRV_DATA_PATTERN_GCRMSG, 0xD); |
| } |