platforms/astbmc/witherspoon.c - skiboot - Git at Google

 // SPDX-License-Identifier: Apache-2.0 OR GPL-2.0-or-later
 /* Copyright 2017-2019 IBM Corp. */

 #include <skiboot.h>
 #include <device.h>
 #include <console.h>
 #include <chip.h>
 #include <ipmi.h>
 #include <psi.h>
 #include <npu-regs.h>
 #include <xscom.h>
 #include <xscom-p9-regs.h>
 #include <timebase.h>
 #include <pci.h>
 #include <pci-slot.h>
 #include <phb4.h>
 #include <npu2.h>
 #include <occ.h>
 #include <i2c.h>
 #include <secvar.h>

 #include "astbmc.h"
 #include "ast.h"

 static enum {
 	WITHERSPOON_TYPE_UNKNOWN,
 	WITHERSPOON_TYPE_SEQUOIA,
 	WITHERSPOON_TYPE_REDBUD
 } witherspoon_type;

 /*
  * HACK: Hostboot doesn't export the correct data for the system VPD EEPROM
  *       for this system. So we need to work around it here.
  */
 static void vpd_dt_fixup(void)
 {
 	struct dt_node *n = dt_find_by_path(dt_root,
 		"/xscom@603fc00000000/i2cm@a2000/i2c-bus@0/eeprom@50");

 	if (n) {
 		dt_check_del_prop(n, "compatible");
 		dt_add_property_string(n, "compatible", "atmel,24c512");

 		dt_check_del_prop(n, "label");
 		dt_add_property_string(n, "label", "system-vpd");
 	}
 }

 static void witherspoon_create_ocapi_i2c_bus(void)
 {
 	struct dt_node *xscom, *i2cm, *i2c_bus;
 	prlog(PR_DEBUG, "OCAPI: Adding I2C bus device node for OCAPI reset\n");
 	dt_for_each_compatible(dt_root, xscom, "ibm,xscom") {
 		i2cm = dt_find_by_name(xscom, "i2cm@a1000");
 		if (!i2cm) {
 			prlog(PR_ERR, "OCAPI: Failed to add I2C bus device node\n");
 			continue;
 		}

 		if (dt_find_by_name(i2cm, "i2c-bus@4"))
 			continue;

 		i2c_bus = dt_new_addr(i2cm, "i2c-bus", 4);
 		dt_add_property_cells(i2c_bus, "reg", 4);
 		dt_add_property_cells(i2c_bus, "bus-frequency", 0x61a80);
 		dt_add_property_strings(i2c_bus, "compatible",
 					"ibm,opal-i2c", "ibm,power8-i2c-port",
 					"ibm,power9-i2c-port");
 	}
 }

 static bool witherspoon_probe(void)
 {
 	struct dt_node *np;
 	int highest_gpu_group_id = 0;
 	int gpu_group_id;

 	if (!dt_node_is_compatible(dt_root, "ibm,witherspoon"))
 		return false;

 	/* Lot of common early inits here */
 	astbmc_early_init();

 	/* Setup UART for use by OPAL (Linux hvc) */
 	uart_set_console_policy(UART_CONSOLE_OPAL);

 	vpd_dt_fixup();

 	witherspoon_create_ocapi_i2c_bus();

 	dt_for_each_compatible(dt_root, np, "ibm,npu-link") {
 		gpu_group_id = dt_prop_get_u32(np, "ibm,npu-group-id");
 		if (gpu_group_id > highest_gpu_group_id)
 			highest_gpu_group_id = gpu_group_id;
 	};

 	switch (highest_gpu_group_id) {
 	case 1:
 		witherspoon_type = WITHERSPOON_TYPE_REDBUD;
 		break;
 	case 2:
 		witherspoon_type = WITHERSPOON_TYPE_SEQUOIA;
 		break;
 	default:
 		witherspoon_type = WITHERSPOON_TYPE_UNKNOWN;
 		prlog(PR_NOTICE, "PLAT: Unknown Witherspoon variant detected\n");
 	}

 	return true;
 }

 static void phb4_activate_shared_slot_witherspoon(struct proc_chip *chip)
 {
 	uint64_t val;

 	/*
 	 * Shared slot activation is done by raising a GPIO line on the
 	 * chip with the secondary slot. It will somehow activate the
 	 * sideband signals between the slots.
 	 * Need to wait 100us for stability.
 	 */
 	xscom_read(chip->id, P9_GPIO_DATA_OUT_ENABLE, &val);
 	val |= PPC_BIT(2);
 	xscom_write(chip->id, P9_GPIO_DATA_OUT_ENABLE, val);

 	xscom_read(chip->id, P9_GPIO_DATA_OUT, &val);
 	val |= PPC_BIT(2);
 	xscom_write(chip->id, P9_GPIO_DATA_OUT, val);
 	time_wait_us(100);
 	prlog(PR_INFO, "Shared PCI slot activated\n");
 }

 static void witherspoon_shared_slot_fixup(void)
 {
 	struct pci_slot *slot0, *slot1;
 	struct proc_chip *chip0, *chip1;
 	uint8_t p0 = 0, p1 = 0;

 	/*
 	 * Detect if a x16 card is present on the shared slot and
 	 * do some extra configuration if it is.
 	 *
 	 * The shared slot, a.k.a "Slot 2" in the documentation, is
 	 * connected to PEC2 phb index 3 on both chips. From skiboot,
 	 * it looks like two x8 slots, each with its own presence bit.
 	 *
 	 * Here is the matrix of possibilities for the presence bits:
 	 *
 	 * slot0 presence     slot1 presence
 	 *    0                  0               => no card
 	 *    1                  0               => x8 or less card detected
 	 *    1                  1               => x16 card detected
 	 *    0                  1               => invalid combination
 	 *
 	 * We only act if a x16 card is detected ('1 1' combination above).
 	 *
 	 * One issue is that we don't really know if it is a
 	 * shared-slot-compatible card (such as Mellanox CX5) or
 	 * a 'normal' x16 PCI card. We activate the shared slot in both cases,
 	 * as it doesn't seem to hurt.
 	 *
 	 * If the card is a normal x16 PCI card, the link won't train on the
 	 * second slot (nothing to do with the shared slot activation), the
 	 * procedure will timeout, thus adding some delay to the boot time.
 	 * Therefore the recommendation is that we shouldn't use a normal
 	 * x16 card on the shared slot of a witherspoon.
 	 *
 	 * Plugging a x8 or less adapter on the shared slot should work
 	 * like any other physical slot.
 	 */
 	chip0 = next_chip(NULL);
 	chip1 = next_chip(chip0);
 	if (!chip1 || next_chip(chip1)) {
 		prlog(PR_WARNING,
 		      "PLAT: Can't find second chip, "
 		      "skipping PCIe shared slot detection\n");
 		return;
 	}

 	/* the shared slot is connected to PHB3 on both chips */
 	slot0 = pci_slot_find(phb4_get_opal_id(chip0->id, 3));
 	slot1 = pci_slot_find(phb4_get_opal_id(chip1->id, 3));
 	if (slot0 && slot1) {
 		if (slot0->ops.get_presence_state)
 			slot0->ops.get_presence_state(slot0, &p0);
 		if (slot1->ops.get_presence_state)
 			slot1->ops.get_presence_state(slot1, &p1);
 		if (p0 == 1 && p1 == 1) {
 			phb4_activate_shared_slot_witherspoon(chip1);
 			slot0->peer_slot = slot1;
 			slot1->peer_slot = slot0;
 		}
 	}
 }

 static int check_mlx_cards(struct phb *phb __unused, struct pci_device *dev,
 			   void *userdata __unused)
 {
 	uint16_t mlx_cards[] = {
 		0x1017, /* ConnectX-5 */
 		0x1019, /* ConnectX-5 Ex */
 		0x101b, /* ConnectX-6 */
 		0x101d, /* ConnectX-6 Dx */
 		0x101f, /* ConnectX-6 Lx */
 		0x1021, /* ConnectX-7 */
 	};

 	if (PCI_VENDOR_ID(dev->vdid) == 0x15b3) { /* Mellanox */
 		for (int i = 0; i < ARRAY_SIZE(mlx_cards); i++) {
 			if (mlx_cards[i] == PCI_DEVICE_ID(dev->vdid))
 				return 1;
 		}
 	}
 	return 0;
 }

 static void witherspoon_pci_probe_complete(void)
 {
 	struct pci_device *dev;
 	struct phb *phb;
 	struct phb4 *p;

 	/*
 	 * Reallocate dma engines between stacks in PEC2 if a Mellanox
 	 * card is found on the shared slot, as it is required to get
 	 * good GPU direct performance.
 	 */
 	for_each_phb(phb) {
 		/* skip the virtual PHBs */
 		if (phb->phb_type != phb_type_pcie_v4)
 			continue;
 		p = phb_to_phb4(phb);
 		/* Keep only the first PHB on PEC2 */
 		if (p->index != 3)
 			continue;
 		dev = pci_walk_dev(phb, NULL, check_mlx_cards, NULL);
 		if (dev)
 			phb4_pec2_dma_engine_realloc(p);
 	}
 }

 static void set_link_details(struct npu2 *npu, uint32_t link_index,
 			     uint32_t brick_index, enum npu2_dev_type type)
 {
 	struct npu2_dev *dev = NULL;
 	for (int i = 0; i < npu->total_devices; i++) {
 		if (npu->devices[i].link_index == link_index) {
 			dev = &npu->devices[i];
 			break;
 		}
 	}
 	if (!dev) {
 		prlog(PR_ERR, "PLAT: Could not find NPU link index %d\n",
 		      link_index);
 		return;
 	}
 	dev->brick_index = brick_index;
 	dev->type = type;
 }

 static void witherspoon_npu2_device_detect(struct npu2 *npu)
 {
 	struct proc_chip *chip;
 	uint8_t state;
 	uint64_t i2c_port_id = 0;
 	char port_name[17];
 	struct dt_node *dn;
 	int rc;

 	bool gpu0_present, gpu1_present;

 	if (witherspoon_type != WITHERSPOON_TYPE_REDBUD) {
 		prlog(PR_DEBUG, "PLAT: Setting all NPU links to NVLink, OpenCAPI only supported on Redbud\n");
 	        for (int i = 0; i < npu->total_devices; i++) {
 			npu->devices[i].type = NPU2_DEV_TYPE_NVLINK;
 		}
 		return;
 	}
 	assert(npu->total_devices == 6);

 	chip = get_chip(npu->chip_id);

 	/* Find I2C port */
 	snprintf(port_name, sizeof(port_name), "p8_%08x_e%dp%d",
 		 chip->id, platform.ocapi->i2c_engine,
 		 platform.ocapi->i2c_port);
 	dt_for_each_compatible(dt_root, dn, "ibm,power9-i2c-port") {
 		if (streq(port_name, dt_prop_get(dn, "ibm,port-name"))) {
 			i2c_port_id = dt_prop_get_u32(dn, "ibm,opal-id");
 			break;
 		}
 	}

 	if (!i2c_port_id) {
 		prlog(PR_ERR, "PLAT: Could not find NPU presence I2C port\n");
 		return;
 	}

 	gpu0_present = occ_get_gpu_presence(chip, 0);
 	if (gpu0_present) {
 		prlog(PR_DEBUG, "PLAT: Chip %d GPU#0 slot present\n", chip->id);
 	}

 	gpu1_present = occ_get_gpu_presence(chip, 1);
 	if (gpu1_present) {
 		prlog(PR_DEBUG, "PLAT: Chip %d GPU#1 slot present\n", chip->id);
 	}

 	/*
 	 * The following I2C ops generate errors if no device is
 	 * present on any SXM2 slot. Since it's useless, let's skip it
 	 */
 	if (!gpu0_present && !gpu1_present)
 		return;

 	/* Set pins to input */
 	state = 0xff;
 	rc = i2c_request_send(i2c_port_id,
 			      platform.ocapi->i2c_presence_addr, SMBUS_WRITE, 3,
 			      1, &state, 1, 120);
 	if (rc)
 		goto i2c_failed;

 	/* Read the presence value */
 	state = 0x00;
 	rc = i2c_request_send(i2c_port_id,
 			      platform.ocapi->i2c_presence_addr, SMBUS_READ, 0,
 			      1, &state, 1, 120);
 	if (rc)
 		goto i2c_failed;

 	if (gpu0_present) {
 		if (state & (1 << 0)) {
 			prlog(PR_DEBUG, "PLAT: Chip %d GPU#0 is OpenCAPI\n",
 			      chip->id);
 			/*
 			 * On witherspoon, bricks 2 and 3 are connected to
 			 * the lanes matching links 0 and 1 in OpenCAPI mode.
 			 */
 			set_link_details(npu, 1, 3, NPU2_DEV_TYPE_OPENCAPI);
 			/* We current don't support using the second link */
 			set_link_details(npu, 0, 2, NPU2_DEV_TYPE_UNKNOWN);
 		} else {
 			prlog(PR_DEBUG, "PLAT: Chip %d GPU#0 is NVLink\n",
 			      chip->id);
 			set_link_details(npu, 0, 0, NPU2_DEV_TYPE_NVLINK);
 			set_link_details(npu, 1, 1, NPU2_DEV_TYPE_NVLINK);
 			set_link_details(npu, 2, 2, NPU2_DEV_TYPE_NVLINK);
 		}
 	}

 	if (gpu1_present) {
 		if (state & (1 << 1)) {
 			prlog(PR_DEBUG, "PLAT: Chip %d GPU#1 is OpenCAPI\n",
 			      chip->id);
 			set_link_details(npu, 4, 4, NPU2_DEV_TYPE_OPENCAPI);
 			/* We current don't support using the second link */
 			set_link_details(npu, 5, 5, NPU2_DEV_TYPE_UNKNOWN);
 		} else {
 			prlog(PR_DEBUG, "PLAT: Chip %d GPU#1 is NVLink\n",
 			      chip->id);
 			set_link_details(npu, 3, 3, NPU2_DEV_TYPE_NVLINK);
 			set_link_details(npu, 4, 4, NPU2_DEV_TYPE_NVLINK);
 			set_link_details(npu, 5, 5, NPU2_DEV_TYPE_NVLINK);
 		}
 	}

 	return;

 i2c_failed:
 	prlog(PR_ERR, "PLAT: NPU device type detection failed, rc=%d\n", rc);
 	return;
 }

 static const char *witherspoon_ocapi_slot_label(uint32_t chip_id,
 						uint32_t brick_index)
 {
 	const char *name = NULL;

 	if (chip_id == 0) {
 		if (brick_index == 3)
 			name = "OPENCAPI-GPU0";
 		else if (brick_index == 4)
 			name = "OPENCAPI-GPU1";
 	} else {
 		if (brick_index == 3)
 			name = "OPENCAPI-GPU3";
 		else if (brick_index == 4)
 			name = "OPENCAPI-GPU4";
 	}
 	return name;
 }

 static const struct platform_ocapi witherspoon_ocapi = {
        .i2c_engine          = 1,
        .i2c_port            = 4,
        .odl_phy_swap        = false,
        .i2c_reset_addr      = 0x20,
        /*
 	* Witherspoon uses SXM2 connectors, carrying 2 OCAPI links
 	* over a single connector - hence each pair of bricks shares
 	* the same pin for resets. We currently only support using
 	* bricks 3 and 4, among other reasons because we can't handle
 	* a reset on one link causing the other link to reset as
 	* well.
 	*/
        .i2c_reset_brick2    = 1 << 0,
        .i2c_reset_brick3    = 1 << 0,
        .i2c_reset_brick4    = 1 << 1,
        .i2c_reset_brick5    = 1 << 1,
        .i2c_presence_addr   = 0x20,
        /* unused, we do this in custom presence detect */
        .i2c_presence_brick2 = 0,
        .i2c_presence_brick3 = 0,
        .i2c_presence_brick4 = 0,
        .i2c_presence_brick5 = 0,
        .ocapi_slot_label    = witherspoon_ocapi_slot_label,
 };

 static int gpu_slot_to_num(const char *slot)
 {
 	char *p = NULL;
 	int ret;

 	if (!slot)
 		return -1;

 	if (memcmp(slot, "GPU", 3))
 		return -1;

 	ret = strtol(slot + 3, &p, 10);
 	if (*p || p == slot + 3)
 		return -1;

 	return ret;
 }

 static void npu2_phb_nvlink_dt(struct phb *npuphb)
 {
 	struct dt_node *g[3] = { NULL }; /* Current maximum 3 GPUs per 1 NPU */
 	struct dt_node *n[6] = { NULL };
 	int max_gpus, i, gpuid, first, last;
 	struct npu2 *npu2_phb = phb_to_npu2_nvlink(npuphb);
 	struct pci_device *npd;

 	switch (witherspoon_type) {
 	case WITHERSPOON_TYPE_REDBUD:
 		max_gpus = 4;
 		break;
 	case WITHERSPOON_TYPE_SEQUOIA:
 		max_gpus = 6;
 		break;
 	default:
 		/* witherspoon_probe() already reported missing support */
 		return;
 	}

 	/* Find the indexes of GPUs connected to this NPU */
 	for (i = 0, first = max_gpus, last = 0; i < npu2_phb->total_devices;
 			++i) {
 		gpuid = gpu_slot_to_num(npu2_phb->devices[i].nvlink.slot_label);
 		if (gpuid < 0)
 			continue;
 		if (gpuid > last)
 			last = gpuid;
 		if (gpuid < first)
 			first = gpuid;
 	}

 	/* Either no "GPUx" slots found or they are not consecutive, abort */
 	if (!last || last + 1 - first > max_gpus)
 		return;

 	/* Collect GPU device nodes, sorted by an index from "GPUn" */
 	for (i = 0; i < npu2_phb->total_devices; ++i) {
 		gpuid = gpu_slot_to_num(npu2_phb->devices[i].nvlink.slot_label);
 		g[gpuid - first] = npu2_phb->devices[i].nvlink.pd->dn;

 		/* Collect NVLink bridge nodes too, for their phandles */
 		list_for_each(&npuphb->devices, npd, link) {
 			if (npd->bdfn == npu2_phb->devices[i].bdfn) {
 				assert(npu2_phb->devices[i].brick_index <
 						ARRAY_SIZE(n));
 				n[npu2_phb->devices[i].brick_index] = npd->dn;
 			}
 		}
 	}

 	/*
 	 * Store interconnect phandles in the device tree.
 	 * The mapping is from Witherspoon_Design_Workbook_v1.7_19June2018.pdf,
 	 * pages 39 (Sequoia), 40 (Redbud):
 	 *   Figure 16: NVLink wiring diagram for planar with 6 GPUs
 	 *   Figure 17: NVLink wiring diagram for planar with 4 GPUs
 	 */
 #define PEERPH(g) 	((g)?(g)->phandle:0)
 	switch (witherspoon_type) {
 	case WITHERSPOON_TYPE_REDBUD:
 		if (g[0])
 			dt_add_property_cells(g[0], "ibm,nvlink-peers",
 					PEERPH(g[1]), PEERPH(n[0]),
 					PEERPH(g[1]), PEERPH(n[1]),
 					PEERPH(g[1]), PEERPH(n[2]));
 		if (g[1])
 			dt_add_property_cells(g[1], "ibm,nvlink-peers",
 					PEERPH(g[0]), PEERPH(n[3]),
 					PEERPH(g[0]), PEERPH(n[4]),
 					PEERPH(g[0]), PEERPH(n[5]));
 		break;
 	case WITHERSPOON_TYPE_SEQUOIA:
 		if (g[0])
 			dt_add_property_cells(g[0], "ibm,nvlink-peers",
 					PEERPH(g[1]), PEERPH(n[0]),
 					PEERPH(g[2]), PEERPH(g[2]),
 					PEERPH(g[1]), PEERPH(n[1]));
 		if (g[1])
 			dt_add_property_cells(g[1], "ibm,nvlink-peers",
 					PEERPH(g[0]), PEERPH(n[2]),
 					PEERPH(g[2]), PEERPH(g[2]),
 					PEERPH(g[0]), PEERPH(n[3]));
 		if (g[2])
 			dt_add_property_cells(g[2], "ibm,nvlink-peers",
 					PEERPH(g[1]), PEERPH(g[0]),
 					PEERPH(g[1]), PEERPH(n[4]),
 					PEERPH(g[0]), PEERPH(n[5]));
 		break;
 	default:
 		break;
 	}
 }

 static void witherspoon_finalise_dt(bool is_reboot)
 {
 	struct dt_node *np;
 	struct proc_chip *c;

 	if (is_reboot)
 		return;

 	dt_for_each_compatible(dt_root, np, "ibm,power9-npu-pciex") {
 		u32 opal_id = dt_prop_get_cell(np, "ibm,opal-phbid", 1);
 		struct phb *npphb = pci_get_phb(opal_id);

 		if (!npphb)
 			continue;
 		if (npphb->phb_type != phb_type_npu_v2)
 			continue;
 		npu2_phb_nvlink_dt(npphb);
 	}

 	/*
 	 * The I2C bus on used to talk to the GPUs has a 750K pullup
 	 * which is way too big. If there's no GPUs connected to the
 	 * chip all I2C transactions fail with an Arb loss error since
 	 * SCL/SDA don't return to the idle state fast enough. Disable
 	 * the port to squash the errors.
 	 */
 	for (c = next_chip(NULL); c; c = next_chip(c)) {
 		bool detected = false;
 		int i;

 		np = dt_find_by_path(c->devnode, "i2cm@a1000/i2c-bus@4");
 		if (!np)
 			continue;

 		for (i = 0; i < 3; i++)
 			detected |= occ_get_gpu_presence(c, i);

 		if (!detected) {
 			dt_check_del_prop(np, "status");
 			dt_add_property_string(np, "status", "disabled");
 		}
 	}
 }

 static int witherspoon_secvar_init(void)
 {
         return secvar_main(secboot_tpm_driver, edk2_compatible_v1);
 }

 /* The only difference between these is the PCI slot handling */

 DECLARE_PLATFORM(witherspoon) = {
 	.name			= "Witherspoon",
 	.probe			= witherspoon_probe,
 	.init			= astbmc_init,
 	.pre_pci_fixup		= witherspoon_shared_slot_fixup,
 	.pci_probe_complete	= witherspoon_pci_probe_complete,
 	.start_preload_resource	= flash_start_preload_resource,
 	.resource_loaded	= flash_resource_loaded,
 	.bmc			= &bmc_plat_ast2500_openbmc,
 	.cec_power_down         = astbmc_ipmi_power_down,
 	.cec_reboot             = astbmc_ipmi_reboot,
 	.elog_commit		= ipmi_elog_commit,
 	.finalise_dt		= witherspoon_finalise_dt,
 	.exit			= astbmc_exit,
 	.terminate		= ipmi_terminate,

 	.pci_get_slot_info	= dt_slot_get_slot_info,
 	.ocapi                  = &witherspoon_ocapi,
 	.npu2_device_detect	= witherspoon_npu2_device_detect,
 	.op_display		= op_display_lpc,
 	.secvar_init		= witherspoon_secvar_init,
 };
	// SPDX-License-Identifier: Apache-2.0 OR GPL-2.0-or-later
	/* Copyright 2017-2019 IBM Corp. */

	#include <skiboot.h>
	#include <device.h>
	#include <console.h>
	#include <chip.h>
	#include <ipmi.h>
	#include <psi.h>
	#include <npu-regs.h>
	#include <xscom.h>
	#include <xscom-p9-regs.h>
	#include <timebase.h>
	#include <pci.h>
	#include <pci-slot.h>
	#include <phb4.h>
	#include <npu2.h>
	#include <occ.h>
	#include <i2c.h>
	#include <secvar.h>

	#include "astbmc.h"
	#include "ast.h"

	static enum {
	WITHERSPOON_TYPE_UNKNOWN,
	WITHERSPOON_TYPE_SEQUOIA,
	WITHERSPOON_TYPE_REDBUD
	} witherspoon_type;

	/*
	* HACK: Hostboot doesn't export the correct data for the system VPD EEPROM
	* for this system. So we need to work around it here.
	*/
	static void vpd_dt_fixup(void)
	{
	struct dt_node *n = dt_find_by_path(dt_root,
	"/xscom@603fc00000000/i2cm@a2000/i2c-bus@0/eeprom@50");

	if (n) {
	dt_check_del_prop(n, "compatible");
	dt_add_property_string(n, "compatible", "atmel,24c512");

	dt_check_del_prop(n, "label");
	dt_add_property_string(n, "label", "system-vpd");
	}
	}

	static void witherspoon_create_ocapi_i2c_bus(void)
	{
	struct dt_node xscom, i2cm, *i2c_bus;
	prlog(PR_DEBUG, "OCAPI: Adding I2C bus device node for OCAPI reset\n");
	dt_for_each_compatible(dt_root, xscom, "ibm,xscom") {
	i2cm = dt_find_by_name(xscom, "i2cm@a1000");
	if (!i2cm) {
	prlog(PR_ERR, "OCAPI: Failed to add I2C bus device node\n");
	continue;
	}

	if (dt_find_by_name(i2cm, "i2c-bus@4"))
	continue;

	i2c_bus = dt_new_addr(i2cm, "i2c-bus", 4);
	dt_add_property_cells(i2c_bus, "reg", 4);
	dt_add_property_cells(i2c_bus, "bus-frequency", 0x61a80);
	dt_add_property_strings(i2c_bus, "compatible",
	"ibm,opal-i2c", "ibm,power8-i2c-port",
	"ibm,power9-i2c-port");
	}
	}

	static bool witherspoon_probe(void)
	{
	struct dt_node *np;
	int highest_gpu_group_id = 0;
	int gpu_group_id;

	if (!dt_node_is_compatible(dt_root, "ibm,witherspoon"))
	return false;

	/* Lot of common early inits here */
	astbmc_early_init();

	/* Setup UART for use by OPAL (Linux hvc) */
	uart_set_console_policy(UART_CONSOLE_OPAL);

	vpd_dt_fixup();

	witherspoon_create_ocapi_i2c_bus();

	dt_for_each_compatible(dt_root, np, "ibm,npu-link") {
	gpu_group_id = dt_prop_get_u32(np, "ibm,npu-group-id");
	if (gpu_group_id > highest_gpu_group_id)
	highest_gpu_group_id = gpu_group_id;
	};

	switch (highest_gpu_group_id) {
	case 1:
	witherspoon_type = WITHERSPOON_TYPE_REDBUD;
	break;
	case 2:
	witherspoon_type = WITHERSPOON_TYPE_SEQUOIA;
	break;
	default:
	witherspoon_type = WITHERSPOON_TYPE_UNKNOWN;
	prlog(PR_NOTICE, "PLAT: Unknown Witherspoon variant detected\n");
	}

	return true;
	}

	static void phb4_activate_shared_slot_witherspoon(struct proc_chip *chip)
	{
	uint64_t val;

	/*
	* Shared slot activation is done by raising a GPIO line on the
	* chip with the secondary slot. It will somehow activate the
	* sideband signals between the slots.
	* Need to wait 100us for stability.
	*/
	xscom_read(chip->id, P9_GPIO_DATA_OUT_ENABLE, &val);
	val \|= PPC_BIT(2);
	xscom_write(chip->id, P9_GPIO_DATA_OUT_ENABLE, val);

	xscom_read(chip->id, P9_GPIO_DATA_OUT, &val);
	val \|= PPC_BIT(2);
	xscom_write(chip->id, P9_GPIO_DATA_OUT, val);
	time_wait_us(100);
	prlog(PR_INFO, "Shared PCI slot activated\n");
	}

	static void witherspoon_shared_slot_fixup(void)
	{
	struct pci_slot slot0, slot1;
	struct proc_chip chip0, chip1;
	uint8_t p0 = 0, p1 = 0;

	/*
	* Detect if a x16 card is present on the shared slot and
	* do some extra configuration if it is.
	*
	* The shared slot, a.k.a "Slot 2" in the documentation, is
	* connected to PEC2 phb index 3 on both chips. From skiboot,
	* it looks like two x8 slots, each with its own presence bit.
	*
	* Here is the matrix of possibilities for the presence bits:
	*
	* slot0 presence slot1 presence
	* 0 0 => no card
	* 1 0 => x8 or less card detected
	* 1 1 => x16 card detected
	* 0 1 => invalid combination
	*
	* We only act if a x16 card is detected ('1 1' combination above).
	*
	* One issue is that we don't really know if it is a
	* shared-slot-compatible card (such as Mellanox CX5) or
	* a 'normal' x16 PCI card. We activate the shared slot in both cases,
	* as it doesn't seem to hurt.
	*
	* If the card is a normal x16 PCI card, the link won't train on the
	* second slot (nothing to do with the shared slot activation), the
	* procedure will timeout, thus adding some delay to the boot time.
	* Therefore the recommendation is that we shouldn't use a normal
	* x16 card on the shared slot of a witherspoon.
	*
	* Plugging a x8 or less adapter on the shared slot should work
	* like any other physical slot.
	*/
	chip0 = next_chip(NULL);
	chip1 = next_chip(chip0);
	if (!chip1 \|\| next_chip(chip1)) {
	prlog(PR_WARNING,
	"PLAT: Can't find second chip, "
	"skipping PCIe shared slot detection\n");
	return;
	}

	/* the shared slot is connected to PHB3 on both chips */
	slot0 = pci_slot_find(phb4_get_opal_id(chip0->id, 3));
	slot1 = pci_slot_find(phb4_get_opal_id(chip1->id, 3));
	if (slot0 && slot1) {
	if (slot0->ops.get_presence_state)
	slot0->ops.get_presence_state(slot0, &p0);
	if (slot1->ops.get_presence_state)
	slot1->ops.get_presence_state(slot1, &p1);
	if (p0 == 1 && p1 == 1) {
	phb4_activate_shared_slot_witherspoon(chip1);
	slot0->peer_slot = slot1;
	slot1->peer_slot = slot0;
	}
	}
	}

	static int check_mlx_cards(struct phb phb __unused, struct pci_device dev,
	void *userdata __unused)
	{
	uint16_t mlx_cards[] = {
	0x1017, /* ConnectX-5 */
	0x1019, /* ConnectX-5 Ex */
	0x101b, /* ConnectX-6 */
	0x101d, /* ConnectX-6 Dx */
	0x101f, /* ConnectX-6 Lx */
	0x1021, /* ConnectX-7 */
	};

	if (PCI_VENDOR_ID(dev->vdid) == 0x15b3) { /* Mellanox */
	for (int i = 0; i < ARRAY_SIZE(mlx_cards); i++) {
	if (mlx_cards[i] == PCI_DEVICE_ID(dev->vdid))
	return 1;
	}
	}
	return 0;
	}

	static void witherspoon_pci_probe_complete(void)
	{
	struct pci_device *dev;
	struct phb *phb;
	struct phb4 *p;

	/*
	* Reallocate dma engines between stacks in PEC2 if a Mellanox
	* card is found on the shared slot, as it is required to get
	* good GPU direct performance.
	*/
	for_each_phb(phb) {
	/* skip the virtual PHBs */
	if (phb->phb_type != phb_type_pcie_v4)
	continue;
	p = phb_to_phb4(phb);
	/* Keep only the first PHB on PEC2 */
	if (p->index != 3)
	continue;
	dev = pci_walk_dev(phb, NULL, check_mlx_cards, NULL);
	if (dev)
	phb4_pec2_dma_engine_realloc(p);
	}
	}

	static void set_link_details(struct npu2 *npu, uint32_t link_index,
	uint32_t brick_index, enum npu2_dev_type type)
	{
	struct npu2_dev *dev = NULL;
	for (int i = 0; i < npu->total_devices; i++) {
	if (npu->devices[i].link_index == link_index) {
	dev = &npu->devices[i];
	break;
	}
	}
	if (!dev) {
	prlog(PR_ERR, "PLAT: Could not find NPU link index %d\n",
	link_index);
	return;
	}
	dev->brick_index = brick_index;
	dev->type = type;
	}

	static void witherspoon_npu2_device_detect(struct npu2 *npu)
	{
	struct proc_chip *chip;
	uint8_t state;
	uint64_t i2c_port_id = 0;
	char port_name[17];
	struct dt_node *dn;
	int rc;

	bool gpu0_present, gpu1_present;

	if (witherspoon_type != WITHERSPOON_TYPE_REDBUD) {
	prlog(PR_DEBUG, "PLAT: Setting all NPU links to NVLink, OpenCAPI only supported on Redbud\n");
	for (int i = 0; i < npu->total_devices; i++) {
	npu->devices[i].type = NPU2_DEV_TYPE_NVLINK;
	}
	return;
	}
	assert(npu->total_devices == 6);

	chip = get_chip(npu->chip_id);

	/* Find I2C port */
	snprintf(port_name, sizeof(port_name), "p8_%08x_e%dp%d",
	chip->id, platform.ocapi->i2c_engine,
	platform.ocapi->i2c_port);
	dt_for_each_compatible(dt_root, dn, "ibm,power9-i2c-port") {
	if (streq(port_name, dt_prop_get(dn, "ibm,port-name"))) {
	i2c_port_id = dt_prop_get_u32(dn, "ibm,opal-id");
	break;
	}
	}

	if (!i2c_port_id) {
	prlog(PR_ERR, "PLAT: Could not find NPU presence I2C port\n");
	return;
	}

	gpu0_present = occ_get_gpu_presence(chip, 0);
	if (gpu0_present) {
	prlog(PR_DEBUG, "PLAT: Chip %d GPU#0 slot present\n", chip->id);
	}

	gpu1_present = occ_get_gpu_presence(chip, 1);
	if (gpu1_present) {
	prlog(PR_DEBUG, "PLAT: Chip %d GPU#1 slot present\n", chip->id);
	}

	/*
	* The following I2C ops generate errors if no device is
	* present on any SXM2 slot. Since it's useless, let's skip it
	*/
	if (!gpu0_present && !gpu1_present)
	return;

	/* Set pins to input */
	state = 0xff;
	rc = i2c_request_send(i2c_port_id,
	platform.ocapi->i2c_presence_addr, SMBUS_WRITE, 3,
	1, &state, 1, 120);
	if (rc)
	goto i2c_failed;

	/* Read the presence value */
	state = 0x00;
	rc = i2c_request_send(i2c_port_id,
	platform.ocapi->i2c_presence_addr, SMBUS_READ, 0,
	1, &state, 1, 120);
	if (rc)
	goto i2c_failed;

	if (gpu0_present) {
	if (state & (1 << 0)) {
	prlog(PR_DEBUG, "PLAT: Chip %d GPU#0 is OpenCAPI\n",
	chip->id);
	/*
	* On witherspoon, bricks 2 and 3 are connected to
	* the lanes matching links 0 and 1 in OpenCAPI mode.
	*/
	set_link_details(npu, 1, 3, NPU2_DEV_TYPE_OPENCAPI);
	/* We current don't support using the second link */
	set_link_details(npu, 0, 2, NPU2_DEV_TYPE_UNKNOWN);
	} else {
	prlog(PR_DEBUG, "PLAT: Chip %d GPU#0 is NVLink\n",
	chip->id);
	set_link_details(npu, 0, 0, NPU2_DEV_TYPE_NVLINK);
	set_link_details(npu, 1, 1, NPU2_DEV_TYPE_NVLINK);
	set_link_details(npu, 2, 2, NPU2_DEV_TYPE_NVLINK);
	}
	}

	if (gpu1_present) {
	if (state & (1 << 1)) {
	prlog(PR_DEBUG, "PLAT: Chip %d GPU#1 is OpenCAPI\n",
	chip->id);
	set_link_details(npu, 4, 4, NPU2_DEV_TYPE_OPENCAPI);
	/* We current don't support using the second link */
	set_link_details(npu, 5, 5, NPU2_DEV_TYPE_UNKNOWN);
	} else {
	prlog(PR_DEBUG, "PLAT: Chip %d GPU#1 is NVLink\n",
	chip->id);
	set_link_details(npu, 3, 3, NPU2_DEV_TYPE_NVLINK);
	set_link_details(npu, 4, 4, NPU2_DEV_TYPE_NVLINK);
	set_link_details(npu, 5, 5, NPU2_DEV_TYPE_NVLINK);
	}
	}

	return;

	i2c_failed:
	prlog(PR_ERR, "PLAT: NPU device type detection failed, rc=%d\n", rc);
	return;
	}

	static const char *witherspoon_ocapi_slot_label(uint32_t chip_id,
	uint32_t brick_index)
	{
	const char *name = NULL;

	if (chip_id == 0) {
	if (brick_index == 3)
	name = "OPENCAPI-GPU0";
	else if (brick_index == 4)
	name = "OPENCAPI-GPU1";
	} else {
	if (brick_index == 3)
	name = "OPENCAPI-GPU3";
	else if (brick_index == 4)
	name = "OPENCAPI-GPU4";
	}
	return name;
	}

	static const struct platform_ocapi witherspoon_ocapi = {
	.i2c_engine = 1,
	.i2c_port = 4,
	.odl_phy_swap = false,
	.i2c_reset_addr = 0x20,
	/*
	* Witherspoon uses SXM2 connectors, carrying 2 OCAPI links
	* over a single connector - hence each pair of bricks shares
	* the same pin for resets. We currently only support using
	* bricks 3 and 4, among other reasons because we can't handle
	* a reset on one link causing the other link to reset as
	* well.
	*/
	.i2c_reset_brick2 = 1 << 0,
	.i2c_reset_brick3 = 1 << 0,
	.i2c_reset_brick4 = 1 << 1,
	.i2c_reset_brick5 = 1 << 1,
	.i2c_presence_addr = 0x20,
	/* unused, we do this in custom presence detect */
	.i2c_presence_brick2 = 0,
	.i2c_presence_brick3 = 0,
	.i2c_presence_brick4 = 0,
	.i2c_presence_brick5 = 0,
	.ocapi_slot_label = witherspoon_ocapi_slot_label,
	};

	static int gpu_slot_to_num(const char *slot)
	{
	char *p = NULL;
	int ret;

	if (!slot)
	return -1;

	if (memcmp(slot, "GPU", 3))
	return -1;

	ret = strtol(slot + 3, &p, 10);
	if (*p \|\| p == slot + 3)
	return -1;

	return ret;
	}

	static void npu2_phb_nvlink_dt(struct phb *npuphb)
	{
	struct dt_node g[3] = { NULL }; / Current maximum 3 GPUs per 1 NPU */
	struct dt_node *n[6] = { NULL };
	int max_gpus, i, gpuid, first, last;
	struct npu2 *npu2_phb = phb_to_npu2_nvlink(npuphb);
	struct pci_device *npd;

	switch (witherspoon_type) {
	case WITHERSPOON_TYPE_REDBUD:
	max_gpus = 4;
	break;
	case WITHERSPOON_TYPE_SEQUOIA:
	max_gpus = 6;
	break;
	default:
	/* witherspoon_probe() already reported missing support */
	return;
	}

	/* Find the indexes of GPUs connected to this NPU */
	for (i = 0, first = max_gpus, last = 0; i < npu2_phb->total_devices;
	++i) {
	gpuid = gpu_slot_to_num(npu2_phb->devices[i].nvlink.slot_label);
	if (gpuid < 0)
	continue;
	if (gpuid > last)
	last = gpuid;
	if (gpuid < first)
	first = gpuid;
	}

	/* Either no "GPUx" slots found or they are not consecutive, abort */
	if (!last \|\| last + 1 - first > max_gpus)
	return;

	/* Collect GPU device nodes, sorted by an index from "GPUn" */
	for (i = 0; i < npu2_phb->total_devices; ++i) {
	gpuid = gpu_slot_to_num(npu2_phb->devices[i].nvlink.slot_label);
	g[gpuid - first] = npu2_phb->devices[i].nvlink.pd->dn;

	/* Collect NVLink bridge nodes too, for their phandles */
	list_for_each(&npuphb->devices, npd, link) {
	if (npd->bdfn == npu2_phb->devices[i].bdfn) {
	assert(npu2_phb->devices[i].brick_index <
	ARRAY_SIZE(n));
	n[npu2_phb->devices[i].brick_index] = npd->dn;
	}
	}
	}

	/*
	* Store interconnect phandles in the device tree.
	* The mapping is from Witherspoon_Design_Workbook_v1.7_19June2018.pdf,
	* pages 39 (Sequoia), 40 (Redbud):
	* Figure 16: NVLink wiring diagram for planar with 6 GPUs
	* Figure 17: NVLink wiring diagram for planar with 4 GPUs
	*/
	#define PEERPH(g) ((g)?(g)->phandle:0)
	switch (witherspoon_type) {
	case WITHERSPOON_TYPE_REDBUD:
	if (g[0])
	dt_add_property_cells(g[0], "ibm,nvlink-peers",
	PEERPH(g[1]), PEERPH(n[0]),
	PEERPH(g[1]), PEERPH(n[1]),
	PEERPH(g[1]), PEERPH(n[2]));
	if (g[1])
	dt_add_property_cells(g[1], "ibm,nvlink-peers",
	PEERPH(g[0]), PEERPH(n[3]),
	PEERPH(g[0]), PEERPH(n[4]),
	PEERPH(g[0]), PEERPH(n[5]));
	break;
	case WITHERSPOON_TYPE_SEQUOIA:
	if (g[0])
	dt_add_property_cells(g[0], "ibm,nvlink-peers",
	PEERPH(g[1]), PEERPH(n[0]),
	PEERPH(g[2]), PEERPH(g[2]),
	PEERPH(g[1]), PEERPH(n[1]));
	if (g[1])
	dt_add_property_cells(g[1], "ibm,nvlink-peers",
	PEERPH(g[0]), PEERPH(n[2]),
	PEERPH(g[2]), PEERPH(g[2]),
	PEERPH(g[0]), PEERPH(n[3]));
	if (g[2])
	dt_add_property_cells(g[2], "ibm,nvlink-peers",
	PEERPH(g[1]), PEERPH(g[0]),
	PEERPH(g[1]), PEERPH(n[4]),
	PEERPH(g[0]), PEERPH(n[5]));
	break;
	default:
	break;
	}
	}

	static void witherspoon_finalise_dt(bool is_reboot)
	{
	struct dt_node *np;
	struct proc_chip *c;

	if (is_reboot)
	return;

	dt_for_each_compatible(dt_root, np, "ibm,power9-npu-pciex") {
	u32 opal_id = dt_prop_get_cell(np, "ibm,opal-phbid", 1);
	struct phb *npphb = pci_get_phb(opal_id);

	if (!npphb)
	continue;
	if (npphb->phb_type != phb_type_npu_v2)
	continue;
	npu2_phb_nvlink_dt(npphb);
	}

	/*
	* The I2C bus on used to talk to the GPUs has a 750K pullup
	* which is way too big. If there's no GPUs connected to the
	* chip all I2C transactions fail with an Arb loss error since
	* SCL/SDA don't return to the idle state fast enough. Disable
	* the port to squash the errors.
	*/
	for (c = next_chip(NULL); c; c = next_chip(c)) {
	bool detected = false;
	int i;

	np = dt_find_by_path(c->devnode, "i2cm@a1000/i2c-bus@4");
	if (!np)
	continue;

	for (i = 0; i < 3; i++)
	detected \|= occ_get_gpu_presence(c, i);

	if (!detected) {
	dt_check_del_prop(np, "status");
	dt_add_property_string(np, "status", "disabled");
	}
	}
	}

	static int witherspoon_secvar_init(void)
	{
	return secvar_main(secboot_tpm_driver, edk2_compatible_v1);
	}

	/* The only difference between these is the PCI slot handling */

	DECLARE_PLATFORM(witherspoon) = {
	.name = "Witherspoon",
	.probe = witherspoon_probe,
	.init = astbmc_init,
	.pre_pci_fixup = witherspoon_shared_slot_fixup,
	.pci_probe_complete = witherspoon_pci_probe_complete,
	.start_preload_resource = flash_start_preload_resource,
	.resource_loaded = flash_resource_loaded,
	.bmc = &bmc_plat_ast2500_openbmc,
	.cec_power_down = astbmc_ipmi_power_down,
	.cec_reboot = astbmc_ipmi_reboot,
	.elog_commit = ipmi_elog_commit,
	.finalise_dt = witherspoon_finalise_dt,
	.exit = astbmc_exit,
	.terminate = ipmi_terminate,

	.pci_get_slot_info = dt_slot_get_slot_info,
	.ocapi = &witherspoon_ocapi,
	.npu2_device_detect = witherspoon_npu2_device_detect,
	.op_display = op_display_lpc,
	.secvar_init = witherspoon_secvar_init,
	};