1e65e175bSOded Gabbay // SPDX-License-Identifier: GPL-2.0 2e65e175bSOded Gabbay 3e65e175bSOded Gabbay /* 4e65e175bSOded Gabbay * Copyright 2016-2022 HabanaLabs, Ltd. 5e65e175bSOded Gabbay * All Rights Reserved. 6e65e175bSOded Gabbay */ 7e65e175bSOded Gabbay 8e65e175bSOded Gabbay #include "habanalabs.h" 9e65e175bSOded Gabbay #include "../include/common/hl_boot_if.h" 10e65e175bSOded Gabbay 11e65e175bSOded Gabbay #include <linux/firmware.h> 12e65e175bSOded Gabbay #include <linux/crc32.h> 13e65e175bSOded Gabbay #include <linux/slab.h> 14e65e175bSOded Gabbay #include <linux/ctype.h> 15e65e175bSOded Gabbay #include <linux/vmalloc.h> 16e65e175bSOded Gabbay 17e65e175bSOded Gabbay #include <trace/events/habanalabs.h> 18e65e175bSOded Gabbay 19e65e175bSOded Gabbay #define FW_FILE_MAX_SIZE 0x1400000 /* maximum size of 20MB */ 20e65e175bSOded Gabbay 21e65e175bSOded Gabbay static char *comms_cmd_str_arr[COMMS_INVLD_LAST] = { 22e65e175bSOded Gabbay [COMMS_NOOP] = __stringify(COMMS_NOOP), 23e65e175bSOded Gabbay [COMMS_CLR_STS] = __stringify(COMMS_CLR_STS), 24e65e175bSOded Gabbay [COMMS_RST_STATE] = __stringify(COMMS_RST_STATE), 25e65e175bSOded Gabbay [COMMS_PREP_DESC] = __stringify(COMMS_PREP_DESC), 26e65e175bSOded Gabbay [COMMS_DATA_RDY] = __stringify(COMMS_DATA_RDY), 27e65e175bSOded Gabbay [COMMS_EXEC] = __stringify(COMMS_EXEC), 28e65e175bSOded Gabbay [COMMS_RST_DEV] = __stringify(COMMS_RST_DEV), 29e65e175bSOded Gabbay [COMMS_GOTO_WFE] = __stringify(COMMS_GOTO_WFE), 30e65e175bSOded Gabbay [COMMS_SKIP_BMC] = __stringify(COMMS_SKIP_BMC), 31e65e175bSOded Gabbay [COMMS_PREP_DESC_ELBI] = __stringify(COMMS_PREP_DESC_ELBI), 32e65e175bSOded Gabbay }; 33e65e175bSOded Gabbay 34e65e175bSOded Gabbay static char *comms_sts_str_arr[COMMS_STS_INVLD_LAST] = { 35e65e175bSOded Gabbay [COMMS_STS_NOOP] = __stringify(COMMS_STS_NOOP), 36e65e175bSOded Gabbay [COMMS_STS_ACK] = __stringify(COMMS_STS_ACK), 37e65e175bSOded Gabbay [COMMS_STS_OK] = __stringify(COMMS_STS_OK), 38e65e175bSOded Gabbay [COMMS_STS_ERR] = __stringify(COMMS_STS_ERR), 39e65e175bSOded Gabbay [COMMS_STS_VALID_ERR] = __stringify(COMMS_STS_VALID_ERR), 40e65e175bSOded Gabbay [COMMS_STS_TIMEOUT_ERR] = __stringify(COMMS_STS_TIMEOUT_ERR), 41e65e175bSOded Gabbay }; 42e65e175bSOded Gabbay 43e65e175bSOded Gabbay static char *extract_fw_ver_from_str(const char *fw_str) 44e65e175bSOded Gabbay { 45e65e175bSOded Gabbay char *str, *fw_ver, *whitespace; 46e65e175bSOded Gabbay u32 ver_offset; 47e65e175bSOded Gabbay 48e65e175bSOded Gabbay fw_ver = kmalloc(VERSION_MAX_LEN, GFP_KERNEL); 49e65e175bSOded Gabbay if (!fw_ver) 50e65e175bSOded Gabbay return NULL; 51e65e175bSOded Gabbay 52e65e175bSOded Gabbay str = strnstr(fw_str, "fw-", VERSION_MAX_LEN); 53e65e175bSOded Gabbay if (!str) 54e65e175bSOded Gabbay goto free_fw_ver; 55e65e175bSOded Gabbay 56e65e175bSOded Gabbay /* Skip the fw- part */ 57e65e175bSOded Gabbay str += 3; 58e65e175bSOded Gabbay ver_offset = str - fw_str; 59e65e175bSOded Gabbay 60e65e175bSOded Gabbay /* Copy until the next whitespace */ 61e65e175bSOded Gabbay whitespace = strnstr(str, " ", VERSION_MAX_LEN - ver_offset); 62e65e175bSOded Gabbay if (!whitespace) 63e65e175bSOded Gabbay goto free_fw_ver; 64e65e175bSOded Gabbay 65e65e175bSOded Gabbay strscpy(fw_ver, str, whitespace - str + 1); 66e65e175bSOded Gabbay 67e65e175bSOded Gabbay return fw_ver; 68e65e175bSOded Gabbay 69e65e175bSOded Gabbay free_fw_ver: 70e65e175bSOded Gabbay kfree(fw_ver); 71e65e175bSOded Gabbay return NULL; 72e65e175bSOded Gabbay } 73e65e175bSOded Gabbay 74*12f77011SDafna Hirschfeld static int hl_get_preboot_major_minor(struct hl_device *hdev, char *preboot_ver) 75e65e175bSOded Gabbay { 76e65e175bSOded Gabbay char major[8], minor[8], *first_dot, *second_dot; 77e65e175bSOded Gabbay int rc; 78e65e175bSOded Gabbay 79e65e175bSOded Gabbay first_dot = strnstr(preboot_ver, ".", 10); 80e65e175bSOded Gabbay if (first_dot) { 81e65e175bSOded Gabbay strscpy(major, preboot_ver, first_dot - preboot_ver + 1); 82e65e175bSOded Gabbay rc = kstrtou32(major, 10, &hdev->fw_major_version); 83e65e175bSOded Gabbay } else { 84e65e175bSOded Gabbay rc = -EINVAL; 85e65e175bSOded Gabbay } 86e65e175bSOded Gabbay 87e65e175bSOded Gabbay if (rc) { 88e65e175bSOded Gabbay dev_err(hdev->dev, "Error %d parsing preboot major version\n", rc); 89*12f77011SDafna Hirschfeld return rc; 90e65e175bSOded Gabbay } 91e65e175bSOded Gabbay 92e65e175bSOded Gabbay /* skip the first dot */ 93e65e175bSOded Gabbay first_dot++; 94e65e175bSOded Gabbay 95e65e175bSOded Gabbay second_dot = strnstr(first_dot, ".", 10); 96e65e175bSOded Gabbay if (second_dot) { 97e65e175bSOded Gabbay strscpy(minor, first_dot, second_dot - first_dot + 1); 98e65e175bSOded Gabbay rc = kstrtou32(minor, 10, &hdev->fw_minor_version); 99e65e175bSOded Gabbay } else { 100e65e175bSOded Gabbay rc = -EINVAL; 101e65e175bSOded Gabbay } 102e65e175bSOded Gabbay 103e65e175bSOded Gabbay if (rc) 104e65e175bSOded Gabbay dev_err(hdev->dev, "Error %d parsing preboot minor version\n", rc); 105e65e175bSOded Gabbay return rc; 106e65e175bSOded Gabbay } 107e65e175bSOded Gabbay 108e65e175bSOded Gabbay static int hl_request_fw(struct hl_device *hdev, 109e65e175bSOded Gabbay const struct firmware **firmware_p, 110e65e175bSOded Gabbay const char *fw_name) 111e65e175bSOded Gabbay { 112e65e175bSOded Gabbay size_t fw_size; 113e65e175bSOded Gabbay int rc; 114e65e175bSOded Gabbay 115e65e175bSOded Gabbay rc = request_firmware(firmware_p, fw_name, hdev->dev); 116e65e175bSOded Gabbay if (rc) { 117e65e175bSOded Gabbay dev_err(hdev->dev, "Firmware file %s is not found! (error %d)\n", 118e65e175bSOded Gabbay fw_name, rc); 119e65e175bSOded Gabbay goto out; 120e65e175bSOded Gabbay } 121e65e175bSOded Gabbay 122e65e175bSOded Gabbay fw_size = (*firmware_p)->size; 123e65e175bSOded Gabbay if ((fw_size % 4) != 0) { 124e65e175bSOded Gabbay dev_err(hdev->dev, "Illegal %s firmware size %zu\n", 125e65e175bSOded Gabbay fw_name, fw_size); 126e65e175bSOded Gabbay rc = -EINVAL; 127e65e175bSOded Gabbay goto release_fw; 128e65e175bSOded Gabbay } 129e65e175bSOded Gabbay 130e65e175bSOded Gabbay dev_dbg(hdev->dev, "%s firmware size == %zu\n", fw_name, fw_size); 131e65e175bSOded Gabbay 132e65e175bSOded Gabbay if (fw_size > FW_FILE_MAX_SIZE) { 133e65e175bSOded Gabbay dev_err(hdev->dev, 134e65e175bSOded Gabbay "FW file size %zu exceeds maximum of %u bytes\n", 135e65e175bSOded Gabbay fw_size, FW_FILE_MAX_SIZE); 136e65e175bSOded Gabbay rc = -EINVAL; 137e65e175bSOded Gabbay goto release_fw; 138e65e175bSOded Gabbay } 139e65e175bSOded Gabbay 140e65e175bSOded Gabbay return 0; 141e65e175bSOded Gabbay 142e65e175bSOded Gabbay release_fw: 143e65e175bSOded Gabbay release_firmware(*firmware_p); 144e65e175bSOded Gabbay out: 145e65e175bSOded Gabbay return rc; 146e65e175bSOded Gabbay } 147e65e175bSOded Gabbay 148e65e175bSOded Gabbay /** 149e65e175bSOded Gabbay * hl_release_firmware() - release FW 150e65e175bSOded Gabbay * 151e65e175bSOded Gabbay * @fw: fw descriptor 152e65e175bSOded Gabbay * 153e65e175bSOded Gabbay * note: this inline function added to serve as a comprehensive mirror for the 154e65e175bSOded Gabbay * hl_request_fw function. 155e65e175bSOded Gabbay */ 156e65e175bSOded Gabbay static inline void hl_release_firmware(const struct firmware *fw) 157e65e175bSOded Gabbay { 158e65e175bSOded Gabbay release_firmware(fw); 159e65e175bSOded Gabbay } 160e65e175bSOded Gabbay 161e65e175bSOded Gabbay /** 162e65e175bSOded Gabbay * hl_fw_copy_fw_to_device() - copy FW to device 163e65e175bSOded Gabbay * 164e65e175bSOded Gabbay * @hdev: pointer to hl_device structure. 165e65e175bSOded Gabbay * @fw: fw descriptor 166e65e175bSOded Gabbay * @dst: IO memory mapped address space to copy firmware to 167e65e175bSOded Gabbay * @src_offset: offset in src FW to copy from 168e65e175bSOded Gabbay * @size: amount of bytes to copy (0 to copy the whole binary) 169e65e175bSOded Gabbay * 170e65e175bSOded Gabbay * actual copy of FW binary data to device, shared by static and dynamic loaders 171e65e175bSOded Gabbay */ 172e65e175bSOded Gabbay static int hl_fw_copy_fw_to_device(struct hl_device *hdev, 173e65e175bSOded Gabbay const struct firmware *fw, void __iomem *dst, 174e65e175bSOded Gabbay u32 src_offset, u32 size) 175e65e175bSOded Gabbay { 176e65e175bSOded Gabbay const void *fw_data; 177e65e175bSOded Gabbay 178e65e175bSOded Gabbay /* size 0 indicates to copy the whole file */ 179e65e175bSOded Gabbay if (!size) 180e65e175bSOded Gabbay size = fw->size; 181e65e175bSOded Gabbay 182e65e175bSOded Gabbay if (src_offset + size > fw->size) { 183e65e175bSOded Gabbay dev_err(hdev->dev, 184e65e175bSOded Gabbay "size to copy(%u) and offset(%u) are invalid\n", 185e65e175bSOded Gabbay size, src_offset); 186e65e175bSOded Gabbay return -EINVAL; 187e65e175bSOded Gabbay } 188e65e175bSOded Gabbay 189e65e175bSOded Gabbay fw_data = (const void *) fw->data; 190e65e175bSOded Gabbay 191e65e175bSOded Gabbay memcpy_toio(dst, fw_data + src_offset, size); 192e65e175bSOded Gabbay return 0; 193e65e175bSOded Gabbay } 194e65e175bSOded Gabbay 195e65e175bSOded Gabbay /** 196e65e175bSOded Gabbay * hl_fw_copy_msg_to_device() - copy message to device 197e65e175bSOded Gabbay * 198e65e175bSOded Gabbay * @hdev: pointer to hl_device structure. 199e65e175bSOded Gabbay * @msg: message 200e65e175bSOded Gabbay * @dst: IO memory mapped address space to copy firmware to 201e65e175bSOded Gabbay * @src_offset: offset in src message to copy from 202e65e175bSOded Gabbay * @size: amount of bytes to copy (0 to copy the whole binary) 203e65e175bSOded Gabbay * 204e65e175bSOded Gabbay * actual copy of message data to device. 205e65e175bSOded Gabbay */ 206e65e175bSOded Gabbay static int hl_fw_copy_msg_to_device(struct hl_device *hdev, 207e65e175bSOded Gabbay struct lkd_msg_comms *msg, void __iomem *dst, 208e65e175bSOded Gabbay u32 src_offset, u32 size) 209e65e175bSOded Gabbay { 210e65e175bSOded Gabbay void *msg_data; 211e65e175bSOded Gabbay 212e65e175bSOded Gabbay /* size 0 indicates to copy the whole file */ 213e65e175bSOded Gabbay if (!size) 214e65e175bSOded Gabbay size = sizeof(struct lkd_msg_comms); 215e65e175bSOded Gabbay 216e65e175bSOded Gabbay if (src_offset + size > sizeof(struct lkd_msg_comms)) { 217e65e175bSOded Gabbay dev_err(hdev->dev, 218e65e175bSOded Gabbay "size to copy(%u) and offset(%u) are invalid\n", 219e65e175bSOded Gabbay size, src_offset); 220e65e175bSOded Gabbay return -EINVAL; 221e65e175bSOded Gabbay } 222e65e175bSOded Gabbay 223e65e175bSOded Gabbay msg_data = (void *) msg; 224e65e175bSOded Gabbay 225e65e175bSOded Gabbay memcpy_toio(dst, msg_data + src_offset, size); 226e65e175bSOded Gabbay 227e65e175bSOded Gabbay return 0; 228e65e175bSOded Gabbay } 229e65e175bSOded Gabbay 230e65e175bSOded Gabbay /** 231e65e175bSOded Gabbay * hl_fw_load_fw_to_device() - Load F/W code to device's memory. 232e65e175bSOded Gabbay * 233e65e175bSOded Gabbay * @hdev: pointer to hl_device structure. 234e65e175bSOded Gabbay * @fw_name: the firmware image name 235e65e175bSOded Gabbay * @dst: IO memory mapped address space to copy firmware to 236e65e175bSOded Gabbay * @src_offset: offset in src FW to copy from 237e65e175bSOded Gabbay * @size: amount of bytes to copy (0 to copy the whole binary) 238e65e175bSOded Gabbay * 239e65e175bSOded Gabbay * Copy fw code from firmware file to device memory. 240e65e175bSOded Gabbay * 241e65e175bSOded Gabbay * Return: 0 on success, non-zero for failure. 242e65e175bSOded Gabbay */ 243e65e175bSOded Gabbay int hl_fw_load_fw_to_device(struct hl_device *hdev, const char *fw_name, 244e65e175bSOded Gabbay void __iomem *dst, u32 src_offset, u32 size) 245e65e175bSOded Gabbay { 246e65e175bSOded Gabbay const struct firmware *fw; 247e65e175bSOded Gabbay int rc; 248e65e175bSOded Gabbay 249e65e175bSOded Gabbay rc = hl_request_fw(hdev, &fw, fw_name); 250e65e175bSOded Gabbay if (rc) 251e65e175bSOded Gabbay return rc; 252e65e175bSOded Gabbay 253e65e175bSOded Gabbay rc = hl_fw_copy_fw_to_device(hdev, fw, dst, src_offset, size); 254e65e175bSOded Gabbay 255e65e175bSOded Gabbay hl_release_firmware(fw); 256e65e175bSOded Gabbay return rc; 257e65e175bSOded Gabbay } 258e65e175bSOded Gabbay 259e65e175bSOded Gabbay int hl_fw_send_pci_access_msg(struct hl_device *hdev, u32 opcode, u64 value) 260e65e175bSOded Gabbay { 261e65e175bSOded Gabbay struct cpucp_packet pkt = {}; 262e65e175bSOded Gabbay 263e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(opcode << CPUCP_PKT_CTL_OPCODE_SHIFT); 264e65e175bSOded Gabbay pkt.value = cpu_to_le64(value); 265e65e175bSOded Gabbay 266e65e175bSOded Gabbay return hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 0, NULL); 267e65e175bSOded Gabbay } 268e65e175bSOded Gabbay 269e65e175bSOded Gabbay int hl_fw_send_cpu_message(struct hl_device *hdev, u32 hw_queue_id, u32 *msg, 270e65e175bSOded Gabbay u16 len, u32 timeout, u64 *result) 271e65e175bSOded Gabbay { 272e65e175bSOded Gabbay struct hl_hw_queue *queue = &hdev->kernel_queues[hw_queue_id]; 273e65e175bSOded Gabbay struct asic_fixed_properties *prop = &hdev->asic_prop; 274e65e175bSOded Gabbay struct cpucp_packet *pkt; 275e65e175bSOded Gabbay dma_addr_t pkt_dma_addr; 276e65e175bSOded Gabbay struct hl_bd *sent_bd; 277e65e175bSOded Gabbay u32 tmp, expected_ack_val, pi, opcode; 278e65e175bSOded Gabbay int rc; 279e65e175bSOded Gabbay 280e65e175bSOded Gabbay pkt = hl_cpu_accessible_dma_pool_alloc(hdev, len, &pkt_dma_addr); 281e65e175bSOded Gabbay if (!pkt) { 282e65e175bSOded Gabbay dev_err(hdev->dev, 283e65e175bSOded Gabbay "Failed to allocate DMA memory for packet to CPU\n"); 284e65e175bSOded Gabbay return -ENOMEM; 285e65e175bSOded Gabbay } 286e65e175bSOded Gabbay 287e65e175bSOded Gabbay memcpy(pkt, msg, len); 288e65e175bSOded Gabbay 289e65e175bSOded Gabbay mutex_lock(&hdev->send_cpu_message_lock); 290e65e175bSOded Gabbay 291e65e175bSOded Gabbay /* CPU-CP messages can be sent during soft-reset */ 292e65e175bSOded Gabbay if (hdev->disabled && !hdev->reset_info.in_compute_reset) { 293e65e175bSOded Gabbay rc = 0; 294e65e175bSOded Gabbay goto out; 295e65e175bSOded Gabbay } 296e65e175bSOded Gabbay 297e65e175bSOded Gabbay if (hdev->device_cpu_disabled) { 298e65e175bSOded Gabbay rc = -EIO; 299e65e175bSOded Gabbay goto out; 300e65e175bSOded Gabbay } 301e65e175bSOded Gabbay 302e65e175bSOded Gabbay /* set fence to a non valid value */ 303e65e175bSOded Gabbay pkt->fence = cpu_to_le32(UINT_MAX); 304e65e175bSOded Gabbay pi = queue->pi; 305e65e175bSOded Gabbay 306e65e175bSOded Gabbay /* 307e65e175bSOded Gabbay * The CPU queue is a synchronous queue with an effective depth of 308e65e175bSOded Gabbay * a single entry (although it is allocated with room for multiple 309e65e175bSOded Gabbay * entries). We lock on it using 'send_cpu_message_lock' which 310e65e175bSOded Gabbay * serializes accesses to the CPU queue. 311e65e175bSOded Gabbay * Which means that we don't need to lock the access to the entire H/W 312e65e175bSOded Gabbay * queues module when submitting a JOB to the CPU queue. 313e65e175bSOded Gabbay */ 314e65e175bSOded Gabbay hl_hw_queue_submit_bd(hdev, queue, hl_queue_inc_ptr(queue->pi), len, pkt_dma_addr); 315e65e175bSOded Gabbay 316e65e175bSOded Gabbay if (prop->fw_app_cpu_boot_dev_sts0 & CPU_BOOT_DEV_STS0_PKT_PI_ACK_EN) 317e65e175bSOded Gabbay expected_ack_val = queue->pi; 318e65e175bSOded Gabbay else 319e65e175bSOded Gabbay expected_ack_val = CPUCP_PACKET_FENCE_VAL; 320e65e175bSOded Gabbay 321e65e175bSOded Gabbay rc = hl_poll_timeout_memory(hdev, &pkt->fence, tmp, 322e65e175bSOded Gabbay (tmp == expected_ack_val), 1000, 323e65e175bSOded Gabbay timeout, true); 324e65e175bSOded Gabbay 325e65e175bSOded Gabbay hl_hw_queue_inc_ci_kernel(hdev, hw_queue_id); 326e65e175bSOded Gabbay 327e65e175bSOded Gabbay if (rc == -ETIMEDOUT) { 328e65e175bSOded Gabbay /* If FW performed reset just before sending it a packet, we will get a timeout. 329e65e175bSOded Gabbay * This is expected behavior, hence no need for error message. 330e65e175bSOded Gabbay */ 331e65e175bSOded Gabbay if (!hl_device_operational(hdev, NULL) && !hdev->reset_info.in_compute_reset) 332e65e175bSOded Gabbay dev_dbg(hdev->dev, "Device CPU packet timeout (0x%x) due to FW reset\n", 333e65e175bSOded Gabbay tmp); 334e65e175bSOded Gabbay else 335eba773d3SMoti Haimovski dev_err(hdev->dev, "Device CPU packet timeout (status = 0x%x)\n", tmp); 336e65e175bSOded Gabbay hdev->device_cpu_disabled = true; 337e65e175bSOded Gabbay goto out; 338e65e175bSOded Gabbay } 339e65e175bSOded Gabbay 340e65e175bSOded Gabbay tmp = le32_to_cpu(pkt->ctl); 341e65e175bSOded Gabbay 342e65e175bSOded Gabbay rc = (tmp & CPUCP_PKT_CTL_RC_MASK) >> CPUCP_PKT_CTL_RC_SHIFT; 343e65e175bSOded Gabbay if (rc) { 344e65e175bSOded Gabbay opcode = (tmp & CPUCP_PKT_CTL_OPCODE_MASK) >> CPUCP_PKT_CTL_OPCODE_SHIFT; 345e65e175bSOded Gabbay 346e65e175bSOded Gabbay if (!prop->supports_advanced_cpucp_rc) { 347e65e175bSOded Gabbay dev_dbg(hdev->dev, "F/W ERROR %d for CPU packet %d\n", rc, opcode); 348e65e175bSOded Gabbay rc = -EIO; 349e65e175bSOded Gabbay goto scrub_descriptor; 350e65e175bSOded Gabbay } 351e65e175bSOded Gabbay 352e65e175bSOded Gabbay switch (rc) { 353e65e175bSOded Gabbay case cpucp_packet_invalid: 354e65e175bSOded Gabbay dev_err(hdev->dev, 355e65e175bSOded Gabbay "CPU packet %d is not supported by F/W\n", opcode); 356e65e175bSOded Gabbay break; 357e65e175bSOded Gabbay case cpucp_packet_fault: 358e65e175bSOded Gabbay dev_err(hdev->dev, 359e65e175bSOded Gabbay "F/W failed processing CPU packet %d\n", opcode); 360e65e175bSOded Gabbay break; 361e65e175bSOded Gabbay case cpucp_packet_invalid_pkt: 362e65e175bSOded Gabbay dev_dbg(hdev->dev, 363e65e175bSOded Gabbay "CPU packet %d is not supported by F/W\n", opcode); 364e65e175bSOded Gabbay break; 365e65e175bSOded Gabbay case cpucp_packet_invalid_params: 366e65e175bSOded Gabbay dev_err(hdev->dev, 367e65e175bSOded Gabbay "F/W reports invalid parameters for CPU packet %d\n", opcode); 368e65e175bSOded Gabbay break; 369e65e175bSOded Gabbay 370e65e175bSOded Gabbay default: 371e65e175bSOded Gabbay dev_err(hdev->dev, 372e65e175bSOded Gabbay "Unknown F/W ERROR %d for CPU packet %d\n", rc, opcode); 373e65e175bSOded Gabbay } 374e65e175bSOded Gabbay 375e65e175bSOded Gabbay /* propagate the return code from the f/w to the callers who want to check it */ 376e65e175bSOded Gabbay if (result) 377e65e175bSOded Gabbay *result = rc; 378e65e175bSOded Gabbay 379e65e175bSOded Gabbay rc = -EIO; 380e65e175bSOded Gabbay 381e65e175bSOded Gabbay } else if (result) { 382e65e175bSOded Gabbay *result = le64_to_cpu(pkt->result); 383e65e175bSOded Gabbay } 384e65e175bSOded Gabbay 385e65e175bSOded Gabbay scrub_descriptor: 386e65e175bSOded Gabbay /* Scrub previous buffer descriptor 'ctl' field which contains the 387e65e175bSOded Gabbay * previous PI value written during packet submission. 388e65e175bSOded Gabbay * We must do this or else F/W can read an old value upon queue wraparound. 389e65e175bSOded Gabbay */ 390e65e175bSOded Gabbay sent_bd = queue->kernel_address; 391e65e175bSOded Gabbay sent_bd += hl_pi_2_offset(pi); 392e65e175bSOded Gabbay sent_bd->ctl = cpu_to_le32(UINT_MAX); 393e65e175bSOded Gabbay 394e65e175bSOded Gabbay out: 395e65e175bSOded Gabbay mutex_unlock(&hdev->send_cpu_message_lock); 396e65e175bSOded Gabbay 397e65e175bSOded Gabbay hl_cpu_accessible_dma_pool_free(hdev, len, pkt); 398e65e175bSOded Gabbay 399e65e175bSOded Gabbay return rc; 400e65e175bSOded Gabbay } 401e65e175bSOded Gabbay 402e65e175bSOded Gabbay int hl_fw_unmask_irq(struct hl_device *hdev, u16 event_type) 403e65e175bSOded Gabbay { 404e65e175bSOded Gabbay struct cpucp_packet pkt; 405e65e175bSOded Gabbay u64 result; 406e65e175bSOded Gabbay int rc; 407e65e175bSOded Gabbay 408e65e175bSOded Gabbay memset(&pkt, 0, sizeof(pkt)); 409e65e175bSOded Gabbay 410e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_UNMASK_RAZWI_IRQ << 411e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 412e65e175bSOded Gabbay pkt.value = cpu_to_le64(event_type); 413e65e175bSOded Gabbay 414e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 415e65e175bSOded Gabbay 0, &result); 416e65e175bSOded Gabbay 417e65e175bSOded Gabbay if (rc) 418e65e175bSOded Gabbay dev_err(hdev->dev, "failed to unmask RAZWI IRQ %d", event_type); 419e65e175bSOded Gabbay 420e65e175bSOded Gabbay return rc; 421e65e175bSOded Gabbay } 422e65e175bSOded Gabbay 423e65e175bSOded Gabbay int hl_fw_unmask_irq_arr(struct hl_device *hdev, const u32 *irq_arr, 424e65e175bSOded Gabbay size_t irq_arr_size) 425e65e175bSOded Gabbay { 426e65e175bSOded Gabbay struct cpucp_unmask_irq_arr_packet *pkt; 427e65e175bSOded Gabbay size_t total_pkt_size; 428e65e175bSOded Gabbay u64 result; 429e65e175bSOded Gabbay int rc; 430e65e175bSOded Gabbay 431e65e175bSOded Gabbay total_pkt_size = sizeof(struct cpucp_unmask_irq_arr_packet) + 432e65e175bSOded Gabbay irq_arr_size; 433e65e175bSOded Gabbay 434e65e175bSOded Gabbay /* data should be aligned to 8 bytes in order to CPU-CP to copy it */ 435e65e175bSOded Gabbay total_pkt_size = (total_pkt_size + 0x7) & ~0x7; 436e65e175bSOded Gabbay 437e65e175bSOded Gabbay /* total_pkt_size is casted to u16 later on */ 438e65e175bSOded Gabbay if (total_pkt_size > USHRT_MAX) { 439e65e175bSOded Gabbay dev_err(hdev->dev, "too many elements in IRQ array\n"); 440e65e175bSOded Gabbay return -EINVAL; 441e65e175bSOded Gabbay } 442e65e175bSOded Gabbay 443e65e175bSOded Gabbay pkt = kzalloc(total_pkt_size, GFP_KERNEL); 444e65e175bSOded Gabbay if (!pkt) 445e65e175bSOded Gabbay return -ENOMEM; 446e65e175bSOded Gabbay 447e65e175bSOded Gabbay pkt->length = cpu_to_le32(irq_arr_size / sizeof(irq_arr[0])); 448e65e175bSOded Gabbay memcpy(&pkt->irqs, irq_arr, irq_arr_size); 449e65e175bSOded Gabbay 450e65e175bSOded Gabbay pkt->cpucp_pkt.ctl = cpu_to_le32(CPUCP_PACKET_UNMASK_RAZWI_IRQ_ARRAY << 451e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 452e65e175bSOded Gabbay 453e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) pkt, 454e65e175bSOded Gabbay total_pkt_size, 0, &result); 455e65e175bSOded Gabbay 456e65e175bSOded Gabbay if (rc) 457e65e175bSOded Gabbay dev_err(hdev->dev, "failed to unmask IRQ array\n"); 458e65e175bSOded Gabbay 459e65e175bSOded Gabbay kfree(pkt); 460e65e175bSOded Gabbay 461e65e175bSOded Gabbay return rc; 462e65e175bSOded Gabbay } 463e65e175bSOded Gabbay 464e65e175bSOded Gabbay int hl_fw_test_cpu_queue(struct hl_device *hdev) 465e65e175bSOded Gabbay { 466e65e175bSOded Gabbay struct cpucp_packet test_pkt = {}; 467e65e175bSOded Gabbay u64 result; 468e65e175bSOded Gabbay int rc; 469e65e175bSOded Gabbay 470e65e175bSOded Gabbay test_pkt.ctl = cpu_to_le32(CPUCP_PACKET_TEST << 471e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 472e65e175bSOded Gabbay test_pkt.value = cpu_to_le64(CPUCP_PACKET_FENCE_VAL); 473e65e175bSOded Gabbay 474e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &test_pkt, 475e65e175bSOded Gabbay sizeof(test_pkt), 0, &result); 476e65e175bSOded Gabbay 477e65e175bSOded Gabbay if (!rc) { 478e65e175bSOded Gabbay if (result != CPUCP_PACKET_FENCE_VAL) 479e65e175bSOded Gabbay dev_err(hdev->dev, 480e65e175bSOded Gabbay "CPU queue test failed (%#08llx)\n", result); 481e65e175bSOded Gabbay } else { 482e65e175bSOded Gabbay dev_err(hdev->dev, "CPU queue test failed, error %d\n", rc); 483e65e175bSOded Gabbay } 484e65e175bSOded Gabbay 485e65e175bSOded Gabbay return rc; 486e65e175bSOded Gabbay } 487e65e175bSOded Gabbay 488e65e175bSOded Gabbay void *hl_fw_cpu_accessible_dma_pool_alloc(struct hl_device *hdev, size_t size, 489e65e175bSOded Gabbay dma_addr_t *dma_handle) 490e65e175bSOded Gabbay { 491e65e175bSOded Gabbay u64 kernel_addr; 492e65e175bSOded Gabbay 493e65e175bSOded Gabbay kernel_addr = gen_pool_alloc(hdev->cpu_accessible_dma_pool, size); 494e65e175bSOded Gabbay 495e65e175bSOded Gabbay *dma_handle = hdev->cpu_accessible_dma_address + 496e65e175bSOded Gabbay (kernel_addr - (u64) (uintptr_t) hdev->cpu_accessible_dma_mem); 497e65e175bSOded Gabbay 498e65e175bSOded Gabbay return (void *) (uintptr_t) kernel_addr; 499e65e175bSOded Gabbay } 500e65e175bSOded Gabbay 501e65e175bSOded Gabbay void hl_fw_cpu_accessible_dma_pool_free(struct hl_device *hdev, size_t size, 502e65e175bSOded Gabbay void *vaddr) 503e65e175bSOded Gabbay { 504e65e175bSOded Gabbay gen_pool_free(hdev->cpu_accessible_dma_pool, (u64) (uintptr_t) vaddr, 505e65e175bSOded Gabbay size); 506e65e175bSOded Gabbay } 507e65e175bSOded Gabbay 508e65e175bSOded Gabbay int hl_fw_send_device_activity(struct hl_device *hdev, bool open) 509e65e175bSOded Gabbay { 510e65e175bSOded Gabbay struct cpucp_packet pkt; 511e65e175bSOded Gabbay int rc; 512e65e175bSOded Gabbay 513e65e175bSOded Gabbay memset(&pkt, 0, sizeof(pkt)); 514e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_ACTIVE_STATUS_SET << CPUCP_PKT_CTL_OPCODE_SHIFT); 515e65e175bSOded Gabbay pkt.value = cpu_to_le64(open); 516e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 0, NULL); 517e65e175bSOded Gabbay if (rc) 518e65e175bSOded Gabbay dev_err(hdev->dev, "failed to send device activity msg(%u)\n", open); 519e65e175bSOded Gabbay 520e65e175bSOded Gabbay return rc; 521e65e175bSOded Gabbay } 522e65e175bSOded Gabbay 523e65e175bSOded Gabbay int hl_fw_send_heartbeat(struct hl_device *hdev) 524e65e175bSOded Gabbay { 525e65e175bSOded Gabbay struct cpucp_packet hb_pkt; 526e65e175bSOded Gabbay u64 result; 527e65e175bSOded Gabbay int rc; 528e65e175bSOded Gabbay 529e65e175bSOded Gabbay memset(&hb_pkt, 0, sizeof(hb_pkt)); 530e65e175bSOded Gabbay hb_pkt.ctl = cpu_to_le32(CPUCP_PACKET_TEST << 531e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 532e65e175bSOded Gabbay hb_pkt.value = cpu_to_le64(CPUCP_PACKET_FENCE_VAL); 533e65e175bSOded Gabbay 534e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &hb_pkt, 535e65e175bSOded Gabbay sizeof(hb_pkt), 0, &result); 536e65e175bSOded Gabbay 537e65e175bSOded Gabbay if ((rc) || (result != CPUCP_PACKET_FENCE_VAL)) 538e65e175bSOded Gabbay return -EIO; 539e65e175bSOded Gabbay 540e65e175bSOded Gabbay if (le32_to_cpu(hb_pkt.status_mask) & 541e65e175bSOded Gabbay CPUCP_PKT_HB_STATUS_EQ_FAULT_MASK) { 542e65e175bSOded Gabbay dev_warn(hdev->dev, "FW reported EQ fault during heartbeat\n"); 543e65e175bSOded Gabbay rc = -EIO; 544e65e175bSOded Gabbay } 545e65e175bSOded Gabbay 546e65e175bSOded Gabbay return rc; 547e65e175bSOded Gabbay } 548e65e175bSOded Gabbay 549e65e175bSOded Gabbay static bool fw_report_boot_dev0(struct hl_device *hdev, u32 err_val, 550e65e175bSOded Gabbay u32 sts_val) 551e65e175bSOded Gabbay { 552e65e175bSOded Gabbay bool err_exists = false; 553e65e175bSOded Gabbay 554e65e175bSOded Gabbay if (!(err_val & CPU_BOOT_ERR0_ENABLED)) 555e65e175bSOded Gabbay return false; 556e65e175bSOded Gabbay 557e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_DRAM_INIT_FAIL) { 558e65e175bSOded Gabbay dev_err(hdev->dev, 559e65e175bSOded Gabbay "Device boot error - DRAM initialization failed\n"); 560e65e175bSOded Gabbay err_exists = true; 561e65e175bSOded Gabbay } 562e65e175bSOded Gabbay 563e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_FIT_CORRUPTED) { 564e65e175bSOded Gabbay dev_err(hdev->dev, "Device boot error - FIT image corrupted\n"); 565e65e175bSOded Gabbay err_exists = true; 566e65e175bSOded Gabbay } 567e65e175bSOded Gabbay 568e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_TS_INIT_FAIL) { 569e65e175bSOded Gabbay dev_err(hdev->dev, 570e65e175bSOded Gabbay "Device boot error - Thermal Sensor initialization failed\n"); 571e65e175bSOded Gabbay err_exists = true; 572e65e175bSOded Gabbay } 573e65e175bSOded Gabbay 574e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_BMC_WAIT_SKIPPED) { 575e65e175bSOded Gabbay if (hdev->bmc_enable) { 576e65e175bSOded Gabbay dev_err(hdev->dev, 577e65e175bSOded Gabbay "Device boot error - Skipped waiting for BMC\n"); 578e65e175bSOded Gabbay err_exists = true; 579e65e175bSOded Gabbay } else { 580e65e175bSOded Gabbay dev_info(hdev->dev, 581e65e175bSOded Gabbay "Device boot message - Skipped waiting for BMC\n"); 582e65e175bSOded Gabbay /* This is an info so we don't want it to disable the 583e65e175bSOded Gabbay * device 584e65e175bSOded Gabbay */ 585e65e175bSOded Gabbay err_val &= ~CPU_BOOT_ERR0_BMC_WAIT_SKIPPED; 586e65e175bSOded Gabbay } 587e65e175bSOded Gabbay } 588e65e175bSOded Gabbay 589e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_NIC_DATA_NOT_RDY) { 590e65e175bSOded Gabbay dev_err(hdev->dev, 591e65e175bSOded Gabbay "Device boot error - Serdes data from BMC not available\n"); 592e65e175bSOded Gabbay err_exists = true; 593e65e175bSOded Gabbay } 594e65e175bSOded Gabbay 595e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_NIC_FW_FAIL) { 596e65e175bSOded Gabbay dev_err(hdev->dev, 597e65e175bSOded Gabbay "Device boot error - NIC F/W initialization failed\n"); 598e65e175bSOded Gabbay err_exists = true; 599e65e175bSOded Gabbay } 600e65e175bSOded Gabbay 601e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_SECURITY_NOT_RDY) { 602e65e175bSOded Gabbay dev_err(hdev->dev, 603e65e175bSOded Gabbay "Device boot warning - security not ready\n"); 604e65e175bSOded Gabbay err_exists = true; 605e65e175bSOded Gabbay } 606e65e175bSOded Gabbay 607e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_SECURITY_FAIL) { 608e65e175bSOded Gabbay dev_err(hdev->dev, "Device boot error - security failure\n"); 609e65e175bSOded Gabbay err_exists = true; 610e65e175bSOded Gabbay } 611e65e175bSOded Gabbay 612e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_EFUSE_FAIL) { 613e65e175bSOded Gabbay dev_err(hdev->dev, "Device boot error - eFuse failure\n"); 614e65e175bSOded Gabbay err_exists = true; 615e65e175bSOded Gabbay } 616e65e175bSOded Gabbay 617e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_SEC_IMG_VER_FAIL) { 618e65e175bSOded Gabbay dev_err(hdev->dev, "Device boot error - Failed to load preboot secondary image\n"); 619e65e175bSOded Gabbay err_exists = true; 620e65e175bSOded Gabbay } 621e65e175bSOded Gabbay 622e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_PLL_FAIL) { 623e65e175bSOded Gabbay dev_err(hdev->dev, "Device boot error - PLL failure\n"); 624e65e175bSOded Gabbay err_exists = true; 625e65e175bSOded Gabbay } 626e65e175bSOded Gabbay 627e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_DEVICE_UNUSABLE_FAIL) { 628e65e175bSOded Gabbay /* Ignore this bit, don't prevent driver loading */ 629e65e175bSOded Gabbay dev_dbg(hdev->dev, "device unusable status is set\n"); 630e65e175bSOded Gabbay err_val &= ~CPU_BOOT_ERR0_DEVICE_UNUSABLE_FAIL; 631e65e175bSOded Gabbay } 632e65e175bSOded Gabbay 633e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_BINNING_FAIL) { 634e65e175bSOded Gabbay dev_err(hdev->dev, "Device boot error - binning failure\n"); 635e65e175bSOded Gabbay err_exists = true; 636e65e175bSOded Gabbay } 637e65e175bSOded Gabbay 638e65e175bSOded Gabbay if (sts_val & CPU_BOOT_DEV_STS0_ENABLED) 639e65e175bSOded Gabbay dev_dbg(hdev->dev, "Device status0 %#x\n", sts_val); 640e65e175bSOded Gabbay 641e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_EEPROM_FAIL) { 642e65e175bSOded Gabbay dev_err(hdev->dev, "Device boot error - EEPROM failure detected\n"); 643e65e175bSOded Gabbay err_exists = true; 644e65e175bSOded Gabbay } 645e65e175bSOded Gabbay 646e65e175bSOded Gabbay /* All warnings should go here in order not to reach the unknown error validation */ 647e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_DRAM_SKIPPED) { 648e65e175bSOded Gabbay dev_warn(hdev->dev, 649e65e175bSOded Gabbay "Device boot warning - Skipped DRAM initialization\n"); 650e65e175bSOded Gabbay /* This is a warning so we don't want it to disable the 651e65e175bSOded Gabbay * device 652e65e175bSOded Gabbay */ 653e65e175bSOded Gabbay err_val &= ~CPU_BOOT_ERR0_DRAM_SKIPPED; 654e65e175bSOded Gabbay } 655e65e175bSOded Gabbay 656e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_PRI_IMG_VER_FAIL) { 657e65e175bSOded Gabbay dev_warn(hdev->dev, 658e65e175bSOded Gabbay "Device boot warning - Failed to load preboot primary image\n"); 659e65e175bSOded Gabbay /* This is a warning so we don't want it to disable the 660e65e175bSOded Gabbay * device as we have a secondary preboot image 661e65e175bSOded Gabbay */ 662e65e175bSOded Gabbay err_val &= ~CPU_BOOT_ERR0_PRI_IMG_VER_FAIL; 663e65e175bSOded Gabbay } 664e65e175bSOded Gabbay 665e65e175bSOded Gabbay if (err_val & CPU_BOOT_ERR0_TPM_FAIL) { 666e65e175bSOded Gabbay dev_warn(hdev->dev, 667e65e175bSOded Gabbay "Device boot warning - TPM failure\n"); 668e65e175bSOded Gabbay /* This is a warning so we don't want it to disable the 669e65e175bSOded Gabbay * device 670e65e175bSOded Gabbay */ 671e65e175bSOded Gabbay err_val &= ~CPU_BOOT_ERR0_TPM_FAIL; 672e65e175bSOded Gabbay } 673e65e175bSOded Gabbay 674e65e175bSOded Gabbay if (!err_exists && (err_val & ~CPU_BOOT_ERR0_ENABLED)) { 675e65e175bSOded Gabbay dev_err(hdev->dev, 676e65e175bSOded Gabbay "Device boot error - unknown ERR0 error 0x%08x\n", err_val); 677e65e175bSOded Gabbay err_exists = true; 678e65e175bSOded Gabbay } 679e65e175bSOded Gabbay 680e65e175bSOded Gabbay /* return error only if it's in the predefined mask */ 681e65e175bSOded Gabbay if (err_exists && ((err_val & ~CPU_BOOT_ERR0_ENABLED) & 682e65e175bSOded Gabbay lower_32_bits(hdev->boot_error_status_mask))) 683e65e175bSOded Gabbay return true; 684e65e175bSOded Gabbay 685e65e175bSOded Gabbay return false; 686e65e175bSOded Gabbay } 687e65e175bSOded Gabbay 688e65e175bSOded Gabbay /* placeholder for ERR1 as no errors defined there yet */ 689e65e175bSOded Gabbay static bool fw_report_boot_dev1(struct hl_device *hdev, u32 err_val, 690e65e175bSOded Gabbay u32 sts_val) 691e65e175bSOded Gabbay { 692e65e175bSOded Gabbay /* 693e65e175bSOded Gabbay * keep this variable to preserve the logic of the function. 694e65e175bSOded Gabbay * this way it would require less modifications when error will be 695e65e175bSOded Gabbay * added to DEV_ERR1 696e65e175bSOded Gabbay */ 697e65e175bSOded Gabbay bool err_exists = false; 698e65e175bSOded Gabbay 699e65e175bSOded Gabbay if (!(err_val & CPU_BOOT_ERR1_ENABLED)) 700e65e175bSOded Gabbay return false; 701e65e175bSOded Gabbay 702e65e175bSOded Gabbay if (sts_val & CPU_BOOT_DEV_STS1_ENABLED) 703e65e175bSOded Gabbay dev_dbg(hdev->dev, "Device status1 %#x\n", sts_val); 704e65e175bSOded Gabbay 705e65e175bSOded Gabbay if (!err_exists && (err_val & ~CPU_BOOT_ERR1_ENABLED)) { 706e65e175bSOded Gabbay dev_err(hdev->dev, 707e65e175bSOded Gabbay "Device boot error - unknown ERR1 error 0x%08x\n", 708e65e175bSOded Gabbay err_val); 709e65e175bSOded Gabbay err_exists = true; 710e65e175bSOded Gabbay } 711e65e175bSOded Gabbay 712e65e175bSOded Gabbay /* return error only if it's in the predefined mask */ 713e65e175bSOded Gabbay if (err_exists && ((err_val & ~CPU_BOOT_ERR1_ENABLED) & 714e65e175bSOded Gabbay upper_32_bits(hdev->boot_error_status_mask))) 715e65e175bSOded Gabbay return true; 716e65e175bSOded Gabbay 717e65e175bSOded Gabbay return false; 718e65e175bSOded Gabbay } 719e65e175bSOded Gabbay 720e65e175bSOded Gabbay static int fw_read_errors(struct hl_device *hdev, u32 boot_err0_reg, 721e65e175bSOded Gabbay u32 boot_err1_reg, u32 cpu_boot_dev_status0_reg, 722e65e175bSOded Gabbay u32 cpu_boot_dev_status1_reg) 723e65e175bSOded Gabbay { 724e65e175bSOded Gabbay u32 err_val, status_val; 725e65e175bSOded Gabbay bool err_exists = false; 726e65e175bSOded Gabbay 727e65e175bSOded Gabbay /* Some of the firmware status codes are deprecated in newer f/w 728e65e175bSOded Gabbay * versions. In those versions, the errors are reported 729e65e175bSOded Gabbay * in different registers. Therefore, we need to check those 730e65e175bSOded Gabbay * registers and print the exact errors. Moreover, there 731e65e175bSOded Gabbay * may be multiple errors, so we need to report on each error 732e65e175bSOded Gabbay * separately. Some of the error codes might indicate a state 733e65e175bSOded Gabbay * that is not an error per-se, but it is an error in production 734e65e175bSOded Gabbay * environment 735e65e175bSOded Gabbay */ 736e65e175bSOded Gabbay err_val = RREG32(boot_err0_reg); 737e65e175bSOded Gabbay status_val = RREG32(cpu_boot_dev_status0_reg); 738e65e175bSOded Gabbay err_exists = fw_report_boot_dev0(hdev, err_val, status_val); 739e65e175bSOded Gabbay 740e65e175bSOded Gabbay err_val = RREG32(boot_err1_reg); 741e65e175bSOded Gabbay status_val = RREG32(cpu_boot_dev_status1_reg); 742e65e175bSOded Gabbay err_exists |= fw_report_boot_dev1(hdev, err_val, status_val); 743e65e175bSOded Gabbay 744e65e175bSOded Gabbay if (err_exists) 745e65e175bSOded Gabbay return -EIO; 746e65e175bSOded Gabbay 747e65e175bSOded Gabbay return 0; 748e65e175bSOded Gabbay } 749e65e175bSOded Gabbay 750e65e175bSOded Gabbay int hl_fw_cpucp_info_get(struct hl_device *hdev, 751e65e175bSOded Gabbay u32 sts_boot_dev_sts0_reg, 752e65e175bSOded Gabbay u32 sts_boot_dev_sts1_reg, u32 boot_err0_reg, 753e65e175bSOded Gabbay u32 boot_err1_reg) 754e65e175bSOded Gabbay { 755e65e175bSOded Gabbay struct asic_fixed_properties *prop = &hdev->asic_prop; 756e65e175bSOded Gabbay struct cpucp_packet pkt = {}; 757e65e175bSOded Gabbay dma_addr_t cpucp_info_dma_addr; 758e65e175bSOded Gabbay void *cpucp_info_cpu_addr; 759e65e175bSOded Gabbay char *kernel_ver; 760e65e175bSOded Gabbay u64 result; 761e65e175bSOded Gabbay int rc; 762e65e175bSOded Gabbay 763e65e175bSOded Gabbay cpucp_info_cpu_addr = hl_cpu_accessible_dma_pool_alloc(hdev, sizeof(struct cpucp_info), 764e65e175bSOded Gabbay &cpucp_info_dma_addr); 765e65e175bSOded Gabbay if (!cpucp_info_cpu_addr) { 766e65e175bSOded Gabbay dev_err(hdev->dev, 767e65e175bSOded Gabbay "Failed to allocate DMA memory for CPU-CP info packet\n"); 768e65e175bSOded Gabbay return -ENOMEM; 769e65e175bSOded Gabbay } 770e65e175bSOded Gabbay 771e65e175bSOded Gabbay memset(cpucp_info_cpu_addr, 0, sizeof(struct cpucp_info)); 772e65e175bSOded Gabbay 773e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_INFO_GET << 774e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 775e65e175bSOded Gabbay pkt.addr = cpu_to_le64(cpucp_info_dma_addr); 776e65e175bSOded Gabbay pkt.data_max_size = cpu_to_le32(sizeof(struct cpucp_info)); 777e65e175bSOded Gabbay 778e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 779e65e175bSOded Gabbay HL_CPUCP_INFO_TIMEOUT_USEC, &result); 780e65e175bSOded Gabbay if (rc) { 781e65e175bSOded Gabbay dev_err(hdev->dev, 782e65e175bSOded Gabbay "Failed to handle CPU-CP info pkt, error %d\n", rc); 783e65e175bSOded Gabbay goto out; 784e65e175bSOded Gabbay } 785e65e175bSOded Gabbay 786e65e175bSOded Gabbay rc = fw_read_errors(hdev, boot_err0_reg, boot_err1_reg, 787e65e175bSOded Gabbay sts_boot_dev_sts0_reg, sts_boot_dev_sts1_reg); 788e65e175bSOded Gabbay if (rc) { 789e65e175bSOded Gabbay dev_err(hdev->dev, "Errors in device boot\n"); 790e65e175bSOded Gabbay goto out; 791e65e175bSOded Gabbay } 792e65e175bSOded Gabbay 793e65e175bSOded Gabbay memcpy(&prop->cpucp_info, cpucp_info_cpu_addr, 794e65e175bSOded Gabbay sizeof(prop->cpucp_info)); 795e65e175bSOded Gabbay 796e65e175bSOded Gabbay rc = hl_build_hwmon_channel_info(hdev, prop->cpucp_info.sensors); 797e65e175bSOded Gabbay if (rc) { 798e65e175bSOded Gabbay dev_err(hdev->dev, 799e65e175bSOded Gabbay "Failed to build hwmon channel info, error %d\n", rc); 800e65e175bSOded Gabbay rc = -EFAULT; 801e65e175bSOded Gabbay goto out; 802e65e175bSOded Gabbay } 803e65e175bSOded Gabbay 804e65e175bSOded Gabbay kernel_ver = extract_fw_ver_from_str(prop->cpucp_info.kernel_version); 805e65e175bSOded Gabbay if (kernel_ver) { 806e65e175bSOded Gabbay dev_info(hdev->dev, "Linux version %s", kernel_ver); 807e65e175bSOded Gabbay kfree(kernel_ver); 808e65e175bSOded Gabbay } 809e65e175bSOded Gabbay 810e65e175bSOded Gabbay /* assume EQ code doesn't need to check eqe index */ 811e65e175bSOded Gabbay hdev->event_queue.check_eqe_index = false; 812e65e175bSOded Gabbay 813e65e175bSOded Gabbay /* Read FW application security bits again */ 814e65e175bSOded Gabbay if (prop->fw_cpu_boot_dev_sts0_valid) { 815e65e175bSOded Gabbay prop->fw_app_cpu_boot_dev_sts0 = RREG32(sts_boot_dev_sts0_reg); 816e65e175bSOded Gabbay if (prop->fw_app_cpu_boot_dev_sts0 & 817e65e175bSOded Gabbay CPU_BOOT_DEV_STS0_EQ_INDEX_EN) 818e65e175bSOded Gabbay hdev->event_queue.check_eqe_index = true; 819e65e175bSOded Gabbay } 820e65e175bSOded Gabbay 821e65e175bSOded Gabbay if (prop->fw_cpu_boot_dev_sts1_valid) 822e65e175bSOded Gabbay prop->fw_app_cpu_boot_dev_sts1 = RREG32(sts_boot_dev_sts1_reg); 823e65e175bSOded Gabbay 824e65e175bSOded Gabbay out: 825e65e175bSOded Gabbay hl_cpu_accessible_dma_pool_free(hdev, sizeof(struct cpucp_info), cpucp_info_cpu_addr); 826e65e175bSOded Gabbay 827e65e175bSOded Gabbay return rc; 828e65e175bSOded Gabbay } 829e65e175bSOded Gabbay 830e65e175bSOded Gabbay static int hl_fw_send_msi_info_msg(struct hl_device *hdev) 831e65e175bSOded Gabbay { 832e65e175bSOded Gabbay struct cpucp_array_data_packet *pkt; 833e65e175bSOded Gabbay size_t total_pkt_size, data_size; 834e65e175bSOded Gabbay u64 result; 835e65e175bSOded Gabbay int rc; 836e65e175bSOded Gabbay 837e65e175bSOded Gabbay /* skip sending this info for unsupported ASICs */ 838e65e175bSOded Gabbay if (!hdev->asic_funcs->get_msi_info) 839e65e175bSOded Gabbay return 0; 840e65e175bSOded Gabbay 841e65e175bSOded Gabbay data_size = CPUCP_NUM_OF_MSI_TYPES * sizeof(u32); 842e65e175bSOded Gabbay total_pkt_size = sizeof(struct cpucp_array_data_packet) + data_size; 843e65e175bSOded Gabbay 844e65e175bSOded Gabbay /* data should be aligned to 8 bytes in order to CPU-CP to copy it */ 845e65e175bSOded Gabbay total_pkt_size = (total_pkt_size + 0x7) & ~0x7; 846e65e175bSOded Gabbay 847e65e175bSOded Gabbay /* total_pkt_size is casted to u16 later on */ 848e65e175bSOded Gabbay if (total_pkt_size > USHRT_MAX) { 849e65e175bSOded Gabbay dev_err(hdev->dev, "CPUCP array data is too big\n"); 850e65e175bSOded Gabbay return -EINVAL; 851e65e175bSOded Gabbay } 852e65e175bSOded Gabbay 853e65e175bSOded Gabbay pkt = kzalloc(total_pkt_size, GFP_KERNEL); 854e65e175bSOded Gabbay if (!pkt) 855e65e175bSOded Gabbay return -ENOMEM; 856e65e175bSOded Gabbay 857e65e175bSOded Gabbay pkt->length = cpu_to_le32(CPUCP_NUM_OF_MSI_TYPES); 858e65e175bSOded Gabbay 859e65e175bSOded Gabbay memset((void *) &pkt->data, 0xFF, data_size); 860e65e175bSOded Gabbay hdev->asic_funcs->get_msi_info(pkt->data); 861e65e175bSOded Gabbay 862e65e175bSOded Gabbay pkt->cpucp_pkt.ctl = cpu_to_le32(CPUCP_PACKET_MSI_INFO_SET << 863e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 864e65e175bSOded Gabbay 865e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *)pkt, 866e65e175bSOded Gabbay total_pkt_size, 0, &result); 867e65e175bSOded Gabbay 868e65e175bSOded Gabbay /* 869e65e175bSOded Gabbay * in case packet result is invalid it means that FW does not support 870e65e175bSOded Gabbay * this feature and will use default/hard coded MSI values. no reason 871e65e175bSOded Gabbay * to stop the boot 872e65e175bSOded Gabbay */ 873e65e175bSOded Gabbay if (rc && result == cpucp_packet_invalid) 874e65e175bSOded Gabbay rc = 0; 875e65e175bSOded Gabbay 876e65e175bSOded Gabbay if (rc) 877e65e175bSOded Gabbay dev_err(hdev->dev, "failed to send CPUCP array data\n"); 878e65e175bSOded Gabbay 879e65e175bSOded Gabbay kfree(pkt); 880e65e175bSOded Gabbay 881e65e175bSOded Gabbay return rc; 882e65e175bSOded Gabbay } 883e65e175bSOded Gabbay 884e65e175bSOded Gabbay int hl_fw_cpucp_handshake(struct hl_device *hdev, 885e65e175bSOded Gabbay u32 sts_boot_dev_sts0_reg, 886e65e175bSOded Gabbay u32 sts_boot_dev_sts1_reg, u32 boot_err0_reg, 887e65e175bSOded Gabbay u32 boot_err1_reg) 888e65e175bSOded Gabbay { 889e65e175bSOded Gabbay int rc; 890e65e175bSOded Gabbay 891e65e175bSOded Gabbay rc = hl_fw_cpucp_info_get(hdev, sts_boot_dev_sts0_reg, 892e65e175bSOded Gabbay sts_boot_dev_sts1_reg, boot_err0_reg, 893e65e175bSOded Gabbay boot_err1_reg); 894e65e175bSOded Gabbay if (rc) 895e65e175bSOded Gabbay return rc; 896e65e175bSOded Gabbay 897e65e175bSOded Gabbay return hl_fw_send_msi_info_msg(hdev); 898e65e175bSOded Gabbay } 899e65e175bSOded Gabbay 900e65e175bSOded Gabbay int hl_fw_get_eeprom_data(struct hl_device *hdev, void *data, size_t max_size) 901e65e175bSOded Gabbay { 902e65e175bSOded Gabbay struct cpucp_packet pkt = {}; 903e65e175bSOded Gabbay void *eeprom_info_cpu_addr; 904e65e175bSOded Gabbay dma_addr_t eeprom_info_dma_addr; 905e65e175bSOded Gabbay u64 result; 906e65e175bSOded Gabbay int rc; 907e65e175bSOded Gabbay 908e65e175bSOded Gabbay eeprom_info_cpu_addr = hl_cpu_accessible_dma_pool_alloc(hdev, max_size, 909e65e175bSOded Gabbay &eeprom_info_dma_addr); 910e65e175bSOded Gabbay if (!eeprom_info_cpu_addr) { 911e65e175bSOded Gabbay dev_err(hdev->dev, 912e65e175bSOded Gabbay "Failed to allocate DMA memory for CPU-CP EEPROM packet\n"); 913e65e175bSOded Gabbay return -ENOMEM; 914e65e175bSOded Gabbay } 915e65e175bSOded Gabbay 916e65e175bSOded Gabbay memset(eeprom_info_cpu_addr, 0, max_size); 917e65e175bSOded Gabbay 918e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_EEPROM_DATA_GET << 919e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 920e65e175bSOded Gabbay pkt.addr = cpu_to_le64(eeprom_info_dma_addr); 921e65e175bSOded Gabbay pkt.data_max_size = cpu_to_le32(max_size); 922e65e175bSOded Gabbay 923e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 924e65e175bSOded Gabbay HL_CPUCP_EEPROM_TIMEOUT_USEC, &result); 925e65e175bSOded Gabbay 926e65e175bSOded Gabbay if (rc) { 927e65e175bSOded Gabbay dev_err(hdev->dev, 928e65e175bSOded Gabbay "Failed to handle CPU-CP EEPROM packet, error %d\n", 929e65e175bSOded Gabbay rc); 930e65e175bSOded Gabbay goto out; 931e65e175bSOded Gabbay } 932e65e175bSOded Gabbay 933e65e175bSOded Gabbay /* result contains the actual size */ 934e65e175bSOded Gabbay memcpy(data, eeprom_info_cpu_addr, min((size_t)result, max_size)); 935e65e175bSOded Gabbay 936e65e175bSOded Gabbay out: 937e65e175bSOded Gabbay hl_cpu_accessible_dma_pool_free(hdev, max_size, eeprom_info_cpu_addr); 938e65e175bSOded Gabbay 939e65e175bSOded Gabbay return rc; 940e65e175bSOded Gabbay } 941e65e175bSOded Gabbay 942e65e175bSOded Gabbay int hl_fw_get_monitor_dump(struct hl_device *hdev, void *data) 943e65e175bSOded Gabbay { 944e65e175bSOded Gabbay struct cpucp_monitor_dump *mon_dump_cpu_addr; 945e65e175bSOded Gabbay dma_addr_t mon_dump_dma_addr; 946e65e175bSOded Gabbay struct cpucp_packet pkt = {}; 947e65e175bSOded Gabbay size_t data_size; 948e65e175bSOded Gabbay __le32 *src_ptr; 949e65e175bSOded Gabbay u32 *dst_ptr; 950e65e175bSOded Gabbay u64 result; 951e65e175bSOded Gabbay int i, rc; 952e65e175bSOded Gabbay 953e65e175bSOded Gabbay data_size = sizeof(struct cpucp_monitor_dump); 954e65e175bSOded Gabbay mon_dump_cpu_addr = hl_cpu_accessible_dma_pool_alloc(hdev, data_size, &mon_dump_dma_addr); 955e65e175bSOded Gabbay if (!mon_dump_cpu_addr) { 956e65e175bSOded Gabbay dev_err(hdev->dev, 957e65e175bSOded Gabbay "Failed to allocate DMA memory for CPU-CP monitor-dump packet\n"); 958e65e175bSOded Gabbay return -ENOMEM; 959e65e175bSOded Gabbay } 960e65e175bSOded Gabbay 961e65e175bSOded Gabbay memset(mon_dump_cpu_addr, 0, data_size); 962e65e175bSOded Gabbay 963e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_MONITOR_DUMP_GET << CPUCP_PKT_CTL_OPCODE_SHIFT); 964e65e175bSOded Gabbay pkt.addr = cpu_to_le64(mon_dump_dma_addr); 965e65e175bSOded Gabbay pkt.data_max_size = cpu_to_le32(data_size); 966e65e175bSOded Gabbay 967e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 968e65e175bSOded Gabbay HL_CPUCP_MON_DUMP_TIMEOUT_USEC, &result); 969e65e175bSOded Gabbay if (rc) { 970e65e175bSOded Gabbay dev_err(hdev->dev, "Failed to handle CPU-CP monitor-dump packet, error %d\n", rc); 971e65e175bSOded Gabbay goto out; 972e65e175bSOded Gabbay } 973e65e175bSOded Gabbay 974e65e175bSOded Gabbay /* result contains the actual size */ 975e65e175bSOded Gabbay src_ptr = (__le32 *) mon_dump_cpu_addr; 976e65e175bSOded Gabbay dst_ptr = data; 977e65e175bSOded Gabbay for (i = 0; i < (data_size / sizeof(u32)); i++) { 978e65e175bSOded Gabbay *dst_ptr = le32_to_cpu(*src_ptr); 979e65e175bSOded Gabbay src_ptr++; 980e65e175bSOded Gabbay dst_ptr++; 981e65e175bSOded Gabbay } 982e65e175bSOded Gabbay 983e65e175bSOded Gabbay out: 984e65e175bSOded Gabbay hl_cpu_accessible_dma_pool_free(hdev, data_size, mon_dump_cpu_addr); 985e65e175bSOded Gabbay 986e65e175bSOded Gabbay return rc; 987e65e175bSOded Gabbay } 988e65e175bSOded Gabbay 989e65e175bSOded Gabbay int hl_fw_cpucp_pci_counters_get(struct hl_device *hdev, 990e65e175bSOded Gabbay struct hl_info_pci_counters *counters) 991e65e175bSOded Gabbay { 992e65e175bSOded Gabbay struct cpucp_packet pkt = {}; 993e65e175bSOded Gabbay u64 result; 994e65e175bSOded Gabbay int rc; 995e65e175bSOded Gabbay 996e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_PCIE_THROUGHPUT_GET << 997e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 998e65e175bSOded Gabbay 999e65e175bSOded Gabbay /* Fetch PCI rx counter */ 1000e65e175bSOded Gabbay pkt.index = cpu_to_le32(cpucp_pcie_throughput_rx); 1001e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 1002e65e175bSOded Gabbay HL_CPUCP_INFO_TIMEOUT_USEC, &result); 1003e65e175bSOded Gabbay if (rc) { 1004e65e175bSOded Gabbay dev_err(hdev->dev, 1005e65e175bSOded Gabbay "Failed to handle CPU-CP PCI info pkt, error %d\n", rc); 1006e65e175bSOded Gabbay return rc; 1007e65e175bSOded Gabbay } 1008e65e175bSOded Gabbay counters->rx_throughput = result; 1009e65e175bSOded Gabbay 1010e65e175bSOded Gabbay memset(&pkt, 0, sizeof(pkt)); 1011e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_PCIE_THROUGHPUT_GET << 1012e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 1013e65e175bSOded Gabbay 1014e65e175bSOded Gabbay /* Fetch PCI tx counter */ 1015e65e175bSOded Gabbay pkt.index = cpu_to_le32(cpucp_pcie_throughput_tx); 1016e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 1017e65e175bSOded Gabbay HL_CPUCP_INFO_TIMEOUT_USEC, &result); 1018e65e175bSOded Gabbay if (rc) { 1019e65e175bSOded Gabbay dev_err(hdev->dev, 1020e65e175bSOded Gabbay "Failed to handle CPU-CP PCI info pkt, error %d\n", rc); 1021e65e175bSOded Gabbay return rc; 1022e65e175bSOded Gabbay } 1023e65e175bSOded Gabbay counters->tx_throughput = result; 1024e65e175bSOded Gabbay 1025e65e175bSOded Gabbay /* Fetch PCI replay counter */ 1026e65e175bSOded Gabbay memset(&pkt, 0, sizeof(pkt)); 1027e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_PCIE_REPLAY_CNT_GET << 1028e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 1029e65e175bSOded Gabbay 1030e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 1031e65e175bSOded Gabbay HL_CPUCP_INFO_TIMEOUT_USEC, &result); 1032e65e175bSOded Gabbay if (rc) { 1033e65e175bSOded Gabbay dev_err(hdev->dev, 1034e65e175bSOded Gabbay "Failed to handle CPU-CP PCI info pkt, error %d\n", rc); 1035e65e175bSOded Gabbay return rc; 1036e65e175bSOded Gabbay } 1037e65e175bSOded Gabbay counters->replay_cnt = (u32) result; 1038e65e175bSOded Gabbay 1039e65e175bSOded Gabbay return rc; 1040e65e175bSOded Gabbay } 1041e65e175bSOded Gabbay 1042e65e175bSOded Gabbay int hl_fw_cpucp_total_energy_get(struct hl_device *hdev, u64 *total_energy) 1043e65e175bSOded Gabbay { 1044e65e175bSOded Gabbay struct cpucp_packet pkt = {}; 1045e65e175bSOded Gabbay u64 result; 1046e65e175bSOded Gabbay int rc; 1047e65e175bSOded Gabbay 1048e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_TOTAL_ENERGY_GET << 1049e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 1050e65e175bSOded Gabbay 1051e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 1052e65e175bSOded Gabbay HL_CPUCP_INFO_TIMEOUT_USEC, &result); 1053e65e175bSOded Gabbay if (rc) { 1054e65e175bSOded Gabbay dev_err(hdev->dev, 1055e65e175bSOded Gabbay "Failed to handle CpuCP total energy pkt, error %d\n", 1056e65e175bSOded Gabbay rc); 1057e65e175bSOded Gabbay return rc; 1058e65e175bSOded Gabbay } 1059e65e175bSOded Gabbay 1060e65e175bSOded Gabbay *total_energy = result; 1061e65e175bSOded Gabbay 1062e65e175bSOded Gabbay return rc; 1063e65e175bSOded Gabbay } 1064e65e175bSOded Gabbay 1065e65e175bSOded Gabbay int get_used_pll_index(struct hl_device *hdev, u32 input_pll_index, 1066e65e175bSOded Gabbay enum pll_index *pll_index) 1067e65e175bSOded Gabbay { 1068e65e175bSOded Gabbay struct asic_fixed_properties *prop = &hdev->asic_prop; 1069e65e175bSOded Gabbay u8 pll_byte, pll_bit_off; 1070e65e175bSOded Gabbay bool dynamic_pll; 1071e65e175bSOded Gabbay int fw_pll_idx; 1072e65e175bSOded Gabbay 1073e65e175bSOded Gabbay dynamic_pll = !!(prop->fw_app_cpu_boot_dev_sts0 & 1074e65e175bSOded Gabbay CPU_BOOT_DEV_STS0_DYN_PLL_EN); 1075e65e175bSOded Gabbay 1076e65e175bSOded Gabbay if (!dynamic_pll) { 1077e65e175bSOded Gabbay /* 1078e65e175bSOded Gabbay * in case we are working with legacy FW (each asic has unique 1079e65e175bSOded Gabbay * PLL numbering) use the driver based index as they are 1080e65e175bSOded Gabbay * aligned with fw legacy numbering 1081e65e175bSOded Gabbay */ 1082e65e175bSOded Gabbay *pll_index = input_pll_index; 1083e65e175bSOded Gabbay return 0; 1084e65e175bSOded Gabbay } 1085e65e175bSOded Gabbay 1086e65e175bSOded Gabbay /* retrieve a FW compatible PLL index based on 1087e65e175bSOded Gabbay * ASIC specific user request 1088e65e175bSOded Gabbay */ 1089e65e175bSOded Gabbay fw_pll_idx = hdev->asic_funcs->map_pll_idx_to_fw_idx(input_pll_index); 1090e65e175bSOded Gabbay if (fw_pll_idx < 0) { 1091e65e175bSOded Gabbay dev_err(hdev->dev, "Invalid PLL index (%u) error %d\n", 1092e65e175bSOded Gabbay input_pll_index, fw_pll_idx); 1093e65e175bSOded Gabbay return -EINVAL; 1094e65e175bSOded Gabbay } 1095e65e175bSOded Gabbay 1096e65e175bSOded Gabbay /* PLL map is a u8 array */ 1097e65e175bSOded Gabbay pll_byte = prop->cpucp_info.pll_map[fw_pll_idx >> 3]; 1098e65e175bSOded Gabbay pll_bit_off = fw_pll_idx & 0x7; 1099e65e175bSOded Gabbay 1100e65e175bSOded Gabbay if (!(pll_byte & BIT(pll_bit_off))) { 1101e65e175bSOded Gabbay dev_err(hdev->dev, "PLL index %d is not supported\n", 1102e65e175bSOded Gabbay fw_pll_idx); 1103e65e175bSOded Gabbay return -EINVAL; 1104e65e175bSOded Gabbay } 1105e65e175bSOded Gabbay 1106e65e175bSOded Gabbay *pll_index = fw_pll_idx; 1107e65e175bSOded Gabbay 1108e65e175bSOded Gabbay return 0; 1109e65e175bSOded Gabbay } 1110e65e175bSOded Gabbay 1111e65e175bSOded Gabbay int hl_fw_cpucp_pll_info_get(struct hl_device *hdev, u32 pll_index, 1112e65e175bSOded Gabbay u16 *pll_freq_arr) 1113e65e175bSOded Gabbay { 1114e65e175bSOded Gabbay struct cpucp_packet pkt; 1115e65e175bSOded Gabbay enum pll_index used_pll_idx; 1116e65e175bSOded Gabbay u64 result; 1117e65e175bSOded Gabbay int rc; 1118e65e175bSOded Gabbay 1119e65e175bSOded Gabbay rc = get_used_pll_index(hdev, pll_index, &used_pll_idx); 1120e65e175bSOded Gabbay if (rc) 1121e65e175bSOded Gabbay return rc; 1122e65e175bSOded Gabbay 1123e65e175bSOded Gabbay memset(&pkt, 0, sizeof(pkt)); 1124e65e175bSOded Gabbay 1125e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_PLL_INFO_GET << 1126e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 1127e65e175bSOded Gabbay pkt.pll_type = __cpu_to_le16((u16)used_pll_idx); 1128e65e175bSOded Gabbay 1129e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 1130e65e175bSOded Gabbay HL_CPUCP_INFO_TIMEOUT_USEC, &result); 1131e65e175bSOded Gabbay if (rc) { 1132e65e175bSOded Gabbay dev_err(hdev->dev, "Failed to read PLL info, error %d\n", rc); 1133e65e175bSOded Gabbay return rc; 1134e65e175bSOded Gabbay } 1135e65e175bSOded Gabbay 1136e65e175bSOded Gabbay pll_freq_arr[0] = FIELD_GET(CPUCP_PKT_RES_PLL_OUT0_MASK, result); 1137e65e175bSOded Gabbay pll_freq_arr[1] = FIELD_GET(CPUCP_PKT_RES_PLL_OUT1_MASK, result); 1138e65e175bSOded Gabbay pll_freq_arr[2] = FIELD_GET(CPUCP_PKT_RES_PLL_OUT2_MASK, result); 1139e65e175bSOded Gabbay pll_freq_arr[3] = FIELD_GET(CPUCP_PKT_RES_PLL_OUT3_MASK, result); 1140e65e175bSOded Gabbay 1141e65e175bSOded Gabbay return 0; 1142e65e175bSOded Gabbay } 1143e65e175bSOded Gabbay 1144e65e175bSOded Gabbay int hl_fw_cpucp_power_get(struct hl_device *hdev, u64 *power) 1145e65e175bSOded Gabbay { 1146e65e175bSOded Gabbay struct cpucp_packet pkt; 1147e65e175bSOded Gabbay u64 result; 1148e65e175bSOded Gabbay int rc; 1149e65e175bSOded Gabbay 1150e65e175bSOded Gabbay memset(&pkt, 0, sizeof(pkt)); 1151e65e175bSOded Gabbay 1152e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_POWER_GET << 1153e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 1154e65e175bSOded Gabbay pkt.type = cpu_to_le16(CPUCP_POWER_INPUT); 1155e65e175bSOded Gabbay 1156e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 1157e65e175bSOded Gabbay HL_CPUCP_INFO_TIMEOUT_USEC, &result); 1158e65e175bSOded Gabbay if (rc) { 1159e65e175bSOded Gabbay dev_err(hdev->dev, "Failed to read power, error %d\n", rc); 1160e65e175bSOded Gabbay return rc; 1161e65e175bSOded Gabbay } 1162e65e175bSOded Gabbay 1163e65e175bSOded Gabbay *power = result; 1164e65e175bSOded Gabbay 1165e65e175bSOded Gabbay return rc; 1166e65e175bSOded Gabbay } 1167e65e175bSOded Gabbay 1168e65e175bSOded Gabbay int hl_fw_dram_replaced_row_get(struct hl_device *hdev, 1169e65e175bSOded Gabbay struct cpucp_hbm_row_info *info) 1170e65e175bSOded Gabbay { 1171e65e175bSOded Gabbay struct cpucp_hbm_row_info *cpucp_repl_rows_info_cpu_addr; 1172e65e175bSOded Gabbay dma_addr_t cpucp_repl_rows_info_dma_addr; 1173e65e175bSOded Gabbay struct cpucp_packet pkt = {}; 1174e65e175bSOded Gabbay u64 result; 1175e65e175bSOded Gabbay int rc; 1176e65e175bSOded Gabbay 1177e65e175bSOded Gabbay cpucp_repl_rows_info_cpu_addr = hl_cpu_accessible_dma_pool_alloc(hdev, 1178e65e175bSOded Gabbay sizeof(struct cpucp_hbm_row_info), 1179e65e175bSOded Gabbay &cpucp_repl_rows_info_dma_addr); 1180e65e175bSOded Gabbay if (!cpucp_repl_rows_info_cpu_addr) { 1181e65e175bSOded Gabbay dev_err(hdev->dev, 1182e65e175bSOded Gabbay "Failed to allocate DMA memory for CPU-CP replaced rows info packet\n"); 1183e65e175bSOded Gabbay return -ENOMEM; 1184e65e175bSOded Gabbay } 1185e65e175bSOded Gabbay 1186e65e175bSOded Gabbay memset(cpucp_repl_rows_info_cpu_addr, 0, sizeof(struct cpucp_hbm_row_info)); 1187e65e175bSOded Gabbay 1188e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_HBM_REPLACED_ROWS_INFO_GET << 1189e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 1190e65e175bSOded Gabbay pkt.addr = cpu_to_le64(cpucp_repl_rows_info_dma_addr); 1191e65e175bSOded Gabbay pkt.data_max_size = cpu_to_le32(sizeof(struct cpucp_hbm_row_info)); 1192e65e175bSOded Gabbay 1193e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 1194e65e175bSOded Gabbay HL_CPUCP_INFO_TIMEOUT_USEC, &result); 1195e65e175bSOded Gabbay if (rc) { 1196e65e175bSOded Gabbay dev_err(hdev->dev, 1197e65e175bSOded Gabbay "Failed to handle CPU-CP replaced rows info pkt, error %d\n", rc); 1198e65e175bSOded Gabbay goto out; 1199e65e175bSOded Gabbay } 1200e65e175bSOded Gabbay 1201e65e175bSOded Gabbay memcpy(info, cpucp_repl_rows_info_cpu_addr, sizeof(*info)); 1202e65e175bSOded Gabbay 1203e65e175bSOded Gabbay out: 1204e65e175bSOded Gabbay hl_cpu_accessible_dma_pool_free(hdev, sizeof(struct cpucp_hbm_row_info), 1205e65e175bSOded Gabbay cpucp_repl_rows_info_cpu_addr); 1206e65e175bSOded Gabbay 1207e65e175bSOded Gabbay return rc; 1208e65e175bSOded Gabbay } 1209e65e175bSOded Gabbay 1210e65e175bSOded Gabbay int hl_fw_dram_pending_row_get(struct hl_device *hdev, u32 *pend_rows_num) 1211e65e175bSOded Gabbay { 1212e65e175bSOded Gabbay struct cpucp_packet pkt; 1213e65e175bSOded Gabbay u64 result; 1214e65e175bSOded Gabbay int rc; 1215e65e175bSOded Gabbay 1216e65e175bSOded Gabbay memset(&pkt, 0, sizeof(pkt)); 1217e65e175bSOded Gabbay 1218e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_HBM_PENDING_ROWS_STATUS << CPUCP_PKT_CTL_OPCODE_SHIFT); 1219e65e175bSOded Gabbay 1220e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 0, &result); 1221e65e175bSOded Gabbay if (rc) { 1222e65e175bSOded Gabbay dev_err(hdev->dev, 1223e65e175bSOded Gabbay "Failed to handle CPU-CP pending rows info pkt, error %d\n", rc); 1224e65e175bSOded Gabbay goto out; 1225e65e175bSOded Gabbay } 1226e65e175bSOded Gabbay 1227e65e175bSOded Gabbay *pend_rows_num = (u32) result; 1228e65e175bSOded Gabbay out: 1229e65e175bSOded Gabbay return rc; 1230e65e175bSOded Gabbay } 1231e65e175bSOded Gabbay 1232e65e175bSOded Gabbay int hl_fw_cpucp_engine_core_asid_set(struct hl_device *hdev, u32 asid) 1233e65e175bSOded Gabbay { 1234e65e175bSOded Gabbay struct cpucp_packet pkt; 1235e65e175bSOded Gabbay int rc; 1236e65e175bSOded Gabbay 1237e65e175bSOded Gabbay memset(&pkt, 0, sizeof(pkt)); 1238e65e175bSOded Gabbay 1239e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_ENGINE_CORE_ASID_SET << CPUCP_PKT_CTL_OPCODE_SHIFT); 1240e65e175bSOded Gabbay pkt.value = cpu_to_le64(asid); 1241e65e175bSOded Gabbay 1242e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 1243e65e175bSOded Gabbay HL_CPUCP_INFO_TIMEOUT_USEC, NULL); 1244e65e175bSOded Gabbay if (rc) 1245e65e175bSOded Gabbay dev_err(hdev->dev, 1246e65e175bSOded Gabbay "Failed on ASID configuration request for engine core, error %d\n", 1247e65e175bSOded Gabbay rc); 1248e65e175bSOded Gabbay 1249e65e175bSOded Gabbay return rc; 1250e65e175bSOded Gabbay } 1251e65e175bSOded Gabbay 1252e65e175bSOded Gabbay void hl_fw_ask_hard_reset_without_linux(struct hl_device *hdev) 1253e65e175bSOded Gabbay { 1254e65e175bSOded Gabbay struct static_fw_load_mgr *static_loader = 1255e65e175bSOded Gabbay &hdev->fw_loader.static_loader; 1256e65e175bSOded Gabbay int rc; 1257e65e175bSOded Gabbay 1258e65e175bSOded Gabbay if (hdev->asic_prop.dynamic_fw_load) { 1259e65e175bSOded Gabbay rc = hl_fw_dynamic_send_protocol_cmd(hdev, &hdev->fw_loader, 1260e65e175bSOded Gabbay COMMS_RST_DEV, 0, false, 1261e65e175bSOded Gabbay hdev->fw_loader.cpu_timeout); 1262e65e175bSOded Gabbay if (rc) 12639d7fef7cSKoby Elbaz dev_err(hdev->dev, "Failed sending COMMS_RST_DEV\n"); 1264e65e175bSOded Gabbay } else { 1265e65e175bSOded Gabbay WREG32(static_loader->kmd_msg_to_cpu_reg, KMD_MSG_RST_DEV); 1266e65e175bSOded Gabbay } 1267e65e175bSOded Gabbay } 1268e65e175bSOded Gabbay 1269e65e175bSOded Gabbay void hl_fw_ask_halt_machine_without_linux(struct hl_device *hdev) 1270e65e175bSOded Gabbay { 1271e65e175bSOded Gabbay struct static_fw_load_mgr *static_loader = 1272e65e175bSOded Gabbay &hdev->fw_loader.static_loader; 1273e65e175bSOded Gabbay int rc; 1274e65e175bSOded Gabbay 1275e65e175bSOded Gabbay if (hdev->device_cpu_is_halted) 1276e65e175bSOded Gabbay return; 1277e65e175bSOded Gabbay 1278e65e175bSOded Gabbay /* Stop device CPU to make sure nothing bad happens */ 1279e65e175bSOded Gabbay if (hdev->asic_prop.dynamic_fw_load) { 1280e65e175bSOded Gabbay rc = hl_fw_dynamic_send_protocol_cmd(hdev, &hdev->fw_loader, 1281e65e175bSOded Gabbay COMMS_GOTO_WFE, 0, true, 1282e65e175bSOded Gabbay hdev->fw_loader.cpu_timeout); 1283e65e175bSOded Gabbay if (rc) 12849d7fef7cSKoby Elbaz dev_err(hdev->dev, "Failed sending COMMS_GOTO_WFE\n"); 1285e65e175bSOded Gabbay } else { 1286e65e175bSOded Gabbay WREG32(static_loader->kmd_msg_to_cpu_reg, KMD_MSG_GOTO_WFE); 1287e65e175bSOded Gabbay msleep(static_loader->cpu_reset_wait_msec); 1288e65e175bSOded Gabbay 1289e65e175bSOded Gabbay /* Must clear this register in order to prevent preboot 1290e65e175bSOded Gabbay * from reading WFE after reboot 1291e65e175bSOded Gabbay */ 1292e65e175bSOded Gabbay WREG32(static_loader->kmd_msg_to_cpu_reg, KMD_MSG_NA); 1293e65e175bSOded Gabbay } 1294e65e175bSOded Gabbay 1295e65e175bSOded Gabbay hdev->device_cpu_is_halted = true; 1296e65e175bSOded Gabbay } 1297e65e175bSOded Gabbay 1298e65e175bSOded Gabbay static void detect_cpu_boot_status(struct hl_device *hdev, u32 status) 1299e65e175bSOded Gabbay { 1300e65e175bSOded Gabbay /* Some of the status codes below are deprecated in newer f/w 1301e65e175bSOded Gabbay * versions but we keep them here for backward compatibility 1302e65e175bSOded Gabbay */ 1303e65e175bSOded Gabbay switch (status) { 1304e65e175bSOded Gabbay case CPU_BOOT_STATUS_NA: 1305e65e175bSOded Gabbay dev_err(hdev->dev, 1306e65e175bSOded Gabbay "Device boot progress - BTL/ROM did NOT run\n"); 1307e65e175bSOded Gabbay break; 1308e65e175bSOded Gabbay case CPU_BOOT_STATUS_IN_WFE: 1309e65e175bSOded Gabbay dev_err(hdev->dev, 1310e65e175bSOded Gabbay "Device boot progress - Stuck inside WFE loop\n"); 1311e65e175bSOded Gabbay break; 1312e65e175bSOded Gabbay case CPU_BOOT_STATUS_IN_BTL: 1313e65e175bSOded Gabbay dev_err(hdev->dev, 1314e65e175bSOded Gabbay "Device boot progress - Stuck in BTL\n"); 1315e65e175bSOded Gabbay break; 1316e65e175bSOded Gabbay case CPU_BOOT_STATUS_IN_PREBOOT: 1317e65e175bSOded Gabbay dev_err(hdev->dev, 1318e65e175bSOded Gabbay "Device boot progress - Stuck in Preboot\n"); 1319e65e175bSOded Gabbay break; 1320e65e175bSOded Gabbay case CPU_BOOT_STATUS_IN_SPL: 1321e65e175bSOded Gabbay dev_err(hdev->dev, 1322e65e175bSOded Gabbay "Device boot progress - Stuck in SPL\n"); 1323e65e175bSOded Gabbay break; 1324e65e175bSOded Gabbay case CPU_BOOT_STATUS_IN_UBOOT: 1325e65e175bSOded Gabbay dev_err(hdev->dev, 1326e65e175bSOded Gabbay "Device boot progress - Stuck in u-boot\n"); 1327e65e175bSOded Gabbay break; 1328e65e175bSOded Gabbay case CPU_BOOT_STATUS_DRAM_INIT_FAIL: 1329e65e175bSOded Gabbay dev_err(hdev->dev, 1330e65e175bSOded Gabbay "Device boot progress - DRAM initialization failed\n"); 1331e65e175bSOded Gabbay break; 1332e65e175bSOded Gabbay case CPU_BOOT_STATUS_UBOOT_NOT_READY: 1333e65e175bSOded Gabbay dev_err(hdev->dev, 1334e65e175bSOded Gabbay "Device boot progress - Cannot boot\n"); 1335e65e175bSOded Gabbay break; 1336e65e175bSOded Gabbay case CPU_BOOT_STATUS_TS_INIT_FAIL: 1337e65e175bSOded Gabbay dev_err(hdev->dev, 1338e65e175bSOded Gabbay "Device boot progress - Thermal Sensor initialization failed\n"); 1339e65e175bSOded Gabbay break; 1340e65e175bSOded Gabbay case CPU_BOOT_STATUS_SECURITY_READY: 1341e65e175bSOded Gabbay dev_err(hdev->dev, 1342e65e175bSOded Gabbay "Device boot progress - Stuck in preboot after security initialization\n"); 1343e65e175bSOded Gabbay break; 1344e65e175bSOded Gabbay default: 1345e65e175bSOded Gabbay dev_err(hdev->dev, 1346eba773d3SMoti Haimovski "Device boot progress - Invalid or unexpected status code %d\n", status); 1347e65e175bSOded Gabbay break; 1348e65e175bSOded Gabbay } 1349e65e175bSOded Gabbay } 1350e65e175bSOded Gabbay 1351e65e175bSOded Gabbay int hl_fw_wait_preboot_ready(struct hl_device *hdev) 1352e65e175bSOded Gabbay { 1353e65e175bSOded Gabbay struct pre_fw_load_props *pre_fw_load = &hdev->fw_loader.pre_fw_load; 1354e65e175bSOded Gabbay u32 status; 1355e65e175bSOded Gabbay int rc; 1356e65e175bSOded Gabbay 1357e65e175bSOded Gabbay /* Need to check two possible scenarios: 1358e65e175bSOded Gabbay * 1359e65e175bSOded Gabbay * CPU_BOOT_STATUS_WAITING_FOR_BOOT_FIT - for newer firmwares where 1360e65e175bSOded Gabbay * the preboot is waiting for the boot fit 1361e65e175bSOded Gabbay * 1362e65e175bSOded Gabbay * All other status values - for older firmwares where the uboot was 1363e65e175bSOded Gabbay * loaded from the FLASH 1364e65e175bSOded Gabbay */ 1365e65e175bSOded Gabbay rc = hl_poll_timeout( 1366e65e175bSOded Gabbay hdev, 1367e65e175bSOded Gabbay pre_fw_load->cpu_boot_status_reg, 1368e65e175bSOded Gabbay status, 1369e65e175bSOded Gabbay (status == CPU_BOOT_STATUS_NIC_FW_RDY) || 1370e65e175bSOded Gabbay (status == CPU_BOOT_STATUS_READY_TO_BOOT) || 1371e65e175bSOded Gabbay (status == CPU_BOOT_STATUS_WAITING_FOR_BOOT_FIT), 1372e65e175bSOded Gabbay hdev->fw_poll_interval_usec, 1373e65e175bSOded Gabbay pre_fw_load->wait_for_preboot_timeout); 1374e65e175bSOded Gabbay 1375e65e175bSOded Gabbay if (rc) { 1376e65e175bSOded Gabbay detect_cpu_boot_status(hdev, status); 1377eba773d3SMoti Haimovski dev_err(hdev->dev, "CPU boot ready timeout (status = %d)\n", status); 1378e65e175bSOded Gabbay 1379e65e175bSOded Gabbay /* If we read all FF, then something is totally wrong, no point 1380e65e175bSOded Gabbay * of reading specific errors 1381e65e175bSOded Gabbay */ 1382e65e175bSOded Gabbay if (status != -1) 1383e65e175bSOded Gabbay fw_read_errors(hdev, pre_fw_load->boot_err0_reg, 1384e65e175bSOded Gabbay pre_fw_load->boot_err1_reg, 1385e65e175bSOded Gabbay pre_fw_load->sts_boot_dev_sts0_reg, 1386e65e175bSOded Gabbay pre_fw_load->sts_boot_dev_sts1_reg); 1387e65e175bSOded Gabbay return -EIO; 1388e65e175bSOded Gabbay } 1389e65e175bSOded Gabbay 1390e65e175bSOded Gabbay hdev->fw_loader.fw_comp_loaded |= FW_TYPE_PREBOOT_CPU; 1391e65e175bSOded Gabbay 1392e65e175bSOded Gabbay return 0; 1393e65e175bSOded Gabbay } 1394e65e175bSOded Gabbay 1395e65e175bSOded Gabbay static int hl_fw_read_preboot_caps(struct hl_device *hdev) 1396e65e175bSOded Gabbay { 1397e65e175bSOded Gabbay struct pre_fw_load_props *pre_fw_load; 1398e65e175bSOded Gabbay struct asic_fixed_properties *prop; 1399e65e175bSOded Gabbay u32 reg_val; 1400e65e175bSOded Gabbay int rc; 1401e65e175bSOded Gabbay 1402e65e175bSOded Gabbay prop = &hdev->asic_prop; 1403e65e175bSOded Gabbay pre_fw_load = &hdev->fw_loader.pre_fw_load; 1404e65e175bSOded Gabbay 1405e65e175bSOded Gabbay rc = hl_fw_wait_preboot_ready(hdev); 1406e65e175bSOded Gabbay if (rc) 1407e65e175bSOded Gabbay return rc; 1408e65e175bSOded Gabbay 1409e65e175bSOded Gabbay /* 1410e65e175bSOded Gabbay * the registers DEV_STS* contain FW capabilities/features. 1411e65e175bSOded Gabbay * We can rely on this registers only if bit CPU_BOOT_DEV_STS*_ENABLED 1412e65e175bSOded Gabbay * is set. 1413e65e175bSOded Gabbay * In the first read of this register we store the value of this 1414e65e175bSOded Gabbay * register ONLY if the register is enabled (which will be propagated 1415e65e175bSOded Gabbay * to next stages) and also mark the register as valid. 1416e65e175bSOded Gabbay * In case it is not enabled the stored value will be left 0- all 1417e65e175bSOded Gabbay * caps/features are off 1418e65e175bSOded Gabbay */ 1419e65e175bSOded Gabbay reg_val = RREG32(pre_fw_load->sts_boot_dev_sts0_reg); 1420e65e175bSOded Gabbay if (reg_val & CPU_BOOT_DEV_STS0_ENABLED) { 1421e65e175bSOded Gabbay prop->fw_cpu_boot_dev_sts0_valid = true; 1422e65e175bSOded Gabbay prop->fw_preboot_cpu_boot_dev_sts0 = reg_val; 1423e65e175bSOded Gabbay } 1424e65e175bSOded Gabbay 1425e65e175bSOded Gabbay reg_val = RREG32(pre_fw_load->sts_boot_dev_sts1_reg); 1426e65e175bSOded Gabbay if (reg_val & CPU_BOOT_DEV_STS1_ENABLED) { 1427e65e175bSOded Gabbay prop->fw_cpu_boot_dev_sts1_valid = true; 1428e65e175bSOded Gabbay prop->fw_preboot_cpu_boot_dev_sts1 = reg_val; 1429e65e175bSOded Gabbay } 1430e65e175bSOded Gabbay 1431e65e175bSOded Gabbay prop->dynamic_fw_load = !!(prop->fw_preboot_cpu_boot_dev_sts0 & 1432e65e175bSOded Gabbay CPU_BOOT_DEV_STS0_FW_LD_COM_EN); 1433e65e175bSOded Gabbay 1434e65e175bSOded Gabbay /* initialize FW loader once we know what load protocol is used */ 1435e65e175bSOded Gabbay hdev->asic_funcs->init_firmware_loader(hdev); 1436e65e175bSOded Gabbay 1437e65e175bSOded Gabbay dev_dbg(hdev->dev, "Attempting %s FW load\n", 1438e65e175bSOded Gabbay prop->dynamic_fw_load ? "dynamic" : "legacy"); 1439e65e175bSOded Gabbay return 0; 1440e65e175bSOded Gabbay } 1441e65e175bSOded Gabbay 1442e65e175bSOded Gabbay static int hl_fw_static_read_device_fw_version(struct hl_device *hdev, 1443e65e175bSOded Gabbay enum hl_fw_component fwc) 1444e65e175bSOded Gabbay { 1445e65e175bSOded Gabbay struct asic_fixed_properties *prop = &hdev->asic_prop; 1446e65e175bSOded Gabbay struct fw_load_mgr *fw_loader = &hdev->fw_loader; 1447e65e175bSOded Gabbay struct static_fw_load_mgr *static_loader; 1448e65e175bSOded Gabbay char *dest, *boot_ver, *preboot_ver; 1449e65e175bSOded Gabbay u32 ver_off, limit; 1450e65e175bSOded Gabbay const char *name; 1451e65e175bSOded Gabbay char btl_ver[32]; 1452e65e175bSOded Gabbay 1453e65e175bSOded Gabbay static_loader = &hdev->fw_loader.static_loader; 1454e65e175bSOded Gabbay 1455e65e175bSOded Gabbay switch (fwc) { 1456e65e175bSOded Gabbay case FW_COMP_BOOT_FIT: 1457e65e175bSOded Gabbay ver_off = RREG32(static_loader->boot_fit_version_offset_reg); 1458e65e175bSOded Gabbay dest = prop->uboot_ver; 1459e65e175bSOded Gabbay name = "Boot-fit"; 1460e65e175bSOded Gabbay limit = static_loader->boot_fit_version_max_off; 1461e65e175bSOded Gabbay break; 1462e65e175bSOded Gabbay case FW_COMP_PREBOOT: 1463e65e175bSOded Gabbay ver_off = RREG32(static_loader->preboot_version_offset_reg); 1464e65e175bSOded Gabbay dest = prop->preboot_ver; 1465e65e175bSOded Gabbay name = "Preboot"; 1466e65e175bSOded Gabbay limit = static_loader->preboot_version_max_off; 1467e65e175bSOded Gabbay break; 1468e65e175bSOded Gabbay default: 1469e65e175bSOded Gabbay dev_warn(hdev->dev, "Undefined FW component: %d\n", fwc); 1470e65e175bSOded Gabbay return -EIO; 1471e65e175bSOded Gabbay } 1472e65e175bSOded Gabbay 1473e65e175bSOded Gabbay ver_off &= static_loader->sram_offset_mask; 1474e65e175bSOded Gabbay 1475e65e175bSOded Gabbay if (ver_off < limit) { 1476e65e175bSOded Gabbay memcpy_fromio(dest, 1477e65e175bSOded Gabbay hdev->pcie_bar[fw_loader->sram_bar_id] + ver_off, 1478e65e175bSOded Gabbay VERSION_MAX_LEN); 1479e65e175bSOded Gabbay } else { 1480e65e175bSOded Gabbay dev_err(hdev->dev, "%s version offset (0x%x) is above SRAM\n", 1481e65e175bSOded Gabbay name, ver_off); 1482e65e175bSOded Gabbay strscpy(dest, "unavailable", VERSION_MAX_LEN); 1483e65e175bSOded Gabbay return -EIO; 1484e65e175bSOded Gabbay } 1485e65e175bSOded Gabbay 1486e65e175bSOded Gabbay if (fwc == FW_COMP_BOOT_FIT) { 1487e65e175bSOded Gabbay boot_ver = extract_fw_ver_from_str(prop->uboot_ver); 1488e65e175bSOded Gabbay if (boot_ver) { 1489e65e175bSOded Gabbay dev_info(hdev->dev, "boot-fit version %s\n", boot_ver); 1490e65e175bSOded Gabbay kfree(boot_ver); 1491e65e175bSOded Gabbay } 1492e65e175bSOded Gabbay } else if (fwc == FW_COMP_PREBOOT) { 1493e65e175bSOded Gabbay preboot_ver = strnstr(prop->preboot_ver, "Preboot", 1494e65e175bSOded Gabbay VERSION_MAX_LEN); 1495e65e175bSOded Gabbay if (preboot_ver && preboot_ver != prop->preboot_ver) { 1496e65e175bSOded Gabbay strscpy(btl_ver, prop->preboot_ver, 1497e65e175bSOded Gabbay min((int) (preboot_ver - prop->preboot_ver), 1498e65e175bSOded Gabbay 31)); 1499e65e175bSOded Gabbay dev_info(hdev->dev, "%s\n", btl_ver); 1500e65e175bSOded Gabbay } 1501e65e175bSOded Gabbay 1502e65e175bSOded Gabbay preboot_ver = extract_fw_ver_from_str(prop->preboot_ver); 1503e65e175bSOded Gabbay if (preboot_ver) { 1504e65e175bSOded Gabbay dev_info(hdev->dev, "preboot version %s\n", 1505e65e175bSOded Gabbay preboot_ver); 1506e65e175bSOded Gabbay kfree(preboot_ver); 1507e65e175bSOded Gabbay } 1508e65e175bSOded Gabbay } 1509e65e175bSOded Gabbay 1510e65e175bSOded Gabbay return 0; 1511e65e175bSOded Gabbay } 1512e65e175bSOded Gabbay 1513e65e175bSOded Gabbay /** 1514e65e175bSOded Gabbay * hl_fw_preboot_update_state - update internal data structures during 1515e65e175bSOded Gabbay * handshake with preboot 1516e65e175bSOded Gabbay * 1517e65e175bSOded Gabbay * 1518e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 1519e65e175bSOded Gabbay * 1520e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 1521e65e175bSOded Gabbay */ 1522e65e175bSOded Gabbay static void hl_fw_preboot_update_state(struct hl_device *hdev) 1523e65e175bSOded Gabbay { 1524e65e175bSOded Gabbay struct asic_fixed_properties *prop = &hdev->asic_prop; 1525e65e175bSOded Gabbay u32 cpu_boot_dev_sts0, cpu_boot_dev_sts1; 1526e65e175bSOded Gabbay 1527e65e175bSOded Gabbay cpu_boot_dev_sts0 = prop->fw_preboot_cpu_boot_dev_sts0; 1528e65e175bSOded Gabbay cpu_boot_dev_sts1 = prop->fw_preboot_cpu_boot_dev_sts1; 1529e65e175bSOded Gabbay 1530e65e175bSOded Gabbay /* We read boot_dev_sts registers multiple times during boot: 1531e65e175bSOded Gabbay * 1. preboot - a. Check whether the security status bits are valid 1532e65e175bSOded Gabbay * b. Check whether fw security is enabled 1533e65e175bSOded Gabbay * c. Check whether hard reset is done by preboot 1534e65e175bSOded Gabbay * 2. boot cpu - a. Fetch boot cpu security status 1535e65e175bSOded Gabbay * b. Check whether hard reset is done by boot cpu 1536e65e175bSOded Gabbay * 3. FW application - a. Fetch fw application security status 1537e65e175bSOded Gabbay * b. Check whether hard reset is done by fw app 1538e65e175bSOded Gabbay */ 1539e65e175bSOded Gabbay prop->hard_reset_done_by_fw = !!(cpu_boot_dev_sts0 & CPU_BOOT_DEV_STS0_FW_HARD_RST_EN); 1540e65e175bSOded Gabbay 1541e65e175bSOded Gabbay prop->fw_security_enabled = !!(cpu_boot_dev_sts0 & CPU_BOOT_DEV_STS0_SECURITY_EN); 1542e65e175bSOded Gabbay 1543e65e175bSOded Gabbay dev_dbg(hdev->dev, "Firmware preboot boot device status0 %#x\n", 1544e65e175bSOded Gabbay cpu_boot_dev_sts0); 1545e65e175bSOded Gabbay 1546e65e175bSOded Gabbay dev_dbg(hdev->dev, "Firmware preboot boot device status1 %#x\n", 1547e65e175bSOded Gabbay cpu_boot_dev_sts1); 1548e65e175bSOded Gabbay 1549e65e175bSOded Gabbay dev_dbg(hdev->dev, "Firmware preboot hard-reset is %s\n", 1550e65e175bSOded Gabbay prop->hard_reset_done_by_fw ? "enabled" : "disabled"); 1551e65e175bSOded Gabbay 1552e65e175bSOded Gabbay dev_dbg(hdev->dev, "firmware-level security is %s\n", 1553e65e175bSOded Gabbay prop->fw_security_enabled ? "enabled" : "disabled"); 1554e65e175bSOded Gabbay 1555e65e175bSOded Gabbay dev_dbg(hdev->dev, "GIC controller is %s\n", 1556e65e175bSOded Gabbay prop->gic_interrupts_enable ? "enabled" : "disabled"); 1557e65e175bSOded Gabbay } 1558e65e175bSOded Gabbay 1559e65e175bSOded Gabbay static int hl_fw_static_read_preboot_status(struct hl_device *hdev) 1560e65e175bSOded Gabbay { 1561e65e175bSOded Gabbay int rc; 1562e65e175bSOded Gabbay 1563e65e175bSOded Gabbay rc = hl_fw_static_read_device_fw_version(hdev, FW_COMP_PREBOOT); 1564e65e175bSOded Gabbay if (rc) 1565e65e175bSOded Gabbay return rc; 1566e65e175bSOded Gabbay 1567e65e175bSOded Gabbay return 0; 1568e65e175bSOded Gabbay } 1569e65e175bSOded Gabbay 1570e65e175bSOded Gabbay int hl_fw_read_preboot_status(struct hl_device *hdev) 1571e65e175bSOded Gabbay { 1572e65e175bSOded Gabbay int rc; 1573e65e175bSOded Gabbay 1574e65e175bSOded Gabbay if (!(hdev->fw_components & FW_TYPE_PREBOOT_CPU)) 1575e65e175bSOded Gabbay return 0; 1576e65e175bSOded Gabbay 1577e65e175bSOded Gabbay /* get FW pre-load parameters */ 1578e65e175bSOded Gabbay hdev->asic_funcs->init_firmware_preload_params(hdev); 1579e65e175bSOded Gabbay 1580e65e175bSOded Gabbay /* 1581e65e175bSOded Gabbay * In order to determine boot method (static VS dynamic) we need to 1582e65e175bSOded Gabbay * read the boot caps register 1583e65e175bSOded Gabbay */ 1584e65e175bSOded Gabbay rc = hl_fw_read_preboot_caps(hdev); 1585e65e175bSOded Gabbay if (rc) 1586e65e175bSOded Gabbay return rc; 1587e65e175bSOded Gabbay 1588e65e175bSOded Gabbay hl_fw_preboot_update_state(hdev); 1589e65e175bSOded Gabbay 1590e65e175bSOded Gabbay /* no need to read preboot status in dynamic load */ 1591e65e175bSOded Gabbay if (hdev->asic_prop.dynamic_fw_load) 1592e65e175bSOded Gabbay return 0; 1593e65e175bSOded Gabbay 1594e65e175bSOded Gabbay return hl_fw_static_read_preboot_status(hdev); 1595e65e175bSOded Gabbay } 1596e65e175bSOded Gabbay 1597e65e175bSOded Gabbay /* associate string with COMM status */ 1598e65e175bSOded Gabbay static char *hl_dynamic_fw_status_str[COMMS_STS_INVLD_LAST] = { 1599e65e175bSOded Gabbay [COMMS_STS_NOOP] = "NOOP", 1600e65e175bSOded Gabbay [COMMS_STS_ACK] = "ACK", 1601e65e175bSOded Gabbay [COMMS_STS_OK] = "OK", 1602e65e175bSOded Gabbay [COMMS_STS_ERR] = "ERR", 1603e65e175bSOded Gabbay [COMMS_STS_VALID_ERR] = "VALID_ERR", 1604e65e175bSOded Gabbay [COMMS_STS_TIMEOUT_ERR] = "TIMEOUT_ERR", 1605e65e175bSOded Gabbay }; 1606e65e175bSOded Gabbay 1607e65e175bSOded Gabbay /** 1608e65e175bSOded Gabbay * hl_fw_dynamic_report_error_status - report error status 1609e65e175bSOded Gabbay * 1610e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 1611e65e175bSOded Gabbay * @status: value of FW status register 1612e65e175bSOded Gabbay * @expected_status: the expected status 1613e65e175bSOded Gabbay */ 1614e65e175bSOded Gabbay static void hl_fw_dynamic_report_error_status(struct hl_device *hdev, 1615e65e175bSOded Gabbay u32 status, 1616e65e175bSOded Gabbay enum comms_sts expected_status) 1617e65e175bSOded Gabbay { 1618e65e175bSOded Gabbay enum comms_sts comm_status = 1619e65e175bSOded Gabbay FIELD_GET(COMMS_STATUS_STATUS_MASK, status); 1620e65e175bSOded Gabbay 1621e65e175bSOded Gabbay if (comm_status < COMMS_STS_INVLD_LAST) 1622e65e175bSOded Gabbay dev_err(hdev->dev, "Device status %s, expected status: %s\n", 1623e65e175bSOded Gabbay hl_dynamic_fw_status_str[comm_status], 1624e65e175bSOded Gabbay hl_dynamic_fw_status_str[expected_status]); 1625e65e175bSOded Gabbay else 1626e65e175bSOded Gabbay dev_err(hdev->dev, "Device status unknown %d, expected status: %s\n", 1627e65e175bSOded Gabbay comm_status, 1628e65e175bSOded Gabbay hl_dynamic_fw_status_str[expected_status]); 1629e65e175bSOded Gabbay } 1630e65e175bSOded Gabbay 1631e65e175bSOded Gabbay /** 1632e65e175bSOded Gabbay * hl_fw_dynamic_send_cmd - send LKD to FW cmd 1633e65e175bSOded Gabbay * 1634e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 1635e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 1636e65e175bSOded Gabbay * @cmd: LKD to FW cmd code 1637e65e175bSOded Gabbay * @size: size of next FW component to be loaded (0 if not necessary) 1638e65e175bSOded Gabbay * 1639e65e175bSOded Gabbay * LDK to FW exact command layout is defined at struct comms_command. 1640e65e175bSOded Gabbay * note: the size argument is used only when the next FW component should be 1641e65e175bSOded Gabbay * loaded, otherwise it shall be 0. the size is used by the FW in later 1642e65e175bSOded Gabbay * protocol stages and when sending only indicating the amount of memory 1643e65e175bSOded Gabbay * to be allocated by the FW to receive the next boot component. 1644e65e175bSOded Gabbay */ 1645e65e175bSOded Gabbay static void hl_fw_dynamic_send_cmd(struct hl_device *hdev, 1646e65e175bSOded Gabbay struct fw_load_mgr *fw_loader, 1647e65e175bSOded Gabbay enum comms_cmd cmd, unsigned int size) 1648e65e175bSOded Gabbay { 1649e65e175bSOded Gabbay struct cpu_dyn_regs *dyn_regs; 1650e65e175bSOded Gabbay u32 val; 1651e65e175bSOded Gabbay 1652e65e175bSOded Gabbay dyn_regs = &fw_loader->dynamic_loader.comm_desc.cpu_dyn_regs; 1653e65e175bSOded Gabbay 1654e65e175bSOded Gabbay val = FIELD_PREP(COMMS_COMMAND_CMD_MASK, cmd); 1655e65e175bSOded Gabbay val |= FIELD_PREP(COMMS_COMMAND_SIZE_MASK, size); 1656e65e175bSOded Gabbay 1657e65e175bSOded Gabbay trace_habanalabs_comms_send_cmd(hdev->dev, comms_cmd_str_arr[cmd]); 1658e65e175bSOded Gabbay WREG32(le32_to_cpu(dyn_regs->kmd_msg_to_cpu), val); 1659e65e175bSOded Gabbay } 1660e65e175bSOded Gabbay 1661e65e175bSOded Gabbay /** 1662e65e175bSOded Gabbay * hl_fw_dynamic_extract_fw_response - update the FW response 1663e65e175bSOded Gabbay * 1664e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 1665e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 1666e65e175bSOded Gabbay * @response: FW response 1667e65e175bSOded Gabbay * @status: the status read from CPU status register 1668e65e175bSOded Gabbay * 1669e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 1670e65e175bSOded Gabbay */ 1671e65e175bSOded Gabbay static int hl_fw_dynamic_extract_fw_response(struct hl_device *hdev, 1672e65e175bSOded Gabbay struct fw_load_mgr *fw_loader, 1673e65e175bSOded Gabbay struct fw_response *response, 1674e65e175bSOded Gabbay u32 status) 1675e65e175bSOded Gabbay { 1676e65e175bSOded Gabbay response->status = FIELD_GET(COMMS_STATUS_STATUS_MASK, status); 1677e65e175bSOded Gabbay response->ram_offset = FIELD_GET(COMMS_STATUS_OFFSET_MASK, status) << 1678e65e175bSOded Gabbay COMMS_STATUS_OFFSET_ALIGN_SHIFT; 1679e65e175bSOded Gabbay response->ram_type = FIELD_GET(COMMS_STATUS_RAM_TYPE_MASK, status); 1680e65e175bSOded Gabbay 1681e65e175bSOded Gabbay if ((response->ram_type != COMMS_SRAM) && 1682e65e175bSOded Gabbay (response->ram_type != COMMS_DRAM)) { 1683e65e175bSOded Gabbay dev_err(hdev->dev, "FW status: invalid RAM type %u\n", 1684e65e175bSOded Gabbay response->ram_type); 1685e65e175bSOded Gabbay return -EIO; 1686e65e175bSOded Gabbay } 1687e65e175bSOded Gabbay 1688e65e175bSOded Gabbay return 0; 1689e65e175bSOded Gabbay } 1690e65e175bSOded Gabbay 1691e65e175bSOded Gabbay /** 1692e65e175bSOded Gabbay * hl_fw_dynamic_wait_for_status - wait for status in dynamic FW load 1693e65e175bSOded Gabbay * 1694e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 1695e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 1696e65e175bSOded Gabbay * @expected_status: expected status to wait for 1697e65e175bSOded Gabbay * @timeout: timeout for status wait 1698e65e175bSOded Gabbay * 1699e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 1700e65e175bSOded Gabbay * 1701e65e175bSOded Gabbay * waiting for status from FW include polling the FW status register until 1702e65e175bSOded Gabbay * expected status is received or timeout occurs (whatever occurs first). 1703e65e175bSOded Gabbay */ 1704e65e175bSOded Gabbay static int hl_fw_dynamic_wait_for_status(struct hl_device *hdev, 1705e65e175bSOded Gabbay struct fw_load_mgr *fw_loader, 1706e65e175bSOded Gabbay enum comms_sts expected_status, 1707e65e175bSOded Gabbay u32 timeout) 1708e65e175bSOded Gabbay { 1709e65e175bSOded Gabbay struct cpu_dyn_regs *dyn_regs; 1710e65e175bSOded Gabbay u32 status; 1711e65e175bSOded Gabbay int rc; 1712e65e175bSOded Gabbay 1713e65e175bSOded Gabbay dyn_regs = &fw_loader->dynamic_loader.comm_desc.cpu_dyn_regs; 1714e65e175bSOded Gabbay 1715e65e175bSOded Gabbay trace_habanalabs_comms_wait_status(hdev->dev, comms_sts_str_arr[expected_status]); 1716e65e175bSOded Gabbay 1717e65e175bSOded Gabbay /* Wait for expected status */ 1718e65e175bSOded Gabbay rc = hl_poll_timeout( 1719e65e175bSOded Gabbay hdev, 1720e65e175bSOded Gabbay le32_to_cpu(dyn_regs->cpu_cmd_status_to_host), 1721e65e175bSOded Gabbay status, 1722e65e175bSOded Gabbay FIELD_GET(COMMS_STATUS_STATUS_MASK, status) == expected_status, 1723e65e175bSOded Gabbay hdev->fw_comms_poll_interval_usec, 1724e65e175bSOded Gabbay timeout); 1725e65e175bSOded Gabbay 1726e65e175bSOded Gabbay if (rc) { 1727e65e175bSOded Gabbay hl_fw_dynamic_report_error_status(hdev, status, 1728e65e175bSOded Gabbay expected_status); 1729e65e175bSOded Gabbay return -EIO; 1730e65e175bSOded Gabbay } 1731e65e175bSOded Gabbay 1732e65e175bSOded Gabbay trace_habanalabs_comms_wait_status_done(hdev->dev, comms_sts_str_arr[expected_status]); 1733e65e175bSOded Gabbay 1734e65e175bSOded Gabbay /* 1735e65e175bSOded Gabbay * skip storing FW response for NOOP to preserve the actual desired 1736e65e175bSOded Gabbay * FW status 1737e65e175bSOded Gabbay */ 1738e65e175bSOded Gabbay if (expected_status == COMMS_STS_NOOP) 1739e65e175bSOded Gabbay return 0; 1740e65e175bSOded Gabbay 1741e65e175bSOded Gabbay rc = hl_fw_dynamic_extract_fw_response(hdev, fw_loader, 1742e65e175bSOded Gabbay &fw_loader->dynamic_loader.response, 1743e65e175bSOded Gabbay status); 1744e65e175bSOded Gabbay return rc; 1745e65e175bSOded Gabbay } 1746e65e175bSOded Gabbay 1747e65e175bSOded Gabbay /** 1748e65e175bSOded Gabbay * hl_fw_dynamic_send_clear_cmd - send clear command to FW 1749e65e175bSOded Gabbay * 1750e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 1751e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 1752e65e175bSOded Gabbay * 1753e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 1754e65e175bSOded Gabbay * 1755e65e175bSOded Gabbay * after command cycle between LKD to FW CPU (i.e. LKD got an expected status 1756e65e175bSOded Gabbay * from FW) we need to clear the CPU status register in order to avoid garbage 1757e65e175bSOded Gabbay * between command cycles. 1758e65e175bSOded Gabbay * This is done by sending clear command and polling the CPU to LKD status 1759e65e175bSOded Gabbay * register to hold the status NOOP 1760e65e175bSOded Gabbay */ 1761e65e175bSOded Gabbay static int hl_fw_dynamic_send_clear_cmd(struct hl_device *hdev, 1762e65e175bSOded Gabbay struct fw_load_mgr *fw_loader) 1763e65e175bSOded Gabbay { 1764e65e175bSOded Gabbay hl_fw_dynamic_send_cmd(hdev, fw_loader, COMMS_CLR_STS, 0); 1765e65e175bSOded Gabbay 1766e65e175bSOded Gabbay return hl_fw_dynamic_wait_for_status(hdev, fw_loader, COMMS_STS_NOOP, 1767e65e175bSOded Gabbay fw_loader->cpu_timeout); 1768e65e175bSOded Gabbay } 1769e65e175bSOded Gabbay 1770e65e175bSOded Gabbay /** 1771e65e175bSOded Gabbay * hl_fw_dynamic_send_protocol_cmd - send LKD to FW cmd and wait for ACK 1772e65e175bSOded Gabbay * 1773e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 1774e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 1775e65e175bSOded Gabbay * @cmd: LKD to FW cmd code 1776e65e175bSOded Gabbay * @size: size of next FW component to be loaded (0 if not necessary) 1777e65e175bSOded Gabbay * @wait_ok: if true also wait for OK response from FW 1778e65e175bSOded Gabbay * @timeout: timeout for status wait 1779e65e175bSOded Gabbay * 1780e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 1781e65e175bSOded Gabbay * 1782e65e175bSOded Gabbay * brief: 1783e65e175bSOded Gabbay * when sending protocol command we have the following steps: 1784e65e175bSOded Gabbay * - send clear (clear command and verify clear status register) 1785e65e175bSOded Gabbay * - send the actual protocol command 1786e65e175bSOded Gabbay * - wait for ACK on the protocol command 1787e65e175bSOded Gabbay * - send clear 1788e65e175bSOded Gabbay * - send NOOP 1789e65e175bSOded Gabbay * if, in addition, the specific protocol command should wait for OK then: 1790e65e175bSOded Gabbay * - wait for OK 1791e65e175bSOded Gabbay * - send clear 1792e65e175bSOded Gabbay * - send NOOP 1793e65e175bSOded Gabbay * 1794e65e175bSOded Gabbay * NOTES: 1795e65e175bSOded Gabbay * send clear: this is necessary in order to clear the status register to avoid 1796e65e175bSOded Gabbay * leftovers between command 1797e65e175bSOded Gabbay * NOOP command: necessary to avoid loop on the clear command by the FW 1798e65e175bSOded Gabbay */ 1799e65e175bSOded Gabbay int hl_fw_dynamic_send_protocol_cmd(struct hl_device *hdev, 1800e65e175bSOded Gabbay struct fw_load_mgr *fw_loader, 1801e65e175bSOded Gabbay enum comms_cmd cmd, unsigned int size, 1802e65e175bSOded Gabbay bool wait_ok, u32 timeout) 1803e65e175bSOded Gabbay { 1804e65e175bSOded Gabbay int rc; 1805e65e175bSOded Gabbay 1806e65e175bSOded Gabbay trace_habanalabs_comms_protocol_cmd(hdev->dev, comms_cmd_str_arr[cmd]); 1807e65e175bSOded Gabbay 1808e65e175bSOded Gabbay /* first send clear command to clean former commands */ 1809e65e175bSOded Gabbay rc = hl_fw_dynamic_send_clear_cmd(hdev, fw_loader); 1810e65e175bSOded Gabbay if (rc) 1811e65e175bSOded Gabbay return rc; 1812e65e175bSOded Gabbay 1813e65e175bSOded Gabbay /* send the actual command */ 1814e65e175bSOded Gabbay hl_fw_dynamic_send_cmd(hdev, fw_loader, cmd, size); 1815e65e175bSOded Gabbay 1816e65e175bSOded Gabbay /* wait for ACK for the command */ 1817e65e175bSOded Gabbay rc = hl_fw_dynamic_wait_for_status(hdev, fw_loader, COMMS_STS_ACK, 1818e65e175bSOded Gabbay timeout); 1819e65e175bSOded Gabbay if (rc) 1820e65e175bSOded Gabbay return rc; 1821e65e175bSOded Gabbay 1822e65e175bSOded Gabbay /* clear command to prepare for NOOP command */ 1823e65e175bSOded Gabbay rc = hl_fw_dynamic_send_clear_cmd(hdev, fw_loader); 1824e65e175bSOded Gabbay if (rc) 1825e65e175bSOded Gabbay return rc; 1826e65e175bSOded Gabbay 1827e65e175bSOded Gabbay /* send the actual NOOP command */ 1828e65e175bSOded Gabbay hl_fw_dynamic_send_cmd(hdev, fw_loader, COMMS_NOOP, 0); 1829e65e175bSOded Gabbay 1830e65e175bSOded Gabbay if (!wait_ok) 1831e65e175bSOded Gabbay return 0; 1832e65e175bSOded Gabbay 1833e65e175bSOded Gabbay rc = hl_fw_dynamic_wait_for_status(hdev, fw_loader, COMMS_STS_OK, 1834e65e175bSOded Gabbay timeout); 1835e65e175bSOded Gabbay if (rc) 1836e65e175bSOded Gabbay return rc; 1837e65e175bSOded Gabbay 1838e65e175bSOded Gabbay /* clear command to prepare for NOOP command */ 1839e65e175bSOded Gabbay rc = hl_fw_dynamic_send_clear_cmd(hdev, fw_loader); 1840e65e175bSOded Gabbay if (rc) 1841e65e175bSOded Gabbay return rc; 1842e65e175bSOded Gabbay 1843e65e175bSOded Gabbay /* send the actual NOOP command */ 1844e65e175bSOded Gabbay hl_fw_dynamic_send_cmd(hdev, fw_loader, COMMS_NOOP, 0); 1845e65e175bSOded Gabbay 1846e65e175bSOded Gabbay return 0; 1847e65e175bSOded Gabbay } 1848e65e175bSOded Gabbay 1849e65e175bSOded Gabbay /** 1850e65e175bSOded Gabbay * hl_fw_compat_crc32 - CRC compatible with FW 1851e65e175bSOded Gabbay * 1852e65e175bSOded Gabbay * @data: pointer to the data 1853e65e175bSOded Gabbay * @size: size of the data 1854e65e175bSOded Gabbay * 1855e65e175bSOded Gabbay * @return the CRC32 result 1856e65e175bSOded Gabbay * 1857e65e175bSOded Gabbay * NOTE: kernel's CRC32 differs from standard CRC32 calculation. 1858e65e175bSOded Gabbay * in order to be aligned we need to flip the bits of both the input 1859e65e175bSOded Gabbay * initial CRC and kernel's CRC32 result. 1860e65e175bSOded Gabbay * in addition both sides use initial CRC of 0, 1861e65e175bSOded Gabbay */ 1862e65e175bSOded Gabbay static u32 hl_fw_compat_crc32(u8 *data, size_t size) 1863e65e175bSOded Gabbay { 1864e65e175bSOded Gabbay return ~crc32_le(~((u32)0), data, size); 1865e65e175bSOded Gabbay } 1866e65e175bSOded Gabbay 1867e65e175bSOded Gabbay /** 1868e65e175bSOded Gabbay * hl_fw_dynamic_validate_memory_bound - validate memory bounds for memory 1869e65e175bSOded Gabbay * transfer (image or descriptor) between 1870e65e175bSOded Gabbay * host and FW 1871e65e175bSOded Gabbay * 1872e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 1873e65e175bSOded Gabbay * @addr: device address of memory transfer 1874e65e175bSOded Gabbay * @size: memory transfer size 1875e65e175bSOded Gabbay * @region: PCI memory region 1876e65e175bSOded Gabbay * 1877e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 1878e65e175bSOded Gabbay */ 1879e65e175bSOded Gabbay static int hl_fw_dynamic_validate_memory_bound(struct hl_device *hdev, 1880e65e175bSOded Gabbay u64 addr, size_t size, 1881e65e175bSOded Gabbay struct pci_mem_region *region) 1882e65e175bSOded Gabbay { 1883e65e175bSOded Gabbay u64 end_addr; 1884e65e175bSOded Gabbay 1885e65e175bSOded Gabbay /* now make sure that the memory transfer is within region's bounds */ 1886e65e175bSOded Gabbay end_addr = addr + size; 1887e65e175bSOded Gabbay if (end_addr >= region->region_base + region->region_size) { 1888e65e175bSOded Gabbay dev_err(hdev->dev, 1889e65e175bSOded Gabbay "dynamic FW load: memory transfer end address out of memory region bounds. addr: %llx\n", 1890e65e175bSOded Gabbay end_addr); 1891e65e175bSOded Gabbay return -EIO; 1892e65e175bSOded Gabbay } 1893e65e175bSOded Gabbay 1894e65e175bSOded Gabbay /* 1895e65e175bSOded Gabbay * now make sure memory transfer is within predefined BAR bounds. 1896e65e175bSOded Gabbay * this is to make sure we do not need to set the bar (e.g. for DRAM 1897e65e175bSOded Gabbay * memory transfers) 1898e65e175bSOded Gabbay */ 1899e65e175bSOded Gabbay if (end_addr >= region->region_base - region->offset_in_bar + 1900e65e175bSOded Gabbay region->bar_size) { 1901e65e175bSOded Gabbay dev_err(hdev->dev, 1902e65e175bSOded Gabbay "FW image beyond PCI BAR bounds\n"); 1903e65e175bSOded Gabbay return -EIO; 1904e65e175bSOded Gabbay } 1905e65e175bSOded Gabbay 1906e65e175bSOded Gabbay return 0; 1907e65e175bSOded Gabbay } 1908e65e175bSOded Gabbay 1909e65e175bSOded Gabbay /** 1910e65e175bSOded Gabbay * hl_fw_dynamic_validate_descriptor - validate FW descriptor 1911e65e175bSOded Gabbay * 1912e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 1913e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 1914e65e175bSOded Gabbay * @fw_desc: the descriptor from FW 1915e65e175bSOded Gabbay * 1916e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 1917e65e175bSOded Gabbay */ 1918e65e175bSOded Gabbay static int hl_fw_dynamic_validate_descriptor(struct hl_device *hdev, 1919e65e175bSOded Gabbay struct fw_load_mgr *fw_loader, 1920e65e175bSOded Gabbay struct lkd_fw_comms_desc *fw_desc) 1921e65e175bSOded Gabbay { 1922e65e175bSOded Gabbay struct pci_mem_region *region; 1923e65e175bSOded Gabbay enum pci_region region_id; 1924e65e175bSOded Gabbay size_t data_size; 1925e65e175bSOded Gabbay u32 data_crc32; 1926e65e175bSOded Gabbay u8 *data_ptr; 1927e65e175bSOded Gabbay u64 addr; 1928e65e175bSOded Gabbay int rc; 1929e65e175bSOded Gabbay 1930e65e175bSOded Gabbay if (le32_to_cpu(fw_desc->header.magic) != HL_COMMS_DESC_MAGIC) 1931e65e175bSOded Gabbay dev_dbg(hdev->dev, "Invalid magic for dynamic FW descriptor (%x)\n", 1932e65e175bSOded Gabbay fw_desc->header.magic); 1933e65e175bSOded Gabbay 1934e65e175bSOded Gabbay if (fw_desc->header.version != HL_COMMS_DESC_VER) 1935e65e175bSOded Gabbay dev_dbg(hdev->dev, "Invalid version for dynamic FW descriptor (%x)\n", 1936e65e175bSOded Gabbay fw_desc->header.version); 1937e65e175bSOded Gabbay 1938e65e175bSOded Gabbay /* 1939e65e175bSOded Gabbay * Calc CRC32 of data without header. use the size of the descriptor 1940e65e175bSOded Gabbay * reported by firmware, without calculating it ourself, to allow adding 1941e65e175bSOded Gabbay * more fields to the lkd_fw_comms_desc structure. 1942e65e175bSOded Gabbay * note that no alignment/stride address issues here as all structures 1943e65e175bSOded Gabbay * are 64 bit padded. 1944e65e175bSOded Gabbay */ 1945e65e175bSOded Gabbay data_ptr = (u8 *)fw_desc + sizeof(struct comms_desc_header); 1946e65e175bSOded Gabbay data_size = le16_to_cpu(fw_desc->header.size); 1947e65e175bSOded Gabbay 1948e65e175bSOded Gabbay data_crc32 = hl_fw_compat_crc32(data_ptr, data_size); 1949e65e175bSOded Gabbay if (data_crc32 != le32_to_cpu(fw_desc->header.crc32)) { 1950e65e175bSOded Gabbay dev_err(hdev->dev, "CRC32 mismatch for dynamic FW descriptor (%x:%x)\n", 1951e65e175bSOded Gabbay data_crc32, fw_desc->header.crc32); 1952e65e175bSOded Gabbay return -EIO; 1953e65e175bSOded Gabbay } 1954e65e175bSOded Gabbay 1955e65e175bSOded Gabbay /* find memory region to which to copy the image */ 1956e65e175bSOded Gabbay addr = le64_to_cpu(fw_desc->img_addr); 1957e65e175bSOded Gabbay region_id = hl_get_pci_memory_region(hdev, addr); 1958e65e175bSOded Gabbay if ((region_id != PCI_REGION_SRAM) && ((region_id != PCI_REGION_DRAM))) { 1959e65e175bSOded Gabbay dev_err(hdev->dev, "Invalid region to copy FW image address=%llx\n", addr); 1960e65e175bSOded Gabbay return -EIO; 1961e65e175bSOded Gabbay } 1962e65e175bSOded Gabbay 1963e65e175bSOded Gabbay region = &hdev->pci_mem_region[region_id]; 1964e65e175bSOded Gabbay 1965e65e175bSOded Gabbay /* store the region for the copy stage */ 1966e65e175bSOded Gabbay fw_loader->dynamic_loader.image_region = region; 1967e65e175bSOded Gabbay 1968e65e175bSOded Gabbay /* 1969e65e175bSOded Gabbay * here we know that the start address is valid, now make sure that the 1970e65e175bSOded Gabbay * image is within region's bounds 1971e65e175bSOded Gabbay */ 1972e65e175bSOded Gabbay rc = hl_fw_dynamic_validate_memory_bound(hdev, addr, 1973e65e175bSOded Gabbay fw_loader->dynamic_loader.fw_image_size, 1974e65e175bSOded Gabbay region); 1975e65e175bSOded Gabbay if (rc) { 1976e65e175bSOded Gabbay dev_err(hdev->dev, "invalid mem transfer request for FW image\n"); 1977e65e175bSOded Gabbay return rc; 1978e65e175bSOded Gabbay } 1979e65e175bSOded Gabbay 1980e65e175bSOded Gabbay /* here we can mark the descriptor as valid as the content has been validated */ 1981e65e175bSOded Gabbay fw_loader->dynamic_loader.fw_desc_valid = true; 1982e65e175bSOded Gabbay 1983e65e175bSOded Gabbay return 0; 1984e65e175bSOded Gabbay } 1985e65e175bSOded Gabbay 1986e65e175bSOded Gabbay static int hl_fw_dynamic_validate_response(struct hl_device *hdev, 1987e65e175bSOded Gabbay struct fw_response *response, 1988e65e175bSOded Gabbay struct pci_mem_region *region) 1989e65e175bSOded Gabbay { 1990e65e175bSOded Gabbay u64 device_addr; 1991e65e175bSOded Gabbay int rc; 1992e65e175bSOded Gabbay 1993e65e175bSOded Gabbay device_addr = region->region_base + response->ram_offset; 1994e65e175bSOded Gabbay 1995e65e175bSOded Gabbay /* 1996e65e175bSOded Gabbay * validate that the descriptor is within region's bounds 1997e65e175bSOded Gabbay * Note that as the start address was supplied according to the RAM 1998e65e175bSOded Gabbay * type- testing only the end address is enough 1999e65e175bSOded Gabbay */ 2000e65e175bSOded Gabbay rc = hl_fw_dynamic_validate_memory_bound(hdev, device_addr, 2001e65e175bSOded Gabbay sizeof(struct lkd_fw_comms_desc), 2002e65e175bSOded Gabbay region); 2003e65e175bSOded Gabbay return rc; 2004e65e175bSOded Gabbay } 2005e65e175bSOded Gabbay 2006e65e175bSOded Gabbay /* 2007e65e175bSOded Gabbay * hl_fw_dynamic_read_descriptor_msg - read and show the ascii msg that sent by fw 2008e65e175bSOded Gabbay * 2009e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 2010e65e175bSOded Gabbay * @fw_desc: the descriptor from FW 2011e65e175bSOded Gabbay */ 2012e65e175bSOded Gabbay static void hl_fw_dynamic_read_descriptor_msg(struct hl_device *hdev, 2013e65e175bSOded Gabbay struct lkd_fw_comms_desc *fw_desc) 2014e65e175bSOded Gabbay { 2015e65e175bSOded Gabbay int i; 2016e65e175bSOded Gabbay char *msg; 2017e65e175bSOded Gabbay 2018e65e175bSOded Gabbay for (i = 0 ; i < LKD_FW_ASCII_MSG_MAX ; i++) { 2019e65e175bSOded Gabbay if (!fw_desc->ascii_msg[i].valid) 2020e65e175bSOded Gabbay return; 2021e65e175bSOded Gabbay 2022e65e175bSOded Gabbay /* force NULL termination */ 2023e65e175bSOded Gabbay msg = fw_desc->ascii_msg[i].msg; 2024e65e175bSOded Gabbay msg[LKD_FW_ASCII_MSG_MAX_LEN - 1] = '\0'; 2025e65e175bSOded Gabbay 2026e65e175bSOded Gabbay switch (fw_desc->ascii_msg[i].msg_lvl) { 2027e65e175bSOded Gabbay case LKD_FW_ASCII_MSG_ERR: 2028e65e175bSOded Gabbay dev_err(hdev->dev, "fw: %s", fw_desc->ascii_msg[i].msg); 2029e65e175bSOded Gabbay break; 2030e65e175bSOded Gabbay case LKD_FW_ASCII_MSG_WRN: 2031e65e175bSOded Gabbay dev_warn(hdev->dev, "fw: %s", fw_desc->ascii_msg[i].msg); 2032e65e175bSOded Gabbay break; 2033e65e175bSOded Gabbay case LKD_FW_ASCII_MSG_INF: 2034e65e175bSOded Gabbay dev_info(hdev->dev, "fw: %s", fw_desc->ascii_msg[i].msg); 2035e65e175bSOded Gabbay break; 2036e65e175bSOded Gabbay default: 2037e65e175bSOded Gabbay dev_dbg(hdev->dev, "fw: %s", fw_desc->ascii_msg[i].msg); 2038e65e175bSOded Gabbay break; 2039e65e175bSOded Gabbay } 2040e65e175bSOded Gabbay } 2041e65e175bSOded Gabbay } 2042e65e175bSOded Gabbay 2043e65e175bSOded Gabbay /** 2044e65e175bSOded Gabbay * hl_fw_dynamic_read_and_validate_descriptor - read and validate FW descriptor 2045e65e175bSOded Gabbay * 2046e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 2047e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 2048e65e175bSOded Gabbay * 2049e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 2050e65e175bSOded Gabbay */ 2051e65e175bSOded Gabbay static int hl_fw_dynamic_read_and_validate_descriptor(struct hl_device *hdev, 2052e65e175bSOded Gabbay struct fw_load_mgr *fw_loader) 2053e65e175bSOded Gabbay { 2054e65e175bSOded Gabbay struct lkd_fw_comms_desc *fw_desc; 2055e65e175bSOded Gabbay struct pci_mem_region *region; 2056e65e175bSOded Gabbay struct fw_response *response; 2057e65e175bSOded Gabbay void *temp_fw_desc; 2058e65e175bSOded Gabbay void __iomem *src; 2059e65e175bSOded Gabbay u16 fw_data_size; 2060e65e175bSOded Gabbay enum pci_region region_id; 2061e65e175bSOded Gabbay int rc; 2062e65e175bSOded Gabbay 2063e65e175bSOded Gabbay fw_desc = &fw_loader->dynamic_loader.comm_desc; 2064e65e175bSOded Gabbay response = &fw_loader->dynamic_loader.response; 2065e65e175bSOded Gabbay 2066e65e175bSOded Gabbay region_id = (response->ram_type == COMMS_SRAM) ? 2067e65e175bSOded Gabbay PCI_REGION_SRAM : PCI_REGION_DRAM; 2068e65e175bSOded Gabbay 2069e65e175bSOded Gabbay region = &hdev->pci_mem_region[region_id]; 2070e65e175bSOded Gabbay 2071e65e175bSOded Gabbay rc = hl_fw_dynamic_validate_response(hdev, response, region); 2072e65e175bSOded Gabbay if (rc) { 2073e65e175bSOded Gabbay dev_err(hdev->dev, 2074e65e175bSOded Gabbay "invalid mem transfer request for FW descriptor\n"); 2075e65e175bSOded Gabbay return rc; 2076e65e175bSOded Gabbay } 2077e65e175bSOded Gabbay 2078e65e175bSOded Gabbay /* 2079e65e175bSOded Gabbay * extract address to copy the descriptor from 2080e65e175bSOded Gabbay * in addition, as the descriptor value is going to be over-ridden by new data- we mark it 2081e65e175bSOded Gabbay * as invalid. 2082e65e175bSOded Gabbay * it will be marked again as valid once validated 2083e65e175bSOded Gabbay */ 2084e65e175bSOded Gabbay fw_loader->dynamic_loader.fw_desc_valid = false; 2085e65e175bSOded Gabbay src = hdev->pcie_bar[region->bar_id] + region->offset_in_bar + 2086e65e175bSOded Gabbay response->ram_offset; 2087e65e175bSOded Gabbay 2088e65e175bSOded Gabbay /* 2089e65e175bSOded Gabbay * We do the copy of the fw descriptor in 2 phases: 2090e65e175bSOded Gabbay * 1. copy the header + data info according to our lkd_fw_comms_desc definition. 2091e65e175bSOded Gabbay * then we're able to read the actual data size provided by fw. 2092e65e175bSOded Gabbay * this is needed for cases where data in descriptor was changed(add/remove) 2093e65e175bSOded Gabbay * in embedded specs header file before updating lkd copy of the header file 2094e65e175bSOded Gabbay * 2. copy descriptor to temporary buffer with aligned size and send it to validation 2095e65e175bSOded Gabbay */ 2096e65e175bSOded Gabbay memcpy_fromio(fw_desc, src, sizeof(struct lkd_fw_comms_desc)); 2097e65e175bSOded Gabbay fw_data_size = le16_to_cpu(fw_desc->header.size); 2098e65e175bSOded Gabbay 2099e65e175bSOded Gabbay temp_fw_desc = vzalloc(sizeof(struct comms_desc_header) + fw_data_size); 2100e65e175bSOded Gabbay if (!temp_fw_desc) 2101e65e175bSOded Gabbay return -ENOMEM; 2102e65e175bSOded Gabbay 2103e65e175bSOded Gabbay memcpy_fromio(temp_fw_desc, src, sizeof(struct comms_desc_header) + fw_data_size); 2104e65e175bSOded Gabbay 2105e65e175bSOded Gabbay rc = hl_fw_dynamic_validate_descriptor(hdev, fw_loader, 2106e65e175bSOded Gabbay (struct lkd_fw_comms_desc *) temp_fw_desc); 2107e65e175bSOded Gabbay 2108e65e175bSOded Gabbay if (!rc) 2109e65e175bSOded Gabbay hl_fw_dynamic_read_descriptor_msg(hdev, temp_fw_desc); 2110e65e175bSOded Gabbay 2111e65e175bSOded Gabbay vfree(temp_fw_desc); 2112e65e175bSOded Gabbay 2113e65e175bSOded Gabbay return rc; 2114e65e175bSOded Gabbay } 2115e65e175bSOded Gabbay 2116e65e175bSOded Gabbay /** 2117e65e175bSOded Gabbay * hl_fw_dynamic_request_descriptor - handshake with CPU to get FW descriptor 2118e65e175bSOded Gabbay * 2119e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 2120e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 2121e65e175bSOded Gabbay * @next_image_size: size to allocate for next FW component 2122e65e175bSOded Gabbay * 2123e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 2124e65e175bSOded Gabbay */ 2125e65e175bSOded Gabbay static int hl_fw_dynamic_request_descriptor(struct hl_device *hdev, 2126e65e175bSOded Gabbay struct fw_load_mgr *fw_loader, 2127e65e175bSOded Gabbay size_t next_image_size) 2128e65e175bSOded Gabbay { 2129e65e175bSOded Gabbay int rc; 2130e65e175bSOded Gabbay 2131e65e175bSOded Gabbay rc = hl_fw_dynamic_send_protocol_cmd(hdev, fw_loader, COMMS_PREP_DESC, 2132e65e175bSOded Gabbay next_image_size, true, 2133e65e175bSOded Gabbay fw_loader->cpu_timeout); 2134e65e175bSOded Gabbay if (rc) 2135e65e175bSOded Gabbay return rc; 2136e65e175bSOded Gabbay 2137e65e175bSOded Gabbay return hl_fw_dynamic_read_and_validate_descriptor(hdev, fw_loader); 2138e65e175bSOded Gabbay } 2139e65e175bSOded Gabbay 2140e65e175bSOded Gabbay /** 2141e65e175bSOded Gabbay * hl_fw_dynamic_read_device_fw_version - read FW version to exposed properties 2142e65e175bSOded Gabbay * 2143e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 2144e65e175bSOded Gabbay * @fwc: the firmware component 2145e65e175bSOded Gabbay * @fw_version: fw component's version string 2146e65e175bSOded Gabbay */ 2147e65e175bSOded Gabbay static int hl_fw_dynamic_read_device_fw_version(struct hl_device *hdev, 2148e65e175bSOded Gabbay enum hl_fw_component fwc, 2149e65e175bSOded Gabbay const char *fw_version) 2150e65e175bSOded Gabbay { 2151e65e175bSOded Gabbay struct asic_fixed_properties *prop = &hdev->asic_prop; 2152e65e175bSOded Gabbay char *preboot_ver, *boot_ver; 2153e65e175bSOded Gabbay char btl_ver[32]; 2154e65e175bSOded Gabbay 2155e65e175bSOded Gabbay switch (fwc) { 2156e65e175bSOded Gabbay case FW_COMP_BOOT_FIT: 2157e65e175bSOded Gabbay strscpy(prop->uboot_ver, fw_version, VERSION_MAX_LEN); 2158e65e175bSOded Gabbay boot_ver = extract_fw_ver_from_str(prop->uboot_ver); 2159e65e175bSOded Gabbay if (boot_ver) { 2160e65e175bSOded Gabbay dev_info(hdev->dev, "boot-fit version %s\n", boot_ver); 2161e65e175bSOded Gabbay kfree(boot_ver); 2162e65e175bSOded Gabbay } 2163e65e175bSOded Gabbay 2164e65e175bSOded Gabbay break; 2165e65e175bSOded Gabbay case FW_COMP_PREBOOT: 2166e65e175bSOded Gabbay strscpy(prop->preboot_ver, fw_version, VERSION_MAX_LEN); 2167e65e175bSOded Gabbay preboot_ver = strnstr(prop->preboot_ver, "Preboot", 2168e65e175bSOded Gabbay VERSION_MAX_LEN); 2169e65e175bSOded Gabbay if (preboot_ver && preboot_ver != prop->preboot_ver) { 2170e65e175bSOded Gabbay strscpy(btl_ver, prop->preboot_ver, 2171e65e175bSOded Gabbay min((int) (preboot_ver - prop->preboot_ver), 31)); 2172e65e175bSOded Gabbay dev_info(hdev->dev, "%s\n", btl_ver); 2173e65e175bSOded Gabbay } 2174e65e175bSOded Gabbay 2175e65e175bSOded Gabbay preboot_ver = extract_fw_ver_from_str(prop->preboot_ver); 2176e65e175bSOded Gabbay if (preboot_ver) { 2177e65e175bSOded Gabbay int rc; 2178e65e175bSOded Gabbay 2179e65e175bSOded Gabbay dev_info(hdev->dev, "preboot version %s\n", preboot_ver); 2180e65e175bSOded Gabbay 2181*12f77011SDafna Hirschfeld rc = hl_get_preboot_major_minor(hdev, preboot_ver); 2182*12f77011SDafna Hirschfeld kfree(preboot_ver); 2183e65e175bSOded Gabbay if (rc) 2184e65e175bSOded Gabbay return rc; 2185e65e175bSOded Gabbay } 2186e65e175bSOded Gabbay 2187e65e175bSOded Gabbay break; 2188e65e175bSOded Gabbay default: 2189e65e175bSOded Gabbay dev_warn(hdev->dev, "Undefined FW component: %d\n", fwc); 2190e65e175bSOded Gabbay return -EINVAL; 2191e65e175bSOded Gabbay } 2192e65e175bSOded Gabbay 2193e65e175bSOded Gabbay return 0; 2194e65e175bSOded Gabbay } 2195e65e175bSOded Gabbay 2196e65e175bSOded Gabbay /** 2197e65e175bSOded Gabbay * hl_fw_dynamic_copy_image - copy image to memory allocated by the FW 2198e65e175bSOded Gabbay * 2199e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 2200e65e175bSOded Gabbay * @fw: fw descriptor 2201e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 2202e65e175bSOded Gabbay */ 2203e65e175bSOded Gabbay static int hl_fw_dynamic_copy_image(struct hl_device *hdev, 2204e65e175bSOded Gabbay const struct firmware *fw, 2205e65e175bSOded Gabbay struct fw_load_mgr *fw_loader) 2206e65e175bSOded Gabbay { 2207e65e175bSOded Gabbay struct lkd_fw_comms_desc *fw_desc; 2208e65e175bSOded Gabbay struct pci_mem_region *region; 2209e65e175bSOded Gabbay void __iomem *dest; 2210e65e175bSOded Gabbay u64 addr; 2211e65e175bSOded Gabbay int rc; 2212e65e175bSOded Gabbay 2213e65e175bSOded Gabbay fw_desc = &fw_loader->dynamic_loader.comm_desc; 2214e65e175bSOded Gabbay addr = le64_to_cpu(fw_desc->img_addr); 2215e65e175bSOded Gabbay 2216e65e175bSOded Gabbay /* find memory region to which to copy the image */ 2217e65e175bSOded Gabbay region = fw_loader->dynamic_loader.image_region; 2218e65e175bSOded Gabbay 2219e65e175bSOded Gabbay dest = hdev->pcie_bar[region->bar_id] + region->offset_in_bar + 2220e65e175bSOded Gabbay (addr - region->region_base); 2221e65e175bSOded Gabbay 2222e65e175bSOded Gabbay rc = hl_fw_copy_fw_to_device(hdev, fw, dest, 2223e65e175bSOded Gabbay fw_loader->boot_fit_img.src_off, 2224e65e175bSOded Gabbay fw_loader->boot_fit_img.copy_size); 2225e65e175bSOded Gabbay 2226e65e175bSOded Gabbay return rc; 2227e65e175bSOded Gabbay } 2228e65e175bSOded Gabbay 2229e65e175bSOded Gabbay /** 2230e65e175bSOded Gabbay * hl_fw_dynamic_copy_msg - copy msg to memory allocated by the FW 2231e65e175bSOded Gabbay * 2232e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 2233e65e175bSOded Gabbay * @msg: message 2234e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 2235e65e175bSOded Gabbay */ 2236e65e175bSOded Gabbay static int hl_fw_dynamic_copy_msg(struct hl_device *hdev, 2237e65e175bSOded Gabbay struct lkd_msg_comms *msg, struct fw_load_mgr *fw_loader) 2238e65e175bSOded Gabbay { 2239e65e175bSOded Gabbay struct lkd_fw_comms_desc *fw_desc; 2240e65e175bSOded Gabbay struct pci_mem_region *region; 2241e65e175bSOded Gabbay void __iomem *dest; 2242e65e175bSOded Gabbay u64 addr; 2243e65e175bSOded Gabbay int rc; 2244e65e175bSOded Gabbay 2245e65e175bSOded Gabbay fw_desc = &fw_loader->dynamic_loader.comm_desc; 2246e65e175bSOded Gabbay addr = le64_to_cpu(fw_desc->img_addr); 2247e65e175bSOded Gabbay 2248e65e175bSOded Gabbay /* find memory region to which to copy the image */ 2249e65e175bSOded Gabbay region = fw_loader->dynamic_loader.image_region; 2250e65e175bSOded Gabbay 2251e65e175bSOded Gabbay dest = hdev->pcie_bar[region->bar_id] + region->offset_in_bar + 2252e65e175bSOded Gabbay (addr - region->region_base); 2253e65e175bSOded Gabbay 2254e65e175bSOded Gabbay rc = hl_fw_copy_msg_to_device(hdev, msg, dest, 0, 0); 2255e65e175bSOded Gabbay 2256e65e175bSOded Gabbay return rc; 2257e65e175bSOded Gabbay } 2258e65e175bSOded Gabbay 2259e65e175bSOded Gabbay /** 2260e65e175bSOded Gabbay * hl_fw_boot_fit_update_state - update internal data structures after boot-fit 2261e65e175bSOded Gabbay * is loaded 2262e65e175bSOded Gabbay * 2263e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 2264e65e175bSOded Gabbay * @cpu_boot_dev_sts0_reg: register holding CPU boot dev status 0 2265e65e175bSOded Gabbay * @cpu_boot_dev_sts1_reg: register holding CPU boot dev status 1 2266e65e175bSOded Gabbay * 2267e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 2268e65e175bSOded Gabbay */ 2269e65e175bSOded Gabbay static void hl_fw_boot_fit_update_state(struct hl_device *hdev, 2270e65e175bSOded Gabbay u32 cpu_boot_dev_sts0_reg, 2271e65e175bSOded Gabbay u32 cpu_boot_dev_sts1_reg) 2272e65e175bSOded Gabbay { 2273e65e175bSOded Gabbay struct asic_fixed_properties *prop = &hdev->asic_prop; 2274e65e175bSOded Gabbay 2275e65e175bSOded Gabbay hdev->fw_loader.fw_comp_loaded |= FW_TYPE_BOOT_CPU; 2276e65e175bSOded Gabbay 2277e65e175bSOded Gabbay /* Read boot_cpu status bits */ 2278e65e175bSOded Gabbay if (prop->fw_preboot_cpu_boot_dev_sts0 & CPU_BOOT_DEV_STS0_ENABLED) { 2279e65e175bSOded Gabbay prop->fw_bootfit_cpu_boot_dev_sts0 = 2280e65e175bSOded Gabbay RREG32(cpu_boot_dev_sts0_reg); 2281e65e175bSOded Gabbay 2282e65e175bSOded Gabbay prop->hard_reset_done_by_fw = !!(prop->fw_bootfit_cpu_boot_dev_sts0 & 2283e65e175bSOded Gabbay CPU_BOOT_DEV_STS0_FW_HARD_RST_EN); 2284e65e175bSOded Gabbay 2285e65e175bSOded Gabbay dev_dbg(hdev->dev, "Firmware boot CPU status0 %#x\n", 2286e65e175bSOded Gabbay prop->fw_bootfit_cpu_boot_dev_sts0); 2287e65e175bSOded Gabbay } 2288e65e175bSOded Gabbay 2289e65e175bSOded Gabbay if (prop->fw_cpu_boot_dev_sts1_valid) { 2290e65e175bSOded Gabbay prop->fw_bootfit_cpu_boot_dev_sts1 = 2291e65e175bSOded Gabbay RREG32(cpu_boot_dev_sts1_reg); 2292e65e175bSOded Gabbay 2293e65e175bSOded Gabbay dev_dbg(hdev->dev, "Firmware boot CPU status1 %#x\n", 2294e65e175bSOded Gabbay prop->fw_bootfit_cpu_boot_dev_sts1); 2295e65e175bSOded Gabbay } 2296e65e175bSOded Gabbay 2297e65e175bSOded Gabbay dev_dbg(hdev->dev, "Firmware boot CPU hard-reset is %s\n", 2298e65e175bSOded Gabbay prop->hard_reset_done_by_fw ? "enabled" : "disabled"); 2299e65e175bSOded Gabbay } 2300e65e175bSOded Gabbay 2301e65e175bSOded Gabbay static void hl_fw_dynamic_update_linux_interrupt_if(struct hl_device *hdev) 2302e65e175bSOded Gabbay { 2303e65e175bSOded Gabbay struct cpu_dyn_regs *dyn_regs = 2304e65e175bSOded Gabbay &hdev->fw_loader.dynamic_loader.comm_desc.cpu_dyn_regs; 2305e65e175bSOded Gabbay 2306e65e175bSOded Gabbay /* Check whether all 3 interrupt interfaces are set, if not use a 2307e65e175bSOded Gabbay * single interface 2308e65e175bSOded Gabbay */ 2309e65e175bSOded Gabbay if (!hdev->asic_prop.gic_interrupts_enable && 2310e65e175bSOded Gabbay !(hdev->asic_prop.fw_app_cpu_boot_dev_sts0 & 2311e65e175bSOded Gabbay CPU_BOOT_DEV_STS0_MULTI_IRQ_POLL_EN)) { 2312e65e175bSOded Gabbay dyn_regs->gic_host_halt_irq = dyn_regs->gic_host_pi_upd_irq; 2313e65e175bSOded Gabbay dyn_regs->gic_host_ints_irq = dyn_regs->gic_host_pi_upd_irq; 2314e65e175bSOded Gabbay 2315e65e175bSOded Gabbay dev_warn(hdev->dev, 2316e65e175bSOded Gabbay "Using a single interrupt interface towards cpucp"); 2317e65e175bSOded Gabbay } 2318e65e175bSOded Gabbay } 2319e65e175bSOded Gabbay /** 2320e65e175bSOded Gabbay * hl_fw_dynamic_load_image - load FW image using dynamic protocol 2321e65e175bSOded Gabbay * 2322e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 2323e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 2324e65e175bSOded Gabbay * @load_fwc: the FW component to be loaded 2325e65e175bSOded Gabbay * @img_ld_timeout: image load timeout 2326e65e175bSOded Gabbay * 2327e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 2328e65e175bSOded Gabbay */ 2329e65e175bSOded Gabbay static int hl_fw_dynamic_load_image(struct hl_device *hdev, 2330e65e175bSOded Gabbay struct fw_load_mgr *fw_loader, 2331e65e175bSOded Gabbay enum hl_fw_component load_fwc, 2332e65e175bSOded Gabbay u32 img_ld_timeout) 2333e65e175bSOded Gabbay { 2334e65e175bSOded Gabbay enum hl_fw_component cur_fwc; 2335e65e175bSOded Gabbay const struct firmware *fw; 2336e65e175bSOded Gabbay char *fw_name; 2337e65e175bSOded Gabbay int rc = 0; 2338e65e175bSOded Gabbay 2339e65e175bSOded Gabbay /* 2340e65e175bSOded Gabbay * when loading image we have one of 2 scenarios: 2341e65e175bSOded Gabbay * 1. current FW component is preboot and we want to load boot-fit 2342e65e175bSOded Gabbay * 2. current FW component is boot-fit and we want to load linux 2343e65e175bSOded Gabbay */ 2344e65e175bSOded Gabbay if (load_fwc == FW_COMP_BOOT_FIT) { 2345e65e175bSOded Gabbay cur_fwc = FW_COMP_PREBOOT; 2346e65e175bSOded Gabbay fw_name = fw_loader->boot_fit_img.image_name; 2347e65e175bSOded Gabbay } else { 2348e65e175bSOded Gabbay cur_fwc = FW_COMP_BOOT_FIT; 2349e65e175bSOded Gabbay fw_name = fw_loader->linux_img.image_name; 2350e65e175bSOded Gabbay } 2351e65e175bSOded Gabbay 2352e65e175bSOded Gabbay /* request FW in order to communicate to FW the size to be allocated */ 2353e65e175bSOded Gabbay rc = hl_request_fw(hdev, &fw, fw_name); 2354e65e175bSOded Gabbay if (rc) 2355e65e175bSOded Gabbay return rc; 2356e65e175bSOded Gabbay 2357e65e175bSOded Gabbay /* store the image size for future validation */ 2358e65e175bSOded Gabbay fw_loader->dynamic_loader.fw_image_size = fw->size; 2359e65e175bSOded Gabbay 2360e65e175bSOded Gabbay rc = hl_fw_dynamic_request_descriptor(hdev, fw_loader, fw->size); 2361e65e175bSOded Gabbay if (rc) 2362e65e175bSOded Gabbay goto release_fw; 2363e65e175bSOded Gabbay 2364e65e175bSOded Gabbay /* read preboot version */ 2365e65e175bSOded Gabbay rc = hl_fw_dynamic_read_device_fw_version(hdev, cur_fwc, 2366e65e175bSOded Gabbay fw_loader->dynamic_loader.comm_desc.cur_fw_ver); 2367e65e175bSOded Gabbay if (rc) 2368e65e175bSOded Gabbay goto release_fw; 2369e65e175bSOded Gabbay 2370e65e175bSOded Gabbay /* update state according to boot stage */ 2371e65e175bSOded Gabbay if (cur_fwc == FW_COMP_BOOT_FIT) { 2372e65e175bSOded Gabbay struct cpu_dyn_regs *dyn_regs; 2373e65e175bSOded Gabbay 2374e65e175bSOded Gabbay dyn_regs = &fw_loader->dynamic_loader.comm_desc.cpu_dyn_regs; 2375e65e175bSOded Gabbay hl_fw_boot_fit_update_state(hdev, 2376e65e175bSOded Gabbay le32_to_cpu(dyn_regs->cpu_boot_dev_sts0), 2377e65e175bSOded Gabbay le32_to_cpu(dyn_regs->cpu_boot_dev_sts1)); 2378e65e175bSOded Gabbay } 2379e65e175bSOded Gabbay 2380e65e175bSOded Gabbay /* copy boot fit to space allocated by FW */ 2381e65e175bSOded Gabbay rc = hl_fw_dynamic_copy_image(hdev, fw, fw_loader); 2382e65e175bSOded Gabbay if (rc) 2383e65e175bSOded Gabbay goto release_fw; 2384e65e175bSOded Gabbay 2385e65e175bSOded Gabbay rc = hl_fw_dynamic_send_protocol_cmd(hdev, fw_loader, COMMS_DATA_RDY, 2386e65e175bSOded Gabbay 0, true, 2387e65e175bSOded Gabbay fw_loader->cpu_timeout); 2388e65e175bSOded Gabbay if (rc) 2389e65e175bSOded Gabbay goto release_fw; 2390e65e175bSOded Gabbay 2391e65e175bSOded Gabbay rc = hl_fw_dynamic_send_protocol_cmd(hdev, fw_loader, COMMS_EXEC, 2392e65e175bSOded Gabbay 0, false, 2393e65e175bSOded Gabbay img_ld_timeout); 2394e65e175bSOded Gabbay 2395e65e175bSOded Gabbay release_fw: 2396e65e175bSOded Gabbay hl_release_firmware(fw); 2397e65e175bSOded Gabbay return rc; 2398e65e175bSOded Gabbay } 2399e65e175bSOded Gabbay 2400e65e175bSOded Gabbay static int hl_fw_dynamic_wait_for_boot_fit_active(struct hl_device *hdev, 2401e65e175bSOded Gabbay struct fw_load_mgr *fw_loader) 2402e65e175bSOded Gabbay { 2403e65e175bSOded Gabbay struct dynamic_fw_load_mgr *dyn_loader; 2404e65e175bSOded Gabbay u32 status; 2405e65e175bSOded Gabbay int rc; 2406e65e175bSOded Gabbay 2407e65e175bSOded Gabbay dyn_loader = &fw_loader->dynamic_loader; 2408e65e175bSOded Gabbay 2409e65e175bSOded Gabbay /* 2410e65e175bSOded Gabbay * Make sure CPU boot-loader is running 2411e65e175bSOded Gabbay * Note that the CPU_BOOT_STATUS_SRAM_AVAIL is generally set by Linux 2412e65e175bSOded Gabbay * yet there is a debug scenario in which we loading uboot (without Linux) 2413e65e175bSOded Gabbay * which at later stage is relocated to DRAM. In this case we expect 2414e65e175bSOded Gabbay * uboot to set the CPU_BOOT_STATUS_SRAM_AVAIL and so we add it to the 2415e65e175bSOded Gabbay * poll flags 2416e65e175bSOded Gabbay */ 2417e65e175bSOded Gabbay rc = hl_poll_timeout( 2418e65e175bSOded Gabbay hdev, 2419e65e175bSOded Gabbay le32_to_cpu(dyn_loader->comm_desc.cpu_dyn_regs.cpu_boot_status), 2420e65e175bSOded Gabbay status, 2421e65e175bSOded Gabbay (status == CPU_BOOT_STATUS_READY_TO_BOOT) || 2422e65e175bSOded Gabbay (status == CPU_BOOT_STATUS_SRAM_AVAIL), 2423e65e175bSOded Gabbay hdev->fw_poll_interval_usec, 2424e65e175bSOded Gabbay dyn_loader->wait_for_bl_timeout); 2425e65e175bSOded Gabbay if (rc) { 2426eba773d3SMoti Haimovski dev_err(hdev->dev, "failed to wait for boot (status = %d)\n", status); 2427e65e175bSOded Gabbay return rc; 2428e65e175bSOded Gabbay } 2429e65e175bSOded Gabbay 2430e65e175bSOded Gabbay dev_dbg(hdev->dev, "uboot status = %d\n", status); 2431e65e175bSOded Gabbay return 0; 2432e65e175bSOded Gabbay } 2433e65e175bSOded Gabbay 2434e65e175bSOded Gabbay static int hl_fw_dynamic_wait_for_linux_active(struct hl_device *hdev, 2435e65e175bSOded Gabbay struct fw_load_mgr *fw_loader) 2436e65e175bSOded Gabbay { 2437e65e175bSOded Gabbay struct dynamic_fw_load_mgr *dyn_loader; 2438e65e175bSOded Gabbay u32 status; 2439e65e175bSOded Gabbay int rc; 2440e65e175bSOded Gabbay 2441e65e175bSOded Gabbay dyn_loader = &fw_loader->dynamic_loader; 2442e65e175bSOded Gabbay 2443e65e175bSOded Gabbay /* Make sure CPU linux is running */ 2444e65e175bSOded Gabbay 2445e65e175bSOded Gabbay rc = hl_poll_timeout( 2446e65e175bSOded Gabbay hdev, 2447e65e175bSOded Gabbay le32_to_cpu(dyn_loader->comm_desc.cpu_dyn_regs.cpu_boot_status), 2448e65e175bSOded Gabbay status, 2449e65e175bSOded Gabbay (status == CPU_BOOT_STATUS_SRAM_AVAIL), 2450e65e175bSOded Gabbay hdev->fw_poll_interval_usec, 2451e65e175bSOded Gabbay fw_loader->cpu_timeout); 2452e65e175bSOded Gabbay if (rc) { 2453eba773d3SMoti Haimovski dev_err(hdev->dev, "failed to wait for Linux (status = %d)\n", status); 2454e65e175bSOded Gabbay return rc; 2455e65e175bSOded Gabbay } 2456e65e175bSOded Gabbay 2457e65e175bSOded Gabbay dev_dbg(hdev->dev, "Boot status = %d\n", status); 2458e65e175bSOded Gabbay return 0; 2459e65e175bSOded Gabbay } 2460e65e175bSOded Gabbay 2461e65e175bSOded Gabbay /** 2462e65e175bSOded Gabbay * hl_fw_linux_update_state - update internal data structures after Linux 2463e65e175bSOded Gabbay * is loaded. 2464e65e175bSOded Gabbay * Note: Linux initialization is comprised mainly 2465e65e175bSOded Gabbay * of two stages - loading kernel (SRAM_AVAIL) 2466e65e175bSOded Gabbay * & loading ARMCP. 2467e65e175bSOded Gabbay * Therefore reading boot device status in any of 2468e65e175bSOded Gabbay * these stages might result in different values. 2469e65e175bSOded Gabbay * 2470e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 2471e65e175bSOded Gabbay * @cpu_boot_dev_sts0_reg: register holding CPU boot dev status 0 2472e65e175bSOded Gabbay * @cpu_boot_dev_sts1_reg: register holding CPU boot dev status 1 2473e65e175bSOded Gabbay * 2474e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 2475e65e175bSOded Gabbay */ 2476e65e175bSOded Gabbay static void hl_fw_linux_update_state(struct hl_device *hdev, 2477e65e175bSOded Gabbay u32 cpu_boot_dev_sts0_reg, 2478e65e175bSOded Gabbay u32 cpu_boot_dev_sts1_reg) 2479e65e175bSOded Gabbay { 2480e65e175bSOded Gabbay struct asic_fixed_properties *prop = &hdev->asic_prop; 2481e65e175bSOded Gabbay 2482e65e175bSOded Gabbay hdev->fw_loader.fw_comp_loaded |= FW_TYPE_LINUX; 2483e65e175bSOded Gabbay 2484e65e175bSOded Gabbay /* Read FW application security bits */ 2485e65e175bSOded Gabbay if (prop->fw_cpu_boot_dev_sts0_valid) { 2486e65e175bSOded Gabbay prop->fw_app_cpu_boot_dev_sts0 = RREG32(cpu_boot_dev_sts0_reg); 2487e65e175bSOded Gabbay 2488e65e175bSOded Gabbay prop->hard_reset_done_by_fw = !!(prop->fw_app_cpu_boot_dev_sts0 & 2489e65e175bSOded Gabbay CPU_BOOT_DEV_STS0_FW_HARD_RST_EN); 2490e65e175bSOded Gabbay 2491e65e175bSOded Gabbay if (prop->fw_app_cpu_boot_dev_sts0 & 2492e65e175bSOded Gabbay CPU_BOOT_DEV_STS0_GIC_PRIVILEGED_EN) 2493e65e175bSOded Gabbay prop->gic_interrupts_enable = false; 2494e65e175bSOded Gabbay 2495e65e175bSOded Gabbay dev_dbg(hdev->dev, 2496e65e175bSOded Gabbay "Firmware application CPU status0 %#x\n", 2497e65e175bSOded Gabbay prop->fw_app_cpu_boot_dev_sts0); 2498e65e175bSOded Gabbay 2499e65e175bSOded Gabbay dev_dbg(hdev->dev, "GIC controller is %s\n", 2500e65e175bSOded Gabbay prop->gic_interrupts_enable ? 2501e65e175bSOded Gabbay "enabled" : "disabled"); 2502e65e175bSOded Gabbay } 2503e65e175bSOded Gabbay 2504e65e175bSOded Gabbay if (prop->fw_cpu_boot_dev_sts1_valid) { 2505e65e175bSOded Gabbay prop->fw_app_cpu_boot_dev_sts1 = RREG32(cpu_boot_dev_sts1_reg); 2506e65e175bSOded Gabbay 2507e65e175bSOded Gabbay dev_dbg(hdev->dev, 2508e65e175bSOded Gabbay "Firmware application CPU status1 %#x\n", 2509e65e175bSOded Gabbay prop->fw_app_cpu_boot_dev_sts1); 2510e65e175bSOded Gabbay } 2511e65e175bSOded Gabbay 2512e65e175bSOded Gabbay dev_dbg(hdev->dev, "Firmware application CPU hard-reset is %s\n", 2513e65e175bSOded Gabbay prop->hard_reset_done_by_fw ? "enabled" : "disabled"); 2514e65e175bSOded Gabbay 2515e65e175bSOded Gabbay dev_info(hdev->dev, "Successfully loaded firmware to device\n"); 2516e65e175bSOded Gabbay } 2517e65e175bSOded Gabbay 2518e65e175bSOded Gabbay /** 2519e65e175bSOded Gabbay * hl_fw_dynamic_send_msg - send a COMMS message with attached data 2520e65e175bSOded Gabbay * 2521e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 2522e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 2523e65e175bSOded Gabbay * @msg_type: message type 2524e65e175bSOded Gabbay * @data: data to be sent 2525e65e175bSOded Gabbay * 2526e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 2527e65e175bSOded Gabbay */ 2528e65e175bSOded Gabbay static int hl_fw_dynamic_send_msg(struct hl_device *hdev, 2529e65e175bSOded Gabbay struct fw_load_mgr *fw_loader, u8 msg_type, void *data) 2530e65e175bSOded Gabbay { 2531e65e175bSOded Gabbay struct lkd_msg_comms *msg; 2532e65e175bSOded Gabbay int rc; 2533e65e175bSOded Gabbay 2534e65e175bSOded Gabbay msg = kzalloc(sizeof(*msg), GFP_KERNEL); 2535e65e175bSOded Gabbay if (!msg) 2536e65e175bSOded Gabbay return -ENOMEM; 2537e65e175bSOded Gabbay 2538e65e175bSOded Gabbay /* create message to be sent */ 2539e65e175bSOded Gabbay msg->header.type = msg_type; 2540e65e175bSOded Gabbay msg->header.size = cpu_to_le16(sizeof(struct comms_msg_header)); 2541e65e175bSOded Gabbay msg->header.magic = cpu_to_le32(HL_COMMS_MSG_MAGIC); 2542e65e175bSOded Gabbay 2543e65e175bSOded Gabbay switch (msg_type) { 2544e65e175bSOded Gabbay case HL_COMMS_RESET_CAUSE_TYPE: 2545e65e175bSOded Gabbay msg->reset_cause = *(__u8 *) data; 2546e65e175bSOded Gabbay break; 2547e65e175bSOded Gabbay 2548e65e175bSOded Gabbay default: 2549e65e175bSOded Gabbay dev_err(hdev->dev, 2550e65e175bSOded Gabbay "Send COMMS message - invalid message type %u\n", 2551e65e175bSOded Gabbay msg_type); 2552e65e175bSOded Gabbay rc = -EINVAL; 2553e65e175bSOded Gabbay goto out; 2554e65e175bSOded Gabbay } 2555e65e175bSOded Gabbay 2556e65e175bSOded Gabbay rc = hl_fw_dynamic_request_descriptor(hdev, fw_loader, 2557e65e175bSOded Gabbay sizeof(struct lkd_msg_comms)); 2558e65e175bSOded Gabbay if (rc) 2559e65e175bSOded Gabbay goto out; 2560e65e175bSOded Gabbay 2561e65e175bSOded Gabbay /* copy message to space allocated by FW */ 2562e65e175bSOded Gabbay rc = hl_fw_dynamic_copy_msg(hdev, msg, fw_loader); 2563e65e175bSOded Gabbay if (rc) 2564e65e175bSOded Gabbay goto out; 2565e65e175bSOded Gabbay 2566e65e175bSOded Gabbay rc = hl_fw_dynamic_send_protocol_cmd(hdev, fw_loader, COMMS_DATA_RDY, 2567e65e175bSOded Gabbay 0, true, 2568e65e175bSOded Gabbay fw_loader->cpu_timeout); 2569e65e175bSOded Gabbay if (rc) 2570e65e175bSOded Gabbay goto out; 2571e65e175bSOded Gabbay 2572e65e175bSOded Gabbay rc = hl_fw_dynamic_send_protocol_cmd(hdev, fw_loader, COMMS_EXEC, 2573e65e175bSOded Gabbay 0, true, 2574e65e175bSOded Gabbay fw_loader->cpu_timeout); 2575e65e175bSOded Gabbay 2576e65e175bSOded Gabbay out: 2577e65e175bSOded Gabbay kfree(msg); 2578e65e175bSOded Gabbay return rc; 2579e65e175bSOded Gabbay } 2580e65e175bSOded Gabbay 2581e65e175bSOded Gabbay /** 2582e65e175bSOded Gabbay * hl_fw_dynamic_init_cpu - initialize the device CPU using dynamic protocol 2583e65e175bSOded Gabbay * 2584e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 2585e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 2586e65e175bSOded Gabbay * 2587e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 2588e65e175bSOded Gabbay * 2589e65e175bSOded Gabbay * brief: the dynamic protocol is master (LKD) slave (FW CPU) protocol. 2590e65e175bSOded Gabbay * the communication is done using registers: 2591e65e175bSOded Gabbay * - LKD command register 2592e65e175bSOded Gabbay * - FW status register 2593e65e175bSOded Gabbay * the protocol is race free. this goal is achieved by splitting the requests 2594e65e175bSOded Gabbay * and response to known synchronization points between the LKD and the FW. 2595e65e175bSOded Gabbay * each response to LKD request is known and bound to a predefined timeout. 2596e65e175bSOded Gabbay * in case of timeout expiration without the desired status from FW- the 2597e65e175bSOded Gabbay * protocol (and hence the boot) will fail. 2598e65e175bSOded Gabbay */ 2599e65e175bSOded Gabbay static int hl_fw_dynamic_init_cpu(struct hl_device *hdev, 2600e65e175bSOded Gabbay struct fw_load_mgr *fw_loader) 2601e65e175bSOded Gabbay { 2602e65e175bSOded Gabbay struct cpu_dyn_regs *dyn_regs; 2603e65e175bSOded Gabbay int rc, fw_error_rc; 2604e65e175bSOded Gabbay 2605e65e175bSOded Gabbay dev_info(hdev->dev, 2606e65e175bSOded Gabbay "Loading %sfirmware to device, may take some time...\n", 2607e65e175bSOded Gabbay hdev->asic_prop.fw_security_enabled ? "secured " : ""); 2608e65e175bSOded Gabbay 2609e65e175bSOded Gabbay /* initialize FW descriptor as invalid */ 2610e65e175bSOded Gabbay fw_loader->dynamic_loader.fw_desc_valid = false; 2611e65e175bSOded Gabbay 2612e65e175bSOded Gabbay /* 2613e65e175bSOded Gabbay * In this stage, "cpu_dyn_regs" contains only LKD's hard coded values! 2614e65e175bSOded Gabbay * It will be updated from FW after hl_fw_dynamic_request_descriptor(). 2615e65e175bSOded Gabbay */ 2616e65e175bSOded Gabbay dyn_regs = &fw_loader->dynamic_loader.comm_desc.cpu_dyn_regs; 2617e65e175bSOded Gabbay 2618e65e175bSOded Gabbay rc = hl_fw_dynamic_send_protocol_cmd(hdev, fw_loader, COMMS_RST_STATE, 2619e65e175bSOded Gabbay 0, true, 2620e65e175bSOded Gabbay fw_loader->cpu_timeout); 2621e65e175bSOded Gabbay if (rc) 2622e65e175bSOded Gabbay goto protocol_err; 2623e65e175bSOded Gabbay 2624e65e175bSOded Gabbay if (hdev->reset_info.curr_reset_cause) { 2625e65e175bSOded Gabbay rc = hl_fw_dynamic_send_msg(hdev, fw_loader, 2626e65e175bSOded Gabbay HL_COMMS_RESET_CAUSE_TYPE, &hdev->reset_info.curr_reset_cause); 2627e65e175bSOded Gabbay if (rc) 2628e65e175bSOded Gabbay goto protocol_err; 2629e65e175bSOded Gabbay 2630e65e175bSOded Gabbay /* Clear current reset cause */ 2631e65e175bSOded Gabbay hdev->reset_info.curr_reset_cause = HL_RESET_CAUSE_UNKNOWN; 2632e65e175bSOded Gabbay } 2633e65e175bSOded Gabbay 2634e65e175bSOded Gabbay if (!(hdev->fw_components & FW_TYPE_BOOT_CPU)) { 2635e65e175bSOded Gabbay struct lkd_fw_binning_info *binning_info; 2636e65e175bSOded Gabbay 2637e65e175bSOded Gabbay rc = hl_fw_dynamic_request_descriptor(hdev, fw_loader, 0); 2638e65e175bSOded Gabbay if (rc) 2639e65e175bSOded Gabbay goto protocol_err; 2640e65e175bSOded Gabbay 2641e65e175bSOded Gabbay /* read preboot version */ 2642e65e175bSOded Gabbay rc = hl_fw_dynamic_read_device_fw_version(hdev, FW_COMP_PREBOOT, 2643e65e175bSOded Gabbay fw_loader->dynamic_loader.comm_desc.cur_fw_ver); 2644e65e175bSOded Gabbay 2645e65e175bSOded Gabbay if (rc) 2646ab509d81SOhad Sharabi return rc; 2647e65e175bSOded Gabbay 2648e65e175bSOded Gabbay /* read binning info from preboot */ 2649e65e175bSOded Gabbay if (hdev->support_preboot_binning) { 2650e65e175bSOded Gabbay binning_info = &fw_loader->dynamic_loader.comm_desc.binning_info; 2651e65e175bSOded Gabbay hdev->tpc_binning = le64_to_cpu(binning_info->tpc_mask_l); 2652e65e175bSOded Gabbay hdev->dram_binning = le32_to_cpu(binning_info->dram_mask); 2653e65e175bSOded Gabbay hdev->edma_binning = le32_to_cpu(binning_info->edma_mask); 2654e65e175bSOded Gabbay hdev->decoder_binning = le32_to_cpu(binning_info->dec_mask); 2655e65e175bSOded Gabbay hdev->rotator_binning = le32_to_cpu(binning_info->rot_mask); 2656e65e175bSOded Gabbay 2657e65e175bSOded Gabbay rc = hdev->asic_funcs->set_dram_properties(hdev); 2658e65e175bSOded Gabbay if (rc) 2659ab509d81SOhad Sharabi return rc; 2660ab509d81SOhad Sharabi 2661ab509d81SOhad Sharabi rc = hdev->asic_funcs->set_binning_masks(hdev); 2662ab509d81SOhad Sharabi if (rc) 2663ab509d81SOhad Sharabi return rc; 2664e65e175bSOded Gabbay 2665e65e175bSOded Gabbay dev_dbg(hdev->dev, 2666e65e175bSOded Gabbay "Read binning masks: tpc: 0x%llx, dram: 0x%llx, edma: 0x%x, dec: 0x%x, rot:0x%x\n", 2667e65e175bSOded Gabbay hdev->tpc_binning, hdev->dram_binning, hdev->edma_binning, 2668e65e175bSOded Gabbay hdev->decoder_binning, hdev->rotator_binning); 2669e65e175bSOded Gabbay } 2670ab509d81SOhad Sharabi 2671ab509d81SOhad Sharabi return 0; 2672e65e175bSOded Gabbay } 2673e65e175bSOded Gabbay 2674e65e175bSOded Gabbay /* load boot fit to FW */ 2675e65e175bSOded Gabbay rc = hl_fw_dynamic_load_image(hdev, fw_loader, FW_COMP_BOOT_FIT, 2676e65e175bSOded Gabbay fw_loader->boot_fit_timeout); 2677e65e175bSOded Gabbay if (rc) { 2678e65e175bSOded Gabbay dev_err(hdev->dev, "failed to load boot fit\n"); 2679e65e175bSOded Gabbay goto protocol_err; 2680e65e175bSOded Gabbay } 2681e65e175bSOded Gabbay 2682e65e175bSOded Gabbay /* 2683e65e175bSOded Gabbay * when testing FW load (without Linux) on PLDM we don't want to 2684e65e175bSOded Gabbay * wait until boot fit is active as it may take several hours. 2685e65e175bSOded Gabbay * instead, we load the bootfit and let it do all initialization in 2686e65e175bSOded Gabbay * the background. 2687e65e175bSOded Gabbay */ 2688e65e175bSOded Gabbay if (hdev->pldm && !(hdev->fw_components & FW_TYPE_LINUX)) 2689e65e175bSOded Gabbay return 0; 2690e65e175bSOded Gabbay 2691e65e175bSOded Gabbay rc = hl_fw_dynamic_wait_for_boot_fit_active(hdev, fw_loader); 2692e65e175bSOded Gabbay if (rc) 2693e65e175bSOded Gabbay goto protocol_err; 2694e65e175bSOded Gabbay 2695e65e175bSOded Gabbay /* Enable DRAM scrambling before Linux boot and after successful 2696e65e175bSOded Gabbay * UBoot 2697e65e175bSOded Gabbay */ 2698e65e175bSOded Gabbay hdev->asic_funcs->init_cpu_scrambler_dram(hdev); 2699e65e175bSOded Gabbay 2700e65e175bSOded Gabbay if (!(hdev->fw_components & FW_TYPE_LINUX)) { 2701e65e175bSOded Gabbay dev_info(hdev->dev, "Skip loading Linux F/W\n"); 2702e65e175bSOded Gabbay return 0; 2703e65e175bSOded Gabbay } 2704e65e175bSOded Gabbay 2705e65e175bSOded Gabbay if (fw_loader->skip_bmc) { 2706e65e175bSOded Gabbay rc = hl_fw_dynamic_send_protocol_cmd(hdev, fw_loader, 2707e65e175bSOded Gabbay COMMS_SKIP_BMC, 0, 2708e65e175bSOded Gabbay true, 2709e65e175bSOded Gabbay fw_loader->cpu_timeout); 2710e65e175bSOded Gabbay if (rc) { 2711e65e175bSOded Gabbay dev_err(hdev->dev, "failed to load boot fit\n"); 2712e65e175bSOded Gabbay goto protocol_err; 2713e65e175bSOded Gabbay } 2714e65e175bSOded Gabbay } 2715e65e175bSOded Gabbay 2716e65e175bSOded Gabbay /* load Linux image to FW */ 2717e65e175bSOded Gabbay rc = hl_fw_dynamic_load_image(hdev, fw_loader, FW_COMP_LINUX, 2718e65e175bSOded Gabbay fw_loader->cpu_timeout); 2719e65e175bSOded Gabbay if (rc) { 2720e65e175bSOded Gabbay dev_err(hdev->dev, "failed to load Linux\n"); 2721e65e175bSOded Gabbay goto protocol_err; 2722e65e175bSOded Gabbay } 2723e65e175bSOded Gabbay 2724e65e175bSOded Gabbay rc = hl_fw_dynamic_wait_for_linux_active(hdev, fw_loader); 2725e65e175bSOded Gabbay if (rc) 2726e65e175bSOded Gabbay goto protocol_err; 2727e65e175bSOded Gabbay 2728e65e175bSOded Gabbay hl_fw_linux_update_state(hdev, le32_to_cpu(dyn_regs->cpu_boot_dev_sts0), 2729e65e175bSOded Gabbay le32_to_cpu(dyn_regs->cpu_boot_dev_sts1)); 2730e65e175bSOded Gabbay 2731e65e175bSOded Gabbay hl_fw_dynamic_update_linux_interrupt_if(hdev); 2732e65e175bSOded Gabbay 2733e65e175bSOded Gabbay protocol_err: 2734e65e175bSOded Gabbay if (fw_loader->dynamic_loader.fw_desc_valid) { 2735e65e175bSOded Gabbay fw_error_rc = fw_read_errors(hdev, le32_to_cpu(dyn_regs->cpu_boot_err0), 2736e65e175bSOded Gabbay le32_to_cpu(dyn_regs->cpu_boot_err1), 2737e65e175bSOded Gabbay le32_to_cpu(dyn_regs->cpu_boot_dev_sts0), 2738e65e175bSOded Gabbay le32_to_cpu(dyn_regs->cpu_boot_dev_sts1)); 2739e65e175bSOded Gabbay 2740e65e175bSOded Gabbay if (fw_error_rc) 2741e65e175bSOded Gabbay return fw_error_rc; 2742e65e175bSOded Gabbay } 2743e65e175bSOded Gabbay 2744e65e175bSOded Gabbay return rc; 2745e65e175bSOded Gabbay } 2746e65e175bSOded Gabbay 2747e65e175bSOded Gabbay /** 2748e65e175bSOded Gabbay * hl_fw_static_init_cpu - initialize the device CPU using static protocol 2749e65e175bSOded Gabbay * 2750e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 2751e65e175bSOded Gabbay * @fw_loader: managing structure for loading device's FW 2752e65e175bSOded Gabbay * 2753e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 2754e65e175bSOded Gabbay */ 2755e65e175bSOded Gabbay static int hl_fw_static_init_cpu(struct hl_device *hdev, 2756e65e175bSOded Gabbay struct fw_load_mgr *fw_loader) 2757e65e175bSOded Gabbay { 2758e65e175bSOded Gabbay u32 cpu_msg_status_reg, cpu_timeout, msg_to_cpu_reg, status; 2759e65e175bSOded Gabbay u32 cpu_boot_dev_status0_reg, cpu_boot_dev_status1_reg; 2760e65e175bSOded Gabbay struct static_fw_load_mgr *static_loader; 2761e65e175bSOded Gabbay u32 cpu_boot_status_reg; 2762e65e175bSOded Gabbay int rc; 2763e65e175bSOded Gabbay 2764e65e175bSOded Gabbay if (!(hdev->fw_components & FW_TYPE_BOOT_CPU)) 2765e65e175bSOded Gabbay return 0; 2766e65e175bSOded Gabbay 2767e65e175bSOded Gabbay /* init common loader parameters */ 2768e65e175bSOded Gabbay cpu_timeout = fw_loader->cpu_timeout; 2769e65e175bSOded Gabbay 2770e65e175bSOded Gabbay /* init static loader parameters */ 2771e65e175bSOded Gabbay static_loader = &fw_loader->static_loader; 2772e65e175bSOded Gabbay cpu_msg_status_reg = static_loader->cpu_cmd_status_to_host_reg; 2773e65e175bSOded Gabbay msg_to_cpu_reg = static_loader->kmd_msg_to_cpu_reg; 2774e65e175bSOded Gabbay cpu_boot_dev_status0_reg = static_loader->cpu_boot_dev_status0_reg; 2775e65e175bSOded Gabbay cpu_boot_dev_status1_reg = static_loader->cpu_boot_dev_status1_reg; 2776e65e175bSOded Gabbay cpu_boot_status_reg = static_loader->cpu_boot_status_reg; 2777e65e175bSOded Gabbay 2778e65e175bSOded Gabbay dev_info(hdev->dev, "Going to wait for device boot (up to %lds)\n", 2779e65e175bSOded Gabbay cpu_timeout / USEC_PER_SEC); 2780e65e175bSOded Gabbay 2781e65e175bSOded Gabbay /* Wait for boot FIT request */ 2782e65e175bSOded Gabbay rc = hl_poll_timeout( 2783e65e175bSOded Gabbay hdev, 2784e65e175bSOded Gabbay cpu_boot_status_reg, 2785e65e175bSOded Gabbay status, 2786e65e175bSOded Gabbay status == CPU_BOOT_STATUS_WAITING_FOR_BOOT_FIT, 2787e65e175bSOded Gabbay hdev->fw_poll_interval_usec, 2788e65e175bSOded Gabbay fw_loader->boot_fit_timeout); 2789e65e175bSOded Gabbay 2790e65e175bSOded Gabbay if (rc) { 2791e65e175bSOded Gabbay dev_dbg(hdev->dev, 2792eba773d3SMoti Haimovski "No boot fit request received (status = %d), resuming boot\n", status); 2793e65e175bSOded Gabbay } else { 2794e65e175bSOded Gabbay rc = hdev->asic_funcs->load_boot_fit_to_device(hdev); 2795e65e175bSOded Gabbay if (rc) 2796e65e175bSOded Gabbay goto out; 2797e65e175bSOded Gabbay 2798e65e175bSOded Gabbay /* Clear device CPU message status */ 2799e65e175bSOded Gabbay WREG32(cpu_msg_status_reg, CPU_MSG_CLR); 2800e65e175bSOded Gabbay 2801e65e175bSOded Gabbay /* Signal device CPU that boot loader is ready */ 2802e65e175bSOded Gabbay WREG32(msg_to_cpu_reg, KMD_MSG_FIT_RDY); 2803e65e175bSOded Gabbay 2804e65e175bSOded Gabbay /* Poll for CPU device ack */ 2805e65e175bSOded Gabbay rc = hl_poll_timeout( 2806e65e175bSOded Gabbay hdev, 2807e65e175bSOded Gabbay cpu_msg_status_reg, 2808e65e175bSOded Gabbay status, 2809e65e175bSOded Gabbay status == CPU_MSG_OK, 2810e65e175bSOded Gabbay hdev->fw_poll_interval_usec, 2811e65e175bSOded Gabbay fw_loader->boot_fit_timeout); 2812e65e175bSOded Gabbay 2813e65e175bSOded Gabbay if (rc) { 2814e65e175bSOded Gabbay dev_err(hdev->dev, 2815eba773d3SMoti Haimovski "Timeout waiting for boot fit load ack (status = %d)\n", status); 2816e65e175bSOded Gabbay goto out; 2817e65e175bSOded Gabbay } 2818e65e175bSOded Gabbay 2819e65e175bSOded Gabbay /* Clear message */ 2820e65e175bSOded Gabbay WREG32(msg_to_cpu_reg, KMD_MSG_NA); 2821e65e175bSOded Gabbay } 2822e65e175bSOded Gabbay 2823e65e175bSOded Gabbay /* 2824e65e175bSOded Gabbay * Make sure CPU boot-loader is running 2825e65e175bSOded Gabbay * Note that the CPU_BOOT_STATUS_SRAM_AVAIL is generally set by Linux 2826e65e175bSOded Gabbay * yet there is a debug scenario in which we loading uboot (without Linux) 2827e65e175bSOded Gabbay * which at later stage is relocated to DRAM. In this case we expect 2828e65e175bSOded Gabbay * uboot to set the CPU_BOOT_STATUS_SRAM_AVAIL and so we add it to the 2829e65e175bSOded Gabbay * poll flags 2830e65e175bSOded Gabbay */ 2831e65e175bSOded Gabbay rc = hl_poll_timeout( 2832e65e175bSOded Gabbay hdev, 2833e65e175bSOded Gabbay cpu_boot_status_reg, 2834e65e175bSOded Gabbay status, 2835e65e175bSOded Gabbay (status == CPU_BOOT_STATUS_DRAM_RDY) || 2836e65e175bSOded Gabbay (status == CPU_BOOT_STATUS_NIC_FW_RDY) || 2837e65e175bSOded Gabbay (status == CPU_BOOT_STATUS_READY_TO_BOOT) || 2838e65e175bSOded Gabbay (status == CPU_BOOT_STATUS_SRAM_AVAIL), 2839e65e175bSOded Gabbay hdev->fw_poll_interval_usec, 2840e65e175bSOded Gabbay cpu_timeout); 2841e65e175bSOded Gabbay 2842e65e175bSOded Gabbay dev_dbg(hdev->dev, "uboot status = %d\n", status); 2843e65e175bSOded Gabbay 2844e65e175bSOded Gabbay /* Read U-Boot version now in case we will later fail */ 2845e65e175bSOded Gabbay hl_fw_static_read_device_fw_version(hdev, FW_COMP_BOOT_FIT); 2846e65e175bSOded Gabbay 2847e65e175bSOded Gabbay /* update state according to boot stage */ 2848e65e175bSOded Gabbay hl_fw_boot_fit_update_state(hdev, cpu_boot_dev_status0_reg, 2849e65e175bSOded Gabbay cpu_boot_dev_status1_reg); 2850e65e175bSOded Gabbay 2851e65e175bSOded Gabbay if (rc) { 2852e65e175bSOded Gabbay detect_cpu_boot_status(hdev, status); 2853e65e175bSOded Gabbay rc = -EIO; 2854e65e175bSOded Gabbay goto out; 2855e65e175bSOded Gabbay } 2856e65e175bSOded Gabbay 2857e65e175bSOded Gabbay /* Enable DRAM scrambling before Linux boot and after successful 2858e65e175bSOded Gabbay * UBoot 2859e65e175bSOded Gabbay */ 2860e65e175bSOded Gabbay hdev->asic_funcs->init_cpu_scrambler_dram(hdev); 2861e65e175bSOded Gabbay 2862e65e175bSOded Gabbay if (!(hdev->fw_components & FW_TYPE_LINUX)) { 2863e65e175bSOded Gabbay dev_info(hdev->dev, "Skip loading Linux F/W\n"); 2864e65e175bSOded Gabbay rc = 0; 2865e65e175bSOded Gabbay goto out; 2866e65e175bSOded Gabbay } 2867e65e175bSOded Gabbay 2868e65e175bSOded Gabbay if (status == CPU_BOOT_STATUS_SRAM_AVAIL) { 2869e65e175bSOded Gabbay rc = 0; 2870e65e175bSOded Gabbay goto out; 2871e65e175bSOded Gabbay } 2872e65e175bSOded Gabbay 2873e65e175bSOded Gabbay dev_info(hdev->dev, 2874e65e175bSOded Gabbay "Loading firmware to device, may take some time...\n"); 2875e65e175bSOded Gabbay 2876e65e175bSOded Gabbay rc = hdev->asic_funcs->load_firmware_to_device(hdev); 2877e65e175bSOded Gabbay if (rc) 2878e65e175bSOded Gabbay goto out; 2879e65e175bSOded Gabbay 2880e65e175bSOded Gabbay if (fw_loader->skip_bmc) { 2881e65e175bSOded Gabbay WREG32(msg_to_cpu_reg, KMD_MSG_SKIP_BMC); 2882e65e175bSOded Gabbay 2883e65e175bSOded Gabbay rc = hl_poll_timeout( 2884e65e175bSOded Gabbay hdev, 2885e65e175bSOded Gabbay cpu_boot_status_reg, 2886e65e175bSOded Gabbay status, 2887e65e175bSOded Gabbay (status == CPU_BOOT_STATUS_BMC_WAITING_SKIPPED), 2888e65e175bSOded Gabbay hdev->fw_poll_interval_usec, 2889e65e175bSOded Gabbay cpu_timeout); 2890e65e175bSOded Gabbay 2891e65e175bSOded Gabbay if (rc) { 2892e65e175bSOded Gabbay dev_err(hdev->dev, 2893eba773d3SMoti Haimovski "Failed to get ACK on skipping BMC (status = %d)\n", 2894e65e175bSOded Gabbay status); 2895e65e175bSOded Gabbay WREG32(msg_to_cpu_reg, KMD_MSG_NA); 2896e65e175bSOded Gabbay rc = -EIO; 2897e65e175bSOded Gabbay goto out; 2898e65e175bSOded Gabbay } 2899e65e175bSOded Gabbay } 2900e65e175bSOded Gabbay 2901e65e175bSOded Gabbay WREG32(msg_to_cpu_reg, KMD_MSG_FIT_RDY); 2902e65e175bSOded Gabbay 2903e65e175bSOded Gabbay rc = hl_poll_timeout( 2904e65e175bSOded Gabbay hdev, 2905e65e175bSOded Gabbay cpu_boot_status_reg, 2906e65e175bSOded Gabbay status, 2907e65e175bSOded Gabbay (status == CPU_BOOT_STATUS_SRAM_AVAIL), 2908e65e175bSOded Gabbay hdev->fw_poll_interval_usec, 2909e65e175bSOded Gabbay cpu_timeout); 2910e65e175bSOded Gabbay 2911e65e175bSOded Gabbay /* Clear message */ 2912e65e175bSOded Gabbay WREG32(msg_to_cpu_reg, KMD_MSG_NA); 2913e65e175bSOded Gabbay 2914e65e175bSOded Gabbay if (rc) { 2915e65e175bSOded Gabbay if (status == CPU_BOOT_STATUS_FIT_CORRUPTED) 2916e65e175bSOded Gabbay dev_err(hdev->dev, 2917e65e175bSOded Gabbay "Device reports FIT image is corrupted\n"); 2918e65e175bSOded Gabbay else 2919e65e175bSOded Gabbay dev_err(hdev->dev, 2920eba773d3SMoti Haimovski "Failed to load firmware to device (status = %d)\n", 2921e65e175bSOded Gabbay status); 2922e65e175bSOded Gabbay 2923e65e175bSOded Gabbay rc = -EIO; 2924e65e175bSOded Gabbay goto out; 2925e65e175bSOded Gabbay } 2926e65e175bSOded Gabbay 2927e65e175bSOded Gabbay rc = fw_read_errors(hdev, fw_loader->static_loader.boot_err0_reg, 2928e65e175bSOded Gabbay fw_loader->static_loader.boot_err1_reg, 2929e65e175bSOded Gabbay cpu_boot_dev_status0_reg, 2930e65e175bSOded Gabbay cpu_boot_dev_status1_reg); 2931e65e175bSOded Gabbay if (rc) 2932e65e175bSOded Gabbay return rc; 2933e65e175bSOded Gabbay 2934e65e175bSOded Gabbay hl_fw_linux_update_state(hdev, cpu_boot_dev_status0_reg, 2935e65e175bSOded Gabbay cpu_boot_dev_status1_reg); 2936e65e175bSOded Gabbay 2937e65e175bSOded Gabbay return 0; 2938e65e175bSOded Gabbay 2939e65e175bSOded Gabbay out: 2940e65e175bSOded Gabbay fw_read_errors(hdev, fw_loader->static_loader.boot_err0_reg, 2941e65e175bSOded Gabbay fw_loader->static_loader.boot_err1_reg, 2942e65e175bSOded Gabbay cpu_boot_dev_status0_reg, 2943e65e175bSOded Gabbay cpu_boot_dev_status1_reg); 2944e65e175bSOded Gabbay 2945e65e175bSOded Gabbay return rc; 2946e65e175bSOded Gabbay } 2947e65e175bSOded Gabbay 2948e65e175bSOded Gabbay /** 2949e65e175bSOded Gabbay * hl_fw_init_cpu - initialize the device CPU 2950e65e175bSOded Gabbay * 2951e65e175bSOded Gabbay * @hdev: pointer to the habanalabs device structure 2952e65e175bSOded Gabbay * 2953e65e175bSOded Gabbay * @return 0 on success, otherwise non-zero error code 2954e65e175bSOded Gabbay * 2955e65e175bSOded Gabbay * perform necessary initializations for device's CPU. takes into account if 2956e65e175bSOded Gabbay * init protocol is static or dynamic. 2957e65e175bSOded Gabbay */ 2958e65e175bSOded Gabbay int hl_fw_init_cpu(struct hl_device *hdev) 2959e65e175bSOded Gabbay { 2960e65e175bSOded Gabbay struct asic_fixed_properties *prop = &hdev->asic_prop; 2961e65e175bSOded Gabbay struct fw_load_mgr *fw_loader = &hdev->fw_loader; 2962e65e175bSOded Gabbay 2963e65e175bSOded Gabbay return prop->dynamic_fw_load ? 2964e65e175bSOded Gabbay hl_fw_dynamic_init_cpu(hdev, fw_loader) : 2965e65e175bSOded Gabbay hl_fw_static_init_cpu(hdev, fw_loader); 2966e65e175bSOded Gabbay } 2967e65e175bSOded Gabbay 2968e65e175bSOded Gabbay void hl_fw_set_pll_profile(struct hl_device *hdev) 2969e65e175bSOded Gabbay { 2970e65e175bSOded Gabbay hl_fw_set_frequency(hdev, hdev->asic_prop.clk_pll_index, 2971e65e175bSOded Gabbay hdev->asic_prop.max_freq_value); 2972e65e175bSOded Gabbay } 2973e65e175bSOded Gabbay 2974e65e175bSOded Gabbay int hl_fw_get_clk_rate(struct hl_device *hdev, u32 *cur_clk, u32 *max_clk) 2975e65e175bSOded Gabbay { 2976e65e175bSOded Gabbay long value; 2977e65e175bSOded Gabbay 2978e65e175bSOded Gabbay if (!hl_device_operational(hdev, NULL)) 2979e65e175bSOded Gabbay return -ENODEV; 2980e65e175bSOded Gabbay 2981e65e175bSOded Gabbay if (!hdev->pdev) { 2982e65e175bSOded Gabbay *cur_clk = 0; 2983e65e175bSOded Gabbay *max_clk = 0; 2984e65e175bSOded Gabbay return 0; 2985e65e175bSOded Gabbay } 2986e65e175bSOded Gabbay 2987e65e175bSOded Gabbay value = hl_fw_get_frequency(hdev, hdev->asic_prop.clk_pll_index, false); 2988e65e175bSOded Gabbay 2989e65e175bSOded Gabbay if (value < 0) { 2990e65e175bSOded Gabbay dev_err(hdev->dev, "Failed to retrieve device max clock %ld\n", value); 2991e65e175bSOded Gabbay return value; 2992e65e175bSOded Gabbay } 2993e65e175bSOded Gabbay 2994e65e175bSOded Gabbay *max_clk = (value / 1000 / 1000); 2995e65e175bSOded Gabbay 2996e65e175bSOded Gabbay value = hl_fw_get_frequency(hdev, hdev->asic_prop.clk_pll_index, true); 2997e65e175bSOded Gabbay 2998e65e175bSOded Gabbay if (value < 0) { 2999e65e175bSOded Gabbay dev_err(hdev->dev, "Failed to retrieve device current clock %ld\n", value); 3000e65e175bSOded Gabbay return value; 3001e65e175bSOded Gabbay } 3002e65e175bSOded Gabbay 3003e65e175bSOded Gabbay *cur_clk = (value / 1000 / 1000); 3004e65e175bSOded Gabbay 3005e65e175bSOded Gabbay return 0; 3006e65e175bSOded Gabbay } 3007e65e175bSOded Gabbay 3008e65e175bSOded Gabbay long hl_fw_get_frequency(struct hl_device *hdev, u32 pll_index, bool curr) 3009e65e175bSOded Gabbay { 3010e65e175bSOded Gabbay struct cpucp_packet pkt; 3011e65e175bSOded Gabbay u32 used_pll_idx; 3012e65e175bSOded Gabbay u64 result; 3013e65e175bSOded Gabbay int rc; 3014e65e175bSOded Gabbay 3015e65e175bSOded Gabbay rc = get_used_pll_index(hdev, pll_index, &used_pll_idx); 3016e65e175bSOded Gabbay if (rc) 3017e65e175bSOded Gabbay return rc; 3018e65e175bSOded Gabbay 3019e65e175bSOded Gabbay memset(&pkt, 0, sizeof(pkt)); 3020e65e175bSOded Gabbay 3021e65e175bSOded Gabbay if (curr) 3022e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_FREQUENCY_CURR_GET << 3023e65e175bSOded Gabbay CPUCP_PKT_CTL_OPCODE_SHIFT); 3024e65e175bSOded Gabbay else 3025e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_FREQUENCY_GET << CPUCP_PKT_CTL_OPCODE_SHIFT); 3026e65e175bSOded Gabbay 3027e65e175bSOded Gabbay pkt.pll_index = cpu_to_le32((u32)used_pll_idx); 3028e65e175bSOded Gabbay 3029e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 0, &result); 3030e65e175bSOded Gabbay 3031e65e175bSOded Gabbay if (rc) { 3032e65e175bSOded Gabbay dev_err(hdev->dev, "Failed to get frequency of PLL %d, error %d\n", 3033e65e175bSOded Gabbay used_pll_idx, rc); 3034e65e175bSOded Gabbay return rc; 3035e65e175bSOded Gabbay } 3036e65e175bSOded Gabbay 3037e65e175bSOded Gabbay return (long) result; 3038e65e175bSOded Gabbay } 3039e65e175bSOded Gabbay 3040e65e175bSOded Gabbay void hl_fw_set_frequency(struct hl_device *hdev, u32 pll_index, u64 freq) 3041e65e175bSOded Gabbay { 3042e65e175bSOded Gabbay struct cpucp_packet pkt; 3043e65e175bSOded Gabbay u32 used_pll_idx; 3044e65e175bSOded Gabbay int rc; 3045e65e175bSOded Gabbay 3046e65e175bSOded Gabbay rc = get_used_pll_index(hdev, pll_index, &used_pll_idx); 3047e65e175bSOded Gabbay if (rc) 3048e65e175bSOded Gabbay return; 3049e65e175bSOded Gabbay 3050e65e175bSOded Gabbay memset(&pkt, 0, sizeof(pkt)); 3051e65e175bSOded Gabbay 3052e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_FREQUENCY_SET << CPUCP_PKT_CTL_OPCODE_SHIFT); 3053e65e175bSOded Gabbay pkt.pll_index = cpu_to_le32((u32)used_pll_idx); 3054e65e175bSOded Gabbay pkt.value = cpu_to_le64(freq); 3055e65e175bSOded Gabbay 3056e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 0, NULL); 3057e65e175bSOded Gabbay 3058e65e175bSOded Gabbay if (rc) 3059e65e175bSOded Gabbay dev_err(hdev->dev, "Failed to set frequency to PLL %d, error %d\n", 3060e65e175bSOded Gabbay used_pll_idx, rc); 3061e65e175bSOded Gabbay } 3062e65e175bSOded Gabbay 3063e65e175bSOded Gabbay long hl_fw_get_max_power(struct hl_device *hdev) 3064e65e175bSOded Gabbay { 3065e65e175bSOded Gabbay struct cpucp_packet pkt; 3066e65e175bSOded Gabbay u64 result; 3067e65e175bSOded Gabbay int rc; 3068e65e175bSOded Gabbay 3069e65e175bSOded Gabbay memset(&pkt, 0, sizeof(pkt)); 3070e65e175bSOded Gabbay 3071e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_MAX_POWER_GET << CPUCP_PKT_CTL_OPCODE_SHIFT); 3072e65e175bSOded Gabbay 3073e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 0, &result); 3074e65e175bSOded Gabbay 3075e65e175bSOded Gabbay if (rc) { 3076e65e175bSOded Gabbay dev_err(hdev->dev, "Failed to get max power, error %d\n", rc); 3077e65e175bSOded Gabbay return rc; 3078e65e175bSOded Gabbay } 3079e65e175bSOded Gabbay 3080e65e175bSOded Gabbay return result; 3081e65e175bSOded Gabbay } 3082e65e175bSOded Gabbay 3083e65e175bSOded Gabbay void hl_fw_set_max_power(struct hl_device *hdev) 3084e65e175bSOded Gabbay { 3085e65e175bSOded Gabbay struct cpucp_packet pkt; 3086e65e175bSOded Gabbay int rc; 3087e65e175bSOded Gabbay 3088e65e175bSOded Gabbay /* TODO: remove this after simulator supports this packet */ 3089e65e175bSOded Gabbay if (!hdev->pdev) 3090e65e175bSOded Gabbay return; 3091e65e175bSOded Gabbay 3092e65e175bSOded Gabbay memset(&pkt, 0, sizeof(pkt)); 3093e65e175bSOded Gabbay 3094e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_MAX_POWER_SET << CPUCP_PKT_CTL_OPCODE_SHIFT); 3095e65e175bSOded Gabbay pkt.value = cpu_to_le64(hdev->max_power); 3096e65e175bSOded Gabbay 3097e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 0, NULL); 3098e65e175bSOded Gabbay 3099e65e175bSOded Gabbay if (rc) 3100e65e175bSOded Gabbay dev_err(hdev->dev, "Failed to set max power, error %d\n", rc); 3101e65e175bSOded Gabbay } 3102e65e175bSOded Gabbay 3103e65e175bSOded Gabbay static int hl_fw_get_sec_attest_data(struct hl_device *hdev, u32 packet_id, void *data, u32 size, 3104e65e175bSOded Gabbay u32 nonce, u32 timeout) 3105e65e175bSOded Gabbay { 3106e65e175bSOded Gabbay struct cpucp_packet pkt = {}; 3107e65e175bSOded Gabbay dma_addr_t req_dma_addr; 3108e65e175bSOded Gabbay void *req_cpu_addr; 3109e65e175bSOded Gabbay int rc; 3110e65e175bSOded Gabbay 3111e65e175bSOded Gabbay req_cpu_addr = hl_cpu_accessible_dma_pool_alloc(hdev, size, &req_dma_addr); 3112e65e175bSOded Gabbay if (!req_cpu_addr) { 3113e65e175bSOded Gabbay dev_err(hdev->dev, 3114e65e175bSOded Gabbay "Failed to allocate DMA memory for CPU-CP packet %u\n", packet_id); 3115e65e175bSOded Gabbay return -ENOMEM; 3116e65e175bSOded Gabbay } 3117e65e175bSOded Gabbay 3118e65e175bSOded Gabbay memset(data, 0, size); 3119e65e175bSOded Gabbay 3120e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(packet_id << CPUCP_PKT_CTL_OPCODE_SHIFT); 3121e65e175bSOded Gabbay pkt.addr = cpu_to_le64(req_dma_addr); 3122e65e175bSOded Gabbay pkt.data_max_size = cpu_to_le32(size); 3123e65e175bSOded Gabbay pkt.nonce = cpu_to_le32(nonce); 3124e65e175bSOded Gabbay 3125e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *) &pkt, sizeof(pkt), 3126e65e175bSOded Gabbay timeout, NULL); 3127e65e175bSOded Gabbay if (rc) { 3128e65e175bSOded Gabbay dev_err(hdev->dev, 3129e65e175bSOded Gabbay "Failed to handle CPU-CP pkt %u, error %d\n", packet_id, rc); 3130e65e175bSOded Gabbay goto out; 3131e65e175bSOded Gabbay } 3132e65e175bSOded Gabbay 3133e65e175bSOded Gabbay memcpy(data, req_cpu_addr, size); 3134e65e175bSOded Gabbay 3135e65e175bSOded Gabbay out: 3136e65e175bSOded Gabbay hl_cpu_accessible_dma_pool_free(hdev, size, req_cpu_addr); 3137e65e175bSOded Gabbay 3138e65e175bSOded Gabbay return rc; 3139e65e175bSOded Gabbay } 3140e65e175bSOded Gabbay 3141e65e175bSOded Gabbay int hl_fw_get_sec_attest_info(struct hl_device *hdev, struct cpucp_sec_attest_info *sec_attest_info, 3142e65e175bSOded Gabbay u32 nonce) 3143e65e175bSOded Gabbay { 3144e65e175bSOded Gabbay return hl_fw_get_sec_attest_data(hdev, CPUCP_PACKET_SEC_ATTEST_GET, sec_attest_info, 3145e65e175bSOded Gabbay sizeof(struct cpucp_sec_attest_info), nonce, 3146e65e175bSOded Gabbay HL_CPUCP_SEC_ATTEST_INFO_TINEOUT_USEC); 3147e65e175bSOded Gabbay } 3148e65e175bSOded Gabbay 3149e65e175bSOded Gabbay int hl_fw_send_generic_request(struct hl_device *hdev, enum hl_passthrough_type sub_opcode, 3150e65e175bSOded Gabbay dma_addr_t buff, u32 *size) 3151e65e175bSOded Gabbay { 31527cd6b562STomer Tayar struct cpucp_packet pkt = {}; 3153e65e175bSOded Gabbay u64 result; 3154e65e175bSOded Gabbay int rc = 0; 3155e65e175bSOded Gabbay 3156e65e175bSOded Gabbay pkt.ctl = cpu_to_le32(CPUCP_PACKET_GENERIC_PASSTHROUGH << CPUCP_PKT_CTL_OPCODE_SHIFT); 3157e65e175bSOded Gabbay pkt.addr = cpu_to_le64(buff); 3158e65e175bSOded Gabbay pkt.data_max_size = cpu_to_le32(*size); 3159e65e175bSOded Gabbay pkt.pkt_subidx = cpu_to_le32(sub_opcode); 3160e65e175bSOded Gabbay 3161e65e175bSOded Gabbay rc = hdev->asic_funcs->send_cpu_message(hdev, (u32 *)&pkt, sizeof(pkt), 3162e65e175bSOded Gabbay HL_CPUCP_INFO_TIMEOUT_USEC, &result); 3163e65e175bSOded Gabbay if (rc) 3164e65e175bSOded Gabbay dev_err(hdev->dev, "failed to send CPUCP data of generic fw pkt\n"); 3165e65e175bSOded Gabbay else 3166e65e175bSOded Gabbay dev_dbg(hdev->dev, "generic pkt was successful, result: 0x%llx\n", result); 3167e65e175bSOded Gabbay 3168e65e175bSOded Gabbay *size = (u32)result; 3169e65e175bSOded Gabbay 3170e65e175bSOded Gabbay return rc; 3171e65e175bSOded Gabbay } 3172