| 1 | /* SPDX-License-Identifier: GPL-2.0 |
| 2 | * |
| 3 | * Copyright 2016-2022 HabanaLabs, Ltd. |
| 4 | * All Rights Reserved. |
| 5 | * |
| 6 | */ |
| 7 | |
| 8 | #ifndef GOYAP_H_ |
| 9 | #define GOYAP_H_ |
| 10 | |
| 11 | #include <uapi/drm/habanalabs_accel.h> |
| 12 | #include <linux/habanalabs/hl_boot_if.h> |
| 13 | #include "../common/habanalabs.h" |
| 14 | #include "../include/goya/goya_packets.h" |
| 15 | #include "../include/goya/goya.h" |
| 16 | #include "../include/goya/goya_async_events.h" |
| 17 | #include "../include/goya/goya_fw_if.h" |
| 18 | |
| 19 | #define NUMBER_OF_CMPLT_QUEUES 5 |
| 20 | #define NUMBER_OF_EXT_HW_QUEUES 5 |
| 21 | #define NUMBER_OF_CPU_HW_QUEUES 1 |
| 22 | #define NUMBER_OF_INT_HW_QUEUES 9 |
| 23 | #define NUMBER_OF_HW_QUEUES (NUMBER_OF_EXT_HW_QUEUES + \ |
| 24 | NUMBER_OF_CPU_HW_QUEUES + \ |
| 25 | NUMBER_OF_INT_HW_QUEUES) |
| 26 | |
| 27 | /* |
| 28 | * Number of MSIX interrupts IDS: |
| 29 | * Each completion queue has 1 ID |
| 30 | * The event queue has 1 ID |
| 31 | */ |
| 32 | #define NUMBER_OF_INTERRUPTS (NUMBER_OF_CMPLT_QUEUES + 1) |
| 33 | |
| 34 | #if (NUMBER_OF_INTERRUPTS > GOYA_MSIX_ENTRIES) |
| 35 | #error "Number of MSIX interrupts must be smaller or equal to GOYA_MSIX_ENTRIES" |
| 36 | #endif |
| 37 | |
| 38 | #define QMAN_FENCE_TIMEOUT_USEC 10000 /* 10 ms */ |
| 39 | |
| 40 | #define QMAN_STOP_TIMEOUT_USEC 100000 /* 100 ms */ |
| 41 | |
| 42 | #define CORESIGHT_TIMEOUT_USEC 100000 /* 100 ms */ |
| 43 | |
| 44 | #define GOYA_CPU_TIMEOUT_USEC 15000000 /* 15s */ |
| 45 | |
| 46 | #define TPC_ENABLED_MASK 0xFF |
| 47 | |
| 48 | #define PLL_HIGH_DEFAULT 1575000000 /* 1.575 GHz */ |
| 49 | |
| 50 | #define MAX_POWER_DEFAULT 200000 /* 200W */ |
| 51 | |
| 52 | #define DC_POWER_DEFAULT 20000 /* 20W */ |
| 53 | |
| 54 | #define DRAM_PHYS_DEFAULT_SIZE 0x100000000ull /* 4GB */ |
| 55 | |
| 56 | #define GOYA_DEFAULT_CARD_NAME "HL1000" |
| 57 | |
| 58 | #define GOYA_MAX_PENDING_CS 64 |
| 59 | |
| 60 | #if !IS_MAX_PENDING_CS_VALID(GOYA_MAX_PENDING_CS) |
| 61 | #error "GOYA_MAX_PENDING_CS must be power of 2 and greater than 1" |
| 62 | #endif |
| 63 | |
| 64 | /* DRAM Memory Map */ |
| 65 | |
| 66 | #define CPU_FW_IMAGE_SIZE 0x10000000 /* 256MB */ |
| 67 | #define MMU_PAGE_TABLES_SIZE 0x0FC00000 /* 252MB */ |
| 68 | #define MMU_DRAM_DEFAULT_PAGE_SIZE 0x00200000 /* 2MB */ |
| 69 | #define MMU_CACHE_MNG_SIZE 0x00001000 /* 4KB */ |
| 70 | |
| 71 | #define CPU_FW_IMAGE_ADDR DRAM_PHYS_BASE |
| 72 | #define MMU_PAGE_TABLES_ADDR (CPU_FW_IMAGE_ADDR + CPU_FW_IMAGE_SIZE) |
| 73 | #define MMU_DRAM_DEFAULT_PAGE_ADDR (MMU_PAGE_TABLES_ADDR + \ |
| 74 | MMU_PAGE_TABLES_SIZE) |
| 75 | #define MMU_CACHE_MNG_ADDR (MMU_DRAM_DEFAULT_PAGE_ADDR + \ |
| 76 | MMU_DRAM_DEFAULT_PAGE_SIZE) |
| 77 | #define DRAM_DRIVER_END_ADDR (MMU_CACHE_MNG_ADDR + \ |
| 78 | MMU_CACHE_MNG_SIZE) |
| 79 | |
| 80 | #define DRAM_BASE_ADDR_USER 0x20000000 |
| 81 | |
| 82 | #if (DRAM_DRIVER_END_ADDR > DRAM_BASE_ADDR_USER) |
| 83 | #error "Driver must reserve no more than 512MB" |
| 84 | #endif |
| 85 | |
| 86 | /* |
| 87 | * SRAM Memory Map for Driver |
| 88 | * |
| 89 | * Driver occupies DRIVER_SRAM_SIZE bytes from the start of SRAM. It is used for |
| 90 | * MME/TPC QMANs |
| 91 | * |
| 92 | */ |
| 93 | |
| 94 | #define MME_QMAN_BASE_OFFSET 0x000000 /* Must be 0 */ |
| 95 | #define MME_QMAN_LENGTH 64 |
| 96 | #define TPC_QMAN_LENGTH 64 |
| 97 | |
| 98 | #define TPC0_QMAN_BASE_OFFSET (MME_QMAN_BASE_OFFSET + \ |
| 99 | (MME_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) |
| 100 | #define TPC1_QMAN_BASE_OFFSET (TPC0_QMAN_BASE_OFFSET + \ |
| 101 | (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) |
| 102 | #define TPC2_QMAN_BASE_OFFSET (TPC1_QMAN_BASE_OFFSET + \ |
| 103 | (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) |
| 104 | #define TPC3_QMAN_BASE_OFFSET (TPC2_QMAN_BASE_OFFSET + \ |
| 105 | (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) |
| 106 | #define TPC4_QMAN_BASE_OFFSET (TPC3_QMAN_BASE_OFFSET + \ |
| 107 | (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) |
| 108 | #define TPC5_QMAN_BASE_OFFSET (TPC4_QMAN_BASE_OFFSET + \ |
| 109 | (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) |
| 110 | #define TPC6_QMAN_BASE_OFFSET (TPC5_QMAN_BASE_OFFSET + \ |
| 111 | (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) |
| 112 | #define TPC7_QMAN_BASE_OFFSET (TPC6_QMAN_BASE_OFFSET + \ |
| 113 | (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) |
| 114 | |
| 115 | #define SRAM_DRIVER_RES_OFFSET (TPC7_QMAN_BASE_OFFSET + \ |
| 116 | (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) |
| 117 | |
| 118 | #if (SRAM_DRIVER_RES_OFFSET >= GOYA_KMD_SRAM_RESERVED_SIZE_FROM_START) |
| 119 | #error "MME/TPC QMANs SRAM space exceeds limit" |
| 120 | #endif |
| 121 | |
| 122 | #define SRAM_USER_BASE_OFFSET GOYA_KMD_SRAM_RESERVED_SIZE_FROM_START |
| 123 | |
| 124 | /* Virtual address space */ |
| 125 | #define VA_HOST_SPACE_START 0x1000000000000ull /* 256TB */ |
| 126 | #define VA_HOST_SPACE_END 0x3FF8000000000ull /* 1PB - 1TB */ |
| 127 | #define VA_HOST_SPACE_SIZE (VA_HOST_SPACE_END - \ |
| 128 | VA_HOST_SPACE_START) /* 767TB */ |
| 129 | |
| 130 | #define VA_DDR_SPACE_START 0x800000000ull /* 32GB */ |
| 131 | #define VA_DDR_SPACE_END 0x2000000000ull /* 128GB */ |
| 132 | #define VA_DDR_SPACE_SIZE (VA_DDR_SPACE_END - \ |
| 133 | VA_DDR_SPACE_START) /* 128GB */ |
| 134 | |
| 135 | #if (HL_CPU_ACCESSIBLE_MEM_SIZE != SZ_2M) |
| 136 | #error "HL_CPU_ACCESSIBLE_MEM_SIZE must be exactly 2MB to enable MMU mapping" |
| 137 | #endif |
| 138 | |
| 139 | #define VA_CPU_ACCESSIBLE_MEM_ADDR 0x8000000000ull |
| 140 | |
| 141 | #define DMA_MAX_TRANSFER_SIZE U32_MAX |
| 142 | |
| 143 | #define HW_CAP_PLL 0x00000001 |
| 144 | #define HW_CAP_DDR_0 0x00000002 |
| 145 | #define HW_CAP_DDR_1 0x00000004 |
| 146 | #define HW_CAP_MME 0x00000008 |
| 147 | #define HW_CAP_CPU 0x00000010 |
| 148 | #define HW_CAP_DMA 0x00000020 |
| 149 | #define HW_CAP_MSIX 0x00000040 |
| 150 | #define HW_CAP_CPU_Q 0x00000080 |
| 151 | #define HW_CAP_MMU 0x00000100 |
| 152 | #define HW_CAP_TPC_MBIST 0x00000200 |
| 153 | #define HW_CAP_GOLDEN 0x00000400 |
| 154 | #define HW_CAP_TPC 0x00000800 |
| 155 | |
| 156 | struct goya_work_freq { |
| 157 | struct hl_device *hdev; |
| 158 | struct delayed_work work_freq; |
| 159 | }; |
| 160 | |
| 161 | struct goya_device { |
| 162 | /* TODO: remove hw_queues_lock after moving to scheduler code */ |
| 163 | spinlock_t hw_queues_lock; |
| 164 | struct goya_work_freq *goya_work; |
| 165 | |
| 166 | u64 mme_clk; |
| 167 | u64 tpc_clk; |
| 168 | u64 ic_clk; |
| 169 | |
| 170 | u64 ddr_bar_cur_addr; |
| 171 | u32 events_stat[GOYA_ASYNC_EVENT_ID_SIZE]; |
| 172 | u32 events_stat_aggregate[GOYA_ASYNC_EVENT_ID_SIZE]; |
| 173 | u32 hw_cap_initialized; |
| 174 | u8 device_cpu_mmu_mappings_done; |
| 175 | |
| 176 | enum hl_pll_frequency curr_pll_profile; |
| 177 | enum hl_pm_mng_profile pm_mng_profile; |
| 178 | }; |
| 179 | |
| 180 | int goya_set_fixed_properties(struct hl_device *hdev); |
| 181 | int goya_mmu_init(struct hl_device *hdev); |
| 182 | void goya_init_dma_qmans(struct hl_device *hdev); |
| 183 | void goya_init_mme_qmans(struct hl_device *hdev); |
| 184 | void goya_init_tpc_qmans(struct hl_device *hdev); |
| 185 | int goya_init_cpu_queues(struct hl_device *hdev); |
| 186 | void goya_init_security(struct hl_device *hdev); |
| 187 | void goya_ack_protection_bits_errors(struct hl_device *hdev); |
| 188 | int goya_late_init(struct hl_device *hdev); |
| 189 | void goya_late_fini(struct hl_device *hdev); |
| 190 | |
| 191 | void goya_ring_doorbell(struct hl_device *hdev, u32 hw_queue_id, u32 pi); |
| 192 | void goya_pqe_write(struct hl_device *hdev, __le64 *pqe, struct hl_bd *bd); |
| 193 | void goya_update_eq_ci(struct hl_device *hdev, u32 val); |
| 194 | void goya_restore_phase_topology(struct hl_device *hdev); |
| 195 | int goya_context_switch(struct hl_device *hdev, u32 asid); |
| 196 | |
| 197 | int goya_debugfs_i2c_read(struct hl_device *hdev, u8 i2c_bus, |
| 198 | u8 i2c_addr, u8 i2c_reg, u32 *val); |
| 199 | int goya_debugfs_i2c_write(struct hl_device *hdev, u8 i2c_bus, |
| 200 | u8 i2c_addr, u8 i2c_reg, u32 val); |
| 201 | void goya_debugfs_led_set(struct hl_device *hdev, u8 led, u8 state); |
| 202 | |
| 203 | int goya_test_queue(struct hl_device *hdev, u32 hw_queue_id); |
| 204 | int goya_test_queues(struct hl_device *hdev); |
| 205 | int goya_test_cpu_queue(struct hl_device *hdev); |
| 206 | int goya_send_cpu_message(struct hl_device *hdev, u32 *msg, u16 len, |
| 207 | u32 timeout, u64 *result); |
| 208 | |
| 209 | long goya_get_temperature(struct hl_device *hdev, int sensor_index, u32 attr); |
| 210 | long goya_get_voltage(struct hl_device *hdev, int sensor_index, u32 attr); |
| 211 | long goya_get_current(struct hl_device *hdev, int sensor_index, u32 attr); |
| 212 | long goya_get_fan_speed(struct hl_device *hdev, int sensor_index, u32 attr); |
| 213 | long goya_get_pwm_info(struct hl_device *hdev, int sensor_index, u32 attr); |
| 214 | void goya_set_pwm_info(struct hl_device *hdev, int sensor_index, u32 attr, |
| 215 | long value); |
| 216 | u64 goya_get_max_power(struct hl_device *hdev); |
| 217 | void goya_set_max_power(struct hl_device *hdev, u64 value); |
| 218 | |
| 219 | void goya_set_pll_profile(struct hl_device *hdev, enum hl_pll_frequency freq); |
| 220 | void goya_add_device_attr(struct hl_device *hdev, struct attribute_group *dev_clk_attr_grp, |
| 221 | struct attribute_group *dev_vrm_attr_grp); |
| 222 | int goya_cpucp_info_get(struct hl_device *hdev); |
| 223 | int goya_debug_coresight(struct hl_device *hdev, struct hl_ctx *ctx, void *data); |
| 224 | void goya_halt_coresight(struct hl_device *hdev, struct hl_ctx *ctx); |
| 225 | |
| 226 | int goya_suspend(struct hl_device *hdev); |
| 227 | int goya_resume(struct hl_device *hdev); |
| 228 | |
| 229 | void goya_handle_eqe(struct hl_device *hdev, struct hl_eq_entry *eq_entry); |
| 230 | void *goya_get_events_stat(struct hl_device *hdev, bool aggregate, u32 *size); |
| 231 | |
| 232 | void goya_add_end_of_cb_packets(struct hl_device *hdev, void *kernel_address, |
| 233 | u32 len, u32 original_len, u64 cq_addr, u32 cq_val, |
| 234 | u32 msix_vec, bool eb); |
| 235 | int goya_cs_parser(struct hl_device *hdev, struct hl_cs_parser *parser); |
| 236 | int goya_scrub_device_mem(struct hl_device *hdev); |
| 237 | void *goya_get_int_queue_base(struct hl_device *hdev, u32 queue_id, |
| 238 | dma_addr_t *dma_handle, u16 *queue_len); |
| 239 | u32 goya_get_dma_desc_list_size(struct hl_device *hdev, struct sg_table *sgt); |
| 240 | int goya_send_heartbeat(struct hl_device *hdev); |
| 241 | void *goya_cpu_accessible_dma_pool_alloc(struct hl_device *hdev, size_t size, |
| 242 | dma_addr_t *dma_handle); |
| 243 | void goya_cpu_accessible_dma_pool_free(struct hl_device *hdev, size_t size, |
| 244 | void *vaddr); |
| 245 | void goya_mmu_remove_device_cpu_mappings(struct hl_device *hdev); |
| 246 | |
| 247 | u32 goya_get_queue_id_for_cq(struct hl_device *hdev, u32 cq_idx); |
| 248 | u64 goya_get_device_time(struct hl_device *hdev); |
| 249 | int goya_set_frequency(struct hl_device *hdev, enum hl_pll_frequency freq); |
| 250 | |
| 251 | #endif /* GOYAP_H_ */ |
| 252 | |