1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0 2*4882a593Smuzhiyun * 3*4882a593Smuzhiyun * Copyright 2016-2019 HabanaLabs, Ltd. 4*4882a593Smuzhiyun * All Rights Reserved. 5*4882a593Smuzhiyun * 6*4882a593Smuzhiyun */ 7*4882a593Smuzhiyun 8*4882a593Smuzhiyun #ifndef GOYAP_H_ 9*4882a593Smuzhiyun #define GOYAP_H_ 10*4882a593Smuzhiyun 11*4882a593Smuzhiyun #include <uapi/misc/habanalabs.h> 12*4882a593Smuzhiyun #include "../common/habanalabs.h" 13*4882a593Smuzhiyun #include "../include/common/hl_boot_if.h" 14*4882a593Smuzhiyun #include "../include/goya/goya_packets.h" 15*4882a593Smuzhiyun #include "../include/goya/goya.h" 16*4882a593Smuzhiyun #include "../include/goya/goya_async_events.h" 17*4882a593Smuzhiyun #include "../include/goya/goya_fw_if.h" 18*4882a593Smuzhiyun 19*4882a593Smuzhiyun #define NUMBER_OF_CMPLT_QUEUES 5 20*4882a593Smuzhiyun #define NUMBER_OF_EXT_HW_QUEUES 5 21*4882a593Smuzhiyun #define NUMBER_OF_CPU_HW_QUEUES 1 22*4882a593Smuzhiyun #define NUMBER_OF_INT_HW_QUEUES 9 23*4882a593Smuzhiyun #define NUMBER_OF_HW_QUEUES (NUMBER_OF_EXT_HW_QUEUES + \ 24*4882a593Smuzhiyun NUMBER_OF_CPU_HW_QUEUES + \ 25*4882a593Smuzhiyun NUMBER_OF_INT_HW_QUEUES) 26*4882a593Smuzhiyun 27*4882a593Smuzhiyun /* 28*4882a593Smuzhiyun * Number of MSIX interrupts IDS: 29*4882a593Smuzhiyun * Each completion queue has 1 ID 30*4882a593Smuzhiyun * The event queue has 1 ID 31*4882a593Smuzhiyun */ 32*4882a593Smuzhiyun #define NUMBER_OF_INTERRUPTS (NUMBER_OF_CMPLT_QUEUES + 1) 33*4882a593Smuzhiyun 34*4882a593Smuzhiyun #if (NUMBER_OF_INTERRUPTS > GOYA_MSIX_ENTRIES) 35*4882a593Smuzhiyun #error "Number of MSIX interrupts must be smaller or equal to GOYA_MSIX_ENTRIES" 36*4882a593Smuzhiyun #endif 37*4882a593Smuzhiyun 38*4882a593Smuzhiyun #define QMAN_FENCE_TIMEOUT_USEC 10000 /* 10 ms */ 39*4882a593Smuzhiyun 40*4882a593Smuzhiyun #define QMAN_STOP_TIMEOUT_USEC 100000 /* 100 ms */ 41*4882a593Smuzhiyun 42*4882a593Smuzhiyun #define CORESIGHT_TIMEOUT_USEC 100000 /* 100 ms */ 43*4882a593Smuzhiyun 44*4882a593Smuzhiyun #define GOYA_CPU_TIMEOUT_USEC 15000000 /* 15s */ 45*4882a593Smuzhiyun 46*4882a593Smuzhiyun #define TPC_ENABLED_MASK 0xFF 47*4882a593Smuzhiyun 48*4882a593Smuzhiyun #define PLL_HIGH_DEFAULT 1575000000 /* 1.575 GHz */ 49*4882a593Smuzhiyun 50*4882a593Smuzhiyun #define MAX_POWER_DEFAULT 200000 /* 200W */ 51*4882a593Smuzhiyun 52*4882a593Smuzhiyun #define DRAM_PHYS_DEFAULT_SIZE 0x100000000ull /* 4GB */ 53*4882a593Smuzhiyun 54*4882a593Smuzhiyun #define GOYA_DEFAULT_CARD_NAME "HL1000" 55*4882a593Smuzhiyun 56*4882a593Smuzhiyun #define GOYA_MAX_PENDING_CS 64 57*4882a593Smuzhiyun 58*4882a593Smuzhiyun #if !IS_MAX_PENDING_CS_VALID(GOYA_MAX_PENDING_CS) 59*4882a593Smuzhiyun #error "GOYA_MAX_PENDING_CS must be power of 2 and greater than 1" 60*4882a593Smuzhiyun #endif 61*4882a593Smuzhiyun 62*4882a593Smuzhiyun /* DRAM Memory Map */ 63*4882a593Smuzhiyun 64*4882a593Smuzhiyun #define CPU_FW_IMAGE_SIZE 0x10000000 /* 256MB */ 65*4882a593Smuzhiyun #define MMU_PAGE_TABLES_SIZE 0x0FC00000 /* 252MB */ 66*4882a593Smuzhiyun #define MMU_DRAM_DEFAULT_PAGE_SIZE 0x00200000 /* 2MB */ 67*4882a593Smuzhiyun #define MMU_CACHE_MNG_SIZE 0x00001000 /* 4KB */ 68*4882a593Smuzhiyun 69*4882a593Smuzhiyun #define CPU_FW_IMAGE_ADDR DRAM_PHYS_BASE 70*4882a593Smuzhiyun #define MMU_PAGE_TABLES_ADDR (CPU_FW_IMAGE_ADDR + CPU_FW_IMAGE_SIZE) 71*4882a593Smuzhiyun #define MMU_DRAM_DEFAULT_PAGE_ADDR (MMU_PAGE_TABLES_ADDR + \ 72*4882a593Smuzhiyun MMU_PAGE_TABLES_SIZE) 73*4882a593Smuzhiyun #define MMU_CACHE_MNG_ADDR (MMU_DRAM_DEFAULT_PAGE_ADDR + \ 74*4882a593Smuzhiyun MMU_DRAM_DEFAULT_PAGE_SIZE) 75*4882a593Smuzhiyun #define DRAM_DRIVER_END_ADDR (MMU_CACHE_MNG_ADDR + \ 76*4882a593Smuzhiyun MMU_CACHE_MNG_SIZE) 77*4882a593Smuzhiyun 78*4882a593Smuzhiyun #define DRAM_BASE_ADDR_USER 0x20000000 79*4882a593Smuzhiyun 80*4882a593Smuzhiyun #if (DRAM_DRIVER_END_ADDR > DRAM_BASE_ADDR_USER) 81*4882a593Smuzhiyun #error "Driver must reserve no more than 512MB" 82*4882a593Smuzhiyun #endif 83*4882a593Smuzhiyun 84*4882a593Smuzhiyun /* 85*4882a593Smuzhiyun * SRAM Memory Map for Driver 86*4882a593Smuzhiyun * 87*4882a593Smuzhiyun * Driver occupies DRIVER_SRAM_SIZE bytes from the start of SRAM. It is used for 88*4882a593Smuzhiyun * MME/TPC QMANs 89*4882a593Smuzhiyun * 90*4882a593Smuzhiyun */ 91*4882a593Smuzhiyun 92*4882a593Smuzhiyun #define MME_QMAN_BASE_OFFSET 0x000000 /* Must be 0 */ 93*4882a593Smuzhiyun #define MME_QMAN_LENGTH 64 94*4882a593Smuzhiyun #define TPC_QMAN_LENGTH 64 95*4882a593Smuzhiyun 96*4882a593Smuzhiyun #define TPC0_QMAN_BASE_OFFSET (MME_QMAN_BASE_OFFSET + \ 97*4882a593Smuzhiyun (MME_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) 98*4882a593Smuzhiyun #define TPC1_QMAN_BASE_OFFSET (TPC0_QMAN_BASE_OFFSET + \ 99*4882a593Smuzhiyun (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) 100*4882a593Smuzhiyun #define TPC2_QMAN_BASE_OFFSET (TPC1_QMAN_BASE_OFFSET + \ 101*4882a593Smuzhiyun (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) 102*4882a593Smuzhiyun #define TPC3_QMAN_BASE_OFFSET (TPC2_QMAN_BASE_OFFSET + \ 103*4882a593Smuzhiyun (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) 104*4882a593Smuzhiyun #define TPC4_QMAN_BASE_OFFSET (TPC3_QMAN_BASE_OFFSET + \ 105*4882a593Smuzhiyun (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) 106*4882a593Smuzhiyun #define TPC5_QMAN_BASE_OFFSET (TPC4_QMAN_BASE_OFFSET + \ 107*4882a593Smuzhiyun (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) 108*4882a593Smuzhiyun #define TPC6_QMAN_BASE_OFFSET (TPC5_QMAN_BASE_OFFSET + \ 109*4882a593Smuzhiyun (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) 110*4882a593Smuzhiyun #define TPC7_QMAN_BASE_OFFSET (TPC6_QMAN_BASE_OFFSET + \ 111*4882a593Smuzhiyun (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) 112*4882a593Smuzhiyun 113*4882a593Smuzhiyun #define SRAM_DRIVER_RES_OFFSET (TPC7_QMAN_BASE_OFFSET + \ 114*4882a593Smuzhiyun (TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE)) 115*4882a593Smuzhiyun 116*4882a593Smuzhiyun #if (SRAM_DRIVER_RES_OFFSET >= GOYA_KMD_SRAM_RESERVED_SIZE_FROM_START) 117*4882a593Smuzhiyun #error "MME/TPC QMANs SRAM space exceeds limit" 118*4882a593Smuzhiyun #endif 119*4882a593Smuzhiyun 120*4882a593Smuzhiyun #define SRAM_USER_BASE_OFFSET GOYA_KMD_SRAM_RESERVED_SIZE_FROM_START 121*4882a593Smuzhiyun 122*4882a593Smuzhiyun /* Virtual address space */ 123*4882a593Smuzhiyun #define VA_HOST_SPACE_START 0x1000000000000ull /* 256TB */ 124*4882a593Smuzhiyun #define VA_HOST_SPACE_END 0x3FF8000000000ull /* 1PB - 1TB */ 125*4882a593Smuzhiyun #define VA_HOST_SPACE_SIZE (VA_HOST_SPACE_END - \ 126*4882a593Smuzhiyun VA_HOST_SPACE_START) /* 767TB */ 127*4882a593Smuzhiyun 128*4882a593Smuzhiyun #define VA_DDR_SPACE_START 0x800000000ull /* 32GB */ 129*4882a593Smuzhiyun #define VA_DDR_SPACE_END 0x2000000000ull /* 128GB */ 130*4882a593Smuzhiyun #define VA_DDR_SPACE_SIZE (VA_DDR_SPACE_END - \ 131*4882a593Smuzhiyun VA_DDR_SPACE_START) /* 128GB */ 132*4882a593Smuzhiyun 133*4882a593Smuzhiyun #if (HL_CPU_ACCESSIBLE_MEM_SIZE != SZ_2M) 134*4882a593Smuzhiyun #error "HL_CPU_ACCESSIBLE_MEM_SIZE must be exactly 2MB to enable MMU mapping" 135*4882a593Smuzhiyun #endif 136*4882a593Smuzhiyun 137*4882a593Smuzhiyun #define VA_CPU_ACCESSIBLE_MEM_ADDR 0x8000000000ull 138*4882a593Smuzhiyun 139*4882a593Smuzhiyun #define DMA_MAX_TRANSFER_SIZE U32_MAX 140*4882a593Smuzhiyun 141*4882a593Smuzhiyun #define HW_CAP_PLL 0x00000001 142*4882a593Smuzhiyun #define HW_CAP_DDR_0 0x00000002 143*4882a593Smuzhiyun #define HW_CAP_DDR_1 0x00000004 144*4882a593Smuzhiyun #define HW_CAP_MME 0x00000008 145*4882a593Smuzhiyun #define HW_CAP_CPU 0x00000010 146*4882a593Smuzhiyun #define HW_CAP_DMA 0x00000020 147*4882a593Smuzhiyun #define HW_CAP_MSIX 0x00000040 148*4882a593Smuzhiyun #define HW_CAP_CPU_Q 0x00000080 149*4882a593Smuzhiyun #define HW_CAP_MMU 0x00000100 150*4882a593Smuzhiyun #define HW_CAP_TPC_MBIST 0x00000200 151*4882a593Smuzhiyun #define HW_CAP_GOLDEN 0x00000400 152*4882a593Smuzhiyun #define HW_CAP_TPC 0x00000800 153*4882a593Smuzhiyun 154*4882a593Smuzhiyun struct goya_device { 155*4882a593Smuzhiyun /* TODO: remove hw_queues_lock after moving to scheduler code */ 156*4882a593Smuzhiyun spinlock_t hw_queues_lock; 157*4882a593Smuzhiyun 158*4882a593Smuzhiyun u64 mme_clk; 159*4882a593Smuzhiyun u64 tpc_clk; 160*4882a593Smuzhiyun u64 ic_clk; 161*4882a593Smuzhiyun 162*4882a593Smuzhiyun u64 ddr_bar_cur_addr; 163*4882a593Smuzhiyun u32 events_stat[GOYA_ASYNC_EVENT_ID_SIZE]; 164*4882a593Smuzhiyun u32 events_stat_aggregate[GOYA_ASYNC_EVENT_ID_SIZE]; 165*4882a593Smuzhiyun u32 hw_cap_initialized; 166*4882a593Smuzhiyun u8 device_cpu_mmu_mappings_done; 167*4882a593Smuzhiyun }; 168*4882a593Smuzhiyun 169*4882a593Smuzhiyun int goya_get_fixed_properties(struct hl_device *hdev); 170*4882a593Smuzhiyun int goya_mmu_init(struct hl_device *hdev); 171*4882a593Smuzhiyun void goya_init_dma_qmans(struct hl_device *hdev); 172*4882a593Smuzhiyun void goya_init_mme_qmans(struct hl_device *hdev); 173*4882a593Smuzhiyun void goya_init_tpc_qmans(struct hl_device *hdev); 174*4882a593Smuzhiyun int goya_init_cpu_queues(struct hl_device *hdev); 175*4882a593Smuzhiyun void goya_init_security(struct hl_device *hdev); 176*4882a593Smuzhiyun int goya_late_init(struct hl_device *hdev); 177*4882a593Smuzhiyun void goya_late_fini(struct hl_device *hdev); 178*4882a593Smuzhiyun 179*4882a593Smuzhiyun void goya_ring_doorbell(struct hl_device *hdev, u32 hw_queue_id, u32 pi); 180*4882a593Smuzhiyun void goya_pqe_write(struct hl_device *hdev, __le64 *pqe, struct hl_bd *bd); 181*4882a593Smuzhiyun void goya_update_eq_ci(struct hl_device *hdev, u32 val); 182*4882a593Smuzhiyun void goya_restore_phase_topology(struct hl_device *hdev); 183*4882a593Smuzhiyun int goya_context_switch(struct hl_device *hdev, u32 asid); 184*4882a593Smuzhiyun 185*4882a593Smuzhiyun int goya_debugfs_i2c_read(struct hl_device *hdev, u8 i2c_bus, 186*4882a593Smuzhiyun u8 i2c_addr, u8 i2c_reg, u32 *val); 187*4882a593Smuzhiyun int goya_debugfs_i2c_write(struct hl_device *hdev, u8 i2c_bus, 188*4882a593Smuzhiyun u8 i2c_addr, u8 i2c_reg, u32 val); 189*4882a593Smuzhiyun void goya_debugfs_led_set(struct hl_device *hdev, u8 led, u8 state); 190*4882a593Smuzhiyun 191*4882a593Smuzhiyun int goya_test_queue(struct hl_device *hdev, u32 hw_queue_id); 192*4882a593Smuzhiyun int goya_test_queues(struct hl_device *hdev); 193*4882a593Smuzhiyun int goya_test_cpu_queue(struct hl_device *hdev); 194*4882a593Smuzhiyun int goya_send_cpu_message(struct hl_device *hdev, u32 *msg, u16 len, 195*4882a593Smuzhiyun u32 timeout, long *result); 196*4882a593Smuzhiyun 197*4882a593Smuzhiyun long goya_get_temperature(struct hl_device *hdev, int sensor_index, u32 attr); 198*4882a593Smuzhiyun long goya_get_voltage(struct hl_device *hdev, int sensor_index, u32 attr); 199*4882a593Smuzhiyun long goya_get_current(struct hl_device *hdev, int sensor_index, u32 attr); 200*4882a593Smuzhiyun long goya_get_fan_speed(struct hl_device *hdev, int sensor_index, u32 attr); 201*4882a593Smuzhiyun long goya_get_pwm_info(struct hl_device *hdev, int sensor_index, u32 attr); 202*4882a593Smuzhiyun void goya_set_pwm_info(struct hl_device *hdev, int sensor_index, u32 attr, 203*4882a593Smuzhiyun long value); 204*4882a593Smuzhiyun u64 goya_get_max_power(struct hl_device *hdev); 205*4882a593Smuzhiyun void goya_set_max_power(struct hl_device *hdev, u64 value); 206*4882a593Smuzhiyun 207*4882a593Smuzhiyun void goya_set_pll_profile(struct hl_device *hdev, enum hl_pll_frequency freq); 208*4882a593Smuzhiyun void goya_add_device_attr(struct hl_device *hdev, 209*4882a593Smuzhiyun struct attribute_group *dev_attr_grp); 210*4882a593Smuzhiyun int goya_cpucp_info_get(struct hl_device *hdev); 211*4882a593Smuzhiyun int goya_debug_coresight(struct hl_device *hdev, void *data); 212*4882a593Smuzhiyun void goya_halt_coresight(struct hl_device *hdev); 213*4882a593Smuzhiyun 214*4882a593Smuzhiyun int goya_suspend(struct hl_device *hdev); 215*4882a593Smuzhiyun int goya_resume(struct hl_device *hdev); 216*4882a593Smuzhiyun 217*4882a593Smuzhiyun void goya_handle_eqe(struct hl_device *hdev, struct hl_eq_entry *eq_entry); 218*4882a593Smuzhiyun void *goya_get_events_stat(struct hl_device *hdev, bool aggregate, u32 *size); 219*4882a593Smuzhiyun 220*4882a593Smuzhiyun void goya_add_end_of_cb_packets(struct hl_device *hdev, void *kernel_address, 221*4882a593Smuzhiyun u32 len, u64 cq_addr, u32 cq_val, u32 msix_vec, 222*4882a593Smuzhiyun bool eb); 223*4882a593Smuzhiyun int goya_cs_parser(struct hl_device *hdev, struct hl_cs_parser *parser); 224*4882a593Smuzhiyun void *goya_get_int_queue_base(struct hl_device *hdev, u32 queue_id, 225*4882a593Smuzhiyun dma_addr_t *dma_handle, u16 *queue_len); 226*4882a593Smuzhiyun u32 goya_get_dma_desc_list_size(struct hl_device *hdev, struct sg_table *sgt); 227*4882a593Smuzhiyun int goya_send_heartbeat(struct hl_device *hdev); 228*4882a593Smuzhiyun void *goya_cpu_accessible_dma_pool_alloc(struct hl_device *hdev, size_t size, 229*4882a593Smuzhiyun dma_addr_t *dma_handle); 230*4882a593Smuzhiyun void goya_cpu_accessible_dma_pool_free(struct hl_device *hdev, size_t size, 231*4882a593Smuzhiyun void *vaddr); 232*4882a593Smuzhiyun void goya_mmu_remove_device_cpu_mappings(struct hl_device *hdev); 233*4882a593Smuzhiyun 234*4882a593Smuzhiyun int goya_get_clk_rate(struct hl_device *hdev, u32 *cur_clk, u32 *max_clk); 235*4882a593Smuzhiyun u32 goya_get_queue_id_for_cq(struct hl_device *hdev, u32 cq_idx); 236*4882a593Smuzhiyun u64 goya_get_device_time(struct hl_device *hdev); 237*4882a593Smuzhiyun 238*4882a593Smuzhiyun #endif /* GOYAP_H_ */ 239