xref: /OK3568_Linux_fs/kernel/drivers/misc/habanalabs/goya/goyaP.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun  *
3*4882a593Smuzhiyun  * Copyright 2016-2019 HabanaLabs, Ltd.
4*4882a593Smuzhiyun  * All Rights Reserved.
5*4882a593Smuzhiyun  *
6*4882a593Smuzhiyun  */
7*4882a593Smuzhiyun 
8*4882a593Smuzhiyun #ifndef GOYAP_H_
9*4882a593Smuzhiyun #define GOYAP_H_
10*4882a593Smuzhiyun 
11*4882a593Smuzhiyun #include <uapi/misc/habanalabs.h>
12*4882a593Smuzhiyun #include "../common/habanalabs.h"
13*4882a593Smuzhiyun #include "../include/common/hl_boot_if.h"
14*4882a593Smuzhiyun #include "../include/goya/goya_packets.h"
15*4882a593Smuzhiyun #include "../include/goya/goya.h"
16*4882a593Smuzhiyun #include "../include/goya/goya_async_events.h"
17*4882a593Smuzhiyun #include "../include/goya/goya_fw_if.h"
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun #define NUMBER_OF_CMPLT_QUEUES		5
20*4882a593Smuzhiyun #define NUMBER_OF_EXT_HW_QUEUES		5
21*4882a593Smuzhiyun #define NUMBER_OF_CPU_HW_QUEUES		1
22*4882a593Smuzhiyun #define NUMBER_OF_INT_HW_QUEUES		9
23*4882a593Smuzhiyun #define NUMBER_OF_HW_QUEUES		(NUMBER_OF_EXT_HW_QUEUES + \
24*4882a593Smuzhiyun 					NUMBER_OF_CPU_HW_QUEUES + \
25*4882a593Smuzhiyun 					NUMBER_OF_INT_HW_QUEUES)
26*4882a593Smuzhiyun 
27*4882a593Smuzhiyun /*
28*4882a593Smuzhiyun  * Number of MSIX interrupts IDS:
29*4882a593Smuzhiyun  * Each completion queue has 1 ID
30*4882a593Smuzhiyun  * The event queue has 1 ID
31*4882a593Smuzhiyun  */
32*4882a593Smuzhiyun #define NUMBER_OF_INTERRUPTS		(NUMBER_OF_CMPLT_QUEUES + 1)
33*4882a593Smuzhiyun 
34*4882a593Smuzhiyun #if (NUMBER_OF_INTERRUPTS > GOYA_MSIX_ENTRIES)
35*4882a593Smuzhiyun #error "Number of MSIX interrupts must be smaller or equal to GOYA_MSIX_ENTRIES"
36*4882a593Smuzhiyun #endif
37*4882a593Smuzhiyun 
38*4882a593Smuzhiyun #define QMAN_FENCE_TIMEOUT_USEC		10000		/* 10 ms */
39*4882a593Smuzhiyun 
40*4882a593Smuzhiyun #define QMAN_STOP_TIMEOUT_USEC		100000		/* 100 ms */
41*4882a593Smuzhiyun 
42*4882a593Smuzhiyun #define CORESIGHT_TIMEOUT_USEC		100000		/* 100 ms */
43*4882a593Smuzhiyun 
44*4882a593Smuzhiyun #define GOYA_CPU_TIMEOUT_USEC		15000000	/* 15s */
45*4882a593Smuzhiyun 
46*4882a593Smuzhiyun #define TPC_ENABLED_MASK		0xFF
47*4882a593Smuzhiyun 
48*4882a593Smuzhiyun #define PLL_HIGH_DEFAULT		1575000000	/* 1.575 GHz */
49*4882a593Smuzhiyun 
50*4882a593Smuzhiyun #define MAX_POWER_DEFAULT		200000		/* 200W */
51*4882a593Smuzhiyun 
52*4882a593Smuzhiyun #define DRAM_PHYS_DEFAULT_SIZE		0x100000000ull	/* 4GB */
53*4882a593Smuzhiyun 
54*4882a593Smuzhiyun #define GOYA_DEFAULT_CARD_NAME		"HL1000"
55*4882a593Smuzhiyun 
56*4882a593Smuzhiyun #define GOYA_MAX_PENDING_CS		64
57*4882a593Smuzhiyun 
58*4882a593Smuzhiyun #if !IS_MAX_PENDING_CS_VALID(GOYA_MAX_PENDING_CS)
59*4882a593Smuzhiyun #error "GOYA_MAX_PENDING_CS must be power of 2 and greater than 1"
60*4882a593Smuzhiyun #endif
61*4882a593Smuzhiyun 
62*4882a593Smuzhiyun /* DRAM Memory Map */
63*4882a593Smuzhiyun 
64*4882a593Smuzhiyun #define CPU_FW_IMAGE_SIZE		0x10000000	/* 256MB */
65*4882a593Smuzhiyun #define MMU_PAGE_TABLES_SIZE		0x0FC00000	/* 252MB */
66*4882a593Smuzhiyun #define MMU_DRAM_DEFAULT_PAGE_SIZE	0x00200000	/* 2MB */
67*4882a593Smuzhiyun #define MMU_CACHE_MNG_SIZE		0x00001000	/* 4KB */
68*4882a593Smuzhiyun 
69*4882a593Smuzhiyun #define CPU_FW_IMAGE_ADDR		DRAM_PHYS_BASE
70*4882a593Smuzhiyun #define MMU_PAGE_TABLES_ADDR		(CPU_FW_IMAGE_ADDR + CPU_FW_IMAGE_SIZE)
71*4882a593Smuzhiyun #define MMU_DRAM_DEFAULT_PAGE_ADDR	(MMU_PAGE_TABLES_ADDR + \
72*4882a593Smuzhiyun 						MMU_PAGE_TABLES_SIZE)
73*4882a593Smuzhiyun #define MMU_CACHE_MNG_ADDR		(MMU_DRAM_DEFAULT_PAGE_ADDR + \
74*4882a593Smuzhiyun 					MMU_DRAM_DEFAULT_PAGE_SIZE)
75*4882a593Smuzhiyun #define DRAM_DRIVER_END_ADDR		(MMU_CACHE_MNG_ADDR + \
76*4882a593Smuzhiyun 						MMU_CACHE_MNG_SIZE)
77*4882a593Smuzhiyun 
78*4882a593Smuzhiyun #define DRAM_BASE_ADDR_USER		0x20000000
79*4882a593Smuzhiyun 
80*4882a593Smuzhiyun #if (DRAM_DRIVER_END_ADDR > DRAM_BASE_ADDR_USER)
81*4882a593Smuzhiyun #error "Driver must reserve no more than 512MB"
82*4882a593Smuzhiyun #endif
83*4882a593Smuzhiyun 
84*4882a593Smuzhiyun /*
85*4882a593Smuzhiyun  * SRAM Memory Map for Driver
86*4882a593Smuzhiyun  *
87*4882a593Smuzhiyun  * Driver occupies DRIVER_SRAM_SIZE bytes from the start of SRAM. It is used for
88*4882a593Smuzhiyun  * MME/TPC QMANs
89*4882a593Smuzhiyun  *
90*4882a593Smuzhiyun  */
91*4882a593Smuzhiyun 
92*4882a593Smuzhiyun #define MME_QMAN_BASE_OFFSET	0x000000	/* Must be 0 */
93*4882a593Smuzhiyun #define MME_QMAN_LENGTH		64
94*4882a593Smuzhiyun #define TPC_QMAN_LENGTH		64
95*4882a593Smuzhiyun 
96*4882a593Smuzhiyun #define TPC0_QMAN_BASE_OFFSET	(MME_QMAN_BASE_OFFSET + \
97*4882a593Smuzhiyun 				(MME_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
98*4882a593Smuzhiyun #define TPC1_QMAN_BASE_OFFSET	(TPC0_QMAN_BASE_OFFSET + \
99*4882a593Smuzhiyun 				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
100*4882a593Smuzhiyun #define TPC2_QMAN_BASE_OFFSET	(TPC1_QMAN_BASE_OFFSET + \
101*4882a593Smuzhiyun 				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
102*4882a593Smuzhiyun #define TPC3_QMAN_BASE_OFFSET	(TPC2_QMAN_BASE_OFFSET + \
103*4882a593Smuzhiyun 				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
104*4882a593Smuzhiyun #define TPC4_QMAN_BASE_OFFSET	(TPC3_QMAN_BASE_OFFSET + \
105*4882a593Smuzhiyun 				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
106*4882a593Smuzhiyun #define TPC5_QMAN_BASE_OFFSET	(TPC4_QMAN_BASE_OFFSET + \
107*4882a593Smuzhiyun 				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
108*4882a593Smuzhiyun #define TPC6_QMAN_BASE_OFFSET	(TPC5_QMAN_BASE_OFFSET + \
109*4882a593Smuzhiyun 				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
110*4882a593Smuzhiyun #define TPC7_QMAN_BASE_OFFSET	(TPC6_QMAN_BASE_OFFSET + \
111*4882a593Smuzhiyun 				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
112*4882a593Smuzhiyun 
113*4882a593Smuzhiyun #define SRAM_DRIVER_RES_OFFSET	(TPC7_QMAN_BASE_OFFSET + \
114*4882a593Smuzhiyun 				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
115*4882a593Smuzhiyun 
116*4882a593Smuzhiyun #if (SRAM_DRIVER_RES_OFFSET >= GOYA_KMD_SRAM_RESERVED_SIZE_FROM_START)
117*4882a593Smuzhiyun #error "MME/TPC QMANs SRAM space exceeds limit"
118*4882a593Smuzhiyun #endif
119*4882a593Smuzhiyun 
120*4882a593Smuzhiyun #define SRAM_USER_BASE_OFFSET	GOYA_KMD_SRAM_RESERVED_SIZE_FROM_START
121*4882a593Smuzhiyun 
122*4882a593Smuzhiyun /* Virtual address space */
123*4882a593Smuzhiyun #define VA_HOST_SPACE_START	0x1000000000000ull	/* 256TB */
124*4882a593Smuzhiyun #define VA_HOST_SPACE_END	0x3FF8000000000ull	/* 1PB - 1TB */
125*4882a593Smuzhiyun #define VA_HOST_SPACE_SIZE	(VA_HOST_SPACE_END - \
126*4882a593Smuzhiyun 					VA_HOST_SPACE_START) /* 767TB */
127*4882a593Smuzhiyun 
128*4882a593Smuzhiyun #define VA_DDR_SPACE_START	0x800000000ull		/* 32GB */
129*4882a593Smuzhiyun #define VA_DDR_SPACE_END	0x2000000000ull		/* 128GB */
130*4882a593Smuzhiyun #define VA_DDR_SPACE_SIZE	(VA_DDR_SPACE_END - \
131*4882a593Smuzhiyun 					VA_DDR_SPACE_START)	/* 128GB */
132*4882a593Smuzhiyun 
133*4882a593Smuzhiyun #if (HL_CPU_ACCESSIBLE_MEM_SIZE != SZ_2M)
134*4882a593Smuzhiyun #error "HL_CPU_ACCESSIBLE_MEM_SIZE must be exactly 2MB to enable MMU mapping"
135*4882a593Smuzhiyun #endif
136*4882a593Smuzhiyun 
137*4882a593Smuzhiyun #define VA_CPU_ACCESSIBLE_MEM_ADDR	0x8000000000ull
138*4882a593Smuzhiyun 
139*4882a593Smuzhiyun #define DMA_MAX_TRANSFER_SIZE	U32_MAX
140*4882a593Smuzhiyun 
141*4882a593Smuzhiyun #define HW_CAP_PLL		0x00000001
142*4882a593Smuzhiyun #define HW_CAP_DDR_0		0x00000002
143*4882a593Smuzhiyun #define HW_CAP_DDR_1		0x00000004
144*4882a593Smuzhiyun #define HW_CAP_MME		0x00000008
145*4882a593Smuzhiyun #define HW_CAP_CPU		0x00000010
146*4882a593Smuzhiyun #define HW_CAP_DMA		0x00000020
147*4882a593Smuzhiyun #define HW_CAP_MSIX		0x00000040
148*4882a593Smuzhiyun #define HW_CAP_CPU_Q		0x00000080
149*4882a593Smuzhiyun #define HW_CAP_MMU		0x00000100
150*4882a593Smuzhiyun #define HW_CAP_TPC_MBIST	0x00000200
151*4882a593Smuzhiyun #define HW_CAP_GOLDEN		0x00000400
152*4882a593Smuzhiyun #define HW_CAP_TPC		0x00000800
153*4882a593Smuzhiyun 
154*4882a593Smuzhiyun struct goya_device {
155*4882a593Smuzhiyun 	/* TODO: remove hw_queues_lock after moving to scheduler code */
156*4882a593Smuzhiyun 	spinlock_t	hw_queues_lock;
157*4882a593Smuzhiyun 
158*4882a593Smuzhiyun 	u64		mme_clk;
159*4882a593Smuzhiyun 	u64		tpc_clk;
160*4882a593Smuzhiyun 	u64		ic_clk;
161*4882a593Smuzhiyun 
162*4882a593Smuzhiyun 	u64		ddr_bar_cur_addr;
163*4882a593Smuzhiyun 	u32		events_stat[GOYA_ASYNC_EVENT_ID_SIZE];
164*4882a593Smuzhiyun 	u32		events_stat_aggregate[GOYA_ASYNC_EVENT_ID_SIZE];
165*4882a593Smuzhiyun 	u32		hw_cap_initialized;
166*4882a593Smuzhiyun 	u8		device_cpu_mmu_mappings_done;
167*4882a593Smuzhiyun };
168*4882a593Smuzhiyun 
169*4882a593Smuzhiyun int goya_get_fixed_properties(struct hl_device *hdev);
170*4882a593Smuzhiyun int goya_mmu_init(struct hl_device *hdev);
171*4882a593Smuzhiyun void goya_init_dma_qmans(struct hl_device *hdev);
172*4882a593Smuzhiyun void goya_init_mme_qmans(struct hl_device *hdev);
173*4882a593Smuzhiyun void goya_init_tpc_qmans(struct hl_device *hdev);
174*4882a593Smuzhiyun int goya_init_cpu_queues(struct hl_device *hdev);
175*4882a593Smuzhiyun void goya_init_security(struct hl_device *hdev);
176*4882a593Smuzhiyun int goya_late_init(struct hl_device *hdev);
177*4882a593Smuzhiyun void goya_late_fini(struct hl_device *hdev);
178*4882a593Smuzhiyun 
179*4882a593Smuzhiyun void goya_ring_doorbell(struct hl_device *hdev, u32 hw_queue_id, u32 pi);
180*4882a593Smuzhiyun void goya_pqe_write(struct hl_device *hdev, __le64 *pqe, struct hl_bd *bd);
181*4882a593Smuzhiyun void goya_update_eq_ci(struct hl_device *hdev, u32 val);
182*4882a593Smuzhiyun void goya_restore_phase_topology(struct hl_device *hdev);
183*4882a593Smuzhiyun int goya_context_switch(struct hl_device *hdev, u32 asid);
184*4882a593Smuzhiyun 
185*4882a593Smuzhiyun int goya_debugfs_i2c_read(struct hl_device *hdev, u8 i2c_bus,
186*4882a593Smuzhiyun 			u8 i2c_addr, u8 i2c_reg, u32 *val);
187*4882a593Smuzhiyun int goya_debugfs_i2c_write(struct hl_device *hdev, u8 i2c_bus,
188*4882a593Smuzhiyun 			u8 i2c_addr, u8 i2c_reg, u32 val);
189*4882a593Smuzhiyun void goya_debugfs_led_set(struct hl_device *hdev, u8 led, u8 state);
190*4882a593Smuzhiyun 
191*4882a593Smuzhiyun int goya_test_queue(struct hl_device *hdev, u32 hw_queue_id);
192*4882a593Smuzhiyun int goya_test_queues(struct hl_device *hdev);
193*4882a593Smuzhiyun int goya_test_cpu_queue(struct hl_device *hdev);
194*4882a593Smuzhiyun int goya_send_cpu_message(struct hl_device *hdev, u32 *msg, u16 len,
195*4882a593Smuzhiyun 				u32 timeout, long *result);
196*4882a593Smuzhiyun 
197*4882a593Smuzhiyun long goya_get_temperature(struct hl_device *hdev, int sensor_index, u32 attr);
198*4882a593Smuzhiyun long goya_get_voltage(struct hl_device *hdev, int sensor_index, u32 attr);
199*4882a593Smuzhiyun long goya_get_current(struct hl_device *hdev, int sensor_index, u32 attr);
200*4882a593Smuzhiyun long goya_get_fan_speed(struct hl_device *hdev, int sensor_index, u32 attr);
201*4882a593Smuzhiyun long goya_get_pwm_info(struct hl_device *hdev, int sensor_index, u32 attr);
202*4882a593Smuzhiyun void goya_set_pwm_info(struct hl_device *hdev, int sensor_index, u32 attr,
203*4882a593Smuzhiyun 			long value);
204*4882a593Smuzhiyun u64 goya_get_max_power(struct hl_device *hdev);
205*4882a593Smuzhiyun void goya_set_max_power(struct hl_device *hdev, u64 value);
206*4882a593Smuzhiyun 
207*4882a593Smuzhiyun void goya_set_pll_profile(struct hl_device *hdev, enum hl_pll_frequency freq);
208*4882a593Smuzhiyun void goya_add_device_attr(struct hl_device *hdev,
209*4882a593Smuzhiyun 			struct attribute_group *dev_attr_grp);
210*4882a593Smuzhiyun int goya_cpucp_info_get(struct hl_device *hdev);
211*4882a593Smuzhiyun int goya_debug_coresight(struct hl_device *hdev, void *data);
212*4882a593Smuzhiyun void goya_halt_coresight(struct hl_device *hdev);
213*4882a593Smuzhiyun 
214*4882a593Smuzhiyun int goya_suspend(struct hl_device *hdev);
215*4882a593Smuzhiyun int goya_resume(struct hl_device *hdev);
216*4882a593Smuzhiyun 
217*4882a593Smuzhiyun void goya_handle_eqe(struct hl_device *hdev, struct hl_eq_entry *eq_entry);
218*4882a593Smuzhiyun void *goya_get_events_stat(struct hl_device *hdev, bool aggregate, u32 *size);
219*4882a593Smuzhiyun 
220*4882a593Smuzhiyun void goya_add_end_of_cb_packets(struct hl_device *hdev, void *kernel_address,
221*4882a593Smuzhiyun 				u32 len, u64 cq_addr, u32 cq_val, u32 msix_vec,
222*4882a593Smuzhiyun 				bool eb);
223*4882a593Smuzhiyun int goya_cs_parser(struct hl_device *hdev, struct hl_cs_parser *parser);
224*4882a593Smuzhiyun void *goya_get_int_queue_base(struct hl_device *hdev, u32 queue_id,
225*4882a593Smuzhiyun 				dma_addr_t *dma_handle,	u16 *queue_len);
226*4882a593Smuzhiyun u32 goya_get_dma_desc_list_size(struct hl_device *hdev, struct sg_table *sgt);
227*4882a593Smuzhiyun int goya_send_heartbeat(struct hl_device *hdev);
228*4882a593Smuzhiyun void *goya_cpu_accessible_dma_pool_alloc(struct hl_device *hdev, size_t size,
229*4882a593Smuzhiyun 					dma_addr_t *dma_handle);
230*4882a593Smuzhiyun void goya_cpu_accessible_dma_pool_free(struct hl_device *hdev, size_t size,
231*4882a593Smuzhiyun 					void *vaddr);
232*4882a593Smuzhiyun void goya_mmu_remove_device_cpu_mappings(struct hl_device *hdev);
233*4882a593Smuzhiyun 
234*4882a593Smuzhiyun int goya_get_clk_rate(struct hl_device *hdev, u32 *cur_clk, u32 *max_clk);
235*4882a593Smuzhiyun u32 goya_get_queue_id_for_cq(struct hl_device *hdev, u32 cq_idx);
236*4882a593Smuzhiyun u64 goya_get_device_time(struct hl_device *hdev);
237*4882a593Smuzhiyun 
238*4882a593Smuzhiyun #endif /* GOYAP_H_ */
239