xref: /OK3568_Linux_fs/kernel/drivers/gpu/drm/amd/amdgpu/amdgpu_discovery.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * Copyright 2018 Advanced Micro Devices, Inc.
3*4882a593Smuzhiyun  *
4*4882a593Smuzhiyun  * Permission is hereby granted, free of charge, to any person obtaining a
5*4882a593Smuzhiyun  * copy of this software and associated documentation files (the "Software"),
6*4882a593Smuzhiyun  * to deal in the Software without restriction, including without limitation
7*4882a593Smuzhiyun  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8*4882a593Smuzhiyun  * and/or sell copies of the Software, and to permit persons to whom the
9*4882a593Smuzhiyun  * Software is furnished to do so, subject to the following conditions:
10*4882a593Smuzhiyun  *
11*4882a593Smuzhiyun  * The above copyright notice and this permission notice shall be included in
12*4882a593Smuzhiyun  * all copies or substantial portions of the Software.
13*4882a593Smuzhiyun  *
14*4882a593Smuzhiyun  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15*4882a593Smuzhiyun  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16*4882a593Smuzhiyun  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17*4882a593Smuzhiyun  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18*4882a593Smuzhiyun  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19*4882a593Smuzhiyun  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20*4882a593Smuzhiyun  * OTHER DEALINGS IN THE SOFTWARE.
21*4882a593Smuzhiyun  *
22*4882a593Smuzhiyun  */
23*4882a593Smuzhiyun 
24*4882a593Smuzhiyun #include "amdgpu.h"
25*4882a593Smuzhiyun #include "amdgpu_discovery.h"
26*4882a593Smuzhiyun #include "soc15_hw_ip.h"
27*4882a593Smuzhiyun #include "discovery.h"
28*4882a593Smuzhiyun 
29*4882a593Smuzhiyun #define mmRCC_CONFIG_MEMSIZE	0xde3
30*4882a593Smuzhiyun #define mmMM_INDEX		0x0
31*4882a593Smuzhiyun #define mmMM_INDEX_HI		0x6
32*4882a593Smuzhiyun #define mmMM_DATA		0x1
33*4882a593Smuzhiyun #define HW_ID_MAX		300
34*4882a593Smuzhiyun 
35*4882a593Smuzhiyun static const char *hw_id_names[HW_ID_MAX] = {
36*4882a593Smuzhiyun 	[MP1_HWID]		= "MP1",
37*4882a593Smuzhiyun 	[MP2_HWID]		= "MP2",
38*4882a593Smuzhiyun 	[THM_HWID]		= "THM",
39*4882a593Smuzhiyun 	[SMUIO_HWID]		= "SMUIO",
40*4882a593Smuzhiyun 	[FUSE_HWID]		= "FUSE",
41*4882a593Smuzhiyun 	[CLKA_HWID]		= "CLKA",
42*4882a593Smuzhiyun 	[PWR_HWID]		= "PWR",
43*4882a593Smuzhiyun 	[GC_HWID]		= "GC",
44*4882a593Smuzhiyun 	[UVD_HWID]		= "UVD",
45*4882a593Smuzhiyun 	[AUDIO_AZ_HWID]		= "AUDIO_AZ",
46*4882a593Smuzhiyun 	[ACP_HWID]		= "ACP",
47*4882a593Smuzhiyun 	[DCI_HWID]		= "DCI",
48*4882a593Smuzhiyun 	[DMU_HWID]		= "DMU",
49*4882a593Smuzhiyun 	[DCO_HWID]		= "DCO",
50*4882a593Smuzhiyun 	[DIO_HWID]		= "DIO",
51*4882a593Smuzhiyun 	[XDMA_HWID]		= "XDMA",
52*4882a593Smuzhiyun 	[DCEAZ_HWID]		= "DCEAZ",
53*4882a593Smuzhiyun 	[DAZ_HWID]		= "DAZ",
54*4882a593Smuzhiyun 	[SDPMUX_HWID]		= "SDPMUX",
55*4882a593Smuzhiyun 	[NTB_HWID]		= "NTB",
56*4882a593Smuzhiyun 	[IOHC_HWID]		= "IOHC",
57*4882a593Smuzhiyun 	[L2IMU_HWID]		= "L2IMU",
58*4882a593Smuzhiyun 	[VCE_HWID]		= "VCE",
59*4882a593Smuzhiyun 	[MMHUB_HWID]		= "MMHUB",
60*4882a593Smuzhiyun 	[ATHUB_HWID]		= "ATHUB",
61*4882a593Smuzhiyun 	[DBGU_NBIO_HWID]	= "DBGU_NBIO",
62*4882a593Smuzhiyun 	[DFX_HWID]		= "DFX",
63*4882a593Smuzhiyun 	[DBGU0_HWID]		= "DBGU0",
64*4882a593Smuzhiyun 	[DBGU1_HWID]		= "DBGU1",
65*4882a593Smuzhiyun 	[OSSSYS_HWID]		= "OSSSYS",
66*4882a593Smuzhiyun 	[HDP_HWID]		= "HDP",
67*4882a593Smuzhiyun 	[SDMA0_HWID]		= "SDMA0",
68*4882a593Smuzhiyun 	[SDMA1_HWID]		= "SDMA1",
69*4882a593Smuzhiyun 	[ISP_HWID]		= "ISP",
70*4882a593Smuzhiyun 	[DBGU_IO_HWID]		= "DBGU_IO",
71*4882a593Smuzhiyun 	[DF_HWID]		= "DF",
72*4882a593Smuzhiyun 	[CLKB_HWID]		= "CLKB",
73*4882a593Smuzhiyun 	[FCH_HWID]		= "FCH",
74*4882a593Smuzhiyun 	[DFX_DAP_HWID]		= "DFX_DAP",
75*4882a593Smuzhiyun 	[L1IMU_PCIE_HWID]	= "L1IMU_PCIE",
76*4882a593Smuzhiyun 	[L1IMU_NBIF_HWID]	= "L1IMU_NBIF",
77*4882a593Smuzhiyun 	[L1IMU_IOAGR_HWID]	= "L1IMU_IOAGR",
78*4882a593Smuzhiyun 	[L1IMU3_HWID]		= "L1IMU3",
79*4882a593Smuzhiyun 	[L1IMU4_HWID]		= "L1IMU4",
80*4882a593Smuzhiyun 	[L1IMU5_HWID]		= "L1IMU5",
81*4882a593Smuzhiyun 	[L1IMU6_HWID]		= "L1IMU6",
82*4882a593Smuzhiyun 	[L1IMU7_HWID]		= "L1IMU7",
83*4882a593Smuzhiyun 	[L1IMU8_HWID]		= "L1IMU8",
84*4882a593Smuzhiyun 	[L1IMU9_HWID]		= "L1IMU9",
85*4882a593Smuzhiyun 	[L1IMU10_HWID]		= "L1IMU10",
86*4882a593Smuzhiyun 	[L1IMU11_HWID]		= "L1IMU11",
87*4882a593Smuzhiyun 	[L1IMU12_HWID]		= "L1IMU12",
88*4882a593Smuzhiyun 	[L1IMU13_HWID]		= "L1IMU13",
89*4882a593Smuzhiyun 	[L1IMU14_HWID]		= "L1IMU14",
90*4882a593Smuzhiyun 	[L1IMU15_HWID]		= "L1IMU15",
91*4882a593Smuzhiyun 	[WAFLC_HWID]		= "WAFLC",
92*4882a593Smuzhiyun 	[FCH_USB_PD_HWID]	= "FCH_USB_PD",
93*4882a593Smuzhiyun 	[PCIE_HWID]		= "PCIE",
94*4882a593Smuzhiyun 	[PCS_HWID]		= "PCS",
95*4882a593Smuzhiyun 	[DDCL_HWID]		= "DDCL",
96*4882a593Smuzhiyun 	[SST_HWID]		= "SST",
97*4882a593Smuzhiyun 	[IOAGR_HWID]		= "IOAGR",
98*4882a593Smuzhiyun 	[NBIF_HWID]		= "NBIF",
99*4882a593Smuzhiyun 	[IOAPIC_HWID]		= "IOAPIC",
100*4882a593Smuzhiyun 	[SYSTEMHUB_HWID]	= "SYSTEMHUB",
101*4882a593Smuzhiyun 	[NTBCCP_HWID]		= "NTBCCP",
102*4882a593Smuzhiyun 	[UMC_HWID]		= "UMC",
103*4882a593Smuzhiyun 	[SATA_HWID]		= "SATA",
104*4882a593Smuzhiyun 	[USB_HWID]		= "USB",
105*4882a593Smuzhiyun 	[CCXSEC_HWID]		= "CCXSEC",
106*4882a593Smuzhiyun 	[XGMI_HWID]		= "XGMI",
107*4882a593Smuzhiyun 	[XGBE_HWID]		= "XGBE",
108*4882a593Smuzhiyun 	[MP0_HWID]		= "MP0",
109*4882a593Smuzhiyun };
110*4882a593Smuzhiyun 
111*4882a593Smuzhiyun static int hw_id_map[MAX_HWIP] = {
112*4882a593Smuzhiyun 	[GC_HWIP]	= GC_HWID,
113*4882a593Smuzhiyun 	[HDP_HWIP]	= HDP_HWID,
114*4882a593Smuzhiyun 	[SDMA0_HWIP]	= SDMA0_HWID,
115*4882a593Smuzhiyun 	[SDMA1_HWIP]	= SDMA1_HWID,
116*4882a593Smuzhiyun 	[MMHUB_HWIP]	= MMHUB_HWID,
117*4882a593Smuzhiyun 	[ATHUB_HWIP]	= ATHUB_HWID,
118*4882a593Smuzhiyun 	[NBIO_HWIP]	= NBIF_HWID,
119*4882a593Smuzhiyun 	[MP0_HWIP]	= MP0_HWID,
120*4882a593Smuzhiyun 	[MP1_HWIP]	= MP1_HWID,
121*4882a593Smuzhiyun 	[UVD_HWIP]	= UVD_HWID,
122*4882a593Smuzhiyun 	[VCE_HWIP]	= VCE_HWID,
123*4882a593Smuzhiyun 	[DF_HWIP]	= DF_HWID,
124*4882a593Smuzhiyun 	[DCE_HWIP]	= DMU_HWID,
125*4882a593Smuzhiyun 	[OSSSYS_HWIP]	= OSSSYS_HWID,
126*4882a593Smuzhiyun 	[SMUIO_HWIP]	= SMUIO_HWID,
127*4882a593Smuzhiyun 	[PWR_HWIP]	= PWR_HWID,
128*4882a593Smuzhiyun 	[NBIF_HWIP]	= NBIF_HWID,
129*4882a593Smuzhiyun 	[THM_HWIP]	= THM_HWID,
130*4882a593Smuzhiyun 	[CLK_HWIP]	= CLKA_HWID,
131*4882a593Smuzhiyun };
132*4882a593Smuzhiyun 
amdgpu_discovery_read_binary(struct amdgpu_device * adev,uint8_t * binary)133*4882a593Smuzhiyun static int amdgpu_discovery_read_binary(struct amdgpu_device *adev, uint8_t *binary)
134*4882a593Smuzhiyun {
135*4882a593Smuzhiyun 	uint64_t vram_size = (uint64_t)RREG32(mmRCC_CONFIG_MEMSIZE) << 20;
136*4882a593Smuzhiyun 	uint64_t pos = vram_size - DISCOVERY_TMR_OFFSET;
137*4882a593Smuzhiyun 
138*4882a593Smuzhiyun 	amdgpu_device_vram_access(adev, pos, (uint32_t *)binary,
139*4882a593Smuzhiyun 				  adev->mman.discovery_tmr_size, false);
140*4882a593Smuzhiyun 	return 0;
141*4882a593Smuzhiyun }
142*4882a593Smuzhiyun 
amdgpu_discovery_calculate_checksum(uint8_t * data,uint32_t size)143*4882a593Smuzhiyun static uint16_t amdgpu_discovery_calculate_checksum(uint8_t *data, uint32_t size)
144*4882a593Smuzhiyun {
145*4882a593Smuzhiyun 	uint16_t checksum = 0;
146*4882a593Smuzhiyun 	int i;
147*4882a593Smuzhiyun 
148*4882a593Smuzhiyun 	for (i = 0; i < size; i++)
149*4882a593Smuzhiyun 		checksum += data[i];
150*4882a593Smuzhiyun 
151*4882a593Smuzhiyun 	return checksum;
152*4882a593Smuzhiyun }
153*4882a593Smuzhiyun 
amdgpu_discovery_verify_checksum(uint8_t * data,uint32_t size,uint16_t expected)154*4882a593Smuzhiyun static inline bool amdgpu_discovery_verify_checksum(uint8_t *data, uint32_t size,
155*4882a593Smuzhiyun 						    uint16_t expected)
156*4882a593Smuzhiyun {
157*4882a593Smuzhiyun 	return !!(amdgpu_discovery_calculate_checksum(data, size) == expected);
158*4882a593Smuzhiyun }
159*4882a593Smuzhiyun 
amdgpu_discovery_init(struct amdgpu_device * adev)160*4882a593Smuzhiyun static int amdgpu_discovery_init(struct amdgpu_device *adev)
161*4882a593Smuzhiyun {
162*4882a593Smuzhiyun 	struct table_info *info;
163*4882a593Smuzhiyun 	struct binary_header *bhdr;
164*4882a593Smuzhiyun 	struct ip_discovery_header *ihdr;
165*4882a593Smuzhiyun 	struct gpu_info_header *ghdr;
166*4882a593Smuzhiyun 	uint16_t offset;
167*4882a593Smuzhiyun 	uint16_t size;
168*4882a593Smuzhiyun 	uint16_t checksum;
169*4882a593Smuzhiyun 	int r;
170*4882a593Smuzhiyun 
171*4882a593Smuzhiyun 	adev->mman.discovery_tmr_size = DISCOVERY_TMR_SIZE;
172*4882a593Smuzhiyun 	adev->mman.discovery_bin = kzalloc(adev->mman.discovery_tmr_size, GFP_KERNEL);
173*4882a593Smuzhiyun 	if (!adev->mman.discovery_bin)
174*4882a593Smuzhiyun 		return -ENOMEM;
175*4882a593Smuzhiyun 
176*4882a593Smuzhiyun 	r = amdgpu_discovery_read_binary(adev, adev->mman.discovery_bin);
177*4882a593Smuzhiyun 	if (r) {
178*4882a593Smuzhiyun 		DRM_ERROR("failed to read ip discovery binary\n");
179*4882a593Smuzhiyun 		goto out;
180*4882a593Smuzhiyun 	}
181*4882a593Smuzhiyun 
182*4882a593Smuzhiyun 	bhdr = (struct binary_header *)adev->mman.discovery_bin;
183*4882a593Smuzhiyun 
184*4882a593Smuzhiyun 	if (le32_to_cpu(bhdr->binary_signature) != BINARY_SIGNATURE) {
185*4882a593Smuzhiyun 		DRM_ERROR("invalid ip discovery binary signature\n");
186*4882a593Smuzhiyun 		r = -EINVAL;
187*4882a593Smuzhiyun 		goto out;
188*4882a593Smuzhiyun 	}
189*4882a593Smuzhiyun 
190*4882a593Smuzhiyun 	offset = offsetof(struct binary_header, binary_checksum) +
191*4882a593Smuzhiyun 		sizeof(bhdr->binary_checksum);
192*4882a593Smuzhiyun 	size = bhdr->binary_size - offset;
193*4882a593Smuzhiyun 	checksum = bhdr->binary_checksum;
194*4882a593Smuzhiyun 
195*4882a593Smuzhiyun 	if (!amdgpu_discovery_verify_checksum(adev->mman.discovery_bin + offset,
196*4882a593Smuzhiyun 					      size, checksum)) {
197*4882a593Smuzhiyun 		DRM_ERROR("invalid ip discovery binary checksum\n");
198*4882a593Smuzhiyun 		r = -EINVAL;
199*4882a593Smuzhiyun 		goto out;
200*4882a593Smuzhiyun 	}
201*4882a593Smuzhiyun 
202*4882a593Smuzhiyun 	info = &bhdr->table_list[IP_DISCOVERY];
203*4882a593Smuzhiyun 	offset = le16_to_cpu(info->offset);
204*4882a593Smuzhiyun 	checksum = le16_to_cpu(info->checksum);
205*4882a593Smuzhiyun 	ihdr = (struct ip_discovery_header *)(adev->mman.discovery_bin + offset);
206*4882a593Smuzhiyun 
207*4882a593Smuzhiyun 	if (le32_to_cpu(ihdr->signature) != DISCOVERY_TABLE_SIGNATURE) {
208*4882a593Smuzhiyun 		DRM_ERROR("invalid ip discovery data table signature\n");
209*4882a593Smuzhiyun 		r = -EINVAL;
210*4882a593Smuzhiyun 		goto out;
211*4882a593Smuzhiyun 	}
212*4882a593Smuzhiyun 
213*4882a593Smuzhiyun 	if (!amdgpu_discovery_verify_checksum(adev->mman.discovery_bin + offset,
214*4882a593Smuzhiyun 					      ihdr->size, checksum)) {
215*4882a593Smuzhiyun 		DRM_ERROR("invalid ip discovery data table checksum\n");
216*4882a593Smuzhiyun 		r = -EINVAL;
217*4882a593Smuzhiyun 		goto out;
218*4882a593Smuzhiyun 	}
219*4882a593Smuzhiyun 
220*4882a593Smuzhiyun 	info = &bhdr->table_list[GC];
221*4882a593Smuzhiyun 	offset = le16_to_cpu(info->offset);
222*4882a593Smuzhiyun 	checksum = le16_to_cpu(info->checksum);
223*4882a593Smuzhiyun 	ghdr = (struct gpu_info_header *)(adev->mman.discovery_bin + offset);
224*4882a593Smuzhiyun 
225*4882a593Smuzhiyun 	if (!amdgpu_discovery_verify_checksum(adev->mman.discovery_bin + offset,
226*4882a593Smuzhiyun 				              ghdr->size, checksum)) {
227*4882a593Smuzhiyun 		DRM_ERROR("invalid gc data table checksum\n");
228*4882a593Smuzhiyun 		r = -EINVAL;
229*4882a593Smuzhiyun 		goto out;
230*4882a593Smuzhiyun 	}
231*4882a593Smuzhiyun 
232*4882a593Smuzhiyun 	return 0;
233*4882a593Smuzhiyun 
234*4882a593Smuzhiyun out:
235*4882a593Smuzhiyun 	kfree(adev->mman.discovery_bin);
236*4882a593Smuzhiyun 	adev->mman.discovery_bin = NULL;
237*4882a593Smuzhiyun 
238*4882a593Smuzhiyun 	return r;
239*4882a593Smuzhiyun }
240*4882a593Smuzhiyun 
amdgpu_discovery_fini(struct amdgpu_device * adev)241*4882a593Smuzhiyun void amdgpu_discovery_fini(struct amdgpu_device *adev)
242*4882a593Smuzhiyun {
243*4882a593Smuzhiyun 	kfree(adev->mman.discovery_bin);
244*4882a593Smuzhiyun 	adev->mman.discovery_bin = NULL;
245*4882a593Smuzhiyun }
246*4882a593Smuzhiyun 
amdgpu_discovery_reg_base_init(struct amdgpu_device * adev)247*4882a593Smuzhiyun int amdgpu_discovery_reg_base_init(struct amdgpu_device *adev)
248*4882a593Smuzhiyun {
249*4882a593Smuzhiyun 	struct binary_header *bhdr;
250*4882a593Smuzhiyun 	struct ip_discovery_header *ihdr;
251*4882a593Smuzhiyun 	struct die_header *dhdr;
252*4882a593Smuzhiyun 	struct ip *ip;
253*4882a593Smuzhiyun 	uint16_t die_offset;
254*4882a593Smuzhiyun 	uint16_t ip_offset;
255*4882a593Smuzhiyun 	uint16_t num_dies;
256*4882a593Smuzhiyun 	uint16_t num_ips;
257*4882a593Smuzhiyun 	uint8_t num_base_address;
258*4882a593Smuzhiyun 	int hw_ip;
259*4882a593Smuzhiyun 	int i, j, k;
260*4882a593Smuzhiyun 	int r;
261*4882a593Smuzhiyun 
262*4882a593Smuzhiyun 	r = amdgpu_discovery_init(adev);
263*4882a593Smuzhiyun 	if (r) {
264*4882a593Smuzhiyun 		DRM_ERROR("amdgpu_discovery_init failed\n");
265*4882a593Smuzhiyun 		return r;
266*4882a593Smuzhiyun 	}
267*4882a593Smuzhiyun 
268*4882a593Smuzhiyun 	bhdr = (struct binary_header *)adev->mman.discovery_bin;
269*4882a593Smuzhiyun 	ihdr = (struct ip_discovery_header *)(adev->mman.discovery_bin +
270*4882a593Smuzhiyun 			le16_to_cpu(bhdr->table_list[IP_DISCOVERY].offset));
271*4882a593Smuzhiyun 	num_dies = le16_to_cpu(ihdr->num_dies);
272*4882a593Smuzhiyun 
273*4882a593Smuzhiyun 	DRM_DEBUG("number of dies: %d\n", num_dies);
274*4882a593Smuzhiyun 
275*4882a593Smuzhiyun 	for (i = 0; i < num_dies; i++) {
276*4882a593Smuzhiyun 		die_offset = le16_to_cpu(ihdr->die_info[i].die_offset);
277*4882a593Smuzhiyun 		dhdr = (struct die_header *)(adev->mman.discovery_bin + die_offset);
278*4882a593Smuzhiyun 		num_ips = le16_to_cpu(dhdr->num_ips);
279*4882a593Smuzhiyun 		ip_offset = die_offset + sizeof(*dhdr);
280*4882a593Smuzhiyun 
281*4882a593Smuzhiyun 		if (le16_to_cpu(dhdr->die_id) != i) {
282*4882a593Smuzhiyun 			DRM_ERROR("invalid die id %d, expected %d\n",
283*4882a593Smuzhiyun 					le16_to_cpu(dhdr->die_id), i);
284*4882a593Smuzhiyun 			return -EINVAL;
285*4882a593Smuzhiyun 		}
286*4882a593Smuzhiyun 
287*4882a593Smuzhiyun 		DRM_DEBUG("number of hardware IPs on die%d: %d\n",
288*4882a593Smuzhiyun 				le16_to_cpu(dhdr->die_id), num_ips);
289*4882a593Smuzhiyun 
290*4882a593Smuzhiyun 		for (j = 0; j < num_ips; j++) {
291*4882a593Smuzhiyun 			ip = (struct ip *)(adev->mman.discovery_bin + ip_offset);
292*4882a593Smuzhiyun 			num_base_address = ip->num_base_address;
293*4882a593Smuzhiyun 
294*4882a593Smuzhiyun 			DRM_DEBUG("%s(%d) #%d v%d.%d.%d:\n",
295*4882a593Smuzhiyun 				  hw_id_names[le16_to_cpu(ip->hw_id)],
296*4882a593Smuzhiyun 				  le16_to_cpu(ip->hw_id),
297*4882a593Smuzhiyun 				  ip->number_instance,
298*4882a593Smuzhiyun 				  ip->major, ip->minor,
299*4882a593Smuzhiyun 				  ip->revision);
300*4882a593Smuzhiyun 
301*4882a593Smuzhiyun 			for (k = 0; k < num_base_address; k++) {
302*4882a593Smuzhiyun 				/*
303*4882a593Smuzhiyun 				 * convert the endianness of base addresses in place,
304*4882a593Smuzhiyun 				 * so that we don't need to convert them when accessing adev->reg_offset.
305*4882a593Smuzhiyun 				 */
306*4882a593Smuzhiyun 				ip->base_address[k] = le32_to_cpu(ip->base_address[k]);
307*4882a593Smuzhiyun 				DRM_DEBUG("\t0x%08x\n", ip->base_address[k]);
308*4882a593Smuzhiyun 			}
309*4882a593Smuzhiyun 
310*4882a593Smuzhiyun 			for (hw_ip = 0; hw_ip < MAX_HWIP; hw_ip++) {
311*4882a593Smuzhiyun 				if (hw_id_map[hw_ip] == le16_to_cpu(ip->hw_id)) {
312*4882a593Smuzhiyun 					DRM_DEBUG("set register base offset for %s\n",
313*4882a593Smuzhiyun 							hw_id_names[le16_to_cpu(ip->hw_id)]);
314*4882a593Smuzhiyun 					adev->reg_offset[hw_ip][ip->number_instance] =
315*4882a593Smuzhiyun 						ip->base_address;
316*4882a593Smuzhiyun 				}
317*4882a593Smuzhiyun 
318*4882a593Smuzhiyun 			}
319*4882a593Smuzhiyun 
320*4882a593Smuzhiyun 			ip_offset += sizeof(*ip) + 4 * (ip->num_base_address - 1);
321*4882a593Smuzhiyun 		}
322*4882a593Smuzhiyun 	}
323*4882a593Smuzhiyun 
324*4882a593Smuzhiyun 	return 0;
325*4882a593Smuzhiyun }
326*4882a593Smuzhiyun 
amdgpu_discovery_get_ip_version(struct amdgpu_device * adev,int hw_id,int * major,int * minor,int * revision)327*4882a593Smuzhiyun int amdgpu_discovery_get_ip_version(struct amdgpu_device *adev, int hw_id,
328*4882a593Smuzhiyun 				    int *major, int *minor, int *revision)
329*4882a593Smuzhiyun {
330*4882a593Smuzhiyun 	struct binary_header *bhdr;
331*4882a593Smuzhiyun 	struct ip_discovery_header *ihdr;
332*4882a593Smuzhiyun 	struct die_header *dhdr;
333*4882a593Smuzhiyun 	struct ip *ip;
334*4882a593Smuzhiyun 	uint16_t die_offset;
335*4882a593Smuzhiyun 	uint16_t ip_offset;
336*4882a593Smuzhiyun 	uint16_t num_dies;
337*4882a593Smuzhiyun 	uint16_t num_ips;
338*4882a593Smuzhiyun 	int i, j;
339*4882a593Smuzhiyun 
340*4882a593Smuzhiyun 	if (!adev->mman.discovery_bin) {
341*4882a593Smuzhiyun 		DRM_ERROR("ip discovery uninitialized\n");
342*4882a593Smuzhiyun 		return -EINVAL;
343*4882a593Smuzhiyun 	}
344*4882a593Smuzhiyun 
345*4882a593Smuzhiyun 	bhdr = (struct binary_header *)adev->mman.discovery_bin;
346*4882a593Smuzhiyun 	ihdr = (struct ip_discovery_header *)(adev->mman.discovery_bin +
347*4882a593Smuzhiyun 			le16_to_cpu(bhdr->table_list[IP_DISCOVERY].offset));
348*4882a593Smuzhiyun 	num_dies = le16_to_cpu(ihdr->num_dies);
349*4882a593Smuzhiyun 
350*4882a593Smuzhiyun 	for (i = 0; i < num_dies; i++) {
351*4882a593Smuzhiyun 		die_offset = le16_to_cpu(ihdr->die_info[i].die_offset);
352*4882a593Smuzhiyun 		dhdr = (struct die_header *)(adev->mman.discovery_bin + die_offset);
353*4882a593Smuzhiyun 		num_ips = le16_to_cpu(dhdr->num_ips);
354*4882a593Smuzhiyun 		ip_offset = die_offset + sizeof(*dhdr);
355*4882a593Smuzhiyun 
356*4882a593Smuzhiyun 		for (j = 0; j < num_ips; j++) {
357*4882a593Smuzhiyun 			ip = (struct ip *)(adev->mman.discovery_bin + ip_offset);
358*4882a593Smuzhiyun 
359*4882a593Smuzhiyun 			if (le16_to_cpu(ip->hw_id) == hw_id) {
360*4882a593Smuzhiyun 				if (major)
361*4882a593Smuzhiyun 					*major = ip->major;
362*4882a593Smuzhiyun 				if (minor)
363*4882a593Smuzhiyun 					*minor = ip->minor;
364*4882a593Smuzhiyun 				if (revision)
365*4882a593Smuzhiyun 					*revision = ip->revision;
366*4882a593Smuzhiyun 				return 0;
367*4882a593Smuzhiyun 			}
368*4882a593Smuzhiyun 			ip_offset += sizeof(*ip) + 4 * (ip->num_base_address - 1);
369*4882a593Smuzhiyun 		}
370*4882a593Smuzhiyun 	}
371*4882a593Smuzhiyun 
372*4882a593Smuzhiyun 	return -EINVAL;
373*4882a593Smuzhiyun }
374*4882a593Smuzhiyun 
375*4882a593Smuzhiyun union gc_info {
376*4882a593Smuzhiyun 	struct gc_info_v1_0 v1;
377*4882a593Smuzhiyun 	struct gc_info_v2_0 v2;
378*4882a593Smuzhiyun };
379*4882a593Smuzhiyun 
amdgpu_discovery_get_gfx_info(struct amdgpu_device * adev)380*4882a593Smuzhiyun int amdgpu_discovery_get_gfx_info(struct amdgpu_device *adev)
381*4882a593Smuzhiyun {
382*4882a593Smuzhiyun 	struct binary_header *bhdr;
383*4882a593Smuzhiyun 	union gc_info *gc_info;
384*4882a593Smuzhiyun 
385*4882a593Smuzhiyun 	if (!adev->mman.discovery_bin) {
386*4882a593Smuzhiyun 		DRM_ERROR("ip discovery uninitialized\n");
387*4882a593Smuzhiyun 		return -EINVAL;
388*4882a593Smuzhiyun 	}
389*4882a593Smuzhiyun 
390*4882a593Smuzhiyun 	bhdr = (struct binary_header *)adev->mman.discovery_bin;
391*4882a593Smuzhiyun 	gc_info = (union gc_info *)(adev->mman.discovery_bin +
392*4882a593Smuzhiyun 			le16_to_cpu(bhdr->table_list[GC].offset));
393*4882a593Smuzhiyun 	switch (gc_info->v1.header.version_major) {
394*4882a593Smuzhiyun 	case 1:
395*4882a593Smuzhiyun 		adev->gfx.config.max_shader_engines = le32_to_cpu(gc_info->v1.gc_num_se);
396*4882a593Smuzhiyun 		adev->gfx.config.max_cu_per_sh = 2 * (le32_to_cpu(gc_info->v1.gc_num_wgp0_per_sa) +
397*4882a593Smuzhiyun 						      le32_to_cpu(gc_info->v1.gc_num_wgp1_per_sa));
398*4882a593Smuzhiyun 		adev->gfx.config.max_sh_per_se = le32_to_cpu(gc_info->v1.gc_num_sa_per_se);
399*4882a593Smuzhiyun 		adev->gfx.config.max_backends_per_se = le32_to_cpu(gc_info->v1.gc_num_rb_per_se);
400*4882a593Smuzhiyun 		adev->gfx.config.max_texture_channel_caches = le32_to_cpu(gc_info->v1.gc_num_gl2c);
401*4882a593Smuzhiyun 		adev->gfx.config.max_gprs = le32_to_cpu(gc_info->v1.gc_num_gprs);
402*4882a593Smuzhiyun 		adev->gfx.config.max_gs_threads = le32_to_cpu(gc_info->v1.gc_num_max_gs_thds);
403*4882a593Smuzhiyun 		adev->gfx.config.gs_vgt_table_depth = le32_to_cpu(gc_info->v1.gc_gs_table_depth);
404*4882a593Smuzhiyun 		adev->gfx.config.gs_prim_buffer_depth = le32_to_cpu(gc_info->v1.gc_gsprim_buff_depth);
405*4882a593Smuzhiyun 		adev->gfx.config.double_offchip_lds_buf = le32_to_cpu(gc_info->v1.gc_double_offchip_lds_buffer);
406*4882a593Smuzhiyun 		adev->gfx.cu_info.wave_front_size = le32_to_cpu(gc_info->v1.gc_wave_size);
407*4882a593Smuzhiyun 		adev->gfx.cu_info.max_waves_per_simd = le32_to_cpu(gc_info->v1.gc_max_waves_per_simd);
408*4882a593Smuzhiyun 		adev->gfx.cu_info.max_scratch_slots_per_cu = le32_to_cpu(gc_info->v1.gc_max_scratch_slots_per_cu);
409*4882a593Smuzhiyun 		adev->gfx.cu_info.lds_size = le32_to_cpu(gc_info->v1.gc_lds_size);
410*4882a593Smuzhiyun 		adev->gfx.config.num_sc_per_sh = le32_to_cpu(gc_info->v1.gc_num_sc_per_se) /
411*4882a593Smuzhiyun 			le32_to_cpu(gc_info->v1.gc_num_sa_per_se);
412*4882a593Smuzhiyun 		adev->gfx.config.num_packer_per_sc = le32_to_cpu(gc_info->v1.gc_num_packer_per_sc);
413*4882a593Smuzhiyun 		break;
414*4882a593Smuzhiyun 	case 2:
415*4882a593Smuzhiyun 		adev->gfx.config.max_shader_engines = le32_to_cpu(gc_info->v2.gc_num_se);
416*4882a593Smuzhiyun 		adev->gfx.config.max_cu_per_sh = le32_to_cpu(gc_info->v2.gc_num_cu_per_sh);
417*4882a593Smuzhiyun 		adev->gfx.config.max_sh_per_se = le32_to_cpu(gc_info->v2.gc_num_sh_per_se);
418*4882a593Smuzhiyun 		adev->gfx.config.max_backends_per_se = le32_to_cpu(gc_info->v2.gc_num_rb_per_se);
419*4882a593Smuzhiyun 		adev->gfx.config.max_texture_channel_caches = le32_to_cpu(gc_info->v2.gc_num_tccs);
420*4882a593Smuzhiyun 		adev->gfx.config.max_gprs = le32_to_cpu(gc_info->v2.gc_num_gprs);
421*4882a593Smuzhiyun 		adev->gfx.config.max_gs_threads = le32_to_cpu(gc_info->v2.gc_num_max_gs_thds);
422*4882a593Smuzhiyun 		adev->gfx.config.gs_vgt_table_depth = le32_to_cpu(gc_info->v2.gc_gs_table_depth);
423*4882a593Smuzhiyun 		adev->gfx.config.gs_prim_buffer_depth = le32_to_cpu(gc_info->v2.gc_gsprim_buff_depth);
424*4882a593Smuzhiyun 		adev->gfx.config.double_offchip_lds_buf = le32_to_cpu(gc_info->v2.gc_double_offchip_lds_buffer);
425*4882a593Smuzhiyun 		adev->gfx.cu_info.wave_front_size = le32_to_cpu(gc_info->v2.gc_wave_size);
426*4882a593Smuzhiyun 		adev->gfx.cu_info.max_waves_per_simd = le32_to_cpu(gc_info->v2.gc_max_waves_per_simd);
427*4882a593Smuzhiyun 		adev->gfx.cu_info.max_scratch_slots_per_cu = le32_to_cpu(gc_info->v2.gc_max_scratch_slots_per_cu);
428*4882a593Smuzhiyun 		adev->gfx.cu_info.lds_size = le32_to_cpu(gc_info->v2.gc_lds_size);
429*4882a593Smuzhiyun 		adev->gfx.config.num_sc_per_sh = le32_to_cpu(gc_info->v2.gc_num_sc_per_se) /
430*4882a593Smuzhiyun 			le32_to_cpu(gc_info->v2.gc_num_sh_per_se);
431*4882a593Smuzhiyun 		adev->gfx.config.num_packer_per_sc = le32_to_cpu(gc_info->v2.gc_num_packer_per_sc);
432*4882a593Smuzhiyun 		break;
433*4882a593Smuzhiyun 	default:
434*4882a593Smuzhiyun 		dev_err(adev->dev,
435*4882a593Smuzhiyun 			"Unhandled GC info table %d.%d\n",
436*4882a593Smuzhiyun 			gc_info->v1.header.version_major,
437*4882a593Smuzhiyun 			gc_info->v1.header.version_minor);
438*4882a593Smuzhiyun 		return -EINVAL;
439*4882a593Smuzhiyun 	}
440*4882a593Smuzhiyun 	return 0;
441*4882a593Smuzhiyun }
442