xref: /OK3568_Linux_fs/kernel/drivers/iommu/intel/dmar.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Copyright (c) 2006, Intel Corporation.
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright (C) 2006-2008 Intel Corporation
6*4882a593Smuzhiyun  * Author: Ashok Raj <ashok.raj@intel.com>
7*4882a593Smuzhiyun  * Author: Shaohua Li <shaohua.li@intel.com>
8*4882a593Smuzhiyun  * Author: Anil S Keshavamurthy <anil.s.keshavamurthy@intel.com>
9*4882a593Smuzhiyun  *
10*4882a593Smuzhiyun  * This file implements early detection/parsing of Remapping Devices
11*4882a593Smuzhiyun  * reported to OS through BIOS via DMA remapping reporting (DMAR) ACPI
12*4882a593Smuzhiyun  * tables.
13*4882a593Smuzhiyun  *
14*4882a593Smuzhiyun  * These routines are used by both DMA-remapping and Interrupt-remapping
15*4882a593Smuzhiyun  */
16*4882a593Smuzhiyun 
17*4882a593Smuzhiyun #define pr_fmt(fmt)     "DMAR: " fmt
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun #include <linux/pci.h>
20*4882a593Smuzhiyun #include <linux/dmar.h>
21*4882a593Smuzhiyun #include <linux/iova.h>
22*4882a593Smuzhiyun #include <linux/intel-iommu.h>
23*4882a593Smuzhiyun #include <linux/timer.h>
24*4882a593Smuzhiyun #include <linux/irq.h>
25*4882a593Smuzhiyun #include <linux/interrupt.h>
26*4882a593Smuzhiyun #include <linux/tboot.h>
27*4882a593Smuzhiyun #include <linux/dmi.h>
28*4882a593Smuzhiyun #include <linux/slab.h>
29*4882a593Smuzhiyun #include <linux/iommu.h>
30*4882a593Smuzhiyun #include <linux/numa.h>
31*4882a593Smuzhiyun #include <linux/limits.h>
32*4882a593Smuzhiyun #include <asm/irq_remapping.h>
33*4882a593Smuzhiyun #include <asm/iommu_table.h>
34*4882a593Smuzhiyun 
35*4882a593Smuzhiyun #include "../irq_remapping.h"
36*4882a593Smuzhiyun 
37*4882a593Smuzhiyun typedef int (*dmar_res_handler_t)(struct acpi_dmar_header *, void *);
38*4882a593Smuzhiyun struct dmar_res_callback {
39*4882a593Smuzhiyun 	dmar_res_handler_t	cb[ACPI_DMAR_TYPE_RESERVED];
40*4882a593Smuzhiyun 	void			*arg[ACPI_DMAR_TYPE_RESERVED];
41*4882a593Smuzhiyun 	bool			ignore_unhandled;
42*4882a593Smuzhiyun 	bool			print_entry;
43*4882a593Smuzhiyun };
44*4882a593Smuzhiyun 
45*4882a593Smuzhiyun /*
46*4882a593Smuzhiyun  * Assumptions:
47*4882a593Smuzhiyun  * 1) The hotplug framework guarentees that DMAR unit will be hot-added
48*4882a593Smuzhiyun  *    before IO devices managed by that unit.
49*4882a593Smuzhiyun  * 2) The hotplug framework guarantees that DMAR unit will be hot-removed
50*4882a593Smuzhiyun  *    after IO devices managed by that unit.
51*4882a593Smuzhiyun  * 3) Hotplug events are rare.
52*4882a593Smuzhiyun  *
53*4882a593Smuzhiyun  * Locking rules for DMA and interrupt remapping related global data structures:
54*4882a593Smuzhiyun  * 1) Use dmar_global_lock in process context
55*4882a593Smuzhiyun  * 2) Use RCU in interrupt context
56*4882a593Smuzhiyun  */
57*4882a593Smuzhiyun DECLARE_RWSEM(dmar_global_lock);
58*4882a593Smuzhiyun LIST_HEAD(dmar_drhd_units);
59*4882a593Smuzhiyun 
60*4882a593Smuzhiyun struct acpi_table_header * __initdata dmar_tbl;
61*4882a593Smuzhiyun static int dmar_dev_scope_status = 1;
62*4882a593Smuzhiyun static unsigned long dmar_seq_ids[BITS_TO_LONGS(DMAR_UNITS_SUPPORTED)];
63*4882a593Smuzhiyun 
64*4882a593Smuzhiyun static int alloc_iommu(struct dmar_drhd_unit *drhd);
65*4882a593Smuzhiyun static void free_iommu(struct intel_iommu *iommu);
66*4882a593Smuzhiyun 
67*4882a593Smuzhiyun extern const struct iommu_ops intel_iommu_ops;
68*4882a593Smuzhiyun 
dmar_register_drhd_unit(struct dmar_drhd_unit * drhd)69*4882a593Smuzhiyun static void dmar_register_drhd_unit(struct dmar_drhd_unit *drhd)
70*4882a593Smuzhiyun {
71*4882a593Smuzhiyun 	/*
72*4882a593Smuzhiyun 	 * add INCLUDE_ALL at the tail, so scan the list will find it at
73*4882a593Smuzhiyun 	 * the very end.
74*4882a593Smuzhiyun 	 */
75*4882a593Smuzhiyun 	if (drhd->include_all)
76*4882a593Smuzhiyun 		list_add_tail_rcu(&drhd->list, &dmar_drhd_units);
77*4882a593Smuzhiyun 	else
78*4882a593Smuzhiyun 		list_add_rcu(&drhd->list, &dmar_drhd_units);
79*4882a593Smuzhiyun }
80*4882a593Smuzhiyun 
dmar_alloc_dev_scope(void * start,void * end,int * cnt)81*4882a593Smuzhiyun void *dmar_alloc_dev_scope(void *start, void *end, int *cnt)
82*4882a593Smuzhiyun {
83*4882a593Smuzhiyun 	struct acpi_dmar_device_scope *scope;
84*4882a593Smuzhiyun 
85*4882a593Smuzhiyun 	*cnt = 0;
86*4882a593Smuzhiyun 	while (start < end) {
87*4882a593Smuzhiyun 		scope = start;
88*4882a593Smuzhiyun 		if (scope->entry_type == ACPI_DMAR_SCOPE_TYPE_NAMESPACE ||
89*4882a593Smuzhiyun 		    scope->entry_type == ACPI_DMAR_SCOPE_TYPE_ENDPOINT ||
90*4882a593Smuzhiyun 		    scope->entry_type == ACPI_DMAR_SCOPE_TYPE_BRIDGE)
91*4882a593Smuzhiyun 			(*cnt)++;
92*4882a593Smuzhiyun 		else if (scope->entry_type != ACPI_DMAR_SCOPE_TYPE_IOAPIC &&
93*4882a593Smuzhiyun 			scope->entry_type != ACPI_DMAR_SCOPE_TYPE_HPET) {
94*4882a593Smuzhiyun 			pr_warn("Unsupported device scope\n");
95*4882a593Smuzhiyun 		}
96*4882a593Smuzhiyun 		start += scope->length;
97*4882a593Smuzhiyun 	}
98*4882a593Smuzhiyun 	if (*cnt == 0)
99*4882a593Smuzhiyun 		return NULL;
100*4882a593Smuzhiyun 
101*4882a593Smuzhiyun 	return kcalloc(*cnt, sizeof(struct dmar_dev_scope), GFP_KERNEL);
102*4882a593Smuzhiyun }
103*4882a593Smuzhiyun 
dmar_free_dev_scope(struct dmar_dev_scope ** devices,int * cnt)104*4882a593Smuzhiyun void dmar_free_dev_scope(struct dmar_dev_scope **devices, int *cnt)
105*4882a593Smuzhiyun {
106*4882a593Smuzhiyun 	int i;
107*4882a593Smuzhiyun 	struct device *tmp_dev;
108*4882a593Smuzhiyun 
109*4882a593Smuzhiyun 	if (*devices && *cnt) {
110*4882a593Smuzhiyun 		for_each_active_dev_scope(*devices, *cnt, i, tmp_dev)
111*4882a593Smuzhiyun 			put_device(tmp_dev);
112*4882a593Smuzhiyun 		kfree(*devices);
113*4882a593Smuzhiyun 	}
114*4882a593Smuzhiyun 
115*4882a593Smuzhiyun 	*devices = NULL;
116*4882a593Smuzhiyun 	*cnt = 0;
117*4882a593Smuzhiyun }
118*4882a593Smuzhiyun 
119*4882a593Smuzhiyun /* Optimize out kzalloc()/kfree() for normal cases */
120*4882a593Smuzhiyun static char dmar_pci_notify_info_buf[64];
121*4882a593Smuzhiyun 
122*4882a593Smuzhiyun static struct dmar_pci_notify_info *
dmar_alloc_pci_notify_info(struct pci_dev * dev,unsigned long event)123*4882a593Smuzhiyun dmar_alloc_pci_notify_info(struct pci_dev *dev, unsigned long event)
124*4882a593Smuzhiyun {
125*4882a593Smuzhiyun 	int level = 0;
126*4882a593Smuzhiyun 	size_t size;
127*4882a593Smuzhiyun 	struct pci_dev *tmp;
128*4882a593Smuzhiyun 	struct dmar_pci_notify_info *info;
129*4882a593Smuzhiyun 
130*4882a593Smuzhiyun 	BUG_ON(dev->is_virtfn);
131*4882a593Smuzhiyun 
132*4882a593Smuzhiyun 	/*
133*4882a593Smuzhiyun 	 * Ignore devices that have a domain number higher than what can
134*4882a593Smuzhiyun 	 * be looked up in DMAR, e.g. VMD subdevices with domain 0x10000
135*4882a593Smuzhiyun 	 */
136*4882a593Smuzhiyun 	if (pci_domain_nr(dev->bus) > U16_MAX)
137*4882a593Smuzhiyun 		return NULL;
138*4882a593Smuzhiyun 
139*4882a593Smuzhiyun 	/* Only generate path[] for device addition event */
140*4882a593Smuzhiyun 	if (event == BUS_NOTIFY_ADD_DEVICE)
141*4882a593Smuzhiyun 		for (tmp = dev; tmp; tmp = tmp->bus->self)
142*4882a593Smuzhiyun 			level++;
143*4882a593Smuzhiyun 
144*4882a593Smuzhiyun 	size = struct_size(info, path, level);
145*4882a593Smuzhiyun 	if (size <= sizeof(dmar_pci_notify_info_buf)) {
146*4882a593Smuzhiyun 		info = (struct dmar_pci_notify_info *)dmar_pci_notify_info_buf;
147*4882a593Smuzhiyun 	} else {
148*4882a593Smuzhiyun 		info = kzalloc(size, GFP_KERNEL);
149*4882a593Smuzhiyun 		if (!info) {
150*4882a593Smuzhiyun 			pr_warn("Out of memory when allocating notify_info "
151*4882a593Smuzhiyun 				"for %s.\n", pci_name(dev));
152*4882a593Smuzhiyun 			if (dmar_dev_scope_status == 0)
153*4882a593Smuzhiyun 				dmar_dev_scope_status = -ENOMEM;
154*4882a593Smuzhiyun 			return NULL;
155*4882a593Smuzhiyun 		}
156*4882a593Smuzhiyun 	}
157*4882a593Smuzhiyun 
158*4882a593Smuzhiyun 	info->event = event;
159*4882a593Smuzhiyun 	info->dev = dev;
160*4882a593Smuzhiyun 	info->seg = pci_domain_nr(dev->bus);
161*4882a593Smuzhiyun 	info->level = level;
162*4882a593Smuzhiyun 	if (event == BUS_NOTIFY_ADD_DEVICE) {
163*4882a593Smuzhiyun 		for (tmp = dev; tmp; tmp = tmp->bus->self) {
164*4882a593Smuzhiyun 			level--;
165*4882a593Smuzhiyun 			info->path[level].bus = tmp->bus->number;
166*4882a593Smuzhiyun 			info->path[level].device = PCI_SLOT(tmp->devfn);
167*4882a593Smuzhiyun 			info->path[level].function = PCI_FUNC(tmp->devfn);
168*4882a593Smuzhiyun 			if (pci_is_root_bus(tmp->bus))
169*4882a593Smuzhiyun 				info->bus = tmp->bus->number;
170*4882a593Smuzhiyun 		}
171*4882a593Smuzhiyun 	}
172*4882a593Smuzhiyun 
173*4882a593Smuzhiyun 	return info;
174*4882a593Smuzhiyun }
175*4882a593Smuzhiyun 
dmar_free_pci_notify_info(struct dmar_pci_notify_info * info)176*4882a593Smuzhiyun static inline void dmar_free_pci_notify_info(struct dmar_pci_notify_info *info)
177*4882a593Smuzhiyun {
178*4882a593Smuzhiyun 	if ((void *)info != dmar_pci_notify_info_buf)
179*4882a593Smuzhiyun 		kfree(info);
180*4882a593Smuzhiyun }
181*4882a593Smuzhiyun 
dmar_match_pci_path(struct dmar_pci_notify_info * info,int bus,struct acpi_dmar_pci_path * path,int count)182*4882a593Smuzhiyun static bool dmar_match_pci_path(struct dmar_pci_notify_info *info, int bus,
183*4882a593Smuzhiyun 				struct acpi_dmar_pci_path *path, int count)
184*4882a593Smuzhiyun {
185*4882a593Smuzhiyun 	int i;
186*4882a593Smuzhiyun 
187*4882a593Smuzhiyun 	if (info->bus != bus)
188*4882a593Smuzhiyun 		goto fallback;
189*4882a593Smuzhiyun 	if (info->level != count)
190*4882a593Smuzhiyun 		goto fallback;
191*4882a593Smuzhiyun 
192*4882a593Smuzhiyun 	for (i = 0; i < count; i++) {
193*4882a593Smuzhiyun 		if (path[i].device != info->path[i].device ||
194*4882a593Smuzhiyun 		    path[i].function != info->path[i].function)
195*4882a593Smuzhiyun 			goto fallback;
196*4882a593Smuzhiyun 	}
197*4882a593Smuzhiyun 
198*4882a593Smuzhiyun 	return true;
199*4882a593Smuzhiyun 
200*4882a593Smuzhiyun fallback:
201*4882a593Smuzhiyun 
202*4882a593Smuzhiyun 	if (count != 1)
203*4882a593Smuzhiyun 		return false;
204*4882a593Smuzhiyun 
205*4882a593Smuzhiyun 	i = info->level - 1;
206*4882a593Smuzhiyun 	if (bus              == info->path[i].bus &&
207*4882a593Smuzhiyun 	    path[0].device   == info->path[i].device &&
208*4882a593Smuzhiyun 	    path[0].function == info->path[i].function) {
209*4882a593Smuzhiyun 		pr_info(FW_BUG "RMRR entry for device %02x:%02x.%x is broken - applying workaround\n",
210*4882a593Smuzhiyun 			bus, path[0].device, path[0].function);
211*4882a593Smuzhiyun 		return true;
212*4882a593Smuzhiyun 	}
213*4882a593Smuzhiyun 
214*4882a593Smuzhiyun 	return false;
215*4882a593Smuzhiyun }
216*4882a593Smuzhiyun 
217*4882a593Smuzhiyun /* Return: > 0 if match found, 0 if no match found, < 0 if error happens */
dmar_insert_dev_scope(struct dmar_pci_notify_info * info,void * start,void * end,u16 segment,struct dmar_dev_scope * devices,int devices_cnt)218*4882a593Smuzhiyun int dmar_insert_dev_scope(struct dmar_pci_notify_info *info,
219*4882a593Smuzhiyun 			  void *start, void*end, u16 segment,
220*4882a593Smuzhiyun 			  struct dmar_dev_scope *devices,
221*4882a593Smuzhiyun 			  int devices_cnt)
222*4882a593Smuzhiyun {
223*4882a593Smuzhiyun 	int i, level;
224*4882a593Smuzhiyun 	struct device *tmp, *dev = &info->dev->dev;
225*4882a593Smuzhiyun 	struct acpi_dmar_device_scope *scope;
226*4882a593Smuzhiyun 	struct acpi_dmar_pci_path *path;
227*4882a593Smuzhiyun 
228*4882a593Smuzhiyun 	if (segment != info->seg)
229*4882a593Smuzhiyun 		return 0;
230*4882a593Smuzhiyun 
231*4882a593Smuzhiyun 	for (; start < end; start += scope->length) {
232*4882a593Smuzhiyun 		scope = start;
233*4882a593Smuzhiyun 		if (scope->entry_type != ACPI_DMAR_SCOPE_TYPE_ENDPOINT &&
234*4882a593Smuzhiyun 		    scope->entry_type != ACPI_DMAR_SCOPE_TYPE_BRIDGE)
235*4882a593Smuzhiyun 			continue;
236*4882a593Smuzhiyun 
237*4882a593Smuzhiyun 		path = (struct acpi_dmar_pci_path *)(scope + 1);
238*4882a593Smuzhiyun 		level = (scope->length - sizeof(*scope)) / sizeof(*path);
239*4882a593Smuzhiyun 		if (!dmar_match_pci_path(info, scope->bus, path, level))
240*4882a593Smuzhiyun 			continue;
241*4882a593Smuzhiyun 
242*4882a593Smuzhiyun 		/*
243*4882a593Smuzhiyun 		 * We expect devices with endpoint scope to have normal PCI
244*4882a593Smuzhiyun 		 * headers, and devices with bridge scope to have bridge PCI
245*4882a593Smuzhiyun 		 * headers.  However PCI NTB devices may be listed in the
246*4882a593Smuzhiyun 		 * DMAR table with bridge scope, even though they have a
247*4882a593Smuzhiyun 		 * normal PCI header.  NTB devices are identified by class
248*4882a593Smuzhiyun 		 * "BRIDGE_OTHER" (0680h) - we don't declare a socpe mismatch
249*4882a593Smuzhiyun 		 * for this special case.
250*4882a593Smuzhiyun 		 */
251*4882a593Smuzhiyun 		if ((scope->entry_type == ACPI_DMAR_SCOPE_TYPE_ENDPOINT &&
252*4882a593Smuzhiyun 		     info->dev->hdr_type != PCI_HEADER_TYPE_NORMAL) ||
253*4882a593Smuzhiyun 		    (scope->entry_type == ACPI_DMAR_SCOPE_TYPE_BRIDGE &&
254*4882a593Smuzhiyun 		     (info->dev->hdr_type == PCI_HEADER_TYPE_NORMAL &&
255*4882a593Smuzhiyun 		      info->dev->class >> 16 != PCI_BASE_CLASS_BRIDGE))) {
256*4882a593Smuzhiyun 			pr_warn("Device scope type does not match for %s\n",
257*4882a593Smuzhiyun 				pci_name(info->dev));
258*4882a593Smuzhiyun 			return -EINVAL;
259*4882a593Smuzhiyun 		}
260*4882a593Smuzhiyun 
261*4882a593Smuzhiyun 		for_each_dev_scope(devices, devices_cnt, i, tmp)
262*4882a593Smuzhiyun 			if (tmp == NULL) {
263*4882a593Smuzhiyun 				devices[i].bus = info->dev->bus->number;
264*4882a593Smuzhiyun 				devices[i].devfn = info->dev->devfn;
265*4882a593Smuzhiyun 				rcu_assign_pointer(devices[i].dev,
266*4882a593Smuzhiyun 						   get_device(dev));
267*4882a593Smuzhiyun 				return 1;
268*4882a593Smuzhiyun 			}
269*4882a593Smuzhiyun 		BUG_ON(i >= devices_cnt);
270*4882a593Smuzhiyun 	}
271*4882a593Smuzhiyun 
272*4882a593Smuzhiyun 	return 0;
273*4882a593Smuzhiyun }
274*4882a593Smuzhiyun 
dmar_remove_dev_scope(struct dmar_pci_notify_info * info,u16 segment,struct dmar_dev_scope * devices,int count)275*4882a593Smuzhiyun int dmar_remove_dev_scope(struct dmar_pci_notify_info *info, u16 segment,
276*4882a593Smuzhiyun 			  struct dmar_dev_scope *devices, int count)
277*4882a593Smuzhiyun {
278*4882a593Smuzhiyun 	int index;
279*4882a593Smuzhiyun 	struct device *tmp;
280*4882a593Smuzhiyun 
281*4882a593Smuzhiyun 	if (info->seg != segment)
282*4882a593Smuzhiyun 		return 0;
283*4882a593Smuzhiyun 
284*4882a593Smuzhiyun 	for_each_active_dev_scope(devices, count, index, tmp)
285*4882a593Smuzhiyun 		if (tmp == &info->dev->dev) {
286*4882a593Smuzhiyun 			RCU_INIT_POINTER(devices[index].dev, NULL);
287*4882a593Smuzhiyun 			synchronize_rcu();
288*4882a593Smuzhiyun 			put_device(tmp);
289*4882a593Smuzhiyun 			return 1;
290*4882a593Smuzhiyun 		}
291*4882a593Smuzhiyun 
292*4882a593Smuzhiyun 	return 0;
293*4882a593Smuzhiyun }
294*4882a593Smuzhiyun 
dmar_pci_bus_add_dev(struct dmar_pci_notify_info * info)295*4882a593Smuzhiyun static int dmar_pci_bus_add_dev(struct dmar_pci_notify_info *info)
296*4882a593Smuzhiyun {
297*4882a593Smuzhiyun 	int ret = 0;
298*4882a593Smuzhiyun 	struct dmar_drhd_unit *dmaru;
299*4882a593Smuzhiyun 	struct acpi_dmar_hardware_unit *drhd;
300*4882a593Smuzhiyun 
301*4882a593Smuzhiyun 	for_each_drhd_unit(dmaru) {
302*4882a593Smuzhiyun 		if (dmaru->include_all)
303*4882a593Smuzhiyun 			continue;
304*4882a593Smuzhiyun 
305*4882a593Smuzhiyun 		drhd = container_of(dmaru->hdr,
306*4882a593Smuzhiyun 				    struct acpi_dmar_hardware_unit, header);
307*4882a593Smuzhiyun 		ret = dmar_insert_dev_scope(info, (void *)(drhd + 1),
308*4882a593Smuzhiyun 				((void *)drhd) + drhd->header.length,
309*4882a593Smuzhiyun 				dmaru->segment,
310*4882a593Smuzhiyun 				dmaru->devices, dmaru->devices_cnt);
311*4882a593Smuzhiyun 		if (ret)
312*4882a593Smuzhiyun 			break;
313*4882a593Smuzhiyun 	}
314*4882a593Smuzhiyun 	if (ret >= 0)
315*4882a593Smuzhiyun 		ret = dmar_iommu_notify_scope_dev(info);
316*4882a593Smuzhiyun 	if (ret < 0 && dmar_dev_scope_status == 0)
317*4882a593Smuzhiyun 		dmar_dev_scope_status = ret;
318*4882a593Smuzhiyun 
319*4882a593Smuzhiyun 	if (ret >= 0)
320*4882a593Smuzhiyun 		intel_irq_remap_add_device(info);
321*4882a593Smuzhiyun 
322*4882a593Smuzhiyun 	return ret;
323*4882a593Smuzhiyun }
324*4882a593Smuzhiyun 
dmar_pci_bus_del_dev(struct dmar_pci_notify_info * info)325*4882a593Smuzhiyun static void  dmar_pci_bus_del_dev(struct dmar_pci_notify_info *info)
326*4882a593Smuzhiyun {
327*4882a593Smuzhiyun 	struct dmar_drhd_unit *dmaru;
328*4882a593Smuzhiyun 
329*4882a593Smuzhiyun 	for_each_drhd_unit(dmaru)
330*4882a593Smuzhiyun 		if (dmar_remove_dev_scope(info, dmaru->segment,
331*4882a593Smuzhiyun 			dmaru->devices, dmaru->devices_cnt))
332*4882a593Smuzhiyun 			break;
333*4882a593Smuzhiyun 	dmar_iommu_notify_scope_dev(info);
334*4882a593Smuzhiyun }
335*4882a593Smuzhiyun 
vf_inherit_msi_domain(struct pci_dev * pdev)336*4882a593Smuzhiyun static inline void vf_inherit_msi_domain(struct pci_dev *pdev)
337*4882a593Smuzhiyun {
338*4882a593Smuzhiyun 	struct pci_dev *physfn = pci_physfn(pdev);
339*4882a593Smuzhiyun 
340*4882a593Smuzhiyun 	dev_set_msi_domain(&pdev->dev, dev_get_msi_domain(&physfn->dev));
341*4882a593Smuzhiyun }
342*4882a593Smuzhiyun 
dmar_pci_bus_notifier(struct notifier_block * nb,unsigned long action,void * data)343*4882a593Smuzhiyun static int dmar_pci_bus_notifier(struct notifier_block *nb,
344*4882a593Smuzhiyun 				 unsigned long action, void *data)
345*4882a593Smuzhiyun {
346*4882a593Smuzhiyun 	struct pci_dev *pdev = to_pci_dev(data);
347*4882a593Smuzhiyun 	struct dmar_pci_notify_info *info;
348*4882a593Smuzhiyun 
349*4882a593Smuzhiyun 	/* Only care about add/remove events for physical functions.
350*4882a593Smuzhiyun 	 * For VFs we actually do the lookup based on the corresponding
351*4882a593Smuzhiyun 	 * PF in device_to_iommu() anyway. */
352*4882a593Smuzhiyun 	if (pdev->is_virtfn) {
353*4882a593Smuzhiyun 		/*
354*4882a593Smuzhiyun 		 * Ensure that the VF device inherits the irq domain of the
355*4882a593Smuzhiyun 		 * PF device. Ideally the device would inherit the domain
356*4882a593Smuzhiyun 		 * from the bus, but DMAR can have multiple units per bus
357*4882a593Smuzhiyun 		 * which makes this impossible. The VF 'bus' could inherit
358*4882a593Smuzhiyun 		 * from the PF device, but that's yet another x86'sism to
359*4882a593Smuzhiyun 		 * inflict on everybody else.
360*4882a593Smuzhiyun 		 */
361*4882a593Smuzhiyun 		if (action == BUS_NOTIFY_ADD_DEVICE)
362*4882a593Smuzhiyun 			vf_inherit_msi_domain(pdev);
363*4882a593Smuzhiyun 		return NOTIFY_DONE;
364*4882a593Smuzhiyun 	}
365*4882a593Smuzhiyun 
366*4882a593Smuzhiyun 	if (action != BUS_NOTIFY_ADD_DEVICE &&
367*4882a593Smuzhiyun 	    action != BUS_NOTIFY_REMOVED_DEVICE)
368*4882a593Smuzhiyun 		return NOTIFY_DONE;
369*4882a593Smuzhiyun 
370*4882a593Smuzhiyun 	info = dmar_alloc_pci_notify_info(pdev, action);
371*4882a593Smuzhiyun 	if (!info)
372*4882a593Smuzhiyun 		return NOTIFY_DONE;
373*4882a593Smuzhiyun 
374*4882a593Smuzhiyun 	down_write(&dmar_global_lock);
375*4882a593Smuzhiyun 	if (action == BUS_NOTIFY_ADD_DEVICE)
376*4882a593Smuzhiyun 		dmar_pci_bus_add_dev(info);
377*4882a593Smuzhiyun 	else if (action == BUS_NOTIFY_REMOVED_DEVICE)
378*4882a593Smuzhiyun 		dmar_pci_bus_del_dev(info);
379*4882a593Smuzhiyun 	up_write(&dmar_global_lock);
380*4882a593Smuzhiyun 
381*4882a593Smuzhiyun 	dmar_free_pci_notify_info(info);
382*4882a593Smuzhiyun 
383*4882a593Smuzhiyun 	return NOTIFY_OK;
384*4882a593Smuzhiyun }
385*4882a593Smuzhiyun 
386*4882a593Smuzhiyun static struct notifier_block dmar_pci_bus_nb = {
387*4882a593Smuzhiyun 	.notifier_call = dmar_pci_bus_notifier,
388*4882a593Smuzhiyun 	.priority = 1,
389*4882a593Smuzhiyun };
390*4882a593Smuzhiyun 
391*4882a593Smuzhiyun static struct dmar_drhd_unit *
dmar_find_dmaru(struct acpi_dmar_hardware_unit * drhd)392*4882a593Smuzhiyun dmar_find_dmaru(struct acpi_dmar_hardware_unit *drhd)
393*4882a593Smuzhiyun {
394*4882a593Smuzhiyun 	struct dmar_drhd_unit *dmaru;
395*4882a593Smuzhiyun 
396*4882a593Smuzhiyun 	list_for_each_entry_rcu(dmaru, &dmar_drhd_units, list,
397*4882a593Smuzhiyun 				dmar_rcu_check())
398*4882a593Smuzhiyun 		if (dmaru->segment == drhd->segment &&
399*4882a593Smuzhiyun 		    dmaru->reg_base_addr == drhd->address)
400*4882a593Smuzhiyun 			return dmaru;
401*4882a593Smuzhiyun 
402*4882a593Smuzhiyun 	return NULL;
403*4882a593Smuzhiyun }
404*4882a593Smuzhiyun 
405*4882a593Smuzhiyun /*
406*4882a593Smuzhiyun  * dmar_parse_one_drhd - parses exactly one DMA remapping hardware definition
407*4882a593Smuzhiyun  * structure which uniquely represent one DMA remapping hardware unit
408*4882a593Smuzhiyun  * present in the platform
409*4882a593Smuzhiyun  */
dmar_parse_one_drhd(struct acpi_dmar_header * header,void * arg)410*4882a593Smuzhiyun static int dmar_parse_one_drhd(struct acpi_dmar_header *header, void *arg)
411*4882a593Smuzhiyun {
412*4882a593Smuzhiyun 	struct acpi_dmar_hardware_unit *drhd;
413*4882a593Smuzhiyun 	struct dmar_drhd_unit *dmaru;
414*4882a593Smuzhiyun 	int ret;
415*4882a593Smuzhiyun 
416*4882a593Smuzhiyun 	drhd = (struct acpi_dmar_hardware_unit *)header;
417*4882a593Smuzhiyun 	dmaru = dmar_find_dmaru(drhd);
418*4882a593Smuzhiyun 	if (dmaru)
419*4882a593Smuzhiyun 		goto out;
420*4882a593Smuzhiyun 
421*4882a593Smuzhiyun 	dmaru = kzalloc(sizeof(*dmaru) + header->length, GFP_KERNEL);
422*4882a593Smuzhiyun 	if (!dmaru)
423*4882a593Smuzhiyun 		return -ENOMEM;
424*4882a593Smuzhiyun 
425*4882a593Smuzhiyun 	/*
426*4882a593Smuzhiyun 	 * If header is allocated from slab by ACPI _DSM method, we need to
427*4882a593Smuzhiyun 	 * copy the content because the memory buffer will be freed on return.
428*4882a593Smuzhiyun 	 */
429*4882a593Smuzhiyun 	dmaru->hdr = (void *)(dmaru + 1);
430*4882a593Smuzhiyun 	memcpy(dmaru->hdr, header, header->length);
431*4882a593Smuzhiyun 	dmaru->reg_base_addr = drhd->address;
432*4882a593Smuzhiyun 	dmaru->segment = drhd->segment;
433*4882a593Smuzhiyun 	dmaru->include_all = drhd->flags & 0x1; /* BIT0: INCLUDE_ALL */
434*4882a593Smuzhiyun 	dmaru->devices = dmar_alloc_dev_scope((void *)(drhd + 1),
435*4882a593Smuzhiyun 					      ((void *)drhd) + drhd->header.length,
436*4882a593Smuzhiyun 					      &dmaru->devices_cnt);
437*4882a593Smuzhiyun 	if (dmaru->devices_cnt && dmaru->devices == NULL) {
438*4882a593Smuzhiyun 		kfree(dmaru);
439*4882a593Smuzhiyun 		return -ENOMEM;
440*4882a593Smuzhiyun 	}
441*4882a593Smuzhiyun 
442*4882a593Smuzhiyun 	ret = alloc_iommu(dmaru);
443*4882a593Smuzhiyun 	if (ret) {
444*4882a593Smuzhiyun 		dmar_free_dev_scope(&dmaru->devices,
445*4882a593Smuzhiyun 				    &dmaru->devices_cnt);
446*4882a593Smuzhiyun 		kfree(dmaru);
447*4882a593Smuzhiyun 		return ret;
448*4882a593Smuzhiyun 	}
449*4882a593Smuzhiyun 	dmar_register_drhd_unit(dmaru);
450*4882a593Smuzhiyun 
451*4882a593Smuzhiyun out:
452*4882a593Smuzhiyun 	if (arg)
453*4882a593Smuzhiyun 		(*(int *)arg)++;
454*4882a593Smuzhiyun 
455*4882a593Smuzhiyun 	return 0;
456*4882a593Smuzhiyun }
457*4882a593Smuzhiyun 
dmar_free_drhd(struct dmar_drhd_unit * dmaru)458*4882a593Smuzhiyun static void dmar_free_drhd(struct dmar_drhd_unit *dmaru)
459*4882a593Smuzhiyun {
460*4882a593Smuzhiyun 	if (dmaru->devices && dmaru->devices_cnt)
461*4882a593Smuzhiyun 		dmar_free_dev_scope(&dmaru->devices, &dmaru->devices_cnt);
462*4882a593Smuzhiyun 	if (dmaru->iommu)
463*4882a593Smuzhiyun 		free_iommu(dmaru->iommu);
464*4882a593Smuzhiyun 	kfree(dmaru);
465*4882a593Smuzhiyun }
466*4882a593Smuzhiyun 
dmar_parse_one_andd(struct acpi_dmar_header * header,void * arg)467*4882a593Smuzhiyun static int __init dmar_parse_one_andd(struct acpi_dmar_header *header,
468*4882a593Smuzhiyun 				      void *arg)
469*4882a593Smuzhiyun {
470*4882a593Smuzhiyun 	struct acpi_dmar_andd *andd = (void *)header;
471*4882a593Smuzhiyun 
472*4882a593Smuzhiyun 	/* Check for NUL termination within the designated length */
473*4882a593Smuzhiyun 	if (strnlen(andd->device_name, header->length - 8) == header->length - 8) {
474*4882a593Smuzhiyun 		pr_warn(FW_BUG
475*4882a593Smuzhiyun 			   "Your BIOS is broken; ANDD object name is not NUL-terminated\n"
476*4882a593Smuzhiyun 			   "BIOS vendor: %s; Ver: %s; Product Version: %s\n",
477*4882a593Smuzhiyun 			   dmi_get_system_info(DMI_BIOS_VENDOR),
478*4882a593Smuzhiyun 			   dmi_get_system_info(DMI_BIOS_VERSION),
479*4882a593Smuzhiyun 			   dmi_get_system_info(DMI_PRODUCT_VERSION));
480*4882a593Smuzhiyun 		add_taint(TAINT_FIRMWARE_WORKAROUND, LOCKDEP_STILL_OK);
481*4882a593Smuzhiyun 		return -EINVAL;
482*4882a593Smuzhiyun 	}
483*4882a593Smuzhiyun 	pr_info("ANDD device: %x name: %s\n", andd->device_number,
484*4882a593Smuzhiyun 		andd->device_name);
485*4882a593Smuzhiyun 
486*4882a593Smuzhiyun 	return 0;
487*4882a593Smuzhiyun }
488*4882a593Smuzhiyun 
489*4882a593Smuzhiyun #ifdef CONFIG_ACPI_NUMA
dmar_parse_one_rhsa(struct acpi_dmar_header * header,void * arg)490*4882a593Smuzhiyun static int dmar_parse_one_rhsa(struct acpi_dmar_header *header, void *arg)
491*4882a593Smuzhiyun {
492*4882a593Smuzhiyun 	struct acpi_dmar_rhsa *rhsa;
493*4882a593Smuzhiyun 	struct dmar_drhd_unit *drhd;
494*4882a593Smuzhiyun 
495*4882a593Smuzhiyun 	rhsa = (struct acpi_dmar_rhsa *)header;
496*4882a593Smuzhiyun 	for_each_drhd_unit(drhd) {
497*4882a593Smuzhiyun 		if (drhd->reg_base_addr == rhsa->base_address) {
498*4882a593Smuzhiyun 			int node = pxm_to_node(rhsa->proximity_domain);
499*4882a593Smuzhiyun 
500*4882a593Smuzhiyun 			if (node != NUMA_NO_NODE && !node_online(node))
501*4882a593Smuzhiyun 				node = NUMA_NO_NODE;
502*4882a593Smuzhiyun 			drhd->iommu->node = node;
503*4882a593Smuzhiyun 			return 0;
504*4882a593Smuzhiyun 		}
505*4882a593Smuzhiyun 	}
506*4882a593Smuzhiyun 	pr_warn(FW_BUG
507*4882a593Smuzhiyun 		"Your BIOS is broken; RHSA refers to non-existent DMAR unit at %llx\n"
508*4882a593Smuzhiyun 		"BIOS vendor: %s; Ver: %s; Product Version: %s\n",
509*4882a593Smuzhiyun 		rhsa->base_address,
510*4882a593Smuzhiyun 		dmi_get_system_info(DMI_BIOS_VENDOR),
511*4882a593Smuzhiyun 		dmi_get_system_info(DMI_BIOS_VERSION),
512*4882a593Smuzhiyun 		dmi_get_system_info(DMI_PRODUCT_VERSION));
513*4882a593Smuzhiyun 	add_taint(TAINT_FIRMWARE_WORKAROUND, LOCKDEP_STILL_OK);
514*4882a593Smuzhiyun 
515*4882a593Smuzhiyun 	return 0;
516*4882a593Smuzhiyun }
517*4882a593Smuzhiyun #else
518*4882a593Smuzhiyun #define	dmar_parse_one_rhsa		dmar_res_noop
519*4882a593Smuzhiyun #endif
520*4882a593Smuzhiyun 
521*4882a593Smuzhiyun static void
dmar_table_print_dmar_entry(struct acpi_dmar_header * header)522*4882a593Smuzhiyun dmar_table_print_dmar_entry(struct acpi_dmar_header *header)
523*4882a593Smuzhiyun {
524*4882a593Smuzhiyun 	struct acpi_dmar_hardware_unit *drhd;
525*4882a593Smuzhiyun 	struct acpi_dmar_reserved_memory *rmrr;
526*4882a593Smuzhiyun 	struct acpi_dmar_atsr *atsr;
527*4882a593Smuzhiyun 	struct acpi_dmar_rhsa *rhsa;
528*4882a593Smuzhiyun 
529*4882a593Smuzhiyun 	switch (header->type) {
530*4882a593Smuzhiyun 	case ACPI_DMAR_TYPE_HARDWARE_UNIT:
531*4882a593Smuzhiyun 		drhd = container_of(header, struct acpi_dmar_hardware_unit,
532*4882a593Smuzhiyun 				    header);
533*4882a593Smuzhiyun 		pr_info("DRHD base: %#016Lx flags: %#x\n",
534*4882a593Smuzhiyun 			(unsigned long long)drhd->address, drhd->flags);
535*4882a593Smuzhiyun 		break;
536*4882a593Smuzhiyun 	case ACPI_DMAR_TYPE_RESERVED_MEMORY:
537*4882a593Smuzhiyun 		rmrr = container_of(header, struct acpi_dmar_reserved_memory,
538*4882a593Smuzhiyun 				    header);
539*4882a593Smuzhiyun 		pr_info("RMRR base: %#016Lx end: %#016Lx\n",
540*4882a593Smuzhiyun 			(unsigned long long)rmrr->base_address,
541*4882a593Smuzhiyun 			(unsigned long long)rmrr->end_address);
542*4882a593Smuzhiyun 		break;
543*4882a593Smuzhiyun 	case ACPI_DMAR_TYPE_ROOT_ATS:
544*4882a593Smuzhiyun 		atsr = container_of(header, struct acpi_dmar_atsr, header);
545*4882a593Smuzhiyun 		pr_info("ATSR flags: %#x\n", atsr->flags);
546*4882a593Smuzhiyun 		break;
547*4882a593Smuzhiyun 	case ACPI_DMAR_TYPE_HARDWARE_AFFINITY:
548*4882a593Smuzhiyun 		rhsa = container_of(header, struct acpi_dmar_rhsa, header);
549*4882a593Smuzhiyun 		pr_info("RHSA base: %#016Lx proximity domain: %#x\n",
550*4882a593Smuzhiyun 		       (unsigned long long)rhsa->base_address,
551*4882a593Smuzhiyun 		       rhsa->proximity_domain);
552*4882a593Smuzhiyun 		break;
553*4882a593Smuzhiyun 	case ACPI_DMAR_TYPE_NAMESPACE:
554*4882a593Smuzhiyun 		/* We don't print this here because we need to sanity-check
555*4882a593Smuzhiyun 		   it first. So print it in dmar_parse_one_andd() instead. */
556*4882a593Smuzhiyun 		break;
557*4882a593Smuzhiyun 	}
558*4882a593Smuzhiyun }
559*4882a593Smuzhiyun 
560*4882a593Smuzhiyun /**
561*4882a593Smuzhiyun  * dmar_table_detect - checks to see if the platform supports DMAR devices
562*4882a593Smuzhiyun  */
dmar_table_detect(void)563*4882a593Smuzhiyun static int __init dmar_table_detect(void)
564*4882a593Smuzhiyun {
565*4882a593Smuzhiyun 	acpi_status status = AE_OK;
566*4882a593Smuzhiyun 
567*4882a593Smuzhiyun 	/* if we could find DMAR table, then there are DMAR devices */
568*4882a593Smuzhiyun 	status = acpi_get_table(ACPI_SIG_DMAR, 0, &dmar_tbl);
569*4882a593Smuzhiyun 
570*4882a593Smuzhiyun 	if (ACPI_SUCCESS(status) && !dmar_tbl) {
571*4882a593Smuzhiyun 		pr_warn("Unable to map DMAR\n");
572*4882a593Smuzhiyun 		status = AE_NOT_FOUND;
573*4882a593Smuzhiyun 	}
574*4882a593Smuzhiyun 
575*4882a593Smuzhiyun 	return ACPI_SUCCESS(status) ? 0 : -ENOENT;
576*4882a593Smuzhiyun }
577*4882a593Smuzhiyun 
dmar_walk_remapping_entries(struct acpi_dmar_header * start,size_t len,struct dmar_res_callback * cb)578*4882a593Smuzhiyun static int dmar_walk_remapping_entries(struct acpi_dmar_header *start,
579*4882a593Smuzhiyun 				       size_t len, struct dmar_res_callback *cb)
580*4882a593Smuzhiyun {
581*4882a593Smuzhiyun 	struct acpi_dmar_header *iter, *next;
582*4882a593Smuzhiyun 	struct acpi_dmar_header *end = ((void *)start) + len;
583*4882a593Smuzhiyun 
584*4882a593Smuzhiyun 	for (iter = start; iter < end; iter = next) {
585*4882a593Smuzhiyun 		next = (void *)iter + iter->length;
586*4882a593Smuzhiyun 		if (iter->length == 0) {
587*4882a593Smuzhiyun 			/* Avoid looping forever on bad ACPI tables */
588*4882a593Smuzhiyun 			pr_debug(FW_BUG "Invalid 0-length structure\n");
589*4882a593Smuzhiyun 			break;
590*4882a593Smuzhiyun 		} else if (next > end) {
591*4882a593Smuzhiyun 			/* Avoid passing table end */
592*4882a593Smuzhiyun 			pr_warn(FW_BUG "Record passes table end\n");
593*4882a593Smuzhiyun 			return -EINVAL;
594*4882a593Smuzhiyun 		}
595*4882a593Smuzhiyun 
596*4882a593Smuzhiyun 		if (cb->print_entry)
597*4882a593Smuzhiyun 			dmar_table_print_dmar_entry(iter);
598*4882a593Smuzhiyun 
599*4882a593Smuzhiyun 		if (iter->type >= ACPI_DMAR_TYPE_RESERVED) {
600*4882a593Smuzhiyun 			/* continue for forward compatibility */
601*4882a593Smuzhiyun 			pr_debug("Unknown DMAR structure type %d\n",
602*4882a593Smuzhiyun 				 iter->type);
603*4882a593Smuzhiyun 		} else if (cb->cb[iter->type]) {
604*4882a593Smuzhiyun 			int ret;
605*4882a593Smuzhiyun 
606*4882a593Smuzhiyun 			ret = cb->cb[iter->type](iter, cb->arg[iter->type]);
607*4882a593Smuzhiyun 			if (ret)
608*4882a593Smuzhiyun 				return ret;
609*4882a593Smuzhiyun 		} else if (!cb->ignore_unhandled) {
610*4882a593Smuzhiyun 			pr_warn("No handler for DMAR structure type %d\n",
611*4882a593Smuzhiyun 				iter->type);
612*4882a593Smuzhiyun 			return -EINVAL;
613*4882a593Smuzhiyun 		}
614*4882a593Smuzhiyun 	}
615*4882a593Smuzhiyun 
616*4882a593Smuzhiyun 	return 0;
617*4882a593Smuzhiyun }
618*4882a593Smuzhiyun 
dmar_walk_dmar_table(struct acpi_table_dmar * dmar,struct dmar_res_callback * cb)619*4882a593Smuzhiyun static inline int dmar_walk_dmar_table(struct acpi_table_dmar *dmar,
620*4882a593Smuzhiyun 				       struct dmar_res_callback *cb)
621*4882a593Smuzhiyun {
622*4882a593Smuzhiyun 	return dmar_walk_remapping_entries((void *)(dmar + 1),
623*4882a593Smuzhiyun 			dmar->header.length - sizeof(*dmar), cb);
624*4882a593Smuzhiyun }
625*4882a593Smuzhiyun 
626*4882a593Smuzhiyun /**
627*4882a593Smuzhiyun  * parse_dmar_table - parses the DMA reporting table
628*4882a593Smuzhiyun  */
629*4882a593Smuzhiyun static int __init
parse_dmar_table(void)630*4882a593Smuzhiyun parse_dmar_table(void)
631*4882a593Smuzhiyun {
632*4882a593Smuzhiyun 	struct acpi_table_dmar *dmar;
633*4882a593Smuzhiyun 	int drhd_count = 0;
634*4882a593Smuzhiyun 	int ret;
635*4882a593Smuzhiyun 	struct dmar_res_callback cb = {
636*4882a593Smuzhiyun 		.print_entry = true,
637*4882a593Smuzhiyun 		.ignore_unhandled = true,
638*4882a593Smuzhiyun 		.arg[ACPI_DMAR_TYPE_HARDWARE_UNIT] = &drhd_count,
639*4882a593Smuzhiyun 		.cb[ACPI_DMAR_TYPE_HARDWARE_UNIT] = &dmar_parse_one_drhd,
640*4882a593Smuzhiyun 		.cb[ACPI_DMAR_TYPE_RESERVED_MEMORY] = &dmar_parse_one_rmrr,
641*4882a593Smuzhiyun 		.cb[ACPI_DMAR_TYPE_ROOT_ATS] = &dmar_parse_one_atsr,
642*4882a593Smuzhiyun 		.cb[ACPI_DMAR_TYPE_HARDWARE_AFFINITY] = &dmar_parse_one_rhsa,
643*4882a593Smuzhiyun 		.cb[ACPI_DMAR_TYPE_NAMESPACE] = &dmar_parse_one_andd,
644*4882a593Smuzhiyun 	};
645*4882a593Smuzhiyun 
646*4882a593Smuzhiyun 	/*
647*4882a593Smuzhiyun 	 * Do it again, earlier dmar_tbl mapping could be mapped with
648*4882a593Smuzhiyun 	 * fixed map.
649*4882a593Smuzhiyun 	 */
650*4882a593Smuzhiyun 	dmar_table_detect();
651*4882a593Smuzhiyun 
652*4882a593Smuzhiyun 	/*
653*4882a593Smuzhiyun 	 * ACPI tables may not be DMA protected by tboot, so use DMAR copy
654*4882a593Smuzhiyun 	 * SINIT saved in SinitMleData in TXT heap (which is DMA protected)
655*4882a593Smuzhiyun 	 */
656*4882a593Smuzhiyun 	dmar_tbl = tboot_get_dmar_table(dmar_tbl);
657*4882a593Smuzhiyun 
658*4882a593Smuzhiyun 	dmar = (struct acpi_table_dmar *)dmar_tbl;
659*4882a593Smuzhiyun 	if (!dmar)
660*4882a593Smuzhiyun 		return -ENODEV;
661*4882a593Smuzhiyun 
662*4882a593Smuzhiyun 	if (dmar->width < PAGE_SHIFT - 1) {
663*4882a593Smuzhiyun 		pr_warn("Invalid DMAR haw\n");
664*4882a593Smuzhiyun 		return -EINVAL;
665*4882a593Smuzhiyun 	}
666*4882a593Smuzhiyun 
667*4882a593Smuzhiyun 	pr_info("Host address width %d\n", dmar->width + 1);
668*4882a593Smuzhiyun 	ret = dmar_walk_dmar_table(dmar, &cb);
669*4882a593Smuzhiyun 	if (ret == 0 && drhd_count == 0)
670*4882a593Smuzhiyun 		pr_warn(FW_BUG "No DRHD structure found in DMAR table\n");
671*4882a593Smuzhiyun 
672*4882a593Smuzhiyun 	return ret;
673*4882a593Smuzhiyun }
674*4882a593Smuzhiyun 
dmar_pci_device_match(struct dmar_dev_scope devices[],int cnt,struct pci_dev * dev)675*4882a593Smuzhiyun static int dmar_pci_device_match(struct dmar_dev_scope devices[],
676*4882a593Smuzhiyun 				 int cnt, struct pci_dev *dev)
677*4882a593Smuzhiyun {
678*4882a593Smuzhiyun 	int index;
679*4882a593Smuzhiyun 	struct device *tmp;
680*4882a593Smuzhiyun 
681*4882a593Smuzhiyun 	while (dev) {
682*4882a593Smuzhiyun 		for_each_active_dev_scope(devices, cnt, index, tmp)
683*4882a593Smuzhiyun 			if (dev_is_pci(tmp) && dev == to_pci_dev(tmp))
684*4882a593Smuzhiyun 				return 1;
685*4882a593Smuzhiyun 
686*4882a593Smuzhiyun 		/* Check our parent */
687*4882a593Smuzhiyun 		dev = dev->bus->self;
688*4882a593Smuzhiyun 	}
689*4882a593Smuzhiyun 
690*4882a593Smuzhiyun 	return 0;
691*4882a593Smuzhiyun }
692*4882a593Smuzhiyun 
693*4882a593Smuzhiyun struct dmar_drhd_unit *
dmar_find_matched_drhd_unit(struct pci_dev * dev)694*4882a593Smuzhiyun dmar_find_matched_drhd_unit(struct pci_dev *dev)
695*4882a593Smuzhiyun {
696*4882a593Smuzhiyun 	struct dmar_drhd_unit *dmaru;
697*4882a593Smuzhiyun 	struct acpi_dmar_hardware_unit *drhd;
698*4882a593Smuzhiyun 
699*4882a593Smuzhiyun 	dev = pci_physfn(dev);
700*4882a593Smuzhiyun 
701*4882a593Smuzhiyun 	rcu_read_lock();
702*4882a593Smuzhiyun 	for_each_drhd_unit(dmaru) {
703*4882a593Smuzhiyun 		drhd = container_of(dmaru->hdr,
704*4882a593Smuzhiyun 				    struct acpi_dmar_hardware_unit,
705*4882a593Smuzhiyun 				    header);
706*4882a593Smuzhiyun 
707*4882a593Smuzhiyun 		if (dmaru->include_all &&
708*4882a593Smuzhiyun 		    drhd->segment == pci_domain_nr(dev->bus))
709*4882a593Smuzhiyun 			goto out;
710*4882a593Smuzhiyun 
711*4882a593Smuzhiyun 		if (dmar_pci_device_match(dmaru->devices,
712*4882a593Smuzhiyun 					  dmaru->devices_cnt, dev))
713*4882a593Smuzhiyun 			goto out;
714*4882a593Smuzhiyun 	}
715*4882a593Smuzhiyun 	dmaru = NULL;
716*4882a593Smuzhiyun out:
717*4882a593Smuzhiyun 	rcu_read_unlock();
718*4882a593Smuzhiyun 
719*4882a593Smuzhiyun 	return dmaru;
720*4882a593Smuzhiyun }
721*4882a593Smuzhiyun 
dmar_acpi_insert_dev_scope(u8 device_number,struct acpi_device * adev)722*4882a593Smuzhiyun static void __init dmar_acpi_insert_dev_scope(u8 device_number,
723*4882a593Smuzhiyun 					      struct acpi_device *adev)
724*4882a593Smuzhiyun {
725*4882a593Smuzhiyun 	struct dmar_drhd_unit *dmaru;
726*4882a593Smuzhiyun 	struct acpi_dmar_hardware_unit *drhd;
727*4882a593Smuzhiyun 	struct acpi_dmar_device_scope *scope;
728*4882a593Smuzhiyun 	struct device *tmp;
729*4882a593Smuzhiyun 	int i;
730*4882a593Smuzhiyun 	struct acpi_dmar_pci_path *path;
731*4882a593Smuzhiyun 
732*4882a593Smuzhiyun 	for_each_drhd_unit(dmaru) {
733*4882a593Smuzhiyun 		drhd = container_of(dmaru->hdr,
734*4882a593Smuzhiyun 				    struct acpi_dmar_hardware_unit,
735*4882a593Smuzhiyun 				    header);
736*4882a593Smuzhiyun 
737*4882a593Smuzhiyun 		for (scope = (void *)(drhd + 1);
738*4882a593Smuzhiyun 		     (unsigned long)scope < ((unsigned long)drhd) + drhd->header.length;
739*4882a593Smuzhiyun 		     scope = ((void *)scope) + scope->length) {
740*4882a593Smuzhiyun 			if (scope->entry_type != ACPI_DMAR_SCOPE_TYPE_NAMESPACE)
741*4882a593Smuzhiyun 				continue;
742*4882a593Smuzhiyun 			if (scope->enumeration_id != device_number)
743*4882a593Smuzhiyun 				continue;
744*4882a593Smuzhiyun 
745*4882a593Smuzhiyun 			path = (void *)(scope + 1);
746*4882a593Smuzhiyun 			pr_info("ACPI device \"%s\" under DMAR at %llx as %02x:%02x.%d\n",
747*4882a593Smuzhiyun 				dev_name(&adev->dev), dmaru->reg_base_addr,
748*4882a593Smuzhiyun 				scope->bus, path->device, path->function);
749*4882a593Smuzhiyun 			for_each_dev_scope(dmaru->devices, dmaru->devices_cnt, i, tmp)
750*4882a593Smuzhiyun 				if (tmp == NULL) {
751*4882a593Smuzhiyun 					dmaru->devices[i].bus = scope->bus;
752*4882a593Smuzhiyun 					dmaru->devices[i].devfn = PCI_DEVFN(path->device,
753*4882a593Smuzhiyun 									    path->function);
754*4882a593Smuzhiyun 					rcu_assign_pointer(dmaru->devices[i].dev,
755*4882a593Smuzhiyun 							   get_device(&adev->dev));
756*4882a593Smuzhiyun 					return;
757*4882a593Smuzhiyun 				}
758*4882a593Smuzhiyun 			BUG_ON(i >= dmaru->devices_cnt);
759*4882a593Smuzhiyun 		}
760*4882a593Smuzhiyun 	}
761*4882a593Smuzhiyun 	pr_warn("No IOMMU scope found for ANDD enumeration ID %d (%s)\n",
762*4882a593Smuzhiyun 		device_number, dev_name(&adev->dev));
763*4882a593Smuzhiyun }
764*4882a593Smuzhiyun 
dmar_acpi_dev_scope_init(void)765*4882a593Smuzhiyun static int __init dmar_acpi_dev_scope_init(void)
766*4882a593Smuzhiyun {
767*4882a593Smuzhiyun 	struct acpi_dmar_andd *andd;
768*4882a593Smuzhiyun 
769*4882a593Smuzhiyun 	if (dmar_tbl == NULL)
770*4882a593Smuzhiyun 		return -ENODEV;
771*4882a593Smuzhiyun 
772*4882a593Smuzhiyun 	for (andd = (void *)dmar_tbl + sizeof(struct acpi_table_dmar);
773*4882a593Smuzhiyun 	     ((unsigned long)andd) < ((unsigned long)dmar_tbl) + dmar_tbl->length;
774*4882a593Smuzhiyun 	     andd = ((void *)andd) + andd->header.length) {
775*4882a593Smuzhiyun 		if (andd->header.type == ACPI_DMAR_TYPE_NAMESPACE) {
776*4882a593Smuzhiyun 			acpi_handle h;
777*4882a593Smuzhiyun 			struct acpi_device *adev;
778*4882a593Smuzhiyun 
779*4882a593Smuzhiyun 			if (!ACPI_SUCCESS(acpi_get_handle(ACPI_ROOT_OBJECT,
780*4882a593Smuzhiyun 							  andd->device_name,
781*4882a593Smuzhiyun 							  &h))) {
782*4882a593Smuzhiyun 				pr_err("Failed to find handle for ACPI object %s\n",
783*4882a593Smuzhiyun 				       andd->device_name);
784*4882a593Smuzhiyun 				continue;
785*4882a593Smuzhiyun 			}
786*4882a593Smuzhiyun 			if (acpi_bus_get_device(h, &adev)) {
787*4882a593Smuzhiyun 				pr_err("Failed to get device for ACPI object %s\n",
788*4882a593Smuzhiyun 				       andd->device_name);
789*4882a593Smuzhiyun 				continue;
790*4882a593Smuzhiyun 			}
791*4882a593Smuzhiyun 			dmar_acpi_insert_dev_scope(andd->device_number, adev);
792*4882a593Smuzhiyun 		}
793*4882a593Smuzhiyun 	}
794*4882a593Smuzhiyun 	return 0;
795*4882a593Smuzhiyun }
796*4882a593Smuzhiyun 
dmar_dev_scope_init(void)797*4882a593Smuzhiyun int __init dmar_dev_scope_init(void)
798*4882a593Smuzhiyun {
799*4882a593Smuzhiyun 	struct pci_dev *dev = NULL;
800*4882a593Smuzhiyun 	struct dmar_pci_notify_info *info;
801*4882a593Smuzhiyun 
802*4882a593Smuzhiyun 	if (dmar_dev_scope_status != 1)
803*4882a593Smuzhiyun 		return dmar_dev_scope_status;
804*4882a593Smuzhiyun 
805*4882a593Smuzhiyun 	if (list_empty(&dmar_drhd_units)) {
806*4882a593Smuzhiyun 		dmar_dev_scope_status = -ENODEV;
807*4882a593Smuzhiyun 	} else {
808*4882a593Smuzhiyun 		dmar_dev_scope_status = 0;
809*4882a593Smuzhiyun 
810*4882a593Smuzhiyun 		dmar_acpi_dev_scope_init();
811*4882a593Smuzhiyun 
812*4882a593Smuzhiyun 		for_each_pci_dev(dev) {
813*4882a593Smuzhiyun 			if (dev->is_virtfn)
814*4882a593Smuzhiyun 				continue;
815*4882a593Smuzhiyun 
816*4882a593Smuzhiyun 			info = dmar_alloc_pci_notify_info(dev,
817*4882a593Smuzhiyun 					BUS_NOTIFY_ADD_DEVICE);
818*4882a593Smuzhiyun 			if (!info) {
819*4882a593Smuzhiyun 				pci_dev_put(dev);
820*4882a593Smuzhiyun 				return dmar_dev_scope_status;
821*4882a593Smuzhiyun 			} else {
822*4882a593Smuzhiyun 				dmar_pci_bus_add_dev(info);
823*4882a593Smuzhiyun 				dmar_free_pci_notify_info(info);
824*4882a593Smuzhiyun 			}
825*4882a593Smuzhiyun 		}
826*4882a593Smuzhiyun 	}
827*4882a593Smuzhiyun 
828*4882a593Smuzhiyun 	return dmar_dev_scope_status;
829*4882a593Smuzhiyun }
830*4882a593Smuzhiyun 
dmar_register_bus_notifier(void)831*4882a593Smuzhiyun void __init dmar_register_bus_notifier(void)
832*4882a593Smuzhiyun {
833*4882a593Smuzhiyun 	bus_register_notifier(&pci_bus_type, &dmar_pci_bus_nb);
834*4882a593Smuzhiyun }
835*4882a593Smuzhiyun 
836*4882a593Smuzhiyun 
dmar_table_init(void)837*4882a593Smuzhiyun int __init dmar_table_init(void)
838*4882a593Smuzhiyun {
839*4882a593Smuzhiyun 	static int dmar_table_initialized;
840*4882a593Smuzhiyun 	int ret;
841*4882a593Smuzhiyun 
842*4882a593Smuzhiyun 	if (dmar_table_initialized == 0) {
843*4882a593Smuzhiyun 		ret = parse_dmar_table();
844*4882a593Smuzhiyun 		if (ret < 0) {
845*4882a593Smuzhiyun 			if (ret != -ENODEV)
846*4882a593Smuzhiyun 				pr_info("Parse DMAR table failure.\n");
847*4882a593Smuzhiyun 		} else  if (list_empty(&dmar_drhd_units)) {
848*4882a593Smuzhiyun 			pr_info("No DMAR devices found\n");
849*4882a593Smuzhiyun 			ret = -ENODEV;
850*4882a593Smuzhiyun 		}
851*4882a593Smuzhiyun 
852*4882a593Smuzhiyun 		if (ret < 0)
853*4882a593Smuzhiyun 			dmar_table_initialized = ret;
854*4882a593Smuzhiyun 		else
855*4882a593Smuzhiyun 			dmar_table_initialized = 1;
856*4882a593Smuzhiyun 	}
857*4882a593Smuzhiyun 
858*4882a593Smuzhiyun 	return dmar_table_initialized < 0 ? dmar_table_initialized : 0;
859*4882a593Smuzhiyun }
860*4882a593Smuzhiyun 
warn_invalid_dmar(u64 addr,const char * message)861*4882a593Smuzhiyun static void warn_invalid_dmar(u64 addr, const char *message)
862*4882a593Smuzhiyun {
863*4882a593Smuzhiyun 	pr_warn_once(FW_BUG
864*4882a593Smuzhiyun 		"Your BIOS is broken; DMAR reported at address %llx%s!\n"
865*4882a593Smuzhiyun 		"BIOS vendor: %s; Ver: %s; Product Version: %s\n",
866*4882a593Smuzhiyun 		addr, message,
867*4882a593Smuzhiyun 		dmi_get_system_info(DMI_BIOS_VENDOR),
868*4882a593Smuzhiyun 		dmi_get_system_info(DMI_BIOS_VERSION),
869*4882a593Smuzhiyun 		dmi_get_system_info(DMI_PRODUCT_VERSION));
870*4882a593Smuzhiyun 	add_taint(TAINT_FIRMWARE_WORKAROUND, LOCKDEP_STILL_OK);
871*4882a593Smuzhiyun }
872*4882a593Smuzhiyun 
873*4882a593Smuzhiyun static int __ref
dmar_validate_one_drhd(struct acpi_dmar_header * entry,void * arg)874*4882a593Smuzhiyun dmar_validate_one_drhd(struct acpi_dmar_header *entry, void *arg)
875*4882a593Smuzhiyun {
876*4882a593Smuzhiyun 	struct acpi_dmar_hardware_unit *drhd;
877*4882a593Smuzhiyun 	void __iomem *addr;
878*4882a593Smuzhiyun 	u64 cap, ecap;
879*4882a593Smuzhiyun 
880*4882a593Smuzhiyun 	drhd = (void *)entry;
881*4882a593Smuzhiyun 	if (!drhd->address) {
882*4882a593Smuzhiyun 		warn_invalid_dmar(0, "");
883*4882a593Smuzhiyun 		return -EINVAL;
884*4882a593Smuzhiyun 	}
885*4882a593Smuzhiyun 
886*4882a593Smuzhiyun 	if (arg)
887*4882a593Smuzhiyun 		addr = ioremap(drhd->address, VTD_PAGE_SIZE);
888*4882a593Smuzhiyun 	else
889*4882a593Smuzhiyun 		addr = early_ioremap(drhd->address, VTD_PAGE_SIZE);
890*4882a593Smuzhiyun 	if (!addr) {
891*4882a593Smuzhiyun 		pr_warn("Can't validate DRHD address: %llx\n", drhd->address);
892*4882a593Smuzhiyun 		return -EINVAL;
893*4882a593Smuzhiyun 	}
894*4882a593Smuzhiyun 
895*4882a593Smuzhiyun 	cap = dmar_readq(addr + DMAR_CAP_REG);
896*4882a593Smuzhiyun 	ecap = dmar_readq(addr + DMAR_ECAP_REG);
897*4882a593Smuzhiyun 
898*4882a593Smuzhiyun 	if (arg)
899*4882a593Smuzhiyun 		iounmap(addr);
900*4882a593Smuzhiyun 	else
901*4882a593Smuzhiyun 		early_iounmap(addr, VTD_PAGE_SIZE);
902*4882a593Smuzhiyun 
903*4882a593Smuzhiyun 	if (cap == (uint64_t)-1 && ecap == (uint64_t)-1) {
904*4882a593Smuzhiyun 		warn_invalid_dmar(drhd->address, " returns all ones");
905*4882a593Smuzhiyun 		return -EINVAL;
906*4882a593Smuzhiyun 	}
907*4882a593Smuzhiyun 
908*4882a593Smuzhiyun 	return 0;
909*4882a593Smuzhiyun }
910*4882a593Smuzhiyun 
detect_intel_iommu(void)911*4882a593Smuzhiyun int __init detect_intel_iommu(void)
912*4882a593Smuzhiyun {
913*4882a593Smuzhiyun 	int ret;
914*4882a593Smuzhiyun 	struct dmar_res_callback validate_drhd_cb = {
915*4882a593Smuzhiyun 		.cb[ACPI_DMAR_TYPE_HARDWARE_UNIT] = &dmar_validate_one_drhd,
916*4882a593Smuzhiyun 		.ignore_unhandled = true,
917*4882a593Smuzhiyun 	};
918*4882a593Smuzhiyun 
919*4882a593Smuzhiyun 	down_write(&dmar_global_lock);
920*4882a593Smuzhiyun 	ret = dmar_table_detect();
921*4882a593Smuzhiyun 	if (!ret)
922*4882a593Smuzhiyun 		ret = dmar_walk_dmar_table((struct acpi_table_dmar *)dmar_tbl,
923*4882a593Smuzhiyun 					   &validate_drhd_cb);
924*4882a593Smuzhiyun 	if (!ret && !no_iommu && !iommu_detected &&
925*4882a593Smuzhiyun 	    (!dmar_disabled || dmar_platform_optin())) {
926*4882a593Smuzhiyun 		iommu_detected = 1;
927*4882a593Smuzhiyun 		/* Make sure ACS will be enabled */
928*4882a593Smuzhiyun 		pci_request_acs();
929*4882a593Smuzhiyun 	}
930*4882a593Smuzhiyun 
931*4882a593Smuzhiyun #ifdef CONFIG_X86
932*4882a593Smuzhiyun 	if (!ret) {
933*4882a593Smuzhiyun 		x86_init.iommu.iommu_init = intel_iommu_init;
934*4882a593Smuzhiyun 		x86_platform.iommu_shutdown = intel_iommu_shutdown;
935*4882a593Smuzhiyun 	}
936*4882a593Smuzhiyun 
937*4882a593Smuzhiyun #endif
938*4882a593Smuzhiyun 
939*4882a593Smuzhiyun 	if (dmar_tbl) {
940*4882a593Smuzhiyun 		acpi_put_table(dmar_tbl);
941*4882a593Smuzhiyun 		dmar_tbl = NULL;
942*4882a593Smuzhiyun 	}
943*4882a593Smuzhiyun 	up_write(&dmar_global_lock);
944*4882a593Smuzhiyun 
945*4882a593Smuzhiyun 	return ret ? ret : 1;
946*4882a593Smuzhiyun }
947*4882a593Smuzhiyun 
unmap_iommu(struct intel_iommu * iommu)948*4882a593Smuzhiyun static void unmap_iommu(struct intel_iommu *iommu)
949*4882a593Smuzhiyun {
950*4882a593Smuzhiyun 	iounmap(iommu->reg);
951*4882a593Smuzhiyun 	release_mem_region(iommu->reg_phys, iommu->reg_size);
952*4882a593Smuzhiyun }
953*4882a593Smuzhiyun 
954*4882a593Smuzhiyun /**
955*4882a593Smuzhiyun  * map_iommu: map the iommu's registers
956*4882a593Smuzhiyun  * @iommu: the iommu to map
957*4882a593Smuzhiyun  * @phys_addr: the physical address of the base resgister
958*4882a593Smuzhiyun  *
959*4882a593Smuzhiyun  * Memory map the iommu's registers.  Start w/ a single page, and
960*4882a593Smuzhiyun  * possibly expand if that turns out to be insufficent.
961*4882a593Smuzhiyun  */
map_iommu(struct intel_iommu * iommu,u64 phys_addr)962*4882a593Smuzhiyun static int map_iommu(struct intel_iommu *iommu, u64 phys_addr)
963*4882a593Smuzhiyun {
964*4882a593Smuzhiyun 	int map_size, err=0;
965*4882a593Smuzhiyun 
966*4882a593Smuzhiyun 	iommu->reg_phys = phys_addr;
967*4882a593Smuzhiyun 	iommu->reg_size = VTD_PAGE_SIZE;
968*4882a593Smuzhiyun 
969*4882a593Smuzhiyun 	if (!request_mem_region(iommu->reg_phys, iommu->reg_size, iommu->name)) {
970*4882a593Smuzhiyun 		pr_err("Can't reserve memory\n");
971*4882a593Smuzhiyun 		err = -EBUSY;
972*4882a593Smuzhiyun 		goto out;
973*4882a593Smuzhiyun 	}
974*4882a593Smuzhiyun 
975*4882a593Smuzhiyun 	iommu->reg = ioremap(iommu->reg_phys, iommu->reg_size);
976*4882a593Smuzhiyun 	if (!iommu->reg) {
977*4882a593Smuzhiyun 		pr_err("Can't map the region\n");
978*4882a593Smuzhiyun 		err = -ENOMEM;
979*4882a593Smuzhiyun 		goto release;
980*4882a593Smuzhiyun 	}
981*4882a593Smuzhiyun 
982*4882a593Smuzhiyun 	iommu->cap = dmar_readq(iommu->reg + DMAR_CAP_REG);
983*4882a593Smuzhiyun 	iommu->ecap = dmar_readq(iommu->reg + DMAR_ECAP_REG);
984*4882a593Smuzhiyun 
985*4882a593Smuzhiyun 	if (iommu->cap == (uint64_t)-1 && iommu->ecap == (uint64_t)-1) {
986*4882a593Smuzhiyun 		err = -EINVAL;
987*4882a593Smuzhiyun 		warn_invalid_dmar(phys_addr, " returns all ones");
988*4882a593Smuzhiyun 		goto unmap;
989*4882a593Smuzhiyun 	}
990*4882a593Smuzhiyun 	if (ecap_vcs(iommu->ecap))
991*4882a593Smuzhiyun 		iommu->vccap = dmar_readq(iommu->reg + DMAR_VCCAP_REG);
992*4882a593Smuzhiyun 
993*4882a593Smuzhiyun 	/* the registers might be more than one page */
994*4882a593Smuzhiyun 	map_size = max_t(int, ecap_max_iotlb_offset(iommu->ecap),
995*4882a593Smuzhiyun 			 cap_max_fault_reg_offset(iommu->cap));
996*4882a593Smuzhiyun 	map_size = VTD_PAGE_ALIGN(map_size);
997*4882a593Smuzhiyun 	if (map_size > iommu->reg_size) {
998*4882a593Smuzhiyun 		iounmap(iommu->reg);
999*4882a593Smuzhiyun 		release_mem_region(iommu->reg_phys, iommu->reg_size);
1000*4882a593Smuzhiyun 		iommu->reg_size = map_size;
1001*4882a593Smuzhiyun 		if (!request_mem_region(iommu->reg_phys, iommu->reg_size,
1002*4882a593Smuzhiyun 					iommu->name)) {
1003*4882a593Smuzhiyun 			pr_err("Can't reserve memory\n");
1004*4882a593Smuzhiyun 			err = -EBUSY;
1005*4882a593Smuzhiyun 			goto out;
1006*4882a593Smuzhiyun 		}
1007*4882a593Smuzhiyun 		iommu->reg = ioremap(iommu->reg_phys, iommu->reg_size);
1008*4882a593Smuzhiyun 		if (!iommu->reg) {
1009*4882a593Smuzhiyun 			pr_err("Can't map the region\n");
1010*4882a593Smuzhiyun 			err = -ENOMEM;
1011*4882a593Smuzhiyun 			goto release;
1012*4882a593Smuzhiyun 		}
1013*4882a593Smuzhiyun 	}
1014*4882a593Smuzhiyun 	err = 0;
1015*4882a593Smuzhiyun 	goto out;
1016*4882a593Smuzhiyun 
1017*4882a593Smuzhiyun unmap:
1018*4882a593Smuzhiyun 	iounmap(iommu->reg);
1019*4882a593Smuzhiyun release:
1020*4882a593Smuzhiyun 	release_mem_region(iommu->reg_phys, iommu->reg_size);
1021*4882a593Smuzhiyun out:
1022*4882a593Smuzhiyun 	return err;
1023*4882a593Smuzhiyun }
1024*4882a593Smuzhiyun 
dmar_alloc_seq_id(struct intel_iommu * iommu)1025*4882a593Smuzhiyun static int dmar_alloc_seq_id(struct intel_iommu *iommu)
1026*4882a593Smuzhiyun {
1027*4882a593Smuzhiyun 	iommu->seq_id = find_first_zero_bit(dmar_seq_ids,
1028*4882a593Smuzhiyun 					    DMAR_UNITS_SUPPORTED);
1029*4882a593Smuzhiyun 	if (iommu->seq_id >= DMAR_UNITS_SUPPORTED) {
1030*4882a593Smuzhiyun 		iommu->seq_id = -1;
1031*4882a593Smuzhiyun 	} else {
1032*4882a593Smuzhiyun 		set_bit(iommu->seq_id, dmar_seq_ids);
1033*4882a593Smuzhiyun 		sprintf(iommu->name, "dmar%d", iommu->seq_id);
1034*4882a593Smuzhiyun 	}
1035*4882a593Smuzhiyun 
1036*4882a593Smuzhiyun 	return iommu->seq_id;
1037*4882a593Smuzhiyun }
1038*4882a593Smuzhiyun 
dmar_free_seq_id(struct intel_iommu * iommu)1039*4882a593Smuzhiyun static void dmar_free_seq_id(struct intel_iommu *iommu)
1040*4882a593Smuzhiyun {
1041*4882a593Smuzhiyun 	if (iommu->seq_id >= 0) {
1042*4882a593Smuzhiyun 		clear_bit(iommu->seq_id, dmar_seq_ids);
1043*4882a593Smuzhiyun 		iommu->seq_id = -1;
1044*4882a593Smuzhiyun 	}
1045*4882a593Smuzhiyun }
1046*4882a593Smuzhiyun 
alloc_iommu(struct dmar_drhd_unit * drhd)1047*4882a593Smuzhiyun static int alloc_iommu(struct dmar_drhd_unit *drhd)
1048*4882a593Smuzhiyun {
1049*4882a593Smuzhiyun 	struct intel_iommu *iommu;
1050*4882a593Smuzhiyun 	u32 ver, sts;
1051*4882a593Smuzhiyun 	int agaw = -1;
1052*4882a593Smuzhiyun 	int msagaw = -1;
1053*4882a593Smuzhiyun 	int err;
1054*4882a593Smuzhiyun 
1055*4882a593Smuzhiyun 	if (!drhd->reg_base_addr) {
1056*4882a593Smuzhiyun 		warn_invalid_dmar(0, "");
1057*4882a593Smuzhiyun 		return -EINVAL;
1058*4882a593Smuzhiyun 	}
1059*4882a593Smuzhiyun 
1060*4882a593Smuzhiyun 	iommu = kzalloc(sizeof(*iommu), GFP_KERNEL);
1061*4882a593Smuzhiyun 	if (!iommu)
1062*4882a593Smuzhiyun 		return -ENOMEM;
1063*4882a593Smuzhiyun 
1064*4882a593Smuzhiyun 	if (dmar_alloc_seq_id(iommu) < 0) {
1065*4882a593Smuzhiyun 		pr_err("Failed to allocate seq_id\n");
1066*4882a593Smuzhiyun 		err = -ENOSPC;
1067*4882a593Smuzhiyun 		goto error;
1068*4882a593Smuzhiyun 	}
1069*4882a593Smuzhiyun 
1070*4882a593Smuzhiyun 	err = map_iommu(iommu, drhd->reg_base_addr);
1071*4882a593Smuzhiyun 	if (err) {
1072*4882a593Smuzhiyun 		pr_err("Failed to map %s\n", iommu->name);
1073*4882a593Smuzhiyun 		goto error_free_seq_id;
1074*4882a593Smuzhiyun 	}
1075*4882a593Smuzhiyun 
1076*4882a593Smuzhiyun 	err = -EINVAL;
1077*4882a593Smuzhiyun 	if (cap_sagaw(iommu->cap) == 0) {
1078*4882a593Smuzhiyun 		pr_info("%s: No supported address widths. Not attempting DMA translation.\n",
1079*4882a593Smuzhiyun 			iommu->name);
1080*4882a593Smuzhiyun 		drhd->ignored = 1;
1081*4882a593Smuzhiyun 	}
1082*4882a593Smuzhiyun 
1083*4882a593Smuzhiyun 	if (!drhd->ignored) {
1084*4882a593Smuzhiyun 		agaw = iommu_calculate_agaw(iommu);
1085*4882a593Smuzhiyun 		if (agaw < 0) {
1086*4882a593Smuzhiyun 			pr_err("Cannot get a valid agaw for iommu (seq_id = %d)\n",
1087*4882a593Smuzhiyun 			       iommu->seq_id);
1088*4882a593Smuzhiyun 			drhd->ignored = 1;
1089*4882a593Smuzhiyun 		}
1090*4882a593Smuzhiyun 	}
1091*4882a593Smuzhiyun 	if (!drhd->ignored) {
1092*4882a593Smuzhiyun 		msagaw = iommu_calculate_max_sagaw(iommu);
1093*4882a593Smuzhiyun 		if (msagaw < 0) {
1094*4882a593Smuzhiyun 			pr_err("Cannot get a valid max agaw for iommu (seq_id = %d)\n",
1095*4882a593Smuzhiyun 			       iommu->seq_id);
1096*4882a593Smuzhiyun 			drhd->ignored = 1;
1097*4882a593Smuzhiyun 			agaw = -1;
1098*4882a593Smuzhiyun 		}
1099*4882a593Smuzhiyun 	}
1100*4882a593Smuzhiyun 	iommu->agaw = agaw;
1101*4882a593Smuzhiyun 	iommu->msagaw = msagaw;
1102*4882a593Smuzhiyun 	iommu->segment = drhd->segment;
1103*4882a593Smuzhiyun 
1104*4882a593Smuzhiyun 	iommu->node = NUMA_NO_NODE;
1105*4882a593Smuzhiyun 
1106*4882a593Smuzhiyun 	ver = readl(iommu->reg + DMAR_VER_REG);
1107*4882a593Smuzhiyun 	pr_info("%s: reg_base_addr %llx ver %d:%d cap %llx ecap %llx\n",
1108*4882a593Smuzhiyun 		iommu->name,
1109*4882a593Smuzhiyun 		(unsigned long long)drhd->reg_base_addr,
1110*4882a593Smuzhiyun 		DMAR_VER_MAJOR(ver), DMAR_VER_MINOR(ver),
1111*4882a593Smuzhiyun 		(unsigned long long)iommu->cap,
1112*4882a593Smuzhiyun 		(unsigned long long)iommu->ecap);
1113*4882a593Smuzhiyun 
1114*4882a593Smuzhiyun 	/* Reflect status in gcmd */
1115*4882a593Smuzhiyun 	sts = readl(iommu->reg + DMAR_GSTS_REG);
1116*4882a593Smuzhiyun 	if (sts & DMA_GSTS_IRES)
1117*4882a593Smuzhiyun 		iommu->gcmd |= DMA_GCMD_IRE;
1118*4882a593Smuzhiyun 	if (sts & DMA_GSTS_TES)
1119*4882a593Smuzhiyun 		iommu->gcmd |= DMA_GCMD_TE;
1120*4882a593Smuzhiyun 	if (sts & DMA_GSTS_QIES)
1121*4882a593Smuzhiyun 		iommu->gcmd |= DMA_GCMD_QIE;
1122*4882a593Smuzhiyun 
1123*4882a593Smuzhiyun 	raw_spin_lock_init(&iommu->register_lock);
1124*4882a593Smuzhiyun 
1125*4882a593Smuzhiyun 	/*
1126*4882a593Smuzhiyun 	 * This is only for hotplug; at boot time intel_iommu_enabled won't
1127*4882a593Smuzhiyun 	 * be set yet. When intel_iommu_init() runs, it registers the units
1128*4882a593Smuzhiyun 	 * present at boot time, then sets intel_iommu_enabled.
1129*4882a593Smuzhiyun 	 */
1130*4882a593Smuzhiyun 	if (intel_iommu_enabled && !drhd->ignored) {
1131*4882a593Smuzhiyun 		err = iommu_device_sysfs_add(&iommu->iommu, NULL,
1132*4882a593Smuzhiyun 					     intel_iommu_groups,
1133*4882a593Smuzhiyun 					     "%s", iommu->name);
1134*4882a593Smuzhiyun 		if (err)
1135*4882a593Smuzhiyun 			goto err_unmap;
1136*4882a593Smuzhiyun 
1137*4882a593Smuzhiyun 		iommu_device_set_ops(&iommu->iommu, &intel_iommu_ops);
1138*4882a593Smuzhiyun 
1139*4882a593Smuzhiyun 		err = iommu_device_register(&iommu->iommu);
1140*4882a593Smuzhiyun 		if (err)
1141*4882a593Smuzhiyun 			goto err_sysfs;
1142*4882a593Smuzhiyun 	}
1143*4882a593Smuzhiyun 
1144*4882a593Smuzhiyun 	drhd->iommu = iommu;
1145*4882a593Smuzhiyun 	iommu->drhd = drhd;
1146*4882a593Smuzhiyun 
1147*4882a593Smuzhiyun 	return 0;
1148*4882a593Smuzhiyun 
1149*4882a593Smuzhiyun err_sysfs:
1150*4882a593Smuzhiyun 	iommu_device_sysfs_remove(&iommu->iommu);
1151*4882a593Smuzhiyun err_unmap:
1152*4882a593Smuzhiyun 	unmap_iommu(iommu);
1153*4882a593Smuzhiyun error_free_seq_id:
1154*4882a593Smuzhiyun 	dmar_free_seq_id(iommu);
1155*4882a593Smuzhiyun error:
1156*4882a593Smuzhiyun 	kfree(iommu);
1157*4882a593Smuzhiyun 	return err;
1158*4882a593Smuzhiyun }
1159*4882a593Smuzhiyun 
free_iommu(struct intel_iommu * iommu)1160*4882a593Smuzhiyun static void free_iommu(struct intel_iommu *iommu)
1161*4882a593Smuzhiyun {
1162*4882a593Smuzhiyun 	if (intel_iommu_enabled && !iommu->drhd->ignored) {
1163*4882a593Smuzhiyun 		iommu_device_unregister(&iommu->iommu);
1164*4882a593Smuzhiyun 		iommu_device_sysfs_remove(&iommu->iommu);
1165*4882a593Smuzhiyun 	}
1166*4882a593Smuzhiyun 
1167*4882a593Smuzhiyun 	if (iommu->irq) {
1168*4882a593Smuzhiyun 		if (iommu->pr_irq) {
1169*4882a593Smuzhiyun 			free_irq(iommu->pr_irq, iommu);
1170*4882a593Smuzhiyun 			dmar_free_hwirq(iommu->pr_irq);
1171*4882a593Smuzhiyun 			iommu->pr_irq = 0;
1172*4882a593Smuzhiyun 		}
1173*4882a593Smuzhiyun 		free_irq(iommu->irq, iommu);
1174*4882a593Smuzhiyun 		dmar_free_hwirq(iommu->irq);
1175*4882a593Smuzhiyun 		iommu->irq = 0;
1176*4882a593Smuzhiyun 	}
1177*4882a593Smuzhiyun 
1178*4882a593Smuzhiyun 	if (iommu->qi) {
1179*4882a593Smuzhiyun 		free_page((unsigned long)iommu->qi->desc);
1180*4882a593Smuzhiyun 		kfree(iommu->qi->desc_status);
1181*4882a593Smuzhiyun 		kfree(iommu->qi);
1182*4882a593Smuzhiyun 	}
1183*4882a593Smuzhiyun 
1184*4882a593Smuzhiyun 	if (iommu->reg)
1185*4882a593Smuzhiyun 		unmap_iommu(iommu);
1186*4882a593Smuzhiyun 
1187*4882a593Smuzhiyun 	dmar_free_seq_id(iommu);
1188*4882a593Smuzhiyun 	kfree(iommu);
1189*4882a593Smuzhiyun }
1190*4882a593Smuzhiyun 
1191*4882a593Smuzhiyun /*
1192*4882a593Smuzhiyun  * Reclaim all the submitted descriptors which have completed its work.
1193*4882a593Smuzhiyun  */
reclaim_free_desc(struct q_inval * qi)1194*4882a593Smuzhiyun static inline void reclaim_free_desc(struct q_inval *qi)
1195*4882a593Smuzhiyun {
1196*4882a593Smuzhiyun 	while (qi->desc_status[qi->free_tail] == QI_DONE ||
1197*4882a593Smuzhiyun 	       qi->desc_status[qi->free_tail] == QI_ABORT) {
1198*4882a593Smuzhiyun 		qi->desc_status[qi->free_tail] = QI_FREE;
1199*4882a593Smuzhiyun 		qi->free_tail = (qi->free_tail + 1) % QI_LENGTH;
1200*4882a593Smuzhiyun 		qi->free_cnt++;
1201*4882a593Smuzhiyun 	}
1202*4882a593Smuzhiyun }
1203*4882a593Smuzhiyun 
qi_check_fault(struct intel_iommu * iommu,int index,int wait_index)1204*4882a593Smuzhiyun static int qi_check_fault(struct intel_iommu *iommu, int index, int wait_index)
1205*4882a593Smuzhiyun {
1206*4882a593Smuzhiyun 	u32 fault;
1207*4882a593Smuzhiyun 	int head, tail;
1208*4882a593Smuzhiyun 	struct q_inval *qi = iommu->qi;
1209*4882a593Smuzhiyun 	int shift = qi_shift(iommu);
1210*4882a593Smuzhiyun 
1211*4882a593Smuzhiyun 	if (qi->desc_status[wait_index] == QI_ABORT)
1212*4882a593Smuzhiyun 		return -EAGAIN;
1213*4882a593Smuzhiyun 
1214*4882a593Smuzhiyun 	fault = readl(iommu->reg + DMAR_FSTS_REG);
1215*4882a593Smuzhiyun 
1216*4882a593Smuzhiyun 	/*
1217*4882a593Smuzhiyun 	 * If IQE happens, the head points to the descriptor associated
1218*4882a593Smuzhiyun 	 * with the error. No new descriptors are fetched until the IQE
1219*4882a593Smuzhiyun 	 * is cleared.
1220*4882a593Smuzhiyun 	 */
1221*4882a593Smuzhiyun 	if (fault & DMA_FSTS_IQE) {
1222*4882a593Smuzhiyun 		head = readl(iommu->reg + DMAR_IQH_REG);
1223*4882a593Smuzhiyun 		if ((head >> shift) == index) {
1224*4882a593Smuzhiyun 			struct qi_desc *desc = qi->desc + head;
1225*4882a593Smuzhiyun 
1226*4882a593Smuzhiyun 			/*
1227*4882a593Smuzhiyun 			 * desc->qw2 and desc->qw3 are either reserved or
1228*4882a593Smuzhiyun 			 * used by software as private data. We won't print
1229*4882a593Smuzhiyun 			 * out these two qw's for security consideration.
1230*4882a593Smuzhiyun 			 */
1231*4882a593Smuzhiyun 			pr_err("VT-d detected invalid descriptor: qw0 = %llx, qw1 = %llx\n",
1232*4882a593Smuzhiyun 			       (unsigned long long)desc->qw0,
1233*4882a593Smuzhiyun 			       (unsigned long long)desc->qw1);
1234*4882a593Smuzhiyun 			memcpy(desc, qi->desc + (wait_index << shift),
1235*4882a593Smuzhiyun 			       1 << shift);
1236*4882a593Smuzhiyun 			writel(DMA_FSTS_IQE, iommu->reg + DMAR_FSTS_REG);
1237*4882a593Smuzhiyun 			return -EINVAL;
1238*4882a593Smuzhiyun 		}
1239*4882a593Smuzhiyun 	}
1240*4882a593Smuzhiyun 
1241*4882a593Smuzhiyun 	/*
1242*4882a593Smuzhiyun 	 * If ITE happens, all pending wait_desc commands are aborted.
1243*4882a593Smuzhiyun 	 * No new descriptors are fetched until the ITE is cleared.
1244*4882a593Smuzhiyun 	 */
1245*4882a593Smuzhiyun 	if (fault & DMA_FSTS_ITE) {
1246*4882a593Smuzhiyun 		head = readl(iommu->reg + DMAR_IQH_REG);
1247*4882a593Smuzhiyun 		head = ((head >> shift) - 1 + QI_LENGTH) % QI_LENGTH;
1248*4882a593Smuzhiyun 		head |= 1;
1249*4882a593Smuzhiyun 		tail = readl(iommu->reg + DMAR_IQT_REG);
1250*4882a593Smuzhiyun 		tail = ((tail >> shift) - 1 + QI_LENGTH) % QI_LENGTH;
1251*4882a593Smuzhiyun 
1252*4882a593Smuzhiyun 		writel(DMA_FSTS_ITE, iommu->reg + DMAR_FSTS_REG);
1253*4882a593Smuzhiyun 
1254*4882a593Smuzhiyun 		do {
1255*4882a593Smuzhiyun 			if (qi->desc_status[head] == QI_IN_USE)
1256*4882a593Smuzhiyun 				qi->desc_status[head] = QI_ABORT;
1257*4882a593Smuzhiyun 			head = (head - 2 + QI_LENGTH) % QI_LENGTH;
1258*4882a593Smuzhiyun 		} while (head != tail);
1259*4882a593Smuzhiyun 
1260*4882a593Smuzhiyun 		if (qi->desc_status[wait_index] == QI_ABORT)
1261*4882a593Smuzhiyun 			return -EAGAIN;
1262*4882a593Smuzhiyun 	}
1263*4882a593Smuzhiyun 
1264*4882a593Smuzhiyun 	if (fault & DMA_FSTS_ICE)
1265*4882a593Smuzhiyun 		writel(DMA_FSTS_ICE, iommu->reg + DMAR_FSTS_REG);
1266*4882a593Smuzhiyun 
1267*4882a593Smuzhiyun 	return 0;
1268*4882a593Smuzhiyun }
1269*4882a593Smuzhiyun 
1270*4882a593Smuzhiyun /*
1271*4882a593Smuzhiyun  * Function to submit invalidation descriptors of all types to the queued
1272*4882a593Smuzhiyun  * invalidation interface(QI). Multiple descriptors can be submitted at a
1273*4882a593Smuzhiyun  * time, a wait descriptor will be appended to each submission to ensure
1274*4882a593Smuzhiyun  * hardware has completed the invalidation before return. Wait descriptors
1275*4882a593Smuzhiyun  * can be part of the submission but it will not be polled for completion.
1276*4882a593Smuzhiyun  */
qi_submit_sync(struct intel_iommu * iommu,struct qi_desc * desc,unsigned int count,unsigned long options)1277*4882a593Smuzhiyun int qi_submit_sync(struct intel_iommu *iommu, struct qi_desc *desc,
1278*4882a593Smuzhiyun 		   unsigned int count, unsigned long options)
1279*4882a593Smuzhiyun {
1280*4882a593Smuzhiyun 	struct q_inval *qi = iommu->qi;
1281*4882a593Smuzhiyun 	struct qi_desc wait_desc;
1282*4882a593Smuzhiyun 	int wait_index, index;
1283*4882a593Smuzhiyun 	unsigned long flags;
1284*4882a593Smuzhiyun 	int offset, shift;
1285*4882a593Smuzhiyun 	int rc, i;
1286*4882a593Smuzhiyun 
1287*4882a593Smuzhiyun 	if (!qi)
1288*4882a593Smuzhiyun 		return 0;
1289*4882a593Smuzhiyun 
1290*4882a593Smuzhiyun restart:
1291*4882a593Smuzhiyun 	rc = 0;
1292*4882a593Smuzhiyun 
1293*4882a593Smuzhiyun 	raw_spin_lock_irqsave(&qi->q_lock, flags);
1294*4882a593Smuzhiyun 	/*
1295*4882a593Smuzhiyun 	 * Check if we have enough empty slots in the queue to submit,
1296*4882a593Smuzhiyun 	 * the calculation is based on:
1297*4882a593Smuzhiyun 	 * # of desc + 1 wait desc + 1 space between head and tail
1298*4882a593Smuzhiyun 	 */
1299*4882a593Smuzhiyun 	while (qi->free_cnt < count + 2) {
1300*4882a593Smuzhiyun 		raw_spin_unlock_irqrestore(&qi->q_lock, flags);
1301*4882a593Smuzhiyun 		cpu_relax();
1302*4882a593Smuzhiyun 		raw_spin_lock_irqsave(&qi->q_lock, flags);
1303*4882a593Smuzhiyun 	}
1304*4882a593Smuzhiyun 
1305*4882a593Smuzhiyun 	index = qi->free_head;
1306*4882a593Smuzhiyun 	wait_index = (index + count) % QI_LENGTH;
1307*4882a593Smuzhiyun 	shift = qi_shift(iommu);
1308*4882a593Smuzhiyun 
1309*4882a593Smuzhiyun 	for (i = 0; i < count; i++) {
1310*4882a593Smuzhiyun 		offset = ((index + i) % QI_LENGTH) << shift;
1311*4882a593Smuzhiyun 		memcpy(qi->desc + offset, &desc[i], 1 << shift);
1312*4882a593Smuzhiyun 		qi->desc_status[(index + i) % QI_LENGTH] = QI_IN_USE;
1313*4882a593Smuzhiyun 	}
1314*4882a593Smuzhiyun 	qi->desc_status[wait_index] = QI_IN_USE;
1315*4882a593Smuzhiyun 
1316*4882a593Smuzhiyun 	wait_desc.qw0 = QI_IWD_STATUS_DATA(QI_DONE) |
1317*4882a593Smuzhiyun 			QI_IWD_STATUS_WRITE | QI_IWD_TYPE;
1318*4882a593Smuzhiyun 	if (options & QI_OPT_WAIT_DRAIN)
1319*4882a593Smuzhiyun 		wait_desc.qw0 |= QI_IWD_PRQ_DRAIN;
1320*4882a593Smuzhiyun 	wait_desc.qw1 = virt_to_phys(&qi->desc_status[wait_index]);
1321*4882a593Smuzhiyun 	wait_desc.qw2 = 0;
1322*4882a593Smuzhiyun 	wait_desc.qw3 = 0;
1323*4882a593Smuzhiyun 
1324*4882a593Smuzhiyun 	offset = wait_index << shift;
1325*4882a593Smuzhiyun 	memcpy(qi->desc + offset, &wait_desc, 1 << shift);
1326*4882a593Smuzhiyun 
1327*4882a593Smuzhiyun 	qi->free_head = (qi->free_head + count + 1) % QI_LENGTH;
1328*4882a593Smuzhiyun 	qi->free_cnt -= count + 1;
1329*4882a593Smuzhiyun 
1330*4882a593Smuzhiyun 	/*
1331*4882a593Smuzhiyun 	 * update the HW tail register indicating the presence of
1332*4882a593Smuzhiyun 	 * new descriptors.
1333*4882a593Smuzhiyun 	 */
1334*4882a593Smuzhiyun 	writel(qi->free_head << shift, iommu->reg + DMAR_IQT_REG);
1335*4882a593Smuzhiyun 
1336*4882a593Smuzhiyun 	while (qi->desc_status[wait_index] != QI_DONE) {
1337*4882a593Smuzhiyun 		/*
1338*4882a593Smuzhiyun 		 * We will leave the interrupts disabled, to prevent interrupt
1339*4882a593Smuzhiyun 		 * context to queue another cmd while a cmd is already submitted
1340*4882a593Smuzhiyun 		 * and waiting for completion on this cpu. This is to avoid
1341*4882a593Smuzhiyun 		 * a deadlock where the interrupt context can wait indefinitely
1342*4882a593Smuzhiyun 		 * for free slots in the queue.
1343*4882a593Smuzhiyun 		 */
1344*4882a593Smuzhiyun 		rc = qi_check_fault(iommu, index, wait_index);
1345*4882a593Smuzhiyun 		if (rc)
1346*4882a593Smuzhiyun 			break;
1347*4882a593Smuzhiyun 
1348*4882a593Smuzhiyun 		raw_spin_unlock(&qi->q_lock);
1349*4882a593Smuzhiyun 		cpu_relax();
1350*4882a593Smuzhiyun 		raw_spin_lock(&qi->q_lock);
1351*4882a593Smuzhiyun 	}
1352*4882a593Smuzhiyun 
1353*4882a593Smuzhiyun 	for (i = 0; i < count; i++)
1354*4882a593Smuzhiyun 		qi->desc_status[(index + i) % QI_LENGTH] = QI_DONE;
1355*4882a593Smuzhiyun 
1356*4882a593Smuzhiyun 	reclaim_free_desc(qi);
1357*4882a593Smuzhiyun 	raw_spin_unlock_irqrestore(&qi->q_lock, flags);
1358*4882a593Smuzhiyun 
1359*4882a593Smuzhiyun 	if (rc == -EAGAIN)
1360*4882a593Smuzhiyun 		goto restart;
1361*4882a593Smuzhiyun 
1362*4882a593Smuzhiyun 	return rc;
1363*4882a593Smuzhiyun }
1364*4882a593Smuzhiyun 
1365*4882a593Smuzhiyun /*
1366*4882a593Smuzhiyun  * Flush the global interrupt entry cache.
1367*4882a593Smuzhiyun  */
qi_global_iec(struct intel_iommu * iommu)1368*4882a593Smuzhiyun void qi_global_iec(struct intel_iommu *iommu)
1369*4882a593Smuzhiyun {
1370*4882a593Smuzhiyun 	struct qi_desc desc;
1371*4882a593Smuzhiyun 
1372*4882a593Smuzhiyun 	desc.qw0 = QI_IEC_TYPE;
1373*4882a593Smuzhiyun 	desc.qw1 = 0;
1374*4882a593Smuzhiyun 	desc.qw2 = 0;
1375*4882a593Smuzhiyun 	desc.qw3 = 0;
1376*4882a593Smuzhiyun 
1377*4882a593Smuzhiyun 	/* should never fail */
1378*4882a593Smuzhiyun 	qi_submit_sync(iommu, &desc, 1, 0);
1379*4882a593Smuzhiyun }
1380*4882a593Smuzhiyun 
qi_flush_context(struct intel_iommu * iommu,u16 did,u16 sid,u8 fm,u64 type)1381*4882a593Smuzhiyun void qi_flush_context(struct intel_iommu *iommu, u16 did, u16 sid, u8 fm,
1382*4882a593Smuzhiyun 		      u64 type)
1383*4882a593Smuzhiyun {
1384*4882a593Smuzhiyun 	struct qi_desc desc;
1385*4882a593Smuzhiyun 
1386*4882a593Smuzhiyun 	desc.qw0 = QI_CC_FM(fm) | QI_CC_SID(sid) | QI_CC_DID(did)
1387*4882a593Smuzhiyun 			| QI_CC_GRAN(type) | QI_CC_TYPE;
1388*4882a593Smuzhiyun 	desc.qw1 = 0;
1389*4882a593Smuzhiyun 	desc.qw2 = 0;
1390*4882a593Smuzhiyun 	desc.qw3 = 0;
1391*4882a593Smuzhiyun 
1392*4882a593Smuzhiyun 	qi_submit_sync(iommu, &desc, 1, 0);
1393*4882a593Smuzhiyun }
1394*4882a593Smuzhiyun 
qi_flush_iotlb(struct intel_iommu * iommu,u16 did,u64 addr,unsigned int size_order,u64 type)1395*4882a593Smuzhiyun void qi_flush_iotlb(struct intel_iommu *iommu, u16 did, u64 addr,
1396*4882a593Smuzhiyun 		    unsigned int size_order, u64 type)
1397*4882a593Smuzhiyun {
1398*4882a593Smuzhiyun 	u8 dw = 0, dr = 0;
1399*4882a593Smuzhiyun 
1400*4882a593Smuzhiyun 	struct qi_desc desc;
1401*4882a593Smuzhiyun 	int ih = 0;
1402*4882a593Smuzhiyun 
1403*4882a593Smuzhiyun 	if (cap_write_drain(iommu->cap))
1404*4882a593Smuzhiyun 		dw = 1;
1405*4882a593Smuzhiyun 
1406*4882a593Smuzhiyun 	if (cap_read_drain(iommu->cap))
1407*4882a593Smuzhiyun 		dr = 1;
1408*4882a593Smuzhiyun 
1409*4882a593Smuzhiyun 	desc.qw0 = QI_IOTLB_DID(did) | QI_IOTLB_DR(dr) | QI_IOTLB_DW(dw)
1410*4882a593Smuzhiyun 		| QI_IOTLB_GRAN(type) | QI_IOTLB_TYPE;
1411*4882a593Smuzhiyun 	desc.qw1 = QI_IOTLB_ADDR(addr) | QI_IOTLB_IH(ih)
1412*4882a593Smuzhiyun 		| QI_IOTLB_AM(size_order);
1413*4882a593Smuzhiyun 	desc.qw2 = 0;
1414*4882a593Smuzhiyun 	desc.qw3 = 0;
1415*4882a593Smuzhiyun 
1416*4882a593Smuzhiyun 	qi_submit_sync(iommu, &desc, 1, 0);
1417*4882a593Smuzhiyun }
1418*4882a593Smuzhiyun 
qi_flush_dev_iotlb(struct intel_iommu * iommu,u16 sid,u16 pfsid,u16 qdep,u64 addr,unsigned mask)1419*4882a593Smuzhiyun void qi_flush_dev_iotlb(struct intel_iommu *iommu, u16 sid, u16 pfsid,
1420*4882a593Smuzhiyun 			u16 qdep, u64 addr, unsigned mask)
1421*4882a593Smuzhiyun {
1422*4882a593Smuzhiyun 	struct qi_desc desc;
1423*4882a593Smuzhiyun 
1424*4882a593Smuzhiyun 	if (mask) {
1425*4882a593Smuzhiyun 		addr |= (1ULL << (VTD_PAGE_SHIFT + mask - 1)) - 1;
1426*4882a593Smuzhiyun 		desc.qw1 = QI_DEV_IOTLB_ADDR(addr) | QI_DEV_IOTLB_SIZE;
1427*4882a593Smuzhiyun 	} else
1428*4882a593Smuzhiyun 		desc.qw1 = QI_DEV_IOTLB_ADDR(addr);
1429*4882a593Smuzhiyun 
1430*4882a593Smuzhiyun 	if (qdep >= QI_DEV_IOTLB_MAX_INVS)
1431*4882a593Smuzhiyun 		qdep = 0;
1432*4882a593Smuzhiyun 
1433*4882a593Smuzhiyun 	desc.qw0 = QI_DEV_IOTLB_SID(sid) | QI_DEV_IOTLB_QDEP(qdep) |
1434*4882a593Smuzhiyun 		   QI_DIOTLB_TYPE | QI_DEV_IOTLB_PFSID(pfsid);
1435*4882a593Smuzhiyun 	desc.qw2 = 0;
1436*4882a593Smuzhiyun 	desc.qw3 = 0;
1437*4882a593Smuzhiyun 
1438*4882a593Smuzhiyun 	qi_submit_sync(iommu, &desc, 1, 0);
1439*4882a593Smuzhiyun }
1440*4882a593Smuzhiyun 
1441*4882a593Smuzhiyun /* PASID-based IOTLB invalidation */
qi_flush_piotlb(struct intel_iommu * iommu,u16 did,u32 pasid,u64 addr,unsigned long npages,bool ih)1442*4882a593Smuzhiyun void qi_flush_piotlb(struct intel_iommu *iommu, u16 did, u32 pasid, u64 addr,
1443*4882a593Smuzhiyun 		     unsigned long npages, bool ih)
1444*4882a593Smuzhiyun {
1445*4882a593Smuzhiyun 	struct qi_desc desc = {.qw2 = 0, .qw3 = 0};
1446*4882a593Smuzhiyun 
1447*4882a593Smuzhiyun 	/*
1448*4882a593Smuzhiyun 	 * npages == -1 means a PASID-selective invalidation, otherwise,
1449*4882a593Smuzhiyun 	 * a positive value for Page-selective-within-PASID invalidation.
1450*4882a593Smuzhiyun 	 * 0 is not a valid input.
1451*4882a593Smuzhiyun 	 */
1452*4882a593Smuzhiyun 	if (WARN_ON(!npages)) {
1453*4882a593Smuzhiyun 		pr_err("Invalid input npages = %ld\n", npages);
1454*4882a593Smuzhiyun 		return;
1455*4882a593Smuzhiyun 	}
1456*4882a593Smuzhiyun 
1457*4882a593Smuzhiyun 	if (npages == -1) {
1458*4882a593Smuzhiyun 		desc.qw0 = QI_EIOTLB_PASID(pasid) |
1459*4882a593Smuzhiyun 				QI_EIOTLB_DID(did) |
1460*4882a593Smuzhiyun 				QI_EIOTLB_GRAN(QI_GRAN_NONG_PASID) |
1461*4882a593Smuzhiyun 				QI_EIOTLB_TYPE;
1462*4882a593Smuzhiyun 		desc.qw1 = 0;
1463*4882a593Smuzhiyun 	} else {
1464*4882a593Smuzhiyun 		int mask = ilog2(__roundup_pow_of_two(npages));
1465*4882a593Smuzhiyun 		unsigned long align = (1ULL << (VTD_PAGE_SHIFT + mask));
1466*4882a593Smuzhiyun 
1467*4882a593Smuzhiyun 		if (WARN_ON_ONCE(!IS_ALIGNED(addr, align)))
1468*4882a593Smuzhiyun 			addr = ALIGN_DOWN(addr, align);
1469*4882a593Smuzhiyun 
1470*4882a593Smuzhiyun 		desc.qw0 = QI_EIOTLB_PASID(pasid) |
1471*4882a593Smuzhiyun 				QI_EIOTLB_DID(did) |
1472*4882a593Smuzhiyun 				QI_EIOTLB_GRAN(QI_GRAN_PSI_PASID) |
1473*4882a593Smuzhiyun 				QI_EIOTLB_TYPE;
1474*4882a593Smuzhiyun 		desc.qw1 = QI_EIOTLB_ADDR(addr) |
1475*4882a593Smuzhiyun 				QI_EIOTLB_IH(ih) |
1476*4882a593Smuzhiyun 				QI_EIOTLB_AM(mask);
1477*4882a593Smuzhiyun 	}
1478*4882a593Smuzhiyun 
1479*4882a593Smuzhiyun 	qi_submit_sync(iommu, &desc, 1, 0);
1480*4882a593Smuzhiyun }
1481*4882a593Smuzhiyun 
1482*4882a593Smuzhiyun /* PASID-based device IOTLB Invalidate */
qi_flush_dev_iotlb_pasid(struct intel_iommu * iommu,u16 sid,u16 pfsid,u32 pasid,u16 qdep,u64 addr,unsigned int size_order)1483*4882a593Smuzhiyun void qi_flush_dev_iotlb_pasid(struct intel_iommu *iommu, u16 sid, u16 pfsid,
1484*4882a593Smuzhiyun 			      u32 pasid,  u16 qdep, u64 addr, unsigned int size_order)
1485*4882a593Smuzhiyun {
1486*4882a593Smuzhiyun 	unsigned long mask = 1UL << (VTD_PAGE_SHIFT + size_order - 1);
1487*4882a593Smuzhiyun 	struct qi_desc desc = {.qw1 = 0, .qw2 = 0, .qw3 = 0};
1488*4882a593Smuzhiyun 
1489*4882a593Smuzhiyun 	desc.qw0 = QI_DEV_EIOTLB_PASID(pasid) | QI_DEV_EIOTLB_SID(sid) |
1490*4882a593Smuzhiyun 		QI_DEV_EIOTLB_QDEP(qdep) | QI_DEIOTLB_TYPE |
1491*4882a593Smuzhiyun 		QI_DEV_IOTLB_PFSID(pfsid);
1492*4882a593Smuzhiyun 
1493*4882a593Smuzhiyun 	/*
1494*4882a593Smuzhiyun 	 * If S bit is 0, we only flush a single page. If S bit is set,
1495*4882a593Smuzhiyun 	 * The least significant zero bit indicates the invalidation address
1496*4882a593Smuzhiyun 	 * range. VT-d spec 6.5.2.6.
1497*4882a593Smuzhiyun 	 * e.g. address bit 12[0] indicates 8KB, 13[0] indicates 16KB.
1498*4882a593Smuzhiyun 	 * size order = 0 is PAGE_SIZE 4KB
1499*4882a593Smuzhiyun 	 * Max Invs Pending (MIP) is set to 0 for now until we have DIT in
1500*4882a593Smuzhiyun 	 * ECAP.
1501*4882a593Smuzhiyun 	 */
1502*4882a593Smuzhiyun 	if (!IS_ALIGNED(addr, VTD_PAGE_SIZE << size_order))
1503*4882a593Smuzhiyun 		pr_warn_ratelimited("Invalidate non-aligned address %llx, order %d\n",
1504*4882a593Smuzhiyun 				    addr, size_order);
1505*4882a593Smuzhiyun 
1506*4882a593Smuzhiyun 	/* Take page address */
1507*4882a593Smuzhiyun 	desc.qw1 = QI_DEV_EIOTLB_ADDR(addr);
1508*4882a593Smuzhiyun 
1509*4882a593Smuzhiyun 	if (size_order) {
1510*4882a593Smuzhiyun 		/*
1511*4882a593Smuzhiyun 		 * Existing 0s in address below size_order may be the least
1512*4882a593Smuzhiyun 		 * significant bit, we must set them to 1s to avoid having
1513*4882a593Smuzhiyun 		 * smaller size than desired.
1514*4882a593Smuzhiyun 		 */
1515*4882a593Smuzhiyun 		desc.qw1 |= GENMASK_ULL(size_order + VTD_PAGE_SHIFT - 1,
1516*4882a593Smuzhiyun 					VTD_PAGE_SHIFT);
1517*4882a593Smuzhiyun 		/* Clear size_order bit to indicate size */
1518*4882a593Smuzhiyun 		desc.qw1 &= ~mask;
1519*4882a593Smuzhiyun 		/* Set the S bit to indicate flushing more than 1 page */
1520*4882a593Smuzhiyun 		desc.qw1 |= QI_DEV_EIOTLB_SIZE;
1521*4882a593Smuzhiyun 	}
1522*4882a593Smuzhiyun 
1523*4882a593Smuzhiyun 	qi_submit_sync(iommu, &desc, 1, 0);
1524*4882a593Smuzhiyun }
1525*4882a593Smuzhiyun 
qi_flush_pasid_cache(struct intel_iommu * iommu,u16 did,u64 granu,u32 pasid)1526*4882a593Smuzhiyun void qi_flush_pasid_cache(struct intel_iommu *iommu, u16 did,
1527*4882a593Smuzhiyun 			  u64 granu, u32 pasid)
1528*4882a593Smuzhiyun {
1529*4882a593Smuzhiyun 	struct qi_desc desc = {.qw1 = 0, .qw2 = 0, .qw3 = 0};
1530*4882a593Smuzhiyun 
1531*4882a593Smuzhiyun 	desc.qw0 = QI_PC_PASID(pasid) | QI_PC_DID(did) |
1532*4882a593Smuzhiyun 			QI_PC_GRAN(granu) | QI_PC_TYPE;
1533*4882a593Smuzhiyun 	qi_submit_sync(iommu, &desc, 1, 0);
1534*4882a593Smuzhiyun }
1535*4882a593Smuzhiyun 
1536*4882a593Smuzhiyun /*
1537*4882a593Smuzhiyun  * Disable Queued Invalidation interface.
1538*4882a593Smuzhiyun  */
dmar_disable_qi(struct intel_iommu * iommu)1539*4882a593Smuzhiyun void dmar_disable_qi(struct intel_iommu *iommu)
1540*4882a593Smuzhiyun {
1541*4882a593Smuzhiyun 	unsigned long flags;
1542*4882a593Smuzhiyun 	u32 sts;
1543*4882a593Smuzhiyun 	cycles_t start_time = get_cycles();
1544*4882a593Smuzhiyun 
1545*4882a593Smuzhiyun 	if (!ecap_qis(iommu->ecap))
1546*4882a593Smuzhiyun 		return;
1547*4882a593Smuzhiyun 
1548*4882a593Smuzhiyun 	raw_spin_lock_irqsave(&iommu->register_lock, flags);
1549*4882a593Smuzhiyun 
1550*4882a593Smuzhiyun 	sts =  readl(iommu->reg + DMAR_GSTS_REG);
1551*4882a593Smuzhiyun 	if (!(sts & DMA_GSTS_QIES))
1552*4882a593Smuzhiyun 		goto end;
1553*4882a593Smuzhiyun 
1554*4882a593Smuzhiyun 	/*
1555*4882a593Smuzhiyun 	 * Give a chance to HW to complete the pending invalidation requests.
1556*4882a593Smuzhiyun 	 */
1557*4882a593Smuzhiyun 	while ((readl(iommu->reg + DMAR_IQT_REG) !=
1558*4882a593Smuzhiyun 		readl(iommu->reg + DMAR_IQH_REG)) &&
1559*4882a593Smuzhiyun 		(DMAR_OPERATION_TIMEOUT > (get_cycles() - start_time)))
1560*4882a593Smuzhiyun 		cpu_relax();
1561*4882a593Smuzhiyun 
1562*4882a593Smuzhiyun 	iommu->gcmd &= ~DMA_GCMD_QIE;
1563*4882a593Smuzhiyun 	writel(iommu->gcmd, iommu->reg + DMAR_GCMD_REG);
1564*4882a593Smuzhiyun 
1565*4882a593Smuzhiyun 	IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG, readl,
1566*4882a593Smuzhiyun 		      !(sts & DMA_GSTS_QIES), sts);
1567*4882a593Smuzhiyun end:
1568*4882a593Smuzhiyun 	raw_spin_unlock_irqrestore(&iommu->register_lock, flags);
1569*4882a593Smuzhiyun }
1570*4882a593Smuzhiyun 
1571*4882a593Smuzhiyun /*
1572*4882a593Smuzhiyun  * Enable queued invalidation.
1573*4882a593Smuzhiyun  */
__dmar_enable_qi(struct intel_iommu * iommu)1574*4882a593Smuzhiyun static void __dmar_enable_qi(struct intel_iommu *iommu)
1575*4882a593Smuzhiyun {
1576*4882a593Smuzhiyun 	u32 sts;
1577*4882a593Smuzhiyun 	unsigned long flags;
1578*4882a593Smuzhiyun 	struct q_inval *qi = iommu->qi;
1579*4882a593Smuzhiyun 	u64 val = virt_to_phys(qi->desc);
1580*4882a593Smuzhiyun 
1581*4882a593Smuzhiyun 	qi->free_head = qi->free_tail = 0;
1582*4882a593Smuzhiyun 	qi->free_cnt = QI_LENGTH;
1583*4882a593Smuzhiyun 
1584*4882a593Smuzhiyun 	/*
1585*4882a593Smuzhiyun 	 * Set DW=1 and QS=1 in IQA_REG when Scalable Mode capability
1586*4882a593Smuzhiyun 	 * is present.
1587*4882a593Smuzhiyun 	 */
1588*4882a593Smuzhiyun 	if (ecap_smts(iommu->ecap))
1589*4882a593Smuzhiyun 		val |= (1 << 11) | 1;
1590*4882a593Smuzhiyun 
1591*4882a593Smuzhiyun 	raw_spin_lock_irqsave(&iommu->register_lock, flags);
1592*4882a593Smuzhiyun 
1593*4882a593Smuzhiyun 	/* write zero to the tail reg */
1594*4882a593Smuzhiyun 	writel(0, iommu->reg + DMAR_IQT_REG);
1595*4882a593Smuzhiyun 
1596*4882a593Smuzhiyun 	dmar_writeq(iommu->reg + DMAR_IQA_REG, val);
1597*4882a593Smuzhiyun 
1598*4882a593Smuzhiyun 	iommu->gcmd |= DMA_GCMD_QIE;
1599*4882a593Smuzhiyun 	writel(iommu->gcmd, iommu->reg + DMAR_GCMD_REG);
1600*4882a593Smuzhiyun 
1601*4882a593Smuzhiyun 	/* Make sure hardware complete it */
1602*4882a593Smuzhiyun 	IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG, readl, (sts & DMA_GSTS_QIES), sts);
1603*4882a593Smuzhiyun 
1604*4882a593Smuzhiyun 	raw_spin_unlock_irqrestore(&iommu->register_lock, flags);
1605*4882a593Smuzhiyun }
1606*4882a593Smuzhiyun 
1607*4882a593Smuzhiyun /*
1608*4882a593Smuzhiyun  * Enable Queued Invalidation interface. This is a must to support
1609*4882a593Smuzhiyun  * interrupt-remapping. Also used by DMA-remapping, which replaces
1610*4882a593Smuzhiyun  * register based IOTLB invalidation.
1611*4882a593Smuzhiyun  */
dmar_enable_qi(struct intel_iommu * iommu)1612*4882a593Smuzhiyun int dmar_enable_qi(struct intel_iommu *iommu)
1613*4882a593Smuzhiyun {
1614*4882a593Smuzhiyun 	struct q_inval *qi;
1615*4882a593Smuzhiyun 	struct page *desc_page;
1616*4882a593Smuzhiyun 
1617*4882a593Smuzhiyun 	if (!ecap_qis(iommu->ecap))
1618*4882a593Smuzhiyun 		return -ENOENT;
1619*4882a593Smuzhiyun 
1620*4882a593Smuzhiyun 	/*
1621*4882a593Smuzhiyun 	 * queued invalidation is already setup and enabled.
1622*4882a593Smuzhiyun 	 */
1623*4882a593Smuzhiyun 	if (iommu->qi)
1624*4882a593Smuzhiyun 		return 0;
1625*4882a593Smuzhiyun 
1626*4882a593Smuzhiyun 	iommu->qi = kmalloc(sizeof(*qi), GFP_ATOMIC);
1627*4882a593Smuzhiyun 	if (!iommu->qi)
1628*4882a593Smuzhiyun 		return -ENOMEM;
1629*4882a593Smuzhiyun 
1630*4882a593Smuzhiyun 	qi = iommu->qi;
1631*4882a593Smuzhiyun 
1632*4882a593Smuzhiyun 	/*
1633*4882a593Smuzhiyun 	 * Need two pages to accommodate 256 descriptors of 256 bits each
1634*4882a593Smuzhiyun 	 * if the remapping hardware supports scalable mode translation.
1635*4882a593Smuzhiyun 	 */
1636*4882a593Smuzhiyun 	desc_page = alloc_pages_node(iommu->node, GFP_ATOMIC | __GFP_ZERO,
1637*4882a593Smuzhiyun 				     !!ecap_smts(iommu->ecap));
1638*4882a593Smuzhiyun 	if (!desc_page) {
1639*4882a593Smuzhiyun 		kfree(qi);
1640*4882a593Smuzhiyun 		iommu->qi = NULL;
1641*4882a593Smuzhiyun 		return -ENOMEM;
1642*4882a593Smuzhiyun 	}
1643*4882a593Smuzhiyun 
1644*4882a593Smuzhiyun 	qi->desc = page_address(desc_page);
1645*4882a593Smuzhiyun 
1646*4882a593Smuzhiyun 	qi->desc_status = kcalloc(QI_LENGTH, sizeof(int), GFP_ATOMIC);
1647*4882a593Smuzhiyun 	if (!qi->desc_status) {
1648*4882a593Smuzhiyun 		free_page((unsigned long) qi->desc);
1649*4882a593Smuzhiyun 		kfree(qi);
1650*4882a593Smuzhiyun 		iommu->qi = NULL;
1651*4882a593Smuzhiyun 		return -ENOMEM;
1652*4882a593Smuzhiyun 	}
1653*4882a593Smuzhiyun 
1654*4882a593Smuzhiyun 	raw_spin_lock_init(&qi->q_lock);
1655*4882a593Smuzhiyun 
1656*4882a593Smuzhiyun 	__dmar_enable_qi(iommu);
1657*4882a593Smuzhiyun 
1658*4882a593Smuzhiyun 	return 0;
1659*4882a593Smuzhiyun }
1660*4882a593Smuzhiyun 
1661*4882a593Smuzhiyun /* iommu interrupt handling. Most stuff are MSI-like. */
1662*4882a593Smuzhiyun 
1663*4882a593Smuzhiyun enum faulttype {
1664*4882a593Smuzhiyun 	DMA_REMAP,
1665*4882a593Smuzhiyun 	INTR_REMAP,
1666*4882a593Smuzhiyun 	UNKNOWN,
1667*4882a593Smuzhiyun };
1668*4882a593Smuzhiyun 
1669*4882a593Smuzhiyun static const char *dma_remap_fault_reasons[] =
1670*4882a593Smuzhiyun {
1671*4882a593Smuzhiyun 	"Software",
1672*4882a593Smuzhiyun 	"Present bit in root entry is clear",
1673*4882a593Smuzhiyun 	"Present bit in context entry is clear",
1674*4882a593Smuzhiyun 	"Invalid context entry",
1675*4882a593Smuzhiyun 	"Access beyond MGAW",
1676*4882a593Smuzhiyun 	"PTE Write access is not set",
1677*4882a593Smuzhiyun 	"PTE Read access is not set",
1678*4882a593Smuzhiyun 	"Next page table ptr is invalid",
1679*4882a593Smuzhiyun 	"Root table address invalid",
1680*4882a593Smuzhiyun 	"Context table ptr is invalid",
1681*4882a593Smuzhiyun 	"non-zero reserved fields in RTP",
1682*4882a593Smuzhiyun 	"non-zero reserved fields in CTP",
1683*4882a593Smuzhiyun 	"non-zero reserved fields in PTE",
1684*4882a593Smuzhiyun 	"PCE for translation request specifies blocking",
1685*4882a593Smuzhiyun };
1686*4882a593Smuzhiyun 
1687*4882a593Smuzhiyun static const char * const dma_remap_sm_fault_reasons[] = {
1688*4882a593Smuzhiyun 	"SM: Invalid Root Table Address",
1689*4882a593Smuzhiyun 	"SM: TTM 0 for request with PASID",
1690*4882a593Smuzhiyun 	"SM: TTM 0 for page group request",
1691*4882a593Smuzhiyun 	"Unknown", "Unknown", "Unknown", "Unknown", "Unknown", /* 0x33-0x37 */
1692*4882a593Smuzhiyun 	"SM: Error attempting to access Root Entry",
1693*4882a593Smuzhiyun 	"SM: Present bit in Root Entry is clear",
1694*4882a593Smuzhiyun 	"SM: Non-zero reserved field set in Root Entry",
1695*4882a593Smuzhiyun 	"Unknown", "Unknown", "Unknown", "Unknown", "Unknown", /* 0x3B-0x3F */
1696*4882a593Smuzhiyun 	"SM: Error attempting to access Context Entry",
1697*4882a593Smuzhiyun 	"SM: Present bit in Context Entry is clear",
1698*4882a593Smuzhiyun 	"SM: Non-zero reserved field set in the Context Entry",
1699*4882a593Smuzhiyun 	"SM: Invalid Context Entry",
1700*4882a593Smuzhiyun 	"SM: DTE field in Context Entry is clear",
1701*4882a593Smuzhiyun 	"SM: PASID Enable field in Context Entry is clear",
1702*4882a593Smuzhiyun 	"SM: PASID is larger than the max in Context Entry",
1703*4882a593Smuzhiyun 	"SM: PRE field in Context-Entry is clear",
1704*4882a593Smuzhiyun 	"SM: RID_PASID field error in Context-Entry",
1705*4882a593Smuzhiyun 	"Unknown", "Unknown", "Unknown", "Unknown", "Unknown", "Unknown", "Unknown", /* 0x49-0x4F */
1706*4882a593Smuzhiyun 	"SM: Error attempting to access the PASID Directory Entry",
1707*4882a593Smuzhiyun 	"SM: Present bit in Directory Entry is clear",
1708*4882a593Smuzhiyun 	"SM: Non-zero reserved field set in PASID Directory Entry",
1709*4882a593Smuzhiyun 	"Unknown", "Unknown", "Unknown", "Unknown", "Unknown", /* 0x53-0x57 */
1710*4882a593Smuzhiyun 	"SM: Error attempting to access PASID Table Entry",
1711*4882a593Smuzhiyun 	"SM: Present bit in PASID Table Entry is clear",
1712*4882a593Smuzhiyun 	"SM: Non-zero reserved field set in PASID Table Entry",
1713*4882a593Smuzhiyun 	"SM: Invalid Scalable-Mode PASID Table Entry",
1714*4882a593Smuzhiyun 	"SM: ERE field is clear in PASID Table Entry",
1715*4882a593Smuzhiyun 	"SM: SRE field is clear in PASID Table Entry",
1716*4882a593Smuzhiyun 	"Unknown", "Unknown",/* 0x5E-0x5F */
1717*4882a593Smuzhiyun 	"Unknown", "Unknown", "Unknown", "Unknown", "Unknown", "Unknown", "Unknown", "Unknown", /* 0x60-0x67 */
1718*4882a593Smuzhiyun 	"Unknown", "Unknown", "Unknown", "Unknown", "Unknown", "Unknown", "Unknown", "Unknown", /* 0x68-0x6F */
1719*4882a593Smuzhiyun 	"SM: Error attempting to access first-level paging entry",
1720*4882a593Smuzhiyun 	"SM: Present bit in first-level paging entry is clear",
1721*4882a593Smuzhiyun 	"SM: Non-zero reserved field set in first-level paging entry",
1722*4882a593Smuzhiyun 	"SM: Error attempting to access FL-PML4 entry",
1723*4882a593Smuzhiyun 	"SM: First-level entry address beyond MGAW in Nested translation",
1724*4882a593Smuzhiyun 	"SM: Read permission error in FL-PML4 entry in Nested translation",
1725*4882a593Smuzhiyun 	"SM: Read permission error in first-level paging entry in Nested translation",
1726*4882a593Smuzhiyun 	"SM: Write permission error in first-level paging entry in Nested translation",
1727*4882a593Smuzhiyun 	"SM: Error attempting to access second-level paging entry",
1728*4882a593Smuzhiyun 	"SM: Read/Write permission error in second-level paging entry",
1729*4882a593Smuzhiyun 	"SM: Non-zero reserved field set in second-level paging entry",
1730*4882a593Smuzhiyun 	"SM: Invalid second-level page table pointer",
1731*4882a593Smuzhiyun 	"SM: A/D bit update needed in second-level entry when set up in no snoop",
1732*4882a593Smuzhiyun 	"Unknown", "Unknown", "Unknown", /* 0x7D-0x7F */
1733*4882a593Smuzhiyun 	"SM: Address in first-level translation is not canonical",
1734*4882a593Smuzhiyun 	"SM: U/S set 0 for first-level translation with user privilege",
1735*4882a593Smuzhiyun 	"SM: No execute permission for request with PASID and ER=1",
1736*4882a593Smuzhiyun 	"SM: Address beyond the DMA hardware max",
1737*4882a593Smuzhiyun 	"SM: Second-level entry address beyond the max",
1738*4882a593Smuzhiyun 	"SM: No write permission for Write/AtomicOp request",
1739*4882a593Smuzhiyun 	"SM: No read permission for Read/AtomicOp request",
1740*4882a593Smuzhiyun 	"SM: Invalid address-interrupt address",
1741*4882a593Smuzhiyun 	"Unknown", "Unknown", "Unknown", "Unknown", "Unknown", "Unknown", "Unknown", "Unknown", /* 0x88-0x8F */
1742*4882a593Smuzhiyun 	"SM: A/D bit update needed in first-level entry when set up in no snoop",
1743*4882a593Smuzhiyun };
1744*4882a593Smuzhiyun 
1745*4882a593Smuzhiyun static const char *irq_remap_fault_reasons[] =
1746*4882a593Smuzhiyun {
1747*4882a593Smuzhiyun 	"Detected reserved fields in the decoded interrupt-remapped request",
1748*4882a593Smuzhiyun 	"Interrupt index exceeded the interrupt-remapping table size",
1749*4882a593Smuzhiyun 	"Present field in the IRTE entry is clear",
1750*4882a593Smuzhiyun 	"Error accessing interrupt-remapping table pointed by IRTA_REG",
1751*4882a593Smuzhiyun 	"Detected reserved fields in the IRTE entry",
1752*4882a593Smuzhiyun 	"Blocked a compatibility format interrupt request",
1753*4882a593Smuzhiyun 	"Blocked an interrupt request due to source-id verification failure",
1754*4882a593Smuzhiyun };
1755*4882a593Smuzhiyun 
dmar_get_fault_reason(u8 fault_reason,int * fault_type)1756*4882a593Smuzhiyun static const char *dmar_get_fault_reason(u8 fault_reason, int *fault_type)
1757*4882a593Smuzhiyun {
1758*4882a593Smuzhiyun 	if (fault_reason >= 0x20 && (fault_reason - 0x20 <
1759*4882a593Smuzhiyun 					ARRAY_SIZE(irq_remap_fault_reasons))) {
1760*4882a593Smuzhiyun 		*fault_type = INTR_REMAP;
1761*4882a593Smuzhiyun 		return irq_remap_fault_reasons[fault_reason - 0x20];
1762*4882a593Smuzhiyun 	} else if (fault_reason >= 0x30 && (fault_reason - 0x30 <
1763*4882a593Smuzhiyun 			ARRAY_SIZE(dma_remap_sm_fault_reasons))) {
1764*4882a593Smuzhiyun 		*fault_type = DMA_REMAP;
1765*4882a593Smuzhiyun 		return dma_remap_sm_fault_reasons[fault_reason - 0x30];
1766*4882a593Smuzhiyun 	} else if (fault_reason < ARRAY_SIZE(dma_remap_fault_reasons)) {
1767*4882a593Smuzhiyun 		*fault_type = DMA_REMAP;
1768*4882a593Smuzhiyun 		return dma_remap_fault_reasons[fault_reason];
1769*4882a593Smuzhiyun 	} else {
1770*4882a593Smuzhiyun 		*fault_type = UNKNOWN;
1771*4882a593Smuzhiyun 		return "Unknown";
1772*4882a593Smuzhiyun 	}
1773*4882a593Smuzhiyun }
1774*4882a593Smuzhiyun 
1775*4882a593Smuzhiyun 
dmar_msi_reg(struct intel_iommu * iommu,int irq)1776*4882a593Smuzhiyun static inline int dmar_msi_reg(struct intel_iommu *iommu, int irq)
1777*4882a593Smuzhiyun {
1778*4882a593Smuzhiyun 	if (iommu->irq == irq)
1779*4882a593Smuzhiyun 		return DMAR_FECTL_REG;
1780*4882a593Smuzhiyun 	else if (iommu->pr_irq == irq)
1781*4882a593Smuzhiyun 		return DMAR_PECTL_REG;
1782*4882a593Smuzhiyun 	else
1783*4882a593Smuzhiyun 		BUG();
1784*4882a593Smuzhiyun }
1785*4882a593Smuzhiyun 
dmar_msi_unmask(struct irq_data * data)1786*4882a593Smuzhiyun void dmar_msi_unmask(struct irq_data *data)
1787*4882a593Smuzhiyun {
1788*4882a593Smuzhiyun 	struct intel_iommu *iommu = irq_data_get_irq_handler_data(data);
1789*4882a593Smuzhiyun 	int reg = dmar_msi_reg(iommu, data->irq);
1790*4882a593Smuzhiyun 	unsigned long flag;
1791*4882a593Smuzhiyun 
1792*4882a593Smuzhiyun 	/* unmask it */
1793*4882a593Smuzhiyun 	raw_spin_lock_irqsave(&iommu->register_lock, flag);
1794*4882a593Smuzhiyun 	writel(0, iommu->reg + reg);
1795*4882a593Smuzhiyun 	/* Read a reg to force flush the post write */
1796*4882a593Smuzhiyun 	readl(iommu->reg + reg);
1797*4882a593Smuzhiyun 	raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
1798*4882a593Smuzhiyun }
1799*4882a593Smuzhiyun 
dmar_msi_mask(struct irq_data * data)1800*4882a593Smuzhiyun void dmar_msi_mask(struct irq_data *data)
1801*4882a593Smuzhiyun {
1802*4882a593Smuzhiyun 	struct intel_iommu *iommu = irq_data_get_irq_handler_data(data);
1803*4882a593Smuzhiyun 	int reg = dmar_msi_reg(iommu, data->irq);
1804*4882a593Smuzhiyun 	unsigned long flag;
1805*4882a593Smuzhiyun 
1806*4882a593Smuzhiyun 	/* mask it */
1807*4882a593Smuzhiyun 	raw_spin_lock_irqsave(&iommu->register_lock, flag);
1808*4882a593Smuzhiyun 	writel(DMA_FECTL_IM, iommu->reg + reg);
1809*4882a593Smuzhiyun 	/* Read a reg to force flush the post write */
1810*4882a593Smuzhiyun 	readl(iommu->reg + reg);
1811*4882a593Smuzhiyun 	raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
1812*4882a593Smuzhiyun }
1813*4882a593Smuzhiyun 
dmar_msi_write(int irq,struct msi_msg * msg)1814*4882a593Smuzhiyun void dmar_msi_write(int irq, struct msi_msg *msg)
1815*4882a593Smuzhiyun {
1816*4882a593Smuzhiyun 	struct intel_iommu *iommu = irq_get_handler_data(irq);
1817*4882a593Smuzhiyun 	int reg = dmar_msi_reg(iommu, irq);
1818*4882a593Smuzhiyun 	unsigned long flag;
1819*4882a593Smuzhiyun 
1820*4882a593Smuzhiyun 	raw_spin_lock_irqsave(&iommu->register_lock, flag);
1821*4882a593Smuzhiyun 	writel(msg->data, iommu->reg + reg + 4);
1822*4882a593Smuzhiyun 	writel(msg->address_lo, iommu->reg + reg + 8);
1823*4882a593Smuzhiyun 	writel(msg->address_hi, iommu->reg + reg + 12);
1824*4882a593Smuzhiyun 	raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
1825*4882a593Smuzhiyun }
1826*4882a593Smuzhiyun 
dmar_msi_read(int irq,struct msi_msg * msg)1827*4882a593Smuzhiyun void dmar_msi_read(int irq, struct msi_msg *msg)
1828*4882a593Smuzhiyun {
1829*4882a593Smuzhiyun 	struct intel_iommu *iommu = irq_get_handler_data(irq);
1830*4882a593Smuzhiyun 	int reg = dmar_msi_reg(iommu, irq);
1831*4882a593Smuzhiyun 	unsigned long flag;
1832*4882a593Smuzhiyun 
1833*4882a593Smuzhiyun 	raw_spin_lock_irqsave(&iommu->register_lock, flag);
1834*4882a593Smuzhiyun 	msg->data = readl(iommu->reg + reg + 4);
1835*4882a593Smuzhiyun 	msg->address_lo = readl(iommu->reg + reg + 8);
1836*4882a593Smuzhiyun 	msg->address_hi = readl(iommu->reg + reg + 12);
1837*4882a593Smuzhiyun 	raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
1838*4882a593Smuzhiyun }
1839*4882a593Smuzhiyun 
dmar_fault_do_one(struct intel_iommu * iommu,int type,u8 fault_reason,u32 pasid,u16 source_id,unsigned long long addr)1840*4882a593Smuzhiyun static int dmar_fault_do_one(struct intel_iommu *iommu, int type,
1841*4882a593Smuzhiyun 		u8 fault_reason, u32 pasid, u16 source_id,
1842*4882a593Smuzhiyun 		unsigned long long addr)
1843*4882a593Smuzhiyun {
1844*4882a593Smuzhiyun 	const char *reason;
1845*4882a593Smuzhiyun 	int fault_type;
1846*4882a593Smuzhiyun 
1847*4882a593Smuzhiyun 	reason = dmar_get_fault_reason(fault_reason, &fault_type);
1848*4882a593Smuzhiyun 
1849*4882a593Smuzhiyun 	if (fault_type == INTR_REMAP)
1850*4882a593Smuzhiyun 		pr_err("[INTR-REMAP] Request device [%02x:%02x.%d] fault index %llx [fault reason %02d] %s\n",
1851*4882a593Smuzhiyun 			source_id >> 8, PCI_SLOT(source_id & 0xFF),
1852*4882a593Smuzhiyun 			PCI_FUNC(source_id & 0xFF), addr >> 48,
1853*4882a593Smuzhiyun 			fault_reason, reason);
1854*4882a593Smuzhiyun 	else
1855*4882a593Smuzhiyun 		pr_err("[%s] Request device [%02x:%02x.%d] PASID %x fault addr %llx [fault reason %02d] %s\n",
1856*4882a593Smuzhiyun 		       type ? "DMA Read" : "DMA Write",
1857*4882a593Smuzhiyun 		       source_id >> 8, PCI_SLOT(source_id & 0xFF),
1858*4882a593Smuzhiyun 		       PCI_FUNC(source_id & 0xFF), pasid, addr,
1859*4882a593Smuzhiyun 		       fault_reason, reason);
1860*4882a593Smuzhiyun 	return 0;
1861*4882a593Smuzhiyun }
1862*4882a593Smuzhiyun 
1863*4882a593Smuzhiyun #define PRIMARY_FAULT_REG_LEN (16)
dmar_fault(int irq,void * dev_id)1864*4882a593Smuzhiyun irqreturn_t dmar_fault(int irq, void *dev_id)
1865*4882a593Smuzhiyun {
1866*4882a593Smuzhiyun 	struct intel_iommu *iommu = dev_id;
1867*4882a593Smuzhiyun 	int reg, fault_index;
1868*4882a593Smuzhiyun 	u32 fault_status;
1869*4882a593Smuzhiyun 	unsigned long flag;
1870*4882a593Smuzhiyun 	static DEFINE_RATELIMIT_STATE(rs,
1871*4882a593Smuzhiyun 				      DEFAULT_RATELIMIT_INTERVAL,
1872*4882a593Smuzhiyun 				      DEFAULT_RATELIMIT_BURST);
1873*4882a593Smuzhiyun 
1874*4882a593Smuzhiyun 	raw_spin_lock_irqsave(&iommu->register_lock, flag);
1875*4882a593Smuzhiyun 	fault_status = readl(iommu->reg + DMAR_FSTS_REG);
1876*4882a593Smuzhiyun 	if (fault_status && __ratelimit(&rs))
1877*4882a593Smuzhiyun 		pr_err("DRHD: handling fault status reg %x\n", fault_status);
1878*4882a593Smuzhiyun 
1879*4882a593Smuzhiyun 	/* TBD: ignore advanced fault log currently */
1880*4882a593Smuzhiyun 	if (!(fault_status & DMA_FSTS_PPF))
1881*4882a593Smuzhiyun 		goto unlock_exit;
1882*4882a593Smuzhiyun 
1883*4882a593Smuzhiyun 	fault_index = dma_fsts_fault_record_index(fault_status);
1884*4882a593Smuzhiyun 	reg = cap_fault_reg_offset(iommu->cap);
1885*4882a593Smuzhiyun 	while (1) {
1886*4882a593Smuzhiyun 		/* Disable printing, simply clear the fault when ratelimited */
1887*4882a593Smuzhiyun 		bool ratelimited = !__ratelimit(&rs);
1888*4882a593Smuzhiyun 		u8 fault_reason;
1889*4882a593Smuzhiyun 		u16 source_id;
1890*4882a593Smuzhiyun 		u64 guest_addr;
1891*4882a593Smuzhiyun 		u32 pasid;
1892*4882a593Smuzhiyun 		int type;
1893*4882a593Smuzhiyun 		u32 data;
1894*4882a593Smuzhiyun 		bool pasid_present;
1895*4882a593Smuzhiyun 
1896*4882a593Smuzhiyun 		/* highest 32 bits */
1897*4882a593Smuzhiyun 		data = readl(iommu->reg + reg +
1898*4882a593Smuzhiyun 				fault_index * PRIMARY_FAULT_REG_LEN + 12);
1899*4882a593Smuzhiyun 		if (!(data & DMA_FRCD_F))
1900*4882a593Smuzhiyun 			break;
1901*4882a593Smuzhiyun 
1902*4882a593Smuzhiyun 		if (!ratelimited) {
1903*4882a593Smuzhiyun 			fault_reason = dma_frcd_fault_reason(data);
1904*4882a593Smuzhiyun 			type = dma_frcd_type(data);
1905*4882a593Smuzhiyun 
1906*4882a593Smuzhiyun 			pasid = dma_frcd_pasid_value(data);
1907*4882a593Smuzhiyun 			data = readl(iommu->reg + reg +
1908*4882a593Smuzhiyun 				     fault_index * PRIMARY_FAULT_REG_LEN + 8);
1909*4882a593Smuzhiyun 			source_id = dma_frcd_source_id(data);
1910*4882a593Smuzhiyun 
1911*4882a593Smuzhiyun 			pasid_present = dma_frcd_pasid_present(data);
1912*4882a593Smuzhiyun 			guest_addr = dmar_readq(iommu->reg + reg +
1913*4882a593Smuzhiyun 					fault_index * PRIMARY_FAULT_REG_LEN);
1914*4882a593Smuzhiyun 			guest_addr = dma_frcd_page_addr(guest_addr);
1915*4882a593Smuzhiyun 		}
1916*4882a593Smuzhiyun 
1917*4882a593Smuzhiyun 		/* clear the fault */
1918*4882a593Smuzhiyun 		writel(DMA_FRCD_F, iommu->reg + reg +
1919*4882a593Smuzhiyun 			fault_index * PRIMARY_FAULT_REG_LEN + 12);
1920*4882a593Smuzhiyun 
1921*4882a593Smuzhiyun 		raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
1922*4882a593Smuzhiyun 
1923*4882a593Smuzhiyun 		if (!ratelimited)
1924*4882a593Smuzhiyun 			/* Using pasid -1 if pasid is not present */
1925*4882a593Smuzhiyun 			dmar_fault_do_one(iommu, type, fault_reason,
1926*4882a593Smuzhiyun 					  pasid_present ? pasid : -1,
1927*4882a593Smuzhiyun 					  source_id, guest_addr);
1928*4882a593Smuzhiyun 
1929*4882a593Smuzhiyun 		fault_index++;
1930*4882a593Smuzhiyun 		if (fault_index >= cap_num_fault_regs(iommu->cap))
1931*4882a593Smuzhiyun 			fault_index = 0;
1932*4882a593Smuzhiyun 		raw_spin_lock_irqsave(&iommu->register_lock, flag);
1933*4882a593Smuzhiyun 	}
1934*4882a593Smuzhiyun 
1935*4882a593Smuzhiyun 	writel(DMA_FSTS_PFO | DMA_FSTS_PPF | DMA_FSTS_PRO,
1936*4882a593Smuzhiyun 	       iommu->reg + DMAR_FSTS_REG);
1937*4882a593Smuzhiyun 
1938*4882a593Smuzhiyun unlock_exit:
1939*4882a593Smuzhiyun 	raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
1940*4882a593Smuzhiyun 	return IRQ_HANDLED;
1941*4882a593Smuzhiyun }
1942*4882a593Smuzhiyun 
dmar_set_interrupt(struct intel_iommu * iommu)1943*4882a593Smuzhiyun int dmar_set_interrupt(struct intel_iommu *iommu)
1944*4882a593Smuzhiyun {
1945*4882a593Smuzhiyun 	int irq, ret;
1946*4882a593Smuzhiyun 
1947*4882a593Smuzhiyun 	/*
1948*4882a593Smuzhiyun 	 * Check if the fault interrupt is already initialized.
1949*4882a593Smuzhiyun 	 */
1950*4882a593Smuzhiyun 	if (iommu->irq)
1951*4882a593Smuzhiyun 		return 0;
1952*4882a593Smuzhiyun 
1953*4882a593Smuzhiyun 	irq = dmar_alloc_hwirq(iommu->seq_id, iommu->node, iommu);
1954*4882a593Smuzhiyun 	if (irq > 0) {
1955*4882a593Smuzhiyun 		iommu->irq = irq;
1956*4882a593Smuzhiyun 	} else {
1957*4882a593Smuzhiyun 		pr_err("No free IRQ vectors\n");
1958*4882a593Smuzhiyun 		return -EINVAL;
1959*4882a593Smuzhiyun 	}
1960*4882a593Smuzhiyun 
1961*4882a593Smuzhiyun 	ret = request_irq(irq, dmar_fault, IRQF_NO_THREAD, iommu->name, iommu);
1962*4882a593Smuzhiyun 	if (ret)
1963*4882a593Smuzhiyun 		pr_err("Can't request irq\n");
1964*4882a593Smuzhiyun 	return ret;
1965*4882a593Smuzhiyun }
1966*4882a593Smuzhiyun 
enable_drhd_fault_handling(void)1967*4882a593Smuzhiyun int __init enable_drhd_fault_handling(void)
1968*4882a593Smuzhiyun {
1969*4882a593Smuzhiyun 	struct dmar_drhd_unit *drhd;
1970*4882a593Smuzhiyun 	struct intel_iommu *iommu;
1971*4882a593Smuzhiyun 
1972*4882a593Smuzhiyun 	/*
1973*4882a593Smuzhiyun 	 * Enable fault control interrupt.
1974*4882a593Smuzhiyun 	 */
1975*4882a593Smuzhiyun 	for_each_iommu(iommu, drhd) {
1976*4882a593Smuzhiyun 		u32 fault_status;
1977*4882a593Smuzhiyun 		int ret = dmar_set_interrupt(iommu);
1978*4882a593Smuzhiyun 
1979*4882a593Smuzhiyun 		if (ret) {
1980*4882a593Smuzhiyun 			pr_err("DRHD %Lx: failed to enable fault, interrupt, ret %d\n",
1981*4882a593Smuzhiyun 			       (unsigned long long)drhd->reg_base_addr, ret);
1982*4882a593Smuzhiyun 			return -1;
1983*4882a593Smuzhiyun 		}
1984*4882a593Smuzhiyun 
1985*4882a593Smuzhiyun 		/*
1986*4882a593Smuzhiyun 		 * Clear any previous faults.
1987*4882a593Smuzhiyun 		 */
1988*4882a593Smuzhiyun 		dmar_fault(iommu->irq, iommu);
1989*4882a593Smuzhiyun 		fault_status = readl(iommu->reg + DMAR_FSTS_REG);
1990*4882a593Smuzhiyun 		writel(fault_status, iommu->reg + DMAR_FSTS_REG);
1991*4882a593Smuzhiyun 	}
1992*4882a593Smuzhiyun 
1993*4882a593Smuzhiyun 	return 0;
1994*4882a593Smuzhiyun }
1995*4882a593Smuzhiyun 
1996*4882a593Smuzhiyun /*
1997*4882a593Smuzhiyun  * Re-enable Queued Invalidation interface.
1998*4882a593Smuzhiyun  */
dmar_reenable_qi(struct intel_iommu * iommu)1999*4882a593Smuzhiyun int dmar_reenable_qi(struct intel_iommu *iommu)
2000*4882a593Smuzhiyun {
2001*4882a593Smuzhiyun 	if (!ecap_qis(iommu->ecap))
2002*4882a593Smuzhiyun 		return -ENOENT;
2003*4882a593Smuzhiyun 
2004*4882a593Smuzhiyun 	if (!iommu->qi)
2005*4882a593Smuzhiyun 		return -ENOENT;
2006*4882a593Smuzhiyun 
2007*4882a593Smuzhiyun 	/*
2008*4882a593Smuzhiyun 	 * First disable queued invalidation.
2009*4882a593Smuzhiyun 	 */
2010*4882a593Smuzhiyun 	dmar_disable_qi(iommu);
2011*4882a593Smuzhiyun 	/*
2012*4882a593Smuzhiyun 	 * Then enable queued invalidation again. Since there is no pending
2013*4882a593Smuzhiyun 	 * invalidation requests now, it's safe to re-enable queued
2014*4882a593Smuzhiyun 	 * invalidation.
2015*4882a593Smuzhiyun 	 */
2016*4882a593Smuzhiyun 	__dmar_enable_qi(iommu);
2017*4882a593Smuzhiyun 
2018*4882a593Smuzhiyun 	return 0;
2019*4882a593Smuzhiyun }
2020*4882a593Smuzhiyun 
2021*4882a593Smuzhiyun /*
2022*4882a593Smuzhiyun  * Check interrupt remapping support in DMAR table description.
2023*4882a593Smuzhiyun  */
dmar_ir_support(void)2024*4882a593Smuzhiyun int __init dmar_ir_support(void)
2025*4882a593Smuzhiyun {
2026*4882a593Smuzhiyun 	struct acpi_table_dmar *dmar;
2027*4882a593Smuzhiyun 	dmar = (struct acpi_table_dmar *)dmar_tbl;
2028*4882a593Smuzhiyun 	if (!dmar)
2029*4882a593Smuzhiyun 		return 0;
2030*4882a593Smuzhiyun 	return dmar->flags & 0x1;
2031*4882a593Smuzhiyun }
2032*4882a593Smuzhiyun 
2033*4882a593Smuzhiyun /* Check whether DMAR units are in use */
dmar_in_use(void)2034*4882a593Smuzhiyun static inline bool dmar_in_use(void)
2035*4882a593Smuzhiyun {
2036*4882a593Smuzhiyun 	return irq_remapping_enabled || intel_iommu_enabled;
2037*4882a593Smuzhiyun }
2038*4882a593Smuzhiyun 
dmar_free_unused_resources(void)2039*4882a593Smuzhiyun static int __init dmar_free_unused_resources(void)
2040*4882a593Smuzhiyun {
2041*4882a593Smuzhiyun 	struct dmar_drhd_unit *dmaru, *dmaru_n;
2042*4882a593Smuzhiyun 
2043*4882a593Smuzhiyun 	if (dmar_in_use())
2044*4882a593Smuzhiyun 		return 0;
2045*4882a593Smuzhiyun 
2046*4882a593Smuzhiyun 	if (dmar_dev_scope_status != 1 && !list_empty(&dmar_drhd_units))
2047*4882a593Smuzhiyun 		bus_unregister_notifier(&pci_bus_type, &dmar_pci_bus_nb);
2048*4882a593Smuzhiyun 
2049*4882a593Smuzhiyun 	down_write(&dmar_global_lock);
2050*4882a593Smuzhiyun 	list_for_each_entry_safe(dmaru, dmaru_n, &dmar_drhd_units, list) {
2051*4882a593Smuzhiyun 		list_del(&dmaru->list);
2052*4882a593Smuzhiyun 		dmar_free_drhd(dmaru);
2053*4882a593Smuzhiyun 	}
2054*4882a593Smuzhiyun 	up_write(&dmar_global_lock);
2055*4882a593Smuzhiyun 
2056*4882a593Smuzhiyun 	return 0;
2057*4882a593Smuzhiyun }
2058*4882a593Smuzhiyun 
2059*4882a593Smuzhiyun late_initcall(dmar_free_unused_resources);
2060*4882a593Smuzhiyun IOMMU_INIT_POST(detect_intel_iommu);
2061*4882a593Smuzhiyun 
2062*4882a593Smuzhiyun /*
2063*4882a593Smuzhiyun  * DMAR Hotplug Support
2064*4882a593Smuzhiyun  * For more details, please refer to Intel(R) Virtualization Technology
2065*4882a593Smuzhiyun  * for Directed-IO Architecture Specifiction, Rev 2.2, Section 8.8
2066*4882a593Smuzhiyun  * "Remapping Hardware Unit Hot Plug".
2067*4882a593Smuzhiyun  */
2068*4882a593Smuzhiyun static guid_t dmar_hp_guid =
2069*4882a593Smuzhiyun 	GUID_INIT(0xD8C1A3A6, 0xBE9B, 0x4C9B,
2070*4882a593Smuzhiyun 		  0x91, 0xBF, 0xC3, 0xCB, 0x81, 0xFC, 0x5D, 0xAF);
2071*4882a593Smuzhiyun 
2072*4882a593Smuzhiyun /*
2073*4882a593Smuzhiyun  * Currently there's only one revision and BIOS will not check the revision id,
2074*4882a593Smuzhiyun  * so use 0 for safety.
2075*4882a593Smuzhiyun  */
2076*4882a593Smuzhiyun #define	DMAR_DSM_REV_ID			0
2077*4882a593Smuzhiyun #define	DMAR_DSM_FUNC_DRHD		1
2078*4882a593Smuzhiyun #define	DMAR_DSM_FUNC_ATSR		2
2079*4882a593Smuzhiyun #define	DMAR_DSM_FUNC_RHSA		3
2080*4882a593Smuzhiyun 
dmar_detect_dsm(acpi_handle handle,int func)2081*4882a593Smuzhiyun static inline bool dmar_detect_dsm(acpi_handle handle, int func)
2082*4882a593Smuzhiyun {
2083*4882a593Smuzhiyun 	return acpi_check_dsm(handle, &dmar_hp_guid, DMAR_DSM_REV_ID, 1 << func);
2084*4882a593Smuzhiyun }
2085*4882a593Smuzhiyun 
dmar_walk_dsm_resource(acpi_handle handle,int func,dmar_res_handler_t handler,void * arg)2086*4882a593Smuzhiyun static int dmar_walk_dsm_resource(acpi_handle handle, int func,
2087*4882a593Smuzhiyun 				  dmar_res_handler_t handler, void *arg)
2088*4882a593Smuzhiyun {
2089*4882a593Smuzhiyun 	int ret = -ENODEV;
2090*4882a593Smuzhiyun 	union acpi_object *obj;
2091*4882a593Smuzhiyun 	struct acpi_dmar_header *start;
2092*4882a593Smuzhiyun 	struct dmar_res_callback callback;
2093*4882a593Smuzhiyun 	static int res_type[] = {
2094*4882a593Smuzhiyun 		[DMAR_DSM_FUNC_DRHD] = ACPI_DMAR_TYPE_HARDWARE_UNIT,
2095*4882a593Smuzhiyun 		[DMAR_DSM_FUNC_ATSR] = ACPI_DMAR_TYPE_ROOT_ATS,
2096*4882a593Smuzhiyun 		[DMAR_DSM_FUNC_RHSA] = ACPI_DMAR_TYPE_HARDWARE_AFFINITY,
2097*4882a593Smuzhiyun 	};
2098*4882a593Smuzhiyun 
2099*4882a593Smuzhiyun 	if (!dmar_detect_dsm(handle, func))
2100*4882a593Smuzhiyun 		return 0;
2101*4882a593Smuzhiyun 
2102*4882a593Smuzhiyun 	obj = acpi_evaluate_dsm_typed(handle, &dmar_hp_guid, DMAR_DSM_REV_ID,
2103*4882a593Smuzhiyun 				      func, NULL, ACPI_TYPE_BUFFER);
2104*4882a593Smuzhiyun 	if (!obj)
2105*4882a593Smuzhiyun 		return -ENODEV;
2106*4882a593Smuzhiyun 
2107*4882a593Smuzhiyun 	memset(&callback, 0, sizeof(callback));
2108*4882a593Smuzhiyun 	callback.cb[res_type[func]] = handler;
2109*4882a593Smuzhiyun 	callback.arg[res_type[func]] = arg;
2110*4882a593Smuzhiyun 	start = (struct acpi_dmar_header *)obj->buffer.pointer;
2111*4882a593Smuzhiyun 	ret = dmar_walk_remapping_entries(start, obj->buffer.length, &callback);
2112*4882a593Smuzhiyun 
2113*4882a593Smuzhiyun 	ACPI_FREE(obj);
2114*4882a593Smuzhiyun 
2115*4882a593Smuzhiyun 	return ret;
2116*4882a593Smuzhiyun }
2117*4882a593Smuzhiyun 
dmar_hp_add_drhd(struct acpi_dmar_header * header,void * arg)2118*4882a593Smuzhiyun static int dmar_hp_add_drhd(struct acpi_dmar_header *header, void *arg)
2119*4882a593Smuzhiyun {
2120*4882a593Smuzhiyun 	int ret;
2121*4882a593Smuzhiyun 	struct dmar_drhd_unit *dmaru;
2122*4882a593Smuzhiyun 
2123*4882a593Smuzhiyun 	dmaru = dmar_find_dmaru((struct acpi_dmar_hardware_unit *)header);
2124*4882a593Smuzhiyun 	if (!dmaru)
2125*4882a593Smuzhiyun 		return -ENODEV;
2126*4882a593Smuzhiyun 
2127*4882a593Smuzhiyun 	ret = dmar_ir_hotplug(dmaru, true);
2128*4882a593Smuzhiyun 	if (ret == 0)
2129*4882a593Smuzhiyun 		ret = dmar_iommu_hotplug(dmaru, true);
2130*4882a593Smuzhiyun 
2131*4882a593Smuzhiyun 	return ret;
2132*4882a593Smuzhiyun }
2133*4882a593Smuzhiyun 
dmar_hp_remove_drhd(struct acpi_dmar_header * header,void * arg)2134*4882a593Smuzhiyun static int dmar_hp_remove_drhd(struct acpi_dmar_header *header, void *arg)
2135*4882a593Smuzhiyun {
2136*4882a593Smuzhiyun 	int i, ret;
2137*4882a593Smuzhiyun 	struct device *dev;
2138*4882a593Smuzhiyun 	struct dmar_drhd_unit *dmaru;
2139*4882a593Smuzhiyun 
2140*4882a593Smuzhiyun 	dmaru = dmar_find_dmaru((struct acpi_dmar_hardware_unit *)header);
2141*4882a593Smuzhiyun 	if (!dmaru)
2142*4882a593Smuzhiyun 		return 0;
2143*4882a593Smuzhiyun 
2144*4882a593Smuzhiyun 	/*
2145*4882a593Smuzhiyun 	 * All PCI devices managed by this unit should have been destroyed.
2146*4882a593Smuzhiyun 	 */
2147*4882a593Smuzhiyun 	if (!dmaru->include_all && dmaru->devices && dmaru->devices_cnt) {
2148*4882a593Smuzhiyun 		for_each_active_dev_scope(dmaru->devices,
2149*4882a593Smuzhiyun 					  dmaru->devices_cnt, i, dev)
2150*4882a593Smuzhiyun 			return -EBUSY;
2151*4882a593Smuzhiyun 	}
2152*4882a593Smuzhiyun 
2153*4882a593Smuzhiyun 	ret = dmar_ir_hotplug(dmaru, false);
2154*4882a593Smuzhiyun 	if (ret == 0)
2155*4882a593Smuzhiyun 		ret = dmar_iommu_hotplug(dmaru, false);
2156*4882a593Smuzhiyun 
2157*4882a593Smuzhiyun 	return ret;
2158*4882a593Smuzhiyun }
2159*4882a593Smuzhiyun 
dmar_hp_release_drhd(struct acpi_dmar_header * header,void * arg)2160*4882a593Smuzhiyun static int dmar_hp_release_drhd(struct acpi_dmar_header *header, void *arg)
2161*4882a593Smuzhiyun {
2162*4882a593Smuzhiyun 	struct dmar_drhd_unit *dmaru;
2163*4882a593Smuzhiyun 
2164*4882a593Smuzhiyun 	dmaru = dmar_find_dmaru((struct acpi_dmar_hardware_unit *)header);
2165*4882a593Smuzhiyun 	if (dmaru) {
2166*4882a593Smuzhiyun 		list_del_rcu(&dmaru->list);
2167*4882a593Smuzhiyun 		synchronize_rcu();
2168*4882a593Smuzhiyun 		dmar_free_drhd(dmaru);
2169*4882a593Smuzhiyun 	}
2170*4882a593Smuzhiyun 
2171*4882a593Smuzhiyun 	return 0;
2172*4882a593Smuzhiyun }
2173*4882a593Smuzhiyun 
dmar_hotplug_insert(acpi_handle handle)2174*4882a593Smuzhiyun static int dmar_hotplug_insert(acpi_handle handle)
2175*4882a593Smuzhiyun {
2176*4882a593Smuzhiyun 	int ret;
2177*4882a593Smuzhiyun 	int drhd_count = 0;
2178*4882a593Smuzhiyun 
2179*4882a593Smuzhiyun 	ret = dmar_walk_dsm_resource(handle, DMAR_DSM_FUNC_DRHD,
2180*4882a593Smuzhiyun 				     &dmar_validate_one_drhd, (void *)1);
2181*4882a593Smuzhiyun 	if (ret)
2182*4882a593Smuzhiyun 		goto out;
2183*4882a593Smuzhiyun 
2184*4882a593Smuzhiyun 	ret = dmar_walk_dsm_resource(handle, DMAR_DSM_FUNC_DRHD,
2185*4882a593Smuzhiyun 				     &dmar_parse_one_drhd, (void *)&drhd_count);
2186*4882a593Smuzhiyun 	if (ret == 0 && drhd_count == 0) {
2187*4882a593Smuzhiyun 		pr_warn(FW_BUG "No DRHD structures in buffer returned by _DSM method\n");
2188*4882a593Smuzhiyun 		goto out;
2189*4882a593Smuzhiyun 	} else if (ret) {
2190*4882a593Smuzhiyun 		goto release_drhd;
2191*4882a593Smuzhiyun 	}
2192*4882a593Smuzhiyun 
2193*4882a593Smuzhiyun 	ret = dmar_walk_dsm_resource(handle, DMAR_DSM_FUNC_RHSA,
2194*4882a593Smuzhiyun 				     &dmar_parse_one_rhsa, NULL);
2195*4882a593Smuzhiyun 	if (ret)
2196*4882a593Smuzhiyun 		goto release_drhd;
2197*4882a593Smuzhiyun 
2198*4882a593Smuzhiyun 	ret = dmar_walk_dsm_resource(handle, DMAR_DSM_FUNC_ATSR,
2199*4882a593Smuzhiyun 				     &dmar_parse_one_atsr, NULL);
2200*4882a593Smuzhiyun 	if (ret)
2201*4882a593Smuzhiyun 		goto release_atsr;
2202*4882a593Smuzhiyun 
2203*4882a593Smuzhiyun 	ret = dmar_walk_dsm_resource(handle, DMAR_DSM_FUNC_DRHD,
2204*4882a593Smuzhiyun 				     &dmar_hp_add_drhd, NULL);
2205*4882a593Smuzhiyun 	if (!ret)
2206*4882a593Smuzhiyun 		return 0;
2207*4882a593Smuzhiyun 
2208*4882a593Smuzhiyun 	dmar_walk_dsm_resource(handle, DMAR_DSM_FUNC_DRHD,
2209*4882a593Smuzhiyun 			       &dmar_hp_remove_drhd, NULL);
2210*4882a593Smuzhiyun release_atsr:
2211*4882a593Smuzhiyun 	dmar_walk_dsm_resource(handle, DMAR_DSM_FUNC_ATSR,
2212*4882a593Smuzhiyun 			       &dmar_release_one_atsr, NULL);
2213*4882a593Smuzhiyun release_drhd:
2214*4882a593Smuzhiyun 	dmar_walk_dsm_resource(handle, DMAR_DSM_FUNC_DRHD,
2215*4882a593Smuzhiyun 			       &dmar_hp_release_drhd, NULL);
2216*4882a593Smuzhiyun out:
2217*4882a593Smuzhiyun 	return ret;
2218*4882a593Smuzhiyun }
2219*4882a593Smuzhiyun 
dmar_hotplug_remove(acpi_handle handle)2220*4882a593Smuzhiyun static int dmar_hotplug_remove(acpi_handle handle)
2221*4882a593Smuzhiyun {
2222*4882a593Smuzhiyun 	int ret;
2223*4882a593Smuzhiyun 
2224*4882a593Smuzhiyun 	ret = dmar_walk_dsm_resource(handle, DMAR_DSM_FUNC_ATSR,
2225*4882a593Smuzhiyun 				     &dmar_check_one_atsr, NULL);
2226*4882a593Smuzhiyun 	if (ret)
2227*4882a593Smuzhiyun 		return ret;
2228*4882a593Smuzhiyun 
2229*4882a593Smuzhiyun 	ret = dmar_walk_dsm_resource(handle, DMAR_DSM_FUNC_DRHD,
2230*4882a593Smuzhiyun 				     &dmar_hp_remove_drhd, NULL);
2231*4882a593Smuzhiyun 	if (ret == 0) {
2232*4882a593Smuzhiyun 		WARN_ON(dmar_walk_dsm_resource(handle, DMAR_DSM_FUNC_ATSR,
2233*4882a593Smuzhiyun 					       &dmar_release_one_atsr, NULL));
2234*4882a593Smuzhiyun 		WARN_ON(dmar_walk_dsm_resource(handle, DMAR_DSM_FUNC_DRHD,
2235*4882a593Smuzhiyun 					       &dmar_hp_release_drhd, NULL));
2236*4882a593Smuzhiyun 	} else {
2237*4882a593Smuzhiyun 		dmar_walk_dsm_resource(handle, DMAR_DSM_FUNC_DRHD,
2238*4882a593Smuzhiyun 				       &dmar_hp_add_drhd, NULL);
2239*4882a593Smuzhiyun 	}
2240*4882a593Smuzhiyun 
2241*4882a593Smuzhiyun 	return ret;
2242*4882a593Smuzhiyun }
2243*4882a593Smuzhiyun 
dmar_get_dsm_handle(acpi_handle handle,u32 lvl,void * context,void ** retval)2244*4882a593Smuzhiyun static acpi_status dmar_get_dsm_handle(acpi_handle handle, u32 lvl,
2245*4882a593Smuzhiyun 				       void *context, void **retval)
2246*4882a593Smuzhiyun {
2247*4882a593Smuzhiyun 	acpi_handle *phdl = retval;
2248*4882a593Smuzhiyun 
2249*4882a593Smuzhiyun 	if (dmar_detect_dsm(handle, DMAR_DSM_FUNC_DRHD)) {
2250*4882a593Smuzhiyun 		*phdl = handle;
2251*4882a593Smuzhiyun 		return AE_CTRL_TERMINATE;
2252*4882a593Smuzhiyun 	}
2253*4882a593Smuzhiyun 
2254*4882a593Smuzhiyun 	return AE_OK;
2255*4882a593Smuzhiyun }
2256*4882a593Smuzhiyun 
dmar_device_hotplug(acpi_handle handle,bool insert)2257*4882a593Smuzhiyun static int dmar_device_hotplug(acpi_handle handle, bool insert)
2258*4882a593Smuzhiyun {
2259*4882a593Smuzhiyun 	int ret;
2260*4882a593Smuzhiyun 	acpi_handle tmp = NULL;
2261*4882a593Smuzhiyun 	acpi_status status;
2262*4882a593Smuzhiyun 
2263*4882a593Smuzhiyun 	if (!dmar_in_use())
2264*4882a593Smuzhiyun 		return 0;
2265*4882a593Smuzhiyun 
2266*4882a593Smuzhiyun 	if (dmar_detect_dsm(handle, DMAR_DSM_FUNC_DRHD)) {
2267*4882a593Smuzhiyun 		tmp = handle;
2268*4882a593Smuzhiyun 	} else {
2269*4882a593Smuzhiyun 		status = acpi_walk_namespace(ACPI_TYPE_DEVICE, handle,
2270*4882a593Smuzhiyun 					     ACPI_UINT32_MAX,
2271*4882a593Smuzhiyun 					     dmar_get_dsm_handle,
2272*4882a593Smuzhiyun 					     NULL, NULL, &tmp);
2273*4882a593Smuzhiyun 		if (ACPI_FAILURE(status)) {
2274*4882a593Smuzhiyun 			pr_warn("Failed to locate _DSM method.\n");
2275*4882a593Smuzhiyun 			return -ENXIO;
2276*4882a593Smuzhiyun 		}
2277*4882a593Smuzhiyun 	}
2278*4882a593Smuzhiyun 	if (tmp == NULL)
2279*4882a593Smuzhiyun 		return 0;
2280*4882a593Smuzhiyun 
2281*4882a593Smuzhiyun 	down_write(&dmar_global_lock);
2282*4882a593Smuzhiyun 	if (insert)
2283*4882a593Smuzhiyun 		ret = dmar_hotplug_insert(tmp);
2284*4882a593Smuzhiyun 	else
2285*4882a593Smuzhiyun 		ret = dmar_hotplug_remove(tmp);
2286*4882a593Smuzhiyun 	up_write(&dmar_global_lock);
2287*4882a593Smuzhiyun 
2288*4882a593Smuzhiyun 	return ret;
2289*4882a593Smuzhiyun }
2290*4882a593Smuzhiyun 
dmar_device_add(acpi_handle handle)2291*4882a593Smuzhiyun int dmar_device_add(acpi_handle handle)
2292*4882a593Smuzhiyun {
2293*4882a593Smuzhiyun 	return dmar_device_hotplug(handle, true);
2294*4882a593Smuzhiyun }
2295*4882a593Smuzhiyun 
dmar_device_remove(acpi_handle handle)2296*4882a593Smuzhiyun int dmar_device_remove(acpi_handle handle)
2297*4882a593Smuzhiyun {
2298*4882a593Smuzhiyun 	return dmar_device_hotplug(handle, false);
2299*4882a593Smuzhiyun }
2300*4882a593Smuzhiyun 
2301*4882a593Smuzhiyun /*
2302*4882a593Smuzhiyun  * dmar_platform_optin - Is %DMA_CTRL_PLATFORM_OPT_IN_FLAG set in DMAR table
2303*4882a593Smuzhiyun  *
2304*4882a593Smuzhiyun  * Returns true if the platform has %DMA_CTRL_PLATFORM_OPT_IN_FLAG set in
2305*4882a593Smuzhiyun  * the ACPI DMAR table. This means that the platform boot firmware has made
2306*4882a593Smuzhiyun  * sure no device can issue DMA outside of RMRR regions.
2307*4882a593Smuzhiyun  */
dmar_platform_optin(void)2308*4882a593Smuzhiyun bool dmar_platform_optin(void)
2309*4882a593Smuzhiyun {
2310*4882a593Smuzhiyun 	struct acpi_table_dmar *dmar;
2311*4882a593Smuzhiyun 	acpi_status status;
2312*4882a593Smuzhiyun 	bool ret;
2313*4882a593Smuzhiyun 
2314*4882a593Smuzhiyun 	status = acpi_get_table(ACPI_SIG_DMAR, 0,
2315*4882a593Smuzhiyun 				(struct acpi_table_header **)&dmar);
2316*4882a593Smuzhiyun 	if (ACPI_FAILURE(status))
2317*4882a593Smuzhiyun 		return false;
2318*4882a593Smuzhiyun 
2319*4882a593Smuzhiyun 	ret = !!(dmar->flags & DMAR_PLATFORM_OPT_IN);
2320*4882a593Smuzhiyun 	acpi_put_table((struct acpi_table_header *)dmar);
2321*4882a593Smuzhiyun 
2322*4882a593Smuzhiyun 	return ret;
2323*4882a593Smuzhiyun }
2324*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(dmar_platform_optin);
2325