blob: 87274b54febd0eb3cfb1dd3358609fa037c90095 [file] [log] [blame]
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001/*
David Woodhouseea8ea462014-03-05 17:09:32 +00002 * Copyright © 2006-2014 Intel Corporation.
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003 *
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms and conditions of the GNU General Public License,
6 * version 2, as published by the Free Software Foundation.
7 *
8 * This program is distributed in the hope it will be useful, but WITHOUT
9 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
11 * more details.
12 *
David Woodhouseea8ea462014-03-05 17:09:32 +000013 * Authors: David Woodhouse <dwmw2@infradead.org>,
14 * Ashok Raj <ashok.raj@intel.com>,
15 * Shaohua Li <shaohua.li@intel.com>,
16 * Anil S Keshavamurthy <anil.s.keshavamurthy@intel.com>,
17 * Fenghua Yu <fenghua.yu@intel.com>
Joerg Roedel9f10e5b2015-06-12 09:57:06 +020018 * Joerg Roedel <jroedel@suse.de>
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070019 */
20
Joerg Roedel9f10e5b2015-06-12 09:57:06 +020021#define pr_fmt(fmt) "DMAR: " fmt
Bjorn Helgaas932a6522019-02-08 16:06:00 -060022#define dev_fmt(fmt) pr_fmt(fmt)
Joerg Roedel9f10e5b2015-06-12 09:57:06 +020023
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070024#include <linux/init.h>
25#include <linux/bitmap.h>
mark gross5e0d2a62008-03-04 15:22:08 -080026#include <linux/debugfs.h>
Paul Gortmaker54485c32011-10-29 10:26:25 -040027#include <linux/export.h>
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070028#include <linux/slab.h>
29#include <linux/irq.h>
30#include <linux/interrupt.h>
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070031#include <linux/spinlock.h>
32#include <linux/pci.h>
33#include <linux/dmar.h>
34#include <linux/dma-mapping.h>
35#include <linux/mempool.h>
Jiang Liu75f05562014-02-19 14:07:37 +080036#include <linux/memory.h>
Omer Pelegaa473242016-04-20 11:33:02 +030037#include <linux/cpu.h>
mark gross5e0d2a62008-03-04 15:22:08 -080038#include <linux/timer.h>
Dan Williamsdfddb962015-10-09 18:16:46 -040039#include <linux/io.h>
Kay, Allen M38717942008-09-09 18:37:29 +030040#include <linux/iova.h>
Joerg Roedel5d450802008-12-03 14:52:32 +010041#include <linux/iommu.h>
Kay, Allen M38717942008-09-09 18:37:29 +030042#include <linux/intel-iommu.h>
Rafael J. Wysocki134fac32011-03-23 22:16:14 +010043#include <linux/syscore_ops.h>
Shane Wang69575d32009-09-01 18:25:07 -070044#include <linux/tboot.h>
Stephen Rothwelladb2fe02009-08-31 15:24:23 +100045#include <linux/dmi.h>
Joerg Roedel5cdede22011-04-04 15:55:18 +020046#include <linux/pci-ats.h>
Tejun Heo0ee332c2011-12-08 10:22:09 -080047#include <linux/memblock.h>
Akinobu Mita36746432014-06-04 16:06:51 -070048#include <linux/dma-contiguous.h>
Christoph Hellwigfec777c2018-03-19 11:38:15 +010049#include <linux/dma-direct.h>
Joerg Roedel091d42e2015-06-12 11:56:10 +020050#include <linux/crash_dump.h>
Anshuman Khandual98fa15f2019-03-05 15:42:58 -080051#include <linux/numa.h>
Suresh Siddha8a8f4222012-03-30 11:47:08 -070052#include <asm/irq_remapping.h>
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070053#include <asm/cacheflush.h>
FUJITA Tomonori46a7fa22008-07-11 10:23:42 +090054#include <asm/iommu.h>
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070055
Joerg Roedel078e1ee2012-09-26 12:44:43 +020056#include "irq_remapping.h"
Lu Baolu56283172018-07-14 15:46:54 +080057#include "intel-pasid.h"
Joerg Roedel078e1ee2012-09-26 12:44:43 +020058
Fenghua Yu5b6985c2008-10-16 18:02:32 -070059#define ROOT_SIZE VTD_PAGE_SIZE
60#define CONTEXT_SIZE VTD_PAGE_SIZE
61
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070062#define IS_GFX_DEVICE(pdev) ((pdev->class >> 16) == PCI_BASE_CLASS_DISPLAY)
David Woodhouse18436af2015-03-25 15:05:47 +000063#define IS_USB_DEVICE(pdev) ((pdev->class >> 8) == PCI_CLASS_SERIAL_USB)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070064#define IS_ISA_DEVICE(pdev) ((pdev->class >> 8) == PCI_CLASS_BRIDGE_ISA)
David Woodhousee0fc7e02009-09-30 09:12:17 -070065#define IS_AZALIA(pdev) ((pdev)->vendor == 0x8086 && (pdev)->device == 0x3a3e)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070066
67#define IOAPIC_RANGE_START (0xfee00000)
68#define IOAPIC_RANGE_END (0xfeefffff)
69#define IOVA_START_ADDR (0x1000)
70
Sohil Mehta5e3b4a12017-12-20 11:59:24 -080071#define DEFAULT_DOMAIN_ADDRESS_WIDTH 57
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070072
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -070073#define MAX_AGAW_WIDTH 64
Jiang Liu5c645b32014-01-06 14:18:12 +080074#define MAX_AGAW_PFN_WIDTH (MAX_AGAW_WIDTH - VTD_PAGE_SHIFT)
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -070075
David Woodhouse2ebe3152009-09-19 07:34:04 -070076#define __DOMAIN_MAX_PFN(gaw) ((((uint64_t)1) << (gaw-VTD_PAGE_SHIFT)) - 1)
77#define __DOMAIN_MAX_ADDR(gaw) ((((uint64_t)1) << gaw) - 1)
78
79/* We limit DOMAIN_MAX_PFN to fit in an unsigned long, and DOMAIN_MAX_ADDR
80 to match. That way, we can use 'unsigned long' for PFNs with impunity. */
81#define DOMAIN_MAX_PFN(gaw) ((unsigned long) min_t(uint64_t, \
82 __DOMAIN_MAX_PFN(gaw), (unsigned long)-1))
83#define DOMAIN_MAX_ADDR(gaw) (((uint64_t)__DOMAIN_MAX_PFN(gaw)) << VTD_PAGE_SHIFT)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070084
Robin Murphy1b722502015-01-12 17:51:15 +000085/* IO virtual address start page frame number */
86#define IOVA_START_PFN (1)
87
Mark McLoughlinf27be032008-11-20 15:49:43 +000088#define IOVA_PFN(addr) ((addr) >> PAGE_SHIFT)
mark gross5e0d2a62008-03-04 15:22:08 -080089
Andrew Mortondf08cdc2010-09-22 13:05:11 -070090/* page table handling */
91#define LEVEL_STRIDE (9)
92#define LEVEL_MASK (((u64)1 << LEVEL_STRIDE) - 1)
93
Ohad Ben-Cohen6d1c56a2011-11-10 11:32:30 +020094/*
95 * This bitmap is used to advertise the page sizes our hardware support
96 * to the IOMMU core, which will then use this information to split
97 * physically contiguous memory regions it is mapping into page sizes
98 * that we support.
99 *
100 * Traditionally the IOMMU core just handed us the mappings directly,
101 * after making sure the size is an order of a 4KiB page and that the
102 * mapping has natural alignment.
103 *
104 * To retain this behavior, we currently advertise that we support
105 * all page sizes that are an order of 4KiB.
106 *
107 * If at some point we'd like to utilize the IOMMU core's new behavior,
108 * we could change this to advertise the real page sizes we support.
109 */
110#define INTEL_IOMMU_PGSIZES (~0xFFFUL)
111
Andrew Mortondf08cdc2010-09-22 13:05:11 -0700112static inline int agaw_to_level(int agaw)
113{
114 return agaw + 2;
115}
116
117static inline int agaw_to_width(int agaw)
118{
Jiang Liu5c645b32014-01-06 14:18:12 +0800119 return min_t(int, 30 + agaw * LEVEL_STRIDE, MAX_AGAW_WIDTH);
Andrew Mortondf08cdc2010-09-22 13:05:11 -0700120}
121
122static inline int width_to_agaw(int width)
123{
Jiang Liu5c645b32014-01-06 14:18:12 +0800124 return DIV_ROUND_UP(width - 30, LEVEL_STRIDE);
Andrew Mortondf08cdc2010-09-22 13:05:11 -0700125}
126
127static inline unsigned int level_to_offset_bits(int level)
128{
129 return (level - 1) * LEVEL_STRIDE;
130}
131
132static inline int pfn_level_offset(unsigned long pfn, int level)
133{
134 return (pfn >> level_to_offset_bits(level)) & LEVEL_MASK;
135}
136
137static inline unsigned long level_mask(int level)
138{
139 return -1UL << level_to_offset_bits(level);
140}
141
142static inline unsigned long level_size(int level)
143{
144 return 1UL << level_to_offset_bits(level);
145}
146
147static inline unsigned long align_to_level(unsigned long pfn, int level)
148{
149 return (pfn + level_size(level) - 1) & level_mask(level);
150}
David Woodhousefd18de52009-05-10 23:57:41 +0100151
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100152static inline unsigned long lvl_to_nr_pages(unsigned int lvl)
153{
Jiang Liu5c645b32014-01-06 14:18:12 +0800154 return 1 << min_t(int, (lvl - 1) * LEVEL_STRIDE, MAX_AGAW_PFN_WIDTH);
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100155}
156
David Woodhousedd4e8312009-06-27 16:21:20 +0100157/* VT-d pages must always be _smaller_ than MM pages. Otherwise things
158 are never going to work. */
159static inline unsigned long dma_to_mm_pfn(unsigned long dma_pfn)
160{
161 return dma_pfn >> (PAGE_SHIFT - VTD_PAGE_SHIFT);
162}
163
164static inline unsigned long mm_to_dma_pfn(unsigned long mm_pfn)
165{
166 return mm_pfn << (PAGE_SHIFT - VTD_PAGE_SHIFT);
167}
168static inline unsigned long page_to_dma_pfn(struct page *pg)
169{
170 return mm_to_dma_pfn(page_to_pfn(pg));
171}
172static inline unsigned long virt_to_dma_pfn(void *p)
173{
174 return page_to_dma_pfn(virt_to_page(p));
175}
176
Weidong Hand9630fe2008-12-08 11:06:32 +0800177/* global iommu list, set NULL for ignored DMAR units */
178static struct intel_iommu **g_iommus;
179
David Woodhousee0fc7e02009-09-30 09:12:17 -0700180static void __init check_tylersburg_isoch(void);
David Woodhouse9af88142009-02-13 23:18:03 +0000181static int rwbf_quirk;
182
Mark McLoughlin46b08e12008-11-20 15:49:44 +0000183/*
Joseph Cihulab7792602011-05-03 00:08:37 -0700184 * set to 1 to panic kernel if can't successfully enable VT-d
185 * (used when kernel is launched w/ TXT)
186 */
187static int force_on = 0;
Shaohua Libfd20f12017-04-26 09:18:35 -0700188int intel_iommu_tboot_noforce;
Lu Baolu89a60792018-10-23 15:45:01 +0800189static int no_platform_optin;
Joseph Cihulab7792602011-05-03 00:08:37 -0700190
Mark McLoughlin46b08e12008-11-20 15:49:44 +0000191#define ROOT_ENTRY_NR (VTD_PAGE_SIZE/sizeof(struct root_entry))
Mark McLoughlin46b08e12008-11-20 15:49:44 +0000192
Joerg Roedel091d42e2015-06-12 11:56:10 +0200193/*
194 * Take a root_entry and return the Lower Context Table Pointer (LCTP)
195 * if marked present.
196 */
197static phys_addr_t root_entry_lctp(struct root_entry *re)
198{
199 if (!(re->lo & 1))
200 return 0;
Mark McLoughlin46b08e12008-11-20 15:49:44 +0000201
Joerg Roedel091d42e2015-06-12 11:56:10 +0200202 return re->lo & VTD_PAGE_MASK;
203}
204
205/*
206 * Take a root_entry and return the Upper Context Table Pointer (UCTP)
207 * if marked present.
208 */
209static phys_addr_t root_entry_uctp(struct root_entry *re)
210{
211 if (!(re->hi & 1))
212 return 0;
213
214 return re->hi & VTD_PAGE_MASK;
215}
Mark McLoughlin7a8fc252008-11-20 15:49:45 +0000216
Joerg Roedelcf484d02015-06-12 12:21:46 +0200217static inline void context_clear_pasid_enable(struct context_entry *context)
218{
219 context->lo &= ~(1ULL << 11);
220}
221
222static inline bool context_pasid_enabled(struct context_entry *context)
223{
224 return !!(context->lo & (1ULL << 11));
225}
226
227static inline void context_set_copied(struct context_entry *context)
228{
229 context->hi |= (1ull << 3);
230}
231
232static inline bool context_copied(struct context_entry *context)
233{
234 return !!(context->hi & (1ULL << 3));
235}
236
237static inline bool __context_present(struct context_entry *context)
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000238{
239 return (context->lo & 1);
240}
Joerg Roedelcf484d02015-06-12 12:21:46 +0200241
Sohil Mehta26b86092018-09-11 17:11:36 -0700242bool context_present(struct context_entry *context)
Joerg Roedelcf484d02015-06-12 12:21:46 +0200243{
244 return context_pasid_enabled(context) ?
245 __context_present(context) :
246 __context_present(context) && !context_copied(context);
247}
248
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000249static inline void context_set_present(struct context_entry *context)
250{
251 context->lo |= 1;
252}
253
254static inline void context_set_fault_enable(struct context_entry *context)
255{
256 context->lo &= (((u64)-1) << 2) | 1;
257}
258
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000259static inline void context_set_translation_type(struct context_entry *context,
260 unsigned long value)
261{
262 context->lo &= (((u64)-1) << 4) | 3;
263 context->lo |= (value & 3) << 2;
264}
265
266static inline void context_set_address_root(struct context_entry *context,
267 unsigned long value)
268{
Li, Zhen-Hua1a2262f2014-11-05 15:30:19 +0800269 context->lo &= ~VTD_PAGE_MASK;
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000270 context->lo |= value & VTD_PAGE_MASK;
271}
272
273static inline void context_set_address_width(struct context_entry *context,
274 unsigned long value)
275{
276 context->hi |= value & 7;
277}
278
279static inline void context_set_domain_id(struct context_entry *context,
280 unsigned long value)
281{
282 context->hi |= (value & ((1 << 16) - 1)) << 8;
283}
284
Joerg Roedeldbcd8612015-06-12 12:02:09 +0200285static inline int context_domain_id(struct context_entry *c)
286{
287 return((c->hi >> 8) & 0xffff);
288}
289
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000290static inline void context_clear_entry(struct context_entry *context)
291{
292 context->lo = 0;
293 context->hi = 0;
294}
Mark McLoughlin7a8fc252008-11-20 15:49:45 +0000295
Mark McLoughlin622ba122008-11-20 15:49:46 +0000296/*
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700297 * This domain is a statically identity mapping domain.
298 * 1. This domain creats a static 1:1 mapping to all usable memory.
299 * 2. It maps to each iommu if successful.
300 * 3. Each iommu mapps to this domain if successful.
301 */
David Woodhouse19943b02009-08-04 16:19:20 +0100302static struct dmar_domain *si_domain;
303static int hw_pass_through = 1;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700304
Joerg Roedel28ccce02015-07-21 14:45:31 +0200305/*
306 * Domain represents a virtual machine, more than one devices
Weidong Han1ce28fe2008-12-08 16:35:39 +0800307 * across iommus may be owned in one domain, e.g. kvm guest.
308 */
Jiang Liuab8dfe22014-07-11 14:19:27 +0800309#define DOMAIN_FLAG_VIRTUAL_MACHINE (1 << 0)
Weidong Han1ce28fe2008-12-08 16:35:39 +0800310
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700311/* si_domain contains mulitple devices */
Jiang Liuab8dfe22014-07-11 14:19:27 +0800312#define DOMAIN_FLAG_STATIC_IDENTITY (1 << 1)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700313
Joerg Roedel29a27712015-07-21 17:17:12 +0200314#define for_each_domain_iommu(idx, domain) \
315 for (idx = 0; idx < g_num_of_iommus; idx++) \
316 if (domain->iommu_refcnt[idx])
317
Jiang Liub94e4112014-02-19 14:07:25 +0800318struct dmar_rmrr_unit {
319 struct list_head list; /* list of rmrr units */
320 struct acpi_dmar_header *hdr; /* ACPI header */
321 u64 base_address; /* reserved base address*/
322 u64 end_address; /* reserved end address */
David Woodhouse832bd852014-03-07 15:08:36 +0000323 struct dmar_dev_scope *devices; /* target devices */
Jiang Liub94e4112014-02-19 14:07:25 +0800324 int devices_cnt; /* target device count */
Eric Auger0659b8d2017-01-19 20:57:53 +0000325 struct iommu_resv_region *resv; /* reserved region handle */
Jiang Liub94e4112014-02-19 14:07:25 +0800326};
327
328struct dmar_atsr_unit {
329 struct list_head list; /* list of ATSR units */
330 struct acpi_dmar_header *hdr; /* ACPI header */
David Woodhouse832bd852014-03-07 15:08:36 +0000331 struct dmar_dev_scope *devices; /* target devices */
Jiang Liub94e4112014-02-19 14:07:25 +0800332 int devices_cnt; /* target device count */
333 u8 include_all:1; /* include all ports */
334};
335
336static LIST_HEAD(dmar_atsr_units);
337static LIST_HEAD(dmar_rmrr_units);
338
339#define for_each_rmrr_units(rmrr) \
340 list_for_each_entry(rmrr, &dmar_rmrr_units, list)
341
mark gross5e0d2a62008-03-04 15:22:08 -0800342/* bitmap for indexing intel_iommus */
mark gross5e0d2a62008-03-04 15:22:08 -0800343static int g_num_of_iommus;
344
Jiang Liu92d03cc2014-02-19 14:07:28 +0800345static void domain_exit(struct dmar_domain *domain);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700346static void domain_remove_dev_info(struct dmar_domain *domain);
Bjorn Helgaas71753232019-02-08 16:06:15 -0600347static void dmar_remove_one_dev_info(struct device *dev);
Joerg Roedel127c7612015-07-23 17:44:46 +0200348static void __dmar_remove_one_dev_info(struct device_domain_info *info);
Joerg Roedel2452d9d2015-07-23 16:20:14 +0200349static void domain_context_clear(struct intel_iommu *iommu,
350 struct device *dev);
Jiang Liu2a46ddf2014-07-11 14:19:30 +0800351static int domain_detach_iommu(struct dmar_domain *domain,
352 struct intel_iommu *iommu);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700353
Suresh Siddhad3f13812011-08-23 17:05:25 -0700354#ifdef CONFIG_INTEL_IOMMU_DEFAULT_ON
Kyle McMartin0cd5c3c2009-02-04 14:29:19 -0800355int dmar_disabled = 0;
356#else
357int dmar_disabled = 1;
Suresh Siddhad3f13812011-08-23 17:05:25 -0700358#endif /*CONFIG_INTEL_IOMMU_DEFAULT_ON*/
Kyle McMartin0cd5c3c2009-02-04 14:29:19 -0800359
Eugeni Dodonov8bc1f852011-11-23 16:42:14 -0200360int intel_iommu_enabled = 0;
361EXPORT_SYMBOL_GPL(intel_iommu_enabled);
362
David Woodhouse2d9e6672010-06-15 10:57:57 +0100363static int dmar_map_gfx = 1;
Keshavamurthy, Anil S7d3b03c2007-10-21 16:41:53 -0700364static int dmar_forcedac;
mark gross5e0d2a62008-03-04 15:22:08 -0800365static int intel_iommu_strict;
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100366static int intel_iommu_superpage = 1;
Lu Baolu8950dcd2019-01-24 10:31:32 +0800367static int intel_iommu_sm;
David Woodhouseae853dd2015-09-09 11:58:59 +0100368static int iommu_identity_mapping;
David Woodhousec83b2f22015-06-12 10:15:49 +0100369
David Woodhouseae853dd2015-09-09 11:58:59 +0100370#define IDENTMAP_ALL 1
371#define IDENTMAP_GFX 2
372#define IDENTMAP_AZALIA 4
David Woodhousec83b2f22015-06-12 10:15:49 +0100373
Lu Baolu765b6a92018-12-10 09:58:55 +0800374#define sm_supported(iommu) (intel_iommu_sm && ecap_smts((iommu)->ecap))
375#define pasid_supported(iommu) (sm_supported(iommu) && \
376 ecap_pasid((iommu)->ecap))
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700377
David Woodhousec0771df2011-10-14 20:59:46 +0100378int intel_iommu_gfx_mapped;
379EXPORT_SYMBOL_GPL(intel_iommu_gfx_mapped);
380
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700381#define DUMMY_DEVICE_DOMAIN_INFO ((struct device_domain_info *)(-1))
382static DEFINE_SPINLOCK(device_domain_lock);
383static LIST_HEAD(device_domain_list);
384
Lu Baolu85319dc2018-07-14 15:46:58 +0800385/*
386 * Iterate over elements in device_domain_list and call the specified
Lu Baolu0bbeb012018-12-10 09:58:56 +0800387 * callback @fn against each element.
Lu Baolu85319dc2018-07-14 15:46:58 +0800388 */
389int for_each_device_domain(int (*fn)(struct device_domain_info *info,
390 void *data), void *data)
391{
392 int ret = 0;
Lu Baolu0bbeb012018-12-10 09:58:56 +0800393 unsigned long flags;
Lu Baolu85319dc2018-07-14 15:46:58 +0800394 struct device_domain_info *info;
395
Lu Baolu0bbeb012018-12-10 09:58:56 +0800396 spin_lock_irqsave(&device_domain_lock, flags);
Lu Baolu85319dc2018-07-14 15:46:58 +0800397 list_for_each_entry(info, &device_domain_list, global) {
398 ret = fn(info, data);
Lu Baolu0bbeb012018-12-10 09:58:56 +0800399 if (ret) {
400 spin_unlock_irqrestore(&device_domain_lock, flags);
Lu Baolu85319dc2018-07-14 15:46:58 +0800401 return ret;
Lu Baolu0bbeb012018-12-10 09:58:56 +0800402 }
Lu Baolu85319dc2018-07-14 15:46:58 +0800403 }
Lu Baolu0bbeb012018-12-10 09:58:56 +0800404 spin_unlock_irqrestore(&device_domain_lock, flags);
Lu Baolu85319dc2018-07-14 15:46:58 +0800405
406 return 0;
407}
408
Joerg Roedelb0119e82017-02-01 13:23:08 +0100409const struct iommu_ops intel_iommu_ops;
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +0100410
Joerg Roedel4158c2e2015-06-12 10:14:02 +0200411static bool translation_pre_enabled(struct intel_iommu *iommu)
412{
413 return (iommu->flags & VTD_FLAG_TRANS_PRE_ENABLED);
414}
415
Joerg Roedel091d42e2015-06-12 11:56:10 +0200416static void clear_translation_pre_enabled(struct intel_iommu *iommu)
417{
418 iommu->flags &= ~VTD_FLAG_TRANS_PRE_ENABLED;
419}
420
Joerg Roedel4158c2e2015-06-12 10:14:02 +0200421static void init_translation_status(struct intel_iommu *iommu)
422{
423 u32 gsts;
424
425 gsts = readl(iommu->reg + DMAR_GSTS_REG);
426 if (gsts & DMA_GSTS_TES)
427 iommu->flags |= VTD_FLAG_TRANS_PRE_ENABLED;
428}
429
Joerg Roedel00a77de2015-03-26 13:43:08 +0100430/* Convert generic 'struct iommu_domain to private struct dmar_domain */
431static struct dmar_domain *to_dmar_domain(struct iommu_domain *dom)
432{
433 return container_of(dom, struct dmar_domain, domain);
434}
435
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700436static int __init intel_iommu_setup(char *str)
437{
438 if (!str)
439 return -EINVAL;
440 while (*str) {
Kyle McMartin0cd5c3c2009-02-04 14:29:19 -0800441 if (!strncmp(str, "on", 2)) {
442 dmar_disabled = 0;
Joerg Roedel9f10e5b2015-06-12 09:57:06 +0200443 pr_info("IOMMU enabled\n");
Kyle McMartin0cd5c3c2009-02-04 14:29:19 -0800444 } else if (!strncmp(str, "off", 3)) {
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700445 dmar_disabled = 1;
Lu Baolu89a60792018-10-23 15:45:01 +0800446 no_platform_optin = 1;
Joerg Roedel9f10e5b2015-06-12 09:57:06 +0200447 pr_info("IOMMU disabled\n");
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700448 } else if (!strncmp(str, "igfx_off", 8)) {
449 dmar_map_gfx = 0;
Joerg Roedel9f10e5b2015-06-12 09:57:06 +0200450 pr_info("Disable GFX device mapping\n");
Keshavamurthy, Anil S7d3b03c2007-10-21 16:41:53 -0700451 } else if (!strncmp(str, "forcedac", 8)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +0200452 pr_info("Forcing DAC for PCI devices\n");
Keshavamurthy, Anil S7d3b03c2007-10-21 16:41:53 -0700453 dmar_forcedac = 1;
mark gross5e0d2a62008-03-04 15:22:08 -0800454 } else if (!strncmp(str, "strict", 6)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +0200455 pr_info("Disable batched IOTLB flush\n");
mark gross5e0d2a62008-03-04 15:22:08 -0800456 intel_iommu_strict = 1;
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100457 } else if (!strncmp(str, "sp_off", 6)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +0200458 pr_info("Disable supported super page\n");
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100459 intel_iommu_superpage = 0;
Lu Baolu8950dcd2019-01-24 10:31:32 +0800460 } else if (!strncmp(str, "sm_on", 5)) {
461 pr_info("Intel-IOMMU: scalable mode supported\n");
462 intel_iommu_sm = 1;
Shaohua Libfd20f12017-04-26 09:18:35 -0700463 } else if (!strncmp(str, "tboot_noforce", 13)) {
464 printk(KERN_INFO
465 "Intel-IOMMU: not forcing on after tboot. This could expose security risk for tboot\n");
466 intel_iommu_tboot_noforce = 1;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700467 }
468
469 str += strcspn(str, ",");
470 while (*str == ',')
471 str++;
472 }
473 return 0;
474}
475__setup("intel_iommu=", intel_iommu_setup);
476
477static struct kmem_cache *iommu_domain_cache;
478static struct kmem_cache *iommu_devinfo_cache;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700479
Joerg Roedel9452d5b2015-07-21 10:00:56 +0200480static struct dmar_domain* get_iommu_domain(struct intel_iommu *iommu, u16 did)
481{
Joerg Roedel8bf47812015-07-21 10:41:21 +0200482 struct dmar_domain **domains;
483 int idx = did >> 8;
484
485 domains = iommu->domains[idx];
486 if (!domains)
487 return NULL;
488
489 return domains[did & 0xff];
Joerg Roedel9452d5b2015-07-21 10:00:56 +0200490}
491
492static void set_iommu_domain(struct intel_iommu *iommu, u16 did,
493 struct dmar_domain *domain)
494{
Joerg Roedel8bf47812015-07-21 10:41:21 +0200495 struct dmar_domain **domains;
496 int idx = did >> 8;
497
498 if (!iommu->domains[idx]) {
499 size_t size = 256 * sizeof(struct dmar_domain *);
500 iommu->domains[idx] = kzalloc(size, GFP_ATOMIC);
501 }
502
503 domains = iommu->domains[idx];
504 if (WARN_ON(!domains))
505 return;
506 else
507 domains[did & 0xff] = domain;
Joerg Roedel9452d5b2015-07-21 10:00:56 +0200508}
509
Lu Baolu9ddbfb42018-07-14 15:46:57 +0800510void *alloc_pgtable_page(int node)
Keshavamurthy, Anil Seb3fa7c2007-10-21 16:41:52 -0700511{
Suresh Siddha4c923d42009-10-02 11:01:24 -0700512 struct page *page;
513 void *vaddr = NULL;
Keshavamurthy, Anil Seb3fa7c2007-10-21 16:41:52 -0700514
Suresh Siddha4c923d42009-10-02 11:01:24 -0700515 page = alloc_pages_node(node, GFP_ATOMIC | __GFP_ZERO, 0);
516 if (page)
517 vaddr = page_address(page);
Keshavamurthy, Anil Seb3fa7c2007-10-21 16:41:52 -0700518 return vaddr;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700519}
520
Lu Baolu9ddbfb42018-07-14 15:46:57 +0800521void free_pgtable_page(void *vaddr)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700522{
523 free_page((unsigned long)vaddr);
524}
525
526static inline void *alloc_domain_mem(void)
527{
KOSAKI Motohiro354bb652009-11-17 16:21:09 +0900528 return kmem_cache_alloc(iommu_domain_cache, GFP_ATOMIC);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700529}
530
Kay, Allen M38717942008-09-09 18:37:29 +0300531static void free_domain_mem(void *vaddr)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700532{
533 kmem_cache_free(iommu_domain_cache, vaddr);
534}
535
536static inline void * alloc_devinfo_mem(void)
537{
KOSAKI Motohiro354bb652009-11-17 16:21:09 +0900538 return kmem_cache_alloc(iommu_devinfo_cache, GFP_ATOMIC);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700539}
540
541static inline void free_devinfo_mem(void *vaddr)
542{
543 kmem_cache_free(iommu_devinfo_cache, vaddr);
544}
545
Jiang Liuab8dfe22014-07-11 14:19:27 +0800546static inline int domain_type_is_vm(struct dmar_domain *domain)
547{
548 return domain->flags & DOMAIN_FLAG_VIRTUAL_MACHINE;
549}
550
Joerg Roedel28ccce02015-07-21 14:45:31 +0200551static inline int domain_type_is_si(struct dmar_domain *domain)
552{
553 return domain->flags & DOMAIN_FLAG_STATIC_IDENTITY;
554}
555
Jiang Liuab8dfe22014-07-11 14:19:27 +0800556static inline int domain_type_is_vm_or_si(struct dmar_domain *domain)
557{
558 return domain->flags & (DOMAIN_FLAG_VIRTUAL_MACHINE |
559 DOMAIN_FLAG_STATIC_IDENTITY);
560}
Weidong Han1b573682008-12-08 15:34:06 +0800561
Jiang Liu162d1b12014-07-11 14:19:35 +0800562static inline int domain_pfn_supported(struct dmar_domain *domain,
563 unsigned long pfn)
564{
565 int addr_width = agaw_to_width(domain->agaw) - VTD_PAGE_SHIFT;
566
567 return !(addr_width < BITS_PER_LONG && pfn >> addr_width);
568}
569
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700570static int __iommu_calculate_agaw(struct intel_iommu *iommu, int max_gaw)
Weidong Han1b573682008-12-08 15:34:06 +0800571{
572 unsigned long sagaw;
573 int agaw = -1;
574
575 sagaw = cap_sagaw(iommu->cap);
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700576 for (agaw = width_to_agaw(max_gaw);
Weidong Han1b573682008-12-08 15:34:06 +0800577 agaw >= 0; agaw--) {
578 if (test_bit(agaw, &sagaw))
579 break;
580 }
581
582 return agaw;
583}
584
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700585/*
586 * Calculate max SAGAW for each iommu.
587 */
588int iommu_calculate_max_sagaw(struct intel_iommu *iommu)
589{
590 return __iommu_calculate_agaw(iommu, MAX_AGAW_WIDTH);
591}
592
593/*
594 * calculate agaw for each iommu.
595 * "SAGAW" may be different across iommus, use a default agaw, and
596 * get a supported less agaw for iommus that don't support the default agaw.
597 */
598int iommu_calculate_agaw(struct intel_iommu *iommu)
599{
600 return __iommu_calculate_agaw(iommu, DEFAULT_DOMAIN_ADDRESS_WIDTH);
601}
602
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700603/* This functionin only returns single iommu in a domain */
Lu Baolu9ddbfb42018-07-14 15:46:57 +0800604struct intel_iommu *domain_get_iommu(struct dmar_domain *domain)
Weidong Han8c11e792008-12-08 15:29:22 +0800605{
606 int iommu_id;
607
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700608 /* si_domain and vm domain should not get here. */
Jiang Liuab8dfe22014-07-11 14:19:27 +0800609 BUG_ON(domain_type_is_vm_or_si(domain));
Joerg Roedel29a27712015-07-21 17:17:12 +0200610 for_each_domain_iommu(iommu_id, domain)
611 break;
612
Weidong Han8c11e792008-12-08 15:29:22 +0800613 if (iommu_id < 0 || iommu_id >= g_num_of_iommus)
614 return NULL;
615
616 return g_iommus[iommu_id];
617}
618
Weidong Han8e6040972008-12-08 15:49:06 +0800619static void domain_update_iommu_coherency(struct dmar_domain *domain)
620{
David Woodhoused0501962014-03-11 17:10:29 -0700621 struct dmar_drhd_unit *drhd;
622 struct intel_iommu *iommu;
Quentin Lambert2f119c72015-02-06 10:59:53 +0100623 bool found = false;
624 int i;
Weidong Han8e6040972008-12-08 15:49:06 +0800625
David Woodhoused0501962014-03-11 17:10:29 -0700626 domain->iommu_coherency = 1;
Weidong Han8e6040972008-12-08 15:49:06 +0800627
Joerg Roedel29a27712015-07-21 17:17:12 +0200628 for_each_domain_iommu(i, domain) {
Quentin Lambert2f119c72015-02-06 10:59:53 +0100629 found = true;
Weidong Han8e6040972008-12-08 15:49:06 +0800630 if (!ecap_coherent(g_iommus[i]->ecap)) {
631 domain->iommu_coherency = 0;
632 break;
633 }
Weidong Han8e6040972008-12-08 15:49:06 +0800634 }
David Woodhoused0501962014-03-11 17:10:29 -0700635 if (found)
636 return;
637
638 /* No hardware attached; use lowest common denominator */
639 rcu_read_lock();
640 for_each_active_iommu(iommu, drhd) {
641 if (!ecap_coherent(iommu->ecap)) {
642 domain->iommu_coherency = 0;
643 break;
644 }
645 }
646 rcu_read_unlock();
Weidong Han8e6040972008-12-08 15:49:06 +0800647}
648
Jiang Liu161f6932014-07-11 14:19:37 +0800649static int domain_update_iommu_snooping(struct intel_iommu *skip)
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100650{
Allen Kay8140a952011-10-14 12:32:17 -0700651 struct dmar_drhd_unit *drhd;
Jiang Liu161f6932014-07-11 14:19:37 +0800652 struct intel_iommu *iommu;
653 int ret = 1;
654
655 rcu_read_lock();
656 for_each_active_iommu(iommu, drhd) {
657 if (iommu != skip) {
658 if (!ecap_sc_support(iommu->ecap)) {
659 ret = 0;
660 break;
661 }
662 }
663 }
664 rcu_read_unlock();
665
666 return ret;
667}
668
669static int domain_update_iommu_superpage(struct intel_iommu *skip)
670{
671 struct dmar_drhd_unit *drhd;
672 struct intel_iommu *iommu;
Allen Kay8140a952011-10-14 12:32:17 -0700673 int mask = 0xf;
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100674
675 if (!intel_iommu_superpage) {
Jiang Liu161f6932014-07-11 14:19:37 +0800676 return 0;
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100677 }
678
Allen Kay8140a952011-10-14 12:32:17 -0700679 /* set iommu_superpage to the smallest common denominator */
Jiang Liu0e2426122014-02-19 14:07:34 +0800680 rcu_read_lock();
Allen Kay8140a952011-10-14 12:32:17 -0700681 for_each_active_iommu(iommu, drhd) {
Jiang Liu161f6932014-07-11 14:19:37 +0800682 if (iommu != skip) {
683 mask &= cap_super_page_val(iommu->cap);
684 if (!mask)
685 break;
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100686 }
687 }
Jiang Liu0e2426122014-02-19 14:07:34 +0800688 rcu_read_unlock();
689
Jiang Liu161f6932014-07-11 14:19:37 +0800690 return fls(mask);
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100691}
692
Sheng Yang58c610b2009-03-18 15:33:05 +0800693/* Some capabilities may be different across iommus */
694static void domain_update_iommu_cap(struct dmar_domain *domain)
695{
696 domain_update_iommu_coherency(domain);
Jiang Liu161f6932014-07-11 14:19:37 +0800697 domain->iommu_snooping = domain_update_iommu_snooping(NULL);
698 domain->iommu_superpage = domain_update_iommu_superpage(NULL);
Sheng Yang58c610b2009-03-18 15:33:05 +0800699}
700
Sohil Mehta26b86092018-09-11 17:11:36 -0700701struct context_entry *iommu_context_addr(struct intel_iommu *iommu, u8 bus,
702 u8 devfn, int alloc)
David Woodhouse03ecc322015-02-13 14:35:21 +0000703{
704 struct root_entry *root = &iommu->root_entry[bus];
705 struct context_entry *context;
706 u64 *entry;
707
Joerg Roedel4df4eab2015-08-25 10:54:28 +0200708 entry = &root->lo;
Lu Baolu765b6a92018-12-10 09:58:55 +0800709 if (sm_supported(iommu)) {
David Woodhouse03ecc322015-02-13 14:35:21 +0000710 if (devfn >= 0x80) {
711 devfn -= 0x80;
712 entry = &root->hi;
713 }
714 devfn *= 2;
715 }
David Woodhouse03ecc322015-02-13 14:35:21 +0000716 if (*entry & 1)
717 context = phys_to_virt(*entry & VTD_PAGE_MASK);
718 else {
719 unsigned long phy_addr;
720 if (!alloc)
721 return NULL;
722
723 context = alloc_pgtable_page(iommu->node);
724 if (!context)
725 return NULL;
726
727 __iommu_flush_cache(iommu, (void *)context, CONTEXT_SIZE);
728 phy_addr = virt_to_phys((void *)context);
729 *entry = phy_addr | 1;
730 __iommu_flush_cache(iommu, entry, sizeof(*entry));
731 }
732 return &context[devfn];
733}
734
David Woodhouse4ed6a542015-05-11 14:59:20 +0100735static int iommu_dummy(struct device *dev)
736{
737 return dev->archdata.iommu == DUMMY_DEVICE_DOMAIN_INFO;
738}
739
David Woodhouse156baca2014-03-09 14:00:57 -0700740static struct intel_iommu *device_to_iommu(struct device *dev, u8 *bus, u8 *devfn)
Weidong Hanc7151a82008-12-08 22:51:37 +0800741{
742 struct dmar_drhd_unit *drhd = NULL;
Jiang Liub683b232014-02-19 14:07:32 +0800743 struct intel_iommu *iommu;
David Woodhouse156baca2014-03-09 14:00:57 -0700744 struct device *tmp;
745 struct pci_dev *ptmp, *pdev = NULL;
Yijing Wangaa4d0662014-05-26 20:14:06 +0800746 u16 segment = 0;
Weidong Hanc7151a82008-12-08 22:51:37 +0800747 int i;
748
David Woodhouse4ed6a542015-05-11 14:59:20 +0100749 if (iommu_dummy(dev))
750 return NULL;
751
David Woodhouse156baca2014-03-09 14:00:57 -0700752 if (dev_is_pci(dev)) {
Ashok Raj1c387182016-10-21 15:32:05 -0700753 struct pci_dev *pf_pdev;
754
David Woodhouse156baca2014-03-09 14:00:57 -0700755 pdev = to_pci_dev(dev);
Jon Derrick5823e332017-08-30 15:05:59 -0600756
757#ifdef CONFIG_X86
758 /* VMD child devices currently cannot be handled individually */
759 if (is_vmd(pdev->bus))
760 return NULL;
761#endif
762
Ashok Raj1c387182016-10-21 15:32:05 -0700763 /* VFs aren't listed in scope tables; we need to look up
764 * the PF instead to find the IOMMU. */
765 pf_pdev = pci_physfn(pdev);
766 dev = &pf_pdev->dev;
David Woodhouse156baca2014-03-09 14:00:57 -0700767 segment = pci_domain_nr(pdev->bus);
Rafael J. Wysockica5b74d2015-03-16 23:49:08 +0100768 } else if (has_acpi_companion(dev))
David Woodhouse156baca2014-03-09 14:00:57 -0700769 dev = &ACPI_COMPANION(dev)->dev;
770
Jiang Liu0e2426122014-02-19 14:07:34 +0800771 rcu_read_lock();
Jiang Liub683b232014-02-19 14:07:32 +0800772 for_each_active_iommu(iommu, drhd) {
David Woodhouse156baca2014-03-09 14:00:57 -0700773 if (pdev && segment != drhd->segment)
David Woodhouse276dbf992009-04-04 01:45:37 +0100774 continue;
Weidong Hanc7151a82008-12-08 22:51:37 +0800775
Jiang Liub683b232014-02-19 14:07:32 +0800776 for_each_active_dev_scope(drhd->devices,
David Woodhouse156baca2014-03-09 14:00:57 -0700777 drhd->devices_cnt, i, tmp) {
778 if (tmp == dev) {
Ashok Raj1c387182016-10-21 15:32:05 -0700779 /* For a VF use its original BDF# not that of the PF
780 * which we used for the IOMMU lookup. Strictly speaking
781 * we could do this for all PCI devices; we only need to
782 * get the BDF# from the scope table for ACPI matches. */
Koos Vriezen5003ae12017-03-01 21:02:50 +0100783 if (pdev && pdev->is_virtfn)
Ashok Raj1c387182016-10-21 15:32:05 -0700784 goto got_pdev;
785
David Woodhouse156baca2014-03-09 14:00:57 -0700786 *bus = drhd->devices[i].bus;
787 *devfn = drhd->devices[i].devfn;
788 goto out;
789 }
790
791 if (!pdev || !dev_is_pci(tmp))
David Woodhouse832bd852014-03-07 15:08:36 +0000792 continue;
David Woodhouse156baca2014-03-09 14:00:57 -0700793
794 ptmp = to_pci_dev(tmp);
795 if (ptmp->subordinate &&
796 ptmp->subordinate->number <= pdev->bus->number &&
797 ptmp->subordinate->busn_res.end >= pdev->bus->number)
798 goto got_pdev;
David Woodhouse924b6232009-04-04 00:39:25 +0100799 }
Weidong Hanc7151a82008-12-08 22:51:37 +0800800
David Woodhouse156baca2014-03-09 14:00:57 -0700801 if (pdev && drhd->include_all) {
802 got_pdev:
803 *bus = pdev->bus->number;
804 *devfn = pdev->devfn;
Jiang Liub683b232014-02-19 14:07:32 +0800805 goto out;
David Woodhouse156baca2014-03-09 14:00:57 -0700806 }
Weidong Hanc7151a82008-12-08 22:51:37 +0800807 }
Jiang Liub683b232014-02-19 14:07:32 +0800808 iommu = NULL;
David Woodhouse156baca2014-03-09 14:00:57 -0700809 out:
Jiang Liu0e2426122014-02-19 14:07:34 +0800810 rcu_read_unlock();
Weidong Hanc7151a82008-12-08 22:51:37 +0800811
Jiang Liub683b232014-02-19 14:07:32 +0800812 return iommu;
Weidong Hanc7151a82008-12-08 22:51:37 +0800813}
814
Weidong Han5331fe62008-12-08 23:00:00 +0800815static void domain_flush_cache(struct dmar_domain *domain,
816 void *addr, int size)
817{
818 if (!domain->iommu_coherency)
819 clflush_cache_range(addr, size);
820}
821
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700822static int device_context_mapped(struct intel_iommu *iommu, u8 bus, u8 devfn)
823{
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700824 struct context_entry *context;
David Woodhouse03ecc322015-02-13 14:35:21 +0000825 int ret = 0;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700826 unsigned long flags;
827
828 spin_lock_irqsave(&iommu->lock, flags);
David Woodhouse03ecc322015-02-13 14:35:21 +0000829 context = iommu_context_addr(iommu, bus, devfn, 0);
830 if (context)
831 ret = context_present(context);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700832 spin_unlock_irqrestore(&iommu->lock, flags);
833 return ret;
834}
835
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700836static void free_context_table(struct intel_iommu *iommu)
837{
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700838 int i;
839 unsigned long flags;
840 struct context_entry *context;
841
842 spin_lock_irqsave(&iommu->lock, flags);
843 if (!iommu->root_entry) {
844 goto out;
845 }
846 for (i = 0; i < ROOT_ENTRY_NR; i++) {
David Woodhouse03ecc322015-02-13 14:35:21 +0000847 context = iommu_context_addr(iommu, i, 0, 0);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700848 if (context)
849 free_pgtable_page(context);
David Woodhouse03ecc322015-02-13 14:35:21 +0000850
Lu Baolu765b6a92018-12-10 09:58:55 +0800851 if (!sm_supported(iommu))
David Woodhouse03ecc322015-02-13 14:35:21 +0000852 continue;
853
854 context = iommu_context_addr(iommu, i, 0x80, 0);
855 if (context)
856 free_pgtable_page(context);
857
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700858 }
859 free_pgtable_page(iommu->root_entry);
860 iommu->root_entry = NULL;
861out:
862 spin_unlock_irqrestore(&iommu->lock, flags);
863}
864
David Woodhouseb026fd22009-06-28 10:37:25 +0100865static struct dma_pte *pfn_to_dma_pte(struct dmar_domain *domain,
David Woodhouse5cf0a762014-03-19 16:07:49 +0000866 unsigned long pfn, int *target_level)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700867{
Bjorn Helgaase083ea5b2019-02-08 16:06:08 -0600868 struct dma_pte *parent, *pte;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700869 int level = agaw_to_level(domain->agaw);
Allen Kay4399c8b2011-10-14 12:32:46 -0700870 int offset;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700871
872 BUG_ON(!domain->pgd);
Julian Stecklinaf9423602013-10-09 10:03:52 +0200873
Jiang Liu162d1b12014-07-11 14:19:35 +0800874 if (!domain_pfn_supported(domain, pfn))
Julian Stecklinaf9423602013-10-09 10:03:52 +0200875 /* Address beyond IOMMU's addressing capabilities. */
876 return NULL;
877
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700878 parent = domain->pgd;
879
David Woodhouse5cf0a762014-03-19 16:07:49 +0000880 while (1) {
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700881 void *tmp_page;
882
David Woodhouseb026fd22009-06-28 10:37:25 +0100883 offset = pfn_level_offset(pfn, level);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700884 pte = &parent[offset];
David Woodhouse5cf0a762014-03-19 16:07:49 +0000885 if (!*target_level && (dma_pte_superpage(pte) || !dma_pte_present(pte)))
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100886 break;
David Woodhouse5cf0a762014-03-19 16:07:49 +0000887 if (level == *target_level)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700888 break;
889
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000890 if (!dma_pte_present(pte)) {
David Woodhousec85994e2009-07-01 19:21:24 +0100891 uint64_t pteval;
892
Suresh Siddha4c923d42009-10-02 11:01:24 -0700893 tmp_page = alloc_pgtable_page(domain->nid);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700894
David Woodhouse206a73c2009-07-01 19:30:28 +0100895 if (!tmp_page)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700896 return NULL;
David Woodhouse206a73c2009-07-01 19:30:28 +0100897
David Woodhousec85994e2009-07-01 19:21:24 +0100898 domain_flush_cache(domain, tmp_page, VTD_PAGE_SIZE);
Benjamin LaHaise64de5af2009-09-16 21:05:55 -0400899 pteval = ((uint64_t)virt_to_dma_pfn(tmp_page) << VTD_PAGE_SHIFT) | DMA_PTE_READ | DMA_PTE_WRITE;
Yijing Wangeffad4b2014-05-26 20:13:47 +0800900 if (cmpxchg64(&pte->val, 0ULL, pteval))
David Woodhousec85994e2009-07-01 19:21:24 +0100901 /* Someone else set it while we were thinking; use theirs. */
902 free_pgtable_page(tmp_page);
Yijing Wangeffad4b2014-05-26 20:13:47 +0800903 else
David Woodhousec85994e2009-07-01 19:21:24 +0100904 domain_flush_cache(domain, pte, sizeof(*pte));
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700905 }
David Woodhouse5cf0a762014-03-19 16:07:49 +0000906 if (level == 1)
907 break;
908
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000909 parent = phys_to_virt(dma_pte_addr(pte));
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700910 level--;
911 }
912
David Woodhouse5cf0a762014-03-19 16:07:49 +0000913 if (!*target_level)
914 *target_level = level;
915
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700916 return pte;
917}
918
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100919
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700920/* return address's pte at specific level */
David Woodhouse90dcfb52009-06-27 17:14:59 +0100921static struct dma_pte *dma_pfn_level_pte(struct dmar_domain *domain,
922 unsigned long pfn,
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100923 int level, int *large_page)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700924{
Bjorn Helgaase083ea5b2019-02-08 16:06:08 -0600925 struct dma_pte *parent, *pte;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700926 int total = agaw_to_level(domain->agaw);
927 int offset;
928
929 parent = domain->pgd;
930 while (level <= total) {
David Woodhouse90dcfb52009-06-27 17:14:59 +0100931 offset = pfn_level_offset(pfn, total);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700932 pte = &parent[offset];
933 if (level == total)
934 return pte;
935
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100936 if (!dma_pte_present(pte)) {
937 *large_page = total;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700938 break;
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100939 }
940
Yijing Wange16922a2014-05-20 20:37:51 +0800941 if (dma_pte_superpage(pte)) {
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100942 *large_page = total;
943 return pte;
944 }
945
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000946 parent = phys_to_virt(dma_pte_addr(pte));
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700947 total--;
948 }
949 return NULL;
950}
951
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700952/* clear last level pte, a tlb flush should be followed */
David Woodhouse5cf0a762014-03-19 16:07:49 +0000953static void dma_pte_clear_range(struct dmar_domain *domain,
David Woodhouse595badf52009-06-27 22:09:11 +0100954 unsigned long start_pfn,
955 unsigned long last_pfn)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700956{
Bjorn Helgaase083ea5b2019-02-08 16:06:08 -0600957 unsigned int large_page;
David Woodhouse310a5ab2009-06-28 18:52:20 +0100958 struct dma_pte *first_pte, *pte;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700959
Jiang Liu162d1b12014-07-11 14:19:35 +0800960 BUG_ON(!domain_pfn_supported(domain, start_pfn));
961 BUG_ON(!domain_pfn_supported(domain, last_pfn));
David Woodhouse59c36282009-09-19 07:36:28 -0700962 BUG_ON(start_pfn > last_pfn);
David Woodhouse66eae842009-06-27 19:00:32 +0100963
David Woodhouse04b18e62009-06-27 19:15:01 +0100964 /* we don't need lock here; nobody else touches the iova range */
David Woodhouse59c36282009-09-19 07:36:28 -0700965 do {
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100966 large_page = 1;
967 first_pte = pte = dma_pfn_level_pte(domain, start_pfn, 1, &large_page);
David Woodhouse310a5ab2009-06-28 18:52:20 +0100968 if (!pte) {
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100969 start_pfn = align_to_level(start_pfn + 1, large_page + 1);
David Woodhouse310a5ab2009-06-28 18:52:20 +0100970 continue;
971 }
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100972 do {
David Woodhouse310a5ab2009-06-28 18:52:20 +0100973 dma_clear_pte(pte);
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100974 start_pfn += lvl_to_nr_pages(large_page);
David Woodhouse310a5ab2009-06-28 18:52:20 +0100975 pte++;
David Woodhouse75e6bf92009-07-02 11:21:16 +0100976 } while (start_pfn <= last_pfn && !first_pte_in_page(pte));
977
David Woodhouse310a5ab2009-06-28 18:52:20 +0100978 domain_flush_cache(domain, first_pte,
979 (void *)pte - (void *)first_pte);
David Woodhouse59c36282009-09-19 07:36:28 -0700980
981 } while (start_pfn && start_pfn <= last_pfn);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700982}
983
Alex Williamson3269ee02013-06-15 10:27:19 -0600984static void dma_pte_free_level(struct dmar_domain *domain, int level,
David Dillowbc24c572017-06-28 19:42:23 -0700985 int retain_level, struct dma_pte *pte,
986 unsigned long pfn, unsigned long start_pfn,
987 unsigned long last_pfn)
Alex Williamson3269ee02013-06-15 10:27:19 -0600988{
989 pfn = max(start_pfn, pfn);
990 pte = &pte[pfn_level_offset(pfn, level)];
991
992 do {
993 unsigned long level_pfn;
994 struct dma_pte *level_pte;
995
996 if (!dma_pte_present(pte) || dma_pte_superpage(pte))
997 goto next;
998
David Dillowf7116e12017-01-30 19:11:11 -0800999 level_pfn = pfn & level_mask(level);
Alex Williamson3269ee02013-06-15 10:27:19 -06001000 level_pte = phys_to_virt(dma_pte_addr(pte));
1001
David Dillowbc24c572017-06-28 19:42:23 -07001002 if (level > 2) {
1003 dma_pte_free_level(domain, level - 1, retain_level,
1004 level_pte, level_pfn, start_pfn,
1005 last_pfn);
1006 }
Alex Williamson3269ee02013-06-15 10:27:19 -06001007
David Dillowbc24c572017-06-28 19:42:23 -07001008 /*
1009 * Free the page table if we're below the level we want to
1010 * retain and the range covers the entire table.
1011 */
1012 if (level < retain_level && !(start_pfn > level_pfn ||
Alex Williamson08336fd2014-01-21 15:48:18 -08001013 last_pfn < level_pfn + level_size(level) - 1)) {
Alex Williamson3269ee02013-06-15 10:27:19 -06001014 dma_clear_pte(pte);
1015 domain_flush_cache(domain, pte, sizeof(*pte));
1016 free_pgtable_page(level_pte);
1017 }
1018next:
1019 pfn += level_size(level);
1020 } while (!first_pte_in_page(++pte) && pfn <= last_pfn);
1021}
1022
David Dillowbc24c572017-06-28 19:42:23 -07001023/*
1024 * clear last level (leaf) ptes and free page table pages below the
1025 * level we wish to keep intact.
1026 */
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001027static void dma_pte_free_pagetable(struct dmar_domain *domain,
David Woodhoused794dc92009-06-28 00:27:49 +01001028 unsigned long start_pfn,
David Dillowbc24c572017-06-28 19:42:23 -07001029 unsigned long last_pfn,
1030 int retain_level)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001031{
Jiang Liu162d1b12014-07-11 14:19:35 +08001032 BUG_ON(!domain_pfn_supported(domain, start_pfn));
1033 BUG_ON(!domain_pfn_supported(domain, last_pfn));
David Woodhouse59c36282009-09-19 07:36:28 -07001034 BUG_ON(start_pfn > last_pfn);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001035
Jiang Liud41a4ad2014-07-11 14:19:34 +08001036 dma_pte_clear_range(domain, start_pfn, last_pfn);
1037
David Woodhousef3a0a522009-06-30 03:40:07 +01001038 /* We don't need lock here; nobody else touches the iova range */
David Dillowbc24c572017-06-28 19:42:23 -07001039 dma_pte_free_level(domain, agaw_to_level(domain->agaw), retain_level,
Alex Williamson3269ee02013-06-15 10:27:19 -06001040 domain->pgd, 0, start_pfn, last_pfn);
David Woodhouse6660c632009-06-27 22:41:00 +01001041
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001042 /* free pgd */
David Woodhoused794dc92009-06-28 00:27:49 +01001043 if (start_pfn == 0 && last_pfn == DOMAIN_MAX_PFN(domain->gaw)) {
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001044 free_pgtable_page(domain->pgd);
1045 domain->pgd = NULL;
1046 }
1047}
1048
David Woodhouseea8ea462014-03-05 17:09:32 +00001049/* When a page at a given level is being unlinked from its parent, we don't
1050 need to *modify* it at all. All we need to do is make a list of all the
1051 pages which can be freed just as soon as we've flushed the IOTLB and we
1052 know the hardware page-walk will no longer touch them.
1053 The 'pte' argument is the *parent* PTE, pointing to the page that is to
1054 be freed. */
1055static struct page *dma_pte_list_pagetables(struct dmar_domain *domain,
1056 int level, struct dma_pte *pte,
1057 struct page *freelist)
1058{
1059 struct page *pg;
1060
1061 pg = pfn_to_page(dma_pte_addr(pte) >> PAGE_SHIFT);
1062 pg->freelist = freelist;
1063 freelist = pg;
1064
1065 if (level == 1)
1066 return freelist;
1067
Jiang Liuadeb2592014-04-09 10:20:39 +08001068 pte = page_address(pg);
1069 do {
David Woodhouseea8ea462014-03-05 17:09:32 +00001070 if (dma_pte_present(pte) && !dma_pte_superpage(pte))
1071 freelist = dma_pte_list_pagetables(domain, level - 1,
1072 pte, freelist);
Jiang Liuadeb2592014-04-09 10:20:39 +08001073 pte++;
1074 } while (!first_pte_in_page(pte));
David Woodhouseea8ea462014-03-05 17:09:32 +00001075
1076 return freelist;
1077}
1078
1079static struct page *dma_pte_clear_level(struct dmar_domain *domain, int level,
1080 struct dma_pte *pte, unsigned long pfn,
1081 unsigned long start_pfn,
1082 unsigned long last_pfn,
1083 struct page *freelist)
1084{
1085 struct dma_pte *first_pte = NULL, *last_pte = NULL;
1086
1087 pfn = max(start_pfn, pfn);
1088 pte = &pte[pfn_level_offset(pfn, level)];
1089
1090 do {
1091 unsigned long level_pfn;
1092
1093 if (!dma_pte_present(pte))
1094 goto next;
1095
1096 level_pfn = pfn & level_mask(level);
1097
1098 /* If range covers entire pagetable, free it */
1099 if (start_pfn <= level_pfn &&
1100 last_pfn >= level_pfn + level_size(level) - 1) {
1101 /* These suborbinate page tables are going away entirely. Don't
1102 bother to clear them; we're just going to *free* them. */
1103 if (level > 1 && !dma_pte_superpage(pte))
1104 freelist = dma_pte_list_pagetables(domain, level - 1, pte, freelist);
1105
1106 dma_clear_pte(pte);
1107 if (!first_pte)
1108 first_pte = pte;
1109 last_pte = pte;
1110 } else if (level > 1) {
1111 /* Recurse down into a level that isn't *entirely* obsolete */
1112 freelist = dma_pte_clear_level(domain, level - 1,
1113 phys_to_virt(dma_pte_addr(pte)),
1114 level_pfn, start_pfn, last_pfn,
1115 freelist);
1116 }
1117next:
1118 pfn += level_size(level);
1119 } while (!first_pte_in_page(++pte) && pfn <= last_pfn);
1120
1121 if (first_pte)
1122 domain_flush_cache(domain, first_pte,
1123 (void *)++last_pte - (void *)first_pte);
1124
1125 return freelist;
1126}
1127
1128/* We can't just free the pages because the IOMMU may still be walking
1129 the page tables, and may have cached the intermediate levels. The
1130 pages can only be freed after the IOTLB flush has been done. */
Joerg Roedelb6904202015-08-13 11:32:18 +02001131static struct page *domain_unmap(struct dmar_domain *domain,
1132 unsigned long start_pfn,
1133 unsigned long last_pfn)
David Woodhouseea8ea462014-03-05 17:09:32 +00001134{
Bjorn Helgaase083ea5b2019-02-08 16:06:08 -06001135 struct page *freelist;
David Woodhouseea8ea462014-03-05 17:09:32 +00001136
Jiang Liu162d1b12014-07-11 14:19:35 +08001137 BUG_ON(!domain_pfn_supported(domain, start_pfn));
1138 BUG_ON(!domain_pfn_supported(domain, last_pfn));
David Woodhouseea8ea462014-03-05 17:09:32 +00001139 BUG_ON(start_pfn > last_pfn);
1140
1141 /* we don't need lock here; nobody else touches the iova range */
1142 freelist = dma_pte_clear_level(domain, agaw_to_level(domain->agaw),
1143 domain->pgd, 0, start_pfn, last_pfn, NULL);
1144
1145 /* free pgd */
1146 if (start_pfn == 0 && last_pfn == DOMAIN_MAX_PFN(domain->gaw)) {
1147 struct page *pgd_page = virt_to_page(domain->pgd);
1148 pgd_page->freelist = freelist;
1149 freelist = pgd_page;
1150
1151 domain->pgd = NULL;
1152 }
1153
1154 return freelist;
1155}
1156
Joerg Roedelb6904202015-08-13 11:32:18 +02001157static void dma_free_pagelist(struct page *freelist)
David Woodhouseea8ea462014-03-05 17:09:32 +00001158{
1159 struct page *pg;
1160
1161 while ((pg = freelist)) {
1162 freelist = pg->freelist;
1163 free_pgtable_page(page_address(pg));
1164 }
1165}
1166
Joerg Roedel13cf0172017-08-11 11:40:10 +02001167static void iova_entry_free(unsigned long data)
1168{
1169 struct page *freelist = (struct page *)data;
1170
1171 dma_free_pagelist(freelist);
1172}
1173
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001174/* iommu handling */
1175static int iommu_alloc_root_entry(struct intel_iommu *iommu)
1176{
1177 struct root_entry *root;
1178 unsigned long flags;
1179
Suresh Siddha4c923d42009-10-02 11:01:24 -07001180 root = (struct root_entry *)alloc_pgtable_page(iommu->node);
Jiang Liuffebeb42014-11-09 22:48:02 +08001181 if (!root) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001182 pr_err("Allocating root entry for %s failed\n",
Jiang Liuffebeb42014-11-09 22:48:02 +08001183 iommu->name);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001184 return -ENOMEM;
Jiang Liuffebeb42014-11-09 22:48:02 +08001185 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001186
Fenghua Yu5b6985c2008-10-16 18:02:32 -07001187 __iommu_flush_cache(iommu, root, ROOT_SIZE);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001188
1189 spin_lock_irqsave(&iommu->lock, flags);
1190 iommu->root_entry = root;
1191 spin_unlock_irqrestore(&iommu->lock, flags);
1192
1193 return 0;
1194}
1195
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001196static void iommu_set_root_entry(struct intel_iommu *iommu)
1197{
David Woodhouse03ecc322015-02-13 14:35:21 +00001198 u64 addr;
David Woodhousec416daa2009-05-10 20:30:58 +01001199 u32 sts;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001200 unsigned long flag;
1201
David Woodhouse03ecc322015-02-13 14:35:21 +00001202 addr = virt_to_phys(iommu->root_entry);
Lu Baolu7373a8c2018-12-10 09:59:03 +08001203 if (sm_supported(iommu))
1204 addr |= DMA_RTADDR_SMT;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001205
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001206 raw_spin_lock_irqsave(&iommu->register_lock, flag);
David Woodhouse03ecc322015-02-13 14:35:21 +00001207 dmar_writeq(iommu->reg + DMAR_RTADDR_REG, addr);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001208
David Woodhousec416daa2009-05-10 20:30:58 +01001209 writel(iommu->gcmd | DMA_GCMD_SRTP, iommu->reg + DMAR_GCMD_REG);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001210
1211 /* Make sure hardware complete it */
1212 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
David Woodhousec416daa2009-05-10 20:30:58 +01001213 readl, (sts & DMA_GSTS_RTPS), sts);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001214
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001215 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001216}
1217
Lu Baolu6f7db752018-12-10 09:59:00 +08001218void iommu_flush_write_buffer(struct intel_iommu *iommu)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001219{
1220 u32 val;
1221 unsigned long flag;
1222
David Woodhouse9af88142009-02-13 23:18:03 +00001223 if (!rwbf_quirk && !cap_rwbf(iommu->cap))
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001224 return;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001225
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001226 raw_spin_lock_irqsave(&iommu->register_lock, flag);
David Woodhouse462b60f2009-05-10 20:18:18 +01001227 writel(iommu->gcmd | DMA_GCMD_WBF, iommu->reg + DMAR_GCMD_REG);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001228
1229 /* Make sure hardware complete it */
1230 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
David Woodhousec416daa2009-05-10 20:30:58 +01001231 readl, (!(val & DMA_GSTS_WBFS)), val);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001232
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001233 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001234}
1235
1236/* return value determine if we need a write buffer flush */
David Woodhouse4c25a2c2009-05-10 17:16:06 +01001237static void __iommu_flush_context(struct intel_iommu *iommu,
1238 u16 did, u16 source_id, u8 function_mask,
1239 u64 type)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001240{
1241 u64 val = 0;
1242 unsigned long flag;
1243
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001244 switch (type) {
1245 case DMA_CCMD_GLOBAL_INVL:
1246 val = DMA_CCMD_GLOBAL_INVL;
1247 break;
1248 case DMA_CCMD_DOMAIN_INVL:
1249 val = DMA_CCMD_DOMAIN_INVL|DMA_CCMD_DID(did);
1250 break;
1251 case DMA_CCMD_DEVICE_INVL:
1252 val = DMA_CCMD_DEVICE_INVL|DMA_CCMD_DID(did)
1253 | DMA_CCMD_SID(source_id) | DMA_CCMD_FM(function_mask);
1254 break;
1255 default:
1256 BUG();
1257 }
1258 val |= DMA_CCMD_ICC;
1259
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001260 raw_spin_lock_irqsave(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001261 dmar_writeq(iommu->reg + DMAR_CCMD_REG, val);
1262
1263 /* Make sure hardware complete it */
1264 IOMMU_WAIT_OP(iommu, DMAR_CCMD_REG,
1265 dmar_readq, (!(val & DMA_CCMD_ICC)), val);
1266
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001267 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001268}
1269
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001270/* return value determine if we need a write buffer flush */
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01001271static void __iommu_flush_iotlb(struct intel_iommu *iommu, u16 did,
1272 u64 addr, unsigned int size_order, u64 type)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001273{
1274 int tlb_offset = ecap_iotlb_offset(iommu->ecap);
1275 u64 val = 0, val_iva = 0;
1276 unsigned long flag;
1277
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001278 switch (type) {
1279 case DMA_TLB_GLOBAL_FLUSH:
1280 /* global flush doesn't need set IVA_REG */
1281 val = DMA_TLB_GLOBAL_FLUSH|DMA_TLB_IVT;
1282 break;
1283 case DMA_TLB_DSI_FLUSH:
1284 val = DMA_TLB_DSI_FLUSH|DMA_TLB_IVT|DMA_TLB_DID(did);
1285 break;
1286 case DMA_TLB_PSI_FLUSH:
1287 val = DMA_TLB_PSI_FLUSH|DMA_TLB_IVT|DMA_TLB_DID(did);
David Woodhouseea8ea462014-03-05 17:09:32 +00001288 /* IH bit is passed in as part of address */
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001289 val_iva = size_order | addr;
1290 break;
1291 default:
1292 BUG();
1293 }
1294 /* Note: set drain read/write */
1295#if 0
1296 /*
1297 * This is probably to be super secure.. Looks like we can
1298 * ignore it without any impact.
1299 */
1300 if (cap_read_drain(iommu->cap))
1301 val |= DMA_TLB_READ_DRAIN;
1302#endif
1303 if (cap_write_drain(iommu->cap))
1304 val |= DMA_TLB_WRITE_DRAIN;
1305
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001306 raw_spin_lock_irqsave(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001307 /* Note: Only uses first TLB reg currently */
1308 if (val_iva)
1309 dmar_writeq(iommu->reg + tlb_offset, val_iva);
1310 dmar_writeq(iommu->reg + tlb_offset + 8, val);
1311
1312 /* Make sure hardware complete it */
1313 IOMMU_WAIT_OP(iommu, tlb_offset + 8,
1314 dmar_readq, (!(val & DMA_TLB_IVT)), val);
1315
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001316 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001317
1318 /* check IOTLB invalidation granularity */
1319 if (DMA_TLB_IAIG(val) == 0)
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001320 pr_err("Flush IOTLB failed\n");
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001321 if (DMA_TLB_IAIG(val) != DMA_TLB_IIRG(type))
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001322 pr_debug("TLB flush request %Lx, actual %Lx\n",
Fenghua Yu5b6985c2008-10-16 18:02:32 -07001323 (unsigned long long)DMA_TLB_IIRG(type),
1324 (unsigned long long)DMA_TLB_IAIG(val));
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001325}
1326
David Woodhouse64ae8922014-03-09 12:52:30 -07001327static struct device_domain_info *
1328iommu_support_dev_iotlb (struct dmar_domain *domain, struct intel_iommu *iommu,
1329 u8 bus, u8 devfn)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001330{
Yu Zhao93a23a72009-05-18 13:51:37 +08001331 struct device_domain_info *info;
Yu Zhao93a23a72009-05-18 13:51:37 +08001332
Joerg Roedel55d94042015-07-22 16:50:40 +02001333 assert_spin_locked(&device_domain_lock);
1334
Yu Zhao93a23a72009-05-18 13:51:37 +08001335 if (!iommu->qi)
1336 return NULL;
1337
Yu Zhao93a23a72009-05-18 13:51:37 +08001338 list_for_each_entry(info, &domain->devices, link)
Jiang Liuc3b497c2014-07-11 14:19:25 +08001339 if (info->iommu == iommu && info->bus == bus &&
1340 info->devfn == devfn) {
David Woodhouseb16d0cb2015-10-12 14:17:37 +01001341 if (info->ats_supported && info->dev)
1342 return info;
Yu Zhao93a23a72009-05-18 13:51:37 +08001343 break;
1344 }
Yu Zhao93a23a72009-05-18 13:51:37 +08001345
David Woodhouseb16d0cb2015-10-12 14:17:37 +01001346 return NULL;
Yu Zhao93a23a72009-05-18 13:51:37 +08001347}
1348
Omer Peleg0824c592016-04-20 19:03:35 +03001349static void domain_update_iotlb(struct dmar_domain *domain)
1350{
1351 struct device_domain_info *info;
1352 bool has_iotlb_device = false;
1353
1354 assert_spin_locked(&device_domain_lock);
1355
1356 list_for_each_entry(info, &domain->devices, link) {
1357 struct pci_dev *pdev;
1358
1359 if (!info->dev || !dev_is_pci(info->dev))
1360 continue;
1361
1362 pdev = to_pci_dev(info->dev);
1363 if (pdev->ats_enabled) {
1364 has_iotlb_device = true;
1365 break;
1366 }
1367 }
1368
1369 domain->has_iotlb_device = has_iotlb_device;
1370}
1371
Yu Zhao93a23a72009-05-18 13:51:37 +08001372static void iommu_enable_dev_iotlb(struct device_domain_info *info)
1373{
Bjorn Helgaasfb0cc3a2015-07-20 09:10:36 -05001374 struct pci_dev *pdev;
1375
Omer Peleg0824c592016-04-20 19:03:35 +03001376 assert_spin_locked(&device_domain_lock);
1377
David Woodhouse0bcb3e22014-03-06 17:12:03 +00001378 if (!info || !dev_is_pci(info->dev))
Yu Zhao93a23a72009-05-18 13:51:37 +08001379 return;
1380
Bjorn Helgaasfb0cc3a2015-07-20 09:10:36 -05001381 pdev = to_pci_dev(info->dev);
Jacob Pan1c48db42018-06-07 09:57:00 -07001382 /* For IOMMU that supports device IOTLB throttling (DIT), we assign
1383 * PFSID to the invalidation desc of a VF such that IOMMU HW can gauge
1384 * queue depth at PF level. If DIT is not set, PFSID will be treated as
1385 * reserved, which should be set to 0.
1386 */
1387 if (!ecap_dit(info->iommu->ecap))
1388 info->pfsid = 0;
1389 else {
1390 struct pci_dev *pf_pdev;
1391
1392 /* pdev will be returned if device is not a vf */
1393 pf_pdev = pci_physfn(pdev);
1394 info->pfsid = PCI_DEVID(pf_pdev->bus->number, pf_pdev->devfn);
1395 }
Bjorn Helgaasfb0cc3a2015-07-20 09:10:36 -05001396
David Woodhouseb16d0cb2015-10-12 14:17:37 +01001397#ifdef CONFIG_INTEL_IOMMU_SVM
1398 /* The PCIe spec, in its wisdom, declares that the behaviour of
1399 the device if you enable PASID support after ATS support is
1400 undefined. So always enable PASID support on devices which
1401 have it, even if we can't yet know if we're ever going to
1402 use it. */
1403 if (info->pasid_supported && !pci_enable_pasid(pdev, info->pasid_supported & ~1))
1404 info->pasid_enabled = 1;
1405
Kuppuswamy Sathyanarayanan1b84778a2019-02-19 11:04:52 -08001406 if (info->pri_supported &&
1407 (info->pasid_enabled ? pci_prg_resp_pasid_required(pdev) : 1) &&
1408 !pci_reset_pri(pdev) && !pci_enable_pri(pdev, 32))
David Woodhouseb16d0cb2015-10-12 14:17:37 +01001409 info->pri_enabled = 1;
1410#endif
Mika Westerbergfb58fdc2018-10-29 13:47:08 +03001411 if (!pdev->untrusted && info->ats_supported &&
Kuppuswamy Sathyanarayanan61363c12019-02-19 11:06:10 -08001412 pci_ats_page_aligned(pdev) &&
Mika Westerbergfb58fdc2018-10-29 13:47:08 +03001413 !pci_enable_ats(pdev, VTD_PAGE_SHIFT)) {
David Woodhouseb16d0cb2015-10-12 14:17:37 +01001414 info->ats_enabled = 1;
Omer Peleg0824c592016-04-20 19:03:35 +03001415 domain_update_iotlb(info->domain);
David Woodhouseb16d0cb2015-10-12 14:17:37 +01001416 info->ats_qdep = pci_ats_queue_depth(pdev);
1417 }
Yu Zhao93a23a72009-05-18 13:51:37 +08001418}
1419
1420static void iommu_disable_dev_iotlb(struct device_domain_info *info)
1421{
David Woodhouseb16d0cb2015-10-12 14:17:37 +01001422 struct pci_dev *pdev;
1423
Omer Peleg0824c592016-04-20 19:03:35 +03001424 assert_spin_locked(&device_domain_lock);
1425
Jeremy McNicollda972fb2016-01-14 21:33:06 -08001426 if (!dev_is_pci(info->dev))
Yu Zhao93a23a72009-05-18 13:51:37 +08001427 return;
1428
David Woodhouseb16d0cb2015-10-12 14:17:37 +01001429 pdev = to_pci_dev(info->dev);
1430
1431 if (info->ats_enabled) {
1432 pci_disable_ats(pdev);
1433 info->ats_enabled = 0;
Omer Peleg0824c592016-04-20 19:03:35 +03001434 domain_update_iotlb(info->domain);
David Woodhouseb16d0cb2015-10-12 14:17:37 +01001435 }
1436#ifdef CONFIG_INTEL_IOMMU_SVM
1437 if (info->pri_enabled) {
1438 pci_disable_pri(pdev);
1439 info->pri_enabled = 0;
1440 }
1441 if (info->pasid_enabled) {
1442 pci_disable_pasid(pdev);
1443 info->pasid_enabled = 0;
1444 }
1445#endif
Yu Zhao93a23a72009-05-18 13:51:37 +08001446}
1447
1448static void iommu_flush_dev_iotlb(struct dmar_domain *domain,
1449 u64 addr, unsigned mask)
1450{
1451 u16 sid, qdep;
1452 unsigned long flags;
1453 struct device_domain_info *info;
1454
Omer Peleg0824c592016-04-20 19:03:35 +03001455 if (!domain->has_iotlb_device)
1456 return;
1457
Yu Zhao93a23a72009-05-18 13:51:37 +08001458 spin_lock_irqsave(&device_domain_lock, flags);
1459 list_for_each_entry(info, &domain->devices, link) {
David Woodhouseb16d0cb2015-10-12 14:17:37 +01001460 if (!info->ats_enabled)
Yu Zhao93a23a72009-05-18 13:51:37 +08001461 continue;
1462
1463 sid = info->bus << 8 | info->devfn;
David Woodhouseb16d0cb2015-10-12 14:17:37 +01001464 qdep = info->ats_qdep;
Jacob Pan1c48db42018-06-07 09:57:00 -07001465 qi_flush_dev_iotlb(info->iommu, sid, info->pfsid,
1466 qdep, addr, mask);
Yu Zhao93a23a72009-05-18 13:51:37 +08001467 }
1468 spin_unlock_irqrestore(&device_domain_lock, flags);
1469}
1470
Joerg Roedela1ddcbe2015-07-21 15:20:32 +02001471static void iommu_flush_iotlb_psi(struct intel_iommu *iommu,
1472 struct dmar_domain *domain,
1473 unsigned long pfn, unsigned int pages,
1474 int ih, int map)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001475{
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001476 unsigned int mask = ilog2(__roundup_pow_of_two(pages));
David Woodhouse03d6a242009-06-28 15:33:46 +01001477 uint64_t addr = (uint64_t)pfn << VTD_PAGE_SHIFT;
Joerg Roedela1ddcbe2015-07-21 15:20:32 +02001478 u16 did = domain->iommu_did[iommu->seq_id];
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001479
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001480 BUG_ON(pages == 0);
1481
David Woodhouseea8ea462014-03-05 17:09:32 +00001482 if (ih)
1483 ih = 1 << 6;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001484 /*
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001485 * Fallback to domain selective flush if no PSI support or the size is
1486 * too big.
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001487 * PSI requires page size to be 2 ^ x, and the base address is naturally
1488 * aligned to the size
1489 */
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001490 if (!cap_pgsel_inv(iommu->cap) || mask > cap_max_amask_val(iommu->cap))
1491 iommu->flush.flush_iotlb(iommu, did, 0, 0,
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01001492 DMA_TLB_DSI_FLUSH);
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001493 else
David Woodhouseea8ea462014-03-05 17:09:32 +00001494 iommu->flush.flush_iotlb(iommu, did, addr | ih, mask,
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001495 DMA_TLB_PSI_FLUSH);
Yu Zhaobf92df32009-06-29 11:31:45 +08001496
1497 /*
Nadav Amit82653632010-04-01 13:24:40 +03001498 * In caching mode, changes of pages from non-present to present require
1499 * flush. However, device IOTLB doesn't need to be flushed in this case.
Yu Zhaobf92df32009-06-29 11:31:45 +08001500 */
Nadav Amit82653632010-04-01 13:24:40 +03001501 if (!cap_caching_mode(iommu->cap) || !map)
Peter Xu9d2e6502018-01-10 13:51:37 +08001502 iommu_flush_dev_iotlb(domain, addr, mask);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001503}
1504
Peter Xueed91a02018-05-04 10:34:52 +08001505/* Notification for newly created mappings */
1506static inline void __mapping_notify_one(struct intel_iommu *iommu,
1507 struct dmar_domain *domain,
1508 unsigned long pfn, unsigned int pages)
1509{
1510 /* It's a non-present to present mapping. Only flush if caching mode */
1511 if (cap_caching_mode(iommu->cap))
1512 iommu_flush_iotlb_psi(iommu, domain, pfn, pages, 0, 1);
1513 else
1514 iommu_flush_write_buffer(iommu);
1515}
1516
Joerg Roedel13cf0172017-08-11 11:40:10 +02001517static void iommu_flush_iova(struct iova_domain *iovad)
1518{
1519 struct dmar_domain *domain;
1520 int idx;
1521
1522 domain = container_of(iovad, struct dmar_domain, iovad);
1523
1524 for_each_domain_iommu(idx, domain) {
1525 struct intel_iommu *iommu = g_iommus[idx];
1526 u16 did = domain->iommu_did[iommu->seq_id];
1527
1528 iommu->flush.flush_iotlb(iommu, did, 0, 0, DMA_TLB_DSI_FLUSH);
1529
1530 if (!cap_caching_mode(iommu->cap))
1531 iommu_flush_dev_iotlb(get_iommu_domain(iommu, did),
1532 0, MAX_AGAW_PFN_WIDTH);
1533 }
1534}
1535
mark grossf8bab732008-02-08 04:18:38 -08001536static void iommu_disable_protect_mem_regions(struct intel_iommu *iommu)
1537{
1538 u32 pmen;
1539 unsigned long flags;
1540
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001541 raw_spin_lock_irqsave(&iommu->register_lock, flags);
mark grossf8bab732008-02-08 04:18:38 -08001542 pmen = readl(iommu->reg + DMAR_PMEN_REG);
1543 pmen &= ~DMA_PMEN_EPM;
1544 writel(pmen, iommu->reg + DMAR_PMEN_REG);
1545
1546 /* wait for the protected region status bit to clear */
1547 IOMMU_WAIT_OP(iommu, DMAR_PMEN_REG,
1548 readl, !(pmen & DMA_PMEN_PRS), pmen);
1549
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001550 raw_spin_unlock_irqrestore(&iommu->register_lock, flags);
mark grossf8bab732008-02-08 04:18:38 -08001551}
1552
Jiang Liu2a41cce2014-07-11 14:19:33 +08001553static void iommu_enable_translation(struct intel_iommu *iommu)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001554{
1555 u32 sts;
1556 unsigned long flags;
1557
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001558 raw_spin_lock_irqsave(&iommu->register_lock, flags);
David Woodhousec416daa2009-05-10 20:30:58 +01001559 iommu->gcmd |= DMA_GCMD_TE;
1560 writel(iommu->gcmd, iommu->reg + DMAR_GCMD_REG);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001561
1562 /* Make sure hardware complete it */
1563 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
David Woodhousec416daa2009-05-10 20:30:58 +01001564 readl, (sts & DMA_GSTS_TES), sts);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001565
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001566 raw_spin_unlock_irqrestore(&iommu->register_lock, flags);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001567}
1568
Jiang Liu2a41cce2014-07-11 14:19:33 +08001569static void iommu_disable_translation(struct intel_iommu *iommu)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001570{
1571 u32 sts;
1572 unsigned long flag;
1573
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001574 raw_spin_lock_irqsave(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001575 iommu->gcmd &= ~DMA_GCMD_TE;
1576 writel(iommu->gcmd, iommu->reg + DMAR_GCMD_REG);
1577
1578 /* Make sure hardware complete it */
1579 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
David Woodhousec416daa2009-05-10 20:30:58 +01001580 readl, (!(sts & DMA_GSTS_TES)), sts);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001581
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001582 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001583}
1584
Keshavamurthy, Anil S3460a6d2007-10-21 16:41:54 -07001585
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001586static int iommu_init_domains(struct intel_iommu *iommu)
1587{
Joerg Roedel8bf47812015-07-21 10:41:21 +02001588 u32 ndomains, nlongs;
1589 size_t size;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001590
1591 ndomains = cap_ndoms(iommu->cap);
Joerg Roedel8bf47812015-07-21 10:41:21 +02001592 pr_debug("%s: Number of Domains supported <%d>\n",
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001593 iommu->name, ndomains);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001594 nlongs = BITS_TO_LONGS(ndomains);
1595
Donald Dutile94a91b502009-08-20 16:51:34 -04001596 spin_lock_init(&iommu->lock);
1597
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001598 iommu->domain_ids = kcalloc(nlongs, sizeof(unsigned long), GFP_KERNEL);
1599 if (!iommu->domain_ids) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001600 pr_err("%s: Allocating domain id array failed\n",
1601 iommu->name);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001602 return -ENOMEM;
1603 }
Joerg Roedel8bf47812015-07-21 10:41:21 +02001604
Wei Yang86f004c2016-05-21 02:41:51 +00001605 size = (ALIGN(ndomains, 256) >> 8) * sizeof(struct dmar_domain **);
Joerg Roedel8bf47812015-07-21 10:41:21 +02001606 iommu->domains = kzalloc(size, GFP_KERNEL);
1607
1608 if (iommu->domains) {
1609 size = 256 * sizeof(struct dmar_domain *);
1610 iommu->domains[0] = kzalloc(size, GFP_KERNEL);
1611 }
1612
1613 if (!iommu->domains || !iommu->domains[0]) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001614 pr_err("%s: Allocating domain array failed\n",
1615 iommu->name);
Jiang Liu852bdb02014-01-06 14:18:11 +08001616 kfree(iommu->domain_ids);
Joerg Roedel8bf47812015-07-21 10:41:21 +02001617 kfree(iommu->domains);
Jiang Liu852bdb02014-01-06 14:18:11 +08001618 iommu->domain_ids = NULL;
Joerg Roedel8bf47812015-07-21 10:41:21 +02001619 iommu->domains = NULL;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001620 return -ENOMEM;
1621 }
1622
Joerg Roedel8bf47812015-07-21 10:41:21 +02001623
1624
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001625 /*
Joerg Roedelc0e8a6c2015-07-21 09:39:46 +02001626 * If Caching mode is set, then invalid translations are tagged
1627 * with domain-id 0, hence we need to pre-allocate it. We also
1628 * use domain-id 0 as a marker for non-allocated domain-id, so
1629 * make sure it is not used for a real domain.
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001630 */
Joerg Roedelc0e8a6c2015-07-21 09:39:46 +02001631 set_bit(0, iommu->domain_ids);
1632
Lu Baolu3b33d4a2018-12-10 09:58:59 +08001633 /*
1634 * Vt-d spec rev3.0 (section 6.2.3.1) requires that each pasid
1635 * entry for first-level or pass-through translation modes should
1636 * be programmed with a domain id different from those used for
1637 * second-level or nested translation. We reserve a domain id for
1638 * this purpose.
1639 */
1640 if (sm_supported(iommu))
1641 set_bit(FLPT_DEFAULT_DID, iommu->domain_ids);
1642
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001643 return 0;
1644}
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001645
Jiang Liuffebeb42014-11-09 22:48:02 +08001646static void disable_dmar_iommu(struct intel_iommu *iommu)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001647{
Joerg Roedel29a27712015-07-21 17:17:12 +02001648 struct device_domain_info *info, *tmp;
Joerg Roedel55d94042015-07-22 16:50:40 +02001649 unsigned long flags;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001650
Joerg Roedel29a27712015-07-21 17:17:12 +02001651 if (!iommu->domains || !iommu->domain_ids)
1652 return;
Jiang Liua4eaa862014-02-19 14:07:30 +08001653
Joerg Roedelbea64032016-11-08 15:08:26 +01001654again:
Joerg Roedel55d94042015-07-22 16:50:40 +02001655 spin_lock_irqsave(&device_domain_lock, flags);
Joerg Roedel29a27712015-07-21 17:17:12 +02001656 list_for_each_entry_safe(info, tmp, &device_domain_list, global) {
1657 struct dmar_domain *domain;
1658
1659 if (info->iommu != iommu)
1660 continue;
1661
1662 if (!info->dev || !info->domain)
1663 continue;
1664
1665 domain = info->domain;
1666
Joerg Roedelbea64032016-11-08 15:08:26 +01001667 __dmar_remove_one_dev_info(info);
Joerg Roedel29a27712015-07-21 17:17:12 +02001668
Joerg Roedelbea64032016-11-08 15:08:26 +01001669 if (!domain_type_is_vm_or_si(domain)) {
1670 /*
1671 * The domain_exit() function can't be called under
1672 * device_domain_lock, as it takes this lock itself.
1673 * So release the lock here and re-run the loop
1674 * afterwards.
1675 */
1676 spin_unlock_irqrestore(&device_domain_lock, flags);
Joerg Roedel29a27712015-07-21 17:17:12 +02001677 domain_exit(domain);
Joerg Roedelbea64032016-11-08 15:08:26 +01001678 goto again;
1679 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001680 }
Joerg Roedel55d94042015-07-22 16:50:40 +02001681 spin_unlock_irqrestore(&device_domain_lock, flags);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001682
1683 if (iommu->gcmd & DMA_GCMD_TE)
1684 iommu_disable_translation(iommu);
Jiang Liuffebeb42014-11-09 22:48:02 +08001685}
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001686
Jiang Liuffebeb42014-11-09 22:48:02 +08001687static void free_dmar_iommu(struct intel_iommu *iommu)
1688{
1689 if ((iommu->domains) && (iommu->domain_ids)) {
Wei Yang86f004c2016-05-21 02:41:51 +00001690 int elems = ALIGN(cap_ndoms(iommu->cap), 256) >> 8;
Joerg Roedel8bf47812015-07-21 10:41:21 +02001691 int i;
1692
1693 for (i = 0; i < elems; i++)
1694 kfree(iommu->domains[i]);
Jiang Liuffebeb42014-11-09 22:48:02 +08001695 kfree(iommu->domains);
1696 kfree(iommu->domain_ids);
1697 iommu->domains = NULL;
1698 iommu->domain_ids = NULL;
1699 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001700
Weidong Hand9630fe2008-12-08 11:06:32 +08001701 g_iommus[iommu->seq_id] = NULL;
1702
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001703 /* free context mapping */
1704 free_context_table(iommu);
David Woodhouse8a94ade2015-03-24 14:54:56 +00001705
1706#ifdef CONFIG_INTEL_IOMMU_SVM
Lu Baolu765b6a92018-12-10 09:58:55 +08001707 if (pasid_supported(iommu)) {
David Woodhousea222a7f2015-10-07 23:35:18 +01001708 if (ecap_prs(iommu->ecap))
1709 intel_svm_finish_prq(iommu);
David Woodhousea222a7f2015-10-07 23:35:18 +01001710 }
David Woodhouse8a94ade2015-03-24 14:54:56 +00001711#endif
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001712}
1713
Jiang Liuab8dfe22014-07-11 14:19:27 +08001714static struct dmar_domain *alloc_domain(int flags)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001715{
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001716 struct dmar_domain *domain;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001717
1718 domain = alloc_domain_mem();
1719 if (!domain)
1720 return NULL;
1721
Jiang Liuab8dfe22014-07-11 14:19:27 +08001722 memset(domain, 0, sizeof(*domain));
Anshuman Khandual98fa15f2019-03-05 15:42:58 -08001723 domain->nid = NUMA_NO_NODE;
Jiang Liuab8dfe22014-07-11 14:19:27 +08001724 domain->flags = flags;
Omer Peleg0824c592016-04-20 19:03:35 +03001725 domain->has_iotlb_device = false;
Jiang Liu92d03cc2014-02-19 14:07:28 +08001726 INIT_LIST_HEAD(&domain->devices);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001727
1728 return domain;
1729}
1730
Joerg Roedeld160aca2015-07-22 11:52:53 +02001731/* Must be called with iommu->lock */
1732static int domain_attach_iommu(struct dmar_domain *domain,
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001733 struct intel_iommu *iommu)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001734{
Jiang Liu44bde612014-07-11 14:19:29 +08001735 unsigned long ndomains;
Joerg Roedel55d94042015-07-22 16:50:40 +02001736 int num;
Jiang Liu44bde612014-07-11 14:19:29 +08001737
Joerg Roedel55d94042015-07-22 16:50:40 +02001738 assert_spin_locked(&device_domain_lock);
Joerg Roedeld160aca2015-07-22 11:52:53 +02001739 assert_spin_locked(&iommu->lock);
Jiang Liu44bde612014-07-11 14:19:29 +08001740
Joerg Roedel29a27712015-07-21 17:17:12 +02001741 domain->iommu_refcnt[iommu->seq_id] += 1;
1742 domain->iommu_count += 1;
1743 if (domain->iommu_refcnt[iommu->seq_id] == 1) {
Jiang Liufb170fb2014-07-11 14:19:28 +08001744 ndomains = cap_ndoms(iommu->cap);
Joerg Roedeld160aca2015-07-22 11:52:53 +02001745 num = find_first_zero_bit(iommu->domain_ids, ndomains);
1746
1747 if (num >= ndomains) {
1748 pr_err("%s: No free domain ids\n", iommu->name);
1749 domain->iommu_refcnt[iommu->seq_id] -= 1;
1750 domain->iommu_count -= 1;
Joerg Roedel55d94042015-07-22 16:50:40 +02001751 return -ENOSPC;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001752 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001753
Joerg Roedeld160aca2015-07-22 11:52:53 +02001754 set_bit(num, iommu->domain_ids);
1755 set_iommu_domain(iommu, num, domain);
Jiang Liufb170fb2014-07-11 14:19:28 +08001756
Joerg Roedeld160aca2015-07-22 11:52:53 +02001757 domain->iommu_did[iommu->seq_id] = num;
1758 domain->nid = iommu->node;
1759
Jiang Liufb170fb2014-07-11 14:19:28 +08001760 domain_update_iommu_cap(domain);
1761 }
Joerg Roedeld160aca2015-07-22 11:52:53 +02001762
Joerg Roedel55d94042015-07-22 16:50:40 +02001763 return 0;
Jiang Liufb170fb2014-07-11 14:19:28 +08001764}
1765
1766static int domain_detach_iommu(struct dmar_domain *domain,
1767 struct intel_iommu *iommu)
1768{
Bjorn Helgaase083ea5b2019-02-08 16:06:08 -06001769 int num, count;
Jiang Liufb170fb2014-07-11 14:19:28 +08001770
Joerg Roedel55d94042015-07-22 16:50:40 +02001771 assert_spin_locked(&device_domain_lock);
Joerg Roedeld160aca2015-07-22 11:52:53 +02001772 assert_spin_locked(&iommu->lock);
Jiang Liufb170fb2014-07-11 14:19:28 +08001773
Joerg Roedel29a27712015-07-21 17:17:12 +02001774 domain->iommu_refcnt[iommu->seq_id] -= 1;
1775 count = --domain->iommu_count;
1776 if (domain->iommu_refcnt[iommu->seq_id] == 0) {
Joerg Roedeld160aca2015-07-22 11:52:53 +02001777 num = domain->iommu_did[iommu->seq_id];
1778 clear_bit(num, iommu->domain_ids);
1779 set_iommu_domain(iommu, num, NULL);
1780
Jiang Liufb170fb2014-07-11 14:19:28 +08001781 domain_update_iommu_cap(domain);
Joerg Roedelc0e8a6c2015-07-21 09:39:46 +02001782 domain->iommu_did[iommu->seq_id] = 0;
Jiang Liufb170fb2014-07-11 14:19:28 +08001783 }
Jiang Liufb170fb2014-07-11 14:19:28 +08001784
1785 return count;
1786}
1787
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001788static struct iova_domain reserved_iova_list;
Mark Gross8a443df2008-03-04 14:59:31 -08001789static struct lock_class_key reserved_rbtree_key;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001790
Joseph Cihula51a63e62011-03-21 11:04:24 -07001791static int dmar_init_reserved_ranges(void)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001792{
1793 struct pci_dev *pdev = NULL;
1794 struct iova *iova;
1795 int i;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001796
Zhen Leiaa3ac942017-09-21 16:52:45 +01001797 init_iova_domain(&reserved_iova_list, VTD_PAGE_SIZE, IOVA_START_PFN);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001798
Mark Gross8a443df2008-03-04 14:59:31 -08001799 lockdep_set_class(&reserved_iova_list.iova_rbtree_lock,
1800 &reserved_rbtree_key);
1801
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001802 /* IOAPIC ranges shouldn't be accessed by DMA */
1803 iova = reserve_iova(&reserved_iova_list, IOVA_PFN(IOAPIC_RANGE_START),
1804 IOVA_PFN(IOAPIC_RANGE_END));
Joseph Cihula51a63e62011-03-21 11:04:24 -07001805 if (!iova) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001806 pr_err("Reserve IOAPIC range failed\n");
Joseph Cihula51a63e62011-03-21 11:04:24 -07001807 return -ENODEV;
1808 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001809
1810 /* Reserve all PCI MMIO to avoid peer-to-peer access */
1811 for_each_pci_dev(pdev) {
1812 struct resource *r;
1813
1814 for (i = 0; i < PCI_NUM_RESOURCES; i++) {
1815 r = &pdev->resource[i];
1816 if (!r->flags || !(r->flags & IORESOURCE_MEM))
1817 continue;
David Woodhouse1a4a4552009-06-28 16:00:42 +01001818 iova = reserve_iova(&reserved_iova_list,
1819 IOVA_PFN(r->start),
1820 IOVA_PFN(r->end));
Joseph Cihula51a63e62011-03-21 11:04:24 -07001821 if (!iova) {
Bjorn Helgaas932a6522019-02-08 16:06:00 -06001822 pci_err(pdev, "Reserve iova for %pR failed\n", r);
Joseph Cihula51a63e62011-03-21 11:04:24 -07001823 return -ENODEV;
1824 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001825 }
1826 }
Joseph Cihula51a63e62011-03-21 11:04:24 -07001827 return 0;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001828}
1829
1830static void domain_reserve_special_ranges(struct dmar_domain *domain)
1831{
1832 copy_reserved_iova(&reserved_iova_list, &domain->iovad);
1833}
1834
1835static inline int guestwidth_to_adjustwidth(int gaw)
1836{
1837 int agaw;
1838 int r = (gaw - 12) % 9;
1839
1840 if (r == 0)
1841 agaw = gaw;
1842 else
1843 agaw = gaw + 9 - r;
1844 if (agaw > 64)
1845 agaw = 64;
1846 return agaw;
1847}
1848
Joerg Roedeldc534b22015-07-22 12:44:02 +02001849static int domain_init(struct dmar_domain *domain, struct intel_iommu *iommu,
1850 int guest_width)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001851{
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001852 int adjust_width, agaw;
1853 unsigned long sagaw;
Joerg Roedel13cf0172017-08-11 11:40:10 +02001854 int err;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001855
Zhen Leiaa3ac942017-09-21 16:52:45 +01001856 init_iova_domain(&domain->iovad, VTD_PAGE_SIZE, IOVA_START_PFN);
Joerg Roedel13cf0172017-08-11 11:40:10 +02001857
1858 err = init_iova_flush_queue(&domain->iovad,
1859 iommu_flush_iova, iova_entry_free);
1860 if (err)
1861 return err;
1862
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001863 domain_reserve_special_ranges(domain);
1864
1865 /* calculate AGAW */
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001866 if (guest_width > cap_mgaw(iommu->cap))
1867 guest_width = cap_mgaw(iommu->cap);
1868 domain->gaw = guest_width;
1869 adjust_width = guestwidth_to_adjustwidth(guest_width);
1870 agaw = width_to_agaw(adjust_width);
1871 sagaw = cap_sagaw(iommu->cap);
1872 if (!test_bit(agaw, &sagaw)) {
1873 /* hardware doesn't support it, choose a bigger one */
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001874 pr_debug("Hardware doesn't support agaw %d\n", agaw);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001875 agaw = find_next_bit(&sagaw, 5, agaw);
1876 if (agaw >= 5)
1877 return -ENODEV;
1878 }
1879 domain->agaw = agaw;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001880
Weidong Han8e6040972008-12-08 15:49:06 +08001881 if (ecap_coherent(iommu->ecap))
1882 domain->iommu_coherency = 1;
1883 else
1884 domain->iommu_coherency = 0;
1885
Sheng Yang58c610b2009-03-18 15:33:05 +08001886 if (ecap_sc_support(iommu->ecap))
1887 domain->iommu_snooping = 1;
1888 else
1889 domain->iommu_snooping = 0;
1890
David Woodhouse214e39a2014-03-19 10:38:49 +00001891 if (intel_iommu_superpage)
1892 domain->iommu_superpage = fls(cap_super_page_val(iommu->cap));
1893 else
1894 domain->iommu_superpage = 0;
1895
Suresh Siddha4c923d42009-10-02 11:01:24 -07001896 domain->nid = iommu->node;
Weidong Hanc7151a82008-12-08 22:51:37 +08001897
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001898 /* always allocate the top pgd */
Suresh Siddha4c923d42009-10-02 11:01:24 -07001899 domain->pgd = (struct dma_pte *)alloc_pgtable_page(domain->nid);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001900 if (!domain->pgd)
1901 return -ENOMEM;
Fenghua Yu5b6985c2008-10-16 18:02:32 -07001902 __iommu_flush_cache(iommu, domain->pgd, PAGE_SIZE);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001903 return 0;
1904}
1905
1906static void domain_exit(struct dmar_domain *domain)
1907{
Bjorn Helgaase083ea5b2019-02-08 16:06:08 -06001908 struct page *freelist;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001909
Joerg Roedeld160aca2015-07-22 11:52:53 +02001910 /* Remove associated devices and clear attached or cached domains */
1911 rcu_read_lock();
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001912 domain_remove_dev_info(domain);
Joerg Roedeld160aca2015-07-22 11:52:53 +02001913 rcu_read_unlock();
Jiang Liu92d03cc2014-02-19 14:07:28 +08001914
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001915 /* destroy iovas */
1916 put_iova_domain(&domain->iovad);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001917
David Woodhouseea8ea462014-03-05 17:09:32 +00001918 freelist = domain_unmap(domain, 0, DOMAIN_MAX_PFN(domain->gaw));
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001919
David Woodhouseea8ea462014-03-05 17:09:32 +00001920 dma_free_pagelist(freelist);
1921
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001922 free_domain_mem(domain);
1923}
1924
Lu Baolu7373a8c2018-12-10 09:59:03 +08001925/*
1926 * Get the PASID directory size for scalable mode context entry.
1927 * Value of X in the PDTS field of a scalable mode context entry
1928 * indicates PASID directory with 2^(X + 7) entries.
1929 */
1930static inline unsigned long context_get_sm_pds(struct pasid_table *table)
1931{
1932 int pds, max_pde;
1933
1934 max_pde = table->max_pasid >> PASID_PDE_SHIFT;
1935 pds = find_first_bit((unsigned long *)&max_pde, MAX_NR_PASID_BITS);
1936 if (pds < 7)
1937 return 0;
1938
1939 return pds - 7;
1940}
1941
1942/*
1943 * Set the RID_PASID field of a scalable mode context entry. The
1944 * IOMMU hardware will use the PASID value set in this field for
1945 * DMA translations of DMA requests without PASID.
1946 */
1947static inline void
1948context_set_sm_rid2pasid(struct context_entry *context, unsigned long pasid)
1949{
1950 context->hi |= pasid & ((1 << 20) - 1);
1951 context->hi |= (1 << 20);
1952}
1953
1954/*
1955 * Set the DTE(Device-TLB Enable) field of a scalable mode context
1956 * entry.
1957 */
1958static inline void context_set_sm_dte(struct context_entry *context)
1959{
1960 context->lo |= (1 << 2);
1961}
1962
1963/*
1964 * Set the PRE(Page Request Enable) field of a scalable mode context
1965 * entry.
1966 */
1967static inline void context_set_sm_pre(struct context_entry *context)
1968{
1969 context->lo |= (1 << 4);
1970}
1971
1972/* Convert value to context PASID directory size field coding. */
1973#define context_pdts(pds) (((pds) & 0x7) << 9)
1974
David Woodhouse64ae8922014-03-09 12:52:30 -07001975static int domain_context_mapping_one(struct dmar_domain *domain,
1976 struct intel_iommu *iommu,
Lu Baoluca6e3222018-12-10 09:59:02 +08001977 struct pasid_table *table,
Joerg Roedel28ccce02015-07-21 14:45:31 +02001978 u8 bus, u8 devfn)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001979{
Joerg Roedelc6c2ceb2015-07-22 13:11:53 +02001980 u16 did = domain->iommu_did[iommu->seq_id];
Joerg Roedel28ccce02015-07-21 14:45:31 +02001981 int translation = CONTEXT_TT_MULTI_LEVEL;
1982 struct device_domain_info *info = NULL;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001983 struct context_entry *context;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001984 unsigned long flags;
Lu Baolu7373a8c2018-12-10 09:59:03 +08001985 int ret;
Joerg Roedel28ccce02015-07-21 14:45:31 +02001986
Joerg Roedelc6c2ceb2015-07-22 13:11:53 +02001987 WARN_ON(did == 0);
1988
Joerg Roedel28ccce02015-07-21 14:45:31 +02001989 if (hw_pass_through && domain_type_is_si(domain))
1990 translation = CONTEXT_TT_PASS_THROUGH;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001991
1992 pr_debug("Set context mapping for %02x:%02x.%d\n",
1993 bus, PCI_SLOT(devfn), PCI_FUNC(devfn));
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001994
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001995 BUG_ON(!domain->pgd);
Weidong Han5331fe62008-12-08 23:00:00 +08001996
Joerg Roedel55d94042015-07-22 16:50:40 +02001997 spin_lock_irqsave(&device_domain_lock, flags);
1998 spin_lock(&iommu->lock);
1999
2000 ret = -ENOMEM;
David Woodhouse03ecc322015-02-13 14:35:21 +00002001 context = iommu_context_addr(iommu, bus, devfn, 1);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002002 if (!context)
Joerg Roedel55d94042015-07-22 16:50:40 +02002003 goto out_unlock;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002004
Joerg Roedel55d94042015-07-22 16:50:40 +02002005 ret = 0;
2006 if (context_present(context))
2007 goto out_unlock;
Joerg Roedelcf484d02015-06-12 12:21:46 +02002008
Xunlei Pangaec0e862016-12-05 20:09:07 +08002009 /*
2010 * For kdump cases, old valid entries may be cached due to the
2011 * in-flight DMA and copied pgtable, but there is no unmapping
2012 * behaviour for them, thus we need an explicit cache flush for
2013 * the newly-mapped device. For kdump, at this point, the device
2014 * is supposed to finish reset at its driver probe stage, so no
2015 * in-flight DMA will exist, and we don't need to worry anymore
2016 * hereafter.
2017 */
2018 if (context_copied(context)) {
2019 u16 did_old = context_domain_id(context);
2020
Christos Gkekasb117e032017-10-08 23:33:31 +01002021 if (did_old < cap_ndoms(iommu->cap)) {
Xunlei Pangaec0e862016-12-05 20:09:07 +08002022 iommu->flush.flush_context(iommu, did_old,
2023 (((u16)bus) << 8) | devfn,
2024 DMA_CCMD_MASK_NOBIT,
2025 DMA_CCMD_DEVICE_INVL);
KarimAllah Ahmedf73a7ee2017-05-05 11:39:59 -07002026 iommu->flush.flush_iotlb(iommu, did_old, 0, 0,
2027 DMA_TLB_DSI_FLUSH);
2028 }
Xunlei Pangaec0e862016-12-05 20:09:07 +08002029 }
2030
Joerg Roedelde24e552015-07-21 14:53:04 +02002031 context_clear_entry(context);
Weidong Hanea6606b2008-12-08 23:08:15 +08002032
Lu Baolu7373a8c2018-12-10 09:59:03 +08002033 if (sm_supported(iommu)) {
2034 unsigned long pds;
Joerg Roedelde24e552015-07-21 14:53:04 +02002035
Lu Baolu7373a8c2018-12-10 09:59:03 +08002036 WARN_ON(!table);
2037
2038 /* Setup the PASID DIR pointer: */
2039 pds = context_get_sm_pds(table);
2040 context->lo = (u64)virt_to_phys(table->table) |
2041 context_pdts(pds);
2042
2043 /* Setup the RID_PASID field: */
2044 context_set_sm_rid2pasid(context, PASID_RID2PASID);
2045
2046 /*
2047 * Setup the Device-TLB enable bit and Page request
2048 * Enable bit:
2049 */
David Woodhouse64ae8922014-03-09 12:52:30 -07002050 info = iommu_support_dev_iotlb(domain, iommu, bus, devfn);
David Woodhouseb16d0cb2015-10-12 14:17:37 +01002051 if (info && info->ats_supported)
Lu Baolu7373a8c2018-12-10 09:59:03 +08002052 context_set_sm_dte(context);
2053 if (info && info->pri_supported)
2054 context_set_sm_pre(context);
Joerg Roedelde24e552015-07-21 14:53:04 +02002055 } else {
Lu Baolu7373a8c2018-12-10 09:59:03 +08002056 struct dma_pte *pgd = domain->pgd;
2057 int agaw;
2058
2059 context_set_domain_id(context, did);
Lu Baolu7373a8c2018-12-10 09:59:03 +08002060
2061 if (translation != CONTEXT_TT_PASS_THROUGH) {
2062 /*
2063 * Skip top levels of page tables for iommu which has
2064 * less agaw than default. Unnecessary for PT mode.
2065 */
2066 for (agaw = domain->agaw; agaw > iommu->agaw; agaw--) {
2067 ret = -ENOMEM;
2068 pgd = phys_to_virt(dma_pte_addr(pgd));
2069 if (!dma_pte_present(pgd))
2070 goto out_unlock;
2071 }
2072
2073 info = iommu_support_dev_iotlb(domain, iommu, bus, devfn);
2074 if (info && info->ats_supported)
2075 translation = CONTEXT_TT_DEV_IOTLB;
2076 else
2077 translation = CONTEXT_TT_MULTI_LEVEL;
2078
2079 context_set_address_root(context, virt_to_phys(pgd));
2080 context_set_address_width(context, agaw);
2081 } else {
2082 /*
2083 * In pass through mode, AW must be programmed to
2084 * indicate the largest AGAW value supported by
2085 * hardware. And ASR is ignored by hardware.
2086 */
2087 context_set_address_width(context, iommu->msagaw);
2088 }
Lu Baolu41b80db2019-03-01 11:23:11 +08002089
2090 context_set_translation_type(context, translation);
Yu Zhao93a23a72009-05-18 13:51:37 +08002091 }
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07002092
Mark McLoughlinc07e7d22008-11-21 16:54:46 +00002093 context_set_fault_enable(context);
2094 context_set_present(context);
Weidong Han5331fe62008-12-08 23:00:00 +08002095 domain_flush_cache(domain, context, sizeof(*context));
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002096
David Woodhouse4c25a2c2009-05-10 17:16:06 +01002097 /*
2098 * It's a non-present to present mapping. If hardware doesn't cache
2099 * non-present entry we only need to flush the write-buffer. If the
2100 * _does_ cache non-present entries, then it does so in the special
2101 * domain #0, which we have to flush:
2102 */
2103 if (cap_caching_mode(iommu->cap)) {
2104 iommu->flush.flush_context(iommu, 0,
2105 (((u16)bus) << 8) | devfn,
2106 DMA_CCMD_MASK_NOBIT,
2107 DMA_CCMD_DEVICE_INVL);
Joerg Roedelc6c2ceb2015-07-22 13:11:53 +02002108 iommu->flush.flush_iotlb(iommu, did, 0, 0, DMA_TLB_DSI_FLUSH);
David Woodhouse4c25a2c2009-05-10 17:16:06 +01002109 } else {
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002110 iommu_flush_write_buffer(iommu);
David Woodhouse4c25a2c2009-05-10 17:16:06 +01002111 }
Yu Zhao93a23a72009-05-18 13:51:37 +08002112 iommu_enable_dev_iotlb(info);
Weidong Hanc7151a82008-12-08 22:51:37 +08002113
Joerg Roedel55d94042015-07-22 16:50:40 +02002114 ret = 0;
2115
2116out_unlock:
2117 spin_unlock(&iommu->lock);
2118 spin_unlock_irqrestore(&device_domain_lock, flags);
Jiang Liufb170fb2014-07-11 14:19:28 +08002119
Wei Yang5c365d12016-07-13 13:53:21 +00002120 return ret;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002121}
2122
Alex Williamson579305f2014-07-03 09:51:43 -06002123struct domain_context_mapping_data {
2124 struct dmar_domain *domain;
2125 struct intel_iommu *iommu;
Lu Baoluca6e3222018-12-10 09:59:02 +08002126 struct pasid_table *table;
Alex Williamson579305f2014-07-03 09:51:43 -06002127};
2128
2129static int domain_context_mapping_cb(struct pci_dev *pdev,
2130 u16 alias, void *opaque)
2131{
2132 struct domain_context_mapping_data *data = opaque;
2133
2134 return domain_context_mapping_one(data->domain, data->iommu,
Lu Baoluca6e3222018-12-10 09:59:02 +08002135 data->table, PCI_BUS_NUM(alias),
2136 alias & 0xff);
Alex Williamson579305f2014-07-03 09:51:43 -06002137}
2138
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002139static int
Joerg Roedel28ccce02015-07-21 14:45:31 +02002140domain_context_mapping(struct dmar_domain *domain, struct device *dev)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002141{
Lu Baoluca6e3222018-12-10 09:59:02 +08002142 struct domain_context_mapping_data data;
2143 struct pasid_table *table;
David Woodhouse64ae8922014-03-09 12:52:30 -07002144 struct intel_iommu *iommu;
David Woodhouse156baca2014-03-09 14:00:57 -07002145 u8 bus, devfn;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002146
David Woodhousee1f167f2014-03-09 15:24:46 -07002147 iommu = device_to_iommu(dev, &bus, &devfn);
David Woodhouse64ae8922014-03-09 12:52:30 -07002148 if (!iommu)
2149 return -ENODEV;
2150
Lu Baoluca6e3222018-12-10 09:59:02 +08002151 table = intel_pasid_get_table(dev);
2152
Alex Williamson579305f2014-07-03 09:51:43 -06002153 if (!dev_is_pci(dev))
Lu Baoluca6e3222018-12-10 09:59:02 +08002154 return domain_context_mapping_one(domain, iommu, table,
2155 bus, devfn);
Alex Williamson579305f2014-07-03 09:51:43 -06002156
2157 data.domain = domain;
2158 data.iommu = iommu;
Lu Baoluca6e3222018-12-10 09:59:02 +08002159 data.table = table;
Alex Williamson579305f2014-07-03 09:51:43 -06002160
2161 return pci_for_each_dma_alias(to_pci_dev(dev),
2162 &domain_context_mapping_cb, &data);
2163}
2164
2165static int domain_context_mapped_cb(struct pci_dev *pdev,
2166 u16 alias, void *opaque)
2167{
2168 struct intel_iommu *iommu = opaque;
2169
2170 return !device_context_mapped(iommu, PCI_BUS_NUM(alias), alias & 0xff);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002171}
2172
David Woodhousee1f167f2014-03-09 15:24:46 -07002173static int domain_context_mapped(struct device *dev)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002174{
Weidong Han5331fe62008-12-08 23:00:00 +08002175 struct intel_iommu *iommu;
David Woodhouse156baca2014-03-09 14:00:57 -07002176 u8 bus, devfn;
Weidong Han5331fe62008-12-08 23:00:00 +08002177
David Woodhousee1f167f2014-03-09 15:24:46 -07002178 iommu = device_to_iommu(dev, &bus, &devfn);
Weidong Han5331fe62008-12-08 23:00:00 +08002179 if (!iommu)
2180 return -ENODEV;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002181
Alex Williamson579305f2014-07-03 09:51:43 -06002182 if (!dev_is_pci(dev))
2183 return device_context_mapped(iommu, bus, devfn);
David Woodhousee1f167f2014-03-09 15:24:46 -07002184
Alex Williamson579305f2014-07-03 09:51:43 -06002185 return !pci_for_each_dma_alias(to_pci_dev(dev),
2186 domain_context_mapped_cb, iommu);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002187}
2188
Fenghua Yuf5329592009-08-04 15:09:37 -07002189/* Returns a number of VTD pages, but aligned to MM page size */
2190static inline unsigned long aligned_nrpages(unsigned long host_addr,
2191 size_t size)
2192{
2193 host_addr &= ~PAGE_MASK;
2194 return PAGE_ALIGN(host_addr + size) >> VTD_PAGE_SHIFT;
2195}
2196
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002197/* Return largest possible superpage level for a given mapping */
2198static inline int hardware_largepage_caps(struct dmar_domain *domain,
2199 unsigned long iov_pfn,
2200 unsigned long phy_pfn,
2201 unsigned long pages)
2202{
2203 int support, level = 1;
2204 unsigned long pfnmerge;
2205
2206 support = domain->iommu_superpage;
2207
2208 /* To use a large page, the virtual *and* physical addresses
2209 must be aligned to 2MiB/1GiB/etc. Lower bits set in either
2210 of them will mean we have to use smaller pages. So just
2211 merge them and check both at once. */
2212 pfnmerge = iov_pfn | phy_pfn;
2213
2214 while (support && !(pfnmerge & ~VTD_STRIDE_MASK)) {
2215 pages >>= VTD_STRIDE_SHIFT;
2216 if (!pages)
2217 break;
2218 pfnmerge >>= VTD_STRIDE_SHIFT;
2219 level++;
2220 support--;
2221 }
2222 return level;
2223}
2224
David Woodhouse9051aa02009-06-29 12:30:54 +01002225static int __domain_mapping(struct dmar_domain *domain, unsigned long iov_pfn,
2226 struct scatterlist *sg, unsigned long phys_pfn,
2227 unsigned long nr_pages, int prot)
David Woodhousee1605492009-06-29 11:17:38 +01002228{
2229 struct dma_pte *first_pte = NULL, *pte = NULL;
David Woodhouse9051aa02009-06-29 12:30:54 +01002230 phys_addr_t uninitialized_var(pteval);
Jiang Liucc4f14a2014-11-26 09:42:10 +08002231 unsigned long sg_res = 0;
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002232 unsigned int largepage_lvl = 0;
2233 unsigned long lvl_pages = 0;
David Woodhousee1605492009-06-29 11:17:38 +01002234
Jiang Liu162d1b12014-07-11 14:19:35 +08002235 BUG_ON(!domain_pfn_supported(domain, iov_pfn + nr_pages - 1));
David Woodhousee1605492009-06-29 11:17:38 +01002236
2237 if ((prot & (DMA_PTE_READ|DMA_PTE_WRITE)) == 0)
2238 return -EINVAL;
2239
2240 prot &= DMA_PTE_READ | DMA_PTE_WRITE | DMA_PTE_SNP;
2241
Jiang Liucc4f14a2014-11-26 09:42:10 +08002242 if (!sg) {
2243 sg_res = nr_pages;
David Woodhouse9051aa02009-06-29 12:30:54 +01002244 pteval = ((phys_addr_t)phys_pfn << VTD_PAGE_SHIFT) | prot;
2245 }
2246
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002247 while (nr_pages > 0) {
David Woodhousec85994e2009-07-01 19:21:24 +01002248 uint64_t tmp;
2249
David Woodhousee1605492009-06-29 11:17:38 +01002250 if (!sg_res) {
Robin Murphy29a90b72017-09-28 15:14:01 +01002251 unsigned int pgoff = sg->offset & ~PAGE_MASK;
2252
Fenghua Yuf5329592009-08-04 15:09:37 -07002253 sg_res = aligned_nrpages(sg->offset, sg->length);
Robin Murphy29a90b72017-09-28 15:14:01 +01002254 sg->dma_address = ((dma_addr_t)iov_pfn << VTD_PAGE_SHIFT) + pgoff;
David Woodhousee1605492009-06-29 11:17:38 +01002255 sg->dma_length = sg->length;
Robin Murphy29a90b72017-09-28 15:14:01 +01002256 pteval = (sg_phys(sg) - pgoff) | prot;
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002257 phys_pfn = pteval >> VTD_PAGE_SHIFT;
David Woodhousee1605492009-06-29 11:17:38 +01002258 }
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002259
David Woodhousee1605492009-06-29 11:17:38 +01002260 if (!pte) {
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002261 largepage_lvl = hardware_largepage_caps(domain, iov_pfn, phys_pfn, sg_res);
2262
David Woodhouse5cf0a762014-03-19 16:07:49 +00002263 first_pte = pte = pfn_to_dma_pte(domain, iov_pfn, &largepage_lvl);
David Woodhousee1605492009-06-29 11:17:38 +01002264 if (!pte)
2265 return -ENOMEM;
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002266 /* It is large page*/
Woodhouse, David6491d4d2012-12-19 13:25:35 +00002267 if (largepage_lvl > 1) {
Christian Zanderba2374f2015-06-10 09:41:45 -07002268 unsigned long nr_superpages, end_pfn;
2269
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002270 pteval |= DMA_PTE_LARGE_PAGE;
Jiang Liud41a4ad2014-07-11 14:19:34 +08002271 lvl_pages = lvl_to_nr_pages(largepage_lvl);
Christian Zanderba2374f2015-06-10 09:41:45 -07002272
2273 nr_superpages = sg_res / lvl_pages;
2274 end_pfn = iov_pfn + nr_superpages * lvl_pages - 1;
2275
Jiang Liud41a4ad2014-07-11 14:19:34 +08002276 /*
2277 * Ensure that old small page tables are
Christian Zanderba2374f2015-06-10 09:41:45 -07002278 * removed to make room for superpage(s).
David Dillowbc24c572017-06-28 19:42:23 -07002279 * We're adding new large pages, so make sure
2280 * we don't remove their parent tables.
Jiang Liud41a4ad2014-07-11 14:19:34 +08002281 */
David Dillowbc24c572017-06-28 19:42:23 -07002282 dma_pte_free_pagetable(domain, iov_pfn, end_pfn,
2283 largepage_lvl + 1);
Woodhouse, David6491d4d2012-12-19 13:25:35 +00002284 } else {
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002285 pteval &= ~(uint64_t)DMA_PTE_LARGE_PAGE;
Woodhouse, David6491d4d2012-12-19 13:25:35 +00002286 }
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002287
David Woodhousee1605492009-06-29 11:17:38 +01002288 }
2289 /* We don't need lock here, nobody else
2290 * touches the iova range
2291 */
David Woodhouse7766a3f2009-07-01 20:27:03 +01002292 tmp = cmpxchg64_local(&pte->val, 0ULL, pteval);
David Woodhousec85994e2009-07-01 19:21:24 +01002293 if (tmp) {
David Woodhouse1bf20f02009-06-29 22:06:43 +01002294 static int dumps = 5;
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002295 pr_crit("ERROR: DMA PTE for vPFN 0x%lx already set (to %llx not %llx)\n",
2296 iov_pfn, tmp, (unsigned long long)pteval);
David Woodhouse1bf20f02009-06-29 22:06:43 +01002297 if (dumps) {
2298 dumps--;
2299 debug_dma_dump_mappings(NULL);
2300 }
2301 WARN_ON(1);
2302 }
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002303
2304 lvl_pages = lvl_to_nr_pages(largepage_lvl);
2305
2306 BUG_ON(nr_pages < lvl_pages);
2307 BUG_ON(sg_res < lvl_pages);
2308
2309 nr_pages -= lvl_pages;
2310 iov_pfn += lvl_pages;
2311 phys_pfn += lvl_pages;
2312 pteval += lvl_pages * VTD_PAGE_SIZE;
2313 sg_res -= lvl_pages;
2314
2315 /* If the next PTE would be the first in a new page, then we
2316 need to flush the cache on the entries we've just written.
2317 And then we'll need to recalculate 'pte', so clear it and
2318 let it get set again in the if (!pte) block above.
2319
2320 If we're done (!nr_pages) we need to flush the cache too.
2321
2322 Also if we've been setting superpages, we may need to
2323 recalculate 'pte' and switch back to smaller pages for the
2324 end of the mapping, if the trailing size is not enough to
2325 use another superpage (i.e. sg_res < lvl_pages). */
David Woodhousee1605492009-06-29 11:17:38 +01002326 pte++;
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002327 if (!nr_pages || first_pte_in_page(pte) ||
2328 (largepage_lvl > 1 && sg_res < lvl_pages)) {
David Woodhousee1605492009-06-29 11:17:38 +01002329 domain_flush_cache(domain, first_pte,
2330 (void *)pte - (void *)first_pte);
2331 pte = NULL;
2332 }
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002333
2334 if (!sg_res && nr_pages)
David Woodhousee1605492009-06-29 11:17:38 +01002335 sg = sg_next(sg);
2336 }
2337 return 0;
2338}
2339
Peter Xu87684fd2018-05-04 10:34:53 +08002340static int domain_mapping(struct dmar_domain *domain, unsigned long iov_pfn,
2341 struct scatterlist *sg, unsigned long phys_pfn,
2342 unsigned long nr_pages, int prot)
2343{
2344 int ret;
2345 struct intel_iommu *iommu;
2346
2347 /* Do the real mapping first */
2348 ret = __domain_mapping(domain, iov_pfn, sg, phys_pfn, nr_pages, prot);
2349 if (ret)
2350 return ret;
2351
2352 /* Notify about the new mapping */
2353 if (domain_type_is_vm(domain)) {
2354 /* VM typed domains can have more than one IOMMUs */
2355 int iommu_id;
2356 for_each_domain_iommu(iommu_id, domain) {
2357 iommu = g_iommus[iommu_id];
2358 __mapping_notify_one(iommu, domain, iov_pfn, nr_pages);
2359 }
2360 } else {
2361 /* General domains only have one IOMMU */
2362 iommu = domain_get_iommu(domain);
2363 __mapping_notify_one(iommu, domain, iov_pfn, nr_pages);
2364 }
2365
2366 return 0;
2367}
2368
David Woodhouse9051aa02009-06-29 12:30:54 +01002369static inline int domain_sg_mapping(struct dmar_domain *domain, unsigned long iov_pfn,
2370 struct scatterlist *sg, unsigned long nr_pages,
2371 int prot)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002372{
Peter Xu87684fd2018-05-04 10:34:53 +08002373 return domain_mapping(domain, iov_pfn, sg, 0, nr_pages, prot);
David Woodhouse9051aa02009-06-29 12:30:54 +01002374}
Fenghua Yu5b6985c2008-10-16 18:02:32 -07002375
David Woodhouse9051aa02009-06-29 12:30:54 +01002376static inline int domain_pfn_mapping(struct dmar_domain *domain, unsigned long iov_pfn,
2377 unsigned long phys_pfn, unsigned long nr_pages,
2378 int prot)
2379{
Peter Xu87684fd2018-05-04 10:34:53 +08002380 return domain_mapping(domain, iov_pfn, NULL, phys_pfn, nr_pages, prot);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002381}
2382
Joerg Roedel2452d9d2015-07-23 16:20:14 +02002383static void domain_context_clear_one(struct intel_iommu *iommu, u8 bus, u8 devfn)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002384{
Filippo Sironi50822192017-08-31 10:58:11 +02002385 unsigned long flags;
2386 struct context_entry *context;
2387 u16 did_old;
2388
Weidong Hanc7151a82008-12-08 22:51:37 +08002389 if (!iommu)
2390 return;
Weidong Han8c11e792008-12-08 15:29:22 +08002391
Filippo Sironi50822192017-08-31 10:58:11 +02002392 spin_lock_irqsave(&iommu->lock, flags);
2393 context = iommu_context_addr(iommu, bus, devfn, 0);
2394 if (!context) {
2395 spin_unlock_irqrestore(&iommu->lock, flags);
2396 return;
2397 }
2398 did_old = context_domain_id(context);
2399 context_clear_entry(context);
2400 __iommu_flush_cache(iommu, context, sizeof(*context));
2401 spin_unlock_irqrestore(&iommu->lock, flags);
2402 iommu->flush.flush_context(iommu,
2403 did_old,
2404 (((u16)bus) << 8) | devfn,
2405 DMA_CCMD_MASK_NOBIT,
2406 DMA_CCMD_DEVICE_INVL);
2407 iommu->flush.flush_iotlb(iommu,
2408 did_old,
2409 0,
2410 0,
2411 DMA_TLB_DSI_FLUSH);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002412}
2413
David Woodhouse109b9b02012-05-25 17:43:02 +01002414static inline void unlink_domain_info(struct device_domain_info *info)
2415{
2416 assert_spin_locked(&device_domain_lock);
2417 list_del(&info->link);
2418 list_del(&info->global);
2419 if (info->dev)
David Woodhouse0bcb3e22014-03-06 17:12:03 +00002420 info->dev->archdata.iommu = NULL;
David Woodhouse109b9b02012-05-25 17:43:02 +01002421}
2422
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002423static void domain_remove_dev_info(struct dmar_domain *domain)
2424{
Yijing Wang3a74ca02014-05-20 20:37:47 +08002425 struct device_domain_info *info, *tmp;
Jiang Liufb170fb2014-07-11 14:19:28 +08002426 unsigned long flags;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002427
2428 spin_lock_irqsave(&device_domain_lock, flags);
Joerg Roedel76f45fe2015-07-21 18:25:11 +02002429 list_for_each_entry_safe(info, tmp, &domain->devices, link)
Joerg Roedel127c7612015-07-23 17:44:46 +02002430 __dmar_remove_one_dev_info(info);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002431 spin_unlock_irqrestore(&device_domain_lock, flags);
2432}
2433
2434/*
2435 * find_domain
David Woodhouse1525a292014-03-06 16:19:30 +00002436 * Note: we use struct device->archdata.iommu stores the info
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002437 */
David Woodhouse1525a292014-03-06 16:19:30 +00002438static struct dmar_domain *find_domain(struct device *dev)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002439{
2440 struct device_domain_info *info;
2441
2442 /* No lock here, assumes no domain exit in normal case */
David Woodhouse1525a292014-03-06 16:19:30 +00002443 info = dev->archdata.iommu;
Peter Xub316d022017-05-22 18:28:51 +08002444 if (likely(info))
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002445 return info->domain;
2446 return NULL;
2447}
2448
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002449static inline struct device_domain_info *
Jiang Liu745f2582014-02-19 14:07:26 +08002450dmar_search_domain_by_dev_info(int segment, int bus, int devfn)
2451{
2452 struct device_domain_info *info;
2453
2454 list_for_each_entry(info, &device_domain_list, global)
David Woodhouse41e80dca2014-03-09 13:55:54 -07002455 if (info->iommu->segment == segment && info->bus == bus &&
Jiang Liu745f2582014-02-19 14:07:26 +08002456 info->devfn == devfn)
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002457 return info;
Jiang Liu745f2582014-02-19 14:07:26 +08002458
2459 return NULL;
2460}
2461
Joerg Roedel5db31562015-07-22 12:40:43 +02002462static struct dmar_domain *dmar_insert_one_dev_info(struct intel_iommu *iommu,
2463 int bus, int devfn,
2464 struct device *dev,
2465 struct dmar_domain *domain)
Jiang Liu745f2582014-02-19 14:07:26 +08002466{
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002467 struct dmar_domain *found = NULL;
Jiang Liu745f2582014-02-19 14:07:26 +08002468 struct device_domain_info *info;
2469 unsigned long flags;
Joerg Roedeld160aca2015-07-22 11:52:53 +02002470 int ret;
Jiang Liu745f2582014-02-19 14:07:26 +08002471
2472 info = alloc_devinfo_mem();
2473 if (!info)
David Woodhouseb718cd32014-03-09 13:11:33 -07002474 return NULL;
Jiang Liu745f2582014-02-19 14:07:26 +08002475
Jiang Liu745f2582014-02-19 14:07:26 +08002476 info->bus = bus;
2477 info->devfn = devfn;
David Woodhouseb16d0cb2015-10-12 14:17:37 +01002478 info->ats_supported = info->pasid_supported = info->pri_supported = 0;
2479 info->ats_enabled = info->pasid_enabled = info->pri_enabled = 0;
2480 info->ats_qdep = 0;
Jiang Liu745f2582014-02-19 14:07:26 +08002481 info->dev = dev;
2482 info->domain = domain;
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002483 info->iommu = iommu;
Lu Baolucc580e42018-07-14 15:46:59 +08002484 info->pasid_table = NULL;
Jiang Liu745f2582014-02-19 14:07:26 +08002485
David Woodhouseb16d0cb2015-10-12 14:17:37 +01002486 if (dev && dev_is_pci(dev)) {
2487 struct pci_dev *pdev = to_pci_dev(info->dev);
2488
Lu Baolud8b85912019-03-01 11:23:10 +08002489 if (!pdev->untrusted &&
2490 !pci_ats_disabled() &&
Gil Kupfercef74402018-05-10 17:56:02 -05002491 ecap_dev_iotlb_support(iommu->ecap) &&
David Woodhouseb16d0cb2015-10-12 14:17:37 +01002492 pci_find_ext_capability(pdev, PCI_EXT_CAP_ID_ATS) &&
2493 dmar_find_matched_atsr_unit(pdev))
2494 info->ats_supported = 1;
2495
Lu Baolu765b6a92018-12-10 09:58:55 +08002496 if (sm_supported(iommu)) {
2497 if (pasid_supported(iommu)) {
David Woodhouseb16d0cb2015-10-12 14:17:37 +01002498 int features = pci_pasid_features(pdev);
2499 if (features >= 0)
2500 info->pasid_supported = features | 1;
2501 }
2502
2503 if (info->ats_supported && ecap_prs(iommu->ecap) &&
2504 pci_find_ext_capability(pdev, PCI_EXT_CAP_ID_PRI))
2505 info->pri_supported = 1;
2506 }
2507 }
2508
Jiang Liu745f2582014-02-19 14:07:26 +08002509 spin_lock_irqsave(&device_domain_lock, flags);
2510 if (dev)
David Woodhouse0bcb3e22014-03-06 17:12:03 +00002511 found = find_domain(dev);
Joerg Roedelf303e502015-07-23 18:37:13 +02002512
2513 if (!found) {
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002514 struct device_domain_info *info2;
David Woodhouse41e80dca2014-03-09 13:55:54 -07002515 info2 = dmar_search_domain_by_dev_info(iommu->segment, bus, devfn);
Joerg Roedelf303e502015-07-23 18:37:13 +02002516 if (info2) {
2517 found = info2->domain;
2518 info2->dev = dev;
2519 }
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002520 }
Joerg Roedelf303e502015-07-23 18:37:13 +02002521
Jiang Liu745f2582014-02-19 14:07:26 +08002522 if (found) {
2523 spin_unlock_irqrestore(&device_domain_lock, flags);
2524 free_devinfo_mem(info);
David Woodhouseb718cd32014-03-09 13:11:33 -07002525 /* Caller must free the original domain */
2526 return found;
Jiang Liu745f2582014-02-19 14:07:26 +08002527 }
2528
Joerg Roedeld160aca2015-07-22 11:52:53 +02002529 spin_lock(&iommu->lock);
2530 ret = domain_attach_iommu(domain, iommu);
2531 spin_unlock(&iommu->lock);
2532
2533 if (ret) {
Joerg Roedelc6c2ceb2015-07-22 13:11:53 +02002534 spin_unlock_irqrestore(&device_domain_lock, flags);
Sudip Mukherjee499f3aa2015-09-18 16:27:07 +05302535 free_devinfo_mem(info);
Joerg Roedelc6c2ceb2015-07-22 13:11:53 +02002536 return NULL;
2537 }
Joerg Roedelc6c2ceb2015-07-22 13:11:53 +02002538
David Woodhouseb718cd32014-03-09 13:11:33 -07002539 list_add(&info->link, &domain->devices);
2540 list_add(&info->global, &device_domain_list);
2541 if (dev)
2542 dev->archdata.iommu = info;
Lu Baolu0bbeb012018-12-10 09:58:56 +08002543 spin_unlock_irqrestore(&device_domain_lock, flags);
Lu Baolua7fc93f2018-07-14 15:47:00 +08002544
Lu Baolu0bbeb012018-12-10 09:58:56 +08002545 /* PASID table is mandatory for a PCI device in scalable mode. */
2546 if (dev && dev_is_pci(dev) && sm_supported(iommu)) {
Lu Baolua7fc93f2018-07-14 15:47:00 +08002547 ret = intel_pasid_alloc_table(dev);
2548 if (ret) {
Bjorn Helgaas932a6522019-02-08 16:06:00 -06002549 dev_err(dev, "PASID table allocation failed\n");
Bjorn Helgaas71753232019-02-08 16:06:15 -06002550 dmar_remove_one_dev_info(dev);
Lu Baolu0bbeb012018-12-10 09:58:56 +08002551 return NULL;
Lu Baolua7fc93f2018-07-14 15:47:00 +08002552 }
Lu Baoluef848b72018-12-10 09:59:01 +08002553
2554 /* Setup the PASID entry for requests without PASID: */
2555 spin_lock(&iommu->lock);
2556 if (hw_pass_through && domain_type_is_si(domain))
2557 ret = intel_pasid_setup_pass_through(iommu, domain,
2558 dev, PASID_RID2PASID);
2559 else
2560 ret = intel_pasid_setup_second_level(iommu, domain,
2561 dev, PASID_RID2PASID);
2562 spin_unlock(&iommu->lock);
2563 if (ret) {
Bjorn Helgaas932a6522019-02-08 16:06:00 -06002564 dev_err(dev, "Setup RID2PASID failed\n");
Bjorn Helgaas71753232019-02-08 16:06:15 -06002565 dmar_remove_one_dev_info(dev);
Lu Baoluef848b72018-12-10 09:59:01 +08002566 return NULL;
Lu Baolua7fc93f2018-07-14 15:47:00 +08002567 }
2568 }
David Woodhouseb718cd32014-03-09 13:11:33 -07002569
Joerg Roedelcc4e2572015-07-22 10:04:36 +02002570 if (dev && domain_context_mapping(domain, dev)) {
Bjorn Helgaas932a6522019-02-08 16:06:00 -06002571 dev_err(dev, "Domain context map failed\n");
Bjorn Helgaas71753232019-02-08 16:06:15 -06002572 dmar_remove_one_dev_info(dev);
Joerg Roedelcc4e2572015-07-22 10:04:36 +02002573 return NULL;
2574 }
2575
David Woodhouseb718cd32014-03-09 13:11:33 -07002576 return domain;
Jiang Liu745f2582014-02-19 14:07:26 +08002577}
2578
Alex Williamson579305f2014-07-03 09:51:43 -06002579static int get_last_alias(struct pci_dev *pdev, u16 alias, void *opaque)
2580{
2581 *(u16 *)opaque = alias;
2582 return 0;
2583}
2584
Joerg Roedel76208352016-08-25 14:25:12 +02002585static struct dmar_domain *find_or_alloc_domain(struct device *dev, int gaw)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002586{
Bjorn Helgaase083ea5b2019-02-08 16:06:08 -06002587 struct device_domain_info *info;
Joerg Roedel76208352016-08-25 14:25:12 +02002588 struct dmar_domain *domain = NULL;
Alex Williamson579305f2014-07-03 09:51:43 -06002589 struct intel_iommu *iommu;
Lu Baolufcc35c62018-05-04 13:08:17 +08002590 u16 dma_alias;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002591 unsigned long flags;
Yijing Wangaa4d0662014-05-26 20:14:06 +08002592 u8 bus, devfn;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002593
David Woodhouse146922e2014-03-09 15:44:17 -07002594 iommu = device_to_iommu(dev, &bus, &devfn);
2595 if (!iommu)
Alex Williamson579305f2014-07-03 09:51:43 -06002596 return NULL;
2597
2598 if (dev_is_pci(dev)) {
2599 struct pci_dev *pdev = to_pci_dev(dev);
2600
2601 pci_for_each_dma_alias(pdev, get_last_alias, &dma_alias);
2602
2603 spin_lock_irqsave(&device_domain_lock, flags);
2604 info = dmar_search_domain_by_dev_info(pci_domain_nr(pdev->bus),
2605 PCI_BUS_NUM(dma_alias),
2606 dma_alias & 0xff);
2607 if (info) {
2608 iommu = info->iommu;
2609 domain = info->domain;
2610 }
2611 spin_unlock_irqrestore(&device_domain_lock, flags);
2612
Joerg Roedel76208352016-08-25 14:25:12 +02002613 /* DMA alias already has a domain, use it */
Alex Williamson579305f2014-07-03 09:51:43 -06002614 if (info)
Joerg Roedel76208352016-08-25 14:25:12 +02002615 goto out;
Alex Williamson579305f2014-07-03 09:51:43 -06002616 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002617
David Woodhouse146922e2014-03-09 15:44:17 -07002618 /* Allocate and initialize new domain for the device */
Jiang Liuab8dfe22014-07-11 14:19:27 +08002619 domain = alloc_domain(0);
Jiang Liu745f2582014-02-19 14:07:26 +08002620 if (!domain)
Alex Williamson579305f2014-07-03 09:51:43 -06002621 return NULL;
Joerg Roedeldc534b22015-07-22 12:44:02 +02002622 if (domain_init(domain, iommu, gaw)) {
Alex Williamson579305f2014-07-03 09:51:43 -06002623 domain_exit(domain);
2624 return NULL;
2625 }
2626
Joerg Roedel76208352016-08-25 14:25:12 +02002627out:
Alex Williamson579305f2014-07-03 09:51:43 -06002628
Joerg Roedel76208352016-08-25 14:25:12 +02002629 return domain;
2630}
2631
2632static struct dmar_domain *set_domain_for_dev(struct device *dev,
2633 struct dmar_domain *domain)
2634{
2635 struct intel_iommu *iommu;
2636 struct dmar_domain *tmp;
2637 u16 req_id, dma_alias;
2638 u8 bus, devfn;
2639
2640 iommu = device_to_iommu(dev, &bus, &devfn);
2641 if (!iommu)
2642 return NULL;
2643
2644 req_id = ((u16)bus << 8) | devfn;
2645
2646 if (dev_is_pci(dev)) {
2647 struct pci_dev *pdev = to_pci_dev(dev);
2648
2649 pci_for_each_dma_alias(pdev, get_last_alias, &dma_alias);
2650
2651 /* register PCI DMA alias device */
2652 if (req_id != dma_alias) {
2653 tmp = dmar_insert_one_dev_info(iommu, PCI_BUS_NUM(dma_alias),
2654 dma_alias & 0xff, NULL, domain);
2655
2656 if (!tmp || tmp != domain)
2657 return tmp;
Alex Williamson579305f2014-07-03 09:51:43 -06002658 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002659 }
2660
Joerg Roedel5db31562015-07-22 12:40:43 +02002661 tmp = dmar_insert_one_dev_info(iommu, bus, devfn, dev, domain);
Joerg Roedel76208352016-08-25 14:25:12 +02002662 if (!tmp || tmp != domain)
2663 return tmp;
Alex Williamson579305f2014-07-03 09:51:43 -06002664
Joerg Roedel76208352016-08-25 14:25:12 +02002665 return domain;
2666}
2667
2668static struct dmar_domain *get_domain_for_dev(struct device *dev, int gaw)
2669{
2670 struct dmar_domain *domain, *tmp;
2671
2672 domain = find_domain(dev);
2673 if (domain)
2674 goto out;
2675
2676 domain = find_or_alloc_domain(dev, gaw);
2677 if (!domain)
2678 goto out;
2679
2680 tmp = set_domain_for_dev(dev, domain);
2681 if (!tmp || domain != tmp) {
Alex Williamson579305f2014-07-03 09:51:43 -06002682 domain_exit(domain);
2683 domain = tmp;
2684 }
David Woodhouseb718cd32014-03-09 13:11:33 -07002685
Joerg Roedel76208352016-08-25 14:25:12 +02002686out:
2687
David Woodhouseb718cd32014-03-09 13:11:33 -07002688 return domain;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002689}
2690
David Woodhouseb2132032009-06-26 18:50:28 +01002691static int iommu_domain_identity_map(struct dmar_domain *domain,
2692 unsigned long long start,
2693 unsigned long long end)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002694{
David Woodhousec5395d52009-06-28 16:35:56 +01002695 unsigned long first_vpfn = start >> VTD_PAGE_SHIFT;
2696 unsigned long last_vpfn = end >> VTD_PAGE_SHIFT;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002697
David Woodhousec5395d52009-06-28 16:35:56 +01002698 if (!reserve_iova(&domain->iovad, dma_to_mm_pfn(first_vpfn),
2699 dma_to_mm_pfn(last_vpfn))) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002700 pr_err("Reserving iova failed\n");
David Woodhouseb2132032009-06-26 18:50:28 +01002701 return -ENOMEM;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002702 }
2703
Joerg Roedelaf1089c2015-07-21 15:45:19 +02002704 pr_debug("Mapping reserved region %llx-%llx\n", start, end);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002705 /*
2706 * RMRR range might have overlap with physical memory range,
2707 * clear it first
2708 */
David Woodhousec5395d52009-06-28 16:35:56 +01002709 dma_pte_clear_range(domain, first_vpfn, last_vpfn);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002710
Peter Xu87684fd2018-05-04 10:34:53 +08002711 return __domain_mapping(domain, first_vpfn, NULL,
2712 first_vpfn, last_vpfn - first_vpfn + 1,
2713 DMA_PTE_READ|DMA_PTE_WRITE);
David Woodhouseb2132032009-06-26 18:50:28 +01002714}
2715
Joerg Roedeld66ce542015-09-23 19:00:10 +02002716static int domain_prepare_identity_map(struct device *dev,
2717 struct dmar_domain *domain,
2718 unsigned long long start,
2719 unsigned long long end)
David Woodhouseb2132032009-06-26 18:50:28 +01002720{
David Woodhouse19943b02009-08-04 16:19:20 +01002721 /* For _hardware_ passthrough, don't bother. But for software
2722 passthrough, we do it anyway -- it may indicate a memory
2723 range which is reserved in E820, so which didn't get set
2724 up to start with in si_domain */
2725 if (domain == si_domain && hw_pass_through) {
Bjorn Helgaas932a6522019-02-08 16:06:00 -06002726 dev_warn(dev, "Ignoring identity map for HW passthrough [0x%Lx - 0x%Lx]\n",
2727 start, end);
David Woodhouse19943b02009-08-04 16:19:20 +01002728 return 0;
2729 }
2730
Bjorn Helgaas932a6522019-02-08 16:06:00 -06002731 dev_info(dev, "Setting identity map [0x%Lx - 0x%Lx]\n", start, end);
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002732
David Woodhouse5595b522009-12-02 09:21:55 +00002733 if (end < start) {
2734 WARN(1, "Your BIOS is broken; RMRR ends before it starts!\n"
2735 "BIOS vendor: %s; Ver: %s; Product Version: %s\n",
2736 dmi_get_system_info(DMI_BIOS_VENDOR),
2737 dmi_get_system_info(DMI_BIOS_VERSION),
2738 dmi_get_system_info(DMI_PRODUCT_VERSION));
Joerg Roedeld66ce542015-09-23 19:00:10 +02002739 return -EIO;
David Woodhouse5595b522009-12-02 09:21:55 +00002740 }
2741
David Woodhouse2ff729f2009-08-26 14:25:41 +01002742 if (end >> agaw_to_width(domain->agaw)) {
2743 WARN(1, "Your BIOS is broken; RMRR exceeds permitted address width (%d bits)\n"
2744 "BIOS vendor: %s; Ver: %s; Product Version: %s\n",
2745 agaw_to_width(domain->agaw),
2746 dmi_get_system_info(DMI_BIOS_VENDOR),
2747 dmi_get_system_info(DMI_BIOS_VERSION),
2748 dmi_get_system_info(DMI_PRODUCT_VERSION));
Joerg Roedeld66ce542015-09-23 19:00:10 +02002749 return -EIO;
David Woodhouse2ff729f2009-08-26 14:25:41 +01002750 }
David Woodhouse19943b02009-08-04 16:19:20 +01002751
Joerg Roedeld66ce542015-09-23 19:00:10 +02002752 return iommu_domain_identity_map(domain, start, end);
2753}
2754
2755static int iommu_prepare_identity_map(struct device *dev,
2756 unsigned long long start,
2757 unsigned long long end)
2758{
2759 struct dmar_domain *domain;
2760 int ret;
2761
2762 domain = get_domain_for_dev(dev, DEFAULT_DOMAIN_ADDRESS_WIDTH);
2763 if (!domain)
2764 return -ENOMEM;
2765
2766 ret = domain_prepare_identity_map(dev, domain, start, end);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002767 if (ret)
Joerg Roedeld66ce542015-09-23 19:00:10 +02002768 domain_exit(domain);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002769
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002770 return ret;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002771}
2772
2773static inline int iommu_prepare_rmrr_dev(struct dmar_rmrr_unit *rmrr,
David Woodhouse0b9d9752014-03-09 15:48:15 -07002774 struct device *dev)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002775{
David Woodhouse0b9d9752014-03-09 15:48:15 -07002776 if (dev->archdata.iommu == DUMMY_DEVICE_DOMAIN_INFO)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002777 return 0;
David Woodhouse0b9d9752014-03-09 15:48:15 -07002778 return iommu_prepare_identity_map(dev, rmrr->base_address,
2779 rmrr->end_address);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002780}
2781
Suresh Siddhad3f13812011-08-23 17:05:25 -07002782#ifdef CONFIG_INTEL_IOMMU_FLOPPY_WA
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002783static inline void iommu_prepare_isa(void)
2784{
2785 struct pci_dev *pdev;
2786 int ret;
2787
2788 pdev = pci_get_class(PCI_CLASS_BRIDGE_ISA << 8, NULL);
2789 if (!pdev)
2790 return;
2791
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002792 pr_info("Prepare 0-16MiB unity mapping for LPC\n");
David Woodhouse0b9d9752014-03-09 15:48:15 -07002793 ret = iommu_prepare_identity_map(&pdev->dev, 0, 16*1024*1024 - 1);
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002794
2795 if (ret)
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002796 pr_err("Failed to create 0-16MiB identity map - floppy might not work\n");
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002797
Yijing Wang9b27e822014-05-20 20:37:52 +08002798 pci_dev_put(pdev);
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002799}
2800#else
2801static inline void iommu_prepare_isa(void)
2802{
2803 return;
2804}
Suresh Siddhad3f13812011-08-23 17:05:25 -07002805#endif /* !CONFIG_INTEL_IOMMU_FLPY_WA */
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002806
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002807static int md_domain_init(struct dmar_domain *domain, int guest_width);
David Woodhousec7ab48d2009-06-26 19:10:36 +01002808
Matt Kraai071e1372009-08-23 22:30:22 -07002809static int __init si_domain_init(int hw)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002810{
Bjorn Helgaase083ea5b2019-02-08 16:06:08 -06002811 int nid, ret;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002812
Jiang Liuab8dfe22014-07-11 14:19:27 +08002813 si_domain = alloc_domain(DOMAIN_FLAG_STATIC_IDENTITY);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002814 if (!si_domain)
2815 return -EFAULT;
2816
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002817 if (md_domain_init(si_domain, DEFAULT_DOMAIN_ADDRESS_WIDTH)) {
2818 domain_exit(si_domain);
2819 return -EFAULT;
2820 }
2821
Joerg Roedel0dc79712015-07-21 15:40:06 +02002822 pr_debug("Identity mapping domain allocated\n");
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002823
David Woodhouse19943b02009-08-04 16:19:20 +01002824 if (hw)
2825 return 0;
2826
David Woodhousec7ab48d2009-06-26 19:10:36 +01002827 for_each_online_node(nid) {
Tejun Heod4bbf7e2011-11-28 09:46:22 -08002828 unsigned long start_pfn, end_pfn;
2829 int i;
2830
2831 for_each_mem_pfn_range(i, nid, &start_pfn, &end_pfn, NULL) {
2832 ret = iommu_domain_identity_map(si_domain,
2833 PFN_PHYS(start_pfn), PFN_PHYS(end_pfn));
2834 if (ret)
2835 return ret;
2836 }
David Woodhousec7ab48d2009-06-26 19:10:36 +01002837 }
2838
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002839 return 0;
2840}
2841
David Woodhouse9b226622014-03-09 14:03:28 -07002842static int identity_mapping(struct device *dev)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002843{
2844 struct device_domain_info *info;
2845
2846 if (likely(!iommu_identity_mapping))
2847 return 0;
2848
David Woodhouse9b226622014-03-09 14:03:28 -07002849 info = dev->archdata.iommu;
Mike Traviscb452a42011-05-28 13:15:03 -05002850 if (info && info != DUMMY_DEVICE_DOMAIN_INFO)
2851 return (info->domain == si_domain);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002852
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002853 return 0;
2854}
2855
Joerg Roedel28ccce02015-07-21 14:45:31 +02002856static int domain_add_dev_info(struct dmar_domain *domain, struct device *dev)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002857{
David Woodhouse0ac72662014-03-09 13:19:22 -07002858 struct dmar_domain *ndomain;
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002859 struct intel_iommu *iommu;
David Woodhouse156baca2014-03-09 14:00:57 -07002860 u8 bus, devfn;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002861
David Woodhouse5913c9b2014-03-09 16:27:31 -07002862 iommu = device_to_iommu(dev, &bus, &devfn);
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002863 if (!iommu)
2864 return -ENODEV;
2865
Joerg Roedel5db31562015-07-22 12:40:43 +02002866 ndomain = dmar_insert_one_dev_info(iommu, bus, devfn, dev, domain);
David Woodhouse0ac72662014-03-09 13:19:22 -07002867 if (ndomain != domain)
2868 return -EBUSY;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002869
2870 return 0;
2871}
2872
David Woodhouse0b9d9752014-03-09 15:48:15 -07002873static bool device_has_rmrr(struct device *dev)
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002874{
2875 struct dmar_rmrr_unit *rmrr;
David Woodhouse832bd852014-03-07 15:08:36 +00002876 struct device *tmp;
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002877 int i;
2878
Jiang Liu0e2426122014-02-19 14:07:34 +08002879 rcu_read_lock();
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002880 for_each_rmrr_units(rmrr) {
Jiang Liub683b232014-02-19 14:07:32 +08002881 /*
2882 * Return TRUE if this RMRR contains the device that
2883 * is passed in.
2884 */
2885 for_each_active_dev_scope(rmrr->devices,
2886 rmrr->devices_cnt, i, tmp)
David Woodhouse0b9d9752014-03-09 15:48:15 -07002887 if (tmp == dev) {
Jiang Liu0e2426122014-02-19 14:07:34 +08002888 rcu_read_unlock();
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002889 return true;
Jiang Liub683b232014-02-19 14:07:32 +08002890 }
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002891 }
Jiang Liu0e2426122014-02-19 14:07:34 +08002892 rcu_read_unlock();
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002893 return false;
2894}
2895
Alex Williamsonc875d2c2014-07-03 09:57:02 -06002896/*
2897 * There are a couple cases where we need to restrict the functionality of
2898 * devices associated with RMRRs. The first is when evaluating a device for
2899 * identity mapping because problems exist when devices are moved in and out
2900 * of domains and their respective RMRR information is lost. This means that
2901 * a device with associated RMRRs will never be in a "passthrough" domain.
2902 * The second is use of the device through the IOMMU API. This interface
2903 * expects to have full control of the IOVA space for the device. We cannot
2904 * satisfy both the requirement that RMRR access is maintained and have an
2905 * unencumbered IOVA space. We also have no ability to quiesce the device's
2906 * use of the RMRR space or even inform the IOMMU API user of the restriction.
2907 * We therefore prevent devices associated with an RMRR from participating in
2908 * the IOMMU API, which eliminates them from device assignment.
2909 *
2910 * In both cases we assume that PCI USB devices with RMRRs have them largely
2911 * for historical reasons and that the RMRR space is not actively used post
2912 * boot. This exclusion may change if vendors begin to abuse it.
David Woodhouse18436af2015-03-25 15:05:47 +00002913 *
2914 * The same exception is made for graphics devices, with the requirement that
2915 * any use of the RMRR regions will be torn down before assigning the device
2916 * to a guest.
Alex Williamsonc875d2c2014-07-03 09:57:02 -06002917 */
2918static bool device_is_rmrr_locked(struct device *dev)
2919{
2920 if (!device_has_rmrr(dev))
2921 return false;
2922
2923 if (dev_is_pci(dev)) {
2924 struct pci_dev *pdev = to_pci_dev(dev);
2925
David Woodhouse18436af2015-03-25 15:05:47 +00002926 if (IS_USB_DEVICE(pdev) || IS_GFX_DEVICE(pdev))
Alex Williamsonc875d2c2014-07-03 09:57:02 -06002927 return false;
2928 }
2929
2930 return true;
2931}
2932
David Woodhouse3bdb2592014-03-09 16:03:08 -07002933static int iommu_should_identity_map(struct device *dev, int startup)
David Woodhouse6941af22009-07-04 18:24:27 +01002934{
David Woodhouse3bdb2592014-03-09 16:03:08 -07002935 if (dev_is_pci(dev)) {
2936 struct pci_dev *pdev = to_pci_dev(dev);
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002937
Alex Williamsonc875d2c2014-07-03 09:57:02 -06002938 if (device_is_rmrr_locked(dev))
David Woodhouse3bdb2592014-03-09 16:03:08 -07002939 return 0;
David Woodhousee0fc7e02009-09-30 09:12:17 -07002940
Lu Baolu89a60792018-10-23 15:45:01 +08002941 /*
2942 * Prevent any device marked as untrusted from getting
2943 * placed into the statically identity mapping domain.
2944 */
2945 if (pdev->untrusted)
2946 return 0;
2947
David Woodhouse3bdb2592014-03-09 16:03:08 -07002948 if ((iommu_identity_mapping & IDENTMAP_AZALIA) && IS_AZALIA(pdev))
2949 return 1;
David Woodhousee0fc7e02009-09-30 09:12:17 -07002950
David Woodhouse3bdb2592014-03-09 16:03:08 -07002951 if ((iommu_identity_mapping & IDENTMAP_GFX) && IS_GFX_DEVICE(pdev))
2952 return 1;
2953
2954 if (!(iommu_identity_mapping & IDENTMAP_ALL))
2955 return 0;
2956
2957 /*
2958 * We want to start off with all devices in the 1:1 domain, and
2959 * take them out later if we find they can't access all of memory.
2960 *
2961 * However, we can't do this for PCI devices behind bridges,
2962 * because all PCI devices behind the same bridge will end up
2963 * with the same source-id on their transactions.
2964 *
2965 * Practically speaking, we can't change things around for these
2966 * devices at run-time, because we can't be sure there'll be no
2967 * DMA transactions in flight for any of their siblings.
2968 *
2969 * So PCI devices (unless they're on the root bus) as well as
2970 * their parent PCI-PCI or PCIe-PCI bridges must be left _out_ of
2971 * the 1:1 domain, just in _case_ one of their siblings turns out
2972 * not to be able to map all of memory.
2973 */
2974 if (!pci_is_pcie(pdev)) {
2975 if (!pci_is_root_bus(pdev->bus))
2976 return 0;
2977 if (pdev->class >> 8 == PCI_CLASS_BRIDGE_PCI)
2978 return 0;
2979 } else if (pci_pcie_type(pdev) == PCI_EXP_TYPE_PCI_BRIDGE)
2980 return 0;
2981 } else {
2982 if (device_has_rmrr(dev))
2983 return 0;
2984 }
David Woodhouse6941af22009-07-04 18:24:27 +01002985
David Woodhouse3dfc8132009-07-04 19:11:08 +01002986 /*
David Woodhouse3dfc8132009-07-04 19:11:08 +01002987 * At boot time, we don't yet know if devices will be 64-bit capable.
David Woodhouse3bdb2592014-03-09 16:03:08 -07002988 * Assume that they will — if they turn out not to be, then we can
David Woodhouse3dfc8132009-07-04 19:11:08 +01002989 * take them out of the 1:1 domain later.
2990 */
Chris Wright8fcc5372011-05-28 13:15:02 -05002991 if (!startup) {
2992 /*
2993 * If the device's dma_mask is less than the system's memory
2994 * size then this is not a candidate for identity mapping.
2995 */
David Woodhouse3bdb2592014-03-09 16:03:08 -07002996 u64 dma_mask = *dev->dma_mask;
Chris Wright8fcc5372011-05-28 13:15:02 -05002997
David Woodhouse3bdb2592014-03-09 16:03:08 -07002998 if (dev->coherent_dma_mask &&
2999 dev->coherent_dma_mask < dma_mask)
3000 dma_mask = dev->coherent_dma_mask;
Chris Wright8fcc5372011-05-28 13:15:02 -05003001
David Woodhouse3bdb2592014-03-09 16:03:08 -07003002 return dma_mask >= dma_get_required_mask(dev);
Chris Wright8fcc5372011-05-28 13:15:02 -05003003 }
David Woodhouse6941af22009-07-04 18:24:27 +01003004
3005 return 1;
3006}
3007
David Woodhousecf04eee2014-03-21 16:49:04 +00003008static int __init dev_prepare_static_identity_mapping(struct device *dev, int hw)
3009{
3010 int ret;
3011
3012 if (!iommu_should_identity_map(dev, 1))
3013 return 0;
3014
Joerg Roedel28ccce02015-07-21 14:45:31 +02003015 ret = domain_add_dev_info(si_domain, dev);
David Woodhousecf04eee2014-03-21 16:49:04 +00003016 if (!ret)
Bjorn Helgaas932a6522019-02-08 16:06:00 -06003017 dev_info(dev, "%s identity mapping\n",
3018 hw ? "Hardware" : "Software");
David Woodhousecf04eee2014-03-21 16:49:04 +00003019 else if (ret == -ENODEV)
3020 /* device not associated with an iommu */
3021 ret = 0;
3022
3023 return ret;
3024}
3025
3026
Matt Kraai071e1372009-08-23 22:30:22 -07003027static int __init iommu_prepare_static_identity_mapping(int hw)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003028{
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003029 struct pci_dev *pdev = NULL;
David Woodhousecf04eee2014-03-21 16:49:04 +00003030 struct dmar_drhd_unit *drhd;
3031 struct intel_iommu *iommu;
3032 struct device *dev;
3033 int i;
3034 int ret = 0;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003035
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003036 for_each_pci_dev(pdev) {
David Woodhousecf04eee2014-03-21 16:49:04 +00003037 ret = dev_prepare_static_identity_mapping(&pdev->dev, hw);
3038 if (ret)
3039 return ret;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003040 }
3041
David Woodhousecf04eee2014-03-21 16:49:04 +00003042 for_each_active_iommu(iommu, drhd)
3043 for_each_active_dev_scope(drhd->devices, drhd->devices_cnt, i, dev) {
3044 struct acpi_device_physical_node *pn;
3045 struct acpi_device *adev;
3046
3047 if (dev->bus != &acpi_bus_type)
3048 continue;
Joerg Roedel86080cc2015-06-12 12:27:16 +02003049
David Woodhousecf04eee2014-03-21 16:49:04 +00003050 adev= to_acpi_device(dev);
3051 mutex_lock(&adev->physical_node_lock);
3052 list_for_each_entry(pn, &adev->physical_node_list, node) {
3053 ret = dev_prepare_static_identity_mapping(pn->dev, hw);
3054 if (ret)
3055 break;
3056 }
3057 mutex_unlock(&adev->physical_node_lock);
3058 if (ret)
3059 return ret;
3060 }
3061
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003062 return 0;
3063}
3064
Jiang Liuffebeb42014-11-09 22:48:02 +08003065static void intel_iommu_init_qi(struct intel_iommu *iommu)
3066{
3067 /*
3068 * Start from the sane iommu hardware state.
3069 * If the queued invalidation is already initialized by us
3070 * (for example, while enabling interrupt-remapping) then
3071 * we got the things already rolling from a sane state.
3072 */
3073 if (!iommu->qi) {
3074 /*
3075 * Clear any previous faults.
3076 */
3077 dmar_fault(-1, iommu);
3078 /*
3079 * Disable queued invalidation if supported and already enabled
3080 * before OS handover.
3081 */
3082 dmar_disable_qi(iommu);
3083 }
3084
3085 if (dmar_enable_qi(iommu)) {
3086 /*
3087 * Queued Invalidate not enabled, use Register Based Invalidate
3088 */
3089 iommu->flush.flush_context = __iommu_flush_context;
3090 iommu->flush.flush_iotlb = __iommu_flush_iotlb;
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003091 pr_info("%s: Using Register based invalidation\n",
Jiang Liuffebeb42014-11-09 22:48:02 +08003092 iommu->name);
3093 } else {
3094 iommu->flush.flush_context = qi_flush_context;
3095 iommu->flush.flush_iotlb = qi_flush_iotlb;
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003096 pr_info("%s: Using Queued invalidation\n", iommu->name);
Jiang Liuffebeb42014-11-09 22:48:02 +08003097 }
3098}
3099
Joerg Roedel091d42e2015-06-12 11:56:10 +02003100static int copy_context_table(struct intel_iommu *iommu,
Dan Williamsdfddb962015-10-09 18:16:46 -04003101 struct root_entry *old_re,
Joerg Roedel091d42e2015-06-12 11:56:10 +02003102 struct context_entry **tbl,
3103 int bus, bool ext)
3104{
Joerg Roedeldbcd8612015-06-12 12:02:09 +02003105 int tbl_idx, pos = 0, idx, devfn, ret = 0, did;
Joerg Roedel543c8dc2015-08-13 11:56:59 +02003106 struct context_entry *new_ce = NULL, ce;
Dan Williamsdfddb962015-10-09 18:16:46 -04003107 struct context_entry *old_ce = NULL;
Joerg Roedel543c8dc2015-08-13 11:56:59 +02003108 struct root_entry re;
Joerg Roedel091d42e2015-06-12 11:56:10 +02003109 phys_addr_t old_ce_phys;
3110
3111 tbl_idx = ext ? bus * 2 : bus;
Dan Williamsdfddb962015-10-09 18:16:46 -04003112 memcpy(&re, old_re, sizeof(re));
Joerg Roedel091d42e2015-06-12 11:56:10 +02003113
3114 for (devfn = 0; devfn < 256; devfn++) {
3115 /* First calculate the correct index */
3116 idx = (ext ? devfn * 2 : devfn) % 256;
3117
3118 if (idx == 0) {
3119 /* First save what we may have and clean up */
3120 if (new_ce) {
3121 tbl[tbl_idx] = new_ce;
3122 __iommu_flush_cache(iommu, new_ce,
3123 VTD_PAGE_SIZE);
3124 pos = 1;
3125 }
3126
3127 if (old_ce)
Pan Bian829383e2018-11-21 17:53:47 +08003128 memunmap(old_ce);
Joerg Roedel091d42e2015-06-12 11:56:10 +02003129
3130 ret = 0;
3131 if (devfn < 0x80)
Joerg Roedel543c8dc2015-08-13 11:56:59 +02003132 old_ce_phys = root_entry_lctp(&re);
Joerg Roedel091d42e2015-06-12 11:56:10 +02003133 else
Joerg Roedel543c8dc2015-08-13 11:56:59 +02003134 old_ce_phys = root_entry_uctp(&re);
Joerg Roedel091d42e2015-06-12 11:56:10 +02003135
3136 if (!old_ce_phys) {
3137 if (ext && devfn == 0) {
3138 /* No LCTP, try UCTP */
3139 devfn = 0x7f;
3140 continue;
3141 } else {
3142 goto out;
3143 }
3144 }
3145
3146 ret = -ENOMEM;
Dan Williamsdfddb962015-10-09 18:16:46 -04003147 old_ce = memremap(old_ce_phys, PAGE_SIZE,
3148 MEMREMAP_WB);
Joerg Roedel091d42e2015-06-12 11:56:10 +02003149 if (!old_ce)
3150 goto out;
3151
3152 new_ce = alloc_pgtable_page(iommu->node);
3153 if (!new_ce)
3154 goto out_unmap;
3155
3156 ret = 0;
3157 }
3158
3159 /* Now copy the context entry */
Dan Williamsdfddb962015-10-09 18:16:46 -04003160 memcpy(&ce, old_ce + idx, sizeof(ce));
Joerg Roedel091d42e2015-06-12 11:56:10 +02003161
Joerg Roedelcf484d02015-06-12 12:21:46 +02003162 if (!__context_present(&ce))
Joerg Roedel091d42e2015-06-12 11:56:10 +02003163 continue;
3164
Joerg Roedeldbcd8612015-06-12 12:02:09 +02003165 did = context_domain_id(&ce);
3166 if (did >= 0 && did < cap_ndoms(iommu->cap))
3167 set_bit(did, iommu->domain_ids);
3168
Joerg Roedelcf484d02015-06-12 12:21:46 +02003169 /*
3170 * We need a marker for copied context entries. This
3171 * marker needs to work for the old format as well as
3172 * for extended context entries.
3173 *
3174 * Bit 67 of the context entry is used. In the old
3175 * format this bit is available to software, in the
3176 * extended format it is the PGE bit, but PGE is ignored
3177 * by HW if PASIDs are disabled (and thus still
3178 * available).
3179 *
3180 * So disable PASIDs first and then mark the entry
3181 * copied. This means that we don't copy PASID
3182 * translations from the old kernel, but this is fine as
3183 * faults there are not fatal.
3184 */
3185 context_clear_pasid_enable(&ce);
3186 context_set_copied(&ce);
3187
Joerg Roedel091d42e2015-06-12 11:56:10 +02003188 new_ce[idx] = ce;
3189 }
3190
3191 tbl[tbl_idx + pos] = new_ce;
3192
3193 __iommu_flush_cache(iommu, new_ce, VTD_PAGE_SIZE);
3194
3195out_unmap:
Dan Williamsdfddb962015-10-09 18:16:46 -04003196 memunmap(old_ce);
Joerg Roedel091d42e2015-06-12 11:56:10 +02003197
3198out:
3199 return ret;
3200}
3201
3202static int copy_translation_tables(struct intel_iommu *iommu)
3203{
3204 struct context_entry **ctxt_tbls;
Dan Williamsdfddb962015-10-09 18:16:46 -04003205 struct root_entry *old_rt;
Joerg Roedel091d42e2015-06-12 11:56:10 +02003206 phys_addr_t old_rt_phys;
3207 int ctxt_table_entries;
3208 unsigned long flags;
3209 u64 rtaddr_reg;
3210 int bus, ret;
Joerg Roedelc3361f22015-06-12 12:39:25 +02003211 bool new_ext, ext;
Joerg Roedel091d42e2015-06-12 11:56:10 +02003212
3213 rtaddr_reg = dmar_readq(iommu->reg + DMAR_RTADDR_REG);
3214 ext = !!(rtaddr_reg & DMA_RTADDR_RTT);
Joerg Roedelc3361f22015-06-12 12:39:25 +02003215 new_ext = !!ecap_ecs(iommu->ecap);
3216
3217 /*
3218 * The RTT bit can only be changed when translation is disabled,
3219 * but disabling translation means to open a window for data
3220 * corruption. So bail out and don't copy anything if we would
3221 * have to change the bit.
3222 */
3223 if (new_ext != ext)
3224 return -EINVAL;
Joerg Roedel091d42e2015-06-12 11:56:10 +02003225
3226 old_rt_phys = rtaddr_reg & VTD_PAGE_MASK;
3227 if (!old_rt_phys)
3228 return -EINVAL;
3229
Dan Williamsdfddb962015-10-09 18:16:46 -04003230 old_rt = memremap(old_rt_phys, PAGE_SIZE, MEMREMAP_WB);
Joerg Roedel091d42e2015-06-12 11:56:10 +02003231 if (!old_rt)
3232 return -ENOMEM;
3233
3234 /* This is too big for the stack - allocate it from slab */
3235 ctxt_table_entries = ext ? 512 : 256;
3236 ret = -ENOMEM;
Kees Cook6396bb22018-06-12 14:03:40 -07003237 ctxt_tbls = kcalloc(ctxt_table_entries, sizeof(void *), GFP_KERNEL);
Joerg Roedel091d42e2015-06-12 11:56:10 +02003238 if (!ctxt_tbls)
3239 goto out_unmap;
3240
3241 for (bus = 0; bus < 256; bus++) {
3242 ret = copy_context_table(iommu, &old_rt[bus],
3243 ctxt_tbls, bus, ext);
3244 if (ret) {
3245 pr_err("%s: Failed to copy context table for bus %d\n",
3246 iommu->name, bus);
3247 continue;
3248 }
3249 }
3250
3251 spin_lock_irqsave(&iommu->lock, flags);
3252
3253 /* Context tables are copied, now write them to the root_entry table */
3254 for (bus = 0; bus < 256; bus++) {
3255 int idx = ext ? bus * 2 : bus;
3256 u64 val;
3257
3258 if (ctxt_tbls[idx]) {
3259 val = virt_to_phys(ctxt_tbls[idx]) | 1;
3260 iommu->root_entry[bus].lo = val;
3261 }
3262
3263 if (!ext || !ctxt_tbls[idx + 1])
3264 continue;
3265
3266 val = virt_to_phys(ctxt_tbls[idx + 1]) | 1;
3267 iommu->root_entry[bus].hi = val;
3268 }
3269
3270 spin_unlock_irqrestore(&iommu->lock, flags);
3271
3272 kfree(ctxt_tbls);
3273
3274 __iommu_flush_cache(iommu, iommu->root_entry, PAGE_SIZE);
3275
3276 ret = 0;
3277
3278out_unmap:
Dan Williamsdfddb962015-10-09 18:16:46 -04003279 memunmap(old_rt);
Joerg Roedel091d42e2015-06-12 11:56:10 +02003280
3281 return ret;
3282}
3283
Joseph Cihulab7792602011-05-03 00:08:37 -07003284static int __init init_dmars(void)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003285{
3286 struct dmar_drhd_unit *drhd;
3287 struct dmar_rmrr_unit *rmrr;
Joerg Roedela87f4912015-06-12 12:32:54 +02003288 bool copied_tables = false;
David Woodhouse832bd852014-03-07 15:08:36 +00003289 struct device *dev;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003290 struct intel_iommu *iommu;
Joerg Roedel13cf0172017-08-11 11:40:10 +02003291 int i, ret;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003292
3293 /*
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003294 * for each drhd
3295 * allocate root
3296 * initialize and program root entry to not present
3297 * endfor
3298 */
3299 for_each_drhd_unit(drhd) {
mark gross5e0d2a62008-03-04 15:22:08 -08003300 /*
3301 * lock not needed as this is only incremented in the single
3302 * threaded kernel __init code path all other access are read
3303 * only
3304 */
Jiang Liu78d8e702014-11-09 22:47:57 +08003305 if (g_num_of_iommus < DMAR_UNITS_SUPPORTED) {
Mike Travis1b198bb2012-03-05 15:05:16 -08003306 g_num_of_iommus++;
3307 continue;
3308 }
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003309 pr_err_once("Exceeded %d IOMMUs\n", DMAR_UNITS_SUPPORTED);
mark gross5e0d2a62008-03-04 15:22:08 -08003310 }
3311
Jiang Liuffebeb42014-11-09 22:48:02 +08003312 /* Preallocate enough resources for IOMMU hot-addition */
3313 if (g_num_of_iommus < DMAR_UNITS_SUPPORTED)
3314 g_num_of_iommus = DMAR_UNITS_SUPPORTED;
3315
Weidong Hand9630fe2008-12-08 11:06:32 +08003316 g_iommus = kcalloc(g_num_of_iommus, sizeof(struct intel_iommu *),
3317 GFP_KERNEL);
3318 if (!g_iommus) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003319 pr_err("Allocating global iommu array failed\n");
Weidong Hand9630fe2008-12-08 11:06:32 +08003320 ret = -ENOMEM;
3321 goto error;
3322 }
3323
Jiang Liu7c919772014-01-06 14:18:18 +08003324 for_each_active_iommu(iommu, drhd) {
Lu Baolu56283172018-07-14 15:46:54 +08003325 /*
3326 * Find the max pasid size of all IOMMU's in the system.
3327 * We need to ensure the system pasid table is no bigger
3328 * than the smallest supported.
3329 */
Lu Baolu765b6a92018-12-10 09:58:55 +08003330 if (pasid_supported(iommu)) {
Lu Baolu56283172018-07-14 15:46:54 +08003331 u32 temp = 2 << ecap_pss(iommu->ecap);
3332
3333 intel_pasid_max_id = min_t(u32, temp,
3334 intel_pasid_max_id);
3335 }
3336
Weidong Hand9630fe2008-12-08 11:06:32 +08003337 g_iommus[iommu->seq_id] = iommu;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003338
Joerg Roedelb63d80d2015-06-12 09:14:34 +02003339 intel_iommu_init_qi(iommu);
3340
Suresh Siddhae61d98d2008-07-10 11:16:35 -07003341 ret = iommu_init_domains(iommu);
3342 if (ret)
Jiang Liu989d51f2014-02-19 14:07:21 +08003343 goto free_iommu;
Suresh Siddhae61d98d2008-07-10 11:16:35 -07003344
Joerg Roedel4158c2e2015-06-12 10:14:02 +02003345 init_translation_status(iommu);
3346
Joerg Roedel091d42e2015-06-12 11:56:10 +02003347 if (translation_pre_enabled(iommu) && !is_kdump_kernel()) {
3348 iommu_disable_translation(iommu);
3349 clear_translation_pre_enabled(iommu);
3350 pr_warn("Translation was enabled for %s but we are not in kdump mode\n",
3351 iommu->name);
3352 }
Joerg Roedel4158c2e2015-06-12 10:14:02 +02003353
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003354 /*
3355 * TBD:
3356 * we could share the same root & context tables
Lucas De Marchi25985ed2011-03-30 22:57:33 -03003357 * among all IOMMU's. Need to Split it later.
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003358 */
3359 ret = iommu_alloc_root_entry(iommu);
Jiang Liuffebeb42014-11-09 22:48:02 +08003360 if (ret)
Jiang Liu989d51f2014-02-19 14:07:21 +08003361 goto free_iommu;
Joerg Roedel5f0a7f72015-06-12 09:18:53 +02003362
Joerg Roedel091d42e2015-06-12 11:56:10 +02003363 if (translation_pre_enabled(iommu)) {
3364 pr_info("Translation already enabled - trying to copy translation structures\n");
3365
3366 ret = copy_translation_tables(iommu);
3367 if (ret) {
3368 /*
3369 * We found the IOMMU with translation
3370 * enabled - but failed to copy over the
3371 * old root-entry table. Try to proceed
3372 * by disabling translation now and
3373 * allocating a clean root-entry table.
3374 * This might cause DMAR faults, but
3375 * probably the dump will still succeed.
3376 */
3377 pr_err("Failed to copy translation tables from previous kernel for %s\n",
3378 iommu->name);
3379 iommu_disable_translation(iommu);
3380 clear_translation_pre_enabled(iommu);
3381 } else {
3382 pr_info("Copied translation tables from previous kernel for %s\n",
3383 iommu->name);
Joerg Roedela87f4912015-06-12 12:32:54 +02003384 copied_tables = true;
Joerg Roedel091d42e2015-06-12 11:56:10 +02003385 }
3386 }
3387
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07003388 if (!ecap_pass_through(iommu->ecap))
David Woodhouse19943b02009-08-04 16:19:20 +01003389 hw_pass_through = 0;
David Woodhouse8a94ade2015-03-24 14:54:56 +00003390#ifdef CONFIG_INTEL_IOMMU_SVM
Lu Baolu765b6a92018-12-10 09:58:55 +08003391 if (pasid_supported(iommu))
Lu Baolud9737952018-07-14 15:47:02 +08003392 intel_svm_init(iommu);
David Woodhouse8a94ade2015-03-24 14:54:56 +00003393#endif
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003394 }
3395
Joerg Roedela4c34ff2016-06-17 11:29:48 +02003396 /*
3397 * Now that qi is enabled on all iommus, set the root entry and flush
3398 * caches. This is required on some Intel X58 chipsets, otherwise the
3399 * flush_context function will loop forever and the boot hangs.
3400 */
3401 for_each_active_iommu(iommu, drhd) {
3402 iommu_flush_write_buffer(iommu);
3403 iommu_set_root_entry(iommu);
3404 iommu->flush.flush_context(iommu, 0, 0, 0, DMA_CCMD_GLOBAL_INVL);
3405 iommu->flush.flush_iotlb(iommu, 0, 0, 0, DMA_TLB_GLOBAL_FLUSH);
3406 }
3407
David Woodhouse19943b02009-08-04 16:19:20 +01003408 if (iommu_pass_through)
David Woodhousee0fc7e02009-09-30 09:12:17 -07003409 iommu_identity_mapping |= IDENTMAP_ALL;
3410
Suresh Siddhad3f13812011-08-23 17:05:25 -07003411#ifdef CONFIG_INTEL_IOMMU_BROKEN_GFX_WA
David Woodhousee0fc7e02009-09-30 09:12:17 -07003412 iommu_identity_mapping |= IDENTMAP_GFX;
David Woodhouse19943b02009-08-04 16:19:20 +01003413#endif
David Woodhousee0fc7e02009-09-30 09:12:17 -07003414
Ashok Raj21e722c2017-01-30 09:39:53 -08003415 check_tylersburg_isoch();
3416
Joerg Roedel86080cc2015-06-12 12:27:16 +02003417 if (iommu_identity_mapping) {
3418 ret = si_domain_init(hw_pass_through);
3419 if (ret)
3420 goto free_iommu;
3421 }
3422
David Woodhousee0fc7e02009-09-30 09:12:17 -07003423
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07003424 /*
Joerg Roedela87f4912015-06-12 12:32:54 +02003425 * If we copied translations from a previous kernel in the kdump
3426 * case, we can not assign the devices to domains now, as that
3427 * would eliminate the old mappings. So skip this part and defer
3428 * the assignment to device driver initialization time.
3429 */
3430 if (copied_tables)
3431 goto domains_done;
3432
3433 /*
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07003434 * If pass through is not set or not enabled, setup context entries for
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003435 * identity mappings for rmrr, gfx, and isa and may fall back to static
3436 * identity mapping if iommu_identity_mapping is set.
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07003437 */
David Woodhouse19943b02009-08-04 16:19:20 +01003438 if (iommu_identity_mapping) {
3439 ret = iommu_prepare_static_identity_mapping(hw_pass_through);
3440 if (ret) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003441 pr_crit("Failed to setup IOMMU pass-through\n");
Jiang Liu989d51f2014-02-19 14:07:21 +08003442 goto free_iommu;
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07003443 }
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07003444 }
David Woodhouse19943b02009-08-04 16:19:20 +01003445 /*
3446 * For each rmrr
3447 * for each dev attached to rmrr
3448 * do
3449 * locate drhd for dev, alloc domain for dev
3450 * allocate free domain
3451 * allocate page table entries for rmrr
3452 * if context not allocated for bus
3453 * allocate and init context
3454 * set present in root table for this bus
3455 * init context with domain, translation etc
3456 * endfor
3457 * endfor
3458 */
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003459 pr_info("Setting RMRR:\n");
David Woodhouse19943b02009-08-04 16:19:20 +01003460 for_each_rmrr_units(rmrr) {
Jiang Liub683b232014-02-19 14:07:32 +08003461 /* some BIOS lists non-exist devices in DMAR table. */
3462 for_each_active_dev_scope(rmrr->devices, rmrr->devices_cnt,
David Woodhouse832bd852014-03-07 15:08:36 +00003463 i, dev) {
David Woodhouse0b9d9752014-03-09 15:48:15 -07003464 ret = iommu_prepare_rmrr_dev(rmrr, dev);
David Woodhouse19943b02009-08-04 16:19:20 +01003465 if (ret)
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003466 pr_err("Mapping reserved region failed\n");
David Woodhouse19943b02009-08-04 16:19:20 +01003467 }
3468 }
3469
3470 iommu_prepare_isa();
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07003471
Joerg Roedela87f4912015-06-12 12:32:54 +02003472domains_done:
3473
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003474 /*
3475 * for each drhd
3476 * enable fault log
3477 * global invalidate context cache
3478 * global invalidate iotlb
3479 * enable translation
3480 */
Jiang Liu7c919772014-01-06 14:18:18 +08003481 for_each_iommu(iommu, drhd) {
Joseph Cihula51a63e62011-03-21 11:04:24 -07003482 if (drhd->ignored) {
3483 /*
3484 * we always have to disable PMRs or DMA may fail on
3485 * this device
3486 */
3487 if (force_on)
Jiang Liu7c919772014-01-06 14:18:18 +08003488 iommu_disable_protect_mem_regions(iommu);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003489 continue;
Joseph Cihula51a63e62011-03-21 11:04:24 -07003490 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003491
3492 iommu_flush_write_buffer(iommu);
3493
David Woodhousea222a7f2015-10-07 23:35:18 +01003494#ifdef CONFIG_INTEL_IOMMU_SVM
Lu Baolu765b6a92018-12-10 09:58:55 +08003495 if (pasid_supported(iommu) && ecap_prs(iommu->ecap)) {
David Woodhousea222a7f2015-10-07 23:35:18 +01003496 ret = intel_svm_enable_prq(iommu);
3497 if (ret)
3498 goto free_iommu;
3499 }
3500#endif
Keshavamurthy, Anil S3460a6d2007-10-21 16:41:54 -07003501 ret = dmar_set_interrupt(iommu);
3502 if (ret)
Jiang Liu989d51f2014-02-19 14:07:21 +08003503 goto free_iommu;
Keshavamurthy, Anil S3460a6d2007-10-21 16:41:54 -07003504
Joerg Roedel8939ddf2015-06-12 14:40:01 +02003505 if (!translation_pre_enabled(iommu))
3506 iommu_enable_translation(iommu);
3507
David Woodhouseb94996c2009-09-19 15:28:12 -07003508 iommu_disable_protect_mem_regions(iommu);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003509 }
3510
3511 return 0;
Jiang Liu989d51f2014-02-19 14:07:21 +08003512
3513free_iommu:
Jiang Liuffebeb42014-11-09 22:48:02 +08003514 for_each_active_iommu(iommu, drhd) {
3515 disable_dmar_iommu(iommu);
Jiang Liua868e6b2014-01-06 14:18:20 +08003516 free_dmar_iommu(iommu);
Jiang Liuffebeb42014-11-09 22:48:02 +08003517 }
Joerg Roedel13cf0172017-08-11 11:40:10 +02003518
Weidong Hand9630fe2008-12-08 11:06:32 +08003519 kfree(g_iommus);
Joerg Roedel13cf0172017-08-11 11:40:10 +02003520
Jiang Liu989d51f2014-02-19 14:07:21 +08003521error:
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003522 return ret;
3523}
3524
David Woodhouse5a5e02a2009-07-04 09:35:44 +01003525/* This takes a number of _MM_ pages, not VTD pages */
Omer Peleg2aac6302016-04-20 11:33:57 +03003526static unsigned long intel_alloc_iova(struct device *dev,
David Woodhouse875764d2009-06-28 21:20:51 +01003527 struct dmar_domain *domain,
3528 unsigned long nrpages, uint64_t dma_mask)
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003529{
Bjorn Helgaase083ea5b2019-02-08 16:06:08 -06003530 unsigned long iova_pfn;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003531
David Woodhouse875764d2009-06-28 21:20:51 +01003532 /* Restrict dma_mask to the width that the iommu can handle */
3533 dma_mask = min_t(uint64_t, DOMAIN_MAX_ADDR(domain->gaw), dma_mask);
Robin Murphy8f6429c2015-07-16 19:40:12 +01003534 /* Ensure we reserve the whole size-aligned region */
3535 nrpages = __roundup_pow_of_two(nrpages);
David Woodhouse875764d2009-06-28 21:20:51 +01003536
3537 if (!dmar_forcedac && dma_mask > DMA_BIT_MASK(32)) {
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003538 /*
3539 * First try to allocate an io virtual address in
Yang Hongyang284901a2009-04-06 19:01:15 -07003540 * DMA_BIT_MASK(32) and if that fails then try allocating
Joe Perches36098012007-12-17 11:40:11 -08003541 * from higher range
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003542 */
Omer Peleg22e2f9f2016-04-20 11:34:11 +03003543 iova_pfn = alloc_iova_fast(&domain->iovad, nrpages,
Tomasz Nowicki538d5b32017-09-20 10:52:02 +02003544 IOVA_PFN(DMA_BIT_MASK(32)), false);
Omer Peleg22e2f9f2016-04-20 11:34:11 +03003545 if (iova_pfn)
3546 return iova_pfn;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003547 }
Tomasz Nowicki538d5b32017-09-20 10:52:02 +02003548 iova_pfn = alloc_iova_fast(&domain->iovad, nrpages,
3549 IOVA_PFN(dma_mask), true);
Omer Peleg22e2f9f2016-04-20 11:34:11 +03003550 if (unlikely(!iova_pfn)) {
Bjorn Helgaas932a6522019-02-08 16:06:00 -06003551 dev_err(dev, "Allocating %ld-page iova failed", nrpages);
Omer Peleg2aac6302016-04-20 11:33:57 +03003552 return 0;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003553 }
3554
Omer Peleg22e2f9f2016-04-20 11:34:11 +03003555 return iova_pfn;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003556}
3557
Lu Baolu9ddbfb42018-07-14 15:46:57 +08003558struct dmar_domain *get_valid_domain_for_dev(struct device *dev)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003559{
Joerg Roedel1c5ebba2016-08-25 13:52:51 +02003560 struct dmar_domain *domain, *tmp;
Joerg Roedelb1ce5b72015-09-23 19:16:01 +02003561 struct dmar_rmrr_unit *rmrr;
Joerg Roedelb1ce5b72015-09-23 19:16:01 +02003562 struct device *i_dev;
3563 int i, ret;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003564
Joerg Roedel1c5ebba2016-08-25 13:52:51 +02003565 domain = find_domain(dev);
3566 if (domain)
3567 goto out;
3568
3569 domain = find_or_alloc_domain(dev, DEFAULT_DOMAIN_ADDRESS_WIDTH);
3570 if (!domain)
3571 goto out;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003572
Joerg Roedelb1ce5b72015-09-23 19:16:01 +02003573 /* We have a new domain - setup possible RMRRs for the device */
3574 rcu_read_lock();
3575 for_each_rmrr_units(rmrr) {
3576 for_each_active_dev_scope(rmrr->devices, rmrr->devices_cnt,
3577 i, i_dev) {
3578 if (i_dev != dev)
3579 continue;
3580
3581 ret = domain_prepare_identity_map(dev, domain,
3582 rmrr->base_address,
3583 rmrr->end_address);
3584 if (ret)
3585 dev_err(dev, "Mapping reserved region failed\n");
3586 }
3587 }
3588 rcu_read_unlock();
3589
Joerg Roedel1c5ebba2016-08-25 13:52:51 +02003590 tmp = set_domain_for_dev(dev, domain);
3591 if (!tmp || domain != tmp) {
3592 domain_exit(domain);
3593 domain = tmp;
3594 }
3595
3596out:
3597
3598 if (!domain)
Bjorn Helgaas932a6522019-02-08 16:06:00 -06003599 dev_err(dev, "Allocating domain failed\n");
Joerg Roedel1c5ebba2016-08-25 13:52:51 +02003600
3601
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003602 return domain;
3603}
3604
David Woodhouseecb509e2014-03-09 16:29:55 -07003605/* Check if the dev needs to go through non-identity map and unmap process.*/
David Woodhouse73676832009-07-04 14:08:36 +01003606static int iommu_no_mapping(struct device *dev)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003607{
3608 int found;
3609
David Woodhouse3d891942014-03-06 15:59:26 +00003610 if (iommu_dummy(dev))
David Woodhouse1e4c64c2009-07-04 10:40:38 +01003611 return 1;
3612
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003613 if (!iommu_identity_mapping)
David Woodhouse1e4c64c2009-07-04 10:40:38 +01003614 return 0;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003615
David Woodhouse9b226622014-03-09 14:03:28 -07003616 found = identity_mapping(dev);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003617 if (found) {
David Woodhouseecb509e2014-03-09 16:29:55 -07003618 if (iommu_should_identity_map(dev, 0))
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003619 return 1;
3620 else {
3621 /*
3622 * 32 bit DMA is removed from si_domain and fall back
3623 * to non-identity mapping.
3624 */
Bjorn Helgaas71753232019-02-08 16:06:15 -06003625 dmar_remove_one_dev_info(dev);
Bjorn Helgaas932a6522019-02-08 16:06:00 -06003626 dev_info(dev, "32bit DMA uses non-identity mapping\n");
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003627 return 0;
3628 }
3629 } else {
3630 /*
3631 * In case of a detached 64 bit DMA device from vm, the device
3632 * is put into si_domain for identity mapping.
3633 */
David Woodhouseecb509e2014-03-09 16:29:55 -07003634 if (iommu_should_identity_map(dev, 0)) {
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003635 int ret;
Joerg Roedel28ccce02015-07-21 14:45:31 +02003636 ret = domain_add_dev_info(si_domain, dev);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003637 if (!ret) {
Bjorn Helgaas932a6522019-02-08 16:06:00 -06003638 dev_info(dev, "64bit DMA uses identity mapping\n");
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003639 return 1;
3640 }
3641 }
3642 }
3643
David Woodhouse1e4c64c2009-07-04 10:40:38 +01003644 return 0;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003645}
3646
Logan Gunthorpe21d5d272019-01-22 14:30:45 -07003647static dma_addr_t __intel_map_single(struct device *dev, phys_addr_t paddr,
3648 size_t size, int dir, u64 dma_mask)
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003649{
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003650 struct dmar_domain *domain;
Fenghua Yu5b6985c2008-10-16 18:02:32 -07003651 phys_addr_t start_paddr;
Omer Peleg2aac6302016-04-20 11:33:57 +03003652 unsigned long iova_pfn;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003653 int prot = 0;
Ingo Molnar6865f0d2008-04-22 11:09:04 +02003654 int ret;
Weidong Han8c11e792008-12-08 15:29:22 +08003655 struct intel_iommu *iommu;
Fenghua Yu33041ec2009-08-04 15:10:59 -07003656 unsigned long paddr_pfn = paddr >> PAGE_SHIFT;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003657
3658 BUG_ON(dir == DMA_NONE);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003659
David Woodhouse5040a912014-03-09 16:14:00 -07003660 if (iommu_no_mapping(dev))
Ingo Molnar6865f0d2008-04-22 11:09:04 +02003661 return paddr;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003662
David Woodhouse5040a912014-03-09 16:14:00 -07003663 domain = get_valid_domain_for_dev(dev);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003664 if (!domain)
Christoph Hellwig524a6692018-11-21 19:34:10 +01003665 return DMA_MAPPING_ERROR;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003666
Weidong Han8c11e792008-12-08 15:29:22 +08003667 iommu = domain_get_iommu(domain);
David Woodhouse88cb6a72009-06-28 15:03:06 +01003668 size = aligned_nrpages(paddr, size);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003669
Omer Peleg2aac6302016-04-20 11:33:57 +03003670 iova_pfn = intel_alloc_iova(dev, domain, dma_to_mm_pfn(size), dma_mask);
3671 if (!iova_pfn)
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003672 goto error;
3673
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003674 /*
3675 * Check if DMAR supports zero-length reads on write only
3676 * mappings..
3677 */
3678 if (dir == DMA_TO_DEVICE || dir == DMA_BIDIRECTIONAL || \
Weidong Han8c11e792008-12-08 15:29:22 +08003679 !cap_zlr(iommu->cap))
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003680 prot |= DMA_PTE_READ;
3681 if (dir == DMA_FROM_DEVICE || dir == DMA_BIDIRECTIONAL)
3682 prot |= DMA_PTE_WRITE;
3683 /*
Ingo Molnar6865f0d2008-04-22 11:09:04 +02003684 * paddr - (paddr + size) might be partial page, we should map the whole
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003685 * page. Note: if two part of one page are separately mapped, we
Ingo Molnar6865f0d2008-04-22 11:09:04 +02003686 * might have two guest_addr mapping to the same host paddr, but this
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003687 * is not a big problem
3688 */
Omer Peleg2aac6302016-04-20 11:33:57 +03003689 ret = domain_pfn_mapping(domain, mm_to_dma_pfn(iova_pfn),
Fenghua Yu33041ec2009-08-04 15:10:59 -07003690 mm_to_dma_pfn(paddr_pfn), size, prot);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003691 if (ret)
3692 goto error;
3693
Omer Peleg2aac6302016-04-20 11:33:57 +03003694 start_paddr = (phys_addr_t)iova_pfn << PAGE_SHIFT;
David Woodhouse03d6a242009-06-28 15:33:46 +01003695 start_paddr += paddr & ~PAGE_MASK;
3696 return start_paddr;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003697
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003698error:
Omer Peleg2aac6302016-04-20 11:33:57 +03003699 if (iova_pfn)
Omer Peleg22e2f9f2016-04-20 11:34:11 +03003700 free_iova_fast(&domain->iovad, iova_pfn, dma_to_mm_pfn(size));
Bjorn Helgaas932a6522019-02-08 16:06:00 -06003701 dev_err(dev, "Device request: %zx@%llx dir %d --- failed\n",
3702 size, (unsigned long long)paddr, dir);
Christoph Hellwig524a6692018-11-21 19:34:10 +01003703 return DMA_MAPPING_ERROR;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003704}
3705
FUJITA Tomonoriffbbef52009-01-05 23:47:26 +09003706static dma_addr_t intel_map_page(struct device *dev, struct page *page,
3707 unsigned long offset, size_t size,
3708 enum dma_data_direction dir,
Krzysztof Kozlowski00085f12016-08-03 13:46:00 -07003709 unsigned long attrs)
FUJITA Tomonoribb9e6d62008-10-15 16:08:28 +09003710{
Logan Gunthorpe21d5d272019-01-22 14:30:45 -07003711 return __intel_map_single(dev, page_to_phys(page) + offset, size,
3712 dir, *dev->dma_mask);
3713}
3714
3715static dma_addr_t intel_map_resource(struct device *dev, phys_addr_t phys_addr,
3716 size_t size, enum dma_data_direction dir,
3717 unsigned long attrs)
3718{
3719 return __intel_map_single(dev, phys_addr, size, dir, *dev->dma_mask);
FUJITA Tomonoribb9e6d62008-10-15 16:08:28 +09003720}
3721
Omer Peleg769530e2016-04-20 11:33:25 +03003722static void intel_unmap(struct device *dev, dma_addr_t dev_addr, size_t size)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003723{
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003724 struct dmar_domain *domain;
David Woodhoused794dc92009-06-28 00:27:49 +01003725 unsigned long start_pfn, last_pfn;
Omer Peleg769530e2016-04-20 11:33:25 +03003726 unsigned long nrpages;
Omer Peleg2aac6302016-04-20 11:33:57 +03003727 unsigned long iova_pfn;
Weidong Han8c11e792008-12-08 15:29:22 +08003728 struct intel_iommu *iommu;
David Woodhouseea8ea462014-03-05 17:09:32 +00003729 struct page *freelist;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003730
David Woodhouse73676832009-07-04 14:08:36 +01003731 if (iommu_no_mapping(dev))
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003732 return;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003733
David Woodhouse1525a292014-03-06 16:19:30 +00003734 domain = find_domain(dev);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003735 BUG_ON(!domain);
3736
Weidong Han8c11e792008-12-08 15:29:22 +08003737 iommu = domain_get_iommu(domain);
3738
Omer Peleg2aac6302016-04-20 11:33:57 +03003739 iova_pfn = IOVA_PFN(dev_addr);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003740
Omer Peleg769530e2016-04-20 11:33:25 +03003741 nrpages = aligned_nrpages(dev_addr, size);
Omer Peleg2aac6302016-04-20 11:33:57 +03003742 start_pfn = mm_to_dma_pfn(iova_pfn);
Omer Peleg769530e2016-04-20 11:33:25 +03003743 last_pfn = start_pfn + nrpages - 1;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003744
Bjorn Helgaas932a6522019-02-08 16:06:00 -06003745 dev_dbg(dev, "Device unmapping: pfn %lx-%lx\n", start_pfn, last_pfn);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003746
David Woodhouseea8ea462014-03-05 17:09:32 +00003747 freelist = domain_unmap(domain, start_pfn, last_pfn);
David Woodhoused794dc92009-06-28 00:27:49 +01003748
mark gross5e0d2a62008-03-04 15:22:08 -08003749 if (intel_iommu_strict) {
Joerg Roedela1ddcbe2015-07-21 15:20:32 +02003750 iommu_flush_iotlb_psi(iommu, domain, start_pfn,
Omer Peleg769530e2016-04-20 11:33:25 +03003751 nrpages, !freelist, 0);
mark gross5e0d2a62008-03-04 15:22:08 -08003752 /* free iova */
Omer Peleg22e2f9f2016-04-20 11:34:11 +03003753 free_iova_fast(&domain->iovad, iova_pfn, dma_to_mm_pfn(nrpages));
David Woodhouseea8ea462014-03-05 17:09:32 +00003754 dma_free_pagelist(freelist);
mark gross5e0d2a62008-03-04 15:22:08 -08003755 } else {
Joerg Roedel13cf0172017-08-11 11:40:10 +02003756 queue_iova(&domain->iovad, iova_pfn, nrpages,
3757 (unsigned long)freelist);
mark gross5e0d2a62008-03-04 15:22:08 -08003758 /*
3759 * queue up the release of the unmap to save the 1/6th of the
3760 * cpu used up by the iotlb flush operation...
3761 */
mark gross5e0d2a62008-03-04 15:22:08 -08003762 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003763}
3764
Jiang Liud41a4ad2014-07-11 14:19:34 +08003765static void intel_unmap_page(struct device *dev, dma_addr_t dev_addr,
3766 size_t size, enum dma_data_direction dir,
Krzysztof Kozlowski00085f12016-08-03 13:46:00 -07003767 unsigned long attrs)
Jiang Liud41a4ad2014-07-11 14:19:34 +08003768{
Omer Peleg769530e2016-04-20 11:33:25 +03003769 intel_unmap(dev, dev_addr, size);
Jiang Liud41a4ad2014-07-11 14:19:34 +08003770}
3771
David Woodhouse5040a912014-03-09 16:14:00 -07003772static void *intel_alloc_coherent(struct device *dev, size_t size,
Andrzej Pietrasiewiczbaa676f2012-03-27 14:28:18 +02003773 dma_addr_t *dma_handle, gfp_t flags,
Krzysztof Kozlowski00085f12016-08-03 13:46:00 -07003774 unsigned long attrs)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003775{
Christoph Hellwig7ec916f2018-07-05 13:29:55 -06003776 struct page *page = NULL;
3777 int order;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003778
Christoph Hellwig7ec916f2018-07-05 13:29:55 -06003779 size = PAGE_ALIGN(size);
3780 order = get_order(size);
Alex Williamsone8bb9102009-11-04 15:59:34 -07003781
Christoph Hellwig7ec916f2018-07-05 13:29:55 -06003782 if (!iommu_no_mapping(dev))
3783 flags &= ~(GFP_DMA | GFP_DMA32);
3784 else if (dev->coherent_dma_mask < dma_get_required_mask(dev)) {
3785 if (dev->coherent_dma_mask < DMA_BIT_MASK(32))
3786 flags |= GFP_DMA;
3787 else
3788 flags |= GFP_DMA32;
3789 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003790
Christoph Hellwig7ec916f2018-07-05 13:29:55 -06003791 if (gfpflags_allow_blocking(flags)) {
3792 unsigned int count = size >> PAGE_SHIFT;
3793
Marek Szyprowskid834c5a2018-08-17 15:49:00 -07003794 page = dma_alloc_from_contiguous(dev, count, order,
3795 flags & __GFP_NOWARN);
Christoph Hellwig7ec916f2018-07-05 13:29:55 -06003796 if (page && iommu_no_mapping(dev) &&
3797 page_to_phys(page) + size > dev->coherent_dma_mask) {
3798 dma_release_from_contiguous(dev, page, count);
3799 page = NULL;
3800 }
3801 }
3802
3803 if (!page)
3804 page = alloc_pages(flags, order);
3805 if (!page)
3806 return NULL;
3807 memset(page_address(page), 0, size);
3808
Logan Gunthorpe21d5d272019-01-22 14:30:45 -07003809 *dma_handle = __intel_map_single(dev, page_to_phys(page), size,
3810 DMA_BIDIRECTIONAL,
3811 dev->coherent_dma_mask);
Christoph Hellwig524a6692018-11-21 19:34:10 +01003812 if (*dma_handle != DMA_MAPPING_ERROR)
Christoph Hellwig7ec916f2018-07-05 13:29:55 -06003813 return page_address(page);
3814 if (!dma_release_from_contiguous(dev, page, size >> PAGE_SHIFT))
3815 __free_pages(page, order);
3816
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003817 return NULL;
3818}
3819
David Woodhouse5040a912014-03-09 16:14:00 -07003820static void intel_free_coherent(struct device *dev, size_t size, void *vaddr,
Krzysztof Kozlowski00085f12016-08-03 13:46:00 -07003821 dma_addr_t dma_handle, unsigned long attrs)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003822{
Christoph Hellwig7ec916f2018-07-05 13:29:55 -06003823 int order;
3824 struct page *page = virt_to_page(vaddr);
3825
3826 size = PAGE_ALIGN(size);
3827 order = get_order(size);
3828
3829 intel_unmap(dev, dma_handle, size);
3830 if (!dma_release_from_contiguous(dev, page, size >> PAGE_SHIFT))
3831 __free_pages(page, order);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003832}
3833
David Woodhouse5040a912014-03-09 16:14:00 -07003834static void intel_unmap_sg(struct device *dev, struct scatterlist *sglist,
FUJITA Tomonorid7ab5c42009-01-28 21:53:18 +09003835 int nelems, enum dma_data_direction dir,
Krzysztof Kozlowski00085f12016-08-03 13:46:00 -07003836 unsigned long attrs)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003837{
Omer Peleg769530e2016-04-20 11:33:25 +03003838 dma_addr_t startaddr = sg_dma_address(sglist) & PAGE_MASK;
3839 unsigned long nrpages = 0;
3840 struct scatterlist *sg;
3841 int i;
3842
3843 for_each_sg(sglist, sg, nelems, i) {
3844 nrpages += aligned_nrpages(sg_dma_address(sg), sg_dma_len(sg));
3845 }
3846
3847 intel_unmap(dev, startaddr, nrpages << VTD_PAGE_SHIFT);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003848}
3849
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003850static int intel_nontranslate_map_sg(struct device *hddev,
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07003851 struct scatterlist *sglist, int nelems, int dir)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003852{
3853 int i;
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07003854 struct scatterlist *sg;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003855
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07003856 for_each_sg(sglist, sg, nelems, i) {
FUJITA Tomonori12d4d402007-10-23 09:32:25 +02003857 BUG_ON(!sg_page(sg));
Robin Murphy29a90b72017-09-28 15:14:01 +01003858 sg->dma_address = sg_phys(sg);
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07003859 sg->dma_length = sg->length;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003860 }
3861 return nelems;
3862}
3863
David Woodhouse5040a912014-03-09 16:14:00 -07003864static int intel_map_sg(struct device *dev, struct scatterlist *sglist, int nelems,
Krzysztof Kozlowski00085f12016-08-03 13:46:00 -07003865 enum dma_data_direction dir, unsigned long attrs)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003866{
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003867 int i;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003868 struct dmar_domain *domain;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003869 size_t size = 0;
3870 int prot = 0;
Omer Peleg2aac6302016-04-20 11:33:57 +03003871 unsigned long iova_pfn;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003872 int ret;
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07003873 struct scatterlist *sg;
David Woodhouseb536d242009-06-28 14:49:31 +01003874 unsigned long start_vpfn;
Weidong Han8c11e792008-12-08 15:29:22 +08003875 struct intel_iommu *iommu;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003876
3877 BUG_ON(dir == DMA_NONE);
David Woodhouse5040a912014-03-09 16:14:00 -07003878 if (iommu_no_mapping(dev))
3879 return intel_nontranslate_map_sg(dev, sglist, nelems, dir);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003880
David Woodhouse5040a912014-03-09 16:14:00 -07003881 domain = get_valid_domain_for_dev(dev);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003882 if (!domain)
3883 return 0;
3884
Weidong Han8c11e792008-12-08 15:29:22 +08003885 iommu = domain_get_iommu(domain);
3886
David Woodhouseb536d242009-06-28 14:49:31 +01003887 for_each_sg(sglist, sg, nelems, i)
David Woodhouse88cb6a72009-06-28 15:03:06 +01003888 size += aligned_nrpages(sg->offset, sg->length);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003889
Omer Peleg2aac6302016-04-20 11:33:57 +03003890 iova_pfn = intel_alloc_iova(dev, domain, dma_to_mm_pfn(size),
David Woodhouse5040a912014-03-09 16:14:00 -07003891 *dev->dma_mask);
Omer Peleg2aac6302016-04-20 11:33:57 +03003892 if (!iova_pfn) {
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07003893 sglist->dma_length = 0;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003894 return 0;
3895 }
3896
3897 /*
3898 * Check if DMAR supports zero-length reads on write only
3899 * mappings..
3900 */
3901 if (dir == DMA_TO_DEVICE || dir == DMA_BIDIRECTIONAL || \
Weidong Han8c11e792008-12-08 15:29:22 +08003902 !cap_zlr(iommu->cap))
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003903 prot |= DMA_PTE_READ;
3904 if (dir == DMA_FROM_DEVICE || dir == DMA_BIDIRECTIONAL)
3905 prot |= DMA_PTE_WRITE;
3906
Omer Peleg2aac6302016-04-20 11:33:57 +03003907 start_vpfn = mm_to_dma_pfn(iova_pfn);
David Woodhousee1605492009-06-29 11:17:38 +01003908
Fenghua Yuf5329592009-08-04 15:09:37 -07003909 ret = domain_sg_mapping(domain, start_vpfn, sglist, size, prot);
David Woodhousee1605492009-06-29 11:17:38 +01003910 if (unlikely(ret)) {
David Woodhousee1605492009-06-29 11:17:38 +01003911 dma_pte_free_pagetable(domain, start_vpfn,
David Dillowbc24c572017-06-28 19:42:23 -07003912 start_vpfn + size - 1,
3913 agaw_to_level(domain->agaw) + 1);
Omer Peleg22e2f9f2016-04-20 11:34:11 +03003914 free_iova_fast(&domain->iovad, iova_pfn, dma_to_mm_pfn(size));
David Woodhousee1605492009-06-29 11:17:38 +01003915 return 0;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003916 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003917
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003918 return nelems;
3919}
3920
Christoph Hellwig02b4da52018-09-17 19:10:31 +02003921static const struct dma_map_ops intel_dma_ops = {
Andrzej Pietrasiewiczbaa676f2012-03-27 14:28:18 +02003922 .alloc = intel_alloc_coherent,
3923 .free = intel_free_coherent,
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003924 .map_sg = intel_map_sg,
3925 .unmap_sg = intel_unmap_sg,
FUJITA Tomonoriffbbef52009-01-05 23:47:26 +09003926 .map_page = intel_map_page,
3927 .unmap_page = intel_unmap_page,
Logan Gunthorpe21d5d272019-01-22 14:30:45 -07003928 .map_resource = intel_map_resource,
3929 .unmap_resource = intel_unmap_page,
Christoph Hellwigfec777c2018-03-19 11:38:15 +01003930 .dma_supported = dma_direct_supported,
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003931};
3932
3933static inline int iommu_domain_cache_init(void)
3934{
3935 int ret = 0;
3936
3937 iommu_domain_cache = kmem_cache_create("iommu_domain",
3938 sizeof(struct dmar_domain),
3939 0,
3940 SLAB_HWCACHE_ALIGN,
3941
3942 NULL);
3943 if (!iommu_domain_cache) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003944 pr_err("Couldn't create iommu_domain cache\n");
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003945 ret = -ENOMEM;
3946 }
3947
3948 return ret;
3949}
3950
3951static inline int iommu_devinfo_cache_init(void)
3952{
3953 int ret = 0;
3954
3955 iommu_devinfo_cache = kmem_cache_create("iommu_devinfo",
3956 sizeof(struct device_domain_info),
3957 0,
3958 SLAB_HWCACHE_ALIGN,
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003959 NULL);
3960 if (!iommu_devinfo_cache) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003961 pr_err("Couldn't create devinfo cache\n");
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003962 ret = -ENOMEM;
3963 }
3964
3965 return ret;
3966}
3967
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003968static int __init iommu_init_mempool(void)
3969{
3970 int ret;
Sakari Ailusae1ff3d2015-07-13 14:31:28 +03003971 ret = iova_cache_get();
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003972 if (ret)
3973 return ret;
3974
3975 ret = iommu_domain_cache_init();
3976 if (ret)
3977 goto domain_error;
3978
3979 ret = iommu_devinfo_cache_init();
3980 if (!ret)
3981 return ret;
3982
3983 kmem_cache_destroy(iommu_domain_cache);
3984domain_error:
Sakari Ailusae1ff3d2015-07-13 14:31:28 +03003985 iova_cache_put();
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003986
3987 return -ENOMEM;
3988}
3989
3990static void __init iommu_exit_mempool(void)
3991{
3992 kmem_cache_destroy(iommu_devinfo_cache);
3993 kmem_cache_destroy(iommu_domain_cache);
Sakari Ailusae1ff3d2015-07-13 14:31:28 +03003994 iova_cache_put();
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003995}
3996
Dan Williams556ab452010-07-23 15:47:56 -07003997static void quirk_ioat_snb_local_iommu(struct pci_dev *pdev)
3998{
3999 struct dmar_drhd_unit *drhd;
4000 u32 vtbar;
4001 int rc;
4002
4003 /* We know that this device on this chipset has its own IOMMU.
4004 * If we find it under a different IOMMU, then the BIOS is lying
4005 * to us. Hope that the IOMMU for this device is actually
4006 * disabled, and it needs no translation...
4007 */
4008 rc = pci_bus_read_config_dword(pdev->bus, PCI_DEVFN(0, 0), 0xb0, &vtbar);
4009 if (rc) {
4010 /* "can't" happen */
4011 dev_info(&pdev->dev, "failed to run vt-d quirk\n");
4012 return;
4013 }
4014 vtbar &= 0xffff0000;
4015
4016 /* we know that the this iommu should be at offset 0xa000 from vtbar */
4017 drhd = dmar_find_matched_drhd_unit(pdev);
4018 if (WARN_TAINT_ONCE(!drhd || drhd->reg_base_addr - vtbar != 0xa000,
4019 TAINT_FIRMWARE_WORKAROUND,
4020 "BIOS assigned incorrect VT-d unit for Intel(R) QuickData Technology device\n"))
4021 pdev->dev.archdata.iommu = DUMMY_DEVICE_DOMAIN_INFO;
4022}
4023DECLARE_PCI_FIXUP_ENABLE(PCI_VENDOR_ID_INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB, quirk_ioat_snb_local_iommu);
4024
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004025static void __init init_no_remapping_devices(void)
4026{
4027 struct dmar_drhd_unit *drhd;
David Woodhouse832bd852014-03-07 15:08:36 +00004028 struct device *dev;
Jiang Liub683b232014-02-19 14:07:32 +08004029 int i;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004030
4031 for_each_drhd_unit(drhd) {
4032 if (!drhd->include_all) {
Jiang Liub683b232014-02-19 14:07:32 +08004033 for_each_active_dev_scope(drhd->devices,
4034 drhd->devices_cnt, i, dev)
4035 break;
David Woodhouse832bd852014-03-07 15:08:36 +00004036 /* ignore DMAR unit if no devices exist */
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004037 if (i == drhd->devices_cnt)
4038 drhd->ignored = 1;
4039 }
4040 }
4041
Jiang Liu7c919772014-01-06 14:18:18 +08004042 for_each_active_drhd_unit(drhd) {
Jiang Liu7c919772014-01-06 14:18:18 +08004043 if (drhd->include_all)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004044 continue;
4045
Jiang Liub683b232014-02-19 14:07:32 +08004046 for_each_active_dev_scope(drhd->devices,
4047 drhd->devices_cnt, i, dev)
David Woodhouse832bd852014-03-07 15:08:36 +00004048 if (!dev_is_pci(dev) || !IS_GFX_DEVICE(to_pci_dev(dev)))
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004049 break;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004050 if (i < drhd->devices_cnt)
4051 continue;
4052
David Woodhousec0771df2011-10-14 20:59:46 +01004053 /* This IOMMU has *only* gfx devices. Either bypass it or
4054 set the gfx_mapped flag, as appropriate */
4055 if (dmar_map_gfx) {
4056 intel_iommu_gfx_mapped = 1;
4057 } else {
4058 drhd->ignored = 1;
Jiang Liub683b232014-02-19 14:07:32 +08004059 for_each_active_dev_scope(drhd->devices,
4060 drhd->devices_cnt, i, dev)
David Woodhouse832bd852014-03-07 15:08:36 +00004061 dev->archdata.iommu = DUMMY_DEVICE_DOMAIN_INFO;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004062 }
4063 }
4064}
4065
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004066#ifdef CONFIG_SUSPEND
4067static int init_iommu_hw(void)
4068{
4069 struct dmar_drhd_unit *drhd;
4070 struct intel_iommu *iommu = NULL;
4071
4072 for_each_active_iommu(iommu, drhd)
4073 if (iommu->qi)
4074 dmar_reenable_qi(iommu);
4075
Joseph Cihulab7792602011-05-03 00:08:37 -07004076 for_each_iommu(iommu, drhd) {
4077 if (drhd->ignored) {
4078 /*
4079 * we always have to disable PMRs or DMA may fail on
4080 * this device
4081 */
4082 if (force_on)
4083 iommu_disable_protect_mem_regions(iommu);
4084 continue;
4085 }
4086
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004087 iommu_flush_write_buffer(iommu);
4088
4089 iommu_set_root_entry(iommu);
4090
4091 iommu->flush.flush_context(iommu, 0, 0, 0,
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01004092 DMA_CCMD_GLOBAL_INVL);
Jiang Liu2a41cce2014-07-11 14:19:33 +08004093 iommu->flush.flush_iotlb(iommu, 0, 0, 0, DMA_TLB_GLOBAL_FLUSH);
4094 iommu_enable_translation(iommu);
David Woodhouseb94996c2009-09-19 15:28:12 -07004095 iommu_disable_protect_mem_regions(iommu);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004096 }
4097
4098 return 0;
4099}
4100
4101static void iommu_flush_all(void)
4102{
4103 struct dmar_drhd_unit *drhd;
4104 struct intel_iommu *iommu;
4105
4106 for_each_active_iommu(iommu, drhd) {
4107 iommu->flush.flush_context(iommu, 0, 0, 0,
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01004108 DMA_CCMD_GLOBAL_INVL);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004109 iommu->flush.flush_iotlb(iommu, 0, 0, 0,
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01004110 DMA_TLB_GLOBAL_FLUSH);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004111 }
4112}
4113
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01004114static int iommu_suspend(void)
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004115{
4116 struct dmar_drhd_unit *drhd;
4117 struct intel_iommu *iommu = NULL;
4118 unsigned long flag;
4119
4120 for_each_active_iommu(iommu, drhd) {
Kees Cook6396bb22018-06-12 14:03:40 -07004121 iommu->iommu_state = kcalloc(MAX_SR_DMAR_REGS, sizeof(u32),
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004122 GFP_ATOMIC);
4123 if (!iommu->iommu_state)
4124 goto nomem;
4125 }
4126
4127 iommu_flush_all();
4128
4129 for_each_active_iommu(iommu, drhd) {
4130 iommu_disable_translation(iommu);
4131
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02004132 raw_spin_lock_irqsave(&iommu->register_lock, flag);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004133
4134 iommu->iommu_state[SR_DMAR_FECTL_REG] =
4135 readl(iommu->reg + DMAR_FECTL_REG);
4136 iommu->iommu_state[SR_DMAR_FEDATA_REG] =
4137 readl(iommu->reg + DMAR_FEDATA_REG);
4138 iommu->iommu_state[SR_DMAR_FEADDR_REG] =
4139 readl(iommu->reg + DMAR_FEADDR_REG);
4140 iommu->iommu_state[SR_DMAR_FEUADDR_REG] =
4141 readl(iommu->reg + DMAR_FEUADDR_REG);
4142
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02004143 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004144 }
4145 return 0;
4146
4147nomem:
4148 for_each_active_iommu(iommu, drhd)
4149 kfree(iommu->iommu_state);
4150
4151 return -ENOMEM;
4152}
4153
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01004154static void iommu_resume(void)
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004155{
4156 struct dmar_drhd_unit *drhd;
4157 struct intel_iommu *iommu = NULL;
4158 unsigned long flag;
4159
4160 if (init_iommu_hw()) {
Joseph Cihulab7792602011-05-03 00:08:37 -07004161 if (force_on)
4162 panic("tboot: IOMMU setup failed, DMAR can not resume!\n");
4163 else
4164 WARN(1, "IOMMU setup failed, DMAR can not resume!\n");
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01004165 return;
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004166 }
4167
4168 for_each_active_iommu(iommu, drhd) {
4169
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02004170 raw_spin_lock_irqsave(&iommu->register_lock, flag);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004171
4172 writel(iommu->iommu_state[SR_DMAR_FECTL_REG],
4173 iommu->reg + DMAR_FECTL_REG);
4174 writel(iommu->iommu_state[SR_DMAR_FEDATA_REG],
4175 iommu->reg + DMAR_FEDATA_REG);
4176 writel(iommu->iommu_state[SR_DMAR_FEADDR_REG],
4177 iommu->reg + DMAR_FEADDR_REG);
4178 writel(iommu->iommu_state[SR_DMAR_FEUADDR_REG],
4179 iommu->reg + DMAR_FEUADDR_REG);
4180
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02004181 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004182 }
4183
4184 for_each_active_iommu(iommu, drhd)
4185 kfree(iommu->iommu_state);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004186}
4187
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01004188static struct syscore_ops iommu_syscore_ops = {
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004189 .resume = iommu_resume,
4190 .suspend = iommu_suspend,
4191};
4192
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01004193static void __init init_iommu_pm_ops(void)
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004194{
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01004195 register_syscore_ops(&iommu_syscore_ops);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004196}
4197
4198#else
Rafael J. Wysocki99592ba2011-06-07 21:32:31 +02004199static inline void init_iommu_pm_ops(void) {}
Fenghua Yuf59c7b62009-03-27 14:22:42 -07004200#endif /* CONFIG_PM */
4201
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004202
Jiang Liuc2a0b532014-11-09 22:47:56 +08004203int __init dmar_parse_one_rmrr(struct acpi_dmar_header *header, void *arg)
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004204{
4205 struct acpi_dmar_reserved_memory *rmrr;
Eric Auger0659b8d2017-01-19 20:57:53 +00004206 int prot = DMA_PTE_READ|DMA_PTE_WRITE;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004207 struct dmar_rmrr_unit *rmrru;
Eric Auger0659b8d2017-01-19 20:57:53 +00004208 size_t length;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004209
4210 rmrru = kzalloc(sizeof(*rmrru), GFP_KERNEL);
4211 if (!rmrru)
Eric Auger0659b8d2017-01-19 20:57:53 +00004212 goto out;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004213
4214 rmrru->hdr = header;
4215 rmrr = (struct acpi_dmar_reserved_memory *)header;
4216 rmrru->base_address = rmrr->base_address;
4217 rmrru->end_address = rmrr->end_address;
Eric Auger0659b8d2017-01-19 20:57:53 +00004218
4219 length = rmrr->end_address - rmrr->base_address + 1;
4220 rmrru->resv = iommu_alloc_resv_region(rmrr->base_address, length, prot,
4221 IOMMU_RESV_DIRECT);
4222 if (!rmrru->resv)
4223 goto free_rmrru;
4224
Jiang Liu2e455282014-02-19 14:07:36 +08004225 rmrru->devices = dmar_alloc_dev_scope((void *)(rmrr + 1),
4226 ((void *)rmrr) + rmrr->header.length,
4227 &rmrru->devices_cnt);
Eric Auger0659b8d2017-01-19 20:57:53 +00004228 if (rmrru->devices_cnt && rmrru->devices == NULL)
4229 goto free_all;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004230
Jiang Liu2e455282014-02-19 14:07:36 +08004231 list_add(&rmrru->list, &dmar_rmrr_units);
4232
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004233 return 0;
Eric Auger0659b8d2017-01-19 20:57:53 +00004234free_all:
4235 kfree(rmrru->resv);
4236free_rmrru:
4237 kfree(rmrru);
4238out:
4239 return -ENOMEM;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004240}
4241
Jiang Liu6b197242014-11-09 22:47:58 +08004242static struct dmar_atsr_unit *dmar_find_atsr(struct acpi_dmar_atsr *atsr)
4243{
4244 struct dmar_atsr_unit *atsru;
4245 struct acpi_dmar_atsr *tmp;
4246
4247 list_for_each_entry_rcu(atsru, &dmar_atsr_units, list) {
4248 tmp = (struct acpi_dmar_atsr *)atsru->hdr;
4249 if (atsr->segment != tmp->segment)
4250 continue;
4251 if (atsr->header.length != tmp->header.length)
4252 continue;
4253 if (memcmp(atsr, tmp, atsr->header.length) == 0)
4254 return atsru;
4255 }
4256
4257 return NULL;
4258}
4259
4260int dmar_parse_one_atsr(struct acpi_dmar_header *hdr, void *arg)
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004261{
4262 struct acpi_dmar_atsr *atsr;
4263 struct dmar_atsr_unit *atsru;
4264
Thomas Gleixnerb608fe32017-05-16 20:42:41 +02004265 if (system_state >= SYSTEM_RUNNING && !intel_iommu_enabled)
Jiang Liu6b197242014-11-09 22:47:58 +08004266 return 0;
4267
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004268 atsr = container_of(hdr, struct acpi_dmar_atsr, header);
Jiang Liu6b197242014-11-09 22:47:58 +08004269 atsru = dmar_find_atsr(atsr);
4270 if (atsru)
4271 return 0;
4272
4273 atsru = kzalloc(sizeof(*atsru) + hdr->length, GFP_KERNEL);
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004274 if (!atsru)
4275 return -ENOMEM;
4276
Jiang Liu6b197242014-11-09 22:47:58 +08004277 /*
4278 * If memory is allocated from slab by ACPI _DSM method, we need to
4279 * copy the memory content because the memory buffer will be freed
4280 * on return.
4281 */
4282 atsru->hdr = (void *)(atsru + 1);
4283 memcpy(atsru->hdr, hdr, hdr->length);
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004284 atsru->include_all = atsr->flags & 0x1;
Jiang Liu2e455282014-02-19 14:07:36 +08004285 if (!atsru->include_all) {
4286 atsru->devices = dmar_alloc_dev_scope((void *)(atsr + 1),
4287 (void *)atsr + atsr->header.length,
4288 &atsru->devices_cnt);
4289 if (atsru->devices_cnt && atsru->devices == NULL) {
4290 kfree(atsru);
4291 return -ENOMEM;
4292 }
4293 }
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004294
Jiang Liu0e2426122014-02-19 14:07:34 +08004295 list_add_rcu(&atsru->list, &dmar_atsr_units);
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004296
4297 return 0;
4298}
4299
Jiang Liu9bdc5312014-01-06 14:18:27 +08004300static void intel_iommu_free_atsr(struct dmar_atsr_unit *atsru)
4301{
4302 dmar_free_dev_scope(&atsru->devices, &atsru->devices_cnt);
4303 kfree(atsru);
4304}
4305
Jiang Liu6b197242014-11-09 22:47:58 +08004306int dmar_release_one_atsr(struct acpi_dmar_header *hdr, void *arg)
4307{
4308 struct acpi_dmar_atsr *atsr;
4309 struct dmar_atsr_unit *atsru;
4310
4311 atsr = container_of(hdr, struct acpi_dmar_atsr, header);
4312 atsru = dmar_find_atsr(atsr);
4313 if (atsru) {
4314 list_del_rcu(&atsru->list);
4315 synchronize_rcu();
4316 intel_iommu_free_atsr(atsru);
4317 }
4318
4319 return 0;
4320}
4321
4322int dmar_check_one_atsr(struct acpi_dmar_header *hdr, void *arg)
4323{
4324 int i;
4325 struct device *dev;
4326 struct acpi_dmar_atsr *atsr;
4327 struct dmar_atsr_unit *atsru;
4328
4329 atsr = container_of(hdr, struct acpi_dmar_atsr, header);
4330 atsru = dmar_find_atsr(atsr);
4331 if (!atsru)
4332 return 0;
4333
Linus Torvalds194dc872016-07-27 20:03:31 -07004334 if (!atsru->include_all && atsru->devices && atsru->devices_cnt) {
Jiang Liu6b197242014-11-09 22:47:58 +08004335 for_each_active_dev_scope(atsru->devices, atsru->devices_cnt,
4336 i, dev)
4337 return -EBUSY;
Linus Torvalds194dc872016-07-27 20:03:31 -07004338 }
Jiang Liu6b197242014-11-09 22:47:58 +08004339
4340 return 0;
4341}
4342
Jiang Liuffebeb42014-11-09 22:48:02 +08004343static int intel_iommu_add(struct dmar_drhd_unit *dmaru)
4344{
Bjorn Helgaase083ea5b2019-02-08 16:06:08 -06004345 int sp, ret;
Jiang Liuffebeb42014-11-09 22:48:02 +08004346 struct intel_iommu *iommu = dmaru->iommu;
4347
4348 if (g_iommus[iommu->seq_id])
4349 return 0;
4350
4351 if (hw_pass_through && !ecap_pass_through(iommu->ecap)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004352 pr_warn("%s: Doesn't support hardware pass through.\n",
Jiang Liuffebeb42014-11-09 22:48:02 +08004353 iommu->name);
4354 return -ENXIO;
4355 }
4356 if (!ecap_sc_support(iommu->ecap) &&
4357 domain_update_iommu_snooping(iommu)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004358 pr_warn("%s: Doesn't support snooping.\n",
Jiang Liuffebeb42014-11-09 22:48:02 +08004359 iommu->name);
4360 return -ENXIO;
4361 }
4362 sp = domain_update_iommu_superpage(iommu) - 1;
4363 if (sp >= 0 && !(cap_super_page_val(iommu->cap) & (1 << sp))) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004364 pr_warn("%s: Doesn't support large page.\n",
Jiang Liuffebeb42014-11-09 22:48:02 +08004365 iommu->name);
4366 return -ENXIO;
4367 }
4368
4369 /*
4370 * Disable translation if already enabled prior to OS handover.
4371 */
4372 if (iommu->gcmd & DMA_GCMD_TE)
4373 iommu_disable_translation(iommu);
4374
4375 g_iommus[iommu->seq_id] = iommu;
4376 ret = iommu_init_domains(iommu);
4377 if (ret == 0)
4378 ret = iommu_alloc_root_entry(iommu);
4379 if (ret)
4380 goto out;
4381
David Woodhouse8a94ade2015-03-24 14:54:56 +00004382#ifdef CONFIG_INTEL_IOMMU_SVM
Lu Baolu765b6a92018-12-10 09:58:55 +08004383 if (pasid_supported(iommu))
Lu Baolud9737952018-07-14 15:47:02 +08004384 intel_svm_init(iommu);
David Woodhouse8a94ade2015-03-24 14:54:56 +00004385#endif
4386
Jiang Liuffebeb42014-11-09 22:48:02 +08004387 if (dmaru->ignored) {
4388 /*
4389 * we always have to disable PMRs or DMA may fail on this device
4390 */
4391 if (force_on)
4392 iommu_disable_protect_mem_regions(iommu);
4393 return 0;
4394 }
4395
4396 intel_iommu_init_qi(iommu);
4397 iommu_flush_write_buffer(iommu);
David Woodhousea222a7f2015-10-07 23:35:18 +01004398
4399#ifdef CONFIG_INTEL_IOMMU_SVM
Lu Baolu765b6a92018-12-10 09:58:55 +08004400 if (pasid_supported(iommu) && ecap_prs(iommu->ecap)) {
David Woodhousea222a7f2015-10-07 23:35:18 +01004401 ret = intel_svm_enable_prq(iommu);
4402 if (ret)
4403 goto disable_iommu;
4404 }
4405#endif
Jiang Liuffebeb42014-11-09 22:48:02 +08004406 ret = dmar_set_interrupt(iommu);
4407 if (ret)
4408 goto disable_iommu;
4409
4410 iommu_set_root_entry(iommu);
4411 iommu->flush.flush_context(iommu, 0, 0, 0, DMA_CCMD_GLOBAL_INVL);
4412 iommu->flush.flush_iotlb(iommu, 0, 0, 0, DMA_TLB_GLOBAL_FLUSH);
4413 iommu_enable_translation(iommu);
4414
Jiang Liuffebeb42014-11-09 22:48:02 +08004415 iommu_disable_protect_mem_regions(iommu);
4416 return 0;
4417
4418disable_iommu:
4419 disable_dmar_iommu(iommu);
4420out:
4421 free_dmar_iommu(iommu);
4422 return ret;
4423}
4424
Jiang Liu6b197242014-11-09 22:47:58 +08004425int dmar_iommu_hotplug(struct dmar_drhd_unit *dmaru, bool insert)
4426{
Jiang Liuffebeb42014-11-09 22:48:02 +08004427 int ret = 0;
4428 struct intel_iommu *iommu = dmaru->iommu;
4429
4430 if (!intel_iommu_enabled)
4431 return 0;
4432 if (iommu == NULL)
4433 return -EINVAL;
4434
4435 if (insert) {
4436 ret = intel_iommu_add(dmaru);
4437 } else {
4438 disable_dmar_iommu(iommu);
4439 free_dmar_iommu(iommu);
4440 }
4441
4442 return ret;
Jiang Liu6b197242014-11-09 22:47:58 +08004443}
4444
Jiang Liu9bdc5312014-01-06 14:18:27 +08004445static void intel_iommu_free_dmars(void)
4446{
4447 struct dmar_rmrr_unit *rmrru, *rmrr_n;
4448 struct dmar_atsr_unit *atsru, *atsr_n;
4449
4450 list_for_each_entry_safe(rmrru, rmrr_n, &dmar_rmrr_units, list) {
4451 list_del(&rmrru->list);
4452 dmar_free_dev_scope(&rmrru->devices, &rmrru->devices_cnt);
Eric Auger0659b8d2017-01-19 20:57:53 +00004453 kfree(rmrru->resv);
Jiang Liu9bdc5312014-01-06 14:18:27 +08004454 kfree(rmrru);
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004455 }
4456
Jiang Liu9bdc5312014-01-06 14:18:27 +08004457 list_for_each_entry_safe(atsru, atsr_n, &dmar_atsr_units, list) {
4458 list_del(&atsru->list);
4459 intel_iommu_free_atsr(atsru);
4460 }
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004461}
4462
4463int dmar_find_matched_atsr_unit(struct pci_dev *dev)
4464{
Jiang Liub683b232014-02-19 14:07:32 +08004465 int i, ret = 1;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004466 struct pci_bus *bus;
David Woodhouse832bd852014-03-07 15:08:36 +00004467 struct pci_dev *bridge = NULL;
4468 struct device *tmp;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004469 struct acpi_dmar_atsr *atsr;
4470 struct dmar_atsr_unit *atsru;
4471
4472 dev = pci_physfn(dev);
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004473 for (bus = dev->bus; bus; bus = bus->parent) {
Jiang Liub5f82dd2014-02-19 14:07:31 +08004474 bridge = bus->self;
David Woodhoused14053b32015-10-15 09:28:06 +01004475 /* If it's an integrated device, allow ATS */
4476 if (!bridge)
4477 return 1;
4478 /* Connected via non-PCIe: no ATS */
4479 if (!pci_is_pcie(bridge) ||
Yijing Wang62f87c02012-07-24 17:20:03 +08004480 pci_pcie_type(bridge) == PCI_EXP_TYPE_PCI_BRIDGE)
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004481 return 0;
David Woodhoused14053b32015-10-15 09:28:06 +01004482 /* If we found the root port, look it up in the ATSR */
Jiang Liub5f82dd2014-02-19 14:07:31 +08004483 if (pci_pcie_type(bridge) == PCI_EXP_TYPE_ROOT_PORT)
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004484 break;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004485 }
4486
Jiang Liu0e2426122014-02-19 14:07:34 +08004487 rcu_read_lock();
Jiang Liub5f82dd2014-02-19 14:07:31 +08004488 list_for_each_entry_rcu(atsru, &dmar_atsr_units, list) {
4489 atsr = container_of(atsru->hdr, struct acpi_dmar_atsr, header);
4490 if (atsr->segment != pci_domain_nr(dev->bus))
4491 continue;
4492
Jiang Liub683b232014-02-19 14:07:32 +08004493 for_each_dev_scope(atsru->devices, atsru->devices_cnt, i, tmp)
David Woodhouse832bd852014-03-07 15:08:36 +00004494 if (tmp == &bridge->dev)
Jiang Liub683b232014-02-19 14:07:32 +08004495 goto out;
Jiang Liub5f82dd2014-02-19 14:07:31 +08004496
4497 if (atsru->include_all)
Jiang Liub683b232014-02-19 14:07:32 +08004498 goto out;
Jiang Liub5f82dd2014-02-19 14:07:31 +08004499 }
Jiang Liub683b232014-02-19 14:07:32 +08004500 ret = 0;
4501out:
Jiang Liu0e2426122014-02-19 14:07:34 +08004502 rcu_read_unlock();
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004503
Jiang Liub683b232014-02-19 14:07:32 +08004504 return ret;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004505}
4506
Jiang Liu59ce0512014-02-19 14:07:35 +08004507int dmar_iommu_notify_scope_dev(struct dmar_pci_notify_info *info)
4508{
Bjorn Helgaase083ea5b2019-02-08 16:06:08 -06004509 int ret;
Jiang Liu59ce0512014-02-19 14:07:35 +08004510 struct dmar_rmrr_unit *rmrru;
4511 struct dmar_atsr_unit *atsru;
4512 struct acpi_dmar_atsr *atsr;
4513 struct acpi_dmar_reserved_memory *rmrr;
4514
Thomas Gleixnerb608fe32017-05-16 20:42:41 +02004515 if (!intel_iommu_enabled && system_state >= SYSTEM_RUNNING)
Jiang Liu59ce0512014-02-19 14:07:35 +08004516 return 0;
4517
4518 list_for_each_entry(rmrru, &dmar_rmrr_units, list) {
4519 rmrr = container_of(rmrru->hdr,
4520 struct acpi_dmar_reserved_memory, header);
4521 if (info->event == BUS_NOTIFY_ADD_DEVICE) {
4522 ret = dmar_insert_dev_scope(info, (void *)(rmrr + 1),
4523 ((void *)rmrr) + rmrr->header.length,
4524 rmrr->segment, rmrru->devices,
4525 rmrru->devices_cnt);
Bjorn Helgaase083ea5b2019-02-08 16:06:08 -06004526 if (ret < 0)
Jiang Liu59ce0512014-02-19 14:07:35 +08004527 return ret;
Joerg Roedele6a8c9b2016-02-29 23:49:47 +01004528 } else if (info->event == BUS_NOTIFY_REMOVED_DEVICE) {
Jiang Liu27e24952014-06-20 15:08:06 +08004529 dmar_remove_dev_scope(info, rmrr->segment,
4530 rmrru->devices, rmrru->devices_cnt);
Jiang Liu59ce0512014-02-19 14:07:35 +08004531 }
4532 }
4533
4534 list_for_each_entry(atsru, &dmar_atsr_units, list) {
4535 if (atsru->include_all)
4536 continue;
4537
4538 atsr = container_of(atsru->hdr, struct acpi_dmar_atsr, header);
4539 if (info->event == BUS_NOTIFY_ADD_DEVICE) {
4540 ret = dmar_insert_dev_scope(info, (void *)(atsr + 1),
4541 (void *)atsr + atsr->header.length,
4542 atsr->segment, atsru->devices,
4543 atsru->devices_cnt);
4544 if (ret > 0)
4545 break;
Bjorn Helgaase083ea5b2019-02-08 16:06:08 -06004546 else if (ret < 0)
Jiang Liu59ce0512014-02-19 14:07:35 +08004547 return ret;
Joerg Roedele6a8c9b2016-02-29 23:49:47 +01004548 } else if (info->event == BUS_NOTIFY_REMOVED_DEVICE) {
Jiang Liu59ce0512014-02-19 14:07:35 +08004549 if (dmar_remove_dev_scope(info, atsr->segment,
4550 atsru->devices, atsru->devices_cnt))
4551 break;
4552 }
4553 }
4554
4555 return 0;
4556}
4557
Fenghua Yu99dcade2009-11-11 07:23:06 -08004558/*
4559 * Here we only respond to action of unbound device from driver.
4560 *
4561 * Added device is not attached to its DMAR domain here yet. That will happen
4562 * when mapping the device to iova.
4563 */
4564static int device_notifier(struct notifier_block *nb,
4565 unsigned long action, void *data)
4566{
4567 struct device *dev = data;
Fenghua Yu99dcade2009-11-11 07:23:06 -08004568 struct dmar_domain *domain;
4569
David Woodhouse3d891942014-03-06 15:59:26 +00004570 if (iommu_dummy(dev))
David Woodhouse44cd6132009-12-02 10:18:30 +00004571 return 0;
4572
Lu Baolu117266f2019-02-25 10:46:36 +08004573 if (action == BUS_NOTIFY_REMOVED_DEVICE) {
4574 domain = find_domain(dev);
4575 if (!domain)
4576 return 0;
Jiang Liu7e7dfab2014-02-19 14:07:23 +08004577
Lu Baolu117266f2019-02-25 10:46:36 +08004578 dmar_remove_one_dev_info(dev);
4579 if (!domain_type_is_vm_or_si(domain) &&
4580 list_empty(&domain->devices))
4581 domain_exit(domain);
4582 } else if (action == BUS_NOTIFY_ADD_DEVICE) {
4583 if (iommu_should_identity_map(dev, 1))
4584 domain_add_dev_info(si_domain, dev);
4585 }
Alex Williamsona97590e2011-03-04 14:52:16 -07004586
Fenghua Yu99dcade2009-11-11 07:23:06 -08004587 return 0;
4588}
4589
4590static struct notifier_block device_nb = {
4591 .notifier_call = device_notifier,
4592};
4593
Jiang Liu75f05562014-02-19 14:07:37 +08004594static int intel_iommu_memory_notifier(struct notifier_block *nb,
4595 unsigned long val, void *v)
4596{
4597 struct memory_notify *mhp = v;
4598 unsigned long long start, end;
4599 unsigned long start_vpfn, last_vpfn;
4600
4601 switch (val) {
4602 case MEM_GOING_ONLINE:
4603 start = mhp->start_pfn << PAGE_SHIFT;
4604 end = ((mhp->start_pfn + mhp->nr_pages) << PAGE_SHIFT) - 1;
4605 if (iommu_domain_identity_map(si_domain, start, end)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004606 pr_warn("Failed to build identity map for [%llx-%llx]\n",
Jiang Liu75f05562014-02-19 14:07:37 +08004607 start, end);
4608 return NOTIFY_BAD;
4609 }
4610 break;
4611
4612 case MEM_OFFLINE:
4613 case MEM_CANCEL_ONLINE:
4614 start_vpfn = mm_to_dma_pfn(mhp->start_pfn);
4615 last_vpfn = mm_to_dma_pfn(mhp->start_pfn + mhp->nr_pages - 1);
4616 while (start_vpfn <= last_vpfn) {
4617 struct iova *iova;
4618 struct dmar_drhd_unit *drhd;
4619 struct intel_iommu *iommu;
David Woodhouseea8ea462014-03-05 17:09:32 +00004620 struct page *freelist;
Jiang Liu75f05562014-02-19 14:07:37 +08004621
4622 iova = find_iova(&si_domain->iovad, start_vpfn);
4623 if (iova == NULL) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004624 pr_debug("Failed get IOVA for PFN %lx\n",
Jiang Liu75f05562014-02-19 14:07:37 +08004625 start_vpfn);
4626 break;
4627 }
4628
4629 iova = split_and_remove_iova(&si_domain->iovad, iova,
4630 start_vpfn, last_vpfn);
4631 if (iova == NULL) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004632 pr_warn("Failed to split IOVA PFN [%lx-%lx]\n",
Jiang Liu75f05562014-02-19 14:07:37 +08004633 start_vpfn, last_vpfn);
4634 return NOTIFY_BAD;
4635 }
4636
David Woodhouseea8ea462014-03-05 17:09:32 +00004637 freelist = domain_unmap(si_domain, iova->pfn_lo,
4638 iova->pfn_hi);
4639
Jiang Liu75f05562014-02-19 14:07:37 +08004640 rcu_read_lock();
4641 for_each_active_iommu(iommu, drhd)
Joerg Roedela1ddcbe2015-07-21 15:20:32 +02004642 iommu_flush_iotlb_psi(iommu, si_domain,
Jiang Liua156ef92014-07-11 14:19:36 +08004643 iova->pfn_lo, iova_size(iova),
David Woodhouseea8ea462014-03-05 17:09:32 +00004644 !freelist, 0);
Jiang Liu75f05562014-02-19 14:07:37 +08004645 rcu_read_unlock();
David Woodhouseea8ea462014-03-05 17:09:32 +00004646 dma_free_pagelist(freelist);
Jiang Liu75f05562014-02-19 14:07:37 +08004647
4648 start_vpfn = iova->pfn_hi + 1;
4649 free_iova_mem(iova);
4650 }
4651 break;
4652 }
4653
4654 return NOTIFY_OK;
4655}
4656
4657static struct notifier_block intel_iommu_memory_nb = {
4658 .notifier_call = intel_iommu_memory_notifier,
4659 .priority = 0
4660};
4661
Omer Peleg22e2f9f2016-04-20 11:34:11 +03004662static void free_all_cpu_cached_iovas(unsigned int cpu)
4663{
4664 int i;
4665
4666 for (i = 0; i < g_num_of_iommus; i++) {
4667 struct intel_iommu *iommu = g_iommus[i];
4668 struct dmar_domain *domain;
Aaron Campbell0caa7612016-07-02 21:23:24 -03004669 int did;
Omer Peleg22e2f9f2016-04-20 11:34:11 +03004670
4671 if (!iommu)
4672 continue;
4673
Jan Niehusmann3bd4f912016-06-06 14:20:11 +02004674 for (did = 0; did < cap_ndoms(iommu->cap); did++) {
Aaron Campbell0caa7612016-07-02 21:23:24 -03004675 domain = get_iommu_domain(iommu, (u16)did);
Omer Peleg22e2f9f2016-04-20 11:34:11 +03004676
4677 if (!domain)
4678 continue;
4679 free_cpu_cached_iovas(cpu, &domain->iovad);
4680 }
4681 }
4682}
4683
Anna-Maria Gleixner21647612016-11-27 00:13:41 +01004684static int intel_iommu_cpu_dead(unsigned int cpu)
Omer Pelegaa473242016-04-20 11:33:02 +03004685{
Anna-Maria Gleixner21647612016-11-27 00:13:41 +01004686 free_all_cpu_cached_iovas(cpu);
Anna-Maria Gleixner21647612016-11-27 00:13:41 +01004687 return 0;
Omer Pelegaa473242016-04-20 11:33:02 +03004688}
4689
Joerg Roedel161b28a2017-03-28 17:04:52 +02004690static void intel_disable_iommus(void)
4691{
4692 struct intel_iommu *iommu = NULL;
4693 struct dmar_drhd_unit *drhd;
4694
4695 for_each_iommu(iommu, drhd)
4696 iommu_disable_translation(iommu);
4697}
4698
Joerg Roedela7fdb6e2017-02-28 13:57:18 +01004699static inline struct intel_iommu *dev_to_intel_iommu(struct device *dev)
4700{
Joerg Roedel2926a2aa2017-08-14 17:19:26 +02004701 struct iommu_device *iommu_dev = dev_to_iommu_device(dev);
4702
4703 return container_of(iommu_dev, struct intel_iommu, iommu);
Joerg Roedela7fdb6e2017-02-28 13:57:18 +01004704}
4705
Alex Williamsona5459cf2014-06-12 16:12:31 -06004706static ssize_t intel_iommu_show_version(struct device *dev,
4707 struct device_attribute *attr,
4708 char *buf)
4709{
Joerg Roedela7fdb6e2017-02-28 13:57:18 +01004710 struct intel_iommu *iommu = dev_to_intel_iommu(dev);
Alex Williamsona5459cf2014-06-12 16:12:31 -06004711 u32 ver = readl(iommu->reg + DMAR_VER_REG);
4712 return sprintf(buf, "%d:%d\n",
4713 DMAR_VER_MAJOR(ver), DMAR_VER_MINOR(ver));
4714}
4715static DEVICE_ATTR(version, S_IRUGO, intel_iommu_show_version, NULL);
4716
4717static ssize_t intel_iommu_show_address(struct device *dev,
4718 struct device_attribute *attr,
4719 char *buf)
4720{
Joerg Roedela7fdb6e2017-02-28 13:57:18 +01004721 struct intel_iommu *iommu = dev_to_intel_iommu(dev);
Alex Williamsona5459cf2014-06-12 16:12:31 -06004722 return sprintf(buf, "%llx\n", iommu->reg_phys);
4723}
4724static DEVICE_ATTR(address, S_IRUGO, intel_iommu_show_address, NULL);
4725
4726static ssize_t intel_iommu_show_cap(struct device *dev,
4727 struct device_attribute *attr,
4728 char *buf)
4729{
Joerg Roedela7fdb6e2017-02-28 13:57:18 +01004730 struct intel_iommu *iommu = dev_to_intel_iommu(dev);
Alex Williamsona5459cf2014-06-12 16:12:31 -06004731 return sprintf(buf, "%llx\n", iommu->cap);
4732}
4733static DEVICE_ATTR(cap, S_IRUGO, intel_iommu_show_cap, NULL);
4734
4735static ssize_t intel_iommu_show_ecap(struct device *dev,
4736 struct device_attribute *attr,
4737 char *buf)
4738{
Joerg Roedela7fdb6e2017-02-28 13:57:18 +01004739 struct intel_iommu *iommu = dev_to_intel_iommu(dev);
Alex Williamsona5459cf2014-06-12 16:12:31 -06004740 return sprintf(buf, "%llx\n", iommu->ecap);
4741}
4742static DEVICE_ATTR(ecap, S_IRUGO, intel_iommu_show_ecap, NULL);
4743
Alex Williamson2238c082015-07-14 15:24:53 -06004744static ssize_t intel_iommu_show_ndoms(struct device *dev,
4745 struct device_attribute *attr,
4746 char *buf)
4747{
Joerg Roedela7fdb6e2017-02-28 13:57:18 +01004748 struct intel_iommu *iommu = dev_to_intel_iommu(dev);
Alex Williamson2238c082015-07-14 15:24:53 -06004749 return sprintf(buf, "%ld\n", cap_ndoms(iommu->cap));
4750}
4751static DEVICE_ATTR(domains_supported, S_IRUGO, intel_iommu_show_ndoms, NULL);
4752
4753static ssize_t intel_iommu_show_ndoms_used(struct device *dev,
4754 struct device_attribute *attr,
4755 char *buf)
4756{
Joerg Roedela7fdb6e2017-02-28 13:57:18 +01004757 struct intel_iommu *iommu = dev_to_intel_iommu(dev);
Alex Williamson2238c082015-07-14 15:24:53 -06004758 return sprintf(buf, "%d\n", bitmap_weight(iommu->domain_ids,
4759 cap_ndoms(iommu->cap)));
4760}
4761static DEVICE_ATTR(domains_used, S_IRUGO, intel_iommu_show_ndoms_used, NULL);
4762
Alex Williamsona5459cf2014-06-12 16:12:31 -06004763static struct attribute *intel_iommu_attrs[] = {
4764 &dev_attr_version.attr,
4765 &dev_attr_address.attr,
4766 &dev_attr_cap.attr,
4767 &dev_attr_ecap.attr,
Alex Williamson2238c082015-07-14 15:24:53 -06004768 &dev_attr_domains_supported.attr,
4769 &dev_attr_domains_used.attr,
Alex Williamsona5459cf2014-06-12 16:12:31 -06004770 NULL,
4771};
4772
4773static struct attribute_group intel_iommu_group = {
4774 .name = "intel-iommu",
4775 .attrs = intel_iommu_attrs,
4776};
4777
4778const struct attribute_group *intel_iommu_groups[] = {
4779 &intel_iommu_group,
4780 NULL,
4781};
4782
Lu Baolu89a60792018-10-23 15:45:01 +08004783static int __init platform_optin_force_iommu(void)
4784{
4785 struct pci_dev *pdev = NULL;
4786 bool has_untrusted_dev = false;
4787
4788 if (!dmar_platform_optin() || no_platform_optin)
4789 return 0;
4790
4791 for_each_pci_dev(pdev) {
4792 if (pdev->untrusted) {
4793 has_untrusted_dev = true;
4794 break;
4795 }
4796 }
4797
4798 if (!has_untrusted_dev)
4799 return 0;
4800
4801 if (no_iommu || dmar_disabled)
4802 pr_info("Intel-IOMMU force enabled due to platform opt in\n");
4803
4804 /*
4805 * If Intel-IOMMU is disabled by default, we will apply identity
4806 * map for all devices except those marked as being untrusted.
4807 */
4808 if (dmar_disabled)
4809 iommu_identity_mapping |= IDENTMAP_ALL;
4810
4811 dmar_disabled = 0;
4812#if defined(CONFIG_X86) && defined(CONFIG_SWIOTLB)
4813 swiotlb = 0;
4814#endif
4815 no_iommu = 0;
4816
4817 return 1;
4818}
4819
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004820int __init intel_iommu_init(void)
4821{
Jiang Liu9bdc5312014-01-06 14:18:27 +08004822 int ret = -ENODEV;
Takao Indoh3a93c842013-04-23 17:35:03 +09004823 struct dmar_drhd_unit *drhd;
Jiang Liu7c919772014-01-06 14:18:18 +08004824 struct intel_iommu *iommu;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004825
Lu Baolu89a60792018-10-23 15:45:01 +08004826 /*
4827 * Intel IOMMU is required for a TXT/tboot launch or platform
4828 * opt in, so enforce that.
4829 */
4830 force_on = tboot_force_iommu() || platform_optin_force_iommu();
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004831
Jiang Liu3a5670e2014-02-19 14:07:33 +08004832 if (iommu_init_mempool()) {
4833 if (force_on)
4834 panic("tboot: Failed to initialize iommu memory\n");
4835 return -ENOMEM;
4836 }
4837
4838 down_write(&dmar_global_lock);
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07004839 if (dmar_table_init()) {
4840 if (force_on)
4841 panic("tboot: Failed to initialize DMAR table\n");
Jiang Liu9bdc5312014-01-06 14:18:27 +08004842 goto out_free_dmar;
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07004843 }
4844
Suresh Siddhac2c72862011-08-23 17:05:19 -07004845 if (dmar_dev_scope_init() < 0) {
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07004846 if (force_on)
4847 panic("tboot: Failed to initialize DMAR device scope\n");
Jiang Liu9bdc5312014-01-06 14:18:27 +08004848 goto out_free_dmar;
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07004849 }
Suresh Siddha1886e8a2008-07-10 11:16:37 -07004850
Joerg Roedelec154bf2017-10-06 15:00:53 +02004851 up_write(&dmar_global_lock);
4852
4853 /*
4854 * The bus notifier takes the dmar_global_lock, so lockdep will
4855 * complain later when we register it under the lock.
4856 */
4857 dmar_register_bus_notifier();
4858
4859 down_write(&dmar_global_lock);
4860
Joerg Roedel161b28a2017-03-28 17:04:52 +02004861 if (no_iommu || dmar_disabled) {
4862 /*
Shaohua Libfd20f12017-04-26 09:18:35 -07004863 * We exit the function here to ensure IOMMU's remapping and
4864 * mempool aren't setup, which means that the IOMMU's PMRs
4865 * won't be disabled via the call to init_dmars(). So disable
4866 * it explicitly here. The PMRs were setup by tboot prior to
4867 * calling SENTER, but the kernel is expected to reset/tear
4868 * down the PMRs.
4869 */
4870 if (intel_iommu_tboot_noforce) {
4871 for_each_iommu(iommu, drhd)
4872 iommu_disable_protect_mem_regions(iommu);
4873 }
4874
4875 /*
Joerg Roedel161b28a2017-03-28 17:04:52 +02004876 * Make sure the IOMMUs are switched off, even when we
4877 * boot into a kexec kernel and the previous kernel left
4878 * them enabled
4879 */
4880 intel_disable_iommus();
Jiang Liu9bdc5312014-01-06 14:18:27 +08004881 goto out_free_dmar;
Joerg Roedel161b28a2017-03-28 17:04:52 +02004882 }
Suresh Siddha2ae21012008-07-10 11:16:43 -07004883
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004884 if (list_empty(&dmar_rmrr_units))
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004885 pr_info("No RMRR found\n");
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004886
4887 if (list_empty(&dmar_atsr_units))
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004888 pr_info("No ATSR found\n");
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004889
Joseph Cihula51a63e62011-03-21 11:04:24 -07004890 if (dmar_init_reserved_ranges()) {
4891 if (force_on)
4892 panic("tboot: Failed to reserve iommu ranges\n");
Jiang Liu3a5670e2014-02-19 14:07:33 +08004893 goto out_free_reserved_range;
Joseph Cihula51a63e62011-03-21 11:04:24 -07004894 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004895
4896 init_no_remapping_devices();
4897
Joseph Cihulab7792602011-05-03 00:08:37 -07004898 ret = init_dmars();
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004899 if (ret) {
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07004900 if (force_on)
4901 panic("tboot: Failed to initialize DMARs\n");
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004902 pr_err("Initialization failed\n");
Jiang Liu9bdc5312014-01-06 14:18:27 +08004903 goto out_free_reserved_range;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004904 }
Jiang Liu3a5670e2014-02-19 14:07:33 +08004905 up_write(&dmar_global_lock);
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004906 pr_info("Intel(R) Virtualization Technology for Directed I/O\n");
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004907
Christoph Hellwig4fac8072017-12-24 13:57:08 +01004908#if defined(CONFIG_X86) && defined(CONFIG_SWIOTLB)
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +09004909 swiotlb = 0;
4910#endif
David Woodhouse19943b02009-08-04 16:19:20 +01004911 dma_ops = &intel_dma_ops;
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07004912
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01004913 init_iommu_pm_ops();
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +01004914
Joerg Roedel39ab9552017-02-01 16:56:46 +01004915 for_each_active_iommu(iommu, drhd) {
4916 iommu_device_sysfs_add(&iommu->iommu, NULL,
4917 intel_iommu_groups,
4918 "%s", iommu->name);
4919 iommu_device_set_ops(&iommu->iommu, &intel_iommu_ops);
4920 iommu_device_register(&iommu->iommu);
4921 }
Alex Williamsona5459cf2014-06-12 16:12:31 -06004922
Joerg Roedel4236d97d2011-09-06 17:56:07 +02004923 bus_set_iommu(&pci_bus_type, &intel_iommu_ops);
Fenghua Yu99dcade2009-11-11 07:23:06 -08004924 bus_register_notifier(&pci_bus_type, &device_nb);
Jiang Liu75f05562014-02-19 14:07:37 +08004925 if (si_domain && !hw_pass_through)
4926 register_memory_notifier(&intel_iommu_memory_nb);
Anna-Maria Gleixner21647612016-11-27 00:13:41 +01004927 cpuhp_setup_state(CPUHP_IOMMU_INTEL_DEAD, "iommu/intel:dead", NULL,
4928 intel_iommu_cpu_dead);
Eugeni Dodonov8bc1f852011-11-23 16:42:14 -02004929 intel_iommu_enabled = 1;
Sohil Mehtaee2636b2018-09-11 17:11:38 -07004930 intel_iommu_debugfs_init();
Eugeni Dodonov8bc1f852011-11-23 16:42:14 -02004931
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004932 return 0;
Jiang Liu9bdc5312014-01-06 14:18:27 +08004933
4934out_free_reserved_range:
4935 put_iova_domain(&reserved_iova_list);
Jiang Liu9bdc5312014-01-06 14:18:27 +08004936out_free_dmar:
4937 intel_iommu_free_dmars();
Jiang Liu3a5670e2014-02-19 14:07:33 +08004938 up_write(&dmar_global_lock);
4939 iommu_exit_mempool();
Jiang Liu9bdc5312014-01-06 14:18:27 +08004940 return ret;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07004941}
Keshavamurthy, Anil Se8204822007-10-21 16:41:55 -07004942
Joerg Roedel2452d9d2015-07-23 16:20:14 +02004943static int domain_context_clear_one_cb(struct pci_dev *pdev, u16 alias, void *opaque)
Alex Williamson579305f2014-07-03 09:51:43 -06004944{
4945 struct intel_iommu *iommu = opaque;
4946
Joerg Roedel2452d9d2015-07-23 16:20:14 +02004947 domain_context_clear_one(iommu, PCI_BUS_NUM(alias), alias & 0xff);
Alex Williamson579305f2014-07-03 09:51:43 -06004948 return 0;
4949}
4950
4951/*
4952 * NB - intel-iommu lacks any sort of reference counting for the users of
4953 * dependent devices. If multiple endpoints have intersecting dependent
4954 * devices, unbinding the driver from any one of them will possibly leave
4955 * the others unable to operate.
4956 */
Joerg Roedel2452d9d2015-07-23 16:20:14 +02004957static void domain_context_clear(struct intel_iommu *iommu, struct device *dev)
Han, Weidong3199aa62009-02-26 17:31:12 +08004958{
David Woodhouse0bcb3e22014-03-06 17:12:03 +00004959 if (!iommu || !dev || !dev_is_pci(dev))
Han, Weidong3199aa62009-02-26 17:31:12 +08004960 return;
4961
Joerg Roedel2452d9d2015-07-23 16:20:14 +02004962 pci_for_each_dma_alias(to_pci_dev(dev), &domain_context_clear_one_cb, iommu);
Han, Weidong3199aa62009-02-26 17:31:12 +08004963}
4964
Joerg Roedel127c7612015-07-23 17:44:46 +02004965static void __dmar_remove_one_dev_info(struct device_domain_info *info)
Weidong Hanc7151a82008-12-08 22:51:37 +08004966{
Weidong Hanc7151a82008-12-08 22:51:37 +08004967 struct intel_iommu *iommu;
4968 unsigned long flags;
Weidong Hanc7151a82008-12-08 22:51:37 +08004969
Joerg Roedel55d94042015-07-22 16:50:40 +02004970 assert_spin_locked(&device_domain_lock);
4971
Joerg Roedelb608ac32015-07-21 18:19:08 +02004972 if (WARN_ON(!info))
Weidong Hanc7151a82008-12-08 22:51:37 +08004973 return;
4974
Joerg Roedel127c7612015-07-23 17:44:46 +02004975 iommu = info->iommu;
4976
4977 if (info->dev) {
Lu Baoluef848b72018-12-10 09:59:01 +08004978 if (dev_is_pci(info->dev) && sm_supported(iommu))
4979 intel_pasid_tear_down_entry(iommu, info->dev,
4980 PASID_RID2PASID);
4981
Joerg Roedel127c7612015-07-23 17:44:46 +02004982 iommu_disable_dev_iotlb(info);
4983 domain_context_clear(iommu, info->dev);
Lu Baolua7fc93f2018-07-14 15:47:00 +08004984 intel_pasid_free_table(info->dev);
Joerg Roedel127c7612015-07-23 17:44:46 +02004985 }
4986
Joerg Roedelb608ac32015-07-21 18:19:08 +02004987 unlink_domain_info(info);
Roland Dreier3e7abe22011-07-20 06:22:21 -07004988
Joerg Roedeld160aca2015-07-22 11:52:53 +02004989 spin_lock_irqsave(&iommu->lock, flags);
Joerg Roedel127c7612015-07-23 17:44:46 +02004990 domain_detach_iommu(info->domain, iommu);
Joerg Roedeld160aca2015-07-22 11:52:53 +02004991 spin_unlock_irqrestore(&iommu->lock, flags);
Joerg Roedel127c7612015-07-23 17:44:46 +02004992
4993 free_devinfo_mem(info);
Weidong Hanc7151a82008-12-08 22:51:37 +08004994}
4995
Bjorn Helgaas71753232019-02-08 16:06:15 -06004996static void dmar_remove_one_dev_info(struct device *dev)
Joerg Roedel55d94042015-07-22 16:50:40 +02004997{
Joerg Roedel127c7612015-07-23 17:44:46 +02004998 struct device_domain_info *info;
Joerg Roedel55d94042015-07-22 16:50:40 +02004999 unsigned long flags;
5000
Weidong Hanc7151a82008-12-08 22:51:37 +08005001 spin_lock_irqsave(&device_domain_lock, flags);
Joerg Roedel127c7612015-07-23 17:44:46 +02005002 info = dev->archdata.iommu;
5003 __dmar_remove_one_dev_info(info);
Weidong Han5e98c4b2008-12-08 23:03:27 +08005004 spin_unlock_irqrestore(&device_domain_lock, flags);
Weidong Han5e98c4b2008-12-08 23:03:27 +08005005}
5006
5007static int md_domain_init(struct dmar_domain *domain, int guest_width)
5008{
5009 int adjust_width;
5010
Zhen Leiaa3ac942017-09-21 16:52:45 +01005011 init_iova_domain(&domain->iovad, VTD_PAGE_SIZE, IOVA_START_PFN);
Weidong Han5e98c4b2008-12-08 23:03:27 +08005012 domain_reserve_special_ranges(domain);
5013
5014 /* calculate AGAW */
5015 domain->gaw = guest_width;
5016 adjust_width = guestwidth_to_adjustwidth(guest_width);
5017 domain->agaw = width_to_agaw(adjust_width);
5018
Weidong Han5e98c4b2008-12-08 23:03:27 +08005019 domain->iommu_coherency = 0;
Sheng Yangc5b15252009-08-06 13:31:56 +08005020 domain->iommu_snooping = 0;
Youquan Song6dd9a7c2011-05-25 19:13:49 +01005021 domain->iommu_superpage = 0;
Weidong Hanfe40f1e2008-12-08 23:10:23 +08005022 domain->max_addr = 0;
Weidong Han5e98c4b2008-12-08 23:03:27 +08005023
5024 /* always allocate the top pgd */
Suresh Siddha4c923d42009-10-02 11:01:24 -07005025 domain->pgd = (struct dma_pte *)alloc_pgtable_page(domain->nid);
Weidong Han5e98c4b2008-12-08 23:03:27 +08005026 if (!domain->pgd)
5027 return -ENOMEM;
5028 domain_flush_cache(domain, domain->pgd, PAGE_SIZE);
5029 return 0;
5030}
5031
Joerg Roedel00a77de2015-03-26 13:43:08 +01005032static struct iommu_domain *intel_iommu_domain_alloc(unsigned type)
Kay, Allen M38717942008-09-09 18:37:29 +03005033{
Joerg Roedel5d450802008-12-03 14:52:32 +01005034 struct dmar_domain *dmar_domain;
Joerg Roedel00a77de2015-03-26 13:43:08 +01005035 struct iommu_domain *domain;
5036
5037 if (type != IOMMU_DOMAIN_UNMANAGED)
5038 return NULL;
Kay, Allen M38717942008-09-09 18:37:29 +03005039
Jiang Liuab8dfe22014-07-11 14:19:27 +08005040 dmar_domain = alloc_domain(DOMAIN_FLAG_VIRTUAL_MACHINE);
Joerg Roedel5d450802008-12-03 14:52:32 +01005041 if (!dmar_domain) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02005042 pr_err("Can't allocate dmar_domain\n");
Joerg Roedel00a77de2015-03-26 13:43:08 +01005043 return NULL;
Kay, Allen M38717942008-09-09 18:37:29 +03005044 }
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07005045 if (md_domain_init(dmar_domain, DEFAULT_DOMAIN_ADDRESS_WIDTH)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02005046 pr_err("Domain initialization failed\n");
Jiang Liu92d03cc2014-02-19 14:07:28 +08005047 domain_exit(dmar_domain);
Joerg Roedel00a77de2015-03-26 13:43:08 +01005048 return NULL;
Kay, Allen M38717942008-09-09 18:37:29 +03005049 }
Allen Kay8140a952011-10-14 12:32:17 -07005050 domain_update_iommu_cap(dmar_domain);
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005051
Joerg Roedel00a77de2015-03-26 13:43:08 +01005052 domain = &dmar_domain->domain;
Joerg Roedel8a0e7152012-01-26 19:40:54 +01005053 domain->geometry.aperture_start = 0;
5054 domain->geometry.aperture_end = __DOMAIN_MAX_ADDR(dmar_domain->gaw);
5055 domain->geometry.force_aperture = true;
5056
Joerg Roedel00a77de2015-03-26 13:43:08 +01005057 return domain;
Kay, Allen M38717942008-09-09 18:37:29 +03005058}
Kay, Allen M38717942008-09-09 18:37:29 +03005059
Joerg Roedel00a77de2015-03-26 13:43:08 +01005060static void intel_iommu_domain_free(struct iommu_domain *domain)
Kay, Allen M38717942008-09-09 18:37:29 +03005061{
Joerg Roedel00a77de2015-03-26 13:43:08 +01005062 domain_exit(to_dmar_domain(domain));
Kay, Allen M38717942008-09-09 18:37:29 +03005063}
Kay, Allen M38717942008-09-09 18:37:29 +03005064
Joerg Roedel4c5478c2008-12-03 14:58:24 +01005065static int intel_iommu_attach_device(struct iommu_domain *domain,
5066 struct device *dev)
Kay, Allen M38717942008-09-09 18:37:29 +03005067{
Joerg Roedel00a77de2015-03-26 13:43:08 +01005068 struct dmar_domain *dmar_domain = to_dmar_domain(domain);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08005069 struct intel_iommu *iommu;
5070 int addr_width;
David Woodhouse156baca2014-03-09 14:00:57 -07005071 u8 bus, devfn;
Kay, Allen M38717942008-09-09 18:37:29 +03005072
Alex Williamsonc875d2c2014-07-03 09:57:02 -06005073 if (device_is_rmrr_locked(dev)) {
5074 dev_warn(dev, "Device is ineligible for IOMMU domain attach due to platform RMRR requirement. Contact your platform vendor.\n");
5075 return -EPERM;
5076 }
5077
David Woodhouse7207d8f2014-03-09 16:31:06 -07005078 /* normally dev is not mapped */
5079 if (unlikely(domain_context_mapped(dev))) {
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005080 struct dmar_domain *old_domain;
5081
David Woodhouse1525a292014-03-06 16:19:30 +00005082 old_domain = find_domain(dev);
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005083 if (old_domain) {
Joerg Roedeld160aca2015-07-22 11:52:53 +02005084 rcu_read_lock();
Bjorn Helgaas71753232019-02-08 16:06:15 -06005085 dmar_remove_one_dev_info(dev);
Joerg Roedeld160aca2015-07-22 11:52:53 +02005086 rcu_read_unlock();
Joerg Roedel62c22162014-12-09 12:56:45 +01005087
5088 if (!domain_type_is_vm_or_si(old_domain) &&
5089 list_empty(&old_domain->devices))
5090 domain_exit(old_domain);
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005091 }
5092 }
5093
David Woodhouse156baca2014-03-09 14:00:57 -07005094 iommu = device_to_iommu(dev, &bus, &devfn);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08005095 if (!iommu)
5096 return -ENODEV;
5097
5098 /* check if this iommu agaw is sufficient for max mapped address */
5099 addr_width = agaw_to_width(iommu->agaw);
Tom Lyona99c47a2010-05-17 08:20:45 +01005100 if (addr_width > cap_mgaw(iommu->cap))
5101 addr_width = cap_mgaw(iommu->cap);
5102
5103 if (dmar_domain->max_addr > (1LL << addr_width)) {
Bjorn Helgaas932a6522019-02-08 16:06:00 -06005104 dev_err(dev, "%s: iommu width (%d) is not "
5105 "sufficient for the mapped address (%llx)\n",
5106 __func__, addr_width, dmar_domain->max_addr);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08005107 return -EFAULT;
5108 }
Tom Lyona99c47a2010-05-17 08:20:45 +01005109 dmar_domain->gaw = addr_width;
5110
5111 /*
5112 * Knock out extra levels of page tables if necessary
5113 */
5114 while (iommu->agaw < dmar_domain->agaw) {
5115 struct dma_pte *pte;
5116
5117 pte = dmar_domain->pgd;
5118 if (dma_pte_present(pte)) {
Sheng Yang25cbff12010-06-12 19:21:42 +08005119 dmar_domain->pgd = (struct dma_pte *)
5120 phys_to_virt(dma_pte_addr(pte));
Jan Kiszka7a661012010-11-02 08:05:51 +01005121 free_pgtable_page(pte);
Tom Lyona99c47a2010-05-17 08:20:45 +01005122 }
5123 dmar_domain->agaw--;
5124 }
Weidong Hanfe40f1e2008-12-08 23:10:23 +08005125
Joerg Roedel28ccce02015-07-21 14:45:31 +02005126 return domain_add_dev_info(dmar_domain, dev);
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005127}
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005128
Joerg Roedel4c5478c2008-12-03 14:58:24 +01005129static void intel_iommu_detach_device(struct iommu_domain *domain,
5130 struct device *dev)
Kay, Allen M38717942008-09-09 18:37:29 +03005131{
Bjorn Helgaas71753232019-02-08 16:06:15 -06005132 dmar_remove_one_dev_info(dev);
Kay, Allen M38717942008-09-09 18:37:29 +03005133}
Kay, Allen M38717942008-09-09 18:37:29 +03005134
Joerg Roedelb146a1c9f2010-01-20 17:17:37 +01005135static int intel_iommu_map(struct iommu_domain *domain,
5136 unsigned long iova, phys_addr_t hpa,
Ohad Ben-Cohen50090652011-11-10 11:32:25 +02005137 size_t size, int iommu_prot)
Kay, Allen M38717942008-09-09 18:37:29 +03005138{
Joerg Roedel00a77de2015-03-26 13:43:08 +01005139 struct dmar_domain *dmar_domain = to_dmar_domain(domain);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08005140 u64 max_addr;
Joerg Roedeldde57a22008-12-03 15:04:09 +01005141 int prot = 0;
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005142 int ret;
Weidong Hanfe40f1e2008-12-08 23:10:23 +08005143
Joerg Roedeldde57a22008-12-03 15:04:09 +01005144 if (iommu_prot & IOMMU_READ)
5145 prot |= DMA_PTE_READ;
5146 if (iommu_prot & IOMMU_WRITE)
5147 prot |= DMA_PTE_WRITE;
Sheng Yang9cf06692009-03-18 15:33:07 +08005148 if ((iommu_prot & IOMMU_CACHE) && dmar_domain->iommu_snooping)
5149 prot |= DMA_PTE_SNP;
Joerg Roedeldde57a22008-12-03 15:04:09 +01005150
David Woodhouse163cc522009-06-28 00:51:17 +01005151 max_addr = iova + size;
Joerg Roedeldde57a22008-12-03 15:04:09 +01005152 if (dmar_domain->max_addr < max_addr) {
Weidong Hanfe40f1e2008-12-08 23:10:23 +08005153 u64 end;
5154
5155 /* check if minimum agaw is sufficient for mapped address */
Tom Lyon8954da12010-05-17 08:19:52 +01005156 end = __DOMAIN_MAX_ADDR(dmar_domain->gaw) + 1;
Weidong Hanfe40f1e2008-12-08 23:10:23 +08005157 if (end < max_addr) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02005158 pr_err("%s: iommu width (%d) is not "
Weidong Hanfe40f1e2008-12-08 23:10:23 +08005159 "sufficient for the mapped address (%llx)\n",
Tom Lyon8954da12010-05-17 08:19:52 +01005160 __func__, dmar_domain->gaw, max_addr);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08005161 return -EFAULT;
5162 }
Joerg Roedeldde57a22008-12-03 15:04:09 +01005163 dmar_domain->max_addr = max_addr;
Weidong Hanfe40f1e2008-12-08 23:10:23 +08005164 }
David Woodhousead051222009-06-28 14:22:28 +01005165 /* Round up size to next multiple of PAGE_SIZE, if it and
5166 the low bits of hpa would take us onto the next page */
David Woodhouse88cb6a72009-06-28 15:03:06 +01005167 size = aligned_nrpages(hpa, size);
David Woodhousead051222009-06-28 14:22:28 +01005168 ret = domain_pfn_mapping(dmar_domain, iova >> VTD_PAGE_SHIFT,
5169 hpa >> VTD_PAGE_SHIFT, size, prot);
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005170 return ret;
Kay, Allen M38717942008-09-09 18:37:29 +03005171}
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005172
Ohad Ben-Cohen50090652011-11-10 11:32:25 +02005173static size_t intel_iommu_unmap(struct iommu_domain *domain,
David Woodhouseea8ea462014-03-05 17:09:32 +00005174 unsigned long iova, size_t size)
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005175{
Joerg Roedel00a77de2015-03-26 13:43:08 +01005176 struct dmar_domain *dmar_domain = to_dmar_domain(domain);
David Woodhouseea8ea462014-03-05 17:09:32 +00005177 struct page *freelist = NULL;
David Woodhouseea8ea462014-03-05 17:09:32 +00005178 unsigned long start_pfn, last_pfn;
5179 unsigned int npages;
Joerg Roedel42e8c182015-07-21 15:50:02 +02005180 int iommu_id, level = 0;
Sheng Yang4b99d352009-07-08 11:52:52 +01005181
David Woodhouse5cf0a762014-03-19 16:07:49 +00005182 /* Cope with horrid API which requires us to unmap more than the
5183 size argument if it happens to be a large-page mapping. */
Joerg Roedeldc02e462015-08-13 11:15:13 +02005184 BUG_ON(!pfn_to_dma_pte(dmar_domain, iova >> VTD_PAGE_SHIFT, &level));
David Woodhouse5cf0a762014-03-19 16:07:49 +00005185
5186 if (size < VTD_PAGE_SIZE << level_to_offset_bits(level))
5187 size = VTD_PAGE_SIZE << level_to_offset_bits(level);
5188
David Woodhouseea8ea462014-03-05 17:09:32 +00005189 start_pfn = iova >> VTD_PAGE_SHIFT;
5190 last_pfn = (iova + size - 1) >> VTD_PAGE_SHIFT;
5191
5192 freelist = domain_unmap(dmar_domain, start_pfn, last_pfn);
5193
5194 npages = last_pfn - start_pfn + 1;
5195
Shaokun Zhangf746a022018-03-22 18:18:06 +08005196 for_each_domain_iommu(iommu_id, dmar_domain)
Joerg Roedel42e8c182015-07-21 15:50:02 +02005197 iommu_flush_iotlb_psi(g_iommus[iommu_id], dmar_domain,
5198 start_pfn, npages, !freelist, 0);
David Woodhouseea8ea462014-03-05 17:09:32 +00005199
5200 dma_free_pagelist(freelist);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08005201
David Woodhouse163cc522009-06-28 00:51:17 +01005202 if (dmar_domain->max_addr == iova + size)
5203 dmar_domain->max_addr = iova;
Joerg Roedelb146a1c9f2010-01-20 17:17:37 +01005204
David Woodhouse5cf0a762014-03-19 16:07:49 +00005205 return size;
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005206}
Kay, Allen M38717942008-09-09 18:37:29 +03005207
Joerg Roedeld14d6572008-12-03 15:06:57 +01005208static phys_addr_t intel_iommu_iova_to_phys(struct iommu_domain *domain,
Varun Sethibb5547a2013-03-29 01:23:58 +05305209 dma_addr_t iova)
Kay, Allen M38717942008-09-09 18:37:29 +03005210{
Joerg Roedel00a77de2015-03-26 13:43:08 +01005211 struct dmar_domain *dmar_domain = to_dmar_domain(domain);
Kay, Allen M38717942008-09-09 18:37:29 +03005212 struct dma_pte *pte;
David Woodhouse5cf0a762014-03-19 16:07:49 +00005213 int level = 0;
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005214 u64 phys = 0;
Kay, Allen M38717942008-09-09 18:37:29 +03005215
David Woodhouse5cf0a762014-03-19 16:07:49 +00005216 pte = pfn_to_dma_pte(dmar_domain, iova >> VTD_PAGE_SHIFT, &level);
Kay, Allen M38717942008-09-09 18:37:29 +03005217 if (pte)
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005218 phys = dma_pte_addr(pte);
Kay, Allen M38717942008-09-09 18:37:29 +03005219
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08005220 return phys;
Kay, Allen M38717942008-09-09 18:37:29 +03005221}
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +01005222
Joerg Roedel5d587b82014-09-05 10:50:45 +02005223static bool intel_iommu_capable(enum iommu_cap cap)
Sheng Yangdbb9fd82009-03-18 15:33:06 +08005224{
Sheng Yangdbb9fd82009-03-18 15:33:06 +08005225 if (cap == IOMMU_CAP_CACHE_COHERENCY)
Joerg Roedel5d587b82014-09-05 10:50:45 +02005226 return domain_update_iommu_snooping(NULL) == 1;
Tom Lyon323f99c2010-07-02 16:56:14 -04005227 if (cap == IOMMU_CAP_INTR_REMAP)
Joerg Roedel5d587b82014-09-05 10:50:45 +02005228 return irq_remapping_enabled == 1;
Sheng Yangdbb9fd82009-03-18 15:33:06 +08005229
Joerg Roedel5d587b82014-09-05 10:50:45 +02005230 return false;
Sheng Yangdbb9fd82009-03-18 15:33:06 +08005231}
5232
Alex Williamsonabdfdde2012-05-30 14:19:19 -06005233static int intel_iommu_add_device(struct device *dev)
Alex Williamson70ae6f02011-10-21 15:56:11 -04005234{
Alex Williamsona5459cf2014-06-12 16:12:31 -06005235 struct intel_iommu *iommu;
Alex Williamsonabdfdde2012-05-30 14:19:19 -06005236 struct iommu_group *group;
David Woodhouse156baca2014-03-09 14:00:57 -07005237 u8 bus, devfn;
Alex Williamson70ae6f02011-10-21 15:56:11 -04005238
Alex Williamsona5459cf2014-06-12 16:12:31 -06005239 iommu = device_to_iommu(dev, &bus, &devfn);
5240 if (!iommu)
Alex Williamson70ae6f02011-10-21 15:56:11 -04005241 return -ENODEV;
5242
Joerg Roedele3d10af2017-02-01 17:23:22 +01005243 iommu_device_link(&iommu->iommu, dev);
Alex Williamsonabdfdde2012-05-30 14:19:19 -06005244
Alex Williamsone17f9ff2014-07-03 09:51:37 -06005245 group = iommu_group_get_for_dev(dev);
Alex Williamson783f1572012-05-30 14:19:43 -06005246
Alex Williamsone17f9ff2014-07-03 09:51:37 -06005247 if (IS_ERR(group))
5248 return PTR_ERR(group);
Alex Williamson70ae6f02011-10-21 15:56:11 -04005249
Alex Williamsonabdfdde2012-05-30 14:19:19 -06005250 iommu_group_put(group);
Alex Williamsone17f9ff2014-07-03 09:51:37 -06005251 return 0;
Alex Williamsonabdfdde2012-05-30 14:19:19 -06005252}
5253
5254static void intel_iommu_remove_device(struct device *dev)
5255{
Alex Williamsona5459cf2014-06-12 16:12:31 -06005256 struct intel_iommu *iommu;
5257 u8 bus, devfn;
5258
5259 iommu = device_to_iommu(dev, &bus, &devfn);
5260 if (!iommu)
5261 return;
5262
Alex Williamsonabdfdde2012-05-30 14:19:19 -06005263 iommu_group_remove_device(dev);
Alex Williamsona5459cf2014-06-12 16:12:31 -06005264
Joerg Roedele3d10af2017-02-01 17:23:22 +01005265 iommu_device_unlink(&iommu->iommu, dev);
Alex Williamson70ae6f02011-10-21 15:56:11 -04005266}
5267
Eric Auger0659b8d2017-01-19 20:57:53 +00005268static void intel_iommu_get_resv_regions(struct device *device,
5269 struct list_head *head)
5270{
5271 struct iommu_resv_region *reg;
5272 struct dmar_rmrr_unit *rmrr;
5273 struct device *i_dev;
5274 int i;
5275
5276 rcu_read_lock();
5277 for_each_rmrr_units(rmrr) {
5278 for_each_active_dev_scope(rmrr->devices, rmrr->devices_cnt,
5279 i, i_dev) {
5280 if (i_dev != device)
5281 continue;
5282
5283 list_add_tail(&rmrr->resv->list, head);
5284 }
5285 }
5286 rcu_read_unlock();
5287
5288 reg = iommu_alloc_resv_region(IOAPIC_RANGE_START,
5289 IOAPIC_RANGE_END - IOAPIC_RANGE_START + 1,
Robin Murphy9d3a4de2017-03-16 17:00:16 +00005290 0, IOMMU_RESV_MSI);
Eric Auger0659b8d2017-01-19 20:57:53 +00005291 if (!reg)
5292 return;
5293 list_add_tail(&reg->list, head);
5294}
5295
5296static void intel_iommu_put_resv_regions(struct device *dev,
5297 struct list_head *head)
5298{
5299 struct iommu_resv_region *entry, *next;
5300
5301 list_for_each_entry_safe(entry, next, head, list) {
Gerald Schaefer198bc322019-01-16 20:11:44 +01005302 if (entry->type == IOMMU_RESV_MSI)
Eric Auger0659b8d2017-01-19 20:57:53 +00005303 kfree(entry);
5304 }
Kay, Allen M38717942008-09-09 18:37:29 +03005305}
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +01005306
David Woodhouse2f26e0a2015-09-09 11:40:47 +01005307#ifdef CONFIG_INTEL_IOMMU_SVM
5308int intel_iommu_enable_pasid(struct intel_iommu *iommu, struct intel_svm_dev *sdev)
5309{
5310 struct device_domain_info *info;
5311 struct context_entry *context;
5312 struct dmar_domain *domain;
5313 unsigned long flags;
5314 u64 ctx_lo;
5315 int ret;
5316
5317 domain = get_valid_domain_for_dev(sdev->dev);
5318 if (!domain)
5319 return -EINVAL;
5320
5321 spin_lock_irqsave(&device_domain_lock, flags);
5322 spin_lock(&iommu->lock);
5323
5324 ret = -EINVAL;
5325 info = sdev->dev->archdata.iommu;
5326 if (!info || !info->pasid_supported)
5327 goto out;
5328
5329 context = iommu_context_addr(iommu, info->bus, info->devfn, 0);
5330 if (WARN_ON(!context))
5331 goto out;
5332
5333 ctx_lo = context[0].lo;
5334
5335 sdev->did = domain->iommu_did[iommu->seq_id];
5336 sdev->sid = PCI_DEVID(info->bus, info->devfn);
5337
5338 if (!(ctx_lo & CONTEXT_PASIDE)) {
David Woodhouse2f26e0a2015-09-09 11:40:47 +01005339 ctx_lo |= CONTEXT_PASIDE;
5340 context[0].lo = ctx_lo;
5341 wmb();
5342 iommu->flush.flush_context(iommu, sdev->did, sdev->sid,
5343 DMA_CCMD_MASK_NOBIT,
5344 DMA_CCMD_DEVICE_INVL);
5345 }
5346
5347 /* Enable PASID support in the device, if it wasn't already */
5348 if (!info->pasid_enabled)
5349 iommu_enable_dev_iotlb(info);
5350
5351 if (info->ats_enabled) {
5352 sdev->dev_iotlb = 1;
5353 sdev->qdep = info->ats_qdep;
5354 if (sdev->qdep >= QI_DEV_EIOTLB_MAX_INVS)
5355 sdev->qdep = 0;
5356 }
5357 ret = 0;
5358
5359 out:
5360 spin_unlock(&iommu->lock);
5361 spin_unlock_irqrestore(&device_domain_lock, flags);
5362
5363 return ret;
5364}
5365
5366struct intel_iommu *intel_svm_device_to_iommu(struct device *dev)
5367{
5368 struct intel_iommu *iommu;
5369 u8 bus, devfn;
5370
5371 if (iommu_dummy(dev)) {
5372 dev_warn(dev,
5373 "No IOMMU translation for device; cannot enable SVM\n");
5374 return NULL;
5375 }
5376
5377 iommu = device_to_iommu(dev, &bus, &devfn);
5378 if ((!iommu)) {
Sudeep Duttb9997e32015-10-18 20:54:37 -07005379 dev_err(dev, "No IOMMU for device; cannot enable SVM\n");
David Woodhouse2f26e0a2015-09-09 11:40:47 +01005380 return NULL;
5381 }
5382
David Woodhouse2f26e0a2015-09-09 11:40:47 +01005383 return iommu;
5384}
5385#endif /* CONFIG_INTEL_IOMMU_SVM */
5386
Joerg Roedelb0119e82017-02-01 13:23:08 +01005387const struct iommu_ops intel_iommu_ops = {
Eric Auger0659b8d2017-01-19 20:57:53 +00005388 .capable = intel_iommu_capable,
5389 .domain_alloc = intel_iommu_domain_alloc,
5390 .domain_free = intel_iommu_domain_free,
5391 .attach_dev = intel_iommu_attach_device,
5392 .detach_dev = intel_iommu_detach_device,
5393 .map = intel_iommu_map,
5394 .unmap = intel_iommu_unmap,
Eric Auger0659b8d2017-01-19 20:57:53 +00005395 .iova_to_phys = intel_iommu_iova_to_phys,
5396 .add_device = intel_iommu_add_device,
5397 .remove_device = intel_iommu_remove_device,
5398 .get_resv_regions = intel_iommu_get_resv_regions,
5399 .put_resv_regions = intel_iommu_put_resv_regions,
5400 .device_group = pci_device_group,
5401 .pgsize_bitmap = INTEL_IOMMU_PGSIZES,
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +01005402};
David Woodhouse9af88142009-02-13 23:18:03 +00005403
Daniel Vetter94526182013-01-20 23:50:13 +01005404static void quirk_iommu_g4x_gfx(struct pci_dev *dev)
5405{
5406 /* G4x/GM45 integrated gfx dmar support is totally busted. */
Bjorn Helgaas932a6522019-02-08 16:06:00 -06005407 pci_info(dev, "Disabling IOMMU for graphics on this chipset\n");
Daniel Vetter94526182013-01-20 23:50:13 +01005408 dmar_map_gfx = 0;
5409}
5410
5411DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2a40, quirk_iommu_g4x_gfx);
5412DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e00, quirk_iommu_g4x_gfx);
5413DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e10, quirk_iommu_g4x_gfx);
5414DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e20, quirk_iommu_g4x_gfx);
5415DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e30, quirk_iommu_g4x_gfx);
5416DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e40, quirk_iommu_g4x_gfx);
5417DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e90, quirk_iommu_g4x_gfx);
5418
Greg Kroah-Hartmand34d6512012-12-21 15:05:21 -08005419static void quirk_iommu_rwbf(struct pci_dev *dev)
David Woodhouse9af88142009-02-13 23:18:03 +00005420{
5421 /*
5422 * Mobile 4 Series Chipset neglects to set RWBF capability,
Daniel Vetter210561f2013-01-21 19:48:59 +01005423 * but needs it. Same seems to hold for the desktop versions.
David Woodhouse9af88142009-02-13 23:18:03 +00005424 */
Bjorn Helgaas932a6522019-02-08 16:06:00 -06005425 pci_info(dev, "Forcing write-buffer flush capability\n");
David Woodhouse9af88142009-02-13 23:18:03 +00005426 rwbf_quirk = 1;
5427}
5428
5429DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2a40, quirk_iommu_rwbf);
Daniel Vetter210561f2013-01-21 19:48:59 +01005430DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e00, quirk_iommu_rwbf);
5431DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e10, quirk_iommu_rwbf);
5432DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e20, quirk_iommu_rwbf);
5433DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e30, quirk_iommu_rwbf);
5434DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e40, quirk_iommu_rwbf);
5435DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e90, quirk_iommu_rwbf);
David Woodhousee0fc7e02009-09-30 09:12:17 -07005436
Adam Jacksoneecfd572010-08-25 21:17:34 +01005437#define GGC 0x52
5438#define GGC_MEMORY_SIZE_MASK (0xf << 8)
5439#define GGC_MEMORY_SIZE_NONE (0x0 << 8)
5440#define GGC_MEMORY_SIZE_1M (0x1 << 8)
5441#define GGC_MEMORY_SIZE_2M (0x3 << 8)
5442#define GGC_MEMORY_VT_ENABLED (0x8 << 8)
5443#define GGC_MEMORY_SIZE_2M_VT (0x9 << 8)
5444#define GGC_MEMORY_SIZE_3M_VT (0xa << 8)
5445#define GGC_MEMORY_SIZE_4M_VT (0xb << 8)
5446
Greg Kroah-Hartmand34d6512012-12-21 15:05:21 -08005447static void quirk_calpella_no_shadow_gtt(struct pci_dev *dev)
David Woodhouse9eecabc2010-09-21 22:28:23 +01005448{
5449 unsigned short ggc;
5450
Adam Jacksoneecfd572010-08-25 21:17:34 +01005451 if (pci_read_config_word(dev, GGC, &ggc))
David Woodhouse9eecabc2010-09-21 22:28:23 +01005452 return;
5453
Adam Jacksoneecfd572010-08-25 21:17:34 +01005454 if (!(ggc & GGC_MEMORY_VT_ENABLED)) {
Bjorn Helgaas932a6522019-02-08 16:06:00 -06005455 pci_info(dev, "BIOS has allocated no shadow GTT; disabling IOMMU for graphics\n");
David Woodhouse9eecabc2010-09-21 22:28:23 +01005456 dmar_map_gfx = 0;
David Woodhouse6fbcfb32011-09-25 19:11:14 -07005457 } else if (dmar_map_gfx) {
5458 /* we have to ensure the gfx device is idle before we flush */
Bjorn Helgaas932a6522019-02-08 16:06:00 -06005459 pci_info(dev, "Disabling batched IOTLB flush on Ironlake\n");
David Woodhouse6fbcfb32011-09-25 19:11:14 -07005460 intel_iommu_strict = 1;
5461 }
David Woodhouse9eecabc2010-09-21 22:28:23 +01005462}
5463DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x0040, quirk_calpella_no_shadow_gtt);
5464DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x0044, quirk_calpella_no_shadow_gtt);
5465DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x0062, quirk_calpella_no_shadow_gtt);
5466DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x006a, quirk_calpella_no_shadow_gtt);
5467
David Woodhousee0fc7e02009-09-30 09:12:17 -07005468/* On Tylersburg chipsets, some BIOSes have been known to enable the
5469 ISOCH DMAR unit for the Azalia sound device, but not give it any
5470 TLB entries, which causes it to deadlock. Check for that. We do
5471 this in a function called from init_dmars(), instead of in a PCI
5472 quirk, because we don't want to print the obnoxious "BIOS broken"
5473 message if VT-d is actually disabled.
5474*/
5475static void __init check_tylersburg_isoch(void)
5476{
5477 struct pci_dev *pdev;
5478 uint32_t vtisochctrl;
5479
5480 /* If there's no Azalia in the system anyway, forget it. */
5481 pdev = pci_get_device(PCI_VENDOR_ID_INTEL, 0x3a3e, NULL);
5482 if (!pdev)
5483 return;
5484 pci_dev_put(pdev);
5485
5486 /* System Management Registers. Might be hidden, in which case
5487 we can't do the sanity check. But that's OK, because the
5488 known-broken BIOSes _don't_ actually hide it, so far. */
5489 pdev = pci_get_device(PCI_VENDOR_ID_INTEL, 0x342e, NULL);
5490 if (!pdev)
5491 return;
5492
5493 if (pci_read_config_dword(pdev, 0x188, &vtisochctrl)) {
5494 pci_dev_put(pdev);
5495 return;
5496 }
5497
5498 pci_dev_put(pdev);
5499
5500 /* If Azalia DMA is routed to the non-isoch DMAR unit, fine. */
5501 if (vtisochctrl & 1)
5502 return;
5503
5504 /* Drop all bits other than the number of TLB entries */
5505 vtisochctrl &= 0x1c;
5506
5507 /* If we have the recommended number of TLB entries (16), fine. */
5508 if (vtisochctrl == 0x10)
5509 return;
5510
5511 /* Zero TLB entries? You get to ride the short bus to school. */
5512 if (!vtisochctrl) {
5513 WARN(1, "Your BIOS is broken; DMA routed to ISOCH DMAR unit but no TLB space.\n"
5514 "BIOS vendor: %s; Ver: %s; Product Version: %s\n",
5515 dmi_get_system_info(DMI_BIOS_VENDOR),
5516 dmi_get_system_info(DMI_BIOS_VERSION),
5517 dmi_get_system_info(DMI_PRODUCT_VERSION));
5518 iommu_identity_mapping |= IDENTMAP_AZALIA;
5519 return;
5520 }
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02005521
5522 pr_warn("Recommended TLB entries for ISOCH unit is 16; your BIOS set %d\n",
David Woodhousee0fc7e02009-09-30 09:12:17 -07005523 vtisochctrl);
5524}