blob: a0ac7197ffddf55524583e86f6bc7980f1b5e7dc [file] [log] [blame]
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001/*
2 * Copyright (c) 2006, Intel Corporation.
3 *
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms and conditions of the GNU General Public License,
6 * version 2, as published by the Free Software Foundation.
7 *
8 * This program is distributed in the hope it will be useful, but WITHOUT
9 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
11 * more details.
12 *
13 * You should have received a copy of the GNU General Public License along with
14 * this program; if not, write to the Free Software Foundation, Inc., 59 Temple
15 * Place - Suite 330, Boston, MA 02111-1307 USA.
16 *
mark gross98bcef52008-02-23 15:23:35 -080017 * Copyright (C) 2006-2008 Intel Corporation
18 * Author: Ashok Raj <ashok.raj@intel.com>
19 * Author: Shaohua Li <shaohua.li@intel.com>
20 * Author: Anil S Keshavamurthy <anil.s.keshavamurthy@intel.com>
Fenghua Yu5b6985c2008-10-16 18:02:32 -070021 * Author: Fenghua Yu <fenghua.yu@intel.com>
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070022 */
23
24#include <linux/init.h>
25#include <linux/bitmap.h>
mark gross5e0d2a62008-03-04 15:22:08 -080026#include <linux/debugfs.h>
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070027#include <linux/slab.h>
28#include <linux/irq.h>
29#include <linux/interrupt.h>
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070030#include <linux/spinlock.h>
31#include <linux/pci.h>
32#include <linux/dmar.h>
33#include <linux/dma-mapping.h>
34#include <linux/mempool.h>
mark gross5e0d2a62008-03-04 15:22:08 -080035#include <linux/timer.h>
Kay, Allen M38717942008-09-09 18:37:29 +030036#include <linux/iova.h>
Joerg Roedel5d450802008-12-03 14:52:32 +010037#include <linux/iommu.h>
Kay, Allen M38717942008-09-09 18:37:29 +030038#include <linux/intel-iommu.h>
Fenghua Yuf59c7b62009-03-27 14:22:42 -070039#include <linux/sysdev.h>
Shane Wang69575d32009-09-01 18:25:07 -070040#include <linux/tboot.h>
Stephen Rothwelladb2fe02009-08-31 15:24:23 +100041#include <linux/dmi.h>
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070042#include <asm/cacheflush.h>
FUJITA Tomonori46a7fa22008-07-11 10:23:42 +090043#include <asm/iommu.h>
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070044#include "pci.h"
45
Fenghua Yu5b6985c2008-10-16 18:02:32 -070046#define ROOT_SIZE VTD_PAGE_SIZE
47#define CONTEXT_SIZE VTD_PAGE_SIZE
48
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070049#define IS_GFX_DEVICE(pdev) ((pdev->class >> 16) == PCI_BASE_CLASS_DISPLAY)
50#define IS_ISA_DEVICE(pdev) ((pdev->class >> 8) == PCI_CLASS_BRIDGE_ISA)
David Woodhousee0fc7e02009-09-30 09:12:17 -070051#define IS_AZALIA(pdev) ((pdev)->vendor == 0x8086 && (pdev)->device == 0x3a3e)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070052
53#define IOAPIC_RANGE_START (0xfee00000)
54#define IOAPIC_RANGE_END (0xfeefffff)
55#define IOVA_START_ADDR (0x1000)
56
57#define DEFAULT_DOMAIN_ADDRESS_WIDTH 48
58
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -070059#define MAX_AGAW_WIDTH 64
60
David Woodhouse2ebe3152009-09-19 07:34:04 -070061#define __DOMAIN_MAX_PFN(gaw) ((((uint64_t)1) << (gaw-VTD_PAGE_SHIFT)) - 1)
62#define __DOMAIN_MAX_ADDR(gaw) ((((uint64_t)1) << gaw) - 1)
63
64/* We limit DOMAIN_MAX_PFN to fit in an unsigned long, and DOMAIN_MAX_ADDR
65 to match. That way, we can use 'unsigned long' for PFNs with impunity. */
66#define DOMAIN_MAX_PFN(gaw) ((unsigned long) min_t(uint64_t, \
67 __DOMAIN_MAX_PFN(gaw), (unsigned long)-1))
68#define DOMAIN_MAX_ADDR(gaw) (((uint64_t)__DOMAIN_MAX_PFN(gaw)) << VTD_PAGE_SHIFT)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -070069
Mark McLoughlinf27be032008-11-20 15:49:43 +000070#define IOVA_PFN(addr) ((addr) >> PAGE_SHIFT)
Yang Hongyang284901a2009-04-06 19:01:15 -070071#define DMA_32BIT_PFN IOVA_PFN(DMA_BIT_MASK(32))
Yang Hongyang6a355282009-04-06 19:01:13 -070072#define DMA_64BIT_PFN IOVA_PFN(DMA_BIT_MASK(64))
mark gross5e0d2a62008-03-04 15:22:08 -080073
David Woodhousefd18de52009-05-10 23:57:41 +010074
David Woodhousedd4e8312009-06-27 16:21:20 +010075/* VT-d pages must always be _smaller_ than MM pages. Otherwise things
76 are never going to work. */
77static inline unsigned long dma_to_mm_pfn(unsigned long dma_pfn)
78{
79 return dma_pfn >> (PAGE_SHIFT - VTD_PAGE_SHIFT);
80}
81
82static inline unsigned long mm_to_dma_pfn(unsigned long mm_pfn)
83{
84 return mm_pfn << (PAGE_SHIFT - VTD_PAGE_SHIFT);
85}
86static inline unsigned long page_to_dma_pfn(struct page *pg)
87{
88 return mm_to_dma_pfn(page_to_pfn(pg));
89}
90static inline unsigned long virt_to_dma_pfn(void *p)
91{
92 return page_to_dma_pfn(virt_to_page(p));
93}
94
Weidong Hand9630fe2008-12-08 11:06:32 +080095/* global iommu list, set NULL for ignored DMAR units */
96static struct intel_iommu **g_iommus;
97
David Woodhousee0fc7e02009-09-30 09:12:17 -070098static void __init check_tylersburg_isoch(void);
David Woodhouse9af88142009-02-13 23:18:03 +000099static int rwbf_quirk;
100
Mark McLoughlin46b08e12008-11-20 15:49:44 +0000101/*
102 * 0: Present
103 * 1-11: Reserved
104 * 12-63: Context Ptr (12 - (haw-1))
105 * 64-127: Reserved
106 */
107struct root_entry {
108 u64 val;
109 u64 rsvd1;
110};
111#define ROOT_ENTRY_NR (VTD_PAGE_SIZE/sizeof(struct root_entry))
112static inline bool root_present(struct root_entry *root)
113{
114 return (root->val & 1);
115}
116static inline void set_root_present(struct root_entry *root)
117{
118 root->val |= 1;
119}
120static inline void set_root_value(struct root_entry *root, unsigned long value)
121{
122 root->val |= value & VTD_PAGE_MASK;
123}
124
125static inline struct context_entry *
126get_context_addr_from_root(struct root_entry *root)
127{
128 return (struct context_entry *)
129 (root_present(root)?phys_to_virt(
130 root->val & VTD_PAGE_MASK) :
131 NULL);
132}
133
Mark McLoughlin7a8fc252008-11-20 15:49:45 +0000134/*
135 * low 64 bits:
136 * 0: present
137 * 1: fault processing disable
138 * 2-3: translation type
139 * 12-63: address space root
140 * high 64 bits:
141 * 0-2: address width
142 * 3-6: aval
143 * 8-23: domain id
144 */
145struct context_entry {
146 u64 lo;
147 u64 hi;
148};
Mark McLoughlin7a8fc252008-11-20 15:49:45 +0000149
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000150static inline bool context_present(struct context_entry *context)
151{
152 return (context->lo & 1);
153}
154static inline void context_set_present(struct context_entry *context)
155{
156 context->lo |= 1;
157}
158
159static inline void context_set_fault_enable(struct context_entry *context)
160{
161 context->lo &= (((u64)-1) << 2) | 1;
162}
163
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000164static inline void context_set_translation_type(struct context_entry *context,
165 unsigned long value)
166{
167 context->lo &= (((u64)-1) << 4) | 3;
168 context->lo |= (value & 3) << 2;
169}
170
171static inline void context_set_address_root(struct context_entry *context,
172 unsigned long value)
173{
174 context->lo |= value & VTD_PAGE_MASK;
175}
176
177static inline void context_set_address_width(struct context_entry *context,
178 unsigned long value)
179{
180 context->hi |= value & 7;
181}
182
183static inline void context_set_domain_id(struct context_entry *context,
184 unsigned long value)
185{
186 context->hi |= (value & ((1 << 16) - 1)) << 8;
187}
188
189static inline void context_clear_entry(struct context_entry *context)
190{
191 context->lo = 0;
192 context->hi = 0;
193}
Mark McLoughlin7a8fc252008-11-20 15:49:45 +0000194
Mark McLoughlin622ba122008-11-20 15:49:46 +0000195/*
196 * 0: readable
197 * 1: writable
198 * 2-6: reserved
199 * 7: super page
Sheng Yang9cf06692009-03-18 15:33:07 +0800200 * 8-10: available
201 * 11: snoop behavior
Mark McLoughlin622ba122008-11-20 15:49:46 +0000202 * 12-63: Host physcial address
203 */
204struct dma_pte {
205 u64 val;
206};
Mark McLoughlin622ba122008-11-20 15:49:46 +0000207
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000208static inline void dma_clear_pte(struct dma_pte *pte)
209{
210 pte->val = 0;
211}
212
213static inline void dma_set_pte_readable(struct dma_pte *pte)
214{
215 pte->val |= DMA_PTE_READ;
216}
217
218static inline void dma_set_pte_writable(struct dma_pte *pte)
219{
220 pte->val |= DMA_PTE_WRITE;
221}
222
Sheng Yang9cf06692009-03-18 15:33:07 +0800223static inline void dma_set_pte_snp(struct dma_pte *pte)
224{
225 pte->val |= DMA_PTE_SNP;
226}
227
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000228static inline void dma_set_pte_prot(struct dma_pte *pte, unsigned long prot)
229{
230 pte->val = (pte->val & ~3) | (prot & 3);
231}
232
233static inline u64 dma_pte_addr(struct dma_pte *pte)
234{
David Woodhousec85994e2009-07-01 19:21:24 +0100235#ifdef CONFIG_64BIT
236 return pte->val & VTD_PAGE_MASK;
237#else
238 /* Must have a full atomic 64-bit read */
239 return __cmpxchg64(pte, 0ULL, 0ULL) & VTD_PAGE_MASK;
240#endif
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000241}
242
David Woodhousedd4e8312009-06-27 16:21:20 +0100243static inline void dma_set_pte_pfn(struct dma_pte *pte, unsigned long pfn)
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000244{
David Woodhousedd4e8312009-06-27 16:21:20 +0100245 pte->val |= (uint64_t)pfn << VTD_PAGE_SHIFT;
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000246}
247
248static inline bool dma_pte_present(struct dma_pte *pte)
249{
250 return (pte->val & 3) != 0;
251}
Mark McLoughlin622ba122008-11-20 15:49:46 +0000252
David Woodhouse75e6bf92009-07-02 11:21:16 +0100253static inline int first_pte_in_page(struct dma_pte *pte)
254{
255 return !((unsigned long)pte & ~VTD_PAGE_MASK);
256}
257
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700258/*
259 * This domain is a statically identity mapping domain.
260 * 1. This domain creats a static 1:1 mapping to all usable memory.
261 * 2. It maps to each iommu if successful.
262 * 3. Each iommu mapps to this domain if successful.
263 */
David Woodhouse19943b02009-08-04 16:19:20 +0100264static struct dmar_domain *si_domain;
265static int hw_pass_through = 1;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700266
Weidong Han3b5410e2008-12-08 09:17:15 +0800267/* devices under the same p2p bridge are owned in one domain */
Mike Daycdc7b832008-12-12 17:16:30 +0100268#define DOMAIN_FLAG_P2P_MULTIPLE_DEVICES (1 << 0)
Weidong Han3b5410e2008-12-08 09:17:15 +0800269
Weidong Han1ce28fe2008-12-08 16:35:39 +0800270/* domain represents a virtual machine, more than one devices
271 * across iommus may be owned in one domain, e.g. kvm guest.
272 */
273#define DOMAIN_FLAG_VIRTUAL_MACHINE (1 << 1)
274
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700275/* si_domain contains mulitple devices */
276#define DOMAIN_FLAG_STATIC_IDENTITY (1 << 2)
277
Mark McLoughlin99126f72008-11-20 15:49:47 +0000278struct dmar_domain {
279 int id; /* domain id */
Suresh Siddha4c923d42009-10-02 11:01:24 -0700280 int nid; /* node id */
Weidong Han8c11e792008-12-08 15:29:22 +0800281 unsigned long iommu_bmp; /* bitmap of iommus this domain uses*/
Mark McLoughlin99126f72008-11-20 15:49:47 +0000282
283 struct list_head devices; /* all devices' list */
284 struct iova_domain iovad; /* iova's that belong to this domain */
285
286 struct dma_pte *pgd; /* virtual address */
Mark McLoughlin99126f72008-11-20 15:49:47 +0000287 int gaw; /* max guest address width */
288
289 /* adjusted guest address width, 0 is level 2 30-bit */
290 int agaw;
291
Weidong Han3b5410e2008-12-08 09:17:15 +0800292 int flags; /* flags to find out type of domain */
Weidong Han8e6040972008-12-08 15:49:06 +0800293
294 int iommu_coherency;/* indicate coherency of iommu access */
Sheng Yang58c610b2009-03-18 15:33:05 +0800295 int iommu_snooping; /* indicate snooping control feature*/
Weidong Hanc7151a82008-12-08 22:51:37 +0800296 int iommu_count; /* reference count of iommu */
297 spinlock_t iommu_lock; /* protect iommu set in domain */
Weidong Hanfe40f1e2008-12-08 23:10:23 +0800298 u64 max_addr; /* maximum mapped address */
Mark McLoughlin99126f72008-11-20 15:49:47 +0000299};
300
Mark McLoughlina647dacb2008-11-20 15:49:48 +0000301/* PCI domain-device relationship */
302struct device_domain_info {
303 struct list_head link; /* link to domain siblings */
304 struct list_head global; /* link to global list */
David Woodhouse276dbf992009-04-04 01:45:37 +0100305 int segment; /* PCI domain */
306 u8 bus; /* PCI bus number */
Mark McLoughlina647dacb2008-11-20 15:49:48 +0000307 u8 devfn; /* PCI devfn number */
Stefan Assmann45e829e2009-12-03 06:49:24 -0500308 struct pci_dev *dev; /* it's NULL for PCIe-to-PCI bridge */
Yu Zhao93a23a72009-05-18 13:51:37 +0800309 struct intel_iommu *iommu; /* IOMMU used by this device */
Mark McLoughlina647dacb2008-11-20 15:49:48 +0000310 struct dmar_domain *domain; /* pointer to domain */
311};
312
mark gross5e0d2a62008-03-04 15:22:08 -0800313static void flush_unmaps_timeout(unsigned long data);
314
315DEFINE_TIMER(unmap_timer, flush_unmaps_timeout, 0, 0);
316
mark gross80b20dd2008-04-18 13:53:58 -0700317#define HIGH_WATER_MARK 250
318struct deferred_flush_tables {
319 int next;
320 struct iova *iova[HIGH_WATER_MARK];
321 struct dmar_domain *domain[HIGH_WATER_MARK];
322};
323
324static struct deferred_flush_tables *deferred_flush;
325
mark gross5e0d2a62008-03-04 15:22:08 -0800326/* bitmap for indexing intel_iommus */
mark gross5e0d2a62008-03-04 15:22:08 -0800327static int g_num_of_iommus;
328
329static DEFINE_SPINLOCK(async_umap_flush_lock);
330static LIST_HEAD(unmaps_to_do);
331
332static int timer_on;
333static long list_size;
mark gross5e0d2a62008-03-04 15:22:08 -0800334
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700335static void domain_remove_dev_info(struct dmar_domain *domain);
336
Kyle McMartin0cd5c3c2009-02-04 14:29:19 -0800337#ifdef CONFIG_DMAR_DEFAULT_ON
338int dmar_disabled = 0;
339#else
340int dmar_disabled = 1;
341#endif /*CONFIG_DMAR_DEFAULT_ON*/
342
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700343static int __initdata dmar_map_gfx = 1;
Keshavamurthy, Anil S7d3b03c2007-10-21 16:41:53 -0700344static int dmar_forcedac;
mark gross5e0d2a62008-03-04 15:22:08 -0800345static int intel_iommu_strict;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700346
347#define DUMMY_DEVICE_DOMAIN_INFO ((struct device_domain_info *)(-1))
348static DEFINE_SPINLOCK(device_domain_lock);
349static LIST_HEAD(device_domain_list);
350
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +0100351static struct iommu_ops intel_iommu_ops;
352
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700353static int __init intel_iommu_setup(char *str)
354{
355 if (!str)
356 return -EINVAL;
357 while (*str) {
Kyle McMartin0cd5c3c2009-02-04 14:29:19 -0800358 if (!strncmp(str, "on", 2)) {
359 dmar_disabled = 0;
360 printk(KERN_INFO "Intel-IOMMU: enabled\n");
361 } else if (!strncmp(str, "off", 3)) {
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700362 dmar_disabled = 1;
Kyle McMartin0cd5c3c2009-02-04 14:29:19 -0800363 printk(KERN_INFO "Intel-IOMMU: disabled\n");
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700364 } else if (!strncmp(str, "igfx_off", 8)) {
365 dmar_map_gfx = 0;
366 printk(KERN_INFO
367 "Intel-IOMMU: disable GFX device mapping\n");
Keshavamurthy, Anil S7d3b03c2007-10-21 16:41:53 -0700368 } else if (!strncmp(str, "forcedac", 8)) {
mark gross5e0d2a62008-03-04 15:22:08 -0800369 printk(KERN_INFO
Keshavamurthy, Anil S7d3b03c2007-10-21 16:41:53 -0700370 "Intel-IOMMU: Forcing DAC for PCI devices\n");
371 dmar_forcedac = 1;
mark gross5e0d2a62008-03-04 15:22:08 -0800372 } else if (!strncmp(str, "strict", 6)) {
373 printk(KERN_INFO
374 "Intel-IOMMU: disable batched IOTLB flush\n");
375 intel_iommu_strict = 1;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700376 }
377
378 str += strcspn(str, ",");
379 while (*str == ',')
380 str++;
381 }
382 return 0;
383}
384__setup("intel_iommu=", intel_iommu_setup);
385
386static struct kmem_cache *iommu_domain_cache;
387static struct kmem_cache *iommu_devinfo_cache;
388static struct kmem_cache *iommu_iova_cache;
389
Suresh Siddha4c923d42009-10-02 11:01:24 -0700390static inline void *alloc_pgtable_page(int node)
Keshavamurthy, Anil Seb3fa7c2007-10-21 16:41:52 -0700391{
Suresh Siddha4c923d42009-10-02 11:01:24 -0700392 struct page *page;
393 void *vaddr = NULL;
Keshavamurthy, Anil Seb3fa7c2007-10-21 16:41:52 -0700394
Suresh Siddha4c923d42009-10-02 11:01:24 -0700395 page = alloc_pages_node(node, GFP_ATOMIC | __GFP_ZERO, 0);
396 if (page)
397 vaddr = page_address(page);
Keshavamurthy, Anil Seb3fa7c2007-10-21 16:41:52 -0700398 return vaddr;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700399}
400
401static inline void free_pgtable_page(void *vaddr)
402{
403 free_page((unsigned long)vaddr);
404}
405
406static inline void *alloc_domain_mem(void)
407{
KOSAKI Motohiro354bb652009-11-17 16:21:09 +0900408 return kmem_cache_alloc(iommu_domain_cache, GFP_ATOMIC);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700409}
410
Kay, Allen M38717942008-09-09 18:37:29 +0300411static void free_domain_mem(void *vaddr)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700412{
413 kmem_cache_free(iommu_domain_cache, vaddr);
414}
415
416static inline void * alloc_devinfo_mem(void)
417{
KOSAKI Motohiro354bb652009-11-17 16:21:09 +0900418 return kmem_cache_alloc(iommu_devinfo_cache, GFP_ATOMIC);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700419}
420
421static inline void free_devinfo_mem(void *vaddr)
422{
423 kmem_cache_free(iommu_devinfo_cache, vaddr);
424}
425
426struct iova *alloc_iova_mem(void)
427{
KOSAKI Motohiro354bb652009-11-17 16:21:09 +0900428 return kmem_cache_alloc(iommu_iova_cache, GFP_ATOMIC);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700429}
430
431void free_iova_mem(struct iova *iova)
432{
433 kmem_cache_free(iommu_iova_cache, iova);
434}
435
Weidong Han1b573682008-12-08 15:34:06 +0800436
437static inline int width_to_agaw(int width);
438
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700439static int __iommu_calculate_agaw(struct intel_iommu *iommu, int max_gaw)
Weidong Han1b573682008-12-08 15:34:06 +0800440{
441 unsigned long sagaw;
442 int agaw = -1;
443
444 sagaw = cap_sagaw(iommu->cap);
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700445 for (agaw = width_to_agaw(max_gaw);
Weidong Han1b573682008-12-08 15:34:06 +0800446 agaw >= 0; agaw--) {
447 if (test_bit(agaw, &sagaw))
448 break;
449 }
450
451 return agaw;
452}
453
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700454/*
455 * Calculate max SAGAW for each iommu.
456 */
457int iommu_calculate_max_sagaw(struct intel_iommu *iommu)
458{
459 return __iommu_calculate_agaw(iommu, MAX_AGAW_WIDTH);
460}
461
462/*
463 * calculate agaw for each iommu.
464 * "SAGAW" may be different across iommus, use a default agaw, and
465 * get a supported less agaw for iommus that don't support the default agaw.
466 */
467int iommu_calculate_agaw(struct intel_iommu *iommu)
468{
469 return __iommu_calculate_agaw(iommu, DEFAULT_DOMAIN_ADDRESS_WIDTH);
470}
471
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700472/* This functionin only returns single iommu in a domain */
Weidong Han8c11e792008-12-08 15:29:22 +0800473static struct intel_iommu *domain_get_iommu(struct dmar_domain *domain)
474{
475 int iommu_id;
476
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700477 /* si_domain and vm domain should not get here. */
Weidong Han1ce28fe2008-12-08 16:35:39 +0800478 BUG_ON(domain->flags & DOMAIN_FLAG_VIRTUAL_MACHINE);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700479 BUG_ON(domain->flags & DOMAIN_FLAG_STATIC_IDENTITY);
Weidong Han1ce28fe2008-12-08 16:35:39 +0800480
Weidong Han8c11e792008-12-08 15:29:22 +0800481 iommu_id = find_first_bit(&domain->iommu_bmp, g_num_of_iommus);
482 if (iommu_id < 0 || iommu_id >= g_num_of_iommus)
483 return NULL;
484
485 return g_iommus[iommu_id];
486}
487
Weidong Han8e6040972008-12-08 15:49:06 +0800488static void domain_update_iommu_coherency(struct dmar_domain *domain)
489{
490 int i;
491
492 domain->iommu_coherency = 1;
493
Akinobu Mitaa45946a2010-03-11 14:04:08 -0800494 for_each_set_bit(i, &domain->iommu_bmp, g_num_of_iommus) {
Weidong Han8e6040972008-12-08 15:49:06 +0800495 if (!ecap_coherent(g_iommus[i]->ecap)) {
496 domain->iommu_coherency = 0;
497 break;
498 }
Weidong Han8e6040972008-12-08 15:49:06 +0800499 }
500}
501
Sheng Yang58c610b2009-03-18 15:33:05 +0800502static void domain_update_iommu_snooping(struct dmar_domain *domain)
503{
504 int i;
505
506 domain->iommu_snooping = 1;
507
Akinobu Mitaa45946a2010-03-11 14:04:08 -0800508 for_each_set_bit(i, &domain->iommu_bmp, g_num_of_iommus) {
Sheng Yang58c610b2009-03-18 15:33:05 +0800509 if (!ecap_sc_support(g_iommus[i]->ecap)) {
510 domain->iommu_snooping = 0;
511 break;
512 }
Sheng Yang58c610b2009-03-18 15:33:05 +0800513 }
514}
515
516/* Some capabilities may be different across iommus */
517static void domain_update_iommu_cap(struct dmar_domain *domain)
518{
519 domain_update_iommu_coherency(domain);
520 domain_update_iommu_snooping(domain);
521}
522
David Woodhouse276dbf992009-04-04 01:45:37 +0100523static struct intel_iommu *device_to_iommu(int segment, u8 bus, u8 devfn)
Weidong Hanc7151a82008-12-08 22:51:37 +0800524{
525 struct dmar_drhd_unit *drhd = NULL;
526 int i;
527
528 for_each_drhd_unit(drhd) {
529 if (drhd->ignored)
530 continue;
David Woodhouse276dbf992009-04-04 01:45:37 +0100531 if (segment != drhd->segment)
532 continue;
Weidong Hanc7151a82008-12-08 22:51:37 +0800533
David Woodhouse924b6232009-04-04 00:39:25 +0100534 for (i = 0; i < drhd->devices_cnt; i++) {
Dirk Hohndel288e4872009-01-11 15:33:51 +0000535 if (drhd->devices[i] &&
536 drhd->devices[i]->bus->number == bus &&
Weidong Hanc7151a82008-12-08 22:51:37 +0800537 drhd->devices[i]->devfn == devfn)
538 return drhd->iommu;
David Woodhouse4958c5d2009-04-06 13:30:01 -0700539 if (drhd->devices[i] &&
540 drhd->devices[i]->subordinate &&
David Woodhouse924b6232009-04-04 00:39:25 +0100541 drhd->devices[i]->subordinate->number <= bus &&
542 drhd->devices[i]->subordinate->subordinate >= bus)
543 return drhd->iommu;
544 }
Weidong Hanc7151a82008-12-08 22:51:37 +0800545
546 if (drhd->include_all)
547 return drhd->iommu;
548 }
549
550 return NULL;
551}
552
Weidong Han5331fe62008-12-08 23:00:00 +0800553static void domain_flush_cache(struct dmar_domain *domain,
554 void *addr, int size)
555{
556 if (!domain->iommu_coherency)
557 clflush_cache_range(addr, size);
558}
559
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700560/* Gets context entry for a given bus and devfn */
561static struct context_entry * device_to_context_entry(struct intel_iommu *iommu,
562 u8 bus, u8 devfn)
563{
564 struct root_entry *root;
565 struct context_entry *context;
566 unsigned long phy_addr;
567 unsigned long flags;
568
569 spin_lock_irqsave(&iommu->lock, flags);
570 root = &iommu->root_entry[bus];
571 context = get_context_addr_from_root(root);
572 if (!context) {
Suresh Siddha4c923d42009-10-02 11:01:24 -0700573 context = (struct context_entry *)
574 alloc_pgtable_page(iommu->node);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700575 if (!context) {
576 spin_unlock_irqrestore(&iommu->lock, flags);
577 return NULL;
578 }
Fenghua Yu5b6985c2008-10-16 18:02:32 -0700579 __iommu_flush_cache(iommu, (void *)context, CONTEXT_SIZE);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700580 phy_addr = virt_to_phys((void *)context);
581 set_root_value(root, phy_addr);
582 set_root_present(root);
583 __iommu_flush_cache(iommu, root, sizeof(*root));
584 }
585 spin_unlock_irqrestore(&iommu->lock, flags);
586 return &context[devfn];
587}
588
589static int device_context_mapped(struct intel_iommu *iommu, u8 bus, u8 devfn)
590{
591 struct root_entry *root;
592 struct context_entry *context;
593 int ret;
594 unsigned long flags;
595
596 spin_lock_irqsave(&iommu->lock, flags);
597 root = &iommu->root_entry[bus];
598 context = get_context_addr_from_root(root);
599 if (!context) {
600 ret = 0;
601 goto out;
602 }
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000603 ret = context_present(&context[devfn]);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700604out:
605 spin_unlock_irqrestore(&iommu->lock, flags);
606 return ret;
607}
608
609static void clear_context_table(struct intel_iommu *iommu, u8 bus, u8 devfn)
610{
611 struct root_entry *root;
612 struct context_entry *context;
613 unsigned long flags;
614
615 spin_lock_irqsave(&iommu->lock, flags);
616 root = &iommu->root_entry[bus];
617 context = get_context_addr_from_root(root);
618 if (context) {
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000619 context_clear_entry(&context[devfn]);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700620 __iommu_flush_cache(iommu, &context[devfn], \
621 sizeof(*context));
622 }
623 spin_unlock_irqrestore(&iommu->lock, flags);
624}
625
626static void free_context_table(struct intel_iommu *iommu)
627{
628 struct root_entry *root;
629 int i;
630 unsigned long flags;
631 struct context_entry *context;
632
633 spin_lock_irqsave(&iommu->lock, flags);
634 if (!iommu->root_entry) {
635 goto out;
636 }
637 for (i = 0; i < ROOT_ENTRY_NR; i++) {
638 root = &iommu->root_entry[i];
639 context = get_context_addr_from_root(root);
640 if (context)
641 free_pgtable_page(context);
642 }
643 free_pgtable_page(iommu->root_entry);
644 iommu->root_entry = NULL;
645out:
646 spin_unlock_irqrestore(&iommu->lock, flags);
647}
648
649/* page table handling */
650#define LEVEL_STRIDE (9)
651#define LEVEL_MASK (((u64)1 << LEVEL_STRIDE) - 1)
652
653static inline int agaw_to_level(int agaw)
654{
655 return agaw + 2;
656}
657
658static inline int agaw_to_width(int agaw)
659{
660 return 30 + agaw * LEVEL_STRIDE;
661
662}
663
664static inline int width_to_agaw(int width)
665{
666 return (width - 30) / LEVEL_STRIDE;
667}
668
669static inline unsigned int level_to_offset_bits(int level)
670{
David Woodhouse6660c632009-06-27 22:41:00 +0100671 return (level - 1) * LEVEL_STRIDE;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700672}
673
David Woodhouse77dfa562009-06-27 16:40:08 +0100674static inline int pfn_level_offset(unsigned long pfn, int level)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700675{
David Woodhouse6660c632009-06-27 22:41:00 +0100676 return (pfn >> level_to_offset_bits(level)) & LEVEL_MASK;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700677}
678
David Woodhouse6660c632009-06-27 22:41:00 +0100679static inline unsigned long level_mask(int level)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700680{
David Woodhouse6660c632009-06-27 22:41:00 +0100681 return -1UL << level_to_offset_bits(level);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700682}
683
David Woodhouse6660c632009-06-27 22:41:00 +0100684static inline unsigned long level_size(int level)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700685{
David Woodhouse6660c632009-06-27 22:41:00 +0100686 return 1UL << level_to_offset_bits(level);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700687}
688
David Woodhouse6660c632009-06-27 22:41:00 +0100689static inline unsigned long align_to_level(unsigned long pfn, int level)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700690{
David Woodhouse6660c632009-06-27 22:41:00 +0100691 return (pfn + level_size(level) - 1) & level_mask(level);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700692}
693
David Woodhouseb026fd22009-06-28 10:37:25 +0100694static struct dma_pte *pfn_to_dma_pte(struct dmar_domain *domain,
695 unsigned long pfn)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700696{
David Woodhouseb026fd22009-06-28 10:37:25 +0100697 int addr_width = agaw_to_width(domain->agaw) - VTD_PAGE_SHIFT;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700698 struct dma_pte *parent, *pte = NULL;
699 int level = agaw_to_level(domain->agaw);
700 int offset;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700701
702 BUG_ON(!domain->pgd);
David Woodhouseb026fd22009-06-28 10:37:25 +0100703 BUG_ON(addr_width < BITS_PER_LONG && pfn >> addr_width);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700704 parent = domain->pgd;
705
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700706 while (level > 0) {
707 void *tmp_page;
708
David Woodhouseb026fd22009-06-28 10:37:25 +0100709 offset = pfn_level_offset(pfn, level);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700710 pte = &parent[offset];
711 if (level == 1)
712 break;
713
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000714 if (!dma_pte_present(pte)) {
David Woodhousec85994e2009-07-01 19:21:24 +0100715 uint64_t pteval;
716
Suresh Siddha4c923d42009-10-02 11:01:24 -0700717 tmp_page = alloc_pgtable_page(domain->nid);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700718
David Woodhouse206a73c2009-07-01 19:30:28 +0100719 if (!tmp_page)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700720 return NULL;
David Woodhouse206a73c2009-07-01 19:30:28 +0100721
David Woodhousec85994e2009-07-01 19:21:24 +0100722 domain_flush_cache(domain, tmp_page, VTD_PAGE_SIZE);
Benjamin LaHaise64de5af2009-09-16 21:05:55 -0400723 pteval = ((uint64_t)virt_to_dma_pfn(tmp_page) << VTD_PAGE_SHIFT) | DMA_PTE_READ | DMA_PTE_WRITE;
David Woodhousec85994e2009-07-01 19:21:24 +0100724 if (cmpxchg64(&pte->val, 0ULL, pteval)) {
725 /* Someone else set it while we were thinking; use theirs. */
726 free_pgtable_page(tmp_page);
727 } else {
728 dma_pte_addr(pte);
729 domain_flush_cache(domain, pte, sizeof(*pte));
730 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700731 }
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000732 parent = phys_to_virt(dma_pte_addr(pte));
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700733 level--;
734 }
735
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700736 return pte;
737}
738
739/* return address's pte at specific level */
David Woodhouse90dcfb52009-06-27 17:14:59 +0100740static struct dma_pte *dma_pfn_level_pte(struct dmar_domain *domain,
741 unsigned long pfn,
742 int level)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700743{
744 struct dma_pte *parent, *pte = NULL;
745 int total = agaw_to_level(domain->agaw);
746 int offset;
747
748 parent = domain->pgd;
749 while (level <= total) {
David Woodhouse90dcfb52009-06-27 17:14:59 +0100750 offset = pfn_level_offset(pfn, total);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700751 pte = &parent[offset];
752 if (level == total)
753 return pte;
754
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000755 if (!dma_pte_present(pte))
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700756 break;
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000757 parent = phys_to_virt(dma_pte_addr(pte));
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700758 total--;
759 }
760 return NULL;
761}
762
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700763/* clear last level pte, a tlb flush should be followed */
David Woodhouse595badf52009-06-27 22:09:11 +0100764static void dma_pte_clear_range(struct dmar_domain *domain,
765 unsigned long start_pfn,
766 unsigned long last_pfn)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700767{
David Woodhouse04b18e62009-06-27 19:15:01 +0100768 int addr_width = agaw_to_width(domain->agaw) - VTD_PAGE_SHIFT;
David Woodhouse310a5ab2009-06-28 18:52:20 +0100769 struct dma_pte *first_pte, *pte;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700770
David Woodhouse04b18e62009-06-27 19:15:01 +0100771 BUG_ON(addr_width < BITS_PER_LONG && start_pfn >> addr_width);
David Woodhouse595badf52009-06-27 22:09:11 +0100772 BUG_ON(addr_width < BITS_PER_LONG && last_pfn >> addr_width);
David Woodhouse59c36282009-09-19 07:36:28 -0700773 BUG_ON(start_pfn > last_pfn);
David Woodhouse66eae842009-06-27 19:00:32 +0100774
David Woodhouse04b18e62009-06-27 19:15:01 +0100775 /* we don't need lock here; nobody else touches the iova range */
David Woodhouse59c36282009-09-19 07:36:28 -0700776 do {
David Woodhouse310a5ab2009-06-28 18:52:20 +0100777 first_pte = pte = dma_pfn_level_pte(domain, start_pfn, 1);
778 if (!pte) {
779 start_pfn = align_to_level(start_pfn + 1, 2);
780 continue;
781 }
David Woodhouse75e6bf92009-07-02 11:21:16 +0100782 do {
David Woodhouse310a5ab2009-06-28 18:52:20 +0100783 dma_clear_pte(pte);
784 start_pfn++;
785 pte++;
David Woodhouse75e6bf92009-07-02 11:21:16 +0100786 } while (start_pfn <= last_pfn && !first_pte_in_page(pte));
787
David Woodhouse310a5ab2009-06-28 18:52:20 +0100788 domain_flush_cache(domain, first_pte,
789 (void *)pte - (void *)first_pte);
David Woodhouse59c36282009-09-19 07:36:28 -0700790
791 } while (start_pfn && start_pfn <= last_pfn);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700792}
793
794/* free page table pages. last level pte should already be cleared */
795static void dma_pte_free_pagetable(struct dmar_domain *domain,
David Woodhoused794dc92009-06-28 00:27:49 +0100796 unsigned long start_pfn,
797 unsigned long last_pfn)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700798{
David Woodhouse6660c632009-06-27 22:41:00 +0100799 int addr_width = agaw_to_width(domain->agaw) - VTD_PAGE_SHIFT;
David Woodhousef3a0a522009-06-30 03:40:07 +0100800 struct dma_pte *first_pte, *pte;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700801 int total = agaw_to_level(domain->agaw);
802 int level;
David Woodhouse6660c632009-06-27 22:41:00 +0100803 unsigned long tmp;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700804
David Woodhouse6660c632009-06-27 22:41:00 +0100805 BUG_ON(addr_width < BITS_PER_LONG && start_pfn >> addr_width);
806 BUG_ON(addr_width < BITS_PER_LONG && last_pfn >> addr_width);
David Woodhouse59c36282009-09-19 07:36:28 -0700807 BUG_ON(start_pfn > last_pfn);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700808
David Woodhousef3a0a522009-06-30 03:40:07 +0100809 /* We don't need lock here; nobody else touches the iova range */
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700810 level = 2;
811 while (level <= total) {
David Woodhouse6660c632009-06-27 22:41:00 +0100812 tmp = align_to_level(start_pfn, level);
813
David Woodhousef3a0a522009-06-30 03:40:07 +0100814 /* If we can't even clear one PTE at this level, we're done */
David Woodhouse6660c632009-06-27 22:41:00 +0100815 if (tmp + level_size(level) - 1 > last_pfn)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700816 return;
817
David Woodhouse59c36282009-09-19 07:36:28 -0700818 do {
David Woodhousef3a0a522009-06-30 03:40:07 +0100819 first_pte = pte = dma_pfn_level_pte(domain, tmp, level);
820 if (!pte) {
821 tmp = align_to_level(tmp + 1, level + 1);
822 continue;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700823 }
David Woodhouse75e6bf92009-07-02 11:21:16 +0100824 do {
David Woodhouse6a43e572009-07-02 12:02:34 +0100825 if (dma_pte_present(pte)) {
826 free_pgtable_page(phys_to_virt(dma_pte_addr(pte)));
827 dma_clear_pte(pte);
828 }
David Woodhousef3a0a522009-06-30 03:40:07 +0100829 pte++;
830 tmp += level_size(level);
David Woodhouse75e6bf92009-07-02 11:21:16 +0100831 } while (!first_pte_in_page(pte) &&
832 tmp + level_size(level) - 1 <= last_pfn);
833
David Woodhousef3a0a522009-06-30 03:40:07 +0100834 domain_flush_cache(domain, first_pte,
835 (void *)pte - (void *)first_pte);
836
David Woodhouse59c36282009-09-19 07:36:28 -0700837 } while (tmp && tmp + level_size(level) - 1 <= last_pfn);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700838 level++;
839 }
840 /* free pgd */
David Woodhoused794dc92009-06-28 00:27:49 +0100841 if (start_pfn == 0 && last_pfn == DOMAIN_MAX_PFN(domain->gaw)) {
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700842 free_pgtable_page(domain->pgd);
843 domain->pgd = NULL;
844 }
845}
846
847/* iommu handling */
848static int iommu_alloc_root_entry(struct intel_iommu *iommu)
849{
850 struct root_entry *root;
851 unsigned long flags;
852
Suresh Siddha4c923d42009-10-02 11:01:24 -0700853 root = (struct root_entry *)alloc_pgtable_page(iommu->node);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700854 if (!root)
855 return -ENOMEM;
856
Fenghua Yu5b6985c2008-10-16 18:02:32 -0700857 __iommu_flush_cache(iommu, root, ROOT_SIZE);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700858
859 spin_lock_irqsave(&iommu->lock, flags);
860 iommu->root_entry = root;
861 spin_unlock_irqrestore(&iommu->lock, flags);
862
863 return 0;
864}
865
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700866static void iommu_set_root_entry(struct intel_iommu *iommu)
867{
868 void *addr;
David Woodhousec416daa2009-05-10 20:30:58 +0100869 u32 sts;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700870 unsigned long flag;
871
872 addr = iommu->root_entry;
873
874 spin_lock_irqsave(&iommu->register_lock, flag);
875 dmar_writeq(iommu->reg + DMAR_RTADDR_REG, virt_to_phys(addr));
876
David Woodhousec416daa2009-05-10 20:30:58 +0100877 writel(iommu->gcmd | DMA_GCMD_SRTP, iommu->reg + DMAR_GCMD_REG);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700878
879 /* Make sure hardware complete it */
880 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
David Woodhousec416daa2009-05-10 20:30:58 +0100881 readl, (sts & DMA_GSTS_RTPS), sts);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700882
883 spin_unlock_irqrestore(&iommu->register_lock, flag);
884}
885
886static void iommu_flush_write_buffer(struct intel_iommu *iommu)
887{
888 u32 val;
889 unsigned long flag;
890
David Woodhouse9af88142009-02-13 23:18:03 +0000891 if (!rwbf_quirk && !cap_rwbf(iommu->cap))
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700892 return;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700893
894 spin_lock_irqsave(&iommu->register_lock, flag);
David Woodhouse462b60f2009-05-10 20:18:18 +0100895 writel(iommu->gcmd | DMA_GCMD_WBF, iommu->reg + DMAR_GCMD_REG);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700896
897 /* Make sure hardware complete it */
898 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
David Woodhousec416daa2009-05-10 20:30:58 +0100899 readl, (!(val & DMA_GSTS_WBFS)), val);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700900
901 spin_unlock_irqrestore(&iommu->register_lock, flag);
902}
903
904/* return value determine if we need a write buffer flush */
David Woodhouse4c25a2c2009-05-10 17:16:06 +0100905static void __iommu_flush_context(struct intel_iommu *iommu,
906 u16 did, u16 source_id, u8 function_mask,
907 u64 type)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700908{
909 u64 val = 0;
910 unsigned long flag;
911
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700912 switch (type) {
913 case DMA_CCMD_GLOBAL_INVL:
914 val = DMA_CCMD_GLOBAL_INVL;
915 break;
916 case DMA_CCMD_DOMAIN_INVL:
917 val = DMA_CCMD_DOMAIN_INVL|DMA_CCMD_DID(did);
918 break;
919 case DMA_CCMD_DEVICE_INVL:
920 val = DMA_CCMD_DEVICE_INVL|DMA_CCMD_DID(did)
921 | DMA_CCMD_SID(source_id) | DMA_CCMD_FM(function_mask);
922 break;
923 default:
924 BUG();
925 }
926 val |= DMA_CCMD_ICC;
927
928 spin_lock_irqsave(&iommu->register_lock, flag);
929 dmar_writeq(iommu->reg + DMAR_CCMD_REG, val);
930
931 /* Make sure hardware complete it */
932 IOMMU_WAIT_OP(iommu, DMAR_CCMD_REG,
933 dmar_readq, (!(val & DMA_CCMD_ICC)), val);
934
935 spin_unlock_irqrestore(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700936}
937
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700938/* return value determine if we need a write buffer flush */
David Woodhouse1f0ef2a2009-05-10 19:58:49 +0100939static void __iommu_flush_iotlb(struct intel_iommu *iommu, u16 did,
940 u64 addr, unsigned int size_order, u64 type)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700941{
942 int tlb_offset = ecap_iotlb_offset(iommu->ecap);
943 u64 val = 0, val_iva = 0;
944 unsigned long flag;
945
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700946 switch (type) {
947 case DMA_TLB_GLOBAL_FLUSH:
948 /* global flush doesn't need set IVA_REG */
949 val = DMA_TLB_GLOBAL_FLUSH|DMA_TLB_IVT;
950 break;
951 case DMA_TLB_DSI_FLUSH:
952 val = DMA_TLB_DSI_FLUSH|DMA_TLB_IVT|DMA_TLB_DID(did);
953 break;
954 case DMA_TLB_PSI_FLUSH:
955 val = DMA_TLB_PSI_FLUSH|DMA_TLB_IVT|DMA_TLB_DID(did);
956 /* Note: always flush non-leaf currently */
957 val_iva = size_order | addr;
958 break;
959 default:
960 BUG();
961 }
962 /* Note: set drain read/write */
963#if 0
964 /*
965 * This is probably to be super secure.. Looks like we can
966 * ignore it without any impact.
967 */
968 if (cap_read_drain(iommu->cap))
969 val |= DMA_TLB_READ_DRAIN;
970#endif
971 if (cap_write_drain(iommu->cap))
972 val |= DMA_TLB_WRITE_DRAIN;
973
974 spin_lock_irqsave(&iommu->register_lock, flag);
975 /* Note: Only uses first TLB reg currently */
976 if (val_iva)
977 dmar_writeq(iommu->reg + tlb_offset, val_iva);
978 dmar_writeq(iommu->reg + tlb_offset + 8, val);
979
980 /* Make sure hardware complete it */
981 IOMMU_WAIT_OP(iommu, tlb_offset + 8,
982 dmar_readq, (!(val & DMA_TLB_IVT)), val);
983
984 spin_unlock_irqrestore(&iommu->register_lock, flag);
985
986 /* check IOTLB invalidation granularity */
987 if (DMA_TLB_IAIG(val) == 0)
988 printk(KERN_ERR"IOMMU: flush IOTLB failed\n");
989 if (DMA_TLB_IAIG(val) != DMA_TLB_IIRG(type))
990 pr_debug("IOMMU: tlb flush request %Lx, actual %Lx\n",
Fenghua Yu5b6985c2008-10-16 18:02:32 -0700991 (unsigned long long)DMA_TLB_IIRG(type),
992 (unsigned long long)DMA_TLB_IAIG(val));
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700993}
994
Yu Zhao93a23a72009-05-18 13:51:37 +0800995static struct device_domain_info *iommu_support_dev_iotlb(
996 struct dmar_domain *domain, int segment, u8 bus, u8 devfn)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -0700997{
Yu Zhao93a23a72009-05-18 13:51:37 +0800998 int found = 0;
999 unsigned long flags;
1000 struct device_domain_info *info;
1001 struct intel_iommu *iommu = device_to_iommu(segment, bus, devfn);
1002
1003 if (!ecap_dev_iotlb_support(iommu->ecap))
1004 return NULL;
1005
1006 if (!iommu->qi)
1007 return NULL;
1008
1009 spin_lock_irqsave(&device_domain_lock, flags);
1010 list_for_each_entry(info, &domain->devices, link)
1011 if (info->bus == bus && info->devfn == devfn) {
1012 found = 1;
1013 break;
1014 }
1015 spin_unlock_irqrestore(&device_domain_lock, flags);
1016
1017 if (!found || !info->dev)
1018 return NULL;
1019
1020 if (!pci_find_ext_capability(info->dev, PCI_EXT_CAP_ID_ATS))
1021 return NULL;
1022
1023 if (!dmar_find_matched_atsr_unit(info->dev))
1024 return NULL;
1025
1026 info->iommu = iommu;
1027
1028 return info;
1029}
1030
1031static void iommu_enable_dev_iotlb(struct device_domain_info *info)
1032{
1033 if (!info)
1034 return;
1035
1036 pci_enable_ats(info->dev, VTD_PAGE_SHIFT);
1037}
1038
1039static void iommu_disable_dev_iotlb(struct device_domain_info *info)
1040{
1041 if (!info->dev || !pci_ats_enabled(info->dev))
1042 return;
1043
1044 pci_disable_ats(info->dev);
1045}
1046
1047static void iommu_flush_dev_iotlb(struct dmar_domain *domain,
1048 u64 addr, unsigned mask)
1049{
1050 u16 sid, qdep;
1051 unsigned long flags;
1052 struct device_domain_info *info;
1053
1054 spin_lock_irqsave(&device_domain_lock, flags);
1055 list_for_each_entry(info, &domain->devices, link) {
1056 if (!info->dev || !pci_ats_enabled(info->dev))
1057 continue;
1058
1059 sid = info->bus << 8 | info->devfn;
1060 qdep = pci_ats_queue_depth(info->dev);
1061 qi_flush_dev_iotlb(info->iommu, sid, qdep, addr, mask);
1062 }
1063 spin_unlock_irqrestore(&device_domain_lock, flags);
1064}
1065
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01001066static void iommu_flush_iotlb_psi(struct intel_iommu *iommu, u16 did,
David Woodhouse03d6a242009-06-28 15:33:46 +01001067 unsigned long pfn, unsigned int pages)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001068{
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001069 unsigned int mask = ilog2(__roundup_pow_of_two(pages));
David Woodhouse03d6a242009-06-28 15:33:46 +01001070 uint64_t addr = (uint64_t)pfn << VTD_PAGE_SHIFT;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001071
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001072 BUG_ON(pages == 0);
1073
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001074 /*
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001075 * Fallback to domain selective flush if no PSI support or the size is
1076 * too big.
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001077 * PSI requires page size to be 2 ^ x, and the base address is naturally
1078 * aligned to the size
1079 */
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001080 if (!cap_pgsel_inv(iommu->cap) || mask > cap_max_amask_val(iommu->cap))
1081 iommu->flush.flush_iotlb(iommu, did, 0, 0,
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01001082 DMA_TLB_DSI_FLUSH);
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001083 else
1084 iommu->flush.flush_iotlb(iommu, did, addr, mask,
1085 DMA_TLB_PSI_FLUSH);
Yu Zhaobf92df32009-06-29 11:31:45 +08001086
1087 /*
1088 * In caching mode, domain ID 0 is reserved for non-present to present
1089 * mapping flush. Device IOTLB doesn't need to be flushed in this case.
1090 */
1091 if (!cap_caching_mode(iommu->cap) || did)
Yu Zhao93a23a72009-05-18 13:51:37 +08001092 iommu_flush_dev_iotlb(iommu->domains[did], addr, mask);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001093}
1094
mark grossf8bab732008-02-08 04:18:38 -08001095static void iommu_disable_protect_mem_regions(struct intel_iommu *iommu)
1096{
1097 u32 pmen;
1098 unsigned long flags;
1099
1100 spin_lock_irqsave(&iommu->register_lock, flags);
1101 pmen = readl(iommu->reg + DMAR_PMEN_REG);
1102 pmen &= ~DMA_PMEN_EPM;
1103 writel(pmen, iommu->reg + DMAR_PMEN_REG);
1104
1105 /* wait for the protected region status bit to clear */
1106 IOMMU_WAIT_OP(iommu, DMAR_PMEN_REG,
1107 readl, !(pmen & DMA_PMEN_PRS), pmen);
1108
1109 spin_unlock_irqrestore(&iommu->register_lock, flags);
1110}
1111
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001112static int iommu_enable_translation(struct intel_iommu *iommu)
1113{
1114 u32 sts;
1115 unsigned long flags;
1116
1117 spin_lock_irqsave(&iommu->register_lock, flags);
David Woodhousec416daa2009-05-10 20:30:58 +01001118 iommu->gcmd |= DMA_GCMD_TE;
1119 writel(iommu->gcmd, iommu->reg + DMAR_GCMD_REG);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001120
1121 /* Make sure hardware complete it */
1122 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
David Woodhousec416daa2009-05-10 20:30:58 +01001123 readl, (sts & DMA_GSTS_TES), sts);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001124
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001125 spin_unlock_irqrestore(&iommu->register_lock, flags);
1126 return 0;
1127}
1128
1129static int iommu_disable_translation(struct intel_iommu *iommu)
1130{
1131 u32 sts;
1132 unsigned long flag;
1133
1134 spin_lock_irqsave(&iommu->register_lock, flag);
1135 iommu->gcmd &= ~DMA_GCMD_TE;
1136 writel(iommu->gcmd, iommu->reg + DMAR_GCMD_REG);
1137
1138 /* Make sure hardware complete it */
1139 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
David Woodhousec416daa2009-05-10 20:30:58 +01001140 readl, (!(sts & DMA_GSTS_TES)), sts);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001141
1142 spin_unlock_irqrestore(&iommu->register_lock, flag);
1143 return 0;
1144}
1145
Keshavamurthy, Anil S3460a6d2007-10-21 16:41:54 -07001146
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001147static int iommu_init_domains(struct intel_iommu *iommu)
1148{
1149 unsigned long ndomains;
1150 unsigned long nlongs;
1151
1152 ndomains = cap_ndoms(iommu->cap);
1153 pr_debug("Number of Domains supportd <%ld>\n", ndomains);
1154 nlongs = BITS_TO_LONGS(ndomains);
1155
Donald Dutile94a91b502009-08-20 16:51:34 -04001156 spin_lock_init(&iommu->lock);
1157
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001158 /* TBD: there might be 64K domains,
1159 * consider other allocation for future chip
1160 */
1161 iommu->domain_ids = kcalloc(nlongs, sizeof(unsigned long), GFP_KERNEL);
1162 if (!iommu->domain_ids) {
1163 printk(KERN_ERR "Allocating domain id array failed\n");
1164 return -ENOMEM;
1165 }
1166 iommu->domains = kcalloc(ndomains, sizeof(struct dmar_domain *),
1167 GFP_KERNEL);
1168 if (!iommu->domains) {
1169 printk(KERN_ERR "Allocating domain array failed\n");
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001170 return -ENOMEM;
1171 }
1172
1173 /*
1174 * if Caching mode is set, then invalid translations are tagged
1175 * with domainid 0. Hence we need to pre-allocate it.
1176 */
1177 if (cap_caching_mode(iommu->cap))
1178 set_bit(0, iommu->domain_ids);
1179 return 0;
1180}
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001181
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001182
1183static void domain_exit(struct dmar_domain *domain);
Weidong Han5e98c4b2008-12-08 23:03:27 +08001184static void vm_domain_exit(struct dmar_domain *domain);
Suresh Siddhae61d98d2008-07-10 11:16:35 -07001185
1186void free_dmar_iommu(struct intel_iommu *iommu)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001187{
1188 struct dmar_domain *domain;
1189 int i;
Weidong Hanc7151a82008-12-08 22:51:37 +08001190 unsigned long flags;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001191
Donald Dutile94a91b502009-08-20 16:51:34 -04001192 if ((iommu->domains) && (iommu->domain_ids)) {
Akinobu Mitaa45946a2010-03-11 14:04:08 -08001193 for_each_set_bit(i, iommu->domain_ids, cap_ndoms(iommu->cap)) {
Donald Dutile94a91b502009-08-20 16:51:34 -04001194 domain = iommu->domains[i];
1195 clear_bit(i, iommu->domain_ids);
Weidong Hanc7151a82008-12-08 22:51:37 +08001196
Donald Dutile94a91b502009-08-20 16:51:34 -04001197 spin_lock_irqsave(&domain->iommu_lock, flags);
1198 if (--domain->iommu_count == 0) {
1199 if (domain->flags & DOMAIN_FLAG_VIRTUAL_MACHINE)
1200 vm_domain_exit(domain);
1201 else
1202 domain_exit(domain);
1203 }
1204 spin_unlock_irqrestore(&domain->iommu_lock, flags);
Weidong Han5e98c4b2008-12-08 23:03:27 +08001205 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001206 }
1207
1208 if (iommu->gcmd & DMA_GCMD_TE)
1209 iommu_disable_translation(iommu);
1210
1211 if (iommu->irq) {
1212 set_irq_data(iommu->irq, NULL);
1213 /* This will mask the irq */
1214 free_irq(iommu->irq, iommu);
1215 destroy_irq(iommu->irq);
1216 }
1217
1218 kfree(iommu->domains);
1219 kfree(iommu->domain_ids);
1220
Weidong Hand9630fe2008-12-08 11:06:32 +08001221 g_iommus[iommu->seq_id] = NULL;
1222
1223 /* if all iommus are freed, free g_iommus */
1224 for (i = 0; i < g_num_of_iommus; i++) {
1225 if (g_iommus[i])
1226 break;
1227 }
1228
1229 if (i == g_num_of_iommus)
1230 kfree(g_iommus);
1231
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001232 /* free context mapping */
1233 free_context_table(iommu);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001234}
1235
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001236static struct dmar_domain *alloc_domain(void)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001237{
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001238 struct dmar_domain *domain;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001239
1240 domain = alloc_domain_mem();
1241 if (!domain)
1242 return NULL;
1243
Suresh Siddha4c923d42009-10-02 11:01:24 -07001244 domain->nid = -1;
Weidong Han8c11e792008-12-08 15:29:22 +08001245 memset(&domain->iommu_bmp, 0, sizeof(unsigned long));
Weidong Hand71a2f32008-12-07 21:13:41 +08001246 domain->flags = 0;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001247
1248 return domain;
1249}
1250
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001251static int iommu_attach_domain(struct dmar_domain *domain,
1252 struct intel_iommu *iommu)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001253{
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001254 int num;
1255 unsigned long ndomains;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001256 unsigned long flags;
1257
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001258 ndomains = cap_ndoms(iommu->cap);
Weidong Han8c11e792008-12-08 15:29:22 +08001259
1260 spin_lock_irqsave(&iommu->lock, flags);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001261
1262 num = find_first_zero_bit(iommu->domain_ids, ndomains);
1263 if (num >= ndomains) {
1264 spin_unlock_irqrestore(&iommu->lock, flags);
1265 printk(KERN_ERR "IOMMU: no free domain ids\n");
1266 return -ENOMEM;
1267 }
1268
1269 domain->id = num;
1270 set_bit(num, iommu->domain_ids);
1271 set_bit(iommu->seq_id, &domain->iommu_bmp);
1272 iommu->domains[num] = domain;
1273 spin_unlock_irqrestore(&iommu->lock, flags);
1274
1275 return 0;
1276}
1277
1278static void iommu_detach_domain(struct dmar_domain *domain,
1279 struct intel_iommu *iommu)
1280{
1281 unsigned long flags;
1282 int num, ndomains;
1283 int found = 0;
1284
1285 spin_lock_irqsave(&iommu->lock, flags);
1286 ndomains = cap_ndoms(iommu->cap);
Akinobu Mitaa45946a2010-03-11 14:04:08 -08001287 for_each_set_bit(num, iommu->domain_ids, ndomains) {
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001288 if (iommu->domains[num] == domain) {
1289 found = 1;
1290 break;
1291 }
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001292 }
1293
1294 if (found) {
1295 clear_bit(num, iommu->domain_ids);
1296 clear_bit(iommu->seq_id, &domain->iommu_bmp);
1297 iommu->domains[num] = NULL;
1298 }
Weidong Han8c11e792008-12-08 15:29:22 +08001299 spin_unlock_irqrestore(&iommu->lock, flags);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001300}
1301
1302static struct iova_domain reserved_iova_list;
Mark Gross8a443df2008-03-04 14:59:31 -08001303static struct lock_class_key reserved_rbtree_key;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001304
1305static void dmar_init_reserved_ranges(void)
1306{
1307 struct pci_dev *pdev = NULL;
1308 struct iova *iova;
1309 int i;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001310
David Millerf6611972008-02-06 01:36:23 -08001311 init_iova_domain(&reserved_iova_list, DMA_32BIT_PFN);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001312
Mark Gross8a443df2008-03-04 14:59:31 -08001313 lockdep_set_class(&reserved_iova_list.iova_rbtree_lock,
1314 &reserved_rbtree_key);
1315
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001316 /* IOAPIC ranges shouldn't be accessed by DMA */
1317 iova = reserve_iova(&reserved_iova_list, IOVA_PFN(IOAPIC_RANGE_START),
1318 IOVA_PFN(IOAPIC_RANGE_END));
1319 if (!iova)
1320 printk(KERN_ERR "Reserve IOAPIC range failed\n");
1321
1322 /* Reserve all PCI MMIO to avoid peer-to-peer access */
1323 for_each_pci_dev(pdev) {
1324 struct resource *r;
1325
1326 for (i = 0; i < PCI_NUM_RESOURCES; i++) {
1327 r = &pdev->resource[i];
1328 if (!r->flags || !(r->flags & IORESOURCE_MEM))
1329 continue;
David Woodhouse1a4a4552009-06-28 16:00:42 +01001330 iova = reserve_iova(&reserved_iova_list,
1331 IOVA_PFN(r->start),
1332 IOVA_PFN(r->end));
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001333 if (!iova)
1334 printk(KERN_ERR "Reserve iova failed\n");
1335 }
1336 }
1337
1338}
1339
1340static void domain_reserve_special_ranges(struct dmar_domain *domain)
1341{
1342 copy_reserved_iova(&reserved_iova_list, &domain->iovad);
1343}
1344
1345static inline int guestwidth_to_adjustwidth(int gaw)
1346{
1347 int agaw;
1348 int r = (gaw - 12) % 9;
1349
1350 if (r == 0)
1351 agaw = gaw;
1352 else
1353 agaw = gaw + 9 - r;
1354 if (agaw > 64)
1355 agaw = 64;
1356 return agaw;
1357}
1358
1359static int domain_init(struct dmar_domain *domain, int guest_width)
1360{
1361 struct intel_iommu *iommu;
1362 int adjust_width, agaw;
1363 unsigned long sagaw;
1364
David Millerf6611972008-02-06 01:36:23 -08001365 init_iova_domain(&domain->iovad, DMA_32BIT_PFN);
Weidong Hanc7151a82008-12-08 22:51:37 +08001366 spin_lock_init(&domain->iommu_lock);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001367
1368 domain_reserve_special_ranges(domain);
1369
1370 /* calculate AGAW */
Weidong Han8c11e792008-12-08 15:29:22 +08001371 iommu = domain_get_iommu(domain);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001372 if (guest_width > cap_mgaw(iommu->cap))
1373 guest_width = cap_mgaw(iommu->cap);
1374 domain->gaw = guest_width;
1375 adjust_width = guestwidth_to_adjustwidth(guest_width);
1376 agaw = width_to_agaw(adjust_width);
1377 sagaw = cap_sagaw(iommu->cap);
1378 if (!test_bit(agaw, &sagaw)) {
1379 /* hardware doesn't support it, choose a bigger one */
1380 pr_debug("IOMMU: hardware doesn't support agaw %d\n", agaw);
1381 agaw = find_next_bit(&sagaw, 5, agaw);
1382 if (agaw >= 5)
1383 return -ENODEV;
1384 }
1385 domain->agaw = agaw;
1386 INIT_LIST_HEAD(&domain->devices);
1387
Weidong Han8e6040972008-12-08 15:49:06 +08001388 if (ecap_coherent(iommu->ecap))
1389 domain->iommu_coherency = 1;
1390 else
1391 domain->iommu_coherency = 0;
1392
Sheng Yang58c610b2009-03-18 15:33:05 +08001393 if (ecap_sc_support(iommu->ecap))
1394 domain->iommu_snooping = 1;
1395 else
1396 domain->iommu_snooping = 0;
1397
Weidong Hanc7151a82008-12-08 22:51:37 +08001398 domain->iommu_count = 1;
Suresh Siddha4c923d42009-10-02 11:01:24 -07001399 domain->nid = iommu->node;
Weidong Hanc7151a82008-12-08 22:51:37 +08001400
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001401 /* always allocate the top pgd */
Suresh Siddha4c923d42009-10-02 11:01:24 -07001402 domain->pgd = (struct dma_pte *)alloc_pgtable_page(domain->nid);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001403 if (!domain->pgd)
1404 return -ENOMEM;
Fenghua Yu5b6985c2008-10-16 18:02:32 -07001405 __iommu_flush_cache(iommu, domain->pgd, PAGE_SIZE);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001406 return 0;
1407}
1408
1409static void domain_exit(struct dmar_domain *domain)
1410{
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001411 struct dmar_drhd_unit *drhd;
1412 struct intel_iommu *iommu;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001413
1414 /* Domain 0 is reserved, so dont process it */
1415 if (!domain)
1416 return;
1417
1418 domain_remove_dev_info(domain);
1419 /* destroy iovas */
1420 put_iova_domain(&domain->iovad);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001421
1422 /* clear ptes */
David Woodhouse595badf52009-06-27 22:09:11 +01001423 dma_pte_clear_range(domain, 0, DOMAIN_MAX_PFN(domain->gaw));
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001424
1425 /* free page tables */
David Woodhoused794dc92009-06-28 00:27:49 +01001426 dma_pte_free_pagetable(domain, 0, DOMAIN_MAX_PFN(domain->gaw));
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001427
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001428 for_each_active_iommu(iommu, drhd)
1429 if (test_bit(iommu->seq_id, &domain->iommu_bmp))
1430 iommu_detach_domain(domain, iommu);
1431
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001432 free_domain_mem(domain);
1433}
1434
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001435static int domain_context_mapping_one(struct dmar_domain *domain, int segment,
1436 u8 bus, u8 devfn, int translation)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001437{
1438 struct context_entry *context;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001439 unsigned long flags;
Weidong Han5331fe62008-12-08 23:00:00 +08001440 struct intel_iommu *iommu;
Weidong Hanea6606b2008-12-08 23:08:15 +08001441 struct dma_pte *pgd;
1442 unsigned long num;
1443 unsigned long ndomains;
1444 int id;
1445 int agaw;
Yu Zhao93a23a72009-05-18 13:51:37 +08001446 struct device_domain_info *info = NULL;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001447
1448 pr_debug("Set context mapping for %02x:%02x.%d\n",
1449 bus, PCI_SLOT(devfn), PCI_FUNC(devfn));
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001450
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001451 BUG_ON(!domain->pgd);
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001452 BUG_ON(translation != CONTEXT_TT_PASS_THROUGH &&
1453 translation != CONTEXT_TT_MULTI_LEVEL);
Weidong Han5331fe62008-12-08 23:00:00 +08001454
David Woodhouse276dbf992009-04-04 01:45:37 +01001455 iommu = device_to_iommu(segment, bus, devfn);
Weidong Han5331fe62008-12-08 23:00:00 +08001456 if (!iommu)
1457 return -ENODEV;
1458
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001459 context = device_to_context_entry(iommu, bus, devfn);
1460 if (!context)
1461 return -ENOMEM;
1462 spin_lock_irqsave(&iommu->lock, flags);
Mark McLoughlinc07e7d22008-11-21 16:54:46 +00001463 if (context_present(context)) {
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001464 spin_unlock_irqrestore(&iommu->lock, flags);
1465 return 0;
1466 }
1467
Weidong Hanea6606b2008-12-08 23:08:15 +08001468 id = domain->id;
1469 pgd = domain->pgd;
1470
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001471 if (domain->flags & DOMAIN_FLAG_VIRTUAL_MACHINE ||
1472 domain->flags & DOMAIN_FLAG_STATIC_IDENTITY) {
Weidong Hanea6606b2008-12-08 23:08:15 +08001473 int found = 0;
1474
1475 /* find an available domain id for this device in iommu */
1476 ndomains = cap_ndoms(iommu->cap);
Akinobu Mitaa45946a2010-03-11 14:04:08 -08001477 for_each_set_bit(num, iommu->domain_ids, ndomains) {
Weidong Hanea6606b2008-12-08 23:08:15 +08001478 if (iommu->domains[num] == domain) {
1479 id = num;
1480 found = 1;
1481 break;
1482 }
Weidong Hanea6606b2008-12-08 23:08:15 +08001483 }
1484
1485 if (found == 0) {
1486 num = find_first_zero_bit(iommu->domain_ids, ndomains);
1487 if (num >= ndomains) {
1488 spin_unlock_irqrestore(&iommu->lock, flags);
1489 printk(KERN_ERR "IOMMU: no free domain ids\n");
1490 return -EFAULT;
1491 }
1492
1493 set_bit(num, iommu->domain_ids);
1494 iommu->domains[num] = domain;
1495 id = num;
1496 }
1497
1498 /* Skip top levels of page tables for
1499 * iommu which has less agaw than default.
Chris Wright1672af12009-12-02 12:06:34 -08001500 * Unnecessary for PT mode.
Weidong Hanea6606b2008-12-08 23:08:15 +08001501 */
Chris Wright1672af12009-12-02 12:06:34 -08001502 if (translation != CONTEXT_TT_PASS_THROUGH) {
1503 for (agaw = domain->agaw; agaw != iommu->agaw; agaw--) {
1504 pgd = phys_to_virt(dma_pte_addr(pgd));
1505 if (!dma_pte_present(pgd)) {
1506 spin_unlock_irqrestore(&iommu->lock, flags);
1507 return -ENOMEM;
1508 }
Weidong Hanea6606b2008-12-08 23:08:15 +08001509 }
1510 }
1511 }
1512
1513 context_set_domain_id(context, id);
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001514
Yu Zhao93a23a72009-05-18 13:51:37 +08001515 if (translation != CONTEXT_TT_PASS_THROUGH) {
1516 info = iommu_support_dev_iotlb(domain, segment, bus, devfn);
1517 translation = info ? CONTEXT_TT_DEV_IOTLB :
1518 CONTEXT_TT_MULTI_LEVEL;
1519 }
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001520 /*
1521 * In pass through mode, AW must be programmed to indicate the largest
1522 * AGAW value supported by hardware. And ASR is ignored by hardware.
1523 */
Yu Zhao93a23a72009-05-18 13:51:37 +08001524 if (unlikely(translation == CONTEXT_TT_PASS_THROUGH))
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001525 context_set_address_width(context, iommu->msagaw);
Yu Zhao93a23a72009-05-18 13:51:37 +08001526 else {
1527 context_set_address_root(context, virt_to_phys(pgd));
1528 context_set_address_width(context, iommu->agaw);
1529 }
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001530
1531 context_set_translation_type(context, translation);
Mark McLoughlinc07e7d22008-11-21 16:54:46 +00001532 context_set_fault_enable(context);
1533 context_set_present(context);
Weidong Han5331fe62008-12-08 23:00:00 +08001534 domain_flush_cache(domain, context, sizeof(*context));
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001535
David Woodhouse4c25a2c2009-05-10 17:16:06 +01001536 /*
1537 * It's a non-present to present mapping. If hardware doesn't cache
1538 * non-present entry we only need to flush the write-buffer. If the
1539 * _does_ cache non-present entries, then it does so in the special
1540 * domain #0, which we have to flush:
1541 */
1542 if (cap_caching_mode(iommu->cap)) {
1543 iommu->flush.flush_context(iommu, 0,
1544 (((u16)bus) << 8) | devfn,
1545 DMA_CCMD_MASK_NOBIT,
1546 DMA_CCMD_DEVICE_INVL);
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01001547 iommu->flush.flush_iotlb(iommu, 0, 0, 0, DMA_TLB_DSI_FLUSH);
David Woodhouse4c25a2c2009-05-10 17:16:06 +01001548 } else {
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001549 iommu_flush_write_buffer(iommu);
David Woodhouse4c25a2c2009-05-10 17:16:06 +01001550 }
Yu Zhao93a23a72009-05-18 13:51:37 +08001551 iommu_enable_dev_iotlb(info);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001552 spin_unlock_irqrestore(&iommu->lock, flags);
Weidong Hanc7151a82008-12-08 22:51:37 +08001553
1554 spin_lock_irqsave(&domain->iommu_lock, flags);
1555 if (!test_and_set_bit(iommu->seq_id, &domain->iommu_bmp)) {
1556 domain->iommu_count++;
Suresh Siddha4c923d42009-10-02 11:01:24 -07001557 if (domain->iommu_count == 1)
1558 domain->nid = iommu->node;
Sheng Yang58c610b2009-03-18 15:33:05 +08001559 domain_update_iommu_cap(domain);
Weidong Hanc7151a82008-12-08 22:51:37 +08001560 }
1561 spin_unlock_irqrestore(&domain->iommu_lock, flags);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001562 return 0;
1563}
1564
1565static int
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001566domain_context_mapping(struct dmar_domain *domain, struct pci_dev *pdev,
1567 int translation)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001568{
1569 int ret;
1570 struct pci_dev *tmp, *parent;
1571
David Woodhouse276dbf992009-04-04 01:45:37 +01001572 ret = domain_context_mapping_one(domain, pci_domain_nr(pdev->bus),
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001573 pdev->bus->number, pdev->devfn,
1574 translation);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001575 if (ret)
1576 return ret;
1577
1578 /* dependent device mapping */
1579 tmp = pci_find_upstream_pcie_bridge(pdev);
1580 if (!tmp)
1581 return 0;
1582 /* Secondary interface's bus number and devfn 0 */
1583 parent = pdev->bus->self;
1584 while (parent != tmp) {
David Woodhouse276dbf992009-04-04 01:45:37 +01001585 ret = domain_context_mapping_one(domain,
1586 pci_domain_nr(parent->bus),
1587 parent->bus->number,
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001588 parent->devfn, translation);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001589 if (ret)
1590 return ret;
1591 parent = parent->bus->self;
1592 }
Stefan Assmann45e829e2009-12-03 06:49:24 -05001593 if (pci_is_pcie(tmp)) /* this is a PCIe-to-PCI bridge */
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001594 return domain_context_mapping_one(domain,
David Woodhouse276dbf992009-04-04 01:45:37 +01001595 pci_domain_nr(tmp->subordinate),
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001596 tmp->subordinate->number, 0,
1597 translation);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001598 else /* this is a legacy PCI bridge */
1599 return domain_context_mapping_one(domain,
David Woodhouse276dbf992009-04-04 01:45:37 +01001600 pci_domain_nr(tmp->bus),
1601 tmp->bus->number,
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001602 tmp->devfn,
1603 translation);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001604}
1605
Weidong Han5331fe62008-12-08 23:00:00 +08001606static int domain_context_mapped(struct pci_dev *pdev)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001607{
1608 int ret;
1609 struct pci_dev *tmp, *parent;
Weidong Han5331fe62008-12-08 23:00:00 +08001610 struct intel_iommu *iommu;
1611
David Woodhouse276dbf992009-04-04 01:45:37 +01001612 iommu = device_to_iommu(pci_domain_nr(pdev->bus), pdev->bus->number,
1613 pdev->devfn);
Weidong Han5331fe62008-12-08 23:00:00 +08001614 if (!iommu)
1615 return -ENODEV;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001616
David Woodhouse276dbf992009-04-04 01:45:37 +01001617 ret = device_context_mapped(iommu, pdev->bus->number, pdev->devfn);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001618 if (!ret)
1619 return ret;
1620 /* dependent device mapping */
1621 tmp = pci_find_upstream_pcie_bridge(pdev);
1622 if (!tmp)
1623 return ret;
1624 /* Secondary interface's bus number and devfn 0 */
1625 parent = pdev->bus->self;
1626 while (parent != tmp) {
Weidong Han8c11e792008-12-08 15:29:22 +08001627 ret = device_context_mapped(iommu, parent->bus->number,
David Woodhouse276dbf992009-04-04 01:45:37 +01001628 parent->devfn);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001629 if (!ret)
1630 return ret;
1631 parent = parent->bus->self;
1632 }
Kenji Kaneshige5f4d91a2009-11-11 14:36:17 +09001633 if (pci_is_pcie(tmp))
David Woodhouse276dbf992009-04-04 01:45:37 +01001634 return device_context_mapped(iommu, tmp->subordinate->number,
1635 0);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001636 else
David Woodhouse276dbf992009-04-04 01:45:37 +01001637 return device_context_mapped(iommu, tmp->bus->number,
1638 tmp->devfn);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001639}
1640
Fenghua Yuf5329592009-08-04 15:09:37 -07001641/* Returns a number of VTD pages, but aligned to MM page size */
1642static inline unsigned long aligned_nrpages(unsigned long host_addr,
1643 size_t size)
1644{
1645 host_addr &= ~PAGE_MASK;
1646 return PAGE_ALIGN(host_addr + size) >> VTD_PAGE_SHIFT;
1647}
1648
David Woodhouse9051aa02009-06-29 12:30:54 +01001649static int __domain_mapping(struct dmar_domain *domain, unsigned long iov_pfn,
1650 struct scatterlist *sg, unsigned long phys_pfn,
1651 unsigned long nr_pages, int prot)
David Woodhousee1605492009-06-29 11:17:38 +01001652{
1653 struct dma_pte *first_pte = NULL, *pte = NULL;
David Woodhouse9051aa02009-06-29 12:30:54 +01001654 phys_addr_t uninitialized_var(pteval);
David Woodhousee1605492009-06-29 11:17:38 +01001655 int addr_width = agaw_to_width(domain->agaw) - VTD_PAGE_SHIFT;
David Woodhouse9051aa02009-06-29 12:30:54 +01001656 unsigned long sg_res;
David Woodhousee1605492009-06-29 11:17:38 +01001657
1658 BUG_ON(addr_width < BITS_PER_LONG && (iov_pfn + nr_pages - 1) >> addr_width);
1659
1660 if ((prot & (DMA_PTE_READ|DMA_PTE_WRITE)) == 0)
1661 return -EINVAL;
1662
1663 prot &= DMA_PTE_READ | DMA_PTE_WRITE | DMA_PTE_SNP;
1664
David Woodhouse9051aa02009-06-29 12:30:54 +01001665 if (sg)
1666 sg_res = 0;
1667 else {
1668 sg_res = nr_pages + 1;
1669 pteval = ((phys_addr_t)phys_pfn << VTD_PAGE_SHIFT) | prot;
1670 }
1671
David Woodhousee1605492009-06-29 11:17:38 +01001672 while (nr_pages--) {
David Woodhousec85994e2009-07-01 19:21:24 +01001673 uint64_t tmp;
1674
David Woodhousee1605492009-06-29 11:17:38 +01001675 if (!sg_res) {
Fenghua Yuf5329592009-08-04 15:09:37 -07001676 sg_res = aligned_nrpages(sg->offset, sg->length);
David Woodhousee1605492009-06-29 11:17:38 +01001677 sg->dma_address = ((dma_addr_t)iov_pfn << VTD_PAGE_SHIFT) + sg->offset;
1678 sg->dma_length = sg->length;
1679 pteval = page_to_phys(sg_page(sg)) | prot;
1680 }
1681 if (!pte) {
1682 first_pte = pte = pfn_to_dma_pte(domain, iov_pfn);
1683 if (!pte)
1684 return -ENOMEM;
1685 }
1686 /* We don't need lock here, nobody else
1687 * touches the iova range
1688 */
David Woodhouse7766a3f2009-07-01 20:27:03 +01001689 tmp = cmpxchg64_local(&pte->val, 0ULL, pteval);
David Woodhousec85994e2009-07-01 19:21:24 +01001690 if (tmp) {
David Woodhouse1bf20f02009-06-29 22:06:43 +01001691 static int dumps = 5;
David Woodhousec85994e2009-07-01 19:21:24 +01001692 printk(KERN_CRIT "ERROR: DMA PTE for vPFN 0x%lx already set (to %llx not %llx)\n",
1693 iov_pfn, tmp, (unsigned long long)pteval);
David Woodhouse1bf20f02009-06-29 22:06:43 +01001694 if (dumps) {
1695 dumps--;
1696 debug_dma_dump_mappings(NULL);
1697 }
1698 WARN_ON(1);
1699 }
David Woodhousee1605492009-06-29 11:17:38 +01001700 pte++;
David Woodhouse75e6bf92009-07-02 11:21:16 +01001701 if (!nr_pages || first_pte_in_page(pte)) {
David Woodhousee1605492009-06-29 11:17:38 +01001702 domain_flush_cache(domain, first_pte,
1703 (void *)pte - (void *)first_pte);
1704 pte = NULL;
1705 }
1706 iov_pfn++;
1707 pteval += VTD_PAGE_SIZE;
1708 sg_res--;
1709 if (!sg_res)
1710 sg = sg_next(sg);
1711 }
1712 return 0;
1713}
1714
David Woodhouse9051aa02009-06-29 12:30:54 +01001715static inline int domain_sg_mapping(struct dmar_domain *domain, unsigned long iov_pfn,
1716 struct scatterlist *sg, unsigned long nr_pages,
1717 int prot)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001718{
David Woodhouse9051aa02009-06-29 12:30:54 +01001719 return __domain_mapping(domain, iov_pfn, sg, 0, nr_pages, prot);
1720}
Fenghua Yu5b6985c2008-10-16 18:02:32 -07001721
David Woodhouse9051aa02009-06-29 12:30:54 +01001722static inline int domain_pfn_mapping(struct dmar_domain *domain, unsigned long iov_pfn,
1723 unsigned long phys_pfn, unsigned long nr_pages,
1724 int prot)
1725{
1726 return __domain_mapping(domain, iov_pfn, NULL, phys_pfn, nr_pages, prot);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001727}
1728
Weidong Hanc7151a82008-12-08 22:51:37 +08001729static void iommu_detach_dev(struct intel_iommu *iommu, u8 bus, u8 devfn)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001730{
Weidong Hanc7151a82008-12-08 22:51:37 +08001731 if (!iommu)
1732 return;
Weidong Han8c11e792008-12-08 15:29:22 +08001733
1734 clear_context_table(iommu, bus, devfn);
1735 iommu->flush.flush_context(iommu, 0, 0, 0,
David Woodhouse4c25a2c2009-05-10 17:16:06 +01001736 DMA_CCMD_GLOBAL_INVL);
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01001737 iommu->flush.flush_iotlb(iommu, 0, 0, 0, DMA_TLB_GLOBAL_FLUSH);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001738}
1739
1740static void domain_remove_dev_info(struct dmar_domain *domain)
1741{
1742 struct device_domain_info *info;
1743 unsigned long flags;
Weidong Hanc7151a82008-12-08 22:51:37 +08001744 struct intel_iommu *iommu;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001745
1746 spin_lock_irqsave(&device_domain_lock, flags);
1747 while (!list_empty(&domain->devices)) {
1748 info = list_entry(domain->devices.next,
1749 struct device_domain_info, link);
1750 list_del(&info->link);
1751 list_del(&info->global);
1752 if (info->dev)
Keshavamurthy, Anil S358dd8a2007-10-21 16:41:59 -07001753 info->dev->dev.archdata.iommu = NULL;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001754 spin_unlock_irqrestore(&device_domain_lock, flags);
1755
Yu Zhao93a23a72009-05-18 13:51:37 +08001756 iommu_disable_dev_iotlb(info);
David Woodhouse276dbf992009-04-04 01:45:37 +01001757 iommu = device_to_iommu(info->segment, info->bus, info->devfn);
Weidong Hanc7151a82008-12-08 22:51:37 +08001758 iommu_detach_dev(iommu, info->bus, info->devfn);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001759 free_devinfo_mem(info);
1760
1761 spin_lock_irqsave(&device_domain_lock, flags);
1762 }
1763 spin_unlock_irqrestore(&device_domain_lock, flags);
1764}
1765
1766/*
1767 * find_domain
Keshavamurthy, Anil S358dd8a2007-10-21 16:41:59 -07001768 * Note: we use struct pci_dev->dev.archdata.iommu stores the info
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001769 */
Kay, Allen M38717942008-09-09 18:37:29 +03001770static struct dmar_domain *
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001771find_domain(struct pci_dev *pdev)
1772{
1773 struct device_domain_info *info;
1774
1775 /* No lock here, assumes no domain exit in normal case */
Keshavamurthy, Anil S358dd8a2007-10-21 16:41:59 -07001776 info = pdev->dev.archdata.iommu;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001777 if (info)
1778 return info->domain;
1779 return NULL;
1780}
1781
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001782/* domain is initialized */
1783static struct dmar_domain *get_domain_for_dev(struct pci_dev *pdev, int gaw)
1784{
1785 struct dmar_domain *domain, *found = NULL;
1786 struct intel_iommu *iommu;
1787 struct dmar_drhd_unit *drhd;
1788 struct device_domain_info *info, *tmp;
1789 struct pci_dev *dev_tmp;
1790 unsigned long flags;
1791 int bus = 0, devfn = 0;
David Woodhouse276dbf992009-04-04 01:45:37 +01001792 int segment;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001793 int ret;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001794
1795 domain = find_domain(pdev);
1796 if (domain)
1797 return domain;
1798
David Woodhouse276dbf992009-04-04 01:45:37 +01001799 segment = pci_domain_nr(pdev->bus);
1800
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001801 dev_tmp = pci_find_upstream_pcie_bridge(pdev);
1802 if (dev_tmp) {
Kenji Kaneshige5f4d91a2009-11-11 14:36:17 +09001803 if (pci_is_pcie(dev_tmp)) {
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001804 bus = dev_tmp->subordinate->number;
1805 devfn = 0;
1806 } else {
1807 bus = dev_tmp->bus->number;
1808 devfn = dev_tmp->devfn;
1809 }
1810 spin_lock_irqsave(&device_domain_lock, flags);
1811 list_for_each_entry(info, &device_domain_list, global) {
David Woodhouse276dbf992009-04-04 01:45:37 +01001812 if (info->segment == segment &&
1813 info->bus == bus && info->devfn == devfn) {
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001814 found = info->domain;
1815 break;
1816 }
1817 }
1818 spin_unlock_irqrestore(&device_domain_lock, flags);
1819 /* pcie-pci bridge already has a domain, uses it */
1820 if (found) {
1821 domain = found;
1822 goto found_domain;
1823 }
1824 }
1825
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001826 domain = alloc_domain();
1827 if (!domain)
1828 goto error;
1829
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001830 /* Allocate new domain for the device */
1831 drhd = dmar_find_matched_drhd_unit(pdev);
1832 if (!drhd) {
1833 printk(KERN_ERR "IOMMU: can't find DMAR for device %s\n",
1834 pci_name(pdev));
1835 return NULL;
1836 }
1837 iommu = drhd->iommu;
1838
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001839 ret = iommu_attach_domain(domain, iommu);
1840 if (ret) {
1841 domain_exit(domain);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001842 goto error;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001843 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001844
1845 if (domain_init(domain, gaw)) {
1846 domain_exit(domain);
1847 goto error;
1848 }
1849
1850 /* register pcie-to-pci device */
1851 if (dev_tmp) {
1852 info = alloc_devinfo_mem();
1853 if (!info) {
1854 domain_exit(domain);
1855 goto error;
1856 }
David Woodhouse276dbf992009-04-04 01:45:37 +01001857 info->segment = segment;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001858 info->bus = bus;
1859 info->devfn = devfn;
1860 info->dev = NULL;
1861 info->domain = domain;
1862 /* This domain is shared by devices under p2p bridge */
Weidong Han3b5410e2008-12-08 09:17:15 +08001863 domain->flags |= DOMAIN_FLAG_P2P_MULTIPLE_DEVICES;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001864
1865 /* pcie-to-pci bridge already has a domain, uses it */
1866 found = NULL;
1867 spin_lock_irqsave(&device_domain_lock, flags);
1868 list_for_each_entry(tmp, &device_domain_list, global) {
David Woodhouse276dbf992009-04-04 01:45:37 +01001869 if (tmp->segment == segment &&
1870 tmp->bus == bus && tmp->devfn == devfn) {
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001871 found = tmp->domain;
1872 break;
1873 }
1874 }
1875 if (found) {
1876 free_devinfo_mem(info);
1877 domain_exit(domain);
1878 domain = found;
1879 } else {
1880 list_add(&info->link, &domain->devices);
1881 list_add(&info->global, &device_domain_list);
1882 }
1883 spin_unlock_irqrestore(&device_domain_lock, flags);
1884 }
1885
1886found_domain:
1887 info = alloc_devinfo_mem();
1888 if (!info)
1889 goto error;
David Woodhouse276dbf992009-04-04 01:45:37 +01001890 info->segment = segment;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001891 info->bus = pdev->bus->number;
1892 info->devfn = pdev->devfn;
1893 info->dev = pdev;
1894 info->domain = domain;
1895 spin_lock_irqsave(&device_domain_lock, flags);
1896 /* somebody is fast */
1897 found = find_domain(pdev);
1898 if (found != NULL) {
1899 spin_unlock_irqrestore(&device_domain_lock, flags);
1900 if (found != domain) {
1901 domain_exit(domain);
1902 domain = found;
1903 }
1904 free_devinfo_mem(info);
1905 return domain;
1906 }
1907 list_add(&info->link, &domain->devices);
1908 list_add(&info->global, &device_domain_list);
Keshavamurthy, Anil S358dd8a2007-10-21 16:41:59 -07001909 pdev->dev.archdata.iommu = info;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001910 spin_unlock_irqrestore(&device_domain_lock, flags);
1911 return domain;
1912error:
1913 /* recheck it here, maybe others set it */
1914 return find_domain(pdev);
1915}
1916
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001917static int iommu_identity_mapping;
David Woodhousee0fc7e02009-09-30 09:12:17 -07001918#define IDENTMAP_ALL 1
1919#define IDENTMAP_GFX 2
1920#define IDENTMAP_AZALIA 4
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001921
David Woodhouseb2132032009-06-26 18:50:28 +01001922static int iommu_domain_identity_map(struct dmar_domain *domain,
1923 unsigned long long start,
1924 unsigned long long end)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001925{
David Woodhousec5395d52009-06-28 16:35:56 +01001926 unsigned long first_vpfn = start >> VTD_PAGE_SHIFT;
1927 unsigned long last_vpfn = end >> VTD_PAGE_SHIFT;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001928
David Woodhousec5395d52009-06-28 16:35:56 +01001929 if (!reserve_iova(&domain->iovad, dma_to_mm_pfn(first_vpfn),
1930 dma_to_mm_pfn(last_vpfn))) {
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001931 printk(KERN_ERR "IOMMU: reserve iova failed\n");
David Woodhouseb2132032009-06-26 18:50:28 +01001932 return -ENOMEM;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001933 }
1934
David Woodhousec5395d52009-06-28 16:35:56 +01001935 pr_debug("Mapping reserved region %llx-%llx for domain %d\n",
1936 start, end, domain->id);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001937 /*
1938 * RMRR range might have overlap with physical memory range,
1939 * clear it first
1940 */
David Woodhousec5395d52009-06-28 16:35:56 +01001941 dma_pte_clear_range(domain, first_vpfn, last_vpfn);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001942
David Woodhousec5395d52009-06-28 16:35:56 +01001943 return domain_pfn_mapping(domain, first_vpfn, first_vpfn,
1944 last_vpfn - first_vpfn + 1,
David Woodhouse61df7442009-06-28 11:55:58 +01001945 DMA_PTE_READ|DMA_PTE_WRITE);
David Woodhouseb2132032009-06-26 18:50:28 +01001946}
1947
1948static int iommu_prepare_identity_map(struct pci_dev *pdev,
1949 unsigned long long start,
1950 unsigned long long end)
1951{
1952 struct dmar_domain *domain;
1953 int ret;
1954
David Woodhousec7ab48d2009-06-26 19:10:36 +01001955 domain = get_domain_for_dev(pdev, DEFAULT_DOMAIN_ADDRESS_WIDTH);
David Woodhouseb2132032009-06-26 18:50:28 +01001956 if (!domain)
1957 return -ENOMEM;
1958
David Woodhouse19943b02009-08-04 16:19:20 +01001959 /* For _hardware_ passthrough, don't bother. But for software
1960 passthrough, we do it anyway -- it may indicate a memory
1961 range which is reserved in E820, so which didn't get set
1962 up to start with in si_domain */
1963 if (domain == si_domain && hw_pass_through) {
1964 printk("Ignoring identity map for HW passthrough device %s [0x%Lx - 0x%Lx]\n",
1965 pci_name(pdev), start, end);
1966 return 0;
1967 }
1968
1969 printk(KERN_INFO
1970 "IOMMU: Setting identity map for device %s [0x%Lx - 0x%Lx]\n",
1971 pci_name(pdev), start, end);
David Woodhouse2ff729f2009-08-26 14:25:41 +01001972
David Woodhouse5595b522009-12-02 09:21:55 +00001973 if (end < start) {
1974 WARN(1, "Your BIOS is broken; RMRR ends before it starts!\n"
1975 "BIOS vendor: %s; Ver: %s; Product Version: %s\n",
1976 dmi_get_system_info(DMI_BIOS_VENDOR),
1977 dmi_get_system_info(DMI_BIOS_VERSION),
1978 dmi_get_system_info(DMI_PRODUCT_VERSION));
1979 ret = -EIO;
1980 goto error;
1981 }
1982
David Woodhouse2ff729f2009-08-26 14:25:41 +01001983 if (end >> agaw_to_width(domain->agaw)) {
1984 WARN(1, "Your BIOS is broken; RMRR exceeds permitted address width (%d bits)\n"
1985 "BIOS vendor: %s; Ver: %s; Product Version: %s\n",
1986 agaw_to_width(domain->agaw),
1987 dmi_get_system_info(DMI_BIOS_VENDOR),
1988 dmi_get_system_info(DMI_BIOS_VERSION),
1989 dmi_get_system_info(DMI_PRODUCT_VERSION));
1990 ret = -EIO;
1991 goto error;
1992 }
David Woodhouse19943b02009-08-04 16:19:20 +01001993
David Woodhouseb2132032009-06-26 18:50:28 +01001994 ret = iommu_domain_identity_map(domain, start, end);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07001995 if (ret)
1996 goto error;
1997
1998 /* context entry init */
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001999 ret = domain_context_mapping(domain, pdev, CONTEXT_TT_MULTI_LEVEL);
David Woodhouseb2132032009-06-26 18:50:28 +01002000 if (ret)
2001 goto error;
2002
2003 return 0;
2004
2005 error:
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002006 domain_exit(domain);
2007 return ret;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002008}
2009
2010static inline int iommu_prepare_rmrr_dev(struct dmar_rmrr_unit *rmrr,
2011 struct pci_dev *pdev)
2012{
Keshavamurthy, Anil S358dd8a2007-10-21 16:41:59 -07002013 if (pdev->dev.archdata.iommu == DUMMY_DEVICE_DOMAIN_INFO)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002014 return 0;
2015 return iommu_prepare_identity_map(pdev, rmrr->base_address,
2016 rmrr->end_address + 1);
2017}
2018
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002019#ifdef CONFIG_DMAR_FLOPPY_WA
2020static inline void iommu_prepare_isa(void)
2021{
2022 struct pci_dev *pdev;
2023 int ret;
2024
2025 pdev = pci_get_class(PCI_CLASS_BRIDGE_ISA << 8, NULL);
2026 if (!pdev)
2027 return;
2028
David Woodhousec7ab48d2009-06-26 19:10:36 +01002029 printk(KERN_INFO "IOMMU: Prepare 0-16MiB unity mapping for LPC\n");
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002030 ret = iommu_prepare_identity_map(pdev, 0, 16*1024*1024);
2031
2032 if (ret)
David Woodhousec7ab48d2009-06-26 19:10:36 +01002033 printk(KERN_ERR "IOMMU: Failed to create 0-16MiB identity map; "
2034 "floppy might not work\n");
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002035
2036}
2037#else
2038static inline void iommu_prepare_isa(void)
2039{
2040 return;
2041}
2042#endif /* !CONFIG_DMAR_FLPY_WA */
2043
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002044static int md_domain_init(struct dmar_domain *domain, int guest_width);
David Woodhousec7ab48d2009-06-26 19:10:36 +01002045
2046static int __init si_domain_work_fn(unsigned long start_pfn,
2047 unsigned long end_pfn, void *datax)
2048{
2049 int *ret = datax;
2050
2051 *ret = iommu_domain_identity_map(si_domain,
2052 (uint64_t)start_pfn << PAGE_SHIFT,
2053 (uint64_t)end_pfn << PAGE_SHIFT);
2054 return *ret;
2055
2056}
2057
Matt Kraai071e1372009-08-23 22:30:22 -07002058static int __init si_domain_init(int hw)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002059{
2060 struct dmar_drhd_unit *drhd;
2061 struct intel_iommu *iommu;
David Woodhousec7ab48d2009-06-26 19:10:36 +01002062 int nid, ret = 0;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002063
2064 si_domain = alloc_domain();
2065 if (!si_domain)
2066 return -EFAULT;
2067
David Woodhousec7ab48d2009-06-26 19:10:36 +01002068 pr_debug("Identity mapping domain is domain %d\n", si_domain->id);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002069
2070 for_each_active_iommu(iommu, drhd) {
2071 ret = iommu_attach_domain(si_domain, iommu);
2072 if (ret) {
2073 domain_exit(si_domain);
2074 return -EFAULT;
2075 }
2076 }
2077
2078 if (md_domain_init(si_domain, DEFAULT_DOMAIN_ADDRESS_WIDTH)) {
2079 domain_exit(si_domain);
2080 return -EFAULT;
2081 }
2082
2083 si_domain->flags = DOMAIN_FLAG_STATIC_IDENTITY;
2084
David Woodhouse19943b02009-08-04 16:19:20 +01002085 if (hw)
2086 return 0;
2087
David Woodhousec7ab48d2009-06-26 19:10:36 +01002088 for_each_online_node(nid) {
2089 work_with_active_regions(nid, si_domain_work_fn, &ret);
2090 if (ret)
2091 return ret;
2092 }
2093
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002094 return 0;
2095}
2096
2097static void domain_remove_one_dev_info(struct dmar_domain *domain,
2098 struct pci_dev *pdev);
2099static int identity_mapping(struct pci_dev *pdev)
2100{
2101 struct device_domain_info *info;
2102
2103 if (likely(!iommu_identity_mapping))
2104 return 0;
2105
2106
2107 list_for_each_entry(info, &si_domain->devices, link)
2108 if (info->dev == pdev)
2109 return 1;
2110 return 0;
2111}
2112
2113static int domain_add_dev_info(struct dmar_domain *domain,
David Woodhouse5fe60f42009-08-09 10:53:41 +01002114 struct pci_dev *pdev,
2115 int translation)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002116{
2117 struct device_domain_info *info;
2118 unsigned long flags;
David Woodhouse5fe60f42009-08-09 10:53:41 +01002119 int ret;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002120
2121 info = alloc_devinfo_mem();
2122 if (!info)
2123 return -ENOMEM;
2124
David Woodhouse5fe60f42009-08-09 10:53:41 +01002125 ret = domain_context_mapping(domain, pdev, translation);
2126 if (ret) {
2127 free_devinfo_mem(info);
2128 return ret;
2129 }
2130
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002131 info->segment = pci_domain_nr(pdev->bus);
2132 info->bus = pdev->bus->number;
2133 info->devfn = pdev->devfn;
2134 info->dev = pdev;
2135 info->domain = domain;
2136
2137 spin_lock_irqsave(&device_domain_lock, flags);
2138 list_add(&info->link, &domain->devices);
2139 list_add(&info->global, &device_domain_list);
2140 pdev->dev.archdata.iommu = info;
2141 spin_unlock_irqrestore(&device_domain_lock, flags);
2142
2143 return 0;
2144}
2145
David Woodhouse6941af22009-07-04 18:24:27 +01002146static int iommu_should_identity_map(struct pci_dev *pdev, int startup)
2147{
David Woodhousee0fc7e02009-09-30 09:12:17 -07002148 if ((iommu_identity_mapping & IDENTMAP_AZALIA) && IS_AZALIA(pdev))
2149 return 1;
2150
2151 if ((iommu_identity_mapping & IDENTMAP_GFX) && IS_GFX_DEVICE(pdev))
2152 return 1;
2153
2154 if (!(iommu_identity_mapping & IDENTMAP_ALL))
2155 return 0;
David Woodhouse6941af22009-07-04 18:24:27 +01002156
David Woodhouse3dfc8132009-07-04 19:11:08 +01002157 /*
2158 * We want to start off with all devices in the 1:1 domain, and
2159 * take them out later if we find they can't access all of memory.
2160 *
2161 * However, we can't do this for PCI devices behind bridges,
2162 * because all PCI devices behind the same bridge will end up
2163 * with the same source-id on their transactions.
2164 *
2165 * Practically speaking, we can't change things around for these
2166 * devices at run-time, because we can't be sure there'll be no
2167 * DMA transactions in flight for any of their siblings.
2168 *
2169 * So PCI devices (unless they're on the root bus) as well as
2170 * their parent PCI-PCI or PCIe-PCI bridges must be left _out_ of
2171 * the 1:1 domain, just in _case_ one of their siblings turns out
2172 * not to be able to map all of memory.
2173 */
Kenji Kaneshige5f4d91a2009-11-11 14:36:17 +09002174 if (!pci_is_pcie(pdev)) {
David Woodhouse3dfc8132009-07-04 19:11:08 +01002175 if (!pci_is_root_bus(pdev->bus))
2176 return 0;
2177 if (pdev->class >> 8 == PCI_CLASS_BRIDGE_PCI)
2178 return 0;
2179 } else if (pdev->pcie_type == PCI_EXP_TYPE_PCI_BRIDGE)
2180 return 0;
2181
2182 /*
2183 * At boot time, we don't yet know if devices will be 64-bit capable.
2184 * Assume that they will -- if they turn out not to be, then we can
2185 * take them out of the 1:1 domain later.
2186 */
David Woodhouse6941af22009-07-04 18:24:27 +01002187 if (!startup)
2188 return pdev->dma_mask > DMA_BIT_MASK(32);
2189
2190 return 1;
2191}
2192
Matt Kraai071e1372009-08-23 22:30:22 -07002193static int __init iommu_prepare_static_identity_mapping(int hw)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002194{
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002195 struct pci_dev *pdev = NULL;
2196 int ret;
2197
David Woodhouse19943b02009-08-04 16:19:20 +01002198 ret = si_domain_init(hw);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002199 if (ret)
2200 return -EFAULT;
2201
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002202 for_each_pci_dev(pdev) {
David Woodhouse6941af22009-07-04 18:24:27 +01002203 if (iommu_should_identity_map(pdev, 1)) {
David Woodhouse19943b02009-08-04 16:19:20 +01002204 printk(KERN_INFO "IOMMU: %s identity mapping for device %s\n",
2205 hw ? "hardware" : "software", pci_name(pdev));
David Woodhousec7ab48d2009-06-26 19:10:36 +01002206
David Woodhouse5fe60f42009-08-09 10:53:41 +01002207 ret = domain_add_dev_info(si_domain, pdev,
David Woodhouse19943b02009-08-04 16:19:20 +01002208 hw ? CONTEXT_TT_PASS_THROUGH :
David Woodhouse62edf5d2009-07-04 10:59:46 +01002209 CONTEXT_TT_MULTI_LEVEL);
2210 if (ret)
2211 return ret;
David Woodhouse62edf5d2009-07-04 10:59:46 +01002212 }
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002213 }
2214
2215 return 0;
2216}
2217
2218int __init init_dmars(void)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002219{
2220 struct dmar_drhd_unit *drhd;
2221 struct dmar_rmrr_unit *rmrr;
2222 struct pci_dev *pdev;
2223 struct intel_iommu *iommu;
Suresh Siddha9d783ba2009-03-16 17:04:55 -07002224 int i, ret;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002225
2226 /*
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002227 * for each drhd
2228 * allocate root
2229 * initialize and program root entry to not present
2230 * endfor
2231 */
2232 for_each_drhd_unit(drhd) {
mark gross5e0d2a62008-03-04 15:22:08 -08002233 g_num_of_iommus++;
2234 /*
2235 * lock not needed as this is only incremented in the single
2236 * threaded kernel __init code path all other access are read
2237 * only
2238 */
2239 }
2240
Weidong Hand9630fe2008-12-08 11:06:32 +08002241 g_iommus = kcalloc(g_num_of_iommus, sizeof(struct intel_iommu *),
2242 GFP_KERNEL);
2243 if (!g_iommus) {
2244 printk(KERN_ERR "Allocating global iommu array failed\n");
2245 ret = -ENOMEM;
2246 goto error;
2247 }
2248
mark gross80b20dd2008-04-18 13:53:58 -07002249 deferred_flush = kzalloc(g_num_of_iommus *
2250 sizeof(struct deferred_flush_tables), GFP_KERNEL);
2251 if (!deferred_flush) {
mark gross5e0d2a62008-03-04 15:22:08 -08002252 ret = -ENOMEM;
2253 goto error;
2254 }
2255
mark gross5e0d2a62008-03-04 15:22:08 -08002256 for_each_drhd_unit(drhd) {
2257 if (drhd->ignored)
2258 continue;
Suresh Siddha1886e8a2008-07-10 11:16:37 -07002259
2260 iommu = drhd->iommu;
Weidong Hand9630fe2008-12-08 11:06:32 +08002261 g_iommus[iommu->seq_id] = iommu;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002262
Suresh Siddhae61d98d2008-07-10 11:16:35 -07002263 ret = iommu_init_domains(iommu);
2264 if (ret)
2265 goto error;
2266
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002267 /*
2268 * TBD:
2269 * we could share the same root & context tables
2270 * amoung all IOMMU's. Need to Split it later.
2271 */
2272 ret = iommu_alloc_root_entry(iommu);
2273 if (ret) {
2274 printk(KERN_ERR "IOMMU: allocate root entry failed\n");
2275 goto error;
2276 }
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07002277 if (!ecap_pass_through(iommu->ecap))
David Woodhouse19943b02009-08-04 16:19:20 +01002278 hw_pass_through = 0;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002279 }
2280
Suresh Siddha1531a6a2009-03-16 17:04:57 -07002281 /*
2282 * Start from the sane iommu hardware state.
2283 */
Youquan Songa77b67d2008-10-16 16:31:56 -07002284 for_each_drhd_unit(drhd) {
2285 if (drhd->ignored)
2286 continue;
2287
2288 iommu = drhd->iommu;
Suresh Siddha1531a6a2009-03-16 17:04:57 -07002289
2290 /*
2291 * If the queued invalidation is already initialized by us
2292 * (for example, while enabling interrupt-remapping) then
2293 * we got the things already rolling from a sane state.
2294 */
2295 if (iommu->qi)
2296 continue;
2297
2298 /*
2299 * Clear any previous faults.
2300 */
2301 dmar_fault(-1, iommu);
2302 /*
2303 * Disable queued invalidation if supported and already enabled
2304 * before OS handover.
2305 */
2306 dmar_disable_qi(iommu);
2307 }
2308
2309 for_each_drhd_unit(drhd) {
2310 if (drhd->ignored)
2311 continue;
2312
2313 iommu = drhd->iommu;
2314
Youquan Songa77b67d2008-10-16 16:31:56 -07002315 if (dmar_enable_qi(iommu)) {
2316 /*
2317 * Queued Invalidate not enabled, use Register Based
2318 * Invalidate
2319 */
2320 iommu->flush.flush_context = __iommu_flush_context;
2321 iommu->flush.flush_iotlb = __iommu_flush_iotlb;
2322 printk(KERN_INFO "IOMMU 0x%Lx: using Register based "
FUJITA Tomonorib4e0f9e2008-11-19 13:53:42 +09002323 "invalidation\n",
2324 (unsigned long long)drhd->reg_base_addr);
Youquan Songa77b67d2008-10-16 16:31:56 -07002325 } else {
2326 iommu->flush.flush_context = qi_flush_context;
2327 iommu->flush.flush_iotlb = qi_flush_iotlb;
2328 printk(KERN_INFO "IOMMU 0x%Lx: using Queued "
FUJITA Tomonorib4e0f9e2008-11-19 13:53:42 +09002329 "invalidation\n",
2330 (unsigned long long)drhd->reg_base_addr);
Youquan Songa77b67d2008-10-16 16:31:56 -07002331 }
2332 }
2333
David Woodhouse19943b02009-08-04 16:19:20 +01002334 if (iommu_pass_through)
David Woodhousee0fc7e02009-09-30 09:12:17 -07002335 iommu_identity_mapping |= IDENTMAP_ALL;
2336
David Woodhouse19943b02009-08-04 16:19:20 +01002337#ifdef CONFIG_DMAR_BROKEN_GFX_WA
David Woodhousee0fc7e02009-09-30 09:12:17 -07002338 iommu_identity_mapping |= IDENTMAP_GFX;
David Woodhouse19943b02009-08-04 16:19:20 +01002339#endif
David Woodhousee0fc7e02009-09-30 09:12:17 -07002340
2341 check_tylersburg_isoch();
2342
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07002343 /*
2344 * If pass through is not set or not enabled, setup context entries for
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002345 * identity mappings for rmrr, gfx, and isa and may fall back to static
2346 * identity mapping if iommu_identity_mapping is set.
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07002347 */
David Woodhouse19943b02009-08-04 16:19:20 +01002348 if (iommu_identity_mapping) {
2349 ret = iommu_prepare_static_identity_mapping(hw_pass_through);
2350 if (ret) {
2351 printk(KERN_CRIT "Failed to setup IOMMU pass-through\n");
2352 goto error;
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07002353 }
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07002354 }
David Woodhouse19943b02009-08-04 16:19:20 +01002355 /*
2356 * For each rmrr
2357 * for each dev attached to rmrr
2358 * do
2359 * locate drhd for dev, alloc domain for dev
2360 * allocate free domain
2361 * allocate page table entries for rmrr
2362 * if context not allocated for bus
2363 * allocate and init context
2364 * set present in root table for this bus
2365 * init context with domain, translation etc
2366 * endfor
2367 * endfor
2368 */
2369 printk(KERN_INFO "IOMMU: Setting RMRR:\n");
2370 for_each_rmrr_units(rmrr) {
2371 for (i = 0; i < rmrr->devices_cnt; i++) {
2372 pdev = rmrr->devices[i];
2373 /*
2374 * some BIOS lists non-exist devices in DMAR
2375 * table.
2376 */
2377 if (!pdev)
2378 continue;
2379 ret = iommu_prepare_rmrr_dev(rmrr, pdev);
2380 if (ret)
2381 printk(KERN_ERR
2382 "IOMMU: mapping reserved region failed\n");
2383 }
2384 }
2385
2386 iommu_prepare_isa();
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002387
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002388 /*
2389 * for each drhd
2390 * enable fault log
2391 * global invalidate context cache
2392 * global invalidate iotlb
2393 * enable translation
2394 */
2395 for_each_drhd_unit(drhd) {
2396 if (drhd->ignored)
2397 continue;
2398 iommu = drhd->iommu;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002399
2400 iommu_flush_write_buffer(iommu);
2401
Keshavamurthy, Anil S3460a6d2007-10-21 16:41:54 -07002402 ret = dmar_set_interrupt(iommu);
2403 if (ret)
2404 goto error;
2405
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002406 iommu_set_root_entry(iommu);
2407
David Woodhouse4c25a2c2009-05-10 17:16:06 +01002408 iommu->flush.flush_context(iommu, 0, 0, 0, DMA_CCMD_GLOBAL_INVL);
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01002409 iommu->flush.flush_iotlb(iommu, 0, 0, 0, DMA_TLB_GLOBAL_FLUSH);
mark grossf8bab732008-02-08 04:18:38 -08002410
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002411 ret = iommu_enable_translation(iommu);
2412 if (ret)
2413 goto error;
David Woodhouseb94996c2009-09-19 15:28:12 -07002414
2415 iommu_disable_protect_mem_regions(iommu);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002416 }
2417
2418 return 0;
2419error:
2420 for_each_drhd_unit(drhd) {
2421 if (drhd->ignored)
2422 continue;
2423 iommu = drhd->iommu;
2424 free_iommu(iommu);
2425 }
Weidong Hand9630fe2008-12-08 11:06:32 +08002426 kfree(g_iommus);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002427 return ret;
2428}
2429
David Woodhouse5a5e02a2009-07-04 09:35:44 +01002430/* This takes a number of _MM_ pages, not VTD pages */
David Woodhouse875764d2009-06-28 21:20:51 +01002431static struct iova *intel_alloc_iova(struct device *dev,
2432 struct dmar_domain *domain,
2433 unsigned long nrpages, uint64_t dma_mask)
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002434{
2435 struct pci_dev *pdev = to_pci_dev(dev);
2436 struct iova *iova = NULL;
2437
David Woodhouse875764d2009-06-28 21:20:51 +01002438 /* Restrict dma_mask to the width that the iommu can handle */
2439 dma_mask = min_t(uint64_t, DOMAIN_MAX_ADDR(domain->gaw), dma_mask);
2440
2441 if (!dmar_forcedac && dma_mask > DMA_BIT_MASK(32)) {
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002442 /*
2443 * First try to allocate an io virtual address in
Yang Hongyang284901a2009-04-06 19:01:15 -07002444 * DMA_BIT_MASK(32) and if that fails then try allocating
Joe Perches36098012007-12-17 11:40:11 -08002445 * from higher range
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002446 */
David Woodhouse875764d2009-06-28 21:20:51 +01002447 iova = alloc_iova(&domain->iovad, nrpages,
2448 IOVA_PFN(DMA_BIT_MASK(32)), 1);
2449 if (iova)
2450 return iova;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002451 }
David Woodhouse875764d2009-06-28 21:20:51 +01002452 iova = alloc_iova(&domain->iovad, nrpages, IOVA_PFN(dma_mask), 1);
2453 if (unlikely(!iova)) {
2454 printk(KERN_ERR "Allocating %ld-page iova for %s failed",
2455 nrpages, pci_name(pdev));
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002456 return NULL;
2457 }
2458
2459 return iova;
2460}
2461
David Woodhouse147202a2009-07-07 19:43:20 +01002462static struct dmar_domain *__get_valid_domain_for_dev(struct pci_dev *pdev)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002463{
2464 struct dmar_domain *domain;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002465 int ret;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002466
2467 domain = get_domain_for_dev(pdev,
2468 DEFAULT_DOMAIN_ADDRESS_WIDTH);
2469 if (!domain) {
2470 printk(KERN_ERR
2471 "Allocating domain for %s failed", pci_name(pdev));
Al Viro4fe05bb2007-10-29 04:51:16 +00002472 return NULL;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002473 }
2474
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002475 /* make sure context mapping is ok */
Weidong Han5331fe62008-12-08 23:00:00 +08002476 if (unlikely(!domain_context_mapped(pdev))) {
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07002477 ret = domain_context_mapping(domain, pdev,
2478 CONTEXT_TT_MULTI_LEVEL);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002479 if (ret) {
2480 printk(KERN_ERR
2481 "Domain context map for %s failed",
2482 pci_name(pdev));
Al Viro4fe05bb2007-10-29 04:51:16 +00002483 return NULL;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002484 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002485 }
2486
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002487 return domain;
2488}
2489
David Woodhouse147202a2009-07-07 19:43:20 +01002490static inline struct dmar_domain *get_valid_domain_for_dev(struct pci_dev *dev)
2491{
2492 struct device_domain_info *info;
2493
2494 /* No lock here, assumes no domain exit in normal case */
2495 info = dev->dev.archdata.iommu;
2496 if (likely(info))
2497 return info->domain;
2498
2499 return __get_valid_domain_for_dev(dev);
2500}
2501
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002502static int iommu_dummy(struct pci_dev *pdev)
2503{
2504 return pdev->dev.archdata.iommu == DUMMY_DEVICE_DOMAIN_INFO;
2505}
2506
2507/* Check if the pdev needs to go through non-identity map and unmap process.*/
David Woodhouse73676832009-07-04 14:08:36 +01002508static int iommu_no_mapping(struct device *dev)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002509{
David Woodhouse73676832009-07-04 14:08:36 +01002510 struct pci_dev *pdev;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002511 int found;
2512
David Woodhouse73676832009-07-04 14:08:36 +01002513 if (unlikely(dev->bus != &pci_bus_type))
2514 return 1;
2515
2516 pdev = to_pci_dev(dev);
David Woodhouse1e4c64c2009-07-04 10:40:38 +01002517 if (iommu_dummy(pdev))
2518 return 1;
2519
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002520 if (!iommu_identity_mapping)
David Woodhouse1e4c64c2009-07-04 10:40:38 +01002521 return 0;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002522
2523 found = identity_mapping(pdev);
2524 if (found) {
David Woodhouse6941af22009-07-04 18:24:27 +01002525 if (iommu_should_identity_map(pdev, 0))
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002526 return 1;
2527 else {
2528 /*
2529 * 32 bit DMA is removed from si_domain and fall back
2530 * to non-identity mapping.
2531 */
2532 domain_remove_one_dev_info(si_domain, pdev);
2533 printk(KERN_INFO "32bit %s uses non-identity mapping\n",
2534 pci_name(pdev));
2535 return 0;
2536 }
2537 } else {
2538 /*
2539 * In case of a detached 64 bit DMA device from vm, the device
2540 * is put into si_domain for identity mapping.
2541 */
David Woodhouse6941af22009-07-04 18:24:27 +01002542 if (iommu_should_identity_map(pdev, 0)) {
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002543 int ret;
David Woodhouse5fe60f42009-08-09 10:53:41 +01002544 ret = domain_add_dev_info(si_domain, pdev,
2545 hw_pass_through ?
2546 CONTEXT_TT_PASS_THROUGH :
2547 CONTEXT_TT_MULTI_LEVEL);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002548 if (!ret) {
2549 printk(KERN_INFO "64bit %s uses identity mapping\n",
2550 pci_name(pdev));
2551 return 1;
2552 }
2553 }
2554 }
2555
David Woodhouse1e4c64c2009-07-04 10:40:38 +01002556 return 0;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002557}
2558
FUJITA Tomonoribb9e6d62008-10-15 16:08:28 +09002559static dma_addr_t __intel_map_single(struct device *hwdev, phys_addr_t paddr,
2560 size_t size, int dir, u64 dma_mask)
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002561{
2562 struct pci_dev *pdev = to_pci_dev(hwdev);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002563 struct dmar_domain *domain;
Fenghua Yu5b6985c2008-10-16 18:02:32 -07002564 phys_addr_t start_paddr;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002565 struct iova *iova;
2566 int prot = 0;
Ingo Molnar6865f0d2008-04-22 11:09:04 +02002567 int ret;
Weidong Han8c11e792008-12-08 15:29:22 +08002568 struct intel_iommu *iommu;
Fenghua Yu33041ec2009-08-04 15:10:59 -07002569 unsigned long paddr_pfn = paddr >> PAGE_SHIFT;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002570
2571 BUG_ON(dir == DMA_NONE);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002572
David Woodhouse73676832009-07-04 14:08:36 +01002573 if (iommu_no_mapping(hwdev))
Ingo Molnar6865f0d2008-04-22 11:09:04 +02002574 return paddr;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002575
2576 domain = get_valid_domain_for_dev(pdev);
2577 if (!domain)
2578 return 0;
2579
Weidong Han8c11e792008-12-08 15:29:22 +08002580 iommu = domain_get_iommu(domain);
David Woodhouse88cb6a72009-06-28 15:03:06 +01002581 size = aligned_nrpages(paddr, size);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002582
David Woodhouse5a5e02a2009-07-04 09:35:44 +01002583 iova = intel_alloc_iova(hwdev, domain, dma_to_mm_pfn(size),
2584 pdev->dma_mask);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002585 if (!iova)
2586 goto error;
2587
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002588 /*
2589 * Check if DMAR supports zero-length reads on write only
2590 * mappings..
2591 */
2592 if (dir == DMA_TO_DEVICE || dir == DMA_BIDIRECTIONAL || \
Weidong Han8c11e792008-12-08 15:29:22 +08002593 !cap_zlr(iommu->cap))
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002594 prot |= DMA_PTE_READ;
2595 if (dir == DMA_FROM_DEVICE || dir == DMA_BIDIRECTIONAL)
2596 prot |= DMA_PTE_WRITE;
2597 /*
Ingo Molnar6865f0d2008-04-22 11:09:04 +02002598 * paddr - (paddr + size) might be partial page, we should map the whole
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002599 * page. Note: if two part of one page are separately mapped, we
Ingo Molnar6865f0d2008-04-22 11:09:04 +02002600 * might have two guest_addr mapping to the same host paddr, but this
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002601 * is not a big problem
2602 */
David Woodhouse0ab36de2009-06-28 14:01:43 +01002603 ret = domain_pfn_mapping(domain, mm_to_dma_pfn(iova->pfn_lo),
Fenghua Yu33041ec2009-08-04 15:10:59 -07002604 mm_to_dma_pfn(paddr_pfn), size, prot);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002605 if (ret)
2606 goto error;
2607
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01002608 /* it's a non-present to present mapping. Only flush if caching mode */
2609 if (cap_caching_mode(iommu->cap))
David Woodhouse03d6a242009-06-28 15:33:46 +01002610 iommu_flush_iotlb_psi(iommu, 0, mm_to_dma_pfn(iova->pfn_lo), size);
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01002611 else
Weidong Han8c11e792008-12-08 15:29:22 +08002612 iommu_flush_write_buffer(iommu);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002613
David Woodhouse03d6a242009-06-28 15:33:46 +01002614 start_paddr = (phys_addr_t)iova->pfn_lo << PAGE_SHIFT;
2615 start_paddr += paddr & ~PAGE_MASK;
2616 return start_paddr;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002617
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002618error:
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002619 if (iova)
2620 __free_iova(&domain->iovad, iova);
David Woodhouse4cf2e752009-02-11 17:23:43 +00002621 printk(KERN_ERR"Device %s request: %zx@%llx dir %d --- failed\n",
Fenghua Yu5b6985c2008-10-16 18:02:32 -07002622 pci_name(pdev), size, (unsigned long long)paddr, dir);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002623 return 0;
2624}
2625
FUJITA Tomonoriffbbef52009-01-05 23:47:26 +09002626static dma_addr_t intel_map_page(struct device *dev, struct page *page,
2627 unsigned long offset, size_t size,
2628 enum dma_data_direction dir,
2629 struct dma_attrs *attrs)
FUJITA Tomonoribb9e6d62008-10-15 16:08:28 +09002630{
FUJITA Tomonoriffbbef52009-01-05 23:47:26 +09002631 return __intel_map_single(dev, page_to_phys(page) + offset, size,
2632 dir, to_pci_dev(dev)->dma_mask);
FUJITA Tomonoribb9e6d62008-10-15 16:08:28 +09002633}
2634
mark gross5e0d2a62008-03-04 15:22:08 -08002635static void flush_unmaps(void)
2636{
mark gross80b20dd2008-04-18 13:53:58 -07002637 int i, j;
mark gross5e0d2a62008-03-04 15:22:08 -08002638
mark gross5e0d2a62008-03-04 15:22:08 -08002639 timer_on = 0;
2640
2641 /* just flush them all */
2642 for (i = 0; i < g_num_of_iommus; i++) {
Weidong Hana2bb8452008-12-08 11:24:12 +08002643 struct intel_iommu *iommu = g_iommus[i];
2644 if (!iommu)
2645 continue;
Suresh Siddhac42d9f32008-07-10 11:16:36 -07002646
Yu Zhao9dd2fe82009-05-18 13:51:36 +08002647 if (!deferred_flush[i].next)
2648 continue;
2649
2650 iommu->flush.flush_iotlb(iommu, 0, 0, 0,
Yu Zhao93a23a72009-05-18 13:51:37 +08002651 DMA_TLB_GLOBAL_FLUSH);
Yu Zhao9dd2fe82009-05-18 13:51:36 +08002652 for (j = 0; j < deferred_flush[i].next; j++) {
Yu Zhao93a23a72009-05-18 13:51:37 +08002653 unsigned long mask;
2654 struct iova *iova = deferred_flush[i].iova[j];
2655
Benjamin LaHaise64de5af2009-09-16 21:05:55 -04002656 mask = ilog2(mm_to_dma_pfn(iova->pfn_hi - iova->pfn_lo + 1));
Yu Zhao93a23a72009-05-18 13:51:37 +08002657 iommu_flush_dev_iotlb(deferred_flush[i].domain[j],
Benjamin LaHaise64de5af2009-09-16 21:05:55 -04002658 (uint64_t)iova->pfn_lo << PAGE_SHIFT, mask);
Yu Zhao93a23a72009-05-18 13:51:37 +08002659 __free_iova(&deferred_flush[i].domain[j]->iovad, iova);
mark gross80b20dd2008-04-18 13:53:58 -07002660 }
Yu Zhao9dd2fe82009-05-18 13:51:36 +08002661 deferred_flush[i].next = 0;
mark gross5e0d2a62008-03-04 15:22:08 -08002662 }
2663
mark gross5e0d2a62008-03-04 15:22:08 -08002664 list_size = 0;
mark gross5e0d2a62008-03-04 15:22:08 -08002665}
2666
2667static void flush_unmaps_timeout(unsigned long data)
2668{
mark gross80b20dd2008-04-18 13:53:58 -07002669 unsigned long flags;
2670
2671 spin_lock_irqsave(&async_umap_flush_lock, flags);
mark gross5e0d2a62008-03-04 15:22:08 -08002672 flush_unmaps();
mark gross80b20dd2008-04-18 13:53:58 -07002673 spin_unlock_irqrestore(&async_umap_flush_lock, flags);
mark gross5e0d2a62008-03-04 15:22:08 -08002674}
2675
2676static void add_unmap(struct dmar_domain *dom, struct iova *iova)
2677{
2678 unsigned long flags;
mark gross80b20dd2008-04-18 13:53:58 -07002679 int next, iommu_id;
Weidong Han8c11e792008-12-08 15:29:22 +08002680 struct intel_iommu *iommu;
mark gross5e0d2a62008-03-04 15:22:08 -08002681
2682 spin_lock_irqsave(&async_umap_flush_lock, flags);
mark gross80b20dd2008-04-18 13:53:58 -07002683 if (list_size == HIGH_WATER_MARK)
2684 flush_unmaps();
2685
Weidong Han8c11e792008-12-08 15:29:22 +08002686 iommu = domain_get_iommu(dom);
2687 iommu_id = iommu->seq_id;
Suresh Siddhac42d9f32008-07-10 11:16:36 -07002688
mark gross80b20dd2008-04-18 13:53:58 -07002689 next = deferred_flush[iommu_id].next;
2690 deferred_flush[iommu_id].domain[next] = dom;
2691 deferred_flush[iommu_id].iova[next] = iova;
2692 deferred_flush[iommu_id].next++;
mark gross5e0d2a62008-03-04 15:22:08 -08002693
2694 if (!timer_on) {
2695 mod_timer(&unmap_timer, jiffies + msecs_to_jiffies(10));
2696 timer_on = 1;
2697 }
2698 list_size++;
2699 spin_unlock_irqrestore(&async_umap_flush_lock, flags);
2700}
2701
FUJITA Tomonoriffbbef52009-01-05 23:47:26 +09002702static void intel_unmap_page(struct device *dev, dma_addr_t dev_addr,
2703 size_t size, enum dma_data_direction dir,
2704 struct dma_attrs *attrs)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002705{
2706 struct pci_dev *pdev = to_pci_dev(dev);
2707 struct dmar_domain *domain;
David Woodhoused794dc92009-06-28 00:27:49 +01002708 unsigned long start_pfn, last_pfn;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002709 struct iova *iova;
Weidong Han8c11e792008-12-08 15:29:22 +08002710 struct intel_iommu *iommu;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002711
David Woodhouse73676832009-07-04 14:08:36 +01002712 if (iommu_no_mapping(dev))
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002713 return;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002714
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002715 domain = find_domain(pdev);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002716 BUG_ON(!domain);
2717
Weidong Han8c11e792008-12-08 15:29:22 +08002718 iommu = domain_get_iommu(domain);
2719
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002720 iova = find_iova(&domain->iovad, IOVA_PFN(dev_addr));
David Woodhouse85b98272009-07-01 19:27:53 +01002721 if (WARN_ONCE(!iova, "Driver unmaps unmatched page at PFN %llx\n",
2722 (unsigned long long)dev_addr))
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002723 return;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002724
David Woodhoused794dc92009-06-28 00:27:49 +01002725 start_pfn = mm_to_dma_pfn(iova->pfn_lo);
2726 last_pfn = mm_to_dma_pfn(iova->pfn_hi + 1) - 1;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002727
David Woodhoused794dc92009-06-28 00:27:49 +01002728 pr_debug("Device %s unmapping: pfn %lx-%lx\n",
2729 pci_name(pdev), start_pfn, last_pfn);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002730
2731 /* clear the whole page */
David Woodhoused794dc92009-06-28 00:27:49 +01002732 dma_pte_clear_range(domain, start_pfn, last_pfn);
2733
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002734 /* free page tables */
David Woodhoused794dc92009-06-28 00:27:49 +01002735 dma_pte_free_pagetable(domain, start_pfn, last_pfn);
2736
mark gross5e0d2a62008-03-04 15:22:08 -08002737 if (intel_iommu_strict) {
David Woodhouse03d6a242009-06-28 15:33:46 +01002738 iommu_flush_iotlb_psi(iommu, domain->id, start_pfn,
David Woodhoused794dc92009-06-28 00:27:49 +01002739 last_pfn - start_pfn + 1);
mark gross5e0d2a62008-03-04 15:22:08 -08002740 /* free iova */
2741 __free_iova(&domain->iovad, iova);
2742 } else {
2743 add_unmap(domain, iova);
2744 /*
2745 * queue up the release of the unmap to save the 1/6th of the
2746 * cpu used up by the iotlb flush operation...
2747 */
mark gross5e0d2a62008-03-04 15:22:08 -08002748 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002749}
2750
FUJITA Tomonorid7ab5c42009-01-28 21:53:18 +09002751static void *intel_alloc_coherent(struct device *hwdev, size_t size,
2752 dma_addr_t *dma_handle, gfp_t flags)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002753{
2754 void *vaddr;
2755 int order;
2756
Fenghua Yu5b6985c2008-10-16 18:02:32 -07002757 size = PAGE_ALIGN(size);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002758 order = get_order(size);
Alex Williamsone8bb9102009-11-04 15:59:34 -07002759
2760 if (!iommu_no_mapping(hwdev))
2761 flags &= ~(GFP_DMA | GFP_DMA32);
2762 else if (hwdev->coherent_dma_mask < dma_get_required_mask(hwdev)) {
2763 if (hwdev->coherent_dma_mask < DMA_BIT_MASK(32))
2764 flags |= GFP_DMA;
2765 else
2766 flags |= GFP_DMA32;
2767 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002768
2769 vaddr = (void *)__get_free_pages(flags, order);
2770 if (!vaddr)
2771 return NULL;
2772 memset(vaddr, 0, size);
2773
FUJITA Tomonoribb9e6d62008-10-15 16:08:28 +09002774 *dma_handle = __intel_map_single(hwdev, virt_to_bus(vaddr), size,
2775 DMA_BIDIRECTIONAL,
2776 hwdev->coherent_dma_mask);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002777 if (*dma_handle)
2778 return vaddr;
2779 free_pages((unsigned long)vaddr, order);
2780 return NULL;
2781}
2782
FUJITA Tomonorid7ab5c42009-01-28 21:53:18 +09002783static void intel_free_coherent(struct device *hwdev, size_t size, void *vaddr,
2784 dma_addr_t dma_handle)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002785{
2786 int order;
2787
Fenghua Yu5b6985c2008-10-16 18:02:32 -07002788 size = PAGE_ALIGN(size);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002789 order = get_order(size);
2790
David Woodhouse0db9b7a2009-07-14 02:01:57 +01002791 intel_unmap_page(hwdev, dma_handle, size, DMA_BIDIRECTIONAL, NULL);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002792 free_pages((unsigned long)vaddr, order);
2793}
2794
FUJITA Tomonorid7ab5c42009-01-28 21:53:18 +09002795static void intel_unmap_sg(struct device *hwdev, struct scatterlist *sglist,
2796 int nelems, enum dma_data_direction dir,
2797 struct dma_attrs *attrs)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002798{
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002799 struct pci_dev *pdev = to_pci_dev(hwdev);
2800 struct dmar_domain *domain;
David Woodhoused794dc92009-06-28 00:27:49 +01002801 unsigned long start_pfn, last_pfn;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002802 struct iova *iova;
Weidong Han8c11e792008-12-08 15:29:22 +08002803 struct intel_iommu *iommu;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002804
David Woodhouse73676832009-07-04 14:08:36 +01002805 if (iommu_no_mapping(hwdev))
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002806 return;
2807
2808 domain = find_domain(pdev);
Weidong Han8c11e792008-12-08 15:29:22 +08002809 BUG_ON(!domain);
2810
2811 iommu = domain_get_iommu(domain);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002812
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07002813 iova = find_iova(&domain->iovad, IOVA_PFN(sglist[0].dma_address));
David Woodhouse85b98272009-07-01 19:27:53 +01002814 if (WARN_ONCE(!iova, "Driver unmaps unmatched sglist at PFN %llx\n",
2815 (unsigned long long)sglist[0].dma_address))
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002816 return;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002817
David Woodhoused794dc92009-06-28 00:27:49 +01002818 start_pfn = mm_to_dma_pfn(iova->pfn_lo);
2819 last_pfn = mm_to_dma_pfn(iova->pfn_hi + 1) - 1;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002820
2821 /* clear the whole page */
David Woodhoused794dc92009-06-28 00:27:49 +01002822 dma_pte_clear_range(domain, start_pfn, last_pfn);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002823
David Woodhoused794dc92009-06-28 00:27:49 +01002824 /* free page tables */
2825 dma_pte_free_pagetable(domain, start_pfn, last_pfn);
2826
David Woodhouseacea0012009-07-14 01:55:11 +01002827 if (intel_iommu_strict) {
2828 iommu_flush_iotlb_psi(iommu, domain->id, start_pfn,
2829 last_pfn - start_pfn + 1);
2830 /* free iova */
2831 __free_iova(&domain->iovad, iova);
2832 } else {
2833 add_unmap(domain, iova);
2834 /*
2835 * queue up the release of the unmap to save the 1/6th of the
2836 * cpu used up by the iotlb flush operation...
2837 */
2838 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002839}
2840
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002841static int intel_nontranslate_map_sg(struct device *hddev,
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07002842 struct scatterlist *sglist, int nelems, int dir)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002843{
2844 int i;
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07002845 struct scatterlist *sg;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002846
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07002847 for_each_sg(sglist, sg, nelems, i) {
FUJITA Tomonori12d4d402007-10-23 09:32:25 +02002848 BUG_ON(!sg_page(sg));
David Woodhouse4cf2e752009-02-11 17:23:43 +00002849 sg->dma_address = page_to_phys(sg_page(sg)) + sg->offset;
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07002850 sg->dma_length = sg->length;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002851 }
2852 return nelems;
2853}
2854
FUJITA Tomonorid7ab5c42009-01-28 21:53:18 +09002855static int intel_map_sg(struct device *hwdev, struct scatterlist *sglist, int nelems,
2856 enum dma_data_direction dir, struct dma_attrs *attrs)
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002857{
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002858 int i;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002859 struct pci_dev *pdev = to_pci_dev(hwdev);
2860 struct dmar_domain *domain;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002861 size_t size = 0;
2862 int prot = 0;
David Woodhouseb536d242009-06-28 14:49:31 +01002863 size_t offset_pfn = 0;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002864 struct iova *iova = NULL;
2865 int ret;
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07002866 struct scatterlist *sg;
David Woodhouseb536d242009-06-28 14:49:31 +01002867 unsigned long start_vpfn;
Weidong Han8c11e792008-12-08 15:29:22 +08002868 struct intel_iommu *iommu;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002869
2870 BUG_ON(dir == DMA_NONE);
David Woodhouse73676832009-07-04 14:08:36 +01002871 if (iommu_no_mapping(hwdev))
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07002872 return intel_nontranslate_map_sg(hwdev, sglist, nelems, dir);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002873
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002874 domain = get_valid_domain_for_dev(pdev);
2875 if (!domain)
2876 return 0;
2877
Weidong Han8c11e792008-12-08 15:29:22 +08002878 iommu = domain_get_iommu(domain);
2879
David Woodhouseb536d242009-06-28 14:49:31 +01002880 for_each_sg(sglist, sg, nelems, i)
David Woodhouse88cb6a72009-06-28 15:03:06 +01002881 size += aligned_nrpages(sg->offset, sg->length);
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002882
David Woodhouse5a5e02a2009-07-04 09:35:44 +01002883 iova = intel_alloc_iova(hwdev, domain, dma_to_mm_pfn(size),
2884 pdev->dma_mask);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002885 if (!iova) {
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07002886 sglist->dma_length = 0;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002887 return 0;
2888 }
2889
2890 /*
2891 * Check if DMAR supports zero-length reads on write only
2892 * mappings..
2893 */
2894 if (dir == DMA_TO_DEVICE || dir == DMA_BIDIRECTIONAL || \
Weidong Han8c11e792008-12-08 15:29:22 +08002895 !cap_zlr(iommu->cap))
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002896 prot |= DMA_PTE_READ;
2897 if (dir == DMA_FROM_DEVICE || dir == DMA_BIDIRECTIONAL)
2898 prot |= DMA_PTE_WRITE;
2899
David Woodhouseb536d242009-06-28 14:49:31 +01002900 start_vpfn = mm_to_dma_pfn(iova->pfn_lo);
David Woodhousee1605492009-06-29 11:17:38 +01002901
Fenghua Yuf5329592009-08-04 15:09:37 -07002902 ret = domain_sg_mapping(domain, start_vpfn, sglist, size, prot);
David Woodhousee1605492009-06-29 11:17:38 +01002903 if (unlikely(ret)) {
2904 /* clear the page */
2905 dma_pte_clear_range(domain, start_vpfn,
2906 start_vpfn + size - 1);
2907 /* free page tables */
2908 dma_pte_free_pagetable(domain, start_vpfn,
2909 start_vpfn + size - 1);
2910 /* free iova */
2911 __free_iova(&domain->iovad, iova);
2912 return 0;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07002913 }
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002914
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01002915 /* it's a non-present to present mapping. Only flush if caching mode */
2916 if (cap_caching_mode(iommu->cap))
David Woodhouse03d6a242009-06-28 15:33:46 +01002917 iommu_flush_iotlb_psi(iommu, 0, start_vpfn, offset_pfn);
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01002918 else
Weidong Han8c11e792008-12-08 15:29:22 +08002919 iommu_flush_write_buffer(iommu);
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01002920
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002921 return nelems;
2922}
2923
FUJITA Tomonoridfb805e2009-01-28 21:53:17 +09002924static int intel_mapping_error(struct device *dev, dma_addr_t dma_addr)
2925{
2926 return !dma_addr;
2927}
2928
FUJITA Tomonori160c1d82009-01-05 23:59:02 +09002929struct dma_map_ops intel_dma_ops = {
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002930 .alloc_coherent = intel_alloc_coherent,
2931 .free_coherent = intel_free_coherent,
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002932 .map_sg = intel_map_sg,
2933 .unmap_sg = intel_unmap_sg,
FUJITA Tomonoriffbbef52009-01-05 23:47:26 +09002934 .map_page = intel_map_page,
2935 .unmap_page = intel_unmap_page,
FUJITA Tomonoridfb805e2009-01-28 21:53:17 +09002936 .mapping_error = intel_mapping_error,
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002937};
2938
2939static inline int iommu_domain_cache_init(void)
2940{
2941 int ret = 0;
2942
2943 iommu_domain_cache = kmem_cache_create("iommu_domain",
2944 sizeof(struct dmar_domain),
2945 0,
2946 SLAB_HWCACHE_ALIGN,
2947
2948 NULL);
2949 if (!iommu_domain_cache) {
2950 printk(KERN_ERR "Couldn't create iommu_domain cache\n");
2951 ret = -ENOMEM;
2952 }
2953
2954 return ret;
2955}
2956
2957static inline int iommu_devinfo_cache_init(void)
2958{
2959 int ret = 0;
2960
2961 iommu_devinfo_cache = kmem_cache_create("iommu_devinfo",
2962 sizeof(struct device_domain_info),
2963 0,
2964 SLAB_HWCACHE_ALIGN,
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002965 NULL);
2966 if (!iommu_devinfo_cache) {
2967 printk(KERN_ERR "Couldn't create devinfo cache\n");
2968 ret = -ENOMEM;
2969 }
2970
2971 return ret;
2972}
2973
2974static inline int iommu_iova_cache_init(void)
2975{
2976 int ret = 0;
2977
2978 iommu_iova_cache = kmem_cache_create("iommu_iova",
2979 sizeof(struct iova),
2980 0,
2981 SLAB_HWCACHE_ALIGN,
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07002982 NULL);
2983 if (!iommu_iova_cache) {
2984 printk(KERN_ERR "Couldn't create iova cache\n");
2985 ret = -ENOMEM;
2986 }
2987
2988 return ret;
2989}
2990
2991static int __init iommu_init_mempool(void)
2992{
2993 int ret;
2994 ret = iommu_iova_cache_init();
2995 if (ret)
2996 return ret;
2997
2998 ret = iommu_domain_cache_init();
2999 if (ret)
3000 goto domain_error;
3001
3002 ret = iommu_devinfo_cache_init();
3003 if (!ret)
3004 return ret;
3005
3006 kmem_cache_destroy(iommu_domain_cache);
3007domain_error:
3008 kmem_cache_destroy(iommu_iova_cache);
3009
3010 return -ENOMEM;
3011}
3012
3013static void __init iommu_exit_mempool(void)
3014{
3015 kmem_cache_destroy(iommu_devinfo_cache);
3016 kmem_cache_destroy(iommu_domain_cache);
3017 kmem_cache_destroy(iommu_iova_cache);
3018
3019}
3020
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003021static void __init init_no_remapping_devices(void)
3022{
3023 struct dmar_drhd_unit *drhd;
3024
3025 for_each_drhd_unit(drhd) {
3026 if (!drhd->include_all) {
3027 int i;
3028 for (i = 0; i < drhd->devices_cnt; i++)
3029 if (drhd->devices[i] != NULL)
3030 break;
3031 /* ignore DMAR unit if no pci devices exist */
3032 if (i == drhd->devices_cnt)
3033 drhd->ignored = 1;
3034 }
3035 }
3036
3037 if (dmar_map_gfx)
3038 return;
3039
3040 for_each_drhd_unit(drhd) {
3041 int i;
3042 if (drhd->ignored || drhd->include_all)
3043 continue;
3044
3045 for (i = 0; i < drhd->devices_cnt; i++)
3046 if (drhd->devices[i] &&
3047 !IS_GFX_DEVICE(drhd->devices[i]))
3048 break;
3049
3050 if (i < drhd->devices_cnt)
3051 continue;
3052
3053 /* bypass IOMMU if it is just for gfx devices */
3054 drhd->ignored = 1;
3055 for (i = 0; i < drhd->devices_cnt; i++) {
3056 if (!drhd->devices[i])
3057 continue;
Keshavamurthy, Anil S358dd8a2007-10-21 16:41:59 -07003058 drhd->devices[i]->dev.archdata.iommu = DUMMY_DEVICE_DOMAIN_INFO;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003059 }
3060 }
3061}
3062
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003063#ifdef CONFIG_SUSPEND
3064static int init_iommu_hw(void)
3065{
3066 struct dmar_drhd_unit *drhd;
3067 struct intel_iommu *iommu = NULL;
3068
3069 for_each_active_iommu(iommu, drhd)
3070 if (iommu->qi)
3071 dmar_reenable_qi(iommu);
3072
3073 for_each_active_iommu(iommu, drhd) {
3074 iommu_flush_write_buffer(iommu);
3075
3076 iommu_set_root_entry(iommu);
3077
3078 iommu->flush.flush_context(iommu, 0, 0, 0,
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01003079 DMA_CCMD_GLOBAL_INVL);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003080 iommu->flush.flush_iotlb(iommu, 0, 0, 0,
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01003081 DMA_TLB_GLOBAL_FLUSH);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003082 iommu_enable_translation(iommu);
David Woodhouseb94996c2009-09-19 15:28:12 -07003083 iommu_disable_protect_mem_regions(iommu);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003084 }
3085
3086 return 0;
3087}
3088
3089static void iommu_flush_all(void)
3090{
3091 struct dmar_drhd_unit *drhd;
3092 struct intel_iommu *iommu;
3093
3094 for_each_active_iommu(iommu, drhd) {
3095 iommu->flush.flush_context(iommu, 0, 0, 0,
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01003096 DMA_CCMD_GLOBAL_INVL);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003097 iommu->flush.flush_iotlb(iommu, 0, 0, 0,
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01003098 DMA_TLB_GLOBAL_FLUSH);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003099 }
3100}
3101
3102static int iommu_suspend(struct sys_device *dev, pm_message_t state)
3103{
3104 struct dmar_drhd_unit *drhd;
3105 struct intel_iommu *iommu = NULL;
3106 unsigned long flag;
3107
3108 for_each_active_iommu(iommu, drhd) {
3109 iommu->iommu_state = kzalloc(sizeof(u32) * MAX_SR_DMAR_REGS,
3110 GFP_ATOMIC);
3111 if (!iommu->iommu_state)
3112 goto nomem;
3113 }
3114
3115 iommu_flush_all();
3116
3117 for_each_active_iommu(iommu, drhd) {
3118 iommu_disable_translation(iommu);
3119
3120 spin_lock_irqsave(&iommu->register_lock, flag);
3121
3122 iommu->iommu_state[SR_DMAR_FECTL_REG] =
3123 readl(iommu->reg + DMAR_FECTL_REG);
3124 iommu->iommu_state[SR_DMAR_FEDATA_REG] =
3125 readl(iommu->reg + DMAR_FEDATA_REG);
3126 iommu->iommu_state[SR_DMAR_FEADDR_REG] =
3127 readl(iommu->reg + DMAR_FEADDR_REG);
3128 iommu->iommu_state[SR_DMAR_FEUADDR_REG] =
3129 readl(iommu->reg + DMAR_FEUADDR_REG);
3130
3131 spin_unlock_irqrestore(&iommu->register_lock, flag);
3132 }
3133 return 0;
3134
3135nomem:
3136 for_each_active_iommu(iommu, drhd)
3137 kfree(iommu->iommu_state);
3138
3139 return -ENOMEM;
3140}
3141
3142static int iommu_resume(struct sys_device *dev)
3143{
3144 struct dmar_drhd_unit *drhd;
3145 struct intel_iommu *iommu = NULL;
3146 unsigned long flag;
3147
3148 if (init_iommu_hw()) {
3149 WARN(1, "IOMMU setup failed, DMAR can not resume!\n");
3150 return -EIO;
3151 }
3152
3153 for_each_active_iommu(iommu, drhd) {
3154
3155 spin_lock_irqsave(&iommu->register_lock, flag);
3156
3157 writel(iommu->iommu_state[SR_DMAR_FECTL_REG],
3158 iommu->reg + DMAR_FECTL_REG);
3159 writel(iommu->iommu_state[SR_DMAR_FEDATA_REG],
3160 iommu->reg + DMAR_FEDATA_REG);
3161 writel(iommu->iommu_state[SR_DMAR_FEADDR_REG],
3162 iommu->reg + DMAR_FEADDR_REG);
3163 writel(iommu->iommu_state[SR_DMAR_FEUADDR_REG],
3164 iommu->reg + DMAR_FEUADDR_REG);
3165
3166 spin_unlock_irqrestore(&iommu->register_lock, flag);
3167 }
3168
3169 for_each_active_iommu(iommu, drhd)
3170 kfree(iommu->iommu_state);
3171
3172 return 0;
3173}
3174
3175static struct sysdev_class iommu_sysclass = {
3176 .name = "iommu",
3177 .resume = iommu_resume,
3178 .suspend = iommu_suspend,
3179};
3180
3181static struct sys_device device_iommu = {
3182 .cls = &iommu_sysclass,
3183};
3184
3185static int __init init_iommu_sysfs(void)
3186{
3187 int error;
3188
3189 error = sysdev_class_register(&iommu_sysclass);
3190 if (error)
3191 return error;
3192
3193 error = sysdev_register(&device_iommu);
3194 if (error)
3195 sysdev_class_unregister(&iommu_sysclass);
3196
3197 return error;
3198}
3199
3200#else
3201static int __init init_iommu_sysfs(void)
3202{
3203 return 0;
3204}
3205#endif /* CONFIG_PM */
3206
Fenghua Yu99dcade2009-11-11 07:23:06 -08003207/*
3208 * Here we only respond to action of unbound device from driver.
3209 *
3210 * Added device is not attached to its DMAR domain here yet. That will happen
3211 * when mapping the device to iova.
3212 */
3213static int device_notifier(struct notifier_block *nb,
3214 unsigned long action, void *data)
3215{
3216 struct device *dev = data;
3217 struct pci_dev *pdev = to_pci_dev(dev);
3218 struct dmar_domain *domain;
3219
David Woodhouse44cd6132009-12-02 10:18:30 +00003220 if (iommu_no_mapping(dev))
3221 return 0;
3222
Fenghua Yu99dcade2009-11-11 07:23:06 -08003223 domain = find_domain(pdev);
3224 if (!domain)
3225 return 0;
3226
3227 if (action == BUS_NOTIFY_UNBOUND_DRIVER && !iommu_pass_through)
3228 domain_remove_one_dev_info(domain, pdev);
3229
3230 return 0;
3231}
3232
3233static struct notifier_block device_nb = {
3234 .notifier_call = device_notifier,
3235};
3236
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003237int __init intel_iommu_init(void)
3238{
3239 int ret = 0;
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07003240 int force_on = 0;
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003241
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07003242 /* VT-d is required for a TXT/tboot launch, so enforce that */
3243 force_on = tboot_force_iommu();
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003244
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07003245 if (dmar_table_init()) {
3246 if (force_on)
3247 panic("tboot: Failed to initialize DMAR table\n");
Suresh Siddha1886e8a2008-07-10 11:16:37 -07003248 return -ENODEV;
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07003249 }
3250
3251 if (dmar_dev_scope_init()) {
3252 if (force_on)
3253 panic("tboot: Failed to initialize DMAR device scope\n");
3254 return -ENODEV;
3255 }
Suresh Siddha1886e8a2008-07-10 11:16:37 -07003256
Suresh Siddha2ae21012008-07-10 11:16:43 -07003257 /*
3258 * Check the need for DMA-remapping initialization now.
3259 * Above initialization will also be used by Interrupt-remapping.
3260 */
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +09003261 if (no_iommu || dmar_disabled)
Suresh Siddha2ae21012008-07-10 11:16:43 -07003262 return -ENODEV;
3263
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003264 iommu_init_mempool();
3265 dmar_init_reserved_ranges();
3266
3267 init_no_remapping_devices();
3268
3269 ret = init_dmars();
3270 if (ret) {
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07003271 if (force_on)
3272 panic("tboot: Failed to initialize DMARs\n");
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003273 printk(KERN_ERR "IOMMU: dmar init failed\n");
3274 put_iova_domain(&reserved_iova_list);
3275 iommu_exit_mempool();
3276 return ret;
3277 }
3278 printk(KERN_INFO
3279 "PCI-DMA: Intel(R) Virtualization Technology for Directed I/O\n");
3280
mark gross5e0d2a62008-03-04 15:22:08 -08003281 init_timer(&unmap_timer);
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +09003282#ifdef CONFIG_SWIOTLB
3283 swiotlb = 0;
3284#endif
David Woodhouse19943b02009-08-04 16:19:20 +01003285 dma_ops = &intel_dma_ops;
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07003286
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003287 init_iommu_sysfs();
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +01003288
3289 register_iommu(&intel_iommu_ops);
3290
Fenghua Yu99dcade2009-11-11 07:23:06 -08003291 bus_register_notifier(&pci_bus_type, &device_nb);
3292
Keshavamurthy, Anil Sba395922007-10-21 16:41:49 -07003293 return 0;
3294}
Keshavamurthy, Anil Se8204822007-10-21 16:41:55 -07003295
Han, Weidong3199aa62009-02-26 17:31:12 +08003296static void iommu_detach_dependent_devices(struct intel_iommu *iommu,
3297 struct pci_dev *pdev)
3298{
3299 struct pci_dev *tmp, *parent;
3300
3301 if (!iommu || !pdev)
3302 return;
3303
3304 /* dependent device detach */
3305 tmp = pci_find_upstream_pcie_bridge(pdev);
3306 /* Secondary interface's bus number and devfn 0 */
3307 if (tmp) {
3308 parent = pdev->bus->self;
3309 while (parent != tmp) {
3310 iommu_detach_dev(iommu, parent->bus->number,
David Woodhouse276dbf992009-04-04 01:45:37 +01003311 parent->devfn);
Han, Weidong3199aa62009-02-26 17:31:12 +08003312 parent = parent->bus->self;
3313 }
Stefan Assmann45e829e2009-12-03 06:49:24 -05003314 if (pci_is_pcie(tmp)) /* this is a PCIe-to-PCI bridge */
Han, Weidong3199aa62009-02-26 17:31:12 +08003315 iommu_detach_dev(iommu,
3316 tmp->subordinate->number, 0);
3317 else /* this is a legacy PCI bridge */
David Woodhouse276dbf992009-04-04 01:45:37 +01003318 iommu_detach_dev(iommu, tmp->bus->number,
3319 tmp->devfn);
Han, Weidong3199aa62009-02-26 17:31:12 +08003320 }
3321}
3322
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003323static void domain_remove_one_dev_info(struct dmar_domain *domain,
Weidong Hanc7151a82008-12-08 22:51:37 +08003324 struct pci_dev *pdev)
3325{
3326 struct device_domain_info *info;
3327 struct intel_iommu *iommu;
3328 unsigned long flags;
3329 int found = 0;
3330 struct list_head *entry, *tmp;
3331
David Woodhouse276dbf992009-04-04 01:45:37 +01003332 iommu = device_to_iommu(pci_domain_nr(pdev->bus), pdev->bus->number,
3333 pdev->devfn);
Weidong Hanc7151a82008-12-08 22:51:37 +08003334 if (!iommu)
3335 return;
3336
3337 spin_lock_irqsave(&device_domain_lock, flags);
3338 list_for_each_safe(entry, tmp, &domain->devices) {
3339 info = list_entry(entry, struct device_domain_info, link);
David Woodhouse276dbf992009-04-04 01:45:37 +01003340 /* No need to compare PCI domain; it has to be the same */
Weidong Hanc7151a82008-12-08 22:51:37 +08003341 if (info->bus == pdev->bus->number &&
3342 info->devfn == pdev->devfn) {
3343 list_del(&info->link);
3344 list_del(&info->global);
3345 if (info->dev)
3346 info->dev->dev.archdata.iommu = NULL;
3347 spin_unlock_irqrestore(&device_domain_lock, flags);
3348
Yu Zhao93a23a72009-05-18 13:51:37 +08003349 iommu_disable_dev_iotlb(info);
Weidong Hanc7151a82008-12-08 22:51:37 +08003350 iommu_detach_dev(iommu, info->bus, info->devfn);
Han, Weidong3199aa62009-02-26 17:31:12 +08003351 iommu_detach_dependent_devices(iommu, pdev);
Weidong Hanc7151a82008-12-08 22:51:37 +08003352 free_devinfo_mem(info);
3353
3354 spin_lock_irqsave(&device_domain_lock, flags);
3355
3356 if (found)
3357 break;
3358 else
3359 continue;
3360 }
3361
3362 /* if there is no other devices under the same iommu
3363 * owned by this domain, clear this iommu in iommu_bmp
3364 * update iommu count and coherency
3365 */
David Woodhouse276dbf992009-04-04 01:45:37 +01003366 if (iommu == device_to_iommu(info->segment, info->bus,
3367 info->devfn))
Weidong Hanc7151a82008-12-08 22:51:37 +08003368 found = 1;
3369 }
3370
3371 if (found == 0) {
3372 unsigned long tmp_flags;
3373 spin_lock_irqsave(&domain->iommu_lock, tmp_flags);
3374 clear_bit(iommu->seq_id, &domain->iommu_bmp);
3375 domain->iommu_count--;
Sheng Yang58c610b2009-03-18 15:33:05 +08003376 domain_update_iommu_cap(domain);
Weidong Hanc7151a82008-12-08 22:51:37 +08003377 spin_unlock_irqrestore(&domain->iommu_lock, tmp_flags);
3378 }
3379
3380 spin_unlock_irqrestore(&device_domain_lock, flags);
3381}
3382
3383static void vm_domain_remove_all_dev_info(struct dmar_domain *domain)
3384{
3385 struct device_domain_info *info;
3386 struct intel_iommu *iommu;
3387 unsigned long flags1, flags2;
3388
3389 spin_lock_irqsave(&device_domain_lock, flags1);
3390 while (!list_empty(&domain->devices)) {
3391 info = list_entry(domain->devices.next,
3392 struct device_domain_info, link);
3393 list_del(&info->link);
3394 list_del(&info->global);
3395 if (info->dev)
3396 info->dev->dev.archdata.iommu = NULL;
3397
3398 spin_unlock_irqrestore(&device_domain_lock, flags1);
3399
Yu Zhao93a23a72009-05-18 13:51:37 +08003400 iommu_disable_dev_iotlb(info);
David Woodhouse276dbf992009-04-04 01:45:37 +01003401 iommu = device_to_iommu(info->segment, info->bus, info->devfn);
Weidong Hanc7151a82008-12-08 22:51:37 +08003402 iommu_detach_dev(iommu, info->bus, info->devfn);
Han, Weidong3199aa62009-02-26 17:31:12 +08003403 iommu_detach_dependent_devices(iommu, info->dev);
Weidong Hanc7151a82008-12-08 22:51:37 +08003404
3405 /* clear this iommu in iommu_bmp, update iommu count
Sheng Yang58c610b2009-03-18 15:33:05 +08003406 * and capabilities
Weidong Hanc7151a82008-12-08 22:51:37 +08003407 */
3408 spin_lock_irqsave(&domain->iommu_lock, flags2);
3409 if (test_and_clear_bit(iommu->seq_id,
3410 &domain->iommu_bmp)) {
3411 domain->iommu_count--;
Sheng Yang58c610b2009-03-18 15:33:05 +08003412 domain_update_iommu_cap(domain);
Weidong Hanc7151a82008-12-08 22:51:37 +08003413 }
3414 spin_unlock_irqrestore(&domain->iommu_lock, flags2);
3415
3416 free_devinfo_mem(info);
3417 spin_lock_irqsave(&device_domain_lock, flags1);
3418 }
3419 spin_unlock_irqrestore(&device_domain_lock, flags1);
3420}
3421
Weidong Han5e98c4b2008-12-08 23:03:27 +08003422/* domain id for virtual machine, it won't be set in context */
3423static unsigned long vm_domid;
3424
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003425static int vm_domain_min_agaw(struct dmar_domain *domain)
3426{
3427 int i;
3428 int min_agaw = domain->agaw;
3429
Akinobu Mitaa45946a2010-03-11 14:04:08 -08003430 for_each_set_bit(i, &domain->iommu_bmp, g_num_of_iommus) {
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003431 if (min_agaw > g_iommus[i]->agaw)
3432 min_agaw = g_iommus[i]->agaw;
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003433 }
3434
3435 return min_agaw;
3436}
3437
Weidong Han5e98c4b2008-12-08 23:03:27 +08003438static struct dmar_domain *iommu_alloc_vm_domain(void)
3439{
3440 struct dmar_domain *domain;
3441
3442 domain = alloc_domain_mem();
3443 if (!domain)
3444 return NULL;
3445
3446 domain->id = vm_domid++;
Suresh Siddha4c923d42009-10-02 11:01:24 -07003447 domain->nid = -1;
Weidong Han5e98c4b2008-12-08 23:03:27 +08003448 memset(&domain->iommu_bmp, 0, sizeof(unsigned long));
3449 domain->flags = DOMAIN_FLAG_VIRTUAL_MACHINE;
3450
3451 return domain;
3452}
3453
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003454static int md_domain_init(struct dmar_domain *domain, int guest_width)
Weidong Han5e98c4b2008-12-08 23:03:27 +08003455{
3456 int adjust_width;
3457
3458 init_iova_domain(&domain->iovad, DMA_32BIT_PFN);
Weidong Han5e98c4b2008-12-08 23:03:27 +08003459 spin_lock_init(&domain->iommu_lock);
3460
3461 domain_reserve_special_ranges(domain);
3462
3463 /* calculate AGAW */
3464 domain->gaw = guest_width;
3465 adjust_width = guestwidth_to_adjustwidth(guest_width);
3466 domain->agaw = width_to_agaw(adjust_width);
3467
3468 INIT_LIST_HEAD(&domain->devices);
3469
3470 domain->iommu_count = 0;
3471 domain->iommu_coherency = 0;
Sheng Yangc5b15252009-08-06 13:31:56 +08003472 domain->iommu_snooping = 0;
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003473 domain->max_addr = 0;
Suresh Siddha4c923d42009-10-02 11:01:24 -07003474 domain->nid = -1;
Weidong Han5e98c4b2008-12-08 23:03:27 +08003475
3476 /* always allocate the top pgd */
Suresh Siddha4c923d42009-10-02 11:01:24 -07003477 domain->pgd = (struct dma_pte *)alloc_pgtable_page(domain->nid);
Weidong Han5e98c4b2008-12-08 23:03:27 +08003478 if (!domain->pgd)
3479 return -ENOMEM;
3480 domain_flush_cache(domain, domain->pgd, PAGE_SIZE);
3481 return 0;
3482}
3483
3484static void iommu_free_vm_domain(struct dmar_domain *domain)
3485{
3486 unsigned long flags;
3487 struct dmar_drhd_unit *drhd;
3488 struct intel_iommu *iommu;
3489 unsigned long i;
3490 unsigned long ndomains;
3491
3492 for_each_drhd_unit(drhd) {
3493 if (drhd->ignored)
3494 continue;
3495 iommu = drhd->iommu;
3496
3497 ndomains = cap_ndoms(iommu->cap);
Akinobu Mitaa45946a2010-03-11 14:04:08 -08003498 for_each_set_bit(i, iommu->domain_ids, ndomains) {
Weidong Han5e98c4b2008-12-08 23:03:27 +08003499 if (iommu->domains[i] == domain) {
3500 spin_lock_irqsave(&iommu->lock, flags);
3501 clear_bit(i, iommu->domain_ids);
3502 iommu->domains[i] = NULL;
3503 spin_unlock_irqrestore(&iommu->lock, flags);
3504 break;
3505 }
Weidong Han5e98c4b2008-12-08 23:03:27 +08003506 }
3507 }
3508}
3509
3510static void vm_domain_exit(struct dmar_domain *domain)
3511{
Weidong Han5e98c4b2008-12-08 23:03:27 +08003512 /* Domain 0 is reserved, so dont process it */
3513 if (!domain)
3514 return;
3515
3516 vm_domain_remove_all_dev_info(domain);
3517 /* destroy iovas */
3518 put_iova_domain(&domain->iovad);
Weidong Han5e98c4b2008-12-08 23:03:27 +08003519
3520 /* clear ptes */
David Woodhouse595badf52009-06-27 22:09:11 +01003521 dma_pte_clear_range(domain, 0, DOMAIN_MAX_PFN(domain->gaw));
Weidong Han5e98c4b2008-12-08 23:03:27 +08003522
3523 /* free page tables */
David Woodhoused794dc92009-06-28 00:27:49 +01003524 dma_pte_free_pagetable(domain, 0, DOMAIN_MAX_PFN(domain->gaw));
Weidong Han5e98c4b2008-12-08 23:03:27 +08003525
3526 iommu_free_vm_domain(domain);
3527 free_domain_mem(domain);
3528}
3529
Joerg Roedel5d450802008-12-03 14:52:32 +01003530static int intel_iommu_domain_init(struct iommu_domain *domain)
Kay, Allen M38717942008-09-09 18:37:29 +03003531{
Joerg Roedel5d450802008-12-03 14:52:32 +01003532 struct dmar_domain *dmar_domain;
Kay, Allen M38717942008-09-09 18:37:29 +03003533
Joerg Roedel5d450802008-12-03 14:52:32 +01003534 dmar_domain = iommu_alloc_vm_domain();
3535 if (!dmar_domain) {
Kay, Allen M38717942008-09-09 18:37:29 +03003536 printk(KERN_ERR
Joerg Roedel5d450802008-12-03 14:52:32 +01003537 "intel_iommu_domain_init: dmar_domain == NULL\n");
3538 return -ENOMEM;
Kay, Allen M38717942008-09-09 18:37:29 +03003539 }
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003540 if (md_domain_init(dmar_domain, DEFAULT_DOMAIN_ADDRESS_WIDTH)) {
Kay, Allen M38717942008-09-09 18:37:29 +03003541 printk(KERN_ERR
Joerg Roedel5d450802008-12-03 14:52:32 +01003542 "intel_iommu_domain_init() failed\n");
3543 vm_domain_exit(dmar_domain);
3544 return -ENOMEM;
Kay, Allen M38717942008-09-09 18:37:29 +03003545 }
Joerg Roedel5d450802008-12-03 14:52:32 +01003546 domain->priv = dmar_domain;
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003547
Joerg Roedel5d450802008-12-03 14:52:32 +01003548 return 0;
Kay, Allen M38717942008-09-09 18:37:29 +03003549}
Kay, Allen M38717942008-09-09 18:37:29 +03003550
Joerg Roedel5d450802008-12-03 14:52:32 +01003551static void intel_iommu_domain_destroy(struct iommu_domain *domain)
Kay, Allen M38717942008-09-09 18:37:29 +03003552{
Joerg Roedel5d450802008-12-03 14:52:32 +01003553 struct dmar_domain *dmar_domain = domain->priv;
3554
3555 domain->priv = NULL;
3556 vm_domain_exit(dmar_domain);
Kay, Allen M38717942008-09-09 18:37:29 +03003557}
Kay, Allen M38717942008-09-09 18:37:29 +03003558
Joerg Roedel4c5478c2008-12-03 14:58:24 +01003559static int intel_iommu_attach_device(struct iommu_domain *domain,
3560 struct device *dev)
Kay, Allen M38717942008-09-09 18:37:29 +03003561{
Joerg Roedel4c5478c2008-12-03 14:58:24 +01003562 struct dmar_domain *dmar_domain = domain->priv;
3563 struct pci_dev *pdev = to_pci_dev(dev);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003564 struct intel_iommu *iommu;
3565 int addr_width;
3566 u64 end;
Kay, Allen M38717942008-09-09 18:37:29 +03003567
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003568 /* normally pdev is not mapped */
3569 if (unlikely(domain_context_mapped(pdev))) {
3570 struct dmar_domain *old_domain;
3571
3572 old_domain = find_domain(pdev);
3573 if (old_domain) {
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003574 if (dmar_domain->flags & DOMAIN_FLAG_VIRTUAL_MACHINE ||
3575 dmar_domain->flags & DOMAIN_FLAG_STATIC_IDENTITY)
3576 domain_remove_one_dev_info(old_domain, pdev);
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003577 else
3578 domain_remove_dev_info(old_domain);
3579 }
3580 }
3581
David Woodhouse276dbf992009-04-04 01:45:37 +01003582 iommu = device_to_iommu(pci_domain_nr(pdev->bus), pdev->bus->number,
3583 pdev->devfn);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003584 if (!iommu)
3585 return -ENODEV;
3586
3587 /* check if this iommu agaw is sufficient for max mapped address */
3588 addr_width = agaw_to_width(iommu->agaw);
3589 end = DOMAIN_MAX_ADDR(addr_width);
3590 end = end & VTD_PAGE_MASK;
Joerg Roedel4c5478c2008-12-03 14:58:24 +01003591 if (end < dmar_domain->max_addr) {
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003592 printk(KERN_ERR "%s: iommu agaw (%d) is not "
3593 "sufficient for the mapped address (%llx)\n",
Joerg Roedel4c5478c2008-12-03 14:58:24 +01003594 __func__, iommu->agaw, dmar_domain->max_addr);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003595 return -EFAULT;
3596 }
3597
David Woodhouse5fe60f42009-08-09 10:53:41 +01003598 return domain_add_dev_info(dmar_domain, pdev, CONTEXT_TT_MULTI_LEVEL);
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003599}
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003600
Joerg Roedel4c5478c2008-12-03 14:58:24 +01003601static void intel_iommu_detach_device(struct iommu_domain *domain,
3602 struct device *dev)
Kay, Allen M38717942008-09-09 18:37:29 +03003603{
Joerg Roedel4c5478c2008-12-03 14:58:24 +01003604 struct dmar_domain *dmar_domain = domain->priv;
3605 struct pci_dev *pdev = to_pci_dev(dev);
3606
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003607 domain_remove_one_dev_info(dmar_domain, pdev);
Kay, Allen M38717942008-09-09 18:37:29 +03003608}
Kay, Allen M38717942008-09-09 18:37:29 +03003609
Joerg Roedeldde57a22008-12-03 15:04:09 +01003610static int intel_iommu_map_range(struct iommu_domain *domain,
3611 unsigned long iova, phys_addr_t hpa,
3612 size_t size, int iommu_prot)
Kay, Allen M38717942008-09-09 18:37:29 +03003613{
Joerg Roedeldde57a22008-12-03 15:04:09 +01003614 struct dmar_domain *dmar_domain = domain->priv;
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003615 u64 max_addr;
3616 int addr_width;
Joerg Roedeldde57a22008-12-03 15:04:09 +01003617 int prot = 0;
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003618 int ret;
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003619
Joerg Roedeldde57a22008-12-03 15:04:09 +01003620 if (iommu_prot & IOMMU_READ)
3621 prot |= DMA_PTE_READ;
3622 if (iommu_prot & IOMMU_WRITE)
3623 prot |= DMA_PTE_WRITE;
Sheng Yang9cf06692009-03-18 15:33:07 +08003624 if ((iommu_prot & IOMMU_CACHE) && dmar_domain->iommu_snooping)
3625 prot |= DMA_PTE_SNP;
Joerg Roedeldde57a22008-12-03 15:04:09 +01003626
David Woodhouse163cc522009-06-28 00:51:17 +01003627 max_addr = iova + size;
Joerg Roedeldde57a22008-12-03 15:04:09 +01003628 if (dmar_domain->max_addr < max_addr) {
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003629 int min_agaw;
3630 u64 end;
3631
3632 /* check if minimum agaw is sufficient for mapped address */
Joerg Roedeldde57a22008-12-03 15:04:09 +01003633 min_agaw = vm_domain_min_agaw(dmar_domain);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003634 addr_width = agaw_to_width(min_agaw);
3635 end = DOMAIN_MAX_ADDR(addr_width);
3636 end = end & VTD_PAGE_MASK;
3637 if (end < max_addr) {
3638 printk(KERN_ERR "%s: iommu agaw (%d) is not "
3639 "sufficient for the mapped address (%llx)\n",
3640 __func__, min_agaw, max_addr);
3641 return -EFAULT;
3642 }
Joerg Roedeldde57a22008-12-03 15:04:09 +01003643 dmar_domain->max_addr = max_addr;
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003644 }
David Woodhousead051222009-06-28 14:22:28 +01003645 /* Round up size to next multiple of PAGE_SIZE, if it and
3646 the low bits of hpa would take us onto the next page */
David Woodhouse88cb6a72009-06-28 15:03:06 +01003647 size = aligned_nrpages(hpa, size);
David Woodhousead051222009-06-28 14:22:28 +01003648 ret = domain_pfn_mapping(dmar_domain, iova >> VTD_PAGE_SHIFT,
3649 hpa >> VTD_PAGE_SHIFT, size, prot);
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003650 return ret;
Kay, Allen M38717942008-09-09 18:37:29 +03003651}
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003652
Joerg Roedeldde57a22008-12-03 15:04:09 +01003653static void intel_iommu_unmap_range(struct iommu_domain *domain,
3654 unsigned long iova, size_t size)
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003655{
Joerg Roedeldde57a22008-12-03 15:04:09 +01003656 struct dmar_domain *dmar_domain = domain->priv;
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003657
Sheng Yang4b99d352009-07-08 11:52:52 +01003658 if (!size)
3659 return;
3660
David Woodhouse163cc522009-06-28 00:51:17 +01003661 dma_pte_clear_range(dmar_domain, iova >> VTD_PAGE_SHIFT,
3662 (iova + size - 1) >> VTD_PAGE_SHIFT);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08003663
David Woodhouse163cc522009-06-28 00:51:17 +01003664 if (dmar_domain->max_addr == iova + size)
3665 dmar_domain->max_addr = iova;
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003666}
Kay, Allen M38717942008-09-09 18:37:29 +03003667
Joerg Roedeld14d6572008-12-03 15:06:57 +01003668static phys_addr_t intel_iommu_iova_to_phys(struct iommu_domain *domain,
3669 unsigned long iova)
Kay, Allen M38717942008-09-09 18:37:29 +03003670{
Joerg Roedeld14d6572008-12-03 15:06:57 +01003671 struct dmar_domain *dmar_domain = domain->priv;
Kay, Allen M38717942008-09-09 18:37:29 +03003672 struct dma_pte *pte;
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003673 u64 phys = 0;
Kay, Allen M38717942008-09-09 18:37:29 +03003674
David Woodhouseb026fd22009-06-28 10:37:25 +01003675 pte = pfn_to_dma_pte(dmar_domain, iova >> VTD_PAGE_SHIFT);
Kay, Allen M38717942008-09-09 18:37:29 +03003676 if (pte)
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003677 phys = dma_pte_addr(pte);
Kay, Allen M38717942008-09-09 18:37:29 +03003678
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08003679 return phys;
Kay, Allen M38717942008-09-09 18:37:29 +03003680}
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +01003681
Sheng Yangdbb9fd82009-03-18 15:33:06 +08003682static int intel_iommu_domain_has_cap(struct iommu_domain *domain,
3683 unsigned long cap)
3684{
3685 struct dmar_domain *dmar_domain = domain->priv;
3686
3687 if (cap == IOMMU_CAP_CACHE_COHERENCY)
3688 return dmar_domain->iommu_snooping;
3689
3690 return 0;
3691}
3692
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +01003693static struct iommu_ops intel_iommu_ops = {
3694 .domain_init = intel_iommu_domain_init,
3695 .domain_destroy = intel_iommu_domain_destroy,
3696 .attach_dev = intel_iommu_attach_device,
3697 .detach_dev = intel_iommu_detach_device,
3698 .map = intel_iommu_map_range,
3699 .unmap = intel_iommu_unmap_range,
3700 .iova_to_phys = intel_iommu_iova_to_phys,
Sheng Yangdbb9fd82009-03-18 15:33:06 +08003701 .domain_has_cap = intel_iommu_domain_has_cap,
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +01003702};
David Woodhouse9af88142009-02-13 23:18:03 +00003703
3704static void __devinit quirk_iommu_rwbf(struct pci_dev *dev)
3705{
3706 /*
3707 * Mobile 4 Series Chipset neglects to set RWBF capability,
3708 * but needs it:
3709 */
3710 printk(KERN_INFO "DMAR: Forcing write-buffer flush capability\n");
3711 rwbf_quirk = 1;
3712}
3713
3714DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2a40, quirk_iommu_rwbf);
David Woodhousee0fc7e02009-09-30 09:12:17 -07003715
3716/* On Tylersburg chipsets, some BIOSes have been known to enable the
3717 ISOCH DMAR unit for the Azalia sound device, but not give it any
3718 TLB entries, which causes it to deadlock. Check for that. We do
3719 this in a function called from init_dmars(), instead of in a PCI
3720 quirk, because we don't want to print the obnoxious "BIOS broken"
3721 message if VT-d is actually disabled.
3722*/
3723static void __init check_tylersburg_isoch(void)
3724{
3725 struct pci_dev *pdev;
3726 uint32_t vtisochctrl;
3727
3728 /* If there's no Azalia in the system anyway, forget it. */
3729 pdev = pci_get_device(PCI_VENDOR_ID_INTEL, 0x3a3e, NULL);
3730 if (!pdev)
3731 return;
3732 pci_dev_put(pdev);
3733
3734 /* System Management Registers. Might be hidden, in which case
3735 we can't do the sanity check. But that's OK, because the
3736 known-broken BIOSes _don't_ actually hide it, so far. */
3737 pdev = pci_get_device(PCI_VENDOR_ID_INTEL, 0x342e, NULL);
3738 if (!pdev)
3739 return;
3740
3741 if (pci_read_config_dword(pdev, 0x188, &vtisochctrl)) {
3742 pci_dev_put(pdev);
3743 return;
3744 }
3745
3746 pci_dev_put(pdev);
3747
3748 /* If Azalia DMA is routed to the non-isoch DMAR unit, fine. */
3749 if (vtisochctrl & 1)
3750 return;
3751
3752 /* Drop all bits other than the number of TLB entries */
3753 vtisochctrl &= 0x1c;
3754
3755 /* If we have the recommended number of TLB entries (16), fine. */
3756 if (vtisochctrl == 0x10)
3757 return;
3758
3759 /* Zero TLB entries? You get to ride the short bus to school. */
3760 if (!vtisochctrl) {
3761 WARN(1, "Your BIOS is broken; DMA routed to ISOCH DMAR unit but no TLB space.\n"
3762 "BIOS vendor: %s; Ver: %s; Product Version: %s\n",
3763 dmi_get_system_info(DMI_BIOS_VENDOR),
3764 dmi_get_system_info(DMI_BIOS_VERSION),
3765 dmi_get_system_info(DMI_PRODUCT_VERSION));
3766 iommu_identity_mapping |= IDENTMAP_AZALIA;
3767 return;
3768 }
3769
3770 printk(KERN_WARNING "DMAR: Recommended TLB entries for ISOCH unit is 16; your BIOS set %d\n",
3771 vtisochctrl);
3772}