blob: 35365f046923db7df50f43f318310711e7fd5e31 [file] [log] [blame]
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001/*
David Woodhouseea8ea462014-03-05 17:09:32 +00002 * Copyright © 2006-2014 Intel Corporation.
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003 *
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms and conditions of the GNU General Public License,
6 * version 2, as published by the Free Software Foundation.
7 *
8 * This program is distributed in the hope it will be useful, but WITHOUT
9 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
11 * more details.
12 *
David Woodhouseea8ea462014-03-05 17:09:32 +000013 * Authors: David Woodhouse <dwmw2@infradead.org>,
14 * Ashok Raj <ashok.raj@intel.com>,
15 * Shaohua Li <shaohua.li@intel.com>,
16 * Anil S Keshavamurthy <anil.s.keshavamurthy@intel.com>,
17 * Fenghua Yu <fenghua.yu@intel.com>
Joerg Roedel9f10e5b2015-06-12 09:57:06 +020018 * Joerg Roedel <jroedel@suse.de>
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -070019 */
20
Joerg Roedel9f10e5b2015-06-12 09:57:06 +020021#define pr_fmt(fmt) "DMAR: " fmt
22
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -070023#include <linux/init.h>
24#include <linux/bitmap.h>
mark gross5e0d2a62008-03-04 15:22:08 -080025#include <linux/debugfs.h>
Paul Gortmaker54485c32011-10-29 10:26:25 -040026#include <linux/export.h>
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -070027#include <linux/slab.h>
28#include <linux/irq.h>
29#include <linux/interrupt.h>
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -070030#include <linux/spinlock.h>
31#include <linux/pci.h>
32#include <linux/dmar.h>
33#include <linux/dma-mapping.h>
34#include <linux/mempool.h>
Jiang Liu75f05562014-02-19 14:07:37 +080035#include <linux/memory.h>
mark gross5e0d2a62008-03-04 15:22:08 -080036#include <linux/timer.h>
Kay, Allen M38717942008-09-09 18:37:29 +030037#include <linux/iova.h>
Joerg Roedel5d450802008-12-03 14:52:32 +010038#include <linux/iommu.h>
Kay, Allen M38717942008-09-09 18:37:29 +030039#include <linux/intel-iommu.h>
Rafael J. Wysocki134fac32011-03-23 22:16:14 +010040#include <linux/syscore_ops.h>
Shane Wang69575d32009-09-01 18:25:07 -070041#include <linux/tboot.h>
Stephen Rothwelladb2fe02009-08-31 15:24:23 +100042#include <linux/dmi.h>
Joerg Roedel5cdede22011-04-04 15:55:18 +020043#include <linux/pci-ats.h>
Tejun Heo0ee332c2011-12-08 10:22:09 -080044#include <linux/memblock.h>
Akinobu Mita36746432014-06-04 16:06:51 -070045#include <linux/dma-contiguous.h>
Joerg Roedel091d42e2015-06-12 11:56:10 +020046#include <linux/crash_dump.h>
Suresh Siddha8a8f4222012-03-30 11:47:08 -070047#include <asm/irq_remapping.h>
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -070048#include <asm/cacheflush.h>
FUJITA Tomonori46a7fa22008-07-11 10:23:42 +090049#include <asm/iommu.h>
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -070050
Joerg Roedel078e1ee2012-09-26 12:44:43 +020051#include "irq_remapping.h"
52
Fenghua Yu5b6985c2008-10-16 18:02:32 -070053#define ROOT_SIZE VTD_PAGE_SIZE
54#define CONTEXT_SIZE VTD_PAGE_SIZE
55
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -070056#define IS_GFX_DEVICE(pdev) ((pdev->class >> 16) == PCI_BASE_CLASS_DISPLAY)
David Woodhouse18436af2015-03-25 15:05:47 +000057#define IS_USB_DEVICE(pdev) ((pdev->class >> 8) == PCI_CLASS_SERIAL_USB)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -070058#define IS_ISA_DEVICE(pdev) ((pdev->class >> 8) == PCI_CLASS_BRIDGE_ISA)
David Woodhousee0fc7e02009-09-30 09:12:17 -070059#define IS_AZALIA(pdev) ((pdev)->vendor == 0x8086 && (pdev)->device == 0x3a3e)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -070060
61#define IOAPIC_RANGE_START (0xfee00000)
62#define IOAPIC_RANGE_END (0xfeefffff)
63#define IOVA_START_ADDR (0x1000)
64
65#define DEFAULT_DOMAIN_ADDRESS_WIDTH 48
66
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -070067#define MAX_AGAW_WIDTH 64
Jiang Liu5c645b32014-01-06 14:18:12 +080068#define MAX_AGAW_PFN_WIDTH (MAX_AGAW_WIDTH - VTD_PAGE_SHIFT)
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -070069
David Woodhouse2ebe3152009-09-19 07:34:04 -070070#define __DOMAIN_MAX_PFN(gaw) ((((uint64_t)1) << (gaw-VTD_PAGE_SHIFT)) - 1)
71#define __DOMAIN_MAX_ADDR(gaw) ((((uint64_t)1) << gaw) - 1)
72
73/* We limit DOMAIN_MAX_PFN to fit in an unsigned long, and DOMAIN_MAX_ADDR
74 to match. That way, we can use 'unsigned long' for PFNs with impunity. */
75#define DOMAIN_MAX_PFN(gaw) ((unsigned long) min_t(uint64_t, \
76 __DOMAIN_MAX_PFN(gaw), (unsigned long)-1))
77#define DOMAIN_MAX_ADDR(gaw) (((uint64_t)__DOMAIN_MAX_PFN(gaw)) << VTD_PAGE_SHIFT)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -070078
Robin Murphy1b722502015-01-12 17:51:15 +000079/* IO virtual address start page frame number */
80#define IOVA_START_PFN (1)
81
Mark McLoughlinf27be032008-11-20 15:49:43 +000082#define IOVA_PFN(addr) ((addr) >> PAGE_SHIFT)
Yang Hongyang284901a2009-04-06 19:01:15 -070083#define DMA_32BIT_PFN IOVA_PFN(DMA_BIT_MASK(32))
Yang Hongyang6a355282009-04-06 19:01:13 -070084#define DMA_64BIT_PFN IOVA_PFN(DMA_BIT_MASK(64))
mark gross5e0d2a62008-03-04 15:22:08 -080085
Andrew Mortondf08cdc2010-09-22 13:05:11 -070086/* page table handling */
87#define LEVEL_STRIDE (9)
88#define LEVEL_MASK (((u64)1 << LEVEL_STRIDE) - 1)
89
Ohad Ben-Cohen6d1c56a2011-11-10 11:32:30 +020090/*
91 * This bitmap is used to advertise the page sizes our hardware support
92 * to the IOMMU core, which will then use this information to split
93 * physically contiguous memory regions it is mapping into page sizes
94 * that we support.
95 *
96 * Traditionally the IOMMU core just handed us the mappings directly,
97 * after making sure the size is an order of a 4KiB page and that the
98 * mapping has natural alignment.
99 *
100 * To retain this behavior, we currently advertise that we support
101 * all page sizes that are an order of 4KiB.
102 *
103 * If at some point we'd like to utilize the IOMMU core's new behavior,
104 * we could change this to advertise the real page sizes we support.
105 */
106#define INTEL_IOMMU_PGSIZES (~0xFFFUL)
107
Andrew Mortondf08cdc2010-09-22 13:05:11 -0700108static inline int agaw_to_level(int agaw)
109{
110 return agaw + 2;
111}
112
113static inline int agaw_to_width(int agaw)
114{
Jiang Liu5c645b32014-01-06 14:18:12 +0800115 return min_t(int, 30 + agaw * LEVEL_STRIDE, MAX_AGAW_WIDTH);
Andrew Mortondf08cdc2010-09-22 13:05:11 -0700116}
117
118static inline int width_to_agaw(int width)
119{
Jiang Liu5c645b32014-01-06 14:18:12 +0800120 return DIV_ROUND_UP(width - 30, LEVEL_STRIDE);
Andrew Mortondf08cdc2010-09-22 13:05:11 -0700121}
122
123static inline unsigned int level_to_offset_bits(int level)
124{
125 return (level - 1) * LEVEL_STRIDE;
126}
127
128static inline int pfn_level_offset(unsigned long pfn, int level)
129{
130 return (pfn >> level_to_offset_bits(level)) & LEVEL_MASK;
131}
132
133static inline unsigned long level_mask(int level)
134{
135 return -1UL << level_to_offset_bits(level);
136}
137
138static inline unsigned long level_size(int level)
139{
140 return 1UL << level_to_offset_bits(level);
141}
142
143static inline unsigned long align_to_level(unsigned long pfn, int level)
144{
145 return (pfn + level_size(level) - 1) & level_mask(level);
146}
David Woodhousefd18de52009-05-10 23:57:41 +0100147
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100148static inline unsigned long lvl_to_nr_pages(unsigned int lvl)
149{
Jiang Liu5c645b32014-01-06 14:18:12 +0800150 return 1 << min_t(int, (lvl - 1) * LEVEL_STRIDE, MAX_AGAW_PFN_WIDTH);
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100151}
152
David Woodhousedd4e8312009-06-27 16:21:20 +0100153/* VT-d pages must always be _smaller_ than MM pages. Otherwise things
154 are never going to work. */
155static inline unsigned long dma_to_mm_pfn(unsigned long dma_pfn)
156{
157 return dma_pfn >> (PAGE_SHIFT - VTD_PAGE_SHIFT);
158}
159
160static inline unsigned long mm_to_dma_pfn(unsigned long mm_pfn)
161{
162 return mm_pfn << (PAGE_SHIFT - VTD_PAGE_SHIFT);
163}
164static inline unsigned long page_to_dma_pfn(struct page *pg)
165{
166 return mm_to_dma_pfn(page_to_pfn(pg));
167}
168static inline unsigned long virt_to_dma_pfn(void *p)
169{
170 return page_to_dma_pfn(virt_to_page(p));
171}
172
Weidong Hand9630fe2008-12-08 11:06:32 +0800173/* global iommu list, set NULL for ignored DMAR units */
174static struct intel_iommu **g_iommus;
175
David Woodhousee0fc7e02009-09-30 09:12:17 -0700176static void __init check_tylersburg_isoch(void);
David Woodhouse9af88142009-02-13 23:18:03 +0000177static int rwbf_quirk;
178
Mark McLoughlin46b08e12008-11-20 15:49:44 +0000179/*
Joseph Cihulab7792602011-05-03 00:08:37 -0700180 * set to 1 to panic kernel if can't successfully enable VT-d
181 * (used when kernel is launched w/ TXT)
182 */
183static int force_on = 0;
184
185/*
Mark McLoughlin46b08e12008-11-20 15:49:44 +0000186 * 0: Present
187 * 1-11: Reserved
188 * 12-63: Context Ptr (12 - (haw-1))
189 * 64-127: Reserved
190 */
191struct root_entry {
David Woodhouse03ecc322015-02-13 14:35:21 +0000192 u64 lo;
193 u64 hi;
Mark McLoughlin46b08e12008-11-20 15:49:44 +0000194};
195#define ROOT_ENTRY_NR (VTD_PAGE_SIZE/sizeof(struct root_entry))
Mark McLoughlin46b08e12008-11-20 15:49:44 +0000196
Joerg Roedel091d42e2015-06-12 11:56:10 +0200197/*
198 * Take a root_entry and return the Lower Context Table Pointer (LCTP)
199 * if marked present.
200 */
201static phys_addr_t root_entry_lctp(struct root_entry *re)
202{
203 if (!(re->lo & 1))
204 return 0;
Mark McLoughlin46b08e12008-11-20 15:49:44 +0000205
Joerg Roedel091d42e2015-06-12 11:56:10 +0200206 return re->lo & VTD_PAGE_MASK;
207}
208
209/*
210 * Take a root_entry and return the Upper Context Table Pointer (UCTP)
211 * if marked present.
212 */
213static phys_addr_t root_entry_uctp(struct root_entry *re)
214{
215 if (!(re->hi & 1))
216 return 0;
217
218 return re->hi & VTD_PAGE_MASK;
219}
Mark McLoughlin7a8fc252008-11-20 15:49:45 +0000220/*
221 * low 64 bits:
222 * 0: present
223 * 1: fault processing disable
224 * 2-3: translation type
225 * 12-63: address space root
226 * high 64 bits:
227 * 0-2: address width
228 * 3-6: aval
229 * 8-23: domain id
230 */
231struct context_entry {
232 u64 lo;
233 u64 hi;
234};
Mark McLoughlin7a8fc252008-11-20 15:49:45 +0000235
Joerg Roedelcf484d02015-06-12 12:21:46 +0200236static inline void context_clear_pasid_enable(struct context_entry *context)
237{
238 context->lo &= ~(1ULL << 11);
239}
240
241static inline bool context_pasid_enabled(struct context_entry *context)
242{
243 return !!(context->lo & (1ULL << 11));
244}
245
246static inline void context_set_copied(struct context_entry *context)
247{
248 context->hi |= (1ull << 3);
249}
250
251static inline bool context_copied(struct context_entry *context)
252{
253 return !!(context->hi & (1ULL << 3));
254}
255
256static inline bool __context_present(struct context_entry *context)
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000257{
258 return (context->lo & 1);
259}
Joerg Roedelcf484d02015-06-12 12:21:46 +0200260
261static inline bool context_present(struct context_entry *context)
262{
263 return context_pasid_enabled(context) ?
264 __context_present(context) :
265 __context_present(context) && !context_copied(context);
266}
267
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000268static inline void context_set_present(struct context_entry *context)
269{
270 context->lo |= 1;
271}
272
273static inline void context_set_fault_enable(struct context_entry *context)
274{
275 context->lo &= (((u64)-1) << 2) | 1;
276}
277
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000278static inline void context_set_translation_type(struct context_entry *context,
279 unsigned long value)
280{
281 context->lo &= (((u64)-1) << 4) | 3;
282 context->lo |= (value & 3) << 2;
283}
284
285static inline void context_set_address_root(struct context_entry *context,
286 unsigned long value)
287{
Li, Zhen-Hua1a2262f2014-11-05 15:30:19 +0800288 context->lo &= ~VTD_PAGE_MASK;
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000289 context->lo |= value & VTD_PAGE_MASK;
290}
291
292static inline void context_set_address_width(struct context_entry *context,
293 unsigned long value)
294{
295 context->hi |= value & 7;
296}
297
298static inline void context_set_domain_id(struct context_entry *context,
299 unsigned long value)
300{
301 context->hi |= (value & ((1 << 16) - 1)) << 8;
302}
303
Joerg Roedeldbcd8612015-06-12 12:02:09 +0200304static inline int context_domain_id(struct context_entry *c)
305{
306 return((c->hi >> 8) & 0xffff);
307}
308
Mark McLoughlinc07e7d22008-11-21 16:54:46 +0000309static inline void context_clear_entry(struct context_entry *context)
310{
311 context->lo = 0;
312 context->hi = 0;
313}
Mark McLoughlin7a8fc252008-11-20 15:49:45 +0000314
Mark McLoughlin622ba122008-11-20 15:49:46 +0000315/*
316 * 0: readable
317 * 1: writable
318 * 2-6: reserved
319 * 7: super page
Sheng Yang9cf06692009-03-18 15:33:07 +0800320 * 8-10: available
321 * 11: snoop behavior
Mark McLoughlin622ba122008-11-20 15:49:46 +0000322 * 12-63: Host physcial address
323 */
324struct dma_pte {
325 u64 val;
326};
Mark McLoughlin622ba122008-11-20 15:49:46 +0000327
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000328static inline void dma_clear_pte(struct dma_pte *pte)
329{
330 pte->val = 0;
331}
332
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000333static inline u64 dma_pte_addr(struct dma_pte *pte)
334{
David Woodhousec85994e2009-07-01 19:21:24 +0100335#ifdef CONFIG_64BIT
336 return pte->val & VTD_PAGE_MASK;
337#else
338 /* Must have a full atomic 64-bit read */
David Woodhouse1a8bd482010-08-10 01:38:53 +0100339 return __cmpxchg64(&pte->val, 0ULL, 0ULL) & VTD_PAGE_MASK;
David Woodhousec85994e2009-07-01 19:21:24 +0100340#endif
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000341}
342
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000343static inline bool dma_pte_present(struct dma_pte *pte)
344{
345 return (pte->val & 3) != 0;
346}
Mark McLoughlin622ba122008-11-20 15:49:46 +0000347
Allen Kay4399c8b2011-10-14 12:32:46 -0700348static inline bool dma_pte_superpage(struct dma_pte *pte)
349{
Joerg Roedelc3c75eb2014-07-04 11:19:10 +0200350 return (pte->val & DMA_PTE_LARGE_PAGE);
Allen Kay4399c8b2011-10-14 12:32:46 -0700351}
352
David Woodhouse75e6bf92009-07-02 11:21:16 +0100353static inline int first_pte_in_page(struct dma_pte *pte)
354{
355 return !((unsigned long)pte & ~VTD_PAGE_MASK);
356}
357
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700358/*
359 * This domain is a statically identity mapping domain.
360 * 1. This domain creats a static 1:1 mapping to all usable memory.
361 * 2. It maps to each iommu if successful.
362 * 3. Each iommu mapps to this domain if successful.
363 */
David Woodhouse19943b02009-08-04 16:19:20 +0100364static struct dmar_domain *si_domain;
365static int hw_pass_through = 1;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700366
Joerg Roedel28ccce02015-07-21 14:45:31 +0200367/*
368 * Domain represents a virtual machine, more than one devices
Weidong Han1ce28fe2008-12-08 16:35:39 +0800369 * across iommus may be owned in one domain, e.g. kvm guest.
370 */
Jiang Liuab8dfe22014-07-11 14:19:27 +0800371#define DOMAIN_FLAG_VIRTUAL_MACHINE (1 << 0)
Weidong Han1ce28fe2008-12-08 16:35:39 +0800372
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700373/* si_domain contains mulitple devices */
Jiang Liuab8dfe22014-07-11 14:19:27 +0800374#define DOMAIN_FLAG_STATIC_IDENTITY (1 << 1)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700375
Joerg Roedel29a27712015-07-21 17:17:12 +0200376#define for_each_domain_iommu(idx, domain) \
377 for (idx = 0; idx < g_num_of_iommus; idx++) \
378 if (domain->iommu_refcnt[idx])
379
Mark McLoughlin99126f72008-11-20 15:49:47 +0000380struct dmar_domain {
Suresh Siddha4c923d42009-10-02 11:01:24 -0700381 int nid; /* node id */
Joerg Roedel29a27712015-07-21 17:17:12 +0200382
383 unsigned iommu_refcnt[DMAR_UNITS_SUPPORTED];
384 /* Refcount of devices per iommu */
385
Mark McLoughlin99126f72008-11-20 15:49:47 +0000386
Joerg Roedelc0e8a6c2015-07-21 09:39:46 +0200387 u16 iommu_did[DMAR_UNITS_SUPPORTED];
388 /* Domain ids per IOMMU. Use u16 since
389 * domain ids are 16 bit wide according
390 * to VT-d spec, section 9.3 */
Mark McLoughlin99126f72008-11-20 15:49:47 +0000391
Joerg Roedel00a77de2015-03-26 13:43:08 +0100392 struct list_head devices; /* all devices' list */
Mark McLoughlin99126f72008-11-20 15:49:47 +0000393 struct iova_domain iovad; /* iova's that belong to this domain */
394
395 struct dma_pte *pgd; /* virtual address */
Mark McLoughlin99126f72008-11-20 15:49:47 +0000396 int gaw; /* max guest address width */
397
398 /* adjusted guest address width, 0 is level 2 30-bit */
399 int agaw;
400
Weidong Han3b5410e2008-12-08 09:17:15 +0800401 int flags; /* flags to find out type of domain */
Weidong Han8e6040972008-12-08 15:49:06 +0800402
403 int iommu_coherency;/* indicate coherency of iommu access */
Sheng Yang58c610b2009-03-18 15:33:05 +0800404 int iommu_snooping; /* indicate snooping control feature*/
Weidong Hanc7151a82008-12-08 22:51:37 +0800405 int iommu_count; /* reference count of iommu */
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100406 int iommu_superpage;/* Level of superpages supported:
407 0 == 4KiB (no superpages), 1 == 2MiB,
408 2 == 1GiB, 3 == 512GiB, 4 == 1TiB */
Weidong Hanfe40f1e2008-12-08 23:10:23 +0800409 u64 max_addr; /* maximum mapped address */
Joerg Roedel00a77de2015-03-26 13:43:08 +0100410
411 struct iommu_domain domain; /* generic domain data structure for
412 iommu core */
Mark McLoughlin99126f72008-11-20 15:49:47 +0000413};
414
Mark McLoughlina647dacb2008-11-20 15:49:48 +0000415/* PCI domain-device relationship */
416struct device_domain_info {
417 struct list_head link; /* link to domain siblings */
418 struct list_head global; /* link to global list */
David Woodhouse276dbf992009-04-04 01:45:37 +0100419 u8 bus; /* PCI bus number */
Mark McLoughlina647dacb2008-11-20 15:49:48 +0000420 u8 devfn; /* PCI devfn number */
Bjorn Helgaasfb0cc3a2015-07-20 09:10:36 -0500421 struct {
422 u8 enabled:1;
423 u8 qdep;
424 } ats; /* ATS state */
David Woodhouse0bcb3e22014-03-06 17:12:03 +0000425 struct device *dev; /* it's NULL for PCIe-to-PCI bridge */
Yu Zhao93a23a72009-05-18 13:51:37 +0800426 struct intel_iommu *iommu; /* IOMMU used by this device */
Mark McLoughlina647dacb2008-11-20 15:49:48 +0000427 struct dmar_domain *domain; /* pointer to domain */
428};
429
Jiang Liub94e4112014-02-19 14:07:25 +0800430struct dmar_rmrr_unit {
431 struct list_head list; /* list of rmrr units */
432 struct acpi_dmar_header *hdr; /* ACPI header */
433 u64 base_address; /* reserved base address*/
434 u64 end_address; /* reserved end address */
David Woodhouse832bd852014-03-07 15:08:36 +0000435 struct dmar_dev_scope *devices; /* target devices */
Jiang Liub94e4112014-02-19 14:07:25 +0800436 int devices_cnt; /* target device count */
437};
438
439struct dmar_atsr_unit {
440 struct list_head list; /* list of ATSR units */
441 struct acpi_dmar_header *hdr; /* ACPI header */
David Woodhouse832bd852014-03-07 15:08:36 +0000442 struct dmar_dev_scope *devices; /* target devices */
Jiang Liub94e4112014-02-19 14:07:25 +0800443 int devices_cnt; /* target device count */
444 u8 include_all:1; /* include all ports */
445};
446
447static LIST_HEAD(dmar_atsr_units);
448static LIST_HEAD(dmar_rmrr_units);
449
450#define for_each_rmrr_units(rmrr) \
451 list_for_each_entry(rmrr, &dmar_rmrr_units, list)
452
mark gross5e0d2a62008-03-04 15:22:08 -0800453static void flush_unmaps_timeout(unsigned long data);
454
Jiang Liub707cb02014-01-06 14:18:26 +0800455static DEFINE_TIMER(unmap_timer, flush_unmaps_timeout, 0, 0);
mark gross5e0d2a62008-03-04 15:22:08 -0800456
mark gross80b20dd2008-04-18 13:53:58 -0700457#define HIGH_WATER_MARK 250
458struct deferred_flush_tables {
459 int next;
460 struct iova *iova[HIGH_WATER_MARK];
461 struct dmar_domain *domain[HIGH_WATER_MARK];
David Woodhouseea8ea462014-03-05 17:09:32 +0000462 struct page *freelist[HIGH_WATER_MARK];
mark gross80b20dd2008-04-18 13:53:58 -0700463};
464
465static struct deferred_flush_tables *deferred_flush;
466
mark gross5e0d2a62008-03-04 15:22:08 -0800467/* bitmap for indexing intel_iommus */
mark gross5e0d2a62008-03-04 15:22:08 -0800468static int g_num_of_iommus;
469
470static DEFINE_SPINLOCK(async_umap_flush_lock);
471static LIST_HEAD(unmaps_to_do);
472
473static int timer_on;
474static long list_size;
mark gross5e0d2a62008-03-04 15:22:08 -0800475
Jiang Liu92d03cc2014-02-19 14:07:28 +0800476static void domain_exit(struct dmar_domain *domain);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700477static void domain_remove_dev_info(struct dmar_domain *domain);
Joerg Roedele6de0f82015-07-22 16:30:36 +0200478static void dmar_remove_one_dev_info(struct dmar_domain *domain,
479 struct device *dev);
Joerg Roedel127c7612015-07-23 17:44:46 +0200480static void __dmar_remove_one_dev_info(struct device_domain_info *info);
Joerg Roedel2452d9d2015-07-23 16:20:14 +0200481static void domain_context_clear(struct intel_iommu *iommu,
482 struct device *dev);
Jiang Liu2a46ddf2014-07-11 14:19:30 +0800483static int domain_detach_iommu(struct dmar_domain *domain,
484 struct intel_iommu *iommu);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700485
Suresh Siddhad3f13812011-08-23 17:05:25 -0700486#ifdef CONFIG_INTEL_IOMMU_DEFAULT_ON
Kyle McMartin0cd5c3c2009-02-04 14:29:19 -0800487int dmar_disabled = 0;
488#else
489int dmar_disabled = 1;
Suresh Siddhad3f13812011-08-23 17:05:25 -0700490#endif /*CONFIG_INTEL_IOMMU_DEFAULT_ON*/
Kyle McMartin0cd5c3c2009-02-04 14:29:19 -0800491
Eugeni Dodonov8bc1f852011-11-23 16:42:14 -0200492int intel_iommu_enabled = 0;
493EXPORT_SYMBOL_GPL(intel_iommu_enabled);
494
David Woodhouse2d9e6672010-06-15 10:57:57 +0100495static int dmar_map_gfx = 1;
Keshavamurthy, Anil S7d3b03c2007-10-21 16:41:53 -0700496static int dmar_forcedac;
mark gross5e0d2a62008-03-04 15:22:08 -0800497static int intel_iommu_strict;
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100498static int intel_iommu_superpage = 1;
David Woodhousec83b2f22015-06-12 10:15:49 +0100499static int intel_iommu_ecs = 1;
500
501/* We only actually use ECS when PASID support (on the new bit 40)
502 * is also advertised. Some early implementations — the ones with
503 * PASID support on bit 28 — have issues even when we *only* use
504 * extended root/context tables. */
505#define ecs_enabled(iommu) (intel_iommu_ecs && ecap_ecs(iommu->ecap) && \
506 ecap_pasid(iommu->ecap))
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700507
David Woodhousec0771df2011-10-14 20:59:46 +0100508int intel_iommu_gfx_mapped;
509EXPORT_SYMBOL_GPL(intel_iommu_gfx_mapped);
510
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700511#define DUMMY_DEVICE_DOMAIN_INFO ((struct device_domain_info *)(-1))
512static DEFINE_SPINLOCK(device_domain_lock);
513static LIST_HEAD(device_domain_list);
514
Thierry Redingb22f6432014-06-27 09:03:12 +0200515static const struct iommu_ops intel_iommu_ops;
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +0100516
Joerg Roedel4158c2e2015-06-12 10:14:02 +0200517static bool translation_pre_enabled(struct intel_iommu *iommu)
518{
519 return (iommu->flags & VTD_FLAG_TRANS_PRE_ENABLED);
520}
521
Joerg Roedel091d42e2015-06-12 11:56:10 +0200522static void clear_translation_pre_enabled(struct intel_iommu *iommu)
523{
524 iommu->flags &= ~VTD_FLAG_TRANS_PRE_ENABLED;
525}
526
Joerg Roedel4158c2e2015-06-12 10:14:02 +0200527static void init_translation_status(struct intel_iommu *iommu)
528{
529 u32 gsts;
530
531 gsts = readl(iommu->reg + DMAR_GSTS_REG);
532 if (gsts & DMA_GSTS_TES)
533 iommu->flags |= VTD_FLAG_TRANS_PRE_ENABLED;
534}
535
Joerg Roedel00a77de2015-03-26 13:43:08 +0100536/* Convert generic 'struct iommu_domain to private struct dmar_domain */
537static struct dmar_domain *to_dmar_domain(struct iommu_domain *dom)
538{
539 return container_of(dom, struct dmar_domain, domain);
540}
541
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700542static int __init intel_iommu_setup(char *str)
543{
544 if (!str)
545 return -EINVAL;
546 while (*str) {
Kyle McMartin0cd5c3c2009-02-04 14:29:19 -0800547 if (!strncmp(str, "on", 2)) {
548 dmar_disabled = 0;
Joerg Roedel9f10e5b2015-06-12 09:57:06 +0200549 pr_info("IOMMU enabled\n");
Kyle McMartin0cd5c3c2009-02-04 14:29:19 -0800550 } else if (!strncmp(str, "off", 3)) {
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700551 dmar_disabled = 1;
Joerg Roedel9f10e5b2015-06-12 09:57:06 +0200552 pr_info("IOMMU disabled\n");
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700553 } else if (!strncmp(str, "igfx_off", 8)) {
554 dmar_map_gfx = 0;
Joerg Roedel9f10e5b2015-06-12 09:57:06 +0200555 pr_info("Disable GFX device mapping\n");
Keshavamurthy, Anil S7d3b03c2007-10-21 16:41:53 -0700556 } else if (!strncmp(str, "forcedac", 8)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +0200557 pr_info("Forcing DAC for PCI devices\n");
Keshavamurthy, Anil S7d3b03c2007-10-21 16:41:53 -0700558 dmar_forcedac = 1;
mark gross5e0d2a62008-03-04 15:22:08 -0800559 } else if (!strncmp(str, "strict", 6)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +0200560 pr_info("Disable batched IOTLB flush\n");
mark gross5e0d2a62008-03-04 15:22:08 -0800561 intel_iommu_strict = 1;
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100562 } else if (!strncmp(str, "sp_off", 6)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +0200563 pr_info("Disable supported super page\n");
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100564 intel_iommu_superpage = 0;
David Woodhousec83b2f22015-06-12 10:15:49 +0100565 } else if (!strncmp(str, "ecs_off", 7)) {
566 printk(KERN_INFO
567 "Intel-IOMMU: disable extended context table support\n");
568 intel_iommu_ecs = 0;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700569 }
570
571 str += strcspn(str, ",");
572 while (*str == ',')
573 str++;
574 }
575 return 0;
576}
577__setup("intel_iommu=", intel_iommu_setup);
578
579static struct kmem_cache *iommu_domain_cache;
580static struct kmem_cache *iommu_devinfo_cache;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700581
Joerg Roedel9452d5b2015-07-21 10:00:56 +0200582static struct dmar_domain* get_iommu_domain(struct intel_iommu *iommu, u16 did)
583{
Joerg Roedel8bf47812015-07-21 10:41:21 +0200584 struct dmar_domain **domains;
585 int idx = did >> 8;
586
587 domains = iommu->domains[idx];
588 if (!domains)
589 return NULL;
590
591 return domains[did & 0xff];
Joerg Roedel9452d5b2015-07-21 10:00:56 +0200592}
593
594static void set_iommu_domain(struct intel_iommu *iommu, u16 did,
595 struct dmar_domain *domain)
596{
Joerg Roedel8bf47812015-07-21 10:41:21 +0200597 struct dmar_domain **domains;
598 int idx = did >> 8;
599
600 if (!iommu->domains[idx]) {
601 size_t size = 256 * sizeof(struct dmar_domain *);
602 iommu->domains[idx] = kzalloc(size, GFP_ATOMIC);
603 }
604
605 domains = iommu->domains[idx];
606 if (WARN_ON(!domains))
607 return;
608 else
609 domains[did & 0xff] = domain;
Joerg Roedel9452d5b2015-07-21 10:00:56 +0200610}
611
Suresh Siddha4c923d42009-10-02 11:01:24 -0700612static inline void *alloc_pgtable_page(int node)
Keshavamurthy, Anil Seb3fa7c2007-10-21 16:41:52 -0700613{
Suresh Siddha4c923d42009-10-02 11:01:24 -0700614 struct page *page;
615 void *vaddr = NULL;
Keshavamurthy, Anil Seb3fa7c2007-10-21 16:41:52 -0700616
Suresh Siddha4c923d42009-10-02 11:01:24 -0700617 page = alloc_pages_node(node, GFP_ATOMIC | __GFP_ZERO, 0);
618 if (page)
619 vaddr = page_address(page);
Keshavamurthy, Anil Seb3fa7c2007-10-21 16:41:52 -0700620 return vaddr;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700621}
622
623static inline void free_pgtable_page(void *vaddr)
624{
625 free_page((unsigned long)vaddr);
626}
627
628static inline void *alloc_domain_mem(void)
629{
KOSAKI Motohiro354bb652009-11-17 16:21:09 +0900630 return kmem_cache_alloc(iommu_domain_cache, GFP_ATOMIC);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700631}
632
Kay, Allen M38717942008-09-09 18:37:29 +0300633static void free_domain_mem(void *vaddr)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700634{
635 kmem_cache_free(iommu_domain_cache, vaddr);
636}
637
638static inline void * alloc_devinfo_mem(void)
639{
KOSAKI Motohiro354bb652009-11-17 16:21:09 +0900640 return kmem_cache_alloc(iommu_devinfo_cache, GFP_ATOMIC);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700641}
642
643static inline void free_devinfo_mem(void *vaddr)
644{
645 kmem_cache_free(iommu_devinfo_cache, vaddr);
646}
647
Jiang Liuab8dfe22014-07-11 14:19:27 +0800648static inline int domain_type_is_vm(struct dmar_domain *domain)
649{
650 return domain->flags & DOMAIN_FLAG_VIRTUAL_MACHINE;
651}
652
Joerg Roedel28ccce02015-07-21 14:45:31 +0200653static inline int domain_type_is_si(struct dmar_domain *domain)
654{
655 return domain->flags & DOMAIN_FLAG_STATIC_IDENTITY;
656}
657
Jiang Liuab8dfe22014-07-11 14:19:27 +0800658static inline int domain_type_is_vm_or_si(struct dmar_domain *domain)
659{
660 return domain->flags & (DOMAIN_FLAG_VIRTUAL_MACHINE |
661 DOMAIN_FLAG_STATIC_IDENTITY);
662}
Weidong Han1b573682008-12-08 15:34:06 +0800663
Jiang Liu162d1b12014-07-11 14:19:35 +0800664static inline int domain_pfn_supported(struct dmar_domain *domain,
665 unsigned long pfn)
666{
667 int addr_width = agaw_to_width(domain->agaw) - VTD_PAGE_SHIFT;
668
669 return !(addr_width < BITS_PER_LONG && pfn >> addr_width);
670}
671
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700672static int __iommu_calculate_agaw(struct intel_iommu *iommu, int max_gaw)
Weidong Han1b573682008-12-08 15:34:06 +0800673{
674 unsigned long sagaw;
675 int agaw = -1;
676
677 sagaw = cap_sagaw(iommu->cap);
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700678 for (agaw = width_to_agaw(max_gaw);
Weidong Han1b573682008-12-08 15:34:06 +0800679 agaw >= 0; agaw--) {
680 if (test_bit(agaw, &sagaw))
681 break;
682 }
683
684 return agaw;
685}
686
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700687/*
688 * Calculate max SAGAW for each iommu.
689 */
690int iommu_calculate_max_sagaw(struct intel_iommu *iommu)
691{
692 return __iommu_calculate_agaw(iommu, MAX_AGAW_WIDTH);
693}
694
695/*
696 * calculate agaw for each iommu.
697 * "SAGAW" may be different across iommus, use a default agaw, and
698 * get a supported less agaw for iommus that don't support the default agaw.
699 */
700int iommu_calculate_agaw(struct intel_iommu *iommu)
701{
702 return __iommu_calculate_agaw(iommu, DEFAULT_DOMAIN_ADDRESS_WIDTH);
703}
704
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700705/* This functionin only returns single iommu in a domain */
Weidong Han8c11e792008-12-08 15:29:22 +0800706static struct intel_iommu *domain_get_iommu(struct dmar_domain *domain)
707{
708 int iommu_id;
709
Fenghua Yu2c2e2c32009-06-19 13:47:29 -0700710 /* si_domain and vm domain should not get here. */
Jiang Liuab8dfe22014-07-11 14:19:27 +0800711 BUG_ON(domain_type_is_vm_or_si(domain));
Joerg Roedel29a27712015-07-21 17:17:12 +0200712 for_each_domain_iommu(iommu_id, domain)
713 break;
714
Weidong Han8c11e792008-12-08 15:29:22 +0800715 if (iommu_id < 0 || iommu_id >= g_num_of_iommus)
716 return NULL;
717
718 return g_iommus[iommu_id];
719}
720
Weidong Han8e6040972008-12-08 15:49:06 +0800721static void domain_update_iommu_coherency(struct dmar_domain *domain)
722{
David Woodhoused0501962014-03-11 17:10:29 -0700723 struct dmar_drhd_unit *drhd;
724 struct intel_iommu *iommu;
Quentin Lambert2f119c72015-02-06 10:59:53 +0100725 bool found = false;
726 int i;
Weidong Han8e6040972008-12-08 15:49:06 +0800727
David Woodhoused0501962014-03-11 17:10:29 -0700728 domain->iommu_coherency = 1;
Weidong Han8e6040972008-12-08 15:49:06 +0800729
Joerg Roedel29a27712015-07-21 17:17:12 +0200730 for_each_domain_iommu(i, domain) {
Quentin Lambert2f119c72015-02-06 10:59:53 +0100731 found = true;
Weidong Han8e6040972008-12-08 15:49:06 +0800732 if (!ecap_coherent(g_iommus[i]->ecap)) {
733 domain->iommu_coherency = 0;
734 break;
735 }
Weidong Han8e6040972008-12-08 15:49:06 +0800736 }
David Woodhoused0501962014-03-11 17:10:29 -0700737 if (found)
738 return;
739
740 /* No hardware attached; use lowest common denominator */
741 rcu_read_lock();
742 for_each_active_iommu(iommu, drhd) {
743 if (!ecap_coherent(iommu->ecap)) {
744 domain->iommu_coherency = 0;
745 break;
746 }
747 }
748 rcu_read_unlock();
Weidong Han8e6040972008-12-08 15:49:06 +0800749}
750
Jiang Liu161f6932014-07-11 14:19:37 +0800751static int domain_update_iommu_snooping(struct intel_iommu *skip)
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100752{
Allen Kay8140a952011-10-14 12:32:17 -0700753 struct dmar_drhd_unit *drhd;
Jiang Liu161f6932014-07-11 14:19:37 +0800754 struct intel_iommu *iommu;
755 int ret = 1;
756
757 rcu_read_lock();
758 for_each_active_iommu(iommu, drhd) {
759 if (iommu != skip) {
760 if (!ecap_sc_support(iommu->ecap)) {
761 ret = 0;
762 break;
763 }
764 }
765 }
766 rcu_read_unlock();
767
768 return ret;
769}
770
771static int domain_update_iommu_superpage(struct intel_iommu *skip)
772{
773 struct dmar_drhd_unit *drhd;
774 struct intel_iommu *iommu;
Allen Kay8140a952011-10-14 12:32:17 -0700775 int mask = 0xf;
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100776
777 if (!intel_iommu_superpage) {
Jiang Liu161f6932014-07-11 14:19:37 +0800778 return 0;
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100779 }
780
Allen Kay8140a952011-10-14 12:32:17 -0700781 /* set iommu_superpage to the smallest common denominator */
Jiang Liu0e2426122014-02-19 14:07:34 +0800782 rcu_read_lock();
Allen Kay8140a952011-10-14 12:32:17 -0700783 for_each_active_iommu(iommu, drhd) {
Jiang Liu161f6932014-07-11 14:19:37 +0800784 if (iommu != skip) {
785 mask &= cap_super_page_val(iommu->cap);
786 if (!mask)
787 break;
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100788 }
789 }
Jiang Liu0e2426122014-02-19 14:07:34 +0800790 rcu_read_unlock();
791
Jiang Liu161f6932014-07-11 14:19:37 +0800792 return fls(mask);
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100793}
794
Sheng Yang58c610b2009-03-18 15:33:05 +0800795/* Some capabilities may be different across iommus */
796static void domain_update_iommu_cap(struct dmar_domain *domain)
797{
798 domain_update_iommu_coherency(domain);
Jiang Liu161f6932014-07-11 14:19:37 +0800799 domain->iommu_snooping = domain_update_iommu_snooping(NULL);
800 domain->iommu_superpage = domain_update_iommu_superpage(NULL);
Sheng Yang58c610b2009-03-18 15:33:05 +0800801}
802
David Woodhouse03ecc322015-02-13 14:35:21 +0000803static inline struct context_entry *iommu_context_addr(struct intel_iommu *iommu,
804 u8 bus, u8 devfn, int alloc)
805{
806 struct root_entry *root = &iommu->root_entry[bus];
807 struct context_entry *context;
808 u64 *entry;
809
Joerg Roedel4df4eab2015-08-25 10:54:28 +0200810 entry = &root->lo;
David Woodhousec83b2f22015-06-12 10:15:49 +0100811 if (ecs_enabled(iommu)) {
David Woodhouse03ecc322015-02-13 14:35:21 +0000812 if (devfn >= 0x80) {
813 devfn -= 0x80;
814 entry = &root->hi;
815 }
816 devfn *= 2;
817 }
David Woodhouse03ecc322015-02-13 14:35:21 +0000818 if (*entry & 1)
819 context = phys_to_virt(*entry & VTD_PAGE_MASK);
820 else {
821 unsigned long phy_addr;
822 if (!alloc)
823 return NULL;
824
825 context = alloc_pgtable_page(iommu->node);
826 if (!context)
827 return NULL;
828
829 __iommu_flush_cache(iommu, (void *)context, CONTEXT_SIZE);
830 phy_addr = virt_to_phys((void *)context);
831 *entry = phy_addr | 1;
832 __iommu_flush_cache(iommu, entry, sizeof(*entry));
833 }
834 return &context[devfn];
835}
836
David Woodhouse4ed6a542015-05-11 14:59:20 +0100837static int iommu_dummy(struct device *dev)
838{
839 return dev->archdata.iommu == DUMMY_DEVICE_DOMAIN_INFO;
840}
841
David Woodhouse156baca2014-03-09 14:00:57 -0700842static struct intel_iommu *device_to_iommu(struct device *dev, u8 *bus, u8 *devfn)
Weidong Hanc7151a82008-12-08 22:51:37 +0800843{
844 struct dmar_drhd_unit *drhd = NULL;
Jiang Liub683b232014-02-19 14:07:32 +0800845 struct intel_iommu *iommu;
David Woodhouse156baca2014-03-09 14:00:57 -0700846 struct device *tmp;
847 struct pci_dev *ptmp, *pdev = NULL;
Yijing Wangaa4d0662014-05-26 20:14:06 +0800848 u16 segment = 0;
Weidong Hanc7151a82008-12-08 22:51:37 +0800849 int i;
850
David Woodhouse4ed6a542015-05-11 14:59:20 +0100851 if (iommu_dummy(dev))
852 return NULL;
853
David Woodhouse156baca2014-03-09 14:00:57 -0700854 if (dev_is_pci(dev)) {
855 pdev = to_pci_dev(dev);
856 segment = pci_domain_nr(pdev->bus);
Rafael J. Wysockica5b74d2015-03-16 23:49:08 +0100857 } else if (has_acpi_companion(dev))
David Woodhouse156baca2014-03-09 14:00:57 -0700858 dev = &ACPI_COMPANION(dev)->dev;
859
Jiang Liu0e2426122014-02-19 14:07:34 +0800860 rcu_read_lock();
Jiang Liub683b232014-02-19 14:07:32 +0800861 for_each_active_iommu(iommu, drhd) {
David Woodhouse156baca2014-03-09 14:00:57 -0700862 if (pdev && segment != drhd->segment)
David Woodhouse276dbf992009-04-04 01:45:37 +0100863 continue;
Weidong Hanc7151a82008-12-08 22:51:37 +0800864
Jiang Liub683b232014-02-19 14:07:32 +0800865 for_each_active_dev_scope(drhd->devices,
David Woodhouse156baca2014-03-09 14:00:57 -0700866 drhd->devices_cnt, i, tmp) {
867 if (tmp == dev) {
868 *bus = drhd->devices[i].bus;
869 *devfn = drhd->devices[i].devfn;
870 goto out;
871 }
872
873 if (!pdev || !dev_is_pci(tmp))
David Woodhouse832bd852014-03-07 15:08:36 +0000874 continue;
David Woodhouse156baca2014-03-09 14:00:57 -0700875
876 ptmp = to_pci_dev(tmp);
877 if (ptmp->subordinate &&
878 ptmp->subordinate->number <= pdev->bus->number &&
879 ptmp->subordinate->busn_res.end >= pdev->bus->number)
880 goto got_pdev;
David Woodhouse924b6232009-04-04 00:39:25 +0100881 }
Weidong Hanc7151a82008-12-08 22:51:37 +0800882
David Woodhouse156baca2014-03-09 14:00:57 -0700883 if (pdev && drhd->include_all) {
884 got_pdev:
885 *bus = pdev->bus->number;
886 *devfn = pdev->devfn;
Jiang Liub683b232014-02-19 14:07:32 +0800887 goto out;
David Woodhouse156baca2014-03-09 14:00:57 -0700888 }
Weidong Hanc7151a82008-12-08 22:51:37 +0800889 }
Jiang Liub683b232014-02-19 14:07:32 +0800890 iommu = NULL;
David Woodhouse156baca2014-03-09 14:00:57 -0700891 out:
Jiang Liu0e2426122014-02-19 14:07:34 +0800892 rcu_read_unlock();
Weidong Hanc7151a82008-12-08 22:51:37 +0800893
Jiang Liub683b232014-02-19 14:07:32 +0800894 return iommu;
Weidong Hanc7151a82008-12-08 22:51:37 +0800895}
896
Weidong Han5331fe62008-12-08 23:00:00 +0800897static void domain_flush_cache(struct dmar_domain *domain,
898 void *addr, int size)
899{
900 if (!domain->iommu_coherency)
901 clflush_cache_range(addr, size);
902}
903
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700904static int device_context_mapped(struct intel_iommu *iommu, u8 bus, u8 devfn)
905{
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700906 struct context_entry *context;
David Woodhouse03ecc322015-02-13 14:35:21 +0000907 int ret = 0;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700908 unsigned long flags;
909
910 spin_lock_irqsave(&iommu->lock, flags);
David Woodhouse03ecc322015-02-13 14:35:21 +0000911 context = iommu_context_addr(iommu, bus, devfn, 0);
912 if (context)
913 ret = context_present(context);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700914 spin_unlock_irqrestore(&iommu->lock, flags);
915 return ret;
916}
917
918static void clear_context_table(struct intel_iommu *iommu, u8 bus, u8 devfn)
919{
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700920 struct context_entry *context;
921 unsigned long flags;
922
923 spin_lock_irqsave(&iommu->lock, flags);
David Woodhouse03ecc322015-02-13 14:35:21 +0000924 context = iommu_context_addr(iommu, bus, devfn, 0);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700925 if (context) {
David Woodhouse03ecc322015-02-13 14:35:21 +0000926 context_clear_entry(context);
927 __iommu_flush_cache(iommu, context, sizeof(*context));
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700928 }
929 spin_unlock_irqrestore(&iommu->lock, flags);
930}
931
932static void free_context_table(struct intel_iommu *iommu)
933{
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700934 int i;
935 unsigned long flags;
936 struct context_entry *context;
937
938 spin_lock_irqsave(&iommu->lock, flags);
939 if (!iommu->root_entry) {
940 goto out;
941 }
942 for (i = 0; i < ROOT_ENTRY_NR; i++) {
David Woodhouse03ecc322015-02-13 14:35:21 +0000943 context = iommu_context_addr(iommu, i, 0, 0);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700944 if (context)
945 free_pgtable_page(context);
David Woodhouse03ecc322015-02-13 14:35:21 +0000946
David Woodhousec83b2f22015-06-12 10:15:49 +0100947 if (!ecs_enabled(iommu))
David Woodhouse03ecc322015-02-13 14:35:21 +0000948 continue;
949
950 context = iommu_context_addr(iommu, i, 0x80, 0);
951 if (context)
952 free_pgtable_page(context);
953
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700954 }
955 free_pgtable_page(iommu->root_entry);
956 iommu->root_entry = NULL;
957out:
958 spin_unlock_irqrestore(&iommu->lock, flags);
959}
960
David Woodhouseb026fd22009-06-28 10:37:25 +0100961static struct dma_pte *pfn_to_dma_pte(struct dmar_domain *domain,
David Woodhouse5cf0a762014-03-19 16:07:49 +0000962 unsigned long pfn, int *target_level)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700963{
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700964 struct dma_pte *parent, *pte = NULL;
965 int level = agaw_to_level(domain->agaw);
Allen Kay4399c8b2011-10-14 12:32:46 -0700966 int offset;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700967
968 BUG_ON(!domain->pgd);
Julian Stecklinaf9423602013-10-09 10:03:52 +0200969
Jiang Liu162d1b12014-07-11 14:19:35 +0800970 if (!domain_pfn_supported(domain, pfn))
Julian Stecklinaf9423602013-10-09 10:03:52 +0200971 /* Address beyond IOMMU's addressing capabilities. */
972 return NULL;
973
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700974 parent = domain->pgd;
975
David Woodhouse5cf0a762014-03-19 16:07:49 +0000976 while (1) {
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700977 void *tmp_page;
978
David Woodhouseb026fd22009-06-28 10:37:25 +0100979 offset = pfn_level_offset(pfn, level);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700980 pte = &parent[offset];
David Woodhouse5cf0a762014-03-19 16:07:49 +0000981 if (!*target_level && (dma_pte_superpage(pte) || !dma_pte_present(pte)))
Youquan Song6dd9a7c2011-05-25 19:13:49 +0100982 break;
David Woodhouse5cf0a762014-03-19 16:07:49 +0000983 if (level == *target_level)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700984 break;
985
Mark McLoughlin19c239c2008-11-21 16:56:53 +0000986 if (!dma_pte_present(pte)) {
David Woodhousec85994e2009-07-01 19:21:24 +0100987 uint64_t pteval;
988
Suresh Siddha4c923d42009-10-02 11:01:24 -0700989 tmp_page = alloc_pgtable_page(domain->nid);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700990
David Woodhouse206a73c2009-07-01 19:30:28 +0100991 if (!tmp_page)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -0700992 return NULL;
David Woodhouse206a73c2009-07-01 19:30:28 +0100993
David Woodhousec85994e2009-07-01 19:21:24 +0100994 domain_flush_cache(domain, tmp_page, VTD_PAGE_SIZE);
Benjamin LaHaise64de5af2009-09-16 21:05:55 -0400995 pteval = ((uint64_t)virt_to_dma_pfn(tmp_page) << VTD_PAGE_SHIFT) | DMA_PTE_READ | DMA_PTE_WRITE;
Yijing Wangeffad4b2014-05-26 20:13:47 +0800996 if (cmpxchg64(&pte->val, 0ULL, pteval))
David Woodhousec85994e2009-07-01 19:21:24 +0100997 /* Someone else set it while we were thinking; use theirs. */
998 free_pgtable_page(tmp_page);
Yijing Wangeffad4b2014-05-26 20:13:47 +0800999 else
David Woodhousec85994e2009-07-01 19:21:24 +01001000 domain_flush_cache(domain, pte, sizeof(*pte));
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001001 }
David Woodhouse5cf0a762014-03-19 16:07:49 +00001002 if (level == 1)
1003 break;
1004
Mark McLoughlin19c239c2008-11-21 16:56:53 +00001005 parent = phys_to_virt(dma_pte_addr(pte));
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001006 level--;
1007 }
1008
David Woodhouse5cf0a762014-03-19 16:07:49 +00001009 if (!*target_level)
1010 *target_level = level;
1011
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001012 return pte;
1013}
1014
Youquan Song6dd9a7c2011-05-25 19:13:49 +01001015
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001016/* return address's pte at specific level */
David Woodhouse90dcfb52009-06-27 17:14:59 +01001017static struct dma_pte *dma_pfn_level_pte(struct dmar_domain *domain,
1018 unsigned long pfn,
Youquan Song6dd9a7c2011-05-25 19:13:49 +01001019 int level, int *large_page)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001020{
1021 struct dma_pte *parent, *pte = NULL;
1022 int total = agaw_to_level(domain->agaw);
1023 int offset;
1024
1025 parent = domain->pgd;
1026 while (level <= total) {
David Woodhouse90dcfb52009-06-27 17:14:59 +01001027 offset = pfn_level_offset(pfn, total);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001028 pte = &parent[offset];
1029 if (level == total)
1030 return pte;
1031
Youquan Song6dd9a7c2011-05-25 19:13:49 +01001032 if (!dma_pte_present(pte)) {
1033 *large_page = total;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001034 break;
Youquan Song6dd9a7c2011-05-25 19:13:49 +01001035 }
1036
Yijing Wange16922a2014-05-20 20:37:51 +08001037 if (dma_pte_superpage(pte)) {
Youquan Song6dd9a7c2011-05-25 19:13:49 +01001038 *large_page = total;
1039 return pte;
1040 }
1041
Mark McLoughlin19c239c2008-11-21 16:56:53 +00001042 parent = phys_to_virt(dma_pte_addr(pte));
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001043 total--;
1044 }
1045 return NULL;
1046}
1047
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001048/* clear last level pte, a tlb flush should be followed */
David Woodhouse5cf0a762014-03-19 16:07:49 +00001049static void dma_pte_clear_range(struct dmar_domain *domain,
David Woodhouse595badf52009-06-27 22:09:11 +01001050 unsigned long start_pfn,
1051 unsigned long last_pfn)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001052{
Youquan Song6dd9a7c2011-05-25 19:13:49 +01001053 unsigned int large_page = 1;
David Woodhouse310a5ab2009-06-28 18:52:20 +01001054 struct dma_pte *first_pte, *pte;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001055
Jiang Liu162d1b12014-07-11 14:19:35 +08001056 BUG_ON(!domain_pfn_supported(domain, start_pfn));
1057 BUG_ON(!domain_pfn_supported(domain, last_pfn));
David Woodhouse59c36282009-09-19 07:36:28 -07001058 BUG_ON(start_pfn > last_pfn);
David Woodhouse66eae842009-06-27 19:00:32 +01001059
David Woodhouse04b18e62009-06-27 19:15:01 +01001060 /* we don't need lock here; nobody else touches the iova range */
David Woodhouse59c36282009-09-19 07:36:28 -07001061 do {
Youquan Song6dd9a7c2011-05-25 19:13:49 +01001062 large_page = 1;
1063 first_pte = pte = dma_pfn_level_pte(domain, start_pfn, 1, &large_page);
David Woodhouse310a5ab2009-06-28 18:52:20 +01001064 if (!pte) {
Youquan Song6dd9a7c2011-05-25 19:13:49 +01001065 start_pfn = align_to_level(start_pfn + 1, large_page + 1);
David Woodhouse310a5ab2009-06-28 18:52:20 +01001066 continue;
1067 }
Youquan Song6dd9a7c2011-05-25 19:13:49 +01001068 do {
David Woodhouse310a5ab2009-06-28 18:52:20 +01001069 dma_clear_pte(pte);
Youquan Song6dd9a7c2011-05-25 19:13:49 +01001070 start_pfn += lvl_to_nr_pages(large_page);
David Woodhouse310a5ab2009-06-28 18:52:20 +01001071 pte++;
David Woodhouse75e6bf92009-07-02 11:21:16 +01001072 } while (start_pfn <= last_pfn && !first_pte_in_page(pte));
1073
David Woodhouse310a5ab2009-06-28 18:52:20 +01001074 domain_flush_cache(domain, first_pte,
1075 (void *)pte - (void *)first_pte);
David Woodhouse59c36282009-09-19 07:36:28 -07001076
1077 } while (start_pfn && start_pfn <= last_pfn);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001078}
1079
Alex Williamson3269ee02013-06-15 10:27:19 -06001080static void dma_pte_free_level(struct dmar_domain *domain, int level,
1081 struct dma_pte *pte, unsigned long pfn,
1082 unsigned long start_pfn, unsigned long last_pfn)
1083{
1084 pfn = max(start_pfn, pfn);
1085 pte = &pte[pfn_level_offset(pfn, level)];
1086
1087 do {
1088 unsigned long level_pfn;
1089 struct dma_pte *level_pte;
1090
1091 if (!dma_pte_present(pte) || dma_pte_superpage(pte))
1092 goto next;
1093
1094 level_pfn = pfn & level_mask(level - 1);
1095 level_pte = phys_to_virt(dma_pte_addr(pte));
1096
1097 if (level > 2)
1098 dma_pte_free_level(domain, level - 1, level_pte,
1099 level_pfn, start_pfn, last_pfn);
1100
1101 /* If range covers entire pagetable, free it */
1102 if (!(start_pfn > level_pfn ||
Alex Williamson08336fd2014-01-21 15:48:18 -08001103 last_pfn < level_pfn + level_size(level) - 1)) {
Alex Williamson3269ee02013-06-15 10:27:19 -06001104 dma_clear_pte(pte);
1105 domain_flush_cache(domain, pte, sizeof(*pte));
1106 free_pgtable_page(level_pte);
1107 }
1108next:
1109 pfn += level_size(level);
1110 } while (!first_pte_in_page(++pte) && pfn <= last_pfn);
1111}
1112
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001113/* free page table pages. last level pte should already be cleared */
1114static void dma_pte_free_pagetable(struct dmar_domain *domain,
David Woodhoused794dc92009-06-28 00:27:49 +01001115 unsigned long start_pfn,
1116 unsigned long last_pfn)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001117{
Jiang Liu162d1b12014-07-11 14:19:35 +08001118 BUG_ON(!domain_pfn_supported(domain, start_pfn));
1119 BUG_ON(!domain_pfn_supported(domain, last_pfn));
David Woodhouse59c36282009-09-19 07:36:28 -07001120 BUG_ON(start_pfn > last_pfn);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001121
Jiang Liud41a4ad2014-07-11 14:19:34 +08001122 dma_pte_clear_range(domain, start_pfn, last_pfn);
1123
David Woodhousef3a0a522009-06-30 03:40:07 +01001124 /* We don't need lock here; nobody else touches the iova range */
Alex Williamson3269ee02013-06-15 10:27:19 -06001125 dma_pte_free_level(domain, agaw_to_level(domain->agaw),
1126 domain->pgd, 0, start_pfn, last_pfn);
David Woodhouse6660c632009-06-27 22:41:00 +01001127
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001128 /* free pgd */
David Woodhoused794dc92009-06-28 00:27:49 +01001129 if (start_pfn == 0 && last_pfn == DOMAIN_MAX_PFN(domain->gaw)) {
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001130 free_pgtable_page(domain->pgd);
1131 domain->pgd = NULL;
1132 }
1133}
1134
David Woodhouseea8ea462014-03-05 17:09:32 +00001135/* When a page at a given level is being unlinked from its parent, we don't
1136 need to *modify* it at all. All we need to do is make a list of all the
1137 pages which can be freed just as soon as we've flushed the IOTLB and we
1138 know the hardware page-walk will no longer touch them.
1139 The 'pte' argument is the *parent* PTE, pointing to the page that is to
1140 be freed. */
1141static struct page *dma_pte_list_pagetables(struct dmar_domain *domain,
1142 int level, struct dma_pte *pte,
1143 struct page *freelist)
1144{
1145 struct page *pg;
1146
1147 pg = pfn_to_page(dma_pte_addr(pte) >> PAGE_SHIFT);
1148 pg->freelist = freelist;
1149 freelist = pg;
1150
1151 if (level == 1)
1152 return freelist;
1153
Jiang Liuadeb2592014-04-09 10:20:39 +08001154 pte = page_address(pg);
1155 do {
David Woodhouseea8ea462014-03-05 17:09:32 +00001156 if (dma_pte_present(pte) && !dma_pte_superpage(pte))
1157 freelist = dma_pte_list_pagetables(domain, level - 1,
1158 pte, freelist);
Jiang Liuadeb2592014-04-09 10:20:39 +08001159 pte++;
1160 } while (!first_pte_in_page(pte));
David Woodhouseea8ea462014-03-05 17:09:32 +00001161
1162 return freelist;
1163}
1164
1165static struct page *dma_pte_clear_level(struct dmar_domain *domain, int level,
1166 struct dma_pte *pte, unsigned long pfn,
1167 unsigned long start_pfn,
1168 unsigned long last_pfn,
1169 struct page *freelist)
1170{
1171 struct dma_pte *first_pte = NULL, *last_pte = NULL;
1172
1173 pfn = max(start_pfn, pfn);
1174 pte = &pte[pfn_level_offset(pfn, level)];
1175
1176 do {
1177 unsigned long level_pfn;
1178
1179 if (!dma_pte_present(pte))
1180 goto next;
1181
1182 level_pfn = pfn & level_mask(level);
1183
1184 /* If range covers entire pagetable, free it */
1185 if (start_pfn <= level_pfn &&
1186 last_pfn >= level_pfn + level_size(level) - 1) {
1187 /* These suborbinate page tables are going away entirely. Don't
1188 bother to clear them; we're just going to *free* them. */
1189 if (level > 1 && !dma_pte_superpage(pte))
1190 freelist = dma_pte_list_pagetables(domain, level - 1, pte, freelist);
1191
1192 dma_clear_pte(pte);
1193 if (!first_pte)
1194 first_pte = pte;
1195 last_pte = pte;
1196 } else if (level > 1) {
1197 /* Recurse down into a level that isn't *entirely* obsolete */
1198 freelist = dma_pte_clear_level(domain, level - 1,
1199 phys_to_virt(dma_pte_addr(pte)),
1200 level_pfn, start_pfn, last_pfn,
1201 freelist);
1202 }
1203next:
1204 pfn += level_size(level);
1205 } while (!first_pte_in_page(++pte) && pfn <= last_pfn);
1206
1207 if (first_pte)
1208 domain_flush_cache(domain, first_pte,
1209 (void *)++last_pte - (void *)first_pte);
1210
1211 return freelist;
1212}
1213
1214/* We can't just free the pages because the IOMMU may still be walking
1215 the page tables, and may have cached the intermediate levels. The
1216 pages can only be freed after the IOTLB flush has been done. */
Joerg Roedelb6904202015-08-13 11:32:18 +02001217static struct page *domain_unmap(struct dmar_domain *domain,
1218 unsigned long start_pfn,
1219 unsigned long last_pfn)
David Woodhouseea8ea462014-03-05 17:09:32 +00001220{
David Woodhouseea8ea462014-03-05 17:09:32 +00001221 struct page *freelist = NULL;
1222
Jiang Liu162d1b12014-07-11 14:19:35 +08001223 BUG_ON(!domain_pfn_supported(domain, start_pfn));
1224 BUG_ON(!domain_pfn_supported(domain, last_pfn));
David Woodhouseea8ea462014-03-05 17:09:32 +00001225 BUG_ON(start_pfn > last_pfn);
1226
1227 /* we don't need lock here; nobody else touches the iova range */
1228 freelist = dma_pte_clear_level(domain, agaw_to_level(domain->agaw),
1229 domain->pgd, 0, start_pfn, last_pfn, NULL);
1230
1231 /* free pgd */
1232 if (start_pfn == 0 && last_pfn == DOMAIN_MAX_PFN(domain->gaw)) {
1233 struct page *pgd_page = virt_to_page(domain->pgd);
1234 pgd_page->freelist = freelist;
1235 freelist = pgd_page;
1236
1237 domain->pgd = NULL;
1238 }
1239
1240 return freelist;
1241}
1242
Joerg Roedelb6904202015-08-13 11:32:18 +02001243static void dma_free_pagelist(struct page *freelist)
David Woodhouseea8ea462014-03-05 17:09:32 +00001244{
1245 struct page *pg;
1246
1247 while ((pg = freelist)) {
1248 freelist = pg->freelist;
1249 free_pgtable_page(page_address(pg));
1250 }
1251}
1252
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001253/* iommu handling */
1254static int iommu_alloc_root_entry(struct intel_iommu *iommu)
1255{
1256 struct root_entry *root;
1257 unsigned long flags;
1258
Suresh Siddha4c923d42009-10-02 11:01:24 -07001259 root = (struct root_entry *)alloc_pgtable_page(iommu->node);
Jiang Liuffebeb42014-11-09 22:48:02 +08001260 if (!root) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001261 pr_err("Allocating root entry for %s failed\n",
Jiang Liuffebeb42014-11-09 22:48:02 +08001262 iommu->name);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001263 return -ENOMEM;
Jiang Liuffebeb42014-11-09 22:48:02 +08001264 }
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001265
Fenghua Yu5b6985c2008-10-16 18:02:32 -07001266 __iommu_flush_cache(iommu, root, ROOT_SIZE);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001267
1268 spin_lock_irqsave(&iommu->lock, flags);
1269 iommu->root_entry = root;
1270 spin_unlock_irqrestore(&iommu->lock, flags);
1271
1272 return 0;
1273}
1274
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001275static void iommu_set_root_entry(struct intel_iommu *iommu)
1276{
David Woodhouse03ecc322015-02-13 14:35:21 +00001277 u64 addr;
David Woodhousec416daa2009-05-10 20:30:58 +01001278 u32 sts;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001279 unsigned long flag;
1280
David Woodhouse03ecc322015-02-13 14:35:21 +00001281 addr = virt_to_phys(iommu->root_entry);
David Woodhousec83b2f22015-06-12 10:15:49 +01001282 if (ecs_enabled(iommu))
David Woodhouse03ecc322015-02-13 14:35:21 +00001283 addr |= DMA_RTADDR_RTT;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001284
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001285 raw_spin_lock_irqsave(&iommu->register_lock, flag);
David Woodhouse03ecc322015-02-13 14:35:21 +00001286 dmar_writeq(iommu->reg + DMAR_RTADDR_REG, addr);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001287
David Woodhousec416daa2009-05-10 20:30:58 +01001288 writel(iommu->gcmd | DMA_GCMD_SRTP, iommu->reg + DMAR_GCMD_REG);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001289
1290 /* Make sure hardware complete it */
1291 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
David Woodhousec416daa2009-05-10 20:30:58 +01001292 readl, (sts & DMA_GSTS_RTPS), sts);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001293
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001294 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001295}
1296
1297static void iommu_flush_write_buffer(struct intel_iommu *iommu)
1298{
1299 u32 val;
1300 unsigned long flag;
1301
David Woodhouse9af88142009-02-13 23:18:03 +00001302 if (!rwbf_quirk && !cap_rwbf(iommu->cap))
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001303 return;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001304
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001305 raw_spin_lock_irqsave(&iommu->register_lock, flag);
David Woodhouse462b60f2009-05-10 20:18:18 +01001306 writel(iommu->gcmd | DMA_GCMD_WBF, iommu->reg + DMAR_GCMD_REG);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001307
1308 /* Make sure hardware complete it */
1309 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
David Woodhousec416daa2009-05-10 20:30:58 +01001310 readl, (!(val & DMA_GSTS_WBFS)), val);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001311
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001312 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001313}
1314
1315/* return value determine if we need a write buffer flush */
David Woodhouse4c25a2c2009-05-10 17:16:06 +01001316static void __iommu_flush_context(struct intel_iommu *iommu,
1317 u16 did, u16 source_id, u8 function_mask,
1318 u64 type)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001319{
1320 u64 val = 0;
1321 unsigned long flag;
1322
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001323 switch (type) {
1324 case DMA_CCMD_GLOBAL_INVL:
1325 val = DMA_CCMD_GLOBAL_INVL;
1326 break;
1327 case DMA_CCMD_DOMAIN_INVL:
1328 val = DMA_CCMD_DOMAIN_INVL|DMA_CCMD_DID(did);
1329 break;
1330 case DMA_CCMD_DEVICE_INVL:
1331 val = DMA_CCMD_DEVICE_INVL|DMA_CCMD_DID(did)
1332 | DMA_CCMD_SID(source_id) | DMA_CCMD_FM(function_mask);
1333 break;
1334 default:
1335 BUG();
1336 }
1337 val |= DMA_CCMD_ICC;
1338
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001339 raw_spin_lock_irqsave(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001340 dmar_writeq(iommu->reg + DMAR_CCMD_REG, val);
1341
1342 /* Make sure hardware complete it */
1343 IOMMU_WAIT_OP(iommu, DMAR_CCMD_REG,
1344 dmar_readq, (!(val & DMA_CCMD_ICC)), val);
1345
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001346 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001347}
1348
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001349/* return value determine if we need a write buffer flush */
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01001350static void __iommu_flush_iotlb(struct intel_iommu *iommu, u16 did,
1351 u64 addr, unsigned int size_order, u64 type)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001352{
1353 int tlb_offset = ecap_iotlb_offset(iommu->ecap);
1354 u64 val = 0, val_iva = 0;
1355 unsigned long flag;
1356
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001357 switch (type) {
1358 case DMA_TLB_GLOBAL_FLUSH:
1359 /* global flush doesn't need set IVA_REG */
1360 val = DMA_TLB_GLOBAL_FLUSH|DMA_TLB_IVT;
1361 break;
1362 case DMA_TLB_DSI_FLUSH:
1363 val = DMA_TLB_DSI_FLUSH|DMA_TLB_IVT|DMA_TLB_DID(did);
1364 break;
1365 case DMA_TLB_PSI_FLUSH:
1366 val = DMA_TLB_PSI_FLUSH|DMA_TLB_IVT|DMA_TLB_DID(did);
David Woodhouseea8ea462014-03-05 17:09:32 +00001367 /* IH bit is passed in as part of address */
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001368 val_iva = size_order | addr;
1369 break;
1370 default:
1371 BUG();
1372 }
1373 /* Note: set drain read/write */
1374#if 0
1375 /*
1376 * This is probably to be super secure.. Looks like we can
1377 * ignore it without any impact.
1378 */
1379 if (cap_read_drain(iommu->cap))
1380 val |= DMA_TLB_READ_DRAIN;
1381#endif
1382 if (cap_write_drain(iommu->cap))
1383 val |= DMA_TLB_WRITE_DRAIN;
1384
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001385 raw_spin_lock_irqsave(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001386 /* Note: Only uses first TLB reg currently */
1387 if (val_iva)
1388 dmar_writeq(iommu->reg + tlb_offset, val_iva);
1389 dmar_writeq(iommu->reg + tlb_offset + 8, val);
1390
1391 /* Make sure hardware complete it */
1392 IOMMU_WAIT_OP(iommu, tlb_offset + 8,
1393 dmar_readq, (!(val & DMA_TLB_IVT)), val);
1394
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001395 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001396
1397 /* check IOTLB invalidation granularity */
1398 if (DMA_TLB_IAIG(val) == 0)
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001399 pr_err("Flush IOTLB failed\n");
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001400 if (DMA_TLB_IAIG(val) != DMA_TLB_IIRG(type))
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001401 pr_debug("TLB flush request %Lx, actual %Lx\n",
Fenghua Yu5b6985c2008-10-16 18:02:32 -07001402 (unsigned long long)DMA_TLB_IIRG(type),
1403 (unsigned long long)DMA_TLB_IAIG(val));
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001404}
1405
David Woodhouse64ae8922014-03-09 12:52:30 -07001406static struct device_domain_info *
1407iommu_support_dev_iotlb (struct dmar_domain *domain, struct intel_iommu *iommu,
1408 u8 bus, u8 devfn)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001409{
Quentin Lambert2f119c72015-02-06 10:59:53 +01001410 bool found = false;
Yu Zhao93a23a72009-05-18 13:51:37 +08001411 struct device_domain_info *info;
David Woodhouse0bcb3e22014-03-06 17:12:03 +00001412 struct pci_dev *pdev;
Yu Zhao93a23a72009-05-18 13:51:37 +08001413
Joerg Roedel55d94042015-07-22 16:50:40 +02001414 assert_spin_locked(&device_domain_lock);
1415
Yu Zhao93a23a72009-05-18 13:51:37 +08001416 if (!ecap_dev_iotlb_support(iommu->ecap))
1417 return NULL;
1418
1419 if (!iommu->qi)
1420 return NULL;
1421
Yu Zhao93a23a72009-05-18 13:51:37 +08001422 list_for_each_entry(info, &domain->devices, link)
Jiang Liuc3b497c2014-07-11 14:19:25 +08001423 if (info->iommu == iommu && info->bus == bus &&
1424 info->devfn == devfn) {
Quentin Lambert2f119c72015-02-06 10:59:53 +01001425 found = true;
Yu Zhao93a23a72009-05-18 13:51:37 +08001426 break;
1427 }
Yu Zhao93a23a72009-05-18 13:51:37 +08001428
David Woodhouse0bcb3e22014-03-06 17:12:03 +00001429 if (!found || !info->dev || !dev_is_pci(info->dev))
Yu Zhao93a23a72009-05-18 13:51:37 +08001430 return NULL;
1431
David Woodhouse0bcb3e22014-03-06 17:12:03 +00001432 pdev = to_pci_dev(info->dev);
1433
1434 if (!pci_find_ext_capability(pdev, PCI_EXT_CAP_ID_ATS))
Yu Zhao93a23a72009-05-18 13:51:37 +08001435 return NULL;
1436
David Woodhouse0bcb3e22014-03-06 17:12:03 +00001437 if (!dmar_find_matched_atsr_unit(pdev))
Yu Zhao93a23a72009-05-18 13:51:37 +08001438 return NULL;
1439
Yu Zhao93a23a72009-05-18 13:51:37 +08001440 return info;
1441}
1442
1443static void iommu_enable_dev_iotlb(struct device_domain_info *info)
1444{
Bjorn Helgaasfb0cc3a2015-07-20 09:10:36 -05001445 struct pci_dev *pdev;
1446
David Woodhouse0bcb3e22014-03-06 17:12:03 +00001447 if (!info || !dev_is_pci(info->dev))
Yu Zhao93a23a72009-05-18 13:51:37 +08001448 return;
1449
Bjorn Helgaasfb0cc3a2015-07-20 09:10:36 -05001450 pdev = to_pci_dev(info->dev);
1451 if (pci_enable_ats(pdev, VTD_PAGE_SHIFT))
1452 return;
1453
1454 info->ats.enabled = 1;
1455 info->ats.qdep = pci_ats_queue_depth(pdev);
Yu Zhao93a23a72009-05-18 13:51:37 +08001456}
1457
1458static void iommu_disable_dev_iotlb(struct device_domain_info *info)
1459{
Bjorn Helgaasfb0cc3a2015-07-20 09:10:36 -05001460 if (!info->ats.enabled)
Yu Zhao93a23a72009-05-18 13:51:37 +08001461 return;
1462
David Woodhouse0bcb3e22014-03-06 17:12:03 +00001463 pci_disable_ats(to_pci_dev(info->dev));
Bjorn Helgaasfb0cc3a2015-07-20 09:10:36 -05001464 info->ats.enabled = 0;
Yu Zhao93a23a72009-05-18 13:51:37 +08001465}
1466
1467static void iommu_flush_dev_iotlb(struct dmar_domain *domain,
1468 u64 addr, unsigned mask)
1469{
1470 u16 sid, qdep;
1471 unsigned long flags;
1472 struct device_domain_info *info;
1473
1474 spin_lock_irqsave(&device_domain_lock, flags);
1475 list_for_each_entry(info, &domain->devices, link) {
Bjorn Helgaasfb0cc3a2015-07-20 09:10:36 -05001476 if (!info->ats.enabled)
Yu Zhao93a23a72009-05-18 13:51:37 +08001477 continue;
1478
1479 sid = info->bus << 8 | info->devfn;
Bjorn Helgaasfb0cc3a2015-07-20 09:10:36 -05001480 qdep = info->ats.qdep;
Yu Zhao93a23a72009-05-18 13:51:37 +08001481 qi_flush_dev_iotlb(info->iommu, sid, qdep, addr, mask);
1482 }
1483 spin_unlock_irqrestore(&device_domain_lock, flags);
1484}
1485
Joerg Roedela1ddcbe2015-07-21 15:20:32 +02001486static void iommu_flush_iotlb_psi(struct intel_iommu *iommu,
1487 struct dmar_domain *domain,
1488 unsigned long pfn, unsigned int pages,
1489 int ih, int map)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001490{
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001491 unsigned int mask = ilog2(__roundup_pow_of_two(pages));
David Woodhouse03d6a242009-06-28 15:33:46 +01001492 uint64_t addr = (uint64_t)pfn << VTD_PAGE_SHIFT;
Joerg Roedela1ddcbe2015-07-21 15:20:32 +02001493 u16 did = domain->iommu_did[iommu->seq_id];
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001494
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001495 BUG_ON(pages == 0);
1496
David Woodhouseea8ea462014-03-05 17:09:32 +00001497 if (ih)
1498 ih = 1 << 6;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001499 /*
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001500 * Fallback to domain selective flush if no PSI support or the size is
1501 * too big.
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001502 * PSI requires page size to be 2 ^ x, and the base address is naturally
1503 * aligned to the size
1504 */
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001505 if (!cap_pgsel_inv(iommu->cap) || mask > cap_max_amask_val(iommu->cap))
1506 iommu->flush.flush_iotlb(iommu, did, 0, 0,
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01001507 DMA_TLB_DSI_FLUSH);
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001508 else
David Woodhouseea8ea462014-03-05 17:09:32 +00001509 iommu->flush.flush_iotlb(iommu, did, addr | ih, mask,
Yu Zhao9dd2fe82009-05-18 13:51:36 +08001510 DMA_TLB_PSI_FLUSH);
Yu Zhaobf92df32009-06-29 11:31:45 +08001511
1512 /*
Nadav Amit82653632010-04-01 13:24:40 +03001513 * In caching mode, changes of pages from non-present to present require
1514 * flush. However, device IOTLB doesn't need to be flushed in this case.
Yu Zhaobf92df32009-06-29 11:31:45 +08001515 */
Nadav Amit82653632010-04-01 13:24:40 +03001516 if (!cap_caching_mode(iommu->cap) || !map)
Joerg Roedel9452d5b2015-07-21 10:00:56 +02001517 iommu_flush_dev_iotlb(get_iommu_domain(iommu, did),
1518 addr, mask);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001519}
1520
mark grossf8bab732008-02-08 04:18:38 -08001521static void iommu_disable_protect_mem_regions(struct intel_iommu *iommu)
1522{
1523 u32 pmen;
1524 unsigned long flags;
1525
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001526 raw_spin_lock_irqsave(&iommu->register_lock, flags);
mark grossf8bab732008-02-08 04:18:38 -08001527 pmen = readl(iommu->reg + DMAR_PMEN_REG);
1528 pmen &= ~DMA_PMEN_EPM;
1529 writel(pmen, iommu->reg + DMAR_PMEN_REG);
1530
1531 /* wait for the protected region status bit to clear */
1532 IOMMU_WAIT_OP(iommu, DMAR_PMEN_REG,
1533 readl, !(pmen & DMA_PMEN_PRS), pmen);
1534
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001535 raw_spin_unlock_irqrestore(&iommu->register_lock, flags);
mark grossf8bab732008-02-08 04:18:38 -08001536}
1537
Jiang Liu2a41cce2014-07-11 14:19:33 +08001538static void iommu_enable_translation(struct intel_iommu *iommu)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001539{
1540 u32 sts;
1541 unsigned long flags;
1542
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001543 raw_spin_lock_irqsave(&iommu->register_lock, flags);
David Woodhousec416daa2009-05-10 20:30:58 +01001544 iommu->gcmd |= DMA_GCMD_TE;
1545 writel(iommu->gcmd, iommu->reg + DMAR_GCMD_REG);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001546
1547 /* Make sure hardware complete it */
1548 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
David Woodhousec416daa2009-05-10 20:30:58 +01001549 readl, (sts & DMA_GSTS_TES), sts);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001550
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001551 raw_spin_unlock_irqrestore(&iommu->register_lock, flags);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001552}
1553
Jiang Liu2a41cce2014-07-11 14:19:33 +08001554static void iommu_disable_translation(struct intel_iommu *iommu)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001555{
1556 u32 sts;
1557 unsigned long flag;
1558
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001559 raw_spin_lock_irqsave(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001560 iommu->gcmd &= ~DMA_GCMD_TE;
1561 writel(iommu->gcmd, iommu->reg + DMAR_GCMD_REG);
1562
1563 /* Make sure hardware complete it */
1564 IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG,
David Woodhousec416daa2009-05-10 20:30:58 +01001565 readl, (!(sts & DMA_GSTS_TES)), sts);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001566
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02001567 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001568}
1569
Keshavamurthy, Anil S3460a6d2007-10-21 16:41:54 -07001570
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001571static int iommu_init_domains(struct intel_iommu *iommu)
1572{
Joerg Roedel8bf47812015-07-21 10:41:21 +02001573 u32 ndomains, nlongs;
1574 size_t size;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001575
1576 ndomains = cap_ndoms(iommu->cap);
Joerg Roedel8bf47812015-07-21 10:41:21 +02001577 pr_debug("%s: Number of Domains supported <%d>\n",
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001578 iommu->name, ndomains);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001579 nlongs = BITS_TO_LONGS(ndomains);
1580
Donald Dutile94a91b502009-08-20 16:51:34 -04001581 spin_lock_init(&iommu->lock);
1582
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001583 iommu->domain_ids = kcalloc(nlongs, sizeof(unsigned long), GFP_KERNEL);
1584 if (!iommu->domain_ids) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001585 pr_err("%s: Allocating domain id array failed\n",
1586 iommu->name);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001587 return -ENOMEM;
1588 }
Joerg Roedel8bf47812015-07-21 10:41:21 +02001589
1590 size = ((ndomains >> 8) + 1) * sizeof(struct dmar_domain **);
1591 iommu->domains = kzalloc(size, GFP_KERNEL);
1592
1593 if (iommu->domains) {
1594 size = 256 * sizeof(struct dmar_domain *);
1595 iommu->domains[0] = kzalloc(size, GFP_KERNEL);
1596 }
1597
1598 if (!iommu->domains || !iommu->domains[0]) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001599 pr_err("%s: Allocating domain array failed\n",
1600 iommu->name);
Jiang Liu852bdb02014-01-06 14:18:11 +08001601 kfree(iommu->domain_ids);
Joerg Roedel8bf47812015-07-21 10:41:21 +02001602 kfree(iommu->domains);
Jiang Liu852bdb02014-01-06 14:18:11 +08001603 iommu->domain_ids = NULL;
Joerg Roedel8bf47812015-07-21 10:41:21 +02001604 iommu->domains = NULL;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001605 return -ENOMEM;
1606 }
1607
Joerg Roedel8bf47812015-07-21 10:41:21 +02001608
1609
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001610 /*
Joerg Roedelc0e8a6c2015-07-21 09:39:46 +02001611 * If Caching mode is set, then invalid translations are tagged
1612 * with domain-id 0, hence we need to pre-allocate it. We also
1613 * use domain-id 0 as a marker for non-allocated domain-id, so
1614 * make sure it is not used for a real domain.
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001615 */
Joerg Roedelc0e8a6c2015-07-21 09:39:46 +02001616 set_bit(0, iommu->domain_ids);
1617
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001618 return 0;
1619}
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001620
Jiang Liuffebeb42014-11-09 22:48:02 +08001621static void disable_dmar_iommu(struct intel_iommu *iommu)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001622{
Joerg Roedel29a27712015-07-21 17:17:12 +02001623 struct device_domain_info *info, *tmp;
Joerg Roedel55d94042015-07-22 16:50:40 +02001624 unsigned long flags;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001625
Joerg Roedel29a27712015-07-21 17:17:12 +02001626 if (!iommu->domains || !iommu->domain_ids)
1627 return;
Jiang Liua4eaa862014-02-19 14:07:30 +08001628
Joerg Roedel55d94042015-07-22 16:50:40 +02001629 spin_lock_irqsave(&device_domain_lock, flags);
Joerg Roedel29a27712015-07-21 17:17:12 +02001630 list_for_each_entry_safe(info, tmp, &device_domain_list, global) {
1631 struct dmar_domain *domain;
1632
1633 if (info->iommu != iommu)
1634 continue;
1635
1636 if (!info->dev || !info->domain)
1637 continue;
1638
1639 domain = info->domain;
1640
Joerg Roedele6de0f82015-07-22 16:30:36 +02001641 dmar_remove_one_dev_info(domain, info->dev);
Joerg Roedel29a27712015-07-21 17:17:12 +02001642
1643 if (!domain_type_is_vm_or_si(domain))
1644 domain_exit(domain);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001645 }
Joerg Roedel55d94042015-07-22 16:50:40 +02001646 spin_unlock_irqrestore(&device_domain_lock, flags);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001647
1648 if (iommu->gcmd & DMA_GCMD_TE)
1649 iommu_disable_translation(iommu);
Jiang Liuffebeb42014-11-09 22:48:02 +08001650}
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001651
Jiang Liuffebeb42014-11-09 22:48:02 +08001652static void free_dmar_iommu(struct intel_iommu *iommu)
1653{
1654 if ((iommu->domains) && (iommu->domain_ids)) {
Joerg Roedel8bf47812015-07-21 10:41:21 +02001655 int elems = (cap_ndoms(iommu->cap) >> 8) + 1;
1656 int i;
1657
1658 for (i = 0; i < elems; i++)
1659 kfree(iommu->domains[i]);
Jiang Liuffebeb42014-11-09 22:48:02 +08001660 kfree(iommu->domains);
1661 kfree(iommu->domain_ids);
1662 iommu->domains = NULL;
1663 iommu->domain_ids = NULL;
1664 }
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001665
Weidong Hand9630fe2008-12-08 11:06:32 +08001666 g_iommus[iommu->seq_id] = NULL;
1667
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001668 /* free context mapping */
1669 free_context_table(iommu);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001670}
1671
Jiang Liuab8dfe22014-07-11 14:19:27 +08001672static struct dmar_domain *alloc_domain(int flags)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001673{
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001674 struct dmar_domain *domain;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001675
1676 domain = alloc_domain_mem();
1677 if (!domain)
1678 return NULL;
1679
Jiang Liuab8dfe22014-07-11 14:19:27 +08001680 memset(domain, 0, sizeof(*domain));
Suresh Siddha4c923d42009-10-02 11:01:24 -07001681 domain->nid = -1;
Jiang Liuab8dfe22014-07-11 14:19:27 +08001682 domain->flags = flags;
Jiang Liu92d03cc2014-02-19 14:07:28 +08001683 INIT_LIST_HEAD(&domain->devices);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001684
1685 return domain;
1686}
1687
Joerg Roedeld160aca2015-07-22 11:52:53 +02001688/* Must be called with iommu->lock */
1689static int domain_attach_iommu(struct dmar_domain *domain,
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001690 struct intel_iommu *iommu)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001691{
Jiang Liu44bde612014-07-11 14:19:29 +08001692 unsigned long ndomains;
Joerg Roedel55d94042015-07-22 16:50:40 +02001693 int num;
Jiang Liu44bde612014-07-11 14:19:29 +08001694
Joerg Roedel55d94042015-07-22 16:50:40 +02001695 assert_spin_locked(&device_domain_lock);
Joerg Roedeld160aca2015-07-22 11:52:53 +02001696 assert_spin_locked(&iommu->lock);
Jiang Liu44bde612014-07-11 14:19:29 +08001697
Joerg Roedel29a27712015-07-21 17:17:12 +02001698 domain->iommu_refcnt[iommu->seq_id] += 1;
1699 domain->iommu_count += 1;
1700 if (domain->iommu_refcnt[iommu->seq_id] == 1) {
Jiang Liufb170fb2014-07-11 14:19:28 +08001701 ndomains = cap_ndoms(iommu->cap);
Joerg Roedeld160aca2015-07-22 11:52:53 +02001702 num = find_first_zero_bit(iommu->domain_ids, ndomains);
1703
1704 if (num >= ndomains) {
1705 pr_err("%s: No free domain ids\n", iommu->name);
1706 domain->iommu_refcnt[iommu->seq_id] -= 1;
1707 domain->iommu_count -= 1;
Joerg Roedel55d94042015-07-22 16:50:40 +02001708 return -ENOSPC;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07001709 }
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001710
Joerg Roedeld160aca2015-07-22 11:52:53 +02001711 set_bit(num, iommu->domain_ids);
1712 set_iommu_domain(iommu, num, domain);
Jiang Liufb170fb2014-07-11 14:19:28 +08001713
Joerg Roedeld160aca2015-07-22 11:52:53 +02001714 domain->iommu_did[iommu->seq_id] = num;
1715 domain->nid = iommu->node;
1716
Jiang Liufb170fb2014-07-11 14:19:28 +08001717 domain_update_iommu_cap(domain);
1718 }
Joerg Roedeld160aca2015-07-22 11:52:53 +02001719
Joerg Roedel55d94042015-07-22 16:50:40 +02001720 return 0;
Jiang Liufb170fb2014-07-11 14:19:28 +08001721}
1722
1723static int domain_detach_iommu(struct dmar_domain *domain,
1724 struct intel_iommu *iommu)
1725{
Joerg Roedeld160aca2015-07-22 11:52:53 +02001726 int num, count = INT_MAX;
Jiang Liufb170fb2014-07-11 14:19:28 +08001727
Joerg Roedel55d94042015-07-22 16:50:40 +02001728 assert_spin_locked(&device_domain_lock);
Joerg Roedeld160aca2015-07-22 11:52:53 +02001729 assert_spin_locked(&iommu->lock);
Jiang Liufb170fb2014-07-11 14:19:28 +08001730
Joerg Roedel29a27712015-07-21 17:17:12 +02001731 domain->iommu_refcnt[iommu->seq_id] -= 1;
1732 count = --domain->iommu_count;
1733 if (domain->iommu_refcnt[iommu->seq_id] == 0) {
Joerg Roedeld160aca2015-07-22 11:52:53 +02001734 num = domain->iommu_did[iommu->seq_id];
1735 clear_bit(num, iommu->domain_ids);
1736 set_iommu_domain(iommu, num, NULL);
1737
Jiang Liufb170fb2014-07-11 14:19:28 +08001738 domain_update_iommu_cap(domain);
Joerg Roedelc0e8a6c2015-07-21 09:39:46 +02001739 domain->iommu_did[iommu->seq_id] = 0;
Jiang Liufb170fb2014-07-11 14:19:28 +08001740 }
Jiang Liufb170fb2014-07-11 14:19:28 +08001741
1742 return count;
1743}
1744
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001745static struct iova_domain reserved_iova_list;
Mark Gross8a443df2008-03-04 14:59:31 -08001746static struct lock_class_key reserved_rbtree_key;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001747
Joseph Cihula51a63e62011-03-21 11:04:24 -07001748static int dmar_init_reserved_ranges(void)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001749{
1750 struct pci_dev *pdev = NULL;
1751 struct iova *iova;
1752 int i;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001753
Robin Murphy0fb5fe82015-01-12 17:51:16 +00001754 init_iova_domain(&reserved_iova_list, VTD_PAGE_SIZE, IOVA_START_PFN,
1755 DMA_32BIT_PFN);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001756
Mark Gross8a443df2008-03-04 14:59:31 -08001757 lockdep_set_class(&reserved_iova_list.iova_rbtree_lock,
1758 &reserved_rbtree_key);
1759
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001760 /* IOAPIC ranges shouldn't be accessed by DMA */
1761 iova = reserve_iova(&reserved_iova_list, IOVA_PFN(IOAPIC_RANGE_START),
1762 IOVA_PFN(IOAPIC_RANGE_END));
Joseph Cihula51a63e62011-03-21 11:04:24 -07001763 if (!iova) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001764 pr_err("Reserve IOAPIC range failed\n");
Joseph Cihula51a63e62011-03-21 11:04:24 -07001765 return -ENODEV;
1766 }
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001767
1768 /* Reserve all PCI MMIO to avoid peer-to-peer access */
1769 for_each_pci_dev(pdev) {
1770 struct resource *r;
1771
1772 for (i = 0; i < PCI_NUM_RESOURCES; i++) {
1773 r = &pdev->resource[i];
1774 if (!r->flags || !(r->flags & IORESOURCE_MEM))
1775 continue;
David Woodhouse1a4a4552009-06-28 16:00:42 +01001776 iova = reserve_iova(&reserved_iova_list,
1777 IOVA_PFN(r->start),
1778 IOVA_PFN(r->end));
Joseph Cihula51a63e62011-03-21 11:04:24 -07001779 if (!iova) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001780 pr_err("Reserve iova failed\n");
Joseph Cihula51a63e62011-03-21 11:04:24 -07001781 return -ENODEV;
1782 }
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001783 }
1784 }
Joseph Cihula51a63e62011-03-21 11:04:24 -07001785 return 0;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001786}
1787
1788static void domain_reserve_special_ranges(struct dmar_domain *domain)
1789{
1790 copy_reserved_iova(&reserved_iova_list, &domain->iovad);
1791}
1792
1793static inline int guestwidth_to_adjustwidth(int gaw)
1794{
1795 int agaw;
1796 int r = (gaw - 12) % 9;
1797
1798 if (r == 0)
1799 agaw = gaw;
1800 else
1801 agaw = gaw + 9 - r;
1802 if (agaw > 64)
1803 agaw = 64;
1804 return agaw;
1805}
1806
Joerg Roedeldc534b22015-07-22 12:44:02 +02001807static int domain_init(struct dmar_domain *domain, struct intel_iommu *iommu,
1808 int guest_width)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001809{
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001810 int adjust_width, agaw;
1811 unsigned long sagaw;
1812
Robin Murphy0fb5fe82015-01-12 17:51:16 +00001813 init_iova_domain(&domain->iovad, VTD_PAGE_SIZE, IOVA_START_PFN,
1814 DMA_32BIT_PFN);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001815 domain_reserve_special_ranges(domain);
1816
1817 /* calculate AGAW */
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001818 if (guest_width > cap_mgaw(iommu->cap))
1819 guest_width = cap_mgaw(iommu->cap);
1820 domain->gaw = guest_width;
1821 adjust_width = guestwidth_to_adjustwidth(guest_width);
1822 agaw = width_to_agaw(adjust_width);
1823 sagaw = cap_sagaw(iommu->cap);
1824 if (!test_bit(agaw, &sagaw)) {
1825 /* hardware doesn't support it, choose a bigger one */
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02001826 pr_debug("Hardware doesn't support agaw %d\n", agaw);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001827 agaw = find_next_bit(&sagaw, 5, agaw);
1828 if (agaw >= 5)
1829 return -ENODEV;
1830 }
1831 domain->agaw = agaw;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001832
Weidong Han8e6040972008-12-08 15:49:06 +08001833 if (ecap_coherent(iommu->ecap))
1834 domain->iommu_coherency = 1;
1835 else
1836 domain->iommu_coherency = 0;
1837
Sheng Yang58c610b2009-03-18 15:33:05 +08001838 if (ecap_sc_support(iommu->ecap))
1839 domain->iommu_snooping = 1;
1840 else
1841 domain->iommu_snooping = 0;
1842
David Woodhouse214e39a2014-03-19 10:38:49 +00001843 if (intel_iommu_superpage)
1844 domain->iommu_superpage = fls(cap_super_page_val(iommu->cap));
1845 else
1846 domain->iommu_superpage = 0;
1847
Suresh Siddha4c923d42009-10-02 11:01:24 -07001848 domain->nid = iommu->node;
Weidong Hanc7151a82008-12-08 22:51:37 +08001849
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001850 /* always allocate the top pgd */
Suresh Siddha4c923d42009-10-02 11:01:24 -07001851 domain->pgd = (struct dma_pte *)alloc_pgtable_page(domain->nid);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001852 if (!domain->pgd)
1853 return -ENOMEM;
Fenghua Yu5b6985c2008-10-16 18:02:32 -07001854 __iommu_flush_cache(iommu, domain->pgd, PAGE_SIZE);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001855 return 0;
1856}
1857
1858static void domain_exit(struct dmar_domain *domain)
1859{
David Woodhouseea8ea462014-03-05 17:09:32 +00001860 struct page *freelist = NULL;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001861
1862 /* Domain 0 is reserved, so dont process it */
1863 if (!domain)
1864 return;
1865
Alex Williamson7b668352011-05-24 12:02:41 +01001866 /* Flush any lazy unmaps that may reference this domain */
1867 if (!intel_iommu_strict)
1868 flush_unmaps_timeout(0);
1869
Joerg Roedeld160aca2015-07-22 11:52:53 +02001870 /* Remove associated devices and clear attached or cached domains */
1871 rcu_read_lock();
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001872 domain_remove_dev_info(domain);
Joerg Roedeld160aca2015-07-22 11:52:53 +02001873 rcu_read_unlock();
Jiang Liu92d03cc2014-02-19 14:07:28 +08001874
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001875 /* destroy iovas */
1876 put_iova_domain(&domain->iovad);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001877
David Woodhouseea8ea462014-03-05 17:09:32 +00001878 freelist = domain_unmap(domain, 0, DOMAIN_MAX_PFN(domain->gaw));
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001879
David Woodhouseea8ea462014-03-05 17:09:32 +00001880 dma_free_pagelist(freelist);
1881
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001882 free_domain_mem(domain);
1883}
1884
David Woodhouse64ae8922014-03-09 12:52:30 -07001885static int domain_context_mapping_one(struct dmar_domain *domain,
1886 struct intel_iommu *iommu,
Joerg Roedel28ccce02015-07-21 14:45:31 +02001887 u8 bus, u8 devfn)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001888{
Joerg Roedelc6c2ceb2015-07-22 13:11:53 +02001889 u16 did = domain->iommu_did[iommu->seq_id];
Joerg Roedel28ccce02015-07-21 14:45:31 +02001890 int translation = CONTEXT_TT_MULTI_LEVEL;
1891 struct device_domain_info *info = NULL;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001892 struct context_entry *context;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001893 unsigned long flags;
Weidong Hanea6606b2008-12-08 23:08:15 +08001894 struct dma_pte *pgd;
Joerg Roedel55d94042015-07-22 16:50:40 +02001895 int ret, agaw;
Joerg Roedel28ccce02015-07-21 14:45:31 +02001896
Joerg Roedelc6c2ceb2015-07-22 13:11:53 +02001897 WARN_ON(did == 0);
1898
Joerg Roedel28ccce02015-07-21 14:45:31 +02001899 if (hw_pass_through && domain_type_is_si(domain))
1900 translation = CONTEXT_TT_PASS_THROUGH;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001901
1902 pr_debug("Set context mapping for %02x:%02x.%d\n",
1903 bus, PCI_SLOT(devfn), PCI_FUNC(devfn));
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001904
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001905 BUG_ON(!domain->pgd);
Weidong Han5331fe62008-12-08 23:00:00 +08001906
Joerg Roedel55d94042015-07-22 16:50:40 +02001907 spin_lock_irqsave(&device_domain_lock, flags);
1908 spin_lock(&iommu->lock);
1909
1910 ret = -ENOMEM;
David Woodhouse03ecc322015-02-13 14:35:21 +00001911 context = iommu_context_addr(iommu, bus, devfn, 1);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001912 if (!context)
Joerg Roedel55d94042015-07-22 16:50:40 +02001913 goto out_unlock;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001914
Joerg Roedel55d94042015-07-22 16:50:40 +02001915 ret = 0;
1916 if (context_present(context))
1917 goto out_unlock;
Joerg Roedelcf484d02015-06-12 12:21:46 +02001918
Weidong Hanea6606b2008-12-08 23:08:15 +08001919 pgd = domain->pgd;
1920
Joerg Roedelde24e552015-07-21 14:53:04 +02001921 context_clear_entry(context);
Joerg Roedelc6c2ceb2015-07-22 13:11:53 +02001922 context_set_domain_id(context, did);
Weidong Hanea6606b2008-12-08 23:08:15 +08001923
Joerg Roedelde24e552015-07-21 14:53:04 +02001924 /*
1925 * Skip top levels of page tables for iommu which has less agaw
1926 * than default. Unnecessary for PT mode.
1927 */
Yu Zhao93a23a72009-05-18 13:51:37 +08001928 if (translation != CONTEXT_TT_PASS_THROUGH) {
Joerg Roedelde24e552015-07-21 14:53:04 +02001929 for (agaw = domain->agaw; agaw != iommu->agaw; agaw--) {
Joerg Roedel55d94042015-07-22 16:50:40 +02001930 ret = -ENOMEM;
Joerg Roedelde24e552015-07-21 14:53:04 +02001931 pgd = phys_to_virt(dma_pte_addr(pgd));
Joerg Roedel55d94042015-07-22 16:50:40 +02001932 if (!dma_pte_present(pgd))
1933 goto out_unlock;
Joerg Roedelde24e552015-07-21 14:53:04 +02001934 }
1935
David Woodhouse64ae8922014-03-09 12:52:30 -07001936 info = iommu_support_dev_iotlb(domain, iommu, bus, devfn);
Yu Zhao93a23a72009-05-18 13:51:37 +08001937 translation = info ? CONTEXT_TT_DEV_IOTLB :
1938 CONTEXT_TT_MULTI_LEVEL;
Joerg Roedelde24e552015-07-21 14:53:04 +02001939
Yu Zhao93a23a72009-05-18 13:51:37 +08001940 context_set_address_root(context, virt_to_phys(pgd));
1941 context_set_address_width(context, iommu->agaw);
Joerg Roedelde24e552015-07-21 14:53:04 +02001942 } else {
1943 /*
1944 * In pass through mode, AW must be programmed to
1945 * indicate the largest AGAW value supported by
1946 * hardware. And ASR is ignored by hardware.
1947 */
1948 context_set_address_width(context, iommu->msagaw);
Yu Zhao93a23a72009-05-18 13:51:37 +08001949 }
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07001950
1951 context_set_translation_type(context, translation);
Mark McLoughlinc07e7d22008-11-21 16:54:46 +00001952 context_set_fault_enable(context);
1953 context_set_present(context);
Weidong Han5331fe62008-12-08 23:00:00 +08001954 domain_flush_cache(domain, context, sizeof(*context));
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001955
David Woodhouse4c25a2c2009-05-10 17:16:06 +01001956 /*
1957 * It's a non-present to present mapping. If hardware doesn't cache
1958 * non-present entry we only need to flush the write-buffer. If the
1959 * _does_ cache non-present entries, then it does so in the special
1960 * domain #0, which we have to flush:
1961 */
1962 if (cap_caching_mode(iommu->cap)) {
1963 iommu->flush.flush_context(iommu, 0,
1964 (((u16)bus) << 8) | devfn,
1965 DMA_CCMD_MASK_NOBIT,
1966 DMA_CCMD_DEVICE_INVL);
Joerg Roedelc6c2ceb2015-07-22 13:11:53 +02001967 iommu->flush.flush_iotlb(iommu, did, 0, 0, DMA_TLB_DSI_FLUSH);
David Woodhouse4c25a2c2009-05-10 17:16:06 +01001968 } else {
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001969 iommu_flush_write_buffer(iommu);
David Woodhouse4c25a2c2009-05-10 17:16:06 +01001970 }
Yu Zhao93a23a72009-05-18 13:51:37 +08001971 iommu_enable_dev_iotlb(info);
Weidong Hanc7151a82008-12-08 22:51:37 +08001972
Joerg Roedel55d94042015-07-22 16:50:40 +02001973 ret = 0;
1974
1975out_unlock:
1976 spin_unlock(&iommu->lock);
1977 spin_unlock_irqrestore(&device_domain_lock, flags);
Jiang Liufb170fb2014-07-11 14:19:28 +08001978
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001979 return 0;
1980}
1981
Alex Williamson579305f2014-07-03 09:51:43 -06001982struct domain_context_mapping_data {
1983 struct dmar_domain *domain;
1984 struct intel_iommu *iommu;
Alex Williamson579305f2014-07-03 09:51:43 -06001985};
1986
1987static int domain_context_mapping_cb(struct pci_dev *pdev,
1988 u16 alias, void *opaque)
1989{
1990 struct domain_context_mapping_data *data = opaque;
1991
1992 return domain_context_mapping_one(data->domain, data->iommu,
Joerg Roedel28ccce02015-07-21 14:45:31 +02001993 PCI_BUS_NUM(alias), alias & 0xff);
Alex Williamson579305f2014-07-03 09:51:43 -06001994}
1995
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001996static int
Joerg Roedel28ccce02015-07-21 14:45:31 +02001997domain_context_mapping(struct dmar_domain *domain, struct device *dev)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07001998{
David Woodhouse64ae8922014-03-09 12:52:30 -07001999 struct intel_iommu *iommu;
David Woodhouse156baca2014-03-09 14:00:57 -07002000 u8 bus, devfn;
Alex Williamson579305f2014-07-03 09:51:43 -06002001 struct domain_context_mapping_data data;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002002
David Woodhousee1f167f2014-03-09 15:24:46 -07002003 iommu = device_to_iommu(dev, &bus, &devfn);
David Woodhouse64ae8922014-03-09 12:52:30 -07002004 if (!iommu)
2005 return -ENODEV;
2006
Alex Williamson579305f2014-07-03 09:51:43 -06002007 if (!dev_is_pci(dev))
Joerg Roedel28ccce02015-07-21 14:45:31 +02002008 return domain_context_mapping_one(domain, iommu, bus, devfn);
Alex Williamson579305f2014-07-03 09:51:43 -06002009
2010 data.domain = domain;
2011 data.iommu = iommu;
Alex Williamson579305f2014-07-03 09:51:43 -06002012
2013 return pci_for_each_dma_alias(to_pci_dev(dev),
2014 &domain_context_mapping_cb, &data);
2015}
2016
2017static int domain_context_mapped_cb(struct pci_dev *pdev,
2018 u16 alias, void *opaque)
2019{
2020 struct intel_iommu *iommu = opaque;
2021
2022 return !device_context_mapped(iommu, PCI_BUS_NUM(alias), alias & 0xff);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002023}
2024
David Woodhousee1f167f2014-03-09 15:24:46 -07002025static int domain_context_mapped(struct device *dev)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002026{
Weidong Han5331fe62008-12-08 23:00:00 +08002027 struct intel_iommu *iommu;
David Woodhouse156baca2014-03-09 14:00:57 -07002028 u8 bus, devfn;
Weidong Han5331fe62008-12-08 23:00:00 +08002029
David Woodhousee1f167f2014-03-09 15:24:46 -07002030 iommu = device_to_iommu(dev, &bus, &devfn);
Weidong Han5331fe62008-12-08 23:00:00 +08002031 if (!iommu)
2032 return -ENODEV;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002033
Alex Williamson579305f2014-07-03 09:51:43 -06002034 if (!dev_is_pci(dev))
2035 return device_context_mapped(iommu, bus, devfn);
David Woodhousee1f167f2014-03-09 15:24:46 -07002036
Alex Williamson579305f2014-07-03 09:51:43 -06002037 return !pci_for_each_dma_alias(to_pci_dev(dev),
2038 domain_context_mapped_cb, iommu);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002039}
2040
Fenghua Yuf5329592009-08-04 15:09:37 -07002041/* Returns a number of VTD pages, but aligned to MM page size */
2042static inline unsigned long aligned_nrpages(unsigned long host_addr,
2043 size_t size)
2044{
2045 host_addr &= ~PAGE_MASK;
2046 return PAGE_ALIGN(host_addr + size) >> VTD_PAGE_SHIFT;
2047}
2048
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002049/* Return largest possible superpage level for a given mapping */
2050static inline int hardware_largepage_caps(struct dmar_domain *domain,
2051 unsigned long iov_pfn,
2052 unsigned long phy_pfn,
2053 unsigned long pages)
2054{
2055 int support, level = 1;
2056 unsigned long pfnmerge;
2057
2058 support = domain->iommu_superpage;
2059
2060 /* To use a large page, the virtual *and* physical addresses
2061 must be aligned to 2MiB/1GiB/etc. Lower bits set in either
2062 of them will mean we have to use smaller pages. So just
2063 merge them and check both at once. */
2064 pfnmerge = iov_pfn | phy_pfn;
2065
2066 while (support && !(pfnmerge & ~VTD_STRIDE_MASK)) {
2067 pages >>= VTD_STRIDE_SHIFT;
2068 if (!pages)
2069 break;
2070 pfnmerge >>= VTD_STRIDE_SHIFT;
2071 level++;
2072 support--;
2073 }
2074 return level;
2075}
2076
David Woodhouse9051aa02009-06-29 12:30:54 +01002077static int __domain_mapping(struct dmar_domain *domain, unsigned long iov_pfn,
2078 struct scatterlist *sg, unsigned long phys_pfn,
2079 unsigned long nr_pages, int prot)
David Woodhousee1605492009-06-29 11:17:38 +01002080{
2081 struct dma_pte *first_pte = NULL, *pte = NULL;
David Woodhouse9051aa02009-06-29 12:30:54 +01002082 phys_addr_t uninitialized_var(pteval);
Jiang Liucc4f14a2014-11-26 09:42:10 +08002083 unsigned long sg_res = 0;
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002084 unsigned int largepage_lvl = 0;
2085 unsigned long lvl_pages = 0;
David Woodhousee1605492009-06-29 11:17:38 +01002086
Jiang Liu162d1b12014-07-11 14:19:35 +08002087 BUG_ON(!domain_pfn_supported(domain, iov_pfn + nr_pages - 1));
David Woodhousee1605492009-06-29 11:17:38 +01002088
2089 if ((prot & (DMA_PTE_READ|DMA_PTE_WRITE)) == 0)
2090 return -EINVAL;
2091
2092 prot &= DMA_PTE_READ | DMA_PTE_WRITE | DMA_PTE_SNP;
2093
Jiang Liucc4f14a2014-11-26 09:42:10 +08002094 if (!sg) {
2095 sg_res = nr_pages;
David Woodhouse9051aa02009-06-29 12:30:54 +01002096 pteval = ((phys_addr_t)phys_pfn << VTD_PAGE_SHIFT) | prot;
2097 }
2098
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002099 while (nr_pages > 0) {
David Woodhousec85994e2009-07-01 19:21:24 +01002100 uint64_t tmp;
2101
David Woodhousee1605492009-06-29 11:17:38 +01002102 if (!sg_res) {
Fenghua Yuf5329592009-08-04 15:09:37 -07002103 sg_res = aligned_nrpages(sg->offset, sg->length);
David Woodhousee1605492009-06-29 11:17:38 +01002104 sg->dma_address = ((dma_addr_t)iov_pfn << VTD_PAGE_SHIFT) + sg->offset;
2105 sg->dma_length = sg->length;
Dan Williamsdb0fa0c2015-08-17 08:13:26 -06002106 pteval = (sg_phys(sg) & PAGE_MASK) | prot;
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002107 phys_pfn = pteval >> VTD_PAGE_SHIFT;
David Woodhousee1605492009-06-29 11:17:38 +01002108 }
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002109
David Woodhousee1605492009-06-29 11:17:38 +01002110 if (!pte) {
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002111 largepage_lvl = hardware_largepage_caps(domain, iov_pfn, phys_pfn, sg_res);
2112
David Woodhouse5cf0a762014-03-19 16:07:49 +00002113 first_pte = pte = pfn_to_dma_pte(domain, iov_pfn, &largepage_lvl);
David Woodhousee1605492009-06-29 11:17:38 +01002114 if (!pte)
2115 return -ENOMEM;
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002116 /* It is large page*/
Woodhouse, David6491d4d2012-12-19 13:25:35 +00002117 if (largepage_lvl > 1) {
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002118 pteval |= DMA_PTE_LARGE_PAGE;
Jiang Liud41a4ad2014-07-11 14:19:34 +08002119 lvl_pages = lvl_to_nr_pages(largepage_lvl);
2120 /*
2121 * Ensure that old small page tables are
2122 * removed to make room for superpage,
2123 * if they exist.
2124 */
Woodhouse, David6491d4d2012-12-19 13:25:35 +00002125 dma_pte_free_pagetable(domain, iov_pfn,
Jiang Liud41a4ad2014-07-11 14:19:34 +08002126 iov_pfn + lvl_pages - 1);
Woodhouse, David6491d4d2012-12-19 13:25:35 +00002127 } else {
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002128 pteval &= ~(uint64_t)DMA_PTE_LARGE_PAGE;
Woodhouse, David6491d4d2012-12-19 13:25:35 +00002129 }
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002130
David Woodhousee1605492009-06-29 11:17:38 +01002131 }
2132 /* We don't need lock here, nobody else
2133 * touches the iova range
2134 */
David Woodhouse7766a3f2009-07-01 20:27:03 +01002135 tmp = cmpxchg64_local(&pte->val, 0ULL, pteval);
David Woodhousec85994e2009-07-01 19:21:24 +01002136 if (tmp) {
David Woodhouse1bf20f02009-06-29 22:06:43 +01002137 static int dumps = 5;
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002138 pr_crit("ERROR: DMA PTE for vPFN 0x%lx already set (to %llx not %llx)\n",
2139 iov_pfn, tmp, (unsigned long long)pteval);
David Woodhouse1bf20f02009-06-29 22:06:43 +01002140 if (dumps) {
2141 dumps--;
2142 debug_dma_dump_mappings(NULL);
2143 }
2144 WARN_ON(1);
2145 }
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002146
2147 lvl_pages = lvl_to_nr_pages(largepage_lvl);
2148
2149 BUG_ON(nr_pages < lvl_pages);
2150 BUG_ON(sg_res < lvl_pages);
2151
2152 nr_pages -= lvl_pages;
2153 iov_pfn += lvl_pages;
2154 phys_pfn += lvl_pages;
2155 pteval += lvl_pages * VTD_PAGE_SIZE;
2156 sg_res -= lvl_pages;
2157
2158 /* If the next PTE would be the first in a new page, then we
2159 need to flush the cache on the entries we've just written.
2160 And then we'll need to recalculate 'pte', so clear it and
2161 let it get set again in the if (!pte) block above.
2162
2163 If we're done (!nr_pages) we need to flush the cache too.
2164
2165 Also if we've been setting superpages, we may need to
2166 recalculate 'pte' and switch back to smaller pages for the
2167 end of the mapping, if the trailing size is not enough to
2168 use another superpage (i.e. sg_res < lvl_pages). */
David Woodhousee1605492009-06-29 11:17:38 +01002169 pte++;
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002170 if (!nr_pages || first_pte_in_page(pte) ||
2171 (largepage_lvl > 1 && sg_res < lvl_pages)) {
David Woodhousee1605492009-06-29 11:17:38 +01002172 domain_flush_cache(domain, first_pte,
2173 (void *)pte - (void *)first_pte);
2174 pte = NULL;
2175 }
Youquan Song6dd9a7c2011-05-25 19:13:49 +01002176
2177 if (!sg_res && nr_pages)
David Woodhousee1605492009-06-29 11:17:38 +01002178 sg = sg_next(sg);
2179 }
2180 return 0;
2181}
2182
David Woodhouse9051aa02009-06-29 12:30:54 +01002183static inline int domain_sg_mapping(struct dmar_domain *domain, unsigned long iov_pfn,
2184 struct scatterlist *sg, unsigned long nr_pages,
2185 int prot)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002186{
David Woodhouse9051aa02009-06-29 12:30:54 +01002187 return __domain_mapping(domain, iov_pfn, sg, 0, nr_pages, prot);
2188}
Fenghua Yu5b6985c2008-10-16 18:02:32 -07002189
David Woodhouse9051aa02009-06-29 12:30:54 +01002190static inline int domain_pfn_mapping(struct dmar_domain *domain, unsigned long iov_pfn,
2191 unsigned long phys_pfn, unsigned long nr_pages,
2192 int prot)
2193{
2194 return __domain_mapping(domain, iov_pfn, NULL, phys_pfn, nr_pages, prot);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002195}
2196
Joerg Roedel2452d9d2015-07-23 16:20:14 +02002197static void domain_context_clear_one(struct intel_iommu *iommu, u8 bus, u8 devfn)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002198{
Weidong Hanc7151a82008-12-08 22:51:37 +08002199 if (!iommu)
2200 return;
Weidong Han8c11e792008-12-08 15:29:22 +08002201
2202 clear_context_table(iommu, bus, devfn);
2203 iommu->flush.flush_context(iommu, 0, 0, 0,
David Woodhouse4c25a2c2009-05-10 17:16:06 +01002204 DMA_CCMD_GLOBAL_INVL);
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01002205 iommu->flush.flush_iotlb(iommu, 0, 0, 0, DMA_TLB_GLOBAL_FLUSH);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002206}
2207
David Woodhouse109b9b02012-05-25 17:43:02 +01002208static inline void unlink_domain_info(struct device_domain_info *info)
2209{
2210 assert_spin_locked(&device_domain_lock);
2211 list_del(&info->link);
2212 list_del(&info->global);
2213 if (info->dev)
David Woodhouse0bcb3e22014-03-06 17:12:03 +00002214 info->dev->archdata.iommu = NULL;
David Woodhouse109b9b02012-05-25 17:43:02 +01002215}
2216
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002217static void domain_remove_dev_info(struct dmar_domain *domain)
2218{
Yijing Wang3a74ca02014-05-20 20:37:47 +08002219 struct device_domain_info *info, *tmp;
Jiang Liufb170fb2014-07-11 14:19:28 +08002220 unsigned long flags;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002221
2222 spin_lock_irqsave(&device_domain_lock, flags);
Joerg Roedel76f45fe2015-07-21 18:25:11 +02002223 list_for_each_entry_safe(info, tmp, &domain->devices, link)
Joerg Roedel127c7612015-07-23 17:44:46 +02002224 __dmar_remove_one_dev_info(info);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002225 spin_unlock_irqrestore(&device_domain_lock, flags);
2226}
2227
2228/*
2229 * find_domain
David Woodhouse1525a292014-03-06 16:19:30 +00002230 * Note: we use struct device->archdata.iommu stores the info
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002231 */
David Woodhouse1525a292014-03-06 16:19:30 +00002232static struct dmar_domain *find_domain(struct device *dev)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002233{
2234 struct device_domain_info *info;
2235
2236 /* No lock here, assumes no domain exit in normal case */
David Woodhouse1525a292014-03-06 16:19:30 +00002237 info = dev->archdata.iommu;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002238 if (info)
2239 return info->domain;
2240 return NULL;
2241}
2242
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002243static inline struct device_domain_info *
Jiang Liu745f2582014-02-19 14:07:26 +08002244dmar_search_domain_by_dev_info(int segment, int bus, int devfn)
2245{
2246 struct device_domain_info *info;
2247
2248 list_for_each_entry(info, &device_domain_list, global)
David Woodhouse41e80dca2014-03-09 13:55:54 -07002249 if (info->iommu->segment == segment && info->bus == bus &&
Jiang Liu745f2582014-02-19 14:07:26 +08002250 info->devfn == devfn)
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002251 return info;
Jiang Liu745f2582014-02-19 14:07:26 +08002252
2253 return NULL;
2254}
2255
Joerg Roedel5db31562015-07-22 12:40:43 +02002256static struct dmar_domain *dmar_insert_one_dev_info(struct intel_iommu *iommu,
2257 int bus, int devfn,
2258 struct device *dev,
2259 struct dmar_domain *domain)
Jiang Liu745f2582014-02-19 14:07:26 +08002260{
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002261 struct dmar_domain *found = NULL;
Jiang Liu745f2582014-02-19 14:07:26 +08002262 struct device_domain_info *info;
2263 unsigned long flags;
Joerg Roedeld160aca2015-07-22 11:52:53 +02002264 int ret;
Jiang Liu745f2582014-02-19 14:07:26 +08002265
2266 info = alloc_devinfo_mem();
2267 if (!info)
David Woodhouseb718cd32014-03-09 13:11:33 -07002268 return NULL;
Jiang Liu745f2582014-02-19 14:07:26 +08002269
Jiang Liu745f2582014-02-19 14:07:26 +08002270 info->bus = bus;
2271 info->devfn = devfn;
Bjorn Helgaasfb0cc3a2015-07-20 09:10:36 -05002272 info->ats.enabled = 0;
2273 info->ats.qdep = 0;
Jiang Liu745f2582014-02-19 14:07:26 +08002274 info->dev = dev;
2275 info->domain = domain;
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002276 info->iommu = iommu;
Jiang Liu745f2582014-02-19 14:07:26 +08002277
2278 spin_lock_irqsave(&device_domain_lock, flags);
2279 if (dev)
David Woodhouse0bcb3e22014-03-06 17:12:03 +00002280 found = find_domain(dev);
Joerg Roedelf303e502015-07-23 18:37:13 +02002281
2282 if (!found) {
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002283 struct device_domain_info *info2;
David Woodhouse41e80dca2014-03-09 13:55:54 -07002284 info2 = dmar_search_domain_by_dev_info(iommu->segment, bus, devfn);
Joerg Roedelf303e502015-07-23 18:37:13 +02002285 if (info2) {
2286 found = info2->domain;
2287 info2->dev = dev;
2288 }
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002289 }
Joerg Roedelf303e502015-07-23 18:37:13 +02002290
Jiang Liu745f2582014-02-19 14:07:26 +08002291 if (found) {
2292 spin_unlock_irqrestore(&device_domain_lock, flags);
2293 free_devinfo_mem(info);
David Woodhouseb718cd32014-03-09 13:11:33 -07002294 /* Caller must free the original domain */
2295 return found;
Jiang Liu745f2582014-02-19 14:07:26 +08002296 }
2297
Joerg Roedeld160aca2015-07-22 11:52:53 +02002298 spin_lock(&iommu->lock);
2299 ret = domain_attach_iommu(domain, iommu);
2300 spin_unlock(&iommu->lock);
2301
2302 if (ret) {
Joerg Roedelc6c2ceb2015-07-22 13:11:53 +02002303 spin_unlock_irqrestore(&device_domain_lock, flags);
Sudip Mukherjee499f3aa2015-09-18 16:27:07 +05302304 free_devinfo_mem(info);
Joerg Roedelc6c2ceb2015-07-22 13:11:53 +02002305 return NULL;
2306 }
Joerg Roedelc6c2ceb2015-07-22 13:11:53 +02002307
David Woodhouseb718cd32014-03-09 13:11:33 -07002308 list_add(&info->link, &domain->devices);
2309 list_add(&info->global, &device_domain_list);
2310 if (dev)
2311 dev->archdata.iommu = info;
2312 spin_unlock_irqrestore(&device_domain_lock, flags);
2313
Joerg Roedelcc4e2572015-07-22 10:04:36 +02002314 if (dev && domain_context_mapping(domain, dev)) {
2315 pr_err("Domain context map for %s failed\n", dev_name(dev));
Joerg Roedele6de0f82015-07-22 16:30:36 +02002316 dmar_remove_one_dev_info(domain, dev);
Joerg Roedelcc4e2572015-07-22 10:04:36 +02002317 return NULL;
2318 }
2319
David Woodhouseb718cd32014-03-09 13:11:33 -07002320 return domain;
Jiang Liu745f2582014-02-19 14:07:26 +08002321}
2322
Alex Williamson579305f2014-07-03 09:51:43 -06002323static int get_last_alias(struct pci_dev *pdev, u16 alias, void *opaque)
2324{
2325 *(u16 *)opaque = alias;
2326 return 0;
2327}
2328
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002329/* domain is initialized */
David Woodhouse146922e2014-03-09 15:44:17 -07002330static struct dmar_domain *get_domain_for_dev(struct device *dev, int gaw)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002331{
Joerg Roedelcc4e2572015-07-22 10:04:36 +02002332 struct device_domain_info *info = NULL;
Alex Williamson579305f2014-07-03 09:51:43 -06002333 struct dmar_domain *domain, *tmp;
2334 struct intel_iommu *iommu;
Joerg Roedel08a7f452015-07-23 18:09:11 +02002335 u16 req_id, dma_alias;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002336 unsigned long flags;
Yijing Wangaa4d0662014-05-26 20:14:06 +08002337 u8 bus, devfn;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002338
David Woodhouse146922e2014-03-09 15:44:17 -07002339 domain = find_domain(dev);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002340 if (domain)
2341 return domain;
2342
David Woodhouse146922e2014-03-09 15:44:17 -07002343 iommu = device_to_iommu(dev, &bus, &devfn);
2344 if (!iommu)
Alex Williamson579305f2014-07-03 09:51:43 -06002345 return NULL;
2346
Joerg Roedel08a7f452015-07-23 18:09:11 +02002347 req_id = ((u16)bus << 8) | devfn;
2348
Alex Williamson579305f2014-07-03 09:51:43 -06002349 if (dev_is_pci(dev)) {
2350 struct pci_dev *pdev = to_pci_dev(dev);
2351
2352 pci_for_each_dma_alias(pdev, get_last_alias, &dma_alias);
2353
2354 spin_lock_irqsave(&device_domain_lock, flags);
2355 info = dmar_search_domain_by_dev_info(pci_domain_nr(pdev->bus),
2356 PCI_BUS_NUM(dma_alias),
2357 dma_alias & 0xff);
2358 if (info) {
2359 iommu = info->iommu;
2360 domain = info->domain;
2361 }
2362 spin_unlock_irqrestore(&device_domain_lock, flags);
2363
2364 /* DMA alias already has a domain, uses it */
2365 if (info)
2366 goto found_domain;
2367 }
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002368
David Woodhouse146922e2014-03-09 15:44:17 -07002369 /* Allocate and initialize new domain for the device */
Jiang Liuab8dfe22014-07-11 14:19:27 +08002370 domain = alloc_domain(0);
Jiang Liu745f2582014-02-19 14:07:26 +08002371 if (!domain)
Alex Williamson579305f2014-07-03 09:51:43 -06002372 return NULL;
Joerg Roedeldc534b22015-07-22 12:44:02 +02002373 if (domain_init(domain, iommu, gaw)) {
Alex Williamson579305f2014-07-03 09:51:43 -06002374 domain_exit(domain);
2375 return NULL;
2376 }
2377
2378 /* register PCI DMA alias device */
Joerg Roedel08a7f452015-07-23 18:09:11 +02002379 if (req_id != dma_alias && dev_is_pci(dev)) {
Joerg Roedel5db31562015-07-22 12:40:43 +02002380 tmp = dmar_insert_one_dev_info(iommu, PCI_BUS_NUM(dma_alias),
2381 dma_alias & 0xff, NULL, domain);
Alex Williamson579305f2014-07-03 09:51:43 -06002382
2383 if (!tmp || tmp != domain) {
2384 domain_exit(domain);
2385 domain = tmp;
2386 }
2387
David Woodhouseb718cd32014-03-09 13:11:33 -07002388 if (!domain)
Alex Williamson579305f2014-07-03 09:51:43 -06002389 return NULL;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002390 }
2391
2392found_domain:
Joerg Roedel5db31562015-07-22 12:40:43 +02002393 tmp = dmar_insert_one_dev_info(iommu, bus, devfn, dev, domain);
Alex Williamson579305f2014-07-03 09:51:43 -06002394
2395 if (!tmp || tmp != domain) {
2396 domain_exit(domain);
2397 domain = tmp;
2398 }
David Woodhouseb718cd32014-03-09 13:11:33 -07002399
2400 return domain;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002401}
2402
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002403static int iommu_identity_mapping;
David Woodhousee0fc7e02009-09-30 09:12:17 -07002404#define IDENTMAP_ALL 1
2405#define IDENTMAP_GFX 2
2406#define IDENTMAP_AZALIA 4
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002407
David Woodhouseb2132032009-06-26 18:50:28 +01002408static int iommu_domain_identity_map(struct dmar_domain *domain,
2409 unsigned long long start,
2410 unsigned long long end)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002411{
David Woodhousec5395d52009-06-28 16:35:56 +01002412 unsigned long first_vpfn = start >> VTD_PAGE_SHIFT;
2413 unsigned long last_vpfn = end >> VTD_PAGE_SHIFT;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002414
David Woodhousec5395d52009-06-28 16:35:56 +01002415 if (!reserve_iova(&domain->iovad, dma_to_mm_pfn(first_vpfn),
2416 dma_to_mm_pfn(last_vpfn))) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002417 pr_err("Reserving iova failed\n");
David Woodhouseb2132032009-06-26 18:50:28 +01002418 return -ENOMEM;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002419 }
2420
Joerg Roedelaf1089c2015-07-21 15:45:19 +02002421 pr_debug("Mapping reserved region %llx-%llx\n", start, end);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002422 /*
2423 * RMRR range might have overlap with physical memory range,
2424 * clear it first
2425 */
David Woodhousec5395d52009-06-28 16:35:56 +01002426 dma_pte_clear_range(domain, first_vpfn, last_vpfn);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002427
David Woodhousec5395d52009-06-28 16:35:56 +01002428 return domain_pfn_mapping(domain, first_vpfn, first_vpfn,
2429 last_vpfn - first_vpfn + 1,
David Woodhouse61df7442009-06-28 11:55:58 +01002430 DMA_PTE_READ|DMA_PTE_WRITE);
David Woodhouseb2132032009-06-26 18:50:28 +01002431}
2432
David Woodhouse0b9d9752014-03-09 15:48:15 -07002433static int iommu_prepare_identity_map(struct device *dev,
David Woodhouseb2132032009-06-26 18:50:28 +01002434 unsigned long long start,
2435 unsigned long long end)
2436{
2437 struct dmar_domain *domain;
2438 int ret;
2439
David Woodhouse0b9d9752014-03-09 15:48:15 -07002440 domain = get_domain_for_dev(dev, DEFAULT_DOMAIN_ADDRESS_WIDTH);
David Woodhouseb2132032009-06-26 18:50:28 +01002441 if (!domain)
2442 return -ENOMEM;
2443
David Woodhouse19943b02009-08-04 16:19:20 +01002444 /* For _hardware_ passthrough, don't bother. But for software
2445 passthrough, we do it anyway -- it may indicate a memory
2446 range which is reserved in E820, so which didn't get set
2447 up to start with in si_domain */
2448 if (domain == si_domain && hw_pass_through) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002449 pr_warn("Ignoring identity map for HW passthrough device %s [0x%Lx - 0x%Lx]\n",
2450 dev_name(dev), start, end);
David Woodhouse19943b02009-08-04 16:19:20 +01002451 return 0;
2452 }
2453
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002454 pr_info("Setting identity map for device %s [0x%Lx - 0x%Lx]\n",
2455 dev_name(dev), start, end);
2456
David Woodhouse5595b522009-12-02 09:21:55 +00002457 if (end < start) {
2458 WARN(1, "Your BIOS is broken; RMRR ends before it starts!\n"
2459 "BIOS vendor: %s; Ver: %s; Product Version: %s\n",
2460 dmi_get_system_info(DMI_BIOS_VENDOR),
2461 dmi_get_system_info(DMI_BIOS_VERSION),
2462 dmi_get_system_info(DMI_PRODUCT_VERSION));
2463 ret = -EIO;
2464 goto error;
2465 }
2466
David Woodhouse2ff729f2009-08-26 14:25:41 +01002467 if (end >> agaw_to_width(domain->agaw)) {
2468 WARN(1, "Your BIOS is broken; RMRR exceeds permitted address width (%d bits)\n"
2469 "BIOS vendor: %s; Ver: %s; Product Version: %s\n",
2470 agaw_to_width(domain->agaw),
2471 dmi_get_system_info(DMI_BIOS_VENDOR),
2472 dmi_get_system_info(DMI_BIOS_VERSION),
2473 dmi_get_system_info(DMI_PRODUCT_VERSION));
2474 ret = -EIO;
2475 goto error;
2476 }
David Woodhouse19943b02009-08-04 16:19:20 +01002477
David Woodhouseb2132032009-06-26 18:50:28 +01002478 ret = iommu_domain_identity_map(domain, start, end);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002479 if (ret)
2480 goto error;
2481
David Woodhouseb2132032009-06-26 18:50:28 +01002482 return 0;
2483
2484 error:
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002485 domain_exit(domain);
2486 return ret;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002487}
2488
2489static inline int iommu_prepare_rmrr_dev(struct dmar_rmrr_unit *rmrr,
David Woodhouse0b9d9752014-03-09 15:48:15 -07002490 struct device *dev)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002491{
David Woodhouse0b9d9752014-03-09 15:48:15 -07002492 if (dev->archdata.iommu == DUMMY_DEVICE_DOMAIN_INFO)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002493 return 0;
David Woodhouse0b9d9752014-03-09 15:48:15 -07002494 return iommu_prepare_identity_map(dev, rmrr->base_address,
2495 rmrr->end_address);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002496}
2497
Suresh Siddhad3f13812011-08-23 17:05:25 -07002498#ifdef CONFIG_INTEL_IOMMU_FLOPPY_WA
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002499static inline void iommu_prepare_isa(void)
2500{
2501 struct pci_dev *pdev;
2502 int ret;
2503
2504 pdev = pci_get_class(PCI_CLASS_BRIDGE_ISA << 8, NULL);
2505 if (!pdev)
2506 return;
2507
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002508 pr_info("Prepare 0-16MiB unity mapping for LPC\n");
David Woodhouse0b9d9752014-03-09 15:48:15 -07002509 ret = iommu_prepare_identity_map(&pdev->dev, 0, 16*1024*1024 - 1);
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002510
2511 if (ret)
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002512 pr_err("Failed to create 0-16MiB identity map - floppy might not work\n");
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002513
Yijing Wang9b27e822014-05-20 20:37:52 +08002514 pci_dev_put(pdev);
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002515}
2516#else
2517static inline void iommu_prepare_isa(void)
2518{
2519 return;
2520}
Suresh Siddhad3f13812011-08-23 17:05:25 -07002521#endif /* !CONFIG_INTEL_IOMMU_FLPY_WA */
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07002522
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002523static int md_domain_init(struct dmar_domain *domain, int guest_width);
David Woodhousec7ab48d2009-06-26 19:10:36 +01002524
Matt Kraai071e1372009-08-23 22:30:22 -07002525static int __init si_domain_init(int hw)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002526{
David Woodhousec7ab48d2009-06-26 19:10:36 +01002527 int nid, ret = 0;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002528
Jiang Liuab8dfe22014-07-11 14:19:27 +08002529 si_domain = alloc_domain(DOMAIN_FLAG_STATIC_IDENTITY);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002530 if (!si_domain)
2531 return -EFAULT;
2532
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002533 if (md_domain_init(si_domain, DEFAULT_DOMAIN_ADDRESS_WIDTH)) {
2534 domain_exit(si_domain);
2535 return -EFAULT;
2536 }
2537
Joerg Roedel0dc79712015-07-21 15:40:06 +02002538 pr_debug("Identity mapping domain allocated\n");
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002539
David Woodhouse19943b02009-08-04 16:19:20 +01002540 if (hw)
2541 return 0;
2542
David Woodhousec7ab48d2009-06-26 19:10:36 +01002543 for_each_online_node(nid) {
Tejun Heod4bbf7e2011-11-28 09:46:22 -08002544 unsigned long start_pfn, end_pfn;
2545 int i;
2546
2547 for_each_mem_pfn_range(i, nid, &start_pfn, &end_pfn, NULL) {
2548 ret = iommu_domain_identity_map(si_domain,
2549 PFN_PHYS(start_pfn), PFN_PHYS(end_pfn));
2550 if (ret)
2551 return ret;
2552 }
David Woodhousec7ab48d2009-06-26 19:10:36 +01002553 }
2554
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002555 return 0;
2556}
2557
David Woodhouse9b226622014-03-09 14:03:28 -07002558static int identity_mapping(struct device *dev)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002559{
2560 struct device_domain_info *info;
2561
2562 if (likely(!iommu_identity_mapping))
2563 return 0;
2564
David Woodhouse9b226622014-03-09 14:03:28 -07002565 info = dev->archdata.iommu;
Mike Traviscb452a42011-05-28 13:15:03 -05002566 if (info && info != DUMMY_DEVICE_DOMAIN_INFO)
2567 return (info->domain == si_domain);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002568
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002569 return 0;
2570}
2571
Joerg Roedel28ccce02015-07-21 14:45:31 +02002572static int domain_add_dev_info(struct dmar_domain *domain, struct device *dev)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002573{
David Woodhouse0ac72662014-03-09 13:19:22 -07002574 struct dmar_domain *ndomain;
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002575 struct intel_iommu *iommu;
David Woodhouse156baca2014-03-09 14:00:57 -07002576 u8 bus, devfn;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002577
David Woodhouse5913c9b2014-03-09 16:27:31 -07002578 iommu = device_to_iommu(dev, &bus, &devfn);
David Woodhouse5a8f40e2014-03-09 13:31:18 -07002579 if (!iommu)
2580 return -ENODEV;
2581
Joerg Roedel5db31562015-07-22 12:40:43 +02002582 ndomain = dmar_insert_one_dev_info(iommu, bus, devfn, dev, domain);
David Woodhouse0ac72662014-03-09 13:19:22 -07002583 if (ndomain != domain)
2584 return -EBUSY;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002585
2586 return 0;
2587}
2588
David Woodhouse0b9d9752014-03-09 15:48:15 -07002589static bool device_has_rmrr(struct device *dev)
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002590{
2591 struct dmar_rmrr_unit *rmrr;
David Woodhouse832bd852014-03-07 15:08:36 +00002592 struct device *tmp;
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002593 int i;
2594
Jiang Liu0e2426122014-02-19 14:07:34 +08002595 rcu_read_lock();
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002596 for_each_rmrr_units(rmrr) {
Jiang Liub683b232014-02-19 14:07:32 +08002597 /*
2598 * Return TRUE if this RMRR contains the device that
2599 * is passed in.
2600 */
2601 for_each_active_dev_scope(rmrr->devices,
2602 rmrr->devices_cnt, i, tmp)
David Woodhouse0b9d9752014-03-09 15:48:15 -07002603 if (tmp == dev) {
Jiang Liu0e2426122014-02-19 14:07:34 +08002604 rcu_read_unlock();
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002605 return true;
Jiang Liub683b232014-02-19 14:07:32 +08002606 }
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002607 }
Jiang Liu0e2426122014-02-19 14:07:34 +08002608 rcu_read_unlock();
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002609 return false;
2610}
2611
Alex Williamsonc875d2c2014-07-03 09:57:02 -06002612/*
2613 * There are a couple cases where we need to restrict the functionality of
2614 * devices associated with RMRRs. The first is when evaluating a device for
2615 * identity mapping because problems exist when devices are moved in and out
2616 * of domains and their respective RMRR information is lost. This means that
2617 * a device with associated RMRRs will never be in a "passthrough" domain.
2618 * The second is use of the device through the IOMMU API. This interface
2619 * expects to have full control of the IOVA space for the device. We cannot
2620 * satisfy both the requirement that RMRR access is maintained and have an
2621 * unencumbered IOVA space. We also have no ability to quiesce the device's
2622 * use of the RMRR space or even inform the IOMMU API user of the restriction.
2623 * We therefore prevent devices associated with an RMRR from participating in
2624 * the IOMMU API, which eliminates them from device assignment.
2625 *
2626 * In both cases we assume that PCI USB devices with RMRRs have them largely
2627 * for historical reasons and that the RMRR space is not actively used post
2628 * boot. This exclusion may change if vendors begin to abuse it.
David Woodhouse18436af2015-03-25 15:05:47 +00002629 *
2630 * The same exception is made for graphics devices, with the requirement that
2631 * any use of the RMRR regions will be torn down before assigning the device
2632 * to a guest.
Alex Williamsonc875d2c2014-07-03 09:57:02 -06002633 */
2634static bool device_is_rmrr_locked(struct device *dev)
2635{
2636 if (!device_has_rmrr(dev))
2637 return false;
2638
2639 if (dev_is_pci(dev)) {
2640 struct pci_dev *pdev = to_pci_dev(dev);
2641
David Woodhouse18436af2015-03-25 15:05:47 +00002642 if (IS_USB_DEVICE(pdev) || IS_GFX_DEVICE(pdev))
Alex Williamsonc875d2c2014-07-03 09:57:02 -06002643 return false;
2644 }
2645
2646 return true;
2647}
2648
David Woodhouse3bdb2592014-03-09 16:03:08 -07002649static int iommu_should_identity_map(struct device *dev, int startup)
David Woodhouse6941af22009-07-04 18:24:27 +01002650{
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002651
David Woodhouse3bdb2592014-03-09 16:03:08 -07002652 if (dev_is_pci(dev)) {
2653 struct pci_dev *pdev = to_pci_dev(dev);
Tom Mingarelliea2447f72012-11-20 19:43:17 +00002654
Alex Williamsonc875d2c2014-07-03 09:57:02 -06002655 if (device_is_rmrr_locked(dev))
David Woodhouse3bdb2592014-03-09 16:03:08 -07002656 return 0;
David Woodhousee0fc7e02009-09-30 09:12:17 -07002657
David Woodhouse3bdb2592014-03-09 16:03:08 -07002658 if ((iommu_identity_mapping & IDENTMAP_AZALIA) && IS_AZALIA(pdev))
2659 return 1;
David Woodhousee0fc7e02009-09-30 09:12:17 -07002660
David Woodhouse3bdb2592014-03-09 16:03:08 -07002661 if ((iommu_identity_mapping & IDENTMAP_GFX) && IS_GFX_DEVICE(pdev))
2662 return 1;
2663
2664 if (!(iommu_identity_mapping & IDENTMAP_ALL))
2665 return 0;
2666
2667 /*
2668 * We want to start off with all devices in the 1:1 domain, and
2669 * take them out later if we find they can't access all of memory.
2670 *
2671 * However, we can't do this for PCI devices behind bridges,
2672 * because all PCI devices behind the same bridge will end up
2673 * with the same source-id on their transactions.
2674 *
2675 * Practically speaking, we can't change things around for these
2676 * devices at run-time, because we can't be sure there'll be no
2677 * DMA transactions in flight for any of their siblings.
2678 *
2679 * So PCI devices (unless they're on the root bus) as well as
2680 * their parent PCI-PCI or PCIe-PCI bridges must be left _out_ of
2681 * the 1:1 domain, just in _case_ one of their siblings turns out
2682 * not to be able to map all of memory.
2683 */
2684 if (!pci_is_pcie(pdev)) {
2685 if (!pci_is_root_bus(pdev->bus))
2686 return 0;
2687 if (pdev->class >> 8 == PCI_CLASS_BRIDGE_PCI)
2688 return 0;
2689 } else if (pci_pcie_type(pdev) == PCI_EXP_TYPE_PCI_BRIDGE)
2690 return 0;
2691 } else {
2692 if (device_has_rmrr(dev))
2693 return 0;
2694 }
David Woodhouse6941af22009-07-04 18:24:27 +01002695
David Woodhouse3dfc8132009-07-04 19:11:08 +01002696 /*
David Woodhouse3dfc8132009-07-04 19:11:08 +01002697 * At boot time, we don't yet know if devices will be 64-bit capable.
David Woodhouse3bdb2592014-03-09 16:03:08 -07002698 * Assume that they will — if they turn out not to be, then we can
David Woodhouse3dfc8132009-07-04 19:11:08 +01002699 * take them out of the 1:1 domain later.
2700 */
Chris Wright8fcc5372011-05-28 13:15:02 -05002701 if (!startup) {
2702 /*
2703 * If the device's dma_mask is less than the system's memory
2704 * size then this is not a candidate for identity mapping.
2705 */
David Woodhouse3bdb2592014-03-09 16:03:08 -07002706 u64 dma_mask = *dev->dma_mask;
Chris Wright8fcc5372011-05-28 13:15:02 -05002707
David Woodhouse3bdb2592014-03-09 16:03:08 -07002708 if (dev->coherent_dma_mask &&
2709 dev->coherent_dma_mask < dma_mask)
2710 dma_mask = dev->coherent_dma_mask;
Chris Wright8fcc5372011-05-28 13:15:02 -05002711
David Woodhouse3bdb2592014-03-09 16:03:08 -07002712 return dma_mask >= dma_get_required_mask(dev);
Chris Wright8fcc5372011-05-28 13:15:02 -05002713 }
David Woodhouse6941af22009-07-04 18:24:27 +01002714
2715 return 1;
2716}
2717
David Woodhousecf04eee2014-03-21 16:49:04 +00002718static int __init dev_prepare_static_identity_mapping(struct device *dev, int hw)
2719{
2720 int ret;
2721
2722 if (!iommu_should_identity_map(dev, 1))
2723 return 0;
2724
Joerg Roedel28ccce02015-07-21 14:45:31 +02002725 ret = domain_add_dev_info(si_domain, dev);
David Woodhousecf04eee2014-03-21 16:49:04 +00002726 if (!ret)
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002727 pr_info("%s identity mapping for device %s\n",
2728 hw ? "Hardware" : "Software", dev_name(dev));
David Woodhousecf04eee2014-03-21 16:49:04 +00002729 else if (ret == -ENODEV)
2730 /* device not associated with an iommu */
2731 ret = 0;
2732
2733 return ret;
2734}
2735
2736
Matt Kraai071e1372009-08-23 22:30:22 -07002737static int __init iommu_prepare_static_identity_mapping(int hw)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002738{
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002739 struct pci_dev *pdev = NULL;
David Woodhousecf04eee2014-03-21 16:49:04 +00002740 struct dmar_drhd_unit *drhd;
2741 struct intel_iommu *iommu;
2742 struct device *dev;
2743 int i;
2744 int ret = 0;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002745
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002746 for_each_pci_dev(pdev) {
David Woodhousecf04eee2014-03-21 16:49:04 +00002747 ret = dev_prepare_static_identity_mapping(&pdev->dev, hw);
2748 if (ret)
2749 return ret;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002750 }
2751
David Woodhousecf04eee2014-03-21 16:49:04 +00002752 for_each_active_iommu(iommu, drhd)
2753 for_each_active_dev_scope(drhd->devices, drhd->devices_cnt, i, dev) {
2754 struct acpi_device_physical_node *pn;
2755 struct acpi_device *adev;
2756
2757 if (dev->bus != &acpi_bus_type)
2758 continue;
Joerg Roedel86080cc2015-06-12 12:27:16 +02002759
David Woodhousecf04eee2014-03-21 16:49:04 +00002760 adev= to_acpi_device(dev);
2761 mutex_lock(&adev->physical_node_lock);
2762 list_for_each_entry(pn, &adev->physical_node_list, node) {
2763 ret = dev_prepare_static_identity_mapping(pn->dev, hw);
2764 if (ret)
2765 break;
2766 }
2767 mutex_unlock(&adev->physical_node_lock);
2768 if (ret)
2769 return ret;
2770 }
2771
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07002772 return 0;
2773}
2774
Jiang Liuffebeb42014-11-09 22:48:02 +08002775static void intel_iommu_init_qi(struct intel_iommu *iommu)
2776{
2777 /*
2778 * Start from the sane iommu hardware state.
2779 * If the queued invalidation is already initialized by us
2780 * (for example, while enabling interrupt-remapping) then
2781 * we got the things already rolling from a sane state.
2782 */
2783 if (!iommu->qi) {
2784 /*
2785 * Clear any previous faults.
2786 */
2787 dmar_fault(-1, iommu);
2788 /*
2789 * Disable queued invalidation if supported and already enabled
2790 * before OS handover.
2791 */
2792 dmar_disable_qi(iommu);
2793 }
2794
2795 if (dmar_enable_qi(iommu)) {
2796 /*
2797 * Queued Invalidate not enabled, use Register Based Invalidate
2798 */
2799 iommu->flush.flush_context = __iommu_flush_context;
2800 iommu->flush.flush_iotlb = __iommu_flush_iotlb;
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002801 pr_info("%s: Using Register based invalidation\n",
Jiang Liuffebeb42014-11-09 22:48:02 +08002802 iommu->name);
2803 } else {
2804 iommu->flush.flush_context = qi_flush_context;
2805 iommu->flush.flush_iotlb = qi_flush_iotlb;
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02002806 pr_info("%s: Using Queued invalidation\n", iommu->name);
Jiang Liuffebeb42014-11-09 22:48:02 +08002807 }
2808}
2809
Joerg Roedel091d42e2015-06-12 11:56:10 +02002810static int copy_context_table(struct intel_iommu *iommu,
Joerg Roedel543c8dc2015-08-13 11:56:59 +02002811 struct root_entry __iomem *old_re,
Joerg Roedel091d42e2015-06-12 11:56:10 +02002812 struct context_entry **tbl,
2813 int bus, bool ext)
2814{
Joerg Roedeldbcd8612015-06-12 12:02:09 +02002815 int tbl_idx, pos = 0, idx, devfn, ret = 0, did;
Joerg Roedel543c8dc2015-08-13 11:56:59 +02002816 struct context_entry __iomem *old_ce = NULL;
2817 struct context_entry *new_ce = NULL, ce;
2818 struct root_entry re;
Joerg Roedel091d42e2015-06-12 11:56:10 +02002819 phys_addr_t old_ce_phys;
2820
2821 tbl_idx = ext ? bus * 2 : bus;
Joerg Roedel543c8dc2015-08-13 11:56:59 +02002822 memcpy_fromio(&re, old_re, sizeof(re));
Joerg Roedel091d42e2015-06-12 11:56:10 +02002823
2824 for (devfn = 0; devfn < 256; devfn++) {
2825 /* First calculate the correct index */
2826 idx = (ext ? devfn * 2 : devfn) % 256;
2827
2828 if (idx == 0) {
2829 /* First save what we may have and clean up */
2830 if (new_ce) {
2831 tbl[tbl_idx] = new_ce;
2832 __iommu_flush_cache(iommu, new_ce,
2833 VTD_PAGE_SIZE);
2834 pos = 1;
2835 }
2836
2837 if (old_ce)
2838 iounmap(old_ce);
2839
2840 ret = 0;
2841 if (devfn < 0x80)
Joerg Roedel543c8dc2015-08-13 11:56:59 +02002842 old_ce_phys = root_entry_lctp(&re);
Joerg Roedel091d42e2015-06-12 11:56:10 +02002843 else
Joerg Roedel543c8dc2015-08-13 11:56:59 +02002844 old_ce_phys = root_entry_uctp(&re);
Joerg Roedel091d42e2015-06-12 11:56:10 +02002845
2846 if (!old_ce_phys) {
2847 if (ext && devfn == 0) {
2848 /* No LCTP, try UCTP */
2849 devfn = 0x7f;
2850 continue;
2851 } else {
2852 goto out;
2853 }
2854 }
2855
2856 ret = -ENOMEM;
2857 old_ce = ioremap_cache(old_ce_phys, PAGE_SIZE);
2858 if (!old_ce)
2859 goto out;
2860
2861 new_ce = alloc_pgtable_page(iommu->node);
2862 if (!new_ce)
2863 goto out_unmap;
2864
2865 ret = 0;
2866 }
2867
2868 /* Now copy the context entry */
Joerg Roedel543c8dc2015-08-13 11:56:59 +02002869 memcpy_fromio(&ce, old_ce + idx, sizeof(ce));
Joerg Roedel091d42e2015-06-12 11:56:10 +02002870
Joerg Roedelcf484d02015-06-12 12:21:46 +02002871 if (!__context_present(&ce))
Joerg Roedel091d42e2015-06-12 11:56:10 +02002872 continue;
2873
Joerg Roedeldbcd8612015-06-12 12:02:09 +02002874 did = context_domain_id(&ce);
2875 if (did >= 0 && did < cap_ndoms(iommu->cap))
2876 set_bit(did, iommu->domain_ids);
2877
Joerg Roedelcf484d02015-06-12 12:21:46 +02002878 /*
2879 * We need a marker for copied context entries. This
2880 * marker needs to work for the old format as well as
2881 * for extended context entries.
2882 *
2883 * Bit 67 of the context entry is used. In the old
2884 * format this bit is available to software, in the
2885 * extended format it is the PGE bit, but PGE is ignored
2886 * by HW if PASIDs are disabled (and thus still
2887 * available).
2888 *
2889 * So disable PASIDs first and then mark the entry
2890 * copied. This means that we don't copy PASID
2891 * translations from the old kernel, but this is fine as
2892 * faults there are not fatal.
2893 */
2894 context_clear_pasid_enable(&ce);
2895 context_set_copied(&ce);
2896
Joerg Roedel091d42e2015-06-12 11:56:10 +02002897 new_ce[idx] = ce;
2898 }
2899
2900 tbl[tbl_idx + pos] = new_ce;
2901
2902 __iommu_flush_cache(iommu, new_ce, VTD_PAGE_SIZE);
2903
2904out_unmap:
2905 iounmap(old_ce);
2906
2907out:
2908 return ret;
2909}
2910
2911static int copy_translation_tables(struct intel_iommu *iommu)
2912{
Joerg Roedel543c8dc2015-08-13 11:56:59 +02002913 struct root_entry __iomem *old_rt;
Joerg Roedel091d42e2015-06-12 11:56:10 +02002914 struct context_entry **ctxt_tbls;
Joerg Roedel091d42e2015-06-12 11:56:10 +02002915 phys_addr_t old_rt_phys;
2916 int ctxt_table_entries;
2917 unsigned long flags;
2918 u64 rtaddr_reg;
2919 int bus, ret;
Joerg Roedelc3361f22015-06-12 12:39:25 +02002920 bool new_ext, ext;
Joerg Roedel091d42e2015-06-12 11:56:10 +02002921
2922 rtaddr_reg = dmar_readq(iommu->reg + DMAR_RTADDR_REG);
2923 ext = !!(rtaddr_reg & DMA_RTADDR_RTT);
Joerg Roedelc3361f22015-06-12 12:39:25 +02002924 new_ext = !!ecap_ecs(iommu->ecap);
2925
2926 /*
2927 * The RTT bit can only be changed when translation is disabled,
2928 * but disabling translation means to open a window for data
2929 * corruption. So bail out and don't copy anything if we would
2930 * have to change the bit.
2931 */
2932 if (new_ext != ext)
2933 return -EINVAL;
Joerg Roedel091d42e2015-06-12 11:56:10 +02002934
2935 old_rt_phys = rtaddr_reg & VTD_PAGE_MASK;
2936 if (!old_rt_phys)
2937 return -EINVAL;
2938
2939 old_rt = ioremap_cache(old_rt_phys, PAGE_SIZE);
2940 if (!old_rt)
2941 return -ENOMEM;
2942
2943 /* This is too big for the stack - allocate it from slab */
2944 ctxt_table_entries = ext ? 512 : 256;
2945 ret = -ENOMEM;
2946 ctxt_tbls = kzalloc(ctxt_table_entries * sizeof(void *), GFP_KERNEL);
2947 if (!ctxt_tbls)
2948 goto out_unmap;
2949
2950 for (bus = 0; bus < 256; bus++) {
2951 ret = copy_context_table(iommu, &old_rt[bus],
2952 ctxt_tbls, bus, ext);
2953 if (ret) {
2954 pr_err("%s: Failed to copy context table for bus %d\n",
2955 iommu->name, bus);
2956 continue;
2957 }
2958 }
2959
2960 spin_lock_irqsave(&iommu->lock, flags);
2961
2962 /* Context tables are copied, now write them to the root_entry table */
2963 for (bus = 0; bus < 256; bus++) {
2964 int idx = ext ? bus * 2 : bus;
2965 u64 val;
2966
2967 if (ctxt_tbls[idx]) {
2968 val = virt_to_phys(ctxt_tbls[idx]) | 1;
2969 iommu->root_entry[bus].lo = val;
2970 }
2971
2972 if (!ext || !ctxt_tbls[idx + 1])
2973 continue;
2974
2975 val = virt_to_phys(ctxt_tbls[idx + 1]) | 1;
2976 iommu->root_entry[bus].hi = val;
2977 }
2978
2979 spin_unlock_irqrestore(&iommu->lock, flags);
2980
2981 kfree(ctxt_tbls);
2982
2983 __iommu_flush_cache(iommu, iommu->root_entry, PAGE_SIZE);
2984
2985 ret = 0;
2986
2987out_unmap:
2988 iounmap(old_rt);
2989
2990 return ret;
2991}
2992
Joseph Cihulab7792602011-05-03 00:08:37 -07002993static int __init init_dmars(void)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002994{
2995 struct dmar_drhd_unit *drhd;
2996 struct dmar_rmrr_unit *rmrr;
Joerg Roedela87f4912015-06-12 12:32:54 +02002997 bool copied_tables = false;
David Woodhouse832bd852014-03-07 15:08:36 +00002998 struct device *dev;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07002999 struct intel_iommu *iommu;
Suresh Siddha9d783ba2009-03-16 17:04:55 -07003000 int i, ret;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003001
3002 /*
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003003 * for each drhd
3004 * allocate root
3005 * initialize and program root entry to not present
3006 * endfor
3007 */
3008 for_each_drhd_unit(drhd) {
mark gross5e0d2a62008-03-04 15:22:08 -08003009 /*
3010 * lock not needed as this is only incremented in the single
3011 * threaded kernel __init code path all other access are read
3012 * only
3013 */
Jiang Liu78d8e702014-11-09 22:47:57 +08003014 if (g_num_of_iommus < DMAR_UNITS_SUPPORTED) {
Mike Travis1b198bb2012-03-05 15:05:16 -08003015 g_num_of_iommus++;
3016 continue;
3017 }
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003018 pr_err_once("Exceeded %d IOMMUs\n", DMAR_UNITS_SUPPORTED);
mark gross5e0d2a62008-03-04 15:22:08 -08003019 }
3020
Jiang Liuffebeb42014-11-09 22:48:02 +08003021 /* Preallocate enough resources for IOMMU hot-addition */
3022 if (g_num_of_iommus < DMAR_UNITS_SUPPORTED)
3023 g_num_of_iommus = DMAR_UNITS_SUPPORTED;
3024
Weidong Hand9630fe2008-12-08 11:06:32 +08003025 g_iommus = kcalloc(g_num_of_iommus, sizeof(struct intel_iommu *),
3026 GFP_KERNEL);
3027 if (!g_iommus) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003028 pr_err("Allocating global iommu array failed\n");
Weidong Hand9630fe2008-12-08 11:06:32 +08003029 ret = -ENOMEM;
3030 goto error;
3031 }
3032
mark gross80b20dd2008-04-18 13:53:58 -07003033 deferred_flush = kzalloc(g_num_of_iommus *
3034 sizeof(struct deferred_flush_tables), GFP_KERNEL);
3035 if (!deferred_flush) {
mark gross5e0d2a62008-03-04 15:22:08 -08003036 ret = -ENOMEM;
Jiang Liu989d51f2014-02-19 14:07:21 +08003037 goto free_g_iommus;
mark gross5e0d2a62008-03-04 15:22:08 -08003038 }
3039
Jiang Liu7c919772014-01-06 14:18:18 +08003040 for_each_active_iommu(iommu, drhd) {
Weidong Hand9630fe2008-12-08 11:06:32 +08003041 g_iommus[iommu->seq_id] = iommu;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003042
Joerg Roedelb63d80d2015-06-12 09:14:34 +02003043 intel_iommu_init_qi(iommu);
3044
Suresh Siddhae61d98d2008-07-10 11:16:35 -07003045 ret = iommu_init_domains(iommu);
3046 if (ret)
Jiang Liu989d51f2014-02-19 14:07:21 +08003047 goto free_iommu;
Suresh Siddhae61d98d2008-07-10 11:16:35 -07003048
Joerg Roedel4158c2e2015-06-12 10:14:02 +02003049 init_translation_status(iommu);
3050
Joerg Roedel091d42e2015-06-12 11:56:10 +02003051 if (translation_pre_enabled(iommu) && !is_kdump_kernel()) {
3052 iommu_disable_translation(iommu);
3053 clear_translation_pre_enabled(iommu);
3054 pr_warn("Translation was enabled for %s but we are not in kdump mode\n",
3055 iommu->name);
3056 }
Joerg Roedel4158c2e2015-06-12 10:14:02 +02003057
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003058 /*
3059 * TBD:
3060 * we could share the same root & context tables
Lucas De Marchi25985ed2011-03-30 22:57:33 -03003061 * among all IOMMU's. Need to Split it later.
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003062 */
3063 ret = iommu_alloc_root_entry(iommu);
Jiang Liuffebeb42014-11-09 22:48:02 +08003064 if (ret)
Jiang Liu989d51f2014-02-19 14:07:21 +08003065 goto free_iommu;
Joerg Roedel5f0a7f72015-06-12 09:18:53 +02003066
Joerg Roedel091d42e2015-06-12 11:56:10 +02003067 if (translation_pre_enabled(iommu)) {
3068 pr_info("Translation already enabled - trying to copy translation structures\n");
3069
3070 ret = copy_translation_tables(iommu);
3071 if (ret) {
3072 /*
3073 * We found the IOMMU with translation
3074 * enabled - but failed to copy over the
3075 * old root-entry table. Try to proceed
3076 * by disabling translation now and
3077 * allocating a clean root-entry table.
3078 * This might cause DMAR faults, but
3079 * probably the dump will still succeed.
3080 */
3081 pr_err("Failed to copy translation tables from previous kernel for %s\n",
3082 iommu->name);
3083 iommu_disable_translation(iommu);
3084 clear_translation_pre_enabled(iommu);
3085 } else {
3086 pr_info("Copied translation tables from previous kernel for %s\n",
3087 iommu->name);
Joerg Roedela87f4912015-06-12 12:32:54 +02003088 copied_tables = true;
Joerg Roedel091d42e2015-06-12 11:56:10 +02003089 }
3090 }
3091
Joerg Roedel5f0a7f72015-06-12 09:18:53 +02003092 iommu_flush_write_buffer(iommu);
3093 iommu_set_root_entry(iommu);
3094 iommu->flush.flush_context(iommu, 0, 0, 0, DMA_CCMD_GLOBAL_INVL);
3095 iommu->flush.flush_iotlb(iommu, 0, 0, 0, DMA_TLB_GLOBAL_FLUSH);
3096
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07003097 if (!ecap_pass_through(iommu->ecap))
David Woodhouse19943b02009-08-04 16:19:20 +01003098 hw_pass_through = 0;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003099 }
3100
David Woodhouse19943b02009-08-04 16:19:20 +01003101 if (iommu_pass_through)
David Woodhousee0fc7e02009-09-30 09:12:17 -07003102 iommu_identity_mapping |= IDENTMAP_ALL;
3103
Suresh Siddhad3f13812011-08-23 17:05:25 -07003104#ifdef CONFIG_INTEL_IOMMU_BROKEN_GFX_WA
David Woodhousee0fc7e02009-09-30 09:12:17 -07003105 iommu_identity_mapping |= IDENTMAP_GFX;
David Woodhouse19943b02009-08-04 16:19:20 +01003106#endif
David Woodhousee0fc7e02009-09-30 09:12:17 -07003107
Joerg Roedel86080cc2015-06-12 12:27:16 +02003108 if (iommu_identity_mapping) {
3109 ret = si_domain_init(hw_pass_through);
3110 if (ret)
3111 goto free_iommu;
3112 }
3113
David Woodhousee0fc7e02009-09-30 09:12:17 -07003114 check_tylersburg_isoch();
3115
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07003116 /*
Joerg Roedela87f4912015-06-12 12:32:54 +02003117 * If we copied translations from a previous kernel in the kdump
3118 * case, we can not assign the devices to domains now, as that
3119 * would eliminate the old mappings. So skip this part and defer
3120 * the assignment to device driver initialization time.
3121 */
3122 if (copied_tables)
3123 goto domains_done;
3124
3125 /*
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07003126 * If pass through is not set or not enabled, setup context entries for
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003127 * identity mappings for rmrr, gfx, and isa and may fall back to static
3128 * identity mapping if iommu_identity_mapping is set.
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07003129 */
David Woodhouse19943b02009-08-04 16:19:20 +01003130 if (iommu_identity_mapping) {
3131 ret = iommu_prepare_static_identity_mapping(hw_pass_through);
3132 if (ret) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003133 pr_crit("Failed to setup IOMMU pass-through\n");
Jiang Liu989d51f2014-02-19 14:07:21 +08003134 goto free_iommu;
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07003135 }
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07003136 }
David Woodhouse19943b02009-08-04 16:19:20 +01003137 /*
3138 * For each rmrr
3139 * for each dev attached to rmrr
3140 * do
3141 * locate drhd for dev, alloc domain for dev
3142 * allocate free domain
3143 * allocate page table entries for rmrr
3144 * if context not allocated for bus
3145 * allocate and init context
3146 * set present in root table for this bus
3147 * init context with domain, translation etc
3148 * endfor
3149 * endfor
3150 */
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003151 pr_info("Setting RMRR:\n");
David Woodhouse19943b02009-08-04 16:19:20 +01003152 for_each_rmrr_units(rmrr) {
Jiang Liub683b232014-02-19 14:07:32 +08003153 /* some BIOS lists non-exist devices in DMAR table. */
3154 for_each_active_dev_scope(rmrr->devices, rmrr->devices_cnt,
David Woodhouse832bd852014-03-07 15:08:36 +00003155 i, dev) {
David Woodhouse0b9d9752014-03-09 15:48:15 -07003156 ret = iommu_prepare_rmrr_dev(rmrr, dev);
David Woodhouse19943b02009-08-04 16:19:20 +01003157 if (ret)
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003158 pr_err("Mapping reserved region failed\n");
David Woodhouse19943b02009-08-04 16:19:20 +01003159 }
3160 }
3161
3162 iommu_prepare_isa();
Keshavamurthy, Anil S49a04292007-10-21 16:41:57 -07003163
Joerg Roedela87f4912015-06-12 12:32:54 +02003164domains_done:
3165
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003166 /*
3167 * for each drhd
3168 * enable fault log
3169 * global invalidate context cache
3170 * global invalidate iotlb
3171 * enable translation
3172 */
Jiang Liu7c919772014-01-06 14:18:18 +08003173 for_each_iommu(iommu, drhd) {
Joseph Cihula51a63e62011-03-21 11:04:24 -07003174 if (drhd->ignored) {
3175 /*
3176 * we always have to disable PMRs or DMA may fail on
3177 * this device
3178 */
3179 if (force_on)
Jiang Liu7c919772014-01-06 14:18:18 +08003180 iommu_disable_protect_mem_regions(iommu);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003181 continue;
Joseph Cihula51a63e62011-03-21 11:04:24 -07003182 }
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003183
3184 iommu_flush_write_buffer(iommu);
3185
Keshavamurthy, Anil S3460a6d2007-10-21 16:41:54 -07003186 ret = dmar_set_interrupt(iommu);
3187 if (ret)
Jiang Liu989d51f2014-02-19 14:07:21 +08003188 goto free_iommu;
Keshavamurthy, Anil S3460a6d2007-10-21 16:41:54 -07003189
Joerg Roedel8939ddf2015-06-12 14:40:01 +02003190 if (!translation_pre_enabled(iommu))
3191 iommu_enable_translation(iommu);
3192
David Woodhouseb94996c2009-09-19 15:28:12 -07003193 iommu_disable_protect_mem_regions(iommu);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003194 }
3195
3196 return 0;
Jiang Liu989d51f2014-02-19 14:07:21 +08003197
3198free_iommu:
Jiang Liuffebeb42014-11-09 22:48:02 +08003199 for_each_active_iommu(iommu, drhd) {
3200 disable_dmar_iommu(iommu);
Jiang Liua868e6b2014-01-06 14:18:20 +08003201 free_dmar_iommu(iommu);
Jiang Liuffebeb42014-11-09 22:48:02 +08003202 }
Jiang Liu9bdc5312014-01-06 14:18:27 +08003203 kfree(deferred_flush);
Jiang Liu989d51f2014-02-19 14:07:21 +08003204free_g_iommus:
Weidong Hand9630fe2008-12-08 11:06:32 +08003205 kfree(g_iommus);
Jiang Liu989d51f2014-02-19 14:07:21 +08003206error:
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003207 return ret;
3208}
3209
David Woodhouse5a5e02a2009-07-04 09:35:44 +01003210/* This takes a number of _MM_ pages, not VTD pages */
David Woodhouse875764d2009-06-28 21:20:51 +01003211static struct iova *intel_alloc_iova(struct device *dev,
3212 struct dmar_domain *domain,
3213 unsigned long nrpages, uint64_t dma_mask)
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003214{
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003215 struct iova *iova = NULL;
3216
David Woodhouse875764d2009-06-28 21:20:51 +01003217 /* Restrict dma_mask to the width that the iommu can handle */
3218 dma_mask = min_t(uint64_t, DOMAIN_MAX_ADDR(domain->gaw), dma_mask);
Robin Murphy8f6429c2015-07-16 19:40:12 +01003219 /* Ensure we reserve the whole size-aligned region */
3220 nrpages = __roundup_pow_of_two(nrpages);
David Woodhouse875764d2009-06-28 21:20:51 +01003221
3222 if (!dmar_forcedac && dma_mask > DMA_BIT_MASK(32)) {
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003223 /*
3224 * First try to allocate an io virtual address in
Yang Hongyang284901a2009-04-06 19:01:15 -07003225 * DMA_BIT_MASK(32) and if that fails then try allocating
Joe Perches36098012007-12-17 11:40:11 -08003226 * from higher range
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003227 */
David Woodhouse875764d2009-06-28 21:20:51 +01003228 iova = alloc_iova(&domain->iovad, nrpages,
3229 IOVA_PFN(DMA_BIT_MASK(32)), 1);
3230 if (iova)
3231 return iova;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003232 }
David Woodhouse875764d2009-06-28 21:20:51 +01003233 iova = alloc_iova(&domain->iovad, nrpages, IOVA_PFN(dma_mask), 1);
3234 if (unlikely(!iova)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003235 pr_err("Allocating %ld-page iova for %s failed",
David Woodhouse207e3592014-03-09 16:12:32 -07003236 nrpages, dev_name(dev));
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003237 return NULL;
3238 }
3239
3240 return iova;
3241}
3242
David Woodhoused4b709f2014-03-09 16:07:40 -07003243static struct dmar_domain *__get_valid_domain_for_dev(struct device *dev)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003244{
3245 struct dmar_domain *domain;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003246
David Woodhoused4b709f2014-03-09 16:07:40 -07003247 domain = get_domain_for_dev(dev, DEFAULT_DOMAIN_ADDRESS_WIDTH);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003248 if (!domain) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003249 pr_err("Allocating domain for %s failed\n",
David Woodhoused4b709f2014-03-09 16:07:40 -07003250 dev_name(dev));
Al Viro4fe05bb2007-10-29 04:51:16 +00003251 return NULL;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003252 }
3253
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003254 return domain;
3255}
3256
David Woodhoused4b709f2014-03-09 16:07:40 -07003257static inline struct dmar_domain *get_valid_domain_for_dev(struct device *dev)
David Woodhouse147202a2009-07-07 19:43:20 +01003258{
3259 struct device_domain_info *info;
3260
3261 /* No lock here, assumes no domain exit in normal case */
David Woodhoused4b709f2014-03-09 16:07:40 -07003262 info = dev->archdata.iommu;
David Woodhouse147202a2009-07-07 19:43:20 +01003263 if (likely(info))
3264 return info->domain;
3265
3266 return __get_valid_domain_for_dev(dev);
3267}
3268
David Woodhouseecb509e2014-03-09 16:29:55 -07003269/* Check if the dev needs to go through non-identity map and unmap process.*/
David Woodhouse73676832009-07-04 14:08:36 +01003270static int iommu_no_mapping(struct device *dev)
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003271{
3272 int found;
3273
David Woodhouse3d891942014-03-06 15:59:26 +00003274 if (iommu_dummy(dev))
David Woodhouse1e4c64c2009-07-04 10:40:38 +01003275 return 1;
3276
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003277 if (!iommu_identity_mapping)
David Woodhouse1e4c64c2009-07-04 10:40:38 +01003278 return 0;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003279
David Woodhouse9b226622014-03-09 14:03:28 -07003280 found = identity_mapping(dev);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003281 if (found) {
David Woodhouseecb509e2014-03-09 16:29:55 -07003282 if (iommu_should_identity_map(dev, 0))
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003283 return 1;
3284 else {
3285 /*
3286 * 32 bit DMA is removed from si_domain and fall back
3287 * to non-identity mapping.
3288 */
Joerg Roedele6de0f82015-07-22 16:30:36 +02003289 dmar_remove_one_dev_info(si_domain, dev);
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003290 pr_info("32bit %s uses non-identity mapping\n",
3291 dev_name(dev));
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003292 return 0;
3293 }
3294 } else {
3295 /*
3296 * In case of a detached 64 bit DMA device from vm, the device
3297 * is put into si_domain for identity mapping.
3298 */
David Woodhouseecb509e2014-03-09 16:29:55 -07003299 if (iommu_should_identity_map(dev, 0)) {
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003300 int ret;
Joerg Roedel28ccce02015-07-21 14:45:31 +02003301 ret = domain_add_dev_info(si_domain, dev);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003302 if (!ret) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003303 pr_info("64bit %s uses identity mapping\n",
3304 dev_name(dev));
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003305 return 1;
3306 }
3307 }
3308 }
3309
David Woodhouse1e4c64c2009-07-04 10:40:38 +01003310 return 0;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003311}
3312
David Woodhouse5040a912014-03-09 16:14:00 -07003313static dma_addr_t __intel_map_single(struct device *dev, phys_addr_t paddr,
FUJITA Tomonoribb9e6d62008-10-15 16:08:28 +09003314 size_t size, int dir, u64 dma_mask)
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003315{
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003316 struct dmar_domain *domain;
Fenghua Yu5b6985c2008-10-16 18:02:32 -07003317 phys_addr_t start_paddr;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003318 struct iova *iova;
3319 int prot = 0;
Ingo Molnar6865f0d2008-04-22 11:09:04 +02003320 int ret;
Weidong Han8c11e792008-12-08 15:29:22 +08003321 struct intel_iommu *iommu;
Fenghua Yu33041ec2009-08-04 15:10:59 -07003322 unsigned long paddr_pfn = paddr >> PAGE_SHIFT;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003323
3324 BUG_ON(dir == DMA_NONE);
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003325
David Woodhouse5040a912014-03-09 16:14:00 -07003326 if (iommu_no_mapping(dev))
Ingo Molnar6865f0d2008-04-22 11:09:04 +02003327 return paddr;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003328
David Woodhouse5040a912014-03-09 16:14:00 -07003329 domain = get_valid_domain_for_dev(dev);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003330 if (!domain)
3331 return 0;
3332
Weidong Han8c11e792008-12-08 15:29:22 +08003333 iommu = domain_get_iommu(domain);
David Woodhouse88cb6a72009-06-28 15:03:06 +01003334 size = aligned_nrpages(paddr, size);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003335
David Woodhouse5040a912014-03-09 16:14:00 -07003336 iova = intel_alloc_iova(dev, domain, dma_to_mm_pfn(size), dma_mask);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003337 if (!iova)
3338 goto error;
3339
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003340 /*
3341 * Check if DMAR supports zero-length reads on write only
3342 * mappings..
3343 */
3344 if (dir == DMA_TO_DEVICE || dir == DMA_BIDIRECTIONAL || \
Weidong Han8c11e792008-12-08 15:29:22 +08003345 !cap_zlr(iommu->cap))
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003346 prot |= DMA_PTE_READ;
3347 if (dir == DMA_FROM_DEVICE || dir == DMA_BIDIRECTIONAL)
3348 prot |= DMA_PTE_WRITE;
3349 /*
Ingo Molnar6865f0d2008-04-22 11:09:04 +02003350 * paddr - (paddr + size) might be partial page, we should map the whole
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003351 * page. Note: if two part of one page are separately mapped, we
Ingo Molnar6865f0d2008-04-22 11:09:04 +02003352 * might have two guest_addr mapping to the same host paddr, but this
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003353 * is not a big problem
3354 */
David Woodhouse0ab36de2009-06-28 14:01:43 +01003355 ret = domain_pfn_mapping(domain, mm_to_dma_pfn(iova->pfn_lo),
Fenghua Yu33041ec2009-08-04 15:10:59 -07003356 mm_to_dma_pfn(paddr_pfn), size, prot);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003357 if (ret)
3358 goto error;
3359
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01003360 /* it's a non-present to present mapping. Only flush if caching mode */
3361 if (cap_caching_mode(iommu->cap))
Joerg Roedela1ddcbe2015-07-21 15:20:32 +02003362 iommu_flush_iotlb_psi(iommu, domain,
3363 mm_to_dma_pfn(iova->pfn_lo),
3364 size, 0, 1);
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01003365 else
Weidong Han8c11e792008-12-08 15:29:22 +08003366 iommu_flush_write_buffer(iommu);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003367
David Woodhouse03d6a242009-06-28 15:33:46 +01003368 start_paddr = (phys_addr_t)iova->pfn_lo << PAGE_SHIFT;
3369 start_paddr += paddr & ~PAGE_MASK;
3370 return start_paddr;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003371
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003372error:
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003373 if (iova)
3374 __free_iova(&domain->iovad, iova);
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003375 pr_err("Device %s request: %zx@%llx dir %d --- failed\n",
David Woodhouse5040a912014-03-09 16:14:00 -07003376 dev_name(dev), size, (unsigned long long)paddr, dir);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003377 return 0;
3378}
3379
FUJITA Tomonoriffbbef52009-01-05 23:47:26 +09003380static dma_addr_t intel_map_page(struct device *dev, struct page *page,
3381 unsigned long offset, size_t size,
3382 enum dma_data_direction dir,
3383 struct dma_attrs *attrs)
FUJITA Tomonoribb9e6d62008-10-15 16:08:28 +09003384{
FUJITA Tomonoriffbbef52009-01-05 23:47:26 +09003385 return __intel_map_single(dev, page_to_phys(page) + offset, size,
David Woodhouse46333e32014-03-10 20:01:21 -07003386 dir, *dev->dma_mask);
FUJITA Tomonoribb9e6d62008-10-15 16:08:28 +09003387}
3388
mark gross5e0d2a62008-03-04 15:22:08 -08003389static void flush_unmaps(void)
3390{
mark gross80b20dd2008-04-18 13:53:58 -07003391 int i, j;
mark gross5e0d2a62008-03-04 15:22:08 -08003392
mark gross5e0d2a62008-03-04 15:22:08 -08003393 timer_on = 0;
3394
3395 /* just flush them all */
3396 for (i = 0; i < g_num_of_iommus; i++) {
Weidong Hana2bb8452008-12-08 11:24:12 +08003397 struct intel_iommu *iommu = g_iommus[i];
3398 if (!iommu)
3399 continue;
Suresh Siddhac42d9f32008-07-10 11:16:36 -07003400
Yu Zhao9dd2fe82009-05-18 13:51:36 +08003401 if (!deferred_flush[i].next)
3402 continue;
3403
Nadav Amit78d5f0f2010-04-08 23:00:41 +03003404 /* In caching mode, global flushes turn emulation expensive */
3405 if (!cap_caching_mode(iommu->cap))
3406 iommu->flush.flush_iotlb(iommu, 0, 0, 0,
Yu Zhao93a23a72009-05-18 13:51:37 +08003407 DMA_TLB_GLOBAL_FLUSH);
Yu Zhao9dd2fe82009-05-18 13:51:36 +08003408 for (j = 0; j < deferred_flush[i].next; j++) {
Yu Zhao93a23a72009-05-18 13:51:37 +08003409 unsigned long mask;
3410 struct iova *iova = deferred_flush[i].iova[j];
Nadav Amit78d5f0f2010-04-08 23:00:41 +03003411 struct dmar_domain *domain = deferred_flush[i].domain[j];
Yu Zhao93a23a72009-05-18 13:51:37 +08003412
Nadav Amit78d5f0f2010-04-08 23:00:41 +03003413 /* On real hardware multiple invalidations are expensive */
3414 if (cap_caching_mode(iommu->cap))
Joerg Roedela1ddcbe2015-07-21 15:20:32 +02003415 iommu_flush_iotlb_psi(iommu, domain,
Jiang Liua156ef92014-07-11 14:19:36 +08003416 iova->pfn_lo, iova_size(iova),
David Woodhouseea8ea462014-03-05 17:09:32 +00003417 !deferred_flush[i].freelist[j], 0);
Nadav Amit78d5f0f2010-04-08 23:00:41 +03003418 else {
Jiang Liua156ef92014-07-11 14:19:36 +08003419 mask = ilog2(mm_to_dma_pfn(iova_size(iova)));
Nadav Amit78d5f0f2010-04-08 23:00:41 +03003420 iommu_flush_dev_iotlb(deferred_flush[i].domain[j],
3421 (uint64_t)iova->pfn_lo << PAGE_SHIFT, mask);
3422 }
Yu Zhao93a23a72009-05-18 13:51:37 +08003423 __free_iova(&deferred_flush[i].domain[j]->iovad, iova);
David Woodhouseea8ea462014-03-05 17:09:32 +00003424 if (deferred_flush[i].freelist[j])
3425 dma_free_pagelist(deferred_flush[i].freelist[j]);
mark gross80b20dd2008-04-18 13:53:58 -07003426 }
Yu Zhao9dd2fe82009-05-18 13:51:36 +08003427 deferred_flush[i].next = 0;
mark gross5e0d2a62008-03-04 15:22:08 -08003428 }
3429
mark gross5e0d2a62008-03-04 15:22:08 -08003430 list_size = 0;
mark gross5e0d2a62008-03-04 15:22:08 -08003431}
3432
3433static void flush_unmaps_timeout(unsigned long data)
3434{
mark gross80b20dd2008-04-18 13:53:58 -07003435 unsigned long flags;
3436
3437 spin_lock_irqsave(&async_umap_flush_lock, flags);
mark gross5e0d2a62008-03-04 15:22:08 -08003438 flush_unmaps();
mark gross80b20dd2008-04-18 13:53:58 -07003439 spin_unlock_irqrestore(&async_umap_flush_lock, flags);
mark gross5e0d2a62008-03-04 15:22:08 -08003440}
3441
David Woodhouseea8ea462014-03-05 17:09:32 +00003442static void add_unmap(struct dmar_domain *dom, struct iova *iova, struct page *freelist)
mark gross5e0d2a62008-03-04 15:22:08 -08003443{
3444 unsigned long flags;
mark gross80b20dd2008-04-18 13:53:58 -07003445 int next, iommu_id;
Weidong Han8c11e792008-12-08 15:29:22 +08003446 struct intel_iommu *iommu;
mark gross5e0d2a62008-03-04 15:22:08 -08003447
3448 spin_lock_irqsave(&async_umap_flush_lock, flags);
mark gross80b20dd2008-04-18 13:53:58 -07003449 if (list_size == HIGH_WATER_MARK)
3450 flush_unmaps();
3451
Weidong Han8c11e792008-12-08 15:29:22 +08003452 iommu = domain_get_iommu(dom);
3453 iommu_id = iommu->seq_id;
Suresh Siddhac42d9f32008-07-10 11:16:36 -07003454
mark gross80b20dd2008-04-18 13:53:58 -07003455 next = deferred_flush[iommu_id].next;
3456 deferred_flush[iommu_id].domain[next] = dom;
3457 deferred_flush[iommu_id].iova[next] = iova;
David Woodhouseea8ea462014-03-05 17:09:32 +00003458 deferred_flush[iommu_id].freelist[next] = freelist;
mark gross80b20dd2008-04-18 13:53:58 -07003459 deferred_flush[iommu_id].next++;
mark gross5e0d2a62008-03-04 15:22:08 -08003460
3461 if (!timer_on) {
3462 mod_timer(&unmap_timer, jiffies + msecs_to_jiffies(10));
3463 timer_on = 1;
3464 }
3465 list_size++;
3466 spin_unlock_irqrestore(&async_umap_flush_lock, flags);
3467}
3468
Jiang Liud41a4ad2014-07-11 14:19:34 +08003469static void intel_unmap(struct device *dev, dma_addr_t dev_addr)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003470{
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003471 struct dmar_domain *domain;
David Woodhoused794dc92009-06-28 00:27:49 +01003472 unsigned long start_pfn, last_pfn;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003473 struct iova *iova;
Weidong Han8c11e792008-12-08 15:29:22 +08003474 struct intel_iommu *iommu;
David Woodhouseea8ea462014-03-05 17:09:32 +00003475 struct page *freelist;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003476
David Woodhouse73676832009-07-04 14:08:36 +01003477 if (iommu_no_mapping(dev))
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003478 return;
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07003479
David Woodhouse1525a292014-03-06 16:19:30 +00003480 domain = find_domain(dev);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003481 BUG_ON(!domain);
3482
Weidong Han8c11e792008-12-08 15:29:22 +08003483 iommu = domain_get_iommu(domain);
3484
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003485 iova = find_iova(&domain->iovad, IOVA_PFN(dev_addr));
David Woodhouse85b98272009-07-01 19:27:53 +01003486 if (WARN_ONCE(!iova, "Driver unmaps unmatched page at PFN %llx\n",
3487 (unsigned long long)dev_addr))
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003488 return;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003489
David Woodhoused794dc92009-06-28 00:27:49 +01003490 start_pfn = mm_to_dma_pfn(iova->pfn_lo);
3491 last_pfn = mm_to_dma_pfn(iova->pfn_hi + 1) - 1;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003492
David Woodhoused794dc92009-06-28 00:27:49 +01003493 pr_debug("Device %s unmapping: pfn %lx-%lx\n",
David Woodhouse207e3592014-03-09 16:12:32 -07003494 dev_name(dev), start_pfn, last_pfn);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003495
David Woodhouseea8ea462014-03-05 17:09:32 +00003496 freelist = domain_unmap(domain, start_pfn, last_pfn);
David Woodhoused794dc92009-06-28 00:27:49 +01003497
mark gross5e0d2a62008-03-04 15:22:08 -08003498 if (intel_iommu_strict) {
Joerg Roedela1ddcbe2015-07-21 15:20:32 +02003499 iommu_flush_iotlb_psi(iommu, domain, start_pfn,
David Woodhouseea8ea462014-03-05 17:09:32 +00003500 last_pfn - start_pfn + 1, !freelist, 0);
mark gross5e0d2a62008-03-04 15:22:08 -08003501 /* free iova */
3502 __free_iova(&domain->iovad, iova);
David Woodhouseea8ea462014-03-05 17:09:32 +00003503 dma_free_pagelist(freelist);
mark gross5e0d2a62008-03-04 15:22:08 -08003504 } else {
David Woodhouseea8ea462014-03-05 17:09:32 +00003505 add_unmap(domain, iova, freelist);
mark gross5e0d2a62008-03-04 15:22:08 -08003506 /*
3507 * queue up the release of the unmap to save the 1/6th of the
3508 * cpu used up by the iotlb flush operation...
3509 */
mark gross5e0d2a62008-03-04 15:22:08 -08003510 }
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003511}
3512
Jiang Liud41a4ad2014-07-11 14:19:34 +08003513static void intel_unmap_page(struct device *dev, dma_addr_t dev_addr,
3514 size_t size, enum dma_data_direction dir,
3515 struct dma_attrs *attrs)
3516{
3517 intel_unmap(dev, dev_addr);
3518}
3519
David Woodhouse5040a912014-03-09 16:14:00 -07003520static void *intel_alloc_coherent(struct device *dev, size_t size,
Andrzej Pietrasiewiczbaa676f2012-03-27 14:28:18 +02003521 dma_addr_t *dma_handle, gfp_t flags,
3522 struct dma_attrs *attrs)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003523{
Akinobu Mita36746432014-06-04 16:06:51 -07003524 struct page *page = NULL;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003525 int order;
3526
Fenghua Yu5b6985c2008-10-16 18:02:32 -07003527 size = PAGE_ALIGN(size);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003528 order = get_order(size);
Alex Williamsone8bb9102009-11-04 15:59:34 -07003529
David Woodhouse5040a912014-03-09 16:14:00 -07003530 if (!iommu_no_mapping(dev))
Alex Williamsone8bb9102009-11-04 15:59:34 -07003531 flags &= ~(GFP_DMA | GFP_DMA32);
David Woodhouse5040a912014-03-09 16:14:00 -07003532 else if (dev->coherent_dma_mask < dma_get_required_mask(dev)) {
3533 if (dev->coherent_dma_mask < DMA_BIT_MASK(32))
Alex Williamsone8bb9102009-11-04 15:59:34 -07003534 flags |= GFP_DMA;
3535 else
3536 flags |= GFP_DMA32;
3537 }
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003538
Akinobu Mita36746432014-06-04 16:06:51 -07003539 if (flags & __GFP_WAIT) {
3540 unsigned int count = size >> PAGE_SHIFT;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003541
Akinobu Mita36746432014-06-04 16:06:51 -07003542 page = dma_alloc_from_contiguous(dev, count, order);
3543 if (page && iommu_no_mapping(dev) &&
3544 page_to_phys(page) + size > dev->coherent_dma_mask) {
3545 dma_release_from_contiguous(dev, page, count);
3546 page = NULL;
3547 }
3548 }
3549
3550 if (!page)
3551 page = alloc_pages(flags, order);
3552 if (!page)
3553 return NULL;
3554 memset(page_address(page), 0, size);
3555
3556 *dma_handle = __intel_map_single(dev, page_to_phys(page), size,
FUJITA Tomonoribb9e6d62008-10-15 16:08:28 +09003557 DMA_BIDIRECTIONAL,
David Woodhouse5040a912014-03-09 16:14:00 -07003558 dev->coherent_dma_mask);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003559 if (*dma_handle)
Akinobu Mita36746432014-06-04 16:06:51 -07003560 return page_address(page);
3561 if (!dma_release_from_contiguous(dev, page, size >> PAGE_SHIFT))
3562 __free_pages(page, order);
3563
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003564 return NULL;
3565}
3566
David Woodhouse5040a912014-03-09 16:14:00 -07003567static void intel_free_coherent(struct device *dev, size_t size, void *vaddr,
Andrzej Pietrasiewiczbaa676f2012-03-27 14:28:18 +02003568 dma_addr_t dma_handle, struct dma_attrs *attrs)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003569{
3570 int order;
Akinobu Mita36746432014-06-04 16:06:51 -07003571 struct page *page = virt_to_page(vaddr);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003572
Fenghua Yu5b6985c2008-10-16 18:02:32 -07003573 size = PAGE_ALIGN(size);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003574 order = get_order(size);
3575
Jiang Liud41a4ad2014-07-11 14:19:34 +08003576 intel_unmap(dev, dma_handle);
Akinobu Mita36746432014-06-04 16:06:51 -07003577 if (!dma_release_from_contiguous(dev, page, size >> PAGE_SHIFT))
3578 __free_pages(page, order);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003579}
3580
David Woodhouse5040a912014-03-09 16:14:00 -07003581static void intel_unmap_sg(struct device *dev, struct scatterlist *sglist,
FUJITA Tomonorid7ab5c42009-01-28 21:53:18 +09003582 int nelems, enum dma_data_direction dir,
3583 struct dma_attrs *attrs)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003584{
Jiang Liud41a4ad2014-07-11 14:19:34 +08003585 intel_unmap(dev, sglist[0].dma_address);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003586}
3587
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003588static int intel_nontranslate_map_sg(struct device *hddev,
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07003589 struct scatterlist *sglist, int nelems, int dir)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003590{
3591 int i;
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07003592 struct scatterlist *sg;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003593
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07003594 for_each_sg(sglist, sg, nelems, i) {
FUJITA Tomonori12d4d402007-10-23 09:32:25 +02003595 BUG_ON(!sg_page(sg));
Dan Williamsdb0fa0c2015-08-17 08:13:26 -06003596 sg->dma_address = sg_phys(sg);
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07003597 sg->dma_length = sg->length;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003598 }
3599 return nelems;
3600}
3601
David Woodhouse5040a912014-03-09 16:14:00 -07003602static int intel_map_sg(struct device *dev, struct scatterlist *sglist, int nelems,
FUJITA Tomonorid7ab5c42009-01-28 21:53:18 +09003603 enum dma_data_direction dir, struct dma_attrs *attrs)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003604{
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003605 int i;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003606 struct dmar_domain *domain;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003607 size_t size = 0;
3608 int prot = 0;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003609 struct iova *iova = NULL;
3610 int ret;
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07003611 struct scatterlist *sg;
David Woodhouseb536d242009-06-28 14:49:31 +01003612 unsigned long start_vpfn;
Weidong Han8c11e792008-12-08 15:29:22 +08003613 struct intel_iommu *iommu;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003614
3615 BUG_ON(dir == DMA_NONE);
David Woodhouse5040a912014-03-09 16:14:00 -07003616 if (iommu_no_mapping(dev))
3617 return intel_nontranslate_map_sg(dev, sglist, nelems, dir);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003618
David Woodhouse5040a912014-03-09 16:14:00 -07003619 domain = get_valid_domain_for_dev(dev);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003620 if (!domain)
3621 return 0;
3622
Weidong Han8c11e792008-12-08 15:29:22 +08003623 iommu = domain_get_iommu(domain);
3624
David Woodhouseb536d242009-06-28 14:49:31 +01003625 for_each_sg(sglist, sg, nelems, i)
David Woodhouse88cb6a72009-06-28 15:03:06 +01003626 size += aligned_nrpages(sg->offset, sg->length);
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003627
David Woodhouse5040a912014-03-09 16:14:00 -07003628 iova = intel_alloc_iova(dev, domain, dma_to_mm_pfn(size),
3629 *dev->dma_mask);
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003630 if (!iova) {
FUJITA Tomonoric03ab372007-10-21 16:42:00 -07003631 sglist->dma_length = 0;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003632 return 0;
3633 }
3634
3635 /*
3636 * Check if DMAR supports zero-length reads on write only
3637 * mappings..
3638 */
3639 if (dir == DMA_TO_DEVICE || dir == DMA_BIDIRECTIONAL || \
Weidong Han8c11e792008-12-08 15:29:22 +08003640 !cap_zlr(iommu->cap))
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003641 prot |= DMA_PTE_READ;
3642 if (dir == DMA_FROM_DEVICE || dir == DMA_BIDIRECTIONAL)
3643 prot |= DMA_PTE_WRITE;
3644
David Woodhouseb536d242009-06-28 14:49:31 +01003645 start_vpfn = mm_to_dma_pfn(iova->pfn_lo);
David Woodhousee1605492009-06-29 11:17:38 +01003646
Fenghua Yuf5329592009-08-04 15:09:37 -07003647 ret = domain_sg_mapping(domain, start_vpfn, sglist, size, prot);
David Woodhousee1605492009-06-29 11:17:38 +01003648 if (unlikely(ret)) {
David Woodhousee1605492009-06-29 11:17:38 +01003649 dma_pte_free_pagetable(domain, start_vpfn,
3650 start_vpfn + size - 1);
David Woodhousee1605492009-06-29 11:17:38 +01003651 __free_iova(&domain->iovad, iova);
3652 return 0;
Keshavamurthy, Anil Sf76aec72007-10-21 16:41:58 -07003653 }
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003654
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01003655 /* it's a non-present to present mapping. Only flush if caching mode */
3656 if (cap_caching_mode(iommu->cap))
Joerg Roedela1ddcbe2015-07-21 15:20:32 +02003657 iommu_flush_iotlb_psi(iommu, domain, start_vpfn, size, 0, 1);
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01003658 else
Weidong Han8c11e792008-12-08 15:29:22 +08003659 iommu_flush_write_buffer(iommu);
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01003660
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003661 return nelems;
3662}
3663
FUJITA Tomonoridfb805e2009-01-28 21:53:17 +09003664static int intel_mapping_error(struct device *dev, dma_addr_t dma_addr)
3665{
3666 return !dma_addr;
3667}
3668
FUJITA Tomonori160c1d82009-01-05 23:59:02 +09003669struct dma_map_ops intel_dma_ops = {
Andrzej Pietrasiewiczbaa676f2012-03-27 14:28:18 +02003670 .alloc = intel_alloc_coherent,
3671 .free = intel_free_coherent,
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003672 .map_sg = intel_map_sg,
3673 .unmap_sg = intel_unmap_sg,
FUJITA Tomonoriffbbef52009-01-05 23:47:26 +09003674 .map_page = intel_map_page,
3675 .unmap_page = intel_unmap_page,
FUJITA Tomonoridfb805e2009-01-28 21:53:17 +09003676 .mapping_error = intel_mapping_error,
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003677};
3678
3679static inline int iommu_domain_cache_init(void)
3680{
3681 int ret = 0;
3682
3683 iommu_domain_cache = kmem_cache_create("iommu_domain",
3684 sizeof(struct dmar_domain),
3685 0,
3686 SLAB_HWCACHE_ALIGN,
3687
3688 NULL);
3689 if (!iommu_domain_cache) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003690 pr_err("Couldn't create iommu_domain cache\n");
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003691 ret = -ENOMEM;
3692 }
3693
3694 return ret;
3695}
3696
3697static inline int iommu_devinfo_cache_init(void)
3698{
3699 int ret = 0;
3700
3701 iommu_devinfo_cache = kmem_cache_create("iommu_devinfo",
3702 sizeof(struct device_domain_info),
3703 0,
3704 SLAB_HWCACHE_ALIGN,
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003705 NULL);
3706 if (!iommu_devinfo_cache) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02003707 pr_err("Couldn't create devinfo cache\n");
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003708 ret = -ENOMEM;
3709 }
3710
3711 return ret;
3712}
3713
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003714static int __init iommu_init_mempool(void)
3715{
3716 int ret;
Sakari Ailusae1ff3d2015-07-13 14:31:28 +03003717 ret = iova_cache_get();
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003718 if (ret)
3719 return ret;
3720
3721 ret = iommu_domain_cache_init();
3722 if (ret)
3723 goto domain_error;
3724
3725 ret = iommu_devinfo_cache_init();
3726 if (!ret)
3727 return ret;
3728
3729 kmem_cache_destroy(iommu_domain_cache);
3730domain_error:
Sakari Ailusae1ff3d2015-07-13 14:31:28 +03003731 iova_cache_put();
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003732
3733 return -ENOMEM;
3734}
3735
3736static void __init iommu_exit_mempool(void)
3737{
3738 kmem_cache_destroy(iommu_devinfo_cache);
3739 kmem_cache_destroy(iommu_domain_cache);
Sakari Ailusae1ff3d2015-07-13 14:31:28 +03003740 iova_cache_put();
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003741}
3742
Dan Williams556ab452010-07-23 15:47:56 -07003743static void quirk_ioat_snb_local_iommu(struct pci_dev *pdev)
3744{
3745 struct dmar_drhd_unit *drhd;
3746 u32 vtbar;
3747 int rc;
3748
3749 /* We know that this device on this chipset has its own IOMMU.
3750 * If we find it under a different IOMMU, then the BIOS is lying
3751 * to us. Hope that the IOMMU for this device is actually
3752 * disabled, and it needs no translation...
3753 */
3754 rc = pci_bus_read_config_dword(pdev->bus, PCI_DEVFN(0, 0), 0xb0, &vtbar);
3755 if (rc) {
3756 /* "can't" happen */
3757 dev_info(&pdev->dev, "failed to run vt-d quirk\n");
3758 return;
3759 }
3760 vtbar &= 0xffff0000;
3761
3762 /* we know that the this iommu should be at offset 0xa000 from vtbar */
3763 drhd = dmar_find_matched_drhd_unit(pdev);
3764 if (WARN_TAINT_ONCE(!drhd || drhd->reg_base_addr - vtbar != 0xa000,
3765 TAINT_FIRMWARE_WORKAROUND,
3766 "BIOS assigned incorrect VT-d unit for Intel(R) QuickData Technology device\n"))
3767 pdev->dev.archdata.iommu = DUMMY_DEVICE_DOMAIN_INFO;
3768}
3769DECLARE_PCI_FIXUP_ENABLE(PCI_VENDOR_ID_INTEL, PCI_DEVICE_ID_INTEL_IOAT_SNB, quirk_ioat_snb_local_iommu);
3770
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003771static void __init init_no_remapping_devices(void)
3772{
3773 struct dmar_drhd_unit *drhd;
David Woodhouse832bd852014-03-07 15:08:36 +00003774 struct device *dev;
Jiang Liub683b232014-02-19 14:07:32 +08003775 int i;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003776
3777 for_each_drhd_unit(drhd) {
3778 if (!drhd->include_all) {
Jiang Liub683b232014-02-19 14:07:32 +08003779 for_each_active_dev_scope(drhd->devices,
3780 drhd->devices_cnt, i, dev)
3781 break;
David Woodhouse832bd852014-03-07 15:08:36 +00003782 /* ignore DMAR unit if no devices exist */
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003783 if (i == drhd->devices_cnt)
3784 drhd->ignored = 1;
3785 }
3786 }
3787
Jiang Liu7c919772014-01-06 14:18:18 +08003788 for_each_active_drhd_unit(drhd) {
Jiang Liu7c919772014-01-06 14:18:18 +08003789 if (drhd->include_all)
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003790 continue;
3791
Jiang Liub683b232014-02-19 14:07:32 +08003792 for_each_active_dev_scope(drhd->devices,
3793 drhd->devices_cnt, i, dev)
David Woodhouse832bd852014-03-07 15:08:36 +00003794 if (!dev_is_pci(dev) || !IS_GFX_DEVICE(to_pci_dev(dev)))
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003795 break;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003796 if (i < drhd->devices_cnt)
3797 continue;
3798
David Woodhousec0771df2011-10-14 20:59:46 +01003799 /* This IOMMU has *only* gfx devices. Either bypass it or
3800 set the gfx_mapped flag, as appropriate */
3801 if (dmar_map_gfx) {
3802 intel_iommu_gfx_mapped = 1;
3803 } else {
3804 drhd->ignored = 1;
Jiang Liub683b232014-02-19 14:07:32 +08003805 for_each_active_dev_scope(drhd->devices,
3806 drhd->devices_cnt, i, dev)
David Woodhouse832bd852014-03-07 15:08:36 +00003807 dev->archdata.iommu = DUMMY_DEVICE_DOMAIN_INFO;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07003808 }
3809 }
3810}
3811
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003812#ifdef CONFIG_SUSPEND
3813static int init_iommu_hw(void)
3814{
3815 struct dmar_drhd_unit *drhd;
3816 struct intel_iommu *iommu = NULL;
3817
3818 for_each_active_iommu(iommu, drhd)
3819 if (iommu->qi)
3820 dmar_reenable_qi(iommu);
3821
Joseph Cihulab7792602011-05-03 00:08:37 -07003822 for_each_iommu(iommu, drhd) {
3823 if (drhd->ignored) {
3824 /*
3825 * we always have to disable PMRs or DMA may fail on
3826 * this device
3827 */
3828 if (force_on)
3829 iommu_disable_protect_mem_regions(iommu);
3830 continue;
3831 }
3832
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003833 iommu_flush_write_buffer(iommu);
3834
3835 iommu_set_root_entry(iommu);
3836
3837 iommu->flush.flush_context(iommu, 0, 0, 0,
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01003838 DMA_CCMD_GLOBAL_INVL);
Jiang Liu2a41cce2014-07-11 14:19:33 +08003839 iommu->flush.flush_iotlb(iommu, 0, 0, 0, DMA_TLB_GLOBAL_FLUSH);
3840 iommu_enable_translation(iommu);
David Woodhouseb94996c2009-09-19 15:28:12 -07003841 iommu_disable_protect_mem_regions(iommu);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003842 }
3843
3844 return 0;
3845}
3846
3847static void iommu_flush_all(void)
3848{
3849 struct dmar_drhd_unit *drhd;
3850 struct intel_iommu *iommu;
3851
3852 for_each_active_iommu(iommu, drhd) {
3853 iommu->flush.flush_context(iommu, 0, 0, 0,
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01003854 DMA_CCMD_GLOBAL_INVL);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003855 iommu->flush.flush_iotlb(iommu, 0, 0, 0,
David Woodhouse1f0ef2a2009-05-10 19:58:49 +01003856 DMA_TLB_GLOBAL_FLUSH);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003857 }
3858}
3859
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01003860static int iommu_suspend(void)
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003861{
3862 struct dmar_drhd_unit *drhd;
3863 struct intel_iommu *iommu = NULL;
3864 unsigned long flag;
3865
3866 for_each_active_iommu(iommu, drhd) {
3867 iommu->iommu_state = kzalloc(sizeof(u32) * MAX_SR_DMAR_REGS,
3868 GFP_ATOMIC);
3869 if (!iommu->iommu_state)
3870 goto nomem;
3871 }
3872
3873 iommu_flush_all();
3874
3875 for_each_active_iommu(iommu, drhd) {
3876 iommu_disable_translation(iommu);
3877
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02003878 raw_spin_lock_irqsave(&iommu->register_lock, flag);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003879
3880 iommu->iommu_state[SR_DMAR_FECTL_REG] =
3881 readl(iommu->reg + DMAR_FECTL_REG);
3882 iommu->iommu_state[SR_DMAR_FEDATA_REG] =
3883 readl(iommu->reg + DMAR_FEDATA_REG);
3884 iommu->iommu_state[SR_DMAR_FEADDR_REG] =
3885 readl(iommu->reg + DMAR_FEADDR_REG);
3886 iommu->iommu_state[SR_DMAR_FEUADDR_REG] =
3887 readl(iommu->reg + DMAR_FEUADDR_REG);
3888
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02003889 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003890 }
3891 return 0;
3892
3893nomem:
3894 for_each_active_iommu(iommu, drhd)
3895 kfree(iommu->iommu_state);
3896
3897 return -ENOMEM;
3898}
3899
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01003900static void iommu_resume(void)
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003901{
3902 struct dmar_drhd_unit *drhd;
3903 struct intel_iommu *iommu = NULL;
3904 unsigned long flag;
3905
3906 if (init_iommu_hw()) {
Joseph Cihulab7792602011-05-03 00:08:37 -07003907 if (force_on)
3908 panic("tboot: IOMMU setup failed, DMAR can not resume!\n");
3909 else
3910 WARN(1, "IOMMU setup failed, DMAR can not resume!\n");
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01003911 return;
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003912 }
3913
3914 for_each_active_iommu(iommu, drhd) {
3915
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02003916 raw_spin_lock_irqsave(&iommu->register_lock, flag);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003917
3918 writel(iommu->iommu_state[SR_DMAR_FECTL_REG],
3919 iommu->reg + DMAR_FECTL_REG);
3920 writel(iommu->iommu_state[SR_DMAR_FEDATA_REG],
3921 iommu->reg + DMAR_FEDATA_REG);
3922 writel(iommu->iommu_state[SR_DMAR_FEADDR_REG],
3923 iommu->reg + DMAR_FEADDR_REG);
3924 writel(iommu->iommu_state[SR_DMAR_FEUADDR_REG],
3925 iommu->reg + DMAR_FEUADDR_REG);
3926
Thomas Gleixner1f5b3c32011-07-19 16:19:51 +02003927 raw_spin_unlock_irqrestore(&iommu->register_lock, flag);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003928 }
3929
3930 for_each_active_iommu(iommu, drhd)
3931 kfree(iommu->iommu_state);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003932}
3933
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01003934static struct syscore_ops iommu_syscore_ops = {
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003935 .resume = iommu_resume,
3936 .suspend = iommu_suspend,
3937};
3938
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01003939static void __init init_iommu_pm_ops(void)
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003940{
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01003941 register_syscore_ops(&iommu_syscore_ops);
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003942}
3943
3944#else
Rafael J. Wysocki99592ba2011-06-07 21:32:31 +02003945static inline void init_iommu_pm_ops(void) {}
Fenghua Yuf59c7b62009-03-27 14:22:42 -07003946#endif /* CONFIG_PM */
3947
Suresh Siddha318fe7d2011-08-23 17:05:20 -07003948
Jiang Liuc2a0b532014-11-09 22:47:56 +08003949int __init dmar_parse_one_rmrr(struct acpi_dmar_header *header, void *arg)
Suresh Siddha318fe7d2011-08-23 17:05:20 -07003950{
3951 struct acpi_dmar_reserved_memory *rmrr;
3952 struct dmar_rmrr_unit *rmrru;
3953
3954 rmrru = kzalloc(sizeof(*rmrru), GFP_KERNEL);
3955 if (!rmrru)
3956 return -ENOMEM;
3957
3958 rmrru->hdr = header;
3959 rmrr = (struct acpi_dmar_reserved_memory *)header;
3960 rmrru->base_address = rmrr->base_address;
3961 rmrru->end_address = rmrr->end_address;
Jiang Liu2e455282014-02-19 14:07:36 +08003962 rmrru->devices = dmar_alloc_dev_scope((void *)(rmrr + 1),
3963 ((void *)rmrr) + rmrr->header.length,
3964 &rmrru->devices_cnt);
3965 if (rmrru->devices_cnt && rmrru->devices == NULL) {
3966 kfree(rmrru);
3967 return -ENOMEM;
3968 }
Suresh Siddha318fe7d2011-08-23 17:05:20 -07003969
Jiang Liu2e455282014-02-19 14:07:36 +08003970 list_add(&rmrru->list, &dmar_rmrr_units);
3971
Suresh Siddha318fe7d2011-08-23 17:05:20 -07003972 return 0;
3973}
3974
Jiang Liu6b197242014-11-09 22:47:58 +08003975static struct dmar_atsr_unit *dmar_find_atsr(struct acpi_dmar_atsr *atsr)
3976{
3977 struct dmar_atsr_unit *atsru;
3978 struct acpi_dmar_atsr *tmp;
3979
3980 list_for_each_entry_rcu(atsru, &dmar_atsr_units, list) {
3981 tmp = (struct acpi_dmar_atsr *)atsru->hdr;
3982 if (atsr->segment != tmp->segment)
3983 continue;
3984 if (atsr->header.length != tmp->header.length)
3985 continue;
3986 if (memcmp(atsr, tmp, atsr->header.length) == 0)
3987 return atsru;
3988 }
3989
3990 return NULL;
3991}
3992
3993int dmar_parse_one_atsr(struct acpi_dmar_header *hdr, void *arg)
Suresh Siddha318fe7d2011-08-23 17:05:20 -07003994{
3995 struct acpi_dmar_atsr *atsr;
3996 struct dmar_atsr_unit *atsru;
3997
Jiang Liu6b197242014-11-09 22:47:58 +08003998 if (system_state != SYSTEM_BOOTING && !intel_iommu_enabled)
3999 return 0;
4000
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004001 atsr = container_of(hdr, struct acpi_dmar_atsr, header);
Jiang Liu6b197242014-11-09 22:47:58 +08004002 atsru = dmar_find_atsr(atsr);
4003 if (atsru)
4004 return 0;
4005
4006 atsru = kzalloc(sizeof(*atsru) + hdr->length, GFP_KERNEL);
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004007 if (!atsru)
4008 return -ENOMEM;
4009
Jiang Liu6b197242014-11-09 22:47:58 +08004010 /*
4011 * If memory is allocated from slab by ACPI _DSM method, we need to
4012 * copy the memory content because the memory buffer will be freed
4013 * on return.
4014 */
4015 atsru->hdr = (void *)(atsru + 1);
4016 memcpy(atsru->hdr, hdr, hdr->length);
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004017 atsru->include_all = atsr->flags & 0x1;
Jiang Liu2e455282014-02-19 14:07:36 +08004018 if (!atsru->include_all) {
4019 atsru->devices = dmar_alloc_dev_scope((void *)(atsr + 1),
4020 (void *)atsr + atsr->header.length,
4021 &atsru->devices_cnt);
4022 if (atsru->devices_cnt && atsru->devices == NULL) {
4023 kfree(atsru);
4024 return -ENOMEM;
4025 }
4026 }
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004027
Jiang Liu0e2426122014-02-19 14:07:34 +08004028 list_add_rcu(&atsru->list, &dmar_atsr_units);
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004029
4030 return 0;
4031}
4032
Jiang Liu9bdc5312014-01-06 14:18:27 +08004033static void intel_iommu_free_atsr(struct dmar_atsr_unit *atsru)
4034{
4035 dmar_free_dev_scope(&atsru->devices, &atsru->devices_cnt);
4036 kfree(atsru);
4037}
4038
Jiang Liu6b197242014-11-09 22:47:58 +08004039int dmar_release_one_atsr(struct acpi_dmar_header *hdr, void *arg)
4040{
4041 struct acpi_dmar_atsr *atsr;
4042 struct dmar_atsr_unit *atsru;
4043
4044 atsr = container_of(hdr, struct acpi_dmar_atsr, header);
4045 atsru = dmar_find_atsr(atsr);
4046 if (atsru) {
4047 list_del_rcu(&atsru->list);
4048 synchronize_rcu();
4049 intel_iommu_free_atsr(atsru);
4050 }
4051
4052 return 0;
4053}
4054
4055int dmar_check_one_atsr(struct acpi_dmar_header *hdr, void *arg)
4056{
4057 int i;
4058 struct device *dev;
4059 struct acpi_dmar_atsr *atsr;
4060 struct dmar_atsr_unit *atsru;
4061
4062 atsr = container_of(hdr, struct acpi_dmar_atsr, header);
4063 atsru = dmar_find_atsr(atsr);
4064 if (!atsru)
4065 return 0;
4066
4067 if (!atsru->include_all && atsru->devices && atsru->devices_cnt)
4068 for_each_active_dev_scope(atsru->devices, atsru->devices_cnt,
4069 i, dev)
4070 return -EBUSY;
4071
4072 return 0;
4073}
4074
Jiang Liuffebeb42014-11-09 22:48:02 +08004075static int intel_iommu_add(struct dmar_drhd_unit *dmaru)
4076{
4077 int sp, ret = 0;
4078 struct intel_iommu *iommu = dmaru->iommu;
4079
4080 if (g_iommus[iommu->seq_id])
4081 return 0;
4082
4083 if (hw_pass_through && !ecap_pass_through(iommu->ecap)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004084 pr_warn("%s: Doesn't support hardware pass through.\n",
Jiang Liuffebeb42014-11-09 22:48:02 +08004085 iommu->name);
4086 return -ENXIO;
4087 }
4088 if (!ecap_sc_support(iommu->ecap) &&
4089 domain_update_iommu_snooping(iommu)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004090 pr_warn("%s: Doesn't support snooping.\n",
Jiang Liuffebeb42014-11-09 22:48:02 +08004091 iommu->name);
4092 return -ENXIO;
4093 }
4094 sp = domain_update_iommu_superpage(iommu) - 1;
4095 if (sp >= 0 && !(cap_super_page_val(iommu->cap) & (1 << sp))) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004096 pr_warn("%s: Doesn't support large page.\n",
Jiang Liuffebeb42014-11-09 22:48:02 +08004097 iommu->name);
4098 return -ENXIO;
4099 }
4100
4101 /*
4102 * Disable translation if already enabled prior to OS handover.
4103 */
4104 if (iommu->gcmd & DMA_GCMD_TE)
4105 iommu_disable_translation(iommu);
4106
4107 g_iommus[iommu->seq_id] = iommu;
4108 ret = iommu_init_domains(iommu);
4109 if (ret == 0)
4110 ret = iommu_alloc_root_entry(iommu);
4111 if (ret)
4112 goto out;
4113
4114 if (dmaru->ignored) {
4115 /*
4116 * we always have to disable PMRs or DMA may fail on this device
4117 */
4118 if (force_on)
4119 iommu_disable_protect_mem_regions(iommu);
4120 return 0;
4121 }
4122
4123 intel_iommu_init_qi(iommu);
4124 iommu_flush_write_buffer(iommu);
4125 ret = dmar_set_interrupt(iommu);
4126 if (ret)
4127 goto disable_iommu;
4128
4129 iommu_set_root_entry(iommu);
4130 iommu->flush.flush_context(iommu, 0, 0, 0, DMA_CCMD_GLOBAL_INVL);
4131 iommu->flush.flush_iotlb(iommu, 0, 0, 0, DMA_TLB_GLOBAL_FLUSH);
4132 iommu_enable_translation(iommu);
4133
Jiang Liuffebeb42014-11-09 22:48:02 +08004134 iommu_disable_protect_mem_regions(iommu);
4135 return 0;
4136
4137disable_iommu:
4138 disable_dmar_iommu(iommu);
4139out:
4140 free_dmar_iommu(iommu);
4141 return ret;
4142}
4143
Jiang Liu6b197242014-11-09 22:47:58 +08004144int dmar_iommu_hotplug(struct dmar_drhd_unit *dmaru, bool insert)
4145{
Jiang Liuffebeb42014-11-09 22:48:02 +08004146 int ret = 0;
4147 struct intel_iommu *iommu = dmaru->iommu;
4148
4149 if (!intel_iommu_enabled)
4150 return 0;
4151 if (iommu == NULL)
4152 return -EINVAL;
4153
4154 if (insert) {
4155 ret = intel_iommu_add(dmaru);
4156 } else {
4157 disable_dmar_iommu(iommu);
4158 free_dmar_iommu(iommu);
4159 }
4160
4161 return ret;
Jiang Liu6b197242014-11-09 22:47:58 +08004162}
4163
Jiang Liu9bdc5312014-01-06 14:18:27 +08004164static void intel_iommu_free_dmars(void)
4165{
4166 struct dmar_rmrr_unit *rmrru, *rmrr_n;
4167 struct dmar_atsr_unit *atsru, *atsr_n;
4168
4169 list_for_each_entry_safe(rmrru, rmrr_n, &dmar_rmrr_units, list) {
4170 list_del(&rmrru->list);
4171 dmar_free_dev_scope(&rmrru->devices, &rmrru->devices_cnt);
4172 kfree(rmrru);
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004173 }
4174
Jiang Liu9bdc5312014-01-06 14:18:27 +08004175 list_for_each_entry_safe(atsru, atsr_n, &dmar_atsr_units, list) {
4176 list_del(&atsru->list);
4177 intel_iommu_free_atsr(atsru);
4178 }
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004179}
4180
4181int dmar_find_matched_atsr_unit(struct pci_dev *dev)
4182{
Jiang Liub683b232014-02-19 14:07:32 +08004183 int i, ret = 1;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004184 struct pci_bus *bus;
David Woodhouse832bd852014-03-07 15:08:36 +00004185 struct pci_dev *bridge = NULL;
4186 struct device *tmp;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004187 struct acpi_dmar_atsr *atsr;
4188 struct dmar_atsr_unit *atsru;
4189
4190 dev = pci_physfn(dev);
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004191 for (bus = dev->bus; bus; bus = bus->parent) {
Jiang Liub5f82dd2014-02-19 14:07:31 +08004192 bridge = bus->self;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004193 if (!bridge || !pci_is_pcie(bridge) ||
Yijing Wang62f87c02012-07-24 17:20:03 +08004194 pci_pcie_type(bridge) == PCI_EXP_TYPE_PCI_BRIDGE)
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004195 return 0;
Jiang Liub5f82dd2014-02-19 14:07:31 +08004196 if (pci_pcie_type(bridge) == PCI_EXP_TYPE_ROOT_PORT)
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004197 break;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004198 }
Jiang Liub5f82dd2014-02-19 14:07:31 +08004199 if (!bridge)
4200 return 0;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004201
Jiang Liu0e2426122014-02-19 14:07:34 +08004202 rcu_read_lock();
Jiang Liub5f82dd2014-02-19 14:07:31 +08004203 list_for_each_entry_rcu(atsru, &dmar_atsr_units, list) {
4204 atsr = container_of(atsru->hdr, struct acpi_dmar_atsr, header);
4205 if (atsr->segment != pci_domain_nr(dev->bus))
4206 continue;
4207
Jiang Liub683b232014-02-19 14:07:32 +08004208 for_each_dev_scope(atsru->devices, atsru->devices_cnt, i, tmp)
David Woodhouse832bd852014-03-07 15:08:36 +00004209 if (tmp == &bridge->dev)
Jiang Liub683b232014-02-19 14:07:32 +08004210 goto out;
Jiang Liub5f82dd2014-02-19 14:07:31 +08004211
4212 if (atsru->include_all)
Jiang Liub683b232014-02-19 14:07:32 +08004213 goto out;
Jiang Liub5f82dd2014-02-19 14:07:31 +08004214 }
Jiang Liub683b232014-02-19 14:07:32 +08004215 ret = 0;
4216out:
Jiang Liu0e2426122014-02-19 14:07:34 +08004217 rcu_read_unlock();
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004218
Jiang Liub683b232014-02-19 14:07:32 +08004219 return ret;
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004220}
4221
Jiang Liu59ce0512014-02-19 14:07:35 +08004222int dmar_iommu_notify_scope_dev(struct dmar_pci_notify_info *info)
4223{
4224 int ret = 0;
4225 struct dmar_rmrr_unit *rmrru;
4226 struct dmar_atsr_unit *atsru;
4227 struct acpi_dmar_atsr *atsr;
4228 struct acpi_dmar_reserved_memory *rmrr;
4229
4230 if (!intel_iommu_enabled && system_state != SYSTEM_BOOTING)
4231 return 0;
4232
4233 list_for_each_entry(rmrru, &dmar_rmrr_units, list) {
4234 rmrr = container_of(rmrru->hdr,
4235 struct acpi_dmar_reserved_memory, header);
4236 if (info->event == BUS_NOTIFY_ADD_DEVICE) {
4237 ret = dmar_insert_dev_scope(info, (void *)(rmrr + 1),
4238 ((void *)rmrr) + rmrr->header.length,
4239 rmrr->segment, rmrru->devices,
4240 rmrru->devices_cnt);
Jiang Liu27e24952014-06-20 15:08:06 +08004241 if(ret < 0)
Jiang Liu59ce0512014-02-19 14:07:35 +08004242 return ret;
4243 } else if (info->event == BUS_NOTIFY_DEL_DEVICE) {
Jiang Liu27e24952014-06-20 15:08:06 +08004244 dmar_remove_dev_scope(info, rmrr->segment,
4245 rmrru->devices, rmrru->devices_cnt);
Jiang Liu59ce0512014-02-19 14:07:35 +08004246 }
4247 }
4248
4249 list_for_each_entry(atsru, &dmar_atsr_units, list) {
4250 if (atsru->include_all)
4251 continue;
4252
4253 atsr = container_of(atsru->hdr, struct acpi_dmar_atsr, header);
4254 if (info->event == BUS_NOTIFY_ADD_DEVICE) {
4255 ret = dmar_insert_dev_scope(info, (void *)(atsr + 1),
4256 (void *)atsr + atsr->header.length,
4257 atsr->segment, atsru->devices,
4258 atsru->devices_cnt);
4259 if (ret > 0)
4260 break;
4261 else if(ret < 0)
4262 return ret;
4263 } else if (info->event == BUS_NOTIFY_DEL_DEVICE) {
4264 if (dmar_remove_dev_scope(info, atsr->segment,
4265 atsru->devices, atsru->devices_cnt))
4266 break;
4267 }
4268 }
4269
4270 return 0;
4271}
4272
Fenghua Yu99dcade2009-11-11 07:23:06 -08004273/*
4274 * Here we only respond to action of unbound device from driver.
4275 *
4276 * Added device is not attached to its DMAR domain here yet. That will happen
4277 * when mapping the device to iova.
4278 */
4279static int device_notifier(struct notifier_block *nb,
4280 unsigned long action, void *data)
4281{
4282 struct device *dev = data;
Fenghua Yu99dcade2009-11-11 07:23:06 -08004283 struct dmar_domain *domain;
4284
David Woodhouse3d891942014-03-06 15:59:26 +00004285 if (iommu_dummy(dev))
David Woodhouse44cd6132009-12-02 10:18:30 +00004286 return 0;
4287
Joerg Roedel1196c2f2014-09-30 13:02:03 +02004288 if (action != BUS_NOTIFY_REMOVED_DEVICE)
Jiang Liu7e7dfab2014-02-19 14:07:23 +08004289 return 0;
4290
David Woodhouse1525a292014-03-06 16:19:30 +00004291 domain = find_domain(dev);
Fenghua Yu99dcade2009-11-11 07:23:06 -08004292 if (!domain)
4293 return 0;
4294
Joerg Roedele6de0f82015-07-22 16:30:36 +02004295 dmar_remove_one_dev_info(domain, dev);
Jiang Liuab8dfe22014-07-11 14:19:27 +08004296 if (!domain_type_is_vm_or_si(domain) && list_empty(&domain->devices))
Jiang Liu7e7dfab2014-02-19 14:07:23 +08004297 domain_exit(domain);
Alex Williamsona97590e2011-03-04 14:52:16 -07004298
Fenghua Yu99dcade2009-11-11 07:23:06 -08004299 return 0;
4300}
4301
4302static struct notifier_block device_nb = {
4303 .notifier_call = device_notifier,
4304};
4305
Jiang Liu75f05562014-02-19 14:07:37 +08004306static int intel_iommu_memory_notifier(struct notifier_block *nb,
4307 unsigned long val, void *v)
4308{
4309 struct memory_notify *mhp = v;
4310 unsigned long long start, end;
4311 unsigned long start_vpfn, last_vpfn;
4312
4313 switch (val) {
4314 case MEM_GOING_ONLINE:
4315 start = mhp->start_pfn << PAGE_SHIFT;
4316 end = ((mhp->start_pfn + mhp->nr_pages) << PAGE_SHIFT) - 1;
4317 if (iommu_domain_identity_map(si_domain, start, end)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004318 pr_warn("Failed to build identity map for [%llx-%llx]\n",
Jiang Liu75f05562014-02-19 14:07:37 +08004319 start, end);
4320 return NOTIFY_BAD;
4321 }
4322 break;
4323
4324 case MEM_OFFLINE:
4325 case MEM_CANCEL_ONLINE:
4326 start_vpfn = mm_to_dma_pfn(mhp->start_pfn);
4327 last_vpfn = mm_to_dma_pfn(mhp->start_pfn + mhp->nr_pages - 1);
4328 while (start_vpfn <= last_vpfn) {
4329 struct iova *iova;
4330 struct dmar_drhd_unit *drhd;
4331 struct intel_iommu *iommu;
David Woodhouseea8ea462014-03-05 17:09:32 +00004332 struct page *freelist;
Jiang Liu75f05562014-02-19 14:07:37 +08004333
4334 iova = find_iova(&si_domain->iovad, start_vpfn);
4335 if (iova == NULL) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004336 pr_debug("Failed get IOVA for PFN %lx\n",
Jiang Liu75f05562014-02-19 14:07:37 +08004337 start_vpfn);
4338 break;
4339 }
4340
4341 iova = split_and_remove_iova(&si_domain->iovad, iova,
4342 start_vpfn, last_vpfn);
4343 if (iova == NULL) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004344 pr_warn("Failed to split IOVA PFN [%lx-%lx]\n",
Jiang Liu75f05562014-02-19 14:07:37 +08004345 start_vpfn, last_vpfn);
4346 return NOTIFY_BAD;
4347 }
4348
David Woodhouseea8ea462014-03-05 17:09:32 +00004349 freelist = domain_unmap(si_domain, iova->pfn_lo,
4350 iova->pfn_hi);
4351
Jiang Liu75f05562014-02-19 14:07:37 +08004352 rcu_read_lock();
4353 for_each_active_iommu(iommu, drhd)
Joerg Roedela1ddcbe2015-07-21 15:20:32 +02004354 iommu_flush_iotlb_psi(iommu, si_domain,
Jiang Liua156ef92014-07-11 14:19:36 +08004355 iova->pfn_lo, iova_size(iova),
David Woodhouseea8ea462014-03-05 17:09:32 +00004356 !freelist, 0);
Jiang Liu75f05562014-02-19 14:07:37 +08004357 rcu_read_unlock();
David Woodhouseea8ea462014-03-05 17:09:32 +00004358 dma_free_pagelist(freelist);
Jiang Liu75f05562014-02-19 14:07:37 +08004359
4360 start_vpfn = iova->pfn_hi + 1;
4361 free_iova_mem(iova);
4362 }
4363 break;
4364 }
4365
4366 return NOTIFY_OK;
4367}
4368
4369static struct notifier_block intel_iommu_memory_nb = {
4370 .notifier_call = intel_iommu_memory_notifier,
4371 .priority = 0
4372};
4373
Alex Williamsona5459cf2014-06-12 16:12:31 -06004374
4375static ssize_t intel_iommu_show_version(struct device *dev,
4376 struct device_attribute *attr,
4377 char *buf)
4378{
4379 struct intel_iommu *iommu = dev_get_drvdata(dev);
4380 u32 ver = readl(iommu->reg + DMAR_VER_REG);
4381 return sprintf(buf, "%d:%d\n",
4382 DMAR_VER_MAJOR(ver), DMAR_VER_MINOR(ver));
4383}
4384static DEVICE_ATTR(version, S_IRUGO, intel_iommu_show_version, NULL);
4385
4386static ssize_t intel_iommu_show_address(struct device *dev,
4387 struct device_attribute *attr,
4388 char *buf)
4389{
4390 struct intel_iommu *iommu = dev_get_drvdata(dev);
4391 return sprintf(buf, "%llx\n", iommu->reg_phys);
4392}
4393static DEVICE_ATTR(address, S_IRUGO, intel_iommu_show_address, NULL);
4394
4395static ssize_t intel_iommu_show_cap(struct device *dev,
4396 struct device_attribute *attr,
4397 char *buf)
4398{
4399 struct intel_iommu *iommu = dev_get_drvdata(dev);
4400 return sprintf(buf, "%llx\n", iommu->cap);
4401}
4402static DEVICE_ATTR(cap, S_IRUGO, intel_iommu_show_cap, NULL);
4403
4404static ssize_t intel_iommu_show_ecap(struct device *dev,
4405 struct device_attribute *attr,
4406 char *buf)
4407{
4408 struct intel_iommu *iommu = dev_get_drvdata(dev);
4409 return sprintf(buf, "%llx\n", iommu->ecap);
4410}
4411static DEVICE_ATTR(ecap, S_IRUGO, intel_iommu_show_ecap, NULL);
4412
Alex Williamson2238c082015-07-14 15:24:53 -06004413static ssize_t intel_iommu_show_ndoms(struct device *dev,
4414 struct device_attribute *attr,
4415 char *buf)
4416{
4417 struct intel_iommu *iommu = dev_get_drvdata(dev);
4418 return sprintf(buf, "%ld\n", cap_ndoms(iommu->cap));
4419}
4420static DEVICE_ATTR(domains_supported, S_IRUGO, intel_iommu_show_ndoms, NULL);
4421
4422static ssize_t intel_iommu_show_ndoms_used(struct device *dev,
4423 struct device_attribute *attr,
4424 char *buf)
4425{
4426 struct intel_iommu *iommu = dev_get_drvdata(dev);
4427 return sprintf(buf, "%d\n", bitmap_weight(iommu->domain_ids,
4428 cap_ndoms(iommu->cap)));
4429}
4430static DEVICE_ATTR(domains_used, S_IRUGO, intel_iommu_show_ndoms_used, NULL);
4431
Alex Williamsona5459cf2014-06-12 16:12:31 -06004432static struct attribute *intel_iommu_attrs[] = {
4433 &dev_attr_version.attr,
4434 &dev_attr_address.attr,
4435 &dev_attr_cap.attr,
4436 &dev_attr_ecap.attr,
Alex Williamson2238c082015-07-14 15:24:53 -06004437 &dev_attr_domains_supported.attr,
4438 &dev_attr_domains_used.attr,
Alex Williamsona5459cf2014-06-12 16:12:31 -06004439 NULL,
4440};
4441
4442static struct attribute_group intel_iommu_group = {
4443 .name = "intel-iommu",
4444 .attrs = intel_iommu_attrs,
4445};
4446
4447const struct attribute_group *intel_iommu_groups[] = {
4448 &intel_iommu_group,
4449 NULL,
4450};
4451
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07004452int __init intel_iommu_init(void)
4453{
Jiang Liu9bdc5312014-01-06 14:18:27 +08004454 int ret = -ENODEV;
Takao Indoh3a93c842013-04-23 17:35:03 +09004455 struct dmar_drhd_unit *drhd;
Jiang Liu7c919772014-01-06 14:18:18 +08004456 struct intel_iommu *iommu;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07004457
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07004458 /* VT-d is required for a TXT/tboot launch, so enforce that */
4459 force_on = tboot_force_iommu();
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07004460
Jiang Liu3a5670e2014-02-19 14:07:33 +08004461 if (iommu_init_mempool()) {
4462 if (force_on)
4463 panic("tboot: Failed to initialize iommu memory\n");
4464 return -ENOMEM;
4465 }
4466
4467 down_write(&dmar_global_lock);
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07004468 if (dmar_table_init()) {
4469 if (force_on)
4470 panic("tboot: Failed to initialize DMAR table\n");
Jiang Liu9bdc5312014-01-06 14:18:27 +08004471 goto out_free_dmar;
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07004472 }
4473
Suresh Siddhac2c72862011-08-23 17:05:19 -07004474 if (dmar_dev_scope_init() < 0) {
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07004475 if (force_on)
4476 panic("tboot: Failed to initialize DMAR device scope\n");
Jiang Liu9bdc5312014-01-06 14:18:27 +08004477 goto out_free_dmar;
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07004478 }
Suresh Siddha1886e8a2008-07-10 11:16:37 -07004479
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +09004480 if (no_iommu || dmar_disabled)
Jiang Liu9bdc5312014-01-06 14:18:27 +08004481 goto out_free_dmar;
Suresh Siddha2ae21012008-07-10 11:16:43 -07004482
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004483 if (list_empty(&dmar_rmrr_units))
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004484 pr_info("No RMRR found\n");
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004485
4486 if (list_empty(&dmar_atsr_units))
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004487 pr_info("No ATSR found\n");
Suresh Siddha318fe7d2011-08-23 17:05:20 -07004488
Joseph Cihula51a63e62011-03-21 11:04:24 -07004489 if (dmar_init_reserved_ranges()) {
4490 if (force_on)
4491 panic("tboot: Failed to reserve iommu ranges\n");
Jiang Liu3a5670e2014-02-19 14:07:33 +08004492 goto out_free_reserved_range;
Joseph Cihula51a63e62011-03-21 11:04:24 -07004493 }
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07004494
4495 init_no_remapping_devices();
4496
Joseph Cihulab7792602011-05-03 00:08:37 -07004497 ret = init_dmars();
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07004498 if (ret) {
Joseph Cihulaa59b50e2009-06-30 19:31:10 -07004499 if (force_on)
4500 panic("tboot: Failed to initialize DMARs\n");
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004501 pr_err("Initialization failed\n");
Jiang Liu9bdc5312014-01-06 14:18:27 +08004502 goto out_free_reserved_range;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07004503 }
Jiang Liu3a5670e2014-02-19 14:07:33 +08004504 up_write(&dmar_global_lock);
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004505 pr_info("Intel(R) Virtualization Technology for Directed I/O\n");
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07004506
mark gross5e0d2a62008-03-04 15:22:08 -08004507 init_timer(&unmap_timer);
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +09004508#ifdef CONFIG_SWIOTLB
4509 swiotlb = 0;
4510#endif
David Woodhouse19943b02009-08-04 16:19:20 +01004511 dma_ops = &intel_dma_ops;
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -07004512
Rafael J. Wysocki134fac32011-03-23 22:16:14 +01004513 init_iommu_pm_ops();
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +01004514
Alex Williamsona5459cf2014-06-12 16:12:31 -06004515 for_each_active_iommu(iommu, drhd)
4516 iommu->iommu_dev = iommu_device_create(NULL, iommu,
4517 intel_iommu_groups,
Kees Cook2439d4a2015-07-24 16:27:57 -07004518 "%s", iommu->name);
Alex Williamsona5459cf2014-06-12 16:12:31 -06004519
Joerg Roedel4236d97d2011-09-06 17:56:07 +02004520 bus_set_iommu(&pci_bus_type, &intel_iommu_ops);
Fenghua Yu99dcade2009-11-11 07:23:06 -08004521 bus_register_notifier(&pci_bus_type, &device_nb);
Jiang Liu75f05562014-02-19 14:07:37 +08004522 if (si_domain && !hw_pass_through)
4523 register_memory_notifier(&intel_iommu_memory_nb);
Fenghua Yu99dcade2009-11-11 07:23:06 -08004524
Eugeni Dodonov8bc1f852011-11-23 16:42:14 -02004525 intel_iommu_enabled = 1;
4526
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07004527 return 0;
Jiang Liu9bdc5312014-01-06 14:18:27 +08004528
4529out_free_reserved_range:
4530 put_iova_domain(&reserved_iova_list);
Jiang Liu9bdc5312014-01-06 14:18:27 +08004531out_free_dmar:
4532 intel_iommu_free_dmars();
Jiang Liu3a5670e2014-02-19 14:07:33 +08004533 up_write(&dmar_global_lock);
4534 iommu_exit_mempool();
Jiang Liu9bdc5312014-01-06 14:18:27 +08004535 return ret;
Keshavamurthy, Anil Sba3959272007-10-21 16:41:49 -07004536}
Keshavamurthy, Anil Se8204822007-10-21 16:41:55 -07004537
Joerg Roedel2452d9d2015-07-23 16:20:14 +02004538static int domain_context_clear_one_cb(struct pci_dev *pdev, u16 alias, void *opaque)
Alex Williamson579305f2014-07-03 09:51:43 -06004539{
4540 struct intel_iommu *iommu = opaque;
4541
Joerg Roedel2452d9d2015-07-23 16:20:14 +02004542 domain_context_clear_one(iommu, PCI_BUS_NUM(alias), alias & 0xff);
Alex Williamson579305f2014-07-03 09:51:43 -06004543 return 0;
4544}
4545
4546/*
4547 * NB - intel-iommu lacks any sort of reference counting for the users of
4548 * dependent devices. If multiple endpoints have intersecting dependent
4549 * devices, unbinding the driver from any one of them will possibly leave
4550 * the others unable to operate.
4551 */
Joerg Roedel2452d9d2015-07-23 16:20:14 +02004552static void domain_context_clear(struct intel_iommu *iommu, struct device *dev)
Han, Weidong3199aa62009-02-26 17:31:12 +08004553{
David Woodhouse0bcb3e22014-03-06 17:12:03 +00004554 if (!iommu || !dev || !dev_is_pci(dev))
Han, Weidong3199aa62009-02-26 17:31:12 +08004555 return;
4556
Joerg Roedel2452d9d2015-07-23 16:20:14 +02004557 pci_for_each_dma_alias(to_pci_dev(dev), &domain_context_clear_one_cb, iommu);
Han, Weidong3199aa62009-02-26 17:31:12 +08004558}
4559
Joerg Roedel127c7612015-07-23 17:44:46 +02004560static void __dmar_remove_one_dev_info(struct device_domain_info *info)
Weidong Hanc7151a82008-12-08 22:51:37 +08004561{
Weidong Hanc7151a82008-12-08 22:51:37 +08004562 struct intel_iommu *iommu;
4563 unsigned long flags;
Weidong Hanc7151a82008-12-08 22:51:37 +08004564
Joerg Roedel55d94042015-07-22 16:50:40 +02004565 assert_spin_locked(&device_domain_lock);
4566
Joerg Roedelb608ac32015-07-21 18:19:08 +02004567 if (WARN_ON(!info))
Weidong Hanc7151a82008-12-08 22:51:37 +08004568 return;
4569
Joerg Roedel127c7612015-07-23 17:44:46 +02004570 iommu = info->iommu;
4571
4572 if (info->dev) {
4573 iommu_disable_dev_iotlb(info);
4574 domain_context_clear(iommu, info->dev);
4575 }
4576
Joerg Roedelb608ac32015-07-21 18:19:08 +02004577 unlink_domain_info(info);
Roland Dreier3e7abe22011-07-20 06:22:21 -07004578
Joerg Roedeld160aca2015-07-22 11:52:53 +02004579 spin_lock_irqsave(&iommu->lock, flags);
Joerg Roedel127c7612015-07-23 17:44:46 +02004580 domain_detach_iommu(info->domain, iommu);
Joerg Roedeld160aca2015-07-22 11:52:53 +02004581 spin_unlock_irqrestore(&iommu->lock, flags);
Joerg Roedel127c7612015-07-23 17:44:46 +02004582
4583 free_devinfo_mem(info);
Weidong Hanc7151a82008-12-08 22:51:37 +08004584}
4585
Joerg Roedel55d94042015-07-22 16:50:40 +02004586static void dmar_remove_one_dev_info(struct dmar_domain *domain,
4587 struct device *dev)
4588{
Joerg Roedel127c7612015-07-23 17:44:46 +02004589 struct device_domain_info *info;
Joerg Roedel55d94042015-07-22 16:50:40 +02004590 unsigned long flags;
4591
Weidong Hanc7151a82008-12-08 22:51:37 +08004592 spin_lock_irqsave(&device_domain_lock, flags);
Joerg Roedel127c7612015-07-23 17:44:46 +02004593 info = dev->archdata.iommu;
4594 __dmar_remove_one_dev_info(info);
Weidong Han5e98c4b2008-12-08 23:03:27 +08004595 spin_unlock_irqrestore(&device_domain_lock, flags);
Weidong Han5e98c4b2008-12-08 23:03:27 +08004596}
4597
4598static int md_domain_init(struct dmar_domain *domain, int guest_width)
4599{
4600 int adjust_width;
4601
Robin Murphy0fb5fe82015-01-12 17:51:16 +00004602 init_iova_domain(&domain->iovad, VTD_PAGE_SIZE, IOVA_START_PFN,
4603 DMA_32BIT_PFN);
Weidong Han5e98c4b2008-12-08 23:03:27 +08004604 domain_reserve_special_ranges(domain);
4605
4606 /* calculate AGAW */
4607 domain->gaw = guest_width;
4608 adjust_width = guestwidth_to_adjustwidth(guest_width);
4609 domain->agaw = width_to_agaw(adjust_width);
4610
Weidong Han5e98c4b2008-12-08 23:03:27 +08004611 domain->iommu_coherency = 0;
Sheng Yangc5b15252009-08-06 13:31:56 +08004612 domain->iommu_snooping = 0;
Youquan Song6dd9a7c2011-05-25 19:13:49 +01004613 domain->iommu_superpage = 0;
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004614 domain->max_addr = 0;
Weidong Han5e98c4b2008-12-08 23:03:27 +08004615
4616 /* always allocate the top pgd */
Suresh Siddha4c923d42009-10-02 11:01:24 -07004617 domain->pgd = (struct dma_pte *)alloc_pgtable_page(domain->nid);
Weidong Han5e98c4b2008-12-08 23:03:27 +08004618 if (!domain->pgd)
4619 return -ENOMEM;
4620 domain_flush_cache(domain, domain->pgd, PAGE_SIZE);
4621 return 0;
4622}
4623
Joerg Roedel00a77de2015-03-26 13:43:08 +01004624static struct iommu_domain *intel_iommu_domain_alloc(unsigned type)
Kay, Allen M38717942008-09-09 18:37:29 +03004625{
Joerg Roedel5d450802008-12-03 14:52:32 +01004626 struct dmar_domain *dmar_domain;
Joerg Roedel00a77de2015-03-26 13:43:08 +01004627 struct iommu_domain *domain;
4628
4629 if (type != IOMMU_DOMAIN_UNMANAGED)
4630 return NULL;
Kay, Allen M38717942008-09-09 18:37:29 +03004631
Jiang Liuab8dfe22014-07-11 14:19:27 +08004632 dmar_domain = alloc_domain(DOMAIN_FLAG_VIRTUAL_MACHINE);
Joerg Roedel5d450802008-12-03 14:52:32 +01004633 if (!dmar_domain) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004634 pr_err("Can't allocate dmar_domain\n");
Joerg Roedel00a77de2015-03-26 13:43:08 +01004635 return NULL;
Kay, Allen M38717942008-09-09 18:37:29 +03004636 }
Fenghua Yu2c2e2c32009-06-19 13:47:29 -07004637 if (md_domain_init(dmar_domain, DEFAULT_DOMAIN_ADDRESS_WIDTH)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004638 pr_err("Domain initialization failed\n");
Jiang Liu92d03cc2014-02-19 14:07:28 +08004639 domain_exit(dmar_domain);
Joerg Roedel00a77de2015-03-26 13:43:08 +01004640 return NULL;
Kay, Allen M38717942008-09-09 18:37:29 +03004641 }
Allen Kay8140a952011-10-14 12:32:17 -07004642 domain_update_iommu_cap(dmar_domain);
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004643
Joerg Roedel00a77de2015-03-26 13:43:08 +01004644 domain = &dmar_domain->domain;
Joerg Roedel8a0e7152012-01-26 19:40:54 +01004645 domain->geometry.aperture_start = 0;
4646 domain->geometry.aperture_end = __DOMAIN_MAX_ADDR(dmar_domain->gaw);
4647 domain->geometry.force_aperture = true;
4648
Joerg Roedel00a77de2015-03-26 13:43:08 +01004649 return domain;
Kay, Allen M38717942008-09-09 18:37:29 +03004650}
Kay, Allen M38717942008-09-09 18:37:29 +03004651
Joerg Roedel00a77de2015-03-26 13:43:08 +01004652static void intel_iommu_domain_free(struct iommu_domain *domain)
Kay, Allen M38717942008-09-09 18:37:29 +03004653{
Joerg Roedel00a77de2015-03-26 13:43:08 +01004654 domain_exit(to_dmar_domain(domain));
Kay, Allen M38717942008-09-09 18:37:29 +03004655}
Kay, Allen M38717942008-09-09 18:37:29 +03004656
Joerg Roedel4c5478c2008-12-03 14:58:24 +01004657static int intel_iommu_attach_device(struct iommu_domain *domain,
4658 struct device *dev)
Kay, Allen M38717942008-09-09 18:37:29 +03004659{
Joerg Roedel00a77de2015-03-26 13:43:08 +01004660 struct dmar_domain *dmar_domain = to_dmar_domain(domain);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004661 struct intel_iommu *iommu;
4662 int addr_width;
David Woodhouse156baca2014-03-09 14:00:57 -07004663 u8 bus, devfn;
Kay, Allen M38717942008-09-09 18:37:29 +03004664
Alex Williamsonc875d2c2014-07-03 09:57:02 -06004665 if (device_is_rmrr_locked(dev)) {
4666 dev_warn(dev, "Device is ineligible for IOMMU domain attach due to platform RMRR requirement. Contact your platform vendor.\n");
4667 return -EPERM;
4668 }
4669
David Woodhouse7207d8f2014-03-09 16:31:06 -07004670 /* normally dev is not mapped */
4671 if (unlikely(domain_context_mapped(dev))) {
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004672 struct dmar_domain *old_domain;
4673
David Woodhouse1525a292014-03-06 16:19:30 +00004674 old_domain = find_domain(dev);
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004675 if (old_domain) {
Joerg Roedeld160aca2015-07-22 11:52:53 +02004676 rcu_read_lock();
Joerg Roedelde7e8882015-07-22 11:58:07 +02004677 dmar_remove_one_dev_info(old_domain, dev);
Joerg Roedeld160aca2015-07-22 11:52:53 +02004678 rcu_read_unlock();
Joerg Roedel62c22162014-12-09 12:56:45 +01004679
4680 if (!domain_type_is_vm_or_si(old_domain) &&
4681 list_empty(&old_domain->devices))
4682 domain_exit(old_domain);
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004683 }
4684 }
4685
David Woodhouse156baca2014-03-09 14:00:57 -07004686 iommu = device_to_iommu(dev, &bus, &devfn);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004687 if (!iommu)
4688 return -ENODEV;
4689
4690 /* check if this iommu agaw is sufficient for max mapped address */
4691 addr_width = agaw_to_width(iommu->agaw);
Tom Lyona99c47a2010-05-17 08:20:45 +01004692 if (addr_width > cap_mgaw(iommu->cap))
4693 addr_width = cap_mgaw(iommu->cap);
4694
4695 if (dmar_domain->max_addr > (1LL << addr_width)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004696 pr_err("%s: iommu width (%d) is not "
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004697 "sufficient for the mapped address (%llx)\n",
Tom Lyona99c47a2010-05-17 08:20:45 +01004698 __func__, addr_width, dmar_domain->max_addr);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004699 return -EFAULT;
4700 }
Tom Lyona99c47a2010-05-17 08:20:45 +01004701 dmar_domain->gaw = addr_width;
4702
4703 /*
4704 * Knock out extra levels of page tables if necessary
4705 */
4706 while (iommu->agaw < dmar_domain->agaw) {
4707 struct dma_pte *pte;
4708
4709 pte = dmar_domain->pgd;
4710 if (dma_pte_present(pte)) {
Sheng Yang25cbff12010-06-12 19:21:42 +08004711 dmar_domain->pgd = (struct dma_pte *)
4712 phys_to_virt(dma_pte_addr(pte));
Jan Kiszka7a661012010-11-02 08:05:51 +01004713 free_pgtable_page(pte);
Tom Lyona99c47a2010-05-17 08:20:45 +01004714 }
4715 dmar_domain->agaw--;
4716 }
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004717
Joerg Roedel28ccce02015-07-21 14:45:31 +02004718 return domain_add_dev_info(dmar_domain, dev);
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004719}
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004720
Joerg Roedel4c5478c2008-12-03 14:58:24 +01004721static void intel_iommu_detach_device(struct iommu_domain *domain,
4722 struct device *dev)
Kay, Allen M38717942008-09-09 18:37:29 +03004723{
Joerg Roedele6de0f82015-07-22 16:30:36 +02004724 dmar_remove_one_dev_info(to_dmar_domain(domain), dev);
Kay, Allen M38717942008-09-09 18:37:29 +03004725}
Kay, Allen M38717942008-09-09 18:37:29 +03004726
Joerg Roedelb146a1c9f2010-01-20 17:17:37 +01004727static int intel_iommu_map(struct iommu_domain *domain,
4728 unsigned long iova, phys_addr_t hpa,
Ohad Ben-Cohen50090652011-11-10 11:32:25 +02004729 size_t size, int iommu_prot)
Kay, Allen M38717942008-09-09 18:37:29 +03004730{
Joerg Roedel00a77de2015-03-26 13:43:08 +01004731 struct dmar_domain *dmar_domain = to_dmar_domain(domain);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004732 u64 max_addr;
Joerg Roedeldde57a22008-12-03 15:04:09 +01004733 int prot = 0;
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004734 int ret;
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004735
Joerg Roedeldde57a22008-12-03 15:04:09 +01004736 if (iommu_prot & IOMMU_READ)
4737 prot |= DMA_PTE_READ;
4738 if (iommu_prot & IOMMU_WRITE)
4739 prot |= DMA_PTE_WRITE;
Sheng Yang9cf06692009-03-18 15:33:07 +08004740 if ((iommu_prot & IOMMU_CACHE) && dmar_domain->iommu_snooping)
4741 prot |= DMA_PTE_SNP;
Joerg Roedeldde57a22008-12-03 15:04:09 +01004742
David Woodhouse163cc522009-06-28 00:51:17 +01004743 max_addr = iova + size;
Joerg Roedeldde57a22008-12-03 15:04:09 +01004744 if (dmar_domain->max_addr < max_addr) {
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004745 u64 end;
4746
4747 /* check if minimum agaw is sufficient for mapped address */
Tom Lyon8954da12010-05-17 08:19:52 +01004748 end = __DOMAIN_MAX_ADDR(dmar_domain->gaw) + 1;
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004749 if (end < max_addr) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004750 pr_err("%s: iommu width (%d) is not "
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004751 "sufficient for the mapped address (%llx)\n",
Tom Lyon8954da12010-05-17 08:19:52 +01004752 __func__, dmar_domain->gaw, max_addr);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004753 return -EFAULT;
4754 }
Joerg Roedeldde57a22008-12-03 15:04:09 +01004755 dmar_domain->max_addr = max_addr;
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004756 }
David Woodhousead051222009-06-28 14:22:28 +01004757 /* Round up size to next multiple of PAGE_SIZE, if it and
4758 the low bits of hpa would take us onto the next page */
David Woodhouse88cb6a72009-06-28 15:03:06 +01004759 size = aligned_nrpages(hpa, size);
David Woodhousead051222009-06-28 14:22:28 +01004760 ret = domain_pfn_mapping(dmar_domain, iova >> VTD_PAGE_SHIFT,
4761 hpa >> VTD_PAGE_SHIFT, size, prot);
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004762 return ret;
Kay, Allen M38717942008-09-09 18:37:29 +03004763}
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004764
Ohad Ben-Cohen50090652011-11-10 11:32:25 +02004765static size_t intel_iommu_unmap(struct iommu_domain *domain,
David Woodhouseea8ea462014-03-05 17:09:32 +00004766 unsigned long iova, size_t size)
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004767{
Joerg Roedel00a77de2015-03-26 13:43:08 +01004768 struct dmar_domain *dmar_domain = to_dmar_domain(domain);
David Woodhouseea8ea462014-03-05 17:09:32 +00004769 struct page *freelist = NULL;
4770 struct intel_iommu *iommu;
4771 unsigned long start_pfn, last_pfn;
4772 unsigned int npages;
Joerg Roedel42e8c182015-07-21 15:50:02 +02004773 int iommu_id, level = 0;
Sheng Yang4b99d352009-07-08 11:52:52 +01004774
David Woodhouse5cf0a762014-03-19 16:07:49 +00004775 /* Cope with horrid API which requires us to unmap more than the
4776 size argument if it happens to be a large-page mapping. */
Joerg Roedeldc02e462015-08-13 11:15:13 +02004777 BUG_ON(!pfn_to_dma_pte(dmar_domain, iova >> VTD_PAGE_SHIFT, &level));
David Woodhouse5cf0a762014-03-19 16:07:49 +00004778
4779 if (size < VTD_PAGE_SIZE << level_to_offset_bits(level))
4780 size = VTD_PAGE_SIZE << level_to_offset_bits(level);
4781
David Woodhouseea8ea462014-03-05 17:09:32 +00004782 start_pfn = iova >> VTD_PAGE_SHIFT;
4783 last_pfn = (iova + size - 1) >> VTD_PAGE_SHIFT;
4784
4785 freelist = domain_unmap(dmar_domain, start_pfn, last_pfn);
4786
4787 npages = last_pfn - start_pfn + 1;
4788
Joerg Roedel29a27712015-07-21 17:17:12 +02004789 for_each_domain_iommu(iommu_id, dmar_domain) {
Joerg Roedela1ddcbe2015-07-21 15:20:32 +02004790 iommu = g_iommus[iommu_id];
David Woodhouseea8ea462014-03-05 17:09:32 +00004791
Joerg Roedel42e8c182015-07-21 15:50:02 +02004792 iommu_flush_iotlb_psi(g_iommus[iommu_id], dmar_domain,
4793 start_pfn, npages, !freelist, 0);
David Woodhouseea8ea462014-03-05 17:09:32 +00004794 }
4795
4796 dma_free_pagelist(freelist);
Weidong Hanfe40f1e2008-12-08 23:10:23 +08004797
David Woodhouse163cc522009-06-28 00:51:17 +01004798 if (dmar_domain->max_addr == iova + size)
4799 dmar_domain->max_addr = iova;
Joerg Roedelb146a1c9f2010-01-20 17:17:37 +01004800
David Woodhouse5cf0a762014-03-19 16:07:49 +00004801 return size;
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004802}
Kay, Allen M38717942008-09-09 18:37:29 +03004803
Joerg Roedeld14d6572008-12-03 15:06:57 +01004804static phys_addr_t intel_iommu_iova_to_phys(struct iommu_domain *domain,
Varun Sethibb5547a2013-03-29 01:23:58 +05304805 dma_addr_t iova)
Kay, Allen M38717942008-09-09 18:37:29 +03004806{
Joerg Roedel00a77de2015-03-26 13:43:08 +01004807 struct dmar_domain *dmar_domain = to_dmar_domain(domain);
Kay, Allen M38717942008-09-09 18:37:29 +03004808 struct dma_pte *pte;
David Woodhouse5cf0a762014-03-19 16:07:49 +00004809 int level = 0;
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004810 u64 phys = 0;
Kay, Allen M38717942008-09-09 18:37:29 +03004811
David Woodhouse5cf0a762014-03-19 16:07:49 +00004812 pte = pfn_to_dma_pte(dmar_domain, iova >> VTD_PAGE_SHIFT, &level);
Kay, Allen M38717942008-09-09 18:37:29 +03004813 if (pte)
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004814 phys = dma_pte_addr(pte);
Kay, Allen M38717942008-09-09 18:37:29 +03004815
Weidong Hanfaa3d6f2008-12-08 23:09:29 +08004816 return phys;
Kay, Allen M38717942008-09-09 18:37:29 +03004817}
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +01004818
Joerg Roedel5d587b82014-09-05 10:50:45 +02004819static bool intel_iommu_capable(enum iommu_cap cap)
Sheng Yangdbb9fd82009-03-18 15:33:06 +08004820{
Sheng Yangdbb9fd82009-03-18 15:33:06 +08004821 if (cap == IOMMU_CAP_CACHE_COHERENCY)
Joerg Roedel5d587b82014-09-05 10:50:45 +02004822 return domain_update_iommu_snooping(NULL) == 1;
Tom Lyon323f99c2010-07-02 16:56:14 -04004823 if (cap == IOMMU_CAP_INTR_REMAP)
Joerg Roedel5d587b82014-09-05 10:50:45 +02004824 return irq_remapping_enabled == 1;
Sheng Yangdbb9fd82009-03-18 15:33:06 +08004825
Joerg Roedel5d587b82014-09-05 10:50:45 +02004826 return false;
Sheng Yangdbb9fd82009-03-18 15:33:06 +08004827}
4828
Alex Williamsonabdfdde2012-05-30 14:19:19 -06004829static int intel_iommu_add_device(struct device *dev)
Alex Williamson70ae6f02011-10-21 15:56:11 -04004830{
Alex Williamsona5459cf2014-06-12 16:12:31 -06004831 struct intel_iommu *iommu;
Alex Williamsonabdfdde2012-05-30 14:19:19 -06004832 struct iommu_group *group;
David Woodhouse156baca2014-03-09 14:00:57 -07004833 u8 bus, devfn;
Alex Williamson70ae6f02011-10-21 15:56:11 -04004834
Alex Williamsona5459cf2014-06-12 16:12:31 -06004835 iommu = device_to_iommu(dev, &bus, &devfn);
4836 if (!iommu)
Alex Williamson70ae6f02011-10-21 15:56:11 -04004837 return -ENODEV;
4838
Alex Williamsona5459cf2014-06-12 16:12:31 -06004839 iommu_device_link(iommu->iommu_dev, dev);
Alex Williamsonabdfdde2012-05-30 14:19:19 -06004840
Alex Williamsone17f9ff2014-07-03 09:51:37 -06004841 group = iommu_group_get_for_dev(dev);
Alex Williamson783f1572012-05-30 14:19:43 -06004842
Alex Williamsone17f9ff2014-07-03 09:51:37 -06004843 if (IS_ERR(group))
4844 return PTR_ERR(group);
Alex Williamson70ae6f02011-10-21 15:56:11 -04004845
Alex Williamsonabdfdde2012-05-30 14:19:19 -06004846 iommu_group_put(group);
Alex Williamsone17f9ff2014-07-03 09:51:37 -06004847 return 0;
Alex Williamsonabdfdde2012-05-30 14:19:19 -06004848}
4849
4850static void intel_iommu_remove_device(struct device *dev)
4851{
Alex Williamsona5459cf2014-06-12 16:12:31 -06004852 struct intel_iommu *iommu;
4853 u8 bus, devfn;
4854
4855 iommu = device_to_iommu(dev, &bus, &devfn);
4856 if (!iommu)
4857 return;
4858
Alex Williamsonabdfdde2012-05-30 14:19:19 -06004859 iommu_group_remove_device(dev);
Alex Williamsona5459cf2014-06-12 16:12:31 -06004860
4861 iommu_device_unlink(iommu->iommu_dev, dev);
Alex Williamson70ae6f02011-10-21 15:56:11 -04004862}
4863
Thierry Redingb22f6432014-06-27 09:03:12 +02004864static const struct iommu_ops intel_iommu_ops = {
Joerg Roedel5d587b82014-09-05 10:50:45 +02004865 .capable = intel_iommu_capable,
Joerg Roedel00a77de2015-03-26 13:43:08 +01004866 .domain_alloc = intel_iommu_domain_alloc,
4867 .domain_free = intel_iommu_domain_free,
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +01004868 .attach_dev = intel_iommu_attach_device,
4869 .detach_dev = intel_iommu_detach_device,
Joerg Roedelb146a1c9f2010-01-20 17:17:37 +01004870 .map = intel_iommu_map,
4871 .unmap = intel_iommu_unmap,
Olav Haugan315786e2014-10-25 09:55:16 -07004872 .map_sg = default_iommu_map_sg,
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +01004873 .iova_to_phys = intel_iommu_iova_to_phys,
Alex Williamsonabdfdde2012-05-30 14:19:19 -06004874 .add_device = intel_iommu_add_device,
4875 .remove_device = intel_iommu_remove_device,
Ohad Ben-Cohen6d1c56a2011-11-10 11:32:30 +02004876 .pgsize_bitmap = INTEL_IOMMU_PGSIZES,
Joerg Roedela8bcbb0d2008-12-03 15:14:02 +01004877};
David Woodhouse9af88142009-02-13 23:18:03 +00004878
Daniel Vetter94526182013-01-20 23:50:13 +01004879static void quirk_iommu_g4x_gfx(struct pci_dev *dev)
4880{
4881 /* G4x/GM45 integrated gfx dmar support is totally busted. */
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004882 pr_info("Disabling IOMMU for graphics on this chipset\n");
Daniel Vetter94526182013-01-20 23:50:13 +01004883 dmar_map_gfx = 0;
4884}
4885
4886DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2a40, quirk_iommu_g4x_gfx);
4887DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e00, quirk_iommu_g4x_gfx);
4888DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e10, quirk_iommu_g4x_gfx);
4889DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e20, quirk_iommu_g4x_gfx);
4890DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e30, quirk_iommu_g4x_gfx);
4891DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e40, quirk_iommu_g4x_gfx);
4892DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e90, quirk_iommu_g4x_gfx);
4893
Greg Kroah-Hartmand34d6512012-12-21 15:05:21 -08004894static void quirk_iommu_rwbf(struct pci_dev *dev)
David Woodhouse9af88142009-02-13 23:18:03 +00004895{
4896 /*
4897 * Mobile 4 Series Chipset neglects to set RWBF capability,
Daniel Vetter210561f2013-01-21 19:48:59 +01004898 * but needs it. Same seems to hold for the desktop versions.
David Woodhouse9af88142009-02-13 23:18:03 +00004899 */
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004900 pr_info("Forcing write-buffer flush capability\n");
David Woodhouse9af88142009-02-13 23:18:03 +00004901 rwbf_quirk = 1;
4902}
4903
4904DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2a40, quirk_iommu_rwbf);
Daniel Vetter210561f2013-01-21 19:48:59 +01004905DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e00, quirk_iommu_rwbf);
4906DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e10, quirk_iommu_rwbf);
4907DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e20, quirk_iommu_rwbf);
4908DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e30, quirk_iommu_rwbf);
4909DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e40, quirk_iommu_rwbf);
4910DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x2e90, quirk_iommu_rwbf);
David Woodhousee0fc7e02009-09-30 09:12:17 -07004911
Adam Jacksoneecfd572010-08-25 21:17:34 +01004912#define GGC 0x52
4913#define GGC_MEMORY_SIZE_MASK (0xf << 8)
4914#define GGC_MEMORY_SIZE_NONE (0x0 << 8)
4915#define GGC_MEMORY_SIZE_1M (0x1 << 8)
4916#define GGC_MEMORY_SIZE_2M (0x3 << 8)
4917#define GGC_MEMORY_VT_ENABLED (0x8 << 8)
4918#define GGC_MEMORY_SIZE_2M_VT (0x9 << 8)
4919#define GGC_MEMORY_SIZE_3M_VT (0xa << 8)
4920#define GGC_MEMORY_SIZE_4M_VT (0xb << 8)
4921
Greg Kroah-Hartmand34d6512012-12-21 15:05:21 -08004922static void quirk_calpella_no_shadow_gtt(struct pci_dev *dev)
David Woodhouse9eecabc2010-09-21 22:28:23 +01004923{
4924 unsigned short ggc;
4925
Adam Jacksoneecfd572010-08-25 21:17:34 +01004926 if (pci_read_config_word(dev, GGC, &ggc))
David Woodhouse9eecabc2010-09-21 22:28:23 +01004927 return;
4928
Adam Jacksoneecfd572010-08-25 21:17:34 +01004929 if (!(ggc & GGC_MEMORY_VT_ENABLED)) {
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004930 pr_info("BIOS has allocated no shadow GTT; disabling IOMMU for graphics\n");
David Woodhouse9eecabc2010-09-21 22:28:23 +01004931 dmar_map_gfx = 0;
David Woodhouse6fbcfb32011-09-25 19:11:14 -07004932 } else if (dmar_map_gfx) {
4933 /* we have to ensure the gfx device is idle before we flush */
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004934 pr_info("Disabling batched IOTLB flush on Ironlake\n");
David Woodhouse6fbcfb32011-09-25 19:11:14 -07004935 intel_iommu_strict = 1;
4936 }
David Woodhouse9eecabc2010-09-21 22:28:23 +01004937}
4938DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x0040, quirk_calpella_no_shadow_gtt);
4939DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x0044, quirk_calpella_no_shadow_gtt);
4940DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x0062, quirk_calpella_no_shadow_gtt);
4941DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_INTEL, 0x006a, quirk_calpella_no_shadow_gtt);
4942
David Woodhousee0fc7e02009-09-30 09:12:17 -07004943/* On Tylersburg chipsets, some BIOSes have been known to enable the
4944 ISOCH DMAR unit for the Azalia sound device, but not give it any
4945 TLB entries, which causes it to deadlock. Check for that. We do
4946 this in a function called from init_dmars(), instead of in a PCI
4947 quirk, because we don't want to print the obnoxious "BIOS broken"
4948 message if VT-d is actually disabled.
4949*/
4950static void __init check_tylersburg_isoch(void)
4951{
4952 struct pci_dev *pdev;
4953 uint32_t vtisochctrl;
4954
4955 /* If there's no Azalia in the system anyway, forget it. */
4956 pdev = pci_get_device(PCI_VENDOR_ID_INTEL, 0x3a3e, NULL);
4957 if (!pdev)
4958 return;
4959 pci_dev_put(pdev);
4960
4961 /* System Management Registers. Might be hidden, in which case
4962 we can't do the sanity check. But that's OK, because the
4963 known-broken BIOSes _don't_ actually hide it, so far. */
4964 pdev = pci_get_device(PCI_VENDOR_ID_INTEL, 0x342e, NULL);
4965 if (!pdev)
4966 return;
4967
4968 if (pci_read_config_dword(pdev, 0x188, &vtisochctrl)) {
4969 pci_dev_put(pdev);
4970 return;
4971 }
4972
4973 pci_dev_put(pdev);
4974
4975 /* If Azalia DMA is routed to the non-isoch DMAR unit, fine. */
4976 if (vtisochctrl & 1)
4977 return;
4978
4979 /* Drop all bits other than the number of TLB entries */
4980 vtisochctrl &= 0x1c;
4981
4982 /* If we have the recommended number of TLB entries (16), fine. */
4983 if (vtisochctrl == 0x10)
4984 return;
4985
4986 /* Zero TLB entries? You get to ride the short bus to school. */
4987 if (!vtisochctrl) {
4988 WARN(1, "Your BIOS is broken; DMA routed to ISOCH DMAR unit but no TLB space.\n"
4989 "BIOS vendor: %s; Ver: %s; Product Version: %s\n",
4990 dmi_get_system_info(DMI_BIOS_VENDOR),
4991 dmi_get_system_info(DMI_BIOS_VERSION),
4992 dmi_get_system_info(DMI_PRODUCT_VERSION));
4993 iommu_identity_mapping |= IDENTMAP_AZALIA;
4994 return;
4995 }
Joerg Roedel9f10e5b2015-06-12 09:57:06 +02004996
4997 pr_warn("Recommended TLB entries for ISOCH unit is 16; your BIOS set %d\n",
David Woodhousee0fc7e02009-09-30 09:12:17 -07004998 vtisochctrl);
4999}