2 * Copyright (c) 2006, Intel Corporation.
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms and conditions of the GNU General Public License,
6 * version 2, as published by the Free Software Foundation.
8 * This program is distributed in the hope it will be useful, but WITHOUT
9 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
13 * You should have received a copy of the GNU General Public License along with
14 * this program; if not, write to the Free Software Foundation, Inc., 59 Temple
15 * Place - Suite 330, Boston, MA 02111-1307 USA.
17 * Copyright (C) 2006-2008 Intel Corporation
18 * Copyright IBM Corporation, 2008
19 * Copyright 2010 Red Hat, Inc. and/or its affiliates.
21 * Author: Allen M. Kay <allen.m.kay@intel.com>
22 * Author: Weidong Han <weidong.han@intel.com>
23 * Author: Ben-Ami Yassour <benami@il.ibm.com>
26 #include <linux/list.h>
27 #include <linux/kvm_host.h>
28 #include <linux/module.h>
29 #include <linux/pci.h>
30 #include <linux/stat.h>
31 #include <linux/dmar.h>
32 #include <linux/iommu.h>
33 #include <linux/intel-iommu.h>
35 static bool allow_unsafe_assigned_interrupts
;
36 module_param_named(allow_unsafe_assigned_interrupts
,
37 allow_unsafe_assigned_interrupts
, bool, S_IRUGO
| S_IWUSR
);
38 MODULE_PARM_DESC(allow_unsafe_assigned_interrupts
,
39 "Enable device assignment on platforms without interrupt remapping support.");
41 static int kvm_iommu_unmap_memslots(struct kvm
*kvm
);
42 static void kvm_iommu_put_pages(struct kvm
*kvm
,
43 gfn_t base_gfn
, unsigned long npages
);
45 static pfn_t
kvm_pin_pages(struct kvm_memory_slot
*slot
, gfn_t gfn
,
51 pfn
= gfn_to_pfn_memslot(slot
, gfn
);
52 end_gfn
= gfn
+ (size
>> PAGE_SHIFT
);
55 if (is_error_noslot_pfn(pfn
))
59 gfn_to_pfn_memslot(slot
, gfn
++);
64 int kvm_iommu_map_pages(struct kvm
*kvm
, struct kvm_memory_slot
*slot
)
69 struct iommu_domain
*domain
= kvm
->arch
.iommu_domain
;
72 /* check if iommu exists and in use */
77 end_gfn
= gfn
+ slot
->npages
;
80 if (!(slot
->flags
& KVM_MEM_READONLY
))
82 if (!kvm
->arch
.iommu_noncoherent
)
86 while (gfn
< end_gfn
) {
87 unsigned long page_size
;
89 /* Check if already mapped */
90 if (iommu_iova_to_phys(domain
, gfn_to_gpa(gfn
))) {
95 /* Get the page size we could use to map */
96 page_size
= kvm_host_page_size(kvm
, gfn
);
98 /* Make sure the page_size does not exceed the memslot */
99 while ((gfn
+ (page_size
>> PAGE_SHIFT
)) > end_gfn
)
102 /* Make sure gfn is aligned to the page size we want to map */
103 while ((gfn
<< PAGE_SHIFT
) & (page_size
- 1))
106 /* Make sure hva is aligned to the page size we want to map */
107 while (__gfn_to_hva_memslot(slot
, gfn
) & (page_size
- 1))
111 * Pin all pages we are about to map in memory. This is
112 * important because we unmap and unpin in 4kb steps later.
114 pfn
= kvm_pin_pages(slot
, gfn
, page_size
);
115 if (is_error_noslot_pfn(pfn
)) {
120 /* Map into IO address space */
121 r
= iommu_map(domain
, gfn_to_gpa(gfn
), pfn_to_hpa(pfn
),
124 printk(KERN_ERR
"kvm_iommu_map_address:"
125 "iommu failed to map pfn=%llx\n", pfn
);
129 gfn
+= page_size
>> PAGE_SHIFT
;
137 kvm_iommu_put_pages(kvm
, slot
->base_gfn
, gfn
);
141 static int kvm_iommu_map_memslots(struct kvm
*kvm
)
144 struct kvm_memslots
*slots
;
145 struct kvm_memory_slot
*memslot
;
147 if (kvm
->arch
.iommu_noncoherent
)
148 kvm_arch_register_noncoherent_dma(kvm
);
150 idx
= srcu_read_lock(&kvm
->srcu
);
151 slots
= kvm_memslots(kvm
);
153 kvm_for_each_memslot(memslot
, slots
) {
154 r
= kvm_iommu_map_pages(kvm
, memslot
);
158 srcu_read_unlock(&kvm
->srcu
, idx
);
163 int kvm_assign_device(struct kvm
*kvm
,
164 struct kvm_assigned_dev_kernel
*assigned_dev
)
166 struct pci_dev
*pdev
= NULL
;
167 struct iommu_domain
*domain
= kvm
->arch
.iommu_domain
;
171 /* check if iommu exists and in use */
175 pdev
= assigned_dev
->dev
;
179 r
= iommu_attach_device(domain
, &pdev
->dev
);
181 dev_err(&pdev
->dev
, "kvm assign device failed ret %d", r
);
185 noncoherent
= !iommu_domain_has_cap(kvm
->arch
.iommu_domain
,
186 IOMMU_CAP_CACHE_COHERENCY
);
188 /* Check if need to update IOMMU page table for guest memory */
189 if (noncoherent
!= kvm
->arch
.iommu_noncoherent
) {
190 kvm_iommu_unmap_memslots(kvm
);
191 kvm
->arch
.iommu_noncoherent
= noncoherent
;
192 r
= kvm_iommu_map_memslots(kvm
);
197 pdev
->dev_flags
|= PCI_DEV_FLAGS_ASSIGNED
;
199 dev_info(&pdev
->dev
, "kvm assign device\n");
203 kvm_iommu_unmap_memslots(kvm
);
207 int kvm_deassign_device(struct kvm
*kvm
,
208 struct kvm_assigned_dev_kernel
*assigned_dev
)
210 struct iommu_domain
*domain
= kvm
->arch
.iommu_domain
;
211 struct pci_dev
*pdev
= NULL
;
213 /* check if iommu exists and in use */
217 pdev
= assigned_dev
->dev
;
221 iommu_detach_device(domain
, &pdev
->dev
);
223 pdev
->dev_flags
&= ~PCI_DEV_FLAGS_ASSIGNED
;
225 dev_info(&pdev
->dev
, "kvm deassign device\n");
230 int kvm_iommu_map_guest(struct kvm
*kvm
)
234 if (!iommu_present(&pci_bus_type
)) {
235 printk(KERN_ERR
"%s: iommu not found\n", __func__
);
239 mutex_lock(&kvm
->slots_lock
);
241 kvm
->arch
.iommu_domain
= iommu_domain_alloc(&pci_bus_type
);
242 if (!kvm
->arch
.iommu_domain
) {
247 if (!allow_unsafe_assigned_interrupts
&&
248 !iommu_domain_has_cap(kvm
->arch
.iommu_domain
,
249 IOMMU_CAP_INTR_REMAP
)) {
250 printk(KERN_WARNING
"%s: No interrupt remapping support,"
251 " disallowing device assignment."
252 " Re-enble with \"allow_unsafe_assigned_interrupts=1\""
253 " module option.\n", __func__
);
254 iommu_domain_free(kvm
->arch
.iommu_domain
);
255 kvm
->arch
.iommu_domain
= NULL
;
260 r
= kvm_iommu_map_memslots(kvm
);
262 kvm_iommu_unmap_memslots(kvm
);
265 mutex_unlock(&kvm
->slots_lock
);
269 static void kvm_unpin_pages(struct kvm
*kvm
, pfn_t pfn
, unsigned long npages
)
273 for (i
= 0; i
< npages
; ++i
)
274 kvm_release_pfn_clean(pfn
+ i
);
277 static void kvm_iommu_put_pages(struct kvm
*kvm
,
278 gfn_t base_gfn
, unsigned long npages
)
280 struct iommu_domain
*domain
;
285 domain
= kvm
->arch
.iommu_domain
;
286 end_gfn
= base_gfn
+ npages
;
289 /* check if iommu exists and in use */
293 while (gfn
< end_gfn
) {
294 unsigned long unmap_pages
;
297 /* Get physical address */
298 phys
= iommu_iova_to_phys(domain
, gfn_to_gpa(gfn
));
305 pfn
= phys
>> PAGE_SHIFT
;
307 /* Unmap address from IO address space */
308 size
= iommu_unmap(domain
, gfn_to_gpa(gfn
), PAGE_SIZE
);
309 unmap_pages
= 1ULL << get_order(size
);
311 /* Unpin all pages we just unmapped to not leak any memory */
312 kvm_unpin_pages(kvm
, pfn
, unmap_pages
);
318 void kvm_iommu_unmap_pages(struct kvm
*kvm
, struct kvm_memory_slot
*slot
)
320 kvm_iommu_put_pages(kvm
, slot
->base_gfn
, slot
->npages
);
323 static int kvm_iommu_unmap_memslots(struct kvm
*kvm
)
326 struct kvm_memslots
*slots
;
327 struct kvm_memory_slot
*memslot
;
329 idx
= srcu_read_lock(&kvm
->srcu
);
330 slots
= kvm_memslots(kvm
);
332 kvm_for_each_memslot(memslot
, slots
)
333 kvm_iommu_unmap_pages(kvm
, memslot
);
335 srcu_read_unlock(&kvm
->srcu
, idx
);
337 if (kvm
->arch
.iommu_noncoherent
)
338 kvm_arch_unregister_noncoherent_dma(kvm
);
343 int kvm_iommu_unmap_guest(struct kvm
*kvm
)
345 struct iommu_domain
*domain
= kvm
->arch
.iommu_domain
;
347 /* check if iommu exists and in use */
351 mutex_lock(&kvm
->slots_lock
);
352 kvm_iommu_unmap_memslots(kvm
);
353 kvm
->arch
.iommu_domain
= NULL
;
354 kvm
->arch
.iommu_noncoherent
= false;
355 mutex_unlock(&kvm
->slots_lock
);
357 iommu_domain_free(domain
);