2 * Copyright (C) 2014-2016 Broadcom Corporation
3 * Copyright (c) 2017 Red Hat, Inc.
4 * Written by Prem Mallappa, Eric Auger
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 as
8 * published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
15 * Author: Prem Mallappa <pmallapp@broadcom.com>
19 #include "qemu/osdep.h"
21 #include "exec/target_page.h"
22 #include "hw/core/cpu.h"
23 #include "hw/qdev-properties.h"
24 #include "qapi/error.h"
25 #include "qemu/jhash.h"
26 #include "qemu/module.h"
28 #include "qemu/error-report.h"
29 #include "hw/arm/smmu-common.h"
30 #include "smmu-internal.h"
32 /* IOTLB Management */
34 static guint
smmu_iotlb_key_hash(gconstpointer v
)
36 SMMUIOTLBKey
*key
= (SMMUIOTLBKey
*)v
;
40 a
= b
= c
= JHASH_INITVAL
+ sizeof(*key
);
41 a
+= key
->asid
+ key
->level
+ key
->tg
;
42 b
+= extract64(key
->iova
, 0, 32);
43 c
+= extract64(key
->iova
, 32, 32);
46 __jhash_final(a
, b
, c
);
51 static gboolean
smmu_iotlb_key_equal(gconstpointer v1
, gconstpointer v2
)
53 SMMUIOTLBKey
*k1
= (SMMUIOTLBKey
*)v1
, *k2
= (SMMUIOTLBKey
*)v2
;
55 return (k1
->asid
== k2
->asid
) && (k1
->iova
== k2
->iova
) &&
56 (k1
->level
== k2
->level
) && (k1
->tg
== k2
->tg
);
59 SMMUIOTLBKey
smmu_get_iotlb_key(uint16_t asid
, uint64_t iova
,
60 uint8_t tg
, uint8_t level
)
62 SMMUIOTLBKey key
= {.asid
= asid
, .iova
= iova
, .tg
= tg
, .level
= level
};
67 SMMUTLBEntry
*smmu_iotlb_lookup(SMMUState
*bs
, SMMUTransCfg
*cfg
,
68 SMMUTransTableInfo
*tt
, hwaddr iova
)
70 uint8_t tg
= (tt
->granule_sz
- 10) / 2;
71 uint8_t inputsize
= 64 - tt
->tsz
;
72 uint8_t stride
= tt
->granule_sz
- 3;
73 uint8_t level
= 4 - (inputsize
- 4) / stride
;
74 SMMUTLBEntry
*entry
= NULL
;
77 uint64_t subpage_size
= 1ULL << level_shift(level
, tt
->granule_sz
);
78 uint64_t mask
= subpage_size
- 1;
81 key
= smmu_get_iotlb_key(cfg
->asid
, iova
& ~mask
, tg
, level
);
82 entry
= g_hash_table_lookup(bs
->iotlb
, &key
);
91 trace_smmu_iotlb_lookup_hit(cfg
->asid
, iova
,
92 cfg
->iotlb_hits
, cfg
->iotlb_misses
,
93 100 * cfg
->iotlb_hits
/
94 (cfg
->iotlb_hits
+ cfg
->iotlb_misses
));
97 trace_smmu_iotlb_lookup_miss(cfg
->asid
, iova
,
98 cfg
->iotlb_hits
, cfg
->iotlb_misses
,
99 100 * cfg
->iotlb_hits
/
100 (cfg
->iotlb_hits
+ cfg
->iotlb_misses
));
105 void smmu_iotlb_insert(SMMUState
*bs
, SMMUTransCfg
*cfg
, SMMUTLBEntry
*new)
107 SMMUIOTLBKey
*key
= g_new0(SMMUIOTLBKey
, 1);
108 uint8_t tg
= (new->granule
- 10) / 2;
110 if (g_hash_table_size(bs
->iotlb
) >= SMMU_IOTLB_MAX_SIZE
) {
111 smmu_iotlb_inv_all(bs
);
114 *key
= smmu_get_iotlb_key(cfg
->asid
, new->entry
.iova
, tg
, new->level
);
115 trace_smmu_iotlb_insert(cfg
->asid
, new->entry
.iova
, tg
, new->level
);
116 g_hash_table_insert(bs
->iotlb
, key
, new);
119 void smmu_iotlb_inv_all(SMMUState
*s
)
121 trace_smmu_iotlb_inv_all();
122 g_hash_table_remove_all(s
->iotlb
);
125 static gboolean
smmu_hash_remove_by_asid(gpointer key
, gpointer value
,
128 uint16_t asid
= *(uint16_t *)user_data
;
129 SMMUIOTLBKey
*iotlb_key
= (SMMUIOTLBKey
*)key
;
131 return SMMU_IOTLB_ASID(*iotlb_key
) == asid
;
134 static gboolean
smmu_hash_remove_by_asid_iova(gpointer key
, gpointer value
,
137 SMMUTLBEntry
*iter
= (SMMUTLBEntry
*)value
;
138 IOMMUTLBEntry
*entry
= &iter
->entry
;
139 SMMUIOTLBPageInvInfo
*info
= (SMMUIOTLBPageInvInfo
*)user_data
;
140 SMMUIOTLBKey iotlb_key
= *(SMMUIOTLBKey
*)key
;
142 if (info
->asid
>= 0 && info
->asid
!= SMMU_IOTLB_ASID(iotlb_key
)) {
145 return ((info
->iova
& ~entry
->addr_mask
) == entry
->iova
) ||
146 ((entry
->iova
& ~info
->mask
) == info
->iova
);
149 void smmu_iotlb_inv_iova(SMMUState
*s
, int asid
, dma_addr_t iova
,
150 uint8_t tg
, uint64_t num_pages
, uint8_t ttl
)
152 /* if tg is not set we use 4KB range invalidation */
153 uint8_t granule
= tg
? tg
* 2 + 10 : 12;
155 if (ttl
&& (num_pages
== 1) && (asid
>= 0)) {
156 SMMUIOTLBKey key
= smmu_get_iotlb_key(asid
, iova
, tg
, ttl
);
158 if (g_hash_table_remove(s
->iotlb
, &key
)) {
162 * if the entry is not found, let's see if it does not
163 * belong to a larger IOTLB entry
167 SMMUIOTLBPageInvInfo info
= {
168 .asid
= asid
, .iova
= iova
,
169 .mask
= (num_pages
* 1 << granule
) - 1};
171 g_hash_table_foreach_remove(s
->iotlb
,
172 smmu_hash_remove_by_asid_iova
,
176 void smmu_iotlb_inv_asid(SMMUState
*s
, uint16_t asid
)
178 trace_smmu_iotlb_inv_asid(asid
);
179 g_hash_table_foreach_remove(s
->iotlb
, smmu_hash_remove_by_asid
, &asid
);
182 /* VMSAv8-64 Translation */
185 * get_pte - Get the content of a page table entry located at
188 static int get_pte(dma_addr_t baseaddr
, uint32_t index
, uint64_t *pte
,
189 SMMUPTWEventInfo
*info
)
192 dma_addr_t addr
= baseaddr
+ index
* sizeof(*pte
);
194 /* TODO: guarantee 64-bit single-copy atomicity */
195 ret
= dma_memory_read(&address_space_memory
, addr
, pte
, sizeof(*pte
),
196 MEMTXATTRS_UNSPECIFIED
);
198 if (ret
!= MEMTX_OK
) {
199 info
->type
= SMMU_PTW_ERR_WALK_EABT
;
203 trace_smmu_get_pte(baseaddr
, index
, addr
, *pte
);
207 /* VMSAv8-64 Translation Table Format Descriptor Decoding */
210 * get_page_pte_address - returns the L3 descriptor output address,
212 * ARM ARM spec: Figure D4-17 VMSAv8-64 level 3 descriptor format
214 static inline hwaddr
get_page_pte_address(uint64_t pte
, int granule_sz
)
216 return PTE_ADDRESS(pte
, granule_sz
);
220 * get_table_pte_address - return table descriptor output address,
221 * ie. address of next level table
222 * ARM ARM Figure D4-16 VMSAv8-64 level0, level1, and level 2 descriptor formats
224 static inline hwaddr
get_table_pte_address(uint64_t pte
, int granule_sz
)
226 return PTE_ADDRESS(pte
, granule_sz
);
230 * get_block_pte_address - return block descriptor output address and block size
231 * ARM ARM Figure D4-16 VMSAv8-64 level0, level1, and level 2 descriptor formats
233 static inline hwaddr
get_block_pte_address(uint64_t pte
, int level
,
234 int granule_sz
, uint64_t *bsz
)
236 int n
= level_shift(level
, granule_sz
);
239 return PTE_ADDRESS(pte
, n
);
242 SMMUTransTableInfo
*select_tt(SMMUTransCfg
*cfg
, dma_addr_t iova
)
244 bool tbi
= extract64(iova
, 55, 1) ? TBI1(cfg
->tbi
) : TBI0(cfg
->tbi
);
245 uint8_t tbi_byte
= tbi
* 8;
247 if (cfg
->tt
[0].tsz
&&
248 !extract64(iova
, 64 - cfg
->tt
[0].tsz
, cfg
->tt
[0].tsz
- tbi_byte
)) {
249 /* there is a ttbr0 region and we are in it (high bits all zero) */
251 } else if (cfg
->tt
[1].tsz
&&
252 sextract64(iova
, 64 - cfg
->tt
[1].tsz
, cfg
->tt
[1].tsz
- tbi_byte
) == -1) {
253 /* there is a ttbr1 region and we are in it (high bits all one) */
255 } else if (!cfg
->tt
[0].tsz
) {
256 /* ttbr0 region is "everything not in the ttbr1 region" */
258 } else if (!cfg
->tt
[1].tsz
) {
259 /* ttbr1 region is "everything not in the ttbr0 region" */
262 /* in the gap between the two regions, this is a Translation fault */
267 * smmu_ptw_64 - VMSAv8-64 Walk of the page tables for a given IOVA
268 * @cfg: translation config
269 * @iova: iova to translate
271 * @tlbe: SMMUTLBEntry (out)
272 * @info: handle to an error info
274 * Return 0 on success, < 0 on error. In case of error, @info is filled
275 * and tlbe->perm is set to IOMMU_NONE.
276 * Upon success, @tlbe is filled with translated_addr and entry
279 static int smmu_ptw_64(SMMUTransCfg
*cfg
,
280 dma_addr_t iova
, IOMMUAccessFlags perm
,
281 SMMUTLBEntry
*tlbe
, SMMUPTWEventInfo
*info
)
283 dma_addr_t baseaddr
, indexmask
;
284 int stage
= cfg
->stage
;
285 SMMUTransTableInfo
*tt
= select_tt(cfg
, iova
);
286 uint8_t level
, granule_sz
, inputsize
, stride
;
288 if (!tt
|| tt
->disabled
) {
289 info
->type
= SMMU_PTW_ERR_TRANSLATION
;
293 granule_sz
= tt
->granule_sz
;
294 stride
= granule_sz
- 3;
295 inputsize
= 64 - tt
->tsz
;
296 level
= 4 - (inputsize
- 4) / stride
;
297 indexmask
= (1ULL << (inputsize
- (stride
* (4 - level
)))) - 1;
298 baseaddr
= extract64(tt
->ttb
, 0, 48);
299 baseaddr
&= ~indexmask
;
302 uint64_t subpage_size
= 1ULL << level_shift(level
, granule_sz
);
303 uint64_t mask
= subpage_size
- 1;
304 uint32_t offset
= iova_level_offset(iova
, inputsize
, level
, granule_sz
);
306 dma_addr_t pte_addr
= baseaddr
+ offset
* sizeof(pte
);
309 if (get_pte(baseaddr
, offset
, &pte
, info
)) {
312 trace_smmu_ptw_level(level
, iova
, subpage_size
,
313 baseaddr
, offset
, pte
);
315 if (is_invalid_pte(pte
) || is_reserved_pte(pte
, level
)) {
316 trace_smmu_ptw_invalid_pte(stage
, level
, baseaddr
,
317 pte_addr
, offset
, pte
);
321 if (is_table_pte(pte
, level
)) {
322 ap
= PTE_APTABLE(pte
);
324 if (is_permission_fault(ap
, perm
) && !tt
->had
) {
325 info
->type
= SMMU_PTW_ERR_PERMISSION
;
328 baseaddr
= get_table_pte_address(pte
, granule_sz
);
331 } else if (is_page_pte(pte
, level
)) {
332 gpa
= get_page_pte_address(pte
, granule_sz
);
333 trace_smmu_ptw_page_pte(stage
, level
, iova
,
334 baseaddr
, pte_addr
, pte
, gpa
);
338 gpa
= get_block_pte_address(pte
, level
, granule_sz
,
340 trace_smmu_ptw_block_pte(stage
, level
, baseaddr
,
341 pte_addr
, pte
, iova
, gpa
,
345 if (is_permission_fault(ap
, perm
)) {
346 info
->type
= SMMU_PTW_ERR_PERMISSION
;
350 tlbe
->entry
.translated_addr
= gpa
;
351 tlbe
->entry
.iova
= iova
& ~mask
;
352 tlbe
->entry
.addr_mask
= mask
;
353 tlbe
->entry
.perm
= PTE_AP_TO_PERM(ap
);
355 tlbe
->granule
= granule_sz
;
358 info
->type
= SMMU_PTW_ERR_TRANSLATION
;
361 tlbe
->entry
.perm
= IOMMU_NONE
;
366 * smmu_ptw - Walk the page tables for an IOVA, according to @cfg
368 * @cfg: translation configuration
369 * @iova: iova to translate
370 * @perm: tentative access type
371 * @tlbe: returned entry
372 * @info: ptw event handle
374 * return 0 on success
376 int smmu_ptw(SMMUTransCfg
*cfg
, dma_addr_t iova
, IOMMUAccessFlags perm
,
377 SMMUTLBEntry
*tlbe
, SMMUPTWEventInfo
*info
)
381 * This code path is not entered as we check this while decoding
382 * the configuration data in the derived SMMU model.
384 g_assert_not_reached();
387 return smmu_ptw_64(cfg
, iova
, perm
, tlbe
, info
);
391 * The bus number is used for lookup when SID based invalidation occurs.
392 * In that case we lazily populate the SMMUPciBus array from the bus hash
393 * table. At the time the SMMUPciBus is created (smmu_find_add_as), the bus
394 * numbers may not be always initialized yet.
396 SMMUPciBus
*smmu_find_smmu_pcibus(SMMUState
*s
, uint8_t bus_num
)
398 SMMUPciBus
*smmu_pci_bus
= s
->smmu_pcibus_by_bus_num
[bus_num
];
405 g_hash_table_iter_init(&iter
, s
->smmu_pcibus_by_busptr
);
406 while (g_hash_table_iter_next(&iter
, NULL
, (void **)&smmu_pci_bus
)) {
407 if (pci_bus_num(smmu_pci_bus
->bus
) == bus_num
) {
408 s
->smmu_pcibus_by_bus_num
[bus_num
] = smmu_pci_bus
;
416 static AddressSpace
*smmu_find_add_as(PCIBus
*bus
, void *opaque
, int devfn
)
418 SMMUState
*s
= opaque
;
419 SMMUPciBus
*sbus
= g_hash_table_lookup(s
->smmu_pcibus_by_busptr
, bus
);
421 static unsigned int index
;
424 sbus
= g_malloc0(sizeof(SMMUPciBus
) +
425 sizeof(SMMUDevice
*) * SMMU_PCI_DEVFN_MAX
);
427 g_hash_table_insert(s
->smmu_pcibus_by_busptr
, bus
, sbus
);
430 sdev
= sbus
->pbdev
[devfn
];
432 char *name
= g_strdup_printf("%s-%d-%d", s
->mrtypename
, devfn
, index
++);
434 sdev
= sbus
->pbdev
[devfn
] = g_new0(SMMUDevice
, 1);
440 memory_region_init_iommu(&sdev
->iommu
, sizeof(sdev
->iommu
),
442 OBJECT(s
), name
, UINT64_MAX
);
443 address_space_init(&sdev
->as
,
444 MEMORY_REGION(&sdev
->iommu
), name
);
445 trace_smmu_add_mr(name
);
452 IOMMUMemoryRegion
*smmu_iommu_mr(SMMUState
*s
, uint32_t sid
)
454 uint8_t bus_n
, devfn
;
455 SMMUPciBus
*smmu_bus
;
458 bus_n
= PCI_BUS_NUM(sid
);
459 smmu_bus
= smmu_find_smmu_pcibus(s
, bus_n
);
461 devfn
= SMMU_PCI_DEVFN(sid
);
462 smmu
= smmu_bus
->pbdev
[devfn
];
470 /* Unmap all notifiers attached to @mr */
471 static void smmu_inv_notifiers_mr(IOMMUMemoryRegion
*mr
)
475 trace_smmu_inv_notifiers_mr(mr
->parent_obj
.name
);
476 IOMMU_NOTIFIER_FOREACH(n
, mr
) {
477 memory_region_unmap_iommu_notifier_range(n
);
481 /* Unmap all notifiers of all mr's */
482 void smmu_inv_notifiers_all(SMMUState
*s
)
486 QLIST_FOREACH(sdev
, &s
->devices_with_notifiers
, next
) {
487 smmu_inv_notifiers_mr(&sdev
->iommu
);
491 static void smmu_base_realize(DeviceState
*dev
, Error
**errp
)
493 SMMUState
*s
= ARM_SMMU(dev
);
494 SMMUBaseClass
*sbc
= ARM_SMMU_GET_CLASS(dev
);
495 Error
*local_err
= NULL
;
497 sbc
->parent_realize(dev
, &local_err
);
499 error_propagate(errp
, local_err
);
502 s
->configs
= g_hash_table_new_full(NULL
, NULL
, NULL
, g_free
);
503 s
->iotlb
= g_hash_table_new_full(smmu_iotlb_key_hash
, smmu_iotlb_key_equal
,
505 s
->smmu_pcibus_by_busptr
= g_hash_table_new(NULL
, NULL
);
507 if (s
->primary_bus
) {
508 pci_setup_iommu(s
->primary_bus
, smmu_find_add_as
, s
);
510 error_setg(errp
, "SMMU is not attached to any PCI bus!");
514 static void smmu_base_reset_hold(Object
*obj
)
516 SMMUState
*s
= ARM_SMMU(obj
);
518 g_hash_table_remove_all(s
->configs
);
519 g_hash_table_remove_all(s
->iotlb
);
522 static Property smmu_dev_properties
[] = {
523 DEFINE_PROP_UINT8("bus_num", SMMUState
, bus_num
, 0),
524 DEFINE_PROP_LINK("primary-bus", SMMUState
, primary_bus
,
525 TYPE_PCI_BUS
, PCIBus
*),
526 DEFINE_PROP_END_OF_LIST(),
529 static void smmu_base_class_init(ObjectClass
*klass
, void *data
)
531 DeviceClass
*dc
= DEVICE_CLASS(klass
);
532 ResettableClass
*rc
= RESETTABLE_CLASS(klass
);
533 SMMUBaseClass
*sbc
= ARM_SMMU_CLASS(klass
);
535 device_class_set_props(dc
, smmu_dev_properties
);
536 device_class_set_parent_realize(dc
, smmu_base_realize
,
537 &sbc
->parent_realize
);
538 rc
->phases
.hold
= smmu_base_reset_hold
;
541 static const TypeInfo smmu_base_info
= {
542 .name
= TYPE_ARM_SMMU
,
543 .parent
= TYPE_SYS_BUS_DEVICE
,
544 .instance_size
= sizeof(SMMUState
),
546 .class_size
= sizeof(SMMUBaseClass
),
547 .class_init
= smmu_base_class_init
,
551 static void smmu_base_register_types(void)
553 type_register_static(&smmu_base_info
);
556 type_init(smmu_base_register_types
)