提交 1d9efa73 编写于 作者: P Peter Xu 提交者: Michael S. Tsirkin

intel-iommu: add iommu lock

SECURITY IMPLICATION: this patch fixes a potential race when multiple
threads access the IOMMU IOTLB cache.

Add a per-iommu big lock to protect IOMMU status.  Currently the only
thing to be protected is the IOTLB/context cache, since that can be
accessed even without BQL, e.g., in IO dataplane.

Note that we don't need to protect device page tables since that's fully
controlled by the guest kernel.  However there is still possibility that
malicious drivers will program the device to not obey the rule.  In that
case QEMU can't really do anything useful, instead the guest itself will
be responsible for all uncertainties.

CC: QEMU Stable <qemu-stable@nongnu.org>
Reported-by: NFam Zheng <famz@redhat.com>
Signed-off-by: NPeter Xu <peterx@redhat.com>
Reviewed-by: NMichael S. Tsirkin <mst@redhat.com>
Signed-off-by: NMichael S. Tsirkin <mst@redhat.com>
上级 b4a4ba0d
...@@ -128,6 +128,16 @@ static uint64_t vtd_set_clear_mask_quad(IntelIOMMUState *s, hwaddr addr, ...@@ -128,6 +128,16 @@ static uint64_t vtd_set_clear_mask_quad(IntelIOMMUState *s, hwaddr addr,
return new_val; return new_val;
} }
static inline void vtd_iommu_lock(IntelIOMMUState *s)
{
qemu_mutex_lock(&s->iommu_lock);
}
static inline void vtd_iommu_unlock(IntelIOMMUState *s)
{
qemu_mutex_unlock(&s->iommu_lock);
}
/* GHashTable functions */ /* GHashTable functions */
static gboolean vtd_uint64_equal(gconstpointer v1, gconstpointer v2) static gboolean vtd_uint64_equal(gconstpointer v1, gconstpointer v2)
{ {
...@@ -172,9 +182,9 @@ static gboolean vtd_hash_remove_by_page(gpointer key, gpointer value, ...@@ -172,9 +182,9 @@ static gboolean vtd_hash_remove_by_page(gpointer key, gpointer value,
} }
/* Reset all the gen of VTDAddressSpace to zero and set the gen of /* Reset all the gen of VTDAddressSpace to zero and set the gen of
* IntelIOMMUState to 1. * IntelIOMMUState to 1. Must be called with IOMMU lock held.
*/ */
static void vtd_reset_context_cache(IntelIOMMUState *s) static void vtd_reset_context_cache_locked(IntelIOMMUState *s)
{ {
VTDAddressSpace *vtd_as; VTDAddressSpace *vtd_as;
VTDBus *vtd_bus; VTDBus *vtd_bus;
...@@ -197,12 +207,20 @@ static void vtd_reset_context_cache(IntelIOMMUState *s) ...@@ -197,12 +207,20 @@ static void vtd_reset_context_cache(IntelIOMMUState *s)
s->context_cache_gen = 1; s->context_cache_gen = 1;
} }
static void vtd_reset_iotlb(IntelIOMMUState *s) /* Must be called with IOMMU lock held. */
static void vtd_reset_iotlb_locked(IntelIOMMUState *s)
{ {
assert(s->iotlb); assert(s->iotlb);
g_hash_table_remove_all(s->iotlb); g_hash_table_remove_all(s->iotlb);
} }
static void vtd_reset_iotlb(IntelIOMMUState *s)
{
vtd_iommu_lock(s);
vtd_reset_iotlb_locked(s);
vtd_iommu_unlock(s);
}
static uint64_t vtd_get_iotlb_key(uint64_t gfn, uint16_t source_id, static uint64_t vtd_get_iotlb_key(uint64_t gfn, uint16_t source_id,
uint32_t level) uint32_t level)
{ {
...@@ -215,6 +233,7 @@ static uint64_t vtd_get_iotlb_gfn(hwaddr addr, uint32_t level) ...@@ -215,6 +233,7 @@ static uint64_t vtd_get_iotlb_gfn(hwaddr addr, uint32_t level)
return (addr & vtd_slpt_level_page_mask(level)) >> VTD_PAGE_SHIFT_4K; return (addr & vtd_slpt_level_page_mask(level)) >> VTD_PAGE_SHIFT_4K;
} }
/* Must be called with IOMMU lock held */
static VTDIOTLBEntry *vtd_lookup_iotlb(IntelIOMMUState *s, uint16_t source_id, static VTDIOTLBEntry *vtd_lookup_iotlb(IntelIOMMUState *s, uint16_t source_id,
hwaddr addr) hwaddr addr)
{ {
...@@ -235,6 +254,7 @@ out: ...@@ -235,6 +254,7 @@ out:
return entry; return entry;
} }
/* Must be with IOMMU lock held */
static void vtd_update_iotlb(IntelIOMMUState *s, uint16_t source_id, static void vtd_update_iotlb(IntelIOMMUState *s, uint16_t source_id,
uint16_t domain_id, hwaddr addr, uint64_t slpte, uint16_t domain_id, hwaddr addr, uint64_t slpte,
uint8_t access_flags, uint32_t level) uint8_t access_flags, uint32_t level)
...@@ -246,7 +266,7 @@ static void vtd_update_iotlb(IntelIOMMUState *s, uint16_t source_id, ...@@ -246,7 +266,7 @@ static void vtd_update_iotlb(IntelIOMMUState *s, uint16_t source_id,
trace_vtd_iotlb_page_update(source_id, addr, slpte, domain_id); trace_vtd_iotlb_page_update(source_id, addr, slpte, domain_id);
if (g_hash_table_size(s->iotlb) >= VTD_IOTLB_MAX_SIZE) { if (g_hash_table_size(s->iotlb) >= VTD_IOTLB_MAX_SIZE) {
trace_vtd_iotlb_reset("iotlb exceeds size limit"); trace_vtd_iotlb_reset("iotlb exceeds size limit");
vtd_reset_iotlb(s); vtd_reset_iotlb_locked(s);
} }
entry->gfn = gfn; entry->gfn = gfn;
...@@ -1106,7 +1126,7 @@ static bool vtd_do_iommu_translate(VTDAddressSpace *vtd_as, PCIBus *bus, ...@@ -1106,7 +1126,7 @@ static bool vtd_do_iommu_translate(VTDAddressSpace *vtd_as, PCIBus *bus,
IntelIOMMUState *s = vtd_as->iommu_state; IntelIOMMUState *s = vtd_as->iommu_state;
VTDContextEntry ce; VTDContextEntry ce;
uint8_t bus_num = pci_bus_num(bus); uint8_t bus_num = pci_bus_num(bus);
VTDContextCacheEntry *cc_entry = &vtd_as->context_cache_entry; VTDContextCacheEntry *cc_entry;
uint64_t slpte, page_mask; uint64_t slpte, page_mask;
uint32_t level; uint32_t level;
uint16_t source_id = vtd_make_source_id(bus_num, devfn); uint16_t source_id = vtd_make_source_id(bus_num, devfn);
...@@ -1123,6 +1143,10 @@ static bool vtd_do_iommu_translate(VTDAddressSpace *vtd_as, PCIBus *bus, ...@@ -1123,6 +1143,10 @@ static bool vtd_do_iommu_translate(VTDAddressSpace *vtd_as, PCIBus *bus,
*/ */
assert(!vtd_is_interrupt_addr(addr)); assert(!vtd_is_interrupt_addr(addr));
vtd_iommu_lock(s);
cc_entry = &vtd_as->context_cache_entry;
/* Try to fetch slpte form IOTLB */ /* Try to fetch slpte form IOTLB */
iotlb_entry = vtd_lookup_iotlb(s, source_id, addr); iotlb_entry = vtd_lookup_iotlb(s, source_id, addr);
if (iotlb_entry) { if (iotlb_entry) {
...@@ -1182,7 +1206,7 @@ static bool vtd_do_iommu_translate(VTDAddressSpace *vtd_as, PCIBus *bus, ...@@ -1182,7 +1206,7 @@ static bool vtd_do_iommu_translate(VTDAddressSpace *vtd_as, PCIBus *bus,
* IOMMU region can be swapped back. * IOMMU region can be swapped back.
*/ */
vtd_pt_enable_fast_path(s, source_id); vtd_pt_enable_fast_path(s, source_id);
vtd_iommu_unlock(s);
return true; return true;
} }
...@@ -1203,6 +1227,7 @@ static bool vtd_do_iommu_translate(VTDAddressSpace *vtd_as, PCIBus *bus, ...@@ -1203,6 +1227,7 @@ static bool vtd_do_iommu_translate(VTDAddressSpace *vtd_as, PCIBus *bus,
vtd_update_iotlb(s, source_id, VTD_CONTEXT_ENTRY_DID(ce.hi), addr, slpte, vtd_update_iotlb(s, source_id, VTD_CONTEXT_ENTRY_DID(ce.hi), addr, slpte,
access_flags, level); access_flags, level);
out: out:
vtd_iommu_unlock(s);
entry->iova = addr & page_mask; entry->iova = addr & page_mask;
entry->translated_addr = vtd_get_slpte_addr(slpte, s->aw_bits) & page_mask; entry->translated_addr = vtd_get_slpte_addr(slpte, s->aw_bits) & page_mask;
entry->addr_mask = ~page_mask; entry->addr_mask = ~page_mask;
...@@ -1210,6 +1235,7 @@ out: ...@@ -1210,6 +1235,7 @@ out:
return true; return true;
error: error:
vtd_iommu_unlock(s);
entry->iova = 0; entry->iova = 0;
entry->translated_addr = 0; entry->translated_addr = 0;
entry->addr_mask = 0; entry->addr_mask = 0;
...@@ -1258,10 +1284,13 @@ static void vtd_iommu_replay_all(IntelIOMMUState *s) ...@@ -1258,10 +1284,13 @@ static void vtd_iommu_replay_all(IntelIOMMUState *s)
static void vtd_context_global_invalidate(IntelIOMMUState *s) static void vtd_context_global_invalidate(IntelIOMMUState *s)
{ {
trace_vtd_inv_desc_cc_global(); trace_vtd_inv_desc_cc_global();
/* Protects context cache */
vtd_iommu_lock(s);
s->context_cache_gen++; s->context_cache_gen++;
if (s->context_cache_gen == VTD_CONTEXT_CACHE_GEN_MAX) { if (s->context_cache_gen == VTD_CONTEXT_CACHE_GEN_MAX) {
vtd_reset_context_cache(s); vtd_reset_context_cache_locked(s);
} }
vtd_iommu_unlock(s);
vtd_switch_address_space_all(s); vtd_switch_address_space_all(s);
/* /*
* From VT-d spec 6.5.2.1, a global context entry invalidation * From VT-d spec 6.5.2.1, a global context entry invalidation
...@@ -1313,7 +1342,9 @@ static void vtd_context_device_invalidate(IntelIOMMUState *s, ...@@ -1313,7 +1342,9 @@ static void vtd_context_device_invalidate(IntelIOMMUState *s,
if (vtd_as && ((devfn_it & mask) == (devfn & mask))) { if (vtd_as && ((devfn_it & mask) == (devfn & mask))) {
trace_vtd_inv_desc_cc_device(bus_n, VTD_PCI_SLOT(devfn_it), trace_vtd_inv_desc_cc_device(bus_n, VTD_PCI_SLOT(devfn_it),
VTD_PCI_FUNC(devfn_it)); VTD_PCI_FUNC(devfn_it));
vtd_iommu_lock(s);
vtd_as->context_cache_entry.context_cache_gen = 0; vtd_as->context_cache_entry.context_cache_gen = 0;
vtd_iommu_unlock(s);
/* /*
* Do switch address space when needed, in case if the * Do switch address space when needed, in case if the
* device passthrough bit is switched. * device passthrough bit is switched.
...@@ -1377,8 +1408,10 @@ static void vtd_iotlb_domain_invalidate(IntelIOMMUState *s, uint16_t domain_id) ...@@ -1377,8 +1408,10 @@ static void vtd_iotlb_domain_invalidate(IntelIOMMUState *s, uint16_t domain_id)
trace_vtd_inv_desc_iotlb_domain(domain_id); trace_vtd_inv_desc_iotlb_domain(domain_id);
vtd_iommu_lock(s);
g_hash_table_foreach_remove(s->iotlb, vtd_hash_remove_by_domain, g_hash_table_foreach_remove(s->iotlb, vtd_hash_remove_by_domain,
&domain_id); &domain_id);
vtd_iommu_unlock(s);
QLIST_FOREACH(vtd_as, &s->vtd_as_with_notifiers, next) { QLIST_FOREACH(vtd_as, &s->vtd_as_with_notifiers, next) {
if (!vtd_dev_to_context_entry(s, pci_bus_num(vtd_as->bus), if (!vtd_dev_to_context_entry(s, pci_bus_num(vtd_as->bus),
...@@ -1426,7 +1459,9 @@ static void vtd_iotlb_page_invalidate(IntelIOMMUState *s, uint16_t domain_id, ...@@ -1426,7 +1459,9 @@ static void vtd_iotlb_page_invalidate(IntelIOMMUState *s, uint16_t domain_id,
info.domain_id = domain_id; info.domain_id = domain_id;
info.addr = addr; info.addr = addr;
info.mask = ~((1 << am) - 1); info.mask = ~((1 << am) - 1);
vtd_iommu_lock(s);
g_hash_table_foreach_remove(s->iotlb, vtd_hash_remove_by_page, &info); g_hash_table_foreach_remove(s->iotlb, vtd_hash_remove_by_page, &info);
vtd_iommu_unlock(s);
vtd_iotlb_page_invalidate_notify(s, domain_id, addr, am); vtd_iotlb_page_invalidate_notify(s, domain_id, addr, am);
} }
...@@ -2929,8 +2964,10 @@ static void vtd_init(IntelIOMMUState *s) ...@@ -2929,8 +2964,10 @@ static void vtd_init(IntelIOMMUState *s)
s->cap |= VTD_CAP_CM; s->cap |= VTD_CAP_CM;
} }
vtd_reset_context_cache(s); vtd_iommu_lock(s);
vtd_reset_iotlb(s); vtd_reset_context_cache_locked(s);
vtd_reset_iotlb_locked(s);
vtd_iommu_unlock(s);
/* Define registers with default values and bit semantics */ /* Define registers with default values and bit semantics */
vtd_define_long(s, DMAR_VER_REG, 0x10UL, 0, 0); vtd_define_long(s, DMAR_VER_REG, 0x10UL, 0, 0);
...@@ -3070,6 +3107,7 @@ static void vtd_realize(DeviceState *dev, Error **errp) ...@@ -3070,6 +3107,7 @@ static void vtd_realize(DeviceState *dev, Error **errp)
} }
QLIST_INIT(&s->vtd_as_with_notifiers); QLIST_INIT(&s->vtd_as_with_notifiers);
qemu_mutex_init(&s->iommu_lock);
memset(s->vtd_as_by_bus_num, 0, sizeof(s->vtd_as_by_bus_num)); memset(s->vtd_as_by_bus_num, 0, sizeof(s->vtd_as_by_bus_num));
memory_region_init_io(&s->csrmem, OBJECT(s), &vtd_mem_ops, s, memory_region_init_io(&s->csrmem, OBJECT(s), &vtd_mem_ops, s,
"intel_iommu", DMAR_REG_SIZE); "intel_iommu", DMAR_REG_SIZE);
......
...@@ -300,6 +300,12 @@ struct IntelIOMMUState { ...@@ -300,6 +300,12 @@ struct IntelIOMMUState {
OnOffAuto intr_eim; /* Toggle for EIM cabability */ OnOffAuto intr_eim; /* Toggle for EIM cabability */
bool buggy_eim; /* Force buggy EIM unless eim=off */ bool buggy_eim; /* Force buggy EIM unless eim=off */
uint8_t aw_bits; /* Host/IOVA address width (in bits) */ uint8_t aw_bits; /* Host/IOVA address width (in bits) */
/*
* Protects IOMMU states in general. Currently it protects the
* per-IOMMU IOTLB cache, and context entry cache in VTDAddressSpace.
*/
QemuMutex iommu_lock;
}; };
/* Find the VTD Address space associated with the given bus pointer, /* Find the VTD Address space associated with the given bus pointer,
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册