@@ -2005,6 +2005,11 @@ static const MemoryRegionOps vtd_mem_ops = {
static Property vtd_properties[] = {
DEFINE_PROP_UINT32("version", IntelIOMMUState, version, 0),
+ /*
+ * TODO: currently EIM is disabled by default. We can enable this
+ * after fully support x2apic.
+ */
+ DEFINE_PROP_BOOL("eim", IntelIOMMUState, eim_supported, false),
DEFINE_PROP_END_OF_LIST(),
};
@@ -2364,7 +2369,10 @@ static void vtd_init(IntelIOMMUState *s)
s->ecap = VTD_ECAP_QI | VTD_ECAP_IRO;
if (x86_iommu->intr_supported) {
- s->ecap |= VTD_ECAP_IR | VTD_ECAP_EIM | VTD_ECAP_MHMV;
+ s->ecap |= VTD_ECAP_IR | VTD_ECAP_MHMV;
+ if (s->eim_supported) {
+ s->ecap |= VTD_ECAP_EIM;
+ }
}
vtd_reset_context_cache(s);
@@ -2468,6 +2476,12 @@ static void vtd_realize(DeviceState *dev, Error **errp)
/* Pseudo address space under root PCI bus. */
pcms->ioapic_as = vtd_host_dma_iommu(bus, s, Q35_PSEUDO_DEVFN_IOAPIC);
+ /* EIM bit requires IR */
+ if (s->eim_supported && !x86_iommu->intr_supported) {
+ error_report("EIM (Extended Interrupt Mode) bit requires intremap=on");
+ exit(1);
+ }
+
/* Currently Intel IOMMU IR only support "kernel-irqchip={off|split}" */
if (x86_iommu->intr_supported && kvm_irqchip_in_kernel() &&
!kvm_irqchip_is_split()) {
@@ -289,6 +289,7 @@ struct IntelIOMMUState {
dma_addr_t intr_root; /* Interrupt remapping table pointer */
uint32_t intr_size; /* Number of IR table entries */
bool intr_eime; /* Extended interrupt mode enabled */
+ bool eim_supported; /* Whether to allow EIM bit */
};
/* Find the VTD Address space associated with the given bus pointer,
Adding one extra property for intel-iommu device to decide whether we should support EIM bit for IR. Now we are throwing high 24 bits of dest_id away directly. This will cause interrupt issues with guests that: - enabled x2apic with cluster mode - have more than 8 vcpus (so dest_id[31:8] might be nonzero) Let's make xapic the default one, and for the brave people who would like to try EIM and know the side effects, we can do it by explicitly enabling EIM using: -device intel-iommu,intremap=on,eim=on Even after we have x2apic support, it'll still be good if we can provide a way to switch xapic/x2apic from QEMU side for e.g. debugging purpose, which is an alternative for tuning guest kernel boot parameters. We can switch the default to "on" after x2apic fully supported. Signed-off-by: Peter Xu <peterx@redhat.com> --- hw/i386/intel_iommu.c | 16 +++++++++++++++- include/hw/i386/intel_iommu.h | 1 + 2 files changed, 16 insertions(+), 1 deletion(-)