Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 1 | // SPDX-License-Identifier: GPL-2.0 |
| 2 | |
| 3 | #define pr_fmt(fmt) "DMAR-IR: " fmt |
| 4 | |
| 5 | #include <linux/interrupt.h> |
| 6 | #include <linux/dmar.h> |
| 7 | #include <linux/spinlock.h> |
| 8 | #include <linux/slab.h> |
| 9 | #include <linux/jiffies.h> |
| 10 | #include <linux/hpet.h> |
| 11 | #include <linux/pci.h> |
| 12 | #include <linux/irq.h> |
| 13 | #include <linux/intel-iommu.h> |
| 14 | #include <linux/acpi.h> |
| 15 | #include <linux/irqdomain.h> |
| 16 | #include <linux/crash_dump.h> |
| 17 | #include <asm/io_apic.h> |
| 18 | #include <asm/smp.h> |
| 19 | #include <asm/cpu.h> |
| 20 | #include <asm/irq_remapping.h> |
| 21 | #include <asm/pci-direct.h> |
| 22 | #include <asm/msidef.h> |
| 23 | |
| 24 | #include "irq_remapping.h" |
| 25 | |
| 26 | enum irq_mode { |
| 27 | IRQ_REMAPPING, |
| 28 | IRQ_POSTING, |
| 29 | }; |
| 30 | |
| 31 | struct ioapic_scope { |
| 32 | struct intel_iommu *iommu; |
| 33 | unsigned int id; |
| 34 | unsigned int bus; /* PCI bus number */ |
| 35 | unsigned int devfn; /* PCI devfn number */ |
| 36 | }; |
| 37 | |
| 38 | struct hpet_scope { |
| 39 | struct intel_iommu *iommu; |
| 40 | u8 id; |
| 41 | unsigned int bus; |
| 42 | unsigned int devfn; |
| 43 | }; |
| 44 | |
| 45 | struct irq_2_iommu { |
| 46 | struct intel_iommu *iommu; |
| 47 | u16 irte_index; |
| 48 | u16 sub_handle; |
| 49 | u8 irte_mask; |
| 50 | enum irq_mode mode; |
| 51 | }; |
| 52 | |
| 53 | struct intel_ir_data { |
| 54 | struct irq_2_iommu irq_2_iommu; |
| 55 | struct irte irte_entry; |
| 56 | union { |
| 57 | struct msi_msg msi_entry; |
| 58 | }; |
| 59 | }; |
| 60 | |
| 61 | #define IR_X2APIC_MODE(mode) (mode ? (1 << 11) : 0) |
| 62 | #define IRTE_DEST(dest) ((eim_mode) ? dest : dest << 8) |
| 63 | |
| 64 | static int __read_mostly eim_mode; |
| 65 | static struct ioapic_scope ir_ioapic[MAX_IO_APICS]; |
| 66 | static struct hpet_scope ir_hpet[MAX_HPET_TBS]; |
| 67 | |
| 68 | /* |
| 69 | * Lock ordering: |
| 70 | * ->dmar_global_lock |
| 71 | * ->irq_2_ir_lock |
| 72 | * ->qi->q_lock |
| 73 | * ->iommu->register_lock |
| 74 | * Note: |
| 75 | * intel_irq_remap_ops.{supported,prepare,enable,disable,reenable} are called |
| 76 | * in single-threaded environment with interrupt disabled, so no need to tabke |
| 77 | * the dmar_global_lock. |
| 78 | */ |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 79 | DEFINE_RAW_SPINLOCK(irq_2_ir_lock); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 80 | static const struct irq_domain_ops intel_ir_domain_ops; |
| 81 | |
| 82 | static void iommu_disable_irq_remapping(struct intel_iommu *iommu); |
| 83 | static int __init parse_ioapics_under_ir(void); |
| 84 | |
| 85 | static bool ir_pre_enabled(struct intel_iommu *iommu) |
| 86 | { |
| 87 | return (iommu->flags & VTD_FLAG_IRQ_REMAP_PRE_ENABLED); |
| 88 | } |
| 89 | |
| 90 | static void clear_ir_pre_enabled(struct intel_iommu *iommu) |
| 91 | { |
| 92 | iommu->flags &= ~VTD_FLAG_IRQ_REMAP_PRE_ENABLED; |
| 93 | } |
| 94 | |
| 95 | static void init_ir_status(struct intel_iommu *iommu) |
| 96 | { |
| 97 | u32 gsts; |
| 98 | |
| 99 | gsts = readl(iommu->reg + DMAR_GSTS_REG); |
| 100 | if (gsts & DMA_GSTS_IRES) |
| 101 | iommu->flags |= VTD_FLAG_IRQ_REMAP_PRE_ENABLED; |
| 102 | } |
| 103 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 104 | static int alloc_irte(struct intel_iommu *iommu, |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 105 | struct irq_2_iommu *irq_iommu, u16 count) |
| 106 | { |
| 107 | struct ir_table *table = iommu->ir_table; |
| 108 | unsigned int mask = 0; |
| 109 | unsigned long flags; |
| 110 | int index; |
| 111 | |
| 112 | if (!count || !irq_iommu) |
| 113 | return -1; |
| 114 | |
| 115 | if (count > 1) { |
| 116 | count = __roundup_pow_of_two(count); |
| 117 | mask = ilog2(count); |
| 118 | } |
| 119 | |
| 120 | if (mask > ecap_max_handle_mask(iommu->ecap)) { |
| 121 | pr_err("Requested mask %x exceeds the max invalidation handle" |
| 122 | " mask value %Lx\n", mask, |
| 123 | ecap_max_handle_mask(iommu->ecap)); |
| 124 | return -1; |
| 125 | } |
| 126 | |
| 127 | raw_spin_lock_irqsave(&irq_2_ir_lock, flags); |
| 128 | index = bitmap_find_free_region(table->bitmap, |
| 129 | INTR_REMAP_TABLE_ENTRIES, mask); |
| 130 | if (index < 0) { |
| 131 | pr_warn("IR%d: can't allocate an IRTE\n", iommu->seq_id); |
| 132 | } else { |
| 133 | irq_iommu->iommu = iommu; |
| 134 | irq_iommu->irte_index = index; |
| 135 | irq_iommu->sub_handle = 0; |
| 136 | irq_iommu->irte_mask = mask; |
| 137 | irq_iommu->mode = IRQ_REMAPPING; |
| 138 | } |
| 139 | raw_spin_unlock_irqrestore(&irq_2_ir_lock, flags); |
| 140 | |
| 141 | return index; |
| 142 | } |
| 143 | |
| 144 | static int qi_flush_iec(struct intel_iommu *iommu, int index, int mask) |
| 145 | { |
| 146 | struct qi_desc desc; |
| 147 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 148 | desc.qw0 = QI_IEC_IIDEX(index) | QI_IEC_TYPE | QI_IEC_IM(mask) |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 149 | | QI_IEC_SELECTIVE; |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 150 | desc.qw1 = 0; |
| 151 | desc.qw2 = 0; |
| 152 | desc.qw3 = 0; |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 153 | |
| 154 | return qi_submit_sync(&desc, iommu); |
| 155 | } |
| 156 | |
| 157 | static int modify_irte(struct irq_2_iommu *irq_iommu, |
| 158 | struct irte *irte_modified) |
| 159 | { |
| 160 | struct intel_iommu *iommu; |
| 161 | unsigned long flags; |
| 162 | struct irte *irte; |
| 163 | int rc, index; |
| 164 | |
| 165 | if (!irq_iommu) |
| 166 | return -1; |
| 167 | |
| 168 | raw_spin_lock_irqsave(&irq_2_ir_lock, flags); |
| 169 | |
| 170 | iommu = irq_iommu->iommu; |
| 171 | |
| 172 | index = irq_iommu->irte_index + irq_iommu->sub_handle; |
| 173 | irte = &iommu->ir_table->base[index]; |
| 174 | |
| 175 | #if defined(CONFIG_HAVE_CMPXCHG_DOUBLE) |
| 176 | if ((irte->pst == 1) || (irte_modified->pst == 1)) { |
| 177 | bool ret; |
| 178 | |
| 179 | ret = cmpxchg_double(&irte->low, &irte->high, |
| 180 | irte->low, irte->high, |
| 181 | irte_modified->low, irte_modified->high); |
| 182 | /* |
| 183 | * We use cmpxchg16 to atomically update the 128-bit IRTE, |
| 184 | * and it cannot be updated by the hardware or other processors |
| 185 | * behind us, so the return value of cmpxchg16 should be the |
| 186 | * same as the old value. |
| 187 | */ |
| 188 | WARN_ON(!ret); |
| 189 | } else |
| 190 | #endif |
| 191 | { |
| 192 | set_64bit(&irte->low, irte_modified->low); |
| 193 | set_64bit(&irte->high, irte_modified->high); |
| 194 | } |
| 195 | __iommu_flush_cache(iommu, irte, sizeof(*irte)); |
| 196 | |
| 197 | rc = qi_flush_iec(iommu, index, 0); |
| 198 | |
| 199 | /* Update iommu mode according to the IRTE mode */ |
| 200 | irq_iommu->mode = irte->pst ? IRQ_POSTING : IRQ_REMAPPING; |
| 201 | raw_spin_unlock_irqrestore(&irq_2_ir_lock, flags); |
| 202 | |
| 203 | return rc; |
| 204 | } |
| 205 | |
| 206 | static struct intel_iommu *map_hpet_to_ir(u8 hpet_id) |
| 207 | { |
| 208 | int i; |
| 209 | |
| 210 | for (i = 0; i < MAX_HPET_TBS; i++) |
| 211 | if (ir_hpet[i].id == hpet_id && ir_hpet[i].iommu) |
| 212 | return ir_hpet[i].iommu; |
| 213 | return NULL; |
| 214 | } |
| 215 | |
| 216 | static struct intel_iommu *map_ioapic_to_ir(int apic) |
| 217 | { |
| 218 | int i; |
| 219 | |
| 220 | for (i = 0; i < MAX_IO_APICS; i++) |
| 221 | if (ir_ioapic[i].id == apic && ir_ioapic[i].iommu) |
| 222 | return ir_ioapic[i].iommu; |
| 223 | return NULL; |
| 224 | } |
| 225 | |
| 226 | static struct intel_iommu *map_dev_to_ir(struct pci_dev *dev) |
| 227 | { |
| 228 | struct dmar_drhd_unit *drhd; |
| 229 | |
| 230 | drhd = dmar_find_matched_drhd_unit(dev); |
| 231 | if (!drhd) |
| 232 | return NULL; |
| 233 | |
| 234 | return drhd->iommu; |
| 235 | } |
| 236 | |
| 237 | static int clear_entries(struct irq_2_iommu *irq_iommu) |
| 238 | { |
| 239 | struct irte *start, *entry, *end; |
| 240 | struct intel_iommu *iommu; |
| 241 | int index; |
| 242 | |
| 243 | if (irq_iommu->sub_handle) |
| 244 | return 0; |
| 245 | |
| 246 | iommu = irq_iommu->iommu; |
| 247 | index = irq_iommu->irte_index; |
| 248 | |
| 249 | start = iommu->ir_table->base + index; |
| 250 | end = start + (1 << irq_iommu->irte_mask); |
| 251 | |
| 252 | for (entry = start; entry < end; entry++) { |
| 253 | set_64bit(&entry->low, 0); |
| 254 | set_64bit(&entry->high, 0); |
| 255 | } |
| 256 | bitmap_release_region(iommu->ir_table->bitmap, index, |
| 257 | irq_iommu->irte_mask); |
| 258 | |
| 259 | return qi_flush_iec(iommu, index, irq_iommu->irte_mask); |
| 260 | } |
| 261 | |
| 262 | /* |
| 263 | * source validation type |
| 264 | */ |
| 265 | #define SVT_NO_VERIFY 0x0 /* no verification is required */ |
| 266 | #define SVT_VERIFY_SID_SQ 0x1 /* verify using SID and SQ fields */ |
| 267 | #define SVT_VERIFY_BUS 0x2 /* verify bus of request-id */ |
| 268 | |
| 269 | /* |
| 270 | * source-id qualifier |
| 271 | */ |
| 272 | #define SQ_ALL_16 0x0 /* verify all 16 bits of request-id */ |
| 273 | #define SQ_13_IGNORE_1 0x1 /* verify most significant 13 bits, ignore |
| 274 | * the third least significant bit |
| 275 | */ |
| 276 | #define SQ_13_IGNORE_2 0x2 /* verify most significant 13 bits, ignore |
| 277 | * the second and third least significant bits |
| 278 | */ |
| 279 | #define SQ_13_IGNORE_3 0x3 /* verify most significant 13 bits, ignore |
| 280 | * the least three significant bits |
| 281 | */ |
| 282 | |
| 283 | /* |
| 284 | * set SVT, SQ and SID fields of irte to verify |
| 285 | * source ids of interrupt requests |
| 286 | */ |
| 287 | static void set_irte_sid(struct irte *irte, unsigned int svt, |
| 288 | unsigned int sq, unsigned int sid) |
| 289 | { |
| 290 | if (disable_sourceid_checking) |
| 291 | svt = SVT_NO_VERIFY; |
| 292 | irte->svt = svt; |
| 293 | irte->sq = sq; |
| 294 | irte->sid = sid; |
| 295 | } |
| 296 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 297 | /* |
| 298 | * Set an IRTE to match only the bus number. Interrupt requests that reference |
| 299 | * this IRTE must have a requester-id whose bus number is between or equal |
| 300 | * to the start_bus and end_bus arguments. |
| 301 | */ |
| 302 | static void set_irte_verify_bus(struct irte *irte, unsigned int start_bus, |
| 303 | unsigned int end_bus) |
| 304 | { |
| 305 | set_irte_sid(irte, SVT_VERIFY_BUS, SQ_ALL_16, |
| 306 | (start_bus << 8) | end_bus); |
| 307 | } |
| 308 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 309 | static int set_ioapic_sid(struct irte *irte, int apic) |
| 310 | { |
| 311 | int i; |
| 312 | u16 sid = 0; |
| 313 | |
| 314 | if (!irte) |
| 315 | return -1; |
| 316 | |
| 317 | down_read(&dmar_global_lock); |
| 318 | for (i = 0; i < MAX_IO_APICS; i++) { |
| 319 | if (ir_ioapic[i].iommu && ir_ioapic[i].id == apic) { |
| 320 | sid = (ir_ioapic[i].bus << 8) | ir_ioapic[i].devfn; |
| 321 | break; |
| 322 | } |
| 323 | } |
| 324 | up_read(&dmar_global_lock); |
| 325 | |
| 326 | if (sid == 0) { |
| 327 | pr_warn("Failed to set source-id of IOAPIC (%d)\n", apic); |
| 328 | return -1; |
| 329 | } |
| 330 | |
| 331 | set_irte_sid(irte, SVT_VERIFY_SID_SQ, SQ_ALL_16, sid); |
| 332 | |
| 333 | return 0; |
| 334 | } |
| 335 | |
| 336 | static int set_hpet_sid(struct irte *irte, u8 id) |
| 337 | { |
| 338 | int i; |
| 339 | u16 sid = 0; |
| 340 | |
| 341 | if (!irte) |
| 342 | return -1; |
| 343 | |
| 344 | down_read(&dmar_global_lock); |
| 345 | for (i = 0; i < MAX_HPET_TBS; i++) { |
| 346 | if (ir_hpet[i].iommu && ir_hpet[i].id == id) { |
| 347 | sid = (ir_hpet[i].bus << 8) | ir_hpet[i].devfn; |
| 348 | break; |
| 349 | } |
| 350 | } |
| 351 | up_read(&dmar_global_lock); |
| 352 | |
| 353 | if (sid == 0) { |
| 354 | pr_warn("Failed to set source-id of HPET block (%d)\n", id); |
| 355 | return -1; |
| 356 | } |
| 357 | |
| 358 | /* |
| 359 | * Should really use SQ_ALL_16. Some platforms are broken. |
| 360 | * While we figure out the right quirks for these broken platforms, use |
| 361 | * SQ_13_IGNORE_3 for now. |
| 362 | */ |
| 363 | set_irte_sid(irte, SVT_VERIFY_SID_SQ, SQ_13_IGNORE_3, sid); |
| 364 | |
| 365 | return 0; |
| 366 | } |
| 367 | |
| 368 | struct set_msi_sid_data { |
| 369 | struct pci_dev *pdev; |
| 370 | u16 alias; |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 371 | int count; |
| 372 | int busmatch_count; |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 373 | }; |
| 374 | |
| 375 | static int set_msi_sid_cb(struct pci_dev *pdev, u16 alias, void *opaque) |
| 376 | { |
| 377 | struct set_msi_sid_data *data = opaque; |
| 378 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 379 | if (data->count == 0 || PCI_BUS_NUM(alias) == PCI_BUS_NUM(data->alias)) |
| 380 | data->busmatch_count++; |
| 381 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 382 | data->pdev = pdev; |
| 383 | data->alias = alias; |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 384 | data->count++; |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 385 | |
| 386 | return 0; |
| 387 | } |
| 388 | |
| 389 | static int set_msi_sid(struct irte *irte, struct pci_dev *dev) |
| 390 | { |
| 391 | struct set_msi_sid_data data; |
| 392 | |
| 393 | if (!irte || !dev) |
| 394 | return -1; |
| 395 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 396 | data.count = 0; |
| 397 | data.busmatch_count = 0; |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 398 | pci_for_each_dma_alias(dev, set_msi_sid_cb, &data); |
| 399 | |
| 400 | /* |
| 401 | * DMA alias provides us with a PCI device and alias. The only case |
| 402 | * where the it will return an alias on a different bus than the |
| 403 | * device is the case of a PCIe-to-PCI bridge, where the alias is for |
| 404 | * the subordinate bus. In this case we can only verify the bus. |
| 405 | * |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 406 | * If there are multiple aliases, all with the same bus number, |
| 407 | * then all we can do is verify the bus. This is typical in NTB |
| 408 | * hardware which use proxy IDs where the device will generate traffic |
| 409 | * from multiple devfn numbers on the same bus. |
| 410 | * |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 411 | * If the alias device is on a different bus than our source device |
| 412 | * then we have a topology based alias, use it. |
| 413 | * |
| 414 | * Otherwise, the alias is for a device DMA quirk and we cannot |
| 415 | * assume that MSI uses the same requester ID. Therefore use the |
| 416 | * original device. |
| 417 | */ |
| 418 | if (PCI_BUS_NUM(data.alias) != data.pdev->bus->number) |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 419 | set_irte_verify_bus(irte, PCI_BUS_NUM(data.alias), |
| 420 | dev->bus->number); |
| 421 | else if (data.count >= 2 && data.busmatch_count == data.count) |
| 422 | set_irte_verify_bus(irte, dev->bus->number, dev->bus->number); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 423 | else if (data.pdev->bus->number != dev->bus->number) |
| 424 | set_irte_sid(irte, SVT_VERIFY_SID_SQ, SQ_ALL_16, data.alias); |
| 425 | else |
| 426 | set_irte_sid(irte, SVT_VERIFY_SID_SQ, SQ_ALL_16, |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 427 | pci_dev_id(dev)); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 428 | |
| 429 | return 0; |
| 430 | } |
| 431 | |
| 432 | static int iommu_load_old_irte(struct intel_iommu *iommu) |
| 433 | { |
| 434 | struct irte *old_ir_table; |
| 435 | phys_addr_t irt_phys; |
| 436 | unsigned int i; |
| 437 | size_t size; |
| 438 | u64 irta; |
| 439 | |
| 440 | /* Check whether the old ir-table has the same size as ours */ |
| 441 | irta = dmar_readq(iommu->reg + DMAR_IRTA_REG); |
| 442 | if ((irta & INTR_REMAP_TABLE_REG_SIZE_MASK) |
| 443 | != INTR_REMAP_TABLE_REG_SIZE) |
| 444 | return -EINVAL; |
| 445 | |
| 446 | irt_phys = irta & VTD_PAGE_MASK; |
| 447 | size = INTR_REMAP_TABLE_ENTRIES*sizeof(struct irte); |
| 448 | |
| 449 | /* Map the old IR table */ |
| 450 | old_ir_table = memremap(irt_phys, size, MEMREMAP_WB); |
| 451 | if (!old_ir_table) |
| 452 | return -ENOMEM; |
| 453 | |
| 454 | /* Copy data over */ |
| 455 | memcpy(iommu->ir_table->base, old_ir_table, size); |
| 456 | |
| 457 | __iommu_flush_cache(iommu, iommu->ir_table->base, size); |
| 458 | |
| 459 | /* |
| 460 | * Now check the table for used entries and mark those as |
| 461 | * allocated in the bitmap |
| 462 | */ |
| 463 | for (i = 0; i < INTR_REMAP_TABLE_ENTRIES; i++) { |
| 464 | if (iommu->ir_table->base[i].present) |
| 465 | bitmap_set(iommu->ir_table->bitmap, i, 1); |
| 466 | } |
| 467 | |
| 468 | memunmap(old_ir_table); |
| 469 | |
| 470 | return 0; |
| 471 | } |
| 472 | |
| 473 | |
| 474 | static void iommu_set_irq_remapping(struct intel_iommu *iommu, int mode) |
| 475 | { |
| 476 | unsigned long flags; |
| 477 | u64 addr; |
| 478 | u32 sts; |
| 479 | |
| 480 | addr = virt_to_phys((void *)iommu->ir_table->base); |
| 481 | |
| 482 | raw_spin_lock_irqsave(&iommu->register_lock, flags); |
| 483 | |
| 484 | dmar_writeq(iommu->reg + DMAR_IRTA_REG, |
| 485 | (addr) | IR_X2APIC_MODE(mode) | INTR_REMAP_TABLE_REG_SIZE); |
| 486 | |
| 487 | /* Set interrupt-remapping table pointer */ |
| 488 | writel(iommu->gcmd | DMA_GCMD_SIRTP, iommu->reg + DMAR_GCMD_REG); |
| 489 | |
| 490 | IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG, |
| 491 | readl, (sts & DMA_GSTS_IRTPS), sts); |
| 492 | raw_spin_unlock_irqrestore(&iommu->register_lock, flags); |
| 493 | |
| 494 | /* |
| 495 | * Global invalidation of interrupt entry cache to make sure the |
| 496 | * hardware uses the new irq remapping table. |
| 497 | */ |
| 498 | qi_global_iec(iommu); |
| 499 | } |
| 500 | |
| 501 | static void iommu_enable_irq_remapping(struct intel_iommu *iommu) |
| 502 | { |
| 503 | unsigned long flags; |
| 504 | u32 sts; |
| 505 | |
| 506 | raw_spin_lock_irqsave(&iommu->register_lock, flags); |
| 507 | |
| 508 | /* Enable interrupt-remapping */ |
| 509 | iommu->gcmd |= DMA_GCMD_IRE; |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 510 | writel(iommu->gcmd, iommu->reg + DMAR_GCMD_REG); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 511 | IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG, |
| 512 | readl, (sts & DMA_GSTS_IRES), sts); |
| 513 | |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame^] | 514 | /* Block compatibility-format MSIs */ |
| 515 | if (sts & DMA_GSTS_CFIS) { |
| 516 | iommu->gcmd &= ~DMA_GCMD_CFI; |
| 517 | writel(iommu->gcmd, iommu->reg + DMAR_GCMD_REG); |
| 518 | IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG, |
| 519 | readl, !(sts & DMA_GSTS_CFIS), sts); |
| 520 | } |
| 521 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 522 | /* |
| 523 | * With CFI clear in the Global Command register, we should be |
| 524 | * protected from dangerous (i.e. compatibility) interrupts |
| 525 | * regardless of x2apic status. Check just to be sure. |
| 526 | */ |
| 527 | if (sts & DMA_GSTS_CFIS) |
| 528 | WARN(1, KERN_WARNING |
| 529 | "Compatibility-format IRQs enabled despite intr remapping;\n" |
| 530 | "you are vulnerable to IRQ injection.\n"); |
| 531 | |
| 532 | raw_spin_unlock_irqrestore(&iommu->register_lock, flags); |
| 533 | } |
| 534 | |
| 535 | static int intel_setup_irq_remapping(struct intel_iommu *iommu) |
| 536 | { |
| 537 | struct ir_table *ir_table; |
| 538 | struct fwnode_handle *fn; |
| 539 | unsigned long *bitmap; |
| 540 | struct page *pages; |
| 541 | |
| 542 | if (iommu->ir_table) |
| 543 | return 0; |
| 544 | |
| 545 | ir_table = kzalloc(sizeof(struct ir_table), GFP_KERNEL); |
| 546 | if (!ir_table) |
| 547 | return -ENOMEM; |
| 548 | |
| 549 | pages = alloc_pages_node(iommu->node, GFP_KERNEL | __GFP_ZERO, |
| 550 | INTR_REMAP_PAGE_ORDER); |
| 551 | if (!pages) { |
| 552 | pr_err("IR%d: failed to allocate pages of order %d\n", |
| 553 | iommu->seq_id, INTR_REMAP_PAGE_ORDER); |
| 554 | goto out_free_table; |
| 555 | } |
| 556 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 557 | bitmap = bitmap_zalloc(INTR_REMAP_TABLE_ENTRIES, GFP_ATOMIC); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 558 | if (bitmap == NULL) { |
| 559 | pr_err("IR%d: failed to allocate bitmap\n", iommu->seq_id); |
| 560 | goto out_free_pages; |
| 561 | } |
| 562 | |
| 563 | fn = irq_domain_alloc_named_id_fwnode("INTEL-IR", iommu->seq_id); |
| 564 | if (!fn) |
| 565 | goto out_free_bitmap; |
| 566 | |
| 567 | iommu->ir_domain = |
| 568 | irq_domain_create_hierarchy(arch_get_ir_parent_domain(), |
| 569 | 0, INTR_REMAP_TABLE_ENTRIES, |
| 570 | fn, &intel_ir_domain_ops, |
| 571 | iommu); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 572 | if (!iommu->ir_domain) { |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame^] | 573 | irq_domain_free_fwnode(fn); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 574 | pr_err("IR%d: failed to allocate irqdomain\n", iommu->seq_id); |
| 575 | goto out_free_bitmap; |
| 576 | } |
| 577 | iommu->ir_msi_domain = |
| 578 | arch_create_remap_msi_irq_domain(iommu->ir_domain, |
| 579 | "INTEL-IR-MSI", |
| 580 | iommu->seq_id); |
| 581 | |
| 582 | ir_table->base = page_address(pages); |
| 583 | ir_table->bitmap = bitmap; |
| 584 | iommu->ir_table = ir_table; |
| 585 | |
| 586 | /* |
| 587 | * If the queued invalidation is already initialized, |
| 588 | * shouldn't disable it. |
| 589 | */ |
| 590 | if (!iommu->qi) { |
| 591 | /* |
| 592 | * Clear previous faults. |
| 593 | */ |
| 594 | dmar_fault(-1, iommu); |
| 595 | dmar_disable_qi(iommu); |
| 596 | |
| 597 | if (dmar_enable_qi(iommu)) { |
| 598 | pr_err("Failed to enable queued invalidation\n"); |
| 599 | goto out_free_bitmap; |
| 600 | } |
| 601 | } |
| 602 | |
| 603 | init_ir_status(iommu); |
| 604 | |
| 605 | if (ir_pre_enabled(iommu)) { |
| 606 | if (!is_kdump_kernel()) { |
| 607 | pr_warn("IRQ remapping was enabled on %s but we are not in kdump mode\n", |
| 608 | iommu->name); |
| 609 | clear_ir_pre_enabled(iommu); |
| 610 | iommu_disable_irq_remapping(iommu); |
| 611 | } else if (iommu_load_old_irte(iommu)) |
| 612 | pr_err("Failed to copy IR table for %s from previous kernel\n", |
| 613 | iommu->name); |
| 614 | else |
| 615 | pr_info("Copied IR table for %s from previous kernel\n", |
| 616 | iommu->name); |
| 617 | } |
| 618 | |
| 619 | iommu_set_irq_remapping(iommu, eim_mode); |
| 620 | |
| 621 | return 0; |
| 622 | |
| 623 | out_free_bitmap: |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 624 | bitmap_free(bitmap); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 625 | out_free_pages: |
| 626 | __free_pages(pages, INTR_REMAP_PAGE_ORDER); |
| 627 | out_free_table: |
| 628 | kfree(ir_table); |
| 629 | |
| 630 | iommu->ir_table = NULL; |
| 631 | |
| 632 | return -ENOMEM; |
| 633 | } |
| 634 | |
| 635 | static void intel_teardown_irq_remapping(struct intel_iommu *iommu) |
| 636 | { |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame^] | 637 | struct fwnode_handle *fn; |
| 638 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 639 | if (iommu && iommu->ir_table) { |
| 640 | if (iommu->ir_msi_domain) { |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame^] | 641 | fn = iommu->ir_msi_domain->fwnode; |
| 642 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 643 | irq_domain_remove(iommu->ir_msi_domain); |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame^] | 644 | irq_domain_free_fwnode(fn); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 645 | iommu->ir_msi_domain = NULL; |
| 646 | } |
| 647 | if (iommu->ir_domain) { |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame^] | 648 | fn = iommu->ir_domain->fwnode; |
| 649 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 650 | irq_domain_remove(iommu->ir_domain); |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame^] | 651 | irq_domain_free_fwnode(fn); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 652 | iommu->ir_domain = NULL; |
| 653 | } |
| 654 | free_pages((unsigned long)iommu->ir_table->base, |
| 655 | INTR_REMAP_PAGE_ORDER); |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 656 | bitmap_free(iommu->ir_table->bitmap); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 657 | kfree(iommu->ir_table); |
| 658 | iommu->ir_table = NULL; |
| 659 | } |
| 660 | } |
| 661 | |
| 662 | /* |
| 663 | * Disable Interrupt Remapping. |
| 664 | */ |
| 665 | static void iommu_disable_irq_remapping(struct intel_iommu *iommu) |
| 666 | { |
| 667 | unsigned long flags; |
| 668 | u32 sts; |
| 669 | |
| 670 | if (!ecap_ir_support(iommu->ecap)) |
| 671 | return; |
| 672 | |
| 673 | /* |
| 674 | * global invalidation of interrupt entry cache before disabling |
| 675 | * interrupt-remapping. |
| 676 | */ |
| 677 | qi_global_iec(iommu); |
| 678 | |
| 679 | raw_spin_lock_irqsave(&iommu->register_lock, flags); |
| 680 | |
| 681 | sts = readl(iommu->reg + DMAR_GSTS_REG); |
| 682 | if (!(sts & DMA_GSTS_IRES)) |
| 683 | goto end; |
| 684 | |
| 685 | iommu->gcmd &= ~DMA_GCMD_IRE; |
| 686 | writel(iommu->gcmd, iommu->reg + DMAR_GCMD_REG); |
| 687 | |
| 688 | IOMMU_WAIT_OP(iommu, DMAR_GSTS_REG, |
| 689 | readl, !(sts & DMA_GSTS_IRES), sts); |
| 690 | |
| 691 | end: |
| 692 | raw_spin_unlock_irqrestore(&iommu->register_lock, flags); |
| 693 | } |
| 694 | |
| 695 | static int __init dmar_x2apic_optout(void) |
| 696 | { |
| 697 | struct acpi_table_dmar *dmar; |
| 698 | dmar = (struct acpi_table_dmar *)dmar_tbl; |
| 699 | if (!dmar || no_x2apic_optout) |
| 700 | return 0; |
| 701 | return dmar->flags & DMAR_X2APIC_OPT_OUT; |
| 702 | } |
| 703 | |
| 704 | static void __init intel_cleanup_irq_remapping(void) |
| 705 | { |
| 706 | struct dmar_drhd_unit *drhd; |
| 707 | struct intel_iommu *iommu; |
| 708 | |
| 709 | for_each_iommu(iommu, drhd) { |
| 710 | if (ecap_ir_support(iommu->ecap)) { |
| 711 | iommu_disable_irq_remapping(iommu); |
| 712 | intel_teardown_irq_remapping(iommu); |
| 713 | } |
| 714 | } |
| 715 | |
| 716 | if (x2apic_supported()) |
| 717 | pr_warn("Failed to enable irq remapping. You are vulnerable to irq-injection attacks.\n"); |
| 718 | } |
| 719 | |
| 720 | static int __init intel_prepare_irq_remapping(void) |
| 721 | { |
| 722 | struct dmar_drhd_unit *drhd; |
| 723 | struct intel_iommu *iommu; |
| 724 | int eim = 0; |
| 725 | |
| 726 | if (irq_remap_broken) { |
| 727 | pr_warn("This system BIOS has enabled interrupt remapping\n" |
| 728 | "on a chipset that contains an erratum making that\n" |
| 729 | "feature unstable. To maintain system stability\n" |
| 730 | "interrupt remapping is being disabled. Please\n" |
| 731 | "contact your BIOS vendor for an update\n"); |
| 732 | add_taint(TAINT_FIRMWARE_WORKAROUND, LOCKDEP_STILL_OK); |
| 733 | return -ENODEV; |
| 734 | } |
| 735 | |
| 736 | if (dmar_table_init() < 0) |
| 737 | return -ENODEV; |
| 738 | |
| 739 | if (!dmar_ir_support()) |
| 740 | return -ENODEV; |
| 741 | |
| 742 | if (parse_ioapics_under_ir()) { |
| 743 | pr_info("Not enabling interrupt remapping\n"); |
| 744 | goto error; |
| 745 | } |
| 746 | |
| 747 | /* First make sure all IOMMUs support IRQ remapping */ |
| 748 | for_each_iommu(iommu, drhd) |
| 749 | if (!ecap_ir_support(iommu->ecap)) |
| 750 | goto error; |
| 751 | |
| 752 | /* Detect remapping mode: lapic or x2apic */ |
| 753 | if (x2apic_supported()) { |
| 754 | eim = !dmar_x2apic_optout(); |
| 755 | if (!eim) { |
| 756 | pr_info("x2apic is disabled because BIOS sets x2apic opt out bit."); |
| 757 | pr_info("Use 'intremap=no_x2apic_optout' to override the BIOS setting.\n"); |
| 758 | } |
| 759 | } |
| 760 | |
| 761 | for_each_iommu(iommu, drhd) { |
| 762 | if (eim && !ecap_eim_support(iommu->ecap)) { |
| 763 | pr_info("%s does not support EIM\n", iommu->name); |
| 764 | eim = 0; |
| 765 | } |
| 766 | } |
| 767 | |
| 768 | eim_mode = eim; |
| 769 | if (eim) |
| 770 | pr_info("Queued invalidation will be enabled to support x2apic and Intr-remapping.\n"); |
| 771 | |
| 772 | /* Do the initializations early */ |
| 773 | for_each_iommu(iommu, drhd) { |
| 774 | if (intel_setup_irq_remapping(iommu)) { |
| 775 | pr_err("Failed to setup irq remapping for %s\n", |
| 776 | iommu->name); |
| 777 | goto error; |
| 778 | } |
| 779 | } |
| 780 | |
| 781 | return 0; |
| 782 | |
| 783 | error: |
| 784 | intel_cleanup_irq_remapping(); |
| 785 | return -ENODEV; |
| 786 | } |
| 787 | |
| 788 | /* |
| 789 | * Set Posted-Interrupts capability. |
| 790 | */ |
| 791 | static inline void set_irq_posting_cap(void) |
| 792 | { |
| 793 | struct dmar_drhd_unit *drhd; |
| 794 | struct intel_iommu *iommu; |
| 795 | |
| 796 | if (!disable_irq_post) { |
| 797 | /* |
| 798 | * If IRTE is in posted format, the 'pda' field goes across the |
| 799 | * 64-bit boundary, we need use cmpxchg16b to atomically update |
| 800 | * it. We only expose posted-interrupt when X86_FEATURE_CX16 |
| 801 | * is supported. Actually, hardware platforms supporting PI |
| 802 | * should have X86_FEATURE_CX16 support, this has been confirmed |
| 803 | * with Intel hardware guys. |
| 804 | */ |
| 805 | if (boot_cpu_has(X86_FEATURE_CX16)) |
| 806 | intel_irq_remap_ops.capability |= 1 << IRQ_POSTING_CAP; |
| 807 | |
| 808 | for_each_iommu(iommu, drhd) |
| 809 | if (!cap_pi_support(iommu->cap)) { |
| 810 | intel_irq_remap_ops.capability &= |
| 811 | ~(1 << IRQ_POSTING_CAP); |
| 812 | break; |
| 813 | } |
| 814 | } |
| 815 | } |
| 816 | |
| 817 | static int __init intel_enable_irq_remapping(void) |
| 818 | { |
| 819 | struct dmar_drhd_unit *drhd; |
| 820 | struct intel_iommu *iommu; |
| 821 | bool setup = false; |
| 822 | |
| 823 | /* |
| 824 | * Setup Interrupt-remapping for all the DRHD's now. |
| 825 | */ |
| 826 | for_each_iommu(iommu, drhd) { |
| 827 | if (!ir_pre_enabled(iommu)) |
| 828 | iommu_enable_irq_remapping(iommu); |
| 829 | setup = true; |
| 830 | } |
| 831 | |
| 832 | if (!setup) |
| 833 | goto error; |
| 834 | |
| 835 | irq_remapping_enabled = 1; |
| 836 | |
| 837 | set_irq_posting_cap(); |
| 838 | |
| 839 | pr_info("Enabled IRQ remapping in %s mode\n", eim_mode ? "x2apic" : "xapic"); |
| 840 | |
| 841 | return eim_mode ? IRQ_REMAP_X2APIC_MODE : IRQ_REMAP_XAPIC_MODE; |
| 842 | |
| 843 | error: |
| 844 | intel_cleanup_irq_remapping(); |
| 845 | return -1; |
| 846 | } |
| 847 | |
| 848 | static int ir_parse_one_hpet_scope(struct acpi_dmar_device_scope *scope, |
| 849 | struct intel_iommu *iommu, |
| 850 | struct acpi_dmar_hardware_unit *drhd) |
| 851 | { |
| 852 | struct acpi_dmar_pci_path *path; |
| 853 | u8 bus; |
| 854 | int count, free = -1; |
| 855 | |
| 856 | bus = scope->bus; |
| 857 | path = (struct acpi_dmar_pci_path *)(scope + 1); |
| 858 | count = (scope->length - sizeof(struct acpi_dmar_device_scope)) |
| 859 | / sizeof(struct acpi_dmar_pci_path); |
| 860 | |
| 861 | while (--count > 0) { |
| 862 | /* |
| 863 | * Access PCI directly due to the PCI |
| 864 | * subsystem isn't initialized yet. |
| 865 | */ |
| 866 | bus = read_pci_config_byte(bus, path->device, path->function, |
| 867 | PCI_SECONDARY_BUS); |
| 868 | path++; |
| 869 | } |
| 870 | |
| 871 | for (count = 0; count < MAX_HPET_TBS; count++) { |
| 872 | if (ir_hpet[count].iommu == iommu && |
| 873 | ir_hpet[count].id == scope->enumeration_id) |
| 874 | return 0; |
| 875 | else if (ir_hpet[count].iommu == NULL && free == -1) |
| 876 | free = count; |
| 877 | } |
| 878 | if (free == -1) { |
| 879 | pr_warn("Exceeded Max HPET blocks\n"); |
| 880 | return -ENOSPC; |
| 881 | } |
| 882 | |
| 883 | ir_hpet[free].iommu = iommu; |
| 884 | ir_hpet[free].id = scope->enumeration_id; |
| 885 | ir_hpet[free].bus = bus; |
| 886 | ir_hpet[free].devfn = PCI_DEVFN(path->device, path->function); |
| 887 | pr_info("HPET id %d under DRHD base 0x%Lx\n", |
| 888 | scope->enumeration_id, drhd->address); |
| 889 | |
| 890 | return 0; |
| 891 | } |
| 892 | |
| 893 | static int ir_parse_one_ioapic_scope(struct acpi_dmar_device_scope *scope, |
| 894 | struct intel_iommu *iommu, |
| 895 | struct acpi_dmar_hardware_unit *drhd) |
| 896 | { |
| 897 | struct acpi_dmar_pci_path *path; |
| 898 | u8 bus; |
| 899 | int count, free = -1; |
| 900 | |
| 901 | bus = scope->bus; |
| 902 | path = (struct acpi_dmar_pci_path *)(scope + 1); |
| 903 | count = (scope->length - sizeof(struct acpi_dmar_device_scope)) |
| 904 | / sizeof(struct acpi_dmar_pci_path); |
| 905 | |
| 906 | while (--count > 0) { |
| 907 | /* |
| 908 | * Access PCI directly due to the PCI |
| 909 | * subsystem isn't initialized yet. |
| 910 | */ |
| 911 | bus = read_pci_config_byte(bus, path->device, path->function, |
| 912 | PCI_SECONDARY_BUS); |
| 913 | path++; |
| 914 | } |
| 915 | |
| 916 | for (count = 0; count < MAX_IO_APICS; count++) { |
| 917 | if (ir_ioapic[count].iommu == iommu && |
| 918 | ir_ioapic[count].id == scope->enumeration_id) |
| 919 | return 0; |
| 920 | else if (ir_ioapic[count].iommu == NULL && free == -1) |
| 921 | free = count; |
| 922 | } |
| 923 | if (free == -1) { |
| 924 | pr_warn("Exceeded Max IO APICS\n"); |
| 925 | return -ENOSPC; |
| 926 | } |
| 927 | |
| 928 | ir_ioapic[free].bus = bus; |
| 929 | ir_ioapic[free].devfn = PCI_DEVFN(path->device, path->function); |
| 930 | ir_ioapic[free].iommu = iommu; |
| 931 | ir_ioapic[free].id = scope->enumeration_id; |
| 932 | pr_info("IOAPIC id %d under DRHD base 0x%Lx IOMMU %d\n", |
| 933 | scope->enumeration_id, drhd->address, iommu->seq_id); |
| 934 | |
| 935 | return 0; |
| 936 | } |
| 937 | |
| 938 | static int ir_parse_ioapic_hpet_scope(struct acpi_dmar_header *header, |
| 939 | struct intel_iommu *iommu) |
| 940 | { |
| 941 | int ret = 0; |
| 942 | struct acpi_dmar_hardware_unit *drhd; |
| 943 | struct acpi_dmar_device_scope *scope; |
| 944 | void *start, *end; |
| 945 | |
| 946 | drhd = (struct acpi_dmar_hardware_unit *)header; |
| 947 | start = (void *)(drhd + 1); |
| 948 | end = ((void *)drhd) + header->length; |
| 949 | |
| 950 | while (start < end && ret == 0) { |
| 951 | scope = start; |
| 952 | if (scope->entry_type == ACPI_DMAR_SCOPE_TYPE_IOAPIC) |
| 953 | ret = ir_parse_one_ioapic_scope(scope, iommu, drhd); |
| 954 | else if (scope->entry_type == ACPI_DMAR_SCOPE_TYPE_HPET) |
| 955 | ret = ir_parse_one_hpet_scope(scope, iommu, drhd); |
| 956 | start += scope->length; |
| 957 | } |
| 958 | |
| 959 | return ret; |
| 960 | } |
| 961 | |
| 962 | static void ir_remove_ioapic_hpet_scope(struct intel_iommu *iommu) |
| 963 | { |
| 964 | int i; |
| 965 | |
| 966 | for (i = 0; i < MAX_HPET_TBS; i++) |
| 967 | if (ir_hpet[i].iommu == iommu) |
| 968 | ir_hpet[i].iommu = NULL; |
| 969 | |
| 970 | for (i = 0; i < MAX_IO_APICS; i++) |
| 971 | if (ir_ioapic[i].iommu == iommu) |
| 972 | ir_ioapic[i].iommu = NULL; |
| 973 | } |
| 974 | |
| 975 | /* |
| 976 | * Finds the assocaition between IOAPIC's and its Interrupt-remapping |
| 977 | * hardware unit. |
| 978 | */ |
| 979 | static int __init parse_ioapics_under_ir(void) |
| 980 | { |
| 981 | struct dmar_drhd_unit *drhd; |
| 982 | struct intel_iommu *iommu; |
| 983 | bool ir_supported = false; |
| 984 | int ioapic_idx; |
| 985 | |
| 986 | for_each_iommu(iommu, drhd) { |
| 987 | int ret; |
| 988 | |
| 989 | if (!ecap_ir_support(iommu->ecap)) |
| 990 | continue; |
| 991 | |
| 992 | ret = ir_parse_ioapic_hpet_scope(drhd->hdr, iommu); |
| 993 | if (ret) |
| 994 | return ret; |
| 995 | |
| 996 | ir_supported = true; |
| 997 | } |
| 998 | |
| 999 | if (!ir_supported) |
| 1000 | return -ENODEV; |
| 1001 | |
| 1002 | for (ioapic_idx = 0; ioapic_idx < nr_ioapics; ioapic_idx++) { |
| 1003 | int ioapic_id = mpc_ioapic_id(ioapic_idx); |
| 1004 | if (!map_ioapic_to_ir(ioapic_id)) { |
| 1005 | pr_err(FW_BUG "ioapic %d has no mapping iommu, " |
| 1006 | "interrupt remapping will be disabled\n", |
| 1007 | ioapic_id); |
| 1008 | return -1; |
| 1009 | } |
| 1010 | } |
| 1011 | |
| 1012 | return 0; |
| 1013 | } |
| 1014 | |
| 1015 | static int __init ir_dev_scope_init(void) |
| 1016 | { |
| 1017 | int ret; |
| 1018 | |
| 1019 | if (!irq_remapping_enabled) |
| 1020 | return 0; |
| 1021 | |
| 1022 | down_write(&dmar_global_lock); |
| 1023 | ret = dmar_dev_scope_init(); |
| 1024 | up_write(&dmar_global_lock); |
| 1025 | |
| 1026 | return ret; |
| 1027 | } |
| 1028 | rootfs_initcall(ir_dev_scope_init); |
| 1029 | |
| 1030 | static void disable_irq_remapping(void) |
| 1031 | { |
| 1032 | struct dmar_drhd_unit *drhd; |
| 1033 | struct intel_iommu *iommu = NULL; |
| 1034 | |
| 1035 | /* |
| 1036 | * Disable Interrupt-remapping for all the DRHD's now. |
| 1037 | */ |
| 1038 | for_each_iommu(iommu, drhd) { |
| 1039 | if (!ecap_ir_support(iommu->ecap)) |
| 1040 | continue; |
| 1041 | |
| 1042 | iommu_disable_irq_remapping(iommu); |
| 1043 | } |
| 1044 | |
| 1045 | /* |
| 1046 | * Clear Posted-Interrupts capability. |
| 1047 | */ |
| 1048 | if (!disable_irq_post) |
| 1049 | intel_irq_remap_ops.capability &= ~(1 << IRQ_POSTING_CAP); |
| 1050 | } |
| 1051 | |
| 1052 | static int reenable_irq_remapping(int eim) |
| 1053 | { |
| 1054 | struct dmar_drhd_unit *drhd; |
| 1055 | bool setup = false; |
| 1056 | struct intel_iommu *iommu = NULL; |
| 1057 | |
| 1058 | for_each_iommu(iommu, drhd) |
| 1059 | if (iommu->qi) |
| 1060 | dmar_reenable_qi(iommu); |
| 1061 | |
| 1062 | /* |
| 1063 | * Setup Interrupt-remapping for all the DRHD's now. |
| 1064 | */ |
| 1065 | for_each_iommu(iommu, drhd) { |
| 1066 | if (!ecap_ir_support(iommu->ecap)) |
| 1067 | continue; |
| 1068 | |
| 1069 | /* Set up interrupt remapping for iommu.*/ |
| 1070 | iommu_set_irq_remapping(iommu, eim); |
| 1071 | iommu_enable_irq_remapping(iommu); |
| 1072 | setup = true; |
| 1073 | } |
| 1074 | |
| 1075 | if (!setup) |
| 1076 | goto error; |
| 1077 | |
| 1078 | set_irq_posting_cap(); |
| 1079 | |
| 1080 | return 0; |
| 1081 | |
| 1082 | error: |
| 1083 | /* |
| 1084 | * handle error condition gracefully here! |
| 1085 | */ |
| 1086 | return -1; |
| 1087 | } |
| 1088 | |
| 1089 | static void prepare_irte(struct irte *irte, int vector, unsigned int dest) |
| 1090 | { |
| 1091 | memset(irte, 0, sizeof(*irte)); |
| 1092 | |
| 1093 | irte->present = 1; |
| 1094 | irte->dst_mode = apic->irq_dest_mode; |
| 1095 | /* |
| 1096 | * Trigger mode in the IRTE will always be edge, and for IO-APIC, the |
| 1097 | * actual level or edge trigger will be setup in the IO-APIC |
| 1098 | * RTE. This will help simplify level triggered irq migration. |
| 1099 | * For more details, see the comments (in io_apic.c) explainig IO-APIC |
| 1100 | * irq migration in the presence of interrupt-remapping. |
| 1101 | */ |
| 1102 | irte->trigger_mode = 0; |
| 1103 | irte->dlvry_mode = apic->irq_delivery_mode; |
| 1104 | irte->vector = vector; |
| 1105 | irte->dest_id = IRTE_DEST(dest); |
| 1106 | irte->redir_hint = 1; |
| 1107 | } |
| 1108 | |
| 1109 | static struct irq_domain *intel_get_ir_irq_domain(struct irq_alloc_info *info) |
| 1110 | { |
| 1111 | struct intel_iommu *iommu = NULL; |
| 1112 | |
| 1113 | if (!info) |
| 1114 | return NULL; |
| 1115 | |
| 1116 | switch (info->type) { |
| 1117 | case X86_IRQ_ALLOC_TYPE_IOAPIC: |
| 1118 | iommu = map_ioapic_to_ir(info->ioapic_id); |
| 1119 | break; |
| 1120 | case X86_IRQ_ALLOC_TYPE_HPET: |
| 1121 | iommu = map_hpet_to_ir(info->hpet_id); |
| 1122 | break; |
| 1123 | case X86_IRQ_ALLOC_TYPE_MSI: |
| 1124 | case X86_IRQ_ALLOC_TYPE_MSIX: |
| 1125 | iommu = map_dev_to_ir(info->msi_dev); |
| 1126 | break; |
| 1127 | default: |
| 1128 | BUG_ON(1); |
| 1129 | break; |
| 1130 | } |
| 1131 | |
| 1132 | return iommu ? iommu->ir_domain : NULL; |
| 1133 | } |
| 1134 | |
| 1135 | static struct irq_domain *intel_get_irq_domain(struct irq_alloc_info *info) |
| 1136 | { |
| 1137 | struct intel_iommu *iommu; |
| 1138 | |
| 1139 | if (!info) |
| 1140 | return NULL; |
| 1141 | |
| 1142 | switch (info->type) { |
| 1143 | case X86_IRQ_ALLOC_TYPE_MSI: |
| 1144 | case X86_IRQ_ALLOC_TYPE_MSIX: |
| 1145 | iommu = map_dev_to_ir(info->msi_dev); |
| 1146 | if (iommu) |
| 1147 | return iommu->ir_msi_domain; |
| 1148 | break; |
| 1149 | default: |
| 1150 | break; |
| 1151 | } |
| 1152 | |
| 1153 | return NULL; |
| 1154 | } |
| 1155 | |
| 1156 | struct irq_remap_ops intel_irq_remap_ops = { |
| 1157 | .prepare = intel_prepare_irq_remapping, |
| 1158 | .enable = intel_enable_irq_remapping, |
| 1159 | .disable = disable_irq_remapping, |
| 1160 | .reenable = reenable_irq_remapping, |
| 1161 | .enable_faulting = enable_drhd_fault_handling, |
| 1162 | .get_ir_irq_domain = intel_get_ir_irq_domain, |
| 1163 | .get_irq_domain = intel_get_irq_domain, |
| 1164 | }; |
| 1165 | |
| 1166 | static void intel_ir_reconfigure_irte(struct irq_data *irqd, bool force) |
| 1167 | { |
| 1168 | struct intel_ir_data *ir_data = irqd->chip_data; |
| 1169 | struct irte *irte = &ir_data->irte_entry; |
| 1170 | struct irq_cfg *cfg = irqd_cfg(irqd); |
| 1171 | |
| 1172 | /* |
| 1173 | * Atomically updates the IRTE with the new destination, vector |
| 1174 | * and flushes the interrupt entry cache. |
| 1175 | */ |
| 1176 | irte->vector = cfg->vector; |
| 1177 | irte->dest_id = IRTE_DEST(cfg->dest_apicid); |
| 1178 | |
| 1179 | /* Update the hardware only if the interrupt is in remapped mode. */ |
| 1180 | if (force || ir_data->irq_2_iommu.mode == IRQ_REMAPPING) |
| 1181 | modify_irte(&ir_data->irq_2_iommu, irte); |
| 1182 | } |
| 1183 | |
| 1184 | /* |
| 1185 | * Migrate the IO-APIC irq in the presence of intr-remapping. |
| 1186 | * |
| 1187 | * For both level and edge triggered, irq migration is a simple atomic |
| 1188 | * update(of vector and cpu destination) of IRTE and flush the hardware cache. |
| 1189 | * |
| 1190 | * For level triggered, we eliminate the io-apic RTE modification (with the |
| 1191 | * updated vector information), by using a virtual vector (io-apic pin number). |
| 1192 | * Real vector that is used for interrupting cpu will be coming from |
| 1193 | * the interrupt-remapping table entry. |
| 1194 | * |
| 1195 | * As the migration is a simple atomic update of IRTE, the same mechanism |
| 1196 | * is used to migrate MSI irq's in the presence of interrupt-remapping. |
| 1197 | */ |
| 1198 | static int |
| 1199 | intel_ir_set_affinity(struct irq_data *data, const struct cpumask *mask, |
| 1200 | bool force) |
| 1201 | { |
| 1202 | struct irq_data *parent = data->parent_data; |
| 1203 | struct irq_cfg *cfg = irqd_cfg(data); |
| 1204 | int ret; |
| 1205 | |
| 1206 | ret = parent->chip->irq_set_affinity(parent, mask, force); |
| 1207 | if (ret < 0 || ret == IRQ_SET_MASK_OK_DONE) |
| 1208 | return ret; |
| 1209 | |
| 1210 | intel_ir_reconfigure_irte(data, false); |
| 1211 | /* |
| 1212 | * After this point, all the interrupts will start arriving |
| 1213 | * at the new destination. So, time to cleanup the previous |
| 1214 | * vector allocation. |
| 1215 | */ |
| 1216 | send_cleanup_vector(cfg); |
| 1217 | |
| 1218 | return IRQ_SET_MASK_OK_DONE; |
| 1219 | } |
| 1220 | |
| 1221 | static void intel_ir_compose_msi_msg(struct irq_data *irq_data, |
| 1222 | struct msi_msg *msg) |
| 1223 | { |
| 1224 | struct intel_ir_data *ir_data = irq_data->chip_data; |
| 1225 | |
| 1226 | *msg = ir_data->msi_entry; |
| 1227 | } |
| 1228 | |
| 1229 | static int intel_ir_set_vcpu_affinity(struct irq_data *data, void *info) |
| 1230 | { |
| 1231 | struct intel_ir_data *ir_data = data->chip_data; |
| 1232 | struct vcpu_data *vcpu_pi_info = info; |
| 1233 | |
| 1234 | /* stop posting interrupts, back to remapping mode */ |
| 1235 | if (!vcpu_pi_info) { |
| 1236 | modify_irte(&ir_data->irq_2_iommu, &ir_data->irte_entry); |
| 1237 | } else { |
| 1238 | struct irte irte_pi; |
| 1239 | |
| 1240 | /* |
| 1241 | * We are not caching the posted interrupt entry. We |
| 1242 | * copy the data from the remapped entry and modify |
| 1243 | * the fields which are relevant for posted mode. The |
| 1244 | * cached remapped entry is used for switching back to |
| 1245 | * remapped mode. |
| 1246 | */ |
| 1247 | memset(&irte_pi, 0, sizeof(irte_pi)); |
| 1248 | dmar_copy_shared_irte(&irte_pi, &ir_data->irte_entry); |
| 1249 | |
| 1250 | /* Update the posted mode fields */ |
| 1251 | irte_pi.p_pst = 1; |
| 1252 | irte_pi.p_urgent = 0; |
| 1253 | irte_pi.p_vector = vcpu_pi_info->vector; |
| 1254 | irte_pi.pda_l = (vcpu_pi_info->pi_desc_addr >> |
| 1255 | (32 - PDA_LOW_BIT)) & ~(-1UL << PDA_LOW_BIT); |
| 1256 | irte_pi.pda_h = (vcpu_pi_info->pi_desc_addr >> 32) & |
| 1257 | ~(-1UL << PDA_HIGH_BIT); |
| 1258 | |
| 1259 | modify_irte(&ir_data->irq_2_iommu, &irte_pi); |
| 1260 | } |
| 1261 | |
| 1262 | return 0; |
| 1263 | } |
| 1264 | |
| 1265 | static struct irq_chip intel_ir_chip = { |
| 1266 | .name = "INTEL-IR", |
| 1267 | .irq_ack = apic_ack_irq, |
| 1268 | .irq_set_affinity = intel_ir_set_affinity, |
| 1269 | .irq_compose_msi_msg = intel_ir_compose_msi_msg, |
| 1270 | .irq_set_vcpu_affinity = intel_ir_set_vcpu_affinity, |
| 1271 | }; |
| 1272 | |
| 1273 | static void intel_irq_remapping_prepare_irte(struct intel_ir_data *data, |
| 1274 | struct irq_cfg *irq_cfg, |
| 1275 | struct irq_alloc_info *info, |
| 1276 | int index, int sub_handle) |
| 1277 | { |
| 1278 | struct IR_IO_APIC_route_entry *entry; |
| 1279 | struct irte *irte = &data->irte_entry; |
| 1280 | struct msi_msg *msg = &data->msi_entry; |
| 1281 | |
| 1282 | prepare_irte(irte, irq_cfg->vector, irq_cfg->dest_apicid); |
| 1283 | switch (info->type) { |
| 1284 | case X86_IRQ_ALLOC_TYPE_IOAPIC: |
| 1285 | /* Set source-id of interrupt request */ |
| 1286 | set_ioapic_sid(irte, info->ioapic_id); |
| 1287 | apic_printk(APIC_VERBOSE, KERN_DEBUG "IOAPIC[%d]: Set IRTE entry (P:%d FPD:%d Dst_Mode:%d Redir_hint:%d Trig_Mode:%d Dlvry_Mode:%X Avail:%X Vector:%02X Dest:%08X SID:%04X SQ:%X SVT:%X)\n", |
| 1288 | info->ioapic_id, irte->present, irte->fpd, |
| 1289 | irte->dst_mode, irte->redir_hint, |
| 1290 | irte->trigger_mode, irte->dlvry_mode, |
| 1291 | irte->avail, irte->vector, irte->dest_id, |
| 1292 | irte->sid, irte->sq, irte->svt); |
| 1293 | |
| 1294 | entry = (struct IR_IO_APIC_route_entry *)info->ioapic_entry; |
| 1295 | info->ioapic_entry = NULL; |
| 1296 | memset(entry, 0, sizeof(*entry)); |
| 1297 | entry->index2 = (index >> 15) & 0x1; |
| 1298 | entry->zero = 0; |
| 1299 | entry->format = 1; |
| 1300 | entry->index = (index & 0x7fff); |
| 1301 | /* |
| 1302 | * IO-APIC RTE will be configured with virtual vector. |
| 1303 | * irq handler will do the explicit EOI to the io-apic. |
| 1304 | */ |
| 1305 | entry->vector = info->ioapic_pin; |
| 1306 | entry->mask = 0; /* enable IRQ */ |
| 1307 | entry->trigger = info->ioapic_trigger; |
| 1308 | entry->polarity = info->ioapic_polarity; |
| 1309 | if (info->ioapic_trigger) |
| 1310 | entry->mask = 1; /* Mask level triggered irqs. */ |
| 1311 | break; |
| 1312 | |
| 1313 | case X86_IRQ_ALLOC_TYPE_HPET: |
| 1314 | case X86_IRQ_ALLOC_TYPE_MSI: |
| 1315 | case X86_IRQ_ALLOC_TYPE_MSIX: |
| 1316 | if (info->type == X86_IRQ_ALLOC_TYPE_HPET) |
| 1317 | set_hpet_sid(irte, info->hpet_id); |
| 1318 | else |
| 1319 | set_msi_sid(irte, info->msi_dev); |
| 1320 | |
| 1321 | msg->address_hi = MSI_ADDR_BASE_HI; |
| 1322 | msg->data = sub_handle; |
| 1323 | msg->address_lo = MSI_ADDR_BASE_LO | MSI_ADDR_IR_EXT_INT | |
| 1324 | MSI_ADDR_IR_SHV | |
| 1325 | MSI_ADDR_IR_INDEX1(index) | |
| 1326 | MSI_ADDR_IR_INDEX2(index); |
| 1327 | break; |
| 1328 | |
| 1329 | default: |
| 1330 | BUG_ON(1); |
| 1331 | break; |
| 1332 | } |
| 1333 | } |
| 1334 | |
| 1335 | static void intel_free_irq_resources(struct irq_domain *domain, |
| 1336 | unsigned int virq, unsigned int nr_irqs) |
| 1337 | { |
| 1338 | struct irq_data *irq_data; |
| 1339 | struct intel_ir_data *data; |
| 1340 | struct irq_2_iommu *irq_iommu; |
| 1341 | unsigned long flags; |
| 1342 | int i; |
| 1343 | for (i = 0; i < nr_irqs; i++) { |
| 1344 | irq_data = irq_domain_get_irq_data(domain, virq + i); |
| 1345 | if (irq_data && irq_data->chip_data) { |
| 1346 | data = irq_data->chip_data; |
| 1347 | irq_iommu = &data->irq_2_iommu; |
| 1348 | raw_spin_lock_irqsave(&irq_2_ir_lock, flags); |
| 1349 | clear_entries(irq_iommu); |
| 1350 | raw_spin_unlock_irqrestore(&irq_2_ir_lock, flags); |
| 1351 | irq_domain_reset_irq_data(irq_data); |
| 1352 | kfree(data); |
| 1353 | } |
| 1354 | } |
| 1355 | } |
| 1356 | |
| 1357 | static int intel_irq_remapping_alloc(struct irq_domain *domain, |
| 1358 | unsigned int virq, unsigned int nr_irqs, |
| 1359 | void *arg) |
| 1360 | { |
| 1361 | struct intel_iommu *iommu = domain->host_data; |
| 1362 | struct irq_alloc_info *info = arg; |
| 1363 | struct intel_ir_data *data, *ird; |
| 1364 | struct irq_data *irq_data; |
| 1365 | struct irq_cfg *irq_cfg; |
| 1366 | int i, ret, index; |
| 1367 | |
| 1368 | if (!info || !iommu) |
| 1369 | return -EINVAL; |
| 1370 | if (nr_irqs > 1 && info->type != X86_IRQ_ALLOC_TYPE_MSI && |
| 1371 | info->type != X86_IRQ_ALLOC_TYPE_MSIX) |
| 1372 | return -EINVAL; |
| 1373 | |
| 1374 | /* |
| 1375 | * With IRQ remapping enabled, don't need contiguous CPU vectors |
| 1376 | * to support multiple MSI interrupts. |
| 1377 | */ |
| 1378 | if (info->type == X86_IRQ_ALLOC_TYPE_MSI) |
| 1379 | info->flags &= ~X86_IRQ_ALLOC_CONTIGUOUS_VECTORS; |
| 1380 | |
| 1381 | ret = irq_domain_alloc_irqs_parent(domain, virq, nr_irqs, arg); |
| 1382 | if (ret < 0) |
| 1383 | return ret; |
| 1384 | |
| 1385 | ret = -ENOMEM; |
| 1386 | data = kzalloc(sizeof(*data), GFP_KERNEL); |
| 1387 | if (!data) |
| 1388 | goto out_free_parent; |
| 1389 | |
| 1390 | down_read(&dmar_global_lock); |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 1391 | index = alloc_irte(iommu, &data->irq_2_iommu, nr_irqs); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 1392 | up_read(&dmar_global_lock); |
| 1393 | if (index < 0) { |
| 1394 | pr_warn("Failed to allocate IRTE\n"); |
| 1395 | kfree(data); |
| 1396 | goto out_free_parent; |
| 1397 | } |
| 1398 | |
| 1399 | for (i = 0; i < nr_irqs; i++) { |
| 1400 | irq_data = irq_domain_get_irq_data(domain, virq + i); |
| 1401 | irq_cfg = irqd_cfg(irq_data); |
| 1402 | if (!irq_data || !irq_cfg) { |
Olivier Deprez | 0e64123 | 2021-09-23 10:07:05 +0200 | [diff] [blame^] | 1403 | if (!i) |
| 1404 | kfree(data); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 1405 | ret = -EINVAL; |
| 1406 | goto out_free_data; |
| 1407 | } |
| 1408 | |
| 1409 | if (i > 0) { |
| 1410 | ird = kzalloc(sizeof(*ird), GFP_KERNEL); |
| 1411 | if (!ird) |
| 1412 | goto out_free_data; |
| 1413 | /* Initialize the common data */ |
| 1414 | ird->irq_2_iommu = data->irq_2_iommu; |
| 1415 | ird->irq_2_iommu.sub_handle = i; |
| 1416 | } else { |
| 1417 | ird = data; |
| 1418 | } |
| 1419 | |
| 1420 | irq_data->hwirq = (index << 16) + i; |
| 1421 | irq_data->chip_data = ird; |
| 1422 | irq_data->chip = &intel_ir_chip; |
| 1423 | intel_irq_remapping_prepare_irte(ird, irq_cfg, info, index, i); |
| 1424 | irq_set_status_flags(virq + i, IRQ_MOVE_PCNTXT); |
| 1425 | } |
| 1426 | return 0; |
| 1427 | |
| 1428 | out_free_data: |
| 1429 | intel_free_irq_resources(domain, virq, i); |
| 1430 | out_free_parent: |
| 1431 | irq_domain_free_irqs_common(domain, virq, nr_irqs); |
| 1432 | return ret; |
| 1433 | } |
| 1434 | |
| 1435 | static void intel_irq_remapping_free(struct irq_domain *domain, |
| 1436 | unsigned int virq, unsigned int nr_irqs) |
| 1437 | { |
| 1438 | intel_free_irq_resources(domain, virq, nr_irqs); |
| 1439 | irq_domain_free_irqs_common(domain, virq, nr_irqs); |
| 1440 | } |
| 1441 | |
| 1442 | static int intel_irq_remapping_activate(struct irq_domain *domain, |
| 1443 | struct irq_data *irq_data, bool reserve) |
| 1444 | { |
| 1445 | intel_ir_reconfigure_irte(irq_data, true); |
| 1446 | return 0; |
| 1447 | } |
| 1448 | |
| 1449 | static void intel_irq_remapping_deactivate(struct irq_domain *domain, |
| 1450 | struct irq_data *irq_data) |
| 1451 | { |
| 1452 | struct intel_ir_data *data = irq_data->chip_data; |
| 1453 | struct irte entry; |
| 1454 | |
| 1455 | memset(&entry, 0, sizeof(entry)); |
| 1456 | modify_irte(&data->irq_2_iommu, &entry); |
| 1457 | } |
| 1458 | |
| 1459 | static const struct irq_domain_ops intel_ir_domain_ops = { |
| 1460 | .alloc = intel_irq_remapping_alloc, |
| 1461 | .free = intel_irq_remapping_free, |
| 1462 | .activate = intel_irq_remapping_activate, |
| 1463 | .deactivate = intel_irq_remapping_deactivate, |
| 1464 | }; |
| 1465 | |
| 1466 | /* |
| 1467 | * Support of Interrupt Remapping Unit Hotplug |
| 1468 | */ |
| 1469 | static int dmar_ir_add(struct dmar_drhd_unit *dmaru, struct intel_iommu *iommu) |
| 1470 | { |
| 1471 | int ret; |
| 1472 | int eim = x2apic_enabled(); |
| 1473 | |
| 1474 | if (eim && !ecap_eim_support(iommu->ecap)) { |
| 1475 | pr_info("DRHD %Lx: EIM not supported by DRHD, ecap %Lx\n", |
| 1476 | iommu->reg_phys, iommu->ecap); |
| 1477 | return -ENODEV; |
| 1478 | } |
| 1479 | |
| 1480 | if (ir_parse_ioapic_hpet_scope(dmaru->hdr, iommu)) { |
| 1481 | pr_warn("DRHD %Lx: failed to parse managed IOAPIC/HPET\n", |
| 1482 | iommu->reg_phys); |
| 1483 | return -ENODEV; |
| 1484 | } |
| 1485 | |
| 1486 | /* TODO: check all IOAPICs are covered by IOMMU */ |
| 1487 | |
| 1488 | /* Setup Interrupt-remapping now. */ |
| 1489 | ret = intel_setup_irq_remapping(iommu); |
| 1490 | if (ret) { |
| 1491 | pr_err("Failed to setup irq remapping for %s\n", |
| 1492 | iommu->name); |
| 1493 | intel_teardown_irq_remapping(iommu); |
| 1494 | ir_remove_ioapic_hpet_scope(iommu); |
| 1495 | } else { |
| 1496 | iommu_enable_irq_remapping(iommu); |
| 1497 | } |
| 1498 | |
| 1499 | return ret; |
| 1500 | } |
| 1501 | |
| 1502 | int dmar_ir_hotplug(struct dmar_drhd_unit *dmaru, bool insert) |
| 1503 | { |
| 1504 | int ret = 0; |
| 1505 | struct intel_iommu *iommu = dmaru->iommu; |
| 1506 | |
| 1507 | if (!irq_remapping_enabled) |
| 1508 | return 0; |
| 1509 | if (iommu == NULL) |
| 1510 | return -EINVAL; |
| 1511 | if (!ecap_ir_support(iommu->ecap)) |
| 1512 | return 0; |
| 1513 | if (irq_remapping_cap(IRQ_POSTING_CAP) && |
| 1514 | !cap_pi_support(iommu->cap)) |
| 1515 | return -EBUSY; |
| 1516 | |
| 1517 | if (insert) { |
| 1518 | if (!iommu->ir_table) |
| 1519 | ret = dmar_ir_add(dmaru, iommu); |
| 1520 | } else { |
| 1521 | if (iommu->ir_table) { |
| 1522 | if (!bitmap_empty(iommu->ir_table->bitmap, |
| 1523 | INTR_REMAP_TABLE_ENTRIES)) { |
| 1524 | ret = -EBUSY; |
| 1525 | } else { |
| 1526 | iommu_disable_irq_remapping(iommu); |
| 1527 | intel_teardown_irq_remapping(iommu); |
| 1528 | ir_remove_ioapic_hpet_scope(iommu); |
| 1529 | } |
| 1530 | } |
| 1531 | } |
| 1532 | |
| 1533 | return ret; |
| 1534 | } |