irq_remapping.c 8.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366
  1. #include <linux/seq_file.h>
  2. #include <linux/cpumask.h>
  3. #include <linux/kernel.h>
  4. #include <linux/string.h>
  5. #include <linux/errno.h>
  6. #include <linux/msi.h>
  7. #include <linux/irq.h>
  8. #include <linux/pci.h>
  9. #include <asm/hw_irq.h>
  10. #include <asm/irq_remapping.h>
  11. #include <asm/processor.h>
  12. #include <asm/x86_init.h>
  13. #include <asm/apic.h>
  14. #include <asm/hpet.h>
  15. #include "irq_remapping.h"
  16. int irq_remapping_enabled;
  17. int irq_remap_broken;
  18. int disable_sourceid_checking;
  19. int no_x2apic_optout;
  20. static int disable_irq_remap;
  21. static struct irq_remap_ops *remap_ops;
  22. static int msi_alloc_remapped_irq(struct pci_dev *pdev, int irq, int nvec);
  23. static int msi_setup_remapped_irq(struct pci_dev *pdev, unsigned int irq,
  24. int index, int sub_handle);
  25. static int set_remapped_irq_affinity(struct irq_data *data,
  26. const struct cpumask *mask,
  27. bool force);
  28. static bool irq_remapped(struct irq_cfg *cfg)
  29. {
  30. return (cfg->remapped == 1);
  31. }
  32. static void irq_remapping_disable_io_apic(void)
  33. {
  34. /*
  35. * With interrupt-remapping, for now we will use virtual wire A
  36. * mode, as virtual wire B is little complex (need to configure
  37. * both IOAPIC RTE as well as interrupt-remapping table entry).
  38. * As this gets called during crash dump, keep this simple for
  39. * now.
  40. */
  41. if (cpu_has_apic || apic_from_smp_config())
  42. disconnect_bsp_APIC(0);
  43. }
  44. static int do_setup_msi_irqs(struct pci_dev *dev, int nvec)
  45. {
  46. int ret, sub_handle, nvec_pow2, index = 0;
  47. unsigned int irq;
  48. struct msi_desc *msidesc;
  49. msidesc = list_entry(dev->msi_list.next, struct msi_desc, list);
  50. irq = irq_alloc_hwirqs(nvec, dev_to_node(&dev->dev));
  51. if (irq == 0)
  52. return -ENOSPC;
  53. nvec_pow2 = __roundup_pow_of_two(nvec);
  54. for (sub_handle = 0; sub_handle < nvec; sub_handle++) {
  55. if (!sub_handle) {
  56. index = msi_alloc_remapped_irq(dev, irq, nvec_pow2);
  57. if (index < 0) {
  58. ret = index;
  59. goto error;
  60. }
  61. } else {
  62. ret = msi_setup_remapped_irq(dev, irq + sub_handle,
  63. index, sub_handle);
  64. if (ret < 0)
  65. goto error;
  66. }
  67. ret = setup_msi_irq(dev, msidesc, irq, sub_handle);
  68. if (ret < 0)
  69. goto error;
  70. }
  71. return 0;
  72. error:
  73. irq_free_hwirqs(irq, nvec);
  74. /*
  75. * Restore altered MSI descriptor fields and prevent just destroyed
  76. * IRQs from tearing down again in default_teardown_msi_irqs()
  77. */
  78. msidesc->irq = 0;
  79. return ret;
  80. }
  81. static int do_setup_msix_irqs(struct pci_dev *dev, int nvec)
  82. {
  83. int node, ret, sub_handle, index = 0;
  84. struct msi_desc *msidesc;
  85. unsigned int irq;
  86. node = dev_to_node(&dev->dev);
  87. sub_handle = 0;
  88. list_for_each_entry(msidesc, &dev->msi_list, list) {
  89. irq = irq_alloc_hwirq(node);
  90. if (irq == 0)
  91. return -1;
  92. if (sub_handle == 0)
  93. ret = index = msi_alloc_remapped_irq(dev, irq, nvec);
  94. else
  95. ret = msi_setup_remapped_irq(dev, irq, index, sub_handle);
  96. if (ret < 0)
  97. goto error;
  98. ret = setup_msi_irq(dev, msidesc, irq, 0);
  99. if (ret < 0)
  100. goto error;
  101. sub_handle += 1;
  102. irq += 1;
  103. }
  104. return 0;
  105. error:
  106. irq_free_hwirq(irq);
  107. return ret;
  108. }
  109. static int irq_remapping_setup_msi_irqs(struct pci_dev *dev,
  110. int nvec, int type)
  111. {
  112. if (type == PCI_CAP_ID_MSI)
  113. return do_setup_msi_irqs(dev, nvec);
  114. else
  115. return do_setup_msix_irqs(dev, nvec);
  116. }
  117. static void eoi_ioapic_pin_remapped(int apic, int pin, int vector)
  118. {
  119. /*
  120. * Intr-remapping uses pin number as the virtual vector
  121. * in the RTE. Actual vector is programmed in
  122. * intr-remapping table entry. Hence for the io-apic
  123. * EOI we use the pin number.
  124. */
  125. io_apic_eoi(apic, pin);
  126. }
  127. static void __init irq_remapping_modify_x86_ops(void)
  128. {
  129. x86_io_apic_ops.disable = irq_remapping_disable_io_apic;
  130. x86_io_apic_ops.set_affinity = set_remapped_irq_affinity;
  131. x86_io_apic_ops.setup_entry = setup_ioapic_remapped_entry;
  132. x86_io_apic_ops.eoi_ioapic_pin = eoi_ioapic_pin_remapped;
  133. x86_msi.setup_msi_irqs = irq_remapping_setup_msi_irqs;
  134. x86_msi.setup_hpet_msi = setup_hpet_msi_remapped;
  135. x86_msi.compose_msi_msg = compose_remapped_msi_msg;
  136. }
  137. static __init int setup_nointremap(char *str)
  138. {
  139. disable_irq_remap = 1;
  140. return 0;
  141. }
  142. early_param("nointremap", setup_nointremap);
  143. static __init int setup_irqremap(char *str)
  144. {
  145. if (!str)
  146. return -EINVAL;
  147. while (*str) {
  148. if (!strncmp(str, "on", 2))
  149. disable_irq_remap = 0;
  150. else if (!strncmp(str, "off", 3))
  151. disable_irq_remap = 1;
  152. else if (!strncmp(str, "nosid", 5))
  153. disable_sourceid_checking = 1;
  154. else if (!strncmp(str, "no_x2apic_optout", 16))
  155. no_x2apic_optout = 1;
  156. str += strcspn(str, ",");
  157. while (*str == ',')
  158. str++;
  159. }
  160. return 0;
  161. }
  162. early_param("intremap", setup_irqremap);
  163. void set_irq_remapping_broken(void)
  164. {
  165. irq_remap_broken = 1;
  166. }
  167. int __init irq_remapping_prepare(void)
  168. {
  169. if (disable_irq_remap)
  170. return -ENOSYS;
  171. if (intel_irq_remap_ops.prepare() == 0)
  172. remap_ops = &intel_irq_remap_ops;
  173. else if (IS_ENABLED(CONFIG_AMD_IOMMU) &&
  174. amd_iommu_irq_ops.prepare() == 0)
  175. remap_ops = &amd_iommu_irq_ops;
  176. else
  177. return -ENOSYS;
  178. return 0;
  179. }
  180. int __init irq_remapping_enable(void)
  181. {
  182. int ret;
  183. if (!remap_ops->enable)
  184. return -ENODEV;
  185. ret = remap_ops->enable();
  186. if (irq_remapping_enabled)
  187. irq_remapping_modify_x86_ops();
  188. return ret;
  189. }
  190. void irq_remapping_disable(void)
  191. {
  192. if (irq_remapping_enabled && remap_ops->disable)
  193. remap_ops->disable();
  194. }
  195. int irq_remapping_reenable(int mode)
  196. {
  197. if (irq_remapping_enabled && remap_ops->reenable)
  198. return remap_ops->reenable(mode);
  199. return 0;
  200. }
  201. int __init irq_remap_enable_fault_handling(void)
  202. {
  203. if (!irq_remapping_enabled)
  204. return 0;
  205. if (!remap_ops->enable_faulting)
  206. return -ENODEV;
  207. return remap_ops->enable_faulting();
  208. }
  209. int setup_ioapic_remapped_entry(int irq,
  210. struct IO_APIC_route_entry *entry,
  211. unsigned int destination, int vector,
  212. struct io_apic_irq_attr *attr)
  213. {
  214. if (!remap_ops->setup_ioapic_entry)
  215. return -ENODEV;
  216. return remap_ops->setup_ioapic_entry(irq, entry, destination,
  217. vector, attr);
  218. }
  219. static int set_remapped_irq_affinity(struct irq_data *data,
  220. const struct cpumask *mask, bool force)
  221. {
  222. if (!config_enabled(CONFIG_SMP) || !remap_ops->set_affinity)
  223. return 0;
  224. return remap_ops->set_affinity(data, mask, force);
  225. }
  226. void free_remapped_irq(int irq)
  227. {
  228. struct irq_cfg *cfg = irq_cfg(irq);
  229. if (irq_remapped(cfg) && remap_ops->free_irq)
  230. remap_ops->free_irq(irq);
  231. }
  232. void compose_remapped_msi_msg(struct pci_dev *pdev,
  233. unsigned int irq, unsigned int dest,
  234. struct msi_msg *msg, u8 hpet_id)
  235. {
  236. struct irq_cfg *cfg = irq_cfg(irq);
  237. if (!irq_remapped(cfg))
  238. native_compose_msi_msg(pdev, irq, dest, msg, hpet_id);
  239. else if (remap_ops->compose_msi_msg)
  240. remap_ops->compose_msi_msg(pdev, irq, dest, msg, hpet_id);
  241. }
  242. static int msi_alloc_remapped_irq(struct pci_dev *pdev, int irq, int nvec)
  243. {
  244. if (!remap_ops->msi_alloc_irq)
  245. return -ENODEV;
  246. return remap_ops->msi_alloc_irq(pdev, irq, nvec);
  247. }
  248. static int msi_setup_remapped_irq(struct pci_dev *pdev, unsigned int irq,
  249. int index, int sub_handle)
  250. {
  251. if (!remap_ops->msi_setup_irq)
  252. return -ENODEV;
  253. return remap_ops->msi_setup_irq(pdev, irq, index, sub_handle);
  254. }
  255. int setup_hpet_msi_remapped(unsigned int irq, unsigned int id)
  256. {
  257. int ret;
  258. if (!remap_ops->alloc_hpet_msi)
  259. return -ENODEV;
  260. ret = remap_ops->alloc_hpet_msi(irq, id);
  261. if (ret)
  262. return -EINVAL;
  263. return default_setup_hpet_msi(irq, id);
  264. }
  265. void panic_if_irq_remap(const char *msg)
  266. {
  267. if (irq_remapping_enabled)
  268. panic(msg);
  269. }
  270. static void ir_ack_apic_edge(struct irq_data *data)
  271. {
  272. ack_APIC_irq();
  273. }
  274. static void ir_ack_apic_level(struct irq_data *data)
  275. {
  276. ack_APIC_irq();
  277. eoi_ioapic_irq(data->irq, irqd_cfg(data));
  278. }
  279. static void ir_print_prefix(struct irq_data *data, struct seq_file *p)
  280. {
  281. seq_printf(p, " IR-%s", data->chip->name);
  282. }
  283. void irq_remap_modify_chip_defaults(struct irq_chip *chip)
  284. {
  285. chip->irq_print_chip = ir_print_prefix;
  286. chip->irq_ack = ir_ack_apic_edge;
  287. chip->irq_eoi = ir_ack_apic_level;
  288. chip->irq_set_affinity = x86_io_apic_ops.set_affinity;
  289. }
  290. bool setup_remapped_irq(int irq, struct irq_cfg *cfg, struct irq_chip *chip)
  291. {
  292. if (!irq_remapped(cfg))
  293. return false;
  294. irq_set_status_flags(irq, IRQ_MOVE_PCNTXT);
  295. irq_remap_modify_chip_defaults(chip);
  296. return true;
  297. }