kvm_host.h 41 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429
  1. /*
  2. * Kernel-based Virtual Machine driver for Linux
  3. *
  4. * This header defines architecture specific interfaces, x86 version
  5. *
  6. * This work is licensed under the terms of the GNU GPL, version 2. See
  7. * the COPYING file in the top-level directory.
  8. *
  9. */
  10. #ifndef _ASM_X86_KVM_HOST_H
  11. #define _ASM_X86_KVM_HOST_H
  12. #include <linux/types.h>
  13. #include <linux/mm.h>
  14. #include <linux/mmu_notifier.h>
  15. #include <linux/tracepoint.h>
  16. #include <linux/cpumask.h>
  17. #include <linux/irq_work.h>
  18. #include <linux/kvm.h>
  19. #include <linux/kvm_para.h>
  20. #include <linux/kvm_types.h>
  21. #include <linux/perf_event.h>
  22. #include <linux/pvclock_gtod.h>
  23. #include <linux/clocksource.h>
  24. #include <linux/irqbypass.h>
  25. #include <linux/hyperv.h>
  26. #include <asm/apic.h>
  27. #include <asm/pvclock-abi.h>
  28. #include <asm/desc.h>
  29. #include <asm/mtrr.h>
  30. #include <asm/msr-index.h>
  31. #include <asm/asm.h>
  32. #include <asm/kvm_page_track.h>
  33. #define KVM_MAX_VCPUS 288
  34. #define KVM_SOFT_MAX_VCPUS 240
  35. #define KVM_MAX_VCPU_ID 1023
  36. #define KVM_USER_MEM_SLOTS 509
  37. /* memory slots that are not exposed to userspace */
  38. #define KVM_PRIVATE_MEM_SLOTS 3
  39. #define KVM_MEM_SLOTS_NUM (KVM_USER_MEM_SLOTS + KVM_PRIVATE_MEM_SLOTS)
  40. #define KVM_HALT_POLL_NS_DEFAULT 200000
  41. #define KVM_IRQCHIP_NUM_PINS KVM_IOAPIC_NUM_PINS
  42. /* x86-specific vcpu->requests bit members */
  43. #define KVM_REQ_MIGRATE_TIMER KVM_ARCH_REQ(0)
  44. #define KVM_REQ_REPORT_TPR_ACCESS KVM_ARCH_REQ(1)
  45. #define KVM_REQ_TRIPLE_FAULT KVM_ARCH_REQ(2)
  46. #define KVM_REQ_MMU_SYNC KVM_ARCH_REQ(3)
  47. #define KVM_REQ_CLOCK_UPDATE KVM_ARCH_REQ(4)
  48. #define KVM_REQ_EVENT KVM_ARCH_REQ(6)
  49. #define KVM_REQ_APF_HALT KVM_ARCH_REQ(7)
  50. #define KVM_REQ_STEAL_UPDATE KVM_ARCH_REQ(8)
  51. #define KVM_REQ_NMI KVM_ARCH_REQ(9)
  52. #define KVM_REQ_PMU KVM_ARCH_REQ(10)
  53. #define KVM_REQ_PMI KVM_ARCH_REQ(11)
  54. #define KVM_REQ_SMI KVM_ARCH_REQ(12)
  55. #define KVM_REQ_MASTERCLOCK_UPDATE KVM_ARCH_REQ(13)
  56. #define KVM_REQ_MCLOCK_INPROGRESS \
  57. KVM_ARCH_REQ_FLAGS(14, KVM_REQUEST_WAIT | KVM_REQUEST_NO_WAKEUP)
  58. #define KVM_REQ_SCAN_IOAPIC \
  59. KVM_ARCH_REQ_FLAGS(15, KVM_REQUEST_WAIT | KVM_REQUEST_NO_WAKEUP)
  60. #define KVM_REQ_GLOBAL_CLOCK_UPDATE KVM_ARCH_REQ(16)
  61. #define KVM_REQ_APIC_PAGE_RELOAD \
  62. KVM_ARCH_REQ_FLAGS(17, KVM_REQUEST_WAIT | KVM_REQUEST_NO_WAKEUP)
  63. #define KVM_REQ_HV_CRASH KVM_ARCH_REQ(18)
  64. #define KVM_REQ_IOAPIC_EOI_EXIT KVM_ARCH_REQ(19)
  65. #define KVM_REQ_HV_RESET KVM_ARCH_REQ(20)
  66. #define KVM_REQ_HV_EXIT KVM_ARCH_REQ(21)
  67. #define KVM_REQ_HV_STIMER KVM_ARCH_REQ(22)
  68. #define CR0_RESERVED_BITS \
  69. (~(unsigned long)(X86_CR0_PE | X86_CR0_MP | X86_CR0_EM | X86_CR0_TS \
  70. | X86_CR0_ET | X86_CR0_NE | X86_CR0_WP | X86_CR0_AM \
  71. | X86_CR0_NW | X86_CR0_CD | X86_CR0_PG))
  72. #define CR3_PCID_INVD BIT_64(63)
  73. #define CR4_RESERVED_BITS \
  74. (~(unsigned long)(X86_CR4_VME | X86_CR4_PVI | X86_CR4_TSD | X86_CR4_DE\
  75. | X86_CR4_PSE | X86_CR4_PAE | X86_CR4_MCE \
  76. | X86_CR4_PGE | X86_CR4_PCE | X86_CR4_OSFXSR | X86_CR4_PCIDE \
  77. | X86_CR4_OSXSAVE | X86_CR4_SMEP | X86_CR4_FSGSBASE \
  78. | X86_CR4_OSXMMEXCPT | X86_CR4_LA57 | X86_CR4_VMXE \
  79. | X86_CR4_SMAP | X86_CR4_PKE))
  80. #define CR8_RESERVED_BITS (~(unsigned long)X86_CR8_TPR)
  81. #define INVALID_PAGE (~(hpa_t)0)
  82. #define VALID_PAGE(x) ((x) != INVALID_PAGE)
  83. #define UNMAPPED_GVA (~(gpa_t)0)
  84. /* KVM Hugepage definitions for x86 */
  85. #define KVM_NR_PAGE_SIZES 3
  86. #define KVM_HPAGE_GFN_SHIFT(x) (((x) - 1) * 9)
  87. #define KVM_HPAGE_SHIFT(x) (PAGE_SHIFT + KVM_HPAGE_GFN_SHIFT(x))
  88. #define KVM_HPAGE_SIZE(x) (1UL << KVM_HPAGE_SHIFT(x))
  89. #define KVM_HPAGE_MASK(x) (~(KVM_HPAGE_SIZE(x) - 1))
  90. #define KVM_PAGES_PER_HPAGE(x) (KVM_HPAGE_SIZE(x) / PAGE_SIZE)
  91. static inline gfn_t gfn_to_index(gfn_t gfn, gfn_t base_gfn, int level)
  92. {
  93. /* KVM_HPAGE_GFN_SHIFT(PT_PAGE_TABLE_LEVEL) must be 0. */
  94. return (gfn >> KVM_HPAGE_GFN_SHIFT(level)) -
  95. (base_gfn >> KVM_HPAGE_GFN_SHIFT(level));
  96. }
  97. #define KVM_PERMILLE_MMU_PAGES 20
  98. #define KVM_MIN_ALLOC_MMU_PAGES 64
  99. #define KVM_MMU_HASH_SHIFT 12
  100. #define KVM_NUM_MMU_PAGES (1 << KVM_MMU_HASH_SHIFT)
  101. #define KVM_MIN_FREE_MMU_PAGES 5
  102. #define KVM_REFILL_PAGES 25
  103. #define KVM_MAX_CPUID_ENTRIES 80
  104. #define KVM_NR_FIXED_MTRR_REGION 88
  105. #define KVM_NR_VAR_MTRR 8
  106. #define ASYNC_PF_PER_VCPU 64
  107. enum kvm_reg {
  108. VCPU_REGS_RAX = 0,
  109. VCPU_REGS_RCX = 1,
  110. VCPU_REGS_RDX = 2,
  111. VCPU_REGS_RBX = 3,
  112. VCPU_REGS_RSP = 4,
  113. VCPU_REGS_RBP = 5,
  114. VCPU_REGS_RSI = 6,
  115. VCPU_REGS_RDI = 7,
  116. #ifdef CONFIG_X86_64
  117. VCPU_REGS_R8 = 8,
  118. VCPU_REGS_R9 = 9,
  119. VCPU_REGS_R10 = 10,
  120. VCPU_REGS_R11 = 11,
  121. VCPU_REGS_R12 = 12,
  122. VCPU_REGS_R13 = 13,
  123. VCPU_REGS_R14 = 14,
  124. VCPU_REGS_R15 = 15,
  125. #endif
  126. VCPU_REGS_RIP,
  127. NR_VCPU_REGS
  128. };
  129. enum kvm_reg_ex {
  130. VCPU_EXREG_PDPTR = NR_VCPU_REGS,
  131. VCPU_EXREG_CR3,
  132. VCPU_EXREG_RFLAGS,
  133. VCPU_EXREG_SEGMENTS,
  134. };
  135. enum {
  136. VCPU_SREG_ES,
  137. VCPU_SREG_CS,
  138. VCPU_SREG_SS,
  139. VCPU_SREG_DS,
  140. VCPU_SREG_FS,
  141. VCPU_SREG_GS,
  142. VCPU_SREG_TR,
  143. VCPU_SREG_LDTR,
  144. };
  145. #include <asm/kvm_emulate.h>
  146. #define KVM_NR_MEM_OBJS 40
  147. #define KVM_NR_DB_REGS 4
  148. #define DR6_BD (1 << 13)
  149. #define DR6_BS (1 << 14)
  150. #define DR6_RTM (1 << 16)
  151. #define DR6_FIXED_1 0xfffe0ff0
  152. #define DR6_INIT 0xffff0ff0
  153. #define DR6_VOLATILE 0x0001e00f
  154. #define DR7_BP_EN_MASK 0x000000ff
  155. #define DR7_GE (1 << 9)
  156. #define DR7_GD (1 << 13)
  157. #define DR7_FIXED_1 0x00000400
  158. #define DR7_VOLATILE 0xffff2bff
  159. #define PFERR_PRESENT_BIT 0
  160. #define PFERR_WRITE_BIT 1
  161. #define PFERR_USER_BIT 2
  162. #define PFERR_RSVD_BIT 3
  163. #define PFERR_FETCH_BIT 4
  164. #define PFERR_PK_BIT 5
  165. #define PFERR_GUEST_FINAL_BIT 32
  166. #define PFERR_GUEST_PAGE_BIT 33
  167. #define PFERR_PRESENT_MASK (1U << PFERR_PRESENT_BIT)
  168. #define PFERR_WRITE_MASK (1U << PFERR_WRITE_BIT)
  169. #define PFERR_USER_MASK (1U << PFERR_USER_BIT)
  170. #define PFERR_RSVD_MASK (1U << PFERR_RSVD_BIT)
  171. #define PFERR_FETCH_MASK (1U << PFERR_FETCH_BIT)
  172. #define PFERR_PK_MASK (1U << PFERR_PK_BIT)
  173. #define PFERR_GUEST_FINAL_MASK (1ULL << PFERR_GUEST_FINAL_BIT)
  174. #define PFERR_GUEST_PAGE_MASK (1ULL << PFERR_GUEST_PAGE_BIT)
  175. #define PFERR_NESTED_GUEST_PAGE (PFERR_GUEST_PAGE_MASK | \
  176. PFERR_WRITE_MASK | \
  177. PFERR_PRESENT_MASK)
  178. /*
  179. * The mask used to denote special SPTEs, which can be either MMIO SPTEs or
  180. * Access Tracking SPTEs. We use bit 62 instead of bit 63 to avoid conflicting
  181. * with the SVE bit in EPT PTEs.
  182. */
  183. #define SPTE_SPECIAL_MASK (1ULL << 62)
  184. /* apic attention bits */
  185. #define KVM_APIC_CHECK_VAPIC 0
  186. /*
  187. * The following bit is set with PV-EOI, unset on EOI.
  188. * We detect PV-EOI changes by guest by comparing
  189. * this bit with PV-EOI in guest memory.
  190. * See the implementation in apic_update_pv_eoi.
  191. */
  192. #define KVM_APIC_PV_EOI_PENDING 1
  193. struct kvm_kernel_irq_routing_entry;
  194. /*
  195. * We don't want allocation failures within the mmu code, so we preallocate
  196. * enough memory for a single page fault in a cache.
  197. */
  198. struct kvm_mmu_memory_cache {
  199. int nobjs;
  200. void *objects[KVM_NR_MEM_OBJS];
  201. };
  202. /*
  203. * the pages used as guest page table on soft mmu are tracked by
  204. * kvm_memory_slot.arch.gfn_track which is 16 bits, so the role bits used
  205. * by indirect shadow page can not be more than 15 bits.
  206. *
  207. * Currently, we used 14 bits that are @level, @cr4_pae, @quadrant, @access,
  208. * @nxe, @cr0_wp, @smep_andnot_wp and @smap_andnot_wp.
  209. */
  210. union kvm_mmu_page_role {
  211. unsigned word;
  212. struct {
  213. unsigned level:4;
  214. unsigned cr4_pae:1;
  215. unsigned quadrant:2;
  216. unsigned direct:1;
  217. unsigned access:3;
  218. unsigned invalid:1;
  219. unsigned nxe:1;
  220. unsigned cr0_wp:1;
  221. unsigned smep_andnot_wp:1;
  222. unsigned smap_andnot_wp:1;
  223. unsigned ad_disabled:1;
  224. unsigned :7;
  225. /*
  226. * This is left at the top of the word so that
  227. * kvm_memslots_for_spte_role can extract it with a
  228. * simple shift. While there is room, give it a whole
  229. * byte so it is also faster to load it from memory.
  230. */
  231. unsigned smm:8;
  232. };
  233. };
  234. struct kvm_rmap_head {
  235. unsigned long val;
  236. };
  237. struct kvm_mmu_page {
  238. struct list_head link;
  239. struct hlist_node hash_link;
  240. /*
  241. * The following two entries are used to key the shadow page in the
  242. * hash table.
  243. */
  244. gfn_t gfn;
  245. union kvm_mmu_page_role role;
  246. u64 *spt;
  247. /* hold the gfn of each spte inside spt */
  248. gfn_t *gfns;
  249. bool unsync;
  250. int root_count; /* Currently serving as active root */
  251. unsigned int unsync_children;
  252. struct kvm_rmap_head parent_ptes; /* rmap pointers to parent sptes */
  253. /* The page is obsolete if mmu_valid_gen != kvm->arch.mmu_valid_gen. */
  254. unsigned long mmu_valid_gen;
  255. DECLARE_BITMAP(unsync_child_bitmap, 512);
  256. #ifdef CONFIG_X86_32
  257. /*
  258. * Used out of the mmu-lock to avoid reading spte values while an
  259. * update is in progress; see the comments in __get_spte_lockless().
  260. */
  261. int clear_spte_count;
  262. #endif
  263. /* Number of writes since the last time traversal visited this page. */
  264. atomic_t write_flooding_count;
  265. };
  266. struct kvm_pio_request {
  267. unsigned long count;
  268. int in;
  269. int port;
  270. int size;
  271. };
  272. #define PT64_ROOT_MAX_LEVEL 5
  273. struct rsvd_bits_validate {
  274. u64 rsvd_bits_mask[2][PT64_ROOT_MAX_LEVEL];
  275. u64 bad_mt_xwr;
  276. };
  277. /*
  278. * x86 supports 4 paging modes (5-level 64-bit, 4-level 64-bit, 3-level 32-bit,
  279. * and 2-level 32-bit). The kvm_mmu structure abstracts the details of the
  280. * current mmu mode.
  281. */
  282. struct kvm_mmu {
  283. void (*set_cr3)(struct kvm_vcpu *vcpu, unsigned long root);
  284. unsigned long (*get_cr3)(struct kvm_vcpu *vcpu);
  285. u64 (*get_pdptr)(struct kvm_vcpu *vcpu, int index);
  286. int (*page_fault)(struct kvm_vcpu *vcpu, gva_t gva, u32 err,
  287. bool prefault);
  288. void (*inject_page_fault)(struct kvm_vcpu *vcpu,
  289. struct x86_exception *fault);
  290. gpa_t (*gva_to_gpa)(struct kvm_vcpu *vcpu, gva_t gva, u32 access,
  291. struct x86_exception *exception);
  292. gpa_t (*translate_gpa)(struct kvm_vcpu *vcpu, gpa_t gpa, u32 access,
  293. struct x86_exception *exception);
  294. int (*sync_page)(struct kvm_vcpu *vcpu,
  295. struct kvm_mmu_page *sp);
  296. void (*invlpg)(struct kvm_vcpu *vcpu, gva_t gva);
  297. void (*update_pte)(struct kvm_vcpu *vcpu, struct kvm_mmu_page *sp,
  298. u64 *spte, const void *pte);
  299. hpa_t root_hpa;
  300. union kvm_mmu_page_role base_role;
  301. u8 root_level;
  302. u8 shadow_root_level;
  303. u8 ept_ad;
  304. bool direct_map;
  305. /*
  306. * Bitmap; bit set = permission fault
  307. * Byte index: page fault error code [4:1]
  308. * Bit index: pte permissions in ACC_* format
  309. */
  310. u8 permissions[16];
  311. /*
  312. * The pkru_mask indicates if protection key checks are needed. It
  313. * consists of 16 domains indexed by page fault error code bits [4:1],
  314. * with PFEC.RSVD replaced by ACC_USER_MASK from the page tables.
  315. * Each domain has 2 bits which are ANDed with AD and WD from PKRU.
  316. */
  317. u32 pkru_mask;
  318. u64 *pae_root;
  319. u64 *lm_root;
  320. /*
  321. * check zero bits on shadow page table entries, these
  322. * bits include not only hardware reserved bits but also
  323. * the bits spte never used.
  324. */
  325. struct rsvd_bits_validate shadow_zero_check;
  326. struct rsvd_bits_validate guest_rsvd_check;
  327. /* Can have large pages at levels 2..last_nonleaf_level-1. */
  328. u8 last_nonleaf_level;
  329. bool nx;
  330. u64 pdptrs[4]; /* pae */
  331. };
  332. enum pmc_type {
  333. KVM_PMC_GP = 0,
  334. KVM_PMC_FIXED,
  335. };
  336. struct kvm_pmc {
  337. enum pmc_type type;
  338. u8 idx;
  339. u64 counter;
  340. u64 eventsel;
  341. struct perf_event *perf_event;
  342. struct kvm_vcpu *vcpu;
  343. };
  344. struct kvm_pmu {
  345. unsigned nr_arch_gp_counters;
  346. unsigned nr_arch_fixed_counters;
  347. unsigned available_event_types;
  348. u64 fixed_ctr_ctrl;
  349. u64 global_ctrl;
  350. u64 global_status;
  351. u64 global_ovf_ctrl;
  352. u64 counter_bitmask[2];
  353. u64 global_ctrl_mask;
  354. u64 reserved_bits;
  355. u8 version;
  356. struct kvm_pmc gp_counters[INTEL_PMC_MAX_GENERIC];
  357. struct kvm_pmc fixed_counters[INTEL_PMC_MAX_FIXED];
  358. struct irq_work irq_work;
  359. u64 reprogram_pmi;
  360. };
  361. struct kvm_pmu_ops;
  362. enum {
  363. KVM_DEBUGREG_BP_ENABLED = 1,
  364. KVM_DEBUGREG_WONT_EXIT = 2,
  365. KVM_DEBUGREG_RELOAD = 4,
  366. };
  367. struct kvm_mtrr_range {
  368. u64 base;
  369. u64 mask;
  370. struct list_head node;
  371. };
  372. struct kvm_mtrr {
  373. struct kvm_mtrr_range var_ranges[KVM_NR_VAR_MTRR];
  374. mtrr_type fixed_ranges[KVM_NR_FIXED_MTRR_REGION];
  375. u64 deftype;
  376. struct list_head head;
  377. };
  378. /* Hyper-V SynIC timer */
  379. struct kvm_vcpu_hv_stimer {
  380. struct hrtimer timer;
  381. int index;
  382. u64 config;
  383. u64 count;
  384. u64 exp_time;
  385. struct hv_message msg;
  386. bool msg_pending;
  387. };
  388. /* Hyper-V synthetic interrupt controller (SynIC)*/
  389. struct kvm_vcpu_hv_synic {
  390. u64 version;
  391. u64 control;
  392. u64 msg_page;
  393. u64 evt_page;
  394. atomic64_t sint[HV_SYNIC_SINT_COUNT];
  395. atomic_t sint_to_gsi[HV_SYNIC_SINT_COUNT];
  396. DECLARE_BITMAP(auto_eoi_bitmap, 256);
  397. DECLARE_BITMAP(vec_bitmap, 256);
  398. bool active;
  399. bool dont_zero_synic_pages;
  400. };
  401. /* Hyper-V per vcpu emulation context */
  402. struct kvm_vcpu_hv {
  403. u32 vp_index;
  404. u64 hv_vapic;
  405. s64 runtime_offset;
  406. struct kvm_vcpu_hv_synic synic;
  407. struct kvm_hyperv_exit exit;
  408. struct kvm_vcpu_hv_stimer stimer[HV_SYNIC_STIMER_COUNT];
  409. DECLARE_BITMAP(stimer_pending_bitmap, HV_SYNIC_STIMER_COUNT);
  410. };
  411. struct kvm_vcpu_arch {
  412. /*
  413. * rip and regs accesses must go through
  414. * kvm_{register,rip}_{read,write} functions.
  415. */
  416. unsigned long regs[NR_VCPU_REGS];
  417. u32 regs_avail;
  418. u32 regs_dirty;
  419. unsigned long cr0;
  420. unsigned long cr0_guest_owned_bits;
  421. unsigned long cr2;
  422. unsigned long cr3;
  423. unsigned long cr4;
  424. unsigned long cr4_guest_owned_bits;
  425. unsigned long cr8;
  426. u32 pkru;
  427. u32 hflags;
  428. u64 efer;
  429. u64 apic_base;
  430. struct kvm_lapic *apic; /* kernel irqchip context */
  431. bool apicv_active;
  432. DECLARE_BITMAP(ioapic_handled_vectors, 256);
  433. unsigned long apic_attention;
  434. int32_t apic_arb_prio;
  435. int mp_state;
  436. u64 ia32_misc_enable_msr;
  437. u64 smbase;
  438. bool tpr_access_reporting;
  439. u64 ia32_xss;
  440. /*
  441. * Paging state of the vcpu
  442. *
  443. * If the vcpu runs in guest mode with two level paging this still saves
  444. * the paging mode of the l1 guest. This context is always used to
  445. * handle faults.
  446. */
  447. struct kvm_mmu mmu;
  448. /*
  449. * Paging state of an L2 guest (used for nested npt)
  450. *
  451. * This context will save all necessary information to walk page tables
  452. * of the an L2 guest. This context is only initialized for page table
  453. * walking and not for faulting since we never handle l2 page faults on
  454. * the host.
  455. */
  456. struct kvm_mmu nested_mmu;
  457. /*
  458. * Pointer to the mmu context currently used for
  459. * gva_to_gpa translations.
  460. */
  461. struct kvm_mmu *walk_mmu;
  462. struct kvm_mmu_memory_cache mmu_pte_list_desc_cache;
  463. struct kvm_mmu_memory_cache mmu_page_cache;
  464. struct kvm_mmu_memory_cache mmu_page_header_cache;
  465. struct fpu guest_fpu;
  466. u64 xcr0;
  467. u64 guest_supported_xcr0;
  468. u32 guest_xstate_size;
  469. struct kvm_pio_request pio;
  470. void *pio_data;
  471. u8 event_exit_inst_len;
  472. struct kvm_queued_exception {
  473. bool pending;
  474. bool injected;
  475. bool has_error_code;
  476. u8 nr;
  477. u32 error_code;
  478. u8 nested_apf;
  479. } exception;
  480. struct kvm_queued_interrupt {
  481. bool pending;
  482. bool soft;
  483. u8 nr;
  484. } interrupt;
  485. int halt_request; /* real mode on Intel only */
  486. int cpuid_nent;
  487. struct kvm_cpuid_entry2 cpuid_entries[KVM_MAX_CPUID_ENTRIES];
  488. int maxphyaddr;
  489. /* emulate context */
  490. struct x86_emulate_ctxt emulate_ctxt;
  491. bool emulate_regs_need_sync_to_vcpu;
  492. bool emulate_regs_need_sync_from_vcpu;
  493. int (*complete_userspace_io)(struct kvm_vcpu *vcpu);
  494. gpa_t time;
  495. struct pvclock_vcpu_time_info hv_clock;
  496. unsigned int hw_tsc_khz;
  497. struct gfn_to_hva_cache pv_time;
  498. bool pv_time_enabled;
  499. /* set guest stopped flag in pvclock flags field */
  500. bool pvclock_set_guest_stopped_request;
  501. struct {
  502. u64 msr_val;
  503. u64 last_steal;
  504. struct gfn_to_hva_cache stime;
  505. struct kvm_steal_time steal;
  506. } st;
  507. u64 tsc_offset;
  508. u64 last_guest_tsc;
  509. u64 last_host_tsc;
  510. u64 tsc_offset_adjustment;
  511. u64 this_tsc_nsec;
  512. u64 this_tsc_write;
  513. u64 this_tsc_generation;
  514. bool tsc_catchup;
  515. bool tsc_always_catchup;
  516. s8 virtual_tsc_shift;
  517. u32 virtual_tsc_mult;
  518. u32 virtual_tsc_khz;
  519. s64 ia32_tsc_adjust_msr;
  520. u64 tsc_scaling_ratio;
  521. atomic_t nmi_queued; /* unprocessed asynchronous NMIs */
  522. unsigned nmi_pending; /* NMI queued after currently running handler */
  523. bool nmi_injected; /* Trying to inject an NMI this entry */
  524. bool smi_pending; /* SMI queued after currently running handler */
  525. struct kvm_mtrr mtrr_state;
  526. u64 pat;
  527. unsigned switch_db_regs;
  528. unsigned long db[KVM_NR_DB_REGS];
  529. unsigned long dr6;
  530. unsigned long dr7;
  531. unsigned long eff_db[KVM_NR_DB_REGS];
  532. unsigned long guest_debug_dr7;
  533. u64 msr_platform_info;
  534. u64 msr_misc_features_enables;
  535. u64 mcg_cap;
  536. u64 mcg_status;
  537. u64 mcg_ctl;
  538. u64 mcg_ext_ctl;
  539. u64 *mce_banks;
  540. /* Cache MMIO info */
  541. u64 mmio_gva;
  542. unsigned access;
  543. gfn_t mmio_gfn;
  544. u64 mmio_gen;
  545. struct kvm_pmu pmu;
  546. /* used for guest single stepping over the given code position */
  547. unsigned long singlestep_rip;
  548. struct kvm_vcpu_hv hyperv;
  549. cpumask_var_t wbinvd_dirty_mask;
  550. unsigned long last_retry_eip;
  551. unsigned long last_retry_addr;
  552. struct {
  553. bool halted;
  554. gfn_t gfns[roundup_pow_of_two(ASYNC_PF_PER_VCPU)];
  555. struct gfn_to_hva_cache data;
  556. u64 msr_val;
  557. u32 id;
  558. bool send_user_only;
  559. u32 host_apf_reason;
  560. unsigned long nested_apf_token;
  561. bool delivery_as_pf_vmexit;
  562. } apf;
  563. /* OSVW MSRs (AMD only) */
  564. struct {
  565. u64 length;
  566. u64 status;
  567. } osvw;
  568. struct {
  569. u64 msr_val;
  570. struct gfn_to_hva_cache data;
  571. } pv_eoi;
  572. /*
  573. * Indicate whether the access faults on its page table in guest
  574. * which is set when fix page fault and used to detect unhandeable
  575. * instruction.
  576. */
  577. bool write_fault_to_shadow_pgtable;
  578. /* set at EPT violation at this point */
  579. unsigned long exit_qualification;
  580. /* pv related host specific info */
  581. struct {
  582. bool pv_unhalted;
  583. } pv;
  584. int pending_ioapic_eoi;
  585. int pending_external_vector;
  586. /* GPA available */
  587. bool gpa_available;
  588. gpa_t gpa_val;
  589. /* be preempted when it's in kernel-mode(cpl=0) */
  590. bool preempted_in_kernel;
  591. };
  592. struct kvm_lpage_info {
  593. int disallow_lpage;
  594. };
  595. struct kvm_arch_memory_slot {
  596. struct kvm_rmap_head *rmap[KVM_NR_PAGE_SIZES];
  597. struct kvm_lpage_info *lpage_info[KVM_NR_PAGE_SIZES - 1];
  598. unsigned short *gfn_track[KVM_PAGE_TRACK_MAX];
  599. };
  600. /*
  601. * We use as the mode the number of bits allocated in the LDR for the
  602. * logical processor ID. It happens that these are all powers of two.
  603. * This makes it is very easy to detect cases where the APICs are
  604. * configured for multiple modes; in that case, we cannot use the map and
  605. * hence cannot use kvm_irq_delivery_to_apic_fast either.
  606. */
  607. #define KVM_APIC_MODE_XAPIC_CLUSTER 4
  608. #define KVM_APIC_MODE_XAPIC_FLAT 8
  609. #define KVM_APIC_MODE_X2APIC 16
  610. struct kvm_apic_map {
  611. struct rcu_head rcu;
  612. u8 mode;
  613. u32 max_apic_id;
  614. union {
  615. struct kvm_lapic *xapic_flat_map[8];
  616. struct kvm_lapic *xapic_cluster_map[16][4];
  617. };
  618. struct kvm_lapic *phys_map[];
  619. };
  620. /* Hyper-V emulation context */
  621. struct kvm_hv {
  622. struct mutex hv_lock;
  623. u64 hv_guest_os_id;
  624. u64 hv_hypercall;
  625. u64 hv_tsc_page;
  626. /* Hyper-v based guest crash (NT kernel bugcheck) parameters */
  627. u64 hv_crash_param[HV_X64_MSR_CRASH_PARAMS];
  628. u64 hv_crash_ctl;
  629. HV_REFERENCE_TSC_PAGE tsc_ref;
  630. };
  631. enum kvm_irqchip_mode {
  632. KVM_IRQCHIP_NONE,
  633. KVM_IRQCHIP_KERNEL, /* created with KVM_CREATE_IRQCHIP */
  634. KVM_IRQCHIP_SPLIT, /* created with KVM_CAP_SPLIT_IRQCHIP */
  635. };
  636. struct kvm_arch {
  637. unsigned int n_used_mmu_pages;
  638. unsigned int n_requested_mmu_pages;
  639. unsigned int n_max_mmu_pages;
  640. unsigned int indirect_shadow_pages;
  641. unsigned long mmu_valid_gen;
  642. struct hlist_head mmu_page_hash[KVM_NUM_MMU_PAGES];
  643. /*
  644. * Hash table of struct kvm_mmu_page.
  645. */
  646. struct list_head active_mmu_pages;
  647. struct list_head zapped_obsolete_pages;
  648. struct kvm_page_track_notifier_node mmu_sp_tracker;
  649. struct kvm_page_track_notifier_head track_notifier_head;
  650. struct list_head assigned_dev_head;
  651. struct iommu_domain *iommu_domain;
  652. bool iommu_noncoherent;
  653. #define __KVM_HAVE_ARCH_NONCOHERENT_DMA
  654. atomic_t noncoherent_dma_count;
  655. #define __KVM_HAVE_ARCH_ASSIGNED_DEVICE
  656. atomic_t assigned_device_count;
  657. struct kvm_pic *vpic;
  658. struct kvm_ioapic *vioapic;
  659. struct kvm_pit *vpit;
  660. atomic_t vapics_in_nmi_mode;
  661. struct mutex apic_map_lock;
  662. struct kvm_apic_map *apic_map;
  663. unsigned int tss_addr;
  664. bool apic_access_page_done;
  665. gpa_t wall_clock;
  666. bool ept_identity_pagetable_done;
  667. gpa_t ept_identity_map_addr;
  668. unsigned long irq_sources_bitmap;
  669. s64 kvmclock_offset;
  670. raw_spinlock_t tsc_write_lock;
  671. u64 last_tsc_nsec;
  672. u64 last_tsc_write;
  673. u32 last_tsc_khz;
  674. u64 cur_tsc_nsec;
  675. u64 cur_tsc_write;
  676. u64 cur_tsc_offset;
  677. u64 cur_tsc_generation;
  678. int nr_vcpus_matched_tsc;
  679. spinlock_t pvclock_gtod_sync_lock;
  680. bool use_master_clock;
  681. u64 master_kernel_ns;
  682. u64 master_cycle_now;
  683. struct delayed_work kvmclock_update_work;
  684. struct delayed_work kvmclock_sync_work;
  685. struct kvm_xen_hvm_config xen_hvm_config;
  686. /* reads protected by irq_srcu, writes by irq_lock */
  687. struct hlist_head mask_notifier_list;
  688. struct kvm_hv hyperv;
  689. #ifdef CONFIG_KVM_MMU_AUDIT
  690. int audit_point;
  691. #endif
  692. bool backwards_tsc_observed;
  693. bool boot_vcpu_runs_old_kvmclock;
  694. u32 bsp_vcpu_id;
  695. u64 disabled_quirks;
  696. enum kvm_irqchip_mode irqchip_mode;
  697. u8 nr_reserved_ioapic_pins;
  698. bool disabled_lapic_found;
  699. /* Struct members for AVIC */
  700. u32 avic_vm_id;
  701. u32 ldr_mode;
  702. struct page *avic_logical_id_table_page;
  703. struct page *avic_physical_id_table_page;
  704. struct hlist_node hnode;
  705. bool x2apic_format;
  706. bool x2apic_broadcast_quirk_disabled;
  707. };
  708. struct kvm_vm_stat {
  709. ulong mmu_shadow_zapped;
  710. ulong mmu_pte_write;
  711. ulong mmu_pte_updated;
  712. ulong mmu_pde_zapped;
  713. ulong mmu_flooded;
  714. ulong mmu_recycled;
  715. ulong mmu_cache_miss;
  716. ulong mmu_unsync;
  717. ulong remote_tlb_flush;
  718. ulong lpages;
  719. ulong max_mmu_page_hash_collisions;
  720. };
  721. struct kvm_vcpu_stat {
  722. u64 pf_fixed;
  723. u64 pf_guest;
  724. u64 tlb_flush;
  725. u64 invlpg;
  726. u64 exits;
  727. u64 io_exits;
  728. u64 mmio_exits;
  729. u64 signal_exits;
  730. u64 irq_window_exits;
  731. u64 nmi_window_exits;
  732. u64 halt_exits;
  733. u64 halt_successful_poll;
  734. u64 halt_attempted_poll;
  735. u64 halt_poll_invalid;
  736. u64 halt_wakeup;
  737. u64 request_irq_exits;
  738. u64 irq_exits;
  739. u64 host_state_reload;
  740. u64 efer_reload;
  741. u64 fpu_reload;
  742. u64 insn_emulation;
  743. u64 insn_emulation_fail;
  744. u64 hypercalls;
  745. u64 irq_injections;
  746. u64 nmi_injections;
  747. u64 req_event;
  748. };
  749. struct x86_instruction_info;
  750. struct msr_data {
  751. bool host_initiated;
  752. u32 index;
  753. u64 data;
  754. };
  755. struct kvm_lapic_irq {
  756. u32 vector;
  757. u16 delivery_mode;
  758. u16 dest_mode;
  759. bool level;
  760. u16 trig_mode;
  761. u32 shorthand;
  762. u32 dest_id;
  763. bool msi_redir_hint;
  764. };
  765. struct kvm_x86_ops {
  766. int (*cpu_has_kvm_support)(void); /* __init */
  767. int (*disabled_by_bios)(void); /* __init */
  768. int (*hardware_enable)(void);
  769. void (*hardware_disable)(void);
  770. void (*check_processor_compatibility)(void *rtn);
  771. int (*hardware_setup)(void); /* __init */
  772. void (*hardware_unsetup)(void); /* __exit */
  773. bool (*cpu_has_accelerated_tpr)(void);
  774. bool (*cpu_has_high_real_mode_segbase)(void);
  775. void (*cpuid_update)(struct kvm_vcpu *vcpu);
  776. int (*vm_init)(struct kvm *kvm);
  777. void (*vm_destroy)(struct kvm *kvm);
  778. /* Create, but do not attach this VCPU */
  779. struct kvm_vcpu *(*vcpu_create)(struct kvm *kvm, unsigned id);
  780. void (*vcpu_free)(struct kvm_vcpu *vcpu);
  781. void (*vcpu_reset)(struct kvm_vcpu *vcpu, bool init_event);
  782. void (*prepare_guest_switch)(struct kvm_vcpu *vcpu);
  783. void (*vcpu_load)(struct kvm_vcpu *vcpu, int cpu);
  784. void (*vcpu_put)(struct kvm_vcpu *vcpu);
  785. void (*update_bp_intercept)(struct kvm_vcpu *vcpu);
  786. int (*get_msr)(struct kvm_vcpu *vcpu, struct msr_data *msr);
  787. int (*set_msr)(struct kvm_vcpu *vcpu, struct msr_data *msr);
  788. u64 (*get_segment_base)(struct kvm_vcpu *vcpu, int seg);
  789. void (*get_segment)(struct kvm_vcpu *vcpu,
  790. struct kvm_segment *var, int seg);
  791. int (*get_cpl)(struct kvm_vcpu *vcpu);
  792. void (*set_segment)(struct kvm_vcpu *vcpu,
  793. struct kvm_segment *var, int seg);
  794. void (*get_cs_db_l_bits)(struct kvm_vcpu *vcpu, int *db, int *l);
  795. void (*decache_cr0_guest_bits)(struct kvm_vcpu *vcpu);
  796. void (*decache_cr3)(struct kvm_vcpu *vcpu);
  797. void (*decache_cr4_guest_bits)(struct kvm_vcpu *vcpu);
  798. void (*set_cr0)(struct kvm_vcpu *vcpu, unsigned long cr0);
  799. void (*set_cr3)(struct kvm_vcpu *vcpu, unsigned long cr3);
  800. int (*set_cr4)(struct kvm_vcpu *vcpu, unsigned long cr4);
  801. void (*set_efer)(struct kvm_vcpu *vcpu, u64 efer);
  802. void (*get_idt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
  803. void (*set_idt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
  804. void (*get_gdt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
  805. void (*set_gdt)(struct kvm_vcpu *vcpu, struct desc_ptr *dt);
  806. u64 (*get_dr6)(struct kvm_vcpu *vcpu);
  807. void (*set_dr6)(struct kvm_vcpu *vcpu, unsigned long value);
  808. void (*sync_dirty_debug_regs)(struct kvm_vcpu *vcpu);
  809. void (*set_dr7)(struct kvm_vcpu *vcpu, unsigned long value);
  810. void (*cache_reg)(struct kvm_vcpu *vcpu, enum kvm_reg reg);
  811. unsigned long (*get_rflags)(struct kvm_vcpu *vcpu);
  812. void (*set_rflags)(struct kvm_vcpu *vcpu, unsigned long rflags);
  813. void (*tlb_flush)(struct kvm_vcpu *vcpu);
  814. void (*run)(struct kvm_vcpu *vcpu);
  815. int (*handle_exit)(struct kvm_vcpu *vcpu);
  816. void (*skip_emulated_instruction)(struct kvm_vcpu *vcpu);
  817. void (*set_interrupt_shadow)(struct kvm_vcpu *vcpu, int mask);
  818. u32 (*get_interrupt_shadow)(struct kvm_vcpu *vcpu);
  819. void (*patch_hypercall)(struct kvm_vcpu *vcpu,
  820. unsigned char *hypercall_addr);
  821. void (*set_irq)(struct kvm_vcpu *vcpu);
  822. void (*set_nmi)(struct kvm_vcpu *vcpu);
  823. void (*queue_exception)(struct kvm_vcpu *vcpu);
  824. void (*cancel_injection)(struct kvm_vcpu *vcpu);
  825. int (*interrupt_allowed)(struct kvm_vcpu *vcpu);
  826. int (*nmi_allowed)(struct kvm_vcpu *vcpu);
  827. bool (*get_nmi_mask)(struct kvm_vcpu *vcpu);
  828. void (*set_nmi_mask)(struct kvm_vcpu *vcpu, bool masked);
  829. void (*enable_nmi_window)(struct kvm_vcpu *vcpu);
  830. void (*enable_irq_window)(struct kvm_vcpu *vcpu);
  831. void (*update_cr8_intercept)(struct kvm_vcpu *vcpu, int tpr, int irr);
  832. bool (*get_enable_apicv)(struct kvm_vcpu *vcpu);
  833. void (*refresh_apicv_exec_ctrl)(struct kvm_vcpu *vcpu);
  834. void (*hwapic_irr_update)(struct kvm_vcpu *vcpu, int max_irr);
  835. void (*hwapic_isr_update)(struct kvm_vcpu *vcpu, int isr);
  836. void (*load_eoi_exitmap)(struct kvm_vcpu *vcpu, u64 *eoi_exit_bitmap);
  837. void (*set_virtual_x2apic_mode)(struct kvm_vcpu *vcpu, bool set);
  838. void (*set_apic_access_page_addr)(struct kvm_vcpu *vcpu, hpa_t hpa);
  839. void (*deliver_posted_interrupt)(struct kvm_vcpu *vcpu, int vector);
  840. int (*sync_pir_to_irr)(struct kvm_vcpu *vcpu);
  841. int (*set_tss_addr)(struct kvm *kvm, unsigned int addr);
  842. int (*get_tdp_level)(struct kvm_vcpu *vcpu);
  843. u64 (*get_mt_mask)(struct kvm_vcpu *vcpu, gfn_t gfn, bool is_mmio);
  844. int (*get_lpage_level)(void);
  845. bool (*rdtscp_supported)(void);
  846. bool (*invpcid_supported)(void);
  847. void (*set_tdp_cr3)(struct kvm_vcpu *vcpu, unsigned long cr3);
  848. void (*set_supported_cpuid)(u32 func, struct kvm_cpuid_entry2 *entry);
  849. bool (*has_wbinvd_exit)(void);
  850. void (*write_tsc_offset)(struct kvm_vcpu *vcpu, u64 offset);
  851. void (*get_exit_info)(struct kvm_vcpu *vcpu, u64 *info1, u64 *info2);
  852. int (*check_intercept)(struct kvm_vcpu *vcpu,
  853. struct x86_instruction_info *info,
  854. enum x86_intercept_stage stage);
  855. void (*handle_external_intr)(struct kvm_vcpu *vcpu);
  856. bool (*mpx_supported)(void);
  857. bool (*xsaves_supported)(void);
  858. int (*check_nested_events)(struct kvm_vcpu *vcpu, bool external_intr);
  859. void (*sched_in)(struct kvm_vcpu *kvm, int cpu);
  860. /*
  861. * Arch-specific dirty logging hooks. These hooks are only supposed to
  862. * be valid if the specific arch has hardware-accelerated dirty logging
  863. * mechanism. Currently only for PML on VMX.
  864. *
  865. * - slot_enable_log_dirty:
  866. * called when enabling log dirty mode for the slot.
  867. * - slot_disable_log_dirty:
  868. * called when disabling log dirty mode for the slot.
  869. * also called when slot is created with log dirty disabled.
  870. * - flush_log_dirty:
  871. * called before reporting dirty_bitmap to userspace.
  872. * - enable_log_dirty_pt_masked:
  873. * called when reenabling log dirty for the GFNs in the mask after
  874. * corresponding bits are cleared in slot->dirty_bitmap.
  875. */
  876. void (*slot_enable_log_dirty)(struct kvm *kvm,
  877. struct kvm_memory_slot *slot);
  878. void (*slot_disable_log_dirty)(struct kvm *kvm,
  879. struct kvm_memory_slot *slot);
  880. void (*flush_log_dirty)(struct kvm *kvm);
  881. void (*enable_log_dirty_pt_masked)(struct kvm *kvm,
  882. struct kvm_memory_slot *slot,
  883. gfn_t offset, unsigned long mask);
  884. int (*write_log_dirty)(struct kvm_vcpu *vcpu);
  885. /* pmu operations of sub-arch */
  886. const struct kvm_pmu_ops *pmu_ops;
  887. /*
  888. * Architecture specific hooks for vCPU blocking due to
  889. * HLT instruction.
  890. * Returns for .pre_block():
  891. * - 0 means continue to block the vCPU.
  892. * - 1 means we cannot block the vCPU since some event
  893. * happens during this period, such as, 'ON' bit in
  894. * posted-interrupts descriptor is set.
  895. */
  896. int (*pre_block)(struct kvm_vcpu *vcpu);
  897. void (*post_block)(struct kvm_vcpu *vcpu);
  898. void (*vcpu_blocking)(struct kvm_vcpu *vcpu);
  899. void (*vcpu_unblocking)(struct kvm_vcpu *vcpu);
  900. int (*update_pi_irte)(struct kvm *kvm, unsigned int host_irq,
  901. uint32_t guest_irq, bool set);
  902. void (*apicv_post_state_restore)(struct kvm_vcpu *vcpu);
  903. int (*set_hv_timer)(struct kvm_vcpu *vcpu, u64 guest_deadline_tsc);
  904. void (*cancel_hv_timer)(struct kvm_vcpu *vcpu);
  905. void (*setup_mce)(struct kvm_vcpu *vcpu);
  906. };
  907. struct kvm_arch_async_pf {
  908. u32 token;
  909. gfn_t gfn;
  910. unsigned long cr3;
  911. bool direct_map;
  912. };
  913. extern struct kvm_x86_ops *kvm_x86_ops;
  914. int kvm_mmu_module_init(void);
  915. void kvm_mmu_module_exit(void);
  916. void kvm_mmu_destroy(struct kvm_vcpu *vcpu);
  917. int kvm_mmu_create(struct kvm_vcpu *vcpu);
  918. void kvm_mmu_setup(struct kvm_vcpu *vcpu);
  919. void kvm_mmu_init_vm(struct kvm *kvm);
  920. void kvm_mmu_uninit_vm(struct kvm *kvm);
  921. void kvm_mmu_set_mask_ptes(u64 user_mask, u64 accessed_mask,
  922. u64 dirty_mask, u64 nx_mask, u64 x_mask, u64 p_mask,
  923. u64 acc_track_mask, u64 me_mask);
  924. void kvm_mmu_reset_context(struct kvm_vcpu *vcpu);
  925. void kvm_mmu_slot_remove_write_access(struct kvm *kvm,
  926. struct kvm_memory_slot *memslot);
  927. void kvm_mmu_zap_collapsible_sptes(struct kvm *kvm,
  928. const struct kvm_memory_slot *memslot);
  929. void kvm_mmu_slot_leaf_clear_dirty(struct kvm *kvm,
  930. struct kvm_memory_slot *memslot);
  931. void kvm_mmu_slot_largepage_remove_write_access(struct kvm *kvm,
  932. struct kvm_memory_slot *memslot);
  933. void kvm_mmu_slot_set_dirty(struct kvm *kvm,
  934. struct kvm_memory_slot *memslot);
  935. void kvm_mmu_clear_dirty_pt_masked(struct kvm *kvm,
  936. struct kvm_memory_slot *slot,
  937. gfn_t gfn_offset, unsigned long mask);
  938. void kvm_mmu_zap_all(struct kvm *kvm);
  939. void kvm_mmu_invalidate_mmio_sptes(struct kvm *kvm, struct kvm_memslots *slots);
  940. unsigned int kvm_mmu_calculate_mmu_pages(struct kvm *kvm);
  941. void kvm_mmu_change_mmu_pages(struct kvm *kvm, unsigned int kvm_nr_mmu_pages);
  942. int load_pdptrs(struct kvm_vcpu *vcpu, struct kvm_mmu *mmu, unsigned long cr3);
  943. bool pdptrs_changed(struct kvm_vcpu *vcpu);
  944. int emulator_write_phys(struct kvm_vcpu *vcpu, gpa_t gpa,
  945. const void *val, int bytes);
  946. struct kvm_irq_mask_notifier {
  947. void (*func)(struct kvm_irq_mask_notifier *kimn, bool masked);
  948. int irq;
  949. struct hlist_node link;
  950. };
  951. void kvm_register_irq_mask_notifier(struct kvm *kvm, int irq,
  952. struct kvm_irq_mask_notifier *kimn);
  953. void kvm_unregister_irq_mask_notifier(struct kvm *kvm, int irq,
  954. struct kvm_irq_mask_notifier *kimn);
  955. void kvm_fire_mask_notifiers(struct kvm *kvm, unsigned irqchip, unsigned pin,
  956. bool mask);
  957. extern bool tdp_enabled;
  958. u64 vcpu_tsc_khz(struct kvm_vcpu *vcpu);
  959. /* control of guest tsc rate supported? */
  960. extern bool kvm_has_tsc_control;
  961. /* maximum supported tsc_khz for guests */
  962. extern u32 kvm_max_guest_tsc_khz;
  963. /* number of bits of the fractional part of the TSC scaling ratio */
  964. extern u8 kvm_tsc_scaling_ratio_frac_bits;
  965. /* maximum allowed value of TSC scaling ratio */
  966. extern u64 kvm_max_tsc_scaling_ratio;
  967. /* 1ull << kvm_tsc_scaling_ratio_frac_bits */
  968. extern u64 kvm_default_tsc_scaling_ratio;
  969. extern u64 kvm_mce_cap_supported;
  970. enum emulation_result {
  971. EMULATE_DONE, /* no further processing */
  972. EMULATE_USER_EXIT, /* kvm_run ready for userspace exit */
  973. EMULATE_FAIL, /* can't emulate this instruction */
  974. };
  975. #define EMULTYPE_NO_DECODE (1 << 0)
  976. #define EMULTYPE_TRAP_UD (1 << 1)
  977. #define EMULTYPE_SKIP (1 << 2)
  978. #define EMULTYPE_RETRY (1 << 3)
  979. #define EMULTYPE_NO_REEXECUTE (1 << 4)
  980. int x86_emulate_instruction(struct kvm_vcpu *vcpu, unsigned long cr2,
  981. int emulation_type, void *insn, int insn_len);
  982. static inline int emulate_instruction(struct kvm_vcpu *vcpu,
  983. int emulation_type)
  984. {
  985. return x86_emulate_instruction(vcpu, 0, emulation_type, NULL, 0);
  986. }
  987. void kvm_enable_efer_bits(u64);
  988. bool kvm_valid_efer(struct kvm_vcpu *vcpu, u64 efer);
  989. int kvm_get_msr(struct kvm_vcpu *vcpu, struct msr_data *msr);
  990. int kvm_set_msr(struct kvm_vcpu *vcpu, struct msr_data *msr);
  991. struct x86_emulate_ctxt;
  992. int kvm_fast_pio_out(struct kvm_vcpu *vcpu, int size, unsigned short port);
  993. int kvm_fast_pio_in(struct kvm_vcpu *vcpu, int size, unsigned short port);
  994. int kvm_emulate_cpuid(struct kvm_vcpu *vcpu);
  995. int kvm_emulate_halt(struct kvm_vcpu *vcpu);
  996. int kvm_vcpu_halt(struct kvm_vcpu *vcpu);
  997. int kvm_emulate_wbinvd(struct kvm_vcpu *vcpu);
  998. void kvm_get_segment(struct kvm_vcpu *vcpu, struct kvm_segment *var, int seg);
  999. int kvm_load_segment_descriptor(struct kvm_vcpu *vcpu, u16 selector, int seg);
  1000. void kvm_vcpu_deliver_sipi_vector(struct kvm_vcpu *vcpu, u8 vector);
  1001. int kvm_task_switch(struct kvm_vcpu *vcpu, u16 tss_selector, int idt_index,
  1002. int reason, bool has_error_code, u32 error_code);
  1003. int kvm_set_cr0(struct kvm_vcpu *vcpu, unsigned long cr0);
  1004. int kvm_set_cr3(struct kvm_vcpu *vcpu, unsigned long cr3);
  1005. int kvm_set_cr4(struct kvm_vcpu *vcpu, unsigned long cr4);
  1006. int kvm_set_cr8(struct kvm_vcpu *vcpu, unsigned long cr8);
  1007. int kvm_set_dr(struct kvm_vcpu *vcpu, int dr, unsigned long val);
  1008. int kvm_get_dr(struct kvm_vcpu *vcpu, int dr, unsigned long *val);
  1009. unsigned long kvm_get_cr8(struct kvm_vcpu *vcpu);
  1010. void kvm_lmsw(struct kvm_vcpu *vcpu, unsigned long msw);
  1011. void kvm_get_cs_db_l_bits(struct kvm_vcpu *vcpu, int *db, int *l);
  1012. int kvm_set_xcr(struct kvm_vcpu *vcpu, u32 index, u64 xcr);
  1013. int kvm_get_msr_common(struct kvm_vcpu *vcpu, struct msr_data *msr);
  1014. int kvm_set_msr_common(struct kvm_vcpu *vcpu, struct msr_data *msr);
  1015. unsigned long kvm_get_rflags(struct kvm_vcpu *vcpu);
  1016. void kvm_set_rflags(struct kvm_vcpu *vcpu, unsigned long rflags);
  1017. bool kvm_rdpmc(struct kvm_vcpu *vcpu);
  1018. void kvm_queue_exception(struct kvm_vcpu *vcpu, unsigned nr);
  1019. void kvm_queue_exception_e(struct kvm_vcpu *vcpu, unsigned nr, u32 error_code);
  1020. void kvm_requeue_exception(struct kvm_vcpu *vcpu, unsigned nr);
  1021. void kvm_requeue_exception_e(struct kvm_vcpu *vcpu, unsigned nr, u32 error_code);
  1022. void kvm_inject_page_fault(struct kvm_vcpu *vcpu, struct x86_exception *fault);
  1023. int kvm_read_guest_page_mmu(struct kvm_vcpu *vcpu, struct kvm_mmu *mmu,
  1024. gfn_t gfn, void *data, int offset, int len,
  1025. u32 access);
  1026. bool kvm_require_cpl(struct kvm_vcpu *vcpu, int required_cpl);
  1027. bool kvm_require_dr(struct kvm_vcpu *vcpu, int dr);
  1028. static inline int __kvm_irq_line_state(unsigned long *irq_state,
  1029. int irq_source_id, int level)
  1030. {
  1031. /* Logical OR for level trig interrupt */
  1032. if (level)
  1033. __set_bit(irq_source_id, irq_state);
  1034. else
  1035. __clear_bit(irq_source_id, irq_state);
  1036. return !!(*irq_state);
  1037. }
  1038. int kvm_pic_set_irq(struct kvm_pic *pic, int irq, int irq_source_id, int level);
  1039. void kvm_pic_clear_all(struct kvm_pic *pic, int irq_source_id);
  1040. void kvm_inject_nmi(struct kvm_vcpu *vcpu);
  1041. int kvm_mmu_unprotect_page(struct kvm *kvm, gfn_t gfn);
  1042. int kvm_mmu_unprotect_page_virt(struct kvm_vcpu *vcpu, gva_t gva);
  1043. void __kvm_mmu_free_some_pages(struct kvm_vcpu *vcpu);
  1044. int kvm_mmu_load(struct kvm_vcpu *vcpu);
  1045. void kvm_mmu_unload(struct kvm_vcpu *vcpu);
  1046. void kvm_mmu_sync_roots(struct kvm_vcpu *vcpu);
  1047. gpa_t translate_nested_gpa(struct kvm_vcpu *vcpu, gpa_t gpa, u32 access,
  1048. struct x86_exception *exception);
  1049. gpa_t kvm_mmu_gva_to_gpa_read(struct kvm_vcpu *vcpu, gva_t gva,
  1050. struct x86_exception *exception);
  1051. gpa_t kvm_mmu_gva_to_gpa_fetch(struct kvm_vcpu *vcpu, gva_t gva,
  1052. struct x86_exception *exception);
  1053. gpa_t kvm_mmu_gva_to_gpa_write(struct kvm_vcpu *vcpu, gva_t gva,
  1054. struct x86_exception *exception);
  1055. gpa_t kvm_mmu_gva_to_gpa_system(struct kvm_vcpu *vcpu, gva_t gva,
  1056. struct x86_exception *exception);
  1057. void kvm_vcpu_deactivate_apicv(struct kvm_vcpu *vcpu);
  1058. int kvm_emulate_hypercall(struct kvm_vcpu *vcpu);
  1059. int kvm_mmu_page_fault(struct kvm_vcpu *vcpu, gva_t gva, u64 error_code,
  1060. void *insn, int insn_len);
  1061. void kvm_mmu_invlpg(struct kvm_vcpu *vcpu, gva_t gva);
  1062. void kvm_mmu_new_cr3(struct kvm_vcpu *vcpu);
  1063. void kvm_enable_tdp(void);
  1064. void kvm_disable_tdp(void);
  1065. static inline gpa_t translate_gpa(struct kvm_vcpu *vcpu, gpa_t gpa, u32 access,
  1066. struct x86_exception *exception)
  1067. {
  1068. return gpa;
  1069. }
  1070. static inline struct kvm_mmu_page *page_header(hpa_t shadow_page)
  1071. {
  1072. struct page *page = pfn_to_page(shadow_page >> PAGE_SHIFT);
  1073. return (struct kvm_mmu_page *)page_private(page);
  1074. }
  1075. static inline u16 kvm_read_ldt(void)
  1076. {
  1077. u16 ldt;
  1078. asm("sldt %0" : "=g"(ldt));
  1079. return ldt;
  1080. }
  1081. static inline void kvm_load_ldt(u16 sel)
  1082. {
  1083. asm("lldt %0" : : "rm"(sel));
  1084. }
  1085. #ifdef CONFIG_X86_64
  1086. static inline unsigned long read_msr(unsigned long msr)
  1087. {
  1088. u64 value;
  1089. rdmsrl(msr, value);
  1090. return value;
  1091. }
  1092. #endif
  1093. static inline u32 get_rdx_init_val(void)
  1094. {
  1095. return 0x600; /* P6 family */
  1096. }
  1097. static inline void kvm_inject_gp(struct kvm_vcpu *vcpu, u32 error_code)
  1098. {
  1099. kvm_queue_exception_e(vcpu, GP_VECTOR, error_code);
  1100. }
  1101. #define TSS_IOPB_BASE_OFFSET 0x66
  1102. #define TSS_BASE_SIZE 0x68
  1103. #define TSS_IOPB_SIZE (65536 / 8)
  1104. #define TSS_REDIRECTION_SIZE (256 / 8)
  1105. #define RMODE_TSS_SIZE \
  1106. (TSS_BASE_SIZE + TSS_REDIRECTION_SIZE + TSS_IOPB_SIZE + 1)
  1107. enum {
  1108. TASK_SWITCH_CALL = 0,
  1109. TASK_SWITCH_IRET = 1,
  1110. TASK_SWITCH_JMP = 2,
  1111. TASK_SWITCH_GATE = 3,
  1112. };
  1113. #define HF_GIF_MASK (1 << 0)
  1114. #define HF_HIF_MASK (1 << 1)
  1115. #define HF_VINTR_MASK (1 << 2)
  1116. #define HF_NMI_MASK (1 << 3)
  1117. #define HF_IRET_MASK (1 << 4)
  1118. #define HF_GUEST_MASK (1 << 5) /* VCPU is in guest-mode */
  1119. #define HF_SMM_MASK (1 << 6)
  1120. #define HF_SMM_INSIDE_NMI_MASK (1 << 7)
  1121. #define __KVM_VCPU_MULTIPLE_ADDRESS_SPACE
  1122. #define KVM_ADDRESS_SPACE_NUM 2
  1123. #define kvm_arch_vcpu_memslots_id(vcpu) ((vcpu)->arch.hflags & HF_SMM_MASK ? 1 : 0)
  1124. #define kvm_memslots_for_spte_role(kvm, role) __kvm_memslots(kvm, (role).smm)
  1125. /*
  1126. * Hardware virtualization extension instructions may fault if a
  1127. * reboot turns off virtualization while processes are running.
  1128. * Trap the fault and ignore the instruction if that happens.
  1129. */
  1130. asmlinkage void kvm_spurious_fault(void);
  1131. #define ____kvm_handle_fault_on_reboot(insn, cleanup_insn) \
  1132. "666: " insn "\n\t" \
  1133. "668: \n\t" \
  1134. ".pushsection .fixup, \"ax\" \n" \
  1135. "667: \n\t" \
  1136. cleanup_insn "\n\t" \
  1137. "cmpb $0, kvm_rebooting \n\t" \
  1138. "jne 668b \n\t" \
  1139. __ASM_SIZE(push) " $666b \n\t" \
  1140. "call kvm_spurious_fault \n\t" \
  1141. ".popsection \n\t" \
  1142. _ASM_EXTABLE(666b, 667b)
  1143. #define __kvm_handle_fault_on_reboot(insn) \
  1144. ____kvm_handle_fault_on_reboot(insn, "")
  1145. #define KVM_ARCH_WANT_MMU_NOTIFIER
  1146. int kvm_unmap_hva(struct kvm *kvm, unsigned long hva);
  1147. int kvm_unmap_hva_range(struct kvm *kvm, unsigned long start, unsigned long end);
  1148. int kvm_age_hva(struct kvm *kvm, unsigned long start, unsigned long end);
  1149. int kvm_test_age_hva(struct kvm *kvm, unsigned long hva);
  1150. void kvm_set_spte_hva(struct kvm *kvm, unsigned long hva, pte_t pte);
  1151. int kvm_cpu_has_injectable_intr(struct kvm_vcpu *v);
  1152. int kvm_cpu_has_interrupt(struct kvm_vcpu *vcpu);
  1153. int kvm_arch_interrupt_allowed(struct kvm_vcpu *vcpu);
  1154. int kvm_cpu_get_interrupt(struct kvm_vcpu *v);
  1155. void kvm_vcpu_reset(struct kvm_vcpu *vcpu, bool init_event);
  1156. void kvm_vcpu_reload_apic_access_page(struct kvm_vcpu *vcpu);
  1157. void kvm_define_shared_msr(unsigned index, u32 msr);
  1158. int kvm_set_shared_msr(unsigned index, u64 val, u64 mask);
  1159. u64 kvm_scale_tsc(struct kvm_vcpu *vcpu, u64 tsc);
  1160. u64 kvm_read_l1_tsc(struct kvm_vcpu *vcpu, u64 host_tsc);
  1161. unsigned long kvm_get_linear_rip(struct kvm_vcpu *vcpu);
  1162. bool kvm_is_linear_rip(struct kvm_vcpu *vcpu, unsigned long linear_rip);
  1163. void kvm_make_mclock_inprogress_request(struct kvm *kvm);
  1164. void kvm_make_scan_ioapic_request(struct kvm *kvm);
  1165. void kvm_arch_async_page_not_present(struct kvm_vcpu *vcpu,
  1166. struct kvm_async_pf *work);
  1167. void kvm_arch_async_page_present(struct kvm_vcpu *vcpu,
  1168. struct kvm_async_pf *work);
  1169. void kvm_arch_async_page_ready(struct kvm_vcpu *vcpu,
  1170. struct kvm_async_pf *work);
  1171. bool kvm_arch_can_inject_async_page_present(struct kvm_vcpu *vcpu);
  1172. extern bool kvm_find_async_pf_gfn(struct kvm_vcpu *vcpu, gfn_t gfn);
  1173. int kvm_skip_emulated_instruction(struct kvm_vcpu *vcpu);
  1174. int kvm_complete_insn_gp(struct kvm_vcpu *vcpu, int err);
  1175. int kvm_is_in_guest(void);
  1176. int __x86_set_memory_region(struct kvm *kvm, int id, gpa_t gpa, u32 size);
  1177. int x86_set_memory_region(struct kvm *kvm, int id, gpa_t gpa, u32 size);
  1178. bool kvm_vcpu_is_reset_bsp(struct kvm_vcpu *vcpu);
  1179. bool kvm_vcpu_is_bsp(struct kvm_vcpu *vcpu);
  1180. bool kvm_intr_is_single_vcpu(struct kvm *kvm, struct kvm_lapic_irq *irq,
  1181. struct kvm_vcpu **dest_vcpu);
  1182. void kvm_set_msi_irq(struct kvm *kvm, struct kvm_kernel_irq_routing_entry *e,
  1183. struct kvm_lapic_irq *irq);
  1184. static inline void kvm_arch_vcpu_blocking(struct kvm_vcpu *vcpu)
  1185. {
  1186. if (kvm_x86_ops->vcpu_blocking)
  1187. kvm_x86_ops->vcpu_blocking(vcpu);
  1188. }
  1189. static inline void kvm_arch_vcpu_unblocking(struct kvm_vcpu *vcpu)
  1190. {
  1191. if (kvm_x86_ops->vcpu_unblocking)
  1192. kvm_x86_ops->vcpu_unblocking(vcpu);
  1193. }
  1194. static inline void kvm_arch_vcpu_block_finish(struct kvm_vcpu *vcpu) {}
  1195. static inline int kvm_cpu_get_apicid(int mps_cpu)
  1196. {
  1197. #ifdef CONFIG_X86_LOCAL_APIC
  1198. return default_cpu_present_to_apicid(mps_cpu);
  1199. #else
  1200. WARN_ON_ONCE(1);
  1201. return BAD_APICID;
  1202. #endif
  1203. }
  1204. #endif /* _ASM_X86_KVM_HOST_H */