pgtable.c 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770
  1. /*
  2. * Copyright IBM Corp. 2007, 2011
  3. * Author(s): Martin Schwidefsky <schwidefsky@de.ibm.com>
  4. */
  5. #include <linux/sched.h>
  6. #include <linux/kernel.h>
  7. #include <linux/errno.h>
  8. #include <linux/gfp.h>
  9. #include <linux/mm.h>
  10. #include <linux/swap.h>
  11. #include <linux/smp.h>
  12. #include <linux/spinlock.h>
  13. #include <linux/rcupdate.h>
  14. #include <linux/slab.h>
  15. #include <linux/swapops.h>
  16. #include <linux/sysctl.h>
  17. #include <linux/ksm.h>
  18. #include <linux/mman.h>
  19. #include <asm/pgtable.h>
  20. #include <asm/pgalloc.h>
  21. #include <asm/tlb.h>
  22. #include <asm/tlbflush.h>
  23. #include <asm/mmu_context.h>
  24. static inline pte_t ptep_flush_direct(struct mm_struct *mm,
  25. unsigned long addr, pte_t *ptep)
  26. {
  27. pte_t old;
  28. old = *ptep;
  29. if (unlikely(pte_val(old) & _PAGE_INVALID))
  30. return old;
  31. atomic_inc(&mm->context.flush_count);
  32. if (MACHINE_HAS_TLB_LC &&
  33. cpumask_equal(mm_cpumask(mm), cpumask_of(smp_processor_id())))
  34. __ptep_ipte(addr, ptep, IPTE_LOCAL);
  35. else
  36. __ptep_ipte(addr, ptep, IPTE_GLOBAL);
  37. atomic_dec(&mm->context.flush_count);
  38. return old;
  39. }
  40. static inline pte_t ptep_flush_lazy(struct mm_struct *mm,
  41. unsigned long addr, pte_t *ptep)
  42. {
  43. pte_t old;
  44. old = *ptep;
  45. if (unlikely(pte_val(old) & _PAGE_INVALID))
  46. return old;
  47. atomic_inc(&mm->context.flush_count);
  48. if (cpumask_equal(&mm->context.cpu_attach_mask,
  49. cpumask_of(smp_processor_id()))) {
  50. pte_val(*ptep) |= _PAGE_INVALID;
  51. mm->context.flush_mm = 1;
  52. } else
  53. __ptep_ipte(addr, ptep, IPTE_GLOBAL);
  54. atomic_dec(&mm->context.flush_count);
  55. return old;
  56. }
  57. static inline pgste_t pgste_get_lock(pte_t *ptep)
  58. {
  59. unsigned long new = 0;
  60. #ifdef CONFIG_PGSTE
  61. unsigned long old;
  62. asm(
  63. " lg %0,%2\n"
  64. "0: lgr %1,%0\n"
  65. " nihh %0,0xff7f\n" /* clear PCL bit in old */
  66. " oihh %1,0x0080\n" /* set PCL bit in new */
  67. " csg %0,%1,%2\n"
  68. " jl 0b\n"
  69. : "=&d" (old), "=&d" (new), "=Q" (ptep[PTRS_PER_PTE])
  70. : "Q" (ptep[PTRS_PER_PTE]) : "cc", "memory");
  71. #endif
  72. return __pgste(new);
  73. }
  74. static inline void pgste_set_unlock(pte_t *ptep, pgste_t pgste)
  75. {
  76. #ifdef CONFIG_PGSTE
  77. asm(
  78. " nihh %1,0xff7f\n" /* clear PCL bit */
  79. " stg %1,%0\n"
  80. : "=Q" (ptep[PTRS_PER_PTE])
  81. : "d" (pgste_val(pgste)), "Q" (ptep[PTRS_PER_PTE])
  82. : "cc", "memory");
  83. #endif
  84. }
  85. static inline pgste_t pgste_get(pte_t *ptep)
  86. {
  87. unsigned long pgste = 0;
  88. #ifdef CONFIG_PGSTE
  89. pgste = *(unsigned long *)(ptep + PTRS_PER_PTE);
  90. #endif
  91. return __pgste(pgste);
  92. }
  93. static inline void pgste_set(pte_t *ptep, pgste_t pgste)
  94. {
  95. #ifdef CONFIG_PGSTE
  96. *(pgste_t *)(ptep + PTRS_PER_PTE) = pgste;
  97. #endif
  98. }
  99. static inline pgste_t pgste_update_all(pte_t pte, pgste_t pgste,
  100. struct mm_struct *mm)
  101. {
  102. #ifdef CONFIG_PGSTE
  103. unsigned long address, bits, skey;
  104. if (!mm_use_skey(mm) || pte_val(pte) & _PAGE_INVALID)
  105. return pgste;
  106. address = pte_val(pte) & PAGE_MASK;
  107. skey = (unsigned long) page_get_storage_key(address);
  108. bits = skey & (_PAGE_CHANGED | _PAGE_REFERENCED);
  109. /* Transfer page changed & referenced bit to guest bits in pgste */
  110. pgste_val(pgste) |= bits << 48; /* GR bit & GC bit */
  111. /* Copy page access key and fetch protection bit to pgste */
  112. pgste_val(pgste) &= ~(PGSTE_ACC_BITS | PGSTE_FP_BIT);
  113. pgste_val(pgste) |= (skey & (_PAGE_ACC_BITS | _PAGE_FP_BIT)) << 56;
  114. #endif
  115. return pgste;
  116. }
  117. static inline void pgste_set_key(pte_t *ptep, pgste_t pgste, pte_t entry,
  118. struct mm_struct *mm)
  119. {
  120. #ifdef CONFIG_PGSTE
  121. unsigned long address;
  122. unsigned long nkey;
  123. if (!mm_use_skey(mm) || pte_val(entry) & _PAGE_INVALID)
  124. return;
  125. VM_BUG_ON(!(pte_val(*ptep) & _PAGE_INVALID));
  126. address = pte_val(entry) & PAGE_MASK;
  127. /*
  128. * Set page access key and fetch protection bit from pgste.
  129. * The guest C/R information is still in the PGSTE, set real
  130. * key C/R to 0.
  131. */
  132. nkey = (pgste_val(pgste) & (PGSTE_ACC_BITS | PGSTE_FP_BIT)) >> 56;
  133. nkey |= (pgste_val(pgste) & (PGSTE_GR_BIT | PGSTE_GC_BIT)) >> 48;
  134. page_set_storage_key(address, nkey, 0);
  135. #endif
  136. }
  137. static inline pgste_t pgste_set_pte(pte_t *ptep, pgste_t pgste, pte_t entry)
  138. {
  139. #ifdef CONFIG_PGSTE
  140. if ((pte_val(entry) & _PAGE_PRESENT) &&
  141. (pte_val(entry) & _PAGE_WRITE) &&
  142. !(pte_val(entry) & _PAGE_INVALID)) {
  143. if (!MACHINE_HAS_ESOP) {
  144. /*
  145. * Without enhanced suppression-on-protection force
  146. * the dirty bit on for all writable ptes.
  147. */
  148. pte_val(entry) |= _PAGE_DIRTY;
  149. pte_val(entry) &= ~_PAGE_PROTECT;
  150. }
  151. if (!(pte_val(entry) & _PAGE_PROTECT))
  152. /* This pte allows write access, set user-dirty */
  153. pgste_val(pgste) |= PGSTE_UC_BIT;
  154. }
  155. #endif
  156. *ptep = entry;
  157. return pgste;
  158. }
  159. static inline pgste_t pgste_pte_notify(struct mm_struct *mm,
  160. unsigned long addr,
  161. pte_t *ptep, pgste_t pgste)
  162. {
  163. #ifdef CONFIG_PGSTE
  164. unsigned long bits;
  165. bits = pgste_val(pgste) & (PGSTE_IN_BIT | PGSTE_VSIE_BIT);
  166. if (bits) {
  167. pgste_val(pgste) ^= bits;
  168. ptep_notify(mm, addr, ptep, bits);
  169. }
  170. #endif
  171. return pgste;
  172. }
  173. static inline pgste_t ptep_xchg_start(struct mm_struct *mm,
  174. unsigned long addr, pte_t *ptep)
  175. {
  176. pgste_t pgste = __pgste(0);
  177. if (mm_has_pgste(mm)) {
  178. pgste = pgste_get_lock(ptep);
  179. pgste = pgste_pte_notify(mm, addr, ptep, pgste);
  180. }
  181. return pgste;
  182. }
  183. static inline void ptep_xchg_commit(struct mm_struct *mm,
  184. unsigned long addr, pte_t *ptep,
  185. pgste_t pgste, pte_t old, pte_t new)
  186. {
  187. if (mm_has_pgste(mm)) {
  188. if (pte_val(old) & _PAGE_INVALID)
  189. pgste_set_key(ptep, pgste, new, mm);
  190. if (pte_val(new) & _PAGE_INVALID) {
  191. pgste = pgste_update_all(old, pgste, mm);
  192. if ((pgste_val(pgste) & _PGSTE_GPS_USAGE_MASK) ==
  193. _PGSTE_GPS_USAGE_UNUSED)
  194. pte_val(old) |= _PAGE_UNUSED;
  195. }
  196. pgste = pgste_set_pte(ptep, pgste, new);
  197. pgste_set_unlock(ptep, pgste);
  198. } else {
  199. *ptep = new;
  200. }
  201. }
  202. pte_t ptep_xchg_direct(struct mm_struct *mm, unsigned long addr,
  203. pte_t *ptep, pte_t new)
  204. {
  205. pgste_t pgste;
  206. pte_t old;
  207. preempt_disable();
  208. pgste = ptep_xchg_start(mm, addr, ptep);
  209. old = ptep_flush_direct(mm, addr, ptep);
  210. ptep_xchg_commit(mm, addr, ptep, pgste, old, new);
  211. preempt_enable();
  212. return old;
  213. }
  214. EXPORT_SYMBOL(ptep_xchg_direct);
  215. pte_t ptep_xchg_lazy(struct mm_struct *mm, unsigned long addr,
  216. pte_t *ptep, pte_t new)
  217. {
  218. pgste_t pgste;
  219. pte_t old;
  220. preempt_disable();
  221. pgste = ptep_xchg_start(mm, addr, ptep);
  222. old = ptep_flush_lazy(mm, addr, ptep);
  223. ptep_xchg_commit(mm, addr, ptep, pgste, old, new);
  224. preempt_enable();
  225. return old;
  226. }
  227. EXPORT_SYMBOL(ptep_xchg_lazy);
  228. pte_t ptep_modify_prot_start(struct mm_struct *mm, unsigned long addr,
  229. pte_t *ptep)
  230. {
  231. pgste_t pgste;
  232. pte_t old;
  233. preempt_disable();
  234. pgste = ptep_xchg_start(mm, addr, ptep);
  235. old = ptep_flush_lazy(mm, addr, ptep);
  236. if (mm_has_pgste(mm)) {
  237. pgste = pgste_update_all(old, pgste, mm);
  238. pgste_set(ptep, pgste);
  239. }
  240. return old;
  241. }
  242. EXPORT_SYMBOL(ptep_modify_prot_start);
  243. void ptep_modify_prot_commit(struct mm_struct *mm, unsigned long addr,
  244. pte_t *ptep, pte_t pte)
  245. {
  246. pgste_t pgste;
  247. if (mm_has_pgste(mm)) {
  248. pgste = pgste_get(ptep);
  249. pgste_set_key(ptep, pgste, pte, mm);
  250. pgste = pgste_set_pte(ptep, pgste, pte);
  251. pgste_set_unlock(ptep, pgste);
  252. } else {
  253. *ptep = pte;
  254. }
  255. preempt_enable();
  256. }
  257. EXPORT_SYMBOL(ptep_modify_prot_commit);
  258. static inline pmd_t pmdp_flush_direct(struct mm_struct *mm,
  259. unsigned long addr, pmd_t *pmdp)
  260. {
  261. pmd_t old;
  262. old = *pmdp;
  263. if (pmd_val(old) & _SEGMENT_ENTRY_INVALID)
  264. return old;
  265. if (!MACHINE_HAS_IDTE) {
  266. __pmdp_csp(pmdp);
  267. return old;
  268. }
  269. atomic_inc(&mm->context.flush_count);
  270. if (MACHINE_HAS_TLB_LC &&
  271. cpumask_equal(mm_cpumask(mm), cpumask_of(smp_processor_id())))
  272. __pmdp_idte(addr, pmdp, IDTE_LOCAL);
  273. else
  274. __pmdp_idte(addr, pmdp, IDTE_GLOBAL);
  275. atomic_dec(&mm->context.flush_count);
  276. return old;
  277. }
  278. static inline pmd_t pmdp_flush_lazy(struct mm_struct *mm,
  279. unsigned long addr, pmd_t *pmdp)
  280. {
  281. pmd_t old;
  282. old = *pmdp;
  283. if (pmd_val(old) & _SEGMENT_ENTRY_INVALID)
  284. return old;
  285. atomic_inc(&mm->context.flush_count);
  286. if (cpumask_equal(&mm->context.cpu_attach_mask,
  287. cpumask_of(smp_processor_id()))) {
  288. pmd_val(*pmdp) |= _SEGMENT_ENTRY_INVALID;
  289. mm->context.flush_mm = 1;
  290. } else if (MACHINE_HAS_IDTE)
  291. __pmdp_idte(addr, pmdp, IDTE_GLOBAL);
  292. else
  293. __pmdp_csp(pmdp);
  294. atomic_dec(&mm->context.flush_count);
  295. return old;
  296. }
  297. pmd_t pmdp_xchg_direct(struct mm_struct *mm, unsigned long addr,
  298. pmd_t *pmdp, pmd_t new)
  299. {
  300. pmd_t old;
  301. preempt_disable();
  302. old = pmdp_flush_direct(mm, addr, pmdp);
  303. *pmdp = new;
  304. preempt_enable();
  305. return old;
  306. }
  307. EXPORT_SYMBOL(pmdp_xchg_direct);
  308. pmd_t pmdp_xchg_lazy(struct mm_struct *mm, unsigned long addr,
  309. pmd_t *pmdp, pmd_t new)
  310. {
  311. pmd_t old;
  312. preempt_disable();
  313. old = pmdp_flush_lazy(mm, addr, pmdp);
  314. *pmdp = new;
  315. preempt_enable();
  316. return old;
  317. }
  318. EXPORT_SYMBOL(pmdp_xchg_lazy);
  319. static inline pud_t pudp_flush_direct(struct mm_struct *mm,
  320. unsigned long addr, pud_t *pudp)
  321. {
  322. pud_t old;
  323. old = *pudp;
  324. if (pud_val(old) & _REGION_ENTRY_INVALID)
  325. return old;
  326. if (!MACHINE_HAS_IDTE) {
  327. /*
  328. * Invalid bit position is the same for pmd and pud, so we can
  329. * re-use _pmd_csp() here
  330. */
  331. __pmdp_csp((pmd_t *) pudp);
  332. return old;
  333. }
  334. atomic_inc(&mm->context.flush_count);
  335. if (MACHINE_HAS_TLB_LC &&
  336. cpumask_equal(mm_cpumask(mm), cpumask_of(smp_processor_id())))
  337. __pudp_idte(addr, pudp, IDTE_LOCAL);
  338. else
  339. __pudp_idte(addr, pudp, IDTE_GLOBAL);
  340. atomic_dec(&mm->context.flush_count);
  341. return old;
  342. }
  343. pud_t pudp_xchg_direct(struct mm_struct *mm, unsigned long addr,
  344. pud_t *pudp, pud_t new)
  345. {
  346. pud_t old;
  347. preempt_disable();
  348. old = pudp_flush_direct(mm, addr, pudp);
  349. *pudp = new;
  350. preempt_enable();
  351. return old;
  352. }
  353. EXPORT_SYMBOL(pudp_xchg_direct);
  354. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  355. void pgtable_trans_huge_deposit(struct mm_struct *mm, pmd_t *pmdp,
  356. pgtable_t pgtable)
  357. {
  358. struct list_head *lh = (struct list_head *) pgtable;
  359. assert_spin_locked(pmd_lockptr(mm, pmdp));
  360. /* FIFO */
  361. if (!pmd_huge_pte(mm, pmdp))
  362. INIT_LIST_HEAD(lh);
  363. else
  364. list_add(lh, (struct list_head *) pmd_huge_pte(mm, pmdp));
  365. pmd_huge_pte(mm, pmdp) = pgtable;
  366. }
  367. pgtable_t pgtable_trans_huge_withdraw(struct mm_struct *mm, pmd_t *pmdp)
  368. {
  369. struct list_head *lh;
  370. pgtable_t pgtable;
  371. pte_t *ptep;
  372. assert_spin_locked(pmd_lockptr(mm, pmdp));
  373. /* FIFO */
  374. pgtable = pmd_huge_pte(mm, pmdp);
  375. lh = (struct list_head *) pgtable;
  376. if (list_empty(lh))
  377. pmd_huge_pte(mm, pmdp) = NULL;
  378. else {
  379. pmd_huge_pte(mm, pmdp) = (pgtable_t) lh->next;
  380. list_del(lh);
  381. }
  382. ptep = (pte_t *) pgtable;
  383. pte_val(*ptep) = _PAGE_INVALID;
  384. ptep++;
  385. pte_val(*ptep) = _PAGE_INVALID;
  386. return pgtable;
  387. }
  388. #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
  389. #ifdef CONFIG_PGSTE
  390. void ptep_set_pte_at(struct mm_struct *mm, unsigned long addr,
  391. pte_t *ptep, pte_t entry)
  392. {
  393. pgste_t pgste;
  394. /* the mm_has_pgste() check is done in set_pte_at() */
  395. preempt_disable();
  396. pgste = pgste_get_lock(ptep);
  397. pgste_val(pgste) &= ~_PGSTE_GPS_ZERO;
  398. pgste_set_key(ptep, pgste, entry, mm);
  399. pgste = pgste_set_pte(ptep, pgste, entry);
  400. pgste_set_unlock(ptep, pgste);
  401. preempt_enable();
  402. }
  403. void ptep_set_notify(struct mm_struct *mm, unsigned long addr, pte_t *ptep)
  404. {
  405. pgste_t pgste;
  406. preempt_disable();
  407. pgste = pgste_get_lock(ptep);
  408. pgste_val(pgste) |= PGSTE_IN_BIT;
  409. pgste_set_unlock(ptep, pgste);
  410. preempt_enable();
  411. }
  412. /**
  413. * ptep_force_prot - change access rights of a locked pte
  414. * @mm: pointer to the process mm_struct
  415. * @addr: virtual address in the guest address space
  416. * @ptep: pointer to the page table entry
  417. * @prot: indicates guest access rights: PROT_NONE, PROT_READ or PROT_WRITE
  418. * @bit: pgste bit to set (e.g. for notification)
  419. *
  420. * Returns 0 if the access rights were changed and -EAGAIN if the current
  421. * and requested access rights are incompatible.
  422. */
  423. int ptep_force_prot(struct mm_struct *mm, unsigned long addr,
  424. pte_t *ptep, int prot, unsigned long bit)
  425. {
  426. pte_t entry;
  427. pgste_t pgste;
  428. int pte_i, pte_p;
  429. pgste = pgste_get_lock(ptep);
  430. entry = *ptep;
  431. /* Check pte entry after all locks have been acquired */
  432. pte_i = pte_val(entry) & _PAGE_INVALID;
  433. pte_p = pte_val(entry) & _PAGE_PROTECT;
  434. if ((pte_i && (prot != PROT_NONE)) ||
  435. (pte_p && (prot & PROT_WRITE))) {
  436. pgste_set_unlock(ptep, pgste);
  437. return -EAGAIN;
  438. }
  439. /* Change access rights and set pgste bit */
  440. if (prot == PROT_NONE && !pte_i) {
  441. ptep_flush_direct(mm, addr, ptep);
  442. pgste = pgste_update_all(entry, pgste, mm);
  443. pte_val(entry) |= _PAGE_INVALID;
  444. }
  445. if (prot == PROT_READ && !pte_p) {
  446. ptep_flush_direct(mm, addr, ptep);
  447. pte_val(entry) &= ~_PAGE_INVALID;
  448. pte_val(entry) |= _PAGE_PROTECT;
  449. }
  450. pgste_val(pgste) |= bit;
  451. pgste = pgste_set_pte(ptep, pgste, entry);
  452. pgste_set_unlock(ptep, pgste);
  453. return 0;
  454. }
  455. int ptep_shadow_pte(struct mm_struct *mm, unsigned long saddr,
  456. pte_t *sptep, pte_t *tptep, pte_t pte)
  457. {
  458. pgste_t spgste, tpgste;
  459. pte_t spte, tpte;
  460. int rc = -EAGAIN;
  461. if (!(pte_val(*tptep) & _PAGE_INVALID))
  462. return 0; /* already shadowed */
  463. spgste = pgste_get_lock(sptep);
  464. spte = *sptep;
  465. if (!(pte_val(spte) & _PAGE_INVALID) &&
  466. !((pte_val(spte) & _PAGE_PROTECT) &&
  467. !(pte_val(pte) & _PAGE_PROTECT))) {
  468. pgste_val(spgste) |= PGSTE_VSIE_BIT;
  469. tpgste = pgste_get_lock(tptep);
  470. pte_val(tpte) = (pte_val(spte) & PAGE_MASK) |
  471. (pte_val(pte) & _PAGE_PROTECT);
  472. /* don't touch the storage key - it belongs to parent pgste */
  473. tpgste = pgste_set_pte(tptep, tpgste, tpte);
  474. pgste_set_unlock(tptep, tpgste);
  475. rc = 1;
  476. }
  477. pgste_set_unlock(sptep, spgste);
  478. return rc;
  479. }
  480. void ptep_unshadow_pte(struct mm_struct *mm, unsigned long saddr, pte_t *ptep)
  481. {
  482. pgste_t pgste;
  483. pgste = pgste_get_lock(ptep);
  484. /* notifier is called by the caller */
  485. ptep_flush_direct(mm, saddr, ptep);
  486. /* don't touch the storage key - it belongs to parent pgste */
  487. pgste = pgste_set_pte(ptep, pgste, __pte(_PAGE_INVALID));
  488. pgste_set_unlock(ptep, pgste);
  489. }
  490. static void ptep_zap_swap_entry(struct mm_struct *mm, swp_entry_t entry)
  491. {
  492. if (!non_swap_entry(entry))
  493. dec_mm_counter(mm, MM_SWAPENTS);
  494. else if (is_migration_entry(entry)) {
  495. struct page *page = migration_entry_to_page(entry);
  496. dec_mm_counter(mm, mm_counter(page));
  497. }
  498. free_swap_and_cache(entry);
  499. }
  500. void ptep_zap_unused(struct mm_struct *mm, unsigned long addr,
  501. pte_t *ptep, int reset)
  502. {
  503. unsigned long pgstev;
  504. pgste_t pgste;
  505. pte_t pte;
  506. /* Zap unused and logically-zero pages */
  507. preempt_disable();
  508. pgste = pgste_get_lock(ptep);
  509. pgstev = pgste_val(pgste);
  510. pte = *ptep;
  511. if (!reset && pte_swap(pte) &&
  512. ((pgstev & _PGSTE_GPS_USAGE_MASK) == _PGSTE_GPS_USAGE_UNUSED ||
  513. (pgstev & _PGSTE_GPS_ZERO))) {
  514. ptep_zap_swap_entry(mm, pte_to_swp_entry(pte));
  515. pte_clear(mm, addr, ptep);
  516. }
  517. if (reset)
  518. pgste_val(pgste) &= ~_PGSTE_GPS_USAGE_MASK;
  519. pgste_set_unlock(ptep, pgste);
  520. preempt_enable();
  521. }
  522. void ptep_zap_key(struct mm_struct *mm, unsigned long addr, pte_t *ptep)
  523. {
  524. unsigned long ptev;
  525. pgste_t pgste;
  526. /* Clear storage key */
  527. preempt_disable();
  528. pgste = pgste_get_lock(ptep);
  529. pgste_val(pgste) &= ~(PGSTE_ACC_BITS | PGSTE_FP_BIT |
  530. PGSTE_GR_BIT | PGSTE_GC_BIT);
  531. ptev = pte_val(*ptep);
  532. if (!(ptev & _PAGE_INVALID) && (ptev & _PAGE_WRITE))
  533. page_set_storage_key(ptev & PAGE_MASK, PAGE_DEFAULT_KEY, 1);
  534. pgste_set_unlock(ptep, pgste);
  535. preempt_enable();
  536. }
  537. /*
  538. * Test and reset if a guest page is dirty
  539. */
  540. bool test_and_clear_guest_dirty(struct mm_struct *mm, unsigned long addr)
  541. {
  542. spinlock_t *ptl;
  543. pgste_t pgste;
  544. pte_t *ptep;
  545. pte_t pte;
  546. bool dirty;
  547. ptep = get_locked_pte(mm, addr, &ptl);
  548. if (unlikely(!ptep))
  549. return false;
  550. pgste = pgste_get_lock(ptep);
  551. dirty = !!(pgste_val(pgste) & PGSTE_UC_BIT);
  552. pgste_val(pgste) &= ~PGSTE_UC_BIT;
  553. pte = *ptep;
  554. if (dirty && (pte_val(pte) & _PAGE_PRESENT)) {
  555. pgste = pgste_pte_notify(mm, addr, ptep, pgste);
  556. __ptep_ipte(addr, ptep, IPTE_GLOBAL);
  557. if (MACHINE_HAS_ESOP || !(pte_val(pte) & _PAGE_WRITE))
  558. pte_val(pte) |= _PAGE_PROTECT;
  559. else
  560. pte_val(pte) |= _PAGE_INVALID;
  561. *ptep = pte;
  562. }
  563. pgste_set_unlock(ptep, pgste);
  564. spin_unlock(ptl);
  565. return dirty;
  566. }
  567. EXPORT_SYMBOL_GPL(test_and_clear_guest_dirty);
  568. int set_guest_storage_key(struct mm_struct *mm, unsigned long addr,
  569. unsigned char key, bool nq)
  570. {
  571. unsigned long keyul;
  572. spinlock_t *ptl;
  573. pgste_t old, new;
  574. pte_t *ptep;
  575. ptep = get_locked_pte(mm, addr, &ptl);
  576. if (unlikely(!ptep))
  577. return -EFAULT;
  578. new = old = pgste_get_lock(ptep);
  579. pgste_val(new) &= ~(PGSTE_GR_BIT | PGSTE_GC_BIT |
  580. PGSTE_ACC_BITS | PGSTE_FP_BIT);
  581. keyul = (unsigned long) key;
  582. pgste_val(new) |= (keyul & (_PAGE_CHANGED | _PAGE_REFERENCED)) << 48;
  583. pgste_val(new) |= (keyul & (_PAGE_ACC_BITS | _PAGE_FP_BIT)) << 56;
  584. if (!(pte_val(*ptep) & _PAGE_INVALID)) {
  585. unsigned long address, bits, skey;
  586. address = pte_val(*ptep) & PAGE_MASK;
  587. skey = (unsigned long) page_get_storage_key(address);
  588. bits = skey & (_PAGE_CHANGED | _PAGE_REFERENCED);
  589. skey = key & (_PAGE_ACC_BITS | _PAGE_FP_BIT);
  590. /* Set storage key ACC and FP */
  591. page_set_storage_key(address, skey, !nq);
  592. /* Merge host changed & referenced into pgste */
  593. pgste_val(new) |= bits << 52;
  594. }
  595. /* changing the guest storage key is considered a change of the page */
  596. if ((pgste_val(new) ^ pgste_val(old)) &
  597. (PGSTE_ACC_BITS | PGSTE_FP_BIT | PGSTE_GR_BIT | PGSTE_GC_BIT))
  598. pgste_val(new) |= PGSTE_UC_BIT;
  599. pgste_set_unlock(ptep, new);
  600. pte_unmap_unlock(ptep, ptl);
  601. return 0;
  602. }
  603. EXPORT_SYMBOL(set_guest_storage_key);
  604. /**
  605. * Conditionally set a guest storage key (handling csske).
  606. * oldkey will be updated when either mr or mc is set and a pointer is given.
  607. *
  608. * Returns 0 if a guests storage key update wasn't necessary, 1 if the guest
  609. * storage key was updated and -EFAULT on access errors.
  610. */
  611. int cond_set_guest_storage_key(struct mm_struct *mm, unsigned long addr,
  612. unsigned char key, unsigned char *oldkey,
  613. bool nq, bool mr, bool mc)
  614. {
  615. unsigned char tmp, mask = _PAGE_ACC_BITS | _PAGE_FP_BIT;
  616. int rc;
  617. /* we can drop the pgste lock between getting and setting the key */
  618. if (mr | mc) {
  619. rc = get_guest_storage_key(current->mm, addr, &tmp);
  620. if (rc)
  621. return rc;
  622. if (oldkey)
  623. *oldkey = tmp;
  624. if (!mr)
  625. mask |= _PAGE_REFERENCED;
  626. if (!mc)
  627. mask |= _PAGE_CHANGED;
  628. if (!((tmp ^ key) & mask))
  629. return 0;
  630. }
  631. rc = set_guest_storage_key(current->mm, addr, key, nq);
  632. return rc < 0 ? rc : 1;
  633. }
  634. EXPORT_SYMBOL(cond_set_guest_storage_key);
  635. /**
  636. * Reset a guest reference bit (rrbe), returning the reference and changed bit.
  637. *
  638. * Returns < 0 in case of error, otherwise the cc to be reported to the guest.
  639. */
  640. int reset_guest_reference_bit(struct mm_struct *mm, unsigned long addr)
  641. {
  642. spinlock_t *ptl;
  643. pgste_t old, new;
  644. pte_t *ptep;
  645. int cc = 0;
  646. ptep = get_locked_pte(mm, addr, &ptl);
  647. if (unlikely(!ptep))
  648. return -EFAULT;
  649. new = old = pgste_get_lock(ptep);
  650. /* Reset guest reference bit only */
  651. pgste_val(new) &= ~PGSTE_GR_BIT;
  652. if (!(pte_val(*ptep) & _PAGE_INVALID)) {
  653. cc = page_reset_referenced(pte_val(*ptep) & PAGE_MASK);
  654. /* Merge real referenced bit into host-set */
  655. pgste_val(new) |= ((unsigned long) cc << 53) & PGSTE_HR_BIT;
  656. }
  657. /* Reflect guest's logical view, not physical */
  658. cc |= (pgste_val(old) & (PGSTE_GR_BIT | PGSTE_GC_BIT)) >> 49;
  659. /* Changing the guest storage key is considered a change of the page */
  660. if ((pgste_val(new) ^ pgste_val(old)) & PGSTE_GR_BIT)
  661. pgste_val(new) |= PGSTE_UC_BIT;
  662. pgste_set_unlock(ptep, new);
  663. pte_unmap_unlock(ptep, ptl);
  664. return 0;
  665. }
  666. EXPORT_SYMBOL(reset_guest_reference_bit);
  667. int get_guest_storage_key(struct mm_struct *mm, unsigned long addr,
  668. unsigned char *key)
  669. {
  670. spinlock_t *ptl;
  671. pgste_t pgste;
  672. pte_t *ptep;
  673. ptep = get_locked_pte(mm, addr, &ptl);
  674. if (unlikely(!ptep))
  675. return -EFAULT;
  676. pgste = pgste_get_lock(ptep);
  677. *key = (pgste_val(pgste) & (PGSTE_ACC_BITS | PGSTE_FP_BIT)) >> 56;
  678. if (!(pte_val(*ptep) & _PAGE_INVALID))
  679. *key = page_get_storage_key(pte_val(*ptep) & PAGE_MASK);
  680. /* Reflect guest's logical view, not physical */
  681. *key |= (pgste_val(pgste) & (PGSTE_GR_BIT | PGSTE_GC_BIT)) >> 48;
  682. pgste_set_unlock(ptep, pgste);
  683. pte_unmap_unlock(ptep, ptl);
  684. return 0;
  685. }
  686. EXPORT_SYMBOL(get_guest_storage_key);
  687. #endif