pgtable.h 37 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295
  1. /* SPDX-License-Identifier: GPL-2.0 */
  2. #ifndef _ASM_POWERPC_BOOK3S_64_PGTABLE_H_
  3. #define _ASM_POWERPC_BOOK3S_64_PGTABLE_H_
  4. #include <asm-generic/5level-fixup.h>
  5. #ifndef __ASSEMBLY__
  6. #include <linux/mmdebug.h>
  7. #include <linux/bug.h>
  8. #endif
  9. /*
  10. * Common bits between hash and Radix page table
  11. */
  12. #define _PAGE_BIT_SWAP_TYPE 0
  13. #define _PAGE_NA 0
  14. #define _PAGE_RO 0
  15. #define _PAGE_USER 0
  16. #define _PAGE_EXEC 0x00001 /* execute permission */
  17. #define _PAGE_WRITE 0x00002 /* write access allowed */
  18. #define _PAGE_READ 0x00004 /* read access allowed */
  19. #define _PAGE_RW (_PAGE_READ | _PAGE_WRITE)
  20. #define _PAGE_RWX (_PAGE_READ | _PAGE_WRITE | _PAGE_EXEC)
  21. #define _PAGE_PRIVILEGED 0x00008 /* kernel access only */
  22. #define _PAGE_SAO 0x00010 /* Strong access order */
  23. #define _PAGE_NON_IDEMPOTENT 0x00020 /* non idempotent memory */
  24. #define _PAGE_TOLERANT 0x00030 /* tolerant memory, cache inhibited */
  25. #define _PAGE_DIRTY 0x00080 /* C: page changed */
  26. #define _PAGE_ACCESSED 0x00100 /* R: page referenced */
  27. /*
  28. * Software bits
  29. */
  30. #define _RPAGE_SW0 0x2000000000000000UL
  31. #define _RPAGE_SW1 0x00800
  32. #define _RPAGE_SW2 0x00400
  33. #define _RPAGE_SW3 0x00200
  34. #define _RPAGE_RSV1 0x1000000000000000UL
  35. #define _RPAGE_RSV2 0x0800000000000000UL
  36. #define _RPAGE_RSV3 0x0400000000000000UL
  37. #define _RPAGE_RSV4 0x0200000000000000UL
  38. #define _RPAGE_RSV5 0x00040UL
  39. #define _PAGE_PTE 0x4000000000000000UL /* distinguishes PTEs from pointers */
  40. #define _PAGE_PRESENT 0x8000000000000000UL /* pte contains a translation */
  41. /*
  42. * We need to mark a pmd pte invalid while splitting. We can do that by clearing
  43. * the _PAGE_PRESENT bit. But then that will be taken as a swap pte. In order to
  44. * differentiate between two use a SW field when invalidating.
  45. *
  46. * We do that temporary invalidate for regular pte entry in ptep_set_access_flags
  47. *
  48. * This is used only when _PAGE_PRESENT is cleared.
  49. */
  50. #define _PAGE_INVALID _RPAGE_SW0
  51. /*
  52. * Top and bottom bits of RPN which can be used by hash
  53. * translation mode, because we expect them to be zero
  54. * otherwise.
  55. */
  56. #define _RPAGE_RPN0 0x01000
  57. #define _RPAGE_RPN1 0x02000
  58. #define _RPAGE_RPN44 0x0100000000000000UL
  59. #define _RPAGE_RPN43 0x0080000000000000UL
  60. #define _RPAGE_RPN42 0x0040000000000000UL
  61. #define _RPAGE_RPN41 0x0020000000000000UL
  62. /* Max physical address bit as per radix table */
  63. #define _RPAGE_PA_MAX 57
  64. /*
  65. * Max physical address bit we will use for now.
  66. *
  67. * This is mostly a hardware limitation and for now Power9 has
  68. * a 51 bit limit.
  69. *
  70. * This is different from the number of physical bit required to address
  71. * the last byte of memory. That is defined by MAX_PHYSMEM_BITS.
  72. * MAX_PHYSMEM_BITS is a linux limitation imposed by the maximum
  73. * number of sections we can support (SECTIONS_SHIFT).
  74. *
  75. * This is different from Radix page table limitation above and
  76. * should always be less than that. The limit is done such that
  77. * we can overload the bits between _RPAGE_PA_MAX and _PAGE_PA_MAX
  78. * for hash linux page table specific bits.
  79. *
  80. * In order to be compatible with future hardware generations we keep
  81. * some offsets and limit this for now to 53
  82. */
  83. #define _PAGE_PA_MAX 53
  84. #define _PAGE_SOFT_DIRTY _RPAGE_SW3 /* software: software dirty tracking */
  85. #define _PAGE_SPECIAL _RPAGE_SW2 /* software: special page */
  86. #define _PAGE_DEVMAP _RPAGE_SW1 /* software: ZONE_DEVICE page */
  87. #define __HAVE_ARCH_PTE_DEVMAP
  88. /*
  89. * Drivers request for cache inhibited pte mapping using _PAGE_NO_CACHE
  90. * Instead of fixing all of them, add an alternate define which
  91. * maps CI pte mapping.
  92. */
  93. #define _PAGE_NO_CACHE _PAGE_TOLERANT
  94. /*
  95. * We support _RPAGE_PA_MAX bit real address in pte. On the linux side
  96. * we are limited by _PAGE_PA_MAX. Clear everything above _PAGE_PA_MAX
  97. * and every thing below PAGE_SHIFT;
  98. */
  99. #define PTE_RPN_MASK (((1UL << _PAGE_PA_MAX) - 1) & (PAGE_MASK))
  100. /*
  101. * set of bits not changed in pmd_modify. Even though we have hash specific bits
  102. * in here, on radix we expect them to be zero.
  103. */
  104. #define _HPAGE_CHG_MASK (PTE_RPN_MASK | _PAGE_HPTEFLAGS | _PAGE_DIRTY | \
  105. _PAGE_ACCESSED | H_PAGE_THP_HUGE | _PAGE_PTE | \
  106. _PAGE_SOFT_DIRTY)
  107. /*
  108. * user access blocked by key
  109. */
  110. #define _PAGE_KERNEL_RW (_PAGE_PRIVILEGED | _PAGE_RW | _PAGE_DIRTY)
  111. #define _PAGE_KERNEL_RO (_PAGE_PRIVILEGED | _PAGE_READ)
  112. #define _PAGE_KERNEL_RWX (_PAGE_PRIVILEGED | _PAGE_DIRTY | \
  113. _PAGE_RW | _PAGE_EXEC)
  114. /*
  115. * No page size encoding in the linux PTE
  116. */
  117. #define _PAGE_PSIZE 0
  118. /*
  119. * _PAGE_CHG_MASK masks of bits that are to be preserved across
  120. * pgprot changes
  121. */
  122. #define _PAGE_CHG_MASK (PTE_RPN_MASK | _PAGE_HPTEFLAGS | _PAGE_DIRTY | \
  123. _PAGE_ACCESSED | _PAGE_SPECIAL | _PAGE_PTE | \
  124. _PAGE_SOFT_DIRTY)
  125. #define H_PTE_PKEY (H_PTE_PKEY_BIT0 | H_PTE_PKEY_BIT1 | H_PTE_PKEY_BIT2 | \
  126. H_PTE_PKEY_BIT3 | H_PTE_PKEY_BIT4)
  127. /*
  128. * Mask of bits returned by pte_pgprot()
  129. */
  130. #define PAGE_PROT_BITS (_PAGE_SAO | _PAGE_NON_IDEMPOTENT | _PAGE_TOLERANT | \
  131. H_PAGE_4K_PFN | _PAGE_PRIVILEGED | _PAGE_ACCESSED | \
  132. _PAGE_READ | _PAGE_WRITE | _PAGE_DIRTY | _PAGE_EXEC | \
  133. _PAGE_SOFT_DIRTY | H_PTE_PKEY)
  134. /*
  135. * We define 2 sets of base prot bits, one for basic pages (ie,
  136. * cacheable kernel and user pages) and one for non cacheable
  137. * pages. We always set _PAGE_COHERENT when SMP is enabled or
  138. * the processor might need it for DMA coherency.
  139. */
  140. #define _PAGE_BASE_NC (_PAGE_PRESENT | _PAGE_ACCESSED | _PAGE_PSIZE)
  141. #define _PAGE_BASE (_PAGE_BASE_NC)
  142. /* Permission masks used to generate the __P and __S table,
  143. *
  144. * Note:__pgprot is defined in arch/powerpc/include/asm/page.h
  145. *
  146. * Write permissions imply read permissions for now (we could make write-only
  147. * pages on BookE but we don't bother for now). Execute permission control is
  148. * possible on platforms that define _PAGE_EXEC
  149. *
  150. * Note due to the way vm flags are laid out, the bits are XWR
  151. */
  152. #define PAGE_NONE __pgprot(_PAGE_BASE | _PAGE_PRIVILEGED)
  153. #define PAGE_SHARED __pgprot(_PAGE_BASE | _PAGE_RW)
  154. #define PAGE_SHARED_X __pgprot(_PAGE_BASE | _PAGE_RW | _PAGE_EXEC)
  155. #define PAGE_COPY __pgprot(_PAGE_BASE | _PAGE_READ)
  156. #define PAGE_COPY_X __pgprot(_PAGE_BASE | _PAGE_READ | _PAGE_EXEC)
  157. #define PAGE_READONLY __pgprot(_PAGE_BASE | _PAGE_READ)
  158. #define PAGE_READONLY_X __pgprot(_PAGE_BASE | _PAGE_READ | _PAGE_EXEC)
  159. #define __P000 PAGE_NONE
  160. #define __P001 PAGE_READONLY
  161. #define __P010 PAGE_COPY
  162. #define __P011 PAGE_COPY
  163. #define __P100 PAGE_READONLY_X
  164. #define __P101 PAGE_READONLY_X
  165. #define __P110 PAGE_COPY_X
  166. #define __P111 PAGE_COPY_X
  167. #define __S000 PAGE_NONE
  168. #define __S001 PAGE_READONLY
  169. #define __S010 PAGE_SHARED
  170. #define __S011 PAGE_SHARED
  171. #define __S100 PAGE_READONLY_X
  172. #define __S101 PAGE_READONLY_X
  173. #define __S110 PAGE_SHARED_X
  174. #define __S111 PAGE_SHARED_X
  175. /* Permission masks used for kernel mappings */
  176. #define PAGE_KERNEL __pgprot(_PAGE_BASE | _PAGE_KERNEL_RW)
  177. #define PAGE_KERNEL_NC __pgprot(_PAGE_BASE_NC | _PAGE_KERNEL_RW | \
  178. _PAGE_TOLERANT)
  179. #define PAGE_KERNEL_NCG __pgprot(_PAGE_BASE_NC | _PAGE_KERNEL_RW | \
  180. _PAGE_NON_IDEMPOTENT)
  181. #define PAGE_KERNEL_X __pgprot(_PAGE_BASE | _PAGE_KERNEL_RWX)
  182. #define PAGE_KERNEL_RO __pgprot(_PAGE_BASE | _PAGE_KERNEL_RO)
  183. #define PAGE_KERNEL_ROX __pgprot(_PAGE_BASE | _PAGE_KERNEL_ROX)
  184. /*
  185. * Protection used for kernel text. We want the debuggers to be able to
  186. * set breakpoints anywhere, so don't write protect the kernel text
  187. * on platforms where such control is possible.
  188. */
  189. #if defined(CONFIG_KGDB) || defined(CONFIG_XMON) || defined(CONFIG_BDI_SWITCH) || \
  190. defined(CONFIG_KPROBES) || defined(CONFIG_DYNAMIC_FTRACE)
  191. #define PAGE_KERNEL_TEXT PAGE_KERNEL_X
  192. #else
  193. #define PAGE_KERNEL_TEXT PAGE_KERNEL_ROX
  194. #endif
  195. /* Make modules code happy. We don't set RO yet */
  196. #define PAGE_KERNEL_EXEC PAGE_KERNEL_X
  197. #define PAGE_AGP (PAGE_KERNEL_NC)
  198. #ifndef __ASSEMBLY__
  199. /*
  200. * page table defines
  201. */
  202. extern unsigned long __pte_index_size;
  203. extern unsigned long __pmd_index_size;
  204. extern unsigned long __pud_index_size;
  205. extern unsigned long __pgd_index_size;
  206. extern unsigned long __pud_cache_index;
  207. #define PTE_INDEX_SIZE __pte_index_size
  208. #define PMD_INDEX_SIZE __pmd_index_size
  209. #define PUD_INDEX_SIZE __pud_index_size
  210. #define PGD_INDEX_SIZE __pgd_index_size
  211. /* pmd table use page table fragments */
  212. #define PMD_CACHE_INDEX 0
  213. #define PUD_CACHE_INDEX __pud_cache_index
  214. /*
  215. * Because of use of pte fragments and THP, size of page table
  216. * are not always derived out of index size above.
  217. */
  218. extern unsigned long __pte_table_size;
  219. extern unsigned long __pmd_table_size;
  220. extern unsigned long __pud_table_size;
  221. extern unsigned long __pgd_table_size;
  222. #define PTE_TABLE_SIZE __pte_table_size
  223. #define PMD_TABLE_SIZE __pmd_table_size
  224. #define PUD_TABLE_SIZE __pud_table_size
  225. #define PGD_TABLE_SIZE __pgd_table_size
  226. extern unsigned long __pmd_val_bits;
  227. extern unsigned long __pud_val_bits;
  228. extern unsigned long __pgd_val_bits;
  229. #define PMD_VAL_BITS __pmd_val_bits
  230. #define PUD_VAL_BITS __pud_val_bits
  231. #define PGD_VAL_BITS __pgd_val_bits
  232. extern unsigned long __pte_frag_nr;
  233. #define PTE_FRAG_NR __pte_frag_nr
  234. extern unsigned long __pte_frag_size_shift;
  235. #define PTE_FRAG_SIZE_SHIFT __pte_frag_size_shift
  236. #define PTE_FRAG_SIZE (1UL << PTE_FRAG_SIZE_SHIFT)
  237. extern unsigned long __pmd_frag_nr;
  238. #define PMD_FRAG_NR __pmd_frag_nr
  239. extern unsigned long __pmd_frag_size_shift;
  240. #define PMD_FRAG_SIZE_SHIFT __pmd_frag_size_shift
  241. #define PMD_FRAG_SIZE (1UL << PMD_FRAG_SIZE_SHIFT)
  242. #define PTRS_PER_PTE (1 << PTE_INDEX_SIZE)
  243. #define PTRS_PER_PMD (1 << PMD_INDEX_SIZE)
  244. #define PTRS_PER_PUD (1 << PUD_INDEX_SIZE)
  245. #define PTRS_PER_PGD (1 << PGD_INDEX_SIZE)
  246. /* PMD_SHIFT determines what a second-level page table entry can map */
  247. #define PMD_SHIFT (PAGE_SHIFT + PTE_INDEX_SIZE)
  248. #define PMD_SIZE (1UL << PMD_SHIFT)
  249. #define PMD_MASK (~(PMD_SIZE-1))
  250. /* PUD_SHIFT determines what a third-level page table entry can map */
  251. #define PUD_SHIFT (PMD_SHIFT + PMD_INDEX_SIZE)
  252. #define PUD_SIZE (1UL << PUD_SHIFT)
  253. #define PUD_MASK (~(PUD_SIZE-1))
  254. /* PGDIR_SHIFT determines what a fourth-level page table entry can map */
  255. #define PGDIR_SHIFT (PUD_SHIFT + PUD_INDEX_SIZE)
  256. #define PGDIR_SIZE (1UL << PGDIR_SHIFT)
  257. #define PGDIR_MASK (~(PGDIR_SIZE-1))
  258. /* Bits to mask out from a PMD to get to the PTE page */
  259. #define PMD_MASKED_BITS 0xc0000000000000ffUL
  260. /* Bits to mask out from a PUD to get to the PMD page */
  261. #define PUD_MASKED_BITS 0xc0000000000000ffUL
  262. /* Bits to mask out from a PGD to get to the PUD page */
  263. #define PGD_MASKED_BITS 0xc0000000000000ffUL
  264. /*
  265. * Used as an indicator for rcu callback functions
  266. */
  267. enum pgtable_index {
  268. PTE_INDEX = 0,
  269. PMD_INDEX,
  270. PUD_INDEX,
  271. PGD_INDEX,
  272. /*
  273. * Below are used with 4k page size and hugetlb
  274. */
  275. HTLB_16M_INDEX,
  276. HTLB_16G_INDEX,
  277. };
  278. extern unsigned long __vmalloc_start;
  279. extern unsigned long __vmalloc_end;
  280. #define VMALLOC_START __vmalloc_start
  281. #define VMALLOC_END __vmalloc_end
  282. extern unsigned long __kernel_virt_start;
  283. extern unsigned long __kernel_virt_size;
  284. extern unsigned long __kernel_io_start;
  285. #define KERN_VIRT_START __kernel_virt_start
  286. #define KERN_VIRT_SIZE __kernel_virt_size
  287. #define KERN_IO_START __kernel_io_start
  288. extern struct page *vmemmap;
  289. extern unsigned long ioremap_bot;
  290. extern unsigned long pci_io_base;
  291. #endif /* __ASSEMBLY__ */
  292. #include <asm/book3s/64/hash.h>
  293. #include <asm/book3s/64/radix.h>
  294. #ifdef CONFIG_PPC_64K_PAGES
  295. #include <asm/book3s/64/pgtable-64k.h>
  296. #else
  297. #include <asm/book3s/64/pgtable-4k.h>
  298. #endif
  299. #include <asm/barrier.h>
  300. /*
  301. * The second half of the kernel virtual space is used for IO mappings,
  302. * it's itself carved into the PIO region (ISA and PHB IO space) and
  303. * the ioremap space
  304. *
  305. * ISA_IO_BASE = KERN_IO_START, 64K reserved area
  306. * PHB_IO_BASE = ISA_IO_BASE + 64K to ISA_IO_BASE + 2G, PHB IO spaces
  307. * IOREMAP_BASE = ISA_IO_BASE + 2G to VMALLOC_START + PGTABLE_RANGE
  308. */
  309. #define FULL_IO_SIZE 0x80000000ul
  310. #define ISA_IO_BASE (KERN_IO_START)
  311. #define ISA_IO_END (KERN_IO_START + 0x10000ul)
  312. #define PHB_IO_BASE (ISA_IO_END)
  313. #define PHB_IO_END (KERN_IO_START + FULL_IO_SIZE)
  314. #define IOREMAP_BASE (PHB_IO_END)
  315. #define IOREMAP_END (KERN_VIRT_START + KERN_VIRT_SIZE)
  316. /* Advertise special mapping type for AGP */
  317. #define HAVE_PAGE_AGP
  318. #ifndef __ASSEMBLY__
  319. /*
  320. * This is the default implementation of various PTE accessors, it's
  321. * used in all cases except Book3S with 64K pages where we have a
  322. * concept of sub-pages
  323. */
  324. #ifndef __real_pte
  325. #define __real_pte(e, p, o) ((real_pte_t){(e)})
  326. #define __rpte_to_pte(r) ((r).pte)
  327. #define __rpte_to_hidx(r,index) (pte_val(__rpte_to_pte(r)) >> H_PAGE_F_GIX_SHIFT)
  328. #define pte_iterate_hashed_subpages(rpte, psize, va, index, shift) \
  329. do { \
  330. index = 0; \
  331. shift = mmu_psize_defs[psize].shift; \
  332. #define pte_iterate_hashed_end() } while(0)
  333. /*
  334. * We expect this to be called only for user addresses or kernel virtual
  335. * addresses other than the linear mapping.
  336. */
  337. #define pte_pagesize_index(mm, addr, pte) MMU_PAGE_4K
  338. #endif /* __real_pte */
  339. static inline unsigned long pte_update(struct mm_struct *mm, unsigned long addr,
  340. pte_t *ptep, unsigned long clr,
  341. unsigned long set, int huge)
  342. {
  343. if (radix_enabled())
  344. return radix__pte_update(mm, addr, ptep, clr, set, huge);
  345. return hash__pte_update(mm, addr, ptep, clr, set, huge);
  346. }
  347. /*
  348. * For hash even if we have _PAGE_ACCESSED = 0, we do a pte_update.
  349. * We currently remove entries from the hashtable regardless of whether
  350. * the entry was young or dirty.
  351. *
  352. * We should be more intelligent about this but for the moment we override
  353. * these functions and force a tlb flush unconditionally
  354. * For radix: H_PAGE_HASHPTE should be zero. Hence we can use the same
  355. * function for both hash and radix.
  356. */
  357. static inline int __ptep_test_and_clear_young(struct mm_struct *mm,
  358. unsigned long addr, pte_t *ptep)
  359. {
  360. unsigned long old;
  361. if ((pte_raw(*ptep) & cpu_to_be64(_PAGE_ACCESSED | H_PAGE_HASHPTE)) == 0)
  362. return 0;
  363. old = pte_update(mm, addr, ptep, _PAGE_ACCESSED, 0, 0);
  364. return (old & _PAGE_ACCESSED) != 0;
  365. }
  366. #define __HAVE_ARCH_PTEP_TEST_AND_CLEAR_YOUNG
  367. #define ptep_test_and_clear_young(__vma, __addr, __ptep) \
  368. ({ \
  369. int __r; \
  370. __r = __ptep_test_and_clear_young((__vma)->vm_mm, __addr, __ptep); \
  371. __r; \
  372. })
  373. static inline int __pte_write(pte_t pte)
  374. {
  375. return !!(pte_raw(pte) & cpu_to_be64(_PAGE_WRITE));
  376. }
  377. #ifdef CONFIG_NUMA_BALANCING
  378. #define pte_savedwrite pte_savedwrite
  379. static inline bool pte_savedwrite(pte_t pte)
  380. {
  381. /*
  382. * Saved write ptes are prot none ptes that doesn't have
  383. * privileged bit sit. We mark prot none as one which has
  384. * present and pviliged bit set and RWX cleared. To mark
  385. * protnone which used to have _PAGE_WRITE set we clear
  386. * the privileged bit.
  387. */
  388. return !(pte_raw(pte) & cpu_to_be64(_PAGE_RWX | _PAGE_PRIVILEGED));
  389. }
  390. #else
  391. #define pte_savedwrite pte_savedwrite
  392. static inline bool pte_savedwrite(pte_t pte)
  393. {
  394. return false;
  395. }
  396. #endif
  397. static inline int pte_write(pte_t pte)
  398. {
  399. return __pte_write(pte) || pte_savedwrite(pte);
  400. }
  401. static inline int pte_read(pte_t pte)
  402. {
  403. return !!(pte_raw(pte) & cpu_to_be64(_PAGE_READ));
  404. }
  405. #define __HAVE_ARCH_PTEP_SET_WRPROTECT
  406. static inline void ptep_set_wrprotect(struct mm_struct *mm, unsigned long addr,
  407. pte_t *ptep)
  408. {
  409. if (__pte_write(*ptep))
  410. pte_update(mm, addr, ptep, _PAGE_WRITE, 0, 0);
  411. else if (unlikely(pte_savedwrite(*ptep)))
  412. pte_update(mm, addr, ptep, 0, _PAGE_PRIVILEGED, 0);
  413. }
  414. static inline void huge_ptep_set_wrprotect(struct mm_struct *mm,
  415. unsigned long addr, pte_t *ptep)
  416. {
  417. /*
  418. * We should not find protnone for hugetlb, but this complete the
  419. * interface.
  420. */
  421. if (__pte_write(*ptep))
  422. pte_update(mm, addr, ptep, _PAGE_WRITE, 0, 1);
  423. else if (unlikely(pte_savedwrite(*ptep)))
  424. pte_update(mm, addr, ptep, 0, _PAGE_PRIVILEGED, 1);
  425. }
  426. #define __HAVE_ARCH_PTEP_GET_AND_CLEAR
  427. static inline pte_t ptep_get_and_clear(struct mm_struct *mm,
  428. unsigned long addr, pte_t *ptep)
  429. {
  430. unsigned long old = pte_update(mm, addr, ptep, ~0UL, 0, 0);
  431. return __pte(old);
  432. }
  433. #define __HAVE_ARCH_PTEP_GET_AND_CLEAR_FULL
  434. static inline pte_t ptep_get_and_clear_full(struct mm_struct *mm,
  435. unsigned long addr,
  436. pte_t *ptep, int full)
  437. {
  438. if (full && radix_enabled()) {
  439. /*
  440. * We know that this is a full mm pte clear and
  441. * hence can be sure there is no parallel set_pte.
  442. */
  443. return radix__ptep_get_and_clear_full(mm, addr, ptep, full);
  444. }
  445. return ptep_get_and_clear(mm, addr, ptep);
  446. }
  447. static inline void pte_clear(struct mm_struct *mm, unsigned long addr,
  448. pte_t * ptep)
  449. {
  450. pte_update(mm, addr, ptep, ~0UL, 0, 0);
  451. }
  452. static inline int pte_dirty(pte_t pte)
  453. {
  454. return !!(pte_raw(pte) & cpu_to_be64(_PAGE_DIRTY));
  455. }
  456. static inline int pte_young(pte_t pte)
  457. {
  458. return !!(pte_raw(pte) & cpu_to_be64(_PAGE_ACCESSED));
  459. }
  460. static inline int pte_special(pte_t pte)
  461. {
  462. return !!(pte_raw(pte) & cpu_to_be64(_PAGE_SPECIAL));
  463. }
  464. static inline pgprot_t pte_pgprot(pte_t pte) { return __pgprot(pte_val(pte) & PAGE_PROT_BITS); }
  465. #ifdef CONFIG_HAVE_ARCH_SOFT_DIRTY
  466. static inline bool pte_soft_dirty(pte_t pte)
  467. {
  468. return !!(pte_raw(pte) & cpu_to_be64(_PAGE_SOFT_DIRTY));
  469. }
  470. static inline pte_t pte_mksoft_dirty(pte_t pte)
  471. {
  472. return __pte(pte_val(pte) | _PAGE_SOFT_DIRTY);
  473. }
  474. static inline pte_t pte_clear_soft_dirty(pte_t pte)
  475. {
  476. return __pte(pte_val(pte) & ~_PAGE_SOFT_DIRTY);
  477. }
  478. #endif /* CONFIG_HAVE_ARCH_SOFT_DIRTY */
  479. #ifdef CONFIG_NUMA_BALANCING
  480. static inline int pte_protnone(pte_t pte)
  481. {
  482. return (pte_raw(pte) & cpu_to_be64(_PAGE_PRESENT | _PAGE_PTE | _PAGE_RWX)) ==
  483. cpu_to_be64(_PAGE_PRESENT | _PAGE_PTE);
  484. }
  485. #define pte_mk_savedwrite pte_mk_savedwrite
  486. static inline pte_t pte_mk_savedwrite(pte_t pte)
  487. {
  488. /*
  489. * Used by Autonuma subsystem to preserve the write bit
  490. * while marking the pte PROT_NONE. Only allow this
  491. * on PROT_NONE pte
  492. */
  493. VM_BUG_ON((pte_raw(pte) & cpu_to_be64(_PAGE_PRESENT | _PAGE_RWX | _PAGE_PRIVILEGED)) !=
  494. cpu_to_be64(_PAGE_PRESENT | _PAGE_PRIVILEGED));
  495. return __pte(pte_val(pte) & ~_PAGE_PRIVILEGED);
  496. }
  497. #define pte_clear_savedwrite pte_clear_savedwrite
  498. static inline pte_t pte_clear_savedwrite(pte_t pte)
  499. {
  500. /*
  501. * Used by KSM subsystem to make a protnone pte readonly.
  502. */
  503. VM_BUG_ON(!pte_protnone(pte));
  504. return __pte(pte_val(pte) | _PAGE_PRIVILEGED);
  505. }
  506. #else
  507. #define pte_clear_savedwrite pte_clear_savedwrite
  508. static inline pte_t pte_clear_savedwrite(pte_t pte)
  509. {
  510. VM_WARN_ON(1);
  511. return __pte(pte_val(pte) & ~_PAGE_WRITE);
  512. }
  513. #endif /* CONFIG_NUMA_BALANCING */
  514. static inline int pte_present(pte_t pte)
  515. {
  516. /*
  517. * A pte is considerent present if _PAGE_PRESENT is set.
  518. * We also need to consider the pte present which is marked
  519. * invalid during ptep_set_access_flags. Hence we look for _PAGE_INVALID
  520. * if we find _PAGE_PRESENT cleared.
  521. */
  522. return !!(pte_raw(pte) & cpu_to_be64(_PAGE_PRESENT | _PAGE_INVALID));
  523. }
  524. #ifdef CONFIG_PPC_MEM_KEYS
  525. extern bool arch_pte_access_permitted(u64 pte, bool write, bool execute);
  526. #else
  527. static inline bool arch_pte_access_permitted(u64 pte, bool write, bool execute)
  528. {
  529. return true;
  530. }
  531. #endif /* CONFIG_PPC_MEM_KEYS */
  532. #define pte_access_permitted pte_access_permitted
  533. static inline bool pte_access_permitted(pte_t pte, bool write)
  534. {
  535. unsigned long pteval = pte_val(pte);
  536. /* Also check for pte_user */
  537. unsigned long clear_pte_bits = _PAGE_PRIVILEGED;
  538. /*
  539. * _PAGE_READ is needed for any access and will be
  540. * cleared for PROT_NONE
  541. */
  542. unsigned long need_pte_bits = _PAGE_PRESENT | _PAGE_READ;
  543. if (write)
  544. need_pte_bits |= _PAGE_WRITE;
  545. if ((pteval & need_pte_bits) != need_pte_bits)
  546. return false;
  547. if ((pteval & clear_pte_bits) == clear_pte_bits)
  548. return false;
  549. return arch_pte_access_permitted(pte_val(pte), write, 0);
  550. }
  551. /*
  552. * Conversion functions: convert a page and protection to a page entry,
  553. * and a page entry and page directory to the page they refer to.
  554. *
  555. * Even if PTEs can be unsigned long long, a PFN is always an unsigned
  556. * long for now.
  557. */
  558. static inline pte_t pfn_pte(unsigned long pfn, pgprot_t pgprot)
  559. {
  560. return __pte((((pte_basic_t)(pfn) << PAGE_SHIFT) & PTE_RPN_MASK) |
  561. pgprot_val(pgprot));
  562. }
  563. static inline unsigned long pte_pfn(pte_t pte)
  564. {
  565. return (pte_val(pte) & PTE_RPN_MASK) >> PAGE_SHIFT;
  566. }
  567. /* Generic modifiers for PTE bits */
  568. static inline pte_t pte_wrprotect(pte_t pte)
  569. {
  570. if (unlikely(pte_savedwrite(pte)))
  571. return pte_clear_savedwrite(pte);
  572. return __pte(pte_val(pte) & ~_PAGE_WRITE);
  573. }
  574. static inline pte_t pte_mkclean(pte_t pte)
  575. {
  576. return __pte(pte_val(pte) & ~_PAGE_DIRTY);
  577. }
  578. static inline pte_t pte_mkold(pte_t pte)
  579. {
  580. return __pte(pte_val(pte) & ~_PAGE_ACCESSED);
  581. }
  582. static inline pte_t pte_mkwrite(pte_t pte)
  583. {
  584. /*
  585. * write implies read, hence set both
  586. */
  587. return __pte(pte_val(pte) | _PAGE_RW);
  588. }
  589. static inline pte_t pte_mkdirty(pte_t pte)
  590. {
  591. return __pte(pte_val(pte) | _PAGE_DIRTY | _PAGE_SOFT_DIRTY);
  592. }
  593. static inline pte_t pte_mkyoung(pte_t pte)
  594. {
  595. return __pte(pte_val(pte) | _PAGE_ACCESSED);
  596. }
  597. static inline pte_t pte_mkspecial(pte_t pte)
  598. {
  599. return __pte(pte_val(pte) | _PAGE_SPECIAL);
  600. }
  601. static inline pte_t pte_mkhuge(pte_t pte)
  602. {
  603. return pte;
  604. }
  605. static inline pte_t pte_mkdevmap(pte_t pte)
  606. {
  607. return __pte(pte_val(pte) | _PAGE_SPECIAL|_PAGE_DEVMAP);
  608. }
  609. /*
  610. * This is potentially called with a pmd as the argument, in which case it's not
  611. * safe to check _PAGE_DEVMAP unless we also confirm that _PAGE_PTE is set.
  612. * That's because the bit we use for _PAGE_DEVMAP is not reserved for software
  613. * use in page directory entries (ie. non-ptes).
  614. */
  615. static inline int pte_devmap(pte_t pte)
  616. {
  617. u64 mask = cpu_to_be64(_PAGE_DEVMAP | _PAGE_PTE);
  618. return (pte_raw(pte) & mask) == mask;
  619. }
  620. static inline pte_t pte_modify(pte_t pte, pgprot_t newprot)
  621. {
  622. /* FIXME!! check whether this need to be a conditional */
  623. return __pte((pte_val(pte) & _PAGE_CHG_MASK) | pgprot_val(newprot));
  624. }
  625. static inline bool pte_user(pte_t pte)
  626. {
  627. return !(pte_raw(pte) & cpu_to_be64(_PAGE_PRIVILEGED));
  628. }
  629. /* Encode and de-code a swap entry */
  630. #define MAX_SWAPFILES_CHECK() do { \
  631. BUILD_BUG_ON(MAX_SWAPFILES_SHIFT > SWP_TYPE_BITS); \
  632. /* \
  633. * Don't have overlapping bits with _PAGE_HPTEFLAGS \
  634. * We filter HPTEFLAGS on set_pte. \
  635. */ \
  636. BUILD_BUG_ON(_PAGE_HPTEFLAGS & (0x1f << _PAGE_BIT_SWAP_TYPE)); \
  637. BUILD_BUG_ON(_PAGE_HPTEFLAGS & _PAGE_SWP_SOFT_DIRTY); \
  638. } while (0)
  639. /*
  640. * on pte we don't need handle RADIX_TREE_EXCEPTIONAL_SHIFT;
  641. */
  642. #define SWP_TYPE_BITS 5
  643. #define __swp_type(x) (((x).val >> _PAGE_BIT_SWAP_TYPE) \
  644. & ((1UL << SWP_TYPE_BITS) - 1))
  645. #define __swp_offset(x) (((x).val & PTE_RPN_MASK) >> PAGE_SHIFT)
  646. #define __swp_entry(type, offset) ((swp_entry_t) { \
  647. ((type) << _PAGE_BIT_SWAP_TYPE) \
  648. | (((offset) << PAGE_SHIFT) & PTE_RPN_MASK)})
  649. /*
  650. * swp_entry_t must be independent of pte bits. We build a swp_entry_t from
  651. * swap type and offset we get from swap and convert that to pte to find a
  652. * matching pte in linux page table.
  653. * Clear bits not found in swap entries here.
  654. */
  655. #define __pte_to_swp_entry(pte) ((swp_entry_t) { pte_val((pte)) & ~_PAGE_PTE })
  656. #define __swp_entry_to_pte(x) __pte((x).val | _PAGE_PTE)
  657. #ifdef CONFIG_MEM_SOFT_DIRTY
  658. #define _PAGE_SWP_SOFT_DIRTY (1UL << (SWP_TYPE_BITS + _PAGE_BIT_SWAP_TYPE))
  659. #else
  660. #define _PAGE_SWP_SOFT_DIRTY 0UL
  661. #endif /* CONFIG_MEM_SOFT_DIRTY */
  662. #ifdef CONFIG_HAVE_ARCH_SOFT_DIRTY
  663. static inline pte_t pte_swp_mksoft_dirty(pte_t pte)
  664. {
  665. return __pte(pte_val(pte) | _PAGE_SWP_SOFT_DIRTY);
  666. }
  667. static inline bool pte_swp_soft_dirty(pte_t pte)
  668. {
  669. return !!(pte_raw(pte) & cpu_to_be64(_PAGE_SWP_SOFT_DIRTY));
  670. }
  671. static inline pte_t pte_swp_clear_soft_dirty(pte_t pte)
  672. {
  673. return __pte(pte_val(pte) & ~_PAGE_SWP_SOFT_DIRTY);
  674. }
  675. #endif /* CONFIG_HAVE_ARCH_SOFT_DIRTY */
  676. static inline bool check_pte_access(unsigned long access, unsigned long ptev)
  677. {
  678. /*
  679. * This check for _PAGE_RWX and _PAGE_PRESENT bits
  680. */
  681. if (access & ~ptev)
  682. return false;
  683. /*
  684. * This check for access to privilege space
  685. */
  686. if ((access & _PAGE_PRIVILEGED) != (ptev & _PAGE_PRIVILEGED))
  687. return false;
  688. return true;
  689. }
  690. /*
  691. * Generic functions with hash/radix callbacks
  692. */
  693. static inline void __ptep_set_access_flags(struct vm_area_struct *vma,
  694. pte_t *ptep, pte_t entry,
  695. unsigned long address,
  696. int psize)
  697. {
  698. if (radix_enabled())
  699. return radix__ptep_set_access_flags(vma, ptep, entry,
  700. address, psize);
  701. return hash__ptep_set_access_flags(ptep, entry);
  702. }
  703. #define __HAVE_ARCH_PTE_SAME
  704. static inline int pte_same(pte_t pte_a, pte_t pte_b)
  705. {
  706. if (radix_enabled())
  707. return radix__pte_same(pte_a, pte_b);
  708. return hash__pte_same(pte_a, pte_b);
  709. }
  710. static inline int pte_none(pte_t pte)
  711. {
  712. if (radix_enabled())
  713. return radix__pte_none(pte);
  714. return hash__pte_none(pte);
  715. }
  716. static inline void __set_pte_at(struct mm_struct *mm, unsigned long addr,
  717. pte_t *ptep, pte_t pte, int percpu)
  718. {
  719. if (radix_enabled())
  720. return radix__set_pte_at(mm, addr, ptep, pte, percpu);
  721. return hash__set_pte_at(mm, addr, ptep, pte, percpu);
  722. }
  723. #define _PAGE_CACHE_CTL (_PAGE_NON_IDEMPOTENT | _PAGE_TOLERANT)
  724. #define pgprot_noncached pgprot_noncached
  725. static inline pgprot_t pgprot_noncached(pgprot_t prot)
  726. {
  727. return __pgprot((pgprot_val(prot) & ~_PAGE_CACHE_CTL) |
  728. _PAGE_NON_IDEMPOTENT);
  729. }
  730. #define pgprot_noncached_wc pgprot_noncached_wc
  731. static inline pgprot_t pgprot_noncached_wc(pgprot_t prot)
  732. {
  733. return __pgprot((pgprot_val(prot) & ~_PAGE_CACHE_CTL) |
  734. _PAGE_TOLERANT);
  735. }
  736. #define pgprot_cached pgprot_cached
  737. static inline pgprot_t pgprot_cached(pgprot_t prot)
  738. {
  739. return __pgprot((pgprot_val(prot) & ~_PAGE_CACHE_CTL));
  740. }
  741. #define pgprot_writecombine pgprot_writecombine
  742. static inline pgprot_t pgprot_writecombine(pgprot_t prot)
  743. {
  744. return pgprot_noncached_wc(prot);
  745. }
  746. /*
  747. * check a pte mapping have cache inhibited property
  748. */
  749. static inline bool pte_ci(pte_t pte)
  750. {
  751. unsigned long pte_v = pte_val(pte);
  752. if (((pte_v & _PAGE_CACHE_CTL) == _PAGE_TOLERANT) ||
  753. ((pte_v & _PAGE_CACHE_CTL) == _PAGE_NON_IDEMPOTENT))
  754. return true;
  755. return false;
  756. }
  757. static inline void pmd_set(pmd_t *pmdp, unsigned long val)
  758. {
  759. *pmdp = __pmd(val);
  760. }
  761. static inline void pmd_clear(pmd_t *pmdp)
  762. {
  763. *pmdp = __pmd(0);
  764. }
  765. static inline int pmd_none(pmd_t pmd)
  766. {
  767. return !pmd_raw(pmd);
  768. }
  769. static inline int pmd_present(pmd_t pmd)
  770. {
  771. return !pmd_none(pmd);
  772. }
  773. static inline int pmd_bad(pmd_t pmd)
  774. {
  775. if (radix_enabled())
  776. return radix__pmd_bad(pmd);
  777. return hash__pmd_bad(pmd);
  778. }
  779. static inline void pud_set(pud_t *pudp, unsigned long val)
  780. {
  781. *pudp = __pud(val);
  782. }
  783. static inline void pud_clear(pud_t *pudp)
  784. {
  785. *pudp = __pud(0);
  786. }
  787. static inline int pud_none(pud_t pud)
  788. {
  789. return !pud_raw(pud);
  790. }
  791. static inline int pud_present(pud_t pud)
  792. {
  793. return !pud_none(pud);
  794. }
  795. extern struct page *pud_page(pud_t pud);
  796. extern struct page *pmd_page(pmd_t pmd);
  797. static inline pte_t pud_pte(pud_t pud)
  798. {
  799. return __pte_raw(pud_raw(pud));
  800. }
  801. static inline pud_t pte_pud(pte_t pte)
  802. {
  803. return __pud_raw(pte_raw(pte));
  804. }
  805. #define pud_write(pud) pte_write(pud_pte(pud))
  806. static inline int pud_bad(pud_t pud)
  807. {
  808. if (radix_enabled())
  809. return radix__pud_bad(pud);
  810. return hash__pud_bad(pud);
  811. }
  812. #define pud_access_permitted pud_access_permitted
  813. static inline bool pud_access_permitted(pud_t pud, bool write)
  814. {
  815. return pte_access_permitted(pud_pte(pud), write);
  816. }
  817. #define pgd_write(pgd) pte_write(pgd_pte(pgd))
  818. static inline void pgd_set(pgd_t *pgdp, unsigned long val)
  819. {
  820. *pgdp = __pgd(val);
  821. }
  822. static inline void pgd_clear(pgd_t *pgdp)
  823. {
  824. *pgdp = __pgd(0);
  825. }
  826. static inline int pgd_none(pgd_t pgd)
  827. {
  828. return !pgd_raw(pgd);
  829. }
  830. static inline int pgd_present(pgd_t pgd)
  831. {
  832. return !pgd_none(pgd);
  833. }
  834. static inline pte_t pgd_pte(pgd_t pgd)
  835. {
  836. return __pte_raw(pgd_raw(pgd));
  837. }
  838. static inline pgd_t pte_pgd(pte_t pte)
  839. {
  840. return __pgd_raw(pte_raw(pte));
  841. }
  842. static inline int pgd_bad(pgd_t pgd)
  843. {
  844. if (radix_enabled())
  845. return radix__pgd_bad(pgd);
  846. return hash__pgd_bad(pgd);
  847. }
  848. #define pgd_access_permitted pgd_access_permitted
  849. static inline bool pgd_access_permitted(pgd_t pgd, bool write)
  850. {
  851. return pte_access_permitted(pgd_pte(pgd), write);
  852. }
  853. extern struct page *pgd_page(pgd_t pgd);
  854. /* Pointers in the page table tree are physical addresses */
  855. #define __pgtable_ptr_val(ptr) __pa(ptr)
  856. #define pmd_page_vaddr(pmd) __va(pmd_val(pmd) & ~PMD_MASKED_BITS)
  857. #define pud_page_vaddr(pud) __va(pud_val(pud) & ~PUD_MASKED_BITS)
  858. #define pgd_page_vaddr(pgd) __va(pgd_val(pgd) & ~PGD_MASKED_BITS)
  859. #define pgd_index(address) (((address) >> (PGDIR_SHIFT)) & (PTRS_PER_PGD - 1))
  860. #define pud_index(address) (((address) >> (PUD_SHIFT)) & (PTRS_PER_PUD - 1))
  861. #define pmd_index(address) (((address) >> (PMD_SHIFT)) & (PTRS_PER_PMD - 1))
  862. #define pte_index(address) (((address) >> (PAGE_SHIFT)) & (PTRS_PER_PTE - 1))
  863. /*
  864. * Find an entry in a page-table-directory. We combine the address region
  865. * (the high order N bits) and the pgd portion of the address.
  866. */
  867. #define pgd_offset(mm, address) ((mm)->pgd + pgd_index(address))
  868. #define pud_offset(pgdp, addr) \
  869. (((pud_t *) pgd_page_vaddr(*(pgdp))) + pud_index(addr))
  870. #define pmd_offset(pudp,addr) \
  871. (((pmd_t *) pud_page_vaddr(*(pudp))) + pmd_index(addr))
  872. #define pte_offset_kernel(dir,addr) \
  873. (((pte_t *) pmd_page_vaddr(*(dir))) + pte_index(addr))
  874. #define pte_offset_map(dir,addr) pte_offset_kernel((dir), (addr))
  875. #define pte_unmap(pte) do { } while(0)
  876. /* to find an entry in a kernel page-table-directory */
  877. /* This now only contains the vmalloc pages */
  878. #define pgd_offset_k(address) pgd_offset(&init_mm, address)
  879. #define pte_ERROR(e) \
  880. pr_err("%s:%d: bad pte %08lx.\n", __FILE__, __LINE__, pte_val(e))
  881. #define pmd_ERROR(e) \
  882. pr_err("%s:%d: bad pmd %08lx.\n", __FILE__, __LINE__, pmd_val(e))
  883. #define pud_ERROR(e) \
  884. pr_err("%s:%d: bad pud %08lx.\n", __FILE__, __LINE__, pud_val(e))
  885. #define pgd_ERROR(e) \
  886. pr_err("%s:%d: bad pgd %08lx.\n", __FILE__, __LINE__, pgd_val(e))
  887. static inline int map_kernel_page(unsigned long ea, unsigned long pa,
  888. unsigned long flags)
  889. {
  890. if (radix_enabled()) {
  891. #if defined(CONFIG_PPC_RADIX_MMU) && defined(DEBUG_VM)
  892. unsigned long page_size = 1 << mmu_psize_defs[mmu_io_psize].shift;
  893. WARN((page_size != PAGE_SIZE), "I/O page size != PAGE_SIZE");
  894. #endif
  895. return radix__map_kernel_page(ea, pa, __pgprot(flags), PAGE_SIZE);
  896. }
  897. return hash__map_kernel_page(ea, pa, flags);
  898. }
  899. static inline int __meminit vmemmap_create_mapping(unsigned long start,
  900. unsigned long page_size,
  901. unsigned long phys)
  902. {
  903. if (radix_enabled())
  904. return radix__vmemmap_create_mapping(start, page_size, phys);
  905. return hash__vmemmap_create_mapping(start, page_size, phys);
  906. }
  907. #ifdef CONFIG_MEMORY_HOTPLUG
  908. static inline void vmemmap_remove_mapping(unsigned long start,
  909. unsigned long page_size)
  910. {
  911. if (radix_enabled())
  912. return radix__vmemmap_remove_mapping(start, page_size);
  913. return hash__vmemmap_remove_mapping(start, page_size);
  914. }
  915. #endif
  916. static inline pte_t pmd_pte(pmd_t pmd)
  917. {
  918. return __pte_raw(pmd_raw(pmd));
  919. }
  920. static inline pmd_t pte_pmd(pte_t pte)
  921. {
  922. return __pmd_raw(pte_raw(pte));
  923. }
  924. static inline pte_t *pmdp_ptep(pmd_t *pmd)
  925. {
  926. return (pte_t *)pmd;
  927. }
  928. #define pmd_pfn(pmd) pte_pfn(pmd_pte(pmd))
  929. #define pmd_dirty(pmd) pte_dirty(pmd_pte(pmd))
  930. #define pmd_young(pmd) pte_young(pmd_pte(pmd))
  931. #define pmd_mkold(pmd) pte_pmd(pte_mkold(pmd_pte(pmd)))
  932. #define pmd_wrprotect(pmd) pte_pmd(pte_wrprotect(pmd_pte(pmd)))
  933. #define pmd_mkdirty(pmd) pte_pmd(pte_mkdirty(pmd_pte(pmd)))
  934. #define pmd_mkclean(pmd) pte_pmd(pte_mkclean(pmd_pte(pmd)))
  935. #define pmd_mkyoung(pmd) pte_pmd(pte_mkyoung(pmd_pte(pmd)))
  936. #define pmd_mkwrite(pmd) pte_pmd(pte_mkwrite(pmd_pte(pmd)))
  937. #define pmd_mk_savedwrite(pmd) pte_pmd(pte_mk_savedwrite(pmd_pte(pmd)))
  938. #define pmd_clear_savedwrite(pmd) pte_pmd(pte_clear_savedwrite(pmd_pte(pmd)))
  939. #ifdef CONFIG_HAVE_ARCH_SOFT_DIRTY
  940. #define pmd_soft_dirty(pmd) pte_soft_dirty(pmd_pte(pmd))
  941. #define pmd_mksoft_dirty(pmd) pte_pmd(pte_mksoft_dirty(pmd_pte(pmd)))
  942. #define pmd_clear_soft_dirty(pmd) pte_pmd(pte_clear_soft_dirty(pmd_pte(pmd)))
  943. #endif /* CONFIG_HAVE_ARCH_SOFT_DIRTY */
  944. #ifdef CONFIG_NUMA_BALANCING
  945. static inline int pmd_protnone(pmd_t pmd)
  946. {
  947. return pte_protnone(pmd_pte(pmd));
  948. }
  949. #endif /* CONFIG_NUMA_BALANCING */
  950. #define pmd_write(pmd) pte_write(pmd_pte(pmd))
  951. #define __pmd_write(pmd) __pte_write(pmd_pte(pmd))
  952. #define pmd_savedwrite(pmd) pte_savedwrite(pmd_pte(pmd))
  953. #define pmd_access_permitted pmd_access_permitted
  954. static inline bool pmd_access_permitted(pmd_t pmd, bool write)
  955. {
  956. return pte_access_permitted(pmd_pte(pmd), write);
  957. }
  958. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  959. extern pmd_t pfn_pmd(unsigned long pfn, pgprot_t pgprot);
  960. extern pmd_t mk_pmd(struct page *page, pgprot_t pgprot);
  961. extern pmd_t pmd_modify(pmd_t pmd, pgprot_t newprot);
  962. extern void set_pmd_at(struct mm_struct *mm, unsigned long addr,
  963. pmd_t *pmdp, pmd_t pmd);
  964. extern void update_mmu_cache_pmd(struct vm_area_struct *vma, unsigned long addr,
  965. pmd_t *pmd);
  966. extern int hash__has_transparent_hugepage(void);
  967. static inline int has_transparent_hugepage(void)
  968. {
  969. if (radix_enabled())
  970. return radix__has_transparent_hugepage();
  971. return hash__has_transparent_hugepage();
  972. }
  973. #define has_transparent_hugepage has_transparent_hugepage
  974. static inline unsigned long
  975. pmd_hugepage_update(struct mm_struct *mm, unsigned long addr, pmd_t *pmdp,
  976. unsigned long clr, unsigned long set)
  977. {
  978. if (radix_enabled())
  979. return radix__pmd_hugepage_update(mm, addr, pmdp, clr, set);
  980. return hash__pmd_hugepage_update(mm, addr, pmdp, clr, set);
  981. }
  982. static inline int pmd_large(pmd_t pmd)
  983. {
  984. return !!(pmd_raw(pmd) & cpu_to_be64(_PAGE_PTE));
  985. }
  986. static inline pmd_t pmd_mknotpresent(pmd_t pmd)
  987. {
  988. return __pmd(pmd_val(pmd) & ~_PAGE_PRESENT);
  989. }
  990. /*
  991. * For radix we should always find H_PAGE_HASHPTE zero. Hence
  992. * the below will work for radix too
  993. */
  994. static inline int __pmdp_test_and_clear_young(struct mm_struct *mm,
  995. unsigned long addr, pmd_t *pmdp)
  996. {
  997. unsigned long old;
  998. if ((pmd_raw(*pmdp) & cpu_to_be64(_PAGE_ACCESSED | H_PAGE_HASHPTE)) == 0)
  999. return 0;
  1000. old = pmd_hugepage_update(mm, addr, pmdp, _PAGE_ACCESSED, 0);
  1001. return ((old & _PAGE_ACCESSED) != 0);
  1002. }
  1003. #define __HAVE_ARCH_PMDP_SET_WRPROTECT
  1004. static inline void pmdp_set_wrprotect(struct mm_struct *mm, unsigned long addr,
  1005. pmd_t *pmdp)
  1006. {
  1007. if (__pmd_write((*pmdp)))
  1008. pmd_hugepage_update(mm, addr, pmdp, _PAGE_WRITE, 0);
  1009. else if (unlikely(pmd_savedwrite(*pmdp)))
  1010. pmd_hugepage_update(mm, addr, pmdp, 0, _PAGE_PRIVILEGED);
  1011. }
  1012. static inline int pmd_trans_huge(pmd_t pmd)
  1013. {
  1014. if (radix_enabled())
  1015. return radix__pmd_trans_huge(pmd);
  1016. return hash__pmd_trans_huge(pmd);
  1017. }
  1018. #define __HAVE_ARCH_PMD_SAME
  1019. static inline int pmd_same(pmd_t pmd_a, pmd_t pmd_b)
  1020. {
  1021. if (radix_enabled())
  1022. return radix__pmd_same(pmd_a, pmd_b);
  1023. return hash__pmd_same(pmd_a, pmd_b);
  1024. }
  1025. static inline pmd_t pmd_mkhuge(pmd_t pmd)
  1026. {
  1027. if (radix_enabled())
  1028. return radix__pmd_mkhuge(pmd);
  1029. return hash__pmd_mkhuge(pmd);
  1030. }
  1031. #define __HAVE_ARCH_PMDP_SET_ACCESS_FLAGS
  1032. extern int pmdp_set_access_flags(struct vm_area_struct *vma,
  1033. unsigned long address, pmd_t *pmdp,
  1034. pmd_t entry, int dirty);
  1035. #define __HAVE_ARCH_PMDP_TEST_AND_CLEAR_YOUNG
  1036. extern int pmdp_test_and_clear_young(struct vm_area_struct *vma,
  1037. unsigned long address, pmd_t *pmdp);
  1038. #define __HAVE_ARCH_PMDP_HUGE_GET_AND_CLEAR
  1039. static inline pmd_t pmdp_huge_get_and_clear(struct mm_struct *mm,
  1040. unsigned long addr, pmd_t *pmdp)
  1041. {
  1042. if (radix_enabled())
  1043. return radix__pmdp_huge_get_and_clear(mm, addr, pmdp);
  1044. return hash__pmdp_huge_get_and_clear(mm, addr, pmdp);
  1045. }
  1046. static inline pmd_t pmdp_collapse_flush(struct vm_area_struct *vma,
  1047. unsigned long address, pmd_t *pmdp)
  1048. {
  1049. if (radix_enabled())
  1050. return radix__pmdp_collapse_flush(vma, address, pmdp);
  1051. return hash__pmdp_collapse_flush(vma, address, pmdp);
  1052. }
  1053. #define pmdp_collapse_flush pmdp_collapse_flush
  1054. #define __HAVE_ARCH_PGTABLE_DEPOSIT
  1055. static inline void pgtable_trans_huge_deposit(struct mm_struct *mm,
  1056. pmd_t *pmdp, pgtable_t pgtable)
  1057. {
  1058. if (radix_enabled())
  1059. return radix__pgtable_trans_huge_deposit(mm, pmdp, pgtable);
  1060. return hash__pgtable_trans_huge_deposit(mm, pmdp, pgtable);
  1061. }
  1062. #define __HAVE_ARCH_PGTABLE_WITHDRAW
  1063. static inline pgtable_t pgtable_trans_huge_withdraw(struct mm_struct *mm,
  1064. pmd_t *pmdp)
  1065. {
  1066. if (radix_enabled())
  1067. return radix__pgtable_trans_huge_withdraw(mm, pmdp);
  1068. return hash__pgtable_trans_huge_withdraw(mm, pmdp);
  1069. }
  1070. #define __HAVE_ARCH_PMDP_INVALIDATE
  1071. extern pmd_t pmdp_invalidate(struct vm_area_struct *vma, unsigned long address,
  1072. pmd_t *pmdp);
  1073. #define pmd_move_must_withdraw pmd_move_must_withdraw
  1074. struct spinlock;
  1075. static inline int pmd_move_must_withdraw(struct spinlock *new_pmd_ptl,
  1076. struct spinlock *old_pmd_ptl,
  1077. struct vm_area_struct *vma)
  1078. {
  1079. if (radix_enabled())
  1080. return false;
  1081. /*
  1082. * Archs like ppc64 use pgtable to store per pmd
  1083. * specific information. So when we switch the pmd,
  1084. * we should also withdraw and deposit the pgtable
  1085. */
  1086. return true;
  1087. }
  1088. #define arch_needs_pgtable_deposit arch_needs_pgtable_deposit
  1089. static inline bool arch_needs_pgtable_deposit(void)
  1090. {
  1091. if (radix_enabled())
  1092. return false;
  1093. return true;
  1094. }
  1095. extern void serialize_against_pte_lookup(struct mm_struct *mm);
  1096. static inline pmd_t pmd_mkdevmap(pmd_t pmd)
  1097. {
  1098. return __pmd(pmd_val(pmd) | (_PAGE_PTE | _PAGE_DEVMAP));
  1099. }
  1100. static inline int pmd_devmap(pmd_t pmd)
  1101. {
  1102. return pte_devmap(pmd_pte(pmd));
  1103. }
  1104. static inline int pud_devmap(pud_t pud)
  1105. {
  1106. return 0;
  1107. }
  1108. static inline int pgd_devmap(pgd_t pgd)
  1109. {
  1110. return 0;
  1111. }
  1112. #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
  1113. static inline const int pud_pfn(pud_t pud)
  1114. {
  1115. /*
  1116. * Currently all calls to pud_pfn() are gated around a pud_devmap()
  1117. * check so this should never be used. If it grows another user we
  1118. * want to know about it.
  1119. */
  1120. BUILD_BUG();
  1121. return 0;
  1122. }
  1123. #endif /* __ASSEMBLY__ */
  1124. #endif /* _ASM_POWERPC_BOOK3S_64_PGTABLE_H_ */