hugetlb.h 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569
  1. #ifndef _LINUX_HUGETLB_H
  2. #define _LINUX_HUGETLB_H
  3. #include <linux/mm_types.h>
  4. #include <linux/mmdebug.h>
  5. #include <linux/fs.h>
  6. #include <linux/hugetlb_inline.h>
  7. #include <linux/cgroup.h>
  8. #include <linux/list.h>
  9. #include <linux/kref.h>
  10. #include <asm/pgtable.h>
  11. struct ctl_table;
  12. struct user_struct;
  13. struct mmu_gather;
  14. #ifdef CONFIG_HUGETLB_PAGE
  15. #include <linux/mempolicy.h>
  16. #include <linux/shm.h>
  17. #include <asm/tlbflush.h>
  18. struct hugepage_subpool {
  19. spinlock_t lock;
  20. long count;
  21. long max_hpages; /* Maximum huge pages or -1 if no maximum. */
  22. long used_hpages; /* Used count against maximum, includes */
  23. /* both alloced and reserved pages. */
  24. struct hstate *hstate;
  25. long min_hpages; /* Minimum huge pages or -1 if no minimum. */
  26. long rsv_hpages; /* Pages reserved against global pool to */
  27. /* sasitfy minimum size. */
  28. };
  29. struct resv_map {
  30. struct kref refs;
  31. spinlock_t lock;
  32. struct list_head regions;
  33. long adds_in_progress;
  34. struct list_head region_cache;
  35. long region_cache_count;
  36. };
  37. extern struct resv_map *resv_map_alloc(void);
  38. void resv_map_release(struct kref *ref);
  39. extern spinlock_t hugetlb_lock;
  40. extern int hugetlb_max_hstate __read_mostly;
  41. #define for_each_hstate(h) \
  42. for ((h) = hstates; (h) < &hstates[hugetlb_max_hstate]; (h)++)
  43. struct hugepage_subpool *hugepage_new_subpool(struct hstate *h, long max_hpages,
  44. long min_hpages);
  45. void hugepage_put_subpool(struct hugepage_subpool *spool);
  46. void reset_vma_resv_huge_pages(struct vm_area_struct *vma);
  47. int hugetlb_sysctl_handler(struct ctl_table *, int, void __user *, size_t *, loff_t *);
  48. int hugetlb_overcommit_handler(struct ctl_table *, int, void __user *, size_t *, loff_t *);
  49. int hugetlb_treat_movable_handler(struct ctl_table *, int, void __user *, size_t *, loff_t *);
  50. #ifdef CONFIG_NUMA
  51. int hugetlb_mempolicy_sysctl_handler(struct ctl_table *, int,
  52. void __user *, size_t *, loff_t *);
  53. #endif
  54. int copy_hugetlb_page_range(struct mm_struct *, struct mm_struct *, struct vm_area_struct *);
  55. long follow_hugetlb_page(struct mm_struct *, struct vm_area_struct *,
  56. struct page **, struct vm_area_struct **,
  57. unsigned long *, unsigned long *, long, unsigned int,
  58. int *);
  59. void unmap_hugepage_range(struct vm_area_struct *,
  60. unsigned long, unsigned long, struct page *);
  61. void __unmap_hugepage_range_final(struct mmu_gather *tlb,
  62. struct vm_area_struct *vma,
  63. unsigned long start, unsigned long end,
  64. struct page *ref_page);
  65. void __unmap_hugepage_range(struct mmu_gather *tlb, struct vm_area_struct *vma,
  66. unsigned long start, unsigned long end,
  67. struct page *ref_page);
  68. void hugetlb_report_meminfo(struct seq_file *);
  69. int hugetlb_report_node_meminfo(int, char *);
  70. void hugetlb_show_meminfo(void);
  71. unsigned long hugetlb_total_pages(void);
  72. int hugetlb_fault(struct mm_struct *mm, struct vm_area_struct *vma,
  73. unsigned long address, unsigned int flags);
  74. int hugetlb_mcopy_atomic_pte(struct mm_struct *dst_mm, pte_t *dst_pte,
  75. struct vm_area_struct *dst_vma,
  76. unsigned long dst_addr,
  77. unsigned long src_addr,
  78. struct page **pagep);
  79. int hugetlb_reserve_pages(struct inode *inode, long from, long to,
  80. struct vm_area_struct *vma,
  81. vm_flags_t vm_flags);
  82. long hugetlb_unreserve_pages(struct inode *inode, long start, long end,
  83. long freed);
  84. int dequeue_hwpoisoned_huge_page(struct page *page);
  85. bool isolate_huge_page(struct page *page, struct list_head *list);
  86. void putback_active_hugepage(struct page *page);
  87. void free_huge_page(struct page *page);
  88. void hugetlb_fix_reserve_counts(struct inode *inode);
  89. extern struct mutex *hugetlb_fault_mutex_table;
  90. u32 hugetlb_fault_mutex_hash(struct hstate *h, struct mm_struct *mm,
  91. struct vm_area_struct *vma,
  92. struct address_space *mapping,
  93. pgoff_t idx, unsigned long address);
  94. pte_t *huge_pmd_share(struct mm_struct *mm, unsigned long addr, pud_t *pud);
  95. extern int hugepages_treat_as_movable;
  96. extern int sysctl_hugetlb_shm_group;
  97. extern struct list_head huge_boot_pages;
  98. /* arch callbacks */
  99. pte_t *huge_pte_alloc(struct mm_struct *mm,
  100. unsigned long addr, unsigned long sz);
  101. pte_t *huge_pte_offset(struct mm_struct *mm, unsigned long addr);
  102. int huge_pmd_unshare(struct mm_struct *mm, unsigned long *addr, pte_t *ptep);
  103. struct page *follow_huge_addr(struct mm_struct *mm, unsigned long address,
  104. int write);
  105. struct page *follow_huge_pmd(struct mm_struct *mm, unsigned long address,
  106. pmd_t *pmd, int flags);
  107. struct page *follow_huge_pud(struct mm_struct *mm, unsigned long address,
  108. pud_t *pud, int flags);
  109. int pmd_huge(pmd_t pmd);
  110. int pud_huge(pud_t pud);
  111. unsigned long hugetlb_change_protection(struct vm_area_struct *vma,
  112. unsigned long address, unsigned long end, pgprot_t newprot);
  113. #else /* !CONFIG_HUGETLB_PAGE */
  114. static inline void reset_vma_resv_huge_pages(struct vm_area_struct *vma)
  115. {
  116. }
  117. static inline unsigned long hugetlb_total_pages(void)
  118. {
  119. return 0;
  120. }
  121. #define follow_hugetlb_page(m,v,p,vs,a,b,i,w,n) ({ BUG(); 0; })
  122. #define follow_huge_addr(mm, addr, write) ERR_PTR(-EINVAL)
  123. #define copy_hugetlb_page_range(src, dst, vma) ({ BUG(); 0; })
  124. static inline void hugetlb_report_meminfo(struct seq_file *m)
  125. {
  126. }
  127. #define hugetlb_report_node_meminfo(n, buf) 0
  128. static inline void hugetlb_show_meminfo(void)
  129. {
  130. }
  131. #define follow_huge_pmd(mm, addr, pmd, flags) NULL
  132. #define follow_huge_pud(mm, addr, pud, flags) NULL
  133. #define prepare_hugepage_range(file, addr, len) (-EINVAL)
  134. #define pmd_huge(x) 0
  135. #define pud_huge(x) 0
  136. #define is_hugepage_only_range(mm, addr, len) 0
  137. #define hugetlb_free_pgd_range(tlb, addr, end, floor, ceiling) ({BUG(); 0; })
  138. #define hugetlb_fault(mm, vma, addr, flags) ({ BUG(); 0; })
  139. #define hugetlb_mcopy_atomic_pte(dst_mm, dst_pte, dst_vma, dst_addr, \
  140. src_addr, pagep) ({ BUG(); 0; })
  141. #define huge_pte_offset(mm, address) 0
  142. static inline int dequeue_hwpoisoned_huge_page(struct page *page)
  143. {
  144. return 0;
  145. }
  146. static inline bool isolate_huge_page(struct page *page, struct list_head *list)
  147. {
  148. return false;
  149. }
  150. #define putback_active_hugepage(p) do {} while (0)
  151. static inline unsigned long hugetlb_change_protection(struct vm_area_struct *vma,
  152. unsigned long address, unsigned long end, pgprot_t newprot)
  153. {
  154. return 0;
  155. }
  156. static inline void __unmap_hugepage_range_final(struct mmu_gather *tlb,
  157. struct vm_area_struct *vma, unsigned long start,
  158. unsigned long end, struct page *ref_page)
  159. {
  160. BUG();
  161. }
  162. static inline void __unmap_hugepage_range(struct mmu_gather *tlb,
  163. struct vm_area_struct *vma, unsigned long start,
  164. unsigned long end, struct page *ref_page)
  165. {
  166. BUG();
  167. }
  168. #endif /* !CONFIG_HUGETLB_PAGE */
  169. /*
  170. * hugepages at page global directory. If arch support
  171. * hugepages at pgd level, they need to define this.
  172. */
  173. #ifndef pgd_huge
  174. #define pgd_huge(x) 0
  175. #endif
  176. #ifndef p4d_huge
  177. #define p4d_huge(x) 0
  178. #endif
  179. #ifndef pgd_write
  180. static inline int pgd_write(pgd_t pgd)
  181. {
  182. BUG();
  183. return 0;
  184. }
  185. #endif
  186. #ifndef pud_write
  187. static inline int pud_write(pud_t pud)
  188. {
  189. BUG();
  190. return 0;
  191. }
  192. #endif
  193. #ifndef is_hugepd
  194. /*
  195. * Some architectures requires a hugepage directory format that is
  196. * required to support multiple hugepage sizes. For example
  197. * a4fe3ce76 "powerpc/mm: Allow more flexible layouts for hugepage pagetables"
  198. * introduced the same on powerpc. This allows for a more flexible hugepage
  199. * pagetable layout.
  200. */
  201. typedef struct { unsigned long pd; } hugepd_t;
  202. #define is_hugepd(hugepd) (0)
  203. #define __hugepd(x) ((hugepd_t) { (x) })
  204. static inline int gup_huge_pd(hugepd_t hugepd, unsigned long addr,
  205. unsigned pdshift, unsigned long end,
  206. int write, struct page **pages, int *nr)
  207. {
  208. return 0;
  209. }
  210. #else
  211. extern int gup_huge_pd(hugepd_t hugepd, unsigned long addr,
  212. unsigned pdshift, unsigned long end,
  213. int write, struct page **pages, int *nr);
  214. #endif
  215. #define HUGETLB_ANON_FILE "anon_hugepage"
  216. enum {
  217. /*
  218. * The file will be used as an shm file so shmfs accounting rules
  219. * apply
  220. */
  221. HUGETLB_SHMFS_INODE = 1,
  222. /*
  223. * The file is being created on the internal vfs mount and shmfs
  224. * accounting rules do not apply
  225. */
  226. HUGETLB_ANONHUGE_INODE = 2,
  227. };
  228. #ifdef CONFIG_HUGETLBFS
  229. struct hugetlbfs_sb_info {
  230. long max_inodes; /* inodes allowed */
  231. long free_inodes; /* inodes free */
  232. spinlock_t stat_lock;
  233. struct hstate *hstate;
  234. struct hugepage_subpool *spool;
  235. };
  236. static inline struct hugetlbfs_sb_info *HUGETLBFS_SB(struct super_block *sb)
  237. {
  238. return sb->s_fs_info;
  239. }
  240. extern const struct file_operations hugetlbfs_file_operations;
  241. extern const struct vm_operations_struct hugetlb_vm_ops;
  242. struct file *hugetlb_file_setup(const char *name, size_t size, vm_flags_t acct,
  243. struct user_struct **user, int creat_flags,
  244. int page_size_log);
  245. static inline bool is_file_hugepages(struct file *file)
  246. {
  247. if (file->f_op == &hugetlbfs_file_operations)
  248. return true;
  249. return is_file_shm_hugepages(file);
  250. }
  251. #else /* !CONFIG_HUGETLBFS */
  252. #define is_file_hugepages(file) false
  253. static inline struct file *
  254. hugetlb_file_setup(const char *name, size_t size, vm_flags_t acctflag,
  255. struct user_struct **user, int creat_flags,
  256. int page_size_log)
  257. {
  258. return ERR_PTR(-ENOSYS);
  259. }
  260. #endif /* !CONFIG_HUGETLBFS */
  261. #ifdef HAVE_ARCH_HUGETLB_UNMAPPED_AREA
  262. unsigned long hugetlb_get_unmapped_area(struct file *file, unsigned long addr,
  263. unsigned long len, unsigned long pgoff,
  264. unsigned long flags);
  265. #endif /* HAVE_ARCH_HUGETLB_UNMAPPED_AREA */
  266. #ifdef CONFIG_HUGETLB_PAGE
  267. #define HSTATE_NAME_LEN 32
  268. /* Defines one hugetlb page size */
  269. struct hstate {
  270. int next_nid_to_alloc;
  271. int next_nid_to_free;
  272. unsigned int order;
  273. unsigned long mask;
  274. unsigned long max_huge_pages;
  275. unsigned long nr_huge_pages;
  276. unsigned long free_huge_pages;
  277. unsigned long resv_huge_pages;
  278. unsigned long surplus_huge_pages;
  279. unsigned long nr_overcommit_huge_pages;
  280. struct list_head hugepage_activelist;
  281. struct list_head hugepage_freelists[MAX_NUMNODES];
  282. unsigned int nr_huge_pages_node[MAX_NUMNODES];
  283. unsigned int free_huge_pages_node[MAX_NUMNODES];
  284. unsigned int surplus_huge_pages_node[MAX_NUMNODES];
  285. #ifdef CONFIG_CGROUP_HUGETLB
  286. /* cgroup control files */
  287. struct cftype cgroup_files[5];
  288. #endif
  289. char name[HSTATE_NAME_LEN];
  290. };
  291. struct huge_bootmem_page {
  292. struct list_head list;
  293. struct hstate *hstate;
  294. #ifdef CONFIG_HIGHMEM
  295. phys_addr_t phys;
  296. #endif
  297. };
  298. struct page *alloc_huge_page(struct vm_area_struct *vma,
  299. unsigned long addr, int avoid_reserve);
  300. struct page *alloc_huge_page_node(struct hstate *h, int nid);
  301. struct page *alloc_huge_page_noerr(struct vm_area_struct *vma,
  302. unsigned long addr, int avoid_reserve);
  303. int huge_add_to_page_cache(struct page *page, struct address_space *mapping,
  304. pgoff_t idx);
  305. /* arch callback */
  306. int __init alloc_bootmem_huge_page(struct hstate *h);
  307. void __init hugetlb_bad_size(void);
  308. void __init hugetlb_add_hstate(unsigned order);
  309. struct hstate *size_to_hstate(unsigned long size);
  310. #ifndef HUGE_MAX_HSTATE
  311. #define HUGE_MAX_HSTATE 1
  312. #endif
  313. extern struct hstate hstates[HUGE_MAX_HSTATE];
  314. extern unsigned int default_hstate_idx;
  315. #define default_hstate (hstates[default_hstate_idx])
  316. static inline struct hstate *hstate_inode(struct inode *i)
  317. {
  318. return HUGETLBFS_SB(i->i_sb)->hstate;
  319. }
  320. static inline struct hstate *hstate_file(struct file *f)
  321. {
  322. return hstate_inode(file_inode(f));
  323. }
  324. static inline struct hstate *hstate_sizelog(int page_size_log)
  325. {
  326. if (!page_size_log)
  327. return &default_hstate;
  328. return size_to_hstate(1UL << page_size_log);
  329. }
  330. static inline struct hstate *hstate_vma(struct vm_area_struct *vma)
  331. {
  332. return hstate_file(vma->vm_file);
  333. }
  334. static inline unsigned long huge_page_size(struct hstate *h)
  335. {
  336. return (unsigned long)PAGE_SIZE << h->order;
  337. }
  338. extern unsigned long vma_kernel_pagesize(struct vm_area_struct *vma);
  339. extern unsigned long vma_mmu_pagesize(struct vm_area_struct *vma);
  340. static inline unsigned long huge_page_mask(struct hstate *h)
  341. {
  342. return h->mask;
  343. }
  344. static inline unsigned int huge_page_order(struct hstate *h)
  345. {
  346. return h->order;
  347. }
  348. static inline unsigned huge_page_shift(struct hstate *h)
  349. {
  350. return h->order + PAGE_SHIFT;
  351. }
  352. static inline bool hstate_is_gigantic(struct hstate *h)
  353. {
  354. return huge_page_order(h) >= MAX_ORDER;
  355. }
  356. static inline unsigned int pages_per_huge_page(struct hstate *h)
  357. {
  358. return 1 << h->order;
  359. }
  360. static inline unsigned int blocks_per_huge_page(struct hstate *h)
  361. {
  362. return huge_page_size(h) / 512;
  363. }
  364. #include <asm/hugetlb.h>
  365. #ifndef arch_make_huge_pte
  366. static inline pte_t arch_make_huge_pte(pte_t entry, struct vm_area_struct *vma,
  367. struct page *page, int writable)
  368. {
  369. return entry;
  370. }
  371. #endif
  372. static inline struct hstate *page_hstate(struct page *page)
  373. {
  374. VM_BUG_ON_PAGE(!PageHuge(page), page);
  375. return size_to_hstate(PAGE_SIZE << compound_order(page));
  376. }
  377. static inline unsigned hstate_index_to_shift(unsigned index)
  378. {
  379. return hstates[index].order + PAGE_SHIFT;
  380. }
  381. static inline int hstate_index(struct hstate *h)
  382. {
  383. return h - hstates;
  384. }
  385. pgoff_t __basepage_index(struct page *page);
  386. /* Return page->index in PAGE_SIZE units */
  387. static inline pgoff_t basepage_index(struct page *page)
  388. {
  389. if (!PageCompound(page))
  390. return page->index;
  391. return __basepage_index(page);
  392. }
  393. extern int dissolve_free_huge_pages(unsigned long start_pfn,
  394. unsigned long end_pfn);
  395. static inline bool hugepage_migration_supported(struct hstate *h)
  396. {
  397. #ifdef CONFIG_ARCH_ENABLE_HUGEPAGE_MIGRATION
  398. if ((huge_page_shift(h) == PMD_SHIFT) ||
  399. (huge_page_shift(h) == PGDIR_SHIFT))
  400. return true;
  401. else
  402. return false;
  403. #else
  404. return false;
  405. #endif
  406. }
  407. static inline spinlock_t *huge_pte_lockptr(struct hstate *h,
  408. struct mm_struct *mm, pte_t *pte)
  409. {
  410. if (huge_page_size(h) == PMD_SIZE)
  411. return pmd_lockptr(mm, (pmd_t *) pte);
  412. VM_BUG_ON(huge_page_size(h) == PAGE_SIZE);
  413. return &mm->page_table_lock;
  414. }
  415. #ifndef hugepages_supported
  416. /*
  417. * Some platform decide whether they support huge pages at boot
  418. * time. Some of them, such as powerpc, set HPAGE_SHIFT to 0
  419. * when there is no such support
  420. */
  421. #define hugepages_supported() (HPAGE_SHIFT != 0)
  422. #endif
  423. void hugetlb_report_usage(struct seq_file *m, struct mm_struct *mm);
  424. static inline void hugetlb_count_add(long l, struct mm_struct *mm)
  425. {
  426. atomic_long_add(l, &mm->hugetlb_usage);
  427. }
  428. static inline void hugetlb_count_sub(long l, struct mm_struct *mm)
  429. {
  430. atomic_long_sub(l, &mm->hugetlb_usage);
  431. }
  432. #else /* CONFIG_HUGETLB_PAGE */
  433. struct hstate {};
  434. #define alloc_huge_page(v, a, r) NULL
  435. #define alloc_huge_page_node(h, nid) NULL
  436. #define alloc_huge_page_noerr(v, a, r) NULL
  437. #define alloc_bootmem_huge_page(h) NULL
  438. #define hstate_file(f) NULL
  439. #define hstate_sizelog(s) NULL
  440. #define hstate_vma(v) NULL
  441. #define hstate_inode(i) NULL
  442. #define page_hstate(page) NULL
  443. #define huge_page_size(h) PAGE_SIZE
  444. #define huge_page_mask(h) PAGE_MASK
  445. #define vma_kernel_pagesize(v) PAGE_SIZE
  446. #define vma_mmu_pagesize(v) PAGE_SIZE
  447. #define huge_page_order(h) 0
  448. #define huge_page_shift(h) PAGE_SHIFT
  449. static inline bool hstate_is_gigantic(struct hstate *h)
  450. {
  451. return false;
  452. }
  453. static inline unsigned int pages_per_huge_page(struct hstate *h)
  454. {
  455. return 1;
  456. }
  457. #define hstate_index_to_shift(index) 0
  458. #define hstate_index(h) 0
  459. static inline pgoff_t basepage_index(struct page *page)
  460. {
  461. return page->index;
  462. }
  463. #define dissolve_free_huge_pages(s, e) 0
  464. #define hugepage_migration_supported(h) false
  465. static inline spinlock_t *huge_pte_lockptr(struct hstate *h,
  466. struct mm_struct *mm, pte_t *pte)
  467. {
  468. return &mm->page_table_lock;
  469. }
  470. static inline void hugetlb_report_usage(struct seq_file *f, struct mm_struct *m)
  471. {
  472. }
  473. static inline void hugetlb_count_sub(long l, struct mm_struct *mm)
  474. {
  475. }
  476. #endif /* CONFIG_HUGETLB_PAGE */
  477. static inline spinlock_t *huge_pte_lock(struct hstate *h,
  478. struct mm_struct *mm, pte_t *pte)
  479. {
  480. spinlock_t *ptl;
  481. ptl = huge_pte_lockptr(h, mm, pte);
  482. spin_lock(ptl);
  483. return ptl;
  484. }
  485. #endif /* _LINUX_HUGETLB_H */