blob: 087fd5f48c9128752cf7ff8a872f30afab057381 [file] [log] [blame]
Andrew Scullb4b6d4a2019-01-02 15:54:55 +00001/* SPDX-License-Identifier: GPL-2.0 */
2#ifndef _LINUX_HUGETLB_H
3#define _LINUX_HUGETLB_H
4
5#include <linux/mm_types.h>
6#include <linux/mmdebug.h>
7#include <linux/fs.h>
8#include <linux/hugetlb_inline.h>
9#include <linux/cgroup.h>
10#include <linux/list.h>
11#include <linux/kref.h>
12#include <asm/pgtable.h>
13
14struct ctl_table;
15struct user_struct;
16struct mmu_gather;
17
18#ifndef is_hugepd
19/*
20 * Some architectures requires a hugepage directory format that is
21 * required to support multiple hugepage sizes. For example
22 * a4fe3ce76 "powerpc/mm: Allow more flexible layouts for hugepage pagetables"
23 * introduced the same on powerpc. This allows for a more flexible hugepage
24 * pagetable layout.
25 */
26typedef struct { unsigned long pd; } hugepd_t;
27#define is_hugepd(hugepd) (0)
28#define __hugepd(x) ((hugepd_t) { (x) })
29static inline int gup_huge_pd(hugepd_t hugepd, unsigned long addr,
30 unsigned pdshift, unsigned long end,
31 int write, struct page **pages, int *nr)
32{
33 return 0;
34}
35#else
36extern int gup_huge_pd(hugepd_t hugepd, unsigned long addr,
37 unsigned pdshift, unsigned long end,
38 int write, struct page **pages, int *nr);
39#endif
40
41
42#ifdef CONFIG_HUGETLB_PAGE
43
44#include <linux/mempolicy.h>
45#include <linux/shm.h>
46#include <asm/tlbflush.h>
47
48struct hugepage_subpool {
49 spinlock_t lock;
50 long count;
51 long max_hpages; /* Maximum huge pages or -1 if no maximum. */
52 long used_hpages; /* Used count against maximum, includes */
53 /* both alloced and reserved pages. */
54 struct hstate *hstate;
55 long min_hpages; /* Minimum huge pages or -1 if no minimum. */
56 long rsv_hpages; /* Pages reserved against global pool to */
57 /* sasitfy minimum size. */
58};
59
60struct resv_map {
61 struct kref refs;
62 spinlock_t lock;
63 struct list_head regions;
64 long adds_in_progress;
65 struct list_head region_cache;
66 long region_cache_count;
67};
68extern struct resv_map *resv_map_alloc(void);
69void resv_map_release(struct kref *ref);
70
71extern spinlock_t hugetlb_lock;
72extern int hugetlb_max_hstate __read_mostly;
73#define for_each_hstate(h) \
74 for ((h) = hstates; (h) < &hstates[hugetlb_max_hstate]; (h)++)
75
76struct hugepage_subpool *hugepage_new_subpool(struct hstate *h, long max_hpages,
77 long min_hpages);
78void hugepage_put_subpool(struct hugepage_subpool *spool);
79
80void reset_vma_resv_huge_pages(struct vm_area_struct *vma);
81int hugetlb_sysctl_handler(struct ctl_table *, int, void __user *, size_t *, loff_t *);
82int hugetlb_overcommit_handler(struct ctl_table *, int, void __user *, size_t *, loff_t *);
83int hugetlb_treat_movable_handler(struct ctl_table *, int, void __user *, size_t *, loff_t *);
84
85#ifdef CONFIG_NUMA
86int hugetlb_mempolicy_sysctl_handler(struct ctl_table *, int,
87 void __user *, size_t *, loff_t *);
88#endif
89
90int copy_hugetlb_page_range(struct mm_struct *, struct mm_struct *, struct vm_area_struct *);
91long follow_hugetlb_page(struct mm_struct *, struct vm_area_struct *,
92 struct page **, struct vm_area_struct **,
93 unsigned long *, unsigned long *, long, unsigned int,
94 int *);
95void unmap_hugepage_range(struct vm_area_struct *,
96 unsigned long, unsigned long, struct page *);
97void __unmap_hugepage_range_final(struct mmu_gather *tlb,
98 struct vm_area_struct *vma,
99 unsigned long start, unsigned long end,
100 struct page *ref_page);
101void __unmap_hugepage_range(struct mmu_gather *tlb, struct vm_area_struct *vma,
102 unsigned long start, unsigned long end,
103 struct page *ref_page);
104void hugetlb_report_meminfo(struct seq_file *);
105int hugetlb_report_node_meminfo(int, char *);
106void hugetlb_show_meminfo(void);
107unsigned long hugetlb_total_pages(void);
108vm_fault_t hugetlb_fault(struct mm_struct *mm, struct vm_area_struct *vma,
109 unsigned long address, unsigned int flags);
110int hugetlb_mcopy_atomic_pte(struct mm_struct *dst_mm, pte_t *dst_pte,
111 struct vm_area_struct *dst_vma,
112 unsigned long dst_addr,
113 unsigned long src_addr,
114 struct page **pagep);
115int hugetlb_reserve_pages(struct inode *inode, long from, long to,
116 struct vm_area_struct *vma,
117 vm_flags_t vm_flags);
118long hugetlb_unreserve_pages(struct inode *inode, long start, long end,
119 long freed);
120bool isolate_huge_page(struct page *page, struct list_head *list);
121void putback_active_hugepage(struct page *page);
122void move_hugetlb_state(struct page *oldpage, struct page *newpage, int reason);
123void free_huge_page(struct page *page);
124void hugetlb_fix_reserve_counts(struct inode *inode);
125extern struct mutex *hugetlb_fault_mutex_table;
126u32 hugetlb_fault_mutex_hash(struct hstate *h, struct mm_struct *mm,
127 struct vm_area_struct *vma,
128 struct address_space *mapping,
129 pgoff_t idx, unsigned long address);
130
131pte_t *huge_pmd_share(struct mm_struct *mm, unsigned long addr, pud_t *pud);
132
133extern int sysctl_hugetlb_shm_group;
134extern struct list_head huge_boot_pages;
135
136/* arch callbacks */
137
138pte_t *huge_pte_alloc(struct mm_struct *mm,
139 unsigned long addr, unsigned long sz);
140pte_t *huge_pte_offset(struct mm_struct *mm,
141 unsigned long addr, unsigned long sz);
142int huge_pmd_unshare(struct mm_struct *mm, unsigned long *addr, pte_t *ptep);
143void adjust_range_if_pmd_sharing_possible(struct vm_area_struct *vma,
144 unsigned long *start, unsigned long *end);
145struct page *follow_huge_addr(struct mm_struct *mm, unsigned long address,
146 int write);
147struct page *follow_huge_pd(struct vm_area_struct *vma,
148 unsigned long address, hugepd_t hpd,
149 int flags, int pdshift);
150struct page *follow_huge_pmd(struct mm_struct *mm, unsigned long address,
151 pmd_t *pmd, int flags);
152struct page *follow_huge_pud(struct mm_struct *mm, unsigned long address,
153 pud_t *pud, int flags);
154struct page *follow_huge_pgd(struct mm_struct *mm, unsigned long address,
155 pgd_t *pgd, int flags);
156
157int pmd_huge(pmd_t pmd);
158int pud_huge(pud_t pud);
159unsigned long hugetlb_change_protection(struct vm_area_struct *vma,
160 unsigned long address, unsigned long end, pgprot_t newprot);
161
162bool is_hugetlb_entry_migration(pte_t pte);
163
164#else /* !CONFIG_HUGETLB_PAGE */
165
166static inline void reset_vma_resv_huge_pages(struct vm_area_struct *vma)
167{
168}
169
170static inline unsigned long hugetlb_total_pages(void)
171{
172 return 0;
173}
174
175static inline int huge_pmd_unshare(struct mm_struct *mm, unsigned long *addr,
176 pte_t *ptep)
177{
178 return 0;
179}
180
181static inline void adjust_range_if_pmd_sharing_possible(
182 struct vm_area_struct *vma,
183 unsigned long *start, unsigned long *end)
184{
185}
186
187#define follow_hugetlb_page(m,v,p,vs,a,b,i,w,n) ({ BUG(); 0; })
188#define follow_huge_addr(mm, addr, write) ERR_PTR(-EINVAL)
189#define copy_hugetlb_page_range(src, dst, vma) ({ BUG(); 0; })
190static inline void hugetlb_report_meminfo(struct seq_file *m)
191{
192}
193#define hugetlb_report_node_meminfo(n, buf) 0
194static inline void hugetlb_show_meminfo(void)
195{
196}
197#define follow_huge_pd(vma, addr, hpd, flags, pdshift) NULL
198#define follow_huge_pmd(mm, addr, pmd, flags) NULL
199#define follow_huge_pud(mm, addr, pud, flags) NULL
200#define follow_huge_pgd(mm, addr, pgd, flags) NULL
201#define prepare_hugepage_range(file, addr, len) (-EINVAL)
202#define pmd_huge(x) 0
203#define pud_huge(x) 0
204#define is_hugepage_only_range(mm, addr, len) 0
205#define hugetlb_free_pgd_range(tlb, addr, end, floor, ceiling) ({BUG(); 0; })
206#define hugetlb_fault(mm, vma, addr, flags) ({ BUG(); 0; })
207#define hugetlb_mcopy_atomic_pte(dst_mm, dst_pte, dst_vma, dst_addr, \
208 src_addr, pagep) ({ BUG(); 0; })
209#define huge_pte_offset(mm, address, sz) 0
210
211static inline bool isolate_huge_page(struct page *page, struct list_head *list)
212{
213 return false;
214}
215#define putback_active_hugepage(p) do {} while (0)
216#define move_hugetlb_state(old, new, reason) do {} while (0)
217
218static inline unsigned long hugetlb_change_protection(struct vm_area_struct *vma,
219 unsigned long address, unsigned long end, pgprot_t newprot)
220{
221 return 0;
222}
223
224static inline void __unmap_hugepage_range_final(struct mmu_gather *tlb,
225 struct vm_area_struct *vma, unsigned long start,
226 unsigned long end, struct page *ref_page)
227{
228 BUG();
229}
230
231static inline void __unmap_hugepage_range(struct mmu_gather *tlb,
232 struct vm_area_struct *vma, unsigned long start,
233 unsigned long end, struct page *ref_page)
234{
235 BUG();
236}
237
238#endif /* !CONFIG_HUGETLB_PAGE */
239/*
240 * hugepages at page global directory. If arch support
241 * hugepages at pgd level, they need to define this.
242 */
243#ifndef pgd_huge
244#define pgd_huge(x) 0
245#endif
246#ifndef p4d_huge
247#define p4d_huge(x) 0
248#endif
249
250#ifndef pgd_write
251static inline int pgd_write(pgd_t pgd)
252{
253 BUG();
254 return 0;
255}
256#endif
257
258#define HUGETLB_ANON_FILE "anon_hugepage"
259
260enum {
261 /*
262 * The file will be used as an shm file so shmfs accounting rules
263 * apply
264 */
265 HUGETLB_SHMFS_INODE = 1,
266 /*
267 * The file is being created on the internal vfs mount and shmfs
268 * accounting rules do not apply
269 */
270 HUGETLB_ANONHUGE_INODE = 2,
271};
272
273#ifdef CONFIG_HUGETLBFS
274struct hugetlbfs_sb_info {
275 long max_inodes; /* inodes allowed */
276 long free_inodes; /* inodes free */
277 spinlock_t stat_lock;
278 struct hstate *hstate;
279 struct hugepage_subpool *spool;
280 kuid_t uid;
281 kgid_t gid;
282 umode_t mode;
283};
284
285static inline struct hugetlbfs_sb_info *HUGETLBFS_SB(struct super_block *sb)
286{
287 return sb->s_fs_info;
288}
289
290struct hugetlbfs_inode_info {
291 struct shared_policy policy;
292 struct inode vfs_inode;
293 unsigned int seals;
294};
295
296static inline struct hugetlbfs_inode_info *HUGETLBFS_I(struct inode *inode)
297{
298 return container_of(inode, struct hugetlbfs_inode_info, vfs_inode);
299}
300
301extern const struct file_operations hugetlbfs_file_operations;
302extern const struct vm_operations_struct hugetlb_vm_ops;
303struct file *hugetlb_file_setup(const char *name, size_t size, vm_flags_t acct,
304 struct user_struct **user, int creat_flags,
305 int page_size_log);
306
307static inline bool is_file_hugepages(struct file *file)
308{
309 if (file->f_op == &hugetlbfs_file_operations)
310 return true;
311
312 return is_file_shm_hugepages(file);
313}
314
315
316#else /* !CONFIG_HUGETLBFS */
317
318#define is_file_hugepages(file) false
319static inline struct file *
320hugetlb_file_setup(const char *name, size_t size, vm_flags_t acctflag,
321 struct user_struct **user, int creat_flags,
322 int page_size_log)
323{
324 return ERR_PTR(-ENOSYS);
325}
326
327#endif /* !CONFIG_HUGETLBFS */
328
329#ifdef HAVE_ARCH_HUGETLB_UNMAPPED_AREA
330unsigned long hugetlb_get_unmapped_area(struct file *file, unsigned long addr,
331 unsigned long len, unsigned long pgoff,
332 unsigned long flags);
333#endif /* HAVE_ARCH_HUGETLB_UNMAPPED_AREA */
334
335#ifdef CONFIG_HUGETLB_PAGE
336
337#define HSTATE_NAME_LEN 32
338/* Defines one hugetlb page size */
339struct hstate {
340 int next_nid_to_alloc;
341 int next_nid_to_free;
342 unsigned int order;
343 unsigned long mask;
344 unsigned long max_huge_pages;
345 unsigned long nr_huge_pages;
346 unsigned long free_huge_pages;
347 unsigned long resv_huge_pages;
348 unsigned long surplus_huge_pages;
349 unsigned long nr_overcommit_huge_pages;
350 struct list_head hugepage_activelist;
351 struct list_head hugepage_freelists[MAX_NUMNODES];
352 unsigned int nr_huge_pages_node[MAX_NUMNODES];
353 unsigned int free_huge_pages_node[MAX_NUMNODES];
354 unsigned int surplus_huge_pages_node[MAX_NUMNODES];
355#ifdef CONFIG_CGROUP_HUGETLB
356 /* cgroup control files */
357 struct cftype cgroup_files[5];
358#endif
359 char name[HSTATE_NAME_LEN];
360};
361
362struct huge_bootmem_page {
363 struct list_head list;
364 struct hstate *hstate;
365};
366
367struct page *alloc_huge_page(struct vm_area_struct *vma,
368 unsigned long addr, int avoid_reserve);
369struct page *alloc_huge_page_node(struct hstate *h, int nid);
370struct page *alloc_huge_page_nodemask(struct hstate *h, int preferred_nid,
371 nodemask_t *nmask);
372struct page *alloc_huge_page_vma(struct hstate *h, struct vm_area_struct *vma,
373 unsigned long address);
374int huge_add_to_page_cache(struct page *page, struct address_space *mapping,
375 pgoff_t idx);
376
377/* arch callback */
378int __init __alloc_bootmem_huge_page(struct hstate *h);
379int __init alloc_bootmem_huge_page(struct hstate *h);
380
381void __init hugetlb_bad_size(void);
382void __init hugetlb_add_hstate(unsigned order);
383struct hstate *size_to_hstate(unsigned long size);
384
385#ifndef HUGE_MAX_HSTATE
386#define HUGE_MAX_HSTATE 1
387#endif
388
389extern struct hstate hstates[HUGE_MAX_HSTATE];
390extern unsigned int default_hstate_idx;
391
392#define default_hstate (hstates[default_hstate_idx])
393
394static inline struct hstate *hstate_inode(struct inode *i)
395{
396 return HUGETLBFS_SB(i->i_sb)->hstate;
397}
398
399static inline struct hstate *hstate_file(struct file *f)
400{
401 return hstate_inode(file_inode(f));
402}
403
404static inline struct hstate *hstate_sizelog(int page_size_log)
405{
406 if (!page_size_log)
407 return &default_hstate;
408
409 return size_to_hstate(1UL << page_size_log);
410}
411
412static inline struct hstate *hstate_vma(struct vm_area_struct *vma)
413{
414 return hstate_file(vma->vm_file);
415}
416
417static inline unsigned long huge_page_size(struct hstate *h)
418{
419 return (unsigned long)PAGE_SIZE << h->order;
420}
421
422extern unsigned long vma_kernel_pagesize(struct vm_area_struct *vma);
423
424extern unsigned long vma_mmu_pagesize(struct vm_area_struct *vma);
425
426static inline unsigned long huge_page_mask(struct hstate *h)
427{
428 return h->mask;
429}
430
431static inline unsigned int huge_page_order(struct hstate *h)
432{
433 return h->order;
434}
435
436static inline unsigned huge_page_shift(struct hstate *h)
437{
438 return h->order + PAGE_SHIFT;
439}
440
441static inline bool hstate_is_gigantic(struct hstate *h)
442{
443 return huge_page_order(h) >= MAX_ORDER;
444}
445
446static inline unsigned int pages_per_huge_page(struct hstate *h)
447{
448 return 1 << h->order;
449}
450
451static inline unsigned int blocks_per_huge_page(struct hstate *h)
452{
453 return huge_page_size(h) / 512;
454}
455
456#include <asm/hugetlb.h>
457
458#ifndef arch_make_huge_pte
459static inline pte_t arch_make_huge_pte(pte_t entry, struct vm_area_struct *vma,
460 struct page *page, int writable)
461{
462 return entry;
463}
464#endif
465
466static inline struct hstate *page_hstate(struct page *page)
467{
468 VM_BUG_ON_PAGE(!PageHuge(page), page);
469 return size_to_hstate(PAGE_SIZE << compound_order(page));
470}
471
472static inline unsigned hstate_index_to_shift(unsigned index)
473{
474 return hstates[index].order + PAGE_SHIFT;
475}
476
477static inline int hstate_index(struct hstate *h)
478{
479 return h - hstates;
480}
481
482pgoff_t __basepage_index(struct page *page);
483
484/* Return page->index in PAGE_SIZE units */
485static inline pgoff_t basepage_index(struct page *page)
486{
487 if (!PageCompound(page))
488 return page->index;
489
490 return __basepage_index(page);
491}
492
493extern int dissolve_free_huge_page(struct page *page);
494extern int dissolve_free_huge_pages(unsigned long start_pfn,
495 unsigned long end_pfn);
496static inline bool hugepage_migration_supported(struct hstate *h)
497{
498#ifdef CONFIG_ARCH_ENABLE_HUGEPAGE_MIGRATION
499 if ((huge_page_shift(h) == PMD_SHIFT) ||
500 (huge_page_shift(h) == PGDIR_SHIFT))
501 return true;
502 else
503 return false;
504#else
505 return false;
506#endif
507}
508
509static inline spinlock_t *huge_pte_lockptr(struct hstate *h,
510 struct mm_struct *mm, pte_t *pte)
511{
512 if (huge_page_size(h) == PMD_SIZE)
513 return pmd_lockptr(mm, (pmd_t *) pte);
514 VM_BUG_ON(huge_page_size(h) == PAGE_SIZE);
515 return &mm->page_table_lock;
516}
517
518#ifndef hugepages_supported
519/*
520 * Some platform decide whether they support huge pages at boot
521 * time. Some of them, such as powerpc, set HPAGE_SHIFT to 0
522 * when there is no such support
523 */
524#define hugepages_supported() (HPAGE_SHIFT != 0)
525#endif
526
527void hugetlb_report_usage(struct seq_file *m, struct mm_struct *mm);
528
529static inline void hugetlb_count_add(long l, struct mm_struct *mm)
530{
531 atomic_long_add(l, &mm->hugetlb_usage);
532}
533
534static inline void hugetlb_count_sub(long l, struct mm_struct *mm)
535{
536 atomic_long_sub(l, &mm->hugetlb_usage);
537}
538
539#ifndef set_huge_swap_pte_at
540static inline void set_huge_swap_pte_at(struct mm_struct *mm, unsigned long addr,
541 pte_t *ptep, pte_t pte, unsigned long sz)
542{
543 set_huge_pte_at(mm, addr, ptep, pte);
544}
545#endif
546#else /* CONFIG_HUGETLB_PAGE */
547struct hstate {};
548#define alloc_huge_page(v, a, r) NULL
549#define alloc_huge_page_node(h, nid) NULL
550#define alloc_huge_page_nodemask(h, preferred_nid, nmask) NULL
551#define alloc_huge_page_vma(h, vma, address) NULL
552#define alloc_bootmem_huge_page(h) NULL
553#define hstate_file(f) NULL
554#define hstate_sizelog(s) NULL
555#define hstate_vma(v) NULL
556#define hstate_inode(i) NULL
557#define page_hstate(page) NULL
558#define huge_page_size(h) PAGE_SIZE
559#define huge_page_mask(h) PAGE_MASK
560#define vma_kernel_pagesize(v) PAGE_SIZE
561#define vma_mmu_pagesize(v) PAGE_SIZE
562#define huge_page_order(h) 0
563#define huge_page_shift(h) PAGE_SHIFT
564static inline bool hstate_is_gigantic(struct hstate *h)
565{
566 return false;
567}
568
569static inline unsigned int pages_per_huge_page(struct hstate *h)
570{
571 return 1;
572}
573
574static inline unsigned hstate_index_to_shift(unsigned index)
575{
576 return 0;
577}
578
579static inline int hstate_index(struct hstate *h)
580{
581 return 0;
582}
583
584static inline pgoff_t basepage_index(struct page *page)
585{
586 return page->index;
587}
588
589static inline int dissolve_free_huge_page(struct page *page)
590{
591 return 0;
592}
593
594static inline int dissolve_free_huge_pages(unsigned long start_pfn,
595 unsigned long end_pfn)
596{
597 return 0;
598}
599
600static inline bool hugepage_migration_supported(struct hstate *h)
601{
602 return false;
603}
604
605static inline spinlock_t *huge_pte_lockptr(struct hstate *h,
606 struct mm_struct *mm, pte_t *pte)
607{
608 return &mm->page_table_lock;
609}
610
611static inline void hugetlb_report_usage(struct seq_file *f, struct mm_struct *m)
612{
613}
614
615static inline void hugetlb_count_sub(long l, struct mm_struct *mm)
616{
617}
618
619static inline void set_huge_swap_pte_at(struct mm_struct *mm, unsigned long addr,
620 pte_t *ptep, pte_t pte, unsigned long sz)
621{
622}
623#endif /* CONFIG_HUGETLB_PAGE */
624
625static inline spinlock_t *huge_pte_lock(struct hstate *h,
626 struct mm_struct *mm, pte_t *pte)
627{
628 spinlock_t *ptl;
629
630 ptl = huge_pte_lockptr(h, mm, pte);
631 spin_lock(ptl);
632 return ptl;
633}
634
635#endif /* _LINUX_HUGETLB_H */