hugetlb.h 15.8 KB
Newer Older
Linus Torvalds's avatar
Linus Torvalds committed
1 2 3
#ifndef _LINUX_HUGETLB_H
#define _LINUX_HUGETLB_H

Linus Torvalds's avatar
Linus Torvalds committed
4
#include <linux/mm_types.h>
5
#include <linux/mmdebug.h>
Alexey Dobriyan's avatar
Alexey Dobriyan committed
6
#include <linux/fs.h>
7
#include <linux/hugetlb_inline.h>
8
#include <linux/cgroup.h>
9 10
#include <linux/list.h>
#include <linux/kref.h>
11
#include <asm/pgtable.h>
Alexey Dobriyan's avatar
Alexey Dobriyan committed
12

13 14
struct ctl_table;
struct user_struct;
15
struct mmu_gather;
16

17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40
#ifndef is_hugepd
/*
 * Some architectures requires a hugepage directory format that is
 * required to support multiple hugepage sizes. For example
 * a4fe3ce76 "powerpc/mm: Allow more flexible layouts for hugepage pagetables"
 * introduced the same on powerpc. This allows for a more flexible hugepage
 * pagetable layout.
 */
typedef struct { unsigned long pd; } hugepd_t;
#define is_hugepd(hugepd) (0)
#define __hugepd(x) ((hugepd_t) { (x) })
static inline int gup_huge_pd(hugepd_t hugepd, unsigned long addr,
			      unsigned pdshift, unsigned long end,
			      int write, struct page **pages, int *nr)
{
	return 0;
}
#else
extern int gup_huge_pd(hugepd_t hugepd, unsigned long addr,
		       unsigned pdshift, unsigned long end,
		       int write, struct page **pages, int *nr);
#endif


Linus Torvalds's avatar
Linus Torvalds committed
41 42 43
#ifdef CONFIG_HUGETLB_PAGE

#include <linux/mempolicy.h>
44
#include <linux/shm.h>
David Gibson's avatar
David Gibson committed
45
#include <asm/tlbflush.h>
Linus Torvalds's avatar
Linus Torvalds committed
46

47 48 49
struct hugepage_subpool {
	spinlock_t lock;
	long count;
50 51 52 53 54 55 56
	long max_hpages;	/* Maximum huge pages or -1 if no maximum. */
	long used_hpages;	/* Used count against maximum, includes */
				/* both alloced and reserved pages. */
	struct hstate *hstate;
	long min_hpages;	/* Minimum huge pages or -1 if no minimum. */
	long rsv_hpages;	/* Pages reserved against global pool to */
				/* sasitfy minimum size. */
57 58
};

59 60
struct resv_map {
	struct kref refs;
61
	spinlock_t lock;
62
	struct list_head regions;
63 64 65
	long adds_in_progress;
	struct list_head region_cache;
	long region_cache_count;
66 67 68 69
};
extern struct resv_map *resv_map_alloc(void);
void resv_map_release(struct kref *ref);

70 71 72 73 74
extern spinlock_t hugetlb_lock;
extern int hugetlb_max_hstate __read_mostly;
#define for_each_hstate(h) \
	for ((h) = hstates; (h) < &hstates[hugetlb_max_hstate]; (h)++)

75 76
struct hugepage_subpool *hugepage_new_subpool(struct hstate *h, long max_hpages,
						long min_hpages);
77 78
void hugepage_put_subpool(struct hugepage_subpool *spool);

79
void reset_vma_resv_huge_pages(struct vm_area_struct *vma);
80 81 82
int hugetlb_sysctl_handler(struct ctl_table *, int, void __user *, size_t *, loff_t *);
int hugetlb_overcommit_handler(struct ctl_table *, int, void __user *, size_t *, loff_t *);
int hugetlb_treat_movable_handler(struct ctl_table *, int, void __user *, size_t *, loff_t *);
83 84 85 86 87 88

#ifdef CONFIG_NUMA
int hugetlb_mempolicy_sysctl_handler(struct ctl_table *, int,
					void __user *, size_t *, loff_t *);
#endif

Linus Torvalds's avatar
Linus Torvalds committed
89
int copy_hugetlb_page_range(struct mm_struct *, struct mm_struct *, struct vm_area_struct *);
90 91
long follow_hugetlb_page(struct mm_struct *, struct vm_area_struct *,
			 struct page **, struct vm_area_struct **,
92 93
			 unsigned long *, unsigned long *, long, unsigned int,
			 int *);
94
void unmap_hugepage_range(struct vm_area_struct *,
95
			  unsigned long, unsigned long, struct page *);
96 97 98 99
void __unmap_hugepage_range_final(struct mmu_gather *tlb,
			  struct vm_area_struct *vma,
			  unsigned long start, unsigned long end,
			  struct page *ref_page);
100 101 102
void __unmap_hugepage_range(struct mmu_gather *tlb, struct vm_area_struct *vma,
				unsigned long start, unsigned long end,
				struct page *ref_page);
103
void hugetlb_report_meminfo(struct seq_file *);
Linus Torvalds's avatar
Linus Torvalds committed
104
int hugetlb_report_node_meminfo(int, char *);
105
void hugetlb_show_meminfo(void);
Linus Torvalds's avatar
Linus Torvalds committed
106
unsigned long hugetlb_total_pages(void);
107
int hugetlb_fault(struct mm_struct *mm, struct vm_area_struct *vma,
108
			unsigned long address, unsigned int flags);
109 110 111 112 113
int hugetlb_mcopy_atomic_pte(struct mm_struct *dst_mm, pte_t *dst_pte,
				struct vm_area_struct *dst_vma,
				unsigned long dst_addr,
				unsigned long src_addr,
				struct page **pagep);
114
int hugetlb_reserve_pages(struct inode *inode, long from, long to,
115
						struct vm_area_struct *vma,
116
						vm_flags_t vm_flags);
117 118
long hugetlb_unreserve_pages(struct inode *inode, long start, long end,
						long freed);
119
int dequeue_hwpoisoned_huge_page(struct page *page);
120 121
bool isolate_huge_page(struct page *page, struct list_head *list);
void putback_active_hugepage(struct page *page);
122
void free_huge_page(struct page *page);
123
void hugetlb_fix_reserve_counts(struct inode *inode);
124 125 126 127 128
extern struct mutex *hugetlb_fault_mutex_table;
u32 hugetlb_fault_mutex_hash(struct hstate *h, struct mm_struct *mm,
				struct vm_area_struct *vma,
				struct address_space *mapping,
				pgoff_t idx, unsigned long address);
Linus Torvalds's avatar
Linus Torvalds committed
129

130 131
pte_t *huge_pmd_share(struct mm_struct *mm, unsigned long addr, pud_t *pud);

132
extern int hugepages_treat_as_movable;
Linus Torvalds's avatar
Linus Torvalds committed
133
extern int sysctl_hugetlb_shm_group;
134
extern struct list_head huge_boot_pages;
Linus Torvalds's avatar
Linus Torvalds committed
135

David Gibson's avatar
David Gibson committed
136 137
/* arch callbacks */

138 139
pte_t *huge_pte_alloc(struct mm_struct *mm,
			unsigned long addr, unsigned long sz);
140 141
pte_t *huge_pte_offset(struct mm_struct *mm,
		       unsigned long addr, unsigned long sz);
142
int huge_pmd_unshare(struct mm_struct *mm, unsigned long *addr, pte_t *ptep);
David Gibson's avatar
David Gibson committed
143 144
struct page *follow_huge_addr(struct mm_struct *mm, unsigned long address,
			      int write);
145 146 147
struct page *follow_huge_pd(struct vm_area_struct *vma,
			    unsigned long address, hugepd_t hpd,
			    int flags, int pdshift);
David Gibson's avatar
David Gibson committed
148
struct page *follow_huge_pmd(struct mm_struct *mm, unsigned long address,
149
				pmd_t *pmd, int flags);
Andi Kleen's avatar
Andi Kleen committed
150
struct page *follow_huge_pud(struct mm_struct *mm, unsigned long address,
151
				pud_t *pud, int flags);
152 153 154
struct page *follow_huge_pgd(struct mm_struct *mm, unsigned long address,
			     pgd_t *pgd, int flags);

David Gibson's avatar
David Gibson committed
155
int pmd_huge(pmd_t pmd);
156
int pud_huge(pud_t pud);
157
unsigned long hugetlb_change_protection(struct vm_area_struct *vma,
158
		unsigned long address, unsigned long end, pgprot_t newprot);
David Gibson's avatar
David Gibson committed
159

160
bool is_hugetlb_entry_migration(pte_t pte);
Linus Torvalds's avatar
Linus Torvalds committed
161 162
#else /* !CONFIG_HUGETLB_PAGE */

163 164 165 166
static inline void reset_vma_resv_huge_pages(struct vm_area_struct *vma)
{
}

Linus Torvalds's avatar
Linus Torvalds committed
167 168 169 170 171
static inline unsigned long hugetlb_total_pages(void)
{
	return 0;
}

172
#define follow_hugetlb_page(m,v,p,vs,a,b,i,w,n)	({ BUG(); 0; })
Linus Torvalds's avatar
Linus Torvalds committed
173 174
#define follow_huge_addr(mm, addr, write)	ERR_PTR(-EINVAL)
#define copy_hugetlb_page_range(src, dst, vma)	({ BUG(); 0; })
175 176 177
static inline void hugetlb_report_meminfo(struct seq_file *m)
{
}
Linus Torvalds's avatar
Linus Torvalds committed
178
#define hugetlb_report_node_meminfo(n, buf)	0
179 180 181
static inline void hugetlb_show_meminfo(void)
{
}
182
#define follow_huge_pd(vma, addr, hpd, flags, pdshift) NULL
183 184
#define follow_huge_pmd(mm, addr, pmd, flags)	NULL
#define follow_huge_pud(mm, addr, pud, flags)	NULL
185
#define follow_huge_pgd(mm, addr, pgd, flags)	NULL
186
#define prepare_hugepage_range(file, addr, len)	(-EINVAL)
Linus Torvalds's avatar
Linus Torvalds committed
187
#define pmd_huge(x)	0
Andi Kleen's avatar
Andi Kleen committed
188
#define pud_huge(x)	0
Linus Torvalds's avatar
Linus Torvalds committed
189
#define is_hugepage_only_range(mm, addr, len)	0
190
#define hugetlb_free_pgd_range(tlb, addr, end, floor, ceiling) ({BUG(); 0; })
191
#define hugetlb_fault(mm, vma, addr, flags)	({ BUG(); 0; })
192 193
#define hugetlb_mcopy_atomic_pte(dst_mm, dst_pte, dst_vma, dst_addr, \
				src_addr, pagep)	({ BUG(); 0; })
194
#define huge_pte_offset(mm, address, sz)	0
195 196 197 198 199
static inline int dequeue_hwpoisoned_huge_page(struct page *page)
{
	return 0;
}

200 201 202 203
static inline bool isolate_huge_page(struct page *page, struct list_head *list)
{
	return false;
}
204
#define putback_active_hugepage(p)	do {} while (0)
Linus Torvalds's avatar
Linus Torvalds committed
205

206 207 208 209 210
static inline unsigned long hugetlb_change_protection(struct vm_area_struct *vma,
		unsigned long address, unsigned long end, pgprot_t newprot)
{
	return 0;
}
211

212 213 214 215 216 217 218
static inline void __unmap_hugepage_range_final(struct mmu_gather *tlb,
			struct vm_area_struct *vma, unsigned long start,
			unsigned long end, struct page *ref_page)
{
	BUG();
}

219 220 221 222 223 224 225
static inline void __unmap_hugepage_range(struct mmu_gather *tlb,
			struct vm_area_struct *vma, unsigned long start,
			unsigned long end, struct page *ref_page)
{
	BUG();
}

Linus Torvalds's avatar
Linus Torvalds committed
226
#endif /* !CONFIG_HUGETLB_PAGE */
227 228 229 230 231 232 233
/*
 * hugepages at page global directory. If arch support
 * hugepages at pgd level, they need to define this.
 */
#ifndef pgd_huge
#define pgd_huge(x)	0
#endif
234 235 236
#ifndef p4d_huge
#define p4d_huge(x)	0
#endif
237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253

#ifndef pgd_write
static inline int pgd_write(pgd_t pgd)
{
	BUG();
	return 0;
}
#endif

#ifndef pud_write
static inline int pud_write(pud_t pud)
{
	BUG();
	return 0;
}
#endif

254 255
#define HUGETLB_ANON_FILE "anon_hugepage"

256 257 258 259 260 261
enum {
	/*
	 * The file will be used as an shm file so shmfs accounting rules
	 * apply
	 */
	HUGETLB_SHMFS_INODE     = 1,
262 263 264 265 266
	/*
	 * The file is being created on the internal vfs mount and shmfs
	 * accounting rules do not apply
	 */
	HUGETLB_ANONHUGE_INODE  = 2,
267 268
};

Linus Torvalds's avatar
Linus Torvalds committed
269 270 271 272 273
#ifdef CONFIG_HUGETLBFS
struct hugetlbfs_sb_info {
	long	max_inodes;   /* inodes allowed */
	long	free_inodes;  /* inodes free */
	spinlock_t	stat_lock;
274
	struct hstate *hstate;
275
	struct hugepage_subpool *spool;
Linus Torvalds's avatar
Linus Torvalds committed
276 277 278 279 280 281 282
};

static inline struct hugetlbfs_sb_info *HUGETLBFS_SB(struct super_block *sb)
{
	return sb->s_fs_info;
}

283
extern const struct file_operations hugetlbfs_file_operations;
284
extern const struct vm_operations_struct hugetlb_vm_ops;
285
struct file *hugetlb_file_setup(const char *name, size_t size, vm_flags_t acct,
286 287
				struct user_struct **user, int creat_flags,
				int page_size_log);
Linus Torvalds's avatar
Linus Torvalds committed
288

289
static inline bool is_file_hugepages(struct file *file)
Linus Torvalds's avatar
Linus Torvalds committed
290
{
291
	if (file->f_op == &hugetlbfs_file_operations)
292
		return true;
293

294
	return is_file_shm_hugepages(file);
Linus Torvalds's avatar
Linus Torvalds committed
295 296
}

297

Linus Torvalds's avatar
Linus Torvalds committed
298 299
#else /* !CONFIG_HUGETLBFS */

300
#define is_file_hugepages(file)			false
301
static inline struct file *
302 303
hugetlb_file_setup(const char *name, size_t size, vm_flags_t acctflag,
		struct user_struct **user, int creat_flags,
304
		int page_size_log)
305 306 307
{
	return ERR_PTR(-ENOSYS);
}
Linus Torvalds's avatar
Linus Torvalds committed
308 309 310

#endif /* !CONFIG_HUGETLBFS */

311 312 313 314 315 316
#ifdef HAVE_ARCH_HUGETLB_UNMAPPED_AREA
unsigned long hugetlb_get_unmapped_area(struct file *file, unsigned long addr,
					unsigned long len, unsigned long pgoff,
					unsigned long flags);
#endif /* HAVE_ARCH_HUGETLB_UNMAPPED_AREA */

317 318
#ifdef CONFIG_HUGETLB_PAGE

319
#define HSTATE_NAME_LEN 32
320 321
/* Defines one hugetlb page size */
struct hstate {
322 323
	int next_nid_to_alloc;
	int next_nid_to_free;
324 325 326 327 328 329 330 331
	unsigned int order;
	unsigned long mask;
	unsigned long max_huge_pages;
	unsigned long nr_huge_pages;
	unsigned long free_huge_pages;
	unsigned long resv_huge_pages;
	unsigned long surplus_huge_pages;
	unsigned long nr_overcommit_huge_pages;
332
	struct list_head hugepage_activelist;
333 334 335 336
	struct list_head hugepage_freelists[MAX_NUMNODES];
	unsigned int nr_huge_pages_node[MAX_NUMNODES];
	unsigned int free_huge_pages_node[MAX_NUMNODES];
	unsigned int surplus_huge_pages_node[MAX_NUMNODES];
337 338 339 340
#ifdef CONFIG_CGROUP_HUGETLB
	/* cgroup control files */
	struct cftype cgroup_files[5];
#endif
341
	char name[HSTATE_NAME_LEN];
342 343
};

344 345 346
struct huge_bootmem_page {
	struct list_head list;
	struct hstate *hstate;
347 348 349
#ifdef CONFIG_HIGHMEM
	phys_addr_t phys;
#endif
350 351
};

352 353
struct page *alloc_huge_page(struct vm_area_struct *vma,
				unsigned long addr, int avoid_reserve);
354
struct page *alloc_huge_page_node(struct hstate *h, int nid);
355 356
struct page *alloc_huge_page_noerr(struct vm_area_struct *vma,
				unsigned long addr, int avoid_reserve);
357 358
int huge_add_to_page_cache(struct page *page, struct address_space *mapping,
			pgoff_t idx);
359

360 361 362
/* arch callback */
int __init alloc_bootmem_huge_page(struct hstate *h);

363
void __init hugetlb_bad_size(void);
364 365 366 367 368 369 370 371 372 373 374
void __init hugetlb_add_hstate(unsigned order);
struct hstate *size_to_hstate(unsigned long size);

#ifndef HUGE_MAX_HSTATE
#define HUGE_MAX_HSTATE 1
#endif

extern struct hstate hstates[HUGE_MAX_HSTATE];
extern unsigned int default_hstate_idx;

#define default_hstate (hstates[default_hstate_idx])
375

376
static inline struct hstate *hstate_inode(struct inode *i)
377
{
378
	return HUGETLBFS_SB(i->i_sb)->hstate;
379 380 381 382
}

static inline struct hstate *hstate_file(struct file *f)
{
Al Viro's avatar
Al Viro committed
383
	return hstate_inode(file_inode(f));
384 385
}

386 387 388 389
static inline struct hstate *hstate_sizelog(int page_size_log)
{
	if (!page_size_log)
		return &default_hstate;
390 391

	return size_to_hstate(1UL << page_size_log);
392 393
}

394
static inline struct hstate *hstate_vma(struct vm_area_struct *vma)
395
{
396
	return hstate_file(vma->vm_file);
397 398 399 400 401 402 403
}

static inline unsigned long huge_page_size(struct hstate *h)
{
	return (unsigned long)PAGE_SIZE << h->order;
}

404 405
extern unsigned long vma_kernel_pagesize(struct vm_area_struct *vma);

406 407
extern unsigned long vma_mmu_pagesize(struct vm_area_struct *vma);

408 409 410 411 412 413 414 415 416 417 418 419 420 421 422
static inline unsigned long huge_page_mask(struct hstate *h)
{
	return h->mask;
}

static inline unsigned int huge_page_order(struct hstate *h)
{
	return h->order;
}

static inline unsigned huge_page_shift(struct hstate *h)
{
	return h->order + PAGE_SHIFT;
}

423 424 425 426 427
static inline bool hstate_is_gigantic(struct hstate *h)
{
	return huge_page_order(h) >= MAX_ORDER;
}

428 429 430 431 432 433 434 435 436 437 438 439
static inline unsigned int pages_per_huge_page(struct hstate *h)
{
	return 1 << h->order;
}

static inline unsigned int blocks_per_huge_page(struct hstate *h)
{
	return huge_page_size(h) / 512;
}

#include <asm/hugetlb.h>

440 441 442 443 444 445 446 447
#ifndef arch_make_huge_pte
static inline pte_t arch_make_huge_pte(pte_t entry, struct vm_area_struct *vma,
				       struct page *page, int writable)
{
	return entry;
}
#endif

448 449
static inline struct hstate *page_hstate(struct page *page)
{
450
	VM_BUG_ON_PAGE(!PageHuge(page), page);
451 452 453
	return size_to_hstate(PAGE_SIZE << compound_order(page));
}

454 455 456 457 458
static inline unsigned hstate_index_to_shift(unsigned index)
{
	return hstates[index].order + PAGE_SHIFT;
}

459 460 461 462 463
static inline int hstate_index(struct hstate *h)
{
	return h - hstates;
}

464 465 466 467 468 469 470 471 472 473 474
pgoff_t __basepage_index(struct page *page);

/* Return page->index in PAGE_SIZE units */
static inline pgoff_t basepage_index(struct page *page)
{
	if (!PageCompound(page))
		return page->index;

	return __basepage_index(page);
}

475 476
extern int dissolve_free_huge_pages(unsigned long start_pfn,
				    unsigned long end_pfn);
477
static inline bool hugepage_migration_supported(struct hstate *h)
478
{
479
#ifdef CONFIG_ARCH_ENABLE_HUGEPAGE_MIGRATION
480 481 482 483 484
	if ((huge_page_shift(h) == PMD_SHIFT) ||
		(huge_page_shift(h) == PGDIR_SHIFT))
		return true;
	else
		return false;
485
#else
486
	return false;
487
#endif
488
}
489

490 491 492 493 494 495 496 497 498
static inline spinlock_t *huge_pte_lockptr(struct hstate *h,
					   struct mm_struct *mm, pte_t *pte)
{
	if (huge_page_size(h) == PMD_SIZE)
		return pmd_lockptr(mm, (pmd_t *) pte);
	VM_BUG_ON(huge_page_size(h) == PAGE_SIZE);
	return &mm->page_table_lock;
}

499 500 501 502 503 504 505 506
#ifndef hugepages_supported
/*
 * Some platform decide whether they support huge pages at boot
 * time. Some of them, such as powerpc, set HPAGE_SHIFT to 0
 * when there is no such support
 */
#define hugepages_supported() (HPAGE_SHIFT != 0)
#endif
507

508 509 510 511 512 513 514 515 516 517 518
void hugetlb_report_usage(struct seq_file *m, struct mm_struct *mm);

static inline void hugetlb_count_add(long l, struct mm_struct *mm)
{
	atomic_long_add(l, &mm->hugetlb_usage);
}

static inline void hugetlb_count_sub(long l, struct mm_struct *mm)
{
	atomic_long_sub(l, &mm->hugetlb_usage);
}
519
#else	/* CONFIG_HUGETLB_PAGE */
520
struct hstate {};
521
#define alloc_huge_page(v, a, r) NULL
522
#define alloc_huge_page_node(h, nid) NULL
523
#define alloc_huge_page_noerr(v, a, r) NULL
524
#define alloc_bootmem_huge_page(h) NULL
525
#define hstate_file(f) NULL
526
#define hstate_sizelog(s) NULL
527 528
#define hstate_vma(v) NULL
#define hstate_inode(i) NULL
529
#define page_hstate(page) NULL
530 531
#define huge_page_size(h) PAGE_SIZE
#define huge_page_mask(h) PAGE_MASK
532
#define vma_kernel_pagesize(v) PAGE_SIZE
533
#define vma_mmu_pagesize(v) PAGE_SIZE
534 535
#define huge_page_order(h) 0
#define huge_page_shift(h) PAGE_SHIFT
536 537 538 539 540
static inline bool hstate_is_gigantic(struct hstate *h)
{
	return false;
}

541 542 543 544
static inline unsigned int pages_per_huge_page(struct hstate *h)
{
	return 1;
}
545
#define hstate_index_to_shift(index) 0
546
#define hstate_index(h) 0
547 548 549 550 551

static inline pgoff_t basepage_index(struct page *page)
{
	return page->index;
}
552
#define dissolve_free_huge_pages(s, e)	0
553
#define hugepage_migration_supported(h)	false
554 555 556 557 558 559

static inline spinlock_t *huge_pte_lockptr(struct hstate *h,
					   struct mm_struct *mm, pte_t *pte)
{
	return &mm->page_table_lock;
}
560 561 562 563 564 565 566 567

static inline void hugetlb_report_usage(struct seq_file *f, struct mm_struct *m)
{
}

static inline void hugetlb_count_sub(long l, struct mm_struct *mm)
{
}
568
#endif	/* CONFIG_HUGETLB_PAGE */
569

570 571 572 573 574 575 576 577 578 579
static inline spinlock_t *huge_pte_lock(struct hstate *h,
					struct mm_struct *mm, pte_t *pte)
{
	spinlock_t *ptl;

	ptl = huge_pte_lockptr(h, mm, pte);
	spin_lock(ptl);
	return ptl;
}

Linus Torvalds's avatar
Linus Torvalds committed
580
#endif /* _LINUX_HUGETLB_H */