9da61aef0f
free_pgtables() has special logic to call hugetlb_free_pgd_range() instead of the normal free_pgd_range() on hugepage VMAs. However, the test it uses to do so is incorrect: it calls is_hugepage_only_range on a hugepage sized range at the start of the vma. is_hugepage_only_range() will return true if the given range has any intersection with a hugepage address region, and in this case the given region need not be hugepage aligned. So, for example, this test can return true if called on, say, a 4k VMA immediately preceding a (nicely aligned) hugepage VMA. At present we get away with this because the powerpc version of hugetlb_free_pgd_range() is just a call to free_pgd_range(). On ia64 (the only other arch with a non-trivial is_hugepage_only_range()) we get away with it for a different reason; the hugepage area is not contiguous with the rest of the user address space, and VMAs are not permitted in between, so the test can't return a false positive there. Nonetheless this should be fixed. We do that in the patch below by replacing the is_hugepage_only_range() test with an explicit test of the VMA using is_vm_hugetlb_page(). This in turn changes behaviour for platforms where is_hugepage_only_range() returns false always (everything except powerpc and ia64). We address this by ensuring that hugetlb_free_pgd_range() is defined to be identical to free_pgd_range() (instead of a no-op) on everything except ia64. Even so, it will prevent some otherwise possible coalescing of calls down to free_pgd_range(). Since this only happens for hugepage VMAs, removing this small optimization seems unlikely to cause any trouble. This patch causes no regressions on the libhugetlbfs testsuite - ppc64 POWER5 (8-way), ppc64 G5 (2-way) and i386 Pentium M (UP). Signed-off-by: David Gibson <dwg@au1.ibm.com> Cc: William Lee Irwin III <wli@holomorphy.com> Acked-by: Hugh Dickins <hugh@veritas.com> Signed-off-by: Andrew Morton <akpm@osdl.org> Signed-off-by: Linus Torvalds <torvalds@osdl.org>
172 lines
5.3 KiB
C
172 lines
5.3 KiB
C
#ifndef _LINUX_HUGETLB_H
|
|
#define _LINUX_HUGETLB_H
|
|
|
|
#ifdef CONFIG_HUGETLB_PAGE
|
|
|
|
#include <linux/mempolicy.h>
|
|
#include <asm/tlbflush.h>
|
|
|
|
struct ctl_table;
|
|
|
|
static inline int is_vm_hugetlb_page(struct vm_area_struct *vma)
|
|
{
|
|
return vma->vm_flags & VM_HUGETLB;
|
|
}
|
|
|
|
int hugetlb_sysctl_handler(struct ctl_table *, int, struct file *, void __user *, size_t *, loff_t *);
|
|
int copy_hugetlb_page_range(struct mm_struct *, struct mm_struct *, struct vm_area_struct *);
|
|
int follow_hugetlb_page(struct mm_struct *, struct vm_area_struct *, struct page **, struct vm_area_struct **, unsigned long *, int *, int);
|
|
void unmap_hugepage_range(struct vm_area_struct *, unsigned long, unsigned long);
|
|
int hugetlb_prefault(struct address_space *, struct vm_area_struct *);
|
|
int hugetlb_report_meminfo(char *);
|
|
int hugetlb_report_node_meminfo(int, char *);
|
|
unsigned long hugetlb_total_pages(void);
|
|
int hugetlb_fault(struct mm_struct *mm, struct vm_area_struct *vma,
|
|
unsigned long address, int write_access);
|
|
|
|
extern unsigned long max_huge_pages;
|
|
extern const unsigned long hugetlb_zero, hugetlb_infinity;
|
|
extern int sysctl_hugetlb_shm_group;
|
|
|
|
/* arch callbacks */
|
|
|
|
pte_t *huge_pte_alloc(struct mm_struct *mm, unsigned long addr);
|
|
pte_t *huge_pte_offset(struct mm_struct *mm, unsigned long addr);
|
|
struct page *follow_huge_addr(struct mm_struct *mm, unsigned long address,
|
|
int write);
|
|
struct page *follow_huge_pmd(struct mm_struct *mm, unsigned long address,
|
|
pmd_t *pmd, int write);
|
|
int is_aligned_hugepage_range(unsigned long addr, unsigned long len);
|
|
int pmd_huge(pmd_t pmd);
|
|
void hugetlb_change_protection(struct vm_area_struct *vma,
|
|
unsigned long address, unsigned long end, pgprot_t newprot);
|
|
|
|
#ifndef ARCH_HAS_HUGEPAGE_ONLY_RANGE
|
|
#define is_hugepage_only_range(mm, addr, len) 0
|
|
#endif
|
|
|
|
#ifndef ARCH_HAS_HUGETLB_FREE_PGD_RANGE
|
|
#define hugetlb_free_pgd_range free_pgd_range
|
|
#endif
|
|
|
|
#ifndef ARCH_HAS_PREPARE_HUGEPAGE_RANGE
|
|
#define prepare_hugepage_range(addr, len) \
|
|
is_aligned_hugepage_range(addr, len)
|
|
#else
|
|
int prepare_hugepage_range(unsigned long addr, unsigned long len);
|
|
#endif
|
|
|
|
#ifndef ARCH_HAS_SETCLEAR_HUGE_PTE
|
|
#define set_huge_pte_at(mm, addr, ptep, pte) set_pte_at(mm, addr, ptep, pte)
|
|
#define huge_ptep_get_and_clear(mm, addr, ptep) ptep_get_and_clear(mm, addr, ptep)
|
|
#else
|
|
void set_huge_pte_at(struct mm_struct *mm, unsigned long addr,
|
|
pte_t *ptep, pte_t pte);
|
|
pte_t huge_ptep_get_and_clear(struct mm_struct *mm, unsigned long addr,
|
|
pte_t *ptep);
|
|
#endif
|
|
|
|
#ifndef ARCH_HAS_HUGETLB_PREFAULT_HOOK
|
|
#define hugetlb_prefault_arch_hook(mm) do { } while (0)
|
|
#else
|
|
void hugetlb_prefault_arch_hook(struct mm_struct *mm);
|
|
#endif
|
|
|
|
#else /* !CONFIG_HUGETLB_PAGE */
|
|
|
|
static inline int is_vm_hugetlb_page(struct vm_area_struct *vma)
|
|
{
|
|
return 0;
|
|
}
|
|
static inline unsigned long hugetlb_total_pages(void)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
#define follow_hugetlb_page(m,v,p,vs,a,b,i) ({ BUG(); 0; })
|
|
#define follow_huge_addr(mm, addr, write) ERR_PTR(-EINVAL)
|
|
#define copy_hugetlb_page_range(src, dst, vma) ({ BUG(); 0; })
|
|
#define hugetlb_prefault(mapping, vma) ({ BUG(); 0; })
|
|
#define unmap_hugepage_range(vma, start, end) BUG()
|
|
#define hugetlb_report_meminfo(buf) 0
|
|
#define hugetlb_report_node_meminfo(n, buf) 0
|
|
#define follow_huge_pmd(mm, addr, pmd, write) NULL
|
|
#define is_aligned_hugepage_range(addr, len) 0
|
|
#define prepare_hugepage_range(addr, len) (-EINVAL)
|
|
#define pmd_huge(x) 0
|
|
#define is_hugepage_only_range(mm, addr, len) 0
|
|
#define hugetlb_free_pgd_range(tlb, addr, end, floor, ceiling) ({BUG(); 0; })
|
|
#define hugetlb_fault(mm, vma, addr, write) ({ BUG(); 0; })
|
|
|
|
#define hugetlb_change_protection(vma, address, end, newprot)
|
|
|
|
#ifndef HPAGE_MASK
|
|
#define HPAGE_MASK PAGE_MASK /* Keep the compiler happy */
|
|
#define HPAGE_SIZE PAGE_SIZE
|
|
#endif
|
|
|
|
#endif /* !CONFIG_HUGETLB_PAGE */
|
|
|
|
#ifdef CONFIG_HUGETLBFS
|
|
struct hugetlbfs_config {
|
|
uid_t uid;
|
|
gid_t gid;
|
|
umode_t mode;
|
|
long nr_blocks;
|
|
long nr_inodes;
|
|
};
|
|
|
|
struct hugetlbfs_sb_info {
|
|
long max_blocks; /* blocks allowed */
|
|
long free_blocks; /* blocks free */
|
|
long max_inodes; /* inodes allowed */
|
|
long free_inodes; /* inodes free */
|
|
spinlock_t stat_lock;
|
|
};
|
|
|
|
|
|
struct hugetlbfs_inode_info {
|
|
struct shared_policy policy;
|
|
/* Protected by the (global) hugetlb_lock */
|
|
unsigned long prereserved_hpages;
|
|
struct inode vfs_inode;
|
|
};
|
|
|
|
static inline struct hugetlbfs_inode_info *HUGETLBFS_I(struct inode *inode)
|
|
{
|
|
return container_of(inode, struct hugetlbfs_inode_info, vfs_inode);
|
|
}
|
|
|
|
static inline struct hugetlbfs_sb_info *HUGETLBFS_SB(struct super_block *sb)
|
|
{
|
|
return sb->s_fs_info;
|
|
}
|
|
|
|
extern struct file_operations hugetlbfs_file_operations;
|
|
extern struct vm_operations_struct hugetlb_vm_ops;
|
|
struct file *hugetlb_zero_setup(size_t);
|
|
int hugetlb_extend_reservation(struct hugetlbfs_inode_info *info,
|
|
unsigned long atleast_hpages);
|
|
void hugetlb_truncate_reservation(struct hugetlbfs_inode_info *info,
|
|
unsigned long atmost_hpages);
|
|
int hugetlb_get_quota(struct address_space *mapping);
|
|
void hugetlb_put_quota(struct address_space *mapping);
|
|
|
|
static inline int is_file_hugepages(struct file *file)
|
|
{
|
|
return file->f_op == &hugetlbfs_file_operations;
|
|
}
|
|
|
|
static inline void set_file_hugepages(struct file *file)
|
|
{
|
|
file->f_op = &hugetlbfs_file_operations;
|
|
}
|
|
#else /* !CONFIG_HUGETLBFS */
|
|
|
|
#define is_file_hugepages(file) 0
|
|
#define set_file_hugepages(file) BUG()
|
|
#define hugetlb_zero_setup(size) ERR_PTR(-ENOSYS)
|
|
|
|
#endif /* !CONFIG_HUGETLBFS */
|
|
|
|
#endif /* _LINUX_HUGETLB_H */
|