1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * IA-32 Huge TLB Page Support for Kernel.
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (C) 2002, Rohit Seth <rohit.seth@intel.com>
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include <linux/init.h>
9*4882a593Smuzhiyun #include <linux/fs.h>
10*4882a593Smuzhiyun #include <linux/mm.h>
11*4882a593Smuzhiyun #include <linux/sched/mm.h>
12*4882a593Smuzhiyun #include <linux/hugetlb.h>
13*4882a593Smuzhiyun #include <linux/pagemap.h>
14*4882a593Smuzhiyun #include <linux/err.h>
15*4882a593Smuzhiyun #include <linux/sysctl.h>
16*4882a593Smuzhiyun #include <linux/compat.h>
17*4882a593Smuzhiyun #include <asm/mman.h>
18*4882a593Smuzhiyun #include <asm/tlb.h>
19*4882a593Smuzhiyun #include <asm/tlbflush.h>
20*4882a593Smuzhiyun #include <asm/elf.h>
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun #if 0 /* This is just for testing */
23*4882a593Smuzhiyun struct page *
24*4882a593Smuzhiyun follow_huge_addr(struct mm_struct *mm, unsigned long address, int write)
25*4882a593Smuzhiyun {
26*4882a593Smuzhiyun unsigned long start = address;
27*4882a593Smuzhiyun int length = 1;
28*4882a593Smuzhiyun int nr;
29*4882a593Smuzhiyun struct page *page;
30*4882a593Smuzhiyun struct vm_area_struct *vma;
31*4882a593Smuzhiyun
32*4882a593Smuzhiyun vma = find_vma(mm, addr);
33*4882a593Smuzhiyun if (!vma || !is_vm_hugetlb_page(vma))
34*4882a593Smuzhiyun return ERR_PTR(-EINVAL);
35*4882a593Smuzhiyun
36*4882a593Smuzhiyun pte = huge_pte_offset(mm, address, vma_mmu_pagesize(vma));
37*4882a593Smuzhiyun
38*4882a593Smuzhiyun /* hugetlb should be locked, and hence, prefaulted */
39*4882a593Smuzhiyun WARN_ON(!pte || pte_none(*pte));
40*4882a593Smuzhiyun
41*4882a593Smuzhiyun page = &pte_page(*pte)[vpfn % (HPAGE_SIZE/PAGE_SIZE)];
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun WARN_ON(!PageHead(page));
44*4882a593Smuzhiyun
45*4882a593Smuzhiyun return page;
46*4882a593Smuzhiyun }
47*4882a593Smuzhiyun
48*4882a593Smuzhiyun int pmd_huge(pmd_t pmd)
49*4882a593Smuzhiyun {
50*4882a593Smuzhiyun return 0;
51*4882a593Smuzhiyun }
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun int pud_huge(pud_t pud)
54*4882a593Smuzhiyun {
55*4882a593Smuzhiyun return 0;
56*4882a593Smuzhiyun }
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun #else
59*4882a593Smuzhiyun
60*4882a593Smuzhiyun /*
61*4882a593Smuzhiyun * pmd_huge() returns 1 if @pmd is hugetlb related entry, that is normal
62*4882a593Smuzhiyun * hugetlb entry or non-present (migration or hwpoisoned) hugetlb entry.
63*4882a593Smuzhiyun * Otherwise, returns 0.
64*4882a593Smuzhiyun */
pmd_huge(pmd_t pmd)65*4882a593Smuzhiyun int pmd_huge(pmd_t pmd)
66*4882a593Smuzhiyun {
67*4882a593Smuzhiyun return !pmd_none(pmd) &&
68*4882a593Smuzhiyun (pmd_val(pmd) & (_PAGE_PRESENT|_PAGE_PSE)) != _PAGE_PRESENT;
69*4882a593Smuzhiyun }
70*4882a593Smuzhiyun
pud_huge(pud_t pud)71*4882a593Smuzhiyun int pud_huge(pud_t pud)
72*4882a593Smuzhiyun {
73*4882a593Smuzhiyun return !!(pud_val(pud) & _PAGE_PSE);
74*4882a593Smuzhiyun }
75*4882a593Smuzhiyun #endif
76*4882a593Smuzhiyun
77*4882a593Smuzhiyun #ifdef CONFIG_HUGETLB_PAGE
hugetlb_get_unmapped_area_bottomup(struct file * file,unsigned long addr,unsigned long len,unsigned long pgoff,unsigned long flags)78*4882a593Smuzhiyun static unsigned long hugetlb_get_unmapped_area_bottomup(struct file *file,
79*4882a593Smuzhiyun unsigned long addr, unsigned long len,
80*4882a593Smuzhiyun unsigned long pgoff, unsigned long flags)
81*4882a593Smuzhiyun {
82*4882a593Smuzhiyun struct hstate *h = hstate_file(file);
83*4882a593Smuzhiyun struct vm_unmapped_area_info info;
84*4882a593Smuzhiyun
85*4882a593Smuzhiyun info.flags = 0;
86*4882a593Smuzhiyun info.length = len;
87*4882a593Smuzhiyun info.low_limit = get_mmap_base(1);
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun /*
90*4882a593Smuzhiyun * If hint address is above DEFAULT_MAP_WINDOW, look for unmapped area
91*4882a593Smuzhiyun * in the full address space.
92*4882a593Smuzhiyun */
93*4882a593Smuzhiyun info.high_limit = in_32bit_syscall() ?
94*4882a593Smuzhiyun task_size_32bit() : task_size_64bit(addr > DEFAULT_MAP_WINDOW);
95*4882a593Smuzhiyun
96*4882a593Smuzhiyun info.align_mask = PAGE_MASK & ~huge_page_mask(h);
97*4882a593Smuzhiyun info.align_offset = 0;
98*4882a593Smuzhiyun return vm_unmapped_area(&info);
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun
hugetlb_get_unmapped_area_topdown(struct file * file,unsigned long addr,unsigned long len,unsigned long pgoff,unsigned long flags)101*4882a593Smuzhiyun static unsigned long hugetlb_get_unmapped_area_topdown(struct file *file,
102*4882a593Smuzhiyun unsigned long addr, unsigned long len,
103*4882a593Smuzhiyun unsigned long pgoff, unsigned long flags)
104*4882a593Smuzhiyun {
105*4882a593Smuzhiyun struct hstate *h = hstate_file(file);
106*4882a593Smuzhiyun struct vm_unmapped_area_info info;
107*4882a593Smuzhiyun
108*4882a593Smuzhiyun info.flags = VM_UNMAPPED_AREA_TOPDOWN;
109*4882a593Smuzhiyun info.length = len;
110*4882a593Smuzhiyun info.low_limit = PAGE_SIZE;
111*4882a593Smuzhiyun info.high_limit = get_mmap_base(0);
112*4882a593Smuzhiyun
113*4882a593Smuzhiyun /*
114*4882a593Smuzhiyun * If hint address is above DEFAULT_MAP_WINDOW, look for unmapped area
115*4882a593Smuzhiyun * in the full address space.
116*4882a593Smuzhiyun */
117*4882a593Smuzhiyun if (addr > DEFAULT_MAP_WINDOW && !in_32bit_syscall())
118*4882a593Smuzhiyun info.high_limit += TASK_SIZE_MAX - DEFAULT_MAP_WINDOW;
119*4882a593Smuzhiyun
120*4882a593Smuzhiyun info.align_mask = PAGE_MASK & ~huge_page_mask(h);
121*4882a593Smuzhiyun info.align_offset = 0;
122*4882a593Smuzhiyun addr = vm_unmapped_area(&info);
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun /*
125*4882a593Smuzhiyun * A failed mmap() very likely causes application failure,
126*4882a593Smuzhiyun * so fall back to the bottom-up function here. This scenario
127*4882a593Smuzhiyun * can happen with large stack limits and large mmap()
128*4882a593Smuzhiyun * allocations.
129*4882a593Smuzhiyun */
130*4882a593Smuzhiyun if (addr & ~PAGE_MASK) {
131*4882a593Smuzhiyun VM_BUG_ON(addr != -ENOMEM);
132*4882a593Smuzhiyun info.flags = 0;
133*4882a593Smuzhiyun info.low_limit = TASK_UNMAPPED_BASE;
134*4882a593Smuzhiyun info.high_limit = TASK_SIZE_LOW;
135*4882a593Smuzhiyun addr = vm_unmapped_area(&info);
136*4882a593Smuzhiyun }
137*4882a593Smuzhiyun
138*4882a593Smuzhiyun return addr;
139*4882a593Smuzhiyun }
140*4882a593Smuzhiyun
141*4882a593Smuzhiyun unsigned long
hugetlb_get_unmapped_area(struct file * file,unsigned long addr,unsigned long len,unsigned long pgoff,unsigned long flags)142*4882a593Smuzhiyun hugetlb_get_unmapped_area(struct file *file, unsigned long addr,
143*4882a593Smuzhiyun unsigned long len, unsigned long pgoff, unsigned long flags)
144*4882a593Smuzhiyun {
145*4882a593Smuzhiyun struct hstate *h = hstate_file(file);
146*4882a593Smuzhiyun struct mm_struct *mm = current->mm;
147*4882a593Smuzhiyun struct vm_area_struct *vma;
148*4882a593Smuzhiyun
149*4882a593Smuzhiyun if (len & ~huge_page_mask(h))
150*4882a593Smuzhiyun return -EINVAL;
151*4882a593Smuzhiyun
152*4882a593Smuzhiyun if (len > TASK_SIZE)
153*4882a593Smuzhiyun return -ENOMEM;
154*4882a593Smuzhiyun
155*4882a593Smuzhiyun /* No address checking. See comment at mmap_address_hint_valid() */
156*4882a593Smuzhiyun if (flags & MAP_FIXED) {
157*4882a593Smuzhiyun if (prepare_hugepage_range(file, addr, len))
158*4882a593Smuzhiyun return -EINVAL;
159*4882a593Smuzhiyun return addr;
160*4882a593Smuzhiyun }
161*4882a593Smuzhiyun
162*4882a593Smuzhiyun if (addr) {
163*4882a593Smuzhiyun addr &= huge_page_mask(h);
164*4882a593Smuzhiyun if (!mmap_address_hint_valid(addr, len))
165*4882a593Smuzhiyun goto get_unmapped_area;
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun vma = find_vma(mm, addr);
168*4882a593Smuzhiyun if (!vma || addr + len <= vm_start_gap(vma))
169*4882a593Smuzhiyun return addr;
170*4882a593Smuzhiyun }
171*4882a593Smuzhiyun
172*4882a593Smuzhiyun get_unmapped_area:
173*4882a593Smuzhiyun if (mm->get_unmapped_area == arch_get_unmapped_area)
174*4882a593Smuzhiyun return hugetlb_get_unmapped_area_bottomup(file, addr, len,
175*4882a593Smuzhiyun pgoff, flags);
176*4882a593Smuzhiyun else
177*4882a593Smuzhiyun return hugetlb_get_unmapped_area_topdown(file, addr, len,
178*4882a593Smuzhiyun pgoff, flags);
179*4882a593Smuzhiyun }
180*4882a593Smuzhiyun #endif /* CONFIG_HUGETLB_PAGE */
181*4882a593Smuzhiyun
182*4882a593Smuzhiyun #ifdef CONFIG_X86_64
arch_hugetlb_valid_size(unsigned long size)183*4882a593Smuzhiyun bool __init arch_hugetlb_valid_size(unsigned long size)
184*4882a593Smuzhiyun {
185*4882a593Smuzhiyun if (size == PMD_SIZE)
186*4882a593Smuzhiyun return true;
187*4882a593Smuzhiyun else if (size == PUD_SIZE && boot_cpu_has(X86_FEATURE_GBPAGES))
188*4882a593Smuzhiyun return true;
189*4882a593Smuzhiyun else
190*4882a593Smuzhiyun return false;
191*4882a593Smuzhiyun }
192*4882a593Smuzhiyun
193*4882a593Smuzhiyun #ifdef CONFIG_CONTIG_ALLOC
gigantic_pages_init(void)194*4882a593Smuzhiyun static __init int gigantic_pages_init(void)
195*4882a593Smuzhiyun {
196*4882a593Smuzhiyun /* With compaction or CMA we can allocate gigantic pages at runtime */
197*4882a593Smuzhiyun if (boot_cpu_has(X86_FEATURE_GBPAGES))
198*4882a593Smuzhiyun hugetlb_add_hstate(PUD_SHIFT - PAGE_SHIFT);
199*4882a593Smuzhiyun return 0;
200*4882a593Smuzhiyun }
201*4882a593Smuzhiyun arch_initcall(gigantic_pages_init);
202*4882a593Smuzhiyun #endif
203*4882a593Smuzhiyun #endif
204