xref: /OK3568_Linux_fs/kernel/arch/ia64/mm/hugetlbpage.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * IA-64 Huge TLB Page Support for Kernel.
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright (C) 2002-2004 Rohit Seth <rohit.seth@intel.com>
6*4882a593Smuzhiyun  * Copyright (C) 2003-2004 Ken Chen <kenneth.w.chen@intel.com>
7*4882a593Smuzhiyun  *
8*4882a593Smuzhiyun  * Sep, 2003: add numa support
9*4882a593Smuzhiyun  * Feb, 2004: dynamic hugetlb page size via boot parameter
10*4882a593Smuzhiyun  */
11*4882a593Smuzhiyun 
12*4882a593Smuzhiyun #include <linux/init.h>
13*4882a593Smuzhiyun #include <linux/fs.h>
14*4882a593Smuzhiyun #include <linux/mm.h>
15*4882a593Smuzhiyun #include <linux/hugetlb.h>
16*4882a593Smuzhiyun #include <linux/pagemap.h>
17*4882a593Smuzhiyun #include <linux/module.h>
18*4882a593Smuzhiyun #include <linux/sysctl.h>
19*4882a593Smuzhiyun #include <linux/log2.h>
20*4882a593Smuzhiyun #include <asm/mman.h>
21*4882a593Smuzhiyun #include <asm/tlb.h>
22*4882a593Smuzhiyun #include <asm/tlbflush.h>
23*4882a593Smuzhiyun 
24*4882a593Smuzhiyun unsigned int hpage_shift = HPAGE_SHIFT_DEFAULT;
25*4882a593Smuzhiyun EXPORT_SYMBOL(hpage_shift);
26*4882a593Smuzhiyun 
27*4882a593Smuzhiyun pte_t *
huge_pte_alloc(struct mm_struct * mm,struct vm_area_struct * vma,unsigned long addr,unsigned long sz)28*4882a593Smuzhiyun huge_pte_alloc(struct mm_struct *mm, struct vm_area_struct *vma,
29*4882a593Smuzhiyun 	       unsigned long addr, unsigned long sz)
30*4882a593Smuzhiyun {
31*4882a593Smuzhiyun 	unsigned long taddr = htlbpage_to_page(addr);
32*4882a593Smuzhiyun 	pgd_t *pgd;
33*4882a593Smuzhiyun 	p4d_t *p4d;
34*4882a593Smuzhiyun 	pud_t *pud;
35*4882a593Smuzhiyun 	pmd_t *pmd;
36*4882a593Smuzhiyun 	pte_t *pte = NULL;
37*4882a593Smuzhiyun 
38*4882a593Smuzhiyun 	pgd = pgd_offset(mm, taddr);
39*4882a593Smuzhiyun 	p4d = p4d_offset(pgd, taddr);
40*4882a593Smuzhiyun 	pud = pud_alloc(mm, p4d, taddr);
41*4882a593Smuzhiyun 	if (pud) {
42*4882a593Smuzhiyun 		pmd = pmd_alloc(mm, pud, taddr);
43*4882a593Smuzhiyun 		if (pmd)
44*4882a593Smuzhiyun 			pte = pte_alloc_map(mm, pmd, taddr);
45*4882a593Smuzhiyun 	}
46*4882a593Smuzhiyun 	return pte;
47*4882a593Smuzhiyun }
48*4882a593Smuzhiyun 
49*4882a593Smuzhiyun pte_t *
huge_pte_offset(struct mm_struct * mm,unsigned long addr,unsigned long sz)50*4882a593Smuzhiyun huge_pte_offset (struct mm_struct *mm, unsigned long addr, unsigned long sz)
51*4882a593Smuzhiyun {
52*4882a593Smuzhiyun 	unsigned long taddr = htlbpage_to_page(addr);
53*4882a593Smuzhiyun 	pgd_t *pgd;
54*4882a593Smuzhiyun 	p4d_t *p4d;
55*4882a593Smuzhiyun 	pud_t *pud;
56*4882a593Smuzhiyun 	pmd_t *pmd;
57*4882a593Smuzhiyun 	pte_t *pte = NULL;
58*4882a593Smuzhiyun 
59*4882a593Smuzhiyun 	pgd = pgd_offset(mm, taddr);
60*4882a593Smuzhiyun 	if (pgd_present(*pgd)) {
61*4882a593Smuzhiyun 		p4d = p4d_offset(pgd, addr);
62*4882a593Smuzhiyun 		if (p4d_present(*p4d)) {
63*4882a593Smuzhiyun 			pud = pud_offset(p4d, taddr);
64*4882a593Smuzhiyun 			if (pud_present(*pud)) {
65*4882a593Smuzhiyun 				pmd = pmd_offset(pud, taddr);
66*4882a593Smuzhiyun 				if (pmd_present(*pmd))
67*4882a593Smuzhiyun 					pte = pte_offset_map(pmd, taddr);
68*4882a593Smuzhiyun 			}
69*4882a593Smuzhiyun 		}
70*4882a593Smuzhiyun 	}
71*4882a593Smuzhiyun 
72*4882a593Smuzhiyun 	return pte;
73*4882a593Smuzhiyun }
74*4882a593Smuzhiyun 
75*4882a593Smuzhiyun #define mk_pte_huge(entry) { pte_val(entry) |= _PAGE_P; }
76*4882a593Smuzhiyun 
77*4882a593Smuzhiyun /*
78*4882a593Smuzhiyun  * Don't actually need to do any preparation, but need to make sure
79*4882a593Smuzhiyun  * the address is in the right region.
80*4882a593Smuzhiyun  */
prepare_hugepage_range(struct file * file,unsigned long addr,unsigned long len)81*4882a593Smuzhiyun int prepare_hugepage_range(struct file *file,
82*4882a593Smuzhiyun 			unsigned long addr, unsigned long len)
83*4882a593Smuzhiyun {
84*4882a593Smuzhiyun 	if (len & ~HPAGE_MASK)
85*4882a593Smuzhiyun 		return -EINVAL;
86*4882a593Smuzhiyun 	if (addr & ~HPAGE_MASK)
87*4882a593Smuzhiyun 		return -EINVAL;
88*4882a593Smuzhiyun 	if (REGION_NUMBER(addr) != RGN_HPAGE)
89*4882a593Smuzhiyun 		return -EINVAL;
90*4882a593Smuzhiyun 
91*4882a593Smuzhiyun 	return 0;
92*4882a593Smuzhiyun }
93*4882a593Smuzhiyun 
follow_huge_addr(struct mm_struct * mm,unsigned long addr,int write)94*4882a593Smuzhiyun struct page *follow_huge_addr(struct mm_struct *mm, unsigned long addr, int write)
95*4882a593Smuzhiyun {
96*4882a593Smuzhiyun 	struct page *page;
97*4882a593Smuzhiyun 	pte_t *ptep;
98*4882a593Smuzhiyun 
99*4882a593Smuzhiyun 	if (REGION_NUMBER(addr) != RGN_HPAGE)
100*4882a593Smuzhiyun 		return ERR_PTR(-EINVAL);
101*4882a593Smuzhiyun 
102*4882a593Smuzhiyun 	ptep = huge_pte_offset(mm, addr, HPAGE_SIZE);
103*4882a593Smuzhiyun 	if (!ptep || pte_none(*ptep))
104*4882a593Smuzhiyun 		return NULL;
105*4882a593Smuzhiyun 	page = pte_page(*ptep);
106*4882a593Smuzhiyun 	page += ((addr & ~HPAGE_MASK) >> PAGE_SHIFT);
107*4882a593Smuzhiyun 	return page;
108*4882a593Smuzhiyun }
pmd_huge(pmd_t pmd)109*4882a593Smuzhiyun int pmd_huge(pmd_t pmd)
110*4882a593Smuzhiyun {
111*4882a593Smuzhiyun 	return 0;
112*4882a593Smuzhiyun }
113*4882a593Smuzhiyun 
pud_huge(pud_t pud)114*4882a593Smuzhiyun int pud_huge(pud_t pud)
115*4882a593Smuzhiyun {
116*4882a593Smuzhiyun 	return 0;
117*4882a593Smuzhiyun }
118*4882a593Smuzhiyun 
hugetlb_free_pgd_range(struct mmu_gather * tlb,unsigned long addr,unsigned long end,unsigned long floor,unsigned long ceiling)119*4882a593Smuzhiyun void hugetlb_free_pgd_range(struct mmu_gather *tlb,
120*4882a593Smuzhiyun 			unsigned long addr, unsigned long end,
121*4882a593Smuzhiyun 			unsigned long floor, unsigned long ceiling)
122*4882a593Smuzhiyun {
123*4882a593Smuzhiyun 	/*
124*4882a593Smuzhiyun 	 * This is called to free hugetlb page tables.
125*4882a593Smuzhiyun 	 *
126*4882a593Smuzhiyun 	 * The offset of these addresses from the base of the hugetlb
127*4882a593Smuzhiyun 	 * region must be scaled down by HPAGE_SIZE/PAGE_SIZE so that
128*4882a593Smuzhiyun 	 * the standard free_pgd_range will free the right page tables.
129*4882a593Smuzhiyun 	 *
130*4882a593Smuzhiyun 	 * If floor and ceiling are also in the hugetlb region, they
131*4882a593Smuzhiyun 	 * must likewise be scaled down; but if outside, left unchanged.
132*4882a593Smuzhiyun 	 */
133*4882a593Smuzhiyun 
134*4882a593Smuzhiyun 	addr = htlbpage_to_page(addr);
135*4882a593Smuzhiyun 	end  = htlbpage_to_page(end);
136*4882a593Smuzhiyun 	if (REGION_NUMBER(floor) == RGN_HPAGE)
137*4882a593Smuzhiyun 		floor = htlbpage_to_page(floor);
138*4882a593Smuzhiyun 	if (REGION_NUMBER(ceiling) == RGN_HPAGE)
139*4882a593Smuzhiyun 		ceiling = htlbpage_to_page(ceiling);
140*4882a593Smuzhiyun 
141*4882a593Smuzhiyun 	free_pgd_range(tlb, addr, end, floor, ceiling);
142*4882a593Smuzhiyun }
143*4882a593Smuzhiyun 
hugetlb_get_unmapped_area(struct file * file,unsigned long addr,unsigned long len,unsigned long pgoff,unsigned long flags)144*4882a593Smuzhiyun unsigned long hugetlb_get_unmapped_area(struct file *file, unsigned long addr, unsigned long len,
145*4882a593Smuzhiyun 		unsigned long pgoff, unsigned long flags)
146*4882a593Smuzhiyun {
147*4882a593Smuzhiyun 	struct vm_unmapped_area_info info;
148*4882a593Smuzhiyun 
149*4882a593Smuzhiyun 	if (len > RGN_MAP_LIMIT)
150*4882a593Smuzhiyun 		return -ENOMEM;
151*4882a593Smuzhiyun 	if (len & ~HPAGE_MASK)
152*4882a593Smuzhiyun 		return -EINVAL;
153*4882a593Smuzhiyun 
154*4882a593Smuzhiyun 	/* Handle MAP_FIXED */
155*4882a593Smuzhiyun 	if (flags & MAP_FIXED) {
156*4882a593Smuzhiyun 		if (prepare_hugepage_range(file, addr, len))
157*4882a593Smuzhiyun 			return -EINVAL;
158*4882a593Smuzhiyun 		return addr;
159*4882a593Smuzhiyun 	}
160*4882a593Smuzhiyun 
161*4882a593Smuzhiyun 	/* This code assumes that RGN_HPAGE != 0. */
162*4882a593Smuzhiyun 	if ((REGION_NUMBER(addr) != RGN_HPAGE) || (addr & (HPAGE_SIZE - 1)))
163*4882a593Smuzhiyun 		addr = HPAGE_REGION_BASE;
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun 	info.flags = 0;
166*4882a593Smuzhiyun 	info.length = len;
167*4882a593Smuzhiyun 	info.low_limit = addr;
168*4882a593Smuzhiyun 	info.high_limit = HPAGE_REGION_BASE + RGN_MAP_LIMIT;
169*4882a593Smuzhiyun 	info.align_mask = PAGE_MASK & (HPAGE_SIZE - 1);
170*4882a593Smuzhiyun 	info.align_offset = 0;
171*4882a593Smuzhiyun 	return vm_unmapped_area(&info);
172*4882a593Smuzhiyun }
173*4882a593Smuzhiyun 
hugetlb_setup_sz(char * str)174*4882a593Smuzhiyun static int __init hugetlb_setup_sz(char *str)
175*4882a593Smuzhiyun {
176*4882a593Smuzhiyun 	u64 tr_pages;
177*4882a593Smuzhiyun 	unsigned long long size;
178*4882a593Smuzhiyun 
179*4882a593Smuzhiyun 	if (ia64_pal_vm_page_size(&tr_pages, NULL) != 0)
180*4882a593Smuzhiyun 		/*
181*4882a593Smuzhiyun 		 * shouldn't happen, but just in case.
182*4882a593Smuzhiyun 		 */
183*4882a593Smuzhiyun 		tr_pages = 0x15557000UL;
184*4882a593Smuzhiyun 
185*4882a593Smuzhiyun 	size = memparse(str, &str);
186*4882a593Smuzhiyun 	if (*str || !is_power_of_2(size) || !(tr_pages & size) ||
187*4882a593Smuzhiyun 		size <= PAGE_SIZE ||
188*4882a593Smuzhiyun 		size >= (1UL << PAGE_SHIFT << MAX_ORDER)) {
189*4882a593Smuzhiyun 		printk(KERN_WARNING "Invalid huge page size specified\n");
190*4882a593Smuzhiyun 		return 1;
191*4882a593Smuzhiyun 	}
192*4882a593Smuzhiyun 
193*4882a593Smuzhiyun 	hpage_shift = __ffs(size);
194*4882a593Smuzhiyun 	/*
195*4882a593Smuzhiyun 	 * boot cpu already executed ia64_mmu_init, and has HPAGE_SHIFT_DEFAULT
196*4882a593Smuzhiyun 	 * override here with new page shift.
197*4882a593Smuzhiyun 	 */
198*4882a593Smuzhiyun 	ia64_set_rr(HPAGE_REGION_BASE, hpage_shift << 2);
199*4882a593Smuzhiyun 	return 0;
200*4882a593Smuzhiyun }
201*4882a593Smuzhiyun early_param("hugepagesz", hugetlb_setup_sz);
202