1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * linux/arch/arm/mm/copypage-feroceon.S
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (C) 2008 Marvell Semiconductors
6*4882a593Smuzhiyun *
7*4882a593Smuzhiyun * This handles copy_user_highpage and clear_user_page on Feroceon
8*4882a593Smuzhiyun * more optimally than the generic implementations.
9*4882a593Smuzhiyun */
10*4882a593Smuzhiyun #include <linux/init.h>
11*4882a593Smuzhiyun #include <linux/highmem.h>
12*4882a593Smuzhiyun
feroceon_copy_user_page(void * kto,const void * kfrom)13*4882a593Smuzhiyun static void feroceon_copy_user_page(void *kto, const void *kfrom)
14*4882a593Smuzhiyun {
15*4882a593Smuzhiyun int tmp;
16*4882a593Smuzhiyun
17*4882a593Smuzhiyun asm volatile ("\
18*4882a593Smuzhiyun 1: ldmia %1!, {r2 - r7, ip, lr} \n\
19*4882a593Smuzhiyun pld [%1, #0] \n\
20*4882a593Smuzhiyun pld [%1, #32] \n\
21*4882a593Smuzhiyun pld [%1, #64] \n\
22*4882a593Smuzhiyun pld [%1, #96] \n\
23*4882a593Smuzhiyun pld [%1, #128] \n\
24*4882a593Smuzhiyun pld [%1, #160] \n\
25*4882a593Smuzhiyun pld [%1, #192] \n\
26*4882a593Smuzhiyun stmia %0, {r2 - r7, ip, lr} \n\
27*4882a593Smuzhiyun ldmia %1!, {r2 - r7, ip, lr} \n\
28*4882a593Smuzhiyun mcr p15, 0, %0, c7, c14, 1 @ clean and invalidate D line\n\
29*4882a593Smuzhiyun add %0, %0, #32 \n\
30*4882a593Smuzhiyun stmia %0, {r2 - r7, ip, lr} \n\
31*4882a593Smuzhiyun ldmia %1!, {r2 - r7, ip, lr} \n\
32*4882a593Smuzhiyun mcr p15, 0, %0, c7, c14, 1 @ clean and invalidate D line\n\
33*4882a593Smuzhiyun add %0, %0, #32 \n\
34*4882a593Smuzhiyun stmia %0, {r2 - r7, ip, lr} \n\
35*4882a593Smuzhiyun ldmia %1!, {r2 - r7, ip, lr} \n\
36*4882a593Smuzhiyun mcr p15, 0, %0, c7, c14, 1 @ clean and invalidate D line\n\
37*4882a593Smuzhiyun add %0, %0, #32 \n\
38*4882a593Smuzhiyun stmia %0, {r2 - r7, ip, lr} \n\
39*4882a593Smuzhiyun ldmia %1!, {r2 - r7, ip, lr} \n\
40*4882a593Smuzhiyun mcr p15, 0, %0, c7, c14, 1 @ clean and invalidate D line\n\
41*4882a593Smuzhiyun add %0, %0, #32 \n\
42*4882a593Smuzhiyun stmia %0, {r2 - r7, ip, lr} \n\
43*4882a593Smuzhiyun ldmia %1!, {r2 - r7, ip, lr} \n\
44*4882a593Smuzhiyun mcr p15, 0, %0, c7, c14, 1 @ clean and invalidate D line\n\
45*4882a593Smuzhiyun add %0, %0, #32 \n\
46*4882a593Smuzhiyun stmia %0, {r2 - r7, ip, lr} \n\
47*4882a593Smuzhiyun ldmia %1!, {r2 - r7, ip, lr} \n\
48*4882a593Smuzhiyun mcr p15, 0, %0, c7, c14, 1 @ clean and invalidate D line\n\
49*4882a593Smuzhiyun add %0, %0, #32 \n\
50*4882a593Smuzhiyun stmia %0, {r2 - r7, ip, lr} \n\
51*4882a593Smuzhiyun ldmia %1!, {r2 - r7, ip, lr} \n\
52*4882a593Smuzhiyun mcr p15, 0, %0, c7, c14, 1 @ clean and invalidate D line\n\
53*4882a593Smuzhiyun add %0, %0, #32 \n\
54*4882a593Smuzhiyun stmia %0, {r2 - r7, ip, lr} \n\
55*4882a593Smuzhiyun subs %2, %2, #(32 * 8) \n\
56*4882a593Smuzhiyun mcr p15, 0, %0, c7, c14, 1 @ clean and invalidate D line\n\
57*4882a593Smuzhiyun add %0, %0, #32 \n\
58*4882a593Smuzhiyun bne 1b \n\
59*4882a593Smuzhiyun mcr p15, 0, %2, c7, c10, 4 @ drain WB"
60*4882a593Smuzhiyun : "+&r" (kto), "+&r" (kfrom), "=&r" (tmp)
61*4882a593Smuzhiyun : "2" (PAGE_SIZE)
62*4882a593Smuzhiyun : "r2", "r3", "r4", "r5", "r6", "r7", "ip", "lr");
63*4882a593Smuzhiyun }
64*4882a593Smuzhiyun
feroceon_copy_user_highpage(struct page * to,struct page * from,unsigned long vaddr,struct vm_area_struct * vma)65*4882a593Smuzhiyun void feroceon_copy_user_highpage(struct page *to, struct page *from,
66*4882a593Smuzhiyun unsigned long vaddr, struct vm_area_struct *vma)
67*4882a593Smuzhiyun {
68*4882a593Smuzhiyun void *kto, *kfrom;
69*4882a593Smuzhiyun
70*4882a593Smuzhiyun kto = kmap_atomic(to);
71*4882a593Smuzhiyun kfrom = kmap_atomic(from);
72*4882a593Smuzhiyun flush_cache_page(vma, vaddr, page_to_pfn(from));
73*4882a593Smuzhiyun feroceon_copy_user_page(kto, kfrom);
74*4882a593Smuzhiyun kunmap_atomic(kfrom);
75*4882a593Smuzhiyun kunmap_atomic(kto);
76*4882a593Smuzhiyun }
77*4882a593Smuzhiyun
feroceon_clear_user_highpage(struct page * page,unsigned long vaddr)78*4882a593Smuzhiyun void feroceon_clear_user_highpage(struct page *page, unsigned long vaddr)
79*4882a593Smuzhiyun {
80*4882a593Smuzhiyun void *ptr, *kaddr = kmap_atomic(page);
81*4882a593Smuzhiyun asm volatile ("\
82*4882a593Smuzhiyun mov r1, %2 \n\
83*4882a593Smuzhiyun mov r2, #0 \n\
84*4882a593Smuzhiyun mov r3, #0 \n\
85*4882a593Smuzhiyun mov r4, #0 \n\
86*4882a593Smuzhiyun mov r5, #0 \n\
87*4882a593Smuzhiyun mov r6, #0 \n\
88*4882a593Smuzhiyun mov r7, #0 \n\
89*4882a593Smuzhiyun mov ip, #0 \n\
90*4882a593Smuzhiyun mov lr, #0 \n\
91*4882a593Smuzhiyun 1: stmia %0, {r2-r7, ip, lr} \n\
92*4882a593Smuzhiyun subs r1, r1, #1 \n\
93*4882a593Smuzhiyun mcr p15, 0, %0, c7, c14, 1 @ clean and invalidate D line\n\
94*4882a593Smuzhiyun add %0, %0, #32 \n\
95*4882a593Smuzhiyun bne 1b \n\
96*4882a593Smuzhiyun mcr p15, 0, r1, c7, c10, 4 @ drain WB"
97*4882a593Smuzhiyun : "=r" (ptr)
98*4882a593Smuzhiyun : "0" (kaddr), "I" (PAGE_SIZE / 32)
99*4882a593Smuzhiyun : "r1", "r2", "r3", "r4", "r5", "r6", "r7", "ip", "lr");
100*4882a593Smuzhiyun kunmap_atomic(kaddr);
101*4882a593Smuzhiyun }
102*4882a593Smuzhiyun
103*4882a593Smuzhiyun struct cpu_user_fns feroceon_user_fns __initdata = {
104*4882a593Smuzhiyun .cpu_clear_user_highpage = feroceon_clear_user_highpage,
105*4882a593Smuzhiyun .cpu_copy_user_highpage = feroceon_copy_user_highpage,
106*4882a593Smuzhiyun };
107*4882a593Smuzhiyun
108