1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Access kernel memory without faulting -- s390 specific implementation.
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright IBM Corp. 2009, 2015
6*4882a593Smuzhiyun *
7*4882a593Smuzhiyun * Author(s): Heiko Carstens <heiko.carstens@de.ibm.com>,
8*4882a593Smuzhiyun *
9*4882a593Smuzhiyun */
10*4882a593Smuzhiyun
11*4882a593Smuzhiyun #include <linux/uaccess.h>
12*4882a593Smuzhiyun #include <linux/kernel.h>
13*4882a593Smuzhiyun #include <linux/types.h>
14*4882a593Smuzhiyun #include <linux/errno.h>
15*4882a593Smuzhiyun #include <linux/gfp.h>
16*4882a593Smuzhiyun #include <linux/cpu.h>
17*4882a593Smuzhiyun #include <asm/ctl_reg.h>
18*4882a593Smuzhiyun #include <asm/io.h>
19*4882a593Smuzhiyun #include <asm/stacktrace.h>
20*4882a593Smuzhiyun
s390_kernel_write_odd(void * dst,const void * src,size_t size)21*4882a593Smuzhiyun static notrace long s390_kernel_write_odd(void *dst, const void *src, size_t size)
22*4882a593Smuzhiyun {
23*4882a593Smuzhiyun unsigned long aligned, offset, count;
24*4882a593Smuzhiyun char tmp[8];
25*4882a593Smuzhiyun
26*4882a593Smuzhiyun aligned = (unsigned long) dst & ~7UL;
27*4882a593Smuzhiyun offset = (unsigned long) dst & 7UL;
28*4882a593Smuzhiyun size = min(8UL - offset, size);
29*4882a593Smuzhiyun count = size - 1;
30*4882a593Smuzhiyun asm volatile(
31*4882a593Smuzhiyun " bras 1,0f\n"
32*4882a593Smuzhiyun " mvc 0(1,%4),0(%5)\n"
33*4882a593Smuzhiyun "0: mvc 0(8,%3),0(%0)\n"
34*4882a593Smuzhiyun " ex %1,0(1)\n"
35*4882a593Smuzhiyun " lg %1,0(%3)\n"
36*4882a593Smuzhiyun " lra %0,0(%0)\n"
37*4882a593Smuzhiyun " sturg %1,%0\n"
38*4882a593Smuzhiyun : "+&a" (aligned), "+&a" (count), "=m" (tmp)
39*4882a593Smuzhiyun : "a" (&tmp), "a" (&tmp[offset]), "a" (src)
40*4882a593Smuzhiyun : "cc", "memory", "1");
41*4882a593Smuzhiyun return size;
42*4882a593Smuzhiyun }
43*4882a593Smuzhiyun
44*4882a593Smuzhiyun /*
45*4882a593Smuzhiyun * s390_kernel_write - write to kernel memory bypassing DAT
46*4882a593Smuzhiyun * @dst: destination address
47*4882a593Smuzhiyun * @src: source address
48*4882a593Smuzhiyun * @size: number of bytes to copy
49*4882a593Smuzhiyun *
50*4882a593Smuzhiyun * This function writes to kernel memory bypassing DAT and possible page table
51*4882a593Smuzhiyun * write protection. It writes to the destination using the sturg instruction.
52*4882a593Smuzhiyun * Therefore we have a read-modify-write sequence: the function reads eight
53*4882a593Smuzhiyun * bytes from destination at an eight byte boundary, modifies the bytes
54*4882a593Smuzhiyun * requested and writes the result back in a loop.
55*4882a593Smuzhiyun */
56*4882a593Smuzhiyun static DEFINE_SPINLOCK(s390_kernel_write_lock);
57*4882a593Smuzhiyun
s390_kernel_write(void * dst,const void * src,size_t size)58*4882a593Smuzhiyun notrace void *s390_kernel_write(void *dst, const void *src, size_t size)
59*4882a593Smuzhiyun {
60*4882a593Smuzhiyun void *tmp = dst;
61*4882a593Smuzhiyun unsigned long flags;
62*4882a593Smuzhiyun long copied;
63*4882a593Smuzhiyun
64*4882a593Smuzhiyun spin_lock_irqsave(&s390_kernel_write_lock, flags);
65*4882a593Smuzhiyun if (!(flags & PSW_MASK_DAT)) {
66*4882a593Smuzhiyun memcpy(dst, src, size);
67*4882a593Smuzhiyun } else {
68*4882a593Smuzhiyun while (size) {
69*4882a593Smuzhiyun copied = s390_kernel_write_odd(tmp, src, size);
70*4882a593Smuzhiyun tmp += copied;
71*4882a593Smuzhiyun src += copied;
72*4882a593Smuzhiyun size -= copied;
73*4882a593Smuzhiyun }
74*4882a593Smuzhiyun }
75*4882a593Smuzhiyun spin_unlock_irqrestore(&s390_kernel_write_lock, flags);
76*4882a593Smuzhiyun
77*4882a593Smuzhiyun return dst;
78*4882a593Smuzhiyun }
79*4882a593Smuzhiyun
__memcpy_real(void * dest,void * src,size_t count)80*4882a593Smuzhiyun static int __no_sanitize_address __memcpy_real(void *dest, void *src, size_t count)
81*4882a593Smuzhiyun {
82*4882a593Smuzhiyun register unsigned long _dest asm("2") = (unsigned long) dest;
83*4882a593Smuzhiyun register unsigned long _len1 asm("3") = (unsigned long) count;
84*4882a593Smuzhiyun register unsigned long _src asm("4") = (unsigned long) src;
85*4882a593Smuzhiyun register unsigned long _len2 asm("5") = (unsigned long) count;
86*4882a593Smuzhiyun int rc = -EFAULT;
87*4882a593Smuzhiyun
88*4882a593Smuzhiyun asm volatile (
89*4882a593Smuzhiyun "0: mvcle %1,%2,0x0\n"
90*4882a593Smuzhiyun "1: jo 0b\n"
91*4882a593Smuzhiyun " lhi %0,0x0\n"
92*4882a593Smuzhiyun "2:\n"
93*4882a593Smuzhiyun EX_TABLE(1b,2b)
94*4882a593Smuzhiyun : "+d" (rc), "+d" (_dest), "+d" (_src), "+d" (_len1),
95*4882a593Smuzhiyun "+d" (_len2), "=m" (*((long *) dest))
96*4882a593Smuzhiyun : "m" (*((long *) src))
97*4882a593Smuzhiyun : "cc", "memory");
98*4882a593Smuzhiyun return rc;
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun
_memcpy_real(unsigned long dest,unsigned long src,unsigned long count)101*4882a593Smuzhiyun static unsigned long __no_sanitize_address _memcpy_real(unsigned long dest,
102*4882a593Smuzhiyun unsigned long src,
103*4882a593Smuzhiyun unsigned long count)
104*4882a593Smuzhiyun {
105*4882a593Smuzhiyun int irqs_disabled, rc;
106*4882a593Smuzhiyun unsigned long flags;
107*4882a593Smuzhiyun
108*4882a593Smuzhiyun if (!count)
109*4882a593Smuzhiyun return 0;
110*4882a593Smuzhiyun flags = arch_local_irq_save();
111*4882a593Smuzhiyun irqs_disabled = arch_irqs_disabled_flags(flags);
112*4882a593Smuzhiyun if (!irqs_disabled)
113*4882a593Smuzhiyun trace_hardirqs_off();
114*4882a593Smuzhiyun __arch_local_irq_stnsm(0xf8); // disable DAT
115*4882a593Smuzhiyun rc = __memcpy_real((void *) dest, (void *) src, (size_t) count);
116*4882a593Smuzhiyun if (flags & PSW_MASK_DAT)
117*4882a593Smuzhiyun __arch_local_irq_stosm(0x04); // enable DAT
118*4882a593Smuzhiyun if (!irqs_disabled)
119*4882a593Smuzhiyun trace_hardirqs_on();
120*4882a593Smuzhiyun __arch_local_irq_ssm(flags);
121*4882a593Smuzhiyun return rc;
122*4882a593Smuzhiyun }
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun /*
125*4882a593Smuzhiyun * Copy memory in real mode (kernel to kernel)
126*4882a593Smuzhiyun */
memcpy_real(void * dest,void * src,size_t count)127*4882a593Smuzhiyun int memcpy_real(void *dest, void *src, size_t count)
128*4882a593Smuzhiyun {
129*4882a593Smuzhiyun int rc;
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun if (S390_lowcore.nodat_stack != 0) {
132*4882a593Smuzhiyun preempt_disable();
133*4882a593Smuzhiyun rc = CALL_ON_STACK(_memcpy_real, S390_lowcore.nodat_stack, 3,
134*4882a593Smuzhiyun dest, src, count);
135*4882a593Smuzhiyun preempt_enable();
136*4882a593Smuzhiyun return rc;
137*4882a593Smuzhiyun }
138*4882a593Smuzhiyun /*
139*4882a593Smuzhiyun * This is a really early memcpy_real call, the stacks are
140*4882a593Smuzhiyun * not set up yet. Just call _memcpy_real on the early boot
141*4882a593Smuzhiyun * stack
142*4882a593Smuzhiyun */
143*4882a593Smuzhiyun return _memcpy_real((unsigned long) dest,(unsigned long) src,
144*4882a593Smuzhiyun (unsigned long) count);
145*4882a593Smuzhiyun }
146*4882a593Smuzhiyun
147*4882a593Smuzhiyun /*
148*4882a593Smuzhiyun * Copy memory in absolute mode (kernel to kernel)
149*4882a593Smuzhiyun */
memcpy_absolute(void * dest,void * src,size_t count)150*4882a593Smuzhiyun void memcpy_absolute(void *dest, void *src, size_t count)
151*4882a593Smuzhiyun {
152*4882a593Smuzhiyun unsigned long cr0, flags, prefix;
153*4882a593Smuzhiyun
154*4882a593Smuzhiyun flags = arch_local_irq_save();
155*4882a593Smuzhiyun __ctl_store(cr0, 0, 0);
156*4882a593Smuzhiyun __ctl_clear_bit(0, 28); /* disable lowcore protection */
157*4882a593Smuzhiyun prefix = store_prefix();
158*4882a593Smuzhiyun if (prefix) {
159*4882a593Smuzhiyun local_mcck_disable();
160*4882a593Smuzhiyun set_prefix(0);
161*4882a593Smuzhiyun memcpy(dest, src, count);
162*4882a593Smuzhiyun set_prefix(prefix);
163*4882a593Smuzhiyun local_mcck_enable();
164*4882a593Smuzhiyun } else {
165*4882a593Smuzhiyun memcpy(dest, src, count);
166*4882a593Smuzhiyun }
167*4882a593Smuzhiyun __ctl_load(cr0, 0, 0);
168*4882a593Smuzhiyun arch_local_irq_restore(flags);
169*4882a593Smuzhiyun }
170*4882a593Smuzhiyun
171*4882a593Smuzhiyun /*
172*4882a593Smuzhiyun * Copy memory from kernel (real) to user (virtual)
173*4882a593Smuzhiyun */
copy_to_user_real(void __user * dest,void * src,unsigned long count)174*4882a593Smuzhiyun int copy_to_user_real(void __user *dest, void *src, unsigned long count)
175*4882a593Smuzhiyun {
176*4882a593Smuzhiyun int offs = 0, size, rc;
177*4882a593Smuzhiyun char *buf;
178*4882a593Smuzhiyun
179*4882a593Smuzhiyun buf = (char *) __get_free_page(GFP_KERNEL);
180*4882a593Smuzhiyun if (!buf)
181*4882a593Smuzhiyun return -ENOMEM;
182*4882a593Smuzhiyun rc = -EFAULT;
183*4882a593Smuzhiyun while (offs < count) {
184*4882a593Smuzhiyun size = min(PAGE_SIZE, count - offs);
185*4882a593Smuzhiyun if (memcpy_real(buf, src + offs, size))
186*4882a593Smuzhiyun goto out;
187*4882a593Smuzhiyun if (copy_to_user(dest + offs, buf, size))
188*4882a593Smuzhiyun goto out;
189*4882a593Smuzhiyun offs += size;
190*4882a593Smuzhiyun }
191*4882a593Smuzhiyun rc = 0;
192*4882a593Smuzhiyun out:
193*4882a593Smuzhiyun free_page((unsigned long) buf);
194*4882a593Smuzhiyun return rc;
195*4882a593Smuzhiyun }
196*4882a593Smuzhiyun
197*4882a593Smuzhiyun /*
198*4882a593Smuzhiyun * Check if physical address is within prefix or zero page
199*4882a593Smuzhiyun */
is_swapped(unsigned long addr)200*4882a593Smuzhiyun static int is_swapped(unsigned long addr)
201*4882a593Smuzhiyun {
202*4882a593Smuzhiyun unsigned long lc;
203*4882a593Smuzhiyun int cpu;
204*4882a593Smuzhiyun
205*4882a593Smuzhiyun if (addr < sizeof(struct lowcore))
206*4882a593Smuzhiyun return 1;
207*4882a593Smuzhiyun for_each_online_cpu(cpu) {
208*4882a593Smuzhiyun lc = (unsigned long) lowcore_ptr[cpu];
209*4882a593Smuzhiyun if (addr > lc + sizeof(struct lowcore) - 1 || addr < lc)
210*4882a593Smuzhiyun continue;
211*4882a593Smuzhiyun return 1;
212*4882a593Smuzhiyun }
213*4882a593Smuzhiyun return 0;
214*4882a593Smuzhiyun }
215*4882a593Smuzhiyun
216*4882a593Smuzhiyun /*
217*4882a593Smuzhiyun * Convert a physical pointer for /dev/mem access
218*4882a593Smuzhiyun *
219*4882a593Smuzhiyun * For swapped prefix pages a new buffer is returned that contains a copy of
220*4882a593Smuzhiyun * the absolute memory. The buffer size is maximum one page large.
221*4882a593Smuzhiyun */
xlate_dev_mem_ptr(phys_addr_t addr)222*4882a593Smuzhiyun void *xlate_dev_mem_ptr(phys_addr_t addr)
223*4882a593Smuzhiyun {
224*4882a593Smuzhiyun void *bounce = (void *) addr;
225*4882a593Smuzhiyun unsigned long size;
226*4882a593Smuzhiyun
227*4882a593Smuzhiyun get_online_cpus();
228*4882a593Smuzhiyun preempt_disable();
229*4882a593Smuzhiyun if (is_swapped(addr)) {
230*4882a593Smuzhiyun size = PAGE_SIZE - (addr & ~PAGE_MASK);
231*4882a593Smuzhiyun bounce = (void *) __get_free_page(GFP_ATOMIC);
232*4882a593Smuzhiyun if (bounce)
233*4882a593Smuzhiyun memcpy_absolute(bounce, (void *) addr, size);
234*4882a593Smuzhiyun }
235*4882a593Smuzhiyun preempt_enable();
236*4882a593Smuzhiyun put_online_cpus();
237*4882a593Smuzhiyun return bounce;
238*4882a593Smuzhiyun }
239*4882a593Smuzhiyun
240*4882a593Smuzhiyun /*
241*4882a593Smuzhiyun * Free converted buffer for /dev/mem access (if necessary)
242*4882a593Smuzhiyun */
unxlate_dev_mem_ptr(phys_addr_t addr,void * buf)243*4882a593Smuzhiyun void unxlate_dev_mem_ptr(phys_addr_t addr, void *buf)
244*4882a593Smuzhiyun {
245*4882a593Smuzhiyun if ((void *) addr != buf)
246*4882a593Smuzhiyun free_page((unsigned long) buf);
247*4882a593Smuzhiyun }
248