1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * linux/fs/read_write.c
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (C) 1991, 1992 Linus Torvalds
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include <linux/slab.h>
9*4882a593Smuzhiyun #include <linux/stat.h>
10*4882a593Smuzhiyun #include <linux/sched/xacct.h>
11*4882a593Smuzhiyun #include <linux/fcntl.h>
12*4882a593Smuzhiyun #include <linux/file.h>
13*4882a593Smuzhiyun #include <linux/uio.h>
14*4882a593Smuzhiyun #include <linux/fsnotify.h>
15*4882a593Smuzhiyun #include <linux/security.h>
16*4882a593Smuzhiyun #include <linux/export.h>
17*4882a593Smuzhiyun #include <linux/syscalls.h>
18*4882a593Smuzhiyun #include <linux/pagemap.h>
19*4882a593Smuzhiyun #include <linux/splice.h>
20*4882a593Smuzhiyun #include <linux/compat.h>
21*4882a593Smuzhiyun #include <linux/mount.h>
22*4882a593Smuzhiyun #include <linux/fs.h>
23*4882a593Smuzhiyun #include "internal.h"
24*4882a593Smuzhiyun
25*4882a593Smuzhiyun #include <linux/uaccess.h>
26*4882a593Smuzhiyun #include <asm/unistd.h>
27*4882a593Smuzhiyun
28*4882a593Smuzhiyun const struct file_operations generic_ro_fops = {
29*4882a593Smuzhiyun .llseek = generic_file_llseek,
30*4882a593Smuzhiyun .read_iter = generic_file_read_iter,
31*4882a593Smuzhiyun .mmap = generic_file_readonly_mmap,
32*4882a593Smuzhiyun .splice_read = generic_file_splice_read,
33*4882a593Smuzhiyun };
34*4882a593Smuzhiyun
35*4882a593Smuzhiyun EXPORT_SYMBOL(generic_ro_fops);
36*4882a593Smuzhiyun
unsigned_offsets(struct file * file)37*4882a593Smuzhiyun static inline bool unsigned_offsets(struct file *file)
38*4882a593Smuzhiyun {
39*4882a593Smuzhiyun return file->f_mode & FMODE_UNSIGNED_OFFSET;
40*4882a593Smuzhiyun }
41*4882a593Smuzhiyun
42*4882a593Smuzhiyun /**
43*4882a593Smuzhiyun * vfs_setpos - update the file offset for lseek
44*4882a593Smuzhiyun * @file: file structure in question
45*4882a593Smuzhiyun * @offset: file offset to seek to
46*4882a593Smuzhiyun * @maxsize: maximum file size
47*4882a593Smuzhiyun *
48*4882a593Smuzhiyun * This is a low-level filesystem helper for updating the file offset to
49*4882a593Smuzhiyun * the value specified by @offset if the given offset is valid and it is
50*4882a593Smuzhiyun * not equal to the current file offset.
51*4882a593Smuzhiyun *
52*4882a593Smuzhiyun * Return the specified offset on success and -EINVAL on invalid offset.
53*4882a593Smuzhiyun */
vfs_setpos(struct file * file,loff_t offset,loff_t maxsize)54*4882a593Smuzhiyun loff_t vfs_setpos(struct file *file, loff_t offset, loff_t maxsize)
55*4882a593Smuzhiyun {
56*4882a593Smuzhiyun if (offset < 0 && !unsigned_offsets(file))
57*4882a593Smuzhiyun return -EINVAL;
58*4882a593Smuzhiyun if (offset > maxsize)
59*4882a593Smuzhiyun return -EINVAL;
60*4882a593Smuzhiyun
61*4882a593Smuzhiyun if (offset != file->f_pos) {
62*4882a593Smuzhiyun file->f_pos = offset;
63*4882a593Smuzhiyun file->f_version = 0;
64*4882a593Smuzhiyun }
65*4882a593Smuzhiyun return offset;
66*4882a593Smuzhiyun }
67*4882a593Smuzhiyun EXPORT_SYMBOL(vfs_setpos);
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun /**
70*4882a593Smuzhiyun * generic_file_llseek_size - generic llseek implementation for regular files
71*4882a593Smuzhiyun * @file: file structure to seek on
72*4882a593Smuzhiyun * @offset: file offset to seek to
73*4882a593Smuzhiyun * @whence: type of seek
74*4882a593Smuzhiyun * @size: max size of this file in file system
75*4882a593Smuzhiyun * @eof: offset used for SEEK_END position
76*4882a593Smuzhiyun *
77*4882a593Smuzhiyun * This is a variant of generic_file_llseek that allows passing in a custom
78*4882a593Smuzhiyun * maximum file size and a custom EOF position, for e.g. hashed directories
79*4882a593Smuzhiyun *
80*4882a593Smuzhiyun * Synchronization:
81*4882a593Smuzhiyun * SEEK_SET and SEEK_END are unsynchronized (but atomic on 64bit platforms)
82*4882a593Smuzhiyun * SEEK_CUR is synchronized against other SEEK_CURs, but not read/writes.
83*4882a593Smuzhiyun * read/writes behave like SEEK_SET against seeks.
84*4882a593Smuzhiyun */
85*4882a593Smuzhiyun loff_t
generic_file_llseek_size(struct file * file,loff_t offset,int whence,loff_t maxsize,loff_t eof)86*4882a593Smuzhiyun generic_file_llseek_size(struct file *file, loff_t offset, int whence,
87*4882a593Smuzhiyun loff_t maxsize, loff_t eof)
88*4882a593Smuzhiyun {
89*4882a593Smuzhiyun switch (whence) {
90*4882a593Smuzhiyun case SEEK_END:
91*4882a593Smuzhiyun offset += eof;
92*4882a593Smuzhiyun break;
93*4882a593Smuzhiyun case SEEK_CUR:
94*4882a593Smuzhiyun /*
95*4882a593Smuzhiyun * Here we special-case the lseek(fd, 0, SEEK_CUR)
96*4882a593Smuzhiyun * position-querying operation. Avoid rewriting the "same"
97*4882a593Smuzhiyun * f_pos value back to the file because a concurrent read(),
98*4882a593Smuzhiyun * write() or lseek() might have altered it
99*4882a593Smuzhiyun */
100*4882a593Smuzhiyun if (offset == 0)
101*4882a593Smuzhiyun return file->f_pos;
102*4882a593Smuzhiyun /*
103*4882a593Smuzhiyun * f_lock protects against read/modify/write race with other
104*4882a593Smuzhiyun * SEEK_CURs. Note that parallel writes and reads behave
105*4882a593Smuzhiyun * like SEEK_SET.
106*4882a593Smuzhiyun */
107*4882a593Smuzhiyun spin_lock(&file->f_lock);
108*4882a593Smuzhiyun offset = vfs_setpos(file, file->f_pos + offset, maxsize);
109*4882a593Smuzhiyun spin_unlock(&file->f_lock);
110*4882a593Smuzhiyun return offset;
111*4882a593Smuzhiyun case SEEK_DATA:
112*4882a593Smuzhiyun /*
113*4882a593Smuzhiyun * In the generic case the entire file is data, so as long as
114*4882a593Smuzhiyun * offset isn't at the end of the file then the offset is data.
115*4882a593Smuzhiyun */
116*4882a593Smuzhiyun if ((unsigned long long)offset >= eof)
117*4882a593Smuzhiyun return -ENXIO;
118*4882a593Smuzhiyun break;
119*4882a593Smuzhiyun case SEEK_HOLE:
120*4882a593Smuzhiyun /*
121*4882a593Smuzhiyun * There is a virtual hole at the end of the file, so as long as
122*4882a593Smuzhiyun * offset isn't i_size or larger, return i_size.
123*4882a593Smuzhiyun */
124*4882a593Smuzhiyun if ((unsigned long long)offset >= eof)
125*4882a593Smuzhiyun return -ENXIO;
126*4882a593Smuzhiyun offset = eof;
127*4882a593Smuzhiyun break;
128*4882a593Smuzhiyun }
129*4882a593Smuzhiyun
130*4882a593Smuzhiyun return vfs_setpos(file, offset, maxsize);
131*4882a593Smuzhiyun }
132*4882a593Smuzhiyun EXPORT_SYMBOL(generic_file_llseek_size);
133*4882a593Smuzhiyun
134*4882a593Smuzhiyun /**
135*4882a593Smuzhiyun * generic_file_llseek - generic llseek implementation for regular files
136*4882a593Smuzhiyun * @file: file structure to seek on
137*4882a593Smuzhiyun * @offset: file offset to seek to
138*4882a593Smuzhiyun * @whence: type of seek
139*4882a593Smuzhiyun *
140*4882a593Smuzhiyun * This is a generic implemenation of ->llseek useable for all normal local
141*4882a593Smuzhiyun * filesystems. It just updates the file offset to the value specified by
142*4882a593Smuzhiyun * @offset and @whence.
143*4882a593Smuzhiyun */
generic_file_llseek(struct file * file,loff_t offset,int whence)144*4882a593Smuzhiyun loff_t generic_file_llseek(struct file *file, loff_t offset, int whence)
145*4882a593Smuzhiyun {
146*4882a593Smuzhiyun struct inode *inode = file->f_mapping->host;
147*4882a593Smuzhiyun
148*4882a593Smuzhiyun return generic_file_llseek_size(file, offset, whence,
149*4882a593Smuzhiyun inode->i_sb->s_maxbytes,
150*4882a593Smuzhiyun i_size_read(inode));
151*4882a593Smuzhiyun }
152*4882a593Smuzhiyun EXPORT_SYMBOL(generic_file_llseek);
153*4882a593Smuzhiyun
154*4882a593Smuzhiyun /**
155*4882a593Smuzhiyun * fixed_size_llseek - llseek implementation for fixed-sized devices
156*4882a593Smuzhiyun * @file: file structure to seek on
157*4882a593Smuzhiyun * @offset: file offset to seek to
158*4882a593Smuzhiyun * @whence: type of seek
159*4882a593Smuzhiyun * @size: size of the file
160*4882a593Smuzhiyun *
161*4882a593Smuzhiyun */
fixed_size_llseek(struct file * file,loff_t offset,int whence,loff_t size)162*4882a593Smuzhiyun loff_t fixed_size_llseek(struct file *file, loff_t offset, int whence, loff_t size)
163*4882a593Smuzhiyun {
164*4882a593Smuzhiyun switch (whence) {
165*4882a593Smuzhiyun case SEEK_SET: case SEEK_CUR: case SEEK_END:
166*4882a593Smuzhiyun return generic_file_llseek_size(file, offset, whence,
167*4882a593Smuzhiyun size, size);
168*4882a593Smuzhiyun default:
169*4882a593Smuzhiyun return -EINVAL;
170*4882a593Smuzhiyun }
171*4882a593Smuzhiyun }
172*4882a593Smuzhiyun EXPORT_SYMBOL(fixed_size_llseek);
173*4882a593Smuzhiyun
174*4882a593Smuzhiyun /**
175*4882a593Smuzhiyun * no_seek_end_llseek - llseek implementation for fixed-sized devices
176*4882a593Smuzhiyun * @file: file structure to seek on
177*4882a593Smuzhiyun * @offset: file offset to seek to
178*4882a593Smuzhiyun * @whence: type of seek
179*4882a593Smuzhiyun *
180*4882a593Smuzhiyun */
no_seek_end_llseek(struct file * file,loff_t offset,int whence)181*4882a593Smuzhiyun loff_t no_seek_end_llseek(struct file *file, loff_t offset, int whence)
182*4882a593Smuzhiyun {
183*4882a593Smuzhiyun switch (whence) {
184*4882a593Smuzhiyun case SEEK_SET: case SEEK_CUR:
185*4882a593Smuzhiyun return generic_file_llseek_size(file, offset, whence,
186*4882a593Smuzhiyun OFFSET_MAX, 0);
187*4882a593Smuzhiyun default:
188*4882a593Smuzhiyun return -EINVAL;
189*4882a593Smuzhiyun }
190*4882a593Smuzhiyun }
191*4882a593Smuzhiyun EXPORT_SYMBOL(no_seek_end_llseek);
192*4882a593Smuzhiyun
193*4882a593Smuzhiyun /**
194*4882a593Smuzhiyun * no_seek_end_llseek_size - llseek implementation for fixed-sized devices
195*4882a593Smuzhiyun * @file: file structure to seek on
196*4882a593Smuzhiyun * @offset: file offset to seek to
197*4882a593Smuzhiyun * @whence: type of seek
198*4882a593Smuzhiyun * @size: maximal offset allowed
199*4882a593Smuzhiyun *
200*4882a593Smuzhiyun */
no_seek_end_llseek_size(struct file * file,loff_t offset,int whence,loff_t size)201*4882a593Smuzhiyun loff_t no_seek_end_llseek_size(struct file *file, loff_t offset, int whence, loff_t size)
202*4882a593Smuzhiyun {
203*4882a593Smuzhiyun switch (whence) {
204*4882a593Smuzhiyun case SEEK_SET: case SEEK_CUR:
205*4882a593Smuzhiyun return generic_file_llseek_size(file, offset, whence,
206*4882a593Smuzhiyun size, 0);
207*4882a593Smuzhiyun default:
208*4882a593Smuzhiyun return -EINVAL;
209*4882a593Smuzhiyun }
210*4882a593Smuzhiyun }
211*4882a593Smuzhiyun EXPORT_SYMBOL(no_seek_end_llseek_size);
212*4882a593Smuzhiyun
213*4882a593Smuzhiyun /**
214*4882a593Smuzhiyun * noop_llseek - No Operation Performed llseek implementation
215*4882a593Smuzhiyun * @file: file structure to seek on
216*4882a593Smuzhiyun * @offset: file offset to seek to
217*4882a593Smuzhiyun * @whence: type of seek
218*4882a593Smuzhiyun *
219*4882a593Smuzhiyun * This is an implementation of ->llseek useable for the rare special case when
220*4882a593Smuzhiyun * userspace expects the seek to succeed but the (device) file is actually not
221*4882a593Smuzhiyun * able to perform the seek. In this case you use noop_llseek() instead of
222*4882a593Smuzhiyun * falling back to the default implementation of ->llseek.
223*4882a593Smuzhiyun */
noop_llseek(struct file * file,loff_t offset,int whence)224*4882a593Smuzhiyun loff_t noop_llseek(struct file *file, loff_t offset, int whence)
225*4882a593Smuzhiyun {
226*4882a593Smuzhiyun return file->f_pos;
227*4882a593Smuzhiyun }
228*4882a593Smuzhiyun EXPORT_SYMBOL(noop_llseek);
229*4882a593Smuzhiyun
no_llseek(struct file * file,loff_t offset,int whence)230*4882a593Smuzhiyun loff_t no_llseek(struct file *file, loff_t offset, int whence)
231*4882a593Smuzhiyun {
232*4882a593Smuzhiyun return -ESPIPE;
233*4882a593Smuzhiyun }
234*4882a593Smuzhiyun EXPORT_SYMBOL(no_llseek);
235*4882a593Smuzhiyun
default_llseek(struct file * file,loff_t offset,int whence)236*4882a593Smuzhiyun loff_t default_llseek(struct file *file, loff_t offset, int whence)
237*4882a593Smuzhiyun {
238*4882a593Smuzhiyun struct inode *inode = file_inode(file);
239*4882a593Smuzhiyun loff_t retval;
240*4882a593Smuzhiyun
241*4882a593Smuzhiyun inode_lock(inode);
242*4882a593Smuzhiyun switch (whence) {
243*4882a593Smuzhiyun case SEEK_END:
244*4882a593Smuzhiyun offset += i_size_read(inode);
245*4882a593Smuzhiyun break;
246*4882a593Smuzhiyun case SEEK_CUR:
247*4882a593Smuzhiyun if (offset == 0) {
248*4882a593Smuzhiyun retval = file->f_pos;
249*4882a593Smuzhiyun goto out;
250*4882a593Smuzhiyun }
251*4882a593Smuzhiyun offset += file->f_pos;
252*4882a593Smuzhiyun break;
253*4882a593Smuzhiyun case SEEK_DATA:
254*4882a593Smuzhiyun /*
255*4882a593Smuzhiyun * In the generic case the entire file is data, so as
256*4882a593Smuzhiyun * long as offset isn't at the end of the file then the
257*4882a593Smuzhiyun * offset is data.
258*4882a593Smuzhiyun */
259*4882a593Smuzhiyun if (offset >= inode->i_size) {
260*4882a593Smuzhiyun retval = -ENXIO;
261*4882a593Smuzhiyun goto out;
262*4882a593Smuzhiyun }
263*4882a593Smuzhiyun break;
264*4882a593Smuzhiyun case SEEK_HOLE:
265*4882a593Smuzhiyun /*
266*4882a593Smuzhiyun * There is a virtual hole at the end of the file, so
267*4882a593Smuzhiyun * as long as offset isn't i_size or larger, return
268*4882a593Smuzhiyun * i_size.
269*4882a593Smuzhiyun */
270*4882a593Smuzhiyun if (offset >= inode->i_size) {
271*4882a593Smuzhiyun retval = -ENXIO;
272*4882a593Smuzhiyun goto out;
273*4882a593Smuzhiyun }
274*4882a593Smuzhiyun offset = inode->i_size;
275*4882a593Smuzhiyun break;
276*4882a593Smuzhiyun }
277*4882a593Smuzhiyun retval = -EINVAL;
278*4882a593Smuzhiyun if (offset >= 0 || unsigned_offsets(file)) {
279*4882a593Smuzhiyun if (offset != file->f_pos) {
280*4882a593Smuzhiyun file->f_pos = offset;
281*4882a593Smuzhiyun file->f_version = 0;
282*4882a593Smuzhiyun }
283*4882a593Smuzhiyun retval = offset;
284*4882a593Smuzhiyun }
285*4882a593Smuzhiyun out:
286*4882a593Smuzhiyun inode_unlock(inode);
287*4882a593Smuzhiyun return retval;
288*4882a593Smuzhiyun }
289*4882a593Smuzhiyun EXPORT_SYMBOL(default_llseek);
290*4882a593Smuzhiyun
vfs_llseek(struct file * file,loff_t offset,int whence)291*4882a593Smuzhiyun loff_t vfs_llseek(struct file *file, loff_t offset, int whence)
292*4882a593Smuzhiyun {
293*4882a593Smuzhiyun loff_t (*fn)(struct file *, loff_t, int);
294*4882a593Smuzhiyun
295*4882a593Smuzhiyun fn = no_llseek;
296*4882a593Smuzhiyun if (file->f_mode & FMODE_LSEEK) {
297*4882a593Smuzhiyun if (file->f_op->llseek)
298*4882a593Smuzhiyun fn = file->f_op->llseek;
299*4882a593Smuzhiyun }
300*4882a593Smuzhiyun return fn(file, offset, whence);
301*4882a593Smuzhiyun }
302*4882a593Smuzhiyun EXPORT_SYMBOL(vfs_llseek);
303*4882a593Smuzhiyun
ksys_lseek(unsigned int fd,off_t offset,unsigned int whence)304*4882a593Smuzhiyun static off_t ksys_lseek(unsigned int fd, off_t offset, unsigned int whence)
305*4882a593Smuzhiyun {
306*4882a593Smuzhiyun off_t retval;
307*4882a593Smuzhiyun struct fd f = fdget_pos(fd);
308*4882a593Smuzhiyun if (!f.file)
309*4882a593Smuzhiyun return -EBADF;
310*4882a593Smuzhiyun
311*4882a593Smuzhiyun retval = -EINVAL;
312*4882a593Smuzhiyun if (whence <= SEEK_MAX) {
313*4882a593Smuzhiyun loff_t res = vfs_llseek(f.file, offset, whence);
314*4882a593Smuzhiyun retval = res;
315*4882a593Smuzhiyun if (res != (loff_t)retval)
316*4882a593Smuzhiyun retval = -EOVERFLOW; /* LFS: should only happen on 32 bit platforms */
317*4882a593Smuzhiyun }
318*4882a593Smuzhiyun fdput_pos(f);
319*4882a593Smuzhiyun return retval;
320*4882a593Smuzhiyun }
321*4882a593Smuzhiyun
SYSCALL_DEFINE3(lseek,unsigned int,fd,off_t,offset,unsigned int,whence)322*4882a593Smuzhiyun SYSCALL_DEFINE3(lseek, unsigned int, fd, off_t, offset, unsigned int, whence)
323*4882a593Smuzhiyun {
324*4882a593Smuzhiyun return ksys_lseek(fd, offset, whence);
325*4882a593Smuzhiyun }
326*4882a593Smuzhiyun
327*4882a593Smuzhiyun #ifdef CONFIG_COMPAT
COMPAT_SYSCALL_DEFINE3(lseek,unsigned int,fd,compat_off_t,offset,unsigned int,whence)328*4882a593Smuzhiyun COMPAT_SYSCALL_DEFINE3(lseek, unsigned int, fd, compat_off_t, offset, unsigned int, whence)
329*4882a593Smuzhiyun {
330*4882a593Smuzhiyun return ksys_lseek(fd, offset, whence);
331*4882a593Smuzhiyun }
332*4882a593Smuzhiyun #endif
333*4882a593Smuzhiyun
334*4882a593Smuzhiyun #if !defined(CONFIG_64BIT) || defined(CONFIG_COMPAT) || \
335*4882a593Smuzhiyun defined(__ARCH_WANT_SYS_LLSEEK)
SYSCALL_DEFINE5(llseek,unsigned int,fd,unsigned long,offset_high,unsigned long,offset_low,loff_t __user *,result,unsigned int,whence)336*4882a593Smuzhiyun SYSCALL_DEFINE5(llseek, unsigned int, fd, unsigned long, offset_high,
337*4882a593Smuzhiyun unsigned long, offset_low, loff_t __user *, result,
338*4882a593Smuzhiyun unsigned int, whence)
339*4882a593Smuzhiyun {
340*4882a593Smuzhiyun int retval;
341*4882a593Smuzhiyun struct fd f = fdget_pos(fd);
342*4882a593Smuzhiyun loff_t offset;
343*4882a593Smuzhiyun
344*4882a593Smuzhiyun if (!f.file)
345*4882a593Smuzhiyun return -EBADF;
346*4882a593Smuzhiyun
347*4882a593Smuzhiyun retval = -EINVAL;
348*4882a593Smuzhiyun if (whence > SEEK_MAX)
349*4882a593Smuzhiyun goto out_putf;
350*4882a593Smuzhiyun
351*4882a593Smuzhiyun offset = vfs_llseek(f.file, ((loff_t) offset_high << 32) | offset_low,
352*4882a593Smuzhiyun whence);
353*4882a593Smuzhiyun
354*4882a593Smuzhiyun retval = (int)offset;
355*4882a593Smuzhiyun if (offset >= 0) {
356*4882a593Smuzhiyun retval = -EFAULT;
357*4882a593Smuzhiyun if (!copy_to_user(result, &offset, sizeof(offset)))
358*4882a593Smuzhiyun retval = 0;
359*4882a593Smuzhiyun }
360*4882a593Smuzhiyun out_putf:
361*4882a593Smuzhiyun fdput_pos(f);
362*4882a593Smuzhiyun return retval;
363*4882a593Smuzhiyun }
364*4882a593Smuzhiyun #endif
365*4882a593Smuzhiyun
rw_verify_area(int read_write,struct file * file,const loff_t * ppos,size_t count)366*4882a593Smuzhiyun int rw_verify_area(int read_write, struct file *file, const loff_t *ppos, size_t count)
367*4882a593Smuzhiyun {
368*4882a593Smuzhiyun struct inode *inode;
369*4882a593Smuzhiyun int retval = -EINVAL;
370*4882a593Smuzhiyun
371*4882a593Smuzhiyun inode = file_inode(file);
372*4882a593Smuzhiyun if (unlikely((ssize_t) count < 0))
373*4882a593Smuzhiyun return retval;
374*4882a593Smuzhiyun
375*4882a593Smuzhiyun /*
376*4882a593Smuzhiyun * ranged mandatory locking does not apply to streams - it makes sense
377*4882a593Smuzhiyun * only for files where position has a meaning.
378*4882a593Smuzhiyun */
379*4882a593Smuzhiyun if (ppos) {
380*4882a593Smuzhiyun loff_t pos = *ppos;
381*4882a593Smuzhiyun
382*4882a593Smuzhiyun if (unlikely(pos < 0)) {
383*4882a593Smuzhiyun if (!unsigned_offsets(file))
384*4882a593Smuzhiyun return retval;
385*4882a593Smuzhiyun if (count >= -pos) /* both values are in 0..LLONG_MAX */
386*4882a593Smuzhiyun return -EOVERFLOW;
387*4882a593Smuzhiyun } else if (unlikely((loff_t) (pos + count) < 0)) {
388*4882a593Smuzhiyun if (!unsigned_offsets(file))
389*4882a593Smuzhiyun return retval;
390*4882a593Smuzhiyun }
391*4882a593Smuzhiyun
392*4882a593Smuzhiyun if (unlikely(inode->i_flctx && mandatory_lock(inode))) {
393*4882a593Smuzhiyun retval = locks_mandatory_area(inode, file, pos, pos + count - 1,
394*4882a593Smuzhiyun read_write == READ ? F_RDLCK : F_WRLCK);
395*4882a593Smuzhiyun if (retval < 0)
396*4882a593Smuzhiyun return retval;
397*4882a593Smuzhiyun }
398*4882a593Smuzhiyun }
399*4882a593Smuzhiyun
400*4882a593Smuzhiyun return security_file_permission(file,
401*4882a593Smuzhiyun read_write == READ ? MAY_READ : MAY_WRITE);
402*4882a593Smuzhiyun }
403*4882a593Smuzhiyun
new_sync_read(struct file * filp,char __user * buf,size_t len,loff_t * ppos)404*4882a593Smuzhiyun static ssize_t new_sync_read(struct file *filp, char __user *buf, size_t len, loff_t *ppos)
405*4882a593Smuzhiyun {
406*4882a593Smuzhiyun struct iovec iov = { .iov_base = buf, .iov_len = len };
407*4882a593Smuzhiyun struct kiocb kiocb;
408*4882a593Smuzhiyun struct iov_iter iter;
409*4882a593Smuzhiyun ssize_t ret;
410*4882a593Smuzhiyun
411*4882a593Smuzhiyun init_sync_kiocb(&kiocb, filp);
412*4882a593Smuzhiyun kiocb.ki_pos = (ppos ? *ppos : 0);
413*4882a593Smuzhiyun iov_iter_init(&iter, READ, &iov, 1, len);
414*4882a593Smuzhiyun
415*4882a593Smuzhiyun ret = call_read_iter(filp, &kiocb, &iter);
416*4882a593Smuzhiyun BUG_ON(ret == -EIOCBQUEUED);
417*4882a593Smuzhiyun if (ppos)
418*4882a593Smuzhiyun *ppos = kiocb.ki_pos;
419*4882a593Smuzhiyun return ret;
420*4882a593Smuzhiyun }
421*4882a593Smuzhiyun
warn_unsupported(struct file * file,const char * op)422*4882a593Smuzhiyun static int warn_unsupported(struct file *file, const char *op)
423*4882a593Smuzhiyun {
424*4882a593Smuzhiyun pr_warn_ratelimited(
425*4882a593Smuzhiyun "kernel %s not supported for file %pD4 (pid: %d comm: %.20s)\n",
426*4882a593Smuzhiyun op, file, current->pid, current->comm);
427*4882a593Smuzhiyun return -EINVAL;
428*4882a593Smuzhiyun }
429*4882a593Smuzhiyun
__kernel_read(struct file * file,void * buf,size_t count,loff_t * pos)430*4882a593Smuzhiyun ssize_t __kernel_read(struct file *file, void *buf, size_t count, loff_t *pos)
431*4882a593Smuzhiyun {
432*4882a593Smuzhiyun struct kvec iov = {
433*4882a593Smuzhiyun .iov_base = buf,
434*4882a593Smuzhiyun .iov_len = min_t(size_t, count, MAX_RW_COUNT),
435*4882a593Smuzhiyun };
436*4882a593Smuzhiyun struct kiocb kiocb;
437*4882a593Smuzhiyun struct iov_iter iter;
438*4882a593Smuzhiyun ssize_t ret;
439*4882a593Smuzhiyun
440*4882a593Smuzhiyun if (WARN_ON_ONCE(!(file->f_mode & FMODE_READ)))
441*4882a593Smuzhiyun return -EINVAL;
442*4882a593Smuzhiyun if (!(file->f_mode & FMODE_CAN_READ))
443*4882a593Smuzhiyun return -EINVAL;
444*4882a593Smuzhiyun /*
445*4882a593Smuzhiyun * Also fail if ->read_iter and ->read are both wired up as that
446*4882a593Smuzhiyun * implies very convoluted semantics.
447*4882a593Smuzhiyun */
448*4882a593Smuzhiyun if (unlikely(!file->f_op->read_iter || file->f_op->read))
449*4882a593Smuzhiyun return warn_unsupported(file, "read");
450*4882a593Smuzhiyun
451*4882a593Smuzhiyun init_sync_kiocb(&kiocb, file);
452*4882a593Smuzhiyun kiocb.ki_pos = pos ? *pos : 0;
453*4882a593Smuzhiyun iov_iter_kvec(&iter, READ, &iov, 1, iov.iov_len);
454*4882a593Smuzhiyun ret = file->f_op->read_iter(&kiocb, &iter);
455*4882a593Smuzhiyun if (ret > 0) {
456*4882a593Smuzhiyun if (pos)
457*4882a593Smuzhiyun *pos = kiocb.ki_pos;
458*4882a593Smuzhiyun fsnotify_access(file);
459*4882a593Smuzhiyun add_rchar(current, ret);
460*4882a593Smuzhiyun }
461*4882a593Smuzhiyun inc_syscr(current);
462*4882a593Smuzhiyun return ret;
463*4882a593Smuzhiyun }
464*4882a593Smuzhiyun
kernel_read(struct file * file,void * buf,size_t count,loff_t * pos)465*4882a593Smuzhiyun ssize_t kernel_read(struct file *file, void *buf, size_t count, loff_t *pos)
466*4882a593Smuzhiyun {
467*4882a593Smuzhiyun ssize_t ret;
468*4882a593Smuzhiyun
469*4882a593Smuzhiyun ret = rw_verify_area(READ, file, pos, count);
470*4882a593Smuzhiyun if (ret)
471*4882a593Smuzhiyun return ret;
472*4882a593Smuzhiyun return __kernel_read(file, buf, count, pos);
473*4882a593Smuzhiyun }
474*4882a593Smuzhiyun EXPORT_SYMBOL_NS(kernel_read, ANDROID_GKI_VFS_EXPORT_ONLY);
475*4882a593Smuzhiyun
vfs_read(struct file * file,char __user * buf,size_t count,loff_t * pos)476*4882a593Smuzhiyun ssize_t vfs_read(struct file *file, char __user *buf, size_t count, loff_t *pos)
477*4882a593Smuzhiyun {
478*4882a593Smuzhiyun ssize_t ret;
479*4882a593Smuzhiyun
480*4882a593Smuzhiyun if (!(file->f_mode & FMODE_READ))
481*4882a593Smuzhiyun return -EBADF;
482*4882a593Smuzhiyun if (!(file->f_mode & FMODE_CAN_READ))
483*4882a593Smuzhiyun return -EINVAL;
484*4882a593Smuzhiyun if (unlikely(!access_ok(buf, count)))
485*4882a593Smuzhiyun return -EFAULT;
486*4882a593Smuzhiyun
487*4882a593Smuzhiyun ret = rw_verify_area(READ, file, pos, count);
488*4882a593Smuzhiyun if (ret)
489*4882a593Smuzhiyun return ret;
490*4882a593Smuzhiyun if (count > MAX_RW_COUNT)
491*4882a593Smuzhiyun count = MAX_RW_COUNT;
492*4882a593Smuzhiyun
493*4882a593Smuzhiyun if (file->f_op->read)
494*4882a593Smuzhiyun ret = file->f_op->read(file, buf, count, pos);
495*4882a593Smuzhiyun else if (file->f_op->read_iter)
496*4882a593Smuzhiyun ret = new_sync_read(file, buf, count, pos);
497*4882a593Smuzhiyun else
498*4882a593Smuzhiyun ret = -EINVAL;
499*4882a593Smuzhiyun if (ret > 0) {
500*4882a593Smuzhiyun fsnotify_access(file);
501*4882a593Smuzhiyun add_rchar(current, ret);
502*4882a593Smuzhiyun }
503*4882a593Smuzhiyun inc_syscr(current);
504*4882a593Smuzhiyun return ret;
505*4882a593Smuzhiyun }
506*4882a593Smuzhiyun
new_sync_write(struct file * filp,const char __user * buf,size_t len,loff_t * ppos)507*4882a593Smuzhiyun static ssize_t new_sync_write(struct file *filp, const char __user *buf, size_t len, loff_t *ppos)
508*4882a593Smuzhiyun {
509*4882a593Smuzhiyun struct iovec iov = { .iov_base = (void __user *)buf, .iov_len = len };
510*4882a593Smuzhiyun struct kiocb kiocb;
511*4882a593Smuzhiyun struct iov_iter iter;
512*4882a593Smuzhiyun ssize_t ret;
513*4882a593Smuzhiyun
514*4882a593Smuzhiyun init_sync_kiocb(&kiocb, filp);
515*4882a593Smuzhiyun kiocb.ki_pos = (ppos ? *ppos : 0);
516*4882a593Smuzhiyun iov_iter_init(&iter, WRITE, &iov, 1, len);
517*4882a593Smuzhiyun
518*4882a593Smuzhiyun ret = call_write_iter(filp, &kiocb, &iter);
519*4882a593Smuzhiyun BUG_ON(ret == -EIOCBQUEUED);
520*4882a593Smuzhiyun if (ret > 0 && ppos)
521*4882a593Smuzhiyun *ppos = kiocb.ki_pos;
522*4882a593Smuzhiyun return ret;
523*4882a593Smuzhiyun }
524*4882a593Smuzhiyun
525*4882a593Smuzhiyun /* caller is responsible for file_start_write/file_end_write */
__kernel_write(struct file * file,const void * buf,size_t count,loff_t * pos)526*4882a593Smuzhiyun ssize_t __kernel_write(struct file *file, const void *buf, size_t count, loff_t *pos)
527*4882a593Smuzhiyun {
528*4882a593Smuzhiyun struct kvec iov = {
529*4882a593Smuzhiyun .iov_base = (void *)buf,
530*4882a593Smuzhiyun .iov_len = min_t(size_t, count, MAX_RW_COUNT),
531*4882a593Smuzhiyun };
532*4882a593Smuzhiyun struct kiocb kiocb;
533*4882a593Smuzhiyun struct iov_iter iter;
534*4882a593Smuzhiyun ssize_t ret;
535*4882a593Smuzhiyun
536*4882a593Smuzhiyun if (WARN_ON_ONCE(!(file->f_mode & FMODE_WRITE)))
537*4882a593Smuzhiyun return -EBADF;
538*4882a593Smuzhiyun if (!(file->f_mode & FMODE_CAN_WRITE))
539*4882a593Smuzhiyun return -EINVAL;
540*4882a593Smuzhiyun /*
541*4882a593Smuzhiyun * Also fail if ->write_iter and ->write are both wired up as that
542*4882a593Smuzhiyun * implies very convoluted semantics.
543*4882a593Smuzhiyun */
544*4882a593Smuzhiyun if (unlikely(!file->f_op->write_iter || file->f_op->write))
545*4882a593Smuzhiyun return warn_unsupported(file, "write");
546*4882a593Smuzhiyun
547*4882a593Smuzhiyun init_sync_kiocb(&kiocb, file);
548*4882a593Smuzhiyun kiocb.ki_pos = pos ? *pos : 0;
549*4882a593Smuzhiyun iov_iter_kvec(&iter, WRITE, &iov, 1, iov.iov_len);
550*4882a593Smuzhiyun ret = file->f_op->write_iter(&kiocb, &iter);
551*4882a593Smuzhiyun if (ret > 0) {
552*4882a593Smuzhiyun if (pos)
553*4882a593Smuzhiyun *pos = kiocb.ki_pos;
554*4882a593Smuzhiyun fsnotify_modify(file);
555*4882a593Smuzhiyun add_wchar(current, ret);
556*4882a593Smuzhiyun }
557*4882a593Smuzhiyun inc_syscw(current);
558*4882a593Smuzhiyun return ret;
559*4882a593Smuzhiyun }
560*4882a593Smuzhiyun /*
561*4882a593Smuzhiyun * This "EXPORT_SYMBOL_GPL()" is more of a "EXPORT_SYMBOL_DONTUSE()",
562*4882a593Smuzhiyun * but autofs is one of the few internal kernel users that actually
563*4882a593Smuzhiyun * wants this _and_ can be built as a module. So we need to export
564*4882a593Smuzhiyun * this symbol for autofs, even though it really isn't appropriate
565*4882a593Smuzhiyun * for any other kernel modules.
566*4882a593Smuzhiyun */
567*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(__kernel_write);
568*4882a593Smuzhiyun
kernel_write(struct file * file,const void * buf,size_t count,loff_t * pos)569*4882a593Smuzhiyun ssize_t kernel_write(struct file *file, const void *buf, size_t count,
570*4882a593Smuzhiyun loff_t *pos)
571*4882a593Smuzhiyun {
572*4882a593Smuzhiyun ssize_t ret;
573*4882a593Smuzhiyun
574*4882a593Smuzhiyun ret = rw_verify_area(WRITE, file, pos, count);
575*4882a593Smuzhiyun if (ret)
576*4882a593Smuzhiyun return ret;
577*4882a593Smuzhiyun
578*4882a593Smuzhiyun file_start_write(file);
579*4882a593Smuzhiyun ret = __kernel_write(file, buf, count, pos);
580*4882a593Smuzhiyun file_end_write(file);
581*4882a593Smuzhiyun return ret;
582*4882a593Smuzhiyun }
583*4882a593Smuzhiyun EXPORT_SYMBOL_NS(kernel_write, ANDROID_GKI_VFS_EXPORT_ONLY);
584*4882a593Smuzhiyun
vfs_write(struct file * file,const char __user * buf,size_t count,loff_t * pos)585*4882a593Smuzhiyun ssize_t vfs_write(struct file *file, const char __user *buf, size_t count, loff_t *pos)
586*4882a593Smuzhiyun {
587*4882a593Smuzhiyun ssize_t ret;
588*4882a593Smuzhiyun
589*4882a593Smuzhiyun if (!(file->f_mode & FMODE_WRITE))
590*4882a593Smuzhiyun return -EBADF;
591*4882a593Smuzhiyun if (!(file->f_mode & FMODE_CAN_WRITE))
592*4882a593Smuzhiyun return -EINVAL;
593*4882a593Smuzhiyun if (unlikely(!access_ok(buf, count)))
594*4882a593Smuzhiyun return -EFAULT;
595*4882a593Smuzhiyun
596*4882a593Smuzhiyun ret = rw_verify_area(WRITE, file, pos, count);
597*4882a593Smuzhiyun if (ret)
598*4882a593Smuzhiyun return ret;
599*4882a593Smuzhiyun if (count > MAX_RW_COUNT)
600*4882a593Smuzhiyun count = MAX_RW_COUNT;
601*4882a593Smuzhiyun file_start_write(file);
602*4882a593Smuzhiyun if (file->f_op->write)
603*4882a593Smuzhiyun ret = file->f_op->write(file, buf, count, pos);
604*4882a593Smuzhiyun else if (file->f_op->write_iter)
605*4882a593Smuzhiyun ret = new_sync_write(file, buf, count, pos);
606*4882a593Smuzhiyun else
607*4882a593Smuzhiyun ret = -EINVAL;
608*4882a593Smuzhiyun if (ret > 0) {
609*4882a593Smuzhiyun fsnotify_modify(file);
610*4882a593Smuzhiyun add_wchar(current, ret);
611*4882a593Smuzhiyun }
612*4882a593Smuzhiyun inc_syscw(current);
613*4882a593Smuzhiyun file_end_write(file);
614*4882a593Smuzhiyun return ret;
615*4882a593Smuzhiyun }
616*4882a593Smuzhiyun
617*4882a593Smuzhiyun /* file_ppos returns &file->f_pos or NULL if file is stream */
file_ppos(struct file * file)618*4882a593Smuzhiyun static inline loff_t *file_ppos(struct file *file)
619*4882a593Smuzhiyun {
620*4882a593Smuzhiyun return file->f_mode & FMODE_STREAM ? NULL : &file->f_pos;
621*4882a593Smuzhiyun }
622*4882a593Smuzhiyun
ksys_read(unsigned int fd,char __user * buf,size_t count)623*4882a593Smuzhiyun ssize_t ksys_read(unsigned int fd, char __user *buf, size_t count)
624*4882a593Smuzhiyun {
625*4882a593Smuzhiyun struct fd f = fdget_pos(fd);
626*4882a593Smuzhiyun ssize_t ret = -EBADF;
627*4882a593Smuzhiyun
628*4882a593Smuzhiyun if (f.file) {
629*4882a593Smuzhiyun loff_t pos, *ppos = file_ppos(f.file);
630*4882a593Smuzhiyun if (ppos) {
631*4882a593Smuzhiyun pos = *ppos;
632*4882a593Smuzhiyun ppos = &pos;
633*4882a593Smuzhiyun }
634*4882a593Smuzhiyun ret = vfs_read(f.file, buf, count, ppos);
635*4882a593Smuzhiyun if (ret >= 0 && ppos)
636*4882a593Smuzhiyun f.file->f_pos = pos;
637*4882a593Smuzhiyun fdput_pos(f);
638*4882a593Smuzhiyun }
639*4882a593Smuzhiyun return ret;
640*4882a593Smuzhiyun }
641*4882a593Smuzhiyun
SYSCALL_DEFINE3(read,unsigned int,fd,char __user *,buf,size_t,count)642*4882a593Smuzhiyun SYSCALL_DEFINE3(read, unsigned int, fd, char __user *, buf, size_t, count)
643*4882a593Smuzhiyun {
644*4882a593Smuzhiyun return ksys_read(fd, buf, count);
645*4882a593Smuzhiyun }
646*4882a593Smuzhiyun
ksys_write(unsigned int fd,const char __user * buf,size_t count)647*4882a593Smuzhiyun ssize_t ksys_write(unsigned int fd, const char __user *buf, size_t count)
648*4882a593Smuzhiyun {
649*4882a593Smuzhiyun struct fd f = fdget_pos(fd);
650*4882a593Smuzhiyun ssize_t ret = -EBADF;
651*4882a593Smuzhiyun
652*4882a593Smuzhiyun if (f.file) {
653*4882a593Smuzhiyun loff_t pos, *ppos = file_ppos(f.file);
654*4882a593Smuzhiyun if (ppos) {
655*4882a593Smuzhiyun pos = *ppos;
656*4882a593Smuzhiyun ppos = &pos;
657*4882a593Smuzhiyun }
658*4882a593Smuzhiyun ret = vfs_write(f.file, buf, count, ppos);
659*4882a593Smuzhiyun if (ret >= 0 && ppos)
660*4882a593Smuzhiyun f.file->f_pos = pos;
661*4882a593Smuzhiyun fdput_pos(f);
662*4882a593Smuzhiyun }
663*4882a593Smuzhiyun
664*4882a593Smuzhiyun return ret;
665*4882a593Smuzhiyun }
666*4882a593Smuzhiyun
SYSCALL_DEFINE3(write,unsigned int,fd,const char __user *,buf,size_t,count)667*4882a593Smuzhiyun SYSCALL_DEFINE3(write, unsigned int, fd, const char __user *, buf,
668*4882a593Smuzhiyun size_t, count)
669*4882a593Smuzhiyun {
670*4882a593Smuzhiyun return ksys_write(fd, buf, count);
671*4882a593Smuzhiyun }
672*4882a593Smuzhiyun
ksys_pread64(unsigned int fd,char __user * buf,size_t count,loff_t pos)673*4882a593Smuzhiyun ssize_t ksys_pread64(unsigned int fd, char __user *buf, size_t count,
674*4882a593Smuzhiyun loff_t pos)
675*4882a593Smuzhiyun {
676*4882a593Smuzhiyun struct fd f;
677*4882a593Smuzhiyun ssize_t ret = -EBADF;
678*4882a593Smuzhiyun
679*4882a593Smuzhiyun if (pos < 0)
680*4882a593Smuzhiyun return -EINVAL;
681*4882a593Smuzhiyun
682*4882a593Smuzhiyun f = fdget(fd);
683*4882a593Smuzhiyun if (f.file) {
684*4882a593Smuzhiyun ret = -ESPIPE;
685*4882a593Smuzhiyun if (f.file->f_mode & FMODE_PREAD)
686*4882a593Smuzhiyun ret = vfs_read(f.file, buf, count, &pos);
687*4882a593Smuzhiyun fdput(f);
688*4882a593Smuzhiyun }
689*4882a593Smuzhiyun
690*4882a593Smuzhiyun return ret;
691*4882a593Smuzhiyun }
692*4882a593Smuzhiyun
SYSCALL_DEFINE4(pread64,unsigned int,fd,char __user *,buf,size_t,count,loff_t,pos)693*4882a593Smuzhiyun SYSCALL_DEFINE4(pread64, unsigned int, fd, char __user *, buf,
694*4882a593Smuzhiyun size_t, count, loff_t, pos)
695*4882a593Smuzhiyun {
696*4882a593Smuzhiyun return ksys_pread64(fd, buf, count, pos);
697*4882a593Smuzhiyun }
698*4882a593Smuzhiyun
ksys_pwrite64(unsigned int fd,const char __user * buf,size_t count,loff_t pos)699*4882a593Smuzhiyun ssize_t ksys_pwrite64(unsigned int fd, const char __user *buf,
700*4882a593Smuzhiyun size_t count, loff_t pos)
701*4882a593Smuzhiyun {
702*4882a593Smuzhiyun struct fd f;
703*4882a593Smuzhiyun ssize_t ret = -EBADF;
704*4882a593Smuzhiyun
705*4882a593Smuzhiyun if (pos < 0)
706*4882a593Smuzhiyun return -EINVAL;
707*4882a593Smuzhiyun
708*4882a593Smuzhiyun f = fdget(fd);
709*4882a593Smuzhiyun if (f.file) {
710*4882a593Smuzhiyun ret = -ESPIPE;
711*4882a593Smuzhiyun if (f.file->f_mode & FMODE_PWRITE)
712*4882a593Smuzhiyun ret = vfs_write(f.file, buf, count, &pos);
713*4882a593Smuzhiyun fdput(f);
714*4882a593Smuzhiyun }
715*4882a593Smuzhiyun
716*4882a593Smuzhiyun return ret;
717*4882a593Smuzhiyun }
718*4882a593Smuzhiyun
SYSCALL_DEFINE4(pwrite64,unsigned int,fd,const char __user *,buf,size_t,count,loff_t,pos)719*4882a593Smuzhiyun SYSCALL_DEFINE4(pwrite64, unsigned int, fd, const char __user *, buf,
720*4882a593Smuzhiyun size_t, count, loff_t, pos)
721*4882a593Smuzhiyun {
722*4882a593Smuzhiyun return ksys_pwrite64(fd, buf, count, pos);
723*4882a593Smuzhiyun }
724*4882a593Smuzhiyun
do_iter_readv_writev(struct file * filp,struct iov_iter * iter,loff_t * ppos,int type,rwf_t flags)725*4882a593Smuzhiyun static ssize_t do_iter_readv_writev(struct file *filp, struct iov_iter *iter,
726*4882a593Smuzhiyun loff_t *ppos, int type, rwf_t flags)
727*4882a593Smuzhiyun {
728*4882a593Smuzhiyun struct kiocb kiocb;
729*4882a593Smuzhiyun ssize_t ret;
730*4882a593Smuzhiyun
731*4882a593Smuzhiyun init_sync_kiocb(&kiocb, filp);
732*4882a593Smuzhiyun ret = kiocb_set_rw_flags(&kiocb, flags);
733*4882a593Smuzhiyun if (ret)
734*4882a593Smuzhiyun return ret;
735*4882a593Smuzhiyun kiocb.ki_pos = (ppos ? *ppos : 0);
736*4882a593Smuzhiyun
737*4882a593Smuzhiyun if (type == READ)
738*4882a593Smuzhiyun ret = call_read_iter(filp, &kiocb, iter);
739*4882a593Smuzhiyun else
740*4882a593Smuzhiyun ret = call_write_iter(filp, &kiocb, iter);
741*4882a593Smuzhiyun BUG_ON(ret == -EIOCBQUEUED);
742*4882a593Smuzhiyun if (ppos)
743*4882a593Smuzhiyun *ppos = kiocb.ki_pos;
744*4882a593Smuzhiyun return ret;
745*4882a593Smuzhiyun }
746*4882a593Smuzhiyun
747*4882a593Smuzhiyun /* Do it by hand, with file-ops */
do_loop_readv_writev(struct file * filp,struct iov_iter * iter,loff_t * ppos,int type,rwf_t flags)748*4882a593Smuzhiyun static ssize_t do_loop_readv_writev(struct file *filp, struct iov_iter *iter,
749*4882a593Smuzhiyun loff_t *ppos, int type, rwf_t flags)
750*4882a593Smuzhiyun {
751*4882a593Smuzhiyun ssize_t ret = 0;
752*4882a593Smuzhiyun
753*4882a593Smuzhiyun if (flags & ~RWF_HIPRI)
754*4882a593Smuzhiyun return -EOPNOTSUPP;
755*4882a593Smuzhiyun
756*4882a593Smuzhiyun while (iov_iter_count(iter)) {
757*4882a593Smuzhiyun struct iovec iovec = iov_iter_iovec(iter);
758*4882a593Smuzhiyun ssize_t nr;
759*4882a593Smuzhiyun
760*4882a593Smuzhiyun if (type == READ) {
761*4882a593Smuzhiyun nr = filp->f_op->read(filp, iovec.iov_base,
762*4882a593Smuzhiyun iovec.iov_len, ppos);
763*4882a593Smuzhiyun } else {
764*4882a593Smuzhiyun nr = filp->f_op->write(filp, iovec.iov_base,
765*4882a593Smuzhiyun iovec.iov_len, ppos);
766*4882a593Smuzhiyun }
767*4882a593Smuzhiyun
768*4882a593Smuzhiyun if (nr < 0) {
769*4882a593Smuzhiyun if (!ret)
770*4882a593Smuzhiyun ret = nr;
771*4882a593Smuzhiyun break;
772*4882a593Smuzhiyun }
773*4882a593Smuzhiyun ret += nr;
774*4882a593Smuzhiyun if (nr != iovec.iov_len)
775*4882a593Smuzhiyun break;
776*4882a593Smuzhiyun iov_iter_advance(iter, nr);
777*4882a593Smuzhiyun }
778*4882a593Smuzhiyun
779*4882a593Smuzhiyun return ret;
780*4882a593Smuzhiyun }
781*4882a593Smuzhiyun
do_iter_read(struct file * file,struct iov_iter * iter,loff_t * pos,rwf_t flags)782*4882a593Smuzhiyun static ssize_t do_iter_read(struct file *file, struct iov_iter *iter,
783*4882a593Smuzhiyun loff_t *pos, rwf_t flags)
784*4882a593Smuzhiyun {
785*4882a593Smuzhiyun size_t tot_len;
786*4882a593Smuzhiyun ssize_t ret = 0;
787*4882a593Smuzhiyun
788*4882a593Smuzhiyun if (!(file->f_mode & FMODE_READ))
789*4882a593Smuzhiyun return -EBADF;
790*4882a593Smuzhiyun if (!(file->f_mode & FMODE_CAN_READ))
791*4882a593Smuzhiyun return -EINVAL;
792*4882a593Smuzhiyun
793*4882a593Smuzhiyun tot_len = iov_iter_count(iter);
794*4882a593Smuzhiyun if (!tot_len)
795*4882a593Smuzhiyun goto out;
796*4882a593Smuzhiyun ret = rw_verify_area(READ, file, pos, tot_len);
797*4882a593Smuzhiyun if (ret < 0)
798*4882a593Smuzhiyun return ret;
799*4882a593Smuzhiyun
800*4882a593Smuzhiyun if (file->f_op->read_iter)
801*4882a593Smuzhiyun ret = do_iter_readv_writev(file, iter, pos, READ, flags);
802*4882a593Smuzhiyun else
803*4882a593Smuzhiyun ret = do_loop_readv_writev(file, iter, pos, READ, flags);
804*4882a593Smuzhiyun out:
805*4882a593Smuzhiyun if (ret >= 0)
806*4882a593Smuzhiyun fsnotify_access(file);
807*4882a593Smuzhiyun return ret;
808*4882a593Smuzhiyun }
809*4882a593Smuzhiyun
vfs_iocb_iter_read(struct file * file,struct kiocb * iocb,struct iov_iter * iter)810*4882a593Smuzhiyun ssize_t vfs_iocb_iter_read(struct file *file, struct kiocb *iocb,
811*4882a593Smuzhiyun struct iov_iter *iter)
812*4882a593Smuzhiyun {
813*4882a593Smuzhiyun size_t tot_len;
814*4882a593Smuzhiyun ssize_t ret = 0;
815*4882a593Smuzhiyun
816*4882a593Smuzhiyun if (!file->f_op->read_iter)
817*4882a593Smuzhiyun return -EINVAL;
818*4882a593Smuzhiyun if (!(file->f_mode & FMODE_READ))
819*4882a593Smuzhiyun return -EBADF;
820*4882a593Smuzhiyun if (!(file->f_mode & FMODE_CAN_READ))
821*4882a593Smuzhiyun return -EINVAL;
822*4882a593Smuzhiyun
823*4882a593Smuzhiyun tot_len = iov_iter_count(iter);
824*4882a593Smuzhiyun if (!tot_len)
825*4882a593Smuzhiyun goto out;
826*4882a593Smuzhiyun ret = rw_verify_area(READ, file, &iocb->ki_pos, tot_len);
827*4882a593Smuzhiyun if (ret < 0)
828*4882a593Smuzhiyun return ret;
829*4882a593Smuzhiyun
830*4882a593Smuzhiyun ret = call_read_iter(file, iocb, iter);
831*4882a593Smuzhiyun out:
832*4882a593Smuzhiyun if (ret >= 0)
833*4882a593Smuzhiyun fsnotify_access(file);
834*4882a593Smuzhiyun return ret;
835*4882a593Smuzhiyun }
836*4882a593Smuzhiyun EXPORT_SYMBOL(vfs_iocb_iter_read);
837*4882a593Smuzhiyun
vfs_iter_read(struct file * file,struct iov_iter * iter,loff_t * ppos,rwf_t flags)838*4882a593Smuzhiyun ssize_t vfs_iter_read(struct file *file, struct iov_iter *iter, loff_t *ppos,
839*4882a593Smuzhiyun rwf_t flags)
840*4882a593Smuzhiyun {
841*4882a593Smuzhiyun if (!file->f_op->read_iter)
842*4882a593Smuzhiyun return -EINVAL;
843*4882a593Smuzhiyun return do_iter_read(file, iter, ppos, flags);
844*4882a593Smuzhiyun }
845*4882a593Smuzhiyun EXPORT_SYMBOL(vfs_iter_read);
846*4882a593Smuzhiyun
do_iter_write(struct file * file,struct iov_iter * iter,loff_t * pos,rwf_t flags)847*4882a593Smuzhiyun static ssize_t do_iter_write(struct file *file, struct iov_iter *iter,
848*4882a593Smuzhiyun loff_t *pos, rwf_t flags)
849*4882a593Smuzhiyun {
850*4882a593Smuzhiyun size_t tot_len;
851*4882a593Smuzhiyun ssize_t ret = 0;
852*4882a593Smuzhiyun
853*4882a593Smuzhiyun if (!(file->f_mode & FMODE_WRITE))
854*4882a593Smuzhiyun return -EBADF;
855*4882a593Smuzhiyun if (!(file->f_mode & FMODE_CAN_WRITE))
856*4882a593Smuzhiyun return -EINVAL;
857*4882a593Smuzhiyun
858*4882a593Smuzhiyun tot_len = iov_iter_count(iter);
859*4882a593Smuzhiyun if (!tot_len)
860*4882a593Smuzhiyun return 0;
861*4882a593Smuzhiyun ret = rw_verify_area(WRITE, file, pos, tot_len);
862*4882a593Smuzhiyun if (ret < 0)
863*4882a593Smuzhiyun return ret;
864*4882a593Smuzhiyun
865*4882a593Smuzhiyun if (file->f_op->write_iter)
866*4882a593Smuzhiyun ret = do_iter_readv_writev(file, iter, pos, WRITE, flags);
867*4882a593Smuzhiyun else
868*4882a593Smuzhiyun ret = do_loop_readv_writev(file, iter, pos, WRITE, flags);
869*4882a593Smuzhiyun if (ret > 0)
870*4882a593Smuzhiyun fsnotify_modify(file);
871*4882a593Smuzhiyun return ret;
872*4882a593Smuzhiyun }
873*4882a593Smuzhiyun
vfs_iocb_iter_write(struct file * file,struct kiocb * iocb,struct iov_iter * iter)874*4882a593Smuzhiyun ssize_t vfs_iocb_iter_write(struct file *file, struct kiocb *iocb,
875*4882a593Smuzhiyun struct iov_iter *iter)
876*4882a593Smuzhiyun {
877*4882a593Smuzhiyun size_t tot_len;
878*4882a593Smuzhiyun ssize_t ret = 0;
879*4882a593Smuzhiyun
880*4882a593Smuzhiyun if (!file->f_op->write_iter)
881*4882a593Smuzhiyun return -EINVAL;
882*4882a593Smuzhiyun if (!(file->f_mode & FMODE_WRITE))
883*4882a593Smuzhiyun return -EBADF;
884*4882a593Smuzhiyun if (!(file->f_mode & FMODE_CAN_WRITE))
885*4882a593Smuzhiyun return -EINVAL;
886*4882a593Smuzhiyun
887*4882a593Smuzhiyun tot_len = iov_iter_count(iter);
888*4882a593Smuzhiyun if (!tot_len)
889*4882a593Smuzhiyun return 0;
890*4882a593Smuzhiyun ret = rw_verify_area(WRITE, file, &iocb->ki_pos, tot_len);
891*4882a593Smuzhiyun if (ret < 0)
892*4882a593Smuzhiyun return ret;
893*4882a593Smuzhiyun
894*4882a593Smuzhiyun ret = call_write_iter(file, iocb, iter);
895*4882a593Smuzhiyun if (ret > 0)
896*4882a593Smuzhiyun fsnotify_modify(file);
897*4882a593Smuzhiyun
898*4882a593Smuzhiyun return ret;
899*4882a593Smuzhiyun }
900*4882a593Smuzhiyun EXPORT_SYMBOL(vfs_iocb_iter_write);
901*4882a593Smuzhiyun
vfs_iter_write(struct file * file,struct iov_iter * iter,loff_t * ppos,rwf_t flags)902*4882a593Smuzhiyun ssize_t vfs_iter_write(struct file *file, struct iov_iter *iter, loff_t *ppos,
903*4882a593Smuzhiyun rwf_t flags)
904*4882a593Smuzhiyun {
905*4882a593Smuzhiyun if (!file->f_op->write_iter)
906*4882a593Smuzhiyun return -EINVAL;
907*4882a593Smuzhiyun return do_iter_write(file, iter, ppos, flags);
908*4882a593Smuzhiyun }
909*4882a593Smuzhiyun EXPORT_SYMBOL(vfs_iter_write);
910*4882a593Smuzhiyun
vfs_readv(struct file * file,const struct iovec __user * vec,unsigned long vlen,loff_t * pos,rwf_t flags)911*4882a593Smuzhiyun static ssize_t vfs_readv(struct file *file, const struct iovec __user *vec,
912*4882a593Smuzhiyun unsigned long vlen, loff_t *pos, rwf_t flags)
913*4882a593Smuzhiyun {
914*4882a593Smuzhiyun struct iovec iovstack[UIO_FASTIOV];
915*4882a593Smuzhiyun struct iovec *iov = iovstack;
916*4882a593Smuzhiyun struct iov_iter iter;
917*4882a593Smuzhiyun ssize_t ret;
918*4882a593Smuzhiyun
919*4882a593Smuzhiyun ret = import_iovec(READ, vec, vlen, ARRAY_SIZE(iovstack), &iov, &iter);
920*4882a593Smuzhiyun if (ret >= 0) {
921*4882a593Smuzhiyun ret = do_iter_read(file, &iter, pos, flags);
922*4882a593Smuzhiyun kfree(iov);
923*4882a593Smuzhiyun }
924*4882a593Smuzhiyun
925*4882a593Smuzhiyun return ret;
926*4882a593Smuzhiyun }
927*4882a593Smuzhiyun
vfs_writev(struct file * file,const struct iovec __user * vec,unsigned long vlen,loff_t * pos,rwf_t flags)928*4882a593Smuzhiyun static ssize_t vfs_writev(struct file *file, const struct iovec __user *vec,
929*4882a593Smuzhiyun unsigned long vlen, loff_t *pos, rwf_t flags)
930*4882a593Smuzhiyun {
931*4882a593Smuzhiyun struct iovec iovstack[UIO_FASTIOV];
932*4882a593Smuzhiyun struct iovec *iov = iovstack;
933*4882a593Smuzhiyun struct iov_iter iter;
934*4882a593Smuzhiyun ssize_t ret;
935*4882a593Smuzhiyun
936*4882a593Smuzhiyun ret = import_iovec(WRITE, vec, vlen, ARRAY_SIZE(iovstack), &iov, &iter);
937*4882a593Smuzhiyun if (ret >= 0) {
938*4882a593Smuzhiyun file_start_write(file);
939*4882a593Smuzhiyun ret = do_iter_write(file, &iter, pos, flags);
940*4882a593Smuzhiyun file_end_write(file);
941*4882a593Smuzhiyun kfree(iov);
942*4882a593Smuzhiyun }
943*4882a593Smuzhiyun return ret;
944*4882a593Smuzhiyun }
945*4882a593Smuzhiyun
do_readv(unsigned long fd,const struct iovec __user * vec,unsigned long vlen,rwf_t flags)946*4882a593Smuzhiyun static ssize_t do_readv(unsigned long fd, const struct iovec __user *vec,
947*4882a593Smuzhiyun unsigned long vlen, rwf_t flags)
948*4882a593Smuzhiyun {
949*4882a593Smuzhiyun struct fd f = fdget_pos(fd);
950*4882a593Smuzhiyun ssize_t ret = -EBADF;
951*4882a593Smuzhiyun
952*4882a593Smuzhiyun if (f.file) {
953*4882a593Smuzhiyun loff_t pos, *ppos = file_ppos(f.file);
954*4882a593Smuzhiyun if (ppos) {
955*4882a593Smuzhiyun pos = *ppos;
956*4882a593Smuzhiyun ppos = &pos;
957*4882a593Smuzhiyun }
958*4882a593Smuzhiyun ret = vfs_readv(f.file, vec, vlen, ppos, flags);
959*4882a593Smuzhiyun if (ret >= 0 && ppos)
960*4882a593Smuzhiyun f.file->f_pos = pos;
961*4882a593Smuzhiyun fdput_pos(f);
962*4882a593Smuzhiyun }
963*4882a593Smuzhiyun
964*4882a593Smuzhiyun if (ret > 0)
965*4882a593Smuzhiyun add_rchar(current, ret);
966*4882a593Smuzhiyun inc_syscr(current);
967*4882a593Smuzhiyun return ret;
968*4882a593Smuzhiyun }
969*4882a593Smuzhiyun
do_writev(unsigned long fd,const struct iovec __user * vec,unsigned long vlen,rwf_t flags)970*4882a593Smuzhiyun static ssize_t do_writev(unsigned long fd, const struct iovec __user *vec,
971*4882a593Smuzhiyun unsigned long vlen, rwf_t flags)
972*4882a593Smuzhiyun {
973*4882a593Smuzhiyun struct fd f = fdget_pos(fd);
974*4882a593Smuzhiyun ssize_t ret = -EBADF;
975*4882a593Smuzhiyun
976*4882a593Smuzhiyun if (f.file) {
977*4882a593Smuzhiyun loff_t pos, *ppos = file_ppos(f.file);
978*4882a593Smuzhiyun if (ppos) {
979*4882a593Smuzhiyun pos = *ppos;
980*4882a593Smuzhiyun ppos = &pos;
981*4882a593Smuzhiyun }
982*4882a593Smuzhiyun ret = vfs_writev(f.file, vec, vlen, ppos, flags);
983*4882a593Smuzhiyun if (ret >= 0 && ppos)
984*4882a593Smuzhiyun f.file->f_pos = pos;
985*4882a593Smuzhiyun fdput_pos(f);
986*4882a593Smuzhiyun }
987*4882a593Smuzhiyun
988*4882a593Smuzhiyun if (ret > 0)
989*4882a593Smuzhiyun add_wchar(current, ret);
990*4882a593Smuzhiyun inc_syscw(current);
991*4882a593Smuzhiyun return ret;
992*4882a593Smuzhiyun }
993*4882a593Smuzhiyun
pos_from_hilo(unsigned long high,unsigned long low)994*4882a593Smuzhiyun static inline loff_t pos_from_hilo(unsigned long high, unsigned long low)
995*4882a593Smuzhiyun {
996*4882a593Smuzhiyun #define HALF_LONG_BITS (BITS_PER_LONG / 2)
997*4882a593Smuzhiyun return (((loff_t)high << HALF_LONG_BITS) << HALF_LONG_BITS) | low;
998*4882a593Smuzhiyun }
999*4882a593Smuzhiyun
do_preadv(unsigned long fd,const struct iovec __user * vec,unsigned long vlen,loff_t pos,rwf_t flags)1000*4882a593Smuzhiyun static ssize_t do_preadv(unsigned long fd, const struct iovec __user *vec,
1001*4882a593Smuzhiyun unsigned long vlen, loff_t pos, rwf_t flags)
1002*4882a593Smuzhiyun {
1003*4882a593Smuzhiyun struct fd f;
1004*4882a593Smuzhiyun ssize_t ret = -EBADF;
1005*4882a593Smuzhiyun
1006*4882a593Smuzhiyun if (pos < 0)
1007*4882a593Smuzhiyun return -EINVAL;
1008*4882a593Smuzhiyun
1009*4882a593Smuzhiyun f = fdget(fd);
1010*4882a593Smuzhiyun if (f.file) {
1011*4882a593Smuzhiyun ret = -ESPIPE;
1012*4882a593Smuzhiyun if (f.file->f_mode & FMODE_PREAD)
1013*4882a593Smuzhiyun ret = vfs_readv(f.file, vec, vlen, &pos, flags);
1014*4882a593Smuzhiyun fdput(f);
1015*4882a593Smuzhiyun }
1016*4882a593Smuzhiyun
1017*4882a593Smuzhiyun if (ret > 0)
1018*4882a593Smuzhiyun add_rchar(current, ret);
1019*4882a593Smuzhiyun inc_syscr(current);
1020*4882a593Smuzhiyun return ret;
1021*4882a593Smuzhiyun }
1022*4882a593Smuzhiyun
do_pwritev(unsigned long fd,const struct iovec __user * vec,unsigned long vlen,loff_t pos,rwf_t flags)1023*4882a593Smuzhiyun static ssize_t do_pwritev(unsigned long fd, const struct iovec __user *vec,
1024*4882a593Smuzhiyun unsigned long vlen, loff_t pos, rwf_t flags)
1025*4882a593Smuzhiyun {
1026*4882a593Smuzhiyun struct fd f;
1027*4882a593Smuzhiyun ssize_t ret = -EBADF;
1028*4882a593Smuzhiyun
1029*4882a593Smuzhiyun if (pos < 0)
1030*4882a593Smuzhiyun return -EINVAL;
1031*4882a593Smuzhiyun
1032*4882a593Smuzhiyun f = fdget(fd);
1033*4882a593Smuzhiyun if (f.file) {
1034*4882a593Smuzhiyun ret = -ESPIPE;
1035*4882a593Smuzhiyun if (f.file->f_mode & FMODE_PWRITE)
1036*4882a593Smuzhiyun ret = vfs_writev(f.file, vec, vlen, &pos, flags);
1037*4882a593Smuzhiyun fdput(f);
1038*4882a593Smuzhiyun }
1039*4882a593Smuzhiyun
1040*4882a593Smuzhiyun if (ret > 0)
1041*4882a593Smuzhiyun add_wchar(current, ret);
1042*4882a593Smuzhiyun inc_syscw(current);
1043*4882a593Smuzhiyun return ret;
1044*4882a593Smuzhiyun }
1045*4882a593Smuzhiyun
SYSCALL_DEFINE3(readv,unsigned long,fd,const struct iovec __user *,vec,unsigned long,vlen)1046*4882a593Smuzhiyun SYSCALL_DEFINE3(readv, unsigned long, fd, const struct iovec __user *, vec,
1047*4882a593Smuzhiyun unsigned long, vlen)
1048*4882a593Smuzhiyun {
1049*4882a593Smuzhiyun return do_readv(fd, vec, vlen, 0);
1050*4882a593Smuzhiyun }
1051*4882a593Smuzhiyun
SYSCALL_DEFINE3(writev,unsigned long,fd,const struct iovec __user *,vec,unsigned long,vlen)1052*4882a593Smuzhiyun SYSCALL_DEFINE3(writev, unsigned long, fd, const struct iovec __user *, vec,
1053*4882a593Smuzhiyun unsigned long, vlen)
1054*4882a593Smuzhiyun {
1055*4882a593Smuzhiyun return do_writev(fd, vec, vlen, 0);
1056*4882a593Smuzhiyun }
1057*4882a593Smuzhiyun
SYSCALL_DEFINE5(preadv,unsigned long,fd,const struct iovec __user *,vec,unsigned long,vlen,unsigned long,pos_l,unsigned long,pos_h)1058*4882a593Smuzhiyun SYSCALL_DEFINE5(preadv, unsigned long, fd, const struct iovec __user *, vec,
1059*4882a593Smuzhiyun unsigned long, vlen, unsigned long, pos_l, unsigned long, pos_h)
1060*4882a593Smuzhiyun {
1061*4882a593Smuzhiyun loff_t pos = pos_from_hilo(pos_h, pos_l);
1062*4882a593Smuzhiyun
1063*4882a593Smuzhiyun return do_preadv(fd, vec, vlen, pos, 0);
1064*4882a593Smuzhiyun }
1065*4882a593Smuzhiyun
SYSCALL_DEFINE6(preadv2,unsigned long,fd,const struct iovec __user *,vec,unsigned long,vlen,unsigned long,pos_l,unsigned long,pos_h,rwf_t,flags)1066*4882a593Smuzhiyun SYSCALL_DEFINE6(preadv2, unsigned long, fd, const struct iovec __user *, vec,
1067*4882a593Smuzhiyun unsigned long, vlen, unsigned long, pos_l, unsigned long, pos_h,
1068*4882a593Smuzhiyun rwf_t, flags)
1069*4882a593Smuzhiyun {
1070*4882a593Smuzhiyun loff_t pos = pos_from_hilo(pos_h, pos_l);
1071*4882a593Smuzhiyun
1072*4882a593Smuzhiyun if (pos == -1)
1073*4882a593Smuzhiyun return do_readv(fd, vec, vlen, flags);
1074*4882a593Smuzhiyun
1075*4882a593Smuzhiyun return do_preadv(fd, vec, vlen, pos, flags);
1076*4882a593Smuzhiyun }
1077*4882a593Smuzhiyun
SYSCALL_DEFINE5(pwritev,unsigned long,fd,const struct iovec __user *,vec,unsigned long,vlen,unsigned long,pos_l,unsigned long,pos_h)1078*4882a593Smuzhiyun SYSCALL_DEFINE5(pwritev, unsigned long, fd, const struct iovec __user *, vec,
1079*4882a593Smuzhiyun unsigned long, vlen, unsigned long, pos_l, unsigned long, pos_h)
1080*4882a593Smuzhiyun {
1081*4882a593Smuzhiyun loff_t pos = pos_from_hilo(pos_h, pos_l);
1082*4882a593Smuzhiyun
1083*4882a593Smuzhiyun return do_pwritev(fd, vec, vlen, pos, 0);
1084*4882a593Smuzhiyun }
1085*4882a593Smuzhiyun
SYSCALL_DEFINE6(pwritev2,unsigned long,fd,const struct iovec __user *,vec,unsigned long,vlen,unsigned long,pos_l,unsigned long,pos_h,rwf_t,flags)1086*4882a593Smuzhiyun SYSCALL_DEFINE6(pwritev2, unsigned long, fd, const struct iovec __user *, vec,
1087*4882a593Smuzhiyun unsigned long, vlen, unsigned long, pos_l, unsigned long, pos_h,
1088*4882a593Smuzhiyun rwf_t, flags)
1089*4882a593Smuzhiyun {
1090*4882a593Smuzhiyun loff_t pos = pos_from_hilo(pos_h, pos_l);
1091*4882a593Smuzhiyun
1092*4882a593Smuzhiyun if (pos == -1)
1093*4882a593Smuzhiyun return do_writev(fd, vec, vlen, flags);
1094*4882a593Smuzhiyun
1095*4882a593Smuzhiyun return do_pwritev(fd, vec, vlen, pos, flags);
1096*4882a593Smuzhiyun }
1097*4882a593Smuzhiyun
1098*4882a593Smuzhiyun /*
1099*4882a593Smuzhiyun * Various compat syscalls. Note that they all pretend to take a native
1100*4882a593Smuzhiyun * iovec - import_iovec will properly treat those as compat_iovecs based on
1101*4882a593Smuzhiyun * in_compat_syscall().
1102*4882a593Smuzhiyun */
1103*4882a593Smuzhiyun #ifdef CONFIG_COMPAT
1104*4882a593Smuzhiyun #ifdef __ARCH_WANT_COMPAT_SYS_PREADV64
COMPAT_SYSCALL_DEFINE4(preadv64,unsigned long,fd,const struct iovec __user *,vec,unsigned long,vlen,loff_t,pos)1105*4882a593Smuzhiyun COMPAT_SYSCALL_DEFINE4(preadv64, unsigned long, fd,
1106*4882a593Smuzhiyun const struct iovec __user *, vec,
1107*4882a593Smuzhiyun unsigned long, vlen, loff_t, pos)
1108*4882a593Smuzhiyun {
1109*4882a593Smuzhiyun return do_preadv(fd, vec, vlen, pos, 0);
1110*4882a593Smuzhiyun }
1111*4882a593Smuzhiyun #endif
1112*4882a593Smuzhiyun
COMPAT_SYSCALL_DEFINE5(preadv,compat_ulong_t,fd,const struct iovec __user *,vec,compat_ulong_t,vlen,u32,pos_low,u32,pos_high)1113*4882a593Smuzhiyun COMPAT_SYSCALL_DEFINE5(preadv, compat_ulong_t, fd,
1114*4882a593Smuzhiyun const struct iovec __user *, vec,
1115*4882a593Smuzhiyun compat_ulong_t, vlen, u32, pos_low, u32, pos_high)
1116*4882a593Smuzhiyun {
1117*4882a593Smuzhiyun loff_t pos = ((loff_t)pos_high << 32) | pos_low;
1118*4882a593Smuzhiyun
1119*4882a593Smuzhiyun return do_preadv(fd, vec, vlen, pos, 0);
1120*4882a593Smuzhiyun }
1121*4882a593Smuzhiyun
1122*4882a593Smuzhiyun #ifdef __ARCH_WANT_COMPAT_SYS_PREADV64V2
COMPAT_SYSCALL_DEFINE5(preadv64v2,unsigned long,fd,const struct iovec __user *,vec,unsigned long,vlen,loff_t,pos,rwf_t,flags)1123*4882a593Smuzhiyun COMPAT_SYSCALL_DEFINE5(preadv64v2, unsigned long, fd,
1124*4882a593Smuzhiyun const struct iovec __user *, vec,
1125*4882a593Smuzhiyun unsigned long, vlen, loff_t, pos, rwf_t, flags)
1126*4882a593Smuzhiyun {
1127*4882a593Smuzhiyun if (pos == -1)
1128*4882a593Smuzhiyun return do_readv(fd, vec, vlen, flags);
1129*4882a593Smuzhiyun return do_preadv(fd, vec, vlen, pos, flags);
1130*4882a593Smuzhiyun }
1131*4882a593Smuzhiyun #endif
1132*4882a593Smuzhiyun
COMPAT_SYSCALL_DEFINE6(preadv2,compat_ulong_t,fd,const struct iovec __user *,vec,compat_ulong_t,vlen,u32,pos_low,u32,pos_high,rwf_t,flags)1133*4882a593Smuzhiyun COMPAT_SYSCALL_DEFINE6(preadv2, compat_ulong_t, fd,
1134*4882a593Smuzhiyun const struct iovec __user *, vec,
1135*4882a593Smuzhiyun compat_ulong_t, vlen, u32, pos_low, u32, pos_high,
1136*4882a593Smuzhiyun rwf_t, flags)
1137*4882a593Smuzhiyun {
1138*4882a593Smuzhiyun loff_t pos = ((loff_t)pos_high << 32) | pos_low;
1139*4882a593Smuzhiyun
1140*4882a593Smuzhiyun if (pos == -1)
1141*4882a593Smuzhiyun return do_readv(fd, vec, vlen, flags);
1142*4882a593Smuzhiyun return do_preadv(fd, vec, vlen, pos, flags);
1143*4882a593Smuzhiyun }
1144*4882a593Smuzhiyun
1145*4882a593Smuzhiyun #ifdef __ARCH_WANT_COMPAT_SYS_PWRITEV64
COMPAT_SYSCALL_DEFINE4(pwritev64,unsigned long,fd,const struct iovec __user *,vec,unsigned long,vlen,loff_t,pos)1146*4882a593Smuzhiyun COMPAT_SYSCALL_DEFINE4(pwritev64, unsigned long, fd,
1147*4882a593Smuzhiyun const struct iovec __user *, vec,
1148*4882a593Smuzhiyun unsigned long, vlen, loff_t, pos)
1149*4882a593Smuzhiyun {
1150*4882a593Smuzhiyun return do_pwritev(fd, vec, vlen, pos, 0);
1151*4882a593Smuzhiyun }
1152*4882a593Smuzhiyun #endif
1153*4882a593Smuzhiyun
COMPAT_SYSCALL_DEFINE5(pwritev,compat_ulong_t,fd,const struct iovec __user *,vec,compat_ulong_t,vlen,u32,pos_low,u32,pos_high)1154*4882a593Smuzhiyun COMPAT_SYSCALL_DEFINE5(pwritev, compat_ulong_t, fd,
1155*4882a593Smuzhiyun const struct iovec __user *,vec,
1156*4882a593Smuzhiyun compat_ulong_t, vlen, u32, pos_low, u32, pos_high)
1157*4882a593Smuzhiyun {
1158*4882a593Smuzhiyun loff_t pos = ((loff_t)pos_high << 32) | pos_low;
1159*4882a593Smuzhiyun
1160*4882a593Smuzhiyun return do_pwritev(fd, vec, vlen, pos, 0);
1161*4882a593Smuzhiyun }
1162*4882a593Smuzhiyun
1163*4882a593Smuzhiyun #ifdef __ARCH_WANT_COMPAT_SYS_PWRITEV64V2
COMPAT_SYSCALL_DEFINE5(pwritev64v2,unsigned long,fd,const struct iovec __user *,vec,unsigned long,vlen,loff_t,pos,rwf_t,flags)1164*4882a593Smuzhiyun COMPAT_SYSCALL_DEFINE5(pwritev64v2, unsigned long, fd,
1165*4882a593Smuzhiyun const struct iovec __user *, vec,
1166*4882a593Smuzhiyun unsigned long, vlen, loff_t, pos, rwf_t, flags)
1167*4882a593Smuzhiyun {
1168*4882a593Smuzhiyun if (pos == -1)
1169*4882a593Smuzhiyun return do_writev(fd, vec, vlen, flags);
1170*4882a593Smuzhiyun return do_pwritev(fd, vec, vlen, pos, flags);
1171*4882a593Smuzhiyun }
1172*4882a593Smuzhiyun #endif
1173*4882a593Smuzhiyun
COMPAT_SYSCALL_DEFINE6(pwritev2,compat_ulong_t,fd,const struct iovec __user *,vec,compat_ulong_t,vlen,u32,pos_low,u32,pos_high,rwf_t,flags)1174*4882a593Smuzhiyun COMPAT_SYSCALL_DEFINE6(pwritev2, compat_ulong_t, fd,
1175*4882a593Smuzhiyun const struct iovec __user *,vec,
1176*4882a593Smuzhiyun compat_ulong_t, vlen, u32, pos_low, u32, pos_high, rwf_t, flags)
1177*4882a593Smuzhiyun {
1178*4882a593Smuzhiyun loff_t pos = ((loff_t)pos_high << 32) | pos_low;
1179*4882a593Smuzhiyun
1180*4882a593Smuzhiyun if (pos == -1)
1181*4882a593Smuzhiyun return do_writev(fd, vec, vlen, flags);
1182*4882a593Smuzhiyun return do_pwritev(fd, vec, vlen, pos, flags);
1183*4882a593Smuzhiyun }
1184*4882a593Smuzhiyun #endif /* CONFIG_COMPAT */
1185*4882a593Smuzhiyun
do_sendfile(int out_fd,int in_fd,loff_t * ppos,size_t count,loff_t max)1186*4882a593Smuzhiyun static ssize_t do_sendfile(int out_fd, int in_fd, loff_t *ppos,
1187*4882a593Smuzhiyun size_t count, loff_t max)
1188*4882a593Smuzhiyun {
1189*4882a593Smuzhiyun struct fd in, out;
1190*4882a593Smuzhiyun struct inode *in_inode, *out_inode;
1191*4882a593Smuzhiyun loff_t pos;
1192*4882a593Smuzhiyun loff_t out_pos;
1193*4882a593Smuzhiyun ssize_t retval;
1194*4882a593Smuzhiyun int fl;
1195*4882a593Smuzhiyun
1196*4882a593Smuzhiyun /*
1197*4882a593Smuzhiyun * Get input file, and verify that it is ok..
1198*4882a593Smuzhiyun */
1199*4882a593Smuzhiyun retval = -EBADF;
1200*4882a593Smuzhiyun in = fdget(in_fd);
1201*4882a593Smuzhiyun if (!in.file)
1202*4882a593Smuzhiyun goto out;
1203*4882a593Smuzhiyun if (!(in.file->f_mode & FMODE_READ))
1204*4882a593Smuzhiyun goto fput_in;
1205*4882a593Smuzhiyun retval = -ESPIPE;
1206*4882a593Smuzhiyun if (!ppos) {
1207*4882a593Smuzhiyun pos = in.file->f_pos;
1208*4882a593Smuzhiyun } else {
1209*4882a593Smuzhiyun pos = *ppos;
1210*4882a593Smuzhiyun if (!(in.file->f_mode & FMODE_PREAD))
1211*4882a593Smuzhiyun goto fput_in;
1212*4882a593Smuzhiyun }
1213*4882a593Smuzhiyun retval = rw_verify_area(READ, in.file, &pos, count);
1214*4882a593Smuzhiyun if (retval < 0)
1215*4882a593Smuzhiyun goto fput_in;
1216*4882a593Smuzhiyun if (count > MAX_RW_COUNT)
1217*4882a593Smuzhiyun count = MAX_RW_COUNT;
1218*4882a593Smuzhiyun
1219*4882a593Smuzhiyun /*
1220*4882a593Smuzhiyun * Get output file, and verify that it is ok..
1221*4882a593Smuzhiyun */
1222*4882a593Smuzhiyun retval = -EBADF;
1223*4882a593Smuzhiyun out = fdget(out_fd);
1224*4882a593Smuzhiyun if (!out.file)
1225*4882a593Smuzhiyun goto fput_in;
1226*4882a593Smuzhiyun if (!(out.file->f_mode & FMODE_WRITE))
1227*4882a593Smuzhiyun goto fput_out;
1228*4882a593Smuzhiyun in_inode = file_inode(in.file);
1229*4882a593Smuzhiyun out_inode = file_inode(out.file);
1230*4882a593Smuzhiyun out_pos = out.file->f_pos;
1231*4882a593Smuzhiyun retval = rw_verify_area(WRITE, out.file, &out_pos, count);
1232*4882a593Smuzhiyun if (retval < 0)
1233*4882a593Smuzhiyun goto fput_out;
1234*4882a593Smuzhiyun
1235*4882a593Smuzhiyun if (!max)
1236*4882a593Smuzhiyun max = min(in_inode->i_sb->s_maxbytes, out_inode->i_sb->s_maxbytes);
1237*4882a593Smuzhiyun
1238*4882a593Smuzhiyun if (unlikely(pos + count > max)) {
1239*4882a593Smuzhiyun retval = -EOVERFLOW;
1240*4882a593Smuzhiyun if (pos >= max)
1241*4882a593Smuzhiyun goto fput_out;
1242*4882a593Smuzhiyun count = max - pos;
1243*4882a593Smuzhiyun }
1244*4882a593Smuzhiyun
1245*4882a593Smuzhiyun fl = 0;
1246*4882a593Smuzhiyun #if 0
1247*4882a593Smuzhiyun /*
1248*4882a593Smuzhiyun * We need to debate whether we can enable this or not. The
1249*4882a593Smuzhiyun * man page documents EAGAIN return for the output at least,
1250*4882a593Smuzhiyun * and the application is arguably buggy if it doesn't expect
1251*4882a593Smuzhiyun * EAGAIN on a non-blocking file descriptor.
1252*4882a593Smuzhiyun */
1253*4882a593Smuzhiyun if (in.file->f_flags & O_NONBLOCK)
1254*4882a593Smuzhiyun fl = SPLICE_F_NONBLOCK;
1255*4882a593Smuzhiyun #endif
1256*4882a593Smuzhiyun file_start_write(out.file);
1257*4882a593Smuzhiyun retval = do_splice_direct(in.file, &pos, out.file, &out_pos, count, fl);
1258*4882a593Smuzhiyun file_end_write(out.file);
1259*4882a593Smuzhiyun
1260*4882a593Smuzhiyun if (retval > 0) {
1261*4882a593Smuzhiyun add_rchar(current, retval);
1262*4882a593Smuzhiyun add_wchar(current, retval);
1263*4882a593Smuzhiyun fsnotify_access(in.file);
1264*4882a593Smuzhiyun fsnotify_modify(out.file);
1265*4882a593Smuzhiyun out.file->f_pos = out_pos;
1266*4882a593Smuzhiyun if (ppos)
1267*4882a593Smuzhiyun *ppos = pos;
1268*4882a593Smuzhiyun else
1269*4882a593Smuzhiyun in.file->f_pos = pos;
1270*4882a593Smuzhiyun }
1271*4882a593Smuzhiyun
1272*4882a593Smuzhiyun inc_syscr(current);
1273*4882a593Smuzhiyun inc_syscw(current);
1274*4882a593Smuzhiyun if (pos > max)
1275*4882a593Smuzhiyun retval = -EOVERFLOW;
1276*4882a593Smuzhiyun
1277*4882a593Smuzhiyun fput_out:
1278*4882a593Smuzhiyun fdput(out);
1279*4882a593Smuzhiyun fput_in:
1280*4882a593Smuzhiyun fdput(in);
1281*4882a593Smuzhiyun out:
1282*4882a593Smuzhiyun return retval;
1283*4882a593Smuzhiyun }
1284*4882a593Smuzhiyun
SYSCALL_DEFINE4(sendfile,int,out_fd,int,in_fd,off_t __user *,offset,size_t,count)1285*4882a593Smuzhiyun SYSCALL_DEFINE4(sendfile, int, out_fd, int, in_fd, off_t __user *, offset, size_t, count)
1286*4882a593Smuzhiyun {
1287*4882a593Smuzhiyun loff_t pos;
1288*4882a593Smuzhiyun off_t off;
1289*4882a593Smuzhiyun ssize_t ret;
1290*4882a593Smuzhiyun
1291*4882a593Smuzhiyun if (offset) {
1292*4882a593Smuzhiyun if (unlikely(get_user(off, offset)))
1293*4882a593Smuzhiyun return -EFAULT;
1294*4882a593Smuzhiyun pos = off;
1295*4882a593Smuzhiyun ret = do_sendfile(out_fd, in_fd, &pos, count, MAX_NON_LFS);
1296*4882a593Smuzhiyun if (unlikely(put_user(pos, offset)))
1297*4882a593Smuzhiyun return -EFAULT;
1298*4882a593Smuzhiyun return ret;
1299*4882a593Smuzhiyun }
1300*4882a593Smuzhiyun
1301*4882a593Smuzhiyun return do_sendfile(out_fd, in_fd, NULL, count, 0);
1302*4882a593Smuzhiyun }
1303*4882a593Smuzhiyun
SYSCALL_DEFINE4(sendfile64,int,out_fd,int,in_fd,loff_t __user *,offset,size_t,count)1304*4882a593Smuzhiyun SYSCALL_DEFINE4(sendfile64, int, out_fd, int, in_fd, loff_t __user *, offset, size_t, count)
1305*4882a593Smuzhiyun {
1306*4882a593Smuzhiyun loff_t pos;
1307*4882a593Smuzhiyun ssize_t ret;
1308*4882a593Smuzhiyun
1309*4882a593Smuzhiyun if (offset) {
1310*4882a593Smuzhiyun if (unlikely(copy_from_user(&pos, offset, sizeof(loff_t))))
1311*4882a593Smuzhiyun return -EFAULT;
1312*4882a593Smuzhiyun ret = do_sendfile(out_fd, in_fd, &pos, count, 0);
1313*4882a593Smuzhiyun if (unlikely(put_user(pos, offset)))
1314*4882a593Smuzhiyun return -EFAULT;
1315*4882a593Smuzhiyun return ret;
1316*4882a593Smuzhiyun }
1317*4882a593Smuzhiyun
1318*4882a593Smuzhiyun return do_sendfile(out_fd, in_fd, NULL, count, 0);
1319*4882a593Smuzhiyun }
1320*4882a593Smuzhiyun
1321*4882a593Smuzhiyun #ifdef CONFIG_COMPAT
COMPAT_SYSCALL_DEFINE4(sendfile,int,out_fd,int,in_fd,compat_off_t __user *,offset,compat_size_t,count)1322*4882a593Smuzhiyun COMPAT_SYSCALL_DEFINE4(sendfile, int, out_fd, int, in_fd,
1323*4882a593Smuzhiyun compat_off_t __user *, offset, compat_size_t, count)
1324*4882a593Smuzhiyun {
1325*4882a593Smuzhiyun loff_t pos;
1326*4882a593Smuzhiyun off_t off;
1327*4882a593Smuzhiyun ssize_t ret;
1328*4882a593Smuzhiyun
1329*4882a593Smuzhiyun if (offset) {
1330*4882a593Smuzhiyun if (unlikely(get_user(off, offset)))
1331*4882a593Smuzhiyun return -EFAULT;
1332*4882a593Smuzhiyun pos = off;
1333*4882a593Smuzhiyun ret = do_sendfile(out_fd, in_fd, &pos, count, MAX_NON_LFS);
1334*4882a593Smuzhiyun if (unlikely(put_user(pos, offset)))
1335*4882a593Smuzhiyun return -EFAULT;
1336*4882a593Smuzhiyun return ret;
1337*4882a593Smuzhiyun }
1338*4882a593Smuzhiyun
1339*4882a593Smuzhiyun return do_sendfile(out_fd, in_fd, NULL, count, 0);
1340*4882a593Smuzhiyun }
1341*4882a593Smuzhiyun
COMPAT_SYSCALL_DEFINE4(sendfile64,int,out_fd,int,in_fd,compat_loff_t __user *,offset,compat_size_t,count)1342*4882a593Smuzhiyun COMPAT_SYSCALL_DEFINE4(sendfile64, int, out_fd, int, in_fd,
1343*4882a593Smuzhiyun compat_loff_t __user *, offset, compat_size_t, count)
1344*4882a593Smuzhiyun {
1345*4882a593Smuzhiyun loff_t pos;
1346*4882a593Smuzhiyun ssize_t ret;
1347*4882a593Smuzhiyun
1348*4882a593Smuzhiyun if (offset) {
1349*4882a593Smuzhiyun if (unlikely(copy_from_user(&pos, offset, sizeof(loff_t))))
1350*4882a593Smuzhiyun return -EFAULT;
1351*4882a593Smuzhiyun ret = do_sendfile(out_fd, in_fd, &pos, count, 0);
1352*4882a593Smuzhiyun if (unlikely(put_user(pos, offset)))
1353*4882a593Smuzhiyun return -EFAULT;
1354*4882a593Smuzhiyun return ret;
1355*4882a593Smuzhiyun }
1356*4882a593Smuzhiyun
1357*4882a593Smuzhiyun return do_sendfile(out_fd, in_fd, NULL, count, 0);
1358*4882a593Smuzhiyun }
1359*4882a593Smuzhiyun #endif
1360*4882a593Smuzhiyun
1361*4882a593Smuzhiyun /**
1362*4882a593Smuzhiyun * generic_copy_file_range - copy data between two files
1363*4882a593Smuzhiyun * @file_in: file structure to read from
1364*4882a593Smuzhiyun * @pos_in: file offset to read from
1365*4882a593Smuzhiyun * @file_out: file structure to write data to
1366*4882a593Smuzhiyun * @pos_out: file offset to write data to
1367*4882a593Smuzhiyun * @len: amount of data to copy
1368*4882a593Smuzhiyun * @flags: copy flags
1369*4882a593Smuzhiyun *
1370*4882a593Smuzhiyun * This is a generic filesystem helper to copy data from one file to another.
1371*4882a593Smuzhiyun * It has no constraints on the source or destination file owners - the files
1372*4882a593Smuzhiyun * can belong to different superblocks and different filesystem types. Short
1373*4882a593Smuzhiyun * copies are allowed.
1374*4882a593Smuzhiyun *
1375*4882a593Smuzhiyun * This should be called from the @file_out filesystem, as per the
1376*4882a593Smuzhiyun * ->copy_file_range() method.
1377*4882a593Smuzhiyun *
1378*4882a593Smuzhiyun * Returns the number of bytes copied or a negative error indicating the
1379*4882a593Smuzhiyun * failure.
1380*4882a593Smuzhiyun */
1381*4882a593Smuzhiyun
generic_copy_file_range(struct file * file_in,loff_t pos_in,struct file * file_out,loff_t pos_out,size_t len,unsigned int flags)1382*4882a593Smuzhiyun ssize_t generic_copy_file_range(struct file *file_in, loff_t pos_in,
1383*4882a593Smuzhiyun struct file *file_out, loff_t pos_out,
1384*4882a593Smuzhiyun size_t len, unsigned int flags)
1385*4882a593Smuzhiyun {
1386*4882a593Smuzhiyun return do_splice_direct(file_in, &pos_in, file_out, &pos_out,
1387*4882a593Smuzhiyun len > MAX_RW_COUNT ? MAX_RW_COUNT : len, 0);
1388*4882a593Smuzhiyun }
1389*4882a593Smuzhiyun EXPORT_SYMBOL(generic_copy_file_range);
1390*4882a593Smuzhiyun
1391*4882a593Smuzhiyun /*
1392*4882a593Smuzhiyun * Performs necessary checks before doing a file copy
1393*4882a593Smuzhiyun *
1394*4882a593Smuzhiyun * Can adjust amount of bytes to copy via @req_count argument.
1395*4882a593Smuzhiyun * Returns appropriate error code that caller should return or
1396*4882a593Smuzhiyun * zero in case the copy should be allowed.
1397*4882a593Smuzhiyun */
generic_copy_file_checks(struct file * file_in,loff_t pos_in,struct file * file_out,loff_t pos_out,size_t * req_count,unsigned int flags)1398*4882a593Smuzhiyun static int generic_copy_file_checks(struct file *file_in, loff_t pos_in,
1399*4882a593Smuzhiyun struct file *file_out, loff_t pos_out,
1400*4882a593Smuzhiyun size_t *req_count, unsigned int flags)
1401*4882a593Smuzhiyun {
1402*4882a593Smuzhiyun struct inode *inode_in = file_inode(file_in);
1403*4882a593Smuzhiyun struct inode *inode_out = file_inode(file_out);
1404*4882a593Smuzhiyun uint64_t count = *req_count;
1405*4882a593Smuzhiyun loff_t size_in;
1406*4882a593Smuzhiyun int ret;
1407*4882a593Smuzhiyun
1408*4882a593Smuzhiyun ret = generic_file_rw_checks(file_in, file_out);
1409*4882a593Smuzhiyun if (ret)
1410*4882a593Smuzhiyun return ret;
1411*4882a593Smuzhiyun
1412*4882a593Smuzhiyun /*
1413*4882a593Smuzhiyun * We allow some filesystems to handle cross sb copy, but passing
1414*4882a593Smuzhiyun * a file of the wrong filesystem type to filesystem driver can result
1415*4882a593Smuzhiyun * in an attempt to dereference the wrong type of ->private_data, so
1416*4882a593Smuzhiyun * avoid doing that until we really have a good reason.
1417*4882a593Smuzhiyun *
1418*4882a593Smuzhiyun * nfs and cifs define several different file_system_type structures
1419*4882a593Smuzhiyun * and several different sets of file_operations, but they all end up
1420*4882a593Smuzhiyun * using the same ->copy_file_range() function pointer.
1421*4882a593Smuzhiyun */
1422*4882a593Smuzhiyun if (flags & COPY_FILE_SPLICE) {
1423*4882a593Smuzhiyun /* cross sb splice is allowed */
1424*4882a593Smuzhiyun } else if (file_out->f_op->copy_file_range) {
1425*4882a593Smuzhiyun if (file_in->f_op->copy_file_range !=
1426*4882a593Smuzhiyun file_out->f_op->copy_file_range)
1427*4882a593Smuzhiyun return -EXDEV;
1428*4882a593Smuzhiyun } else if (file_inode(file_in)->i_sb != file_inode(file_out)->i_sb) {
1429*4882a593Smuzhiyun return -EXDEV;
1430*4882a593Smuzhiyun }
1431*4882a593Smuzhiyun
1432*4882a593Smuzhiyun /* Don't touch certain kinds of inodes */
1433*4882a593Smuzhiyun if (IS_IMMUTABLE(inode_out))
1434*4882a593Smuzhiyun return -EPERM;
1435*4882a593Smuzhiyun
1436*4882a593Smuzhiyun if (IS_SWAPFILE(inode_in) || IS_SWAPFILE(inode_out))
1437*4882a593Smuzhiyun return -ETXTBSY;
1438*4882a593Smuzhiyun
1439*4882a593Smuzhiyun /* Ensure offsets don't wrap. */
1440*4882a593Smuzhiyun if (pos_in + count < pos_in || pos_out + count < pos_out)
1441*4882a593Smuzhiyun return -EOVERFLOW;
1442*4882a593Smuzhiyun
1443*4882a593Smuzhiyun /* Shorten the copy to EOF */
1444*4882a593Smuzhiyun size_in = i_size_read(inode_in);
1445*4882a593Smuzhiyun if (pos_in >= size_in)
1446*4882a593Smuzhiyun count = 0;
1447*4882a593Smuzhiyun else
1448*4882a593Smuzhiyun count = min(count, size_in - (uint64_t)pos_in);
1449*4882a593Smuzhiyun
1450*4882a593Smuzhiyun ret = generic_write_check_limits(file_out, pos_out, &count);
1451*4882a593Smuzhiyun if (ret)
1452*4882a593Smuzhiyun return ret;
1453*4882a593Smuzhiyun
1454*4882a593Smuzhiyun /* Don't allow overlapped copying within the same file. */
1455*4882a593Smuzhiyun if (inode_in == inode_out &&
1456*4882a593Smuzhiyun pos_out + count > pos_in &&
1457*4882a593Smuzhiyun pos_out < pos_in + count)
1458*4882a593Smuzhiyun return -EINVAL;
1459*4882a593Smuzhiyun
1460*4882a593Smuzhiyun *req_count = count;
1461*4882a593Smuzhiyun return 0;
1462*4882a593Smuzhiyun }
1463*4882a593Smuzhiyun
1464*4882a593Smuzhiyun /*
1465*4882a593Smuzhiyun * copy_file_range() differs from regular file read and write in that it
1466*4882a593Smuzhiyun * specifically allows return partial success. When it does so is up to
1467*4882a593Smuzhiyun * the copy_file_range method.
1468*4882a593Smuzhiyun */
vfs_copy_file_range(struct file * file_in,loff_t pos_in,struct file * file_out,loff_t pos_out,size_t len,unsigned int flags)1469*4882a593Smuzhiyun ssize_t vfs_copy_file_range(struct file *file_in, loff_t pos_in,
1470*4882a593Smuzhiyun struct file *file_out, loff_t pos_out,
1471*4882a593Smuzhiyun size_t len, unsigned int flags)
1472*4882a593Smuzhiyun {
1473*4882a593Smuzhiyun ssize_t ret;
1474*4882a593Smuzhiyun bool splice = flags & COPY_FILE_SPLICE;
1475*4882a593Smuzhiyun
1476*4882a593Smuzhiyun if (flags & ~COPY_FILE_SPLICE)
1477*4882a593Smuzhiyun return -EINVAL;
1478*4882a593Smuzhiyun
1479*4882a593Smuzhiyun ret = generic_copy_file_checks(file_in, pos_in, file_out, pos_out, &len,
1480*4882a593Smuzhiyun flags);
1481*4882a593Smuzhiyun if (unlikely(ret))
1482*4882a593Smuzhiyun return ret;
1483*4882a593Smuzhiyun
1484*4882a593Smuzhiyun ret = rw_verify_area(READ, file_in, &pos_in, len);
1485*4882a593Smuzhiyun if (unlikely(ret))
1486*4882a593Smuzhiyun return ret;
1487*4882a593Smuzhiyun
1488*4882a593Smuzhiyun ret = rw_verify_area(WRITE, file_out, &pos_out, len);
1489*4882a593Smuzhiyun if (unlikely(ret))
1490*4882a593Smuzhiyun return ret;
1491*4882a593Smuzhiyun
1492*4882a593Smuzhiyun if (len == 0)
1493*4882a593Smuzhiyun return 0;
1494*4882a593Smuzhiyun
1495*4882a593Smuzhiyun file_start_write(file_out);
1496*4882a593Smuzhiyun
1497*4882a593Smuzhiyun /*
1498*4882a593Smuzhiyun * Cloning is supported by more file systems, so we implement copy on
1499*4882a593Smuzhiyun * same sb using clone, but for filesystems where both clone and copy
1500*4882a593Smuzhiyun * are supported (e.g. nfs,cifs), we only call the copy method.
1501*4882a593Smuzhiyun */
1502*4882a593Smuzhiyun if (!splice && file_out->f_op->copy_file_range) {
1503*4882a593Smuzhiyun ret = file_out->f_op->copy_file_range(file_in, pos_in,
1504*4882a593Smuzhiyun file_out, pos_out,
1505*4882a593Smuzhiyun len, flags);
1506*4882a593Smuzhiyun goto done;
1507*4882a593Smuzhiyun }
1508*4882a593Smuzhiyun
1509*4882a593Smuzhiyun if (!splice && file_in->f_op->remap_file_range &&
1510*4882a593Smuzhiyun file_inode(file_in)->i_sb == file_inode(file_out)->i_sb) {
1511*4882a593Smuzhiyun ret = file_in->f_op->remap_file_range(file_in, pos_in,
1512*4882a593Smuzhiyun file_out, pos_out,
1513*4882a593Smuzhiyun min_t(loff_t, MAX_RW_COUNT, len),
1514*4882a593Smuzhiyun REMAP_FILE_CAN_SHORTEN);
1515*4882a593Smuzhiyun if (ret > 0)
1516*4882a593Smuzhiyun goto done;
1517*4882a593Smuzhiyun }
1518*4882a593Smuzhiyun
1519*4882a593Smuzhiyun /*
1520*4882a593Smuzhiyun * We can get here for same sb copy of filesystems that do not implement
1521*4882a593Smuzhiyun * ->copy_file_range() in case filesystem does not support clone or in
1522*4882a593Smuzhiyun * case filesystem supports clone but rejected the clone request (e.g.
1523*4882a593Smuzhiyun * because it was not block aligned).
1524*4882a593Smuzhiyun *
1525*4882a593Smuzhiyun * In both cases, fall back to kernel copy so we are able to maintain a
1526*4882a593Smuzhiyun * consistent story about which filesystems support copy_file_range()
1527*4882a593Smuzhiyun * and which filesystems do not, that will allow userspace tools to
1528*4882a593Smuzhiyun * make consistent desicions w.r.t using copy_file_range().
1529*4882a593Smuzhiyun *
1530*4882a593Smuzhiyun * We also get here if caller (e.g. nfsd) requested COPY_FILE_SPLICE.
1531*4882a593Smuzhiyun */
1532*4882a593Smuzhiyun ret = generic_copy_file_range(file_in, pos_in, file_out, pos_out, len,
1533*4882a593Smuzhiyun flags);
1534*4882a593Smuzhiyun
1535*4882a593Smuzhiyun done:
1536*4882a593Smuzhiyun if (ret > 0) {
1537*4882a593Smuzhiyun fsnotify_access(file_in);
1538*4882a593Smuzhiyun add_rchar(current, ret);
1539*4882a593Smuzhiyun fsnotify_modify(file_out);
1540*4882a593Smuzhiyun add_wchar(current, ret);
1541*4882a593Smuzhiyun }
1542*4882a593Smuzhiyun
1543*4882a593Smuzhiyun inc_syscr(current);
1544*4882a593Smuzhiyun inc_syscw(current);
1545*4882a593Smuzhiyun
1546*4882a593Smuzhiyun file_end_write(file_out);
1547*4882a593Smuzhiyun
1548*4882a593Smuzhiyun return ret;
1549*4882a593Smuzhiyun }
1550*4882a593Smuzhiyun EXPORT_SYMBOL(vfs_copy_file_range);
1551*4882a593Smuzhiyun
SYSCALL_DEFINE6(copy_file_range,int,fd_in,loff_t __user *,off_in,int,fd_out,loff_t __user *,off_out,size_t,len,unsigned int,flags)1552*4882a593Smuzhiyun SYSCALL_DEFINE6(copy_file_range, int, fd_in, loff_t __user *, off_in,
1553*4882a593Smuzhiyun int, fd_out, loff_t __user *, off_out,
1554*4882a593Smuzhiyun size_t, len, unsigned int, flags)
1555*4882a593Smuzhiyun {
1556*4882a593Smuzhiyun loff_t pos_in;
1557*4882a593Smuzhiyun loff_t pos_out;
1558*4882a593Smuzhiyun struct fd f_in;
1559*4882a593Smuzhiyun struct fd f_out;
1560*4882a593Smuzhiyun ssize_t ret = -EBADF;
1561*4882a593Smuzhiyun
1562*4882a593Smuzhiyun f_in = fdget(fd_in);
1563*4882a593Smuzhiyun if (!f_in.file)
1564*4882a593Smuzhiyun goto out2;
1565*4882a593Smuzhiyun
1566*4882a593Smuzhiyun f_out = fdget(fd_out);
1567*4882a593Smuzhiyun if (!f_out.file)
1568*4882a593Smuzhiyun goto out1;
1569*4882a593Smuzhiyun
1570*4882a593Smuzhiyun ret = -EFAULT;
1571*4882a593Smuzhiyun if (off_in) {
1572*4882a593Smuzhiyun if (copy_from_user(&pos_in, off_in, sizeof(loff_t)))
1573*4882a593Smuzhiyun goto out;
1574*4882a593Smuzhiyun } else {
1575*4882a593Smuzhiyun pos_in = f_in.file->f_pos;
1576*4882a593Smuzhiyun }
1577*4882a593Smuzhiyun
1578*4882a593Smuzhiyun if (off_out) {
1579*4882a593Smuzhiyun if (copy_from_user(&pos_out, off_out, sizeof(loff_t)))
1580*4882a593Smuzhiyun goto out;
1581*4882a593Smuzhiyun } else {
1582*4882a593Smuzhiyun pos_out = f_out.file->f_pos;
1583*4882a593Smuzhiyun }
1584*4882a593Smuzhiyun
1585*4882a593Smuzhiyun ret = -EINVAL;
1586*4882a593Smuzhiyun if (flags != 0)
1587*4882a593Smuzhiyun goto out;
1588*4882a593Smuzhiyun
1589*4882a593Smuzhiyun ret = vfs_copy_file_range(f_in.file, pos_in, f_out.file, pos_out, len,
1590*4882a593Smuzhiyun flags);
1591*4882a593Smuzhiyun if (ret > 0) {
1592*4882a593Smuzhiyun pos_in += ret;
1593*4882a593Smuzhiyun pos_out += ret;
1594*4882a593Smuzhiyun
1595*4882a593Smuzhiyun if (off_in) {
1596*4882a593Smuzhiyun if (copy_to_user(off_in, &pos_in, sizeof(loff_t)))
1597*4882a593Smuzhiyun ret = -EFAULT;
1598*4882a593Smuzhiyun } else {
1599*4882a593Smuzhiyun f_in.file->f_pos = pos_in;
1600*4882a593Smuzhiyun }
1601*4882a593Smuzhiyun
1602*4882a593Smuzhiyun if (off_out) {
1603*4882a593Smuzhiyun if (copy_to_user(off_out, &pos_out, sizeof(loff_t)))
1604*4882a593Smuzhiyun ret = -EFAULT;
1605*4882a593Smuzhiyun } else {
1606*4882a593Smuzhiyun f_out.file->f_pos = pos_out;
1607*4882a593Smuzhiyun }
1608*4882a593Smuzhiyun }
1609*4882a593Smuzhiyun
1610*4882a593Smuzhiyun out:
1611*4882a593Smuzhiyun fdput(f_out);
1612*4882a593Smuzhiyun out1:
1613*4882a593Smuzhiyun fdput(f_in);
1614*4882a593Smuzhiyun out2:
1615*4882a593Smuzhiyun return ret;
1616*4882a593Smuzhiyun }
1617*4882a593Smuzhiyun
1618*4882a593Smuzhiyun /*
1619*4882a593Smuzhiyun * Don't operate on ranges the page cache doesn't support, and don't exceed the
1620*4882a593Smuzhiyun * LFS limits. If pos is under the limit it becomes a short access. If it
1621*4882a593Smuzhiyun * exceeds the limit we return -EFBIG.
1622*4882a593Smuzhiyun */
generic_write_check_limits(struct file * file,loff_t pos,loff_t * count)1623*4882a593Smuzhiyun int generic_write_check_limits(struct file *file, loff_t pos, loff_t *count)
1624*4882a593Smuzhiyun {
1625*4882a593Smuzhiyun struct inode *inode = file->f_mapping->host;
1626*4882a593Smuzhiyun loff_t max_size = inode->i_sb->s_maxbytes;
1627*4882a593Smuzhiyun loff_t limit = rlimit(RLIMIT_FSIZE);
1628*4882a593Smuzhiyun
1629*4882a593Smuzhiyun if (limit != RLIM_INFINITY) {
1630*4882a593Smuzhiyun if (pos >= limit) {
1631*4882a593Smuzhiyun send_sig(SIGXFSZ, current, 0);
1632*4882a593Smuzhiyun return -EFBIG;
1633*4882a593Smuzhiyun }
1634*4882a593Smuzhiyun *count = min(*count, limit - pos);
1635*4882a593Smuzhiyun }
1636*4882a593Smuzhiyun
1637*4882a593Smuzhiyun if (!(file->f_flags & O_LARGEFILE))
1638*4882a593Smuzhiyun max_size = MAX_NON_LFS;
1639*4882a593Smuzhiyun
1640*4882a593Smuzhiyun if (unlikely(pos >= max_size))
1641*4882a593Smuzhiyun return -EFBIG;
1642*4882a593Smuzhiyun
1643*4882a593Smuzhiyun *count = min(*count, max_size - pos);
1644*4882a593Smuzhiyun
1645*4882a593Smuzhiyun return 0;
1646*4882a593Smuzhiyun }
1647*4882a593Smuzhiyun
1648*4882a593Smuzhiyun /*
1649*4882a593Smuzhiyun * Performs necessary checks before doing a write
1650*4882a593Smuzhiyun *
1651*4882a593Smuzhiyun * Can adjust writing position or amount of bytes to write.
1652*4882a593Smuzhiyun * Returns appropriate error code that caller should return or
1653*4882a593Smuzhiyun * zero in case that write should be allowed.
1654*4882a593Smuzhiyun */
generic_write_checks(struct kiocb * iocb,struct iov_iter * from)1655*4882a593Smuzhiyun ssize_t generic_write_checks(struct kiocb *iocb, struct iov_iter *from)
1656*4882a593Smuzhiyun {
1657*4882a593Smuzhiyun struct file *file = iocb->ki_filp;
1658*4882a593Smuzhiyun struct inode *inode = file->f_mapping->host;
1659*4882a593Smuzhiyun loff_t count;
1660*4882a593Smuzhiyun int ret;
1661*4882a593Smuzhiyun
1662*4882a593Smuzhiyun if (IS_SWAPFILE(inode))
1663*4882a593Smuzhiyun return -ETXTBSY;
1664*4882a593Smuzhiyun
1665*4882a593Smuzhiyun if (!iov_iter_count(from))
1666*4882a593Smuzhiyun return 0;
1667*4882a593Smuzhiyun
1668*4882a593Smuzhiyun /* FIXME: this is for backwards compatibility with 2.4 */
1669*4882a593Smuzhiyun if (iocb->ki_flags & IOCB_APPEND)
1670*4882a593Smuzhiyun iocb->ki_pos = i_size_read(inode);
1671*4882a593Smuzhiyun
1672*4882a593Smuzhiyun if ((iocb->ki_flags & IOCB_NOWAIT) && !(iocb->ki_flags & IOCB_DIRECT))
1673*4882a593Smuzhiyun return -EINVAL;
1674*4882a593Smuzhiyun
1675*4882a593Smuzhiyun count = iov_iter_count(from);
1676*4882a593Smuzhiyun ret = generic_write_check_limits(file, iocb->ki_pos, &count);
1677*4882a593Smuzhiyun if (ret)
1678*4882a593Smuzhiyun return ret;
1679*4882a593Smuzhiyun
1680*4882a593Smuzhiyun iov_iter_truncate(from, count);
1681*4882a593Smuzhiyun return iov_iter_count(from);
1682*4882a593Smuzhiyun }
1683*4882a593Smuzhiyun EXPORT_SYMBOL(generic_write_checks);
1684*4882a593Smuzhiyun
1685*4882a593Smuzhiyun /*
1686*4882a593Smuzhiyun * Performs common checks before doing a file copy/clone
1687*4882a593Smuzhiyun * from @file_in to @file_out.
1688*4882a593Smuzhiyun */
generic_file_rw_checks(struct file * file_in,struct file * file_out)1689*4882a593Smuzhiyun int generic_file_rw_checks(struct file *file_in, struct file *file_out)
1690*4882a593Smuzhiyun {
1691*4882a593Smuzhiyun struct inode *inode_in = file_inode(file_in);
1692*4882a593Smuzhiyun struct inode *inode_out = file_inode(file_out);
1693*4882a593Smuzhiyun
1694*4882a593Smuzhiyun /* Don't copy dirs, pipes, sockets... */
1695*4882a593Smuzhiyun if (S_ISDIR(inode_in->i_mode) || S_ISDIR(inode_out->i_mode))
1696*4882a593Smuzhiyun return -EISDIR;
1697*4882a593Smuzhiyun if (!S_ISREG(inode_in->i_mode) || !S_ISREG(inode_out->i_mode))
1698*4882a593Smuzhiyun return -EINVAL;
1699*4882a593Smuzhiyun
1700*4882a593Smuzhiyun if (!(file_in->f_mode & FMODE_READ) ||
1701*4882a593Smuzhiyun !(file_out->f_mode & FMODE_WRITE) ||
1702*4882a593Smuzhiyun (file_out->f_flags & O_APPEND))
1703*4882a593Smuzhiyun return -EBADF;
1704*4882a593Smuzhiyun
1705*4882a593Smuzhiyun return 0;
1706*4882a593Smuzhiyun }
1707