1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * This file contians vfs file ops for 9P2000.
4 *
5 * Copyright (C) 2004 by Eric Van Hensbergen <ericvh@gmail.com>
6 * Copyright (C) 2002 by Ron Minnich <rminnich@lanl.gov>
7 */
8
9#include <linux/module.h>
10#include <linux/errno.h>
11#include <linux/fs.h>
12#include <linux/filelock.h>
13#include <linux/sched.h>
14#include <linux/file.h>
15#include <linux/stat.h>
16#include <linux/string.h>
17#include <linux/list.h>
18#include <linux/pagemap.h>
19#include <linux/utsname.h>
20#include <linux/uaccess.h>
21#include <linux/uio.h>
22#include <linux/slab.h>
23#include <net/9p/9p.h>
24#include <net/9p/client.h>
25
26#include "v9fs.h"
27#include "v9fs_vfs.h"
28#include "fid.h"
29#include "cache.h"
30
31static const struct vm_operations_struct v9fs_mmap_file_vm_ops;
32
33/**
34 * v9fs_file_open - open a file (or directory)
35 * @inode: inode to be opened
36 * @file: file being opened
37 *
38 */
39
40int v9fs_file_open(struct inode *inode, struct file *file)
41{
42 int err;
43 struct v9fs_session_info *v9ses;
44 struct p9_fid *fid;
45 int omode;
46
47 p9_debug(P9_DEBUG_VFS, "inode: %p file: %p\n", inode, file);
48 v9ses = v9fs_inode2v9ses(inode);
49 if (v9fs_proto_dotl(v9ses))
50 omode = v9fs_open_to_dotl_flags(flags: file->f_flags);
51 else
52 omode = v9fs_uflags2omode(uflags: file->f_flags,
53 extended: v9fs_proto_dotu(v9ses));
54 fid = file->private_data;
55 if (!fid) {
56 fid = v9fs_fid_clone(dentry: file_dentry(file));
57 if (IS_ERR(ptr: fid))
58 return PTR_ERR(ptr: fid);
59
60 if ((v9ses->cache & CACHE_WRITEBACK) && (omode & P9_OWRITE)) {
61 int writeback_omode = (omode & ~P9_OWRITE) | P9_ORDWR;
62
63 p9_debug(P9_DEBUG_CACHE, "write-only file with writeback enabled, try opening O_RDWR\n");
64 err = p9_client_open(fid, mode: writeback_omode);
65 if (err < 0) {
66 p9_debug(P9_DEBUG_CACHE, "could not open O_RDWR, disabling caches\n");
67 err = p9_client_open(fid, mode: omode);
68 fid->mode |= P9L_DIRECT;
69 }
70 } else {
71 err = p9_client_open(fid, mode: omode);
72 }
73 if (err < 0) {
74 p9_fid_put(fid);
75 return err;
76 }
77 if ((file->f_flags & O_APPEND) &&
78 (!v9fs_proto_dotu(v9ses) && !v9fs_proto_dotl(v9ses)))
79 generic_file_llseek(file, offset: 0, SEEK_END);
80
81 file->private_data = fid;
82 }
83
84#ifdef CONFIG_9P_FSCACHE
85 if (v9ses->cache & CACHE_FSCACHE)
86 fscache_use_cookie(cookie: v9fs_inode_cookie(v9inode: V9FS_I(inode)),
87 will_modify: file->f_mode & FMODE_WRITE);
88#endif
89 v9fs_fid_add_modes(fid, s_flags: v9ses->flags, s_cache: v9ses->cache, f_flags: file->f_flags);
90 v9fs_open_fid_add(inode, fid: &fid);
91 return 0;
92}
93
94/**
95 * v9fs_file_lock - lock a file (or directory)
96 * @filp: file to be locked
97 * @cmd: lock command
98 * @fl: file lock structure
99 *
100 * Bugs: this looks like a local only lock, we should extend into 9P
101 * by using open exclusive
102 */
103
104static int v9fs_file_lock(struct file *filp, int cmd, struct file_lock *fl)
105{
106 struct inode *inode = file_inode(f: filp);
107
108 p9_debug(P9_DEBUG_VFS, "filp: %p lock: %p\n", filp, fl);
109
110 if ((IS_SETLK(cmd) || IS_SETLKW(cmd)) && fl->fl_type != F_UNLCK) {
111 filemap_write_and_wait(mapping: inode->i_mapping);
112 invalidate_mapping_pages(mapping: &inode->i_data, start: 0, end: -1);
113 }
114
115 return 0;
116}
117
118static int v9fs_file_do_lock(struct file *filp, int cmd, struct file_lock *fl)
119{
120 struct p9_flock flock;
121 struct p9_fid *fid;
122 uint8_t status = P9_LOCK_ERROR;
123 int res = 0;
124 unsigned char fl_type;
125 struct v9fs_session_info *v9ses;
126
127 fid = filp->private_data;
128 BUG_ON(fid == NULL);
129
130 BUG_ON((fl->fl_flags & FL_POSIX) != FL_POSIX);
131
132 res = locks_lock_file_wait(filp, fl);
133 if (res < 0)
134 goto out;
135
136 /* convert posix lock to p9 tlock args */
137 memset(&flock, 0, sizeof(flock));
138 /* map the lock type */
139 switch (fl->fl_type) {
140 case F_RDLCK:
141 flock.type = P9_LOCK_TYPE_RDLCK;
142 break;
143 case F_WRLCK:
144 flock.type = P9_LOCK_TYPE_WRLCK;
145 break;
146 case F_UNLCK:
147 flock.type = P9_LOCK_TYPE_UNLCK;
148 break;
149 }
150 flock.start = fl->fl_start;
151 if (fl->fl_end == OFFSET_MAX)
152 flock.length = 0;
153 else
154 flock.length = fl->fl_end - fl->fl_start + 1;
155 flock.proc_id = fl->fl_pid;
156 flock.client_id = fid->clnt->name;
157 if (IS_SETLKW(cmd))
158 flock.flags = P9_LOCK_FLAGS_BLOCK;
159
160 v9ses = v9fs_inode2v9ses(inode: file_inode(f: filp));
161
162 /*
163 * if its a blocked request and we get P9_LOCK_BLOCKED as the status
164 * for lock request, keep on trying
165 */
166 for (;;) {
167 res = p9_client_lock_dotl(fid, flock: &flock, status: &status);
168 if (res < 0)
169 goto out_unlock;
170
171 if (status != P9_LOCK_BLOCKED)
172 break;
173 if (status == P9_LOCK_BLOCKED && !IS_SETLKW(cmd))
174 break;
175 if (schedule_timeout_interruptible(timeout: v9ses->session_lock_timeout)
176 != 0)
177 break;
178 /*
179 * p9_client_lock_dotl overwrites flock.client_id with the
180 * server message, free and reuse the client name
181 */
182 if (flock.client_id != fid->clnt->name) {
183 kfree(objp: flock.client_id);
184 flock.client_id = fid->clnt->name;
185 }
186 }
187
188 /* map 9p status to VFS status */
189 switch (status) {
190 case P9_LOCK_SUCCESS:
191 res = 0;
192 break;
193 case P9_LOCK_BLOCKED:
194 res = -EAGAIN;
195 break;
196 default:
197 WARN_ONCE(1, "unknown lock status code: %d\n", status);
198 fallthrough;
199 case P9_LOCK_ERROR:
200 case P9_LOCK_GRACE:
201 res = -ENOLCK;
202 break;
203 }
204
205out_unlock:
206 /*
207 * incase server returned error for lock request, revert
208 * it locally
209 */
210 if (res < 0 && fl->fl_type != F_UNLCK) {
211 fl_type = fl->fl_type;
212 fl->fl_type = F_UNLCK;
213 /* Even if this fails we want to return the remote error */
214 locks_lock_file_wait(filp, fl);
215 fl->fl_type = fl_type;
216 }
217 if (flock.client_id != fid->clnt->name)
218 kfree(objp: flock.client_id);
219out:
220 return res;
221}
222
223static int v9fs_file_getlock(struct file *filp, struct file_lock *fl)
224{
225 struct p9_getlock glock;
226 struct p9_fid *fid;
227 int res = 0;
228
229 fid = filp->private_data;
230 BUG_ON(fid == NULL);
231
232 posix_test_lock(filp, fl);
233 /*
234 * if we have a conflicting lock locally, no need to validate
235 * with server
236 */
237 if (fl->fl_type != F_UNLCK)
238 return res;
239
240 /* convert posix lock to p9 tgetlock args */
241 memset(&glock, 0, sizeof(glock));
242 glock.type = P9_LOCK_TYPE_UNLCK;
243 glock.start = fl->fl_start;
244 if (fl->fl_end == OFFSET_MAX)
245 glock.length = 0;
246 else
247 glock.length = fl->fl_end - fl->fl_start + 1;
248 glock.proc_id = fl->fl_pid;
249 glock.client_id = fid->clnt->name;
250
251 res = p9_client_getlock_dotl(fid, fl: &glock);
252 if (res < 0)
253 goto out;
254 /* map 9p lock type to os lock type */
255 switch (glock.type) {
256 case P9_LOCK_TYPE_RDLCK:
257 fl->fl_type = F_RDLCK;
258 break;
259 case P9_LOCK_TYPE_WRLCK:
260 fl->fl_type = F_WRLCK;
261 break;
262 case P9_LOCK_TYPE_UNLCK:
263 fl->fl_type = F_UNLCK;
264 break;
265 }
266 if (glock.type != P9_LOCK_TYPE_UNLCK) {
267 fl->fl_start = glock.start;
268 if (glock.length == 0)
269 fl->fl_end = OFFSET_MAX;
270 else
271 fl->fl_end = glock.start + glock.length - 1;
272 fl->fl_pid = -glock.proc_id;
273 }
274out:
275 if (glock.client_id != fid->clnt->name)
276 kfree(objp: glock.client_id);
277 return res;
278}
279
280/**
281 * v9fs_file_lock_dotl - lock a file (or directory)
282 * @filp: file to be locked
283 * @cmd: lock command
284 * @fl: file lock structure
285 *
286 */
287
288static int v9fs_file_lock_dotl(struct file *filp, int cmd, struct file_lock *fl)
289{
290 struct inode *inode = file_inode(f: filp);
291 int ret = -ENOLCK;
292
293 p9_debug(P9_DEBUG_VFS, "filp: %p cmd:%d lock: %p name: %pD\n",
294 filp, cmd, fl, filp);
295
296 if ((IS_SETLK(cmd) || IS_SETLKW(cmd)) && fl->fl_type != F_UNLCK) {
297 filemap_write_and_wait(mapping: inode->i_mapping);
298 invalidate_mapping_pages(mapping: &inode->i_data, start: 0, end: -1);
299 }
300
301 if (IS_SETLK(cmd) || IS_SETLKW(cmd))
302 ret = v9fs_file_do_lock(filp, cmd, fl);
303 else if (IS_GETLK(cmd))
304 ret = v9fs_file_getlock(filp, fl);
305 else
306 ret = -EINVAL;
307 return ret;
308}
309
310/**
311 * v9fs_file_flock_dotl - lock a file
312 * @filp: file to be locked
313 * @cmd: lock command
314 * @fl: file lock structure
315 *
316 */
317
318static int v9fs_file_flock_dotl(struct file *filp, int cmd,
319 struct file_lock *fl)
320{
321 struct inode *inode = file_inode(f: filp);
322 int ret = -ENOLCK;
323
324 p9_debug(P9_DEBUG_VFS, "filp: %p cmd:%d lock: %p name: %pD\n",
325 filp, cmd, fl, filp);
326
327 if (!(fl->fl_flags & FL_FLOCK))
328 goto out_err;
329
330 if ((IS_SETLK(cmd) || IS_SETLKW(cmd)) && fl->fl_type != F_UNLCK) {
331 filemap_write_and_wait(mapping: inode->i_mapping);
332 invalidate_mapping_pages(mapping: &inode->i_data, start: 0, end: -1);
333 }
334 /* Convert flock to posix lock */
335 fl->fl_flags |= FL_POSIX;
336 fl->fl_flags ^= FL_FLOCK;
337
338 if (IS_SETLK(cmd) | IS_SETLKW(cmd))
339 ret = v9fs_file_do_lock(filp, cmd, fl);
340 else
341 ret = -EINVAL;
342out_err:
343 return ret;
344}
345
346/**
347 * v9fs_file_read_iter - read from a file
348 * @iocb: The operation parameters
349 * @to: The buffer to read into
350 *
351 */
352static ssize_t
353v9fs_file_read_iter(struct kiocb *iocb, struct iov_iter *to)
354{
355 struct p9_fid *fid = iocb->ki_filp->private_data;
356 int ret, err = 0;
357
358 p9_debug(P9_DEBUG_VFS, "fid %d count %zu offset %lld\n",
359 fid->fid, iov_iter_count(to), iocb->ki_pos);
360
361 if (!(fid->mode & P9L_DIRECT)) {
362 p9_debug(P9_DEBUG_VFS, "(cached)\n");
363 return generic_file_read_iter(iocb, to);
364 }
365
366 if (iocb->ki_filp->f_flags & O_NONBLOCK)
367 ret = p9_client_read_once(fid, offset: iocb->ki_pos, to, err: &err);
368 else
369 ret = p9_client_read(fid, offset: iocb->ki_pos, to, err: &err);
370 if (!ret)
371 return err;
372
373 iocb->ki_pos += ret;
374 return ret;
375}
376
377/*
378 * v9fs_file_splice_read - splice-read from a file
379 * @in: The 9p file to read from
380 * @ppos: Where to find/update the file position
381 * @pipe: The pipe to splice into
382 * @len: The maximum amount of data to splice
383 * @flags: SPLICE_F_* flags
384 */
385static ssize_t v9fs_file_splice_read(struct file *in, loff_t *ppos,
386 struct pipe_inode_info *pipe,
387 size_t len, unsigned int flags)
388{
389 struct p9_fid *fid = in->private_data;
390
391 p9_debug(P9_DEBUG_VFS, "fid %d count %zu offset %lld\n",
392 fid->fid, len, *ppos);
393
394 if (fid->mode & P9L_DIRECT)
395 return copy_splice_read(in, ppos, pipe, len, flags);
396 return filemap_splice_read(in, ppos, pipe, len, flags);
397}
398
399/**
400 * v9fs_file_write_iter - write to a file
401 * @iocb: The operation parameters
402 * @from: The data to write
403 *
404 */
405static ssize_t
406v9fs_file_write_iter(struct kiocb *iocb, struct iov_iter *from)
407{
408 struct file *file = iocb->ki_filp;
409 struct p9_fid *fid = file->private_data;
410 ssize_t retval;
411 loff_t origin;
412 int err = 0;
413
414 p9_debug(P9_DEBUG_VFS, "fid %d\n", fid->fid);
415
416 if (!(fid->mode & (P9L_DIRECT | P9L_NOWRITECACHE))) {
417 p9_debug(P9_DEBUG_CACHE, "(cached)\n");
418 return generic_file_write_iter(iocb, from);
419 }
420
421 retval = generic_write_checks(iocb, from);
422 if (retval <= 0)
423 return retval;
424
425 origin = iocb->ki_pos;
426 retval = p9_client_write(fid: file->private_data, offset: iocb->ki_pos, from, err: &err);
427 if (retval > 0) {
428 struct inode *inode = file_inode(f: file);
429 loff_t i_size;
430 unsigned long pg_start, pg_end;
431
432 pg_start = origin >> PAGE_SHIFT;
433 pg_end = (origin + retval - 1) >> PAGE_SHIFT;
434 if (inode->i_mapping && inode->i_mapping->nrpages)
435 invalidate_inode_pages2_range(mapping: inode->i_mapping,
436 start: pg_start, end: pg_end);
437 iocb->ki_pos += retval;
438 i_size = i_size_read(inode);
439 if (iocb->ki_pos > i_size) {
440 inode_add_bytes(inode, bytes: iocb->ki_pos - i_size);
441 /*
442 * Need to serialize against i_size_write() in
443 * v9fs_stat2inode()
444 */
445 v9fs_i_size_write(inode, i_size: iocb->ki_pos);
446 }
447 return retval;
448 }
449 return err;
450}
451
452static int v9fs_file_fsync(struct file *filp, loff_t start, loff_t end,
453 int datasync)
454{
455 struct p9_fid *fid;
456 struct inode *inode = filp->f_mapping->host;
457 struct p9_wstat wstat;
458 int retval;
459
460 retval = file_write_and_wait_range(file: filp, start, end);
461 if (retval)
462 return retval;
463
464 inode_lock(inode);
465 p9_debug(P9_DEBUG_VFS, "filp %p datasync %x\n", filp, datasync);
466
467 fid = filp->private_data;
468 v9fs_blank_wstat(wstat: &wstat);
469
470 retval = p9_client_wstat(fid, wst: &wstat);
471 inode_unlock(inode);
472
473 return retval;
474}
475
476int v9fs_file_fsync_dotl(struct file *filp, loff_t start, loff_t end,
477 int datasync)
478{
479 struct p9_fid *fid;
480 struct inode *inode = filp->f_mapping->host;
481 int retval;
482
483 retval = file_write_and_wait_range(file: filp, start, end);
484 if (retval)
485 return retval;
486
487 inode_lock(inode);
488 p9_debug(P9_DEBUG_VFS, "filp %p datasync %x\n", filp, datasync);
489
490 fid = filp->private_data;
491
492 retval = p9_client_fsync(fid, datasync);
493 inode_unlock(inode);
494
495 return retval;
496}
497
498static int
499v9fs_file_mmap(struct file *filp, struct vm_area_struct *vma)
500{
501 int retval;
502 struct inode *inode = file_inode(f: filp);
503 struct v9fs_session_info *v9ses = v9fs_inode2v9ses(inode);
504
505 p9_debug(P9_DEBUG_MMAP, "filp :%p\n", filp);
506
507 if (!(v9ses->cache & CACHE_WRITEBACK)) {
508 p9_debug(P9_DEBUG_CACHE, "(read-only mmap mode)");
509 return generic_file_readonly_mmap(filp, vma);
510 }
511
512 retval = generic_file_mmap(filp, vma);
513 if (!retval)
514 vma->vm_ops = &v9fs_mmap_file_vm_ops;
515
516 return retval;
517}
518
519static vm_fault_t
520v9fs_vm_page_mkwrite(struct vm_fault *vmf)
521{
522 struct folio *folio = page_folio(vmf->page);
523 struct file *filp = vmf->vma->vm_file;
524 struct inode *inode = file_inode(f: filp);
525
526
527 p9_debug(P9_DEBUG_VFS, "folio %p fid %lx\n",
528 folio, (unsigned long)filp->private_data);
529
530 /* Wait for the page to be written to the cache before we allow it to
531 * be modified. We then assume the entire page will need writing back.
532 */
533#ifdef CONFIG_9P_FSCACHE
534 if (folio_test_fscache(folio) &&
535 folio_wait_fscache_killable(folio) < 0)
536 return VM_FAULT_NOPAGE;
537#endif
538
539 /* Update file times before taking page lock */
540 file_update_time(file: filp);
541
542 if (folio_lock_killable(folio) < 0)
543 return VM_FAULT_RETRY;
544 if (folio_mapping(folio) != inode->i_mapping)
545 goto out_unlock;
546 folio_wait_stable(folio);
547
548 return VM_FAULT_LOCKED;
549out_unlock:
550 folio_unlock(folio);
551 return VM_FAULT_NOPAGE;
552}
553
554static void v9fs_mmap_vm_close(struct vm_area_struct *vma)
555{
556 struct inode *inode;
557
558 struct writeback_control wbc = {
559 .nr_to_write = LONG_MAX,
560 .sync_mode = WB_SYNC_ALL,
561 .range_start = (loff_t)vma->vm_pgoff * PAGE_SIZE,
562 /* absolute end, byte at end included */
563 .range_end = (loff_t)vma->vm_pgoff * PAGE_SIZE +
564 (vma->vm_end - vma->vm_start - 1),
565 };
566
567 if (!(vma->vm_flags & VM_SHARED))
568 return;
569
570 p9_debug(P9_DEBUG_VFS, "9p VMA close, %p, flushing", vma);
571
572 inode = file_inode(f: vma->vm_file);
573 filemap_fdatawrite_wbc(mapping: inode->i_mapping, wbc: &wbc);
574}
575
576static const struct vm_operations_struct v9fs_mmap_file_vm_ops = {
577 .close = v9fs_mmap_vm_close,
578 .fault = filemap_fault,
579 .map_pages = filemap_map_pages,
580 .page_mkwrite = v9fs_vm_page_mkwrite,
581};
582
583const struct file_operations v9fs_file_operations = {
584 .llseek = generic_file_llseek,
585 .read_iter = v9fs_file_read_iter,
586 .write_iter = v9fs_file_write_iter,
587 .open = v9fs_file_open,
588 .release = v9fs_dir_release,
589 .lock = v9fs_file_lock,
590 .mmap = generic_file_readonly_mmap,
591 .splice_read = v9fs_file_splice_read,
592 .splice_write = iter_file_splice_write,
593 .fsync = v9fs_file_fsync,
594};
595
596const struct file_operations v9fs_file_operations_dotl = {
597 .llseek = generic_file_llseek,
598 .read_iter = v9fs_file_read_iter,
599 .write_iter = v9fs_file_write_iter,
600 .open = v9fs_file_open,
601 .release = v9fs_dir_release,
602 .lock = v9fs_file_lock_dotl,
603 .flock = v9fs_file_flock_dotl,
604 .mmap = v9fs_file_mmap,
605 .splice_read = v9fs_file_splice_read,
606 .splice_write = iter_file_splice_write,
607 .fsync = v9fs_file_fsync_dotl,
608};
609

source code of linux/fs/9p/vfs_file.c