| // SPDX-License-Identifier: GPL-2.0-only |
| /* |
| * This file contians vfs file ops for 9P2000. |
| * |
| * Copyright (C) 2004 by Eric Van Hensbergen <ericvh@gmail.com> |
| * Copyright (C) 2002 by Ron Minnich <rminnich@lanl.gov> |
| */ |
| |
| #include <linux/module.h> |
| #include <linux/errno.h> |
| #include <linux/fs.h> |
| #include <linux/filelock.h> |
| #include <linux/sched.h> |
| #include <linux/file.h> |
| #include <linux/stat.h> |
| #include <linux/string.h> |
| #include <linux/list.h> |
| #include <linux/pagemap.h> |
| #include <linux/utsname.h> |
| #include <linux/uaccess.h> |
| #include <linux/uio.h> |
| #include <linux/slab.h> |
| #include <net/9p/9p.h> |
| #include <net/9p/client.h> |
| |
| #include "v9fs.h" |
| #include "v9fs_vfs.h" |
| #include "fid.h" |
| #include "cache.h" |
| |
| static const struct vm_operations_struct v9fs_mmap_file_vm_ops; |
| |
| /** |
| * v9fs_file_open - open a file (or directory) |
| * @inode: inode to be opened |
| * @file: file being opened |
| * |
| */ |
| |
| int v9fs_file_open(struct inode *inode, struct file *file) |
| { |
| int err; |
| struct v9fs_session_info *v9ses; |
| struct p9_fid *fid; |
| int omode; |
| |
| p9_debug(P9_DEBUG_VFS, "inode: %p file: %p\n", inode, file); |
| v9ses = v9fs_inode2v9ses(inode); |
| if (v9fs_proto_dotl(v9ses)) |
| omode = v9fs_open_to_dotl_flags(file->f_flags); |
| else |
| omode = v9fs_uflags2omode(file->f_flags, |
| v9fs_proto_dotu(v9ses)); |
| fid = file->private_data; |
| if (!fid) { |
| fid = v9fs_fid_clone(file_dentry(file)); |
| if (IS_ERR(fid)) |
| return PTR_ERR(fid); |
| |
| if ((v9ses->cache & CACHE_WRITEBACK) && (omode & P9_OWRITE)) { |
| int writeback_omode = (omode & ~P9_OWRITE) | P9_ORDWR; |
| |
| p9_debug(P9_DEBUG_CACHE, "write-only file with writeback enabled, try opening O_RDWR\n"); |
| err = p9_client_open(fid, writeback_omode); |
| if (err < 0) { |
| p9_debug(P9_DEBUG_CACHE, "could not open O_RDWR, disabling caches\n"); |
| err = p9_client_open(fid, omode); |
| fid->mode |= P9L_DIRECT; |
| } |
| } else { |
| err = p9_client_open(fid, omode); |
| } |
| if (err < 0) { |
| p9_fid_put(fid); |
| return err; |
| } |
| if ((file->f_flags & O_APPEND) && |
| (!v9fs_proto_dotu(v9ses) && !v9fs_proto_dotl(v9ses))) |
| generic_file_llseek(file, 0, SEEK_END); |
| |
| file->private_data = fid; |
| } |
| |
| #ifdef CONFIG_9P_FSCACHE |
| if (v9ses->cache & CACHE_FSCACHE) |
| fscache_use_cookie(v9fs_inode_cookie(V9FS_I(inode)), |
| file->f_mode & FMODE_WRITE); |
| #endif |
| v9fs_fid_add_modes(fid, v9ses->flags, v9ses->cache, file->f_flags); |
| v9fs_open_fid_add(inode, &fid); |
| return 0; |
| } |
| |
| /** |
| * v9fs_file_lock - lock a file (or directory) |
| * @filp: file to be locked |
| * @cmd: lock command |
| * @fl: file lock structure |
| * |
| * Bugs: this looks like a local only lock, we should extend into 9P |
| * by using open exclusive |
| */ |
| |
| static int v9fs_file_lock(struct file *filp, int cmd, struct file_lock *fl) |
| { |
| struct inode *inode = file_inode(filp); |
| |
| p9_debug(P9_DEBUG_VFS, "filp: %p lock: %p\n", filp, fl); |
| |
| if ((IS_SETLK(cmd) || IS_SETLKW(cmd)) && fl->fl_type != F_UNLCK) { |
| filemap_write_and_wait(inode->i_mapping); |
| invalidate_mapping_pages(&inode->i_data, 0, -1); |
| } |
| |
| return 0; |
| } |
| |
| static int v9fs_file_do_lock(struct file *filp, int cmd, struct file_lock *fl) |
| { |
| struct p9_flock flock; |
| struct p9_fid *fid; |
| uint8_t status = P9_LOCK_ERROR; |
| int res = 0; |
| unsigned char fl_type; |
| struct v9fs_session_info *v9ses; |
| |
| fid = filp->private_data; |
| BUG_ON(fid == NULL); |
| |
| BUG_ON((fl->fl_flags & FL_POSIX) != FL_POSIX); |
| |
| res = locks_lock_file_wait(filp, fl); |
| if (res < 0) |
| goto out; |
| |
| /* convert posix lock to p9 tlock args */ |
| memset(&flock, 0, sizeof(flock)); |
| /* map the lock type */ |
| switch (fl->fl_type) { |
| case F_RDLCK: |
| flock.type = P9_LOCK_TYPE_RDLCK; |
| break; |
| case F_WRLCK: |
| flock.type = P9_LOCK_TYPE_WRLCK; |
| break; |
| case F_UNLCK: |
| flock.type = P9_LOCK_TYPE_UNLCK; |
| break; |
| } |
| flock.start = fl->fl_start; |
| if (fl->fl_end == OFFSET_MAX) |
| flock.length = 0; |
| else |
| flock.length = fl->fl_end - fl->fl_start + 1; |
| flock.proc_id = fl->fl_pid; |
| flock.client_id = fid->clnt->name; |
| if (IS_SETLKW(cmd)) |
| flock.flags = P9_LOCK_FLAGS_BLOCK; |
| |
| v9ses = v9fs_inode2v9ses(file_inode(filp)); |
| |
| /* |
| * if its a blocked request and we get P9_LOCK_BLOCKED as the status |
| * for lock request, keep on trying |
| */ |
| for (;;) { |
| res = p9_client_lock_dotl(fid, &flock, &status); |
| if (res < 0) |
| goto out_unlock; |
| |
| if (status != P9_LOCK_BLOCKED) |
| break; |
| if (status == P9_LOCK_BLOCKED && !IS_SETLKW(cmd)) |
| break; |
| if (schedule_timeout_interruptible(v9ses->session_lock_timeout) |
| != 0) |
| break; |
| /* |
| * p9_client_lock_dotl overwrites flock.client_id with the |
| * server message, free and reuse the client name |
| */ |
| if (flock.client_id != fid->clnt->name) { |
| kfree(flock.client_id); |
| flock.client_id = fid->clnt->name; |
| } |
| } |
| |
| /* map 9p status to VFS status */ |
| switch (status) { |
| case P9_LOCK_SUCCESS: |
| res = 0; |
| break; |
| case P9_LOCK_BLOCKED: |
| res = -EAGAIN; |
| break; |
| default: |
| WARN_ONCE(1, "unknown lock status code: %d\n", status); |
| fallthrough; |
| case P9_LOCK_ERROR: |
| case P9_LOCK_GRACE: |
| res = -ENOLCK; |
| break; |
| } |
| |
| out_unlock: |
| /* |
| * incase server returned error for lock request, revert |
| * it locally |
| */ |
| if (res < 0 && fl->fl_type != F_UNLCK) { |
| fl_type = fl->fl_type; |
| fl->fl_type = F_UNLCK; |
| /* Even if this fails we want to return the remote error */ |
| locks_lock_file_wait(filp, fl); |
| fl->fl_type = fl_type; |
| } |
| if (flock.client_id != fid->clnt->name) |
| kfree(flock.client_id); |
| out: |
| return res; |
| } |
| |
| static int v9fs_file_getlock(struct file *filp, struct file_lock *fl) |
| { |
| struct p9_getlock glock; |
| struct p9_fid *fid; |
| int res = 0; |
| |
| fid = filp->private_data; |
| BUG_ON(fid == NULL); |
| |
| posix_test_lock(filp, fl); |
| /* |
| * if we have a conflicting lock locally, no need to validate |
| * with server |
| */ |
| if (fl->fl_type != F_UNLCK) |
| return res; |
| |
| /* convert posix lock to p9 tgetlock args */ |
| memset(&glock, 0, sizeof(glock)); |
| glock.type = P9_LOCK_TYPE_UNLCK; |
| glock.start = fl->fl_start; |
| if (fl->fl_end == OFFSET_MAX) |
| glock.length = 0; |
| else |
| glock.length = fl->fl_end - fl->fl_start + 1; |
| glock.proc_id = fl->fl_pid; |
| glock.client_id = fid->clnt->name; |
| |
| res = p9_client_getlock_dotl(fid, &glock); |
| if (res < 0) |
| goto out; |
| /* map 9p lock type to os lock type */ |
| switch (glock.type) { |
| case P9_LOCK_TYPE_RDLCK: |
| fl->fl_type = F_RDLCK; |
| break; |
| case P9_LOCK_TYPE_WRLCK: |
| fl->fl_type = F_WRLCK; |
| break; |
| case P9_LOCK_TYPE_UNLCK: |
| fl->fl_type = F_UNLCK; |
| break; |
| } |
| if (glock.type != P9_LOCK_TYPE_UNLCK) { |
| fl->fl_start = glock.start; |
| if (glock.length == 0) |
| fl->fl_end = OFFSET_MAX; |
| else |
| fl->fl_end = glock.start + glock.length - 1; |
| fl->fl_pid = -glock.proc_id; |
| } |
| out: |
| if (glock.client_id != fid->clnt->name) |
| kfree(glock.client_id); |
| return res; |
| } |
| |
| /** |
| * v9fs_file_lock_dotl - lock a file (or directory) |
| * @filp: file to be locked |
| * @cmd: lock command |
| * @fl: file lock structure |
| * |
| */ |
| |
| static int v9fs_file_lock_dotl(struct file *filp, int cmd, struct file_lock *fl) |
| { |
| struct inode *inode = file_inode(filp); |
| int ret = -ENOLCK; |
| |
| p9_debug(P9_DEBUG_VFS, "filp: %p cmd:%d lock: %p name: %pD\n", |
| filp, cmd, fl, filp); |
| |
| if ((IS_SETLK(cmd) || IS_SETLKW(cmd)) && fl->fl_type != F_UNLCK) { |
| filemap_write_and_wait(inode->i_mapping); |
| invalidate_mapping_pages(&inode->i_data, 0, -1); |
| } |
| |
| if (IS_SETLK(cmd) || IS_SETLKW(cmd)) |
| ret = v9fs_file_do_lock(filp, cmd, fl); |
| else if (IS_GETLK(cmd)) |
| ret = v9fs_file_getlock(filp, fl); |
| else |
| ret = -EINVAL; |
| return ret; |
| } |
| |
| /** |
| * v9fs_file_flock_dotl - lock a file |
| * @filp: file to be locked |
| * @cmd: lock command |
| * @fl: file lock structure |
| * |
| */ |
| |
| static int v9fs_file_flock_dotl(struct file *filp, int cmd, |
| struct file_lock *fl) |
| { |
| struct inode *inode = file_inode(filp); |
| int ret = -ENOLCK; |
| |
| p9_debug(P9_DEBUG_VFS, "filp: %p cmd:%d lock: %p name: %pD\n", |
| filp, cmd, fl, filp); |
| |
| if (!(fl->fl_flags & FL_FLOCK)) |
| goto out_err; |
| |
| if ((IS_SETLK(cmd) || IS_SETLKW(cmd)) && fl->fl_type != F_UNLCK) { |
| filemap_write_and_wait(inode->i_mapping); |
| invalidate_mapping_pages(&inode->i_data, 0, -1); |
| } |
| /* Convert flock to posix lock */ |
| fl->fl_flags |= FL_POSIX; |
| fl->fl_flags ^= FL_FLOCK; |
| |
| if (IS_SETLK(cmd) | IS_SETLKW(cmd)) |
| ret = v9fs_file_do_lock(filp, cmd, fl); |
| else |
| ret = -EINVAL; |
| out_err: |
| return ret; |
| } |
| |
| /** |
| * v9fs_file_read_iter - read from a file |
| * @iocb: The operation parameters |
| * @to: The buffer to read into |
| * |
| */ |
| static ssize_t |
| v9fs_file_read_iter(struct kiocb *iocb, struct iov_iter *to) |
| { |
| struct p9_fid *fid = iocb->ki_filp->private_data; |
| int ret, err = 0; |
| |
| p9_debug(P9_DEBUG_VFS, "fid %d count %zu offset %lld\n", |
| fid->fid, iov_iter_count(to), iocb->ki_pos); |
| |
| if (!(fid->mode & P9L_DIRECT)) { |
| p9_debug(P9_DEBUG_VFS, "(cached)\n"); |
| return generic_file_read_iter(iocb, to); |
| } |
| |
| if (iocb->ki_filp->f_flags & O_NONBLOCK) |
| ret = p9_client_read_once(fid, iocb->ki_pos, to, &err); |
| else |
| ret = p9_client_read(fid, iocb->ki_pos, to, &err); |
| if (!ret) |
| return err; |
| |
| iocb->ki_pos += ret; |
| return ret; |
| } |
| |
| /* |
| * v9fs_file_splice_read - splice-read from a file |
| * @in: The 9p file to read from |
| * @ppos: Where to find/update the file position |
| * @pipe: The pipe to splice into |
| * @len: The maximum amount of data to splice |
| * @flags: SPLICE_F_* flags |
| */ |
| static ssize_t v9fs_file_splice_read(struct file *in, loff_t *ppos, |
| struct pipe_inode_info *pipe, |
| size_t len, unsigned int flags) |
| { |
| struct p9_fid *fid = in->private_data; |
| |
| p9_debug(P9_DEBUG_VFS, "fid %d count %zu offset %lld\n", |
| fid->fid, len, *ppos); |
| |
| if (fid->mode & P9L_DIRECT) |
| return copy_splice_read(in, ppos, pipe, len, flags); |
| return filemap_splice_read(in, ppos, pipe, len, flags); |
| } |
| |
| /** |
| * v9fs_file_write_iter - write to a file |
| * @iocb: The operation parameters |
| * @from: The data to write |
| * |
| */ |
| static ssize_t |
| v9fs_file_write_iter(struct kiocb *iocb, struct iov_iter *from) |
| { |
| struct file *file = iocb->ki_filp; |
| struct p9_fid *fid = file->private_data; |
| ssize_t retval; |
| loff_t origin; |
| int err = 0; |
| |
| p9_debug(P9_DEBUG_VFS, "fid %d\n", fid->fid); |
| |
| if (!(fid->mode & (P9L_DIRECT | P9L_NOWRITECACHE))) { |
| p9_debug(P9_DEBUG_CACHE, "(cached)\n"); |
| return generic_file_write_iter(iocb, from); |
| } |
| |
| retval = generic_write_checks(iocb, from); |
| if (retval <= 0) |
| return retval; |
| |
| origin = iocb->ki_pos; |
| retval = p9_client_write(file->private_data, iocb->ki_pos, from, &err); |
| if (retval > 0) { |
| struct inode *inode = file_inode(file); |
| loff_t i_size; |
| unsigned long pg_start, pg_end; |
| |
| pg_start = origin >> PAGE_SHIFT; |
| pg_end = (origin + retval - 1) >> PAGE_SHIFT; |
| if (inode->i_mapping && inode->i_mapping->nrpages) |
| invalidate_inode_pages2_range(inode->i_mapping, |
| pg_start, pg_end); |
| iocb->ki_pos += retval; |
| i_size = i_size_read(inode); |
| if (iocb->ki_pos > i_size) { |
| inode_add_bytes(inode, iocb->ki_pos - i_size); |
| /* |
| * Need to serialize against i_size_write() in |
| * v9fs_stat2inode() |
| */ |
| v9fs_i_size_write(inode, iocb->ki_pos); |
| } |
| return retval; |
| } |
| return err; |
| } |
| |
| static int v9fs_file_fsync(struct file *filp, loff_t start, loff_t end, |
| int datasync) |
| { |
| struct p9_fid *fid; |
| struct inode *inode = filp->f_mapping->host; |
| struct p9_wstat wstat; |
| int retval; |
| |
| retval = file_write_and_wait_range(filp, start, end); |
| if (retval) |
| return retval; |
| |
| inode_lock(inode); |
| p9_debug(P9_DEBUG_VFS, "filp %p datasync %x\n", filp, datasync); |
| |
| fid = filp->private_data; |
| v9fs_blank_wstat(&wstat); |
| |
| retval = p9_client_wstat(fid, &wstat); |
| inode_unlock(inode); |
| |
| return retval; |
| } |
| |
| int v9fs_file_fsync_dotl(struct file *filp, loff_t start, loff_t end, |
| int datasync) |
| { |
| struct p9_fid *fid; |
| struct inode *inode = filp->f_mapping->host; |
| int retval; |
| |
| retval = file_write_and_wait_range(filp, start, end); |
| if (retval) |
| return retval; |
| |
| inode_lock(inode); |
| p9_debug(P9_DEBUG_VFS, "filp %p datasync %x\n", filp, datasync); |
| |
| fid = filp->private_data; |
| |
| retval = p9_client_fsync(fid, datasync); |
| inode_unlock(inode); |
| |
| return retval; |
| } |
| |
| static int |
| v9fs_file_mmap(struct file *filp, struct vm_area_struct *vma) |
| { |
| int retval; |
| struct inode *inode = file_inode(filp); |
| struct v9fs_session_info *v9ses = v9fs_inode2v9ses(inode); |
| |
| p9_debug(P9_DEBUG_MMAP, "filp :%p\n", filp); |
| |
| if (!(v9ses->cache & CACHE_WRITEBACK)) { |
| p9_debug(P9_DEBUG_CACHE, "(no mmap mode)"); |
| if (vma->vm_flags & VM_MAYSHARE) |
| return -ENODEV; |
| invalidate_inode_pages2(filp->f_mapping); |
| return generic_file_readonly_mmap(filp, vma); |
| } |
| |
| retval = generic_file_mmap(filp, vma); |
| if (!retval) |
| vma->vm_ops = &v9fs_mmap_file_vm_ops; |
| |
| return retval; |
| } |
| |
| static vm_fault_t |
| v9fs_vm_page_mkwrite(struct vm_fault *vmf) |
| { |
| struct folio *folio = page_folio(vmf->page); |
| struct file *filp = vmf->vma->vm_file; |
| struct inode *inode = file_inode(filp); |
| |
| |
| p9_debug(P9_DEBUG_VFS, "folio %p fid %lx\n", |
| folio, (unsigned long)filp->private_data); |
| |
| /* Wait for the page to be written to the cache before we allow it to |
| * be modified. We then assume the entire page will need writing back. |
| */ |
| #ifdef CONFIG_9P_FSCACHE |
| if (folio_test_fscache(folio) && |
| folio_wait_fscache_killable(folio) < 0) |
| return VM_FAULT_NOPAGE; |
| #endif |
| |
| /* Update file times before taking page lock */ |
| file_update_time(filp); |
| |
| if (folio_lock_killable(folio) < 0) |
| return VM_FAULT_RETRY; |
| if (folio_mapping(folio) != inode->i_mapping) |
| goto out_unlock; |
| folio_wait_stable(folio); |
| |
| return VM_FAULT_LOCKED; |
| out_unlock: |
| folio_unlock(folio); |
| return VM_FAULT_NOPAGE; |
| } |
| |
| static void v9fs_mmap_vm_close(struct vm_area_struct *vma) |
| { |
| struct inode *inode; |
| |
| struct writeback_control wbc = { |
| .nr_to_write = LONG_MAX, |
| .sync_mode = WB_SYNC_ALL, |
| .range_start = (loff_t)vma->vm_pgoff * PAGE_SIZE, |
| /* absolute end, byte at end included */ |
| .range_end = (loff_t)vma->vm_pgoff * PAGE_SIZE + |
| (vma->vm_end - vma->vm_start - 1), |
| }; |
| |
| if (!(vma->vm_flags & VM_SHARED)) |
| return; |
| |
| p9_debug(P9_DEBUG_VFS, "9p VMA close, %p, flushing", vma); |
| |
| inode = file_inode(vma->vm_file); |
| filemap_fdatawrite_wbc(inode->i_mapping, &wbc); |
| } |
| |
| static const struct vm_operations_struct v9fs_mmap_file_vm_ops = { |
| .close = v9fs_mmap_vm_close, |
| .fault = filemap_fault, |
| .map_pages = filemap_map_pages, |
| .page_mkwrite = v9fs_vm_page_mkwrite, |
| }; |
| |
| const struct file_operations v9fs_file_operations = { |
| .llseek = generic_file_llseek, |
| .read_iter = v9fs_file_read_iter, |
| .write_iter = v9fs_file_write_iter, |
| .open = v9fs_file_open, |
| .release = v9fs_dir_release, |
| .lock = v9fs_file_lock, |
| .mmap = generic_file_readonly_mmap, |
| .splice_read = v9fs_file_splice_read, |
| .splice_write = iter_file_splice_write, |
| .fsync = v9fs_file_fsync, |
| }; |
| |
| const struct file_operations v9fs_file_operations_dotl = { |
| .llseek = generic_file_llseek, |
| .read_iter = v9fs_file_read_iter, |
| .write_iter = v9fs_file_write_iter, |
| .open = v9fs_file_open, |
| .release = v9fs_dir_release, |
| .lock = v9fs_file_lock_dotl, |
| .flock = v9fs_file_flock_dotl, |
| .mmap = v9fs_file_mmap, |
| .splice_read = v9fs_file_splice_read, |
| .splice_write = iter_file_splice_write, |
| .fsync = v9fs_file_fsync_dotl, |
| }; |