2 * linux/fs/9p/vfs_file.c
4 * This file contians vfs file ops for 9P2000.
6 * Copyright (C) 2004 by Eric Van Hensbergen <ericvh@gmail.com>
7 * Copyright (C) 2002 by Ron Minnich <rminnich@lanl.gov>
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License version 2
11 * as published by the Free Software Foundation.
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
18 * You should have received a copy of the GNU General Public License
19 * along with this program; if not, write to:
20 * Free Software Foundation
21 * 51 Franklin Street, Fifth Floor
22 * Boston, MA 02111-1301 USA
26 #include <linux/module.h>
27 #include <linux/errno.h>
29 #include <linux/sched.h>
30 #include <linux/file.h>
31 #include <linux/stat.h>
32 #include <linux/string.h>
33 #include <linux/inet.h>
34 #include <linux/list.h>
35 #include <linux/pagemap.h>
36 #include <linux/utsname.h>
37 #include <asm/uaccess.h>
38 #include <linux/idr.h>
39 #include <net/9p/9p.h>
40 #include <net/9p/client.h>
47 static const struct vm_operations_struct v9fs_file_vm_ops;
50 * v9fs_file_open - open a file (or directory)
51 * @inode: inode to be opened
52 * @file: file being opened
56 int v9fs_file_open(struct inode *inode, struct file *file)
59 struct v9fs_inode *v9inode;
60 struct v9fs_session_info *v9ses;
64 P9_DPRINTK(P9_DEBUG_VFS, "inode: %p file: %p\n", inode, file);
65 v9inode = V9FS_I(inode);
66 v9ses = v9fs_inode2v9ses(inode);
67 if (v9fs_proto_dotl(v9ses))
68 omode = v9fs_open_to_dotl_flags(file->f_flags);
70 omode = v9fs_uflags2omode(file->f_flags,
71 v9fs_proto_dotu(v9ses));
72 fid = file->private_data;
74 fid = v9fs_fid_clone(file->f_path.dentry);
78 err = p9_client_open(fid, omode);
83 if (file->f_flags & O_TRUNC) {
84 i_size_write(inode, 0);
87 if ((file->f_flags & O_APPEND) &&
88 (!v9fs_proto_dotu(v9ses) && !v9fs_proto_dotl(v9ses)))
89 generic_file_llseek(file, 0, SEEK_END);
92 file->private_data = fid;
93 mutex_lock(&v9inode->v_mutex);
94 if (v9ses->cache && !v9inode->writeback_fid &&
95 ((file->f_flags & O_ACCMODE) != O_RDONLY)) {
97 * clone a fid and add it to writeback_fid
98 * we do it during open time instead of
99 * page dirty time via write_begin/page_mkwrite
100 * because we want write after unlink usecase
103 fid = v9fs_writeback_fid(file->f_path.dentry);
106 mutex_unlock(&v9inode->v_mutex);
109 v9inode->writeback_fid = (void *) fid;
111 mutex_unlock(&v9inode->v_mutex);
112 #ifdef CONFIG_9P_FSCACHE
114 v9fs_cache_inode_set_cookie(inode, file);
118 p9_client_clunk(file->private_data);
119 file->private_data = NULL;
124 * v9fs_file_lock - lock a file (or directory)
125 * @filp: file to be locked
127 * @fl: file lock structure
129 * Bugs: this looks like a local only lock, we should extend into 9P
130 * by using open exclusive
133 static int v9fs_file_lock(struct file *filp, int cmd, struct file_lock *fl)
136 struct inode *inode = filp->f_path.dentry->d_inode;
138 P9_DPRINTK(P9_DEBUG_VFS, "filp: %p lock: %p\n", filp, fl);
140 /* No mandatory locks */
141 if (__mandatory_lock(inode) && fl->fl_type != F_UNLCK)
144 if ((IS_SETLK(cmd) || IS_SETLKW(cmd)) && fl->fl_type != F_UNLCK) {
145 filemap_write_and_wait(inode->i_mapping);
146 invalidate_mapping_pages(&inode->i_data, 0, -1);
152 static int v9fs_file_do_lock(struct file *filp, int cmd, struct file_lock *fl)
154 struct p9_flock flock;
158 unsigned char fl_type;
160 fid = filp->private_data;
163 if ((fl->fl_flags & FL_POSIX) != FL_POSIX)
166 res = posix_lock_file_wait(filp, fl);
170 /* convert posix lock to p9 tlock args */
171 memset(&flock, 0, sizeof(flock));
172 /* map the lock type */
173 switch (fl->fl_type) {
175 flock.type = P9_LOCK_TYPE_RDLCK;
178 flock.type = P9_LOCK_TYPE_WRLCK;
181 flock.type = P9_LOCK_TYPE_UNLCK;
184 flock.start = fl->fl_start;
185 if (fl->fl_end == OFFSET_MAX)
188 flock.length = fl->fl_end - fl->fl_start + 1;
189 flock.proc_id = fl->fl_pid;
190 flock.client_id = utsname()->nodename;
192 flock.flags = P9_LOCK_FLAGS_BLOCK;
195 * if its a blocked request and we get P9_LOCK_BLOCKED as the status
196 * for lock request, keep on trying
199 res = p9_client_lock_dotl(fid, &flock, &status);
203 if (status != P9_LOCK_BLOCKED)
205 if (status == P9_LOCK_BLOCKED && !IS_SETLKW(cmd))
207 schedule_timeout_interruptible(P9_LOCK_TIMEOUT);
210 /* map 9p status to VFS status */
212 case P9_LOCK_SUCCESS:
215 case P9_LOCK_BLOCKED:
227 * incase server returned error for lock request, revert
230 if (res < 0 && fl->fl_type != F_UNLCK) {
231 fl_type = fl->fl_type;
232 fl->fl_type = F_UNLCK;
233 res = posix_lock_file_wait(filp, fl);
234 fl->fl_type = fl_type;
240 static int v9fs_file_getlock(struct file *filp, struct file_lock *fl)
242 struct p9_getlock glock;
246 fid = filp->private_data;
249 posix_test_lock(filp, fl);
251 * if we have a conflicting lock locally, no need to validate
254 if (fl->fl_type != F_UNLCK)
257 /* convert posix lock to p9 tgetlock args */
258 memset(&glock, 0, sizeof(glock));
259 glock.type = P9_LOCK_TYPE_UNLCK;
260 glock.start = fl->fl_start;
261 if (fl->fl_end == OFFSET_MAX)
264 glock.length = fl->fl_end - fl->fl_start + 1;
265 glock.proc_id = fl->fl_pid;
266 glock.client_id = utsname()->nodename;
268 res = p9_client_getlock_dotl(fid, &glock);
271 /* map 9p lock type to os lock type */
272 switch (glock.type) {
273 case P9_LOCK_TYPE_RDLCK:
274 fl->fl_type = F_RDLCK;
276 case P9_LOCK_TYPE_WRLCK:
277 fl->fl_type = F_WRLCK;
279 case P9_LOCK_TYPE_UNLCK:
280 fl->fl_type = F_UNLCK;
283 if (glock.type != P9_LOCK_TYPE_UNLCK) {
284 fl->fl_start = glock.start;
285 if (glock.length == 0)
286 fl->fl_end = OFFSET_MAX;
288 fl->fl_end = glock.start + glock.length - 1;
289 fl->fl_pid = glock.proc_id;
295 * v9fs_file_lock_dotl - lock a file (or directory)
296 * @filp: file to be locked
298 * @fl: file lock structure
302 static int v9fs_file_lock_dotl(struct file *filp, int cmd, struct file_lock *fl)
304 struct inode *inode = filp->f_path.dentry->d_inode;
307 P9_DPRINTK(P9_DEBUG_VFS, "filp: %p cmd:%d lock: %p name: %s\n", filp,
308 cmd, fl, filp->f_path.dentry->d_name.name);
310 /* No mandatory locks */
311 if (__mandatory_lock(inode) && fl->fl_type != F_UNLCK)
314 if ((IS_SETLK(cmd) || IS_SETLKW(cmd)) && fl->fl_type != F_UNLCK) {
315 filemap_write_and_wait(inode->i_mapping);
316 invalidate_mapping_pages(&inode->i_data, 0, -1);
319 if (IS_SETLK(cmd) || IS_SETLKW(cmd))
320 ret = v9fs_file_do_lock(filp, cmd, fl);
321 else if (IS_GETLK(cmd))
322 ret = v9fs_file_getlock(filp, fl);
330 * v9fs_file_flock_dotl - lock a file
331 * @filp: file to be locked
333 * @fl: file lock structure
337 static int v9fs_file_flock_dotl(struct file *filp, int cmd,
338 struct file_lock *fl)
340 struct inode *inode = filp->f_path.dentry->d_inode;
343 P9_DPRINTK(P9_DEBUG_VFS, "filp: %p cmd:%d lock: %p name: %s\n", filp,
344 cmd, fl, filp->f_path.dentry->d_name.name);
346 /* No mandatory locks */
347 if (__mandatory_lock(inode) && fl->fl_type != F_UNLCK)
350 if (!(fl->fl_flags & FL_FLOCK))
353 if ((IS_SETLK(cmd) || IS_SETLKW(cmd)) && fl->fl_type != F_UNLCK) {
354 filemap_write_and_wait(inode->i_mapping);
355 invalidate_mapping_pages(&inode->i_data, 0, -1);
357 /* Convert flock to posix lock */
358 fl->fl_owner = (fl_owner_t)filp;
360 fl->fl_end = OFFSET_MAX;
361 fl->fl_flags |= FL_POSIX;
362 fl->fl_flags ^= FL_FLOCK;
364 if (IS_SETLK(cmd) | IS_SETLKW(cmd))
365 ret = v9fs_file_do_lock(filp, cmd, fl);
373 * v9fs_fid_readn - read from a fid
375 * @data: data buffer to read data into
376 * @udata: user data buffer to read data into
377 * @count: size of buffer
378 * @offset: offset at which to read data
382 v9fs_fid_readn(struct p9_fid *fid, char *data, char __user *udata, u32 count,
387 P9_DPRINTK(P9_DEBUG_VFS, "fid %d offset %llu count %d\n", fid->fid,
388 (long long unsigned) offset, count);
391 size = fid->iounit ? fid->iounit : fid->clnt->msize - P9_IOHDRSZ;
393 n = p9_client_read(fid, data, udata, offset, count);
405 } while (count > 0 && n == size);
414 * v9fs_file_readn - read from a file
415 * @filp: file pointer to read
416 * @data: data buffer to read data into
417 * @udata: user data buffer to read data into
418 * @count: size of buffer
419 * @offset: offset at which to read data
423 v9fs_file_readn(struct file *filp, char *data, char __user *udata, u32 count,
426 return v9fs_fid_readn(filp->private_data, data, udata, count, offset);
430 * v9fs_file_read - read from a file
431 * @filp: file pointer to read
432 * @udata: user data buffer to read data into
433 * @count: size of buffer
434 * @offset: offset at which to read data
439 v9fs_file_read(struct file *filp, char __user *udata, size_t count,
446 P9_DPRINTK(P9_DEBUG_VFS, "count %zu offset %lld\n", count, *offset);
447 fid = filp->private_data;
449 size = fid->iounit ? fid->iounit : fid->clnt->msize - P9_IOHDRSZ;
451 ret = v9fs_file_readn(filp, NULL, udata, count, *offset);
453 ret = p9_client_read(fid, NULL, udata, *offset, count);
462 v9fs_file_write_internal(struct inode *inode, struct p9_fid *fid,
463 const char __user *data, size_t count,
464 loff_t *offset, int invalidate)
469 struct p9_client *clnt;
470 loff_t origin = *offset;
471 unsigned long pg_start, pg_end;
473 P9_DPRINTK(P9_DEBUG_VFS, "data %p count %d offset %x\n", data,
474 (int)count, (int)*offset);
478 n = p9_client_write(fid, NULL, data+total, origin+total, count);
485 if (invalidate && (total > 0)) {
486 pg_start = origin >> PAGE_CACHE_SHIFT;
487 pg_end = (origin + total - 1) >> PAGE_CACHE_SHIFT;
488 if (inode->i_mapping && inode->i_mapping->nrpages)
489 invalidate_inode_pages2_range(inode->i_mapping,
492 i_size = i_size_read(inode);
493 if (*offset > i_size) {
494 inode_add_bytes(inode, *offset - i_size);
495 i_size_write(inode, *offset);
505 * v9fs_file_write - write to a file
506 * @filp: file pointer to write
507 * @data: data buffer to write data from
508 * @count: size of buffer
509 * @offset: offset at which to write data
513 v9fs_file_write(struct file *filp, const char __user * data,
514 size_t count, loff_t *offset)
517 loff_t origin = *offset;
520 retval = generic_write_checks(filp, &origin, &count, 0);
525 if ((ssize_t) count < 0)
531 retval = v9fs_file_write_internal(filp->f_path.dentry->d_inode,
533 data, count, &origin, 1);
534 /* update offset on successful write */
542 static int v9fs_file_fsync(struct file *filp, loff_t start, loff_t end,
546 struct inode *inode = filp->f_mapping->host;
547 struct p9_wstat wstat;
550 retval = filemap_write_and_wait_range(inode->i_mapping, start, end);
554 mutex_lock(&inode->i_mutex);
555 P9_DPRINTK(P9_DEBUG_VFS, "filp %p datasync %x\n", filp, datasync);
557 fid = filp->private_data;
558 v9fs_blank_wstat(&wstat);
560 retval = p9_client_wstat(fid, &wstat);
561 mutex_unlock(&inode->i_mutex);
566 int v9fs_file_fsync_dotl(struct file *filp, loff_t start, loff_t end,
570 struct inode *inode = filp->f_mapping->host;
573 retval = filemap_write_and_wait_range(inode->i_mapping, start, end);
577 mutex_lock(&inode->i_mutex);
578 P9_DPRINTK(P9_DEBUG_VFS, "v9fs_file_fsync_dotl: filp %p datasync %x\n",
581 fid = filp->private_data;
583 retval = p9_client_fsync(fid, datasync);
584 mutex_unlock(&inode->i_mutex);
590 v9fs_file_mmap(struct file *file, struct vm_area_struct *vma)
594 retval = generic_file_mmap(file, vma);
596 vma->vm_ops = &v9fs_file_vm_ops;
602 v9fs_vm_page_mkwrite(struct vm_area_struct *vma, struct vm_fault *vmf)
604 struct v9fs_inode *v9inode;
605 struct page *page = vmf->page;
606 struct file *filp = vma->vm_file;
607 struct inode *inode = filp->f_path.dentry->d_inode;
610 P9_DPRINTK(P9_DEBUG_VFS, "page %p fid %lx\n",
611 page, (unsigned long)filp->private_data);
613 v9inode = V9FS_I(inode);
614 /* make sure the cache has finished storing the page */
615 v9fs_fscache_wait_on_page_write(inode, page);
616 BUG_ON(!v9inode->writeback_fid);
618 if (page->mapping != inode->i_mapping)
621 return VM_FAULT_LOCKED;
624 return VM_FAULT_NOPAGE;
628 v9fs_direct_read(struct file *filp, char __user *udata, size_t count,
633 struct address_space *mapping;
636 mapping = filp->f_mapping;
637 inode = mapping->host;
640 size = i_size_read(inode);
642 filemap_write_and_wait_range(mapping, offset,
645 return v9fs_file_read(filp, udata, count, offsetp);
649 * v9fs_cached_file_read - read from a file
650 * @filp: file pointer to read
651 * @udata: user data buffer to read data into
652 * @count: size of buffer
653 * @offset: offset at which to read data
657 v9fs_cached_file_read(struct file *filp, char __user *data, size_t count,
660 if (filp->f_flags & O_DIRECT)
661 return v9fs_direct_read(filp, data, count, offset);
662 return do_sync_read(filp, data, count, offset);
666 v9fs_direct_write(struct file *filp, const char __user * data,
667 size_t count, loff_t *offsetp)
672 struct address_space *mapping;
675 mapping = filp->f_mapping;
676 inode = mapping->host;
680 mutex_lock(&inode->i_mutex);
681 retval = filemap_write_and_wait_range(mapping, offset,
686 * After a write we want buffered reads to be sure to go to disk to get
687 * the new data. We invalidate clean cached page from the region we're
688 * about to write. We do this *before* the write so that if we fail
689 * here we fall back to buffered write
691 if (mapping->nrpages) {
692 pgoff_t pg_start = offset >> PAGE_CACHE_SHIFT;
693 pgoff_t pg_end = (offset + count - 1) >> PAGE_CACHE_SHIFT;
695 retval = invalidate_inode_pages2_range(mapping,
698 * If a page can not be invalidated, fall back
702 if (retval == -EBUSY)
707 retval = v9fs_file_write(filp, data, count, offsetp);
709 mutex_unlock(&inode->i_mutex);
713 mutex_unlock(&inode->i_mutex);
714 return do_sync_write(filp, data, count, offsetp);
718 * v9fs_cached_file_write - write to a file
719 * @filp: file pointer to write
720 * @data: data buffer to write data from
721 * @count: size of buffer
722 * @offset: offset at which to write data
726 v9fs_cached_file_write(struct file *filp, const char __user * data,
727 size_t count, loff_t *offset)
730 if (filp->f_flags & O_DIRECT)
731 return v9fs_direct_write(filp, data, count, offset);
732 return do_sync_write(filp, data, count, offset);
735 static const struct vm_operations_struct v9fs_file_vm_ops = {
736 .fault = filemap_fault,
737 .page_mkwrite = v9fs_vm_page_mkwrite,
741 const struct file_operations v9fs_cached_file_operations = {
742 .llseek = generic_file_llseek,
743 .read = v9fs_cached_file_read,
744 .write = v9fs_cached_file_write,
745 .aio_read = generic_file_aio_read,
746 .aio_write = generic_file_aio_write,
747 .open = v9fs_file_open,
748 .release = v9fs_dir_release,
749 .lock = v9fs_file_lock,
750 .mmap = v9fs_file_mmap,
751 .fsync = v9fs_file_fsync,
754 const struct file_operations v9fs_cached_file_operations_dotl = {
755 .llseek = generic_file_llseek,
756 .read = v9fs_cached_file_read,
757 .write = v9fs_cached_file_write,
758 .aio_read = generic_file_aio_read,
759 .aio_write = generic_file_aio_write,
760 .open = v9fs_file_open,
761 .release = v9fs_dir_release,
762 .lock = v9fs_file_lock_dotl,
763 .flock = v9fs_file_flock_dotl,
764 .mmap = v9fs_file_mmap,
765 .fsync = v9fs_file_fsync_dotl,
768 const struct file_operations v9fs_file_operations = {
769 .llseek = generic_file_llseek,
770 .read = v9fs_file_read,
771 .write = v9fs_file_write,
772 .open = v9fs_file_open,
773 .release = v9fs_dir_release,
774 .lock = v9fs_file_lock,
775 .mmap = generic_file_readonly_mmap,
776 .fsync = v9fs_file_fsync,
779 const struct file_operations v9fs_file_operations_dotl = {
780 .llseek = generic_file_llseek,
781 .read = v9fs_file_read,
782 .write = v9fs_file_write,
783 .open = v9fs_file_open,
784 .release = v9fs_dir_release,
785 .lock = v9fs_file_lock_dotl,
786 .flock = v9fs_file_flock_dotl,
787 .mmap = generic_file_readonly_mmap,
788 .fsync = v9fs_file_fsync_dotl,