mirror of
				git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
				synced 2025-09-04 20:19:47 +08:00 
			
		
		
		
	 9687c85dfb
			
		
	
	
		9687c85dfb
		
	
	
	
	
		
			
			[ 612.157429] ================================================================== [ 612.158275] BUG: KASAN: use-after-free in process_one_work+0x90/0x9b0 [ 612.158801] Read of size 8 at addr ffff88810a31ca60 by task kworker/2:9/2382 [ 612.159611] CPU: 2 PID: 2382 Comm: kworker/2:9 Tainted: G OE 5.13.0-rc2+ #98 [ 612.159623] Hardware name: QEMU Standard PC (i440FX + PIIX, 1996), BIOS 1.14.0-1.fc33 04/01/2014 [ 612.159640] Workqueue: 0x0 (deferredclose) [ 612.159669] Call Trace: [ 612.159685] dump_stack+0xbb/0x107 [ 612.159711] print_address_description.constprop.0+0x18/0x140 [ 612.159733] ? process_one_work+0x90/0x9b0 [ 612.159743] ? process_one_work+0x90/0x9b0 [ 612.159754] kasan_report.cold+0x7c/0xd8 [ 612.159778] ? lock_is_held_type+0x80/0x130 [ 612.159789] ? process_one_work+0x90/0x9b0 [ 612.159812] kasan_check_range+0x145/0x1a0 [ 612.159834] process_one_work+0x90/0x9b0 [ 612.159877] ? pwq_dec_nr_in_flight+0x110/0x110 [ 612.159914] ? spin_bug+0x90/0x90 [ 612.159967] worker_thread+0x3b6/0x6c0 [ 612.160023] ? process_one_work+0x9b0/0x9b0 [ 612.160038] kthread+0x1dc/0x200 [ 612.160051] ? kthread_create_worker_on_cpu+0xd0/0xd0 [ 612.160092] ret_from_fork+0x1f/0x30 [ 612.160399] Allocated by task 2358: [ 612.160757] kasan_save_stack+0x1b/0x40 [ 612.160768] __kasan_kmalloc+0x9b/0xd0 [ 612.160778] cifs_new_fileinfo+0xb0/0x960 [cifs] [ 612.161170] cifs_open+0xadf/0xf20 [cifs] [ 612.161421] do_dentry_open+0x2aa/0x6b0 [ 612.161432] path_openat+0xbd9/0xfa0 [ 612.161441] do_filp_open+0x11d/0x230 [ 612.161450] do_sys_openat2+0x115/0x240 [ 612.161460] __x64_sys_openat+0xce/0x140 When mod_delayed_work is called to modify the delay of pending work, it might return false and queue a new work when pending work is already scheduled or when try to grab pending work failed. So, Increase the reference count when new work is scheduled to avoid use-after-free. Signed-off-by: Rohith Surabattula <rohiths@microsoft.com> Signed-off-by: Steve French <stfrench@microsoft.com>
		
			
				
	
	
		
			5006 lines
		
	
	
		
			127 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			5006 lines
		
	
	
		
			127 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  *   fs/cifs/file.c
 | |
|  *
 | |
|  *   vfs operations that deal with files
 | |
|  *
 | |
|  *   Copyright (C) International Business Machines  Corp., 2002,2010
 | |
|  *   Author(s): Steve French (sfrench@us.ibm.com)
 | |
|  *              Jeremy Allison (jra@samba.org)
 | |
|  *
 | |
|  *   This library is free software; you can redistribute it and/or modify
 | |
|  *   it under the terms of the GNU Lesser General Public License as published
 | |
|  *   by the Free Software Foundation; either version 2.1 of the License, or
 | |
|  *   (at your option) any later version.
 | |
|  *
 | |
|  *   This library is distributed in the hope that it will be useful,
 | |
|  *   but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See
 | |
|  *   the GNU Lesser General Public License for more details.
 | |
|  *
 | |
|  *   You should have received a copy of the GNU Lesser General Public License
 | |
|  *   along with this library; if not, write to the Free Software
 | |
|  *   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
 | |
|  */
 | |
| #include <linux/fs.h>
 | |
| #include <linux/backing-dev.h>
 | |
| #include <linux/stat.h>
 | |
| #include <linux/fcntl.h>
 | |
| #include <linux/pagemap.h>
 | |
| #include <linux/pagevec.h>
 | |
| #include <linux/writeback.h>
 | |
| #include <linux/task_io_accounting_ops.h>
 | |
| #include <linux/delay.h>
 | |
| #include <linux/mount.h>
 | |
| #include <linux/slab.h>
 | |
| #include <linux/swap.h>
 | |
| #include <linux/mm.h>
 | |
| #include <asm/div64.h>
 | |
| #include "cifsfs.h"
 | |
| #include "cifspdu.h"
 | |
| #include "cifsglob.h"
 | |
| #include "cifsproto.h"
 | |
| #include "cifs_unicode.h"
 | |
| #include "cifs_debug.h"
 | |
| #include "cifs_fs_sb.h"
 | |
| #include "fscache.h"
 | |
| #include "smbdirect.h"
 | |
| #include "fs_context.h"
 | |
| #include "cifs_ioctl.h"
 | |
| 
 | |
| static inline int cifs_convert_flags(unsigned int flags)
 | |
| {
 | |
| 	if ((flags & O_ACCMODE) == O_RDONLY)
 | |
| 		return GENERIC_READ;
 | |
| 	else if ((flags & O_ACCMODE) == O_WRONLY)
 | |
| 		return GENERIC_WRITE;
 | |
| 	else if ((flags & O_ACCMODE) == O_RDWR) {
 | |
| 		/* GENERIC_ALL is too much permission to request
 | |
| 		   can cause unnecessary access denied on create */
 | |
| 		/* return GENERIC_ALL; */
 | |
| 		return (GENERIC_READ | GENERIC_WRITE);
 | |
| 	}
 | |
| 
 | |
| 	return (READ_CONTROL | FILE_WRITE_ATTRIBUTES | FILE_READ_ATTRIBUTES |
 | |
| 		FILE_WRITE_EA | FILE_APPEND_DATA | FILE_WRITE_DATA |
 | |
| 		FILE_READ_DATA);
 | |
| }
 | |
| 
 | |
| static u32 cifs_posix_convert_flags(unsigned int flags)
 | |
| {
 | |
| 	u32 posix_flags = 0;
 | |
| 
 | |
| 	if ((flags & O_ACCMODE) == O_RDONLY)
 | |
| 		posix_flags = SMB_O_RDONLY;
 | |
| 	else if ((flags & O_ACCMODE) == O_WRONLY)
 | |
| 		posix_flags = SMB_O_WRONLY;
 | |
| 	else if ((flags & O_ACCMODE) == O_RDWR)
 | |
| 		posix_flags = SMB_O_RDWR;
 | |
| 
 | |
| 	if (flags & O_CREAT) {
 | |
| 		posix_flags |= SMB_O_CREAT;
 | |
| 		if (flags & O_EXCL)
 | |
| 			posix_flags |= SMB_O_EXCL;
 | |
| 	} else if (flags & O_EXCL)
 | |
| 		cifs_dbg(FYI, "Application %s pid %d has incorrectly set O_EXCL flag but not O_CREAT on file open. Ignoring O_EXCL\n",
 | |
| 			 current->comm, current->tgid);
 | |
| 
 | |
| 	if (flags & O_TRUNC)
 | |
| 		posix_flags |= SMB_O_TRUNC;
 | |
| 	/* be safe and imply O_SYNC for O_DSYNC */
 | |
| 	if (flags & O_DSYNC)
 | |
| 		posix_flags |= SMB_O_SYNC;
 | |
| 	if (flags & O_DIRECTORY)
 | |
| 		posix_flags |= SMB_O_DIRECTORY;
 | |
| 	if (flags & O_NOFOLLOW)
 | |
| 		posix_flags |= SMB_O_NOFOLLOW;
 | |
| 	if (flags & O_DIRECT)
 | |
| 		posix_flags |= SMB_O_DIRECT;
 | |
| 
 | |
| 	return posix_flags;
 | |
| }
 | |
| 
 | |
| static inline int cifs_get_disposition(unsigned int flags)
 | |
| {
 | |
| 	if ((flags & (O_CREAT | O_EXCL)) == (O_CREAT | O_EXCL))
 | |
| 		return FILE_CREATE;
 | |
| 	else if ((flags & (O_CREAT | O_TRUNC)) == (O_CREAT | O_TRUNC))
 | |
| 		return FILE_OVERWRITE_IF;
 | |
| 	else if ((flags & O_CREAT) == O_CREAT)
 | |
| 		return FILE_OPEN_IF;
 | |
| 	else if ((flags & O_TRUNC) == O_TRUNC)
 | |
| 		return FILE_OVERWRITE;
 | |
| 	else
 | |
| 		return FILE_OPEN;
 | |
| }
 | |
| 
 | |
| int cifs_posix_open(const char *full_path, struct inode **pinode,
 | |
| 			struct super_block *sb, int mode, unsigned int f_flags,
 | |
| 			__u32 *poplock, __u16 *pnetfid, unsigned int xid)
 | |
| {
 | |
| 	int rc;
 | |
| 	FILE_UNIX_BASIC_INFO *presp_data;
 | |
| 	__u32 posix_flags = 0;
 | |
| 	struct cifs_sb_info *cifs_sb = CIFS_SB(sb);
 | |
| 	struct cifs_fattr fattr;
 | |
| 	struct tcon_link *tlink;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 
 | |
| 	cifs_dbg(FYI, "posix open %s\n", full_path);
 | |
| 
 | |
| 	presp_data = kzalloc(sizeof(FILE_UNIX_BASIC_INFO), GFP_KERNEL);
 | |
| 	if (presp_data == NULL)
 | |
| 		return -ENOMEM;
 | |
| 
 | |
| 	tlink = cifs_sb_tlink(cifs_sb);
 | |
| 	if (IS_ERR(tlink)) {
 | |
| 		rc = PTR_ERR(tlink);
 | |
| 		goto posix_open_ret;
 | |
| 	}
 | |
| 
 | |
| 	tcon = tlink_tcon(tlink);
 | |
| 	mode &= ~current_umask();
 | |
| 
 | |
| 	posix_flags = cifs_posix_convert_flags(f_flags);
 | |
| 	rc = CIFSPOSIXCreate(xid, tcon, posix_flags, mode, pnetfid, presp_data,
 | |
| 			     poplock, full_path, cifs_sb->local_nls,
 | |
| 			     cifs_remap(cifs_sb));
 | |
| 	cifs_put_tlink(tlink);
 | |
| 
 | |
| 	if (rc)
 | |
| 		goto posix_open_ret;
 | |
| 
 | |
| 	if (presp_data->Type == cpu_to_le32(-1))
 | |
| 		goto posix_open_ret; /* open ok, caller does qpathinfo */
 | |
| 
 | |
| 	if (!pinode)
 | |
| 		goto posix_open_ret; /* caller does not need info */
 | |
| 
 | |
| 	cifs_unix_basic_to_fattr(&fattr, presp_data, cifs_sb);
 | |
| 
 | |
| 	/* get new inode and set it up */
 | |
| 	if (*pinode == NULL) {
 | |
| 		cifs_fill_uniqueid(sb, &fattr);
 | |
| 		*pinode = cifs_iget(sb, &fattr);
 | |
| 		if (!*pinode) {
 | |
| 			rc = -ENOMEM;
 | |
| 			goto posix_open_ret;
 | |
| 		}
 | |
| 	} else {
 | |
| 		cifs_revalidate_mapping(*pinode);
 | |
| 		rc = cifs_fattr_to_inode(*pinode, &fattr);
 | |
| 	}
 | |
| 
 | |
| posix_open_ret:
 | |
| 	kfree(presp_data);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_nt_open(const char *full_path, struct inode *inode, struct cifs_sb_info *cifs_sb,
 | |
| 	     struct cifs_tcon *tcon, unsigned int f_flags, __u32 *oplock,
 | |
| 	     struct cifs_fid *fid, unsigned int xid)
 | |
| {
 | |
| 	int rc;
 | |
| 	int desired_access;
 | |
| 	int disposition;
 | |
| 	int create_options = CREATE_NOT_DIR;
 | |
| 	FILE_ALL_INFO *buf;
 | |
| 	struct TCP_Server_Info *server = tcon->ses->server;
 | |
| 	struct cifs_open_parms oparms;
 | |
| 
 | |
| 	if (!server->ops->open)
 | |
| 		return -ENOSYS;
 | |
| 
 | |
| 	desired_access = cifs_convert_flags(f_flags);
 | |
| 
 | |
| /*********************************************************************
 | |
|  *  open flag mapping table:
 | |
|  *
 | |
|  *	POSIX Flag            CIFS Disposition
 | |
|  *	----------            ----------------
 | |
|  *	O_CREAT               FILE_OPEN_IF
 | |
|  *	O_CREAT | O_EXCL      FILE_CREATE
 | |
|  *	O_CREAT | O_TRUNC     FILE_OVERWRITE_IF
 | |
|  *	O_TRUNC               FILE_OVERWRITE
 | |
|  *	none of the above     FILE_OPEN
 | |
|  *
 | |
|  *	Note that there is not a direct match between disposition
 | |
|  *	FILE_SUPERSEDE (ie create whether or not file exists although
 | |
|  *	O_CREAT | O_TRUNC is similar but truncates the existing
 | |
|  *	file rather than creating a new file as FILE_SUPERSEDE does
 | |
|  *	(which uses the attributes / metadata passed in on open call)
 | |
|  *?
 | |
|  *?  O_SYNC is a reasonable match to CIFS writethrough flag
 | |
|  *?  and the read write flags match reasonably.  O_LARGEFILE
 | |
|  *?  is irrelevant because largefile support is always used
 | |
|  *?  by this client. Flags O_APPEND, O_DIRECT, O_DIRECTORY,
 | |
|  *	 O_FASYNC, O_NOFOLLOW, O_NONBLOCK need further investigation
 | |
|  *********************************************************************/
 | |
| 
 | |
| 	disposition = cifs_get_disposition(f_flags);
 | |
| 
 | |
| 	/* BB pass O_SYNC flag through on file attributes .. BB */
 | |
| 
 | |
| 	buf = kmalloc(sizeof(FILE_ALL_INFO), GFP_KERNEL);
 | |
| 	if (!buf)
 | |
| 		return -ENOMEM;
 | |
| 
 | |
| 	/* O_SYNC also has bit for O_DSYNC so following check picks up either */
 | |
| 	if (f_flags & O_SYNC)
 | |
| 		create_options |= CREATE_WRITE_THROUGH;
 | |
| 
 | |
| 	if (f_flags & O_DIRECT)
 | |
| 		create_options |= CREATE_NO_BUFFER;
 | |
| 
 | |
| 	oparms.tcon = tcon;
 | |
| 	oparms.cifs_sb = cifs_sb;
 | |
| 	oparms.desired_access = desired_access;
 | |
| 	oparms.create_options = cifs_create_options(cifs_sb, create_options);
 | |
| 	oparms.disposition = disposition;
 | |
| 	oparms.path = full_path;
 | |
| 	oparms.fid = fid;
 | |
| 	oparms.reconnect = false;
 | |
| 
 | |
| 	rc = server->ops->open(xid, &oparms, oplock, buf);
 | |
| 
 | |
| 	if (rc)
 | |
| 		goto out;
 | |
| 
 | |
| 	/* TODO: Add support for calling posix query info but with passing in fid */
 | |
| 	if (tcon->unix_ext)
 | |
| 		rc = cifs_get_inode_info_unix(&inode, full_path, inode->i_sb,
 | |
| 					      xid);
 | |
| 	else
 | |
| 		rc = cifs_get_inode_info(&inode, full_path, buf, inode->i_sb,
 | |
| 					 xid, fid);
 | |
| 
 | |
| 	if (rc) {
 | |
| 		server->ops->close(xid, tcon, fid);
 | |
| 		if (rc == -ESTALE)
 | |
| 			rc = -EOPENSTALE;
 | |
| 	}
 | |
| 
 | |
| out:
 | |
| 	kfree(buf);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static bool
 | |
| cifs_has_mand_locks(struct cifsInodeInfo *cinode)
 | |
| {
 | |
| 	struct cifs_fid_locks *cur;
 | |
| 	bool has_locks = false;
 | |
| 
 | |
| 	down_read(&cinode->lock_sem);
 | |
| 	list_for_each_entry(cur, &cinode->llist, llist) {
 | |
| 		if (!list_empty(&cur->locks)) {
 | |
| 			has_locks = true;
 | |
| 			break;
 | |
| 		}
 | |
| 	}
 | |
| 	up_read(&cinode->lock_sem);
 | |
| 	return has_locks;
 | |
| }
 | |
| 
 | |
| void
 | |
| cifs_down_write(struct rw_semaphore *sem)
 | |
| {
 | |
| 	while (!down_write_trylock(sem))
 | |
| 		msleep(10);
 | |
| }
 | |
| 
 | |
| static void cifsFileInfo_put_work(struct work_struct *work);
 | |
| 
 | |
| struct cifsFileInfo *
 | |
| cifs_new_fileinfo(struct cifs_fid *fid, struct file *file,
 | |
| 		  struct tcon_link *tlink, __u32 oplock)
 | |
| {
 | |
| 	struct dentry *dentry = file_dentry(file);
 | |
| 	struct inode *inode = d_inode(dentry);
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(inode);
 | |
| 	struct cifsFileInfo *cfile;
 | |
| 	struct cifs_fid_locks *fdlocks;
 | |
| 	struct cifs_tcon *tcon = tlink_tcon(tlink);
 | |
| 	struct TCP_Server_Info *server = tcon->ses->server;
 | |
| 
 | |
| 	cfile = kzalloc(sizeof(struct cifsFileInfo), GFP_KERNEL);
 | |
| 	if (cfile == NULL)
 | |
| 		return cfile;
 | |
| 
 | |
| 	fdlocks = kzalloc(sizeof(struct cifs_fid_locks), GFP_KERNEL);
 | |
| 	if (!fdlocks) {
 | |
| 		kfree(cfile);
 | |
| 		return NULL;
 | |
| 	}
 | |
| 
 | |
| 	INIT_LIST_HEAD(&fdlocks->locks);
 | |
| 	fdlocks->cfile = cfile;
 | |
| 	cfile->llist = fdlocks;
 | |
| 
 | |
| 	cfile->count = 1;
 | |
| 	cfile->pid = current->tgid;
 | |
| 	cfile->uid = current_fsuid();
 | |
| 	cfile->dentry = dget(dentry);
 | |
| 	cfile->f_flags = file->f_flags;
 | |
| 	cfile->invalidHandle = false;
 | |
| 	cfile->deferred_close_scheduled = false;
 | |
| 	cfile->tlink = cifs_get_tlink(tlink);
 | |
| 	INIT_WORK(&cfile->oplock_break, cifs_oplock_break);
 | |
| 	INIT_WORK(&cfile->put, cifsFileInfo_put_work);
 | |
| 	INIT_DELAYED_WORK(&cfile->deferred, smb2_deferred_work_close);
 | |
| 	mutex_init(&cfile->fh_mutex);
 | |
| 	spin_lock_init(&cfile->file_info_lock);
 | |
| 
 | |
| 	cifs_sb_active(inode->i_sb);
 | |
| 
 | |
| 	/*
 | |
| 	 * If the server returned a read oplock and we have mandatory brlocks,
 | |
| 	 * set oplock level to None.
 | |
| 	 */
 | |
| 	if (server->ops->is_read_op(oplock) && cifs_has_mand_locks(cinode)) {
 | |
| 		cifs_dbg(FYI, "Reset oplock val from read to None due to mand locks\n");
 | |
| 		oplock = 0;
 | |
| 	}
 | |
| 
 | |
| 	cifs_down_write(&cinode->lock_sem);
 | |
| 	list_add(&fdlocks->llist, &cinode->llist);
 | |
| 	up_write(&cinode->lock_sem);
 | |
| 
 | |
| 	spin_lock(&tcon->open_file_lock);
 | |
| 	if (fid->pending_open->oplock != CIFS_OPLOCK_NO_CHANGE && oplock)
 | |
| 		oplock = fid->pending_open->oplock;
 | |
| 	list_del(&fid->pending_open->olist);
 | |
| 
 | |
| 	fid->purge_cache = false;
 | |
| 	server->ops->set_fid(cfile, fid, oplock);
 | |
| 
 | |
| 	list_add(&cfile->tlist, &tcon->openFileList);
 | |
| 	atomic_inc(&tcon->num_local_opens);
 | |
| 
 | |
| 	/* if readable file instance put first in list*/
 | |
| 	spin_lock(&cinode->open_file_lock);
 | |
| 	if (file->f_mode & FMODE_READ)
 | |
| 		list_add(&cfile->flist, &cinode->openFileList);
 | |
| 	else
 | |
| 		list_add_tail(&cfile->flist, &cinode->openFileList);
 | |
| 	spin_unlock(&cinode->open_file_lock);
 | |
| 	spin_unlock(&tcon->open_file_lock);
 | |
| 
 | |
| 	if (fid->purge_cache)
 | |
| 		cifs_zap_mapping(inode);
 | |
| 
 | |
| 	file->private_data = cfile;
 | |
| 	return cfile;
 | |
| }
 | |
| 
 | |
| struct cifsFileInfo *
 | |
| cifsFileInfo_get(struct cifsFileInfo *cifs_file)
 | |
| {
 | |
| 	spin_lock(&cifs_file->file_info_lock);
 | |
| 	cifsFileInfo_get_locked(cifs_file);
 | |
| 	spin_unlock(&cifs_file->file_info_lock);
 | |
| 	return cifs_file;
 | |
| }
 | |
| 
 | |
| static void cifsFileInfo_put_final(struct cifsFileInfo *cifs_file)
 | |
| {
 | |
| 	struct inode *inode = d_inode(cifs_file->dentry);
 | |
| 	struct cifsInodeInfo *cifsi = CIFS_I(inode);
 | |
| 	struct cifsLockInfo *li, *tmp;
 | |
| 	struct super_block *sb = inode->i_sb;
 | |
| 
 | |
| 	/*
 | |
| 	 * Delete any outstanding lock records. We'll lose them when the file
 | |
| 	 * is closed anyway.
 | |
| 	 */
 | |
| 	cifs_down_write(&cifsi->lock_sem);
 | |
| 	list_for_each_entry_safe(li, tmp, &cifs_file->llist->locks, llist) {
 | |
| 		list_del(&li->llist);
 | |
| 		cifs_del_lock_waiters(li);
 | |
| 		kfree(li);
 | |
| 	}
 | |
| 	list_del(&cifs_file->llist->llist);
 | |
| 	kfree(cifs_file->llist);
 | |
| 	up_write(&cifsi->lock_sem);
 | |
| 
 | |
| 	cifs_put_tlink(cifs_file->tlink);
 | |
| 	dput(cifs_file->dentry);
 | |
| 	cifs_sb_deactive(sb);
 | |
| 	kfree(cifs_file);
 | |
| }
 | |
| 
 | |
| static void cifsFileInfo_put_work(struct work_struct *work)
 | |
| {
 | |
| 	struct cifsFileInfo *cifs_file = container_of(work,
 | |
| 			struct cifsFileInfo, put);
 | |
| 
 | |
| 	cifsFileInfo_put_final(cifs_file);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * cifsFileInfo_put - release a reference of file priv data
 | |
|  *
 | |
|  * Always potentially wait for oplock handler. See _cifsFileInfo_put().
 | |
|  *
 | |
|  * @cifs_file:	cifs/smb3 specific info (eg refcounts) for an open file
 | |
|  */
 | |
| void cifsFileInfo_put(struct cifsFileInfo *cifs_file)
 | |
| {
 | |
| 	_cifsFileInfo_put(cifs_file, true, true);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * _cifsFileInfo_put - release a reference of file priv data
 | |
|  *
 | |
|  * This may involve closing the filehandle @cifs_file out on the
 | |
|  * server. Must be called without holding tcon->open_file_lock,
 | |
|  * cinode->open_file_lock and cifs_file->file_info_lock.
 | |
|  *
 | |
|  * If @wait_for_oplock_handler is true and we are releasing the last
 | |
|  * reference, wait for any running oplock break handler of the file
 | |
|  * and cancel any pending one.
 | |
|  *
 | |
|  * @cifs_file:	cifs/smb3 specific info (eg refcounts) for an open file
 | |
|  * @wait_oplock_handler: must be false if called from oplock_break_handler
 | |
|  * @offload:	not offloaded on close and oplock breaks
 | |
|  *
 | |
|  */
 | |
| void _cifsFileInfo_put(struct cifsFileInfo *cifs_file,
 | |
| 		       bool wait_oplock_handler, bool offload)
 | |
| {
 | |
| 	struct inode *inode = d_inode(cifs_file->dentry);
 | |
| 	struct cifs_tcon *tcon = tlink_tcon(cifs_file->tlink);
 | |
| 	struct TCP_Server_Info *server = tcon->ses->server;
 | |
| 	struct cifsInodeInfo *cifsi = CIFS_I(inode);
 | |
| 	struct super_block *sb = inode->i_sb;
 | |
| 	struct cifs_sb_info *cifs_sb = CIFS_SB(sb);
 | |
| 	struct cifs_fid fid;
 | |
| 	struct cifs_pending_open open;
 | |
| 	bool oplock_break_cancelled;
 | |
| 
 | |
| 	spin_lock(&tcon->open_file_lock);
 | |
| 	spin_lock(&cifsi->open_file_lock);
 | |
| 	spin_lock(&cifs_file->file_info_lock);
 | |
| 	if (--cifs_file->count > 0) {
 | |
| 		spin_unlock(&cifs_file->file_info_lock);
 | |
| 		spin_unlock(&cifsi->open_file_lock);
 | |
| 		spin_unlock(&tcon->open_file_lock);
 | |
| 		return;
 | |
| 	}
 | |
| 	spin_unlock(&cifs_file->file_info_lock);
 | |
| 
 | |
| 	if (server->ops->get_lease_key)
 | |
| 		server->ops->get_lease_key(inode, &fid);
 | |
| 
 | |
| 	/* store open in pending opens to make sure we don't miss lease break */
 | |
| 	cifs_add_pending_open_locked(&fid, cifs_file->tlink, &open);
 | |
| 
 | |
| 	/* remove it from the lists */
 | |
| 	list_del(&cifs_file->flist);
 | |
| 	list_del(&cifs_file->tlist);
 | |
| 	atomic_dec(&tcon->num_local_opens);
 | |
| 
 | |
| 	if (list_empty(&cifsi->openFileList)) {
 | |
| 		cifs_dbg(FYI, "closing last open instance for inode %p\n",
 | |
| 			 d_inode(cifs_file->dentry));
 | |
| 		/*
 | |
| 		 * In strict cache mode we need invalidate mapping on the last
 | |
| 		 * close  because it may cause a error when we open this file
 | |
| 		 * again and get at least level II oplock.
 | |
| 		 */
 | |
| 		if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_STRICT_IO)
 | |
| 			set_bit(CIFS_INO_INVALID_MAPPING, &cifsi->flags);
 | |
| 		cifs_set_oplock_level(cifsi, 0);
 | |
| 	}
 | |
| 
 | |
| 	spin_unlock(&cifsi->open_file_lock);
 | |
| 	spin_unlock(&tcon->open_file_lock);
 | |
| 
 | |
| 	oplock_break_cancelled = wait_oplock_handler ?
 | |
| 		cancel_work_sync(&cifs_file->oplock_break) : false;
 | |
| 
 | |
| 	if (!tcon->need_reconnect && !cifs_file->invalidHandle) {
 | |
| 		struct TCP_Server_Info *server = tcon->ses->server;
 | |
| 		unsigned int xid;
 | |
| 
 | |
| 		xid = get_xid();
 | |
| 		if (server->ops->close_getattr)
 | |
| 			server->ops->close_getattr(xid, tcon, cifs_file);
 | |
| 		else if (server->ops->close)
 | |
| 			server->ops->close(xid, tcon, &cifs_file->fid);
 | |
| 		_free_xid(xid);
 | |
| 	}
 | |
| 
 | |
| 	if (oplock_break_cancelled)
 | |
| 		cifs_done_oplock_break(cifsi);
 | |
| 
 | |
| 	cifs_del_pending_open(&open);
 | |
| 
 | |
| 	if (offload)
 | |
| 		queue_work(fileinfo_put_wq, &cifs_file->put);
 | |
| 	else
 | |
| 		cifsFileInfo_put_final(cifs_file);
 | |
| }
 | |
| 
 | |
| int cifs_open(struct inode *inode, struct file *file)
 | |
| 
 | |
| {
 | |
| 	int rc = -EACCES;
 | |
| 	unsigned int xid;
 | |
| 	__u32 oplock;
 | |
| 	struct cifs_sb_info *cifs_sb;
 | |
| 	struct TCP_Server_Info *server;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 	struct tcon_link *tlink;
 | |
| 	struct cifsFileInfo *cfile = NULL;
 | |
| 	void *page;
 | |
| 	const char *full_path;
 | |
| 	bool posix_open_ok = false;
 | |
| 	struct cifs_fid fid;
 | |
| 	struct cifs_pending_open open;
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 
 | |
| 	cifs_sb = CIFS_SB(inode->i_sb);
 | |
| 	if (unlikely(cifs_forced_shutdown(cifs_sb))) {
 | |
| 		free_xid(xid);
 | |
| 		return -EIO;
 | |
| 	}
 | |
| 
 | |
| 	tlink = cifs_sb_tlink(cifs_sb);
 | |
| 	if (IS_ERR(tlink)) {
 | |
| 		free_xid(xid);
 | |
| 		return PTR_ERR(tlink);
 | |
| 	}
 | |
| 	tcon = tlink_tcon(tlink);
 | |
| 	server = tcon->ses->server;
 | |
| 
 | |
| 	page = alloc_dentry_path();
 | |
| 	full_path = build_path_from_dentry(file_dentry(file), page);
 | |
| 	if (IS_ERR(full_path)) {
 | |
| 		rc = PTR_ERR(full_path);
 | |
| 		goto out;
 | |
| 	}
 | |
| 
 | |
| 	cifs_dbg(FYI, "inode = 0x%p file flags are 0x%x for %s\n",
 | |
| 		 inode, file->f_flags, full_path);
 | |
| 
 | |
| 	if (file->f_flags & O_DIRECT &&
 | |
| 	    cifs_sb->mnt_cifs_flags & CIFS_MOUNT_STRICT_IO) {
 | |
| 		if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NO_BRL)
 | |
| 			file->f_op = &cifs_file_direct_nobrl_ops;
 | |
| 		else
 | |
| 			file->f_op = &cifs_file_direct_ops;
 | |
| 	}
 | |
| 
 | |
| 	/* Get the cached handle as SMB2 close is deferred */
 | |
| 	rc = cifs_get_readable_path(tcon, full_path, &cfile);
 | |
| 	if (rc == 0) {
 | |
| 		if (file->f_flags == cfile->f_flags) {
 | |
| 			file->private_data = cfile;
 | |
| 			spin_lock(&CIFS_I(inode)->deferred_lock);
 | |
| 			cifs_del_deferred_close(cfile);
 | |
| 			spin_unlock(&CIFS_I(inode)->deferred_lock);
 | |
| 			goto out;
 | |
| 		} else {
 | |
| 			_cifsFileInfo_put(cfile, true, false);
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if (server->oplocks)
 | |
| 		oplock = REQ_OPLOCK;
 | |
| 	else
 | |
| 		oplock = 0;
 | |
| 
 | |
| 	if (!tcon->broken_posix_open && tcon->unix_ext &&
 | |
| 	    cap_unix(tcon->ses) && (CIFS_UNIX_POSIX_PATH_OPS_CAP &
 | |
| 				le64_to_cpu(tcon->fsUnixInfo.Capability))) {
 | |
| 		/* can not refresh inode info since size could be stale */
 | |
| 		rc = cifs_posix_open(full_path, &inode, inode->i_sb,
 | |
| 				cifs_sb->ctx->file_mode /* ignored */,
 | |
| 				file->f_flags, &oplock, &fid.netfid, xid);
 | |
| 		if (rc == 0) {
 | |
| 			cifs_dbg(FYI, "posix open succeeded\n");
 | |
| 			posix_open_ok = true;
 | |
| 		} else if ((rc == -EINVAL) || (rc == -EOPNOTSUPP)) {
 | |
| 			if (tcon->ses->serverNOS)
 | |
| 				cifs_dbg(VFS, "server %s of type %s returned unexpected error on SMB posix open, disabling posix open support. Check if server update available.\n",
 | |
| 					 tcon->ses->ip_addr,
 | |
| 					 tcon->ses->serverNOS);
 | |
| 			tcon->broken_posix_open = true;
 | |
| 		} else if ((rc != -EIO) && (rc != -EREMOTE) &&
 | |
| 			 (rc != -EOPNOTSUPP)) /* path not found or net err */
 | |
| 			goto out;
 | |
| 		/*
 | |
| 		 * Else fallthrough to retry open the old way on network i/o
 | |
| 		 * or DFS errors.
 | |
| 		 */
 | |
| 	}
 | |
| 
 | |
| 	if (server->ops->get_lease_key)
 | |
| 		server->ops->get_lease_key(inode, &fid);
 | |
| 
 | |
| 	cifs_add_pending_open(&fid, tlink, &open);
 | |
| 
 | |
| 	if (!posix_open_ok) {
 | |
| 		if (server->ops->get_lease_key)
 | |
| 			server->ops->get_lease_key(inode, &fid);
 | |
| 
 | |
| 		rc = cifs_nt_open(full_path, inode, cifs_sb, tcon,
 | |
| 				  file->f_flags, &oplock, &fid, xid);
 | |
| 		if (rc) {
 | |
| 			cifs_del_pending_open(&open);
 | |
| 			goto out;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	cfile = cifs_new_fileinfo(&fid, file, tlink, oplock);
 | |
| 	if (cfile == NULL) {
 | |
| 		if (server->ops->close)
 | |
| 			server->ops->close(xid, tcon, &fid);
 | |
| 		cifs_del_pending_open(&open);
 | |
| 		rc = -ENOMEM;
 | |
| 		goto out;
 | |
| 	}
 | |
| 
 | |
| 	cifs_fscache_set_inode_cookie(inode, file);
 | |
| 
 | |
| 	if ((oplock & CIFS_CREATE_ACTION) && !posix_open_ok && tcon->unix_ext) {
 | |
| 		/*
 | |
| 		 * Time to set mode which we can not set earlier due to
 | |
| 		 * problems creating new read-only files.
 | |
| 		 */
 | |
| 		struct cifs_unix_set_info_args args = {
 | |
| 			.mode	= inode->i_mode,
 | |
| 			.uid	= INVALID_UID, /* no change */
 | |
| 			.gid	= INVALID_GID, /* no change */
 | |
| 			.ctime	= NO_CHANGE_64,
 | |
| 			.atime	= NO_CHANGE_64,
 | |
| 			.mtime	= NO_CHANGE_64,
 | |
| 			.device	= 0,
 | |
| 		};
 | |
| 		CIFSSMBUnixSetFileInfo(xid, tcon, &args, fid.netfid,
 | |
| 				       cfile->pid);
 | |
| 	}
 | |
| 
 | |
| out:
 | |
| 	free_dentry_path(page);
 | |
| 	free_xid(xid);
 | |
| 	cifs_put_tlink(tlink);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int cifs_push_posix_locks(struct cifsFileInfo *cfile);
 | |
| 
 | |
| /*
 | |
|  * Try to reacquire byte range locks that were released when session
 | |
|  * to server was lost.
 | |
|  */
 | |
| static int
 | |
| cifs_relock_file(struct cifsFileInfo *cfile)
 | |
| {
 | |
| 	struct cifs_sb_info *cifs_sb = CIFS_SB(cfile->dentry->d_sb);
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
 | |
| 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
 | |
| 	int rc = 0;
 | |
| 
 | |
| 	down_read_nested(&cinode->lock_sem, SINGLE_DEPTH_NESTING);
 | |
| 	if (cinode->can_cache_brlcks) {
 | |
| 		/* can cache locks - no need to relock */
 | |
| 		up_read(&cinode->lock_sem);
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	if (cap_unix(tcon->ses) &&
 | |
| 	    (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
 | |
| 	    ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
 | |
| 		rc = cifs_push_posix_locks(cfile);
 | |
| 	else
 | |
| 		rc = tcon->ses->server->ops->push_mand_locks(cfile);
 | |
| 
 | |
| 	up_read(&cinode->lock_sem);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_reopen_file(struct cifsFileInfo *cfile, bool can_flush)
 | |
| {
 | |
| 	int rc = -EACCES;
 | |
| 	unsigned int xid;
 | |
| 	__u32 oplock;
 | |
| 	struct cifs_sb_info *cifs_sb;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 	struct TCP_Server_Info *server;
 | |
| 	struct cifsInodeInfo *cinode;
 | |
| 	struct inode *inode;
 | |
| 	void *page;
 | |
| 	const char *full_path;
 | |
| 	int desired_access;
 | |
| 	int disposition = FILE_OPEN;
 | |
| 	int create_options = CREATE_NOT_DIR;
 | |
| 	struct cifs_open_parms oparms;
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 	mutex_lock(&cfile->fh_mutex);
 | |
| 	if (!cfile->invalidHandle) {
 | |
| 		mutex_unlock(&cfile->fh_mutex);
 | |
| 		free_xid(xid);
 | |
| 		return 0;
 | |
| 	}
 | |
| 
 | |
| 	inode = d_inode(cfile->dentry);
 | |
| 	cifs_sb = CIFS_SB(inode->i_sb);
 | |
| 	tcon = tlink_tcon(cfile->tlink);
 | |
| 	server = tcon->ses->server;
 | |
| 
 | |
| 	/*
 | |
| 	 * Can not grab rename sem here because various ops, including those
 | |
| 	 * that already have the rename sem can end up causing writepage to get
 | |
| 	 * called and if the server was down that means we end up here, and we
 | |
| 	 * can never tell if the caller already has the rename_sem.
 | |
| 	 */
 | |
| 	page = alloc_dentry_path();
 | |
| 	full_path = build_path_from_dentry(cfile->dentry, page);
 | |
| 	if (IS_ERR(full_path)) {
 | |
| 		mutex_unlock(&cfile->fh_mutex);
 | |
| 		free_dentry_path(page);
 | |
| 		free_xid(xid);
 | |
| 		return PTR_ERR(full_path);
 | |
| 	}
 | |
| 
 | |
| 	cifs_dbg(FYI, "inode = 0x%p file flags 0x%x for %s\n",
 | |
| 		 inode, cfile->f_flags, full_path);
 | |
| 
 | |
| 	if (tcon->ses->server->oplocks)
 | |
| 		oplock = REQ_OPLOCK;
 | |
| 	else
 | |
| 		oplock = 0;
 | |
| 
 | |
| 	if (tcon->unix_ext && cap_unix(tcon->ses) &&
 | |
| 	    (CIFS_UNIX_POSIX_PATH_OPS_CAP &
 | |
| 				le64_to_cpu(tcon->fsUnixInfo.Capability))) {
 | |
| 		/*
 | |
| 		 * O_CREAT, O_EXCL and O_TRUNC already had their effect on the
 | |
| 		 * original open. Must mask them off for a reopen.
 | |
| 		 */
 | |
| 		unsigned int oflags = cfile->f_flags &
 | |
| 						~(O_CREAT | O_EXCL | O_TRUNC);
 | |
| 
 | |
| 		rc = cifs_posix_open(full_path, NULL, inode->i_sb,
 | |
| 				     cifs_sb->ctx->file_mode /* ignored */,
 | |
| 				     oflags, &oplock, &cfile->fid.netfid, xid);
 | |
| 		if (rc == 0) {
 | |
| 			cifs_dbg(FYI, "posix reopen succeeded\n");
 | |
| 			oparms.reconnect = true;
 | |
| 			goto reopen_success;
 | |
| 		}
 | |
| 		/*
 | |
| 		 * fallthrough to retry open the old way on errors, especially
 | |
| 		 * in the reconnect path it is important to retry hard
 | |
| 		 */
 | |
| 	}
 | |
| 
 | |
| 	desired_access = cifs_convert_flags(cfile->f_flags);
 | |
| 
 | |
| 	/* O_SYNC also has bit for O_DSYNC so following check picks up either */
 | |
| 	if (cfile->f_flags & O_SYNC)
 | |
| 		create_options |= CREATE_WRITE_THROUGH;
 | |
| 
 | |
| 	if (cfile->f_flags & O_DIRECT)
 | |
| 		create_options |= CREATE_NO_BUFFER;
 | |
| 
 | |
| 	if (server->ops->get_lease_key)
 | |
| 		server->ops->get_lease_key(inode, &cfile->fid);
 | |
| 
 | |
| 	oparms.tcon = tcon;
 | |
| 	oparms.cifs_sb = cifs_sb;
 | |
| 	oparms.desired_access = desired_access;
 | |
| 	oparms.create_options = cifs_create_options(cifs_sb, create_options);
 | |
| 	oparms.disposition = disposition;
 | |
| 	oparms.path = full_path;
 | |
| 	oparms.fid = &cfile->fid;
 | |
| 	oparms.reconnect = true;
 | |
| 
 | |
| 	/*
 | |
| 	 * Can not refresh inode by passing in file_info buf to be returned by
 | |
| 	 * ops->open and then calling get_inode_info with returned buf since
 | |
| 	 * file might have write behind data that needs to be flushed and server
 | |
| 	 * version of file size can be stale. If we knew for sure that inode was
 | |
| 	 * not dirty locally we could do this.
 | |
| 	 */
 | |
| 	rc = server->ops->open(xid, &oparms, &oplock, NULL);
 | |
| 	if (rc == -ENOENT && oparms.reconnect == false) {
 | |
| 		/* durable handle timeout is expired - open the file again */
 | |
| 		rc = server->ops->open(xid, &oparms, &oplock, NULL);
 | |
| 		/* indicate that we need to relock the file */
 | |
| 		oparms.reconnect = true;
 | |
| 	}
 | |
| 
 | |
| 	if (rc) {
 | |
| 		mutex_unlock(&cfile->fh_mutex);
 | |
| 		cifs_dbg(FYI, "cifs_reopen returned 0x%x\n", rc);
 | |
| 		cifs_dbg(FYI, "oplock: %d\n", oplock);
 | |
| 		goto reopen_error_exit;
 | |
| 	}
 | |
| 
 | |
| reopen_success:
 | |
| 	cfile->invalidHandle = false;
 | |
| 	mutex_unlock(&cfile->fh_mutex);
 | |
| 	cinode = CIFS_I(inode);
 | |
| 
 | |
| 	if (can_flush) {
 | |
| 		rc = filemap_write_and_wait(inode->i_mapping);
 | |
| 		if (!is_interrupt_error(rc))
 | |
| 			mapping_set_error(inode->i_mapping, rc);
 | |
| 
 | |
| 		if (tcon->posix_extensions)
 | |
| 			rc = smb311_posix_get_inode_info(&inode, full_path, inode->i_sb, xid);
 | |
| 		else if (tcon->unix_ext)
 | |
| 			rc = cifs_get_inode_info_unix(&inode, full_path,
 | |
| 						      inode->i_sb, xid);
 | |
| 		else
 | |
| 			rc = cifs_get_inode_info(&inode, full_path, NULL,
 | |
| 						 inode->i_sb, xid, NULL);
 | |
| 	}
 | |
| 	/*
 | |
| 	 * Else we are writing out data to server already and could deadlock if
 | |
| 	 * we tried to flush data, and since we do not know if we have data that
 | |
| 	 * would invalidate the current end of file on the server we can not go
 | |
| 	 * to the server to get the new inode info.
 | |
| 	 */
 | |
| 
 | |
| 	/*
 | |
| 	 * If the server returned a read oplock and we have mandatory brlocks,
 | |
| 	 * set oplock level to None.
 | |
| 	 */
 | |
| 	if (server->ops->is_read_op(oplock) && cifs_has_mand_locks(cinode)) {
 | |
| 		cifs_dbg(FYI, "Reset oplock val from read to None due to mand locks\n");
 | |
| 		oplock = 0;
 | |
| 	}
 | |
| 
 | |
| 	server->ops->set_fid(cfile, &cfile->fid, oplock);
 | |
| 	if (oparms.reconnect)
 | |
| 		cifs_relock_file(cfile);
 | |
| 
 | |
| reopen_error_exit:
 | |
| 	free_dentry_path(page);
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| void smb2_deferred_work_close(struct work_struct *work)
 | |
| {
 | |
| 	struct cifsFileInfo *cfile = container_of(work,
 | |
| 			struct cifsFileInfo, deferred.work);
 | |
| 
 | |
| 	spin_lock(&CIFS_I(d_inode(cfile->dentry))->deferred_lock);
 | |
| 	cifs_del_deferred_close(cfile);
 | |
| 	cfile->deferred_close_scheduled = false;
 | |
| 	spin_unlock(&CIFS_I(d_inode(cfile->dentry))->deferred_lock);
 | |
| 	_cifsFileInfo_put(cfile, true, false);
 | |
| }
 | |
| 
 | |
| int cifs_close(struct inode *inode, struct file *file)
 | |
| {
 | |
| 	struct cifsFileInfo *cfile;
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(inode);
 | |
| 	struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
 | |
| 	struct cifs_deferred_close *dclose;
 | |
| 
 | |
| 	if (file->private_data != NULL) {
 | |
| 		cfile = file->private_data;
 | |
| 		file->private_data = NULL;
 | |
| 		dclose = kmalloc(sizeof(struct cifs_deferred_close), GFP_KERNEL);
 | |
| 		if ((cinode->oplock == CIFS_CACHE_RHW_FLG) &&
 | |
| 		    cinode->lease_granted &&
 | |
| 		    dclose) {
 | |
| 			if (test_bit(CIFS_INO_MODIFIED_ATTR, &cinode->flags))
 | |
| 				inode->i_ctime = inode->i_mtime = current_time(inode);
 | |
| 			spin_lock(&cinode->deferred_lock);
 | |
| 			cifs_add_deferred_close(cfile, dclose);
 | |
| 			if (cfile->deferred_close_scheduled &&
 | |
| 			    delayed_work_pending(&cfile->deferred)) {
 | |
| 				/*
 | |
| 				 * If there is no pending work, mod_delayed_work queues new work.
 | |
| 				 * So, Increase the ref count to avoid use-after-free.
 | |
| 				 */
 | |
| 				if (!mod_delayed_work(deferredclose_wq,
 | |
| 						&cfile->deferred, cifs_sb->ctx->acregmax))
 | |
| 					cifsFileInfo_get(cfile);
 | |
| 			} else {
 | |
| 				/* Deferred close for files */
 | |
| 				queue_delayed_work(deferredclose_wq,
 | |
| 						&cfile->deferred, cifs_sb->ctx->acregmax);
 | |
| 				cfile->deferred_close_scheduled = true;
 | |
| 				spin_unlock(&cinode->deferred_lock);
 | |
| 				return 0;
 | |
| 			}
 | |
| 			spin_unlock(&cinode->deferred_lock);
 | |
| 			_cifsFileInfo_put(cfile, true, false);
 | |
| 		} else {
 | |
| 			_cifsFileInfo_put(cfile, true, false);
 | |
| 			kfree(dclose);
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	/* return code from the ->release op is always ignored */
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| void
 | |
| cifs_reopen_persistent_handles(struct cifs_tcon *tcon)
 | |
| {
 | |
| 	struct cifsFileInfo *open_file;
 | |
| 	struct list_head *tmp;
 | |
| 	struct list_head *tmp1;
 | |
| 	struct list_head tmp_list;
 | |
| 
 | |
| 	if (!tcon->use_persistent || !tcon->need_reopen_files)
 | |
| 		return;
 | |
| 
 | |
| 	tcon->need_reopen_files = false;
 | |
| 
 | |
| 	cifs_dbg(FYI, "Reopen persistent handles\n");
 | |
| 	INIT_LIST_HEAD(&tmp_list);
 | |
| 
 | |
| 	/* list all files open on tree connection, reopen resilient handles  */
 | |
| 	spin_lock(&tcon->open_file_lock);
 | |
| 	list_for_each(tmp, &tcon->openFileList) {
 | |
| 		open_file = list_entry(tmp, struct cifsFileInfo, tlist);
 | |
| 		if (!open_file->invalidHandle)
 | |
| 			continue;
 | |
| 		cifsFileInfo_get(open_file);
 | |
| 		list_add_tail(&open_file->rlist, &tmp_list);
 | |
| 	}
 | |
| 	spin_unlock(&tcon->open_file_lock);
 | |
| 
 | |
| 	list_for_each_safe(tmp, tmp1, &tmp_list) {
 | |
| 		open_file = list_entry(tmp, struct cifsFileInfo, rlist);
 | |
| 		if (cifs_reopen_file(open_file, false /* do not flush */))
 | |
| 			tcon->need_reopen_files = true;
 | |
| 		list_del_init(&open_file->rlist);
 | |
| 		cifsFileInfo_put(open_file);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| int cifs_closedir(struct inode *inode, struct file *file)
 | |
| {
 | |
| 	int rc = 0;
 | |
| 	unsigned int xid;
 | |
| 	struct cifsFileInfo *cfile = file->private_data;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 	struct TCP_Server_Info *server;
 | |
| 	char *buf;
 | |
| 
 | |
| 	cifs_dbg(FYI, "Closedir inode = 0x%p\n", inode);
 | |
| 
 | |
| 	if (cfile == NULL)
 | |
| 		return rc;
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 	tcon = tlink_tcon(cfile->tlink);
 | |
| 	server = tcon->ses->server;
 | |
| 
 | |
| 	cifs_dbg(FYI, "Freeing private data in close dir\n");
 | |
| 	spin_lock(&cfile->file_info_lock);
 | |
| 	if (server->ops->dir_needs_close(cfile)) {
 | |
| 		cfile->invalidHandle = true;
 | |
| 		spin_unlock(&cfile->file_info_lock);
 | |
| 		if (server->ops->close_dir)
 | |
| 			rc = server->ops->close_dir(xid, tcon, &cfile->fid);
 | |
| 		else
 | |
| 			rc = -ENOSYS;
 | |
| 		cifs_dbg(FYI, "Closing uncompleted readdir with rc %d\n", rc);
 | |
| 		/* not much we can do if it fails anyway, ignore rc */
 | |
| 		rc = 0;
 | |
| 	} else
 | |
| 		spin_unlock(&cfile->file_info_lock);
 | |
| 
 | |
| 	buf = cfile->srch_inf.ntwrk_buf_start;
 | |
| 	if (buf) {
 | |
| 		cifs_dbg(FYI, "closedir free smb buf in srch struct\n");
 | |
| 		cfile->srch_inf.ntwrk_buf_start = NULL;
 | |
| 		if (cfile->srch_inf.smallBuf)
 | |
| 			cifs_small_buf_release(buf);
 | |
| 		else
 | |
| 			cifs_buf_release(buf);
 | |
| 	}
 | |
| 
 | |
| 	cifs_put_tlink(cfile->tlink);
 | |
| 	kfree(file->private_data);
 | |
| 	file->private_data = NULL;
 | |
| 	/* BB can we lock the filestruct while this is going on? */
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static struct cifsLockInfo *
 | |
| cifs_lock_init(__u64 offset, __u64 length, __u8 type, __u16 flags)
 | |
| {
 | |
| 	struct cifsLockInfo *lock =
 | |
| 		kmalloc(sizeof(struct cifsLockInfo), GFP_KERNEL);
 | |
| 	if (!lock)
 | |
| 		return lock;
 | |
| 	lock->offset = offset;
 | |
| 	lock->length = length;
 | |
| 	lock->type = type;
 | |
| 	lock->pid = current->tgid;
 | |
| 	lock->flags = flags;
 | |
| 	INIT_LIST_HEAD(&lock->blist);
 | |
| 	init_waitqueue_head(&lock->block_q);
 | |
| 	return lock;
 | |
| }
 | |
| 
 | |
| void
 | |
| cifs_del_lock_waiters(struct cifsLockInfo *lock)
 | |
| {
 | |
| 	struct cifsLockInfo *li, *tmp;
 | |
| 	list_for_each_entry_safe(li, tmp, &lock->blist, blist) {
 | |
| 		list_del_init(&li->blist);
 | |
| 		wake_up(&li->block_q);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| #define CIFS_LOCK_OP	0
 | |
| #define CIFS_READ_OP	1
 | |
| #define CIFS_WRITE_OP	2
 | |
| 
 | |
| /* @rw_check : 0 - no op, 1 - read, 2 - write */
 | |
| static bool
 | |
| cifs_find_fid_lock_conflict(struct cifs_fid_locks *fdlocks, __u64 offset,
 | |
| 			    __u64 length, __u8 type, __u16 flags,
 | |
| 			    struct cifsFileInfo *cfile,
 | |
| 			    struct cifsLockInfo **conf_lock, int rw_check)
 | |
| {
 | |
| 	struct cifsLockInfo *li;
 | |
| 	struct cifsFileInfo *cur_cfile = fdlocks->cfile;
 | |
| 	struct TCP_Server_Info *server = tlink_tcon(cfile->tlink)->ses->server;
 | |
| 
 | |
| 	list_for_each_entry(li, &fdlocks->locks, llist) {
 | |
| 		if (offset + length <= li->offset ||
 | |
| 		    offset >= li->offset + li->length)
 | |
| 			continue;
 | |
| 		if (rw_check != CIFS_LOCK_OP && current->tgid == li->pid &&
 | |
| 		    server->ops->compare_fids(cfile, cur_cfile)) {
 | |
| 			/* shared lock prevents write op through the same fid */
 | |
| 			if (!(li->type & server->vals->shared_lock_type) ||
 | |
| 			    rw_check != CIFS_WRITE_OP)
 | |
| 				continue;
 | |
| 		}
 | |
| 		if ((type & server->vals->shared_lock_type) &&
 | |
| 		    ((server->ops->compare_fids(cfile, cur_cfile) &&
 | |
| 		     current->tgid == li->pid) || type == li->type))
 | |
| 			continue;
 | |
| 		if (rw_check == CIFS_LOCK_OP &&
 | |
| 		    (flags & FL_OFDLCK) && (li->flags & FL_OFDLCK) &&
 | |
| 		    server->ops->compare_fids(cfile, cur_cfile))
 | |
| 			continue;
 | |
| 		if (conf_lock)
 | |
| 			*conf_lock = li;
 | |
| 		return true;
 | |
| 	}
 | |
| 	return false;
 | |
| }
 | |
| 
 | |
| bool
 | |
| cifs_find_lock_conflict(struct cifsFileInfo *cfile, __u64 offset, __u64 length,
 | |
| 			__u8 type, __u16 flags,
 | |
| 			struct cifsLockInfo **conf_lock, int rw_check)
 | |
| {
 | |
| 	bool rc = false;
 | |
| 	struct cifs_fid_locks *cur;
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
 | |
| 
 | |
| 	list_for_each_entry(cur, &cinode->llist, llist) {
 | |
| 		rc = cifs_find_fid_lock_conflict(cur, offset, length, type,
 | |
| 						 flags, cfile, conf_lock,
 | |
| 						 rw_check);
 | |
| 		if (rc)
 | |
| 			break;
 | |
| 	}
 | |
| 
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Check if there is another lock that prevents us to set the lock (mandatory
 | |
|  * style). If such a lock exists, update the flock structure with its
 | |
|  * properties. Otherwise, set the flock type to F_UNLCK if we can cache brlocks
 | |
|  * or leave it the same if we can't. Returns 0 if we don't need to request to
 | |
|  * the server or 1 otherwise.
 | |
|  */
 | |
| static int
 | |
| cifs_lock_test(struct cifsFileInfo *cfile, __u64 offset, __u64 length,
 | |
| 	       __u8 type, struct file_lock *flock)
 | |
| {
 | |
| 	int rc = 0;
 | |
| 	struct cifsLockInfo *conf_lock;
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
 | |
| 	struct TCP_Server_Info *server = tlink_tcon(cfile->tlink)->ses->server;
 | |
| 	bool exist;
 | |
| 
 | |
| 	down_read(&cinode->lock_sem);
 | |
| 
 | |
| 	exist = cifs_find_lock_conflict(cfile, offset, length, type,
 | |
| 					flock->fl_flags, &conf_lock,
 | |
| 					CIFS_LOCK_OP);
 | |
| 	if (exist) {
 | |
| 		flock->fl_start = conf_lock->offset;
 | |
| 		flock->fl_end = conf_lock->offset + conf_lock->length - 1;
 | |
| 		flock->fl_pid = conf_lock->pid;
 | |
| 		if (conf_lock->type & server->vals->shared_lock_type)
 | |
| 			flock->fl_type = F_RDLCK;
 | |
| 		else
 | |
| 			flock->fl_type = F_WRLCK;
 | |
| 	} else if (!cinode->can_cache_brlcks)
 | |
| 		rc = 1;
 | |
| 	else
 | |
| 		flock->fl_type = F_UNLCK;
 | |
| 
 | |
| 	up_read(&cinode->lock_sem);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static void
 | |
| cifs_lock_add(struct cifsFileInfo *cfile, struct cifsLockInfo *lock)
 | |
| {
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
 | |
| 	cifs_down_write(&cinode->lock_sem);
 | |
| 	list_add_tail(&lock->llist, &cfile->llist->locks);
 | |
| 	up_write(&cinode->lock_sem);
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Set the byte-range lock (mandatory style). Returns:
 | |
|  * 1) 0, if we set the lock and don't need to request to the server;
 | |
|  * 2) 1, if no locks prevent us but we need to request to the server;
 | |
|  * 3) -EACCES, if there is a lock that prevents us and wait is false.
 | |
|  */
 | |
| static int
 | |
| cifs_lock_add_if(struct cifsFileInfo *cfile, struct cifsLockInfo *lock,
 | |
| 		 bool wait)
 | |
| {
 | |
| 	struct cifsLockInfo *conf_lock;
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
 | |
| 	bool exist;
 | |
| 	int rc = 0;
 | |
| 
 | |
| try_again:
 | |
| 	exist = false;
 | |
| 	cifs_down_write(&cinode->lock_sem);
 | |
| 
 | |
| 	exist = cifs_find_lock_conflict(cfile, lock->offset, lock->length,
 | |
| 					lock->type, lock->flags, &conf_lock,
 | |
| 					CIFS_LOCK_OP);
 | |
| 	if (!exist && cinode->can_cache_brlcks) {
 | |
| 		list_add_tail(&lock->llist, &cfile->llist->locks);
 | |
| 		up_write(&cinode->lock_sem);
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	if (!exist)
 | |
| 		rc = 1;
 | |
| 	else if (!wait)
 | |
| 		rc = -EACCES;
 | |
| 	else {
 | |
| 		list_add_tail(&lock->blist, &conf_lock->blist);
 | |
| 		up_write(&cinode->lock_sem);
 | |
| 		rc = wait_event_interruptible(lock->block_q,
 | |
| 					(lock->blist.prev == &lock->blist) &&
 | |
| 					(lock->blist.next == &lock->blist));
 | |
| 		if (!rc)
 | |
| 			goto try_again;
 | |
| 		cifs_down_write(&cinode->lock_sem);
 | |
| 		list_del_init(&lock->blist);
 | |
| 	}
 | |
| 
 | |
| 	up_write(&cinode->lock_sem);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Check if there is another lock that prevents us to set the lock (posix
 | |
|  * style). If such a lock exists, update the flock structure with its
 | |
|  * properties. Otherwise, set the flock type to F_UNLCK if we can cache brlocks
 | |
|  * or leave it the same if we can't. Returns 0 if we don't need to request to
 | |
|  * the server or 1 otherwise.
 | |
|  */
 | |
| static int
 | |
| cifs_posix_lock_test(struct file *file, struct file_lock *flock)
 | |
| {
 | |
| 	int rc = 0;
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(file_inode(file));
 | |
| 	unsigned char saved_type = flock->fl_type;
 | |
| 
 | |
| 	if ((flock->fl_flags & FL_POSIX) == 0)
 | |
| 		return 1;
 | |
| 
 | |
| 	down_read(&cinode->lock_sem);
 | |
| 	posix_test_lock(file, flock);
 | |
| 
 | |
| 	if (flock->fl_type == F_UNLCK && !cinode->can_cache_brlcks) {
 | |
| 		flock->fl_type = saved_type;
 | |
| 		rc = 1;
 | |
| 	}
 | |
| 
 | |
| 	up_read(&cinode->lock_sem);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Set the byte-range lock (posix style). Returns:
 | |
|  * 1) <0, if the error occurs while setting the lock;
 | |
|  * 2) 0, if we set the lock and don't need to request to the server;
 | |
|  * 3) FILE_LOCK_DEFERRED, if we will wait for some other file_lock;
 | |
|  * 4) FILE_LOCK_DEFERRED + 1, if we need to request to the server.
 | |
|  */
 | |
| static int
 | |
| cifs_posix_lock_set(struct file *file, struct file_lock *flock)
 | |
| {
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(file_inode(file));
 | |
| 	int rc = FILE_LOCK_DEFERRED + 1;
 | |
| 
 | |
| 	if ((flock->fl_flags & FL_POSIX) == 0)
 | |
| 		return rc;
 | |
| 
 | |
| 	cifs_down_write(&cinode->lock_sem);
 | |
| 	if (!cinode->can_cache_brlcks) {
 | |
| 		up_write(&cinode->lock_sem);
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	rc = posix_lock_file(file, flock, NULL);
 | |
| 	up_write(&cinode->lock_sem);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| int
 | |
| cifs_push_mandatory_locks(struct cifsFileInfo *cfile)
 | |
| {
 | |
| 	unsigned int xid;
 | |
| 	int rc = 0, stored_rc;
 | |
| 	struct cifsLockInfo *li, *tmp;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 	unsigned int num, max_num, max_buf;
 | |
| 	LOCKING_ANDX_RANGE *buf, *cur;
 | |
| 	static const int types[] = {
 | |
| 		LOCKING_ANDX_LARGE_FILES,
 | |
| 		LOCKING_ANDX_SHARED_LOCK | LOCKING_ANDX_LARGE_FILES
 | |
| 	};
 | |
| 	int i;
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 	tcon = tlink_tcon(cfile->tlink);
 | |
| 
 | |
| 	/*
 | |
| 	 * Accessing maxBuf is racy with cifs_reconnect - need to store value
 | |
| 	 * and check it before using.
 | |
| 	 */
 | |
| 	max_buf = tcon->ses->server->maxBuf;
 | |
| 	if (max_buf < (sizeof(struct smb_hdr) + sizeof(LOCKING_ANDX_RANGE))) {
 | |
| 		free_xid(xid);
 | |
| 		return -EINVAL;
 | |
| 	}
 | |
| 
 | |
| 	BUILD_BUG_ON(sizeof(struct smb_hdr) + sizeof(LOCKING_ANDX_RANGE) >
 | |
| 		     PAGE_SIZE);
 | |
| 	max_buf = min_t(unsigned int, max_buf - sizeof(struct smb_hdr),
 | |
| 			PAGE_SIZE);
 | |
| 	max_num = (max_buf - sizeof(struct smb_hdr)) /
 | |
| 						sizeof(LOCKING_ANDX_RANGE);
 | |
| 	buf = kcalloc(max_num, sizeof(LOCKING_ANDX_RANGE), GFP_KERNEL);
 | |
| 	if (!buf) {
 | |
| 		free_xid(xid);
 | |
| 		return -ENOMEM;
 | |
| 	}
 | |
| 
 | |
| 	for (i = 0; i < 2; i++) {
 | |
| 		cur = buf;
 | |
| 		num = 0;
 | |
| 		list_for_each_entry_safe(li, tmp, &cfile->llist->locks, llist) {
 | |
| 			if (li->type != types[i])
 | |
| 				continue;
 | |
| 			cur->Pid = cpu_to_le16(li->pid);
 | |
| 			cur->LengthLow = cpu_to_le32((u32)li->length);
 | |
| 			cur->LengthHigh = cpu_to_le32((u32)(li->length>>32));
 | |
| 			cur->OffsetLow = cpu_to_le32((u32)li->offset);
 | |
| 			cur->OffsetHigh = cpu_to_le32((u32)(li->offset>>32));
 | |
| 			if (++num == max_num) {
 | |
| 				stored_rc = cifs_lockv(xid, tcon,
 | |
| 						       cfile->fid.netfid,
 | |
| 						       (__u8)li->type, 0, num,
 | |
| 						       buf);
 | |
| 				if (stored_rc)
 | |
| 					rc = stored_rc;
 | |
| 				cur = buf;
 | |
| 				num = 0;
 | |
| 			} else
 | |
| 				cur++;
 | |
| 		}
 | |
| 
 | |
| 		if (num) {
 | |
| 			stored_rc = cifs_lockv(xid, tcon, cfile->fid.netfid,
 | |
| 					       (__u8)types[i], 0, num, buf);
 | |
| 			if (stored_rc)
 | |
| 				rc = stored_rc;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	kfree(buf);
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static __u32
 | |
| hash_lockowner(fl_owner_t owner)
 | |
| {
 | |
| 	return cifs_lock_secret ^ hash32_ptr((const void *)owner);
 | |
| }
 | |
| 
 | |
| struct lock_to_push {
 | |
| 	struct list_head llist;
 | |
| 	__u64 offset;
 | |
| 	__u64 length;
 | |
| 	__u32 pid;
 | |
| 	__u16 netfid;
 | |
| 	__u8 type;
 | |
| };
 | |
| 
 | |
| static int
 | |
| cifs_push_posix_locks(struct cifsFileInfo *cfile)
 | |
| {
 | |
| 	struct inode *inode = d_inode(cfile->dentry);
 | |
| 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
 | |
| 	struct file_lock *flock;
 | |
| 	struct file_lock_context *flctx = inode->i_flctx;
 | |
| 	unsigned int count = 0, i;
 | |
| 	int rc = 0, xid, type;
 | |
| 	struct list_head locks_to_send, *el;
 | |
| 	struct lock_to_push *lck, *tmp;
 | |
| 	__u64 length;
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 
 | |
| 	if (!flctx)
 | |
| 		goto out;
 | |
| 
 | |
| 	spin_lock(&flctx->flc_lock);
 | |
| 	list_for_each(el, &flctx->flc_posix) {
 | |
| 		count++;
 | |
| 	}
 | |
| 	spin_unlock(&flctx->flc_lock);
 | |
| 
 | |
| 	INIT_LIST_HEAD(&locks_to_send);
 | |
| 
 | |
| 	/*
 | |
| 	 * Allocating count locks is enough because no FL_POSIX locks can be
 | |
| 	 * added to the list while we are holding cinode->lock_sem that
 | |
| 	 * protects locking operations of this inode.
 | |
| 	 */
 | |
| 	for (i = 0; i < count; i++) {
 | |
| 		lck = kmalloc(sizeof(struct lock_to_push), GFP_KERNEL);
 | |
| 		if (!lck) {
 | |
| 			rc = -ENOMEM;
 | |
| 			goto err_out;
 | |
| 		}
 | |
| 		list_add_tail(&lck->llist, &locks_to_send);
 | |
| 	}
 | |
| 
 | |
| 	el = locks_to_send.next;
 | |
| 	spin_lock(&flctx->flc_lock);
 | |
| 	list_for_each_entry(flock, &flctx->flc_posix, fl_list) {
 | |
| 		if (el == &locks_to_send) {
 | |
| 			/*
 | |
| 			 * The list ended. We don't have enough allocated
 | |
| 			 * structures - something is really wrong.
 | |
| 			 */
 | |
| 			cifs_dbg(VFS, "Can't push all brlocks!\n");
 | |
| 			break;
 | |
| 		}
 | |
| 		length = 1 + flock->fl_end - flock->fl_start;
 | |
| 		if (flock->fl_type == F_RDLCK || flock->fl_type == F_SHLCK)
 | |
| 			type = CIFS_RDLCK;
 | |
| 		else
 | |
| 			type = CIFS_WRLCK;
 | |
| 		lck = list_entry(el, struct lock_to_push, llist);
 | |
| 		lck->pid = hash_lockowner(flock->fl_owner);
 | |
| 		lck->netfid = cfile->fid.netfid;
 | |
| 		lck->length = length;
 | |
| 		lck->type = type;
 | |
| 		lck->offset = flock->fl_start;
 | |
| 	}
 | |
| 	spin_unlock(&flctx->flc_lock);
 | |
| 
 | |
| 	list_for_each_entry_safe(lck, tmp, &locks_to_send, llist) {
 | |
| 		int stored_rc;
 | |
| 
 | |
| 		stored_rc = CIFSSMBPosixLock(xid, tcon, lck->netfid, lck->pid,
 | |
| 					     lck->offset, lck->length, NULL,
 | |
| 					     lck->type, 0);
 | |
| 		if (stored_rc)
 | |
| 			rc = stored_rc;
 | |
| 		list_del(&lck->llist);
 | |
| 		kfree(lck);
 | |
| 	}
 | |
| 
 | |
| out:
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| err_out:
 | |
| 	list_for_each_entry_safe(lck, tmp, &locks_to_send, llist) {
 | |
| 		list_del(&lck->llist);
 | |
| 		kfree(lck);
 | |
| 	}
 | |
| 	goto out;
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_push_locks(struct cifsFileInfo *cfile)
 | |
| {
 | |
| 	struct cifs_sb_info *cifs_sb = CIFS_SB(cfile->dentry->d_sb);
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
 | |
| 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
 | |
| 	int rc = 0;
 | |
| 
 | |
| 	/* we are going to update can_cache_brlcks here - need a write access */
 | |
| 	cifs_down_write(&cinode->lock_sem);
 | |
| 	if (!cinode->can_cache_brlcks) {
 | |
| 		up_write(&cinode->lock_sem);
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	if (cap_unix(tcon->ses) &&
 | |
| 	    (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
 | |
| 	    ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
 | |
| 		rc = cifs_push_posix_locks(cfile);
 | |
| 	else
 | |
| 		rc = tcon->ses->server->ops->push_mand_locks(cfile);
 | |
| 
 | |
| 	cinode->can_cache_brlcks = false;
 | |
| 	up_write(&cinode->lock_sem);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static void
 | |
| cifs_read_flock(struct file_lock *flock, __u32 *type, int *lock, int *unlock,
 | |
| 		bool *wait_flag, struct TCP_Server_Info *server)
 | |
| {
 | |
| 	if (flock->fl_flags & FL_POSIX)
 | |
| 		cifs_dbg(FYI, "Posix\n");
 | |
| 	if (flock->fl_flags & FL_FLOCK)
 | |
| 		cifs_dbg(FYI, "Flock\n");
 | |
| 	if (flock->fl_flags & FL_SLEEP) {
 | |
| 		cifs_dbg(FYI, "Blocking lock\n");
 | |
| 		*wait_flag = true;
 | |
| 	}
 | |
| 	if (flock->fl_flags & FL_ACCESS)
 | |
| 		cifs_dbg(FYI, "Process suspended by mandatory locking - not implemented yet\n");
 | |
| 	if (flock->fl_flags & FL_LEASE)
 | |
| 		cifs_dbg(FYI, "Lease on file - not implemented yet\n");
 | |
| 	if (flock->fl_flags &
 | |
| 	    (~(FL_POSIX | FL_FLOCK | FL_SLEEP |
 | |
| 	       FL_ACCESS | FL_LEASE | FL_CLOSE | FL_OFDLCK)))
 | |
| 		cifs_dbg(FYI, "Unknown lock flags 0x%x\n", flock->fl_flags);
 | |
| 
 | |
| 	*type = server->vals->large_lock_type;
 | |
| 	if (flock->fl_type == F_WRLCK) {
 | |
| 		cifs_dbg(FYI, "F_WRLCK\n");
 | |
| 		*type |= server->vals->exclusive_lock_type;
 | |
| 		*lock = 1;
 | |
| 	} else if (flock->fl_type == F_UNLCK) {
 | |
| 		cifs_dbg(FYI, "F_UNLCK\n");
 | |
| 		*type |= server->vals->unlock_lock_type;
 | |
| 		*unlock = 1;
 | |
| 		/* Check if unlock includes more than one lock range */
 | |
| 	} else if (flock->fl_type == F_RDLCK) {
 | |
| 		cifs_dbg(FYI, "F_RDLCK\n");
 | |
| 		*type |= server->vals->shared_lock_type;
 | |
| 		*lock = 1;
 | |
| 	} else if (flock->fl_type == F_EXLCK) {
 | |
| 		cifs_dbg(FYI, "F_EXLCK\n");
 | |
| 		*type |= server->vals->exclusive_lock_type;
 | |
| 		*lock = 1;
 | |
| 	} else if (flock->fl_type == F_SHLCK) {
 | |
| 		cifs_dbg(FYI, "F_SHLCK\n");
 | |
| 		*type |= server->vals->shared_lock_type;
 | |
| 		*lock = 1;
 | |
| 	} else
 | |
| 		cifs_dbg(FYI, "Unknown type of lock\n");
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_getlk(struct file *file, struct file_lock *flock, __u32 type,
 | |
| 	   bool wait_flag, bool posix_lck, unsigned int xid)
 | |
| {
 | |
| 	int rc = 0;
 | |
| 	__u64 length = 1 + flock->fl_end - flock->fl_start;
 | |
| 	struct cifsFileInfo *cfile = (struct cifsFileInfo *)file->private_data;
 | |
| 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
 | |
| 	struct TCP_Server_Info *server = tcon->ses->server;
 | |
| 	__u16 netfid = cfile->fid.netfid;
 | |
| 
 | |
| 	if (posix_lck) {
 | |
| 		int posix_lock_type;
 | |
| 
 | |
| 		rc = cifs_posix_lock_test(file, flock);
 | |
| 		if (!rc)
 | |
| 			return rc;
 | |
| 
 | |
| 		if (type & server->vals->shared_lock_type)
 | |
| 			posix_lock_type = CIFS_RDLCK;
 | |
| 		else
 | |
| 			posix_lock_type = CIFS_WRLCK;
 | |
| 		rc = CIFSSMBPosixLock(xid, tcon, netfid,
 | |
| 				      hash_lockowner(flock->fl_owner),
 | |
| 				      flock->fl_start, length, flock,
 | |
| 				      posix_lock_type, wait_flag);
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	rc = cifs_lock_test(cfile, flock->fl_start, length, type, flock);
 | |
| 	if (!rc)
 | |
| 		return rc;
 | |
| 
 | |
| 	/* BB we could chain these into one lock request BB */
 | |
| 	rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length, type,
 | |
| 				    1, 0, false);
 | |
| 	if (rc == 0) {
 | |
| 		rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length,
 | |
| 					    type, 0, 1, false);
 | |
| 		flock->fl_type = F_UNLCK;
 | |
| 		if (rc != 0)
 | |
| 			cifs_dbg(VFS, "Error unlocking previously locked range %d during test of lock\n",
 | |
| 				 rc);
 | |
| 		return 0;
 | |
| 	}
 | |
| 
 | |
| 	if (type & server->vals->shared_lock_type) {
 | |
| 		flock->fl_type = F_WRLCK;
 | |
| 		return 0;
 | |
| 	}
 | |
| 
 | |
| 	type &= ~server->vals->exclusive_lock_type;
 | |
| 
 | |
| 	rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length,
 | |
| 				    type | server->vals->shared_lock_type,
 | |
| 				    1, 0, false);
 | |
| 	if (rc == 0) {
 | |
| 		rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length,
 | |
| 			type | server->vals->shared_lock_type, 0, 1, false);
 | |
| 		flock->fl_type = F_RDLCK;
 | |
| 		if (rc != 0)
 | |
| 			cifs_dbg(VFS, "Error unlocking previously locked range %d during test of lock\n",
 | |
| 				 rc);
 | |
| 	} else
 | |
| 		flock->fl_type = F_WRLCK;
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| void
 | |
| cifs_move_llist(struct list_head *source, struct list_head *dest)
 | |
| {
 | |
| 	struct list_head *li, *tmp;
 | |
| 	list_for_each_safe(li, tmp, source)
 | |
| 		list_move(li, dest);
 | |
| }
 | |
| 
 | |
| void
 | |
| cifs_free_llist(struct list_head *llist)
 | |
| {
 | |
| 	struct cifsLockInfo *li, *tmp;
 | |
| 	list_for_each_entry_safe(li, tmp, llist, llist) {
 | |
| 		cifs_del_lock_waiters(li);
 | |
| 		list_del(&li->llist);
 | |
| 		kfree(li);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| int
 | |
| cifs_unlock_range(struct cifsFileInfo *cfile, struct file_lock *flock,
 | |
| 		  unsigned int xid)
 | |
| {
 | |
| 	int rc = 0, stored_rc;
 | |
| 	static const int types[] = {
 | |
| 		LOCKING_ANDX_LARGE_FILES,
 | |
| 		LOCKING_ANDX_SHARED_LOCK | LOCKING_ANDX_LARGE_FILES
 | |
| 	};
 | |
| 	unsigned int i;
 | |
| 	unsigned int max_num, num, max_buf;
 | |
| 	LOCKING_ANDX_RANGE *buf, *cur;
 | |
| 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(d_inode(cfile->dentry));
 | |
| 	struct cifsLockInfo *li, *tmp;
 | |
| 	__u64 length = 1 + flock->fl_end - flock->fl_start;
 | |
| 	struct list_head tmp_llist;
 | |
| 
 | |
| 	INIT_LIST_HEAD(&tmp_llist);
 | |
| 
 | |
| 	/*
 | |
| 	 * Accessing maxBuf is racy with cifs_reconnect - need to store value
 | |
| 	 * and check it before using.
 | |
| 	 */
 | |
| 	max_buf = tcon->ses->server->maxBuf;
 | |
| 	if (max_buf < (sizeof(struct smb_hdr) + sizeof(LOCKING_ANDX_RANGE)))
 | |
| 		return -EINVAL;
 | |
| 
 | |
| 	BUILD_BUG_ON(sizeof(struct smb_hdr) + sizeof(LOCKING_ANDX_RANGE) >
 | |
| 		     PAGE_SIZE);
 | |
| 	max_buf = min_t(unsigned int, max_buf - sizeof(struct smb_hdr),
 | |
| 			PAGE_SIZE);
 | |
| 	max_num = (max_buf - sizeof(struct smb_hdr)) /
 | |
| 						sizeof(LOCKING_ANDX_RANGE);
 | |
| 	buf = kcalloc(max_num, sizeof(LOCKING_ANDX_RANGE), GFP_KERNEL);
 | |
| 	if (!buf)
 | |
| 		return -ENOMEM;
 | |
| 
 | |
| 	cifs_down_write(&cinode->lock_sem);
 | |
| 	for (i = 0; i < 2; i++) {
 | |
| 		cur = buf;
 | |
| 		num = 0;
 | |
| 		list_for_each_entry_safe(li, tmp, &cfile->llist->locks, llist) {
 | |
| 			if (flock->fl_start > li->offset ||
 | |
| 			    (flock->fl_start + length) <
 | |
| 			    (li->offset + li->length))
 | |
| 				continue;
 | |
| 			if (current->tgid != li->pid)
 | |
| 				continue;
 | |
| 			if (types[i] != li->type)
 | |
| 				continue;
 | |
| 			if (cinode->can_cache_brlcks) {
 | |
| 				/*
 | |
| 				 * We can cache brlock requests - simply remove
 | |
| 				 * a lock from the file's list.
 | |
| 				 */
 | |
| 				list_del(&li->llist);
 | |
| 				cifs_del_lock_waiters(li);
 | |
| 				kfree(li);
 | |
| 				continue;
 | |
| 			}
 | |
| 			cur->Pid = cpu_to_le16(li->pid);
 | |
| 			cur->LengthLow = cpu_to_le32((u32)li->length);
 | |
| 			cur->LengthHigh = cpu_to_le32((u32)(li->length>>32));
 | |
| 			cur->OffsetLow = cpu_to_le32((u32)li->offset);
 | |
| 			cur->OffsetHigh = cpu_to_le32((u32)(li->offset>>32));
 | |
| 			/*
 | |
| 			 * We need to save a lock here to let us add it again to
 | |
| 			 * the file's list if the unlock range request fails on
 | |
| 			 * the server.
 | |
| 			 */
 | |
| 			list_move(&li->llist, &tmp_llist);
 | |
| 			if (++num == max_num) {
 | |
| 				stored_rc = cifs_lockv(xid, tcon,
 | |
| 						       cfile->fid.netfid,
 | |
| 						       li->type, num, 0, buf);
 | |
| 				if (stored_rc) {
 | |
| 					/*
 | |
| 					 * We failed on the unlock range
 | |
| 					 * request - add all locks from the tmp
 | |
| 					 * list to the head of the file's list.
 | |
| 					 */
 | |
| 					cifs_move_llist(&tmp_llist,
 | |
| 							&cfile->llist->locks);
 | |
| 					rc = stored_rc;
 | |
| 				} else
 | |
| 					/*
 | |
| 					 * The unlock range request succeed -
 | |
| 					 * free the tmp list.
 | |
| 					 */
 | |
| 					cifs_free_llist(&tmp_llist);
 | |
| 				cur = buf;
 | |
| 				num = 0;
 | |
| 			} else
 | |
| 				cur++;
 | |
| 		}
 | |
| 		if (num) {
 | |
| 			stored_rc = cifs_lockv(xid, tcon, cfile->fid.netfid,
 | |
| 					       types[i], num, 0, buf);
 | |
| 			if (stored_rc) {
 | |
| 				cifs_move_llist(&tmp_llist,
 | |
| 						&cfile->llist->locks);
 | |
| 				rc = stored_rc;
 | |
| 			} else
 | |
| 				cifs_free_llist(&tmp_llist);
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	up_write(&cinode->lock_sem);
 | |
| 	kfree(buf);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_setlk(struct file *file, struct file_lock *flock, __u32 type,
 | |
| 	   bool wait_flag, bool posix_lck, int lock, int unlock,
 | |
| 	   unsigned int xid)
 | |
| {
 | |
| 	int rc = 0;
 | |
| 	__u64 length = 1 + flock->fl_end - flock->fl_start;
 | |
| 	struct cifsFileInfo *cfile = (struct cifsFileInfo *)file->private_data;
 | |
| 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
 | |
| 	struct TCP_Server_Info *server = tcon->ses->server;
 | |
| 	struct inode *inode = d_inode(cfile->dentry);
 | |
| 
 | |
| 	if (posix_lck) {
 | |
| 		int posix_lock_type;
 | |
| 
 | |
| 		rc = cifs_posix_lock_set(file, flock);
 | |
| 		if (rc <= FILE_LOCK_DEFERRED)
 | |
| 			return rc;
 | |
| 
 | |
| 		if (type & server->vals->shared_lock_type)
 | |
| 			posix_lock_type = CIFS_RDLCK;
 | |
| 		else
 | |
| 			posix_lock_type = CIFS_WRLCK;
 | |
| 
 | |
| 		if (unlock == 1)
 | |
| 			posix_lock_type = CIFS_UNLCK;
 | |
| 
 | |
| 		rc = CIFSSMBPosixLock(xid, tcon, cfile->fid.netfid,
 | |
| 				      hash_lockowner(flock->fl_owner),
 | |
| 				      flock->fl_start, length,
 | |
| 				      NULL, posix_lock_type, wait_flag);
 | |
| 		goto out;
 | |
| 	}
 | |
| 
 | |
| 	if (lock) {
 | |
| 		struct cifsLockInfo *lock;
 | |
| 
 | |
| 		lock = cifs_lock_init(flock->fl_start, length, type,
 | |
| 				      flock->fl_flags);
 | |
| 		if (!lock)
 | |
| 			return -ENOMEM;
 | |
| 
 | |
| 		rc = cifs_lock_add_if(cfile, lock, wait_flag);
 | |
| 		if (rc < 0) {
 | |
| 			kfree(lock);
 | |
| 			return rc;
 | |
| 		}
 | |
| 		if (!rc)
 | |
| 			goto out;
 | |
| 
 | |
| 		/*
 | |
| 		 * Windows 7 server can delay breaking lease from read to None
 | |
| 		 * if we set a byte-range lock on a file - break it explicitly
 | |
| 		 * before sending the lock to the server to be sure the next
 | |
| 		 * read won't conflict with non-overlapted locks due to
 | |
| 		 * pagereading.
 | |
| 		 */
 | |
| 		if (!CIFS_CACHE_WRITE(CIFS_I(inode)) &&
 | |
| 					CIFS_CACHE_READ(CIFS_I(inode))) {
 | |
| 			cifs_zap_mapping(inode);
 | |
| 			cifs_dbg(FYI, "Set no oplock for inode=%p due to mand locks\n",
 | |
| 				 inode);
 | |
| 			CIFS_I(inode)->oplock = 0;
 | |
| 		}
 | |
| 
 | |
| 		rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length,
 | |
| 					    type, 1, 0, wait_flag);
 | |
| 		if (rc) {
 | |
| 			kfree(lock);
 | |
| 			return rc;
 | |
| 		}
 | |
| 
 | |
| 		cifs_lock_add(cfile, lock);
 | |
| 	} else if (unlock)
 | |
| 		rc = server->ops->mand_unlock_range(cfile, flock, xid);
 | |
| 
 | |
| out:
 | |
| 	if ((flock->fl_flags & FL_POSIX) || (flock->fl_flags & FL_FLOCK)) {
 | |
| 		/*
 | |
| 		 * If this is a request to remove all locks because we
 | |
| 		 * are closing the file, it doesn't matter if the
 | |
| 		 * unlocking failed as both cifs.ko and the SMB server
 | |
| 		 * remove the lock on file close
 | |
| 		 */
 | |
| 		if (rc) {
 | |
| 			cifs_dbg(VFS, "%s failed rc=%d\n", __func__, rc);
 | |
| 			if (!(flock->fl_flags & FL_CLOSE))
 | |
| 				return rc;
 | |
| 		}
 | |
| 		rc = locks_lock_file_wait(file, flock);
 | |
| 	}
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| int cifs_flock(struct file *file, int cmd, struct file_lock *fl)
 | |
| {
 | |
| 	int rc, xid;
 | |
| 	int lock = 0, unlock = 0;
 | |
| 	bool wait_flag = false;
 | |
| 	bool posix_lck = false;
 | |
| 	struct cifs_sb_info *cifs_sb;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 	struct cifsFileInfo *cfile;
 | |
| 	__u32 type;
 | |
| 
 | |
| 	rc = -EACCES;
 | |
| 	xid = get_xid();
 | |
| 
 | |
| 	if (!(fl->fl_flags & FL_FLOCK))
 | |
| 		return -ENOLCK;
 | |
| 
 | |
| 	cfile = (struct cifsFileInfo *)file->private_data;
 | |
| 	tcon = tlink_tcon(cfile->tlink);
 | |
| 
 | |
| 	cifs_read_flock(fl, &type, &lock, &unlock, &wait_flag,
 | |
| 			tcon->ses->server);
 | |
| 	cifs_sb = CIFS_FILE_SB(file);
 | |
| 
 | |
| 	if (cap_unix(tcon->ses) &&
 | |
| 	    (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
 | |
| 	    ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
 | |
| 		posix_lck = true;
 | |
| 
 | |
| 	if (!lock && !unlock) {
 | |
| 		/*
 | |
| 		 * if no lock or unlock then nothing to do since we do not
 | |
| 		 * know what it is
 | |
| 		 */
 | |
| 		free_xid(xid);
 | |
| 		return -EOPNOTSUPP;
 | |
| 	}
 | |
| 
 | |
| 	rc = cifs_setlk(file, fl, type, wait_flag, posix_lck, lock, unlock,
 | |
| 			xid);
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| 
 | |
| 
 | |
| }
 | |
| 
 | |
| int cifs_lock(struct file *file, int cmd, struct file_lock *flock)
 | |
| {
 | |
| 	int rc, xid;
 | |
| 	int lock = 0, unlock = 0;
 | |
| 	bool wait_flag = false;
 | |
| 	bool posix_lck = false;
 | |
| 	struct cifs_sb_info *cifs_sb;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 	struct cifsFileInfo *cfile;
 | |
| 	__u32 type;
 | |
| 
 | |
| 	rc = -EACCES;
 | |
| 	xid = get_xid();
 | |
| 
 | |
| 	cifs_dbg(FYI, "Lock parm: 0x%x flockflags: 0x%x flocktype: 0x%x start: %lld end: %lld\n",
 | |
| 		 cmd, flock->fl_flags, flock->fl_type,
 | |
| 		 flock->fl_start, flock->fl_end);
 | |
| 
 | |
| 	cfile = (struct cifsFileInfo *)file->private_data;
 | |
| 	tcon = tlink_tcon(cfile->tlink);
 | |
| 
 | |
| 	cifs_read_flock(flock, &type, &lock, &unlock, &wait_flag,
 | |
| 			tcon->ses->server);
 | |
| 	cifs_sb = CIFS_FILE_SB(file);
 | |
| 
 | |
| 	if (cap_unix(tcon->ses) &&
 | |
| 	    (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
 | |
| 	    ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
 | |
| 		posix_lck = true;
 | |
| 	/*
 | |
| 	 * BB add code here to normalize offset and length to account for
 | |
| 	 * negative length which we can not accept over the wire.
 | |
| 	 */
 | |
| 	if (IS_GETLK(cmd)) {
 | |
| 		rc = cifs_getlk(file, flock, type, wait_flag, posix_lck, xid);
 | |
| 		free_xid(xid);
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	if (!lock && !unlock) {
 | |
| 		/*
 | |
| 		 * if no lock or unlock then nothing to do since we do not
 | |
| 		 * know what it is
 | |
| 		 */
 | |
| 		free_xid(xid);
 | |
| 		return -EOPNOTSUPP;
 | |
| 	}
 | |
| 
 | |
| 	rc = cifs_setlk(file, flock, type, wait_flag, posix_lck, lock, unlock,
 | |
| 			xid);
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * update the file size (if needed) after a write. Should be called with
 | |
|  * the inode->i_lock held
 | |
|  */
 | |
| void
 | |
| cifs_update_eof(struct cifsInodeInfo *cifsi, loff_t offset,
 | |
| 		      unsigned int bytes_written)
 | |
| {
 | |
| 	loff_t end_of_write = offset + bytes_written;
 | |
| 
 | |
| 	if (end_of_write > cifsi->server_eof)
 | |
| 		cifsi->server_eof = end_of_write;
 | |
| }
 | |
| 
 | |
| static ssize_t
 | |
| cifs_write(struct cifsFileInfo *open_file, __u32 pid, const char *write_data,
 | |
| 	   size_t write_size, loff_t *offset)
 | |
| {
 | |
| 	int rc = 0;
 | |
| 	unsigned int bytes_written = 0;
 | |
| 	unsigned int total_written;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 	struct TCP_Server_Info *server;
 | |
| 	unsigned int xid;
 | |
| 	struct dentry *dentry = open_file->dentry;
 | |
| 	struct cifsInodeInfo *cifsi = CIFS_I(d_inode(dentry));
 | |
| 	struct cifs_io_parms io_parms = {0};
 | |
| 
 | |
| 	cifs_dbg(FYI, "write %zd bytes to offset %lld of %pd\n",
 | |
| 		 write_size, *offset, dentry);
 | |
| 
 | |
| 	tcon = tlink_tcon(open_file->tlink);
 | |
| 	server = tcon->ses->server;
 | |
| 
 | |
| 	if (!server->ops->sync_write)
 | |
| 		return -ENOSYS;
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 
 | |
| 	for (total_written = 0; write_size > total_written;
 | |
| 	     total_written += bytes_written) {
 | |
| 		rc = -EAGAIN;
 | |
| 		while (rc == -EAGAIN) {
 | |
| 			struct kvec iov[2];
 | |
| 			unsigned int len;
 | |
| 
 | |
| 			if (open_file->invalidHandle) {
 | |
| 				/* we could deadlock if we called
 | |
| 				   filemap_fdatawait from here so tell
 | |
| 				   reopen_file not to flush data to
 | |
| 				   server now */
 | |
| 				rc = cifs_reopen_file(open_file, false);
 | |
| 				if (rc != 0)
 | |
| 					break;
 | |
| 			}
 | |
| 
 | |
| 			len = min(server->ops->wp_retry_size(d_inode(dentry)),
 | |
| 				  (unsigned int)write_size - total_written);
 | |
| 			/* iov[0] is reserved for smb header */
 | |
| 			iov[1].iov_base = (char *)write_data + total_written;
 | |
| 			iov[1].iov_len = len;
 | |
| 			io_parms.pid = pid;
 | |
| 			io_parms.tcon = tcon;
 | |
| 			io_parms.offset = *offset;
 | |
| 			io_parms.length = len;
 | |
| 			rc = server->ops->sync_write(xid, &open_file->fid,
 | |
| 					&io_parms, &bytes_written, iov, 1);
 | |
| 		}
 | |
| 		if (rc || (bytes_written == 0)) {
 | |
| 			if (total_written)
 | |
| 				break;
 | |
| 			else {
 | |
| 				free_xid(xid);
 | |
| 				return rc;
 | |
| 			}
 | |
| 		} else {
 | |
| 			spin_lock(&d_inode(dentry)->i_lock);
 | |
| 			cifs_update_eof(cifsi, *offset, bytes_written);
 | |
| 			spin_unlock(&d_inode(dentry)->i_lock);
 | |
| 			*offset += bytes_written;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	cifs_stats_bytes_written(tcon, total_written);
 | |
| 
 | |
| 	if (total_written > 0) {
 | |
| 		spin_lock(&d_inode(dentry)->i_lock);
 | |
| 		if (*offset > d_inode(dentry)->i_size) {
 | |
| 			i_size_write(d_inode(dentry), *offset);
 | |
| 			d_inode(dentry)->i_blocks = (512 - 1 + *offset) >> 9;
 | |
| 		}
 | |
| 		spin_unlock(&d_inode(dentry)->i_lock);
 | |
| 	}
 | |
| 	mark_inode_dirty_sync(d_inode(dentry));
 | |
| 	free_xid(xid);
 | |
| 	return total_written;
 | |
| }
 | |
| 
 | |
| struct cifsFileInfo *find_readable_file(struct cifsInodeInfo *cifs_inode,
 | |
| 					bool fsuid_only)
 | |
| {
 | |
| 	struct cifsFileInfo *open_file = NULL;
 | |
| 	struct cifs_sb_info *cifs_sb = CIFS_SB(cifs_inode->vfs_inode.i_sb);
 | |
| 
 | |
| 	/* only filter by fsuid on multiuser mounts */
 | |
| 	if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_MULTIUSER))
 | |
| 		fsuid_only = false;
 | |
| 
 | |
| 	spin_lock(&cifs_inode->open_file_lock);
 | |
| 	/* we could simply get the first_list_entry since write-only entries
 | |
| 	   are always at the end of the list but since the first entry might
 | |
| 	   have a close pending, we go through the whole list */
 | |
| 	list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
 | |
| 		if (fsuid_only && !uid_eq(open_file->uid, current_fsuid()))
 | |
| 			continue;
 | |
| 		if (OPEN_FMODE(open_file->f_flags) & FMODE_READ) {
 | |
| 			if ((!open_file->invalidHandle)) {
 | |
| 				/* found a good file */
 | |
| 				/* lock it so it will not be closed on us */
 | |
| 				cifsFileInfo_get(open_file);
 | |
| 				spin_unlock(&cifs_inode->open_file_lock);
 | |
| 				return open_file;
 | |
| 			} /* else might as well continue, and look for
 | |
| 			     another, or simply have the caller reopen it
 | |
| 			     again rather than trying to fix this handle */
 | |
| 		} else /* write only file */
 | |
| 			break; /* write only files are last so must be done */
 | |
| 	}
 | |
| 	spin_unlock(&cifs_inode->open_file_lock);
 | |
| 	return NULL;
 | |
| }
 | |
| 
 | |
| /* Return -EBADF if no handle is found and general rc otherwise */
 | |
| int
 | |
| cifs_get_writable_file(struct cifsInodeInfo *cifs_inode, int flags,
 | |
| 		       struct cifsFileInfo **ret_file)
 | |
| {
 | |
| 	struct cifsFileInfo *open_file, *inv_file = NULL;
 | |
| 	struct cifs_sb_info *cifs_sb;
 | |
| 	bool any_available = false;
 | |
| 	int rc = -EBADF;
 | |
| 	unsigned int refind = 0;
 | |
| 	bool fsuid_only = flags & FIND_WR_FSUID_ONLY;
 | |
| 	bool with_delete = flags & FIND_WR_WITH_DELETE;
 | |
| 	*ret_file = NULL;
 | |
| 
 | |
| 	/*
 | |
| 	 * Having a null inode here (because mapping->host was set to zero by
 | |
| 	 * the VFS or MM) should not happen but we had reports of on oops (due
 | |
| 	 * to it being zero) during stress testcases so we need to check for it
 | |
| 	 */
 | |
| 
 | |
| 	if (cifs_inode == NULL) {
 | |
| 		cifs_dbg(VFS, "Null inode passed to cifs_writeable_file\n");
 | |
| 		dump_stack();
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	cifs_sb = CIFS_SB(cifs_inode->vfs_inode.i_sb);
 | |
| 
 | |
| 	/* only filter by fsuid on multiuser mounts */
 | |
| 	if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_MULTIUSER))
 | |
| 		fsuid_only = false;
 | |
| 
 | |
| 	spin_lock(&cifs_inode->open_file_lock);
 | |
| refind_writable:
 | |
| 	if (refind > MAX_REOPEN_ATT) {
 | |
| 		spin_unlock(&cifs_inode->open_file_lock);
 | |
| 		return rc;
 | |
| 	}
 | |
| 	list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
 | |
| 		if (!any_available && open_file->pid != current->tgid)
 | |
| 			continue;
 | |
| 		if (fsuid_only && !uid_eq(open_file->uid, current_fsuid()))
 | |
| 			continue;
 | |
| 		if (with_delete && !(open_file->fid.access & DELETE))
 | |
| 			continue;
 | |
| 		if (OPEN_FMODE(open_file->f_flags) & FMODE_WRITE) {
 | |
| 			if (!open_file->invalidHandle) {
 | |
| 				/* found a good writable file */
 | |
| 				cifsFileInfo_get(open_file);
 | |
| 				spin_unlock(&cifs_inode->open_file_lock);
 | |
| 				*ret_file = open_file;
 | |
| 				return 0;
 | |
| 			} else {
 | |
| 				if (!inv_file)
 | |
| 					inv_file = open_file;
 | |
| 			}
 | |
| 		}
 | |
| 	}
 | |
| 	/* couldn't find useable FH with same pid, try any available */
 | |
| 	if (!any_available) {
 | |
| 		any_available = true;
 | |
| 		goto refind_writable;
 | |
| 	}
 | |
| 
 | |
| 	if (inv_file) {
 | |
| 		any_available = false;
 | |
| 		cifsFileInfo_get(inv_file);
 | |
| 	}
 | |
| 
 | |
| 	spin_unlock(&cifs_inode->open_file_lock);
 | |
| 
 | |
| 	if (inv_file) {
 | |
| 		rc = cifs_reopen_file(inv_file, false);
 | |
| 		if (!rc) {
 | |
| 			*ret_file = inv_file;
 | |
| 			return 0;
 | |
| 		}
 | |
| 
 | |
| 		spin_lock(&cifs_inode->open_file_lock);
 | |
| 		list_move_tail(&inv_file->flist, &cifs_inode->openFileList);
 | |
| 		spin_unlock(&cifs_inode->open_file_lock);
 | |
| 		cifsFileInfo_put(inv_file);
 | |
| 		++refind;
 | |
| 		inv_file = NULL;
 | |
| 		spin_lock(&cifs_inode->open_file_lock);
 | |
| 		goto refind_writable;
 | |
| 	}
 | |
| 
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| struct cifsFileInfo *
 | |
| find_writable_file(struct cifsInodeInfo *cifs_inode, int flags)
 | |
| {
 | |
| 	struct cifsFileInfo *cfile;
 | |
| 	int rc;
 | |
| 
 | |
| 	rc = cifs_get_writable_file(cifs_inode, flags, &cfile);
 | |
| 	if (rc)
 | |
| 		cifs_dbg(FYI, "Couldn't find writable handle rc=%d\n", rc);
 | |
| 
 | |
| 	return cfile;
 | |
| }
 | |
| 
 | |
| int
 | |
| cifs_get_writable_path(struct cifs_tcon *tcon, const char *name,
 | |
| 		       int flags,
 | |
| 		       struct cifsFileInfo **ret_file)
 | |
| {
 | |
| 	struct cifsFileInfo *cfile;
 | |
| 	void *page = alloc_dentry_path();
 | |
| 
 | |
| 	*ret_file = NULL;
 | |
| 
 | |
| 	spin_lock(&tcon->open_file_lock);
 | |
| 	list_for_each_entry(cfile, &tcon->openFileList, tlist) {
 | |
| 		struct cifsInodeInfo *cinode;
 | |
| 		const char *full_path = build_path_from_dentry(cfile->dentry, page);
 | |
| 		if (IS_ERR(full_path)) {
 | |
| 			spin_unlock(&tcon->open_file_lock);
 | |
| 			free_dentry_path(page);
 | |
| 			return PTR_ERR(full_path);
 | |
| 		}
 | |
| 		if (strcmp(full_path, name))
 | |
| 			continue;
 | |
| 
 | |
| 		cinode = CIFS_I(d_inode(cfile->dentry));
 | |
| 		spin_unlock(&tcon->open_file_lock);
 | |
| 		free_dentry_path(page);
 | |
| 		return cifs_get_writable_file(cinode, flags, ret_file);
 | |
| 	}
 | |
| 
 | |
| 	spin_unlock(&tcon->open_file_lock);
 | |
| 	free_dentry_path(page);
 | |
| 	return -ENOENT;
 | |
| }
 | |
| 
 | |
| int
 | |
| cifs_get_readable_path(struct cifs_tcon *tcon, const char *name,
 | |
| 		       struct cifsFileInfo **ret_file)
 | |
| {
 | |
| 	struct cifsFileInfo *cfile;
 | |
| 	void *page = alloc_dentry_path();
 | |
| 
 | |
| 	*ret_file = NULL;
 | |
| 
 | |
| 	spin_lock(&tcon->open_file_lock);
 | |
| 	list_for_each_entry(cfile, &tcon->openFileList, tlist) {
 | |
| 		struct cifsInodeInfo *cinode;
 | |
| 		const char *full_path = build_path_from_dentry(cfile->dentry, page);
 | |
| 		if (IS_ERR(full_path)) {
 | |
| 			spin_unlock(&tcon->open_file_lock);
 | |
| 			free_dentry_path(page);
 | |
| 			return PTR_ERR(full_path);
 | |
| 		}
 | |
| 		if (strcmp(full_path, name))
 | |
| 			continue;
 | |
| 
 | |
| 		cinode = CIFS_I(d_inode(cfile->dentry));
 | |
| 		spin_unlock(&tcon->open_file_lock);
 | |
| 		free_dentry_path(page);
 | |
| 		*ret_file = find_readable_file(cinode, 0);
 | |
| 		return *ret_file ? 0 : -ENOENT;
 | |
| 	}
 | |
| 
 | |
| 	spin_unlock(&tcon->open_file_lock);
 | |
| 	free_dentry_path(page);
 | |
| 	return -ENOENT;
 | |
| }
 | |
| 
 | |
| static int cifs_partialpagewrite(struct page *page, unsigned from, unsigned to)
 | |
| {
 | |
| 	struct address_space *mapping = page->mapping;
 | |
| 	loff_t offset = (loff_t)page->index << PAGE_SHIFT;
 | |
| 	char *write_data;
 | |
| 	int rc = -EFAULT;
 | |
| 	int bytes_written = 0;
 | |
| 	struct inode *inode;
 | |
| 	struct cifsFileInfo *open_file;
 | |
| 
 | |
| 	if (!mapping || !mapping->host)
 | |
| 		return -EFAULT;
 | |
| 
 | |
| 	inode = page->mapping->host;
 | |
| 
 | |
| 	offset += (loff_t)from;
 | |
| 	write_data = kmap(page);
 | |
| 	write_data += from;
 | |
| 
 | |
| 	if ((to > PAGE_SIZE) || (from > to)) {
 | |
| 		kunmap(page);
 | |
| 		return -EIO;
 | |
| 	}
 | |
| 
 | |
| 	/* racing with truncate? */
 | |
| 	if (offset > mapping->host->i_size) {
 | |
| 		kunmap(page);
 | |
| 		return 0; /* don't care */
 | |
| 	}
 | |
| 
 | |
| 	/* check to make sure that we are not extending the file */
 | |
| 	if (mapping->host->i_size - offset < (loff_t)to)
 | |
| 		to = (unsigned)(mapping->host->i_size - offset);
 | |
| 
 | |
| 	rc = cifs_get_writable_file(CIFS_I(mapping->host), FIND_WR_ANY,
 | |
| 				    &open_file);
 | |
| 	if (!rc) {
 | |
| 		bytes_written = cifs_write(open_file, open_file->pid,
 | |
| 					   write_data, to - from, &offset);
 | |
| 		cifsFileInfo_put(open_file);
 | |
| 		/* Does mm or vfs already set times? */
 | |
| 		inode->i_atime = inode->i_mtime = current_time(inode);
 | |
| 		if ((bytes_written > 0) && (offset))
 | |
| 			rc = 0;
 | |
| 		else if (bytes_written < 0)
 | |
| 			rc = bytes_written;
 | |
| 		else
 | |
| 			rc = -EFAULT;
 | |
| 	} else {
 | |
| 		cifs_dbg(FYI, "No writable handle for write page rc=%d\n", rc);
 | |
| 		if (!is_retryable_error(rc))
 | |
| 			rc = -EIO;
 | |
| 	}
 | |
| 
 | |
| 	kunmap(page);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static struct cifs_writedata *
 | |
| wdata_alloc_and_fillpages(pgoff_t tofind, struct address_space *mapping,
 | |
| 			  pgoff_t end, pgoff_t *index,
 | |
| 			  unsigned int *found_pages)
 | |
| {
 | |
| 	struct cifs_writedata *wdata;
 | |
| 
 | |
| 	wdata = cifs_writedata_alloc((unsigned int)tofind,
 | |
| 				     cifs_writev_complete);
 | |
| 	if (!wdata)
 | |
| 		return NULL;
 | |
| 
 | |
| 	*found_pages = find_get_pages_range_tag(mapping, index, end,
 | |
| 				PAGECACHE_TAG_DIRTY, tofind, wdata->pages);
 | |
| 	return wdata;
 | |
| }
 | |
| 
 | |
| static unsigned int
 | |
| wdata_prepare_pages(struct cifs_writedata *wdata, unsigned int found_pages,
 | |
| 		    struct address_space *mapping,
 | |
| 		    struct writeback_control *wbc,
 | |
| 		    pgoff_t end, pgoff_t *index, pgoff_t *next, bool *done)
 | |
| {
 | |
| 	unsigned int nr_pages = 0, i;
 | |
| 	struct page *page;
 | |
| 
 | |
| 	for (i = 0; i < found_pages; i++) {
 | |
| 		page = wdata->pages[i];
 | |
| 		/*
 | |
| 		 * At this point we hold neither the i_pages lock nor the
 | |
| 		 * page lock: the page may be truncated or invalidated
 | |
| 		 * (changing page->mapping to NULL), or even swizzled
 | |
| 		 * back from swapper_space to tmpfs file mapping
 | |
| 		 */
 | |
| 
 | |
| 		if (nr_pages == 0)
 | |
| 			lock_page(page);
 | |
| 		else if (!trylock_page(page))
 | |
| 			break;
 | |
| 
 | |
| 		if (unlikely(page->mapping != mapping)) {
 | |
| 			unlock_page(page);
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		if (!wbc->range_cyclic && page->index > end) {
 | |
| 			*done = true;
 | |
| 			unlock_page(page);
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		if (*next && (page->index != *next)) {
 | |
| 			/* Not next consecutive page */
 | |
| 			unlock_page(page);
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		if (wbc->sync_mode != WB_SYNC_NONE)
 | |
| 			wait_on_page_writeback(page);
 | |
| 
 | |
| 		if (PageWriteback(page) ||
 | |
| 				!clear_page_dirty_for_io(page)) {
 | |
| 			unlock_page(page);
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		/*
 | |
| 		 * This actually clears the dirty bit in the radix tree.
 | |
| 		 * See cifs_writepage() for more commentary.
 | |
| 		 */
 | |
| 		set_page_writeback(page);
 | |
| 		if (page_offset(page) >= i_size_read(mapping->host)) {
 | |
| 			*done = true;
 | |
| 			unlock_page(page);
 | |
| 			end_page_writeback(page);
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		wdata->pages[i] = page;
 | |
| 		*next = page->index + 1;
 | |
| 		++nr_pages;
 | |
| 	}
 | |
| 
 | |
| 	/* reset index to refind any pages skipped */
 | |
| 	if (nr_pages == 0)
 | |
| 		*index = wdata->pages[0]->index + 1;
 | |
| 
 | |
| 	/* put any pages we aren't going to use */
 | |
| 	for (i = nr_pages; i < found_pages; i++) {
 | |
| 		put_page(wdata->pages[i]);
 | |
| 		wdata->pages[i] = NULL;
 | |
| 	}
 | |
| 
 | |
| 	return nr_pages;
 | |
| }
 | |
| 
 | |
| static int
 | |
| wdata_send_pages(struct cifs_writedata *wdata, unsigned int nr_pages,
 | |
| 		 struct address_space *mapping, struct writeback_control *wbc)
 | |
| {
 | |
| 	int rc;
 | |
| 
 | |
| 	wdata->sync_mode = wbc->sync_mode;
 | |
| 	wdata->nr_pages = nr_pages;
 | |
| 	wdata->offset = page_offset(wdata->pages[0]);
 | |
| 	wdata->pagesz = PAGE_SIZE;
 | |
| 	wdata->tailsz = min(i_size_read(mapping->host) -
 | |
| 			page_offset(wdata->pages[nr_pages - 1]),
 | |
| 			(loff_t)PAGE_SIZE);
 | |
| 	wdata->bytes = ((nr_pages - 1) * PAGE_SIZE) + wdata->tailsz;
 | |
| 	wdata->pid = wdata->cfile->pid;
 | |
| 
 | |
| 	rc = adjust_credits(wdata->server, &wdata->credits, wdata->bytes);
 | |
| 	if (rc)
 | |
| 		return rc;
 | |
| 
 | |
| 	if (wdata->cfile->invalidHandle)
 | |
| 		rc = -EAGAIN;
 | |
| 	else
 | |
| 		rc = wdata->server->ops->async_writev(wdata,
 | |
| 						      cifs_writedata_release);
 | |
| 
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int cifs_writepages(struct address_space *mapping,
 | |
| 			   struct writeback_control *wbc)
 | |
| {
 | |
| 	struct inode *inode = mapping->host;
 | |
| 	struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
 | |
| 	struct TCP_Server_Info *server;
 | |
| 	bool done = false, scanned = false, range_whole = false;
 | |
| 	pgoff_t end, index;
 | |
| 	struct cifs_writedata *wdata;
 | |
| 	struct cifsFileInfo *cfile = NULL;
 | |
| 	int rc = 0;
 | |
| 	int saved_rc = 0;
 | |
| 	unsigned int xid;
 | |
| 
 | |
| 	/*
 | |
| 	 * If wsize is smaller than the page cache size, default to writing
 | |
| 	 * one page at a time via cifs_writepage
 | |
| 	 */
 | |
| 	if (cifs_sb->ctx->wsize < PAGE_SIZE)
 | |
| 		return generic_writepages(mapping, wbc);
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 	if (wbc->range_cyclic) {
 | |
| 		index = mapping->writeback_index; /* Start from prev offset */
 | |
| 		end = -1;
 | |
| 	} else {
 | |
| 		index = wbc->range_start >> PAGE_SHIFT;
 | |
| 		end = wbc->range_end >> PAGE_SHIFT;
 | |
| 		if (wbc->range_start == 0 && wbc->range_end == LLONG_MAX)
 | |
| 			range_whole = true;
 | |
| 		scanned = true;
 | |
| 	}
 | |
| 	server = cifs_pick_channel(cifs_sb_master_tcon(cifs_sb)->ses);
 | |
| 
 | |
| retry:
 | |
| 	while (!done && index <= end) {
 | |
| 		unsigned int i, nr_pages, found_pages, wsize;
 | |
| 		pgoff_t next = 0, tofind, saved_index = index;
 | |
| 		struct cifs_credits credits_on_stack;
 | |
| 		struct cifs_credits *credits = &credits_on_stack;
 | |
| 		int get_file_rc = 0;
 | |
| 
 | |
| 		if (cfile)
 | |
| 			cifsFileInfo_put(cfile);
 | |
| 
 | |
| 		rc = cifs_get_writable_file(CIFS_I(inode), FIND_WR_ANY, &cfile);
 | |
| 
 | |
| 		/* in case of an error store it to return later */
 | |
| 		if (rc)
 | |
| 			get_file_rc = rc;
 | |
| 
 | |
| 		rc = server->ops->wait_mtu_credits(server, cifs_sb->ctx->wsize,
 | |
| 						   &wsize, credits);
 | |
| 		if (rc != 0) {
 | |
| 			done = true;
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		tofind = min((wsize / PAGE_SIZE) - 1, end - index) + 1;
 | |
| 
 | |
| 		wdata = wdata_alloc_and_fillpages(tofind, mapping, end, &index,
 | |
| 						  &found_pages);
 | |
| 		if (!wdata) {
 | |
| 			rc = -ENOMEM;
 | |
| 			done = true;
 | |
| 			add_credits_and_wake_if(server, credits, 0);
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		if (found_pages == 0) {
 | |
| 			kref_put(&wdata->refcount, cifs_writedata_release);
 | |
| 			add_credits_and_wake_if(server, credits, 0);
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		nr_pages = wdata_prepare_pages(wdata, found_pages, mapping, wbc,
 | |
| 					       end, &index, &next, &done);
 | |
| 
 | |
| 		/* nothing to write? */
 | |
| 		if (nr_pages == 0) {
 | |
| 			kref_put(&wdata->refcount, cifs_writedata_release);
 | |
| 			add_credits_and_wake_if(server, credits, 0);
 | |
| 			continue;
 | |
| 		}
 | |
| 
 | |
| 		wdata->credits = credits_on_stack;
 | |
| 		wdata->cfile = cfile;
 | |
| 		wdata->server = server;
 | |
| 		cfile = NULL;
 | |
| 
 | |
| 		if (!wdata->cfile) {
 | |
| 			cifs_dbg(VFS, "No writable handle in writepages rc=%d\n",
 | |
| 				 get_file_rc);
 | |
| 			if (is_retryable_error(get_file_rc))
 | |
| 				rc = get_file_rc;
 | |
| 			else
 | |
| 				rc = -EBADF;
 | |
| 		} else
 | |
| 			rc = wdata_send_pages(wdata, nr_pages, mapping, wbc);
 | |
| 
 | |
| 		for (i = 0; i < nr_pages; ++i)
 | |
| 			unlock_page(wdata->pages[i]);
 | |
| 
 | |
| 		/* send failure -- clean up the mess */
 | |
| 		if (rc != 0) {
 | |
| 			add_credits_and_wake_if(server, &wdata->credits, 0);
 | |
| 			for (i = 0; i < nr_pages; ++i) {
 | |
| 				if (is_retryable_error(rc))
 | |
| 					redirty_page_for_writepage(wbc,
 | |
| 							   wdata->pages[i]);
 | |
| 				else
 | |
| 					SetPageError(wdata->pages[i]);
 | |
| 				end_page_writeback(wdata->pages[i]);
 | |
| 				put_page(wdata->pages[i]);
 | |
| 			}
 | |
| 			if (!is_retryable_error(rc))
 | |
| 				mapping_set_error(mapping, rc);
 | |
| 		}
 | |
| 		kref_put(&wdata->refcount, cifs_writedata_release);
 | |
| 
 | |
| 		if (wbc->sync_mode == WB_SYNC_ALL && rc == -EAGAIN) {
 | |
| 			index = saved_index;
 | |
| 			continue;
 | |
| 		}
 | |
| 
 | |
| 		/* Return immediately if we received a signal during writing */
 | |
| 		if (is_interrupt_error(rc)) {
 | |
| 			done = true;
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		if (rc != 0 && saved_rc == 0)
 | |
| 			saved_rc = rc;
 | |
| 
 | |
| 		wbc->nr_to_write -= nr_pages;
 | |
| 		if (wbc->nr_to_write <= 0)
 | |
| 			done = true;
 | |
| 
 | |
| 		index = next;
 | |
| 	}
 | |
| 
 | |
| 	if (!scanned && !done) {
 | |
| 		/*
 | |
| 		 * We hit the last page and there is more work to be done: wrap
 | |
| 		 * back to the start of the file
 | |
| 		 */
 | |
| 		scanned = true;
 | |
| 		index = 0;
 | |
| 		goto retry;
 | |
| 	}
 | |
| 
 | |
| 	if (saved_rc != 0)
 | |
| 		rc = saved_rc;
 | |
| 
 | |
| 	if (wbc->range_cyclic || (range_whole && wbc->nr_to_write > 0))
 | |
| 		mapping->writeback_index = index;
 | |
| 
 | |
| 	if (cfile)
 | |
| 		cifsFileInfo_put(cfile);
 | |
| 	free_xid(xid);
 | |
| 	/* Indication to update ctime and mtime as close is deferred */
 | |
| 	set_bit(CIFS_INO_MODIFIED_ATTR, &CIFS_I(inode)->flags);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_writepage_locked(struct page *page, struct writeback_control *wbc)
 | |
| {
 | |
| 	int rc;
 | |
| 	unsigned int xid;
 | |
| 
 | |
| 	xid = get_xid();
 | |
| /* BB add check for wbc flags */
 | |
| 	get_page(page);
 | |
| 	if (!PageUptodate(page))
 | |
| 		cifs_dbg(FYI, "ppw - page not up to date\n");
 | |
| 
 | |
| 	/*
 | |
| 	 * Set the "writeback" flag, and clear "dirty" in the radix tree.
 | |
| 	 *
 | |
| 	 * A writepage() implementation always needs to do either this,
 | |
| 	 * or re-dirty the page with "redirty_page_for_writepage()" in
 | |
| 	 * the case of a failure.
 | |
| 	 *
 | |
| 	 * Just unlocking the page will cause the radix tree tag-bits
 | |
| 	 * to fail to update with the state of the page correctly.
 | |
| 	 */
 | |
| 	set_page_writeback(page);
 | |
| retry_write:
 | |
| 	rc = cifs_partialpagewrite(page, 0, PAGE_SIZE);
 | |
| 	if (is_retryable_error(rc)) {
 | |
| 		if (wbc->sync_mode == WB_SYNC_ALL && rc == -EAGAIN)
 | |
| 			goto retry_write;
 | |
| 		redirty_page_for_writepage(wbc, page);
 | |
| 	} else if (rc != 0) {
 | |
| 		SetPageError(page);
 | |
| 		mapping_set_error(page->mapping, rc);
 | |
| 	} else {
 | |
| 		SetPageUptodate(page);
 | |
| 	}
 | |
| 	end_page_writeback(page);
 | |
| 	put_page(page);
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int cifs_writepage(struct page *page, struct writeback_control *wbc)
 | |
| {
 | |
| 	int rc = cifs_writepage_locked(page, wbc);
 | |
| 	unlock_page(page);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int cifs_write_end(struct file *file, struct address_space *mapping,
 | |
| 			loff_t pos, unsigned len, unsigned copied,
 | |
| 			struct page *page, void *fsdata)
 | |
| {
 | |
| 	int rc;
 | |
| 	struct inode *inode = mapping->host;
 | |
| 	struct cifsFileInfo *cfile = file->private_data;
 | |
| 	struct cifs_sb_info *cifs_sb = CIFS_SB(cfile->dentry->d_sb);
 | |
| 	__u32 pid;
 | |
| 
 | |
| 	if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
 | |
| 		pid = cfile->pid;
 | |
| 	else
 | |
| 		pid = current->tgid;
 | |
| 
 | |
| 	cifs_dbg(FYI, "write_end for page %p from pos %lld with %d bytes\n",
 | |
| 		 page, pos, copied);
 | |
| 
 | |
| 	if (PageChecked(page)) {
 | |
| 		if (copied == len)
 | |
| 			SetPageUptodate(page);
 | |
| 		ClearPageChecked(page);
 | |
| 	} else if (!PageUptodate(page) && copied == PAGE_SIZE)
 | |
| 		SetPageUptodate(page);
 | |
| 
 | |
| 	if (!PageUptodate(page)) {
 | |
| 		char *page_data;
 | |
| 		unsigned offset = pos & (PAGE_SIZE - 1);
 | |
| 		unsigned int xid;
 | |
| 
 | |
| 		xid = get_xid();
 | |
| 		/* this is probably better than directly calling
 | |
| 		   partialpage_write since in this function the file handle is
 | |
| 		   known which we might as well	leverage */
 | |
| 		/* BB check if anything else missing out of ppw
 | |
| 		   such as updating last write time */
 | |
| 		page_data = kmap(page);
 | |
| 		rc = cifs_write(cfile, pid, page_data + offset, copied, &pos);
 | |
| 		/* if (rc < 0) should we set writebehind rc? */
 | |
| 		kunmap(page);
 | |
| 
 | |
| 		free_xid(xid);
 | |
| 	} else {
 | |
| 		rc = copied;
 | |
| 		pos += copied;
 | |
| 		set_page_dirty(page);
 | |
| 	}
 | |
| 
 | |
| 	if (rc > 0) {
 | |
| 		spin_lock(&inode->i_lock);
 | |
| 		if (pos > inode->i_size) {
 | |
| 			i_size_write(inode, pos);
 | |
| 			inode->i_blocks = (512 - 1 + pos) >> 9;
 | |
| 		}
 | |
| 		spin_unlock(&inode->i_lock);
 | |
| 	}
 | |
| 
 | |
| 	unlock_page(page);
 | |
| 	put_page(page);
 | |
| 	/* Indication to update ctime and mtime as close is deferred */
 | |
| 	set_bit(CIFS_INO_MODIFIED_ATTR, &CIFS_I(inode)->flags);
 | |
| 
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| int cifs_strict_fsync(struct file *file, loff_t start, loff_t end,
 | |
| 		      int datasync)
 | |
| {
 | |
| 	unsigned int xid;
 | |
| 	int rc = 0;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 	struct TCP_Server_Info *server;
 | |
| 	struct cifsFileInfo *smbfile = file->private_data;
 | |
| 	struct inode *inode = file_inode(file);
 | |
| 	struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
 | |
| 
 | |
| 	rc = file_write_and_wait_range(file, start, end);
 | |
| 	if (rc) {
 | |
| 		trace_cifs_fsync_err(inode->i_ino, rc);
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 
 | |
| 	cifs_dbg(FYI, "Sync file - name: %pD datasync: 0x%x\n",
 | |
| 		 file, datasync);
 | |
| 
 | |
| 	if (!CIFS_CACHE_READ(CIFS_I(inode))) {
 | |
| 		rc = cifs_zap_mapping(inode);
 | |
| 		if (rc) {
 | |
| 			cifs_dbg(FYI, "rc: %d during invalidate phase\n", rc);
 | |
| 			rc = 0; /* don't care about it in fsync */
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	tcon = tlink_tcon(smbfile->tlink);
 | |
| 	if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOSSYNC)) {
 | |
| 		server = tcon->ses->server;
 | |
| 		if (server->ops->flush)
 | |
| 			rc = server->ops->flush(xid, tcon, &smbfile->fid);
 | |
| 		else
 | |
| 			rc = -ENOSYS;
 | |
| 	}
 | |
| 
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| int cifs_fsync(struct file *file, loff_t start, loff_t end, int datasync)
 | |
| {
 | |
| 	unsigned int xid;
 | |
| 	int rc = 0;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 	struct TCP_Server_Info *server;
 | |
| 	struct cifsFileInfo *smbfile = file->private_data;
 | |
| 	struct cifs_sb_info *cifs_sb = CIFS_FILE_SB(file);
 | |
| 
 | |
| 	rc = file_write_and_wait_range(file, start, end);
 | |
| 	if (rc) {
 | |
| 		trace_cifs_fsync_err(file_inode(file)->i_ino, rc);
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 
 | |
| 	cifs_dbg(FYI, "Sync file - name: %pD datasync: 0x%x\n",
 | |
| 		 file, datasync);
 | |
| 
 | |
| 	tcon = tlink_tcon(smbfile->tlink);
 | |
| 	if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOSSYNC)) {
 | |
| 		server = tcon->ses->server;
 | |
| 		if (server->ops->flush)
 | |
| 			rc = server->ops->flush(xid, tcon, &smbfile->fid);
 | |
| 		else
 | |
| 			rc = -ENOSYS;
 | |
| 	}
 | |
| 
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * As file closes, flush all cached write data for this inode checking
 | |
|  * for write behind errors.
 | |
|  */
 | |
| int cifs_flush(struct file *file, fl_owner_t id)
 | |
| {
 | |
| 	struct inode *inode = file_inode(file);
 | |
| 	int rc = 0;
 | |
| 
 | |
| 	if (file->f_mode & FMODE_WRITE)
 | |
| 		rc = filemap_write_and_wait(inode->i_mapping);
 | |
| 
 | |
| 	cifs_dbg(FYI, "Flush inode %p file %p rc %d\n", inode, file, rc);
 | |
| 	if (rc)
 | |
| 		trace_cifs_flush_err(inode->i_ino, rc);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_write_allocate_pages(struct page **pages, unsigned long num_pages)
 | |
| {
 | |
| 	int rc = 0;
 | |
| 	unsigned long i;
 | |
| 
 | |
| 	for (i = 0; i < num_pages; i++) {
 | |
| 		pages[i] = alloc_page(GFP_KERNEL|__GFP_HIGHMEM);
 | |
| 		if (!pages[i]) {
 | |
| 			/*
 | |
| 			 * save number of pages we have already allocated and
 | |
| 			 * return with ENOMEM error
 | |
| 			 */
 | |
| 			num_pages = i;
 | |
| 			rc = -ENOMEM;
 | |
| 			break;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if (rc) {
 | |
| 		for (i = 0; i < num_pages; i++)
 | |
| 			put_page(pages[i]);
 | |
| 	}
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static inline
 | |
| size_t get_numpages(const size_t wsize, const size_t len, size_t *cur_len)
 | |
| {
 | |
| 	size_t num_pages;
 | |
| 	size_t clen;
 | |
| 
 | |
| 	clen = min_t(const size_t, len, wsize);
 | |
| 	num_pages = DIV_ROUND_UP(clen, PAGE_SIZE);
 | |
| 
 | |
| 	if (cur_len)
 | |
| 		*cur_len = clen;
 | |
| 
 | |
| 	return num_pages;
 | |
| }
 | |
| 
 | |
| static void
 | |
| cifs_uncached_writedata_release(struct kref *refcount)
 | |
| {
 | |
| 	int i;
 | |
| 	struct cifs_writedata *wdata = container_of(refcount,
 | |
| 					struct cifs_writedata, refcount);
 | |
| 
 | |
| 	kref_put(&wdata->ctx->refcount, cifs_aio_ctx_release);
 | |
| 	for (i = 0; i < wdata->nr_pages; i++)
 | |
| 		put_page(wdata->pages[i]);
 | |
| 	cifs_writedata_release(refcount);
 | |
| }
 | |
| 
 | |
| static void collect_uncached_write_data(struct cifs_aio_ctx *ctx);
 | |
| 
 | |
| static void
 | |
| cifs_uncached_writev_complete(struct work_struct *work)
 | |
| {
 | |
| 	struct cifs_writedata *wdata = container_of(work,
 | |
| 					struct cifs_writedata, work);
 | |
| 	struct inode *inode = d_inode(wdata->cfile->dentry);
 | |
| 	struct cifsInodeInfo *cifsi = CIFS_I(inode);
 | |
| 
 | |
| 	spin_lock(&inode->i_lock);
 | |
| 	cifs_update_eof(cifsi, wdata->offset, wdata->bytes);
 | |
| 	if (cifsi->server_eof > inode->i_size)
 | |
| 		i_size_write(inode, cifsi->server_eof);
 | |
| 	spin_unlock(&inode->i_lock);
 | |
| 
 | |
| 	complete(&wdata->done);
 | |
| 	collect_uncached_write_data(wdata->ctx);
 | |
| 	/* the below call can possibly free the last ref to aio ctx */
 | |
| 	kref_put(&wdata->refcount, cifs_uncached_writedata_release);
 | |
| }
 | |
| 
 | |
| static int
 | |
| wdata_fill_from_iovec(struct cifs_writedata *wdata, struct iov_iter *from,
 | |
| 		      size_t *len, unsigned long *num_pages)
 | |
| {
 | |
| 	size_t save_len, copied, bytes, cur_len = *len;
 | |
| 	unsigned long i, nr_pages = *num_pages;
 | |
| 
 | |
| 	save_len = cur_len;
 | |
| 	for (i = 0; i < nr_pages; i++) {
 | |
| 		bytes = min_t(const size_t, cur_len, PAGE_SIZE);
 | |
| 		copied = copy_page_from_iter(wdata->pages[i], 0, bytes, from);
 | |
| 		cur_len -= copied;
 | |
| 		/*
 | |
| 		 * If we didn't copy as much as we expected, then that
 | |
| 		 * may mean we trod into an unmapped area. Stop copying
 | |
| 		 * at that point. On the next pass through the big
 | |
| 		 * loop, we'll likely end up getting a zero-length
 | |
| 		 * write and bailing out of it.
 | |
| 		 */
 | |
| 		if (copied < bytes)
 | |
| 			break;
 | |
| 	}
 | |
| 	cur_len = save_len - cur_len;
 | |
| 	*len = cur_len;
 | |
| 
 | |
| 	/*
 | |
| 	 * If we have no data to send, then that probably means that
 | |
| 	 * the copy above failed altogether. That's most likely because
 | |
| 	 * the address in the iovec was bogus. Return -EFAULT and let
 | |
| 	 * the caller free anything we allocated and bail out.
 | |
| 	 */
 | |
| 	if (!cur_len)
 | |
| 		return -EFAULT;
 | |
| 
 | |
| 	/*
 | |
| 	 * i + 1 now represents the number of pages we actually used in
 | |
| 	 * the copy phase above.
 | |
| 	 */
 | |
| 	*num_pages = i + 1;
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_resend_wdata(struct cifs_writedata *wdata, struct list_head *wdata_list,
 | |
| 	struct cifs_aio_ctx *ctx)
 | |
| {
 | |
| 	unsigned int wsize;
 | |
| 	struct cifs_credits credits;
 | |
| 	int rc;
 | |
| 	struct TCP_Server_Info *server = wdata->server;
 | |
| 
 | |
| 	do {
 | |
| 		if (wdata->cfile->invalidHandle) {
 | |
| 			rc = cifs_reopen_file(wdata->cfile, false);
 | |
| 			if (rc == -EAGAIN)
 | |
| 				continue;
 | |
| 			else if (rc)
 | |
| 				break;
 | |
| 		}
 | |
| 
 | |
| 
 | |
| 		/*
 | |
| 		 * Wait for credits to resend this wdata.
 | |
| 		 * Note: we are attempting to resend the whole wdata not in
 | |
| 		 * segments
 | |
| 		 */
 | |
| 		do {
 | |
| 			rc = server->ops->wait_mtu_credits(server, wdata->bytes,
 | |
| 						&wsize, &credits);
 | |
| 			if (rc)
 | |
| 				goto fail;
 | |
| 
 | |
| 			if (wsize < wdata->bytes) {
 | |
| 				add_credits_and_wake_if(server, &credits, 0);
 | |
| 				msleep(1000);
 | |
| 			}
 | |
| 		} while (wsize < wdata->bytes);
 | |
| 		wdata->credits = credits;
 | |
| 
 | |
| 		rc = adjust_credits(server, &wdata->credits, wdata->bytes);
 | |
| 
 | |
| 		if (!rc) {
 | |
| 			if (wdata->cfile->invalidHandle)
 | |
| 				rc = -EAGAIN;
 | |
| 			else {
 | |
| #ifdef CONFIG_CIFS_SMB_DIRECT
 | |
| 				if (wdata->mr) {
 | |
| 					wdata->mr->need_invalidate = true;
 | |
| 					smbd_deregister_mr(wdata->mr);
 | |
| 					wdata->mr = NULL;
 | |
| 				}
 | |
| #endif
 | |
| 				rc = server->ops->async_writev(wdata,
 | |
| 					cifs_uncached_writedata_release);
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		/* If the write was successfully sent, we are done */
 | |
| 		if (!rc) {
 | |
| 			list_add_tail(&wdata->list, wdata_list);
 | |
| 			return 0;
 | |
| 		}
 | |
| 
 | |
| 		/* Roll back credits and retry if needed */
 | |
| 		add_credits_and_wake_if(server, &wdata->credits, 0);
 | |
| 	} while (rc == -EAGAIN);
 | |
| 
 | |
| fail:
 | |
| 	kref_put(&wdata->refcount, cifs_uncached_writedata_release);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_write_from_iter(loff_t offset, size_t len, struct iov_iter *from,
 | |
| 		     struct cifsFileInfo *open_file,
 | |
| 		     struct cifs_sb_info *cifs_sb, struct list_head *wdata_list,
 | |
| 		     struct cifs_aio_ctx *ctx)
 | |
| {
 | |
| 	int rc = 0;
 | |
| 	size_t cur_len;
 | |
| 	unsigned long nr_pages, num_pages, i;
 | |
| 	struct cifs_writedata *wdata;
 | |
| 	struct iov_iter saved_from = *from;
 | |
| 	loff_t saved_offset = offset;
 | |
| 	pid_t pid;
 | |
| 	struct TCP_Server_Info *server;
 | |
| 	struct page **pagevec;
 | |
| 	size_t start;
 | |
| 	unsigned int xid;
 | |
| 
 | |
| 	if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
 | |
| 		pid = open_file->pid;
 | |
| 	else
 | |
| 		pid = current->tgid;
 | |
| 
 | |
| 	server = cifs_pick_channel(tlink_tcon(open_file->tlink)->ses);
 | |
| 	xid = get_xid();
 | |
| 
 | |
| 	do {
 | |
| 		unsigned int wsize;
 | |
| 		struct cifs_credits credits_on_stack;
 | |
| 		struct cifs_credits *credits = &credits_on_stack;
 | |
| 
 | |
| 		if (open_file->invalidHandle) {
 | |
| 			rc = cifs_reopen_file(open_file, false);
 | |
| 			if (rc == -EAGAIN)
 | |
| 				continue;
 | |
| 			else if (rc)
 | |
| 				break;
 | |
| 		}
 | |
| 
 | |
| 		rc = server->ops->wait_mtu_credits(server, cifs_sb->ctx->wsize,
 | |
| 						   &wsize, credits);
 | |
| 		if (rc)
 | |
| 			break;
 | |
| 
 | |
| 		cur_len = min_t(const size_t, len, wsize);
 | |
| 
 | |
| 		if (ctx->direct_io) {
 | |
| 			ssize_t result;
 | |
| 
 | |
| 			result = iov_iter_get_pages_alloc(
 | |
| 				from, &pagevec, cur_len, &start);
 | |
| 			if (result < 0) {
 | |
| 				cifs_dbg(VFS,
 | |
| 					 "direct_writev couldn't get user pages (rc=%zd) iter type %d iov_offset %zd count %zd\n",
 | |
| 					 result, iov_iter_type(from),
 | |
| 					 from->iov_offset, from->count);
 | |
| 				dump_stack();
 | |
| 
 | |
| 				rc = result;
 | |
| 				add_credits_and_wake_if(server, credits, 0);
 | |
| 				break;
 | |
| 			}
 | |
| 			cur_len = (size_t)result;
 | |
| 			iov_iter_advance(from, cur_len);
 | |
| 
 | |
| 			nr_pages =
 | |
| 				(cur_len + start + PAGE_SIZE - 1) / PAGE_SIZE;
 | |
| 
 | |
| 			wdata = cifs_writedata_direct_alloc(pagevec,
 | |
| 					     cifs_uncached_writev_complete);
 | |
| 			if (!wdata) {
 | |
| 				rc = -ENOMEM;
 | |
| 				add_credits_and_wake_if(server, credits, 0);
 | |
| 				break;
 | |
| 			}
 | |
| 
 | |
| 
 | |
| 			wdata->page_offset = start;
 | |
| 			wdata->tailsz =
 | |
| 				nr_pages > 1 ?
 | |
| 					cur_len - (PAGE_SIZE - start) -
 | |
| 					(nr_pages - 2) * PAGE_SIZE :
 | |
| 					cur_len;
 | |
| 		} else {
 | |
| 			nr_pages = get_numpages(wsize, len, &cur_len);
 | |
| 			wdata = cifs_writedata_alloc(nr_pages,
 | |
| 					     cifs_uncached_writev_complete);
 | |
| 			if (!wdata) {
 | |
| 				rc = -ENOMEM;
 | |
| 				add_credits_and_wake_if(server, credits, 0);
 | |
| 				break;
 | |
| 			}
 | |
| 
 | |
| 			rc = cifs_write_allocate_pages(wdata->pages, nr_pages);
 | |
| 			if (rc) {
 | |
| 				kvfree(wdata->pages);
 | |
| 				kfree(wdata);
 | |
| 				add_credits_and_wake_if(server, credits, 0);
 | |
| 				break;
 | |
| 			}
 | |
| 
 | |
| 			num_pages = nr_pages;
 | |
| 			rc = wdata_fill_from_iovec(
 | |
| 				wdata, from, &cur_len, &num_pages);
 | |
| 			if (rc) {
 | |
| 				for (i = 0; i < nr_pages; i++)
 | |
| 					put_page(wdata->pages[i]);
 | |
| 				kvfree(wdata->pages);
 | |
| 				kfree(wdata);
 | |
| 				add_credits_and_wake_if(server, credits, 0);
 | |
| 				break;
 | |
| 			}
 | |
| 
 | |
| 			/*
 | |
| 			 * Bring nr_pages down to the number of pages we
 | |
| 			 * actually used, and free any pages that we didn't use.
 | |
| 			 */
 | |
| 			for ( ; nr_pages > num_pages; nr_pages--)
 | |
| 				put_page(wdata->pages[nr_pages - 1]);
 | |
| 
 | |
| 			wdata->tailsz = cur_len - ((nr_pages - 1) * PAGE_SIZE);
 | |
| 		}
 | |
| 
 | |
| 		wdata->sync_mode = WB_SYNC_ALL;
 | |
| 		wdata->nr_pages = nr_pages;
 | |
| 		wdata->offset = (__u64)offset;
 | |
| 		wdata->cfile = cifsFileInfo_get(open_file);
 | |
| 		wdata->server = server;
 | |
| 		wdata->pid = pid;
 | |
| 		wdata->bytes = cur_len;
 | |
| 		wdata->pagesz = PAGE_SIZE;
 | |
| 		wdata->credits = credits_on_stack;
 | |
| 		wdata->ctx = ctx;
 | |
| 		kref_get(&ctx->refcount);
 | |
| 
 | |
| 		rc = adjust_credits(server, &wdata->credits, wdata->bytes);
 | |
| 
 | |
| 		if (!rc) {
 | |
| 			if (wdata->cfile->invalidHandle)
 | |
| 				rc = -EAGAIN;
 | |
| 			else
 | |
| 				rc = server->ops->async_writev(wdata,
 | |
| 					cifs_uncached_writedata_release);
 | |
| 		}
 | |
| 
 | |
| 		if (rc) {
 | |
| 			add_credits_and_wake_if(server, &wdata->credits, 0);
 | |
| 			kref_put(&wdata->refcount,
 | |
| 				 cifs_uncached_writedata_release);
 | |
| 			if (rc == -EAGAIN) {
 | |
| 				*from = saved_from;
 | |
| 				iov_iter_advance(from, offset - saved_offset);
 | |
| 				continue;
 | |
| 			}
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		list_add_tail(&wdata->list, wdata_list);
 | |
| 		offset += cur_len;
 | |
| 		len -= cur_len;
 | |
| 	} while (len > 0);
 | |
| 
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static void collect_uncached_write_data(struct cifs_aio_ctx *ctx)
 | |
| {
 | |
| 	struct cifs_writedata *wdata, *tmp;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 	struct cifs_sb_info *cifs_sb;
 | |
| 	struct dentry *dentry = ctx->cfile->dentry;
 | |
| 	int rc;
 | |
| 
 | |
| 	tcon = tlink_tcon(ctx->cfile->tlink);
 | |
| 	cifs_sb = CIFS_SB(dentry->d_sb);
 | |
| 
 | |
| 	mutex_lock(&ctx->aio_mutex);
 | |
| 
 | |
| 	if (list_empty(&ctx->list)) {
 | |
| 		mutex_unlock(&ctx->aio_mutex);
 | |
| 		return;
 | |
| 	}
 | |
| 
 | |
| 	rc = ctx->rc;
 | |
| 	/*
 | |
| 	 * Wait for and collect replies for any successful sends in order of
 | |
| 	 * increasing offset. Once an error is hit, then return without waiting
 | |
| 	 * for any more replies.
 | |
| 	 */
 | |
| restart_loop:
 | |
| 	list_for_each_entry_safe(wdata, tmp, &ctx->list, list) {
 | |
| 		if (!rc) {
 | |
| 			if (!try_wait_for_completion(&wdata->done)) {
 | |
| 				mutex_unlock(&ctx->aio_mutex);
 | |
| 				return;
 | |
| 			}
 | |
| 
 | |
| 			if (wdata->result)
 | |
| 				rc = wdata->result;
 | |
| 			else
 | |
| 				ctx->total_len += wdata->bytes;
 | |
| 
 | |
| 			/* resend call if it's a retryable error */
 | |
| 			if (rc == -EAGAIN) {
 | |
| 				struct list_head tmp_list;
 | |
| 				struct iov_iter tmp_from = ctx->iter;
 | |
| 
 | |
| 				INIT_LIST_HEAD(&tmp_list);
 | |
| 				list_del_init(&wdata->list);
 | |
| 
 | |
| 				if (ctx->direct_io)
 | |
| 					rc = cifs_resend_wdata(
 | |
| 						wdata, &tmp_list, ctx);
 | |
| 				else {
 | |
| 					iov_iter_advance(&tmp_from,
 | |
| 						 wdata->offset - ctx->pos);
 | |
| 
 | |
| 					rc = cifs_write_from_iter(wdata->offset,
 | |
| 						wdata->bytes, &tmp_from,
 | |
| 						ctx->cfile, cifs_sb, &tmp_list,
 | |
| 						ctx);
 | |
| 
 | |
| 					kref_put(&wdata->refcount,
 | |
| 						cifs_uncached_writedata_release);
 | |
| 				}
 | |
| 
 | |
| 				list_splice(&tmp_list, &ctx->list);
 | |
| 				goto restart_loop;
 | |
| 			}
 | |
| 		}
 | |
| 		list_del_init(&wdata->list);
 | |
| 		kref_put(&wdata->refcount, cifs_uncached_writedata_release);
 | |
| 	}
 | |
| 
 | |
| 	cifs_stats_bytes_written(tcon, ctx->total_len);
 | |
| 	set_bit(CIFS_INO_INVALID_MAPPING, &CIFS_I(dentry->d_inode)->flags);
 | |
| 
 | |
| 	ctx->rc = (rc == 0) ? ctx->total_len : rc;
 | |
| 
 | |
| 	mutex_unlock(&ctx->aio_mutex);
 | |
| 
 | |
| 	if (ctx->iocb && ctx->iocb->ki_complete)
 | |
| 		ctx->iocb->ki_complete(ctx->iocb, ctx->rc, 0);
 | |
| 	else
 | |
| 		complete(&ctx->done);
 | |
| }
 | |
| 
 | |
| static ssize_t __cifs_writev(
 | |
| 	struct kiocb *iocb, struct iov_iter *from, bool direct)
 | |
| {
 | |
| 	struct file *file = iocb->ki_filp;
 | |
| 	ssize_t total_written = 0;
 | |
| 	struct cifsFileInfo *cfile;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 	struct cifs_sb_info *cifs_sb;
 | |
| 	struct cifs_aio_ctx *ctx;
 | |
| 	struct iov_iter saved_from = *from;
 | |
| 	size_t len = iov_iter_count(from);
 | |
| 	int rc;
 | |
| 
 | |
| 	/*
 | |
| 	 * iov_iter_get_pages_alloc doesn't work with ITER_KVEC.
 | |
| 	 * In this case, fall back to non-direct write function.
 | |
| 	 * this could be improved by getting pages directly in ITER_KVEC
 | |
| 	 */
 | |
| 	if (direct && iov_iter_is_kvec(from)) {
 | |
| 		cifs_dbg(FYI, "use non-direct cifs_writev for kvec I/O\n");
 | |
| 		direct = false;
 | |
| 	}
 | |
| 
 | |
| 	rc = generic_write_checks(iocb, from);
 | |
| 	if (rc <= 0)
 | |
| 		return rc;
 | |
| 
 | |
| 	cifs_sb = CIFS_FILE_SB(file);
 | |
| 	cfile = file->private_data;
 | |
| 	tcon = tlink_tcon(cfile->tlink);
 | |
| 
 | |
| 	if (!tcon->ses->server->ops->async_writev)
 | |
| 		return -ENOSYS;
 | |
| 
 | |
| 	ctx = cifs_aio_ctx_alloc();
 | |
| 	if (!ctx)
 | |
| 		return -ENOMEM;
 | |
| 
 | |
| 	ctx->cfile = cifsFileInfo_get(cfile);
 | |
| 
 | |
| 	if (!is_sync_kiocb(iocb))
 | |
| 		ctx->iocb = iocb;
 | |
| 
 | |
| 	ctx->pos = iocb->ki_pos;
 | |
| 
 | |
| 	if (direct) {
 | |
| 		ctx->direct_io = true;
 | |
| 		ctx->iter = *from;
 | |
| 		ctx->len = len;
 | |
| 	} else {
 | |
| 		rc = setup_aio_ctx_iter(ctx, from, WRITE);
 | |
| 		if (rc) {
 | |
| 			kref_put(&ctx->refcount, cifs_aio_ctx_release);
 | |
| 			return rc;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	/* grab a lock here due to read response handlers can access ctx */
 | |
| 	mutex_lock(&ctx->aio_mutex);
 | |
| 
 | |
| 	rc = cifs_write_from_iter(iocb->ki_pos, ctx->len, &saved_from,
 | |
| 				  cfile, cifs_sb, &ctx->list, ctx);
 | |
| 
 | |
| 	/*
 | |
| 	 * If at least one write was successfully sent, then discard any rc
 | |
| 	 * value from the later writes. If the other write succeeds, then
 | |
| 	 * we'll end up returning whatever was written. If it fails, then
 | |
| 	 * we'll get a new rc value from that.
 | |
| 	 */
 | |
| 	if (!list_empty(&ctx->list))
 | |
| 		rc = 0;
 | |
| 
 | |
| 	mutex_unlock(&ctx->aio_mutex);
 | |
| 
 | |
| 	if (rc) {
 | |
| 		kref_put(&ctx->refcount, cifs_aio_ctx_release);
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	if (!is_sync_kiocb(iocb)) {
 | |
| 		kref_put(&ctx->refcount, cifs_aio_ctx_release);
 | |
| 		return -EIOCBQUEUED;
 | |
| 	}
 | |
| 
 | |
| 	rc = wait_for_completion_killable(&ctx->done);
 | |
| 	if (rc) {
 | |
| 		mutex_lock(&ctx->aio_mutex);
 | |
| 		ctx->rc = rc = -EINTR;
 | |
| 		total_written = ctx->total_len;
 | |
| 		mutex_unlock(&ctx->aio_mutex);
 | |
| 	} else {
 | |
| 		rc = ctx->rc;
 | |
| 		total_written = ctx->total_len;
 | |
| 	}
 | |
| 
 | |
| 	kref_put(&ctx->refcount, cifs_aio_ctx_release);
 | |
| 
 | |
| 	if (unlikely(!total_written))
 | |
| 		return rc;
 | |
| 
 | |
| 	iocb->ki_pos += total_written;
 | |
| 	return total_written;
 | |
| }
 | |
| 
 | |
| ssize_t cifs_direct_writev(struct kiocb *iocb, struct iov_iter *from)
 | |
| {
 | |
| 	return __cifs_writev(iocb, from, true);
 | |
| }
 | |
| 
 | |
| ssize_t cifs_user_writev(struct kiocb *iocb, struct iov_iter *from)
 | |
| {
 | |
| 	return __cifs_writev(iocb, from, false);
 | |
| }
 | |
| 
 | |
| static ssize_t
 | |
| cifs_writev(struct kiocb *iocb, struct iov_iter *from)
 | |
| {
 | |
| 	struct file *file = iocb->ki_filp;
 | |
| 	struct cifsFileInfo *cfile = (struct cifsFileInfo *)file->private_data;
 | |
| 	struct inode *inode = file->f_mapping->host;
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(inode);
 | |
| 	struct TCP_Server_Info *server = tlink_tcon(cfile->tlink)->ses->server;
 | |
| 	ssize_t rc;
 | |
| 
 | |
| 	inode_lock(inode);
 | |
| 	/*
 | |
| 	 * We need to hold the sem to be sure nobody modifies lock list
 | |
| 	 * with a brlock that prevents writing.
 | |
| 	 */
 | |
| 	down_read(&cinode->lock_sem);
 | |
| 
 | |
| 	rc = generic_write_checks(iocb, from);
 | |
| 	if (rc <= 0)
 | |
| 		goto out;
 | |
| 
 | |
| 	if (!cifs_find_lock_conflict(cfile, iocb->ki_pos, iov_iter_count(from),
 | |
| 				     server->vals->exclusive_lock_type, 0,
 | |
| 				     NULL, CIFS_WRITE_OP))
 | |
| 		rc = __generic_file_write_iter(iocb, from);
 | |
| 	else
 | |
| 		rc = -EACCES;
 | |
| out:
 | |
| 	up_read(&cinode->lock_sem);
 | |
| 	inode_unlock(inode);
 | |
| 
 | |
| 	if (rc > 0)
 | |
| 		rc = generic_write_sync(iocb, rc);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| ssize_t
 | |
| cifs_strict_writev(struct kiocb *iocb, struct iov_iter *from)
 | |
| {
 | |
| 	struct inode *inode = file_inode(iocb->ki_filp);
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(inode);
 | |
| 	struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
 | |
| 	struct cifsFileInfo *cfile = (struct cifsFileInfo *)
 | |
| 						iocb->ki_filp->private_data;
 | |
| 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
 | |
| 	ssize_t written;
 | |
| 
 | |
| 	written = cifs_get_writer(cinode);
 | |
| 	if (written)
 | |
| 		return written;
 | |
| 
 | |
| 	if (CIFS_CACHE_WRITE(cinode)) {
 | |
| 		if (cap_unix(tcon->ses) &&
 | |
| 		(CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability))
 | |
| 		  && ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0)) {
 | |
| 			written = generic_file_write_iter(iocb, from);
 | |
| 			goto out;
 | |
| 		}
 | |
| 		written = cifs_writev(iocb, from);
 | |
| 		goto out;
 | |
| 	}
 | |
| 	/*
 | |
| 	 * For non-oplocked files in strict cache mode we need to write the data
 | |
| 	 * to the server exactly from the pos to pos+len-1 rather than flush all
 | |
| 	 * affected pages because it may cause a error with mandatory locks on
 | |
| 	 * these pages but not on the region from pos to ppos+len-1.
 | |
| 	 */
 | |
| 	written = cifs_user_writev(iocb, from);
 | |
| 	if (CIFS_CACHE_READ(cinode)) {
 | |
| 		/*
 | |
| 		 * We have read level caching and we have just sent a write
 | |
| 		 * request to the server thus making data in the cache stale.
 | |
| 		 * Zap the cache and set oplock/lease level to NONE to avoid
 | |
| 		 * reading stale data from the cache. All subsequent read
 | |
| 		 * operations will read new data from the server.
 | |
| 		 */
 | |
| 		cifs_zap_mapping(inode);
 | |
| 		cifs_dbg(FYI, "Set Oplock/Lease to NONE for inode=%p after write\n",
 | |
| 			 inode);
 | |
| 		cinode->oplock = 0;
 | |
| 	}
 | |
| out:
 | |
| 	cifs_put_writer(cinode);
 | |
| 	return written;
 | |
| }
 | |
| 
 | |
| static struct cifs_readdata *
 | |
| cifs_readdata_direct_alloc(struct page **pages, work_func_t complete)
 | |
| {
 | |
| 	struct cifs_readdata *rdata;
 | |
| 
 | |
| 	rdata = kzalloc(sizeof(*rdata), GFP_KERNEL);
 | |
| 	if (rdata != NULL) {
 | |
| 		rdata->pages = pages;
 | |
| 		kref_init(&rdata->refcount);
 | |
| 		INIT_LIST_HEAD(&rdata->list);
 | |
| 		init_completion(&rdata->done);
 | |
| 		INIT_WORK(&rdata->work, complete);
 | |
| 	}
 | |
| 
 | |
| 	return rdata;
 | |
| }
 | |
| 
 | |
| static struct cifs_readdata *
 | |
| cifs_readdata_alloc(unsigned int nr_pages, work_func_t complete)
 | |
| {
 | |
| 	struct page **pages =
 | |
| 		kcalloc(nr_pages, sizeof(struct page *), GFP_KERNEL);
 | |
| 	struct cifs_readdata *ret = NULL;
 | |
| 
 | |
| 	if (pages) {
 | |
| 		ret = cifs_readdata_direct_alloc(pages, complete);
 | |
| 		if (!ret)
 | |
| 			kfree(pages);
 | |
| 	}
 | |
| 
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| void
 | |
| cifs_readdata_release(struct kref *refcount)
 | |
| {
 | |
| 	struct cifs_readdata *rdata = container_of(refcount,
 | |
| 					struct cifs_readdata, refcount);
 | |
| #ifdef CONFIG_CIFS_SMB_DIRECT
 | |
| 	if (rdata->mr) {
 | |
| 		smbd_deregister_mr(rdata->mr);
 | |
| 		rdata->mr = NULL;
 | |
| 	}
 | |
| #endif
 | |
| 	if (rdata->cfile)
 | |
| 		cifsFileInfo_put(rdata->cfile);
 | |
| 
 | |
| 	kvfree(rdata->pages);
 | |
| 	kfree(rdata);
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_read_allocate_pages(struct cifs_readdata *rdata, unsigned int nr_pages)
 | |
| {
 | |
| 	int rc = 0;
 | |
| 	struct page *page;
 | |
| 	unsigned int i;
 | |
| 
 | |
| 	for (i = 0; i < nr_pages; i++) {
 | |
| 		page = alloc_page(GFP_KERNEL|__GFP_HIGHMEM);
 | |
| 		if (!page) {
 | |
| 			rc = -ENOMEM;
 | |
| 			break;
 | |
| 		}
 | |
| 		rdata->pages[i] = page;
 | |
| 	}
 | |
| 
 | |
| 	if (rc) {
 | |
| 		unsigned int nr_page_failed = i;
 | |
| 
 | |
| 		for (i = 0; i < nr_page_failed; i++) {
 | |
| 			put_page(rdata->pages[i]);
 | |
| 			rdata->pages[i] = NULL;
 | |
| 		}
 | |
| 	}
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static void
 | |
| cifs_uncached_readdata_release(struct kref *refcount)
 | |
| {
 | |
| 	struct cifs_readdata *rdata = container_of(refcount,
 | |
| 					struct cifs_readdata, refcount);
 | |
| 	unsigned int i;
 | |
| 
 | |
| 	kref_put(&rdata->ctx->refcount, cifs_aio_ctx_release);
 | |
| 	for (i = 0; i < rdata->nr_pages; i++) {
 | |
| 		put_page(rdata->pages[i]);
 | |
| 	}
 | |
| 	cifs_readdata_release(refcount);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * cifs_readdata_to_iov - copy data from pages in response to an iovec
 | |
|  * @rdata:	the readdata response with list of pages holding data
 | |
|  * @iter:	destination for our data
 | |
|  *
 | |
|  * This function copies data from a list of pages in a readdata response into
 | |
|  * an array of iovecs. It will first calculate where the data should go
 | |
|  * based on the info in the readdata and then copy the data into that spot.
 | |
|  */
 | |
| static int
 | |
| cifs_readdata_to_iov(struct cifs_readdata *rdata, struct iov_iter *iter)
 | |
| {
 | |
| 	size_t remaining = rdata->got_bytes;
 | |
| 	unsigned int i;
 | |
| 
 | |
| 	for (i = 0; i < rdata->nr_pages; i++) {
 | |
| 		struct page *page = rdata->pages[i];
 | |
| 		size_t copy = min_t(size_t, remaining, PAGE_SIZE);
 | |
| 		size_t written;
 | |
| 
 | |
| 		if (unlikely(iov_iter_is_pipe(iter))) {
 | |
| 			void *addr = kmap_atomic(page);
 | |
| 
 | |
| 			written = copy_to_iter(addr, copy, iter);
 | |
| 			kunmap_atomic(addr);
 | |
| 		} else
 | |
| 			written = copy_page_to_iter(page, 0, copy, iter);
 | |
| 		remaining -= written;
 | |
| 		if (written < copy && iov_iter_count(iter) > 0)
 | |
| 			break;
 | |
| 	}
 | |
| 	return remaining ? -EFAULT : 0;
 | |
| }
 | |
| 
 | |
| static void collect_uncached_read_data(struct cifs_aio_ctx *ctx);
 | |
| 
 | |
| static void
 | |
| cifs_uncached_readv_complete(struct work_struct *work)
 | |
| {
 | |
| 	struct cifs_readdata *rdata = container_of(work,
 | |
| 						struct cifs_readdata, work);
 | |
| 
 | |
| 	complete(&rdata->done);
 | |
| 	collect_uncached_read_data(rdata->ctx);
 | |
| 	/* the below call can possibly free the last ref to aio ctx */
 | |
| 	kref_put(&rdata->refcount, cifs_uncached_readdata_release);
 | |
| }
 | |
| 
 | |
| static int
 | |
| uncached_fill_pages(struct TCP_Server_Info *server,
 | |
| 		    struct cifs_readdata *rdata, struct iov_iter *iter,
 | |
| 		    unsigned int len)
 | |
| {
 | |
| 	int result = 0;
 | |
| 	unsigned int i;
 | |
| 	unsigned int nr_pages = rdata->nr_pages;
 | |
| 	unsigned int page_offset = rdata->page_offset;
 | |
| 
 | |
| 	rdata->got_bytes = 0;
 | |
| 	rdata->tailsz = PAGE_SIZE;
 | |
| 	for (i = 0; i < nr_pages; i++) {
 | |
| 		struct page *page = rdata->pages[i];
 | |
| 		size_t n;
 | |
| 		unsigned int segment_size = rdata->pagesz;
 | |
| 
 | |
| 		if (i == 0)
 | |
| 			segment_size -= page_offset;
 | |
| 		else
 | |
| 			page_offset = 0;
 | |
| 
 | |
| 
 | |
| 		if (len <= 0) {
 | |
| 			/* no need to hold page hostage */
 | |
| 			rdata->pages[i] = NULL;
 | |
| 			rdata->nr_pages--;
 | |
| 			put_page(page);
 | |
| 			continue;
 | |
| 		}
 | |
| 
 | |
| 		n = len;
 | |
| 		if (len >= segment_size)
 | |
| 			/* enough data to fill the page */
 | |
| 			n = segment_size;
 | |
| 		else
 | |
| 			rdata->tailsz = len;
 | |
| 		len -= n;
 | |
| 
 | |
| 		if (iter)
 | |
| 			result = copy_page_from_iter(
 | |
| 					page, page_offset, n, iter);
 | |
| #ifdef CONFIG_CIFS_SMB_DIRECT
 | |
| 		else if (rdata->mr)
 | |
| 			result = n;
 | |
| #endif
 | |
| 		else
 | |
| 			result = cifs_read_page_from_socket(
 | |
| 					server, page, page_offset, n);
 | |
| 		if (result < 0)
 | |
| 			break;
 | |
| 
 | |
| 		rdata->got_bytes += result;
 | |
| 	}
 | |
| 
 | |
| 	return rdata->got_bytes > 0 && result != -ECONNABORTED ?
 | |
| 						rdata->got_bytes : result;
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_uncached_read_into_pages(struct TCP_Server_Info *server,
 | |
| 			      struct cifs_readdata *rdata, unsigned int len)
 | |
| {
 | |
| 	return uncached_fill_pages(server, rdata, NULL, len);
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_uncached_copy_into_pages(struct TCP_Server_Info *server,
 | |
| 			      struct cifs_readdata *rdata,
 | |
| 			      struct iov_iter *iter)
 | |
| {
 | |
| 	return uncached_fill_pages(server, rdata, iter, iter->count);
 | |
| }
 | |
| 
 | |
| static int cifs_resend_rdata(struct cifs_readdata *rdata,
 | |
| 			struct list_head *rdata_list,
 | |
| 			struct cifs_aio_ctx *ctx)
 | |
| {
 | |
| 	unsigned int rsize;
 | |
| 	struct cifs_credits credits;
 | |
| 	int rc;
 | |
| 	struct TCP_Server_Info *server;
 | |
| 
 | |
| 	/* XXX: should we pick a new channel here? */
 | |
| 	server = rdata->server;
 | |
| 
 | |
| 	do {
 | |
| 		if (rdata->cfile->invalidHandle) {
 | |
| 			rc = cifs_reopen_file(rdata->cfile, true);
 | |
| 			if (rc == -EAGAIN)
 | |
| 				continue;
 | |
| 			else if (rc)
 | |
| 				break;
 | |
| 		}
 | |
| 
 | |
| 		/*
 | |
| 		 * Wait for credits to resend this rdata.
 | |
| 		 * Note: we are attempting to resend the whole rdata not in
 | |
| 		 * segments
 | |
| 		 */
 | |
| 		do {
 | |
| 			rc = server->ops->wait_mtu_credits(server, rdata->bytes,
 | |
| 						&rsize, &credits);
 | |
| 
 | |
| 			if (rc)
 | |
| 				goto fail;
 | |
| 
 | |
| 			if (rsize < rdata->bytes) {
 | |
| 				add_credits_and_wake_if(server, &credits, 0);
 | |
| 				msleep(1000);
 | |
| 			}
 | |
| 		} while (rsize < rdata->bytes);
 | |
| 		rdata->credits = credits;
 | |
| 
 | |
| 		rc = adjust_credits(server, &rdata->credits, rdata->bytes);
 | |
| 		if (!rc) {
 | |
| 			if (rdata->cfile->invalidHandle)
 | |
| 				rc = -EAGAIN;
 | |
| 			else {
 | |
| #ifdef CONFIG_CIFS_SMB_DIRECT
 | |
| 				if (rdata->mr) {
 | |
| 					rdata->mr->need_invalidate = true;
 | |
| 					smbd_deregister_mr(rdata->mr);
 | |
| 					rdata->mr = NULL;
 | |
| 				}
 | |
| #endif
 | |
| 				rc = server->ops->async_readv(rdata);
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		/* If the read was successfully sent, we are done */
 | |
| 		if (!rc) {
 | |
| 			/* Add to aio pending list */
 | |
| 			list_add_tail(&rdata->list, rdata_list);
 | |
| 			return 0;
 | |
| 		}
 | |
| 
 | |
| 		/* Roll back credits and retry if needed */
 | |
| 		add_credits_and_wake_if(server, &rdata->credits, 0);
 | |
| 	} while (rc == -EAGAIN);
 | |
| 
 | |
| fail:
 | |
| 	kref_put(&rdata->refcount, cifs_uncached_readdata_release);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_send_async_read(loff_t offset, size_t len, struct cifsFileInfo *open_file,
 | |
| 		     struct cifs_sb_info *cifs_sb, struct list_head *rdata_list,
 | |
| 		     struct cifs_aio_ctx *ctx)
 | |
| {
 | |
| 	struct cifs_readdata *rdata;
 | |
| 	unsigned int npages, rsize;
 | |
| 	struct cifs_credits credits_on_stack;
 | |
| 	struct cifs_credits *credits = &credits_on_stack;
 | |
| 	size_t cur_len;
 | |
| 	int rc;
 | |
| 	pid_t pid;
 | |
| 	struct TCP_Server_Info *server;
 | |
| 	struct page **pagevec;
 | |
| 	size_t start;
 | |
| 	struct iov_iter direct_iov = ctx->iter;
 | |
| 
 | |
| 	server = cifs_pick_channel(tlink_tcon(open_file->tlink)->ses);
 | |
| 
 | |
| 	if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
 | |
| 		pid = open_file->pid;
 | |
| 	else
 | |
| 		pid = current->tgid;
 | |
| 
 | |
| 	if (ctx->direct_io)
 | |
| 		iov_iter_advance(&direct_iov, offset - ctx->pos);
 | |
| 
 | |
| 	do {
 | |
| 		if (open_file->invalidHandle) {
 | |
| 			rc = cifs_reopen_file(open_file, true);
 | |
| 			if (rc == -EAGAIN)
 | |
| 				continue;
 | |
| 			else if (rc)
 | |
| 				break;
 | |
| 		}
 | |
| 
 | |
| 		rc = server->ops->wait_mtu_credits(server, cifs_sb->ctx->rsize,
 | |
| 						   &rsize, credits);
 | |
| 		if (rc)
 | |
| 			break;
 | |
| 
 | |
| 		cur_len = min_t(const size_t, len, rsize);
 | |
| 
 | |
| 		if (ctx->direct_io) {
 | |
| 			ssize_t result;
 | |
| 
 | |
| 			result = iov_iter_get_pages_alloc(
 | |
| 					&direct_iov, &pagevec,
 | |
| 					cur_len, &start);
 | |
| 			if (result < 0) {
 | |
| 				cifs_dbg(VFS,
 | |
| 					 "Couldn't get user pages (rc=%zd) iter type %d iov_offset %zd count %zd\n",
 | |
| 					 result, iov_iter_type(&direct_iov),
 | |
| 					 direct_iov.iov_offset,
 | |
| 					 direct_iov.count);
 | |
| 				dump_stack();
 | |
| 
 | |
| 				rc = result;
 | |
| 				add_credits_and_wake_if(server, credits, 0);
 | |
| 				break;
 | |
| 			}
 | |
| 			cur_len = (size_t)result;
 | |
| 			iov_iter_advance(&direct_iov, cur_len);
 | |
| 
 | |
| 			rdata = cifs_readdata_direct_alloc(
 | |
| 					pagevec, cifs_uncached_readv_complete);
 | |
| 			if (!rdata) {
 | |
| 				add_credits_and_wake_if(server, credits, 0);
 | |
| 				rc = -ENOMEM;
 | |
| 				break;
 | |
| 			}
 | |
| 
 | |
| 			npages = (cur_len + start + PAGE_SIZE-1) / PAGE_SIZE;
 | |
| 			rdata->page_offset = start;
 | |
| 			rdata->tailsz = npages > 1 ?
 | |
| 				cur_len-(PAGE_SIZE-start)-(npages-2)*PAGE_SIZE :
 | |
| 				cur_len;
 | |
| 
 | |
| 		} else {
 | |
| 
 | |
| 			npages = DIV_ROUND_UP(cur_len, PAGE_SIZE);
 | |
| 			/* allocate a readdata struct */
 | |
| 			rdata = cifs_readdata_alloc(npages,
 | |
| 					    cifs_uncached_readv_complete);
 | |
| 			if (!rdata) {
 | |
| 				add_credits_and_wake_if(server, credits, 0);
 | |
| 				rc = -ENOMEM;
 | |
| 				break;
 | |
| 			}
 | |
| 
 | |
| 			rc = cifs_read_allocate_pages(rdata, npages);
 | |
| 			if (rc) {
 | |
| 				kvfree(rdata->pages);
 | |
| 				kfree(rdata);
 | |
| 				add_credits_and_wake_if(server, credits, 0);
 | |
| 				break;
 | |
| 			}
 | |
| 
 | |
| 			rdata->tailsz = PAGE_SIZE;
 | |
| 		}
 | |
| 
 | |
| 		rdata->server = server;
 | |
| 		rdata->cfile = cifsFileInfo_get(open_file);
 | |
| 		rdata->nr_pages = npages;
 | |
| 		rdata->offset = offset;
 | |
| 		rdata->bytes = cur_len;
 | |
| 		rdata->pid = pid;
 | |
| 		rdata->pagesz = PAGE_SIZE;
 | |
| 		rdata->read_into_pages = cifs_uncached_read_into_pages;
 | |
| 		rdata->copy_into_pages = cifs_uncached_copy_into_pages;
 | |
| 		rdata->credits = credits_on_stack;
 | |
| 		rdata->ctx = ctx;
 | |
| 		kref_get(&ctx->refcount);
 | |
| 
 | |
| 		rc = adjust_credits(server, &rdata->credits, rdata->bytes);
 | |
| 
 | |
| 		if (!rc) {
 | |
| 			if (rdata->cfile->invalidHandle)
 | |
| 				rc = -EAGAIN;
 | |
| 			else
 | |
| 				rc = server->ops->async_readv(rdata);
 | |
| 		}
 | |
| 
 | |
| 		if (rc) {
 | |
| 			add_credits_and_wake_if(server, &rdata->credits, 0);
 | |
| 			kref_put(&rdata->refcount,
 | |
| 				cifs_uncached_readdata_release);
 | |
| 			if (rc == -EAGAIN) {
 | |
| 				iov_iter_revert(&direct_iov, cur_len);
 | |
| 				continue;
 | |
| 			}
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		list_add_tail(&rdata->list, rdata_list);
 | |
| 		offset += cur_len;
 | |
| 		len -= cur_len;
 | |
| 	} while (len > 0);
 | |
| 
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static void
 | |
| collect_uncached_read_data(struct cifs_aio_ctx *ctx)
 | |
| {
 | |
| 	struct cifs_readdata *rdata, *tmp;
 | |
| 	struct iov_iter *to = &ctx->iter;
 | |
| 	struct cifs_sb_info *cifs_sb;
 | |
| 	int rc;
 | |
| 
 | |
| 	cifs_sb = CIFS_SB(ctx->cfile->dentry->d_sb);
 | |
| 
 | |
| 	mutex_lock(&ctx->aio_mutex);
 | |
| 
 | |
| 	if (list_empty(&ctx->list)) {
 | |
| 		mutex_unlock(&ctx->aio_mutex);
 | |
| 		return;
 | |
| 	}
 | |
| 
 | |
| 	rc = ctx->rc;
 | |
| 	/* the loop below should proceed in the order of increasing offsets */
 | |
| again:
 | |
| 	list_for_each_entry_safe(rdata, tmp, &ctx->list, list) {
 | |
| 		if (!rc) {
 | |
| 			if (!try_wait_for_completion(&rdata->done)) {
 | |
| 				mutex_unlock(&ctx->aio_mutex);
 | |
| 				return;
 | |
| 			}
 | |
| 
 | |
| 			if (rdata->result == -EAGAIN) {
 | |
| 				/* resend call if it's a retryable error */
 | |
| 				struct list_head tmp_list;
 | |
| 				unsigned int got_bytes = rdata->got_bytes;
 | |
| 
 | |
| 				list_del_init(&rdata->list);
 | |
| 				INIT_LIST_HEAD(&tmp_list);
 | |
| 
 | |
| 				/*
 | |
| 				 * Got a part of data and then reconnect has
 | |
| 				 * happened -- fill the buffer and continue
 | |
| 				 * reading.
 | |
| 				 */
 | |
| 				if (got_bytes && got_bytes < rdata->bytes) {
 | |
| 					rc = 0;
 | |
| 					if (!ctx->direct_io)
 | |
| 						rc = cifs_readdata_to_iov(rdata, to);
 | |
| 					if (rc) {
 | |
| 						kref_put(&rdata->refcount,
 | |
| 							cifs_uncached_readdata_release);
 | |
| 						continue;
 | |
| 					}
 | |
| 				}
 | |
| 
 | |
| 				if (ctx->direct_io) {
 | |
| 					/*
 | |
| 					 * Re-use rdata as this is a
 | |
| 					 * direct I/O
 | |
| 					 */
 | |
| 					rc = cifs_resend_rdata(
 | |
| 						rdata,
 | |
| 						&tmp_list, ctx);
 | |
| 				} else {
 | |
| 					rc = cifs_send_async_read(
 | |
| 						rdata->offset + got_bytes,
 | |
| 						rdata->bytes - got_bytes,
 | |
| 						rdata->cfile, cifs_sb,
 | |
| 						&tmp_list, ctx);
 | |
| 
 | |
| 					kref_put(&rdata->refcount,
 | |
| 						cifs_uncached_readdata_release);
 | |
| 				}
 | |
| 
 | |
| 				list_splice(&tmp_list, &ctx->list);
 | |
| 
 | |
| 				goto again;
 | |
| 			} else if (rdata->result)
 | |
| 				rc = rdata->result;
 | |
| 			else if (!ctx->direct_io)
 | |
| 				rc = cifs_readdata_to_iov(rdata, to);
 | |
| 
 | |
| 			/* if there was a short read -- discard anything left */
 | |
| 			if (rdata->got_bytes && rdata->got_bytes < rdata->bytes)
 | |
| 				rc = -ENODATA;
 | |
| 
 | |
| 			ctx->total_len += rdata->got_bytes;
 | |
| 		}
 | |
| 		list_del_init(&rdata->list);
 | |
| 		kref_put(&rdata->refcount, cifs_uncached_readdata_release);
 | |
| 	}
 | |
| 
 | |
| 	if (!ctx->direct_io)
 | |
| 		ctx->total_len = ctx->len - iov_iter_count(to);
 | |
| 
 | |
| 	/* mask nodata case */
 | |
| 	if (rc == -ENODATA)
 | |
| 		rc = 0;
 | |
| 
 | |
| 	ctx->rc = (rc == 0) ? (ssize_t)ctx->total_len : rc;
 | |
| 
 | |
| 	mutex_unlock(&ctx->aio_mutex);
 | |
| 
 | |
| 	if (ctx->iocb && ctx->iocb->ki_complete)
 | |
| 		ctx->iocb->ki_complete(ctx->iocb, ctx->rc, 0);
 | |
| 	else
 | |
| 		complete(&ctx->done);
 | |
| }
 | |
| 
 | |
| static ssize_t __cifs_readv(
 | |
| 	struct kiocb *iocb, struct iov_iter *to, bool direct)
 | |
| {
 | |
| 	size_t len;
 | |
| 	struct file *file = iocb->ki_filp;
 | |
| 	struct cifs_sb_info *cifs_sb;
 | |
| 	struct cifsFileInfo *cfile;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 	ssize_t rc, total_read = 0;
 | |
| 	loff_t offset = iocb->ki_pos;
 | |
| 	struct cifs_aio_ctx *ctx;
 | |
| 
 | |
| 	/*
 | |
| 	 * iov_iter_get_pages_alloc() doesn't work with ITER_KVEC,
 | |
| 	 * fall back to data copy read path
 | |
| 	 * this could be improved by getting pages directly in ITER_KVEC
 | |
| 	 */
 | |
| 	if (direct && iov_iter_is_kvec(to)) {
 | |
| 		cifs_dbg(FYI, "use non-direct cifs_user_readv for kvec I/O\n");
 | |
| 		direct = false;
 | |
| 	}
 | |
| 
 | |
| 	len = iov_iter_count(to);
 | |
| 	if (!len)
 | |
| 		return 0;
 | |
| 
 | |
| 	cifs_sb = CIFS_FILE_SB(file);
 | |
| 	cfile = file->private_data;
 | |
| 	tcon = tlink_tcon(cfile->tlink);
 | |
| 
 | |
| 	if (!tcon->ses->server->ops->async_readv)
 | |
| 		return -ENOSYS;
 | |
| 
 | |
| 	if ((file->f_flags & O_ACCMODE) == O_WRONLY)
 | |
| 		cifs_dbg(FYI, "attempting read on write only file instance\n");
 | |
| 
 | |
| 	ctx = cifs_aio_ctx_alloc();
 | |
| 	if (!ctx)
 | |
| 		return -ENOMEM;
 | |
| 
 | |
| 	ctx->cfile = cifsFileInfo_get(cfile);
 | |
| 
 | |
| 	if (!is_sync_kiocb(iocb))
 | |
| 		ctx->iocb = iocb;
 | |
| 
 | |
| 	if (iter_is_iovec(to))
 | |
| 		ctx->should_dirty = true;
 | |
| 
 | |
| 	if (direct) {
 | |
| 		ctx->pos = offset;
 | |
| 		ctx->direct_io = true;
 | |
| 		ctx->iter = *to;
 | |
| 		ctx->len = len;
 | |
| 	} else {
 | |
| 		rc = setup_aio_ctx_iter(ctx, to, READ);
 | |
| 		if (rc) {
 | |
| 			kref_put(&ctx->refcount, cifs_aio_ctx_release);
 | |
| 			return rc;
 | |
| 		}
 | |
| 		len = ctx->len;
 | |
| 	}
 | |
| 
 | |
| 	/* grab a lock here due to read response handlers can access ctx */
 | |
| 	mutex_lock(&ctx->aio_mutex);
 | |
| 
 | |
| 	rc = cifs_send_async_read(offset, len, cfile, cifs_sb, &ctx->list, ctx);
 | |
| 
 | |
| 	/* if at least one read request send succeeded, then reset rc */
 | |
| 	if (!list_empty(&ctx->list))
 | |
| 		rc = 0;
 | |
| 
 | |
| 	mutex_unlock(&ctx->aio_mutex);
 | |
| 
 | |
| 	if (rc) {
 | |
| 		kref_put(&ctx->refcount, cifs_aio_ctx_release);
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	if (!is_sync_kiocb(iocb)) {
 | |
| 		kref_put(&ctx->refcount, cifs_aio_ctx_release);
 | |
| 		return -EIOCBQUEUED;
 | |
| 	}
 | |
| 
 | |
| 	rc = wait_for_completion_killable(&ctx->done);
 | |
| 	if (rc) {
 | |
| 		mutex_lock(&ctx->aio_mutex);
 | |
| 		ctx->rc = rc = -EINTR;
 | |
| 		total_read = ctx->total_len;
 | |
| 		mutex_unlock(&ctx->aio_mutex);
 | |
| 	} else {
 | |
| 		rc = ctx->rc;
 | |
| 		total_read = ctx->total_len;
 | |
| 	}
 | |
| 
 | |
| 	kref_put(&ctx->refcount, cifs_aio_ctx_release);
 | |
| 
 | |
| 	if (total_read) {
 | |
| 		iocb->ki_pos += total_read;
 | |
| 		return total_read;
 | |
| 	}
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| ssize_t cifs_direct_readv(struct kiocb *iocb, struct iov_iter *to)
 | |
| {
 | |
| 	return __cifs_readv(iocb, to, true);
 | |
| }
 | |
| 
 | |
| ssize_t cifs_user_readv(struct kiocb *iocb, struct iov_iter *to)
 | |
| {
 | |
| 	return __cifs_readv(iocb, to, false);
 | |
| }
 | |
| 
 | |
| ssize_t
 | |
| cifs_strict_readv(struct kiocb *iocb, struct iov_iter *to)
 | |
| {
 | |
| 	struct inode *inode = file_inode(iocb->ki_filp);
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(inode);
 | |
| 	struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
 | |
| 	struct cifsFileInfo *cfile = (struct cifsFileInfo *)
 | |
| 						iocb->ki_filp->private_data;
 | |
| 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
 | |
| 	int rc = -EACCES;
 | |
| 
 | |
| 	/*
 | |
| 	 * In strict cache mode we need to read from the server all the time
 | |
| 	 * if we don't have level II oplock because the server can delay mtime
 | |
| 	 * change - so we can't make a decision about inode invalidating.
 | |
| 	 * And we can also fail with pagereading if there are mandatory locks
 | |
| 	 * on pages affected by this read but not on the region from pos to
 | |
| 	 * pos+len-1.
 | |
| 	 */
 | |
| 	if (!CIFS_CACHE_READ(cinode))
 | |
| 		return cifs_user_readv(iocb, to);
 | |
| 
 | |
| 	if (cap_unix(tcon->ses) &&
 | |
| 	    (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
 | |
| 	    ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
 | |
| 		return generic_file_read_iter(iocb, to);
 | |
| 
 | |
| 	/*
 | |
| 	 * We need to hold the sem to be sure nobody modifies lock list
 | |
| 	 * with a brlock that prevents reading.
 | |
| 	 */
 | |
| 	down_read(&cinode->lock_sem);
 | |
| 	if (!cifs_find_lock_conflict(cfile, iocb->ki_pos, iov_iter_count(to),
 | |
| 				     tcon->ses->server->vals->shared_lock_type,
 | |
| 				     0, NULL, CIFS_READ_OP))
 | |
| 		rc = generic_file_read_iter(iocb, to);
 | |
| 	up_read(&cinode->lock_sem);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static ssize_t
 | |
| cifs_read(struct file *file, char *read_data, size_t read_size, loff_t *offset)
 | |
| {
 | |
| 	int rc = -EACCES;
 | |
| 	unsigned int bytes_read = 0;
 | |
| 	unsigned int total_read;
 | |
| 	unsigned int current_read_size;
 | |
| 	unsigned int rsize;
 | |
| 	struct cifs_sb_info *cifs_sb;
 | |
| 	struct cifs_tcon *tcon;
 | |
| 	struct TCP_Server_Info *server;
 | |
| 	unsigned int xid;
 | |
| 	char *cur_offset;
 | |
| 	struct cifsFileInfo *open_file;
 | |
| 	struct cifs_io_parms io_parms = {0};
 | |
| 	int buf_type = CIFS_NO_BUFFER;
 | |
| 	__u32 pid;
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 	cifs_sb = CIFS_FILE_SB(file);
 | |
| 
 | |
| 	/* FIXME: set up handlers for larger reads and/or convert to async */
 | |
| 	rsize = min_t(unsigned int, cifs_sb->ctx->rsize, CIFSMaxBufSize);
 | |
| 
 | |
| 	if (file->private_data == NULL) {
 | |
| 		rc = -EBADF;
 | |
| 		free_xid(xid);
 | |
| 		return rc;
 | |
| 	}
 | |
| 	open_file = file->private_data;
 | |
| 	tcon = tlink_tcon(open_file->tlink);
 | |
| 	server = cifs_pick_channel(tcon->ses);
 | |
| 
 | |
| 	if (!server->ops->sync_read) {
 | |
| 		free_xid(xid);
 | |
| 		return -ENOSYS;
 | |
| 	}
 | |
| 
 | |
| 	if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
 | |
| 		pid = open_file->pid;
 | |
| 	else
 | |
| 		pid = current->tgid;
 | |
| 
 | |
| 	if ((file->f_flags & O_ACCMODE) == O_WRONLY)
 | |
| 		cifs_dbg(FYI, "attempting read on write only file instance\n");
 | |
| 
 | |
| 	for (total_read = 0, cur_offset = read_data; read_size > total_read;
 | |
| 	     total_read += bytes_read, cur_offset += bytes_read) {
 | |
| 		do {
 | |
| 			current_read_size = min_t(uint, read_size - total_read,
 | |
| 						  rsize);
 | |
| 			/*
 | |
| 			 * For windows me and 9x we do not want to request more
 | |
| 			 * than it negotiated since it will refuse the read
 | |
| 			 * then.
 | |
| 			 */
 | |
| 			if (!(tcon->ses->capabilities &
 | |
| 				tcon->ses->server->vals->cap_large_files)) {
 | |
| 				current_read_size = min_t(uint,
 | |
| 					current_read_size, CIFSMaxBufSize);
 | |
| 			}
 | |
| 			if (open_file->invalidHandle) {
 | |
| 				rc = cifs_reopen_file(open_file, true);
 | |
| 				if (rc != 0)
 | |
| 					break;
 | |
| 			}
 | |
| 			io_parms.pid = pid;
 | |
| 			io_parms.tcon = tcon;
 | |
| 			io_parms.offset = *offset;
 | |
| 			io_parms.length = current_read_size;
 | |
| 			io_parms.server = server;
 | |
| 			rc = server->ops->sync_read(xid, &open_file->fid, &io_parms,
 | |
| 						    &bytes_read, &cur_offset,
 | |
| 						    &buf_type);
 | |
| 		} while (rc == -EAGAIN);
 | |
| 
 | |
| 		if (rc || (bytes_read == 0)) {
 | |
| 			if (total_read) {
 | |
| 				break;
 | |
| 			} else {
 | |
| 				free_xid(xid);
 | |
| 				return rc;
 | |
| 			}
 | |
| 		} else {
 | |
| 			cifs_stats_bytes_read(tcon, total_read);
 | |
| 			*offset += bytes_read;
 | |
| 		}
 | |
| 	}
 | |
| 	free_xid(xid);
 | |
| 	return total_read;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * If the page is mmap'ed into a process' page tables, then we need to make
 | |
|  * sure that it doesn't change while being written back.
 | |
|  */
 | |
| static vm_fault_t
 | |
| cifs_page_mkwrite(struct vm_fault *vmf)
 | |
| {
 | |
| 	struct page *page = vmf->page;
 | |
| 
 | |
| 	lock_page(page);
 | |
| 	return VM_FAULT_LOCKED;
 | |
| }
 | |
| 
 | |
| static const struct vm_operations_struct cifs_file_vm_ops = {
 | |
| 	.fault = filemap_fault,
 | |
| 	.map_pages = filemap_map_pages,
 | |
| 	.page_mkwrite = cifs_page_mkwrite,
 | |
| };
 | |
| 
 | |
| int cifs_file_strict_mmap(struct file *file, struct vm_area_struct *vma)
 | |
| {
 | |
| 	int xid, rc = 0;
 | |
| 	struct inode *inode = file_inode(file);
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 
 | |
| 	if (!CIFS_CACHE_READ(CIFS_I(inode)))
 | |
| 		rc = cifs_zap_mapping(inode);
 | |
| 	if (!rc)
 | |
| 		rc = generic_file_mmap(file, vma);
 | |
| 	if (!rc)
 | |
| 		vma->vm_ops = &cifs_file_vm_ops;
 | |
| 
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| int cifs_file_mmap(struct file *file, struct vm_area_struct *vma)
 | |
| {
 | |
| 	int rc, xid;
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 
 | |
| 	rc = cifs_revalidate_file(file);
 | |
| 	if (rc)
 | |
| 		cifs_dbg(FYI, "Validation prior to mmap failed, error=%d\n",
 | |
| 			 rc);
 | |
| 	if (!rc)
 | |
| 		rc = generic_file_mmap(file, vma);
 | |
| 	if (!rc)
 | |
| 		vma->vm_ops = &cifs_file_vm_ops;
 | |
| 
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static void
 | |
| cifs_readv_complete(struct work_struct *work)
 | |
| {
 | |
| 	unsigned int i, got_bytes;
 | |
| 	struct cifs_readdata *rdata = container_of(work,
 | |
| 						struct cifs_readdata, work);
 | |
| 
 | |
| 	got_bytes = rdata->got_bytes;
 | |
| 	for (i = 0; i < rdata->nr_pages; i++) {
 | |
| 		struct page *page = rdata->pages[i];
 | |
| 
 | |
| 		lru_cache_add(page);
 | |
| 
 | |
| 		if (rdata->result == 0 ||
 | |
| 		    (rdata->result == -EAGAIN && got_bytes)) {
 | |
| 			flush_dcache_page(page);
 | |
| 			SetPageUptodate(page);
 | |
| 		}
 | |
| 
 | |
| 		unlock_page(page);
 | |
| 
 | |
| 		if (rdata->result == 0 ||
 | |
| 		    (rdata->result == -EAGAIN && got_bytes))
 | |
| 			cifs_readpage_to_fscache(rdata->mapping->host, page);
 | |
| 
 | |
| 		got_bytes -= min_t(unsigned int, PAGE_SIZE, got_bytes);
 | |
| 
 | |
| 		put_page(page);
 | |
| 		rdata->pages[i] = NULL;
 | |
| 	}
 | |
| 	kref_put(&rdata->refcount, cifs_readdata_release);
 | |
| }
 | |
| 
 | |
| static int
 | |
| readpages_fill_pages(struct TCP_Server_Info *server,
 | |
| 		     struct cifs_readdata *rdata, struct iov_iter *iter,
 | |
| 		     unsigned int len)
 | |
| {
 | |
| 	int result = 0;
 | |
| 	unsigned int i;
 | |
| 	u64 eof;
 | |
| 	pgoff_t eof_index;
 | |
| 	unsigned int nr_pages = rdata->nr_pages;
 | |
| 	unsigned int page_offset = rdata->page_offset;
 | |
| 
 | |
| 	/* determine the eof that the server (probably) has */
 | |
| 	eof = CIFS_I(rdata->mapping->host)->server_eof;
 | |
| 	eof_index = eof ? (eof - 1) >> PAGE_SHIFT : 0;
 | |
| 	cifs_dbg(FYI, "eof=%llu eof_index=%lu\n", eof, eof_index);
 | |
| 
 | |
| 	rdata->got_bytes = 0;
 | |
| 	rdata->tailsz = PAGE_SIZE;
 | |
| 	for (i = 0; i < nr_pages; i++) {
 | |
| 		struct page *page = rdata->pages[i];
 | |
| 		unsigned int to_read = rdata->pagesz;
 | |
| 		size_t n;
 | |
| 
 | |
| 		if (i == 0)
 | |
| 			to_read -= page_offset;
 | |
| 		else
 | |
| 			page_offset = 0;
 | |
| 
 | |
| 		n = to_read;
 | |
| 
 | |
| 		if (len >= to_read) {
 | |
| 			len -= to_read;
 | |
| 		} else if (len > 0) {
 | |
| 			/* enough for partial page, fill and zero the rest */
 | |
| 			zero_user(page, len + page_offset, to_read - len);
 | |
| 			n = rdata->tailsz = len;
 | |
| 			len = 0;
 | |
| 		} else if (page->index > eof_index) {
 | |
| 			/*
 | |
| 			 * The VFS will not try to do readahead past the
 | |
| 			 * i_size, but it's possible that we have outstanding
 | |
| 			 * writes with gaps in the middle and the i_size hasn't
 | |
| 			 * caught up yet. Populate those with zeroed out pages
 | |
| 			 * to prevent the VFS from repeatedly attempting to
 | |
| 			 * fill them until the writes are flushed.
 | |
| 			 */
 | |
| 			zero_user(page, 0, PAGE_SIZE);
 | |
| 			lru_cache_add(page);
 | |
| 			flush_dcache_page(page);
 | |
| 			SetPageUptodate(page);
 | |
| 			unlock_page(page);
 | |
| 			put_page(page);
 | |
| 			rdata->pages[i] = NULL;
 | |
| 			rdata->nr_pages--;
 | |
| 			continue;
 | |
| 		} else {
 | |
| 			/* no need to hold page hostage */
 | |
| 			lru_cache_add(page);
 | |
| 			unlock_page(page);
 | |
| 			put_page(page);
 | |
| 			rdata->pages[i] = NULL;
 | |
| 			rdata->nr_pages--;
 | |
| 			continue;
 | |
| 		}
 | |
| 
 | |
| 		if (iter)
 | |
| 			result = copy_page_from_iter(
 | |
| 					page, page_offset, n, iter);
 | |
| #ifdef CONFIG_CIFS_SMB_DIRECT
 | |
| 		else if (rdata->mr)
 | |
| 			result = n;
 | |
| #endif
 | |
| 		else
 | |
| 			result = cifs_read_page_from_socket(
 | |
| 					server, page, page_offset, n);
 | |
| 		if (result < 0)
 | |
| 			break;
 | |
| 
 | |
| 		rdata->got_bytes += result;
 | |
| 	}
 | |
| 
 | |
| 	return rdata->got_bytes > 0 && result != -ECONNABORTED ?
 | |
| 						rdata->got_bytes : result;
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_readpages_read_into_pages(struct TCP_Server_Info *server,
 | |
| 			       struct cifs_readdata *rdata, unsigned int len)
 | |
| {
 | |
| 	return readpages_fill_pages(server, rdata, NULL, len);
 | |
| }
 | |
| 
 | |
| static int
 | |
| cifs_readpages_copy_into_pages(struct TCP_Server_Info *server,
 | |
| 			       struct cifs_readdata *rdata,
 | |
| 			       struct iov_iter *iter)
 | |
| {
 | |
| 	return readpages_fill_pages(server, rdata, iter, iter->count);
 | |
| }
 | |
| 
 | |
| static int
 | |
| readpages_get_pages(struct address_space *mapping, struct list_head *page_list,
 | |
| 		    unsigned int rsize, struct list_head *tmplist,
 | |
| 		    unsigned int *nr_pages, loff_t *offset, unsigned int *bytes)
 | |
| {
 | |
| 	struct page *page, *tpage;
 | |
| 	unsigned int expected_index;
 | |
| 	int rc;
 | |
| 	gfp_t gfp = readahead_gfp_mask(mapping);
 | |
| 
 | |
| 	INIT_LIST_HEAD(tmplist);
 | |
| 
 | |
| 	page = lru_to_page(page_list);
 | |
| 
 | |
| 	/*
 | |
| 	 * Lock the page and put it in the cache. Since no one else
 | |
| 	 * should have access to this page, we're safe to simply set
 | |
| 	 * PG_locked without checking it first.
 | |
| 	 */
 | |
| 	__SetPageLocked(page);
 | |
| 	rc = add_to_page_cache_locked(page, mapping,
 | |
| 				      page->index, gfp);
 | |
| 
 | |
| 	/* give up if we can't stick it in the cache */
 | |
| 	if (rc) {
 | |
| 		__ClearPageLocked(page);
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	/* move first page to the tmplist */
 | |
| 	*offset = (loff_t)page->index << PAGE_SHIFT;
 | |
| 	*bytes = PAGE_SIZE;
 | |
| 	*nr_pages = 1;
 | |
| 	list_move_tail(&page->lru, tmplist);
 | |
| 
 | |
| 	/* now try and add more pages onto the request */
 | |
| 	expected_index = page->index + 1;
 | |
| 	list_for_each_entry_safe_reverse(page, tpage, page_list, lru) {
 | |
| 		/* discontinuity ? */
 | |
| 		if (page->index != expected_index)
 | |
| 			break;
 | |
| 
 | |
| 		/* would this page push the read over the rsize? */
 | |
| 		if (*bytes + PAGE_SIZE > rsize)
 | |
| 			break;
 | |
| 
 | |
| 		__SetPageLocked(page);
 | |
| 		rc = add_to_page_cache_locked(page, mapping, page->index, gfp);
 | |
| 		if (rc) {
 | |
| 			__ClearPageLocked(page);
 | |
| 			break;
 | |
| 		}
 | |
| 		list_move_tail(&page->lru, tmplist);
 | |
| 		(*bytes) += PAGE_SIZE;
 | |
| 		expected_index++;
 | |
| 		(*nr_pages)++;
 | |
| 	}
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int cifs_readpages(struct file *file, struct address_space *mapping,
 | |
| 	struct list_head *page_list, unsigned num_pages)
 | |
| {
 | |
| 	int rc;
 | |
| 	int err = 0;
 | |
| 	struct list_head tmplist;
 | |
| 	struct cifsFileInfo *open_file = file->private_data;
 | |
| 	struct cifs_sb_info *cifs_sb = CIFS_FILE_SB(file);
 | |
| 	struct TCP_Server_Info *server;
 | |
| 	pid_t pid;
 | |
| 	unsigned int xid;
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 	/*
 | |
| 	 * Reads as many pages as possible from fscache. Returns -ENOBUFS
 | |
| 	 * immediately if the cookie is negative
 | |
| 	 *
 | |
| 	 * After this point, every page in the list might have PG_fscache set,
 | |
| 	 * so we will need to clean that up off of every page we don't use.
 | |
| 	 */
 | |
| 	rc = cifs_readpages_from_fscache(mapping->host, mapping, page_list,
 | |
| 					 &num_pages);
 | |
| 	if (rc == 0) {
 | |
| 		free_xid(xid);
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
 | |
| 		pid = open_file->pid;
 | |
| 	else
 | |
| 		pid = current->tgid;
 | |
| 
 | |
| 	rc = 0;
 | |
| 	server = cifs_pick_channel(tlink_tcon(open_file->tlink)->ses);
 | |
| 
 | |
| 	cifs_dbg(FYI, "%s: file=%p mapping=%p num_pages=%u\n",
 | |
| 		 __func__, file, mapping, num_pages);
 | |
| 
 | |
| 	/*
 | |
| 	 * Start with the page at end of list and move it to private
 | |
| 	 * list. Do the same with any following pages until we hit
 | |
| 	 * the rsize limit, hit an index discontinuity, or run out of
 | |
| 	 * pages. Issue the async read and then start the loop again
 | |
| 	 * until the list is empty.
 | |
| 	 *
 | |
| 	 * Note that list order is important. The page_list is in
 | |
| 	 * the order of declining indexes. When we put the pages in
 | |
| 	 * the rdata->pages, then we want them in increasing order.
 | |
| 	 */
 | |
| 	while (!list_empty(page_list) && !err) {
 | |
| 		unsigned int i, nr_pages, bytes, rsize;
 | |
| 		loff_t offset;
 | |
| 		struct page *page, *tpage;
 | |
| 		struct cifs_readdata *rdata;
 | |
| 		struct cifs_credits credits_on_stack;
 | |
| 		struct cifs_credits *credits = &credits_on_stack;
 | |
| 
 | |
| 		if (open_file->invalidHandle) {
 | |
| 			rc = cifs_reopen_file(open_file, true);
 | |
| 			if (rc == -EAGAIN)
 | |
| 				continue;
 | |
| 			else if (rc)
 | |
| 				break;
 | |
| 		}
 | |
| 
 | |
| 		rc = server->ops->wait_mtu_credits(server, cifs_sb->ctx->rsize,
 | |
| 						   &rsize, credits);
 | |
| 		if (rc)
 | |
| 			break;
 | |
| 
 | |
| 		/*
 | |
| 		 * Give up immediately if rsize is too small to read an entire
 | |
| 		 * page. The VFS will fall back to readpage. We should never
 | |
| 		 * reach this point however since we set ra_pages to 0 when the
 | |
| 		 * rsize is smaller than a cache page.
 | |
| 		 */
 | |
| 		if (unlikely(rsize < PAGE_SIZE)) {
 | |
| 			add_credits_and_wake_if(server, credits, 0);
 | |
| 			free_xid(xid);
 | |
| 			return 0;
 | |
| 		}
 | |
| 
 | |
| 		nr_pages = 0;
 | |
| 		err = readpages_get_pages(mapping, page_list, rsize, &tmplist,
 | |
| 					 &nr_pages, &offset, &bytes);
 | |
| 		if (!nr_pages) {
 | |
| 			add_credits_and_wake_if(server, credits, 0);
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		rdata = cifs_readdata_alloc(nr_pages, cifs_readv_complete);
 | |
| 		if (!rdata) {
 | |
| 			/* best to give up if we're out of mem */
 | |
| 			list_for_each_entry_safe(page, tpage, &tmplist, lru) {
 | |
| 				list_del(&page->lru);
 | |
| 				lru_cache_add(page);
 | |
| 				unlock_page(page);
 | |
| 				put_page(page);
 | |
| 			}
 | |
| 			rc = -ENOMEM;
 | |
| 			add_credits_and_wake_if(server, credits, 0);
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		rdata->cfile = cifsFileInfo_get(open_file);
 | |
| 		rdata->server = server;
 | |
| 		rdata->mapping = mapping;
 | |
| 		rdata->offset = offset;
 | |
| 		rdata->bytes = bytes;
 | |
| 		rdata->pid = pid;
 | |
| 		rdata->pagesz = PAGE_SIZE;
 | |
| 		rdata->tailsz = PAGE_SIZE;
 | |
| 		rdata->read_into_pages = cifs_readpages_read_into_pages;
 | |
| 		rdata->copy_into_pages = cifs_readpages_copy_into_pages;
 | |
| 		rdata->credits = credits_on_stack;
 | |
| 
 | |
| 		list_for_each_entry_safe(page, tpage, &tmplist, lru) {
 | |
| 			list_del(&page->lru);
 | |
| 			rdata->pages[rdata->nr_pages++] = page;
 | |
| 		}
 | |
| 
 | |
| 		rc = adjust_credits(server, &rdata->credits, rdata->bytes);
 | |
| 
 | |
| 		if (!rc) {
 | |
| 			if (rdata->cfile->invalidHandle)
 | |
| 				rc = -EAGAIN;
 | |
| 			else
 | |
| 				rc = server->ops->async_readv(rdata);
 | |
| 		}
 | |
| 
 | |
| 		if (rc) {
 | |
| 			add_credits_and_wake_if(server, &rdata->credits, 0);
 | |
| 			for (i = 0; i < rdata->nr_pages; i++) {
 | |
| 				page = rdata->pages[i];
 | |
| 				lru_cache_add(page);
 | |
| 				unlock_page(page);
 | |
| 				put_page(page);
 | |
| 			}
 | |
| 			/* Fallback to the readpage in error/reconnect cases */
 | |
| 			kref_put(&rdata->refcount, cifs_readdata_release);
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 		kref_put(&rdata->refcount, cifs_readdata_release);
 | |
| 	}
 | |
| 
 | |
| 	/* Any pages that have been shown to fscache but didn't get added to
 | |
| 	 * the pagecache must be uncached before they get returned to the
 | |
| 	 * allocator.
 | |
| 	 */
 | |
| 	cifs_fscache_readpages_cancel(mapping->host, page_list);
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * cifs_readpage_worker must be called with the page pinned
 | |
|  */
 | |
| static int cifs_readpage_worker(struct file *file, struct page *page,
 | |
| 	loff_t *poffset)
 | |
| {
 | |
| 	char *read_data;
 | |
| 	int rc;
 | |
| 
 | |
| 	/* Is the page cached? */
 | |
| 	rc = cifs_readpage_from_fscache(file_inode(file), page);
 | |
| 	if (rc == 0)
 | |
| 		goto read_complete;
 | |
| 
 | |
| 	read_data = kmap(page);
 | |
| 	/* for reads over a certain size could initiate async read ahead */
 | |
| 
 | |
| 	rc = cifs_read(file, read_data, PAGE_SIZE, poffset);
 | |
| 
 | |
| 	if (rc < 0)
 | |
| 		goto io_error;
 | |
| 	else
 | |
| 		cifs_dbg(FYI, "Bytes read %d\n", rc);
 | |
| 
 | |
| 	/* we do not want atime to be less than mtime, it broke some apps */
 | |
| 	file_inode(file)->i_atime = current_time(file_inode(file));
 | |
| 	if (timespec64_compare(&(file_inode(file)->i_atime), &(file_inode(file)->i_mtime)))
 | |
| 		file_inode(file)->i_atime = file_inode(file)->i_mtime;
 | |
| 	else
 | |
| 		file_inode(file)->i_atime = current_time(file_inode(file));
 | |
| 
 | |
| 	if (PAGE_SIZE > rc)
 | |
| 		memset(read_data + rc, 0, PAGE_SIZE - rc);
 | |
| 
 | |
| 	flush_dcache_page(page);
 | |
| 	SetPageUptodate(page);
 | |
| 
 | |
| 	/* send this page to the cache */
 | |
| 	cifs_readpage_to_fscache(file_inode(file), page);
 | |
| 
 | |
| 	rc = 0;
 | |
| 
 | |
| io_error:
 | |
| 	kunmap(page);
 | |
| 	unlock_page(page);
 | |
| 
 | |
| read_complete:
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int cifs_readpage(struct file *file, struct page *page)
 | |
| {
 | |
| 	loff_t offset = (loff_t)page->index << PAGE_SHIFT;
 | |
| 	int rc = -EACCES;
 | |
| 	unsigned int xid;
 | |
| 
 | |
| 	xid = get_xid();
 | |
| 
 | |
| 	if (file->private_data == NULL) {
 | |
| 		rc = -EBADF;
 | |
| 		free_xid(xid);
 | |
| 		return rc;
 | |
| 	}
 | |
| 
 | |
| 	cifs_dbg(FYI, "readpage %p at offset %d 0x%x\n",
 | |
| 		 page, (int)offset, (int)offset);
 | |
| 
 | |
| 	rc = cifs_readpage_worker(file, page, &offset);
 | |
| 
 | |
| 	free_xid(xid);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int is_inode_writable(struct cifsInodeInfo *cifs_inode)
 | |
| {
 | |
| 	struct cifsFileInfo *open_file;
 | |
| 
 | |
| 	spin_lock(&cifs_inode->open_file_lock);
 | |
| 	list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
 | |
| 		if (OPEN_FMODE(open_file->f_flags) & FMODE_WRITE) {
 | |
| 			spin_unlock(&cifs_inode->open_file_lock);
 | |
| 			return 1;
 | |
| 		}
 | |
| 	}
 | |
| 	spin_unlock(&cifs_inode->open_file_lock);
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| /* We do not want to update the file size from server for inodes
 | |
|    open for write - to avoid races with writepage extending
 | |
|    the file - in the future we could consider allowing
 | |
|    refreshing the inode only on increases in the file size
 | |
|    but this is tricky to do without racing with writebehind
 | |
|    page caching in the current Linux kernel design */
 | |
| bool is_size_safe_to_change(struct cifsInodeInfo *cifsInode, __u64 end_of_file)
 | |
| {
 | |
| 	if (!cifsInode)
 | |
| 		return true;
 | |
| 
 | |
| 	if (is_inode_writable(cifsInode)) {
 | |
| 		/* This inode is open for write at least once */
 | |
| 		struct cifs_sb_info *cifs_sb;
 | |
| 
 | |
| 		cifs_sb = CIFS_SB(cifsInode->vfs_inode.i_sb);
 | |
| 		if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_DIRECT_IO) {
 | |
| 			/* since no page cache to corrupt on directio
 | |
| 			we can change size safely */
 | |
| 			return true;
 | |
| 		}
 | |
| 
 | |
| 		if (i_size_read(&cifsInode->vfs_inode) < end_of_file)
 | |
| 			return true;
 | |
| 
 | |
| 		return false;
 | |
| 	} else
 | |
| 		return true;
 | |
| }
 | |
| 
 | |
| static int cifs_write_begin(struct file *file, struct address_space *mapping,
 | |
| 			loff_t pos, unsigned len, unsigned flags,
 | |
| 			struct page **pagep, void **fsdata)
 | |
| {
 | |
| 	int oncethru = 0;
 | |
| 	pgoff_t index = pos >> PAGE_SHIFT;
 | |
| 	loff_t offset = pos & (PAGE_SIZE - 1);
 | |
| 	loff_t page_start = pos & PAGE_MASK;
 | |
| 	loff_t i_size;
 | |
| 	struct page *page;
 | |
| 	int rc = 0;
 | |
| 
 | |
| 	cifs_dbg(FYI, "write_begin from %lld len %d\n", (long long)pos, len);
 | |
| 
 | |
| start:
 | |
| 	page = grab_cache_page_write_begin(mapping, index, flags);
 | |
| 	if (!page) {
 | |
| 		rc = -ENOMEM;
 | |
| 		goto out;
 | |
| 	}
 | |
| 
 | |
| 	if (PageUptodate(page))
 | |
| 		goto out;
 | |
| 
 | |
| 	/*
 | |
| 	 * If we write a full page it will be up to date, no need to read from
 | |
| 	 * the server. If the write is short, we'll end up doing a sync write
 | |
| 	 * instead.
 | |
| 	 */
 | |
| 	if (len == PAGE_SIZE)
 | |
| 		goto out;
 | |
| 
 | |
| 	/*
 | |
| 	 * optimize away the read when we have an oplock, and we're not
 | |
| 	 * expecting to use any of the data we'd be reading in. That
 | |
| 	 * is, when the page lies beyond the EOF, or straddles the EOF
 | |
| 	 * and the write will cover all of the existing data.
 | |
| 	 */
 | |
| 	if (CIFS_CACHE_READ(CIFS_I(mapping->host))) {
 | |
| 		i_size = i_size_read(mapping->host);
 | |
| 		if (page_start >= i_size ||
 | |
| 		    (offset == 0 && (pos + len) >= i_size)) {
 | |
| 			zero_user_segments(page, 0, offset,
 | |
| 					   offset + len,
 | |
| 					   PAGE_SIZE);
 | |
| 			/*
 | |
| 			 * PageChecked means that the parts of the page
 | |
| 			 * to which we're not writing are considered up
 | |
| 			 * to date. Once the data is copied to the
 | |
| 			 * page, it can be set uptodate.
 | |
| 			 */
 | |
| 			SetPageChecked(page);
 | |
| 			goto out;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if ((file->f_flags & O_ACCMODE) != O_WRONLY && !oncethru) {
 | |
| 		/*
 | |
| 		 * might as well read a page, it is fast enough. If we get
 | |
| 		 * an error, we don't need to return it. cifs_write_end will
 | |
| 		 * do a sync write instead since PG_uptodate isn't set.
 | |
| 		 */
 | |
| 		cifs_readpage_worker(file, page, &page_start);
 | |
| 		put_page(page);
 | |
| 		oncethru = 1;
 | |
| 		goto start;
 | |
| 	} else {
 | |
| 		/* we could try using another file handle if there is one -
 | |
| 		   but how would we lock it to prevent close of that handle
 | |
| 		   racing with this read? In any case
 | |
| 		   this will be written out by write_end so is fine */
 | |
| 	}
 | |
| out:
 | |
| 	*pagep = page;
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int cifs_release_page(struct page *page, gfp_t gfp)
 | |
| {
 | |
| 	if (PagePrivate(page))
 | |
| 		return 0;
 | |
| 
 | |
| 	return cifs_fscache_release_page(page, gfp);
 | |
| }
 | |
| 
 | |
| static void cifs_invalidate_page(struct page *page, unsigned int offset,
 | |
| 				 unsigned int length)
 | |
| {
 | |
| 	struct cifsInodeInfo *cifsi = CIFS_I(page->mapping->host);
 | |
| 
 | |
| 	if (offset == 0 && length == PAGE_SIZE)
 | |
| 		cifs_fscache_invalidate_page(page, &cifsi->vfs_inode);
 | |
| }
 | |
| 
 | |
| static int cifs_launder_page(struct page *page)
 | |
| {
 | |
| 	int rc = 0;
 | |
| 	loff_t range_start = page_offset(page);
 | |
| 	loff_t range_end = range_start + (loff_t)(PAGE_SIZE - 1);
 | |
| 	struct writeback_control wbc = {
 | |
| 		.sync_mode = WB_SYNC_ALL,
 | |
| 		.nr_to_write = 0,
 | |
| 		.range_start = range_start,
 | |
| 		.range_end = range_end,
 | |
| 	};
 | |
| 
 | |
| 	cifs_dbg(FYI, "Launder page: %p\n", page);
 | |
| 
 | |
| 	if (clear_page_dirty_for_io(page))
 | |
| 		rc = cifs_writepage_locked(page, &wbc);
 | |
| 
 | |
| 	cifs_fscache_invalidate_page(page, page->mapping->host);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| void cifs_oplock_break(struct work_struct *work)
 | |
| {
 | |
| 	struct cifsFileInfo *cfile = container_of(work, struct cifsFileInfo,
 | |
| 						  oplock_break);
 | |
| 	struct inode *inode = d_inode(cfile->dentry);
 | |
| 	struct cifsInodeInfo *cinode = CIFS_I(inode);
 | |
| 	struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
 | |
| 	struct TCP_Server_Info *server = tcon->ses->server;
 | |
| 	int rc = 0;
 | |
| 	bool purge_cache = false;
 | |
| 	bool is_deferred = false;
 | |
| 	struct cifs_deferred_close *dclose;
 | |
| 
 | |
| 	wait_on_bit(&cinode->flags, CIFS_INODE_PENDING_WRITERS,
 | |
| 			TASK_UNINTERRUPTIBLE);
 | |
| 
 | |
| 	server->ops->downgrade_oplock(server, cinode, cfile->oplock_level,
 | |
| 				      cfile->oplock_epoch, &purge_cache);
 | |
| 
 | |
| 	if (!CIFS_CACHE_WRITE(cinode) && CIFS_CACHE_READ(cinode) &&
 | |
| 						cifs_has_mand_locks(cinode)) {
 | |
| 		cifs_dbg(FYI, "Reset oplock to None for inode=%p due to mand locks\n",
 | |
| 			 inode);
 | |
| 		cinode->oplock = 0;
 | |
| 	}
 | |
| 
 | |
| 	if (inode && S_ISREG(inode->i_mode)) {
 | |
| 		if (CIFS_CACHE_READ(cinode))
 | |
| 			break_lease(inode, O_RDONLY);
 | |
| 		else
 | |
| 			break_lease(inode, O_WRONLY);
 | |
| 		rc = filemap_fdatawrite(inode->i_mapping);
 | |
| 		if (!CIFS_CACHE_READ(cinode) || purge_cache) {
 | |
| 			rc = filemap_fdatawait(inode->i_mapping);
 | |
| 			mapping_set_error(inode->i_mapping, rc);
 | |
| 			cifs_zap_mapping(inode);
 | |
| 		}
 | |
| 		cifs_dbg(FYI, "Oplock flush inode %p rc %d\n", inode, rc);
 | |
| 		if (CIFS_CACHE_WRITE(cinode))
 | |
| 			goto oplock_break_ack;
 | |
| 	}
 | |
| 
 | |
| 	rc = cifs_push_locks(cfile);
 | |
| 	if (rc)
 | |
| 		cifs_dbg(VFS, "Push locks rc = %d\n", rc);
 | |
| 
 | |
| oplock_break_ack:
 | |
| 	/*
 | |
| 	 * releasing stale oplock after recent reconnect of smb session using
 | |
| 	 * a now incorrect file handle is not a data integrity issue but do
 | |
| 	 * not bother sending an oplock release if session to server still is
 | |
| 	 * disconnected since oplock already released by the server
 | |
| 	 */
 | |
| 	if (!cfile->oplock_break_cancelled) {
 | |
| 		rc = tcon->ses->server->ops->oplock_response(tcon, &cfile->fid,
 | |
| 							     cinode);
 | |
| 		cifs_dbg(FYI, "Oplock release rc = %d\n", rc);
 | |
| 	}
 | |
| 	/*
 | |
| 	 * When oplock break is received and there are no active
 | |
| 	 * file handles but cached, then schedule deferred close immediately.
 | |
| 	 * So, new open will not use cached handle.
 | |
| 	 */
 | |
| 	spin_lock(&CIFS_I(inode)->deferred_lock);
 | |
| 	is_deferred = cifs_is_deferred_close(cfile, &dclose);
 | |
| 	if (is_deferred &&
 | |
| 	    cfile->deferred_close_scheduled &&
 | |
| 	    delayed_work_pending(&cfile->deferred)) {
 | |
| 		/*
 | |
| 		 * If there is no pending work, mod_delayed_work queues new work.
 | |
| 		 * So, Increase the ref count to avoid use-after-free.
 | |
| 		 */
 | |
| 		if (!mod_delayed_work(deferredclose_wq, &cfile->deferred, 0))
 | |
| 			cifsFileInfo_get(cfile);
 | |
| 	}
 | |
| 	spin_unlock(&CIFS_I(inode)->deferred_lock);
 | |
| 	_cifsFileInfo_put(cfile, false /* do not wait for ourself */, false);
 | |
| 	cifs_done_oplock_break(cinode);
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * The presence of cifs_direct_io() in the address space ops vector
 | |
|  * allowes open() O_DIRECT flags which would have failed otherwise.
 | |
|  *
 | |
|  * In the non-cached mode (mount with cache=none), we shunt off direct read and write requests
 | |
|  * so this method should never be called.
 | |
|  *
 | |
|  * Direct IO is not yet supported in the cached mode. 
 | |
|  */
 | |
| static ssize_t
 | |
| cifs_direct_io(struct kiocb *iocb, struct iov_iter *iter)
 | |
| {
 | |
|         /*
 | |
|          * FIXME
 | |
|          * Eventually need to support direct IO for non forcedirectio mounts
 | |
|          */
 | |
|         return -EINVAL;
 | |
| }
 | |
| 
 | |
| static int cifs_swap_activate(struct swap_info_struct *sis,
 | |
| 			      struct file *swap_file, sector_t *span)
 | |
| {
 | |
| 	struct cifsFileInfo *cfile = swap_file->private_data;
 | |
| 	struct inode *inode = swap_file->f_mapping->host;
 | |
| 	unsigned long blocks;
 | |
| 	long long isize;
 | |
| 
 | |
| 	cifs_dbg(FYI, "swap activate\n");
 | |
| 
 | |
| 	spin_lock(&inode->i_lock);
 | |
| 	blocks = inode->i_blocks;
 | |
| 	isize = inode->i_size;
 | |
| 	spin_unlock(&inode->i_lock);
 | |
| 	if (blocks*512 < isize) {
 | |
| 		pr_warn("swap activate: swapfile has holes\n");
 | |
| 		return -EINVAL;
 | |
| 	}
 | |
| 	*span = sis->pages;
 | |
| 
 | |
| 	pr_warn_once("Swap support over SMB3 is experimental\n");
 | |
| 
 | |
| 	/*
 | |
| 	 * TODO: consider adding ACL (or documenting how) to prevent other
 | |
| 	 * users (on this or other systems) from reading it
 | |
| 	 */
 | |
| 
 | |
| 
 | |
| 	/* TODO: add sk_set_memalloc(inet) or similar */
 | |
| 
 | |
| 	if (cfile)
 | |
| 		cfile->swapfile = true;
 | |
| 	/*
 | |
| 	 * TODO: Since file already open, we can't open with DENY_ALL here
 | |
| 	 * but we could add call to grab a byte range lock to prevent others
 | |
| 	 * from reading or writing the file
 | |
| 	 */
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static void cifs_swap_deactivate(struct file *file)
 | |
| {
 | |
| 	struct cifsFileInfo *cfile = file->private_data;
 | |
| 
 | |
| 	cifs_dbg(FYI, "swap deactivate\n");
 | |
| 
 | |
| 	/* TODO: undo sk_set_memalloc(inet) will eventually be needed */
 | |
| 
 | |
| 	if (cfile)
 | |
| 		cfile->swapfile = false;
 | |
| 
 | |
| 	/* do we need to unpin (or unlock) the file */
 | |
| }
 | |
| 
 | |
| const struct address_space_operations cifs_addr_ops = {
 | |
| 	.readpage = cifs_readpage,
 | |
| 	.readpages = cifs_readpages,
 | |
| 	.writepage = cifs_writepage,
 | |
| 	.writepages = cifs_writepages,
 | |
| 	.write_begin = cifs_write_begin,
 | |
| 	.write_end = cifs_write_end,
 | |
| 	.set_page_dirty = __set_page_dirty_nobuffers,
 | |
| 	.releasepage = cifs_release_page,
 | |
| 	.direct_IO = cifs_direct_io,
 | |
| 	.invalidatepage = cifs_invalidate_page,
 | |
| 	.launder_page = cifs_launder_page,
 | |
| 	/*
 | |
| 	 * TODO: investigate and if useful we could add an cifs_migratePage
 | |
| 	 * helper (under an CONFIG_MIGRATION) in the future, and also
 | |
| 	 * investigate and add an is_dirty_writeback helper if needed
 | |
| 	 */
 | |
| 	.swap_activate = cifs_swap_activate,
 | |
| 	.swap_deactivate = cifs_swap_deactivate,
 | |
| };
 | |
| 
 | |
| /*
 | |
|  * cifs_readpages requires the server to support a buffer large enough to
 | |
|  * contain the header plus one complete page of data.  Otherwise, we need
 | |
|  * to leave cifs_readpages out of the address space operations.
 | |
|  */
 | |
| const struct address_space_operations cifs_addr_ops_smallbuf = {
 | |
| 	.readpage = cifs_readpage,
 | |
| 	.writepage = cifs_writepage,
 | |
| 	.writepages = cifs_writepages,
 | |
| 	.write_begin = cifs_write_begin,
 | |
| 	.write_end = cifs_write_end,
 | |
| 	.set_page_dirty = __set_page_dirty_nobuffers,
 | |
| 	.releasepage = cifs_release_page,
 | |
| 	.invalidatepage = cifs_invalidate_page,
 | |
| 	.launder_page = cifs_launder_page,
 | |
| };
 |