Merge tag 'pci-v3.15-changes' of git://git.kernel.org/pub/scm/linux/kernel/git/helgaa...
[deliverable/linux.git] / fs / cifs / file.c
CommitLineData
1da177e4
LT
1/*
2 * fs/cifs/file.c
3 *
4 * vfs operations that deal with files
fb8c4b14 5 *
f19159dc 6 * Copyright (C) International Business Machines Corp., 2002,2010
1da177e4 7 * Author(s): Steve French (sfrench@us.ibm.com)
7ee1af76 8 * Jeremy Allison (jra@samba.org)
1da177e4
LT
9 *
10 * This library is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU Lesser General Public License as published
12 * by the Free Software Foundation; either version 2.1 of the License, or
13 * (at your option) any later version.
14 *
15 * This library is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
18 * the GNU Lesser General Public License for more details.
19 *
20 * You should have received a copy of the GNU Lesser General Public License
21 * along with this library; if not, write to the Free Software
22 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 */
24#include <linux/fs.h>
37c0eb46 25#include <linux/backing-dev.h>
1da177e4
LT
26#include <linux/stat.h>
27#include <linux/fcntl.h>
28#include <linux/pagemap.h>
29#include <linux/pagevec.h>
37c0eb46 30#include <linux/writeback.h>
6f88cc2e 31#include <linux/task_io_accounting_ops.h>
23e7dd7d 32#include <linux/delay.h>
3bc303c2 33#include <linux/mount.h>
5a0e3ad6 34#include <linux/slab.h>
690c5e31 35#include <linux/swap.h>
1da177e4
LT
36#include <asm/div64.h>
37#include "cifsfs.h"
38#include "cifspdu.h"
39#include "cifsglob.h"
40#include "cifsproto.h"
41#include "cifs_unicode.h"
42#include "cifs_debug.h"
43#include "cifs_fs_sb.h"
9451a9a5 44#include "fscache.h"
1da177e4 45
07b92d0d 46
1da177e4
LT
47static inline int cifs_convert_flags(unsigned int flags)
48{
49 if ((flags & O_ACCMODE) == O_RDONLY)
50 return GENERIC_READ;
51 else if ((flags & O_ACCMODE) == O_WRONLY)
52 return GENERIC_WRITE;
53 else if ((flags & O_ACCMODE) == O_RDWR) {
54 /* GENERIC_ALL is too much permission to request
55 can cause unnecessary access denied on create */
56 /* return GENERIC_ALL; */
57 return (GENERIC_READ | GENERIC_WRITE);
58 }
59
e10f7b55
JL
60 return (READ_CONTROL | FILE_WRITE_ATTRIBUTES | FILE_READ_ATTRIBUTES |
61 FILE_WRITE_EA | FILE_APPEND_DATA | FILE_WRITE_DATA |
62 FILE_READ_DATA);
7fc8f4e9 63}
e10f7b55 64
608712fe 65static u32 cifs_posix_convert_flags(unsigned int flags)
7fc8f4e9 66{
608712fe 67 u32 posix_flags = 0;
e10f7b55 68
7fc8f4e9 69 if ((flags & O_ACCMODE) == O_RDONLY)
608712fe 70 posix_flags = SMB_O_RDONLY;
7fc8f4e9 71 else if ((flags & O_ACCMODE) == O_WRONLY)
608712fe
JL
72 posix_flags = SMB_O_WRONLY;
73 else if ((flags & O_ACCMODE) == O_RDWR)
74 posix_flags = SMB_O_RDWR;
75
07b92d0d 76 if (flags & O_CREAT) {
608712fe 77 posix_flags |= SMB_O_CREAT;
07b92d0d
SF
78 if (flags & O_EXCL)
79 posix_flags |= SMB_O_EXCL;
80 } else if (flags & O_EXCL)
f96637be
JP
81 cifs_dbg(FYI, "Application %s pid %d has incorrectly set O_EXCL flag but not O_CREAT on file open. Ignoring O_EXCL\n",
82 current->comm, current->tgid);
07b92d0d 83
608712fe
JL
84 if (flags & O_TRUNC)
85 posix_flags |= SMB_O_TRUNC;
86 /* be safe and imply O_SYNC for O_DSYNC */
6b2f3d1f 87 if (flags & O_DSYNC)
608712fe 88 posix_flags |= SMB_O_SYNC;
7fc8f4e9 89 if (flags & O_DIRECTORY)
608712fe 90 posix_flags |= SMB_O_DIRECTORY;
7fc8f4e9 91 if (flags & O_NOFOLLOW)
608712fe 92 posix_flags |= SMB_O_NOFOLLOW;
7fc8f4e9 93 if (flags & O_DIRECT)
608712fe 94 posix_flags |= SMB_O_DIRECT;
7fc8f4e9
SF
95
96 return posix_flags;
1da177e4
LT
97}
98
99static inline int cifs_get_disposition(unsigned int flags)
100{
101 if ((flags & (O_CREAT | O_EXCL)) == (O_CREAT | O_EXCL))
102 return FILE_CREATE;
103 else if ((flags & (O_CREAT | O_TRUNC)) == (O_CREAT | O_TRUNC))
104 return FILE_OVERWRITE_IF;
105 else if ((flags & O_CREAT) == O_CREAT)
106 return FILE_OPEN_IF;
55aa2e09
SF
107 else if ((flags & O_TRUNC) == O_TRUNC)
108 return FILE_OVERWRITE;
1da177e4
LT
109 else
110 return FILE_OPEN;
111}
112
608712fe
JL
113int cifs_posix_open(char *full_path, struct inode **pinode,
114 struct super_block *sb, int mode, unsigned int f_flags,
6d5786a3 115 __u32 *poplock, __u16 *pnetfid, unsigned int xid)
608712fe
JL
116{
117 int rc;
118 FILE_UNIX_BASIC_INFO *presp_data;
119 __u32 posix_flags = 0;
120 struct cifs_sb_info *cifs_sb = CIFS_SB(sb);
121 struct cifs_fattr fattr;
122 struct tcon_link *tlink;
96daf2b0 123 struct cifs_tcon *tcon;
608712fe 124
f96637be 125 cifs_dbg(FYI, "posix open %s\n", full_path);
608712fe
JL
126
127 presp_data = kzalloc(sizeof(FILE_UNIX_BASIC_INFO), GFP_KERNEL);
128 if (presp_data == NULL)
129 return -ENOMEM;
130
131 tlink = cifs_sb_tlink(cifs_sb);
132 if (IS_ERR(tlink)) {
133 rc = PTR_ERR(tlink);
134 goto posix_open_ret;
135 }
136
137 tcon = tlink_tcon(tlink);
138 mode &= ~current_umask();
139
140 posix_flags = cifs_posix_convert_flags(f_flags);
141 rc = CIFSPOSIXCreate(xid, tcon, posix_flags, mode, pnetfid, presp_data,
142 poplock, full_path, cifs_sb->local_nls,
143 cifs_sb->mnt_cifs_flags &
144 CIFS_MOUNT_MAP_SPECIAL_CHR);
145 cifs_put_tlink(tlink);
146
147 if (rc)
148 goto posix_open_ret;
149
150 if (presp_data->Type == cpu_to_le32(-1))
151 goto posix_open_ret; /* open ok, caller does qpathinfo */
152
153 if (!pinode)
154 goto posix_open_ret; /* caller does not need info */
155
156 cifs_unix_basic_to_fattr(&fattr, presp_data, cifs_sb);
157
158 /* get new inode and set it up */
159 if (*pinode == NULL) {
160 cifs_fill_uniqueid(sb, &fattr);
161 *pinode = cifs_iget(sb, &fattr);
162 if (!*pinode) {
163 rc = -ENOMEM;
164 goto posix_open_ret;
165 }
166 } else {
167 cifs_fattr_to_inode(*pinode, &fattr);
168 }
169
170posix_open_ret:
171 kfree(presp_data);
172 return rc;
173}
174
eeb910a6
PS
175static int
176cifs_nt_open(char *full_path, struct inode *inode, struct cifs_sb_info *cifs_sb,
fb1214e4
PS
177 struct cifs_tcon *tcon, unsigned int f_flags, __u32 *oplock,
178 struct cifs_fid *fid, unsigned int xid)
eeb910a6
PS
179{
180 int rc;
fb1214e4 181 int desired_access;
eeb910a6 182 int disposition;
3d3ea8e6 183 int create_options = CREATE_NOT_DIR;
eeb910a6 184 FILE_ALL_INFO *buf;
b8c32dbb 185 struct TCP_Server_Info *server = tcon->ses->server;
226730b4 186 struct cifs_open_parms oparms;
eeb910a6 187
b8c32dbb 188 if (!server->ops->open)
fb1214e4
PS
189 return -ENOSYS;
190
191 desired_access = cifs_convert_flags(f_flags);
eeb910a6
PS
192
193/*********************************************************************
194 * open flag mapping table:
195 *
196 * POSIX Flag CIFS Disposition
197 * ---------- ----------------
198 * O_CREAT FILE_OPEN_IF
199 * O_CREAT | O_EXCL FILE_CREATE
200 * O_CREAT | O_TRUNC FILE_OVERWRITE_IF
201 * O_TRUNC FILE_OVERWRITE
202 * none of the above FILE_OPEN
203 *
204 * Note that there is not a direct match between disposition
205 * FILE_SUPERSEDE (ie create whether or not file exists although
206 * O_CREAT | O_TRUNC is similar but truncates the existing
207 * file rather than creating a new file as FILE_SUPERSEDE does
208 * (which uses the attributes / metadata passed in on open call)
209 *?
210 *? O_SYNC is a reasonable match to CIFS writethrough flag
211 *? and the read write flags match reasonably. O_LARGEFILE
212 *? is irrelevant because largefile support is always used
213 *? by this client. Flags O_APPEND, O_DIRECT, O_DIRECTORY,
214 * O_FASYNC, O_NOFOLLOW, O_NONBLOCK need further investigation
215 *********************************************************************/
216
217 disposition = cifs_get_disposition(f_flags);
218
219 /* BB pass O_SYNC flag through on file attributes .. BB */
220
221 buf = kmalloc(sizeof(FILE_ALL_INFO), GFP_KERNEL);
222 if (!buf)
223 return -ENOMEM;
224
3d3ea8e6
SP
225 if (backup_cred(cifs_sb))
226 create_options |= CREATE_OPEN_BACKUP_INTENT;
227
226730b4
PS
228 oparms.tcon = tcon;
229 oparms.cifs_sb = cifs_sb;
230 oparms.desired_access = desired_access;
231 oparms.create_options = create_options;
232 oparms.disposition = disposition;
233 oparms.path = full_path;
234 oparms.fid = fid;
9cbc0b73 235 oparms.reconnect = false;
226730b4
PS
236
237 rc = server->ops->open(xid, &oparms, oplock, buf);
eeb910a6
PS
238
239 if (rc)
240 goto out;
241
242 if (tcon->unix_ext)
243 rc = cifs_get_inode_info_unix(&inode, full_path, inode->i_sb,
244 xid);
245 else
246 rc = cifs_get_inode_info(&inode, full_path, buf, inode->i_sb,
42eacf9e 247 xid, fid);
eeb910a6
PS
248
249out:
250 kfree(buf);
251 return rc;
252}
253
63b7d3a4
PS
254static bool
255cifs_has_mand_locks(struct cifsInodeInfo *cinode)
256{
257 struct cifs_fid_locks *cur;
258 bool has_locks = false;
259
260 down_read(&cinode->lock_sem);
261 list_for_each_entry(cur, &cinode->llist, llist) {
262 if (!list_empty(&cur->locks)) {
263 has_locks = true;
264 break;
265 }
266 }
267 up_read(&cinode->lock_sem);
268 return has_locks;
269}
270
15ecb436 271struct cifsFileInfo *
fb1214e4 272cifs_new_fileinfo(struct cifs_fid *fid, struct file *file,
15ecb436
JL
273 struct tcon_link *tlink, __u32 oplock)
274{
275 struct dentry *dentry = file->f_path.dentry;
276 struct inode *inode = dentry->d_inode;
4b4de76e
PS
277 struct cifsInodeInfo *cinode = CIFS_I(inode);
278 struct cifsFileInfo *cfile;
f45d3416 279 struct cifs_fid_locks *fdlocks;
233839b1 280 struct cifs_tcon *tcon = tlink_tcon(tlink);
63b7d3a4 281 struct TCP_Server_Info *server = tcon->ses->server;
4b4de76e
PS
282
283 cfile = kzalloc(sizeof(struct cifsFileInfo), GFP_KERNEL);
284 if (cfile == NULL)
285 return cfile;
286
f45d3416
PS
287 fdlocks = kzalloc(sizeof(struct cifs_fid_locks), GFP_KERNEL);
288 if (!fdlocks) {
289 kfree(cfile);
290 return NULL;
291 }
292
293 INIT_LIST_HEAD(&fdlocks->locks);
294 fdlocks->cfile = cfile;
295 cfile->llist = fdlocks;
1b4b55a1 296 down_write(&cinode->lock_sem);
f45d3416 297 list_add(&fdlocks->llist, &cinode->llist);
1b4b55a1 298 up_write(&cinode->lock_sem);
f45d3416 299
4b4de76e 300 cfile->count = 1;
4b4de76e
PS
301 cfile->pid = current->tgid;
302 cfile->uid = current_fsuid();
303 cfile->dentry = dget(dentry);
304 cfile->f_flags = file->f_flags;
305 cfile->invalidHandle = false;
306 cfile->tlink = cifs_get_tlink(tlink);
4b4de76e 307 INIT_WORK(&cfile->oplock_break, cifs_oplock_break);
f45d3416 308 mutex_init(&cfile->fh_mutex);
15ecb436 309
24261fc2
MG
310 cifs_sb_active(inode->i_sb);
311
63b7d3a4
PS
312 /*
313 * If the server returned a read oplock and we have mandatory brlocks,
314 * set oplock level to None.
315 */
53ef1016 316 if (server->ops->is_read_op(oplock) && cifs_has_mand_locks(cinode)) {
f96637be 317 cifs_dbg(FYI, "Reset oplock val from read to None due to mand locks\n");
63b7d3a4
PS
318 oplock = 0;
319 }
320
4477288a 321 spin_lock(&cifs_file_list_lock);
63b7d3a4 322 if (fid->pending_open->oplock != CIFS_OPLOCK_NO_CHANGE && oplock)
233839b1
PS
323 oplock = fid->pending_open->oplock;
324 list_del(&fid->pending_open->olist);
325
42873b0a 326 fid->purge_cache = false;
63b7d3a4 327 server->ops->set_fid(cfile, fid, oplock);
233839b1
PS
328
329 list_add(&cfile->tlist, &tcon->openFileList);
15ecb436
JL
330 /* if readable file instance put first in list*/
331 if (file->f_mode & FMODE_READ)
4b4de76e 332 list_add(&cfile->flist, &cinode->openFileList);
15ecb436 333 else
4b4de76e 334 list_add_tail(&cfile->flist, &cinode->openFileList);
4477288a 335 spin_unlock(&cifs_file_list_lock);
15ecb436 336
42873b0a
PS
337 if (fid->purge_cache)
338 cifs_invalidate_mapping(inode);
339
4b4de76e
PS
340 file->private_data = cfile;
341 return cfile;
15ecb436
JL
342}
343
764a1b1a
JL
344struct cifsFileInfo *
345cifsFileInfo_get(struct cifsFileInfo *cifs_file)
346{
347 spin_lock(&cifs_file_list_lock);
348 cifsFileInfo_get_locked(cifs_file);
349 spin_unlock(&cifs_file_list_lock);
350 return cifs_file;
351}
352
cdff08e7
SF
353/*
354 * Release a reference on the file private data. This may involve closing
5f6dbc9e
JL
355 * the filehandle out on the server. Must be called without holding
356 * cifs_file_list_lock.
cdff08e7 357 */
b33879aa
JL
358void cifsFileInfo_put(struct cifsFileInfo *cifs_file)
359{
e66673e3 360 struct inode *inode = cifs_file->dentry->d_inode;
96daf2b0 361 struct cifs_tcon *tcon = tlink_tcon(cifs_file->tlink);
233839b1 362 struct TCP_Server_Info *server = tcon->ses->server;
e66673e3 363 struct cifsInodeInfo *cifsi = CIFS_I(inode);
24261fc2
MG
364 struct super_block *sb = inode->i_sb;
365 struct cifs_sb_info *cifs_sb = CIFS_SB(sb);
cdff08e7 366 struct cifsLockInfo *li, *tmp;
233839b1
PS
367 struct cifs_fid fid;
368 struct cifs_pending_open open;
cdff08e7
SF
369
370 spin_lock(&cifs_file_list_lock);
5f6dbc9e 371 if (--cifs_file->count > 0) {
cdff08e7
SF
372 spin_unlock(&cifs_file_list_lock);
373 return;
374 }
375
233839b1
PS
376 if (server->ops->get_lease_key)
377 server->ops->get_lease_key(inode, &fid);
378
379 /* store open in pending opens to make sure we don't miss lease break */
380 cifs_add_pending_open_locked(&fid, cifs_file->tlink, &open);
381
cdff08e7
SF
382 /* remove it from the lists */
383 list_del(&cifs_file->flist);
384 list_del(&cifs_file->tlist);
385
386 if (list_empty(&cifsi->openFileList)) {
f96637be
JP
387 cifs_dbg(FYI, "closing last open instance for inode %p\n",
388 cifs_file->dentry->d_inode);
25364138
PS
389 /*
390 * In strict cache mode we need invalidate mapping on the last
391 * close because it may cause a error when we open this file
392 * again and get at least level II oplock.
393 */
4f8ba8a0
PS
394 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_STRICT_IO)
395 CIFS_I(inode)->invalid_mapping = true;
c6723628 396 cifs_set_oplock_level(cifsi, 0);
cdff08e7
SF
397 }
398 spin_unlock(&cifs_file_list_lock);
399
ad635942
JL
400 cancel_work_sync(&cifs_file->oplock_break);
401
cdff08e7 402 if (!tcon->need_reconnect && !cifs_file->invalidHandle) {
0ff78a22 403 struct TCP_Server_Info *server = tcon->ses->server;
6d5786a3 404 unsigned int xid;
0ff78a22 405
6d5786a3 406 xid = get_xid();
0ff78a22 407 if (server->ops->close)
760ad0ca
PS
408 server->ops->close(xid, tcon, &cifs_file->fid);
409 _free_xid(xid);
cdff08e7
SF
410 }
411
233839b1
PS
412 cifs_del_pending_open(&open);
413
f45d3416
PS
414 /*
415 * Delete any outstanding lock records. We'll lose them when the file
cdff08e7
SF
416 * is closed anyway.
417 */
1b4b55a1 418 down_write(&cifsi->lock_sem);
f45d3416 419 list_for_each_entry_safe(li, tmp, &cifs_file->llist->locks, llist) {
cdff08e7 420 list_del(&li->llist);
85160e03 421 cifs_del_lock_waiters(li);
cdff08e7 422 kfree(li);
b33879aa 423 }
f45d3416
PS
424 list_del(&cifs_file->llist->llist);
425 kfree(cifs_file->llist);
1b4b55a1 426 up_write(&cifsi->lock_sem);
cdff08e7
SF
427
428 cifs_put_tlink(cifs_file->tlink);
429 dput(cifs_file->dentry);
24261fc2 430 cifs_sb_deactive(sb);
cdff08e7 431 kfree(cifs_file);
b33879aa
JL
432}
433
1da177e4 434int cifs_open(struct inode *inode, struct file *file)
233839b1 435
1da177e4
LT
436{
437 int rc = -EACCES;
6d5786a3 438 unsigned int xid;
590a3fe0 439 __u32 oplock;
1da177e4 440 struct cifs_sb_info *cifs_sb;
b8c32dbb 441 struct TCP_Server_Info *server;
96daf2b0 442 struct cifs_tcon *tcon;
7ffec372 443 struct tcon_link *tlink;
fb1214e4 444 struct cifsFileInfo *cfile = NULL;
1da177e4 445 char *full_path = NULL;
7e12eddb 446 bool posix_open_ok = false;
fb1214e4 447 struct cifs_fid fid;
233839b1 448 struct cifs_pending_open open;
1da177e4 449
6d5786a3 450 xid = get_xid();
1da177e4
LT
451
452 cifs_sb = CIFS_SB(inode->i_sb);
7ffec372
JL
453 tlink = cifs_sb_tlink(cifs_sb);
454 if (IS_ERR(tlink)) {
6d5786a3 455 free_xid(xid);
7ffec372
JL
456 return PTR_ERR(tlink);
457 }
458 tcon = tlink_tcon(tlink);
b8c32dbb 459 server = tcon->ses->server;
1da177e4 460
e6a00296 461 full_path = build_path_from_dentry(file->f_path.dentry);
1da177e4 462 if (full_path == NULL) {
0f3bc09e 463 rc = -ENOMEM;
232341ba 464 goto out;
1da177e4
LT
465 }
466
f96637be 467 cifs_dbg(FYI, "inode = 0x%p file flags are 0x%x for %s\n",
b6b38f70 468 inode, file->f_flags, full_path);
276a74a4 469
233839b1 470 if (server->oplocks)
276a74a4
SF
471 oplock = REQ_OPLOCK;
472 else
473 oplock = 0;
474
64cc2c63 475 if (!tcon->broken_posix_open && tcon->unix_ext &&
29e20f9c
PS
476 cap_unix(tcon->ses) && (CIFS_UNIX_POSIX_PATH_OPS_CAP &
477 le64_to_cpu(tcon->fsUnixInfo.Capability))) {
276a74a4 478 /* can not refresh inode info since size could be stale */
2422f676 479 rc = cifs_posix_open(full_path, &inode, inode->i_sb,
fa588e0c 480 cifs_sb->mnt_file_mode /* ignored */,
fb1214e4 481 file->f_flags, &oplock, &fid.netfid, xid);
276a74a4 482 if (rc == 0) {
f96637be 483 cifs_dbg(FYI, "posix open succeeded\n");
7e12eddb 484 posix_open_ok = true;
64cc2c63
SF
485 } else if ((rc == -EINVAL) || (rc == -EOPNOTSUPP)) {
486 if (tcon->ses->serverNOS)
f96637be
JP
487 cifs_dbg(VFS, "server %s of type %s returned unexpected error on SMB posix open, disabling posix open support. Check if server update available.\n",
488 tcon->ses->serverName,
489 tcon->ses->serverNOS);
64cc2c63 490 tcon->broken_posix_open = true;
276a74a4
SF
491 } else if ((rc != -EIO) && (rc != -EREMOTE) &&
492 (rc != -EOPNOTSUPP)) /* path not found or net err */
493 goto out;
fb1214e4
PS
494 /*
495 * Else fallthrough to retry open the old way on network i/o
496 * or DFS errors.
497 */
276a74a4
SF
498 }
499
233839b1
PS
500 if (server->ops->get_lease_key)
501 server->ops->get_lease_key(inode, &fid);
502
503 cifs_add_pending_open(&fid, tlink, &open);
504
7e12eddb 505 if (!posix_open_ok) {
b8c32dbb
PS
506 if (server->ops->get_lease_key)
507 server->ops->get_lease_key(inode, &fid);
508
7e12eddb 509 rc = cifs_nt_open(full_path, inode, cifs_sb, tcon,
fb1214e4 510 file->f_flags, &oplock, &fid, xid);
233839b1
PS
511 if (rc) {
512 cifs_del_pending_open(&open);
7e12eddb 513 goto out;
233839b1 514 }
7e12eddb 515 }
47c78b7f 516
fb1214e4
PS
517 cfile = cifs_new_fileinfo(&fid, file, tlink, oplock);
518 if (cfile == NULL) {
b8c32dbb
PS
519 if (server->ops->close)
520 server->ops->close(xid, tcon, &fid);
233839b1 521 cifs_del_pending_open(&open);
1da177e4
LT
522 rc = -ENOMEM;
523 goto out;
524 }
1da177e4 525
9451a9a5
SJ
526 cifs_fscache_set_inode_cookie(inode, file);
527
7e12eddb 528 if ((oplock & CIFS_CREATE_ACTION) && !posix_open_ok && tcon->unix_ext) {
fb1214e4
PS
529 /*
530 * Time to set mode which we can not set earlier due to
531 * problems creating new read-only files.
532 */
7e12eddb
PS
533 struct cifs_unix_set_info_args args = {
534 .mode = inode->i_mode,
49418b2c
EB
535 .uid = INVALID_UID, /* no change */
536 .gid = INVALID_GID, /* no change */
7e12eddb
PS
537 .ctime = NO_CHANGE_64,
538 .atime = NO_CHANGE_64,
539 .mtime = NO_CHANGE_64,
540 .device = 0,
541 };
fb1214e4
PS
542 CIFSSMBUnixSetFileInfo(xid, tcon, &args, fid.netfid,
543 cfile->pid);
1da177e4
LT
544 }
545
546out:
1da177e4 547 kfree(full_path);
6d5786a3 548 free_xid(xid);
7ffec372 549 cifs_put_tlink(tlink);
1da177e4
LT
550 return rc;
551}
552
f152fd5f
PS
553static int cifs_push_posix_locks(struct cifsFileInfo *cfile);
554
2ae78ba8
PS
555/*
556 * Try to reacquire byte range locks that were released when session
f152fd5f 557 * to server was lost.
2ae78ba8 558 */
f152fd5f
PS
559static int
560cifs_relock_file(struct cifsFileInfo *cfile)
1da177e4 561{
f152fd5f
PS
562 struct cifs_sb_info *cifs_sb = CIFS_SB(cfile->dentry->d_sb);
563 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
564 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
1da177e4
LT
565 int rc = 0;
566
689c3db4 567 down_read(&cinode->lock_sem);
f152fd5f 568 if (cinode->can_cache_brlcks) {
689c3db4
PS
569 /* can cache locks - no need to relock */
570 up_read(&cinode->lock_sem);
f152fd5f
PS
571 return rc;
572 }
573
574 if (cap_unix(tcon->ses) &&
575 (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
576 ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
577 rc = cifs_push_posix_locks(cfile);
578 else
579 rc = tcon->ses->server->ops->push_mand_locks(cfile);
1da177e4 580
689c3db4 581 up_read(&cinode->lock_sem);
1da177e4
LT
582 return rc;
583}
584
2ae78ba8
PS
585static int
586cifs_reopen_file(struct cifsFileInfo *cfile, bool can_flush)
1da177e4
LT
587{
588 int rc = -EACCES;
6d5786a3 589 unsigned int xid;
590a3fe0 590 __u32 oplock;
1da177e4 591 struct cifs_sb_info *cifs_sb;
96daf2b0 592 struct cifs_tcon *tcon;
2ae78ba8
PS
593 struct TCP_Server_Info *server;
594 struct cifsInodeInfo *cinode;
fb8c4b14 595 struct inode *inode;
1da177e4 596 char *full_path = NULL;
2ae78ba8 597 int desired_access;
1da177e4 598 int disposition = FILE_OPEN;
3d3ea8e6 599 int create_options = CREATE_NOT_DIR;
226730b4 600 struct cifs_open_parms oparms;
1da177e4 601
6d5786a3 602 xid = get_xid();
2ae78ba8
PS
603 mutex_lock(&cfile->fh_mutex);
604 if (!cfile->invalidHandle) {
605 mutex_unlock(&cfile->fh_mutex);
0f3bc09e 606 rc = 0;
6d5786a3 607 free_xid(xid);
0f3bc09e 608 return rc;
1da177e4
LT
609 }
610
2ae78ba8 611 inode = cfile->dentry->d_inode;
1da177e4 612 cifs_sb = CIFS_SB(inode->i_sb);
2ae78ba8
PS
613 tcon = tlink_tcon(cfile->tlink);
614 server = tcon->ses->server;
615
616 /*
617 * Can not grab rename sem here because various ops, including those
618 * that already have the rename sem can end up causing writepage to get
619 * called and if the server was down that means we end up here, and we
620 * can never tell if the caller already has the rename_sem.
621 */
622 full_path = build_path_from_dentry(cfile->dentry);
1da177e4 623 if (full_path == NULL) {
3a9f462f 624 rc = -ENOMEM;
2ae78ba8 625 mutex_unlock(&cfile->fh_mutex);
6d5786a3 626 free_xid(xid);
3a9f462f 627 return rc;
1da177e4
LT
628 }
629
f96637be
JP
630 cifs_dbg(FYI, "inode = 0x%p file flags 0x%x for %s\n",
631 inode, cfile->f_flags, full_path);
1da177e4 632
10b9b98e 633 if (tcon->ses->server->oplocks)
1da177e4
LT
634 oplock = REQ_OPLOCK;
635 else
4b18f2a9 636 oplock = 0;
1da177e4 637
29e20f9c 638 if (tcon->unix_ext && cap_unix(tcon->ses) &&
7fc8f4e9 639 (CIFS_UNIX_POSIX_PATH_OPS_CAP &
29e20f9c 640 le64_to_cpu(tcon->fsUnixInfo.Capability))) {
608712fe
JL
641 /*
642 * O_CREAT, O_EXCL and O_TRUNC already had their effect on the
643 * original open. Must mask them off for a reopen.
644 */
2ae78ba8 645 unsigned int oflags = cfile->f_flags &
15886177 646 ~(O_CREAT | O_EXCL | O_TRUNC);
608712fe 647
2422f676 648 rc = cifs_posix_open(full_path, NULL, inode->i_sb,
2ae78ba8 649 cifs_sb->mnt_file_mode /* ignored */,
9cbc0b73 650 oflags, &oplock, &cfile->fid.netfid, xid);
7fc8f4e9 651 if (rc == 0) {
f96637be 652 cifs_dbg(FYI, "posix reopen succeeded\n");
fe090e4e 653 oparms.reconnect = true;
7fc8f4e9
SF
654 goto reopen_success;
655 }
2ae78ba8
PS
656 /*
657 * fallthrough to retry open the old way on errors, especially
658 * in the reconnect path it is important to retry hard
659 */
7fc8f4e9
SF
660 }
661
2ae78ba8 662 desired_access = cifs_convert_flags(cfile->f_flags);
7fc8f4e9 663
3d3ea8e6
SP
664 if (backup_cred(cifs_sb))
665 create_options |= CREATE_OPEN_BACKUP_INTENT;
666
b8c32dbb 667 if (server->ops->get_lease_key)
9cbc0b73 668 server->ops->get_lease_key(inode, &cfile->fid);
b8c32dbb 669
226730b4
PS
670 oparms.tcon = tcon;
671 oparms.cifs_sb = cifs_sb;
672 oparms.desired_access = desired_access;
673 oparms.create_options = create_options;
674 oparms.disposition = disposition;
675 oparms.path = full_path;
9cbc0b73
PS
676 oparms.fid = &cfile->fid;
677 oparms.reconnect = true;
226730b4 678
2ae78ba8
PS
679 /*
680 * Can not refresh inode by passing in file_info buf to be returned by
d81b8a40 681 * ops->open and then calling get_inode_info with returned buf since
2ae78ba8
PS
682 * file might have write behind data that needs to be flushed and server
683 * version of file size can be stale. If we knew for sure that inode was
684 * not dirty locally we could do this.
685 */
226730b4 686 rc = server->ops->open(xid, &oparms, &oplock, NULL);
b33fcf1c
PS
687 if (rc == -ENOENT && oparms.reconnect == false) {
688 /* durable handle timeout is expired - open the file again */
689 rc = server->ops->open(xid, &oparms, &oplock, NULL);
690 /* indicate that we need to relock the file */
691 oparms.reconnect = true;
692 }
693
1da177e4 694 if (rc) {
2ae78ba8 695 mutex_unlock(&cfile->fh_mutex);
f96637be
JP
696 cifs_dbg(FYI, "cifs_reopen returned 0x%x\n", rc);
697 cifs_dbg(FYI, "oplock: %d\n", oplock);
15886177
JL
698 goto reopen_error_exit;
699 }
700
7fc8f4e9 701reopen_success:
2ae78ba8
PS
702 cfile->invalidHandle = false;
703 mutex_unlock(&cfile->fh_mutex);
704 cinode = CIFS_I(inode);
15886177
JL
705
706 if (can_flush) {
707 rc = filemap_write_and_wait(inode->i_mapping);
eb4b756b 708 mapping_set_error(inode->i_mapping, rc);
15886177 709
15886177 710 if (tcon->unix_ext)
2ae78ba8
PS
711 rc = cifs_get_inode_info_unix(&inode, full_path,
712 inode->i_sb, xid);
15886177 713 else
2ae78ba8
PS
714 rc = cifs_get_inode_info(&inode, full_path, NULL,
715 inode->i_sb, xid, NULL);
716 }
717 /*
718 * Else we are writing out data to server already and could deadlock if
719 * we tried to flush data, and since we do not know if we have data that
720 * would invalidate the current end of file on the server we can not go
721 * to the server to get the new inode info.
722 */
723
9cbc0b73
PS
724 server->ops->set_fid(cfile, &cfile->fid, oplock);
725 if (oparms.reconnect)
726 cifs_relock_file(cfile);
15886177
JL
727
728reopen_error_exit:
1da177e4 729 kfree(full_path);
6d5786a3 730 free_xid(xid);
1da177e4
LT
731 return rc;
732}
733
734int cifs_close(struct inode *inode, struct file *file)
735{
77970693
JL
736 if (file->private_data != NULL) {
737 cifsFileInfo_put(file->private_data);
738 file->private_data = NULL;
739 }
7ee1af76 740
cdff08e7
SF
741 /* return code from the ->release op is always ignored */
742 return 0;
1da177e4
LT
743}
744
745int cifs_closedir(struct inode *inode, struct file *file)
746{
747 int rc = 0;
6d5786a3 748 unsigned int xid;
4b4de76e 749 struct cifsFileInfo *cfile = file->private_data;
92fc65a7
PS
750 struct cifs_tcon *tcon;
751 struct TCP_Server_Info *server;
752 char *buf;
1da177e4 753
f96637be 754 cifs_dbg(FYI, "Closedir inode = 0x%p\n", inode);
1da177e4 755
92fc65a7
PS
756 if (cfile == NULL)
757 return rc;
758
6d5786a3 759 xid = get_xid();
92fc65a7
PS
760 tcon = tlink_tcon(cfile->tlink);
761 server = tcon->ses->server;
1da177e4 762
f96637be 763 cifs_dbg(FYI, "Freeing private data in close dir\n");
92fc65a7
PS
764 spin_lock(&cifs_file_list_lock);
765 if (!cfile->srch_inf.endOfSearch && !cfile->invalidHandle) {
766 cfile->invalidHandle = true;
767 spin_unlock(&cifs_file_list_lock);
768 if (server->ops->close_dir)
769 rc = server->ops->close_dir(xid, tcon, &cfile->fid);
770 else
771 rc = -ENOSYS;
f96637be 772 cifs_dbg(FYI, "Closing uncompleted readdir with rc %d\n", rc);
92fc65a7
PS
773 /* not much we can do if it fails anyway, ignore rc */
774 rc = 0;
775 } else
776 spin_unlock(&cifs_file_list_lock);
777
778 buf = cfile->srch_inf.ntwrk_buf_start;
779 if (buf) {
f96637be 780 cifs_dbg(FYI, "closedir free smb buf in srch struct\n");
92fc65a7
PS
781 cfile->srch_inf.ntwrk_buf_start = NULL;
782 if (cfile->srch_inf.smallBuf)
783 cifs_small_buf_release(buf);
784 else
785 cifs_buf_release(buf);
1da177e4 786 }
92fc65a7
PS
787
788 cifs_put_tlink(cfile->tlink);
789 kfree(file->private_data);
790 file->private_data = NULL;
1da177e4 791 /* BB can we lock the filestruct while this is going on? */
6d5786a3 792 free_xid(xid);
1da177e4
LT
793 return rc;
794}
795
85160e03 796static struct cifsLockInfo *
fbd35aca 797cifs_lock_init(__u64 offset, __u64 length, __u8 type)
7ee1af76 798{
a88b4707 799 struct cifsLockInfo *lock =
fb8c4b14 800 kmalloc(sizeof(struct cifsLockInfo), GFP_KERNEL);
a88b4707
PS
801 if (!lock)
802 return lock;
803 lock->offset = offset;
804 lock->length = length;
805 lock->type = type;
a88b4707
PS
806 lock->pid = current->tgid;
807 INIT_LIST_HEAD(&lock->blist);
808 init_waitqueue_head(&lock->block_q);
809 return lock;
85160e03
PS
810}
811
f7ba7fe6 812void
85160e03
PS
813cifs_del_lock_waiters(struct cifsLockInfo *lock)
814{
815 struct cifsLockInfo *li, *tmp;
816 list_for_each_entry_safe(li, tmp, &lock->blist, blist) {
817 list_del_init(&li->blist);
818 wake_up(&li->block_q);
819 }
820}
821
081c0414
PS
822#define CIFS_LOCK_OP 0
823#define CIFS_READ_OP 1
824#define CIFS_WRITE_OP 2
825
826/* @rw_check : 0 - no op, 1 - read, 2 - write */
85160e03 827static bool
f45d3416
PS
828cifs_find_fid_lock_conflict(struct cifs_fid_locks *fdlocks, __u64 offset,
829 __u64 length, __u8 type, struct cifsFileInfo *cfile,
081c0414 830 struct cifsLockInfo **conf_lock, int rw_check)
85160e03 831{
fbd35aca 832 struct cifsLockInfo *li;
f45d3416 833 struct cifsFileInfo *cur_cfile = fdlocks->cfile;
106dc538 834 struct TCP_Server_Info *server = tlink_tcon(cfile->tlink)->ses->server;
85160e03 835
f45d3416 836 list_for_each_entry(li, &fdlocks->locks, llist) {
85160e03
PS
837 if (offset + length <= li->offset ||
838 offset >= li->offset + li->length)
839 continue;
081c0414
PS
840 if (rw_check != CIFS_LOCK_OP && current->tgid == li->pid &&
841 server->ops->compare_fids(cfile, cur_cfile)) {
842 /* shared lock prevents write op through the same fid */
843 if (!(li->type & server->vals->shared_lock_type) ||
844 rw_check != CIFS_WRITE_OP)
845 continue;
846 }
f45d3416
PS
847 if ((type & server->vals->shared_lock_type) &&
848 ((server->ops->compare_fids(cfile, cur_cfile) &&
849 current->tgid == li->pid) || type == li->type))
85160e03 850 continue;
579f9053
PS
851 if (conf_lock)
852 *conf_lock = li;
f45d3416 853 return true;
85160e03
PS
854 }
855 return false;
856}
857
579f9053 858bool
55157dfb 859cifs_find_lock_conflict(struct cifsFileInfo *cfile, __u64 offset, __u64 length,
579f9053 860 __u8 type, struct cifsLockInfo **conf_lock,
081c0414 861 int rw_check)
161ebf9f 862{
fbd35aca 863 bool rc = false;
f45d3416 864 struct cifs_fid_locks *cur;
55157dfb 865 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
fbd35aca 866
f45d3416
PS
867 list_for_each_entry(cur, &cinode->llist, llist) {
868 rc = cifs_find_fid_lock_conflict(cur, offset, length, type,
579f9053 869 cfile, conf_lock, rw_check);
fbd35aca
PS
870 if (rc)
871 break;
872 }
fbd35aca
PS
873
874 return rc;
161ebf9f
PS
875}
876
9a5101c8
PS
877/*
878 * Check if there is another lock that prevents us to set the lock (mandatory
879 * style). If such a lock exists, update the flock structure with its
880 * properties. Otherwise, set the flock type to F_UNLCK if we can cache brlocks
881 * or leave it the same if we can't. Returns 0 if we don't need to request to
882 * the server or 1 otherwise.
883 */
85160e03 884static int
fbd35aca
PS
885cifs_lock_test(struct cifsFileInfo *cfile, __u64 offset, __u64 length,
886 __u8 type, struct file_lock *flock)
85160e03
PS
887{
888 int rc = 0;
889 struct cifsLockInfo *conf_lock;
fbd35aca 890 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
106dc538 891 struct TCP_Server_Info *server = tlink_tcon(cfile->tlink)->ses->server;
85160e03
PS
892 bool exist;
893
1b4b55a1 894 down_read(&cinode->lock_sem);
85160e03 895
55157dfb 896 exist = cifs_find_lock_conflict(cfile, offset, length, type,
081c0414 897 &conf_lock, CIFS_LOCK_OP);
85160e03
PS
898 if (exist) {
899 flock->fl_start = conf_lock->offset;
900 flock->fl_end = conf_lock->offset + conf_lock->length - 1;
901 flock->fl_pid = conf_lock->pid;
106dc538 902 if (conf_lock->type & server->vals->shared_lock_type)
85160e03
PS
903 flock->fl_type = F_RDLCK;
904 else
905 flock->fl_type = F_WRLCK;
906 } else if (!cinode->can_cache_brlcks)
907 rc = 1;
908 else
909 flock->fl_type = F_UNLCK;
910
1b4b55a1 911 up_read(&cinode->lock_sem);
85160e03
PS
912 return rc;
913}
914
161ebf9f 915static void
fbd35aca 916cifs_lock_add(struct cifsFileInfo *cfile, struct cifsLockInfo *lock)
85160e03 917{
fbd35aca 918 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
1b4b55a1 919 down_write(&cinode->lock_sem);
f45d3416 920 list_add_tail(&lock->llist, &cfile->llist->locks);
1b4b55a1 921 up_write(&cinode->lock_sem);
7ee1af76
JA
922}
923
9a5101c8
PS
924/*
925 * Set the byte-range lock (mandatory style). Returns:
926 * 1) 0, if we set the lock and don't need to request to the server;
927 * 2) 1, if no locks prevent us but we need to request to the server;
928 * 3) -EACCESS, if there is a lock that prevents us and wait is false.
929 */
85160e03 930static int
fbd35aca 931cifs_lock_add_if(struct cifsFileInfo *cfile, struct cifsLockInfo *lock,
161ebf9f 932 bool wait)
85160e03 933{
161ebf9f 934 struct cifsLockInfo *conf_lock;
fbd35aca 935 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
85160e03
PS
936 bool exist;
937 int rc = 0;
938
85160e03
PS
939try_again:
940 exist = false;
1b4b55a1 941 down_write(&cinode->lock_sem);
85160e03 942
55157dfb 943 exist = cifs_find_lock_conflict(cfile, lock->offset, lock->length,
081c0414 944 lock->type, &conf_lock, CIFS_LOCK_OP);
85160e03 945 if (!exist && cinode->can_cache_brlcks) {
f45d3416 946 list_add_tail(&lock->llist, &cfile->llist->locks);
1b4b55a1 947 up_write(&cinode->lock_sem);
85160e03
PS
948 return rc;
949 }
950
951 if (!exist)
952 rc = 1;
953 else if (!wait)
954 rc = -EACCES;
955 else {
956 list_add_tail(&lock->blist, &conf_lock->blist);
1b4b55a1 957 up_write(&cinode->lock_sem);
85160e03
PS
958 rc = wait_event_interruptible(lock->block_q,
959 (lock->blist.prev == &lock->blist) &&
960 (lock->blist.next == &lock->blist));
961 if (!rc)
962 goto try_again;
1b4b55a1 963 down_write(&cinode->lock_sem);
a88b4707 964 list_del_init(&lock->blist);
85160e03
PS
965 }
966
1b4b55a1 967 up_write(&cinode->lock_sem);
85160e03
PS
968 return rc;
969}
970
9a5101c8
PS
971/*
972 * Check if there is another lock that prevents us to set the lock (posix
973 * style). If such a lock exists, update the flock structure with its
974 * properties. Otherwise, set the flock type to F_UNLCK if we can cache brlocks
975 * or leave it the same if we can't. Returns 0 if we don't need to request to
976 * the server or 1 otherwise.
977 */
85160e03 978static int
4f6bcec9
PS
979cifs_posix_lock_test(struct file *file, struct file_lock *flock)
980{
981 int rc = 0;
496ad9aa 982 struct cifsInodeInfo *cinode = CIFS_I(file_inode(file));
4f6bcec9
PS
983 unsigned char saved_type = flock->fl_type;
984
50792760
PS
985 if ((flock->fl_flags & FL_POSIX) == 0)
986 return 1;
987
1b4b55a1 988 down_read(&cinode->lock_sem);
4f6bcec9
PS
989 posix_test_lock(file, flock);
990
991 if (flock->fl_type == F_UNLCK && !cinode->can_cache_brlcks) {
992 flock->fl_type = saved_type;
993 rc = 1;
994 }
995
1b4b55a1 996 up_read(&cinode->lock_sem);
4f6bcec9
PS
997 return rc;
998}
999
9a5101c8
PS
1000/*
1001 * Set the byte-range lock (posix style). Returns:
1002 * 1) 0, if we set the lock and don't need to request to the server;
1003 * 2) 1, if we need to request to the server;
1004 * 3) <0, if the error occurs while setting the lock.
1005 */
4f6bcec9
PS
1006static int
1007cifs_posix_lock_set(struct file *file, struct file_lock *flock)
1008{
496ad9aa 1009 struct cifsInodeInfo *cinode = CIFS_I(file_inode(file));
50792760
PS
1010 int rc = 1;
1011
1012 if ((flock->fl_flags & FL_POSIX) == 0)
1013 return rc;
4f6bcec9 1014
66189be7 1015try_again:
1b4b55a1 1016 down_write(&cinode->lock_sem);
4f6bcec9 1017 if (!cinode->can_cache_brlcks) {
1b4b55a1 1018 up_write(&cinode->lock_sem);
50792760 1019 return rc;
4f6bcec9 1020 }
66189be7
PS
1021
1022 rc = posix_lock_file(file, flock, NULL);
1b4b55a1 1023 up_write(&cinode->lock_sem);
66189be7
PS
1024 if (rc == FILE_LOCK_DEFERRED) {
1025 rc = wait_event_interruptible(flock->fl_wait, !flock->fl_next);
1026 if (!rc)
1027 goto try_again;
1a9e64a7 1028 posix_unblock_lock(flock);
66189be7 1029 }
9ebb389d 1030 return rc;
4f6bcec9
PS
1031}
1032
d39a4f71 1033int
4f6bcec9 1034cifs_push_mandatory_locks(struct cifsFileInfo *cfile)
85160e03 1035{
6d5786a3
PS
1036 unsigned int xid;
1037 int rc = 0, stored_rc;
85160e03
PS
1038 struct cifsLockInfo *li, *tmp;
1039 struct cifs_tcon *tcon;
0013fb4c 1040 unsigned int num, max_num, max_buf;
32b9aaf1
PS
1041 LOCKING_ANDX_RANGE *buf, *cur;
1042 int types[] = {LOCKING_ANDX_LARGE_FILES,
1043 LOCKING_ANDX_SHARED_LOCK | LOCKING_ANDX_LARGE_FILES};
1044 int i;
85160e03 1045
6d5786a3 1046 xid = get_xid();
85160e03
PS
1047 tcon = tlink_tcon(cfile->tlink);
1048
0013fb4c
PS
1049 /*
1050 * Accessing maxBuf is racy with cifs_reconnect - need to store value
1051 * and check it for zero before using.
1052 */
1053 max_buf = tcon->ses->server->maxBuf;
1054 if (!max_buf) {
6d5786a3 1055 free_xid(xid);
0013fb4c
PS
1056 return -EINVAL;
1057 }
1058
1059 max_num = (max_buf - sizeof(struct smb_hdr)) /
1060 sizeof(LOCKING_ANDX_RANGE);
32b9aaf1
PS
1061 buf = kzalloc(max_num * sizeof(LOCKING_ANDX_RANGE), GFP_KERNEL);
1062 if (!buf) {
6d5786a3 1063 free_xid(xid);
e2f2886a 1064 return -ENOMEM;
32b9aaf1
PS
1065 }
1066
1067 for (i = 0; i < 2; i++) {
1068 cur = buf;
1069 num = 0;
f45d3416 1070 list_for_each_entry_safe(li, tmp, &cfile->llist->locks, llist) {
32b9aaf1
PS
1071 if (li->type != types[i])
1072 continue;
1073 cur->Pid = cpu_to_le16(li->pid);
1074 cur->LengthLow = cpu_to_le32((u32)li->length);
1075 cur->LengthHigh = cpu_to_le32((u32)(li->length>>32));
1076 cur->OffsetLow = cpu_to_le32((u32)li->offset);
1077 cur->OffsetHigh = cpu_to_le32((u32)(li->offset>>32));
1078 if (++num == max_num) {
4b4de76e
PS
1079 stored_rc = cifs_lockv(xid, tcon,
1080 cfile->fid.netfid,
04a6aa8a
PS
1081 (__u8)li->type, 0, num,
1082 buf);
32b9aaf1
PS
1083 if (stored_rc)
1084 rc = stored_rc;
1085 cur = buf;
1086 num = 0;
1087 } else
1088 cur++;
1089 }
1090
1091 if (num) {
4b4de76e 1092 stored_rc = cifs_lockv(xid, tcon, cfile->fid.netfid,
04a6aa8a 1093 (__u8)types[i], 0, num, buf);
32b9aaf1
PS
1094 if (stored_rc)
1095 rc = stored_rc;
1096 }
85160e03
PS
1097 }
1098
32b9aaf1 1099 kfree(buf);
6d5786a3 1100 free_xid(xid);
85160e03
PS
1101 return rc;
1102}
1103
4f6bcec9
PS
1104/* copied from fs/locks.c with a name change */
1105#define cifs_for_each_lock(inode, lockp) \
1106 for (lockp = &inode->i_flock; *lockp != NULL; \
1107 lockp = &(*lockp)->fl_next)
1108
d5751469
PS
1109struct lock_to_push {
1110 struct list_head llist;
1111 __u64 offset;
1112 __u64 length;
1113 __u32 pid;
1114 __u16 netfid;
1115 __u8 type;
1116};
1117
4f6bcec9 1118static int
b8db928b 1119cifs_push_posix_locks(struct cifsFileInfo *cfile)
4f6bcec9 1120{
1c8c601a 1121 struct inode *inode = cfile->dentry->d_inode;
4f6bcec9
PS
1122 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
1123 struct file_lock *flock, **before;
d5751469 1124 unsigned int count = 0, i = 0;
4f6bcec9 1125 int rc = 0, xid, type;
d5751469
PS
1126 struct list_head locks_to_send, *el;
1127 struct lock_to_push *lck, *tmp;
4f6bcec9 1128 __u64 length;
4f6bcec9 1129
6d5786a3 1130 xid = get_xid();
4f6bcec9 1131
1c8c601a
JL
1132 spin_lock(&inode->i_lock);
1133 cifs_for_each_lock(inode, before) {
d5751469
PS
1134 if ((*before)->fl_flags & FL_POSIX)
1135 count++;
1136 }
1c8c601a 1137 spin_unlock(&inode->i_lock);
d5751469 1138
4f6bcec9
PS
1139 INIT_LIST_HEAD(&locks_to_send);
1140
d5751469 1141 /*
ce85852b 1142 * Allocating count locks is enough because no FL_POSIX locks can be
1b4b55a1 1143 * added to the list while we are holding cinode->lock_sem that
ce85852b 1144 * protects locking operations of this inode.
d5751469
PS
1145 */
1146 for (; i < count; i++) {
1147 lck = kmalloc(sizeof(struct lock_to_push), GFP_KERNEL);
1148 if (!lck) {
1149 rc = -ENOMEM;
1150 goto err_out;
1151 }
1152 list_add_tail(&lck->llist, &locks_to_send);
1153 }
1154
d5751469 1155 el = locks_to_send.next;
1c8c601a
JL
1156 spin_lock(&inode->i_lock);
1157 cifs_for_each_lock(inode, before) {
ce85852b
PS
1158 flock = *before;
1159 if ((flock->fl_flags & FL_POSIX) == 0)
1160 continue;
d5751469 1161 if (el == &locks_to_send) {
ce85852b
PS
1162 /*
1163 * The list ended. We don't have enough allocated
1164 * structures - something is really wrong.
1165 */
f96637be 1166 cifs_dbg(VFS, "Can't push all brlocks!\n");
d5751469
PS
1167 break;
1168 }
4f6bcec9
PS
1169 length = 1 + flock->fl_end - flock->fl_start;
1170 if (flock->fl_type == F_RDLCK || flock->fl_type == F_SHLCK)
1171 type = CIFS_RDLCK;
1172 else
1173 type = CIFS_WRLCK;
d5751469 1174 lck = list_entry(el, struct lock_to_push, llist);
4f6bcec9 1175 lck->pid = flock->fl_pid;
4b4de76e 1176 lck->netfid = cfile->fid.netfid;
d5751469
PS
1177 lck->length = length;
1178 lck->type = type;
1179 lck->offset = flock->fl_start;
d5751469 1180 el = el->next;
4f6bcec9 1181 }
1c8c601a 1182 spin_unlock(&inode->i_lock);
4f6bcec9
PS
1183
1184 list_for_each_entry_safe(lck, tmp, &locks_to_send, llist) {
4f6bcec9
PS
1185 int stored_rc;
1186
4f6bcec9 1187 stored_rc = CIFSSMBPosixLock(xid, tcon, lck->netfid, lck->pid,
c5fd363d 1188 lck->offset, lck->length, NULL,
4f6bcec9
PS
1189 lck->type, 0);
1190 if (stored_rc)
1191 rc = stored_rc;
1192 list_del(&lck->llist);
1193 kfree(lck);
1194 }
1195
d5751469 1196out:
6d5786a3 1197 free_xid(xid);
4f6bcec9 1198 return rc;
d5751469
PS
1199err_out:
1200 list_for_each_entry_safe(lck, tmp, &locks_to_send, llist) {
1201 list_del(&lck->llist);
1202 kfree(lck);
1203 }
1204 goto out;
4f6bcec9
PS
1205}
1206
9ec3c882 1207static int
b8db928b 1208cifs_push_locks(struct cifsFileInfo *cfile)
9ec3c882 1209{
b8db928b 1210 struct cifs_sb_info *cifs_sb = CIFS_SB(cfile->dentry->d_sb);
9ec3c882 1211 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
b8db928b 1212 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
9ec3c882
PS
1213 int rc = 0;
1214
1215 /* we are going to update can_cache_brlcks here - need a write access */
1216 down_write(&cinode->lock_sem);
1217 if (!cinode->can_cache_brlcks) {
1218 up_write(&cinode->lock_sem);
1219 return rc;
1220 }
4f6bcec9 1221
29e20f9c 1222 if (cap_unix(tcon->ses) &&
4f6bcec9
PS
1223 (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
1224 ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
b8db928b
PS
1225 rc = cifs_push_posix_locks(cfile);
1226 else
1227 rc = tcon->ses->server->ops->push_mand_locks(cfile);
4f6bcec9 1228
b8db928b
PS
1229 cinode->can_cache_brlcks = false;
1230 up_write(&cinode->lock_sem);
1231 return rc;
4f6bcec9
PS
1232}
1233
03776f45 1234static void
04a6aa8a 1235cifs_read_flock(struct file_lock *flock, __u32 *type, int *lock, int *unlock,
106dc538 1236 bool *wait_flag, struct TCP_Server_Info *server)
1da177e4 1237{
03776f45 1238 if (flock->fl_flags & FL_POSIX)
f96637be 1239 cifs_dbg(FYI, "Posix\n");
03776f45 1240 if (flock->fl_flags & FL_FLOCK)
f96637be 1241 cifs_dbg(FYI, "Flock\n");
03776f45 1242 if (flock->fl_flags & FL_SLEEP) {
f96637be 1243 cifs_dbg(FYI, "Blocking lock\n");
03776f45 1244 *wait_flag = true;
1da177e4 1245 }
03776f45 1246 if (flock->fl_flags & FL_ACCESS)
f96637be 1247 cifs_dbg(FYI, "Process suspended by mandatory locking - not implemented yet\n");
03776f45 1248 if (flock->fl_flags & FL_LEASE)
f96637be 1249 cifs_dbg(FYI, "Lease on file - not implemented yet\n");
03776f45 1250 if (flock->fl_flags &
3d6d854a
JL
1251 (~(FL_POSIX | FL_FLOCK | FL_SLEEP |
1252 FL_ACCESS | FL_LEASE | FL_CLOSE)))
f96637be 1253 cifs_dbg(FYI, "Unknown lock flags 0x%x\n", flock->fl_flags);
1da177e4 1254
106dc538 1255 *type = server->vals->large_lock_type;
03776f45 1256 if (flock->fl_type == F_WRLCK) {
f96637be 1257 cifs_dbg(FYI, "F_WRLCK\n");
106dc538 1258 *type |= server->vals->exclusive_lock_type;
03776f45
PS
1259 *lock = 1;
1260 } else if (flock->fl_type == F_UNLCK) {
f96637be 1261 cifs_dbg(FYI, "F_UNLCK\n");
106dc538 1262 *type |= server->vals->unlock_lock_type;
03776f45
PS
1263 *unlock = 1;
1264 /* Check if unlock includes more than one lock range */
1265 } else if (flock->fl_type == F_RDLCK) {
f96637be 1266 cifs_dbg(FYI, "F_RDLCK\n");
106dc538 1267 *type |= server->vals->shared_lock_type;
03776f45
PS
1268 *lock = 1;
1269 } else if (flock->fl_type == F_EXLCK) {
f96637be 1270 cifs_dbg(FYI, "F_EXLCK\n");
106dc538 1271 *type |= server->vals->exclusive_lock_type;
03776f45
PS
1272 *lock = 1;
1273 } else if (flock->fl_type == F_SHLCK) {
f96637be 1274 cifs_dbg(FYI, "F_SHLCK\n");
106dc538 1275 *type |= server->vals->shared_lock_type;
03776f45 1276 *lock = 1;
1da177e4 1277 } else
f96637be 1278 cifs_dbg(FYI, "Unknown type of lock\n");
03776f45 1279}
1da177e4 1280
03776f45 1281static int
04a6aa8a 1282cifs_getlk(struct file *file, struct file_lock *flock, __u32 type,
6d5786a3 1283 bool wait_flag, bool posix_lck, unsigned int xid)
03776f45
PS
1284{
1285 int rc = 0;
1286 __u64 length = 1 + flock->fl_end - flock->fl_start;
4f6bcec9
PS
1287 struct cifsFileInfo *cfile = (struct cifsFileInfo *)file->private_data;
1288 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
106dc538 1289 struct TCP_Server_Info *server = tcon->ses->server;
4b4de76e 1290 __u16 netfid = cfile->fid.netfid;
f05337c6 1291
03776f45
PS
1292 if (posix_lck) {
1293 int posix_lock_type;
4f6bcec9
PS
1294
1295 rc = cifs_posix_lock_test(file, flock);
1296 if (!rc)
1297 return rc;
1298
106dc538 1299 if (type & server->vals->shared_lock_type)
03776f45
PS
1300 posix_lock_type = CIFS_RDLCK;
1301 else
1302 posix_lock_type = CIFS_WRLCK;
4f6bcec9 1303 rc = CIFSSMBPosixLock(xid, tcon, netfid, current->tgid,
c5fd363d 1304 flock->fl_start, length, flock,
4f6bcec9 1305 posix_lock_type, wait_flag);
03776f45
PS
1306 return rc;
1307 }
1da177e4 1308
fbd35aca 1309 rc = cifs_lock_test(cfile, flock->fl_start, length, type, flock);
85160e03
PS
1310 if (!rc)
1311 return rc;
1312
03776f45 1313 /* BB we could chain these into one lock request BB */
d39a4f71
PS
1314 rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length, type,
1315 1, 0, false);
03776f45 1316 if (rc == 0) {
d39a4f71
PS
1317 rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length,
1318 type, 0, 1, false);
03776f45
PS
1319 flock->fl_type = F_UNLCK;
1320 if (rc != 0)
f96637be
JP
1321 cifs_dbg(VFS, "Error unlocking previously locked range %d during test of lock\n",
1322 rc);
a88b4707 1323 return 0;
1da177e4 1324 }
7ee1af76 1325
106dc538 1326 if (type & server->vals->shared_lock_type) {
03776f45 1327 flock->fl_type = F_WRLCK;
a88b4707 1328 return 0;
7ee1af76
JA
1329 }
1330
d39a4f71
PS
1331 type &= ~server->vals->exclusive_lock_type;
1332
1333 rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length,
1334 type | server->vals->shared_lock_type,
1335 1, 0, false);
03776f45 1336 if (rc == 0) {
d39a4f71
PS
1337 rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length,
1338 type | server->vals->shared_lock_type, 0, 1, false);
03776f45
PS
1339 flock->fl_type = F_RDLCK;
1340 if (rc != 0)
f96637be
JP
1341 cifs_dbg(VFS, "Error unlocking previously locked range %d during test of lock\n",
1342 rc);
03776f45
PS
1343 } else
1344 flock->fl_type = F_WRLCK;
1345
a88b4707 1346 return 0;
03776f45
PS
1347}
1348
f7ba7fe6 1349void
9ee305b7
PS
1350cifs_move_llist(struct list_head *source, struct list_head *dest)
1351{
1352 struct list_head *li, *tmp;
1353 list_for_each_safe(li, tmp, source)
1354 list_move(li, dest);
1355}
1356
f7ba7fe6 1357void
9ee305b7
PS
1358cifs_free_llist(struct list_head *llist)
1359{
1360 struct cifsLockInfo *li, *tmp;
1361 list_for_each_entry_safe(li, tmp, llist, llist) {
1362 cifs_del_lock_waiters(li);
1363 list_del(&li->llist);
1364 kfree(li);
1365 }
1366}
1367
d39a4f71 1368int
6d5786a3
PS
1369cifs_unlock_range(struct cifsFileInfo *cfile, struct file_lock *flock,
1370 unsigned int xid)
9ee305b7
PS
1371{
1372 int rc = 0, stored_rc;
1373 int types[] = {LOCKING_ANDX_LARGE_FILES,
1374 LOCKING_ANDX_SHARED_LOCK | LOCKING_ANDX_LARGE_FILES};
1375 unsigned int i;
0013fb4c 1376 unsigned int max_num, num, max_buf;
9ee305b7
PS
1377 LOCKING_ANDX_RANGE *buf, *cur;
1378 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
1379 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
1380 struct cifsLockInfo *li, *tmp;
1381 __u64 length = 1 + flock->fl_end - flock->fl_start;
1382 struct list_head tmp_llist;
1383
1384 INIT_LIST_HEAD(&tmp_llist);
1385
0013fb4c
PS
1386 /*
1387 * Accessing maxBuf is racy with cifs_reconnect - need to store value
1388 * and check it for zero before using.
1389 */
1390 max_buf = tcon->ses->server->maxBuf;
1391 if (!max_buf)
1392 return -EINVAL;
1393
1394 max_num = (max_buf - sizeof(struct smb_hdr)) /
1395 sizeof(LOCKING_ANDX_RANGE);
9ee305b7
PS
1396 buf = kzalloc(max_num * sizeof(LOCKING_ANDX_RANGE), GFP_KERNEL);
1397 if (!buf)
1398 return -ENOMEM;
1399
1b4b55a1 1400 down_write(&cinode->lock_sem);
9ee305b7
PS
1401 for (i = 0; i < 2; i++) {
1402 cur = buf;
1403 num = 0;
f45d3416 1404 list_for_each_entry_safe(li, tmp, &cfile->llist->locks, llist) {
9ee305b7
PS
1405 if (flock->fl_start > li->offset ||
1406 (flock->fl_start + length) <
1407 (li->offset + li->length))
1408 continue;
1409 if (current->tgid != li->pid)
1410 continue;
9ee305b7
PS
1411 if (types[i] != li->type)
1412 continue;
ea319d57 1413 if (cinode->can_cache_brlcks) {
9ee305b7
PS
1414 /*
1415 * We can cache brlock requests - simply remove
fbd35aca 1416 * a lock from the file's list.
9ee305b7
PS
1417 */
1418 list_del(&li->llist);
1419 cifs_del_lock_waiters(li);
1420 kfree(li);
ea319d57 1421 continue;
9ee305b7 1422 }
ea319d57
PS
1423 cur->Pid = cpu_to_le16(li->pid);
1424 cur->LengthLow = cpu_to_le32((u32)li->length);
1425 cur->LengthHigh = cpu_to_le32((u32)(li->length>>32));
1426 cur->OffsetLow = cpu_to_le32((u32)li->offset);
1427 cur->OffsetHigh = cpu_to_le32((u32)(li->offset>>32));
1428 /*
1429 * We need to save a lock here to let us add it again to
1430 * the file's list if the unlock range request fails on
1431 * the server.
1432 */
1433 list_move(&li->llist, &tmp_llist);
1434 if (++num == max_num) {
4b4de76e
PS
1435 stored_rc = cifs_lockv(xid, tcon,
1436 cfile->fid.netfid,
ea319d57
PS
1437 li->type, num, 0, buf);
1438 if (stored_rc) {
1439 /*
1440 * We failed on the unlock range
1441 * request - add all locks from the tmp
1442 * list to the head of the file's list.
1443 */
1444 cifs_move_llist(&tmp_llist,
f45d3416 1445 &cfile->llist->locks);
ea319d57
PS
1446 rc = stored_rc;
1447 } else
1448 /*
1449 * The unlock range request succeed -
1450 * free the tmp list.
1451 */
1452 cifs_free_llist(&tmp_llist);
1453 cur = buf;
1454 num = 0;
1455 } else
1456 cur++;
9ee305b7
PS
1457 }
1458 if (num) {
4b4de76e 1459 stored_rc = cifs_lockv(xid, tcon, cfile->fid.netfid,
9ee305b7
PS
1460 types[i], num, 0, buf);
1461 if (stored_rc) {
f45d3416
PS
1462 cifs_move_llist(&tmp_llist,
1463 &cfile->llist->locks);
9ee305b7
PS
1464 rc = stored_rc;
1465 } else
1466 cifs_free_llist(&tmp_llist);
1467 }
1468 }
1469
1b4b55a1 1470 up_write(&cinode->lock_sem);
9ee305b7
PS
1471 kfree(buf);
1472 return rc;
1473}
1474
03776f45 1475static int
f45d3416 1476cifs_setlk(struct file *file, struct file_lock *flock, __u32 type,
6d5786a3
PS
1477 bool wait_flag, bool posix_lck, int lock, int unlock,
1478 unsigned int xid)
03776f45
PS
1479{
1480 int rc = 0;
1481 __u64 length = 1 + flock->fl_end - flock->fl_start;
1482 struct cifsFileInfo *cfile = (struct cifsFileInfo *)file->private_data;
1483 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
106dc538 1484 struct TCP_Server_Info *server = tcon->ses->server;
63b7d3a4 1485 struct inode *inode = cfile->dentry->d_inode;
03776f45
PS
1486
1487 if (posix_lck) {
08547b03 1488 int posix_lock_type;
4f6bcec9
PS
1489
1490 rc = cifs_posix_lock_set(file, flock);
1491 if (!rc || rc < 0)
1492 return rc;
1493
106dc538 1494 if (type & server->vals->shared_lock_type)
08547b03
SF
1495 posix_lock_type = CIFS_RDLCK;
1496 else
1497 posix_lock_type = CIFS_WRLCK;
50c2f753 1498
03776f45 1499 if (unlock == 1)
beb84dc8 1500 posix_lock_type = CIFS_UNLCK;
7ee1af76 1501
f45d3416
PS
1502 rc = CIFSSMBPosixLock(xid, tcon, cfile->fid.netfid,
1503 current->tgid, flock->fl_start, length,
1504 NULL, posix_lock_type, wait_flag);
03776f45
PS
1505 goto out;
1506 }
7ee1af76 1507
03776f45 1508 if (lock) {
161ebf9f
PS
1509 struct cifsLockInfo *lock;
1510
fbd35aca 1511 lock = cifs_lock_init(flock->fl_start, length, type);
161ebf9f
PS
1512 if (!lock)
1513 return -ENOMEM;
1514
fbd35aca 1515 rc = cifs_lock_add_if(cfile, lock, wait_flag);
21cb2d90 1516 if (rc < 0) {
161ebf9f 1517 kfree(lock);
21cb2d90
PS
1518 return rc;
1519 }
1520 if (!rc)
85160e03
PS
1521 goto out;
1522
63b7d3a4
PS
1523 /*
1524 * Windows 7 server can delay breaking lease from read to None
1525 * if we set a byte-range lock on a file - break it explicitly
1526 * before sending the lock to the server to be sure the next
1527 * read won't conflict with non-overlapted locks due to
1528 * pagereading.
1529 */
18cceb6a
PS
1530 if (!CIFS_CACHE_WRITE(CIFS_I(inode)) &&
1531 CIFS_CACHE_READ(CIFS_I(inode))) {
63b7d3a4 1532 cifs_invalidate_mapping(inode);
f96637be
JP
1533 cifs_dbg(FYI, "Set no oplock for inode=%p due to mand locks\n",
1534 inode);
18cceb6a 1535 CIFS_I(inode)->oplock = 0;
63b7d3a4
PS
1536 }
1537
d39a4f71
PS
1538 rc = server->ops->mand_lock(xid, cfile, flock->fl_start, length,
1539 type, 1, 0, wait_flag);
161ebf9f
PS
1540 if (rc) {
1541 kfree(lock);
21cb2d90 1542 return rc;
03776f45 1543 }
161ebf9f 1544
fbd35aca 1545 cifs_lock_add(cfile, lock);
9ee305b7 1546 } else if (unlock)
d39a4f71 1547 rc = server->ops->mand_unlock_range(cfile, flock, xid);
03776f45 1548
03776f45
PS
1549out:
1550 if (flock->fl_flags & FL_POSIX)
9ebb389d 1551 posix_lock_file_wait(file, flock);
03776f45
PS
1552 return rc;
1553}
1554
1555int cifs_lock(struct file *file, int cmd, struct file_lock *flock)
1556{
1557 int rc, xid;
1558 int lock = 0, unlock = 0;
1559 bool wait_flag = false;
1560 bool posix_lck = false;
1561 struct cifs_sb_info *cifs_sb;
1562 struct cifs_tcon *tcon;
1563 struct cifsInodeInfo *cinode;
1564 struct cifsFileInfo *cfile;
1565 __u16 netfid;
04a6aa8a 1566 __u32 type;
03776f45
PS
1567
1568 rc = -EACCES;
6d5786a3 1569 xid = get_xid();
03776f45 1570
f96637be
JP
1571 cifs_dbg(FYI, "Lock parm: 0x%x flockflags: 0x%x flocktype: 0x%x start: %lld end: %lld\n",
1572 cmd, flock->fl_flags, flock->fl_type,
1573 flock->fl_start, flock->fl_end);
03776f45 1574
03776f45
PS
1575 cfile = (struct cifsFileInfo *)file->private_data;
1576 tcon = tlink_tcon(cfile->tlink);
106dc538
PS
1577
1578 cifs_read_flock(flock, &type, &lock, &unlock, &wait_flag,
1579 tcon->ses->server);
1580
1581 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
4b4de76e 1582 netfid = cfile->fid.netfid;
496ad9aa 1583 cinode = CIFS_I(file_inode(file));
03776f45 1584
29e20f9c 1585 if (cap_unix(tcon->ses) &&
03776f45
PS
1586 (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
1587 ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
1588 posix_lck = true;
1589 /*
1590 * BB add code here to normalize offset and length to account for
1591 * negative length which we can not accept over the wire.
1592 */
1593 if (IS_GETLK(cmd)) {
4f6bcec9 1594 rc = cifs_getlk(file, flock, type, wait_flag, posix_lck, xid);
6d5786a3 1595 free_xid(xid);
03776f45
PS
1596 return rc;
1597 }
1598
1599 if (!lock && !unlock) {
1600 /*
1601 * if no lock or unlock then nothing to do since we do not
1602 * know what it is
1603 */
6d5786a3 1604 free_xid(xid);
03776f45 1605 return -EOPNOTSUPP;
7ee1af76
JA
1606 }
1607
03776f45
PS
1608 rc = cifs_setlk(file, flock, type, wait_flag, posix_lck, lock, unlock,
1609 xid);
6d5786a3 1610 free_xid(xid);
1da177e4
LT
1611 return rc;
1612}
1613
597b027f
JL
1614/*
1615 * update the file size (if needed) after a write. Should be called with
1616 * the inode->i_lock held
1617 */
72432ffc 1618void
fbec9ab9
JL
1619cifs_update_eof(struct cifsInodeInfo *cifsi, loff_t offset,
1620 unsigned int bytes_written)
1621{
1622 loff_t end_of_write = offset + bytes_written;
1623
1624 if (end_of_write > cifsi->server_eof)
1625 cifsi->server_eof = end_of_write;
1626}
1627
ba9ad725
PS
1628static ssize_t
1629cifs_write(struct cifsFileInfo *open_file, __u32 pid, const char *write_data,
1630 size_t write_size, loff_t *offset)
1da177e4
LT
1631{
1632 int rc = 0;
1633 unsigned int bytes_written = 0;
1634 unsigned int total_written;
1635 struct cifs_sb_info *cifs_sb;
ba9ad725
PS
1636 struct cifs_tcon *tcon;
1637 struct TCP_Server_Info *server;
6d5786a3 1638 unsigned int xid;
7da4b49a
JL
1639 struct dentry *dentry = open_file->dentry;
1640 struct cifsInodeInfo *cifsi = CIFS_I(dentry->d_inode);
fa2989f4 1641 struct cifs_io_parms io_parms;
1da177e4 1642
7da4b49a 1643 cifs_sb = CIFS_SB(dentry->d_sb);
1da177e4 1644
f96637be
JP
1645 cifs_dbg(FYI, "write %zd bytes to offset %lld of %s\n",
1646 write_size, *offset, dentry->d_name.name);
1da177e4 1647
ba9ad725
PS
1648 tcon = tlink_tcon(open_file->tlink);
1649 server = tcon->ses->server;
1650
1651 if (!server->ops->sync_write)
1652 return -ENOSYS;
50c2f753 1653
6d5786a3 1654 xid = get_xid();
1da177e4 1655
1da177e4
LT
1656 for (total_written = 0; write_size > total_written;
1657 total_written += bytes_written) {
1658 rc = -EAGAIN;
1659 while (rc == -EAGAIN) {
ca83ce3d
JL
1660 struct kvec iov[2];
1661 unsigned int len;
1662
1da177e4 1663 if (open_file->invalidHandle) {
1da177e4
LT
1664 /* we could deadlock if we called
1665 filemap_fdatawait from here so tell
fb8c4b14 1666 reopen_file not to flush data to
1da177e4 1667 server now */
15886177 1668 rc = cifs_reopen_file(open_file, false);
1da177e4
LT
1669 if (rc != 0)
1670 break;
1671 }
ca83ce3d
JL
1672
1673 len = min((size_t)cifs_sb->wsize,
1674 write_size - total_written);
1675 /* iov[0] is reserved for smb header */
1676 iov[1].iov_base = (char *)write_data + total_written;
1677 iov[1].iov_len = len;
fa2989f4 1678 io_parms.pid = pid;
ba9ad725
PS
1679 io_parms.tcon = tcon;
1680 io_parms.offset = *offset;
fa2989f4 1681 io_parms.length = len;
ba9ad725
PS
1682 rc = server->ops->sync_write(xid, open_file, &io_parms,
1683 &bytes_written, iov, 1);
1da177e4
LT
1684 }
1685 if (rc || (bytes_written == 0)) {
1686 if (total_written)
1687 break;
1688 else {
6d5786a3 1689 free_xid(xid);
1da177e4
LT
1690 return rc;
1691 }
fbec9ab9 1692 } else {
597b027f 1693 spin_lock(&dentry->d_inode->i_lock);
ba9ad725 1694 cifs_update_eof(cifsi, *offset, bytes_written);
597b027f 1695 spin_unlock(&dentry->d_inode->i_lock);
ba9ad725 1696 *offset += bytes_written;
fbec9ab9 1697 }
1da177e4
LT
1698 }
1699
ba9ad725 1700 cifs_stats_bytes_written(tcon, total_written);
1da177e4 1701
7da4b49a
JL
1702 if (total_written > 0) {
1703 spin_lock(&dentry->d_inode->i_lock);
ba9ad725
PS
1704 if (*offset > dentry->d_inode->i_size)
1705 i_size_write(dentry->d_inode, *offset);
7da4b49a 1706 spin_unlock(&dentry->d_inode->i_lock);
1da177e4 1707 }
7da4b49a 1708 mark_inode_dirty_sync(dentry->d_inode);
6d5786a3 1709 free_xid(xid);
1da177e4
LT
1710 return total_written;
1711}
1712
6508d904
JL
1713struct cifsFileInfo *find_readable_file(struct cifsInodeInfo *cifs_inode,
1714 bool fsuid_only)
630f3f0c
SF
1715{
1716 struct cifsFileInfo *open_file = NULL;
6508d904
JL
1717 struct cifs_sb_info *cifs_sb = CIFS_SB(cifs_inode->vfs_inode.i_sb);
1718
1719 /* only filter by fsuid on multiuser mounts */
1720 if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_MULTIUSER))
1721 fsuid_only = false;
630f3f0c 1722
4477288a 1723 spin_lock(&cifs_file_list_lock);
630f3f0c
SF
1724 /* we could simply get the first_list_entry since write-only entries
1725 are always at the end of the list but since the first entry might
1726 have a close pending, we go through the whole list */
1727 list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
fef59fd7 1728 if (fsuid_only && !uid_eq(open_file->uid, current_fsuid()))
6508d904 1729 continue;
2e396b83 1730 if (OPEN_FMODE(open_file->f_flags) & FMODE_READ) {
630f3f0c
SF
1731 if (!open_file->invalidHandle) {
1732 /* found a good file */
1733 /* lock it so it will not be closed on us */
764a1b1a 1734 cifsFileInfo_get_locked(open_file);
4477288a 1735 spin_unlock(&cifs_file_list_lock);
630f3f0c
SF
1736 return open_file;
1737 } /* else might as well continue, and look for
1738 another, or simply have the caller reopen it
1739 again rather than trying to fix this handle */
1740 } else /* write only file */
1741 break; /* write only files are last so must be done */
1742 }
4477288a 1743 spin_unlock(&cifs_file_list_lock);
630f3f0c
SF
1744 return NULL;
1745}
630f3f0c 1746
6508d904
JL
1747struct cifsFileInfo *find_writable_file(struct cifsInodeInfo *cifs_inode,
1748 bool fsuid_only)
6148a742 1749{
2c0c2a08 1750 struct cifsFileInfo *open_file, *inv_file = NULL;
d3892294 1751 struct cifs_sb_info *cifs_sb;
2846d386 1752 bool any_available = false;
dd99cd80 1753 int rc;
2c0c2a08 1754 unsigned int refind = 0;
6148a742 1755
60808233
SF
1756 /* Having a null inode here (because mapping->host was set to zero by
1757 the VFS or MM) should not happen but we had reports of on oops (due to
1758 it being zero) during stress testcases so we need to check for it */
1759
fb8c4b14 1760 if (cifs_inode == NULL) {
f96637be 1761 cifs_dbg(VFS, "Null inode passed to cifs_writeable_file\n");
60808233
SF
1762 dump_stack();
1763 return NULL;
1764 }
1765
d3892294
JL
1766 cifs_sb = CIFS_SB(cifs_inode->vfs_inode.i_sb);
1767
6508d904
JL
1768 /* only filter by fsuid on multiuser mounts */
1769 if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_MULTIUSER))
1770 fsuid_only = false;
1771
4477288a 1772 spin_lock(&cifs_file_list_lock);
9b22b0b7 1773refind_writable:
2c0c2a08
SP
1774 if (refind > MAX_REOPEN_ATT) {
1775 spin_unlock(&cifs_file_list_lock);
1776 return NULL;
1777 }
6148a742 1778 list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
6508d904
JL
1779 if (!any_available && open_file->pid != current->tgid)
1780 continue;
fef59fd7 1781 if (fsuid_only && !uid_eq(open_file->uid, current_fsuid()))
6148a742 1782 continue;
2e396b83 1783 if (OPEN_FMODE(open_file->f_flags) & FMODE_WRITE) {
9b22b0b7
SF
1784 if (!open_file->invalidHandle) {
1785 /* found a good writable file */
764a1b1a 1786 cifsFileInfo_get_locked(open_file);
4477288a 1787 spin_unlock(&cifs_file_list_lock);
9b22b0b7 1788 return open_file;
2c0c2a08
SP
1789 } else {
1790 if (!inv_file)
1791 inv_file = open_file;
9b22b0b7 1792 }
6148a742
SF
1793 }
1794 }
2846d386
JL
1795 /* couldn't find useable FH with same pid, try any available */
1796 if (!any_available) {
1797 any_available = true;
1798 goto refind_writable;
1799 }
2c0c2a08
SP
1800
1801 if (inv_file) {
1802 any_available = false;
764a1b1a 1803 cifsFileInfo_get_locked(inv_file);
2c0c2a08
SP
1804 }
1805
4477288a 1806 spin_unlock(&cifs_file_list_lock);
2c0c2a08
SP
1807
1808 if (inv_file) {
1809 rc = cifs_reopen_file(inv_file, false);
1810 if (!rc)
1811 return inv_file;
1812 else {
1813 spin_lock(&cifs_file_list_lock);
1814 list_move_tail(&inv_file->flist,
1815 &cifs_inode->openFileList);
1816 spin_unlock(&cifs_file_list_lock);
1817 cifsFileInfo_put(inv_file);
1818 spin_lock(&cifs_file_list_lock);
1819 ++refind;
1820 goto refind_writable;
1821 }
1822 }
1823
6148a742
SF
1824 return NULL;
1825}
1826
1da177e4
LT
1827static int cifs_partialpagewrite(struct page *page, unsigned from, unsigned to)
1828{
1829 struct address_space *mapping = page->mapping;
1830 loff_t offset = (loff_t)page->index << PAGE_CACHE_SHIFT;
1831 char *write_data;
1832 int rc = -EFAULT;
1833 int bytes_written = 0;
1da177e4 1834 struct inode *inode;
6148a742 1835 struct cifsFileInfo *open_file;
1da177e4
LT
1836
1837 if (!mapping || !mapping->host)
1838 return -EFAULT;
1839
1840 inode = page->mapping->host;
1da177e4
LT
1841
1842 offset += (loff_t)from;
1843 write_data = kmap(page);
1844 write_data += from;
1845
1846 if ((to > PAGE_CACHE_SIZE) || (from > to)) {
1847 kunmap(page);
1848 return -EIO;
1849 }
1850
1851 /* racing with truncate? */
1852 if (offset > mapping->host->i_size) {
1853 kunmap(page);
1854 return 0; /* don't care */
1855 }
1856
1857 /* check to make sure that we are not extending the file */
1858 if (mapping->host->i_size - offset < (loff_t)to)
fb8c4b14 1859 to = (unsigned)(mapping->host->i_size - offset);
1da177e4 1860
6508d904 1861 open_file = find_writable_file(CIFS_I(mapping->host), false);
6148a742 1862 if (open_file) {
fa2989f4
PS
1863 bytes_written = cifs_write(open_file, open_file->pid,
1864 write_data, to - from, &offset);
6ab409b5 1865 cifsFileInfo_put(open_file);
1da177e4 1866 /* Does mm or vfs already set times? */
6148a742 1867 inode->i_atime = inode->i_mtime = current_fs_time(inode->i_sb);
bb5a9a04 1868 if ((bytes_written > 0) && (offset))
6148a742 1869 rc = 0;
bb5a9a04
SF
1870 else if (bytes_written < 0)
1871 rc = bytes_written;
6148a742 1872 } else {
f96637be 1873 cifs_dbg(FYI, "No writeable filehandles for inode\n");
1da177e4
LT
1874 rc = -EIO;
1875 }
1876
1877 kunmap(page);
1878 return rc;
1879}
1880
1da177e4 1881static int cifs_writepages(struct address_space *mapping,
37c0eb46 1882 struct writeback_control *wbc)
1da177e4 1883{
c3d17b63
JL
1884 struct cifs_sb_info *cifs_sb = CIFS_SB(mapping->host->i_sb);
1885 bool done = false, scanned = false, range_whole = false;
1886 pgoff_t end, index;
1887 struct cifs_writedata *wdata;
c9de5c80 1888 struct TCP_Server_Info *server;
37c0eb46 1889 struct page *page;
37c0eb46 1890 int rc = 0;
50c2f753 1891
37c0eb46 1892 /*
c3d17b63 1893 * If wsize is smaller than the page cache size, default to writing
37c0eb46
SF
1894 * one page at a time via cifs_writepage
1895 */
1896 if (cifs_sb->wsize < PAGE_CACHE_SIZE)
1897 return generic_writepages(mapping, wbc);
1898
111ebb6e 1899 if (wbc->range_cyclic) {
37c0eb46 1900 index = mapping->writeback_index; /* Start from prev offset */
111ebb6e
OH
1901 end = -1;
1902 } else {
1903 index = wbc->range_start >> PAGE_CACHE_SHIFT;
1904 end = wbc->range_end >> PAGE_CACHE_SHIFT;
1905 if (wbc->range_start == 0 && wbc->range_end == LLONG_MAX)
c3d17b63
JL
1906 range_whole = true;
1907 scanned = true;
37c0eb46
SF
1908 }
1909retry:
c3d17b63
JL
1910 while (!done && index <= end) {
1911 unsigned int i, nr_pages, found_pages;
1912 pgoff_t next = 0, tofind;
1913 struct page **pages;
1914
1915 tofind = min((cifs_sb->wsize / PAGE_CACHE_SIZE) - 1,
1916 end - index) + 1;
1917
c2e87640
JL
1918 wdata = cifs_writedata_alloc((unsigned int)tofind,
1919 cifs_writev_complete);
c3d17b63
JL
1920 if (!wdata) {
1921 rc = -ENOMEM;
1922 break;
1923 }
1924
1925 /*
1926 * find_get_pages_tag seems to return a max of 256 on each
1927 * iteration, so we must call it several times in order to
1928 * fill the array or the wsize is effectively limited to
1929 * 256 * PAGE_CACHE_SIZE.
1930 */
1931 found_pages = 0;
1932 pages = wdata->pages;
1933 do {
1934 nr_pages = find_get_pages_tag(mapping, &index,
1935 PAGECACHE_TAG_DIRTY,
1936 tofind, pages);
1937 found_pages += nr_pages;
1938 tofind -= nr_pages;
1939 pages += nr_pages;
1940 } while (nr_pages && tofind && index <= end);
1941
1942 if (found_pages == 0) {
1943 kref_put(&wdata->refcount, cifs_writedata_release);
1944 break;
1945 }
1946
1947 nr_pages = 0;
1948 for (i = 0; i < found_pages; i++) {
1949 page = wdata->pages[i];
37c0eb46
SF
1950 /*
1951 * At this point we hold neither mapping->tree_lock nor
1952 * lock on the page itself: the page may be truncated or
1953 * invalidated (changing page->mapping to NULL), or even
1954 * swizzled back from swapper_space to tmpfs file
1955 * mapping
1956 */
1957
c3d17b63 1958 if (nr_pages == 0)
37c0eb46 1959 lock_page(page);
529ae9aa 1960 else if (!trylock_page(page))
37c0eb46
SF
1961 break;
1962
1963 if (unlikely(page->mapping != mapping)) {
1964 unlock_page(page);
1965 break;
1966 }
1967
111ebb6e 1968 if (!wbc->range_cyclic && page->index > end) {
c3d17b63 1969 done = true;
37c0eb46
SF
1970 unlock_page(page);
1971 break;
1972 }
1973
1974 if (next && (page->index != next)) {
1975 /* Not next consecutive page */
1976 unlock_page(page);
1977 break;
1978 }
1979
1980 if (wbc->sync_mode != WB_SYNC_NONE)
1981 wait_on_page_writeback(page);
1982
1983 if (PageWriteback(page) ||
cb876f45 1984 !clear_page_dirty_for_io(page)) {
37c0eb46
SF
1985 unlock_page(page);
1986 break;
1987 }
84d2f07e 1988
cb876f45
LT
1989 /*
1990 * This actually clears the dirty bit in the radix tree.
1991 * See cifs_writepage() for more commentary.
1992 */
1993 set_page_writeback(page);
1994
3a98b861 1995 if (page_offset(page) >= i_size_read(mapping->host)) {
c3d17b63 1996 done = true;
84d2f07e 1997 unlock_page(page);
cb876f45 1998 end_page_writeback(page);
84d2f07e
SF
1999 break;
2000 }
2001
c3d17b63
JL
2002 wdata->pages[i] = page;
2003 next = page->index + 1;
2004 ++nr_pages;
2005 }
37c0eb46 2006
c3d17b63
JL
2007 /* reset index to refind any pages skipped */
2008 if (nr_pages == 0)
2009 index = wdata->pages[0]->index + 1;
84d2f07e 2010
c3d17b63
JL
2011 /* put any pages we aren't going to use */
2012 for (i = nr_pages; i < found_pages; i++) {
2013 page_cache_release(wdata->pages[i]);
2014 wdata->pages[i] = NULL;
2015 }
37c0eb46 2016
c3d17b63
JL
2017 /* nothing to write? */
2018 if (nr_pages == 0) {
2019 kref_put(&wdata->refcount, cifs_writedata_release);
2020 continue;
37c0eb46 2021 }
fbec9ab9 2022
c3d17b63
JL
2023 wdata->sync_mode = wbc->sync_mode;
2024 wdata->nr_pages = nr_pages;
2025 wdata->offset = page_offset(wdata->pages[0]);
eddb079d
JL
2026 wdata->pagesz = PAGE_CACHE_SIZE;
2027 wdata->tailsz =
3a98b861
JL
2028 min(i_size_read(mapping->host) -
2029 page_offset(wdata->pages[nr_pages - 1]),
eddb079d
JL
2030 (loff_t)PAGE_CACHE_SIZE);
2031 wdata->bytes = ((nr_pages - 1) * PAGE_CACHE_SIZE) +
2032 wdata->tailsz;
941b853d 2033
c3d17b63
JL
2034 do {
2035 if (wdata->cfile != NULL)
2036 cifsFileInfo_put(wdata->cfile);
2037 wdata->cfile = find_writable_file(CIFS_I(mapping->host),
2038 false);
2039 if (!wdata->cfile) {
f96637be 2040 cifs_dbg(VFS, "No writable handles for inode\n");
c3d17b63
JL
2041 rc = -EBADF;
2042 break;
941b853d 2043 }
fe5f5d2e 2044 wdata->pid = wdata->cfile->pid;
c9de5c80 2045 server = tlink_tcon(wdata->cfile->tlink)->ses->server;
4a5c80d7
SF
2046 rc = server->ops->async_writev(wdata,
2047 cifs_writedata_release);
c3d17b63 2048 } while (wbc->sync_mode == WB_SYNC_ALL && rc == -EAGAIN);
941b853d 2049
c3d17b63
JL
2050 for (i = 0; i < nr_pages; ++i)
2051 unlock_page(wdata->pages[i]);
f3983c21 2052
c3d17b63
JL
2053 /* send failure -- clean up the mess */
2054 if (rc != 0) {
2055 for (i = 0; i < nr_pages; ++i) {
941b853d 2056 if (rc == -EAGAIN)
c3d17b63
JL
2057 redirty_page_for_writepage(wbc,
2058 wdata->pages[i]);
2059 else
2060 SetPageError(wdata->pages[i]);
2061 end_page_writeback(wdata->pages[i]);
2062 page_cache_release(wdata->pages[i]);
37c0eb46 2063 }
941b853d
JL
2064 if (rc != -EAGAIN)
2065 mapping_set_error(mapping, rc);
c3d17b63
JL
2066 }
2067 kref_put(&wdata->refcount, cifs_writedata_release);
941b853d 2068
c3d17b63
JL
2069 wbc->nr_to_write -= nr_pages;
2070 if (wbc->nr_to_write <= 0)
2071 done = true;
b066a48c 2072
c3d17b63 2073 index = next;
37c0eb46 2074 }
c3d17b63 2075
37c0eb46
SF
2076 if (!scanned && !done) {
2077 /*
2078 * We hit the last page and there is more work to be done: wrap
2079 * back to the start of the file
2080 */
c3d17b63 2081 scanned = true;
37c0eb46
SF
2082 index = 0;
2083 goto retry;
2084 }
c3d17b63 2085
111ebb6e 2086 if (wbc->range_cyclic || (range_whole && wbc->nr_to_write > 0))
37c0eb46
SF
2087 mapping->writeback_index = index;
2088
1da177e4
LT
2089 return rc;
2090}
1da177e4 2091
9ad1506b
PS
2092static int
2093cifs_writepage_locked(struct page *page, struct writeback_control *wbc)
1da177e4 2094{
9ad1506b 2095 int rc;
6d5786a3 2096 unsigned int xid;
1da177e4 2097
6d5786a3 2098 xid = get_xid();
1da177e4
LT
2099/* BB add check for wbc flags */
2100 page_cache_get(page);
ad7a2926 2101 if (!PageUptodate(page))
f96637be 2102 cifs_dbg(FYI, "ppw - page not up to date\n");
cb876f45
LT
2103
2104 /*
2105 * Set the "writeback" flag, and clear "dirty" in the radix tree.
2106 *
2107 * A writepage() implementation always needs to do either this,
2108 * or re-dirty the page with "redirty_page_for_writepage()" in
2109 * the case of a failure.
2110 *
2111 * Just unlocking the page will cause the radix tree tag-bits
2112 * to fail to update with the state of the page correctly.
2113 */
fb8c4b14 2114 set_page_writeback(page);
9ad1506b 2115retry_write:
1da177e4 2116 rc = cifs_partialpagewrite(page, 0, PAGE_CACHE_SIZE);
9ad1506b
PS
2117 if (rc == -EAGAIN && wbc->sync_mode == WB_SYNC_ALL)
2118 goto retry_write;
2119 else if (rc == -EAGAIN)
2120 redirty_page_for_writepage(wbc, page);
2121 else if (rc != 0)
2122 SetPageError(page);
2123 else
2124 SetPageUptodate(page);
cb876f45
LT
2125 end_page_writeback(page);
2126 page_cache_release(page);
6d5786a3 2127 free_xid(xid);
1da177e4
LT
2128 return rc;
2129}
2130
9ad1506b
PS
2131static int cifs_writepage(struct page *page, struct writeback_control *wbc)
2132{
2133 int rc = cifs_writepage_locked(page, wbc);
2134 unlock_page(page);
2135 return rc;
2136}
2137
d9414774
NP
2138static int cifs_write_end(struct file *file, struct address_space *mapping,
2139 loff_t pos, unsigned len, unsigned copied,
2140 struct page *page, void *fsdata)
1da177e4 2141{
d9414774
NP
2142 int rc;
2143 struct inode *inode = mapping->host;
d4ffff1f
PS
2144 struct cifsFileInfo *cfile = file->private_data;
2145 struct cifs_sb_info *cifs_sb = CIFS_SB(cfile->dentry->d_sb);
2146 __u32 pid;
2147
2148 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
2149 pid = cfile->pid;
2150 else
2151 pid = current->tgid;
1da177e4 2152
f96637be 2153 cifs_dbg(FYI, "write_end for page %p from pos %lld with %d bytes\n",
b6b38f70 2154 page, pos, copied);
d9414774 2155
a98ee8c1
JL
2156 if (PageChecked(page)) {
2157 if (copied == len)
2158 SetPageUptodate(page);
2159 ClearPageChecked(page);
2160 } else if (!PageUptodate(page) && copied == PAGE_CACHE_SIZE)
d9414774 2161 SetPageUptodate(page);
ad7a2926 2162
1da177e4 2163 if (!PageUptodate(page)) {
d9414774
NP
2164 char *page_data;
2165 unsigned offset = pos & (PAGE_CACHE_SIZE - 1);
6d5786a3 2166 unsigned int xid;
d9414774 2167
6d5786a3 2168 xid = get_xid();
1da177e4
LT
2169 /* this is probably better than directly calling
2170 partialpage_write since in this function the file handle is
2171 known which we might as well leverage */
2172 /* BB check if anything else missing out of ppw
2173 such as updating last write time */
2174 page_data = kmap(page);
d4ffff1f 2175 rc = cifs_write(cfile, pid, page_data + offset, copied, &pos);
d9414774 2176 /* if (rc < 0) should we set writebehind rc? */
1da177e4 2177 kunmap(page);
d9414774 2178
6d5786a3 2179 free_xid(xid);
fb8c4b14 2180 } else {
d9414774
NP
2181 rc = copied;
2182 pos += copied;
ca8aa29c 2183 set_page_dirty(page);
1da177e4
LT
2184 }
2185
d9414774
NP
2186 if (rc > 0) {
2187 spin_lock(&inode->i_lock);
2188 if (pos > inode->i_size)
2189 i_size_write(inode, pos);
2190 spin_unlock(&inode->i_lock);
2191 }
2192
2193 unlock_page(page);
2194 page_cache_release(page);
2195
1da177e4
LT
2196 return rc;
2197}
2198
02c24a82
JB
2199int cifs_strict_fsync(struct file *file, loff_t start, loff_t end,
2200 int datasync)
1da177e4 2201{
6d5786a3 2202 unsigned int xid;
1da177e4 2203 int rc = 0;
96daf2b0 2204 struct cifs_tcon *tcon;
1d8c4c00 2205 struct TCP_Server_Info *server;
c21dfb69 2206 struct cifsFileInfo *smbfile = file->private_data;
496ad9aa 2207 struct inode *inode = file_inode(file);
8be7e6ba 2208 struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
1da177e4 2209
02c24a82
JB
2210 rc = filemap_write_and_wait_range(inode->i_mapping, start, end);
2211 if (rc)
2212 return rc;
2213 mutex_lock(&inode->i_mutex);
2214
6d5786a3 2215 xid = get_xid();
1da177e4 2216
f96637be
JP
2217 cifs_dbg(FYI, "Sync file - name: %s datasync: 0x%x\n",
2218 file->f_path.dentry->d_name.name, datasync);
50c2f753 2219
18cceb6a 2220 if (!CIFS_CACHE_READ(CIFS_I(inode))) {
6feb9891
PS
2221 rc = cifs_invalidate_mapping(inode);
2222 if (rc) {
f96637be 2223 cifs_dbg(FYI, "rc: %d during invalidate phase\n", rc);
6feb9891
PS
2224 rc = 0; /* don't care about it in fsync */
2225 }
2226 }
eb4b756b 2227
8be7e6ba 2228 tcon = tlink_tcon(smbfile->tlink);
1d8c4c00
PS
2229 if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOSSYNC)) {
2230 server = tcon->ses->server;
2231 if (server->ops->flush)
2232 rc = server->ops->flush(xid, tcon, &smbfile->fid);
2233 else
2234 rc = -ENOSYS;
2235 }
8be7e6ba 2236
6d5786a3 2237 free_xid(xid);
02c24a82 2238 mutex_unlock(&inode->i_mutex);
8be7e6ba
PS
2239 return rc;
2240}
2241
02c24a82 2242int cifs_fsync(struct file *file, loff_t start, loff_t end, int datasync)
8be7e6ba 2243{
6d5786a3 2244 unsigned int xid;
8be7e6ba 2245 int rc = 0;
96daf2b0 2246 struct cifs_tcon *tcon;
1d8c4c00 2247 struct TCP_Server_Info *server;
8be7e6ba
PS
2248 struct cifsFileInfo *smbfile = file->private_data;
2249 struct cifs_sb_info *cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
02c24a82
JB
2250 struct inode *inode = file->f_mapping->host;
2251
2252 rc = filemap_write_and_wait_range(inode->i_mapping, start, end);
2253 if (rc)
2254 return rc;
2255 mutex_lock(&inode->i_mutex);
8be7e6ba 2256
6d5786a3 2257 xid = get_xid();
8be7e6ba 2258
f96637be
JP
2259 cifs_dbg(FYI, "Sync file - name: %s datasync: 0x%x\n",
2260 file->f_path.dentry->d_name.name, datasync);
8be7e6ba
PS
2261
2262 tcon = tlink_tcon(smbfile->tlink);
1d8c4c00
PS
2263 if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOSSYNC)) {
2264 server = tcon->ses->server;
2265 if (server->ops->flush)
2266 rc = server->ops->flush(xid, tcon, &smbfile->fid);
2267 else
2268 rc = -ENOSYS;
2269 }
b298f223 2270
6d5786a3 2271 free_xid(xid);
02c24a82 2272 mutex_unlock(&inode->i_mutex);
1da177e4
LT
2273 return rc;
2274}
2275
1da177e4
LT
2276/*
2277 * As file closes, flush all cached write data for this inode checking
2278 * for write behind errors.
2279 */
75e1fcc0 2280int cifs_flush(struct file *file, fl_owner_t id)
1da177e4 2281{
496ad9aa 2282 struct inode *inode = file_inode(file);
1da177e4
LT
2283 int rc = 0;
2284
eb4b756b 2285 if (file->f_mode & FMODE_WRITE)
d3f1322a 2286 rc = filemap_write_and_wait(inode->i_mapping);
50c2f753 2287
f96637be 2288 cifs_dbg(FYI, "Flush inode %p file %p rc %d\n", inode, file, rc);
1da177e4
LT
2289
2290 return rc;
2291}
2292
72432ffc
PS
2293static int
2294cifs_write_allocate_pages(struct page **pages, unsigned long num_pages)
2295{
2296 int rc = 0;
2297 unsigned long i;
2298
2299 for (i = 0; i < num_pages; i++) {
e94f7ba1 2300 pages[i] = alloc_page(GFP_KERNEL|__GFP_HIGHMEM);
72432ffc
PS
2301 if (!pages[i]) {
2302 /*
2303 * save number of pages we have already allocated and
2304 * return with ENOMEM error
2305 */
2306 num_pages = i;
2307 rc = -ENOMEM;
e94f7ba1 2308 break;
72432ffc
PS
2309 }
2310 }
2311
e94f7ba1
JL
2312 if (rc) {
2313 for (i = 0; i < num_pages; i++)
2314 put_page(pages[i]);
2315 }
72432ffc
PS
2316 return rc;
2317}
2318
2319static inline
2320size_t get_numpages(const size_t wsize, const size_t len, size_t *cur_len)
2321{
2322 size_t num_pages;
2323 size_t clen;
2324
2325 clen = min_t(const size_t, len, wsize);
a7103b99 2326 num_pages = DIV_ROUND_UP(clen, PAGE_SIZE);
72432ffc
PS
2327
2328 if (cur_len)
2329 *cur_len = clen;
2330
2331 return num_pages;
2332}
2333
da82f7e7 2334static void
4a5c80d7 2335cifs_uncached_writedata_release(struct kref *refcount)
da82f7e7
JL
2336{
2337 int i;
4a5c80d7
SF
2338 struct cifs_writedata *wdata = container_of(refcount,
2339 struct cifs_writedata, refcount);
2340
2341 for (i = 0; i < wdata->nr_pages; i++)
2342 put_page(wdata->pages[i]);
2343 cifs_writedata_release(refcount);
2344}
2345
2346static void
2347cifs_uncached_writev_complete(struct work_struct *work)
2348{
da82f7e7
JL
2349 struct cifs_writedata *wdata = container_of(work,
2350 struct cifs_writedata, work);
2351 struct inode *inode = wdata->cfile->dentry->d_inode;
2352 struct cifsInodeInfo *cifsi = CIFS_I(inode);
2353
2354 spin_lock(&inode->i_lock);
2355 cifs_update_eof(cifsi, wdata->offset, wdata->bytes);
2356 if (cifsi->server_eof > inode->i_size)
2357 i_size_write(inode, cifsi->server_eof);
2358 spin_unlock(&inode->i_lock);
2359
2360 complete(&wdata->done);
2361
4a5c80d7 2362 kref_put(&wdata->refcount, cifs_uncached_writedata_release);
da82f7e7
JL
2363}
2364
2365/* attempt to send write to server, retry on any -EAGAIN errors */
2366static int
2367cifs_uncached_retry_writev(struct cifs_writedata *wdata)
2368{
2369 int rc;
c9de5c80
PS
2370 struct TCP_Server_Info *server;
2371
2372 server = tlink_tcon(wdata->cfile->tlink)->ses->server;
da82f7e7
JL
2373
2374 do {
2375 if (wdata->cfile->invalidHandle) {
2376 rc = cifs_reopen_file(wdata->cfile, false);
2377 if (rc != 0)
2378 continue;
2379 }
4a5c80d7
SF
2380 rc = server->ops->async_writev(wdata,
2381 cifs_uncached_writedata_release);
da82f7e7
JL
2382 } while (rc == -EAGAIN);
2383
2384 return rc;
2385}
2386
72432ffc
PS
2387static ssize_t
2388cifs_iovec_write(struct file *file, const struct iovec *iov,
2389 unsigned long nr_segs, loff_t *poffset)
2390{
da82f7e7 2391 unsigned long nr_pages, i;
5d81de8e 2392 size_t bytes, copied, len, cur_len;
76429c14 2393 ssize_t total_written = 0;
3af9d8f2 2394 loff_t offset;
72432ffc 2395 struct iov_iter it;
72432ffc 2396 struct cifsFileInfo *open_file;
da82f7e7 2397 struct cifs_tcon *tcon;
72432ffc 2398 struct cifs_sb_info *cifs_sb;
da82f7e7
JL
2399 struct cifs_writedata *wdata, *tmp;
2400 struct list_head wdata_list;
2401 int rc;
2402 pid_t pid;
72432ffc
PS
2403
2404 len = iov_length(iov, nr_segs);
2405 if (!len)
2406 return 0;
2407
2408 rc = generic_write_checks(file, poffset, &len, 0);
2409 if (rc)
2410 return rc;
2411
da82f7e7 2412 INIT_LIST_HEAD(&wdata_list);
72432ffc 2413 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
72432ffc 2414 open_file = file->private_data;
da82f7e7 2415 tcon = tlink_tcon(open_file->tlink);
c9de5c80
PS
2416
2417 if (!tcon->ses->server->ops->async_writev)
2418 return -ENOSYS;
2419
3af9d8f2 2420 offset = *poffset;
d4ffff1f
PS
2421
2422 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
2423 pid = open_file->pid;
2424 else
2425 pid = current->tgid;
2426
72432ffc 2427 iov_iter_init(&it, iov, nr_segs, len, 0);
72432ffc 2428 do {
da82f7e7
JL
2429 size_t save_len;
2430
2431 nr_pages = get_numpages(cifs_sb->wsize, len, &cur_len);
2432 wdata = cifs_writedata_alloc(nr_pages,
2433 cifs_uncached_writev_complete);
2434 if (!wdata) {
2435 rc = -ENOMEM;
2436 break;
2437 }
2438
2439 rc = cifs_write_allocate_pages(wdata->pages, nr_pages);
2440 if (rc) {
2441 kfree(wdata);
2442 break;
2443 }
2444
2445 save_len = cur_len;
2446 for (i = 0; i < nr_pages; i++) {
5d81de8e 2447 bytes = min_t(const size_t, cur_len, PAGE_SIZE);
da82f7e7 2448 copied = iov_iter_copy_from_user(wdata->pages[i], &it,
5d81de8e 2449 0, bytes);
72432ffc
PS
2450 cur_len -= copied;
2451 iov_iter_advance(&it, copied);
5d81de8e
JL
2452 /*
2453 * If we didn't copy as much as we expected, then that
2454 * may mean we trod into an unmapped area. Stop copying
2455 * at that point. On the next pass through the big
2456 * loop, we'll likely end up getting a zero-length
2457 * write and bailing out of it.
2458 */
2459 if (copied < bytes)
2460 break;
72432ffc 2461 }
72432ffc
PS
2462 cur_len = save_len - cur_len;
2463
5d81de8e
JL
2464 /*
2465 * If we have no data to send, then that probably means that
2466 * the copy above failed altogether. That's most likely because
2467 * the address in the iovec was bogus. Set the rc to -EFAULT,
2468 * free anything we allocated and bail out.
2469 */
2470 if (!cur_len) {
2471 for (i = 0; i < nr_pages; i++)
2472 put_page(wdata->pages[i]);
2473 kfree(wdata);
2474 rc = -EFAULT;
2475 break;
2476 }
2477
2478 /*
2479 * i + 1 now represents the number of pages we actually used in
2480 * the copy phase above. Bring nr_pages down to that, and free
2481 * any pages that we didn't use.
2482 */
2483 for ( ; nr_pages > i + 1; nr_pages--)
2484 put_page(wdata->pages[nr_pages - 1]);
2485
da82f7e7
JL
2486 wdata->sync_mode = WB_SYNC_ALL;
2487 wdata->nr_pages = nr_pages;
2488 wdata->offset = (__u64)offset;
2489 wdata->cfile = cifsFileInfo_get(open_file);
2490 wdata->pid = pid;
2491 wdata->bytes = cur_len;
eddb079d
JL
2492 wdata->pagesz = PAGE_SIZE;
2493 wdata->tailsz = cur_len - ((nr_pages - 1) * PAGE_SIZE);
da82f7e7
JL
2494 rc = cifs_uncached_retry_writev(wdata);
2495 if (rc) {
4a5c80d7
SF
2496 kref_put(&wdata->refcount,
2497 cifs_uncached_writedata_release);
72432ffc
PS
2498 break;
2499 }
2500
da82f7e7
JL
2501 list_add_tail(&wdata->list, &wdata_list);
2502 offset += cur_len;
2503 len -= cur_len;
72432ffc
PS
2504 } while (len > 0);
2505
da82f7e7
JL
2506 /*
2507 * If at least one write was successfully sent, then discard any rc
2508 * value from the later writes. If the other write succeeds, then
2509 * we'll end up returning whatever was written. If it fails, then
2510 * we'll get a new rc value from that.
2511 */
2512 if (!list_empty(&wdata_list))
2513 rc = 0;
2514
2515 /*
2516 * Wait for and collect replies for any successful sends in order of
2517 * increasing offset. Once an error is hit or we get a fatal signal
2518 * while waiting, then return without waiting for any more replies.
2519 */
2520restart_loop:
2521 list_for_each_entry_safe(wdata, tmp, &wdata_list, list) {
2522 if (!rc) {
2523 /* FIXME: freezable too? */
2524 rc = wait_for_completion_killable(&wdata->done);
2525 if (rc)
2526 rc = -EINTR;
2527 else if (wdata->result)
2528 rc = wdata->result;
2529 else
2530 total_written += wdata->bytes;
2531
2532 /* resend call if it's a retryable error */
2533 if (rc == -EAGAIN) {
2534 rc = cifs_uncached_retry_writev(wdata);
2535 goto restart_loop;
2536 }
2537 }
2538 list_del_init(&wdata->list);
4a5c80d7 2539 kref_put(&wdata->refcount, cifs_uncached_writedata_release);
72432ffc
PS
2540 }
2541
da82f7e7
JL
2542 if (total_written > 0)
2543 *poffset += total_written;
72432ffc 2544
da82f7e7
JL
2545 cifs_stats_bytes_written(tcon, total_written);
2546 return total_written ? total_written : (ssize_t)rc;
72432ffc
PS
2547}
2548
0b81c1c4 2549ssize_t cifs_user_writev(struct kiocb *iocb, const struct iovec *iov,
72432ffc
PS
2550 unsigned long nr_segs, loff_t pos)
2551{
2552 ssize_t written;
2553 struct inode *inode;
2554
496ad9aa 2555 inode = file_inode(iocb->ki_filp);
72432ffc
PS
2556
2557 /*
2558 * BB - optimize the way when signing is disabled. We can drop this
2559 * extra memory-to-memory copying and use iovec buffers for constructing
2560 * write request.
2561 */
2562
2563 written = cifs_iovec_write(iocb->ki_filp, iov, nr_segs, &pos);
2564 if (written > 0) {
2565 CIFS_I(inode)->invalid_mapping = true;
2566 iocb->ki_pos = pos;
2567 }
2568
2569 return written;
2570}
2571
579f9053 2572static ssize_t
ca8aa29c
PS
2573cifs_writev(struct kiocb *iocb, const struct iovec *iov,
2574 unsigned long nr_segs, loff_t pos)
72432ffc 2575{
579f9053
PS
2576 struct file *file = iocb->ki_filp;
2577 struct cifsFileInfo *cfile = (struct cifsFileInfo *)file->private_data;
2578 struct inode *inode = file->f_mapping->host;
2579 struct cifsInodeInfo *cinode = CIFS_I(inode);
2580 struct TCP_Server_Info *server = tlink_tcon(cfile->tlink)->ses->server;
2581 ssize_t rc = -EACCES;
6b1168e1 2582 loff_t lock_pos = pos;
72432ffc 2583
6b1168e1
PS
2584 if (file->f_flags & O_APPEND)
2585 lock_pos = i_size_read(inode);
579f9053
PS
2586 /*
2587 * We need to hold the sem to be sure nobody modifies lock list
2588 * with a brlock that prevents writing.
2589 */
2590 down_read(&cinode->lock_sem);
6b1168e1 2591 if (!cifs_find_lock_conflict(cfile, lock_pos, iov_length(iov, nr_segs),
579f9053 2592 server->vals->exclusive_lock_type, NULL,
6b1168e1
PS
2593 CIFS_WRITE_OP))
2594 rc = generic_file_aio_write(iocb, iov, nr_segs, pos);
579f9053 2595 up_read(&cinode->lock_sem);
579f9053
PS
2596 return rc;
2597}
2598
2599ssize_t
2600cifs_strict_writev(struct kiocb *iocb, const struct iovec *iov,
2601 unsigned long nr_segs, loff_t pos)
2602{
496ad9aa 2603 struct inode *inode = file_inode(iocb->ki_filp);
579f9053
PS
2604 struct cifsInodeInfo *cinode = CIFS_I(inode);
2605 struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
2606 struct cifsFileInfo *cfile = (struct cifsFileInfo *)
2607 iocb->ki_filp->private_data;
2608 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
88cf75aa 2609 ssize_t written;
ca8aa29c 2610
18cceb6a 2611 if (CIFS_CACHE_WRITE(cinode)) {
88cf75aa
PS
2612 if (cap_unix(tcon->ses) &&
2613 (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability))
2614 && ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
2615 return generic_file_aio_write(iocb, iov, nr_segs, pos);
2616 return cifs_writev(iocb, iov, nr_segs, pos);
25078105 2617 }
25078105 2618 /*
ca8aa29c
PS
2619 * For non-oplocked files in strict cache mode we need to write the data
2620 * to the server exactly from the pos to pos+len-1 rather than flush all
2621 * affected pages because it may cause a error with mandatory locks on
2622 * these pages but not on the region from pos to ppos+len-1.
72432ffc 2623 */
88cf75aa 2624 written = cifs_user_writev(iocb, iov, nr_segs, pos);
18cceb6a 2625 if (written > 0 && CIFS_CACHE_READ(cinode)) {
88cf75aa
PS
2626 /*
2627 * Windows 7 server can delay breaking level2 oplock if a write
2628 * request comes - break it on the client to prevent reading
2629 * an old data.
2630 */
2631 cifs_invalidate_mapping(inode);
f96637be
JP
2632 cifs_dbg(FYI, "Set no oplock for inode=%p after a write operation\n",
2633 inode);
18cceb6a 2634 cinode->oplock = 0;
88cf75aa
PS
2635 }
2636 return written;
72432ffc
PS
2637}
2638
0471ca3f 2639static struct cifs_readdata *
f4e49cd2 2640cifs_readdata_alloc(unsigned int nr_pages, work_func_t complete)
0471ca3f
JL
2641{
2642 struct cifs_readdata *rdata;
f4e49cd2 2643
c5fab6f4
JL
2644 rdata = kzalloc(sizeof(*rdata) + (sizeof(struct page *) * nr_pages),
2645 GFP_KERNEL);
0471ca3f 2646 if (rdata != NULL) {
6993f74a 2647 kref_init(&rdata->refcount);
1c892549
JL
2648 INIT_LIST_HEAD(&rdata->list);
2649 init_completion(&rdata->done);
0471ca3f 2650 INIT_WORK(&rdata->work, complete);
0471ca3f 2651 }
f4e49cd2 2652
0471ca3f
JL
2653 return rdata;
2654}
2655
6993f74a
JL
2656void
2657cifs_readdata_release(struct kref *refcount)
0471ca3f 2658{
6993f74a
JL
2659 struct cifs_readdata *rdata = container_of(refcount,
2660 struct cifs_readdata, refcount);
2661
2662 if (rdata->cfile)
2663 cifsFileInfo_put(rdata->cfile);
2664
0471ca3f
JL
2665 kfree(rdata);
2666}
2667
1c892549 2668static int
c5fab6f4 2669cifs_read_allocate_pages(struct cifs_readdata *rdata, unsigned int nr_pages)
1c892549
JL
2670{
2671 int rc = 0;
c5fab6f4 2672 struct page *page;
1c892549
JL
2673 unsigned int i;
2674
c5fab6f4 2675 for (i = 0; i < nr_pages; i++) {
1c892549
JL
2676 page = alloc_page(GFP_KERNEL|__GFP_HIGHMEM);
2677 if (!page) {
2678 rc = -ENOMEM;
2679 break;
2680 }
c5fab6f4 2681 rdata->pages[i] = page;
1c892549
JL
2682 }
2683
2684 if (rc) {
c5fab6f4
JL
2685 for (i = 0; i < nr_pages; i++) {
2686 put_page(rdata->pages[i]);
2687 rdata->pages[i] = NULL;
1c892549
JL
2688 }
2689 }
2690 return rc;
2691}
2692
2693static void
2694cifs_uncached_readdata_release(struct kref *refcount)
2695{
1c892549
JL
2696 struct cifs_readdata *rdata = container_of(refcount,
2697 struct cifs_readdata, refcount);
c5fab6f4 2698 unsigned int i;
1c892549 2699
c5fab6f4
JL
2700 for (i = 0; i < rdata->nr_pages; i++) {
2701 put_page(rdata->pages[i]);
2702 rdata->pages[i] = NULL;
1c892549
JL
2703 }
2704 cifs_readdata_release(refcount);
2705}
2706
2a1bb138
JL
2707static int
2708cifs_retry_async_readv(struct cifs_readdata *rdata)
2709{
2710 int rc;
fc9c5966
PS
2711 struct TCP_Server_Info *server;
2712
2713 server = tlink_tcon(rdata->cfile->tlink)->ses->server;
2a1bb138
JL
2714
2715 do {
2716 if (rdata->cfile->invalidHandle) {
2717 rc = cifs_reopen_file(rdata->cfile, true);
2718 if (rc != 0)
2719 continue;
2720 }
fc9c5966 2721 rc = server->ops->async_readv(rdata);
2a1bb138
JL
2722 } while (rc == -EAGAIN);
2723
2724 return rc;
2725}
2726
1c892549
JL
2727/**
2728 * cifs_readdata_to_iov - copy data from pages in response to an iovec
2729 * @rdata: the readdata response with list of pages holding data
2730 * @iov: vector in which we should copy the data
2731 * @nr_segs: number of segments in vector
2732 * @offset: offset into file of the first iovec
2733 * @copied: used to return the amount of data copied to the iov
2734 *
2735 * This function copies data from a list of pages in a readdata response into
2736 * an array of iovecs. It will first calculate where the data should go
2737 * based on the info in the readdata and then copy the data into that spot.
2738 */
2739static ssize_t
2740cifs_readdata_to_iov(struct cifs_readdata *rdata, const struct iovec *iov,
2741 unsigned long nr_segs, loff_t offset, ssize_t *copied)
2742{
2743 int rc = 0;
2744 struct iov_iter ii;
2745 size_t pos = rdata->offset - offset;
1c892549
JL
2746 ssize_t remaining = rdata->bytes;
2747 unsigned char *pdata;
c5fab6f4 2748 unsigned int i;
1c892549
JL
2749
2750 /* set up iov_iter and advance to the correct offset */
2751 iov_iter_init(&ii, iov, nr_segs, iov_length(iov, nr_segs), 0);
2752 iov_iter_advance(&ii, pos);
2753
2754 *copied = 0;
c5fab6f4 2755 for (i = 0; i < rdata->nr_pages; i++) {
1c892549 2756 ssize_t copy;
c5fab6f4 2757 struct page *page = rdata->pages[i];
1c892549
JL
2758
2759 /* copy a whole page or whatever's left */
2760 copy = min_t(ssize_t, remaining, PAGE_SIZE);
2761
2762 /* ...but limit it to whatever space is left in the iov */
2763 copy = min_t(ssize_t, copy, iov_iter_count(&ii));
2764
2765 /* go while there's data to be copied and no errors */
2766 if (copy && !rc) {
2767 pdata = kmap(page);
2768 rc = memcpy_toiovecend(ii.iov, pdata, ii.iov_offset,
2769 (int)copy);
2770 kunmap(page);
2771 if (!rc) {
2772 *copied += copy;
2773 remaining -= copy;
2774 iov_iter_advance(&ii, copy);
2775 }
2776 }
1c892549
JL
2777 }
2778
2779 return rc;
2780}
2781
2782static void
2783cifs_uncached_readv_complete(struct work_struct *work)
2784{
2785 struct cifs_readdata *rdata = container_of(work,
2786 struct cifs_readdata, work);
1c892549
JL
2787
2788 complete(&rdata->done);
2789 kref_put(&rdata->refcount, cifs_uncached_readdata_release);
2790}
2791
2792static int
8321fec4
JL
2793cifs_uncached_read_into_pages(struct TCP_Server_Info *server,
2794 struct cifs_readdata *rdata, unsigned int len)
1c892549 2795{
8321fec4 2796 int total_read = 0, result = 0;
c5fab6f4
JL
2797 unsigned int i;
2798 unsigned int nr_pages = rdata->nr_pages;
8321fec4 2799 struct kvec iov;
1c892549 2800
8321fec4 2801 rdata->tailsz = PAGE_SIZE;
c5fab6f4
JL
2802 for (i = 0; i < nr_pages; i++) {
2803 struct page *page = rdata->pages[i];
2804
8321fec4 2805 if (len >= PAGE_SIZE) {
1c892549 2806 /* enough data to fill the page */
8321fec4
JL
2807 iov.iov_base = kmap(page);
2808 iov.iov_len = PAGE_SIZE;
f96637be
JP
2809 cifs_dbg(FYI, "%u: iov_base=%p iov_len=%zu\n",
2810 i, iov.iov_base, iov.iov_len);
8321fec4
JL
2811 len -= PAGE_SIZE;
2812 } else if (len > 0) {
1c892549 2813 /* enough for partial page, fill and zero the rest */
8321fec4
JL
2814 iov.iov_base = kmap(page);
2815 iov.iov_len = len;
f96637be
JP
2816 cifs_dbg(FYI, "%u: iov_base=%p iov_len=%zu\n",
2817 i, iov.iov_base, iov.iov_len);
8321fec4
JL
2818 memset(iov.iov_base + len, '\0', PAGE_SIZE - len);
2819 rdata->tailsz = len;
2820 len = 0;
1c892549
JL
2821 } else {
2822 /* no need to hold page hostage */
c5fab6f4
JL
2823 rdata->pages[i] = NULL;
2824 rdata->nr_pages--;
1c892549 2825 put_page(page);
8321fec4 2826 continue;
1c892549 2827 }
8321fec4
JL
2828
2829 result = cifs_readv_from_socket(server, &iov, 1, iov.iov_len);
2830 kunmap(page);
2831 if (result < 0)
2832 break;
2833
2834 total_read += result;
1c892549
JL
2835 }
2836
8321fec4 2837 return total_read > 0 ? total_read : result;
1c892549
JL
2838}
2839
a70307ee
PS
2840static ssize_t
2841cifs_iovec_read(struct file *file, const struct iovec *iov,
2842 unsigned long nr_segs, loff_t *poffset)
1da177e4 2843{
1c892549 2844 ssize_t rc;
a70307ee 2845 size_t len, cur_len;
1c892549
JL
2846 ssize_t total_read = 0;
2847 loff_t offset = *poffset;
2848 unsigned int npages;
1da177e4 2849 struct cifs_sb_info *cifs_sb;
1c892549 2850 struct cifs_tcon *tcon;
1da177e4 2851 struct cifsFileInfo *open_file;
1c892549
JL
2852 struct cifs_readdata *rdata, *tmp;
2853 struct list_head rdata_list;
2854 pid_t pid;
a70307ee
PS
2855
2856 if (!nr_segs)
2857 return 0;
2858
2859 len = iov_length(iov, nr_segs);
2860 if (!len)
2861 return 0;
1da177e4 2862
1c892549 2863 INIT_LIST_HEAD(&rdata_list);
e6a00296 2864 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
c21dfb69 2865 open_file = file->private_data;
1c892549 2866 tcon = tlink_tcon(open_file->tlink);
1da177e4 2867
fc9c5966
PS
2868 if (!tcon->ses->server->ops->async_readv)
2869 return -ENOSYS;
2870
d4ffff1f
PS
2871 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
2872 pid = open_file->pid;
2873 else
2874 pid = current->tgid;
2875
ad7a2926 2876 if ((file->f_flags & O_ACCMODE) == O_WRONLY)
f96637be 2877 cifs_dbg(FYI, "attempting read on write only file instance\n");
ad7a2926 2878
1c892549
JL
2879 do {
2880 cur_len = min_t(const size_t, len - total_read, cifs_sb->rsize);
2881 npages = DIV_ROUND_UP(cur_len, PAGE_SIZE);
a70307ee 2882
1c892549
JL
2883 /* allocate a readdata struct */
2884 rdata = cifs_readdata_alloc(npages,
2885 cifs_uncached_readv_complete);
2886 if (!rdata) {
2887 rc = -ENOMEM;
2888 goto error;
1da177e4 2889 }
a70307ee 2890
c5fab6f4 2891 rc = cifs_read_allocate_pages(rdata, npages);
1c892549
JL
2892 if (rc)
2893 goto error;
2894
2895 rdata->cfile = cifsFileInfo_get(open_file);
c5fab6f4 2896 rdata->nr_pages = npages;
1c892549
JL
2897 rdata->offset = offset;
2898 rdata->bytes = cur_len;
2899 rdata->pid = pid;
8321fec4
JL
2900 rdata->pagesz = PAGE_SIZE;
2901 rdata->read_into_pages = cifs_uncached_read_into_pages;
1c892549
JL
2902
2903 rc = cifs_retry_async_readv(rdata);
2904error:
2905 if (rc) {
2906 kref_put(&rdata->refcount,
2907 cifs_uncached_readdata_release);
2908 break;
2909 }
2910
2911 list_add_tail(&rdata->list, &rdata_list);
2912 offset += cur_len;
2913 len -= cur_len;
2914 } while (len > 0);
2915
2916 /* if at least one read request send succeeded, then reset rc */
2917 if (!list_empty(&rdata_list))
2918 rc = 0;
2919
2920 /* the loop below should proceed in the order of increasing offsets */
2921restart_loop:
2922 list_for_each_entry_safe(rdata, tmp, &rdata_list, list) {
2923 if (!rc) {
2924 ssize_t copied;
2925
2926 /* FIXME: freezable sleep too? */
2927 rc = wait_for_completion_killable(&rdata->done);
2928 if (rc)
2929 rc = -EINTR;
2930 else if (rdata->result)
2931 rc = rdata->result;
2932 else {
2933 rc = cifs_readdata_to_iov(rdata, iov,
2934 nr_segs, *poffset,
2935 &copied);
2936 total_read += copied;
2937 }
2938
2939 /* resend call if it's a retryable error */
2940 if (rc == -EAGAIN) {
2941 rc = cifs_retry_async_readv(rdata);
2942 goto restart_loop;
1da177e4 2943 }
1da177e4 2944 }
1c892549
JL
2945 list_del_init(&rdata->list);
2946 kref_put(&rdata->refcount, cifs_uncached_readdata_release);
1da177e4 2947 }
a70307ee 2948
1c892549
JL
2949 cifs_stats_bytes_read(tcon, total_read);
2950 *poffset += total_read;
2951
09a4707e
PS
2952 /* mask nodata case */
2953 if (rc == -ENODATA)
2954 rc = 0;
2955
1c892549 2956 return total_read ? total_read : rc;
1da177e4
LT
2957}
2958
0b81c1c4 2959ssize_t cifs_user_readv(struct kiocb *iocb, const struct iovec *iov,
a70307ee
PS
2960 unsigned long nr_segs, loff_t pos)
2961{
2962 ssize_t read;
2963
2964 read = cifs_iovec_read(iocb->ki_filp, iov, nr_segs, &pos);
2965 if (read > 0)
2966 iocb->ki_pos = pos;
2967
2968 return read;
2969}
2970
579f9053
PS
2971ssize_t
2972cifs_strict_readv(struct kiocb *iocb, const struct iovec *iov,
2973 unsigned long nr_segs, loff_t pos)
a70307ee 2974{
496ad9aa 2975 struct inode *inode = file_inode(iocb->ki_filp);
579f9053
PS
2976 struct cifsInodeInfo *cinode = CIFS_I(inode);
2977 struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
2978 struct cifsFileInfo *cfile = (struct cifsFileInfo *)
2979 iocb->ki_filp->private_data;
2980 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
2981 int rc = -EACCES;
a70307ee
PS
2982
2983 /*
2984 * In strict cache mode we need to read from the server all the time
2985 * if we don't have level II oplock because the server can delay mtime
2986 * change - so we can't make a decision about inode invalidating.
2987 * And we can also fail with pagereading if there are mandatory locks
2988 * on pages affected by this read but not on the region from pos to
2989 * pos+len-1.
2990 */
18cceb6a 2991 if (!CIFS_CACHE_READ(cinode))
579f9053 2992 return cifs_user_readv(iocb, iov, nr_segs, pos);
a70307ee 2993
579f9053
PS
2994 if (cap_unix(tcon->ses) &&
2995 (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
2996 ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
2997 return generic_file_aio_read(iocb, iov, nr_segs, pos);
2998
2999 /*
3000 * We need to hold the sem to be sure nobody modifies lock list
3001 * with a brlock that prevents reading.
3002 */
3003 down_read(&cinode->lock_sem);
3004 if (!cifs_find_lock_conflict(cfile, pos, iov_length(iov, nr_segs),
3005 tcon->ses->server->vals->shared_lock_type,
081c0414 3006 NULL, CIFS_READ_OP))
579f9053
PS
3007 rc = generic_file_aio_read(iocb, iov, nr_segs, pos);
3008 up_read(&cinode->lock_sem);
3009 return rc;
a70307ee 3010}
1da177e4 3011
f9c6e234
PS
3012static ssize_t
3013cifs_read(struct file *file, char *read_data, size_t read_size, loff_t *offset)
1da177e4
LT
3014{
3015 int rc = -EACCES;
3016 unsigned int bytes_read = 0;
3017 unsigned int total_read;
3018 unsigned int current_read_size;
5eba8ab3 3019 unsigned int rsize;
1da177e4 3020 struct cifs_sb_info *cifs_sb;
29e20f9c 3021 struct cifs_tcon *tcon;
f9c6e234 3022 struct TCP_Server_Info *server;
6d5786a3 3023 unsigned int xid;
f9c6e234 3024 char *cur_offset;
1da177e4 3025 struct cifsFileInfo *open_file;
d4ffff1f 3026 struct cifs_io_parms io_parms;
ec637e3f 3027 int buf_type = CIFS_NO_BUFFER;
d4ffff1f 3028 __u32 pid;
1da177e4 3029
6d5786a3 3030 xid = get_xid();
e6a00296 3031 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
1da177e4 3032
5eba8ab3
JL
3033 /* FIXME: set up handlers for larger reads and/or convert to async */
3034 rsize = min_t(unsigned int, cifs_sb->rsize, CIFSMaxBufSize);
3035
1da177e4 3036 if (file->private_data == NULL) {
0f3bc09e 3037 rc = -EBADF;
6d5786a3 3038 free_xid(xid);
0f3bc09e 3039 return rc;
1da177e4 3040 }
c21dfb69 3041 open_file = file->private_data;
29e20f9c 3042 tcon = tlink_tcon(open_file->tlink);
f9c6e234
PS
3043 server = tcon->ses->server;
3044
3045 if (!server->ops->sync_read) {
3046 free_xid(xid);
3047 return -ENOSYS;
3048 }
1da177e4 3049
d4ffff1f
PS
3050 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
3051 pid = open_file->pid;
3052 else
3053 pid = current->tgid;
3054
1da177e4 3055 if ((file->f_flags & O_ACCMODE) == O_WRONLY)
f96637be 3056 cifs_dbg(FYI, "attempting read on write only file instance\n");
1da177e4 3057
f9c6e234
PS
3058 for (total_read = 0, cur_offset = read_data; read_size > total_read;
3059 total_read += bytes_read, cur_offset += bytes_read) {
5eba8ab3 3060 current_read_size = min_t(uint, read_size - total_read, rsize);
29e20f9c
PS
3061 /*
3062 * For windows me and 9x we do not want to request more than it
3063 * negotiated since it will refuse the read then.
3064 */
3065 if ((tcon->ses) && !(tcon->ses->capabilities &
3066 tcon->ses->server->vals->cap_large_files)) {
7748dd6e 3067 current_read_size = min_t(uint, current_read_size,
c974befa 3068 CIFSMaxBufSize);
f9f5c817 3069 }
1da177e4
LT
3070 rc = -EAGAIN;
3071 while (rc == -EAGAIN) {
cdff08e7 3072 if (open_file->invalidHandle) {
15886177 3073 rc = cifs_reopen_file(open_file, true);
1da177e4
LT
3074 if (rc != 0)
3075 break;
3076 }
d4ffff1f 3077 io_parms.pid = pid;
29e20f9c 3078 io_parms.tcon = tcon;
f9c6e234 3079 io_parms.offset = *offset;
d4ffff1f 3080 io_parms.length = current_read_size;
f9c6e234
PS
3081 rc = server->ops->sync_read(xid, open_file, &io_parms,
3082 &bytes_read, &cur_offset,
3083 &buf_type);
1da177e4
LT
3084 }
3085 if (rc || (bytes_read == 0)) {
3086 if (total_read) {
3087 break;
3088 } else {
6d5786a3 3089 free_xid(xid);
1da177e4
LT
3090 return rc;
3091 }
3092 } else {
29e20f9c 3093 cifs_stats_bytes_read(tcon, total_read);
f9c6e234 3094 *offset += bytes_read;
1da177e4
LT
3095 }
3096 }
6d5786a3 3097 free_xid(xid);
1da177e4
LT
3098 return total_read;
3099}
3100
ca83ce3d
JL
3101/*
3102 * If the page is mmap'ed into a process' page tables, then we need to make
3103 * sure that it doesn't change while being written back.
3104 */
3105static int
3106cifs_page_mkwrite(struct vm_area_struct *vma, struct vm_fault *vmf)
3107{
3108 struct page *page = vmf->page;
3109
3110 lock_page(page);
3111 return VM_FAULT_LOCKED;
3112}
3113
3114static struct vm_operations_struct cifs_file_vm_ops = {
3115 .fault = filemap_fault,
3116 .page_mkwrite = cifs_page_mkwrite,
0b173bc4 3117 .remap_pages = generic_file_remap_pages,
ca83ce3d
JL
3118};
3119
7a6a19b1
PS
3120int cifs_file_strict_mmap(struct file *file, struct vm_area_struct *vma)
3121{
3122 int rc, xid;
496ad9aa 3123 struct inode *inode = file_inode(file);
7a6a19b1 3124
6d5786a3 3125 xid = get_xid();
7a6a19b1 3126
18cceb6a 3127 if (!CIFS_CACHE_READ(CIFS_I(inode))) {
6feb9891
PS
3128 rc = cifs_invalidate_mapping(inode);
3129 if (rc)
3130 return rc;
3131 }
7a6a19b1
PS
3132
3133 rc = generic_file_mmap(file, vma);
ca83ce3d
JL
3134 if (rc == 0)
3135 vma->vm_ops = &cifs_file_vm_ops;
6d5786a3 3136 free_xid(xid);
7a6a19b1
PS
3137 return rc;
3138}
3139
1da177e4
LT
3140int cifs_file_mmap(struct file *file, struct vm_area_struct *vma)
3141{
1da177e4
LT
3142 int rc, xid;
3143
6d5786a3 3144 xid = get_xid();
abab095d 3145 rc = cifs_revalidate_file(file);
1da177e4 3146 if (rc) {
f96637be
JP
3147 cifs_dbg(FYI, "Validation prior to mmap failed, error=%d\n",
3148 rc);
6d5786a3 3149 free_xid(xid);
1da177e4
LT
3150 return rc;
3151 }
3152 rc = generic_file_mmap(file, vma);
ca83ce3d
JL
3153 if (rc == 0)
3154 vma->vm_ops = &cifs_file_vm_ops;
6d5786a3 3155 free_xid(xid);
1da177e4
LT
3156 return rc;
3157}
3158
0471ca3f
JL
3159static void
3160cifs_readv_complete(struct work_struct *work)
3161{
c5fab6f4 3162 unsigned int i;
0471ca3f
JL
3163 struct cifs_readdata *rdata = container_of(work,
3164 struct cifs_readdata, work);
0471ca3f 3165
c5fab6f4
JL
3166 for (i = 0; i < rdata->nr_pages; i++) {
3167 struct page *page = rdata->pages[i];
3168
0471ca3f
JL
3169 lru_cache_add_file(page);
3170
3171 if (rdata->result == 0) {
0471ca3f
JL
3172 flush_dcache_page(page);
3173 SetPageUptodate(page);
3174 }
3175
3176 unlock_page(page);
3177
3178 if (rdata->result == 0)
3179 cifs_readpage_to_fscache(rdata->mapping->host, page);
3180
3181 page_cache_release(page);
c5fab6f4 3182 rdata->pages[i] = NULL;
0471ca3f 3183 }
6993f74a 3184 kref_put(&rdata->refcount, cifs_readdata_release);
0471ca3f
JL
3185}
3186
8d5ce4d2 3187static int
8321fec4
JL
3188cifs_readpages_read_into_pages(struct TCP_Server_Info *server,
3189 struct cifs_readdata *rdata, unsigned int len)
8d5ce4d2 3190{
8321fec4 3191 int total_read = 0, result = 0;
c5fab6f4 3192 unsigned int i;
8d5ce4d2
JL
3193 u64 eof;
3194 pgoff_t eof_index;
c5fab6f4 3195 unsigned int nr_pages = rdata->nr_pages;
8321fec4 3196 struct kvec iov;
8d5ce4d2
JL
3197
3198 /* determine the eof that the server (probably) has */
3199 eof = CIFS_I(rdata->mapping->host)->server_eof;
3200 eof_index = eof ? (eof - 1) >> PAGE_CACHE_SHIFT : 0;
f96637be 3201 cifs_dbg(FYI, "eof=%llu eof_index=%lu\n", eof, eof_index);
8d5ce4d2 3202
8321fec4 3203 rdata->tailsz = PAGE_CACHE_SIZE;
c5fab6f4
JL
3204 for (i = 0; i < nr_pages; i++) {
3205 struct page *page = rdata->pages[i];
3206
8321fec4 3207 if (len >= PAGE_CACHE_SIZE) {
8d5ce4d2 3208 /* enough data to fill the page */
8321fec4
JL
3209 iov.iov_base = kmap(page);
3210 iov.iov_len = PAGE_CACHE_SIZE;
f96637be
JP
3211 cifs_dbg(FYI, "%u: idx=%lu iov_base=%p iov_len=%zu\n",
3212 i, page->index, iov.iov_base, iov.iov_len);
8321fec4
JL
3213 len -= PAGE_CACHE_SIZE;
3214 } else if (len > 0) {
8d5ce4d2 3215 /* enough for partial page, fill and zero the rest */
8321fec4
JL
3216 iov.iov_base = kmap(page);
3217 iov.iov_len = len;
f96637be
JP
3218 cifs_dbg(FYI, "%u: idx=%lu iov_base=%p iov_len=%zu\n",
3219 i, page->index, iov.iov_base, iov.iov_len);
8321fec4
JL
3220 memset(iov.iov_base + len,
3221 '\0', PAGE_CACHE_SIZE - len);
3222 rdata->tailsz = len;
3223 len = 0;
8d5ce4d2
JL
3224 } else if (page->index > eof_index) {
3225 /*
3226 * The VFS will not try to do readahead past the
3227 * i_size, but it's possible that we have outstanding
3228 * writes with gaps in the middle and the i_size hasn't
3229 * caught up yet. Populate those with zeroed out pages
3230 * to prevent the VFS from repeatedly attempting to
3231 * fill them until the writes are flushed.
3232 */
3233 zero_user(page, 0, PAGE_CACHE_SIZE);
8d5ce4d2
JL
3234 lru_cache_add_file(page);
3235 flush_dcache_page(page);
3236 SetPageUptodate(page);
3237 unlock_page(page);
3238 page_cache_release(page);
c5fab6f4
JL
3239 rdata->pages[i] = NULL;
3240 rdata->nr_pages--;
8321fec4 3241 continue;
8d5ce4d2
JL
3242 } else {
3243 /* no need to hold page hostage */
8d5ce4d2
JL
3244 lru_cache_add_file(page);
3245 unlock_page(page);
3246 page_cache_release(page);
c5fab6f4
JL
3247 rdata->pages[i] = NULL;
3248 rdata->nr_pages--;
8321fec4 3249 continue;
8d5ce4d2 3250 }
8321fec4
JL
3251
3252 result = cifs_readv_from_socket(server, &iov, 1, iov.iov_len);
3253 kunmap(page);
3254 if (result < 0)
3255 break;
3256
3257 total_read += result;
8d5ce4d2
JL
3258 }
3259
8321fec4 3260 return total_read > 0 ? total_read : result;
8d5ce4d2
JL
3261}
3262
1da177e4
LT
3263static int cifs_readpages(struct file *file, struct address_space *mapping,
3264 struct list_head *page_list, unsigned num_pages)
3265{
690c5e31
JL
3266 int rc;
3267 struct list_head tmplist;
3268 struct cifsFileInfo *open_file = file->private_data;
3269 struct cifs_sb_info *cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
3270 unsigned int rsize = cifs_sb->rsize;
3271 pid_t pid;
1da177e4 3272
690c5e31
JL
3273 /*
3274 * Give up immediately if rsize is too small to read an entire page.
3275 * The VFS will fall back to readpage. We should never reach this
3276 * point however since we set ra_pages to 0 when the rsize is smaller
3277 * than a cache page.
3278 */
3279 if (unlikely(rsize < PAGE_CACHE_SIZE))
3280 return 0;
bfa0d75a 3281
56698236
SJ
3282 /*
3283 * Reads as many pages as possible from fscache. Returns -ENOBUFS
3284 * immediately if the cookie is negative
54afa990
DH
3285 *
3286 * After this point, every page in the list might have PG_fscache set,
3287 * so we will need to clean that up off of every page we don't use.
56698236
SJ
3288 */
3289 rc = cifs_readpages_from_fscache(mapping->host, mapping, page_list,
3290 &num_pages);
3291 if (rc == 0)
690c5e31 3292 return rc;
56698236 3293
d4ffff1f
PS
3294 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
3295 pid = open_file->pid;
3296 else
3297 pid = current->tgid;
3298
690c5e31
JL
3299 rc = 0;
3300 INIT_LIST_HEAD(&tmplist);
1da177e4 3301
f96637be
JP
3302 cifs_dbg(FYI, "%s: file=%p mapping=%p num_pages=%u\n",
3303 __func__, file, mapping, num_pages);
690c5e31
JL
3304
3305 /*
3306 * Start with the page at end of list and move it to private
3307 * list. Do the same with any following pages until we hit
3308 * the rsize limit, hit an index discontinuity, or run out of
3309 * pages. Issue the async read and then start the loop again
3310 * until the list is empty.
3311 *
3312 * Note that list order is important. The page_list is in
3313 * the order of declining indexes. When we put the pages in
3314 * the rdata->pages, then we want them in increasing order.
3315 */
3316 while (!list_empty(page_list)) {
c5fab6f4 3317 unsigned int i;
690c5e31
JL
3318 unsigned int bytes = PAGE_CACHE_SIZE;
3319 unsigned int expected_index;
3320 unsigned int nr_pages = 1;
3321 loff_t offset;
3322 struct page *page, *tpage;
3323 struct cifs_readdata *rdata;
1da177e4
LT
3324
3325 page = list_entry(page_list->prev, struct page, lru);
690c5e31
JL
3326
3327 /*
3328 * Lock the page and put it in the cache. Since no one else
3329 * should have access to this page, we're safe to simply set
3330 * PG_locked without checking it first.
3331 */
3332 __set_page_locked(page);
3333 rc = add_to_page_cache_locked(page, mapping,
3334 page->index, GFP_KERNEL);
3335
3336 /* give up if we can't stick it in the cache */
3337 if (rc) {
3338 __clear_page_locked(page);
3339 break;
3340 }
3341
3342 /* move first page to the tmplist */
1da177e4 3343 offset = (loff_t)page->index << PAGE_CACHE_SHIFT;
690c5e31 3344 list_move_tail(&page->lru, &tmplist);
1da177e4 3345
690c5e31
JL
3346 /* now try and add more pages onto the request */
3347 expected_index = page->index + 1;
3348 list_for_each_entry_safe_reverse(page, tpage, page_list, lru) {
3349 /* discontinuity ? */
3350 if (page->index != expected_index)
fb8c4b14 3351 break;
690c5e31
JL
3352
3353 /* would this page push the read over the rsize? */
3354 if (bytes + PAGE_CACHE_SIZE > rsize)
3355 break;
3356
3357 __set_page_locked(page);
3358 if (add_to_page_cache_locked(page, mapping,
3359 page->index, GFP_KERNEL)) {
3360 __clear_page_locked(page);
3361 break;
3362 }
3363 list_move_tail(&page->lru, &tmplist);
3364 bytes += PAGE_CACHE_SIZE;
3365 expected_index++;
3366 nr_pages++;
1da177e4 3367 }
690c5e31 3368
0471ca3f 3369 rdata = cifs_readdata_alloc(nr_pages, cifs_readv_complete);
690c5e31
JL
3370 if (!rdata) {
3371 /* best to give up if we're out of mem */
3372 list_for_each_entry_safe(page, tpage, &tmplist, lru) {
3373 list_del(&page->lru);
3374 lru_cache_add_file(page);
3375 unlock_page(page);
3376 page_cache_release(page);
3377 }
3378 rc = -ENOMEM;
3379 break;
3380 }
3381
6993f74a 3382 rdata->cfile = cifsFileInfo_get(open_file);
690c5e31
JL
3383 rdata->mapping = mapping;
3384 rdata->offset = offset;
3385 rdata->bytes = bytes;
3386 rdata->pid = pid;
8321fec4
JL
3387 rdata->pagesz = PAGE_CACHE_SIZE;
3388 rdata->read_into_pages = cifs_readpages_read_into_pages;
c5fab6f4
JL
3389
3390 list_for_each_entry_safe(page, tpage, &tmplist, lru) {
3391 list_del(&page->lru);
3392 rdata->pages[rdata->nr_pages++] = page;
3393 }
690c5e31 3394
2a1bb138 3395 rc = cifs_retry_async_readv(rdata);
690c5e31 3396 if (rc != 0) {
c5fab6f4
JL
3397 for (i = 0; i < rdata->nr_pages; i++) {
3398 page = rdata->pages[i];
690c5e31
JL
3399 lru_cache_add_file(page);
3400 unlock_page(page);
3401 page_cache_release(page);
1da177e4 3402 }
6993f74a 3403 kref_put(&rdata->refcount, cifs_readdata_release);
1da177e4
LT
3404 break;
3405 }
6993f74a
JL
3406
3407 kref_put(&rdata->refcount, cifs_readdata_release);
1da177e4
LT
3408 }
3409
54afa990
DH
3410 /* Any pages that have been shown to fscache but didn't get added to
3411 * the pagecache must be uncached before they get returned to the
3412 * allocator.
3413 */
3414 cifs_fscache_readpages_cancel(mapping->host, page_list);
1da177e4
LT
3415 return rc;
3416}
3417
a9e9b7bc
SP
3418/*
3419 * cifs_readpage_worker must be called with the page pinned
3420 */
1da177e4
LT
3421static int cifs_readpage_worker(struct file *file, struct page *page,
3422 loff_t *poffset)
3423{
3424 char *read_data;
3425 int rc;
3426
56698236 3427 /* Is the page cached? */
496ad9aa 3428 rc = cifs_readpage_from_fscache(file_inode(file), page);
56698236
SJ
3429 if (rc == 0)
3430 goto read_complete;
3431
1da177e4
LT
3432 read_data = kmap(page);
3433 /* for reads over a certain size could initiate async read ahead */
fb8c4b14 3434
1da177e4 3435 rc = cifs_read(file, read_data, PAGE_CACHE_SIZE, poffset);
fb8c4b14 3436
1da177e4
LT
3437 if (rc < 0)
3438 goto io_error;
3439 else
f96637be 3440 cifs_dbg(FYI, "Bytes read %d\n", rc);
fb8c4b14 3441
496ad9aa
AV
3442 file_inode(file)->i_atime =
3443 current_fs_time(file_inode(file)->i_sb);
fb8c4b14 3444
1da177e4
LT
3445 if (PAGE_CACHE_SIZE > rc)
3446 memset(read_data + rc, 0, PAGE_CACHE_SIZE - rc);
3447
3448 flush_dcache_page(page);
3449 SetPageUptodate(page);
9dc06558
SJ
3450
3451 /* send this page to the cache */
496ad9aa 3452 cifs_readpage_to_fscache(file_inode(file), page);
9dc06558 3453
1da177e4 3454 rc = 0;
fb8c4b14 3455
1da177e4 3456io_error:
fb8c4b14 3457 kunmap(page);
466bd31b 3458 unlock_page(page);
56698236
SJ
3459
3460read_complete:
1da177e4
LT
3461 return rc;
3462}
3463
3464static int cifs_readpage(struct file *file, struct page *page)
3465{
3466 loff_t offset = (loff_t)page->index << PAGE_CACHE_SHIFT;
3467 int rc = -EACCES;
6d5786a3 3468 unsigned int xid;
1da177e4 3469
6d5786a3 3470 xid = get_xid();
1da177e4
LT
3471
3472 if (file->private_data == NULL) {
0f3bc09e 3473 rc = -EBADF;
6d5786a3 3474 free_xid(xid);
0f3bc09e 3475 return rc;
1da177e4
LT
3476 }
3477
f96637be 3478 cifs_dbg(FYI, "readpage %p at offset %d 0x%x\n",
b6b38f70 3479 page, (int)offset, (int)offset);
1da177e4
LT
3480
3481 rc = cifs_readpage_worker(file, page, &offset);
3482
6d5786a3 3483 free_xid(xid);
1da177e4
LT
3484 return rc;
3485}
3486
a403a0a3
SF
3487static int is_inode_writable(struct cifsInodeInfo *cifs_inode)
3488{
3489 struct cifsFileInfo *open_file;
3490
4477288a 3491 spin_lock(&cifs_file_list_lock);
a403a0a3 3492 list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
2e396b83 3493 if (OPEN_FMODE(open_file->f_flags) & FMODE_WRITE) {
4477288a 3494 spin_unlock(&cifs_file_list_lock);
a403a0a3
SF
3495 return 1;
3496 }
3497 }
4477288a 3498 spin_unlock(&cifs_file_list_lock);
a403a0a3
SF
3499 return 0;
3500}
3501
1da177e4
LT
3502/* We do not want to update the file size from server for inodes
3503 open for write - to avoid races with writepage extending
3504 the file - in the future we could consider allowing
fb8c4b14 3505 refreshing the inode only on increases in the file size
1da177e4
LT
3506 but this is tricky to do without racing with writebehind
3507 page caching in the current Linux kernel design */
4b18f2a9 3508bool is_size_safe_to_change(struct cifsInodeInfo *cifsInode, __u64 end_of_file)
1da177e4 3509{
a403a0a3 3510 if (!cifsInode)
4b18f2a9 3511 return true;
50c2f753 3512
a403a0a3
SF
3513 if (is_inode_writable(cifsInode)) {
3514 /* This inode is open for write at least once */
c32a0b68
SF
3515 struct cifs_sb_info *cifs_sb;
3516
c32a0b68 3517 cifs_sb = CIFS_SB(cifsInode->vfs_inode.i_sb);
ad7a2926 3518 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_DIRECT_IO) {
fb8c4b14 3519 /* since no page cache to corrupt on directio
c32a0b68 3520 we can change size safely */
4b18f2a9 3521 return true;
c32a0b68
SF
3522 }
3523
fb8c4b14 3524 if (i_size_read(&cifsInode->vfs_inode) < end_of_file)
4b18f2a9 3525 return true;
7ba52631 3526
4b18f2a9 3527 return false;
23e7dd7d 3528 } else
4b18f2a9 3529 return true;
1da177e4
LT
3530}
3531
d9414774
NP
3532static int cifs_write_begin(struct file *file, struct address_space *mapping,
3533 loff_t pos, unsigned len, unsigned flags,
3534 struct page **pagep, void **fsdata)
1da177e4 3535{
466bd31b 3536 int oncethru = 0;
d9414774
NP
3537 pgoff_t index = pos >> PAGE_CACHE_SHIFT;
3538 loff_t offset = pos & (PAGE_CACHE_SIZE - 1);
a98ee8c1
JL
3539 loff_t page_start = pos & PAGE_MASK;
3540 loff_t i_size;
3541 struct page *page;
3542 int rc = 0;
d9414774 3543
f96637be 3544 cifs_dbg(FYI, "write_begin from %lld len %d\n", (long long)pos, len);
d9414774 3545
466bd31b 3546start:
54566b2c 3547 page = grab_cache_page_write_begin(mapping, index, flags);
a98ee8c1
JL
3548 if (!page) {
3549 rc = -ENOMEM;
3550 goto out;
3551 }
8a236264 3552
a98ee8c1
JL
3553 if (PageUptodate(page))
3554 goto out;
8a236264 3555
a98ee8c1
JL
3556 /*
3557 * If we write a full page it will be up to date, no need to read from
3558 * the server. If the write is short, we'll end up doing a sync write
3559 * instead.
3560 */
3561 if (len == PAGE_CACHE_SIZE)
3562 goto out;
8a236264 3563
a98ee8c1
JL
3564 /*
3565 * optimize away the read when we have an oplock, and we're not
3566 * expecting to use any of the data we'd be reading in. That
3567 * is, when the page lies beyond the EOF, or straddles the EOF
3568 * and the write will cover all of the existing data.
3569 */
18cceb6a 3570 if (CIFS_CACHE_READ(CIFS_I(mapping->host))) {
a98ee8c1
JL
3571 i_size = i_size_read(mapping->host);
3572 if (page_start >= i_size ||
3573 (offset == 0 && (pos + len) >= i_size)) {
3574 zero_user_segments(page, 0, offset,
3575 offset + len,
3576 PAGE_CACHE_SIZE);
3577 /*
3578 * PageChecked means that the parts of the page
3579 * to which we're not writing are considered up
3580 * to date. Once the data is copied to the
3581 * page, it can be set uptodate.
3582 */
3583 SetPageChecked(page);
3584 goto out;
3585 }
3586 }
d9414774 3587
466bd31b 3588 if ((file->f_flags & O_ACCMODE) != O_WRONLY && !oncethru) {
a98ee8c1
JL
3589 /*
3590 * might as well read a page, it is fast enough. If we get
3591 * an error, we don't need to return it. cifs_write_end will
3592 * do a sync write instead since PG_uptodate isn't set.
3593 */
3594 cifs_readpage_worker(file, page, &page_start);
466bd31b
SP
3595 page_cache_release(page);
3596 oncethru = 1;
3597 goto start;
8a236264
SF
3598 } else {
3599 /* we could try using another file handle if there is one -
3600 but how would we lock it to prevent close of that handle
3601 racing with this read? In any case
d9414774 3602 this will be written out by write_end so is fine */
1da177e4 3603 }
a98ee8c1
JL
3604out:
3605 *pagep = page;
3606 return rc;
1da177e4
LT
3607}
3608
85f2d6b4
SJ
3609static int cifs_release_page(struct page *page, gfp_t gfp)
3610{
3611 if (PagePrivate(page))
3612 return 0;
3613
3614 return cifs_fscache_release_page(page, gfp);
3615}
3616
d47992f8
LC
3617static void cifs_invalidate_page(struct page *page, unsigned int offset,
3618 unsigned int length)
85f2d6b4
SJ
3619{
3620 struct cifsInodeInfo *cifsi = CIFS_I(page->mapping->host);
3621
d47992f8 3622 if (offset == 0 && length == PAGE_CACHE_SIZE)
85f2d6b4
SJ
3623 cifs_fscache_invalidate_page(page, &cifsi->vfs_inode);
3624}
3625
9ad1506b
PS
3626static int cifs_launder_page(struct page *page)
3627{
3628 int rc = 0;
3629 loff_t range_start = page_offset(page);
3630 loff_t range_end = range_start + (loff_t)(PAGE_CACHE_SIZE - 1);
3631 struct writeback_control wbc = {
3632 .sync_mode = WB_SYNC_ALL,
3633 .nr_to_write = 0,
3634 .range_start = range_start,
3635 .range_end = range_end,
3636 };
3637
f96637be 3638 cifs_dbg(FYI, "Launder page: %p\n", page);
9ad1506b
PS
3639
3640 if (clear_page_dirty_for_io(page))
3641 rc = cifs_writepage_locked(page, &wbc);
3642
3643 cifs_fscache_invalidate_page(page, page->mapping->host);
3644 return rc;
3645}
3646
9b646972 3647void cifs_oplock_break(struct work_struct *work)
3bc303c2
JL
3648{
3649 struct cifsFileInfo *cfile = container_of(work, struct cifsFileInfo,
3650 oplock_break);
a5e18bc3 3651 struct inode *inode = cfile->dentry->d_inode;
3bc303c2 3652 struct cifsInodeInfo *cinode = CIFS_I(inode);
95a3f2f3 3653 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
eb4b756b 3654 int rc = 0;
3bc303c2 3655
18cceb6a 3656 if (!CIFS_CACHE_WRITE(cinode) && CIFS_CACHE_READ(cinode) &&
63b7d3a4 3657 cifs_has_mand_locks(cinode)) {
f96637be
JP
3658 cifs_dbg(FYI, "Reset oplock to None for inode=%p due to mand locks\n",
3659 inode);
18cceb6a 3660 cinode->oplock = 0;
63b7d3a4
PS
3661 }
3662
3bc303c2 3663 if (inode && S_ISREG(inode->i_mode)) {
18cceb6a 3664 if (CIFS_CACHE_READ(cinode))
8737c930 3665 break_lease(inode, O_RDONLY);
d54ff732 3666 else
8737c930 3667 break_lease(inode, O_WRONLY);
3bc303c2 3668 rc = filemap_fdatawrite(inode->i_mapping);
18cceb6a 3669 if (!CIFS_CACHE_READ(cinode)) {
eb4b756b
JL
3670 rc = filemap_fdatawait(inode->i_mapping);
3671 mapping_set_error(inode->i_mapping, rc);
03eca704 3672 cifs_invalidate_mapping(inode);
3bc303c2 3673 }
f96637be 3674 cifs_dbg(FYI, "Oplock flush inode %p rc %d\n", inode, rc);
3bc303c2
JL
3675 }
3676
85160e03
PS
3677 rc = cifs_push_locks(cfile);
3678 if (rc)
f96637be 3679 cifs_dbg(VFS, "Push locks rc = %d\n", rc);
85160e03 3680
3bc303c2
JL
3681 /*
3682 * releasing stale oplock after recent reconnect of smb session using
3683 * a now incorrect file handle is not a data integrity issue but do
3684 * not bother sending an oplock release if session to server still is
3685 * disconnected since oplock already released by the server
3686 */
cdff08e7 3687 if (!cfile->oplock_break_cancelled) {
95a3f2f3
PS
3688 rc = tcon->ses->server->ops->oplock_response(tcon, &cfile->fid,
3689 cinode);
f96637be 3690 cifs_dbg(FYI, "Oplock release rc = %d\n", rc);
3bc303c2 3691 }
3bc303c2
JL
3692}
3693
dca69288
SF
3694/*
3695 * The presence of cifs_direct_io() in the address space ops vector
3696 * allowes open() O_DIRECT flags which would have failed otherwise.
3697 *
3698 * In the non-cached mode (mount with cache=none), we shunt off direct read and write requests
3699 * so this method should never be called.
3700 *
3701 * Direct IO is not yet supported in the cached mode.
3702 */
3703static ssize_t
3704cifs_direct_io(int rw, struct kiocb *iocb, const struct iovec *iov,
3705 loff_t pos, unsigned long nr_segs)
3706{
3707 /*
3708 * FIXME
3709 * Eventually need to support direct IO for non forcedirectio mounts
3710 */
3711 return -EINVAL;
3712}
3713
3714
f5e54d6e 3715const struct address_space_operations cifs_addr_ops = {
1da177e4
LT
3716 .readpage = cifs_readpage,
3717 .readpages = cifs_readpages,
3718 .writepage = cifs_writepage,
37c0eb46 3719 .writepages = cifs_writepages,
d9414774
NP
3720 .write_begin = cifs_write_begin,
3721 .write_end = cifs_write_end,
1da177e4 3722 .set_page_dirty = __set_page_dirty_nobuffers,
85f2d6b4 3723 .releasepage = cifs_release_page,
dca69288 3724 .direct_IO = cifs_direct_io,
85f2d6b4 3725 .invalidatepage = cifs_invalidate_page,
9ad1506b 3726 .launder_page = cifs_launder_page,
1da177e4 3727};
273d81d6
DK
3728
3729/*
3730 * cifs_readpages requires the server to support a buffer large enough to
3731 * contain the header plus one complete page of data. Otherwise, we need
3732 * to leave cifs_readpages out of the address space operations.
3733 */
f5e54d6e 3734const struct address_space_operations cifs_addr_ops_smallbuf = {
273d81d6
DK
3735 .readpage = cifs_readpage,
3736 .writepage = cifs_writepage,
3737 .writepages = cifs_writepages,
d9414774
NP
3738 .write_begin = cifs_write_begin,
3739 .write_end = cifs_write_end,
273d81d6 3740 .set_page_dirty = __set_page_dirty_nobuffers,
85f2d6b4
SJ
3741 .releasepage = cifs_release_page,
3742 .invalidatepage = cifs_invalidate_page,
9ad1506b 3743 .launder_page = cifs_launder_page,
273d81d6 3744};
This page took 0.714658 seconds and 5 git commands to generate.