]> git.ipfire.org Git - people/ms/linux.git/blame - fs/cifs/file.c
CIFS: Move protocol specific tcon/tdis code to ops struct
[people/ms/linux.git] / fs / cifs / file.c
CommitLineData
1da177e4
LT
1/*
2 * fs/cifs/file.c
3 *
4 * vfs operations that deal with files
fb8c4b14 5 *
f19159dc 6 * Copyright (C) International Business Machines Corp., 2002,2010
1da177e4 7 * Author(s): Steve French (sfrench@us.ibm.com)
7ee1af76 8 * Jeremy Allison (jra@samba.org)
1da177e4
LT
9 *
10 * This library is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU Lesser General Public License as published
12 * by the Free Software Foundation; either version 2.1 of the License, or
13 * (at your option) any later version.
14 *
15 * This library is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
18 * the GNU Lesser General Public License for more details.
19 *
20 * You should have received a copy of the GNU Lesser General Public License
21 * along with this library; if not, write to the Free Software
22 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 */
24#include <linux/fs.h>
37c0eb46 25#include <linux/backing-dev.h>
1da177e4
LT
26#include <linux/stat.h>
27#include <linux/fcntl.h>
28#include <linux/pagemap.h>
29#include <linux/pagevec.h>
37c0eb46 30#include <linux/writeback.h>
6f88cc2e 31#include <linux/task_io_accounting_ops.h>
23e7dd7d 32#include <linux/delay.h>
3bc303c2 33#include <linux/mount.h>
5a0e3ad6 34#include <linux/slab.h>
690c5e31 35#include <linux/swap.h>
1da177e4
LT
36#include <asm/div64.h>
37#include "cifsfs.h"
38#include "cifspdu.h"
39#include "cifsglob.h"
40#include "cifsproto.h"
41#include "cifs_unicode.h"
42#include "cifs_debug.h"
43#include "cifs_fs_sb.h"
9451a9a5 44#include "fscache.h"
1da177e4 45
1da177e4
LT
46static inline int cifs_convert_flags(unsigned int flags)
47{
48 if ((flags & O_ACCMODE) == O_RDONLY)
49 return GENERIC_READ;
50 else if ((flags & O_ACCMODE) == O_WRONLY)
51 return GENERIC_WRITE;
52 else if ((flags & O_ACCMODE) == O_RDWR) {
53 /* GENERIC_ALL is too much permission to request
54 can cause unnecessary access denied on create */
55 /* return GENERIC_ALL; */
56 return (GENERIC_READ | GENERIC_WRITE);
57 }
58
e10f7b55
JL
59 return (READ_CONTROL | FILE_WRITE_ATTRIBUTES | FILE_READ_ATTRIBUTES |
60 FILE_WRITE_EA | FILE_APPEND_DATA | FILE_WRITE_DATA |
61 FILE_READ_DATA);
7fc8f4e9 62}
e10f7b55 63
608712fe 64static u32 cifs_posix_convert_flags(unsigned int flags)
7fc8f4e9 65{
608712fe 66 u32 posix_flags = 0;
e10f7b55 67
7fc8f4e9 68 if ((flags & O_ACCMODE) == O_RDONLY)
608712fe 69 posix_flags = SMB_O_RDONLY;
7fc8f4e9 70 else if ((flags & O_ACCMODE) == O_WRONLY)
608712fe
JL
71 posix_flags = SMB_O_WRONLY;
72 else if ((flags & O_ACCMODE) == O_RDWR)
73 posix_flags = SMB_O_RDWR;
74
75 if (flags & O_CREAT)
76 posix_flags |= SMB_O_CREAT;
77 if (flags & O_EXCL)
78 posix_flags |= SMB_O_EXCL;
79 if (flags & O_TRUNC)
80 posix_flags |= SMB_O_TRUNC;
81 /* be safe and imply O_SYNC for O_DSYNC */
6b2f3d1f 82 if (flags & O_DSYNC)
608712fe 83 posix_flags |= SMB_O_SYNC;
7fc8f4e9 84 if (flags & O_DIRECTORY)
608712fe 85 posix_flags |= SMB_O_DIRECTORY;
7fc8f4e9 86 if (flags & O_NOFOLLOW)
608712fe 87 posix_flags |= SMB_O_NOFOLLOW;
7fc8f4e9 88 if (flags & O_DIRECT)
608712fe 89 posix_flags |= SMB_O_DIRECT;
7fc8f4e9
SF
90
91 return posix_flags;
1da177e4
LT
92}
93
94static inline int cifs_get_disposition(unsigned int flags)
95{
96 if ((flags & (O_CREAT | O_EXCL)) == (O_CREAT | O_EXCL))
97 return FILE_CREATE;
98 else if ((flags & (O_CREAT | O_TRUNC)) == (O_CREAT | O_TRUNC))
99 return FILE_OVERWRITE_IF;
100 else if ((flags & O_CREAT) == O_CREAT)
101 return FILE_OPEN_IF;
55aa2e09
SF
102 else if ((flags & O_TRUNC) == O_TRUNC)
103 return FILE_OVERWRITE;
1da177e4
LT
104 else
105 return FILE_OPEN;
106}
107
608712fe
JL
108int cifs_posix_open(char *full_path, struct inode **pinode,
109 struct super_block *sb, int mode, unsigned int f_flags,
110 __u32 *poplock, __u16 *pnetfid, int xid)
111{
112 int rc;
113 FILE_UNIX_BASIC_INFO *presp_data;
114 __u32 posix_flags = 0;
115 struct cifs_sb_info *cifs_sb = CIFS_SB(sb);
116 struct cifs_fattr fattr;
117 struct tcon_link *tlink;
96daf2b0 118 struct cifs_tcon *tcon;
608712fe
JL
119
120 cFYI(1, "posix open %s", full_path);
121
122 presp_data = kzalloc(sizeof(FILE_UNIX_BASIC_INFO), GFP_KERNEL);
123 if (presp_data == NULL)
124 return -ENOMEM;
125
126 tlink = cifs_sb_tlink(cifs_sb);
127 if (IS_ERR(tlink)) {
128 rc = PTR_ERR(tlink);
129 goto posix_open_ret;
130 }
131
132 tcon = tlink_tcon(tlink);
133 mode &= ~current_umask();
134
135 posix_flags = cifs_posix_convert_flags(f_flags);
136 rc = CIFSPOSIXCreate(xid, tcon, posix_flags, mode, pnetfid, presp_data,
137 poplock, full_path, cifs_sb->local_nls,
138 cifs_sb->mnt_cifs_flags &
139 CIFS_MOUNT_MAP_SPECIAL_CHR);
140 cifs_put_tlink(tlink);
141
142 if (rc)
143 goto posix_open_ret;
144
145 if (presp_data->Type == cpu_to_le32(-1))
146 goto posix_open_ret; /* open ok, caller does qpathinfo */
147
148 if (!pinode)
149 goto posix_open_ret; /* caller does not need info */
150
151 cifs_unix_basic_to_fattr(&fattr, presp_data, cifs_sb);
152
153 /* get new inode and set it up */
154 if (*pinode == NULL) {
155 cifs_fill_uniqueid(sb, &fattr);
156 *pinode = cifs_iget(sb, &fattr);
157 if (!*pinode) {
158 rc = -ENOMEM;
159 goto posix_open_ret;
160 }
161 } else {
162 cifs_fattr_to_inode(*pinode, &fattr);
163 }
164
165posix_open_ret:
166 kfree(presp_data);
167 return rc;
168}
169
eeb910a6
PS
170static int
171cifs_nt_open(char *full_path, struct inode *inode, struct cifs_sb_info *cifs_sb,
96daf2b0 172 struct cifs_tcon *tcon, unsigned int f_flags, __u32 *poplock,
eeb910a6
PS
173 __u16 *pnetfid, int xid)
174{
175 int rc;
176 int desiredAccess;
177 int disposition;
3d3ea8e6 178 int create_options = CREATE_NOT_DIR;
eeb910a6
PS
179 FILE_ALL_INFO *buf;
180
181 desiredAccess = cifs_convert_flags(f_flags);
182
183/*********************************************************************
184 * open flag mapping table:
185 *
186 * POSIX Flag CIFS Disposition
187 * ---------- ----------------
188 * O_CREAT FILE_OPEN_IF
189 * O_CREAT | O_EXCL FILE_CREATE
190 * O_CREAT | O_TRUNC FILE_OVERWRITE_IF
191 * O_TRUNC FILE_OVERWRITE
192 * none of the above FILE_OPEN
193 *
194 * Note that there is not a direct match between disposition
195 * FILE_SUPERSEDE (ie create whether or not file exists although
196 * O_CREAT | O_TRUNC is similar but truncates the existing
197 * file rather than creating a new file as FILE_SUPERSEDE does
198 * (which uses the attributes / metadata passed in on open call)
199 *?
200 *? O_SYNC is a reasonable match to CIFS writethrough flag
201 *? and the read write flags match reasonably. O_LARGEFILE
202 *? is irrelevant because largefile support is always used
203 *? by this client. Flags O_APPEND, O_DIRECT, O_DIRECTORY,
204 * O_FASYNC, O_NOFOLLOW, O_NONBLOCK need further investigation
205 *********************************************************************/
206
207 disposition = cifs_get_disposition(f_flags);
208
209 /* BB pass O_SYNC flag through on file attributes .. BB */
210
211 buf = kmalloc(sizeof(FILE_ALL_INFO), GFP_KERNEL);
212 if (!buf)
213 return -ENOMEM;
214
3d3ea8e6
SP
215 if (backup_cred(cifs_sb))
216 create_options |= CREATE_OPEN_BACKUP_INTENT;
217
eeb910a6
PS
218 if (tcon->ses->capabilities & CAP_NT_SMBS)
219 rc = CIFSSMBOpen(xid, tcon, full_path, disposition,
3d3ea8e6 220 desiredAccess, create_options, pnetfid, poplock, buf,
eeb910a6
PS
221 cifs_sb->local_nls, cifs_sb->mnt_cifs_flags
222 & CIFS_MOUNT_MAP_SPECIAL_CHR);
223 else
224 rc = SMBLegacyOpen(xid, tcon, full_path, disposition,
225 desiredAccess, CREATE_NOT_DIR, pnetfid, poplock, buf,
226 cifs_sb->local_nls, cifs_sb->mnt_cifs_flags
227 & CIFS_MOUNT_MAP_SPECIAL_CHR);
228
229 if (rc)
230 goto out;
231
232 if (tcon->unix_ext)
233 rc = cifs_get_inode_info_unix(&inode, full_path, inode->i_sb,
234 xid);
235 else
236 rc = cifs_get_inode_info(&inode, full_path, buf, inode->i_sb,
237 xid, pnetfid);
238
239out:
240 kfree(buf);
241 return rc;
242}
243
15ecb436
JL
244struct cifsFileInfo *
245cifs_new_fileinfo(__u16 fileHandle, struct file *file,
246 struct tcon_link *tlink, __u32 oplock)
247{
248 struct dentry *dentry = file->f_path.dentry;
249 struct inode *inode = dentry->d_inode;
250 struct cifsInodeInfo *pCifsInode = CIFS_I(inode);
251 struct cifsFileInfo *pCifsFile;
252
253 pCifsFile = kzalloc(sizeof(struct cifsFileInfo), GFP_KERNEL);
254 if (pCifsFile == NULL)
255 return pCifsFile;
256
5f6dbc9e 257 pCifsFile->count = 1;
15ecb436
JL
258 pCifsFile->netfid = fileHandle;
259 pCifsFile->pid = current->tgid;
260 pCifsFile->uid = current_fsuid();
261 pCifsFile->dentry = dget(dentry);
262 pCifsFile->f_flags = file->f_flags;
263 pCifsFile->invalidHandle = false;
15ecb436
JL
264 pCifsFile->tlink = cifs_get_tlink(tlink);
265 mutex_init(&pCifsFile->fh_mutex);
15ecb436 266 INIT_WORK(&pCifsFile->oplock_break, cifs_oplock_break);
fbd35aca 267 INIT_LIST_HEAD(&pCifsFile->llist);
15ecb436 268
4477288a 269 spin_lock(&cifs_file_list_lock);
15ecb436
JL
270 list_add(&pCifsFile->tlist, &(tlink_tcon(tlink)->openFileList));
271 /* if readable file instance put first in list*/
272 if (file->f_mode & FMODE_READ)
273 list_add(&pCifsFile->flist, &pCifsInode->openFileList);
274 else
275 list_add_tail(&pCifsFile->flist, &pCifsInode->openFileList);
4477288a 276 spin_unlock(&cifs_file_list_lock);
15ecb436 277
c6723628 278 cifs_set_oplock_level(pCifsInode, oplock);
85160e03 279 pCifsInode->can_cache_brlcks = pCifsInode->clientCanCacheAll;
15ecb436
JL
280
281 file->private_data = pCifsFile;
282 return pCifsFile;
283}
284
85160e03
PS
285static void cifs_del_lock_waiters(struct cifsLockInfo *lock);
286
cdff08e7
SF
287/*
288 * Release a reference on the file private data. This may involve closing
5f6dbc9e
JL
289 * the filehandle out on the server. Must be called without holding
290 * cifs_file_list_lock.
cdff08e7 291 */
b33879aa
JL
292void cifsFileInfo_put(struct cifsFileInfo *cifs_file)
293{
e66673e3 294 struct inode *inode = cifs_file->dentry->d_inode;
96daf2b0 295 struct cifs_tcon *tcon = tlink_tcon(cifs_file->tlink);
e66673e3 296 struct cifsInodeInfo *cifsi = CIFS_I(inode);
4f8ba8a0 297 struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
cdff08e7
SF
298 struct cifsLockInfo *li, *tmp;
299
300 spin_lock(&cifs_file_list_lock);
5f6dbc9e 301 if (--cifs_file->count > 0) {
cdff08e7
SF
302 spin_unlock(&cifs_file_list_lock);
303 return;
304 }
305
306 /* remove it from the lists */
307 list_del(&cifs_file->flist);
308 list_del(&cifs_file->tlist);
309
310 if (list_empty(&cifsi->openFileList)) {
311 cFYI(1, "closing last open instance for inode %p",
312 cifs_file->dentry->d_inode);
4f8ba8a0
PS
313
314 /* in strict cache mode we need invalidate mapping on the last
315 close because it may cause a error when we open this file
316 again and get at least level II oplock */
317 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_STRICT_IO)
318 CIFS_I(inode)->invalid_mapping = true;
319
c6723628 320 cifs_set_oplock_level(cifsi, 0);
cdff08e7
SF
321 }
322 spin_unlock(&cifs_file_list_lock);
323
ad635942
JL
324 cancel_work_sync(&cifs_file->oplock_break);
325
cdff08e7
SF
326 if (!tcon->need_reconnect && !cifs_file->invalidHandle) {
327 int xid, rc;
328
329 xid = GetXid();
330 rc = CIFSSMBClose(xid, tcon, cifs_file->netfid);
331 FreeXid(xid);
332 }
333
334 /* Delete any outstanding lock records. We'll lose them when the file
335 * is closed anyway.
336 */
d59dad2b 337 mutex_lock(&cifsi->lock_mutex);
fbd35aca 338 list_for_each_entry_safe(li, tmp, &cifs_file->llist, llist) {
cdff08e7 339 list_del(&li->llist);
85160e03 340 cifs_del_lock_waiters(li);
cdff08e7 341 kfree(li);
b33879aa 342 }
d59dad2b 343 mutex_unlock(&cifsi->lock_mutex);
cdff08e7
SF
344
345 cifs_put_tlink(cifs_file->tlink);
346 dput(cifs_file->dentry);
347 kfree(cifs_file);
b33879aa
JL
348}
349
1da177e4
LT
350int cifs_open(struct inode *inode, struct file *file)
351{
352 int rc = -EACCES;
590a3fe0
JL
353 int xid;
354 __u32 oplock;
1da177e4 355 struct cifs_sb_info *cifs_sb;
96daf2b0 356 struct cifs_tcon *tcon;
7ffec372 357 struct tcon_link *tlink;
6ca9f3ba 358 struct cifsFileInfo *pCifsFile = NULL;
1da177e4 359 char *full_path = NULL;
7e12eddb 360 bool posix_open_ok = false;
1da177e4 361 __u16 netfid;
1da177e4
LT
362
363 xid = GetXid();
364
365 cifs_sb = CIFS_SB(inode->i_sb);
7ffec372
JL
366 tlink = cifs_sb_tlink(cifs_sb);
367 if (IS_ERR(tlink)) {
368 FreeXid(xid);
369 return PTR_ERR(tlink);
370 }
371 tcon = tlink_tcon(tlink);
1da177e4 372
e6a00296 373 full_path = build_path_from_dentry(file->f_path.dentry);
1da177e4 374 if (full_path == NULL) {
0f3bc09e 375 rc = -ENOMEM;
232341ba 376 goto out;
1da177e4
LT
377 }
378
b6b38f70
JP
379 cFYI(1, "inode = 0x%p file flags are 0x%x for %s",
380 inode, file->f_flags, full_path);
276a74a4 381
10b9b98e 382 if (tcon->ses->server->oplocks)
276a74a4
SF
383 oplock = REQ_OPLOCK;
384 else
385 oplock = 0;
386
64cc2c63
SF
387 if (!tcon->broken_posix_open && tcon->unix_ext &&
388 (tcon->ses->capabilities & CAP_UNIX) &&
276a74a4
SF
389 (CIFS_UNIX_POSIX_PATH_OPS_CAP &
390 le64_to_cpu(tcon->fsUnixInfo.Capability))) {
276a74a4 391 /* can not refresh inode info since size could be stale */
2422f676 392 rc = cifs_posix_open(full_path, &inode, inode->i_sb,
fa588e0c 393 cifs_sb->mnt_file_mode /* ignored */,
608712fe 394 file->f_flags, &oplock, &netfid, xid);
276a74a4 395 if (rc == 0) {
b6b38f70 396 cFYI(1, "posix open succeeded");
7e12eddb 397 posix_open_ok = true;
64cc2c63
SF
398 } else if ((rc == -EINVAL) || (rc == -EOPNOTSUPP)) {
399 if (tcon->ses->serverNOS)
b6b38f70 400 cERROR(1, "server %s of type %s returned"
64cc2c63
SF
401 " unexpected error on SMB posix open"
402 ", disabling posix open support."
403 " Check if server update available.",
404 tcon->ses->serverName,
b6b38f70 405 tcon->ses->serverNOS);
64cc2c63 406 tcon->broken_posix_open = true;
276a74a4
SF
407 } else if ((rc != -EIO) && (rc != -EREMOTE) &&
408 (rc != -EOPNOTSUPP)) /* path not found or net err */
409 goto out;
64cc2c63
SF
410 /* else fallthrough to retry open the old way on network i/o
411 or DFS errors */
276a74a4
SF
412 }
413
7e12eddb
PS
414 if (!posix_open_ok) {
415 rc = cifs_nt_open(full_path, inode, cifs_sb, tcon,
416 file->f_flags, &oplock, &netfid, xid);
417 if (rc)
418 goto out;
419 }
47c78b7f 420
abfe1eed 421 pCifsFile = cifs_new_fileinfo(netfid, file, tlink, oplock);
6ca9f3ba 422 if (pCifsFile == NULL) {
7e12eddb 423 CIFSSMBClose(xid, tcon, netfid);
1da177e4
LT
424 rc = -ENOMEM;
425 goto out;
426 }
1da177e4 427
9451a9a5
SJ
428 cifs_fscache_set_inode_cookie(inode, file);
429
7e12eddb 430 if ((oplock & CIFS_CREATE_ACTION) && !posix_open_ok && tcon->unix_ext) {
1da177e4
LT
431 /* time to set mode which we can not set earlier due to
432 problems creating new read-only files */
7e12eddb
PS
433 struct cifs_unix_set_info_args args = {
434 .mode = inode->i_mode,
435 .uid = NO_CHANGE_64,
436 .gid = NO_CHANGE_64,
437 .ctime = NO_CHANGE_64,
438 .atime = NO_CHANGE_64,
439 .mtime = NO_CHANGE_64,
440 .device = 0,
441 };
d44a9fe2
JL
442 CIFSSMBUnixSetFileInfo(xid, tcon, &args, netfid,
443 pCifsFile->pid);
1da177e4
LT
444 }
445
446out:
1da177e4
LT
447 kfree(full_path);
448 FreeXid(xid);
7ffec372 449 cifs_put_tlink(tlink);
1da177e4
LT
450 return rc;
451}
452
0418726b 453/* Try to reacquire byte range locks that were released when session */
1da177e4
LT
454/* to server was lost */
455static int cifs_relock_file(struct cifsFileInfo *cifsFile)
456{
457 int rc = 0;
458
459/* BB list all locks open on this file and relock */
460
461 return rc;
462}
463
15886177 464static int cifs_reopen_file(struct cifsFileInfo *pCifsFile, bool can_flush)
1da177e4
LT
465{
466 int rc = -EACCES;
590a3fe0
JL
467 int xid;
468 __u32 oplock;
1da177e4 469 struct cifs_sb_info *cifs_sb;
96daf2b0 470 struct cifs_tcon *tcon;
1da177e4 471 struct cifsInodeInfo *pCifsInode;
fb8c4b14 472 struct inode *inode;
1da177e4
LT
473 char *full_path = NULL;
474 int desiredAccess;
475 int disposition = FILE_OPEN;
3d3ea8e6 476 int create_options = CREATE_NOT_DIR;
1da177e4
LT
477 __u16 netfid;
478
1da177e4 479 xid = GetXid();
f0a71eb8 480 mutex_lock(&pCifsFile->fh_mutex);
4b18f2a9 481 if (!pCifsFile->invalidHandle) {
f0a71eb8 482 mutex_unlock(&pCifsFile->fh_mutex);
0f3bc09e 483 rc = 0;
1da177e4 484 FreeXid(xid);
0f3bc09e 485 return rc;
1da177e4
LT
486 }
487
15886177 488 inode = pCifsFile->dentry->d_inode;
1da177e4 489 cifs_sb = CIFS_SB(inode->i_sb);
13cfb733 490 tcon = tlink_tcon(pCifsFile->tlink);
3a9f462f 491
1da177e4
LT
492/* can not grab rename sem here because various ops, including
493 those that already have the rename sem can end up causing writepage
494 to get called and if the server was down that means we end up here,
495 and we can never tell if the caller already has the rename_sem */
15886177 496 full_path = build_path_from_dentry(pCifsFile->dentry);
1da177e4 497 if (full_path == NULL) {
3a9f462f 498 rc = -ENOMEM;
f0a71eb8 499 mutex_unlock(&pCifsFile->fh_mutex);
1da177e4 500 FreeXid(xid);
3a9f462f 501 return rc;
1da177e4
LT
502 }
503
b6b38f70 504 cFYI(1, "inode = 0x%p file flags 0x%x for %s",
15886177 505 inode, pCifsFile->f_flags, full_path);
1da177e4 506
10b9b98e 507 if (tcon->ses->server->oplocks)
1da177e4
LT
508 oplock = REQ_OPLOCK;
509 else
4b18f2a9 510 oplock = 0;
1da177e4 511
7fc8f4e9
SF
512 if (tcon->unix_ext && (tcon->ses->capabilities & CAP_UNIX) &&
513 (CIFS_UNIX_POSIX_PATH_OPS_CAP &
514 le64_to_cpu(tcon->fsUnixInfo.Capability))) {
608712fe
JL
515
516 /*
517 * O_CREAT, O_EXCL and O_TRUNC already had their effect on the
518 * original open. Must mask them off for a reopen.
519 */
15886177
JL
520 unsigned int oflags = pCifsFile->f_flags &
521 ~(O_CREAT | O_EXCL | O_TRUNC);
608712fe 522
2422f676 523 rc = cifs_posix_open(full_path, NULL, inode->i_sb,
fa588e0c
SF
524 cifs_sb->mnt_file_mode /* ignored */,
525 oflags, &oplock, &netfid, xid);
7fc8f4e9 526 if (rc == 0) {
b6b38f70 527 cFYI(1, "posix reopen succeeded");
7fc8f4e9
SF
528 goto reopen_success;
529 }
530 /* fallthrough to retry open the old way on errors, especially
531 in the reconnect path it is important to retry hard */
532 }
533
15886177 534 desiredAccess = cifs_convert_flags(pCifsFile->f_flags);
7fc8f4e9 535
3d3ea8e6
SP
536 if (backup_cred(cifs_sb))
537 create_options |= CREATE_OPEN_BACKUP_INTENT;
538
1da177e4 539 /* Can not refresh inode by passing in file_info buf to be returned
fb8c4b14
SF
540 by SMBOpen and then calling get_inode_info with returned buf
541 since file might have write behind data that needs to be flushed
1da177e4
LT
542 and server version of file size can be stale. If we knew for sure
543 that inode was not dirty locally we could do this */
544
7fc8f4e9 545 rc = CIFSSMBOpen(xid, tcon, full_path, disposition, desiredAccess,
3d3ea8e6 546 create_options, &netfid, &oplock, NULL,
fb8c4b14 547 cifs_sb->local_nls, cifs_sb->mnt_cifs_flags &
737b758c 548 CIFS_MOUNT_MAP_SPECIAL_CHR);
1da177e4 549 if (rc) {
f0a71eb8 550 mutex_unlock(&pCifsFile->fh_mutex);
b6b38f70
JP
551 cFYI(1, "cifs_open returned 0x%x", rc);
552 cFYI(1, "oplock: %d", oplock);
15886177
JL
553 goto reopen_error_exit;
554 }
555
7fc8f4e9 556reopen_success:
15886177
JL
557 pCifsFile->netfid = netfid;
558 pCifsFile->invalidHandle = false;
559 mutex_unlock(&pCifsFile->fh_mutex);
560 pCifsInode = CIFS_I(inode);
561
562 if (can_flush) {
563 rc = filemap_write_and_wait(inode->i_mapping);
eb4b756b 564 mapping_set_error(inode->i_mapping, rc);
15886177 565
15886177
JL
566 if (tcon->unix_ext)
567 rc = cifs_get_inode_info_unix(&inode,
568 full_path, inode->i_sb, xid);
569 else
570 rc = cifs_get_inode_info(&inode,
571 full_path, NULL, inode->i_sb,
572 xid, NULL);
573 } /* else we are writing out data to server already
574 and could deadlock if we tried to flush data, and
575 since we do not know if we have data that would
576 invalidate the current end of file on the server
577 we can not go to the server to get the new inod
578 info */
e66673e3 579
c6723628 580 cifs_set_oplock_level(pCifsInode, oplock);
e66673e3 581
15886177
JL
582 cifs_relock_file(pCifsFile);
583
584reopen_error_exit:
1da177e4
LT
585 kfree(full_path);
586 FreeXid(xid);
587 return rc;
588}
589
590int cifs_close(struct inode *inode, struct file *file)
591{
77970693
JL
592 if (file->private_data != NULL) {
593 cifsFileInfo_put(file->private_data);
594 file->private_data = NULL;
595 }
7ee1af76 596
cdff08e7
SF
597 /* return code from the ->release op is always ignored */
598 return 0;
1da177e4
LT
599}
600
601int cifs_closedir(struct inode *inode, struct file *file)
602{
603 int rc = 0;
604 int xid;
c21dfb69 605 struct cifsFileInfo *pCFileStruct = file->private_data;
1da177e4
LT
606 char *ptmp;
607
b6b38f70 608 cFYI(1, "Closedir inode = 0x%p", inode);
1da177e4
LT
609
610 xid = GetXid();
611
612 if (pCFileStruct) {
96daf2b0 613 struct cifs_tcon *pTcon = tlink_tcon(pCFileStruct->tlink);
1da177e4 614
b6b38f70 615 cFYI(1, "Freeing private data in close dir");
4477288a 616 spin_lock(&cifs_file_list_lock);
4b18f2a9
SF
617 if (!pCFileStruct->srch_inf.endOfSearch &&
618 !pCFileStruct->invalidHandle) {
619 pCFileStruct->invalidHandle = true;
4477288a 620 spin_unlock(&cifs_file_list_lock);
1da177e4 621 rc = CIFSFindClose(xid, pTcon, pCFileStruct->netfid);
b6b38f70
JP
622 cFYI(1, "Closing uncompleted readdir with rc %d",
623 rc);
1da177e4
LT
624 /* not much we can do if it fails anyway, ignore rc */
625 rc = 0;
ddb4cbfc 626 } else
4477288a 627 spin_unlock(&cifs_file_list_lock);
1da177e4
LT
628 ptmp = pCFileStruct->srch_inf.ntwrk_buf_start;
629 if (ptmp) {
b6b38f70 630 cFYI(1, "closedir free smb buf in srch struct");
1da177e4 631 pCFileStruct->srch_inf.ntwrk_buf_start = NULL;
fb8c4b14 632 if (pCFileStruct->srch_inf.smallBuf)
d47d7c1a
SF
633 cifs_small_buf_release(ptmp);
634 else
635 cifs_buf_release(ptmp);
1da177e4 636 }
13cfb733 637 cifs_put_tlink(pCFileStruct->tlink);
1da177e4
LT
638 kfree(file->private_data);
639 file->private_data = NULL;
640 }
641 /* BB can we lock the filestruct while this is going on? */
642 FreeXid(xid);
643 return rc;
644}
645
85160e03 646static struct cifsLockInfo *
fbd35aca 647cifs_lock_init(__u64 offset, __u64 length, __u8 type)
7ee1af76 648{
a88b4707 649 struct cifsLockInfo *lock =
fb8c4b14 650 kmalloc(sizeof(struct cifsLockInfo), GFP_KERNEL);
a88b4707
PS
651 if (!lock)
652 return lock;
653 lock->offset = offset;
654 lock->length = length;
655 lock->type = type;
a88b4707
PS
656 lock->pid = current->tgid;
657 INIT_LIST_HEAD(&lock->blist);
658 init_waitqueue_head(&lock->block_q);
659 return lock;
85160e03
PS
660}
661
662static void
663cifs_del_lock_waiters(struct cifsLockInfo *lock)
664{
665 struct cifsLockInfo *li, *tmp;
666 list_for_each_entry_safe(li, tmp, &lock->blist, blist) {
667 list_del_init(&li->blist);
668 wake_up(&li->block_q);
669 }
670}
671
672static bool
fbd35aca 673cifs_find_fid_lock_conflict(struct cifsFileInfo *cfile, __u64 offset,
55157dfb 674 __u64 length, __u8 type, struct cifsFileInfo *cur,
fbd35aca 675 struct cifsLockInfo **conf_lock)
85160e03 676{
fbd35aca 677 struct cifsLockInfo *li;
106dc538 678 struct TCP_Server_Info *server = tlink_tcon(cfile->tlink)->ses->server;
85160e03 679
fbd35aca 680 list_for_each_entry(li, &cfile->llist, llist) {
85160e03
PS
681 if (offset + length <= li->offset ||
682 offset >= li->offset + li->length)
683 continue;
106dc538 684 else if ((type & server->vals->shared_lock_type) &&
55157dfb
PS
685 ((server->ops->compare_fids(cur, cfile) &&
686 current->tgid == li->pid) || type == li->type))
85160e03
PS
687 continue;
688 else {
689 *conf_lock = li;
690 return true;
691 }
692 }
693 return false;
694}
695
161ebf9f 696static bool
55157dfb
PS
697cifs_find_lock_conflict(struct cifsFileInfo *cfile, __u64 offset, __u64 length,
698 __u8 type, struct cifsLockInfo **conf_lock)
161ebf9f 699{
fbd35aca
PS
700 bool rc = false;
701 struct cifsFileInfo *fid, *tmp;
55157dfb 702 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
fbd35aca
PS
703
704 spin_lock(&cifs_file_list_lock);
705 list_for_each_entry_safe(fid, tmp, &cinode->openFileList, flist) {
706 rc = cifs_find_fid_lock_conflict(fid, offset, length, type,
55157dfb 707 cfile, conf_lock);
fbd35aca
PS
708 if (rc)
709 break;
710 }
711 spin_unlock(&cifs_file_list_lock);
712
713 return rc;
161ebf9f
PS
714}
715
9a5101c8
PS
716/*
717 * Check if there is another lock that prevents us to set the lock (mandatory
718 * style). If such a lock exists, update the flock structure with its
719 * properties. Otherwise, set the flock type to F_UNLCK if we can cache brlocks
720 * or leave it the same if we can't. Returns 0 if we don't need to request to
721 * the server or 1 otherwise.
722 */
85160e03 723static int
fbd35aca
PS
724cifs_lock_test(struct cifsFileInfo *cfile, __u64 offset, __u64 length,
725 __u8 type, struct file_lock *flock)
85160e03
PS
726{
727 int rc = 0;
728 struct cifsLockInfo *conf_lock;
fbd35aca 729 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
106dc538 730 struct TCP_Server_Info *server = tlink_tcon(cfile->tlink)->ses->server;
85160e03
PS
731 bool exist;
732
733 mutex_lock(&cinode->lock_mutex);
734
55157dfb
PS
735 exist = cifs_find_lock_conflict(cfile, offset, length, type,
736 &conf_lock);
85160e03
PS
737 if (exist) {
738 flock->fl_start = conf_lock->offset;
739 flock->fl_end = conf_lock->offset + conf_lock->length - 1;
740 flock->fl_pid = conf_lock->pid;
106dc538 741 if (conf_lock->type & server->vals->shared_lock_type)
85160e03
PS
742 flock->fl_type = F_RDLCK;
743 else
744 flock->fl_type = F_WRLCK;
745 } else if (!cinode->can_cache_brlcks)
746 rc = 1;
747 else
748 flock->fl_type = F_UNLCK;
749
750 mutex_unlock(&cinode->lock_mutex);
751 return rc;
752}
753
161ebf9f 754static void
fbd35aca 755cifs_lock_add(struct cifsFileInfo *cfile, struct cifsLockInfo *lock)
85160e03 756{
fbd35aca 757 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
d59dad2b 758 mutex_lock(&cinode->lock_mutex);
fbd35aca 759 list_add_tail(&lock->llist, &cfile->llist);
d59dad2b 760 mutex_unlock(&cinode->lock_mutex);
7ee1af76
JA
761}
762
9a5101c8
PS
763/*
764 * Set the byte-range lock (mandatory style). Returns:
765 * 1) 0, if we set the lock and don't need to request to the server;
766 * 2) 1, if no locks prevent us but we need to request to the server;
767 * 3) -EACCESS, if there is a lock that prevents us and wait is false.
768 */
85160e03 769static int
fbd35aca 770cifs_lock_add_if(struct cifsFileInfo *cfile, struct cifsLockInfo *lock,
161ebf9f 771 bool wait)
85160e03 772{
161ebf9f 773 struct cifsLockInfo *conf_lock;
fbd35aca 774 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
85160e03
PS
775 bool exist;
776 int rc = 0;
777
85160e03
PS
778try_again:
779 exist = false;
780 mutex_lock(&cinode->lock_mutex);
781
55157dfb
PS
782 exist = cifs_find_lock_conflict(cfile, lock->offset, lock->length,
783 lock->type, &conf_lock);
85160e03 784 if (!exist && cinode->can_cache_brlcks) {
fbd35aca 785 list_add_tail(&lock->llist, &cfile->llist);
85160e03
PS
786 mutex_unlock(&cinode->lock_mutex);
787 return rc;
788 }
789
790 if (!exist)
791 rc = 1;
792 else if (!wait)
793 rc = -EACCES;
794 else {
795 list_add_tail(&lock->blist, &conf_lock->blist);
796 mutex_unlock(&cinode->lock_mutex);
797 rc = wait_event_interruptible(lock->block_q,
798 (lock->blist.prev == &lock->blist) &&
799 (lock->blist.next == &lock->blist));
800 if (!rc)
801 goto try_again;
a88b4707
PS
802 mutex_lock(&cinode->lock_mutex);
803 list_del_init(&lock->blist);
85160e03
PS
804 }
805
85160e03
PS
806 mutex_unlock(&cinode->lock_mutex);
807 return rc;
808}
809
9a5101c8
PS
810/*
811 * Check if there is another lock that prevents us to set the lock (posix
812 * style). If such a lock exists, update the flock structure with its
813 * properties. Otherwise, set the flock type to F_UNLCK if we can cache brlocks
814 * or leave it the same if we can't. Returns 0 if we don't need to request to
815 * the server or 1 otherwise.
816 */
85160e03 817static int
4f6bcec9
PS
818cifs_posix_lock_test(struct file *file, struct file_lock *flock)
819{
820 int rc = 0;
821 struct cifsInodeInfo *cinode = CIFS_I(file->f_path.dentry->d_inode);
822 unsigned char saved_type = flock->fl_type;
823
50792760
PS
824 if ((flock->fl_flags & FL_POSIX) == 0)
825 return 1;
826
4f6bcec9
PS
827 mutex_lock(&cinode->lock_mutex);
828 posix_test_lock(file, flock);
829
830 if (flock->fl_type == F_UNLCK && !cinode->can_cache_brlcks) {
831 flock->fl_type = saved_type;
832 rc = 1;
833 }
834
835 mutex_unlock(&cinode->lock_mutex);
836 return rc;
837}
838
9a5101c8
PS
839/*
840 * Set the byte-range lock (posix style). Returns:
841 * 1) 0, if we set the lock and don't need to request to the server;
842 * 2) 1, if we need to request to the server;
843 * 3) <0, if the error occurs while setting the lock.
844 */
4f6bcec9
PS
845static int
846cifs_posix_lock_set(struct file *file, struct file_lock *flock)
847{
848 struct cifsInodeInfo *cinode = CIFS_I(file->f_path.dentry->d_inode);
50792760
PS
849 int rc = 1;
850
851 if ((flock->fl_flags & FL_POSIX) == 0)
852 return rc;
4f6bcec9 853
66189be7 854try_again:
4f6bcec9
PS
855 mutex_lock(&cinode->lock_mutex);
856 if (!cinode->can_cache_brlcks) {
857 mutex_unlock(&cinode->lock_mutex);
50792760 858 return rc;
4f6bcec9 859 }
66189be7
PS
860
861 rc = posix_lock_file(file, flock, NULL);
9ebb389d 862 mutex_unlock(&cinode->lock_mutex);
66189be7
PS
863 if (rc == FILE_LOCK_DEFERRED) {
864 rc = wait_event_interruptible(flock->fl_wait, !flock->fl_next);
865 if (!rc)
866 goto try_again;
867 locks_delete_block(flock);
868 }
9ebb389d 869 return rc;
4f6bcec9
PS
870}
871
872static int
873cifs_push_mandatory_locks(struct cifsFileInfo *cfile)
85160e03
PS
874{
875 int xid, rc = 0, stored_rc;
876 struct cifsLockInfo *li, *tmp;
877 struct cifs_tcon *tcon;
878 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
0013fb4c 879 unsigned int num, max_num, max_buf;
32b9aaf1
PS
880 LOCKING_ANDX_RANGE *buf, *cur;
881 int types[] = {LOCKING_ANDX_LARGE_FILES,
882 LOCKING_ANDX_SHARED_LOCK | LOCKING_ANDX_LARGE_FILES};
883 int i;
85160e03
PS
884
885 xid = GetXid();
886 tcon = tlink_tcon(cfile->tlink);
887
888 mutex_lock(&cinode->lock_mutex);
889 if (!cinode->can_cache_brlcks) {
890 mutex_unlock(&cinode->lock_mutex);
891 FreeXid(xid);
892 return rc;
893 }
894
0013fb4c
PS
895 /*
896 * Accessing maxBuf is racy with cifs_reconnect - need to store value
897 * and check it for zero before using.
898 */
899 max_buf = tcon->ses->server->maxBuf;
900 if (!max_buf) {
901 mutex_unlock(&cinode->lock_mutex);
902 FreeXid(xid);
903 return -EINVAL;
904 }
905
906 max_num = (max_buf - sizeof(struct smb_hdr)) /
907 sizeof(LOCKING_ANDX_RANGE);
32b9aaf1
PS
908 buf = kzalloc(max_num * sizeof(LOCKING_ANDX_RANGE), GFP_KERNEL);
909 if (!buf) {
910 mutex_unlock(&cinode->lock_mutex);
911 FreeXid(xid);
912 return rc;
913 }
914
915 for (i = 0; i < 2; i++) {
916 cur = buf;
917 num = 0;
fbd35aca 918 list_for_each_entry_safe(li, tmp, &cfile->llist, llist) {
32b9aaf1
PS
919 if (li->type != types[i])
920 continue;
921 cur->Pid = cpu_to_le16(li->pid);
922 cur->LengthLow = cpu_to_le32((u32)li->length);
923 cur->LengthHigh = cpu_to_le32((u32)(li->length>>32));
924 cur->OffsetLow = cpu_to_le32((u32)li->offset);
925 cur->OffsetHigh = cpu_to_le32((u32)(li->offset>>32));
926 if (++num == max_num) {
927 stored_rc = cifs_lockv(xid, tcon, cfile->netfid,
04a6aa8a
PS
928 (__u8)li->type, 0, num,
929 buf);
32b9aaf1
PS
930 if (stored_rc)
931 rc = stored_rc;
932 cur = buf;
933 num = 0;
934 } else
935 cur++;
936 }
937
938 if (num) {
939 stored_rc = cifs_lockv(xid, tcon, cfile->netfid,
04a6aa8a 940 (__u8)types[i], 0, num, buf);
32b9aaf1
PS
941 if (stored_rc)
942 rc = stored_rc;
943 }
85160e03
PS
944 }
945
946 cinode->can_cache_brlcks = false;
947 mutex_unlock(&cinode->lock_mutex);
948
32b9aaf1 949 kfree(buf);
85160e03
PS
950 FreeXid(xid);
951 return rc;
952}
953
4f6bcec9
PS
954/* copied from fs/locks.c with a name change */
955#define cifs_for_each_lock(inode, lockp) \
956 for (lockp = &inode->i_flock; *lockp != NULL; \
957 lockp = &(*lockp)->fl_next)
958
d5751469
PS
959struct lock_to_push {
960 struct list_head llist;
961 __u64 offset;
962 __u64 length;
963 __u32 pid;
964 __u16 netfid;
965 __u8 type;
966};
967
4f6bcec9
PS
968static int
969cifs_push_posix_locks(struct cifsFileInfo *cfile)
970{
971 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
972 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
973 struct file_lock *flock, **before;
d5751469 974 unsigned int count = 0, i = 0;
4f6bcec9 975 int rc = 0, xid, type;
d5751469
PS
976 struct list_head locks_to_send, *el;
977 struct lock_to_push *lck, *tmp;
4f6bcec9 978 __u64 length;
4f6bcec9
PS
979
980 xid = GetXid();
981
982 mutex_lock(&cinode->lock_mutex);
983 if (!cinode->can_cache_brlcks) {
984 mutex_unlock(&cinode->lock_mutex);
985 FreeXid(xid);
986 return rc;
987 }
988
d5751469
PS
989 lock_flocks();
990 cifs_for_each_lock(cfile->dentry->d_inode, before) {
991 if ((*before)->fl_flags & FL_POSIX)
992 count++;
993 }
994 unlock_flocks();
995
4f6bcec9
PS
996 INIT_LIST_HEAD(&locks_to_send);
997
d5751469 998 /*
ce85852b
PS
999 * Allocating count locks is enough because no FL_POSIX locks can be
1000 * added to the list while we are holding cinode->lock_mutex that
1001 * protects locking operations of this inode.
d5751469
PS
1002 */
1003 for (; i < count; i++) {
1004 lck = kmalloc(sizeof(struct lock_to_push), GFP_KERNEL);
1005 if (!lck) {
1006 rc = -ENOMEM;
1007 goto err_out;
1008 }
1009 list_add_tail(&lck->llist, &locks_to_send);
1010 }
1011
d5751469 1012 el = locks_to_send.next;
4f6bcec9
PS
1013 lock_flocks();
1014 cifs_for_each_lock(cfile->dentry->d_inode, before) {
ce85852b
PS
1015 flock = *before;
1016 if ((flock->fl_flags & FL_POSIX) == 0)
1017 continue;
d5751469 1018 if (el == &locks_to_send) {
ce85852b
PS
1019 /*
1020 * The list ended. We don't have enough allocated
1021 * structures - something is really wrong.
1022 */
d5751469
PS
1023 cERROR(1, "Can't push all brlocks!");
1024 break;
1025 }
4f6bcec9
PS
1026 length = 1 + flock->fl_end - flock->fl_start;
1027 if (flock->fl_type == F_RDLCK || flock->fl_type == F_SHLCK)
1028 type = CIFS_RDLCK;
1029 else
1030 type = CIFS_WRLCK;
d5751469 1031 lck = list_entry(el, struct lock_to_push, llist);
4f6bcec9 1032 lck->pid = flock->fl_pid;
d5751469
PS
1033 lck->netfid = cfile->netfid;
1034 lck->length = length;
1035 lck->type = type;
1036 lck->offset = flock->fl_start;
d5751469 1037 el = el->next;
4f6bcec9 1038 }
4f6bcec9
PS
1039 unlock_flocks();
1040
1041 list_for_each_entry_safe(lck, tmp, &locks_to_send, llist) {
4f6bcec9
PS
1042 int stored_rc;
1043
4f6bcec9 1044 stored_rc = CIFSSMBPosixLock(xid, tcon, lck->netfid, lck->pid,
c5fd363d 1045 lck->offset, lck->length, NULL,
4f6bcec9
PS
1046 lck->type, 0);
1047 if (stored_rc)
1048 rc = stored_rc;
1049 list_del(&lck->llist);
1050 kfree(lck);
1051 }
1052
d5751469 1053out:
4f6bcec9
PS
1054 cinode->can_cache_brlcks = false;
1055 mutex_unlock(&cinode->lock_mutex);
1056
1057 FreeXid(xid);
1058 return rc;
d5751469
PS
1059err_out:
1060 list_for_each_entry_safe(lck, tmp, &locks_to_send, llist) {
1061 list_del(&lck->llist);
1062 kfree(lck);
1063 }
1064 goto out;
4f6bcec9
PS
1065}
1066
1067static int
1068cifs_push_locks(struct cifsFileInfo *cfile)
1069{
1070 struct cifs_sb_info *cifs_sb = CIFS_SB(cfile->dentry->d_sb);
1071 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
1072
1073 if ((tcon->ses->capabilities & CAP_UNIX) &&
1074 (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
1075 ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
1076 return cifs_push_posix_locks(cfile);
1077
1078 return cifs_push_mandatory_locks(cfile);
1079}
1080
03776f45 1081static void
04a6aa8a 1082cifs_read_flock(struct file_lock *flock, __u32 *type, int *lock, int *unlock,
106dc538 1083 bool *wait_flag, struct TCP_Server_Info *server)
1da177e4 1084{
03776f45 1085 if (flock->fl_flags & FL_POSIX)
b6b38f70 1086 cFYI(1, "Posix");
03776f45 1087 if (flock->fl_flags & FL_FLOCK)
b6b38f70 1088 cFYI(1, "Flock");
03776f45 1089 if (flock->fl_flags & FL_SLEEP) {
b6b38f70 1090 cFYI(1, "Blocking lock");
03776f45 1091 *wait_flag = true;
1da177e4 1092 }
03776f45 1093 if (flock->fl_flags & FL_ACCESS)
b6b38f70 1094 cFYI(1, "Process suspended by mandatory locking - "
03776f45
PS
1095 "not implemented yet");
1096 if (flock->fl_flags & FL_LEASE)
b6b38f70 1097 cFYI(1, "Lease on file - not implemented yet");
03776f45 1098 if (flock->fl_flags &
1da177e4 1099 (~(FL_POSIX | FL_FLOCK | FL_SLEEP | FL_ACCESS | FL_LEASE)))
03776f45 1100 cFYI(1, "Unknown lock flags 0x%x", flock->fl_flags);
1da177e4 1101
106dc538 1102 *type = server->vals->large_lock_type;
03776f45 1103 if (flock->fl_type == F_WRLCK) {
b6b38f70 1104 cFYI(1, "F_WRLCK ");
106dc538 1105 *type |= server->vals->exclusive_lock_type;
03776f45
PS
1106 *lock = 1;
1107 } else if (flock->fl_type == F_UNLCK) {
b6b38f70 1108 cFYI(1, "F_UNLCK");
106dc538 1109 *type |= server->vals->unlock_lock_type;
03776f45
PS
1110 *unlock = 1;
1111 /* Check if unlock includes more than one lock range */
1112 } else if (flock->fl_type == F_RDLCK) {
b6b38f70 1113 cFYI(1, "F_RDLCK");
106dc538 1114 *type |= server->vals->shared_lock_type;
03776f45
PS
1115 *lock = 1;
1116 } else if (flock->fl_type == F_EXLCK) {
b6b38f70 1117 cFYI(1, "F_EXLCK");
106dc538 1118 *type |= server->vals->exclusive_lock_type;
03776f45
PS
1119 *lock = 1;
1120 } else if (flock->fl_type == F_SHLCK) {
b6b38f70 1121 cFYI(1, "F_SHLCK");
106dc538 1122 *type |= server->vals->shared_lock_type;
03776f45 1123 *lock = 1;
1da177e4 1124 } else
b6b38f70 1125 cFYI(1, "Unknown type of lock");
03776f45 1126}
1da177e4 1127
55157dfb
PS
1128static int
1129cifs_mandatory_lock(int xid, struct cifsFileInfo *cfile, __u64 offset,
1130 __u64 length, __u32 type, int lock, int unlock, bool wait)
1131{
1132 return CIFSSMBLock(xid, tlink_tcon(cfile->tlink), cfile->netfid,
1133 current->tgid, length, offset, unlock, lock,
1134 (__u8)type, wait, 0);
1135}
1136
03776f45 1137static int
04a6aa8a 1138cifs_getlk(struct file *file, struct file_lock *flock, __u32 type,
03776f45
PS
1139 bool wait_flag, bool posix_lck, int xid)
1140{
1141 int rc = 0;
1142 __u64 length = 1 + flock->fl_end - flock->fl_start;
4f6bcec9
PS
1143 struct cifsFileInfo *cfile = (struct cifsFileInfo *)file->private_data;
1144 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
106dc538 1145 struct TCP_Server_Info *server = tcon->ses->server;
03776f45 1146 __u16 netfid = cfile->netfid;
f05337c6 1147
03776f45
PS
1148 if (posix_lck) {
1149 int posix_lock_type;
4f6bcec9
PS
1150
1151 rc = cifs_posix_lock_test(file, flock);
1152 if (!rc)
1153 return rc;
1154
106dc538 1155 if (type & server->vals->shared_lock_type)
03776f45
PS
1156 posix_lock_type = CIFS_RDLCK;
1157 else
1158 posix_lock_type = CIFS_WRLCK;
4f6bcec9 1159 rc = CIFSSMBPosixLock(xid, tcon, netfid, current->tgid,
c5fd363d 1160 flock->fl_start, length, flock,
4f6bcec9 1161 posix_lock_type, wait_flag);
03776f45
PS
1162 return rc;
1163 }
1da177e4 1164
fbd35aca 1165 rc = cifs_lock_test(cfile, flock->fl_start, length, type, flock);
85160e03
PS
1166 if (!rc)
1167 return rc;
1168
03776f45 1169 /* BB we could chain these into one lock request BB */
55157dfb
PS
1170 rc = cifs_mandatory_lock(xid, cfile, flock->fl_start, length, type,
1171 1, 0, false);
03776f45 1172 if (rc == 0) {
55157dfb
PS
1173 rc = cifs_mandatory_lock(xid, cfile, flock->fl_start, length,
1174 type, 0, 1, false);
03776f45
PS
1175 flock->fl_type = F_UNLCK;
1176 if (rc != 0)
1177 cERROR(1, "Error unlocking previously locked "
106dc538 1178 "range %d during test of lock", rc);
a88b4707 1179 return 0;
1da177e4 1180 }
7ee1af76 1181
106dc538 1182 if (type & server->vals->shared_lock_type) {
03776f45 1183 flock->fl_type = F_WRLCK;
a88b4707 1184 return 0;
7ee1af76
JA
1185 }
1186
55157dfb
PS
1187 rc = cifs_mandatory_lock(xid, cfile, flock->fl_start, length,
1188 type | server->vals->shared_lock_type, 1, 0,
1189 false);
03776f45 1190 if (rc == 0) {
55157dfb
PS
1191 rc = cifs_mandatory_lock(xid, cfile, flock->fl_start, length,
1192 type | server->vals->shared_lock_type,
1193 0, 1, false);
03776f45
PS
1194 flock->fl_type = F_RDLCK;
1195 if (rc != 0)
1196 cERROR(1, "Error unlocking previously locked "
1197 "range %d during test of lock", rc);
1198 } else
1199 flock->fl_type = F_WRLCK;
1200
a88b4707 1201 return 0;
03776f45
PS
1202}
1203
9ee305b7
PS
1204static void
1205cifs_move_llist(struct list_head *source, struct list_head *dest)
1206{
1207 struct list_head *li, *tmp;
1208 list_for_each_safe(li, tmp, source)
1209 list_move(li, dest);
1210}
1211
1212static void
1213cifs_free_llist(struct list_head *llist)
1214{
1215 struct cifsLockInfo *li, *tmp;
1216 list_for_each_entry_safe(li, tmp, llist, llist) {
1217 cifs_del_lock_waiters(li);
1218 list_del(&li->llist);
1219 kfree(li);
1220 }
1221}
1222
1223static int
1224cifs_unlock_range(struct cifsFileInfo *cfile, struct file_lock *flock, int xid)
1225{
1226 int rc = 0, stored_rc;
1227 int types[] = {LOCKING_ANDX_LARGE_FILES,
1228 LOCKING_ANDX_SHARED_LOCK | LOCKING_ANDX_LARGE_FILES};
1229 unsigned int i;
0013fb4c 1230 unsigned int max_num, num, max_buf;
9ee305b7
PS
1231 LOCKING_ANDX_RANGE *buf, *cur;
1232 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
1233 struct cifsInodeInfo *cinode = CIFS_I(cfile->dentry->d_inode);
1234 struct cifsLockInfo *li, *tmp;
1235 __u64 length = 1 + flock->fl_end - flock->fl_start;
1236 struct list_head tmp_llist;
1237
1238 INIT_LIST_HEAD(&tmp_llist);
1239
0013fb4c
PS
1240 /*
1241 * Accessing maxBuf is racy with cifs_reconnect - need to store value
1242 * and check it for zero before using.
1243 */
1244 max_buf = tcon->ses->server->maxBuf;
1245 if (!max_buf)
1246 return -EINVAL;
1247
1248 max_num = (max_buf - sizeof(struct smb_hdr)) /
1249 sizeof(LOCKING_ANDX_RANGE);
9ee305b7
PS
1250 buf = kzalloc(max_num * sizeof(LOCKING_ANDX_RANGE), GFP_KERNEL);
1251 if (!buf)
1252 return -ENOMEM;
1253
1254 mutex_lock(&cinode->lock_mutex);
1255 for (i = 0; i < 2; i++) {
1256 cur = buf;
1257 num = 0;
fbd35aca 1258 list_for_each_entry_safe(li, tmp, &cfile->llist, llist) {
9ee305b7
PS
1259 if (flock->fl_start > li->offset ||
1260 (flock->fl_start + length) <
1261 (li->offset + li->length))
1262 continue;
1263 if (current->tgid != li->pid)
1264 continue;
9ee305b7
PS
1265 if (types[i] != li->type)
1266 continue;
ea319d57 1267 if (cinode->can_cache_brlcks) {
9ee305b7
PS
1268 /*
1269 * We can cache brlock requests - simply remove
fbd35aca 1270 * a lock from the file's list.
9ee305b7
PS
1271 */
1272 list_del(&li->llist);
1273 cifs_del_lock_waiters(li);
1274 kfree(li);
ea319d57 1275 continue;
9ee305b7 1276 }
ea319d57
PS
1277 cur->Pid = cpu_to_le16(li->pid);
1278 cur->LengthLow = cpu_to_le32((u32)li->length);
1279 cur->LengthHigh = cpu_to_le32((u32)(li->length>>32));
1280 cur->OffsetLow = cpu_to_le32((u32)li->offset);
1281 cur->OffsetHigh = cpu_to_le32((u32)(li->offset>>32));
1282 /*
1283 * We need to save a lock here to let us add it again to
1284 * the file's list if the unlock range request fails on
1285 * the server.
1286 */
1287 list_move(&li->llist, &tmp_llist);
1288 if (++num == max_num) {
1289 stored_rc = cifs_lockv(xid, tcon, cfile->netfid,
1290 li->type, num, 0, buf);
1291 if (stored_rc) {
1292 /*
1293 * We failed on the unlock range
1294 * request - add all locks from the tmp
1295 * list to the head of the file's list.
1296 */
1297 cifs_move_llist(&tmp_llist,
1298 &cfile->llist);
1299 rc = stored_rc;
1300 } else
1301 /*
1302 * The unlock range request succeed -
1303 * free the tmp list.
1304 */
1305 cifs_free_llist(&tmp_llist);
1306 cur = buf;
1307 num = 0;
1308 } else
1309 cur++;
9ee305b7
PS
1310 }
1311 if (num) {
1312 stored_rc = cifs_lockv(xid, tcon, cfile->netfid,
1313 types[i], num, 0, buf);
1314 if (stored_rc) {
fbd35aca 1315 cifs_move_llist(&tmp_llist, &cfile->llist);
9ee305b7
PS
1316 rc = stored_rc;
1317 } else
1318 cifs_free_llist(&tmp_llist);
1319 }
1320 }
1321
1322 mutex_unlock(&cinode->lock_mutex);
1323 kfree(buf);
1324 return rc;
1325}
1326
03776f45 1327static int
04a6aa8a 1328cifs_setlk(struct file *file, struct file_lock *flock, __u32 type,
03776f45
PS
1329 bool wait_flag, bool posix_lck, int lock, int unlock, int xid)
1330{
1331 int rc = 0;
1332 __u64 length = 1 + flock->fl_end - flock->fl_start;
1333 struct cifsFileInfo *cfile = (struct cifsFileInfo *)file->private_data;
1334 struct cifs_tcon *tcon = tlink_tcon(cfile->tlink);
106dc538 1335 struct TCP_Server_Info *server = tcon->ses->server;
03776f45
PS
1336 __u16 netfid = cfile->netfid;
1337
1338 if (posix_lck) {
08547b03 1339 int posix_lock_type;
4f6bcec9
PS
1340
1341 rc = cifs_posix_lock_set(file, flock);
1342 if (!rc || rc < 0)
1343 return rc;
1344
106dc538 1345 if (type & server->vals->shared_lock_type)
08547b03
SF
1346 posix_lock_type = CIFS_RDLCK;
1347 else
1348 posix_lock_type = CIFS_WRLCK;
50c2f753 1349
03776f45 1350 if (unlock == 1)
beb84dc8 1351 posix_lock_type = CIFS_UNLCK;
7ee1af76 1352
4f6bcec9 1353 rc = CIFSSMBPosixLock(xid, tcon, netfid, current->tgid,
c5fd363d 1354 flock->fl_start, length, NULL,
4f6bcec9 1355 posix_lock_type, wait_flag);
03776f45
PS
1356 goto out;
1357 }
7ee1af76 1358
03776f45 1359 if (lock) {
161ebf9f
PS
1360 struct cifsLockInfo *lock;
1361
fbd35aca 1362 lock = cifs_lock_init(flock->fl_start, length, type);
161ebf9f
PS
1363 if (!lock)
1364 return -ENOMEM;
1365
fbd35aca 1366 rc = cifs_lock_add_if(cfile, lock, wait_flag);
85160e03 1367 if (rc < 0)
161ebf9f
PS
1368 kfree(lock);
1369 if (rc <= 0)
85160e03
PS
1370 goto out;
1371
7f92447a
PS
1372 rc = cifs_mandatory_lock(xid, cfile, flock->fl_start, length,
1373 type, 1, 0, wait_flag);
161ebf9f
PS
1374 if (rc) {
1375 kfree(lock);
1376 goto out;
03776f45 1377 }
161ebf9f 1378
fbd35aca 1379 cifs_lock_add(cfile, lock);
9ee305b7
PS
1380 } else if (unlock)
1381 rc = cifs_unlock_range(cfile, flock, xid);
03776f45 1382
03776f45
PS
1383out:
1384 if (flock->fl_flags & FL_POSIX)
9ebb389d 1385 posix_lock_file_wait(file, flock);
03776f45
PS
1386 return rc;
1387}
1388
1389int cifs_lock(struct file *file, int cmd, struct file_lock *flock)
1390{
1391 int rc, xid;
1392 int lock = 0, unlock = 0;
1393 bool wait_flag = false;
1394 bool posix_lck = false;
1395 struct cifs_sb_info *cifs_sb;
1396 struct cifs_tcon *tcon;
1397 struct cifsInodeInfo *cinode;
1398 struct cifsFileInfo *cfile;
1399 __u16 netfid;
04a6aa8a 1400 __u32 type;
03776f45
PS
1401
1402 rc = -EACCES;
1403 xid = GetXid();
1404
1405 cFYI(1, "Lock parm: 0x%x flockflags: 0x%x flocktype: 0x%x start: %lld "
1406 "end: %lld", cmd, flock->fl_flags, flock->fl_type,
1407 flock->fl_start, flock->fl_end);
1408
03776f45
PS
1409 cfile = (struct cifsFileInfo *)file->private_data;
1410 tcon = tlink_tcon(cfile->tlink);
106dc538
PS
1411
1412 cifs_read_flock(flock, &type, &lock, &unlock, &wait_flag,
1413 tcon->ses->server);
1414
1415 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
03776f45
PS
1416 netfid = cfile->netfid;
1417 cinode = CIFS_I(file->f_path.dentry->d_inode);
1418
1419 if ((tcon->ses->capabilities & CAP_UNIX) &&
1420 (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
1421 ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
1422 posix_lck = true;
1423 /*
1424 * BB add code here to normalize offset and length to account for
1425 * negative length which we can not accept over the wire.
1426 */
1427 if (IS_GETLK(cmd)) {
4f6bcec9 1428 rc = cifs_getlk(file, flock, type, wait_flag, posix_lck, xid);
03776f45
PS
1429 FreeXid(xid);
1430 return rc;
1431 }
1432
1433 if (!lock && !unlock) {
1434 /*
1435 * if no lock or unlock then nothing to do since we do not
1436 * know what it is
1437 */
1438 FreeXid(xid);
1439 return -EOPNOTSUPP;
7ee1af76
JA
1440 }
1441
03776f45
PS
1442 rc = cifs_setlk(file, flock, type, wait_flag, posix_lck, lock, unlock,
1443 xid);
1da177e4
LT
1444 FreeXid(xid);
1445 return rc;
1446}
1447
597b027f
JL
1448/*
1449 * update the file size (if needed) after a write. Should be called with
1450 * the inode->i_lock held
1451 */
72432ffc 1452void
fbec9ab9
JL
1453cifs_update_eof(struct cifsInodeInfo *cifsi, loff_t offset,
1454 unsigned int bytes_written)
1455{
1456 loff_t end_of_write = offset + bytes_written;
1457
1458 if (end_of_write > cifsi->server_eof)
1459 cifsi->server_eof = end_of_write;
1460}
1461
fa2989f4 1462static ssize_t cifs_write(struct cifsFileInfo *open_file, __u32 pid,
7da4b49a
JL
1463 const char *write_data, size_t write_size,
1464 loff_t *poffset)
1da177e4
LT
1465{
1466 int rc = 0;
1467 unsigned int bytes_written = 0;
1468 unsigned int total_written;
1469 struct cifs_sb_info *cifs_sb;
96daf2b0 1470 struct cifs_tcon *pTcon;
7749981e 1471 int xid;
7da4b49a
JL
1472 struct dentry *dentry = open_file->dentry;
1473 struct cifsInodeInfo *cifsi = CIFS_I(dentry->d_inode);
fa2989f4 1474 struct cifs_io_parms io_parms;
1da177e4 1475
7da4b49a 1476 cifs_sb = CIFS_SB(dentry->d_sb);
1da177e4 1477
b6b38f70 1478 cFYI(1, "write %zd bytes to offset %lld of %s", write_size,
7da4b49a 1479 *poffset, dentry->d_name.name);
1da177e4 1480
13cfb733 1481 pTcon = tlink_tcon(open_file->tlink);
50c2f753 1482
1da177e4 1483 xid = GetXid();
1da177e4 1484
1da177e4
LT
1485 for (total_written = 0; write_size > total_written;
1486 total_written += bytes_written) {
1487 rc = -EAGAIN;
1488 while (rc == -EAGAIN) {
ca83ce3d
JL
1489 struct kvec iov[2];
1490 unsigned int len;
1491
1da177e4 1492 if (open_file->invalidHandle) {
1da177e4
LT
1493 /* we could deadlock if we called
1494 filemap_fdatawait from here so tell
fb8c4b14 1495 reopen_file not to flush data to
1da177e4 1496 server now */
15886177 1497 rc = cifs_reopen_file(open_file, false);
1da177e4
LT
1498 if (rc != 0)
1499 break;
1500 }
ca83ce3d
JL
1501
1502 len = min((size_t)cifs_sb->wsize,
1503 write_size - total_written);
1504 /* iov[0] is reserved for smb header */
1505 iov[1].iov_base = (char *)write_data + total_written;
1506 iov[1].iov_len = len;
fa2989f4
PS
1507 io_parms.netfid = open_file->netfid;
1508 io_parms.pid = pid;
1509 io_parms.tcon = pTcon;
1510 io_parms.offset = *poffset;
1511 io_parms.length = len;
1512 rc = CIFSSMBWrite2(xid, &io_parms, &bytes_written, iov,
1513 1, 0);
1da177e4
LT
1514 }
1515 if (rc || (bytes_written == 0)) {
1516 if (total_written)
1517 break;
1518 else {
1519 FreeXid(xid);
1520 return rc;
1521 }
fbec9ab9 1522 } else {
597b027f 1523 spin_lock(&dentry->d_inode->i_lock);
fbec9ab9 1524 cifs_update_eof(cifsi, *poffset, bytes_written);
597b027f 1525 spin_unlock(&dentry->d_inode->i_lock);
1da177e4 1526 *poffset += bytes_written;
fbec9ab9 1527 }
1da177e4
LT
1528 }
1529
a4544347 1530 cifs_stats_bytes_written(pTcon, total_written);
1da177e4 1531
7da4b49a
JL
1532 if (total_written > 0) {
1533 spin_lock(&dentry->d_inode->i_lock);
1534 if (*poffset > dentry->d_inode->i_size)
1535 i_size_write(dentry->d_inode, *poffset);
1536 spin_unlock(&dentry->d_inode->i_lock);
1da177e4 1537 }
7da4b49a 1538 mark_inode_dirty_sync(dentry->d_inode);
1da177e4
LT
1539 FreeXid(xid);
1540 return total_written;
1541}
1542
6508d904
JL
1543struct cifsFileInfo *find_readable_file(struct cifsInodeInfo *cifs_inode,
1544 bool fsuid_only)
630f3f0c
SF
1545{
1546 struct cifsFileInfo *open_file = NULL;
6508d904
JL
1547 struct cifs_sb_info *cifs_sb = CIFS_SB(cifs_inode->vfs_inode.i_sb);
1548
1549 /* only filter by fsuid on multiuser mounts */
1550 if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_MULTIUSER))
1551 fsuid_only = false;
630f3f0c 1552
4477288a 1553 spin_lock(&cifs_file_list_lock);
630f3f0c
SF
1554 /* we could simply get the first_list_entry since write-only entries
1555 are always at the end of the list but since the first entry might
1556 have a close pending, we go through the whole list */
1557 list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
6508d904
JL
1558 if (fsuid_only && open_file->uid != current_fsuid())
1559 continue;
2e396b83 1560 if (OPEN_FMODE(open_file->f_flags) & FMODE_READ) {
630f3f0c
SF
1561 if (!open_file->invalidHandle) {
1562 /* found a good file */
1563 /* lock it so it will not be closed on us */
6ab409b5 1564 cifsFileInfo_get(open_file);
4477288a 1565 spin_unlock(&cifs_file_list_lock);
630f3f0c
SF
1566 return open_file;
1567 } /* else might as well continue, and look for
1568 another, or simply have the caller reopen it
1569 again rather than trying to fix this handle */
1570 } else /* write only file */
1571 break; /* write only files are last so must be done */
1572 }
4477288a 1573 spin_unlock(&cifs_file_list_lock);
630f3f0c
SF
1574 return NULL;
1575}
630f3f0c 1576
6508d904
JL
1577struct cifsFileInfo *find_writable_file(struct cifsInodeInfo *cifs_inode,
1578 bool fsuid_only)
6148a742 1579{
2c0c2a08 1580 struct cifsFileInfo *open_file, *inv_file = NULL;
d3892294 1581 struct cifs_sb_info *cifs_sb;
2846d386 1582 bool any_available = false;
dd99cd80 1583 int rc;
2c0c2a08 1584 unsigned int refind = 0;
6148a742 1585
60808233
SF
1586 /* Having a null inode here (because mapping->host was set to zero by
1587 the VFS or MM) should not happen but we had reports of on oops (due to
1588 it being zero) during stress testcases so we need to check for it */
1589
fb8c4b14 1590 if (cifs_inode == NULL) {
b6b38f70 1591 cERROR(1, "Null inode passed to cifs_writeable_file");
60808233
SF
1592 dump_stack();
1593 return NULL;
1594 }
1595
d3892294
JL
1596 cifs_sb = CIFS_SB(cifs_inode->vfs_inode.i_sb);
1597
6508d904
JL
1598 /* only filter by fsuid on multiuser mounts */
1599 if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_MULTIUSER))
1600 fsuid_only = false;
1601
4477288a 1602 spin_lock(&cifs_file_list_lock);
9b22b0b7 1603refind_writable:
2c0c2a08
SP
1604 if (refind > MAX_REOPEN_ATT) {
1605 spin_unlock(&cifs_file_list_lock);
1606 return NULL;
1607 }
6148a742 1608 list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
6508d904
JL
1609 if (!any_available && open_file->pid != current->tgid)
1610 continue;
1611 if (fsuid_only && open_file->uid != current_fsuid())
6148a742 1612 continue;
2e396b83 1613 if (OPEN_FMODE(open_file->f_flags) & FMODE_WRITE) {
9b22b0b7
SF
1614 if (!open_file->invalidHandle) {
1615 /* found a good writable file */
2c0c2a08 1616 cifsFileInfo_get(open_file);
4477288a 1617 spin_unlock(&cifs_file_list_lock);
9b22b0b7 1618 return open_file;
2c0c2a08
SP
1619 } else {
1620 if (!inv_file)
1621 inv_file = open_file;
9b22b0b7 1622 }
6148a742
SF
1623 }
1624 }
2846d386
JL
1625 /* couldn't find useable FH with same pid, try any available */
1626 if (!any_available) {
1627 any_available = true;
1628 goto refind_writable;
1629 }
2c0c2a08
SP
1630
1631 if (inv_file) {
1632 any_available = false;
1633 cifsFileInfo_get(inv_file);
1634 }
1635
4477288a 1636 spin_unlock(&cifs_file_list_lock);
2c0c2a08
SP
1637
1638 if (inv_file) {
1639 rc = cifs_reopen_file(inv_file, false);
1640 if (!rc)
1641 return inv_file;
1642 else {
1643 spin_lock(&cifs_file_list_lock);
1644 list_move_tail(&inv_file->flist,
1645 &cifs_inode->openFileList);
1646 spin_unlock(&cifs_file_list_lock);
1647 cifsFileInfo_put(inv_file);
1648 spin_lock(&cifs_file_list_lock);
1649 ++refind;
1650 goto refind_writable;
1651 }
1652 }
1653
6148a742
SF
1654 return NULL;
1655}
1656
1da177e4
LT
1657static int cifs_partialpagewrite(struct page *page, unsigned from, unsigned to)
1658{
1659 struct address_space *mapping = page->mapping;
1660 loff_t offset = (loff_t)page->index << PAGE_CACHE_SHIFT;
1661 char *write_data;
1662 int rc = -EFAULT;
1663 int bytes_written = 0;
1da177e4 1664 struct inode *inode;
6148a742 1665 struct cifsFileInfo *open_file;
1da177e4
LT
1666
1667 if (!mapping || !mapping->host)
1668 return -EFAULT;
1669
1670 inode = page->mapping->host;
1da177e4
LT
1671
1672 offset += (loff_t)from;
1673 write_data = kmap(page);
1674 write_data += from;
1675
1676 if ((to > PAGE_CACHE_SIZE) || (from > to)) {
1677 kunmap(page);
1678 return -EIO;
1679 }
1680
1681 /* racing with truncate? */
1682 if (offset > mapping->host->i_size) {
1683 kunmap(page);
1684 return 0; /* don't care */
1685 }
1686
1687 /* check to make sure that we are not extending the file */
1688 if (mapping->host->i_size - offset < (loff_t)to)
fb8c4b14 1689 to = (unsigned)(mapping->host->i_size - offset);
1da177e4 1690
6508d904 1691 open_file = find_writable_file(CIFS_I(mapping->host), false);
6148a742 1692 if (open_file) {
fa2989f4
PS
1693 bytes_written = cifs_write(open_file, open_file->pid,
1694 write_data, to - from, &offset);
6ab409b5 1695 cifsFileInfo_put(open_file);
1da177e4 1696 /* Does mm or vfs already set times? */
6148a742 1697 inode->i_atime = inode->i_mtime = current_fs_time(inode->i_sb);
bb5a9a04 1698 if ((bytes_written > 0) && (offset))
6148a742 1699 rc = 0;
bb5a9a04
SF
1700 else if (bytes_written < 0)
1701 rc = bytes_written;
6148a742 1702 } else {
b6b38f70 1703 cFYI(1, "No writeable filehandles for inode");
1da177e4
LT
1704 rc = -EIO;
1705 }
1706
1707 kunmap(page);
1708 return rc;
1709}
1710
e9492871
JL
1711/*
1712 * Marshal up the iov array, reserving the first one for the header. Also,
1713 * set wdata->bytes.
1714 */
1715static void
1716cifs_writepages_marshal_iov(struct kvec *iov, struct cifs_writedata *wdata)
1717{
1718 int i;
1719 struct inode *inode = wdata->cfile->dentry->d_inode;
1720 loff_t size = i_size_read(inode);
1721
1722 /* marshal up the pages into iov array */
1723 wdata->bytes = 0;
1724 for (i = 0; i < wdata->nr_pages; i++) {
1725 iov[i + 1].iov_len = min(size - page_offset(wdata->pages[i]),
1726 (loff_t)PAGE_CACHE_SIZE);
1727 iov[i + 1].iov_base = kmap(wdata->pages[i]);
1728 wdata->bytes += iov[i + 1].iov_len;
1729 }
1730}
1731
1da177e4 1732static int cifs_writepages(struct address_space *mapping,
37c0eb46 1733 struct writeback_control *wbc)
1da177e4 1734{
c3d17b63
JL
1735 struct cifs_sb_info *cifs_sb = CIFS_SB(mapping->host->i_sb);
1736 bool done = false, scanned = false, range_whole = false;
1737 pgoff_t end, index;
1738 struct cifs_writedata *wdata;
37c0eb46 1739 struct page *page;
37c0eb46 1740 int rc = 0;
50c2f753 1741
37c0eb46 1742 /*
c3d17b63 1743 * If wsize is smaller than the page cache size, default to writing
37c0eb46
SF
1744 * one page at a time via cifs_writepage
1745 */
1746 if (cifs_sb->wsize < PAGE_CACHE_SIZE)
1747 return generic_writepages(mapping, wbc);
1748
111ebb6e 1749 if (wbc->range_cyclic) {
37c0eb46 1750 index = mapping->writeback_index; /* Start from prev offset */
111ebb6e
OH
1751 end = -1;
1752 } else {
1753 index = wbc->range_start >> PAGE_CACHE_SHIFT;
1754 end = wbc->range_end >> PAGE_CACHE_SHIFT;
1755 if (wbc->range_start == 0 && wbc->range_end == LLONG_MAX)
c3d17b63
JL
1756 range_whole = true;
1757 scanned = true;
37c0eb46
SF
1758 }
1759retry:
c3d17b63
JL
1760 while (!done && index <= end) {
1761 unsigned int i, nr_pages, found_pages;
1762 pgoff_t next = 0, tofind;
1763 struct page **pages;
1764
1765 tofind = min((cifs_sb->wsize / PAGE_CACHE_SIZE) - 1,
1766 end - index) + 1;
1767
c2e87640
JL
1768 wdata = cifs_writedata_alloc((unsigned int)tofind,
1769 cifs_writev_complete);
c3d17b63
JL
1770 if (!wdata) {
1771 rc = -ENOMEM;
1772 break;
1773 }
1774
1775 /*
1776 * find_get_pages_tag seems to return a max of 256 on each
1777 * iteration, so we must call it several times in order to
1778 * fill the array or the wsize is effectively limited to
1779 * 256 * PAGE_CACHE_SIZE.
1780 */
1781 found_pages = 0;
1782 pages = wdata->pages;
1783 do {
1784 nr_pages = find_get_pages_tag(mapping, &index,
1785 PAGECACHE_TAG_DIRTY,
1786 tofind, pages);
1787 found_pages += nr_pages;
1788 tofind -= nr_pages;
1789 pages += nr_pages;
1790 } while (nr_pages && tofind && index <= end);
1791
1792 if (found_pages == 0) {
1793 kref_put(&wdata->refcount, cifs_writedata_release);
1794 break;
1795 }
1796
1797 nr_pages = 0;
1798 for (i = 0; i < found_pages; i++) {
1799 page = wdata->pages[i];
37c0eb46
SF
1800 /*
1801 * At this point we hold neither mapping->tree_lock nor
1802 * lock on the page itself: the page may be truncated or
1803 * invalidated (changing page->mapping to NULL), or even
1804 * swizzled back from swapper_space to tmpfs file
1805 * mapping
1806 */
1807
c3d17b63 1808 if (nr_pages == 0)
37c0eb46 1809 lock_page(page);
529ae9aa 1810 else if (!trylock_page(page))
37c0eb46
SF
1811 break;
1812
1813 if (unlikely(page->mapping != mapping)) {
1814 unlock_page(page);
1815 break;
1816 }
1817
111ebb6e 1818 if (!wbc->range_cyclic && page->index > end) {
c3d17b63 1819 done = true;
37c0eb46
SF
1820 unlock_page(page);
1821 break;
1822 }
1823
1824 if (next && (page->index != next)) {
1825 /* Not next consecutive page */
1826 unlock_page(page);
1827 break;
1828 }
1829
1830 if (wbc->sync_mode != WB_SYNC_NONE)
1831 wait_on_page_writeback(page);
1832
1833 if (PageWriteback(page) ||
cb876f45 1834 !clear_page_dirty_for_io(page)) {
37c0eb46
SF
1835 unlock_page(page);
1836 break;
1837 }
84d2f07e 1838
cb876f45
LT
1839 /*
1840 * This actually clears the dirty bit in the radix tree.
1841 * See cifs_writepage() for more commentary.
1842 */
1843 set_page_writeback(page);
1844
84d2f07e 1845 if (page_offset(page) >= mapping->host->i_size) {
c3d17b63 1846 done = true;
84d2f07e 1847 unlock_page(page);
cb876f45 1848 end_page_writeback(page);
84d2f07e
SF
1849 break;
1850 }
1851
c3d17b63
JL
1852 wdata->pages[i] = page;
1853 next = page->index + 1;
1854 ++nr_pages;
1855 }
37c0eb46 1856
c3d17b63
JL
1857 /* reset index to refind any pages skipped */
1858 if (nr_pages == 0)
1859 index = wdata->pages[0]->index + 1;
84d2f07e 1860
c3d17b63
JL
1861 /* put any pages we aren't going to use */
1862 for (i = nr_pages; i < found_pages; i++) {
1863 page_cache_release(wdata->pages[i]);
1864 wdata->pages[i] = NULL;
1865 }
37c0eb46 1866
c3d17b63
JL
1867 /* nothing to write? */
1868 if (nr_pages == 0) {
1869 kref_put(&wdata->refcount, cifs_writedata_release);
1870 continue;
37c0eb46 1871 }
fbec9ab9 1872
c3d17b63
JL
1873 wdata->sync_mode = wbc->sync_mode;
1874 wdata->nr_pages = nr_pages;
1875 wdata->offset = page_offset(wdata->pages[0]);
e9492871 1876 wdata->marshal_iov = cifs_writepages_marshal_iov;
941b853d 1877
c3d17b63
JL
1878 do {
1879 if (wdata->cfile != NULL)
1880 cifsFileInfo_put(wdata->cfile);
1881 wdata->cfile = find_writable_file(CIFS_I(mapping->host),
1882 false);
1883 if (!wdata->cfile) {
1884 cERROR(1, "No writable handles for inode");
1885 rc = -EBADF;
1886 break;
941b853d 1887 }
fe5f5d2e 1888 wdata->pid = wdata->cfile->pid;
c3d17b63
JL
1889 rc = cifs_async_writev(wdata);
1890 } while (wbc->sync_mode == WB_SYNC_ALL && rc == -EAGAIN);
941b853d 1891
c3d17b63
JL
1892 for (i = 0; i < nr_pages; ++i)
1893 unlock_page(wdata->pages[i]);
f3983c21 1894
c3d17b63
JL
1895 /* send failure -- clean up the mess */
1896 if (rc != 0) {
1897 for (i = 0; i < nr_pages; ++i) {
941b853d 1898 if (rc == -EAGAIN)
c3d17b63
JL
1899 redirty_page_for_writepage(wbc,
1900 wdata->pages[i]);
1901 else
1902 SetPageError(wdata->pages[i]);
1903 end_page_writeback(wdata->pages[i]);
1904 page_cache_release(wdata->pages[i]);
37c0eb46 1905 }
941b853d
JL
1906 if (rc != -EAGAIN)
1907 mapping_set_error(mapping, rc);
c3d17b63
JL
1908 }
1909 kref_put(&wdata->refcount, cifs_writedata_release);
941b853d 1910
c3d17b63
JL
1911 wbc->nr_to_write -= nr_pages;
1912 if (wbc->nr_to_write <= 0)
1913 done = true;
b066a48c 1914
c3d17b63 1915 index = next;
37c0eb46 1916 }
c3d17b63 1917
37c0eb46
SF
1918 if (!scanned && !done) {
1919 /*
1920 * We hit the last page and there is more work to be done: wrap
1921 * back to the start of the file
1922 */
c3d17b63 1923 scanned = true;
37c0eb46
SF
1924 index = 0;
1925 goto retry;
1926 }
c3d17b63 1927
111ebb6e 1928 if (wbc->range_cyclic || (range_whole && wbc->nr_to_write > 0))
37c0eb46
SF
1929 mapping->writeback_index = index;
1930
1da177e4
LT
1931 return rc;
1932}
1da177e4 1933
9ad1506b
PS
1934static int
1935cifs_writepage_locked(struct page *page, struct writeback_control *wbc)
1da177e4 1936{
9ad1506b 1937 int rc;
1da177e4
LT
1938 int xid;
1939
1940 xid = GetXid();
1941/* BB add check for wbc flags */
1942 page_cache_get(page);
ad7a2926 1943 if (!PageUptodate(page))
b6b38f70 1944 cFYI(1, "ppw - page not up to date");
cb876f45
LT
1945
1946 /*
1947 * Set the "writeback" flag, and clear "dirty" in the radix tree.
1948 *
1949 * A writepage() implementation always needs to do either this,
1950 * or re-dirty the page with "redirty_page_for_writepage()" in
1951 * the case of a failure.
1952 *
1953 * Just unlocking the page will cause the radix tree tag-bits
1954 * to fail to update with the state of the page correctly.
1955 */
fb8c4b14 1956 set_page_writeback(page);
9ad1506b 1957retry_write:
1da177e4 1958 rc = cifs_partialpagewrite(page, 0, PAGE_CACHE_SIZE);
9ad1506b
PS
1959 if (rc == -EAGAIN && wbc->sync_mode == WB_SYNC_ALL)
1960 goto retry_write;
1961 else if (rc == -EAGAIN)
1962 redirty_page_for_writepage(wbc, page);
1963 else if (rc != 0)
1964 SetPageError(page);
1965 else
1966 SetPageUptodate(page);
cb876f45
LT
1967 end_page_writeback(page);
1968 page_cache_release(page);
1da177e4
LT
1969 FreeXid(xid);
1970 return rc;
1971}
1972
9ad1506b
PS
1973static int cifs_writepage(struct page *page, struct writeback_control *wbc)
1974{
1975 int rc = cifs_writepage_locked(page, wbc);
1976 unlock_page(page);
1977 return rc;
1978}
1979
d9414774
NP
1980static int cifs_write_end(struct file *file, struct address_space *mapping,
1981 loff_t pos, unsigned len, unsigned copied,
1982 struct page *page, void *fsdata)
1da177e4 1983{
d9414774
NP
1984 int rc;
1985 struct inode *inode = mapping->host;
d4ffff1f
PS
1986 struct cifsFileInfo *cfile = file->private_data;
1987 struct cifs_sb_info *cifs_sb = CIFS_SB(cfile->dentry->d_sb);
1988 __u32 pid;
1989
1990 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
1991 pid = cfile->pid;
1992 else
1993 pid = current->tgid;
1da177e4 1994
b6b38f70
JP
1995 cFYI(1, "write_end for page %p from pos %lld with %d bytes",
1996 page, pos, copied);
d9414774 1997
a98ee8c1
JL
1998 if (PageChecked(page)) {
1999 if (copied == len)
2000 SetPageUptodate(page);
2001 ClearPageChecked(page);
2002 } else if (!PageUptodate(page) && copied == PAGE_CACHE_SIZE)
d9414774 2003 SetPageUptodate(page);
ad7a2926 2004
1da177e4 2005 if (!PageUptodate(page)) {
d9414774
NP
2006 char *page_data;
2007 unsigned offset = pos & (PAGE_CACHE_SIZE - 1);
2008 int xid;
2009
2010 xid = GetXid();
1da177e4
LT
2011 /* this is probably better than directly calling
2012 partialpage_write since in this function the file handle is
2013 known which we might as well leverage */
2014 /* BB check if anything else missing out of ppw
2015 such as updating last write time */
2016 page_data = kmap(page);
d4ffff1f 2017 rc = cifs_write(cfile, pid, page_data + offset, copied, &pos);
d9414774 2018 /* if (rc < 0) should we set writebehind rc? */
1da177e4 2019 kunmap(page);
d9414774
NP
2020
2021 FreeXid(xid);
fb8c4b14 2022 } else {
d9414774
NP
2023 rc = copied;
2024 pos += copied;
1da177e4
LT
2025 set_page_dirty(page);
2026 }
2027
d9414774
NP
2028 if (rc > 0) {
2029 spin_lock(&inode->i_lock);
2030 if (pos > inode->i_size)
2031 i_size_write(inode, pos);
2032 spin_unlock(&inode->i_lock);
2033 }
2034
2035 unlock_page(page);
2036 page_cache_release(page);
2037
1da177e4
LT
2038 return rc;
2039}
2040
02c24a82
JB
2041int cifs_strict_fsync(struct file *file, loff_t start, loff_t end,
2042 int datasync)
1da177e4
LT
2043{
2044 int xid;
2045 int rc = 0;
96daf2b0 2046 struct cifs_tcon *tcon;
c21dfb69 2047 struct cifsFileInfo *smbfile = file->private_data;
e6a00296 2048 struct inode *inode = file->f_path.dentry->d_inode;
8be7e6ba 2049 struct cifs_sb_info *cifs_sb = CIFS_SB(inode->i_sb);
1da177e4 2050
02c24a82
JB
2051 rc = filemap_write_and_wait_range(inode->i_mapping, start, end);
2052 if (rc)
2053 return rc;
2054 mutex_lock(&inode->i_mutex);
2055
1da177e4
LT
2056 xid = GetXid();
2057
b6b38f70 2058 cFYI(1, "Sync file - name: %s datasync: 0x%x",
7ea80859 2059 file->f_path.dentry->d_name.name, datasync);
50c2f753 2060
6feb9891
PS
2061 if (!CIFS_I(inode)->clientCanCacheRead) {
2062 rc = cifs_invalidate_mapping(inode);
2063 if (rc) {
2064 cFYI(1, "rc: %d during invalidate phase", rc);
2065 rc = 0; /* don't care about it in fsync */
2066 }
2067 }
eb4b756b 2068
8be7e6ba
PS
2069 tcon = tlink_tcon(smbfile->tlink);
2070 if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOSSYNC))
2071 rc = CIFSSMBFlush(xid, tcon, smbfile->netfid);
2072
2073 FreeXid(xid);
02c24a82 2074 mutex_unlock(&inode->i_mutex);
8be7e6ba
PS
2075 return rc;
2076}
2077
02c24a82 2078int cifs_fsync(struct file *file, loff_t start, loff_t end, int datasync)
8be7e6ba
PS
2079{
2080 int xid;
2081 int rc = 0;
96daf2b0 2082 struct cifs_tcon *tcon;
8be7e6ba
PS
2083 struct cifsFileInfo *smbfile = file->private_data;
2084 struct cifs_sb_info *cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
02c24a82
JB
2085 struct inode *inode = file->f_mapping->host;
2086
2087 rc = filemap_write_and_wait_range(inode->i_mapping, start, end);
2088 if (rc)
2089 return rc;
2090 mutex_lock(&inode->i_mutex);
8be7e6ba
PS
2091
2092 xid = GetXid();
2093
2094 cFYI(1, "Sync file - name: %s datasync: 0x%x",
2095 file->f_path.dentry->d_name.name, datasync);
2096
2097 tcon = tlink_tcon(smbfile->tlink);
2098 if (!(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOSSYNC))
2099 rc = CIFSSMBFlush(xid, tcon, smbfile->netfid);
b298f223 2100
1da177e4 2101 FreeXid(xid);
02c24a82 2102 mutex_unlock(&inode->i_mutex);
1da177e4
LT
2103 return rc;
2104}
2105
1da177e4
LT
2106/*
2107 * As file closes, flush all cached write data for this inode checking
2108 * for write behind errors.
2109 */
75e1fcc0 2110int cifs_flush(struct file *file, fl_owner_t id)
1da177e4 2111{
fb8c4b14 2112 struct inode *inode = file->f_path.dentry->d_inode;
1da177e4
LT
2113 int rc = 0;
2114
eb4b756b 2115 if (file->f_mode & FMODE_WRITE)
d3f1322a 2116 rc = filemap_write_and_wait(inode->i_mapping);
50c2f753 2117
b6b38f70 2118 cFYI(1, "Flush inode %p file %p rc %d", inode, file, rc);
1da177e4
LT
2119
2120 return rc;
2121}
2122
72432ffc
PS
2123static int
2124cifs_write_allocate_pages(struct page **pages, unsigned long num_pages)
2125{
2126 int rc = 0;
2127 unsigned long i;
2128
2129 for (i = 0; i < num_pages; i++) {
e94f7ba1 2130 pages[i] = alloc_page(GFP_KERNEL|__GFP_HIGHMEM);
72432ffc
PS
2131 if (!pages[i]) {
2132 /*
2133 * save number of pages we have already allocated and
2134 * return with ENOMEM error
2135 */
2136 num_pages = i;
2137 rc = -ENOMEM;
e94f7ba1 2138 break;
72432ffc
PS
2139 }
2140 }
2141
e94f7ba1
JL
2142 if (rc) {
2143 for (i = 0; i < num_pages; i++)
2144 put_page(pages[i]);
2145 }
72432ffc
PS
2146 return rc;
2147}
2148
2149static inline
2150size_t get_numpages(const size_t wsize, const size_t len, size_t *cur_len)
2151{
2152 size_t num_pages;
2153 size_t clen;
2154
2155 clen = min_t(const size_t, len, wsize);
a7103b99 2156 num_pages = DIV_ROUND_UP(clen, PAGE_SIZE);
72432ffc
PS
2157
2158 if (cur_len)
2159 *cur_len = clen;
2160
2161 return num_pages;
2162}
2163
da82f7e7
JL
2164static void
2165cifs_uncached_marshal_iov(struct kvec *iov, struct cifs_writedata *wdata)
2166{
2167 int i;
2168 size_t bytes = wdata->bytes;
2169
2170 /* marshal up the pages into iov array */
2171 for (i = 0; i < wdata->nr_pages; i++) {
c7ad42b5 2172 iov[i + 1].iov_len = min_t(size_t, bytes, PAGE_SIZE);
da82f7e7
JL
2173 iov[i + 1].iov_base = kmap(wdata->pages[i]);
2174 bytes -= iov[i + 1].iov_len;
2175 }
2176}
2177
2178static void
2179cifs_uncached_writev_complete(struct work_struct *work)
2180{
2181 int i;
2182 struct cifs_writedata *wdata = container_of(work,
2183 struct cifs_writedata, work);
2184 struct inode *inode = wdata->cfile->dentry->d_inode;
2185 struct cifsInodeInfo *cifsi = CIFS_I(inode);
2186
2187 spin_lock(&inode->i_lock);
2188 cifs_update_eof(cifsi, wdata->offset, wdata->bytes);
2189 if (cifsi->server_eof > inode->i_size)
2190 i_size_write(inode, cifsi->server_eof);
2191 spin_unlock(&inode->i_lock);
2192
2193 complete(&wdata->done);
2194
2195 if (wdata->result != -EAGAIN) {
2196 for (i = 0; i < wdata->nr_pages; i++)
2197 put_page(wdata->pages[i]);
2198 }
2199
2200 kref_put(&wdata->refcount, cifs_writedata_release);
2201}
2202
2203/* attempt to send write to server, retry on any -EAGAIN errors */
2204static int
2205cifs_uncached_retry_writev(struct cifs_writedata *wdata)
2206{
2207 int rc;
2208
2209 do {
2210 if (wdata->cfile->invalidHandle) {
2211 rc = cifs_reopen_file(wdata->cfile, false);
2212 if (rc != 0)
2213 continue;
2214 }
2215 rc = cifs_async_writev(wdata);
2216 } while (rc == -EAGAIN);
2217
2218 return rc;
2219}
2220
72432ffc
PS
2221static ssize_t
2222cifs_iovec_write(struct file *file, const struct iovec *iov,
2223 unsigned long nr_segs, loff_t *poffset)
2224{
da82f7e7 2225 unsigned long nr_pages, i;
76429c14
PS
2226 size_t copied, len, cur_len;
2227 ssize_t total_written = 0;
3af9d8f2 2228 loff_t offset;
72432ffc 2229 struct iov_iter it;
72432ffc 2230 struct cifsFileInfo *open_file;
da82f7e7 2231 struct cifs_tcon *tcon;
72432ffc 2232 struct cifs_sb_info *cifs_sb;
da82f7e7
JL
2233 struct cifs_writedata *wdata, *tmp;
2234 struct list_head wdata_list;
2235 int rc;
2236 pid_t pid;
72432ffc
PS
2237
2238 len = iov_length(iov, nr_segs);
2239 if (!len)
2240 return 0;
2241
2242 rc = generic_write_checks(file, poffset, &len, 0);
2243 if (rc)
2244 return rc;
2245
da82f7e7 2246 INIT_LIST_HEAD(&wdata_list);
72432ffc 2247 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
72432ffc 2248 open_file = file->private_data;
da82f7e7 2249 tcon = tlink_tcon(open_file->tlink);
3af9d8f2 2250 offset = *poffset;
d4ffff1f
PS
2251
2252 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
2253 pid = open_file->pid;
2254 else
2255 pid = current->tgid;
2256
72432ffc 2257 iov_iter_init(&it, iov, nr_segs, len, 0);
72432ffc 2258 do {
da82f7e7
JL
2259 size_t save_len;
2260
2261 nr_pages = get_numpages(cifs_sb->wsize, len, &cur_len);
2262 wdata = cifs_writedata_alloc(nr_pages,
2263 cifs_uncached_writev_complete);
2264 if (!wdata) {
2265 rc = -ENOMEM;
2266 break;
2267 }
2268
2269 rc = cifs_write_allocate_pages(wdata->pages, nr_pages);
2270 if (rc) {
2271 kfree(wdata);
2272 break;
2273 }
2274
2275 save_len = cur_len;
2276 for (i = 0; i < nr_pages; i++) {
2277 copied = min_t(const size_t, cur_len, PAGE_SIZE);
2278 copied = iov_iter_copy_from_user(wdata->pages[i], &it,
2279 0, copied);
72432ffc
PS
2280 cur_len -= copied;
2281 iov_iter_advance(&it, copied);
72432ffc 2282 }
72432ffc
PS
2283 cur_len = save_len - cur_len;
2284
da82f7e7
JL
2285 wdata->sync_mode = WB_SYNC_ALL;
2286 wdata->nr_pages = nr_pages;
2287 wdata->offset = (__u64)offset;
2288 wdata->cfile = cifsFileInfo_get(open_file);
2289 wdata->pid = pid;
2290 wdata->bytes = cur_len;
2291 wdata->marshal_iov = cifs_uncached_marshal_iov;
2292 rc = cifs_uncached_retry_writev(wdata);
2293 if (rc) {
2294 kref_put(&wdata->refcount, cifs_writedata_release);
72432ffc
PS
2295 break;
2296 }
2297
da82f7e7
JL
2298 list_add_tail(&wdata->list, &wdata_list);
2299 offset += cur_len;
2300 len -= cur_len;
72432ffc
PS
2301 } while (len > 0);
2302
da82f7e7
JL
2303 /*
2304 * If at least one write was successfully sent, then discard any rc
2305 * value from the later writes. If the other write succeeds, then
2306 * we'll end up returning whatever was written. If it fails, then
2307 * we'll get a new rc value from that.
2308 */
2309 if (!list_empty(&wdata_list))
2310 rc = 0;
2311
2312 /*
2313 * Wait for and collect replies for any successful sends in order of
2314 * increasing offset. Once an error is hit or we get a fatal signal
2315 * while waiting, then return without waiting for any more replies.
2316 */
2317restart_loop:
2318 list_for_each_entry_safe(wdata, tmp, &wdata_list, list) {
2319 if (!rc) {
2320 /* FIXME: freezable too? */
2321 rc = wait_for_completion_killable(&wdata->done);
2322 if (rc)
2323 rc = -EINTR;
2324 else if (wdata->result)
2325 rc = wdata->result;
2326 else
2327 total_written += wdata->bytes;
2328
2329 /* resend call if it's a retryable error */
2330 if (rc == -EAGAIN) {
2331 rc = cifs_uncached_retry_writev(wdata);
2332 goto restart_loop;
2333 }
2334 }
2335 list_del_init(&wdata->list);
2336 kref_put(&wdata->refcount, cifs_writedata_release);
72432ffc
PS
2337 }
2338
da82f7e7
JL
2339 if (total_written > 0)
2340 *poffset += total_written;
72432ffc 2341
da82f7e7
JL
2342 cifs_stats_bytes_written(tcon, total_written);
2343 return total_written ? total_written : (ssize_t)rc;
72432ffc
PS
2344}
2345
0b81c1c4 2346ssize_t cifs_user_writev(struct kiocb *iocb, const struct iovec *iov,
72432ffc
PS
2347 unsigned long nr_segs, loff_t pos)
2348{
2349 ssize_t written;
2350 struct inode *inode;
2351
2352 inode = iocb->ki_filp->f_path.dentry->d_inode;
2353
2354 /*
2355 * BB - optimize the way when signing is disabled. We can drop this
2356 * extra memory-to-memory copying and use iovec buffers for constructing
2357 * write request.
2358 */
2359
2360 written = cifs_iovec_write(iocb->ki_filp, iov, nr_segs, &pos);
2361 if (written > 0) {
2362 CIFS_I(inode)->invalid_mapping = true;
2363 iocb->ki_pos = pos;
2364 }
2365
2366 return written;
2367}
2368
2369ssize_t cifs_strict_writev(struct kiocb *iocb, const struct iovec *iov,
2370 unsigned long nr_segs, loff_t pos)
2371{
2372 struct inode *inode;
2373
2374 inode = iocb->ki_filp->f_path.dentry->d_inode;
2375
2376 if (CIFS_I(inode)->clientCanCacheAll)
2377 return generic_file_aio_write(iocb, iov, nr_segs, pos);
2378
2379 /*
2380 * In strict cache mode we need to write the data to the server exactly
2381 * from the pos to pos+len-1 rather than flush all affected pages
2382 * because it may cause a error with mandatory locks on these pages but
2383 * not on the region from pos to ppos+len-1.
2384 */
2385
2386 return cifs_user_writev(iocb, iov, nr_segs, pos);
2387}
2388
0471ca3f
JL
2389static struct cifs_readdata *
2390cifs_readdata_alloc(unsigned int nr_vecs, work_func_t complete)
2391{
2392 struct cifs_readdata *rdata;
2393
2394 rdata = kzalloc(sizeof(*rdata) +
2395 sizeof(struct kvec) * nr_vecs, GFP_KERNEL);
2396 if (rdata != NULL) {
6993f74a 2397 kref_init(&rdata->refcount);
1c892549
JL
2398 INIT_LIST_HEAD(&rdata->list);
2399 init_completion(&rdata->done);
0471ca3f
JL
2400 INIT_WORK(&rdata->work, complete);
2401 INIT_LIST_HEAD(&rdata->pages);
2402 }
2403 return rdata;
2404}
2405
6993f74a
JL
2406void
2407cifs_readdata_release(struct kref *refcount)
0471ca3f 2408{
6993f74a
JL
2409 struct cifs_readdata *rdata = container_of(refcount,
2410 struct cifs_readdata, refcount);
2411
2412 if (rdata->cfile)
2413 cifsFileInfo_put(rdata->cfile);
2414
0471ca3f
JL
2415 kfree(rdata);
2416}
2417
1c892549
JL
2418static int
2419cifs_read_allocate_pages(struct list_head *list, unsigned int npages)
2420{
2421 int rc = 0;
2422 struct page *page, *tpage;
2423 unsigned int i;
2424
2425 for (i = 0; i < npages; i++) {
2426 page = alloc_page(GFP_KERNEL|__GFP_HIGHMEM);
2427 if (!page) {
2428 rc = -ENOMEM;
2429 break;
2430 }
2431 list_add(&page->lru, list);
2432 }
2433
2434 if (rc) {
2435 list_for_each_entry_safe(page, tpage, list, lru) {
2436 list_del(&page->lru);
2437 put_page(page);
2438 }
2439 }
2440 return rc;
2441}
2442
2443static void
2444cifs_uncached_readdata_release(struct kref *refcount)
2445{
2446 struct page *page, *tpage;
2447 struct cifs_readdata *rdata = container_of(refcount,
2448 struct cifs_readdata, refcount);
2449
2450 list_for_each_entry_safe(page, tpage, &rdata->pages, lru) {
2451 list_del(&page->lru);
2452 put_page(page);
2453 }
2454 cifs_readdata_release(refcount);
2455}
2456
2a1bb138
JL
2457static int
2458cifs_retry_async_readv(struct cifs_readdata *rdata)
2459{
2460 int rc;
2461
2462 do {
2463 if (rdata->cfile->invalidHandle) {
2464 rc = cifs_reopen_file(rdata->cfile, true);
2465 if (rc != 0)
2466 continue;
2467 }
2468 rc = cifs_async_readv(rdata);
2469 } while (rc == -EAGAIN);
2470
2471 return rc;
2472}
2473
1c892549
JL
2474/**
2475 * cifs_readdata_to_iov - copy data from pages in response to an iovec
2476 * @rdata: the readdata response with list of pages holding data
2477 * @iov: vector in which we should copy the data
2478 * @nr_segs: number of segments in vector
2479 * @offset: offset into file of the first iovec
2480 * @copied: used to return the amount of data copied to the iov
2481 *
2482 * This function copies data from a list of pages in a readdata response into
2483 * an array of iovecs. It will first calculate where the data should go
2484 * based on the info in the readdata and then copy the data into that spot.
2485 */
2486static ssize_t
2487cifs_readdata_to_iov(struct cifs_readdata *rdata, const struct iovec *iov,
2488 unsigned long nr_segs, loff_t offset, ssize_t *copied)
2489{
2490 int rc = 0;
2491 struct iov_iter ii;
2492 size_t pos = rdata->offset - offset;
2493 struct page *page, *tpage;
2494 ssize_t remaining = rdata->bytes;
2495 unsigned char *pdata;
2496
2497 /* set up iov_iter and advance to the correct offset */
2498 iov_iter_init(&ii, iov, nr_segs, iov_length(iov, nr_segs), 0);
2499 iov_iter_advance(&ii, pos);
2500
2501 *copied = 0;
2502 list_for_each_entry_safe(page, tpage, &rdata->pages, lru) {
2503 ssize_t copy;
2504
2505 /* copy a whole page or whatever's left */
2506 copy = min_t(ssize_t, remaining, PAGE_SIZE);
2507
2508 /* ...but limit it to whatever space is left in the iov */
2509 copy = min_t(ssize_t, copy, iov_iter_count(&ii));
2510
2511 /* go while there's data to be copied and no errors */
2512 if (copy && !rc) {
2513 pdata = kmap(page);
2514 rc = memcpy_toiovecend(ii.iov, pdata, ii.iov_offset,
2515 (int)copy);
2516 kunmap(page);
2517 if (!rc) {
2518 *copied += copy;
2519 remaining -= copy;
2520 iov_iter_advance(&ii, copy);
2521 }
2522 }
2523
2524 list_del(&page->lru);
2525 put_page(page);
2526 }
2527
2528 return rc;
2529}
2530
2531static void
2532cifs_uncached_readv_complete(struct work_struct *work)
2533{
2534 struct cifs_readdata *rdata = container_of(work,
2535 struct cifs_readdata, work);
2536
2537 /* if the result is non-zero then the pages weren't kmapped */
2538 if (rdata->result == 0) {
2539 struct page *page;
2540
2541 list_for_each_entry(page, &rdata->pages, lru)
2542 kunmap(page);
2543 }
2544
2545 complete(&rdata->done);
2546 kref_put(&rdata->refcount, cifs_uncached_readdata_release);
2547}
2548
2549static int
2550cifs_uncached_read_marshal_iov(struct cifs_readdata *rdata,
2551 unsigned int remaining)
2552{
2553 int len = 0;
2554 struct page *page, *tpage;
2555
2556 rdata->nr_iov = 1;
2557 list_for_each_entry_safe(page, tpage, &rdata->pages, lru) {
2558 if (remaining >= PAGE_SIZE) {
2559 /* enough data to fill the page */
2560 rdata->iov[rdata->nr_iov].iov_base = kmap(page);
2561 rdata->iov[rdata->nr_iov].iov_len = PAGE_SIZE;
2562 cFYI(1, "%u: idx=%lu iov_base=%p iov_len=%zu",
2563 rdata->nr_iov, page->index,
2564 rdata->iov[rdata->nr_iov].iov_base,
2565 rdata->iov[rdata->nr_iov].iov_len);
2566 ++rdata->nr_iov;
2567 len += PAGE_SIZE;
2568 remaining -= PAGE_SIZE;
2569 } else if (remaining > 0) {
2570 /* enough for partial page, fill and zero the rest */
2571 rdata->iov[rdata->nr_iov].iov_base = kmap(page);
2572 rdata->iov[rdata->nr_iov].iov_len = remaining;
2573 cFYI(1, "%u: idx=%lu iov_base=%p iov_len=%zu",
2574 rdata->nr_iov, page->index,
2575 rdata->iov[rdata->nr_iov].iov_base,
2576 rdata->iov[rdata->nr_iov].iov_len);
2577 memset(rdata->iov[rdata->nr_iov].iov_base + remaining,
2578 '\0', PAGE_SIZE - remaining);
2579 ++rdata->nr_iov;
2580 len += remaining;
2581 remaining = 0;
2582 } else {
2583 /* no need to hold page hostage */
2584 list_del(&page->lru);
2585 put_page(page);
2586 }
2587 }
2588
2589 return len;
2590}
2591
a70307ee
PS
2592static ssize_t
2593cifs_iovec_read(struct file *file, const struct iovec *iov,
2594 unsigned long nr_segs, loff_t *poffset)
1da177e4 2595{
1c892549 2596 ssize_t rc;
a70307ee 2597 size_t len, cur_len;
1c892549
JL
2598 ssize_t total_read = 0;
2599 loff_t offset = *poffset;
2600 unsigned int npages;
1da177e4 2601 struct cifs_sb_info *cifs_sb;
1c892549 2602 struct cifs_tcon *tcon;
1da177e4 2603 struct cifsFileInfo *open_file;
1c892549
JL
2604 struct cifs_readdata *rdata, *tmp;
2605 struct list_head rdata_list;
2606 pid_t pid;
a70307ee
PS
2607
2608 if (!nr_segs)
2609 return 0;
2610
2611 len = iov_length(iov, nr_segs);
2612 if (!len)
2613 return 0;
1da177e4 2614
1c892549 2615 INIT_LIST_HEAD(&rdata_list);
e6a00296 2616 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
c21dfb69 2617 open_file = file->private_data;
1c892549 2618 tcon = tlink_tcon(open_file->tlink);
1da177e4 2619
d4ffff1f
PS
2620 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
2621 pid = open_file->pid;
2622 else
2623 pid = current->tgid;
2624
ad7a2926 2625 if ((file->f_flags & O_ACCMODE) == O_WRONLY)
b6b38f70 2626 cFYI(1, "attempting read on write only file instance");
ad7a2926 2627
1c892549
JL
2628 do {
2629 cur_len = min_t(const size_t, len - total_read, cifs_sb->rsize);
2630 npages = DIV_ROUND_UP(cur_len, PAGE_SIZE);
a70307ee 2631
1c892549
JL
2632 /* allocate a readdata struct */
2633 rdata = cifs_readdata_alloc(npages,
2634 cifs_uncached_readv_complete);
2635 if (!rdata) {
2636 rc = -ENOMEM;
2637 goto error;
1da177e4 2638 }
a70307ee 2639
1c892549
JL
2640 rc = cifs_read_allocate_pages(&rdata->pages, npages);
2641 if (rc)
2642 goto error;
2643
2644 rdata->cfile = cifsFileInfo_get(open_file);
2645 rdata->offset = offset;
2646 rdata->bytes = cur_len;
2647 rdata->pid = pid;
2648 rdata->marshal_iov = cifs_uncached_read_marshal_iov;
2649
2650 rc = cifs_retry_async_readv(rdata);
2651error:
2652 if (rc) {
2653 kref_put(&rdata->refcount,
2654 cifs_uncached_readdata_release);
2655 break;
2656 }
2657
2658 list_add_tail(&rdata->list, &rdata_list);
2659 offset += cur_len;
2660 len -= cur_len;
2661 } while (len > 0);
2662
2663 /* if at least one read request send succeeded, then reset rc */
2664 if (!list_empty(&rdata_list))
2665 rc = 0;
2666
2667 /* the loop below should proceed in the order of increasing offsets */
2668restart_loop:
2669 list_for_each_entry_safe(rdata, tmp, &rdata_list, list) {
2670 if (!rc) {
2671 ssize_t copied;
2672
2673 /* FIXME: freezable sleep too? */
2674 rc = wait_for_completion_killable(&rdata->done);
2675 if (rc)
2676 rc = -EINTR;
2677 else if (rdata->result)
2678 rc = rdata->result;
2679 else {
2680 rc = cifs_readdata_to_iov(rdata, iov,
2681 nr_segs, *poffset,
2682 &copied);
2683 total_read += copied;
2684 }
2685
2686 /* resend call if it's a retryable error */
2687 if (rc == -EAGAIN) {
2688 rc = cifs_retry_async_readv(rdata);
2689 goto restart_loop;
1da177e4 2690 }
1da177e4 2691 }
1c892549
JL
2692 list_del_init(&rdata->list);
2693 kref_put(&rdata->refcount, cifs_uncached_readdata_release);
1da177e4 2694 }
a70307ee 2695
1c892549
JL
2696 cifs_stats_bytes_read(tcon, total_read);
2697 *poffset += total_read;
2698
2699 return total_read ? total_read : rc;
1da177e4
LT
2700}
2701
0b81c1c4 2702ssize_t cifs_user_readv(struct kiocb *iocb, const struct iovec *iov,
a70307ee
PS
2703 unsigned long nr_segs, loff_t pos)
2704{
2705 ssize_t read;
2706
2707 read = cifs_iovec_read(iocb->ki_filp, iov, nr_segs, &pos);
2708 if (read > 0)
2709 iocb->ki_pos = pos;
2710
2711 return read;
2712}
2713
2714ssize_t cifs_strict_readv(struct kiocb *iocb, const struct iovec *iov,
2715 unsigned long nr_segs, loff_t pos)
2716{
2717 struct inode *inode;
2718
2719 inode = iocb->ki_filp->f_path.dentry->d_inode;
2720
2721 if (CIFS_I(inode)->clientCanCacheRead)
2722 return generic_file_aio_read(iocb, iov, nr_segs, pos);
2723
2724 /*
2725 * In strict cache mode we need to read from the server all the time
2726 * if we don't have level II oplock because the server can delay mtime
2727 * change - so we can't make a decision about inode invalidating.
2728 * And we can also fail with pagereading if there are mandatory locks
2729 * on pages affected by this read but not on the region from pos to
2730 * pos+len-1.
2731 */
2732
2733 return cifs_user_readv(iocb, iov, nr_segs, pos);
2734}
1da177e4
LT
2735
2736static ssize_t cifs_read(struct file *file, char *read_data, size_t read_size,
a70307ee 2737 loff_t *poffset)
1da177e4
LT
2738{
2739 int rc = -EACCES;
2740 unsigned int bytes_read = 0;
2741 unsigned int total_read;
2742 unsigned int current_read_size;
5eba8ab3 2743 unsigned int rsize;
1da177e4 2744 struct cifs_sb_info *cifs_sb;
96daf2b0 2745 struct cifs_tcon *pTcon;
1da177e4
LT
2746 int xid;
2747 char *current_offset;
2748 struct cifsFileInfo *open_file;
d4ffff1f 2749 struct cifs_io_parms io_parms;
ec637e3f 2750 int buf_type = CIFS_NO_BUFFER;
d4ffff1f 2751 __u32 pid;
1da177e4
LT
2752
2753 xid = GetXid();
e6a00296 2754 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
1da177e4 2755
5eba8ab3
JL
2756 /* FIXME: set up handlers for larger reads and/or convert to async */
2757 rsize = min_t(unsigned int, cifs_sb->rsize, CIFSMaxBufSize);
2758
1da177e4 2759 if (file->private_data == NULL) {
0f3bc09e 2760 rc = -EBADF;
1da177e4 2761 FreeXid(xid);
0f3bc09e 2762 return rc;
1da177e4 2763 }
c21dfb69 2764 open_file = file->private_data;
13cfb733 2765 pTcon = tlink_tcon(open_file->tlink);
1da177e4 2766
d4ffff1f
PS
2767 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
2768 pid = open_file->pid;
2769 else
2770 pid = current->tgid;
2771
1da177e4 2772 if ((file->f_flags & O_ACCMODE) == O_WRONLY)
b6b38f70 2773 cFYI(1, "attempting read on write only file instance");
1da177e4 2774
fb8c4b14 2775 for (total_read = 0, current_offset = read_data;
1da177e4
LT
2776 read_size > total_read;
2777 total_read += bytes_read, current_offset += bytes_read) {
5eba8ab3
JL
2778 current_read_size = min_t(uint, read_size - total_read, rsize);
2779
f9f5c817
SF
2780 /* For windows me and 9x we do not want to request more
2781 than it negotiated since it will refuse the read then */
fb8c4b14 2782 if ((pTcon->ses) &&
f9f5c817 2783 !(pTcon->ses->capabilities & CAP_LARGE_FILES)) {
7748dd6e 2784 current_read_size = min_t(uint, current_read_size,
c974befa 2785 CIFSMaxBufSize);
f9f5c817 2786 }
1da177e4
LT
2787 rc = -EAGAIN;
2788 while (rc == -EAGAIN) {
cdff08e7 2789 if (open_file->invalidHandle) {
15886177 2790 rc = cifs_reopen_file(open_file, true);
1da177e4
LT
2791 if (rc != 0)
2792 break;
2793 }
d4ffff1f
PS
2794 io_parms.netfid = open_file->netfid;
2795 io_parms.pid = pid;
2796 io_parms.tcon = pTcon;
2797 io_parms.offset = *poffset;
2798 io_parms.length = current_read_size;
2799 rc = CIFSSMBRead(xid, &io_parms, &bytes_read,
2800 &current_offset, &buf_type);
1da177e4
LT
2801 }
2802 if (rc || (bytes_read == 0)) {
2803 if (total_read) {
2804 break;
2805 } else {
2806 FreeXid(xid);
2807 return rc;
2808 }
2809 } else {
a4544347 2810 cifs_stats_bytes_read(pTcon, total_read);
1da177e4
LT
2811 *poffset += bytes_read;
2812 }
2813 }
2814 FreeXid(xid);
2815 return total_read;
2816}
2817
ca83ce3d
JL
2818/*
2819 * If the page is mmap'ed into a process' page tables, then we need to make
2820 * sure that it doesn't change while being written back.
2821 */
2822static int
2823cifs_page_mkwrite(struct vm_area_struct *vma, struct vm_fault *vmf)
2824{
2825 struct page *page = vmf->page;
2826
2827 lock_page(page);
2828 return VM_FAULT_LOCKED;
2829}
2830
2831static struct vm_operations_struct cifs_file_vm_ops = {
2832 .fault = filemap_fault,
2833 .page_mkwrite = cifs_page_mkwrite,
2834};
2835
7a6a19b1
PS
2836int cifs_file_strict_mmap(struct file *file, struct vm_area_struct *vma)
2837{
2838 int rc, xid;
2839 struct inode *inode = file->f_path.dentry->d_inode;
2840
2841 xid = GetXid();
2842
6feb9891
PS
2843 if (!CIFS_I(inode)->clientCanCacheRead) {
2844 rc = cifs_invalidate_mapping(inode);
2845 if (rc)
2846 return rc;
2847 }
7a6a19b1
PS
2848
2849 rc = generic_file_mmap(file, vma);
ca83ce3d
JL
2850 if (rc == 0)
2851 vma->vm_ops = &cifs_file_vm_ops;
7a6a19b1
PS
2852 FreeXid(xid);
2853 return rc;
2854}
2855
1da177e4
LT
2856int cifs_file_mmap(struct file *file, struct vm_area_struct *vma)
2857{
1da177e4
LT
2858 int rc, xid;
2859
2860 xid = GetXid();
abab095d 2861 rc = cifs_revalidate_file(file);
1da177e4 2862 if (rc) {
b6b38f70 2863 cFYI(1, "Validation prior to mmap failed, error=%d", rc);
1da177e4
LT
2864 FreeXid(xid);
2865 return rc;
2866 }
2867 rc = generic_file_mmap(file, vma);
ca83ce3d
JL
2868 if (rc == 0)
2869 vma->vm_ops = &cifs_file_vm_ops;
1da177e4
LT
2870 FreeXid(xid);
2871 return rc;
2872}
2873
0471ca3f
JL
2874static void
2875cifs_readv_complete(struct work_struct *work)
2876{
2877 struct cifs_readdata *rdata = container_of(work,
2878 struct cifs_readdata, work);
2879 struct page *page, *tpage;
2880
2881 list_for_each_entry_safe(page, tpage, &rdata->pages, lru) {
2882 list_del(&page->lru);
2883 lru_cache_add_file(page);
2884
2885 if (rdata->result == 0) {
2886 kunmap(page);
2887 flush_dcache_page(page);
2888 SetPageUptodate(page);
2889 }
2890
2891 unlock_page(page);
2892
2893 if (rdata->result == 0)
2894 cifs_readpage_to_fscache(rdata->mapping->host, page);
2895
2896 page_cache_release(page);
2897 }
6993f74a 2898 kref_put(&rdata->refcount, cifs_readdata_release);
0471ca3f
JL
2899}
2900
8d5ce4d2
JL
2901static int
2902cifs_readpages_marshal_iov(struct cifs_readdata *rdata, unsigned int remaining)
2903{
2904 int len = 0;
2905 struct page *page, *tpage;
2906 u64 eof;
2907 pgoff_t eof_index;
2908
2909 /* determine the eof that the server (probably) has */
2910 eof = CIFS_I(rdata->mapping->host)->server_eof;
2911 eof_index = eof ? (eof - 1) >> PAGE_CACHE_SHIFT : 0;
2912 cFYI(1, "eof=%llu eof_index=%lu", eof, eof_index);
2913
2914 rdata->nr_iov = 1;
2915 list_for_each_entry_safe(page, tpage, &rdata->pages, lru) {
2916 if (remaining >= PAGE_CACHE_SIZE) {
2917 /* enough data to fill the page */
2918 rdata->iov[rdata->nr_iov].iov_base = kmap(page);
2919 rdata->iov[rdata->nr_iov].iov_len = PAGE_CACHE_SIZE;
2920 cFYI(1, "%u: idx=%lu iov_base=%p iov_len=%zu",
2921 rdata->nr_iov, page->index,
2922 rdata->iov[rdata->nr_iov].iov_base,
2923 rdata->iov[rdata->nr_iov].iov_len);
2924 ++rdata->nr_iov;
2925 len += PAGE_CACHE_SIZE;
2926 remaining -= PAGE_CACHE_SIZE;
2927 } else if (remaining > 0) {
2928 /* enough for partial page, fill and zero the rest */
2929 rdata->iov[rdata->nr_iov].iov_base = kmap(page);
2930 rdata->iov[rdata->nr_iov].iov_len = remaining;
2931 cFYI(1, "%u: idx=%lu iov_base=%p iov_len=%zu",
2932 rdata->nr_iov, page->index,
2933 rdata->iov[rdata->nr_iov].iov_base,
2934 rdata->iov[rdata->nr_iov].iov_len);
2935 memset(rdata->iov[rdata->nr_iov].iov_base + remaining,
2936 '\0', PAGE_CACHE_SIZE - remaining);
2937 ++rdata->nr_iov;
2938 len += remaining;
2939 remaining = 0;
2940 } else if (page->index > eof_index) {
2941 /*
2942 * The VFS will not try to do readahead past the
2943 * i_size, but it's possible that we have outstanding
2944 * writes with gaps in the middle and the i_size hasn't
2945 * caught up yet. Populate those with zeroed out pages
2946 * to prevent the VFS from repeatedly attempting to
2947 * fill them until the writes are flushed.
2948 */
2949 zero_user(page, 0, PAGE_CACHE_SIZE);
2950 list_del(&page->lru);
2951 lru_cache_add_file(page);
2952 flush_dcache_page(page);
2953 SetPageUptodate(page);
2954 unlock_page(page);
2955 page_cache_release(page);
2956 } else {
2957 /* no need to hold page hostage */
2958 list_del(&page->lru);
2959 lru_cache_add_file(page);
2960 unlock_page(page);
2961 page_cache_release(page);
2962 }
2963 }
2964
2965 return len;
2966}
2967
1da177e4
LT
2968static int cifs_readpages(struct file *file, struct address_space *mapping,
2969 struct list_head *page_list, unsigned num_pages)
2970{
690c5e31
JL
2971 int rc;
2972 struct list_head tmplist;
2973 struct cifsFileInfo *open_file = file->private_data;
2974 struct cifs_sb_info *cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
2975 unsigned int rsize = cifs_sb->rsize;
2976 pid_t pid;
1da177e4 2977
690c5e31
JL
2978 /*
2979 * Give up immediately if rsize is too small to read an entire page.
2980 * The VFS will fall back to readpage. We should never reach this
2981 * point however since we set ra_pages to 0 when the rsize is smaller
2982 * than a cache page.
2983 */
2984 if (unlikely(rsize < PAGE_CACHE_SIZE))
2985 return 0;
bfa0d75a 2986
56698236
SJ
2987 /*
2988 * Reads as many pages as possible from fscache. Returns -ENOBUFS
2989 * immediately if the cookie is negative
2990 */
2991 rc = cifs_readpages_from_fscache(mapping->host, mapping, page_list,
2992 &num_pages);
2993 if (rc == 0)
690c5e31 2994 return rc;
56698236 2995
d4ffff1f
PS
2996 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_RWPIDFORWARD)
2997 pid = open_file->pid;
2998 else
2999 pid = current->tgid;
3000
690c5e31
JL
3001 rc = 0;
3002 INIT_LIST_HEAD(&tmplist);
1da177e4 3003
690c5e31
JL
3004 cFYI(1, "%s: file=%p mapping=%p num_pages=%u", __func__, file,
3005 mapping, num_pages);
3006
3007 /*
3008 * Start with the page at end of list and move it to private
3009 * list. Do the same with any following pages until we hit
3010 * the rsize limit, hit an index discontinuity, or run out of
3011 * pages. Issue the async read and then start the loop again
3012 * until the list is empty.
3013 *
3014 * Note that list order is important. The page_list is in
3015 * the order of declining indexes. When we put the pages in
3016 * the rdata->pages, then we want them in increasing order.
3017 */
3018 while (!list_empty(page_list)) {
3019 unsigned int bytes = PAGE_CACHE_SIZE;
3020 unsigned int expected_index;
3021 unsigned int nr_pages = 1;
3022 loff_t offset;
3023 struct page *page, *tpage;
3024 struct cifs_readdata *rdata;
1da177e4
LT
3025
3026 page = list_entry(page_list->prev, struct page, lru);
690c5e31
JL
3027
3028 /*
3029 * Lock the page and put it in the cache. Since no one else
3030 * should have access to this page, we're safe to simply set
3031 * PG_locked without checking it first.
3032 */
3033 __set_page_locked(page);
3034 rc = add_to_page_cache_locked(page, mapping,
3035 page->index, GFP_KERNEL);
3036
3037 /* give up if we can't stick it in the cache */
3038 if (rc) {
3039 __clear_page_locked(page);
3040 break;
3041 }
3042
3043 /* move first page to the tmplist */
1da177e4 3044 offset = (loff_t)page->index << PAGE_CACHE_SHIFT;
690c5e31 3045 list_move_tail(&page->lru, &tmplist);
1da177e4 3046
690c5e31
JL
3047 /* now try and add more pages onto the request */
3048 expected_index = page->index + 1;
3049 list_for_each_entry_safe_reverse(page, tpage, page_list, lru) {
3050 /* discontinuity ? */
3051 if (page->index != expected_index)
fb8c4b14 3052 break;
690c5e31
JL
3053
3054 /* would this page push the read over the rsize? */
3055 if (bytes + PAGE_CACHE_SIZE > rsize)
3056 break;
3057
3058 __set_page_locked(page);
3059 if (add_to_page_cache_locked(page, mapping,
3060 page->index, GFP_KERNEL)) {
3061 __clear_page_locked(page);
3062 break;
3063 }
3064 list_move_tail(&page->lru, &tmplist);
3065 bytes += PAGE_CACHE_SIZE;
3066 expected_index++;
3067 nr_pages++;
1da177e4 3068 }
690c5e31 3069
0471ca3f 3070 rdata = cifs_readdata_alloc(nr_pages, cifs_readv_complete);
690c5e31
JL
3071 if (!rdata) {
3072 /* best to give up if we're out of mem */
3073 list_for_each_entry_safe(page, tpage, &tmplist, lru) {
3074 list_del(&page->lru);
3075 lru_cache_add_file(page);
3076 unlock_page(page);
3077 page_cache_release(page);
3078 }
3079 rc = -ENOMEM;
3080 break;
3081 }
3082
3083 spin_lock(&cifs_file_list_lock);
690c5e31 3084 spin_unlock(&cifs_file_list_lock);
6993f74a 3085 rdata->cfile = cifsFileInfo_get(open_file);
690c5e31
JL
3086 rdata->mapping = mapping;
3087 rdata->offset = offset;
3088 rdata->bytes = bytes;
3089 rdata->pid = pid;
8d5ce4d2 3090 rdata->marshal_iov = cifs_readpages_marshal_iov;
690c5e31
JL
3091 list_splice_init(&tmplist, &rdata->pages);
3092
2a1bb138 3093 rc = cifs_retry_async_readv(rdata);
690c5e31
JL
3094 if (rc != 0) {
3095 list_for_each_entry_safe(page, tpage, &rdata->pages,
3096 lru) {
3097 list_del(&page->lru);
3098 lru_cache_add_file(page);
3099 unlock_page(page);
3100 page_cache_release(page);
1da177e4 3101 }
6993f74a 3102 kref_put(&rdata->refcount, cifs_readdata_release);
1da177e4
LT
3103 break;
3104 }
6993f74a
JL
3105
3106 kref_put(&rdata->refcount, cifs_readdata_release);
1da177e4
LT
3107 }
3108
1da177e4
LT
3109 return rc;
3110}
3111
3112static int cifs_readpage_worker(struct file *file, struct page *page,
3113 loff_t *poffset)
3114{
3115 char *read_data;
3116 int rc;
3117
56698236
SJ
3118 /* Is the page cached? */
3119 rc = cifs_readpage_from_fscache(file->f_path.dentry->d_inode, page);
3120 if (rc == 0)
3121 goto read_complete;
3122
1da177e4
LT
3123 page_cache_get(page);
3124 read_data = kmap(page);
3125 /* for reads over a certain size could initiate async read ahead */
fb8c4b14 3126
1da177e4 3127 rc = cifs_read(file, read_data, PAGE_CACHE_SIZE, poffset);
fb8c4b14 3128
1da177e4
LT
3129 if (rc < 0)
3130 goto io_error;
3131 else
b6b38f70 3132 cFYI(1, "Bytes read %d", rc);
fb8c4b14 3133
e6a00296
JJS
3134 file->f_path.dentry->d_inode->i_atime =
3135 current_fs_time(file->f_path.dentry->d_inode->i_sb);
fb8c4b14 3136
1da177e4
LT
3137 if (PAGE_CACHE_SIZE > rc)
3138 memset(read_data + rc, 0, PAGE_CACHE_SIZE - rc);
3139
3140 flush_dcache_page(page);
3141 SetPageUptodate(page);
9dc06558
SJ
3142
3143 /* send this page to the cache */
3144 cifs_readpage_to_fscache(file->f_path.dentry->d_inode, page);
3145
1da177e4 3146 rc = 0;
fb8c4b14 3147
1da177e4 3148io_error:
fb8c4b14 3149 kunmap(page);
1da177e4 3150 page_cache_release(page);
56698236
SJ
3151
3152read_complete:
1da177e4
LT
3153 return rc;
3154}
3155
3156static int cifs_readpage(struct file *file, struct page *page)
3157{
3158 loff_t offset = (loff_t)page->index << PAGE_CACHE_SHIFT;
3159 int rc = -EACCES;
3160 int xid;
3161
3162 xid = GetXid();
3163
3164 if (file->private_data == NULL) {
0f3bc09e 3165 rc = -EBADF;
1da177e4 3166 FreeXid(xid);
0f3bc09e 3167 return rc;
1da177e4
LT
3168 }
3169
ac3aa2f8 3170 cFYI(1, "readpage %p at offset %d 0x%x",
b6b38f70 3171 page, (int)offset, (int)offset);
1da177e4
LT
3172
3173 rc = cifs_readpage_worker(file, page, &offset);
3174
3175 unlock_page(page);
3176
3177 FreeXid(xid);
3178 return rc;
3179}
3180
a403a0a3
SF
3181static int is_inode_writable(struct cifsInodeInfo *cifs_inode)
3182{
3183 struct cifsFileInfo *open_file;
3184
4477288a 3185 spin_lock(&cifs_file_list_lock);
a403a0a3 3186 list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
2e396b83 3187 if (OPEN_FMODE(open_file->f_flags) & FMODE_WRITE) {
4477288a 3188 spin_unlock(&cifs_file_list_lock);
a403a0a3
SF
3189 return 1;
3190 }
3191 }
4477288a 3192 spin_unlock(&cifs_file_list_lock);
a403a0a3
SF
3193 return 0;
3194}
3195
1da177e4
LT
3196/* We do not want to update the file size from server for inodes
3197 open for write - to avoid races with writepage extending
3198 the file - in the future we could consider allowing
fb8c4b14 3199 refreshing the inode only on increases in the file size
1da177e4
LT
3200 but this is tricky to do without racing with writebehind
3201 page caching in the current Linux kernel design */
4b18f2a9 3202bool is_size_safe_to_change(struct cifsInodeInfo *cifsInode, __u64 end_of_file)
1da177e4 3203{
a403a0a3 3204 if (!cifsInode)
4b18f2a9 3205 return true;
50c2f753 3206
a403a0a3
SF
3207 if (is_inode_writable(cifsInode)) {
3208 /* This inode is open for write at least once */
c32a0b68
SF
3209 struct cifs_sb_info *cifs_sb;
3210
c32a0b68 3211 cifs_sb = CIFS_SB(cifsInode->vfs_inode.i_sb);
ad7a2926 3212 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_DIRECT_IO) {
fb8c4b14 3213 /* since no page cache to corrupt on directio
c32a0b68 3214 we can change size safely */
4b18f2a9 3215 return true;
c32a0b68
SF
3216 }
3217
fb8c4b14 3218 if (i_size_read(&cifsInode->vfs_inode) < end_of_file)
4b18f2a9 3219 return true;
7ba52631 3220
4b18f2a9 3221 return false;
23e7dd7d 3222 } else
4b18f2a9 3223 return true;
1da177e4
LT
3224}
3225
d9414774
NP
3226static int cifs_write_begin(struct file *file, struct address_space *mapping,
3227 loff_t pos, unsigned len, unsigned flags,
3228 struct page **pagep, void **fsdata)
1da177e4 3229{
d9414774
NP
3230 pgoff_t index = pos >> PAGE_CACHE_SHIFT;
3231 loff_t offset = pos & (PAGE_CACHE_SIZE - 1);
a98ee8c1
JL
3232 loff_t page_start = pos & PAGE_MASK;
3233 loff_t i_size;
3234 struct page *page;
3235 int rc = 0;
d9414774 3236
b6b38f70 3237 cFYI(1, "write_begin from %lld len %d", (long long)pos, len);
d9414774 3238
54566b2c 3239 page = grab_cache_page_write_begin(mapping, index, flags);
a98ee8c1
JL
3240 if (!page) {
3241 rc = -ENOMEM;
3242 goto out;
3243 }
8a236264 3244
a98ee8c1
JL
3245 if (PageUptodate(page))
3246 goto out;
8a236264 3247
a98ee8c1
JL
3248 /*
3249 * If we write a full page it will be up to date, no need to read from
3250 * the server. If the write is short, we'll end up doing a sync write
3251 * instead.
3252 */
3253 if (len == PAGE_CACHE_SIZE)
3254 goto out;
8a236264 3255
a98ee8c1
JL
3256 /*
3257 * optimize away the read when we have an oplock, and we're not
3258 * expecting to use any of the data we'd be reading in. That
3259 * is, when the page lies beyond the EOF, or straddles the EOF
3260 * and the write will cover all of the existing data.
3261 */
3262 if (CIFS_I(mapping->host)->clientCanCacheRead) {
3263 i_size = i_size_read(mapping->host);
3264 if (page_start >= i_size ||
3265 (offset == 0 && (pos + len) >= i_size)) {
3266 zero_user_segments(page, 0, offset,
3267 offset + len,
3268 PAGE_CACHE_SIZE);
3269 /*
3270 * PageChecked means that the parts of the page
3271 * to which we're not writing are considered up
3272 * to date. Once the data is copied to the
3273 * page, it can be set uptodate.
3274 */
3275 SetPageChecked(page);
3276 goto out;
3277 }
3278 }
d9414774 3279
a98ee8c1
JL
3280 if ((file->f_flags & O_ACCMODE) != O_WRONLY) {
3281 /*
3282 * might as well read a page, it is fast enough. If we get
3283 * an error, we don't need to return it. cifs_write_end will
3284 * do a sync write instead since PG_uptodate isn't set.
3285 */
3286 cifs_readpage_worker(file, page, &page_start);
8a236264
SF
3287 } else {
3288 /* we could try using another file handle if there is one -
3289 but how would we lock it to prevent close of that handle
3290 racing with this read? In any case
d9414774 3291 this will be written out by write_end so is fine */
1da177e4 3292 }
a98ee8c1
JL
3293out:
3294 *pagep = page;
3295 return rc;
1da177e4
LT
3296}
3297
85f2d6b4
SJ
3298static int cifs_release_page(struct page *page, gfp_t gfp)
3299{
3300 if (PagePrivate(page))
3301 return 0;
3302
3303 return cifs_fscache_release_page(page, gfp);
3304}
3305
3306static void cifs_invalidate_page(struct page *page, unsigned long offset)
3307{
3308 struct cifsInodeInfo *cifsi = CIFS_I(page->mapping->host);
3309
3310 if (offset == 0)
3311 cifs_fscache_invalidate_page(page, &cifsi->vfs_inode);
3312}
3313
9ad1506b
PS
3314static int cifs_launder_page(struct page *page)
3315{
3316 int rc = 0;
3317 loff_t range_start = page_offset(page);
3318 loff_t range_end = range_start + (loff_t)(PAGE_CACHE_SIZE - 1);
3319 struct writeback_control wbc = {
3320 .sync_mode = WB_SYNC_ALL,
3321 .nr_to_write = 0,
3322 .range_start = range_start,
3323 .range_end = range_end,
3324 };
3325
3326 cFYI(1, "Launder page: %p", page);
3327
3328 if (clear_page_dirty_for_io(page))
3329 rc = cifs_writepage_locked(page, &wbc);
3330
3331 cifs_fscache_invalidate_page(page, page->mapping->host);
3332 return rc;
3333}
3334
9b646972 3335void cifs_oplock_break(struct work_struct *work)
3bc303c2
JL
3336{
3337 struct cifsFileInfo *cfile = container_of(work, struct cifsFileInfo,
3338 oplock_break);
a5e18bc3 3339 struct inode *inode = cfile->dentry->d_inode;
3bc303c2 3340 struct cifsInodeInfo *cinode = CIFS_I(inode);
eb4b756b 3341 int rc = 0;
3bc303c2
JL
3342
3343 if (inode && S_ISREG(inode->i_mode)) {
d54ff732 3344 if (cinode->clientCanCacheRead)
8737c930 3345 break_lease(inode, O_RDONLY);
d54ff732 3346 else
8737c930 3347 break_lease(inode, O_WRONLY);
3bc303c2
JL
3348 rc = filemap_fdatawrite(inode->i_mapping);
3349 if (cinode->clientCanCacheRead == 0) {
eb4b756b
JL
3350 rc = filemap_fdatawait(inode->i_mapping);
3351 mapping_set_error(inode->i_mapping, rc);
3bc303c2
JL
3352 invalidate_remote_inode(inode);
3353 }
b6b38f70 3354 cFYI(1, "Oplock flush inode %p rc %d", inode, rc);
3bc303c2
JL
3355 }
3356
85160e03
PS
3357 rc = cifs_push_locks(cfile);
3358 if (rc)
3359 cERROR(1, "Push locks rc = %d", rc);
3360
3bc303c2
JL
3361 /*
3362 * releasing stale oplock after recent reconnect of smb session using
3363 * a now incorrect file handle is not a data integrity issue but do
3364 * not bother sending an oplock release if session to server still is
3365 * disconnected since oplock already released by the server
3366 */
cdff08e7 3367 if (!cfile->oplock_break_cancelled) {
03776f45
PS
3368 rc = CIFSSMBLock(0, tlink_tcon(cfile->tlink), cfile->netfid,
3369 current->tgid, 0, 0, 0, 0,
3370 LOCKING_ANDX_OPLOCK_RELEASE, false,
12fed00d 3371 cinode->clientCanCacheRead ? 1 : 0);
b6b38f70 3372 cFYI(1, "Oplock release rc = %d", rc);
3bc303c2 3373 }
3bc303c2
JL
3374}
3375
f5e54d6e 3376const struct address_space_operations cifs_addr_ops = {
1da177e4
LT
3377 .readpage = cifs_readpage,
3378 .readpages = cifs_readpages,
3379 .writepage = cifs_writepage,
37c0eb46 3380 .writepages = cifs_writepages,
d9414774
NP
3381 .write_begin = cifs_write_begin,
3382 .write_end = cifs_write_end,
1da177e4 3383 .set_page_dirty = __set_page_dirty_nobuffers,
85f2d6b4
SJ
3384 .releasepage = cifs_release_page,
3385 .invalidatepage = cifs_invalidate_page,
9ad1506b 3386 .launder_page = cifs_launder_page,
1da177e4 3387};
273d81d6
DK
3388
3389/*
3390 * cifs_readpages requires the server to support a buffer large enough to
3391 * contain the header plus one complete page of data. Otherwise, we need
3392 * to leave cifs_readpages out of the address space operations.
3393 */
f5e54d6e 3394const struct address_space_operations cifs_addr_ops_smallbuf = {
273d81d6
DK
3395 .readpage = cifs_readpage,
3396 .writepage = cifs_writepage,
3397 .writepages = cifs_writepages,
d9414774
NP
3398 .write_begin = cifs_write_begin,
3399 .write_end = cifs_write_end,
273d81d6 3400 .set_page_dirty = __set_page_dirty_nobuffers,
85f2d6b4
SJ
3401 .releasepage = cifs_release_page,
3402 .invalidatepage = cifs_invalidate_page,
9ad1506b 3403 .launder_page = cifs_launder_page,
273d81d6 3404};