[CIFS] Add new nostrictsync cifs mount option to avoid slow SMB flush
[GitHub/mt8127/android_kernel_alcatel_ttab.git] / fs / cifs / file.c
CommitLineData
1da177e4
LT
1/*
2 * fs/cifs/file.c
3 *
4 * vfs operations that deal with files
fb8c4b14
SF
5 *
6 * Copyright (C) International Business Machines Corp., 2002,2007
1da177e4 7 * Author(s): Steve French (sfrench@us.ibm.com)
7ee1af76 8 * Jeremy Allison (jra@samba.org)
1da177e4
LT
9 *
10 * This library is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU Lesser General Public License as published
12 * by the Free Software Foundation; either version 2.1 of the License, or
13 * (at your option) any later version.
14 *
15 * This library is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
18 * the GNU Lesser General Public License for more details.
19 *
20 * You should have received a copy of the GNU Lesser General Public License
21 * along with this library; if not, write to the Free Software
22 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 */
24#include <linux/fs.h>
37c0eb46 25#include <linux/backing-dev.h>
1da177e4
LT
26#include <linux/stat.h>
27#include <linux/fcntl.h>
28#include <linux/pagemap.h>
29#include <linux/pagevec.h>
37c0eb46 30#include <linux/writeback.h>
6f88cc2e 31#include <linux/task_io_accounting_ops.h>
23e7dd7d 32#include <linux/delay.h>
1da177e4
LT
33#include <asm/div64.h>
34#include "cifsfs.h"
35#include "cifspdu.h"
36#include "cifsglob.h"
37#include "cifsproto.h"
38#include "cifs_unicode.h"
39#include "cifs_debug.h"
40#include "cifs_fs_sb.h"
41
42static inline struct cifsFileInfo *cifs_init_private(
43 struct cifsFileInfo *private_data, struct inode *inode,
44 struct file *file, __u16 netfid)
45{
46 memset(private_data, 0, sizeof(struct cifsFileInfo));
47 private_data->netfid = netfid;
fb8c4b14 48 private_data->pid = current->tgid;
1da177e4 49 init_MUTEX(&private_data->fh_sem);
796e5661 50 mutex_init(&private_data->lock_mutex);
7ee1af76 51 INIT_LIST_HEAD(&private_data->llist);
1da177e4
LT
52 private_data->pfile = file; /* needed for writepage */
53 private_data->pInode = inode;
4b18f2a9
SF
54 private_data->invalidHandle = false;
55 private_data->closePend = false;
23e7dd7d
SF
56 /* we have to track num writers to the inode, since writepages
57 does not tell us which handle the write is for so there can
58 be a close (overlapping with write) of the filehandle that
59 cifs_writepages chose to use */
fb8c4b14 60 atomic_set(&private_data->wrtPending, 0);
1da177e4
LT
61
62 return private_data;
63}
64
65static inline int cifs_convert_flags(unsigned int flags)
66{
67 if ((flags & O_ACCMODE) == O_RDONLY)
68 return GENERIC_READ;
69 else if ((flags & O_ACCMODE) == O_WRONLY)
70 return GENERIC_WRITE;
71 else if ((flags & O_ACCMODE) == O_RDWR) {
72 /* GENERIC_ALL is too much permission to request
73 can cause unnecessary access denied on create */
74 /* return GENERIC_ALL; */
75 return (GENERIC_READ | GENERIC_WRITE);
76 }
77
e10f7b55
JL
78 return (READ_CONTROL | FILE_WRITE_ATTRIBUTES | FILE_READ_ATTRIBUTES |
79 FILE_WRITE_EA | FILE_APPEND_DATA | FILE_WRITE_DATA |
80 FILE_READ_DATA);
81
82
1da177e4
LT
83}
84
85static inline int cifs_get_disposition(unsigned int flags)
86{
87 if ((flags & (O_CREAT | O_EXCL)) == (O_CREAT | O_EXCL))
88 return FILE_CREATE;
89 else if ((flags & (O_CREAT | O_TRUNC)) == (O_CREAT | O_TRUNC))
90 return FILE_OVERWRITE_IF;
91 else if ((flags & O_CREAT) == O_CREAT)
92 return FILE_OPEN_IF;
55aa2e09
SF
93 else if ((flags & O_TRUNC) == O_TRUNC)
94 return FILE_OVERWRITE;
1da177e4
LT
95 else
96 return FILE_OPEN;
97}
98
99/* all arguments to this function must be checked for validity in caller */
100static inline int cifs_open_inode_helper(struct inode *inode, struct file *file,
101 struct cifsInodeInfo *pCifsInode, struct cifsFileInfo *pCifsFile,
102 struct cifsTconInfo *pTcon, int *oplock, FILE_ALL_INFO *buf,
103 char *full_path, int xid)
104{
105 struct timespec temp;
106 int rc;
107
108 /* want handles we can use to read with first
109 in the list so we do not have to walk the
d9414774 110 list to search for one in write_begin */
1da177e4 111 if ((file->f_flags & O_ACCMODE) == O_WRONLY) {
fb8c4b14 112 list_add_tail(&pCifsFile->flist,
1da177e4
LT
113 &pCifsInode->openFileList);
114 } else {
115 list_add(&pCifsFile->flist,
116 &pCifsInode->openFileList);
117 }
118 write_unlock(&GlobalSMBSeslock);
1da177e4
LT
119 if (pCifsInode->clientCanCacheRead) {
120 /* we have the inode open somewhere else
121 no need to discard cache data */
122 goto client_can_cache;
123 }
124
125 /* BB need same check in cifs_create too? */
126 /* if not oplocked, invalidate inode pages if mtime or file
127 size changed */
128 temp = cifs_NTtimeToUnix(le64_to_cpu(buf->LastWriteTime));
e6a00296
JJS
129 if (timespec_equal(&file->f_path.dentry->d_inode->i_mtime, &temp) &&
130 (file->f_path.dentry->d_inode->i_size ==
1da177e4
LT
131 (loff_t)le64_to_cpu(buf->EndOfFile))) {
132 cFYI(1, ("inode unchanged on server"));
133 } else {
e6a00296 134 if (file->f_path.dentry->d_inode->i_mapping) {
1da177e4
LT
135 /* BB no need to lock inode until after invalidate
136 since namei code should already have it locked? */
cea21805
JL
137 rc = filemap_write_and_wait(file->f_path.dentry->d_inode->i_mapping);
138 if (rc != 0)
139 CIFS_I(file->f_path.dentry->d_inode)->write_behind_rc = rc;
1da177e4
LT
140 }
141 cFYI(1, ("invalidating remote inode since open detected it "
142 "changed"));
e6a00296 143 invalidate_remote_inode(file->f_path.dentry->d_inode);
1da177e4
LT
144 }
145
146client_can_cache:
c18c842b 147 if (pTcon->unix_ext)
e6a00296 148 rc = cifs_get_inode_info_unix(&file->f_path.dentry->d_inode,
1da177e4
LT
149 full_path, inode->i_sb, xid);
150 else
e6a00296 151 rc = cifs_get_inode_info(&file->f_path.dentry->d_inode,
8b1327f6 152 full_path, buf, inode->i_sb, xid, NULL);
1da177e4
LT
153
154 if ((*oplock & 0xF) == OPLOCK_EXCLUSIVE) {
4b18f2a9
SF
155 pCifsInode->clientCanCacheAll = true;
156 pCifsInode->clientCanCacheRead = true;
1da177e4 157 cFYI(1, ("Exclusive Oplock granted on inode %p",
e6a00296 158 file->f_path.dentry->d_inode));
1da177e4 159 } else if ((*oplock & 0xF) == OPLOCK_READ)
4b18f2a9 160 pCifsInode->clientCanCacheRead = true;
1da177e4
LT
161
162 return rc;
163}
164
165int cifs_open(struct inode *inode, struct file *file)
166{
167 int rc = -EACCES;
168 int xid, oplock;
169 struct cifs_sb_info *cifs_sb;
170 struct cifsTconInfo *pTcon;
171 struct cifsFileInfo *pCifsFile;
172 struct cifsInodeInfo *pCifsInode;
173 struct list_head *tmp;
174 char *full_path = NULL;
175 int desiredAccess;
176 int disposition;
177 __u16 netfid;
178 FILE_ALL_INFO *buf = NULL;
179
180 xid = GetXid();
181
182 cifs_sb = CIFS_SB(inode->i_sb);
183 pTcon = cifs_sb->tcon;
184
185 if (file->f_flags & O_CREAT) {
186 /* search inode for this file and fill in file->private_data */
e6a00296 187 pCifsInode = CIFS_I(file->f_path.dentry->d_inode);
1da177e4
LT
188 read_lock(&GlobalSMBSeslock);
189 list_for_each(tmp, &pCifsInode->openFileList) {
190 pCifsFile = list_entry(tmp, struct cifsFileInfo,
191 flist);
192 if ((pCifsFile->pfile == NULL) &&
193 (pCifsFile->pid == current->tgid)) {
194 /* mode set in cifs_create */
195
196 /* needed for writepage */
197 pCifsFile->pfile = file;
50c2f753 198
1da177e4
LT
199 file->private_data = pCifsFile;
200 break;
201 }
202 }
203 read_unlock(&GlobalSMBSeslock);
204 if (file->private_data != NULL) {
205 rc = 0;
206 FreeXid(xid);
207 return rc;
208 } else {
209 if (file->f_flags & O_EXCL)
210 cERROR(1, ("could not find file instance for "
26a21b98 211 "new file %p", file));
1da177e4
LT
212 }
213 }
214
e6a00296 215 full_path = build_path_from_dentry(file->f_path.dentry);
1da177e4
LT
216 if (full_path == NULL) {
217 FreeXid(xid);
218 return -ENOMEM;
219 }
220
7521a3c5 221 cFYI(1, ("inode = 0x%p file flags are 0x%x for %s",
1da177e4
LT
222 inode, file->f_flags, full_path));
223 desiredAccess = cifs_convert_flags(file->f_flags);
224
225/*********************************************************************
226 * open flag mapping table:
fb8c4b14 227 *
1da177e4 228 * POSIX Flag CIFS Disposition
fb8c4b14 229 * ---------- ----------------
1da177e4
LT
230 * O_CREAT FILE_OPEN_IF
231 * O_CREAT | O_EXCL FILE_CREATE
232 * O_CREAT | O_TRUNC FILE_OVERWRITE_IF
233 * O_TRUNC FILE_OVERWRITE
234 * none of the above FILE_OPEN
235 *
236 * Note that there is not a direct match between disposition
fb8c4b14 237 * FILE_SUPERSEDE (ie create whether or not file exists although
1da177e4
LT
238 * O_CREAT | O_TRUNC is similar but truncates the existing
239 * file rather than creating a new file as FILE_SUPERSEDE does
240 * (which uses the attributes / metadata passed in on open call)
241 *?
fb8c4b14 242 *? O_SYNC is a reasonable match to CIFS writethrough flag
1da177e4
LT
243 *? and the read write flags match reasonably. O_LARGEFILE
244 *? is irrelevant because largefile support is always used
245 *? by this client. Flags O_APPEND, O_DIRECT, O_DIRECTORY,
246 * O_FASYNC, O_NOFOLLOW, O_NONBLOCK need further investigation
247 *********************************************************************/
248
249 disposition = cifs_get_disposition(file->f_flags);
250
251 if (oplockEnabled)
252 oplock = REQ_OPLOCK;
253 else
4b18f2a9 254 oplock = 0;
1da177e4
LT
255
256 /* BB pass O_SYNC flag through on file attributes .. BB */
257
258 /* Also refresh inode by passing in file_info buf returned by SMBOpen
259 and calling get_inode_info with returned buf (at least helps
260 non-Unix server case) */
261
fb8c4b14
SF
262 /* BB we can not do this if this is the second open of a file
263 and the first handle has writebehind data, we might be
1da177e4
LT
264 able to simply do a filemap_fdatawrite/filemap_fdatawait first */
265 buf = kmalloc(sizeof(FILE_ALL_INFO), GFP_KERNEL);
266 if (!buf) {
267 rc = -ENOMEM;
268 goto out;
269 }
5bafd765
SF
270
271 if (cifs_sb->tcon->ses->capabilities & CAP_NT_SMBS)
fb8c4b14 272 rc = CIFSSMBOpen(xid, pTcon, full_path, disposition,
5bafd765 273 desiredAccess, CREATE_NOT_DIR, &netfid, &oplock, buf,
737b758c
SF
274 cifs_sb->local_nls, cifs_sb->mnt_cifs_flags
275 & CIFS_MOUNT_MAP_SPECIAL_CHR);
5bafd765
SF
276 else
277 rc = -EIO; /* no NT SMB support fall into legacy open below */
278
a9d02ad4
SF
279 if (rc == -EIO) {
280 /* Old server, try legacy style OpenX */
281 rc = SMBLegacyOpen(xid, pTcon, full_path, disposition,
282 desiredAccess, CREATE_NOT_DIR, &netfid, &oplock, buf,
283 cifs_sb->local_nls, cifs_sb->mnt_cifs_flags
284 & CIFS_MOUNT_MAP_SPECIAL_CHR);
285 }
1da177e4 286 if (rc) {
26a21b98 287 cFYI(1, ("cifs_open returned 0x%x", rc));
1da177e4
LT
288 goto out;
289 }
290 file->private_data =
291 kmalloc(sizeof(struct cifsFileInfo), GFP_KERNEL);
292 if (file->private_data == NULL) {
293 rc = -ENOMEM;
294 goto out;
295 }
296 pCifsFile = cifs_init_private(file->private_data, inode, file, netfid);
1da177e4
LT
297 write_lock(&GlobalSMBSeslock);
298 list_add(&pCifsFile->tlist, &pTcon->openFileList);
299
e6a00296 300 pCifsInode = CIFS_I(file->f_path.dentry->d_inode);
1da177e4
LT
301 if (pCifsInode) {
302 rc = cifs_open_inode_helper(inode, file, pCifsInode,
303 pCifsFile, pTcon,
304 &oplock, buf, full_path, xid);
305 } else {
306 write_unlock(&GlobalSMBSeslock);
1da177e4
LT
307 }
308
fb8c4b14 309 if (oplock & CIFS_CREATE_ACTION) {
1da177e4
LT
310 /* time to set mode which we can not set earlier due to
311 problems creating new read-only files */
c18c842b 312 if (pTcon->unix_ext) {
4e1e7fb9
JL
313 struct cifs_unix_set_info_args args = {
314 .mode = inode->i_mode,
315 .uid = NO_CHANGE_64,
316 .gid = NO_CHANGE_64,
317 .ctime = NO_CHANGE_64,
318 .atime = NO_CHANGE_64,
319 .mtime = NO_CHANGE_64,
320 .device = 0,
321 };
322 CIFSSMBUnixSetInfo(xid, pTcon, full_path, &args,
737b758c 323 cifs_sb->local_nls,
fb8c4b14 324 cifs_sb->mnt_cifs_flags &
737b758c 325 CIFS_MOUNT_MAP_SPECIAL_CHR);
1da177e4
LT
326 }
327 }
328
329out:
330 kfree(buf);
331 kfree(full_path);
332 FreeXid(xid);
333 return rc;
334}
335
0418726b 336/* Try to reacquire byte range locks that were released when session */
1da177e4
LT
337/* to server was lost */
338static int cifs_relock_file(struct cifsFileInfo *cifsFile)
339{
340 int rc = 0;
341
342/* BB list all locks open on this file and relock */
343
344 return rc;
345}
346
4b18f2a9 347static int cifs_reopen_file(struct file *file, bool can_flush)
1da177e4
LT
348{
349 int rc = -EACCES;
350 int xid, oplock;
351 struct cifs_sb_info *cifs_sb;
352 struct cifsTconInfo *pTcon;
353 struct cifsFileInfo *pCifsFile;
354 struct cifsInodeInfo *pCifsInode;
fb8c4b14 355 struct inode *inode;
1da177e4
LT
356 char *full_path = NULL;
357 int desiredAccess;
358 int disposition = FILE_OPEN;
359 __u16 netfid;
360
ad7a2926 361 if (file->private_data)
1da177e4 362 pCifsFile = (struct cifsFileInfo *)file->private_data;
ad7a2926 363 else
1da177e4
LT
364 return -EBADF;
365
366 xid = GetXid();
367 down(&pCifsFile->fh_sem);
4b18f2a9 368 if (!pCifsFile->invalidHandle) {
1da177e4
LT
369 up(&pCifsFile->fh_sem);
370 FreeXid(xid);
371 return 0;
372 }
373
e6a00296 374 if (file->f_path.dentry == NULL) {
3a9f462f
SF
375 cERROR(1, ("no valid name if dentry freed"));
376 dump_stack();
377 rc = -EBADF;
378 goto reopen_error_exit;
379 }
380
381 inode = file->f_path.dentry->d_inode;
fb8c4b14 382 if (inode == NULL) {
3a9f462f
SF
383 cERROR(1, ("inode not valid"));
384 dump_stack();
385 rc = -EBADF;
386 goto reopen_error_exit;
1da177e4 387 }
50c2f753 388
1da177e4
LT
389 cifs_sb = CIFS_SB(inode->i_sb);
390 pTcon = cifs_sb->tcon;
3a9f462f 391
1da177e4
LT
392/* can not grab rename sem here because various ops, including
393 those that already have the rename sem can end up causing writepage
394 to get called and if the server was down that means we end up here,
395 and we can never tell if the caller already has the rename_sem */
e6a00296 396 full_path = build_path_from_dentry(file->f_path.dentry);
1da177e4 397 if (full_path == NULL) {
3a9f462f
SF
398 rc = -ENOMEM;
399reopen_error_exit:
1da177e4
LT
400 up(&pCifsFile->fh_sem);
401 FreeXid(xid);
3a9f462f 402 return rc;
1da177e4
LT
403 }
404
3a9f462f 405 cFYI(1, ("inode = 0x%p file flags 0x%x for %s",
fb8c4b14 406 inode, file->f_flags, full_path));
1da177e4
LT
407 desiredAccess = cifs_convert_flags(file->f_flags);
408
409 if (oplockEnabled)
410 oplock = REQ_OPLOCK;
411 else
4b18f2a9 412 oplock = 0;
1da177e4
LT
413
414 /* Can not refresh inode by passing in file_info buf to be returned
fb8c4b14
SF
415 by SMBOpen and then calling get_inode_info with returned buf
416 since file might have write behind data that needs to be flushed
1da177e4
LT
417 and server version of file size can be stale. If we knew for sure
418 that inode was not dirty locally we could do this */
419
1da177e4
LT
420 rc = CIFSSMBOpen(xid, pTcon, full_path, disposition, desiredAccess,
421 CREATE_NOT_DIR, &netfid, &oplock, NULL,
fb8c4b14 422 cifs_sb->local_nls, cifs_sb->mnt_cifs_flags &
737b758c 423 CIFS_MOUNT_MAP_SPECIAL_CHR);
1da177e4
LT
424 if (rc) {
425 up(&pCifsFile->fh_sem);
26a21b98
SF
426 cFYI(1, ("cifs_open returned 0x%x", rc));
427 cFYI(1, ("oplock: %d", oplock));
1da177e4
LT
428 } else {
429 pCifsFile->netfid = netfid;
4b18f2a9 430 pCifsFile->invalidHandle = false;
1da177e4
LT
431 up(&pCifsFile->fh_sem);
432 pCifsInode = CIFS_I(inode);
433 if (pCifsInode) {
434 if (can_flush) {
cea21805
JL
435 rc = filemap_write_and_wait(inode->i_mapping);
436 if (rc != 0)
437 CIFS_I(inode)->write_behind_rc = rc;
1da177e4
LT
438 /* temporarily disable caching while we
439 go to server to get inode info */
4b18f2a9
SF
440 pCifsInode->clientCanCacheAll = false;
441 pCifsInode->clientCanCacheRead = false;
c18c842b 442 if (pTcon->unix_ext)
1da177e4
LT
443 rc = cifs_get_inode_info_unix(&inode,
444 full_path, inode->i_sb, xid);
445 else
446 rc = cifs_get_inode_info(&inode,
447 full_path, NULL, inode->i_sb,
8b1327f6 448 xid, NULL);
1da177e4
LT
449 } /* else we are writing out data to server already
450 and could deadlock if we tried to flush data, and
451 since we do not know if we have data that would
452 invalidate the current end of file on the server
453 we can not go to the server to get the new inod
454 info */
455 if ((oplock & 0xF) == OPLOCK_EXCLUSIVE) {
4b18f2a9
SF
456 pCifsInode->clientCanCacheAll = true;
457 pCifsInode->clientCanCacheRead = true;
1da177e4 458 cFYI(1, ("Exclusive Oplock granted on inode %p",
e6a00296 459 file->f_path.dentry->d_inode));
1da177e4 460 } else if ((oplock & 0xF) == OPLOCK_READ) {
4b18f2a9
SF
461 pCifsInode->clientCanCacheRead = true;
462 pCifsInode->clientCanCacheAll = false;
1da177e4 463 } else {
4b18f2a9
SF
464 pCifsInode->clientCanCacheRead = false;
465 pCifsInode->clientCanCacheAll = false;
1da177e4
LT
466 }
467 cifs_relock_file(pCifsFile);
468 }
469 }
470
471 kfree(full_path);
472 FreeXid(xid);
473 return rc;
474}
475
476int cifs_close(struct inode *inode, struct file *file)
477{
478 int rc = 0;
15745320 479 int xid, timeout;
1da177e4
LT
480 struct cifs_sb_info *cifs_sb;
481 struct cifsTconInfo *pTcon;
482 struct cifsFileInfo *pSMBFile =
483 (struct cifsFileInfo *)file->private_data;
484
485 xid = GetXid();
486
487 cifs_sb = CIFS_SB(inode->i_sb);
488 pTcon = cifs_sb->tcon;
489 if (pSMBFile) {
7ee1af76 490 struct cifsLockInfo *li, *tmp;
ddb4cbfc 491 write_lock(&GlobalSMBSeslock);
4b18f2a9 492 pSMBFile->closePend = true;
1da177e4
LT
493 if (pTcon) {
494 /* no sense reconnecting to close a file that is
495 already closed */
3b795210 496 if (!pTcon->need_reconnect) {
ddb4cbfc 497 write_unlock(&GlobalSMBSeslock);
15745320 498 timeout = 2;
fb8c4b14 499 while ((atomic_read(&pSMBFile->wrtPending) != 0)
15745320 500 && (timeout <= 2048)) {
23e7dd7d
SF
501 /* Give write a better chance to get to
502 server ahead of the close. We do not
503 want to add a wait_q here as it would
504 increase the memory utilization as
505 the struct would be in each open file,
fb8c4b14 506 but this should give enough time to
23e7dd7d 507 clear the socket */
90c81e0b
SF
508 cFYI(DBG2,
509 ("close delay, write pending"));
23e7dd7d
SF
510 msleep(timeout);
511 timeout *= 4;
4891d539 512 }
fb8c4b14 513 if (atomic_read(&pSMBFile->wrtPending))
ddb4cbfc
SF
514 cERROR(1, ("close with pending write"));
515 if (!pTcon->need_reconnect &&
516 !pSMBFile->invalidHandle)
517 rc = CIFSSMBClose(xid, pTcon,
1da177e4 518 pSMBFile->netfid);
ddb4cbfc
SF
519 } else
520 write_unlock(&GlobalSMBSeslock);
521 } else
522 write_unlock(&GlobalSMBSeslock);
7ee1af76
JA
523
524 /* Delete any outstanding lock records.
525 We'll lose them when the file is closed anyway. */
796e5661 526 mutex_lock(&pSMBFile->lock_mutex);
7ee1af76
JA
527 list_for_each_entry_safe(li, tmp, &pSMBFile->llist, llist) {
528 list_del(&li->llist);
529 kfree(li);
530 }
796e5661 531 mutex_unlock(&pSMBFile->lock_mutex);
7ee1af76 532
cbe0476f 533 write_lock(&GlobalSMBSeslock);
1da177e4
LT
534 list_del(&pSMBFile->flist);
535 list_del(&pSMBFile->tlist);
cbe0476f 536 write_unlock(&GlobalSMBSeslock);
15745320
SF
537 timeout = 10;
538 /* We waited above to give the SMBWrite a chance to issue
539 on the wire (so we do not get SMBWrite returning EBADF
540 if writepages is racing with close. Note that writepages
541 does not specify a file handle, so it is possible for a file
542 to be opened twice, and the application close the "wrong"
543 file handle - in these cases we delay long enough to allow
544 the SMBWrite to get on the wire before the SMB Close.
545 We allow total wait here over 45 seconds, more than
546 oplock break time, and more than enough to allow any write
547 to complete on the server, or to time out on the client */
548 while ((atomic_read(&pSMBFile->wrtPending) != 0)
549 && (timeout <= 50000)) {
550 cERROR(1, ("writes pending, delay free of handle"));
551 msleep(timeout);
552 timeout *= 8;
553 }
1da177e4
LT
554 kfree(file->private_data);
555 file->private_data = NULL;
556 } else
557 rc = -EBADF;
558
4efa53f0 559 read_lock(&GlobalSMBSeslock);
1da177e4
LT
560 if (list_empty(&(CIFS_I(inode)->openFileList))) {
561 cFYI(1, ("closing last open instance for inode %p", inode));
562 /* if the file is not open we do not know if we can cache info
563 on this inode, much less write behind and read ahead */
4b18f2a9
SF
564 CIFS_I(inode)->clientCanCacheRead = false;
565 CIFS_I(inode)->clientCanCacheAll = false;
1da177e4 566 }
4efa53f0 567 read_unlock(&GlobalSMBSeslock);
fb8c4b14 568 if ((rc == 0) && CIFS_I(inode)->write_behind_rc)
1da177e4
LT
569 rc = CIFS_I(inode)->write_behind_rc;
570 FreeXid(xid);
571 return rc;
572}
573
574int cifs_closedir(struct inode *inode, struct file *file)
575{
576 int rc = 0;
577 int xid;
578 struct cifsFileInfo *pCFileStruct =
579 (struct cifsFileInfo *)file->private_data;
580 char *ptmp;
581
26a21b98 582 cFYI(1, ("Closedir inode = 0x%p", inode));
1da177e4
LT
583
584 xid = GetXid();
585
586 if (pCFileStruct) {
587 struct cifsTconInfo *pTcon;
fb8c4b14
SF
588 struct cifs_sb_info *cifs_sb =
589 CIFS_SB(file->f_path.dentry->d_sb);
1da177e4
LT
590
591 pTcon = cifs_sb->tcon;
592
593 cFYI(1, ("Freeing private data in close dir"));
ddb4cbfc 594 write_lock(&GlobalSMBSeslock);
4b18f2a9
SF
595 if (!pCFileStruct->srch_inf.endOfSearch &&
596 !pCFileStruct->invalidHandle) {
597 pCFileStruct->invalidHandle = true;
ddb4cbfc 598 write_unlock(&GlobalSMBSeslock);
1da177e4
LT
599 rc = CIFSFindClose(xid, pTcon, pCFileStruct->netfid);
600 cFYI(1, ("Closing uncompleted readdir with rc %d",
601 rc));
602 /* not much we can do if it fails anyway, ignore rc */
603 rc = 0;
ddb4cbfc
SF
604 } else
605 write_unlock(&GlobalSMBSeslock);
1da177e4
LT
606 ptmp = pCFileStruct->srch_inf.ntwrk_buf_start;
607 if (ptmp) {
ec637e3f 608 cFYI(1, ("closedir free smb buf in srch struct"));
1da177e4 609 pCFileStruct->srch_inf.ntwrk_buf_start = NULL;
fb8c4b14 610 if (pCFileStruct->srch_inf.smallBuf)
d47d7c1a
SF
611 cifs_small_buf_release(ptmp);
612 else
613 cifs_buf_release(ptmp);
1da177e4 614 }
1da177e4
LT
615 kfree(file->private_data);
616 file->private_data = NULL;
617 }
618 /* BB can we lock the filestruct while this is going on? */
619 FreeXid(xid);
620 return rc;
621}
622
7ee1af76
JA
623static int store_file_lock(struct cifsFileInfo *fid, __u64 len,
624 __u64 offset, __u8 lockType)
625{
fb8c4b14
SF
626 struct cifsLockInfo *li =
627 kmalloc(sizeof(struct cifsLockInfo), GFP_KERNEL);
7ee1af76
JA
628 if (li == NULL)
629 return -ENOMEM;
630 li->offset = offset;
631 li->length = len;
632 li->type = lockType;
796e5661 633 mutex_lock(&fid->lock_mutex);
7ee1af76 634 list_add(&li->llist, &fid->llist);
796e5661 635 mutex_unlock(&fid->lock_mutex);
7ee1af76
JA
636 return 0;
637}
638
1da177e4
LT
639int cifs_lock(struct file *file, int cmd, struct file_lock *pfLock)
640{
641 int rc, xid;
1da177e4
LT
642 __u32 numLock = 0;
643 __u32 numUnlock = 0;
644 __u64 length;
4b18f2a9 645 bool wait_flag = false;
1da177e4 646 struct cifs_sb_info *cifs_sb;
13a6e42a 647 struct cifsTconInfo *tcon;
08547b03
SF
648 __u16 netfid;
649 __u8 lockType = LOCKING_ANDX_LARGE_FILES;
13a6e42a 650 bool posix_locking = 0;
1da177e4
LT
651
652 length = 1 + pfLock->fl_end - pfLock->fl_start;
653 rc = -EACCES;
654 xid = GetXid();
655
656 cFYI(1, ("Lock parm: 0x%x flockflags: "
657 "0x%x flocktype: 0x%x start: %lld end: %lld",
fb8c4b14
SF
658 cmd, pfLock->fl_flags, pfLock->fl_type, pfLock->fl_start,
659 pfLock->fl_end));
1da177e4
LT
660
661 if (pfLock->fl_flags & FL_POSIX)
d47d7c1a 662 cFYI(1, ("Posix"));
1da177e4 663 if (pfLock->fl_flags & FL_FLOCK)
d47d7c1a 664 cFYI(1, ("Flock"));
1da177e4 665 if (pfLock->fl_flags & FL_SLEEP) {
d47d7c1a 666 cFYI(1, ("Blocking lock"));
4b18f2a9 667 wait_flag = true;
1da177e4
LT
668 }
669 if (pfLock->fl_flags & FL_ACCESS)
670 cFYI(1, ("Process suspended by mandatory locking - "
26a21b98 671 "not implemented yet"));
1da177e4
LT
672 if (pfLock->fl_flags & FL_LEASE)
673 cFYI(1, ("Lease on file - not implemented yet"));
fb8c4b14 674 if (pfLock->fl_flags &
1da177e4
LT
675 (~(FL_POSIX | FL_FLOCK | FL_SLEEP | FL_ACCESS | FL_LEASE)))
676 cFYI(1, ("Unknown lock flags 0x%x", pfLock->fl_flags));
677
678 if (pfLock->fl_type == F_WRLCK) {
679 cFYI(1, ("F_WRLCK "));
680 numLock = 1;
681 } else if (pfLock->fl_type == F_UNLCK) {
d47d7c1a 682 cFYI(1, ("F_UNLCK"));
1da177e4 683 numUnlock = 1;
d47d7c1a
SF
684 /* Check if unlock includes more than
685 one lock range */
1da177e4 686 } else if (pfLock->fl_type == F_RDLCK) {
d47d7c1a 687 cFYI(1, ("F_RDLCK"));
1da177e4
LT
688 lockType |= LOCKING_ANDX_SHARED_LOCK;
689 numLock = 1;
690 } else if (pfLock->fl_type == F_EXLCK) {
d47d7c1a 691 cFYI(1, ("F_EXLCK"));
1da177e4
LT
692 numLock = 1;
693 } else if (pfLock->fl_type == F_SHLCK) {
d47d7c1a 694 cFYI(1, ("F_SHLCK"));
1da177e4
LT
695 lockType |= LOCKING_ANDX_SHARED_LOCK;
696 numLock = 1;
697 } else
d47d7c1a 698 cFYI(1, ("Unknown type of lock"));
1da177e4 699
e6a00296 700 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
13a6e42a 701 tcon = cifs_sb->tcon;
1da177e4
LT
702
703 if (file->private_data == NULL) {
704 FreeXid(xid);
705 return -EBADF;
706 }
08547b03
SF
707 netfid = ((struct cifsFileInfo *)file->private_data)->netfid;
708
13a6e42a
SF
709 if ((tcon->ses->capabilities & CAP_UNIX) &&
710 (CIFS_UNIX_FCNTL_CAP & le64_to_cpu(tcon->fsUnixInfo.Capability)) &&
acc18aa1 711 ((cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NOPOSIXBRL) == 0))
13a6e42a 712 posix_locking = 1;
08547b03
SF
713 /* BB add code here to normalize offset and length to
714 account for negative length which we can not accept over the
715 wire */
1da177e4 716 if (IS_GETLK(cmd)) {
fb8c4b14 717 if (posix_locking) {
08547b03 718 int posix_lock_type;
fb8c4b14 719 if (lockType & LOCKING_ANDX_SHARED_LOCK)
08547b03
SF
720 posix_lock_type = CIFS_RDLCK;
721 else
722 posix_lock_type = CIFS_WRLCK;
13a6e42a 723 rc = CIFSSMBPosixLock(xid, tcon, netfid, 1 /* get */,
fc94cdb9 724 length, pfLock,
08547b03
SF
725 posix_lock_type, wait_flag);
726 FreeXid(xid);
727 return rc;
728 }
729
730 /* BB we could chain these into one lock request BB */
13a6e42a 731 rc = CIFSSMBLock(xid, tcon, netfid, length, pfLock->fl_start,
08547b03 732 0, 1, lockType, 0 /* wait flag */ );
1da177e4 733 if (rc == 0) {
13a6e42a 734 rc = CIFSSMBLock(xid, tcon, netfid, length,
1da177e4
LT
735 pfLock->fl_start, 1 /* numUnlock */ ,
736 0 /* numLock */ , lockType,
737 0 /* wait flag */ );
738 pfLock->fl_type = F_UNLCK;
739 if (rc != 0)
740 cERROR(1, ("Error unlocking previously locked "
08547b03 741 "range %d during test of lock", rc));
1da177e4
LT
742 rc = 0;
743
744 } else {
745 /* if rc == ERR_SHARING_VIOLATION ? */
746 rc = 0; /* do not change lock type to unlock
747 since range in use */
748 }
749
750 FreeXid(xid);
751 return rc;
752 }
7ee1af76
JA
753
754 if (!numLock && !numUnlock) {
755 /* if no lock or unlock then nothing
756 to do since we do not know what it is */
757 FreeXid(xid);
758 return -EOPNOTSUPP;
759 }
760
761 if (posix_locking) {
08547b03 762 int posix_lock_type;
fb8c4b14 763 if (lockType & LOCKING_ANDX_SHARED_LOCK)
08547b03
SF
764 posix_lock_type = CIFS_RDLCK;
765 else
766 posix_lock_type = CIFS_WRLCK;
50c2f753 767
fb8c4b14 768 if (numUnlock == 1)
beb84dc8 769 posix_lock_type = CIFS_UNLCK;
7ee1af76 770
13a6e42a 771 rc = CIFSSMBPosixLock(xid, tcon, netfid, 0 /* set */,
fc94cdb9 772 length, pfLock,
08547b03 773 posix_lock_type, wait_flag);
7ee1af76 774 } else {
fb8c4b14
SF
775 struct cifsFileInfo *fid =
776 (struct cifsFileInfo *)file->private_data;
7ee1af76
JA
777
778 if (numLock) {
13a6e42a 779 rc = CIFSSMBLock(xid, tcon, netfid, length,
fb8c4b14 780 pfLock->fl_start,
7ee1af76
JA
781 0, numLock, lockType, wait_flag);
782
783 if (rc == 0) {
784 /* For Windows locks we must store them. */
785 rc = store_file_lock(fid, length,
786 pfLock->fl_start, lockType);
787 }
788 } else if (numUnlock) {
789 /* For each stored lock that this unlock overlaps
790 completely, unlock it. */
791 int stored_rc = 0;
792 struct cifsLockInfo *li, *tmp;
793
6b70c955 794 rc = 0;
796e5661 795 mutex_lock(&fid->lock_mutex);
7ee1af76
JA
796 list_for_each_entry_safe(li, tmp, &fid->llist, llist) {
797 if (pfLock->fl_start <= li->offset &&
c19eb710 798 (pfLock->fl_start + length) >=
39db810c 799 (li->offset + li->length)) {
13a6e42a 800 stored_rc = CIFSSMBLock(xid, tcon,
fb8c4b14 801 netfid,
7ee1af76 802 li->length, li->offset,
4b18f2a9 803 1, 0, li->type, false);
7ee1af76
JA
804 if (stored_rc)
805 rc = stored_rc;
806
807 list_del(&li->llist);
808 kfree(li);
809 }
810 }
796e5661 811 mutex_unlock(&fid->lock_mutex);
7ee1af76
JA
812 }
813 }
814
d634cc15 815 if (pfLock->fl_flags & FL_POSIX)
1da177e4
LT
816 posix_lock_file_wait(file, pfLock);
817 FreeXid(xid);
818 return rc;
819}
820
821ssize_t cifs_user_write(struct file *file, const char __user *write_data,
822 size_t write_size, loff_t *poffset)
823{
824 int rc = 0;
825 unsigned int bytes_written = 0;
826 unsigned int total_written;
827 struct cifs_sb_info *cifs_sb;
828 struct cifsTconInfo *pTcon;
829 int xid, long_op;
830 struct cifsFileInfo *open_file;
831
e6a00296 832 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
1da177e4
LT
833
834 pTcon = cifs_sb->tcon;
835
836 /* cFYI(1,
837 (" write %d bytes to offset %lld of %s", write_size,
e6a00296 838 *poffset, file->f_path.dentry->d_name.name)); */
1da177e4
LT
839
840 if (file->private_data == NULL)
841 return -EBADF;
c33f8d32 842 open_file = (struct cifsFileInfo *) file->private_data;
50c2f753 843
838726c4
JL
844 rc = generic_write_checks(file, poffset, &write_size, 0);
845 if (rc)
846 return rc;
847
1da177e4 848 xid = GetXid();
1da177e4 849
e6a00296 850 if (*poffset > file->f_path.dentry->d_inode->i_size)
133672ef 851 long_op = CIFS_VLONG_OP; /* writes past EOF take long time */
1da177e4 852 else
133672ef 853 long_op = CIFS_LONG_OP;
1da177e4
LT
854
855 for (total_written = 0; write_size > total_written;
856 total_written += bytes_written) {
857 rc = -EAGAIN;
858 while (rc == -EAGAIN) {
859 if (file->private_data == NULL) {
860 /* file has been closed on us */
861 FreeXid(xid);
862 /* if we have gotten here we have written some data
863 and blocked, and the file has been freed on us while
864 we blocked so return what we managed to write */
865 return total_written;
fb8c4b14 866 }
1da177e4
LT
867 if (open_file->closePend) {
868 FreeXid(xid);
869 if (total_written)
870 return total_written;
871 else
872 return -EBADF;
873 }
874 if (open_file->invalidHandle) {
1da177e4
LT
875 /* we could deadlock if we called
876 filemap_fdatawait from here so tell
877 reopen_file not to flush data to server
878 now */
4b18f2a9 879 rc = cifs_reopen_file(file, false);
1da177e4
LT
880 if (rc != 0)
881 break;
882 }
883
884 rc = CIFSSMBWrite(xid, pTcon,
885 open_file->netfid,
886 min_t(const int, cifs_sb->wsize,
887 write_size - total_written),
888 *poffset, &bytes_written,
889 NULL, write_data + total_written, long_op);
890 }
891 if (rc || (bytes_written == 0)) {
892 if (total_written)
893 break;
894 else {
895 FreeXid(xid);
896 return rc;
897 }
898 } else
899 *poffset += bytes_written;
133672ef 900 long_op = CIFS_STD_OP; /* subsequent writes fast -
1da177e4
LT
901 15 seconds is plenty */
902 }
903
a4544347 904 cifs_stats_bytes_written(pTcon, total_written);
1da177e4
LT
905
906 /* since the write may have blocked check these pointers again */
3677db10
SF
907 if ((file->f_path.dentry) && (file->f_path.dentry->d_inode)) {
908 struct inode *inode = file->f_path.dentry->d_inode;
fb8c4b14
SF
909/* Do not update local mtime - server will set its actual value on write
910 * inode->i_ctime = inode->i_mtime =
3677db10
SF
911 * current_fs_time(inode->i_sb);*/
912 if (total_written > 0) {
913 spin_lock(&inode->i_lock);
914 if (*poffset > file->f_path.dentry->d_inode->i_size)
915 i_size_write(file->f_path.dentry->d_inode,
1da177e4 916 *poffset);
3677db10 917 spin_unlock(&inode->i_lock);
1da177e4 918 }
fb8c4b14 919 mark_inode_dirty_sync(file->f_path.dentry->d_inode);
1da177e4
LT
920 }
921 FreeXid(xid);
922 return total_written;
923}
924
925static ssize_t cifs_write(struct file *file, const char *write_data,
d9414774 926 size_t write_size, loff_t *poffset)
1da177e4
LT
927{
928 int rc = 0;
929 unsigned int bytes_written = 0;
930 unsigned int total_written;
931 struct cifs_sb_info *cifs_sb;
932 struct cifsTconInfo *pTcon;
933 int xid, long_op;
934 struct cifsFileInfo *open_file;
935
e6a00296 936 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
1da177e4
LT
937
938 pTcon = cifs_sb->tcon;
939
fb8c4b14 940 cFYI(1, ("write %zd bytes to offset %lld of %s", write_size,
e6a00296 941 *poffset, file->f_path.dentry->d_name.name));
1da177e4
LT
942
943 if (file->private_data == NULL)
944 return -EBADF;
c33f8d32 945 open_file = (struct cifsFileInfo *)file->private_data;
50c2f753 946
1da177e4 947 xid = GetXid();
1da177e4 948
e6a00296 949 if (*poffset > file->f_path.dentry->d_inode->i_size)
133672ef 950 long_op = CIFS_VLONG_OP; /* writes past EOF can be slow */
1da177e4 951 else
133672ef 952 long_op = CIFS_LONG_OP;
1da177e4
LT
953
954 for (total_written = 0; write_size > total_written;
955 total_written += bytes_written) {
956 rc = -EAGAIN;
957 while (rc == -EAGAIN) {
958 if (file->private_data == NULL) {
959 /* file has been closed on us */
960 FreeXid(xid);
961 /* if we have gotten here we have written some data
962 and blocked, and the file has been freed on us
fb8c4b14 963 while we blocked so return what we managed to
1da177e4
LT
964 write */
965 return total_written;
fb8c4b14 966 }
1da177e4
LT
967 if (open_file->closePend) {
968 FreeXid(xid);
969 if (total_written)
970 return total_written;
971 else
972 return -EBADF;
973 }
974 if (open_file->invalidHandle) {
1da177e4
LT
975 /* we could deadlock if we called
976 filemap_fdatawait from here so tell
fb8c4b14 977 reopen_file not to flush data to
1da177e4 978 server now */
4b18f2a9 979 rc = cifs_reopen_file(file, false);
1da177e4
LT
980 if (rc != 0)
981 break;
982 }
fb8c4b14
SF
983 if (experimEnabled || (pTcon->ses->server &&
984 ((pTcon->ses->server->secMode &
08775834 985 (SECMODE_SIGN_REQUIRED | SECMODE_SIGN_ENABLED))
c01f36a8 986 == 0))) {
3e84469d
SF
987 struct kvec iov[2];
988 unsigned int len;
989
0ae0efad 990 len = min((size_t)cifs_sb->wsize,
3e84469d
SF
991 write_size - total_written);
992 /* iov[0] is reserved for smb header */
993 iov[1].iov_base = (char *)write_data +
994 total_written;
995 iov[1].iov_len = len;
d6e04ae6 996 rc = CIFSSMBWrite2(xid, pTcon,
3e84469d 997 open_file->netfid, len,
d6e04ae6 998 *poffset, &bytes_written,
3e84469d 999 iov, 1, long_op);
d6e04ae6 1000 } else
60808233
SF
1001 rc = CIFSSMBWrite(xid, pTcon,
1002 open_file->netfid,
1003 min_t(const int, cifs_sb->wsize,
1004 write_size - total_written),
1005 *poffset, &bytes_written,
1006 write_data + total_written,
1007 NULL, long_op);
1da177e4
LT
1008 }
1009 if (rc || (bytes_written == 0)) {
1010 if (total_written)
1011 break;
1012 else {
1013 FreeXid(xid);
1014 return rc;
1015 }
1016 } else
1017 *poffset += bytes_written;
133672ef 1018 long_op = CIFS_STD_OP; /* subsequent writes fast -
1da177e4
LT
1019 15 seconds is plenty */
1020 }
1021
a4544347 1022 cifs_stats_bytes_written(pTcon, total_written);
1da177e4
LT
1023
1024 /* since the write may have blocked check these pointers again */
3677db10 1025 if ((file->f_path.dentry) && (file->f_path.dentry->d_inode)) {
004c46b9 1026/*BB We could make this contingent on superblock ATIME flag too */
3677db10
SF
1027/* file->f_path.dentry->d_inode->i_ctime =
1028 file->f_path.dentry->d_inode->i_mtime = CURRENT_TIME;*/
1029 if (total_written > 0) {
1030 spin_lock(&file->f_path.dentry->d_inode->i_lock);
1031 if (*poffset > file->f_path.dentry->d_inode->i_size)
1032 i_size_write(file->f_path.dentry->d_inode,
1033 *poffset);
1034 spin_unlock(&file->f_path.dentry->d_inode->i_lock);
1da177e4 1035 }
3677db10 1036 mark_inode_dirty_sync(file->f_path.dentry->d_inode);
1da177e4
LT
1037 }
1038 FreeXid(xid);
1039 return total_written;
1040}
1041
630f3f0c
SF
1042#ifdef CONFIG_CIFS_EXPERIMENTAL
1043struct cifsFileInfo *find_readable_file(struct cifsInodeInfo *cifs_inode)
1044{
1045 struct cifsFileInfo *open_file = NULL;
1046
1047 read_lock(&GlobalSMBSeslock);
1048 /* we could simply get the first_list_entry since write-only entries
1049 are always at the end of the list but since the first entry might
1050 have a close pending, we go through the whole list */
1051 list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
1052 if (open_file->closePend)
1053 continue;
1054 if (open_file->pfile && ((open_file->pfile->f_flags & O_RDWR) ||
1055 (open_file->pfile->f_flags & O_RDONLY))) {
1056 if (!open_file->invalidHandle) {
1057 /* found a good file */
1058 /* lock it so it will not be closed on us */
1059 atomic_inc(&open_file->wrtPending);
1060 read_unlock(&GlobalSMBSeslock);
1061 return open_file;
1062 } /* else might as well continue, and look for
1063 another, or simply have the caller reopen it
1064 again rather than trying to fix this handle */
1065 } else /* write only file */
1066 break; /* write only files are last so must be done */
1067 }
1068 read_unlock(&GlobalSMBSeslock);
1069 return NULL;
1070}
1071#endif
1072
dd99cd80 1073struct cifsFileInfo *find_writable_file(struct cifsInodeInfo *cifs_inode)
6148a742
SF
1074{
1075 struct cifsFileInfo *open_file;
2846d386 1076 bool any_available = false;
dd99cd80 1077 int rc;
6148a742 1078
60808233
SF
1079 /* Having a null inode here (because mapping->host was set to zero by
1080 the VFS or MM) should not happen but we had reports of on oops (due to
1081 it being zero) during stress testcases so we need to check for it */
1082
fb8c4b14
SF
1083 if (cifs_inode == NULL) {
1084 cERROR(1, ("Null inode passed to cifs_writeable_file"));
60808233
SF
1085 dump_stack();
1086 return NULL;
1087 }
1088
6148a742 1089 read_lock(&GlobalSMBSeslock);
9b22b0b7 1090refind_writable:
6148a742 1091 list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
2846d386
JL
1092 if (open_file->closePend ||
1093 (!any_available && open_file->pid != current->tgid))
6148a742 1094 continue;
2846d386 1095
6148a742
SF
1096 if (open_file->pfile &&
1097 ((open_file->pfile->f_flags & O_RDWR) ||
1098 (open_file->pfile->f_flags & O_WRONLY))) {
23e7dd7d 1099 atomic_inc(&open_file->wrtPending);
9b22b0b7
SF
1100
1101 if (!open_file->invalidHandle) {
1102 /* found a good writable file */
1103 read_unlock(&GlobalSMBSeslock);
1104 return open_file;
1105 }
8840dee9 1106
6148a742 1107 read_unlock(&GlobalSMBSeslock);
9b22b0b7 1108 /* Had to unlock since following call can block */
4b18f2a9 1109 rc = cifs_reopen_file(open_file->pfile, false);
8840dee9 1110 if (!rc) {
9b22b0b7
SF
1111 if (!open_file->closePend)
1112 return open_file;
1113 else { /* start over in case this was deleted */
1114 /* since the list could be modified */
37c0eb46 1115 read_lock(&GlobalSMBSeslock);
15745320 1116 atomic_dec(&open_file->wrtPending);
9b22b0b7 1117 goto refind_writable;
37c0eb46
SF
1118 }
1119 }
9b22b0b7
SF
1120
1121 /* if it fails, try another handle if possible -
1122 (we can not do this if closePending since
1123 loop could be modified - in which case we
1124 have to start at the beginning of the list
1125 again. Note that it would be bad
1126 to hold up writepages here (rather than
1127 in caller) with continuous retries */
1128 cFYI(1, ("wp failed on reopen file"));
1129 read_lock(&GlobalSMBSeslock);
1130 /* can not use this handle, no write
1131 pending on this one after all */
1132 atomic_dec(&open_file->wrtPending);
8840dee9 1133
9b22b0b7
SF
1134 if (open_file->closePend) /* list could have changed */
1135 goto refind_writable;
1136 /* else we simply continue to the next entry. Thus
1137 we do not loop on reopen errors. If we
1138 can not reopen the file, for example if we
1139 reconnected to a server with another client
1140 racing to delete or lock the file we would not
1141 make progress if we restarted before the beginning
1142 of the loop here. */
6148a742
SF
1143 }
1144 }
2846d386
JL
1145 /* couldn't find useable FH with same pid, try any available */
1146 if (!any_available) {
1147 any_available = true;
1148 goto refind_writable;
1149 }
6148a742
SF
1150 read_unlock(&GlobalSMBSeslock);
1151 return NULL;
1152}
1153
1da177e4
LT
1154static int cifs_partialpagewrite(struct page *page, unsigned from, unsigned to)
1155{
1156 struct address_space *mapping = page->mapping;
1157 loff_t offset = (loff_t)page->index << PAGE_CACHE_SHIFT;
1158 char *write_data;
1159 int rc = -EFAULT;
1160 int bytes_written = 0;
1161 struct cifs_sb_info *cifs_sb;
1162 struct cifsTconInfo *pTcon;
1163 struct inode *inode;
6148a742 1164 struct cifsFileInfo *open_file;
1da177e4
LT
1165
1166 if (!mapping || !mapping->host)
1167 return -EFAULT;
1168
1169 inode = page->mapping->host;
1170 cifs_sb = CIFS_SB(inode->i_sb);
1171 pTcon = cifs_sb->tcon;
1172
1173 offset += (loff_t)from;
1174 write_data = kmap(page);
1175 write_data += from;
1176
1177 if ((to > PAGE_CACHE_SIZE) || (from > to)) {
1178 kunmap(page);
1179 return -EIO;
1180 }
1181
1182 /* racing with truncate? */
1183 if (offset > mapping->host->i_size) {
1184 kunmap(page);
1185 return 0; /* don't care */
1186 }
1187
1188 /* check to make sure that we are not extending the file */
1189 if (mapping->host->i_size - offset < (loff_t)to)
fb8c4b14 1190 to = (unsigned)(mapping->host->i_size - offset);
1da177e4 1191
6148a742
SF
1192 open_file = find_writable_file(CIFS_I(mapping->host));
1193 if (open_file) {
1194 bytes_written = cifs_write(open_file->pfile, write_data,
1195 to-from, &offset);
23e7dd7d 1196 atomic_dec(&open_file->wrtPending);
1da177e4 1197 /* Does mm or vfs already set times? */
6148a742 1198 inode->i_atime = inode->i_mtime = current_fs_time(inode->i_sb);
bb5a9a04 1199 if ((bytes_written > 0) && (offset))
6148a742 1200 rc = 0;
bb5a9a04
SF
1201 else if (bytes_written < 0)
1202 rc = bytes_written;
6148a742 1203 } else {
1da177e4
LT
1204 cFYI(1, ("No writeable filehandles for inode"));
1205 rc = -EIO;
1206 }
1207
1208 kunmap(page);
1209 return rc;
1210}
1211
1da177e4 1212static int cifs_writepages(struct address_space *mapping,
37c0eb46 1213 struct writeback_control *wbc)
1da177e4 1214{
37c0eb46
SF
1215 struct backing_dev_info *bdi = mapping->backing_dev_info;
1216 unsigned int bytes_to_write;
1217 unsigned int bytes_written;
1218 struct cifs_sb_info *cifs_sb;
1219 int done = 0;
111ebb6e 1220 pgoff_t end;
37c0eb46 1221 pgoff_t index;
fb8c4b14
SF
1222 int range_whole = 0;
1223 struct kvec *iov;
84d2f07e 1224 int len;
37c0eb46
SF
1225 int n_iov = 0;
1226 pgoff_t next;
1227 int nr_pages;
1228 __u64 offset = 0;
23e7dd7d 1229 struct cifsFileInfo *open_file;
37c0eb46
SF
1230 struct page *page;
1231 struct pagevec pvec;
1232 int rc = 0;
1233 int scanned = 0;
1da177e4
LT
1234 int xid;
1235
37c0eb46 1236 cifs_sb = CIFS_SB(mapping->host->i_sb);
50c2f753 1237
37c0eb46
SF
1238 /*
1239 * If wsize is smaller that the page cache size, default to writing
1240 * one page at a time via cifs_writepage
1241 */
1242 if (cifs_sb->wsize < PAGE_CACHE_SIZE)
1243 return generic_writepages(mapping, wbc);
1244
fb8c4b14
SF
1245 if ((cifs_sb->tcon->ses) && (cifs_sb->tcon->ses->server))
1246 if (cifs_sb->tcon->ses->server->secMode &
1247 (SECMODE_SIGN_REQUIRED | SECMODE_SIGN_ENABLED))
1248 if (!experimEnabled)
60808233 1249 return generic_writepages(mapping, wbc);
4a77118c 1250
9a0c8230 1251 iov = kmalloc(32 * sizeof(struct kvec), GFP_KERNEL);
fb8c4b14 1252 if (iov == NULL)
9a0c8230
SF
1253 return generic_writepages(mapping, wbc);
1254
1255
37c0eb46
SF
1256 /*
1257 * BB: Is this meaningful for a non-block-device file system?
1258 * If it is, we should test it again after we do I/O
1259 */
1260 if (wbc->nonblocking && bdi_write_congested(bdi)) {
1261 wbc->encountered_congestion = 1;
9a0c8230 1262 kfree(iov);
37c0eb46
SF
1263 return 0;
1264 }
1265
1da177e4
LT
1266 xid = GetXid();
1267
37c0eb46 1268 pagevec_init(&pvec, 0);
111ebb6e 1269 if (wbc->range_cyclic) {
37c0eb46 1270 index = mapping->writeback_index; /* Start from prev offset */
111ebb6e
OH
1271 end = -1;
1272 } else {
1273 index = wbc->range_start >> PAGE_CACHE_SHIFT;
1274 end = wbc->range_end >> PAGE_CACHE_SHIFT;
1275 if (wbc->range_start == 0 && wbc->range_end == LLONG_MAX)
1276 range_whole = 1;
37c0eb46
SF
1277 scanned = 1;
1278 }
1279retry:
1280 while (!done && (index <= end) &&
1281 (nr_pages = pagevec_lookup_tag(&pvec, mapping, &index,
1282 PAGECACHE_TAG_DIRTY,
1283 min(end - index, (pgoff_t)PAGEVEC_SIZE - 1) + 1))) {
1284 int first;
1285 unsigned int i;
1286
37c0eb46
SF
1287 first = -1;
1288 next = 0;
1289 n_iov = 0;
1290 bytes_to_write = 0;
1291
1292 for (i = 0; i < nr_pages; i++) {
1293 page = pvec.pages[i];
1294 /*
1295 * At this point we hold neither mapping->tree_lock nor
1296 * lock on the page itself: the page may be truncated or
1297 * invalidated (changing page->mapping to NULL), or even
1298 * swizzled back from swapper_space to tmpfs file
1299 * mapping
1300 */
1301
1302 if (first < 0)
1303 lock_page(page);
529ae9aa 1304 else if (!trylock_page(page))
37c0eb46
SF
1305 break;
1306
1307 if (unlikely(page->mapping != mapping)) {
1308 unlock_page(page);
1309 break;
1310 }
1311
111ebb6e 1312 if (!wbc->range_cyclic && page->index > end) {
37c0eb46
SF
1313 done = 1;
1314 unlock_page(page);
1315 break;
1316 }
1317
1318 if (next && (page->index != next)) {
1319 /* Not next consecutive page */
1320 unlock_page(page);
1321 break;
1322 }
1323
1324 if (wbc->sync_mode != WB_SYNC_NONE)
1325 wait_on_page_writeback(page);
1326
1327 if (PageWriteback(page) ||
cb876f45 1328 !clear_page_dirty_for_io(page)) {
37c0eb46
SF
1329 unlock_page(page);
1330 break;
1331 }
84d2f07e 1332
cb876f45
LT
1333 /*
1334 * This actually clears the dirty bit in the radix tree.
1335 * See cifs_writepage() for more commentary.
1336 */
1337 set_page_writeback(page);
1338
84d2f07e
SF
1339 if (page_offset(page) >= mapping->host->i_size) {
1340 done = 1;
1341 unlock_page(page);
cb876f45 1342 end_page_writeback(page);
84d2f07e
SF
1343 break;
1344 }
1345
37c0eb46
SF
1346 /*
1347 * BB can we get rid of this? pages are held by pvec
1348 */
1349 page_cache_get(page);
1350
84d2f07e
SF
1351 len = min(mapping->host->i_size - page_offset(page),
1352 (loff_t)PAGE_CACHE_SIZE);
1353
37c0eb46
SF
1354 /* reserve iov[0] for the smb header */
1355 n_iov++;
1356 iov[n_iov].iov_base = kmap(page);
84d2f07e
SF
1357 iov[n_iov].iov_len = len;
1358 bytes_to_write += len;
37c0eb46
SF
1359
1360 if (first < 0) {
1361 first = i;
1362 offset = page_offset(page);
1363 }
1364 next = page->index + 1;
1365 if (bytes_to_write + PAGE_CACHE_SIZE > cifs_sb->wsize)
1366 break;
1367 }
1368 if (n_iov) {
23e7dd7d
SF
1369 /* Search for a writable handle every time we call
1370 * CIFSSMBWrite2. We can't rely on the last handle
1371 * we used to still be valid
1372 */
1373 open_file = find_writable_file(CIFS_I(mapping->host));
1374 if (!open_file) {
1375 cERROR(1, ("No writable handles for inode"));
1376 rc = -EBADF;
1047abc1 1377 } else {
23e7dd7d
SF
1378 rc = CIFSSMBWrite2(xid, cifs_sb->tcon,
1379 open_file->netfid,
1380 bytes_to_write, offset,
1381 &bytes_written, iov, n_iov,
133672ef 1382 CIFS_LONG_OP);
23e7dd7d
SF
1383 atomic_dec(&open_file->wrtPending);
1384 if (rc || bytes_written < bytes_to_write) {
63135e08 1385 cERROR(1, ("Write2 ret %d, wrote %d",
23e7dd7d
SF
1386 rc, bytes_written));
1387 /* BB what if continued retry is
1388 requested via mount flags? */
cea21805
JL
1389 if (rc == -ENOSPC)
1390 set_bit(AS_ENOSPC, &mapping->flags);
1391 else
1392 set_bit(AS_EIO, &mapping->flags);
23e7dd7d
SF
1393 } else {
1394 cifs_stats_bytes_written(cifs_sb->tcon,
1395 bytes_written);
1396 }
37c0eb46
SF
1397 }
1398 for (i = 0; i < n_iov; i++) {
1399 page = pvec.pages[first + i];
eb9bdaa3
SF
1400 /* Should we also set page error on
1401 success rc but too little data written? */
1402 /* BB investigate retry logic on temporary
1403 server crash cases and how recovery works
fb8c4b14
SF
1404 when page marked as error */
1405 if (rc)
eb9bdaa3 1406 SetPageError(page);
37c0eb46
SF
1407 kunmap(page);
1408 unlock_page(page);
cb876f45 1409 end_page_writeback(page);
37c0eb46
SF
1410 page_cache_release(page);
1411 }
1412 if ((wbc->nr_to_write -= n_iov) <= 0)
1413 done = 1;
1414 index = next;
b066a48c
DK
1415 } else
1416 /* Need to re-find the pages we skipped */
1417 index = pvec.pages[0]->index + 1;
1418
37c0eb46
SF
1419 pagevec_release(&pvec);
1420 }
1421 if (!scanned && !done) {
1422 /*
1423 * We hit the last page and there is more work to be done: wrap
1424 * back to the start of the file
1425 */
1426 scanned = 1;
1427 index = 0;
1428 goto retry;
1429 }
111ebb6e 1430 if (wbc->range_cyclic || (range_whole && wbc->nr_to_write > 0))
37c0eb46
SF
1431 mapping->writeback_index = index;
1432
1da177e4 1433 FreeXid(xid);
9a0c8230 1434 kfree(iov);
1da177e4
LT
1435 return rc;
1436}
1da177e4 1437
fb8c4b14 1438static int cifs_writepage(struct page *page, struct writeback_control *wbc)
1da177e4
LT
1439{
1440 int rc = -EFAULT;
1441 int xid;
1442
1443 xid = GetXid();
1444/* BB add check for wbc flags */
1445 page_cache_get(page);
ad7a2926 1446 if (!PageUptodate(page))
1da177e4 1447 cFYI(1, ("ppw - page not up to date"));
cb876f45
LT
1448
1449 /*
1450 * Set the "writeback" flag, and clear "dirty" in the radix tree.
1451 *
1452 * A writepage() implementation always needs to do either this,
1453 * or re-dirty the page with "redirty_page_for_writepage()" in
1454 * the case of a failure.
1455 *
1456 * Just unlocking the page will cause the radix tree tag-bits
1457 * to fail to update with the state of the page correctly.
1458 */
fb8c4b14 1459 set_page_writeback(page);
1da177e4
LT
1460 rc = cifs_partialpagewrite(page, 0, PAGE_CACHE_SIZE);
1461 SetPageUptodate(page); /* BB add check for error and Clearuptodate? */
1462 unlock_page(page);
cb876f45
LT
1463 end_page_writeback(page);
1464 page_cache_release(page);
1da177e4
LT
1465 FreeXid(xid);
1466 return rc;
1467}
1468
d9414774
NP
1469static int cifs_write_end(struct file *file, struct address_space *mapping,
1470 loff_t pos, unsigned len, unsigned copied,
1471 struct page *page, void *fsdata)
1da177e4 1472{
d9414774
NP
1473 int rc;
1474 struct inode *inode = mapping->host;
1da177e4 1475
d9414774
NP
1476 cFYI(1, ("write_end for page %p from pos %lld with %d bytes",
1477 page, pos, copied));
1478
a98ee8c1
JL
1479 if (PageChecked(page)) {
1480 if (copied == len)
1481 SetPageUptodate(page);
1482 ClearPageChecked(page);
1483 } else if (!PageUptodate(page) && copied == PAGE_CACHE_SIZE)
d9414774 1484 SetPageUptodate(page);
ad7a2926 1485
1da177e4 1486 if (!PageUptodate(page)) {
d9414774
NP
1487 char *page_data;
1488 unsigned offset = pos & (PAGE_CACHE_SIZE - 1);
1489 int xid;
1490
1491 xid = GetXid();
1da177e4
LT
1492 /* this is probably better than directly calling
1493 partialpage_write since in this function the file handle is
1494 known which we might as well leverage */
1495 /* BB check if anything else missing out of ppw
1496 such as updating last write time */
1497 page_data = kmap(page);
d9414774
NP
1498 rc = cifs_write(file, page_data + offset, copied, &pos);
1499 /* if (rc < 0) should we set writebehind rc? */
1da177e4 1500 kunmap(page);
d9414774
NP
1501
1502 FreeXid(xid);
fb8c4b14 1503 } else {
d9414774
NP
1504 rc = copied;
1505 pos += copied;
1da177e4
LT
1506 set_page_dirty(page);
1507 }
1508
d9414774
NP
1509 if (rc > 0) {
1510 spin_lock(&inode->i_lock);
1511 if (pos > inode->i_size)
1512 i_size_write(inode, pos);
1513 spin_unlock(&inode->i_lock);
1514 }
1515
1516 unlock_page(page);
1517 page_cache_release(page);
1518
1da177e4
LT
1519 return rc;
1520}
1521
1522int cifs_fsync(struct file *file, struct dentry *dentry, int datasync)
1523{
1524 int xid;
1525 int rc = 0;
b298f223
SF
1526 struct cifsTconInfo *tcon;
1527 struct cifsFileInfo *smbfile =
1528 (struct cifsFileInfo *)file->private_data;
e6a00296 1529 struct inode *inode = file->f_path.dentry->d_inode;
1da177e4
LT
1530
1531 xid = GetXid();
1532
fb8c4b14 1533 cFYI(1, ("Sync file - name: %s datasync: 0x%x",
1da177e4 1534 dentry->d_name.name, datasync));
50c2f753 1535
cea21805
JL
1536 rc = filemap_write_and_wait(inode->i_mapping);
1537 if (rc == 0) {
1538 rc = CIFS_I(inode)->write_behind_rc;
1da177e4 1539 CIFS_I(inode)->write_behind_rc = 0;
b298f223 1540 tcon = CIFS_SB(inode->i_sb)->tcon;
be652445
SF
1541 if (!rc && tcon && smbfile &&
1542 !(cifs_sb->mnt_cifs_flags & CIFS_MOUNT_NO_SSYNC))
b298f223 1543 rc = CIFSSMBFlush(xid, tcon, smbfile->netfid);
cea21805 1544 }
b298f223 1545
1da177e4
LT
1546 FreeXid(xid);
1547 return rc;
1548}
1549
3978d717 1550/* static void cifs_sync_page(struct page *page)
1da177e4
LT
1551{
1552 struct address_space *mapping;
1553 struct inode *inode;
1554 unsigned long index = page->index;
1555 unsigned int rpages = 0;
1556 int rc = 0;
1557
1558 cFYI(1, ("sync page %p",page));
1559 mapping = page->mapping;
1560 if (!mapping)
1561 return 0;
1562 inode = mapping->host;
1563 if (!inode)
3978d717 1564 return; */
1da177e4 1565
fb8c4b14 1566/* fill in rpages then
1da177e4
LT
1567 result = cifs_pagein_inode(inode, index, rpages); */ /* BB finish */
1568
26a21b98 1569/* cFYI(1, ("rpages is %d for sync page of Index %ld", rpages, index));
1da177e4 1570
3978d717 1571#if 0
1da177e4
LT
1572 if (rc < 0)
1573 return rc;
1574 return 0;
3978d717 1575#endif
1da177e4
LT
1576} */
1577
1578/*
1579 * As file closes, flush all cached write data for this inode checking
1580 * for write behind errors.
1581 */
75e1fcc0 1582int cifs_flush(struct file *file, fl_owner_t id)
1da177e4 1583{
fb8c4b14 1584 struct inode *inode = file->f_path.dentry->d_inode;
1da177e4
LT
1585 int rc = 0;
1586
1587 /* Rather than do the steps manually:
1588 lock the inode for writing
1589 loop through pages looking for write behind data (dirty pages)
1590 coalesce into contiguous 16K (or smaller) chunks to write to server
1591 send to server (prefer in parallel)
1592 deal with writebehind errors
1593 unlock inode for writing
1594 filemapfdatawrite appears easier for the time being */
1595
1596 rc = filemap_fdatawrite(inode->i_mapping);
cea21805
JL
1597 /* reset wb rc if we were able to write out dirty pages */
1598 if (!rc) {
1599 rc = CIFS_I(inode)->write_behind_rc;
1da177e4 1600 CIFS_I(inode)->write_behind_rc = 0;
cea21805 1601 }
50c2f753 1602
fb8c4b14 1603 cFYI(1, ("Flush inode %p file %p rc %d", inode, file, rc));
1da177e4
LT
1604
1605 return rc;
1606}
1607
1608ssize_t cifs_user_read(struct file *file, char __user *read_data,
1609 size_t read_size, loff_t *poffset)
1610{
1611 int rc = -EACCES;
1612 unsigned int bytes_read = 0;
1613 unsigned int total_read = 0;
1614 unsigned int current_read_size;
1615 struct cifs_sb_info *cifs_sb;
1616 struct cifsTconInfo *pTcon;
1617 int xid;
1618 struct cifsFileInfo *open_file;
1619 char *smb_read_data;
1620 char __user *current_offset;
1621 struct smb_com_read_rsp *pSMBr;
1622
1623 xid = GetXid();
e6a00296 1624 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
1da177e4
LT
1625 pTcon = cifs_sb->tcon;
1626
1627 if (file->private_data == NULL) {
1628 FreeXid(xid);
1629 return -EBADF;
1630 }
1631 open_file = (struct cifsFileInfo *)file->private_data;
1632
ad7a2926 1633 if ((file->f_flags & O_ACCMODE) == O_WRONLY)
1da177e4 1634 cFYI(1, ("attempting read on write only file instance"));
ad7a2926 1635
1da177e4
LT
1636 for (total_read = 0, current_offset = read_data;
1637 read_size > total_read;
1638 total_read += bytes_read, current_offset += bytes_read) {
fb8c4b14 1639 current_read_size = min_t(const int, read_size - total_read,
1da177e4
LT
1640 cifs_sb->rsize);
1641 rc = -EAGAIN;
1642 smb_read_data = NULL;
1643 while (rc == -EAGAIN) {
ec637e3f 1644 int buf_type = CIFS_NO_BUFFER;
fb8c4b14 1645 if ((open_file->invalidHandle) &&
1da177e4 1646 (!open_file->closePend)) {
4b18f2a9 1647 rc = cifs_reopen_file(file, true);
1da177e4
LT
1648 if (rc != 0)
1649 break;
1650 }
bfa0d75a 1651 rc = CIFSSMBRead(xid, pTcon,
ec637e3f
SF
1652 open_file->netfid,
1653 current_read_size, *poffset,
1654 &bytes_read, &smb_read_data,
1655 &buf_type);
1da177e4 1656 pSMBr = (struct smb_com_read_rsp *)smb_read_data;
1da177e4 1657 if (smb_read_data) {
93544cc6
SF
1658 if (copy_to_user(current_offset,
1659 smb_read_data +
1660 4 /* RFC1001 length field */ +
1661 le16_to_cpu(pSMBr->DataOffset),
ad7a2926 1662 bytes_read))
93544cc6 1663 rc = -EFAULT;
93544cc6 1664
fb8c4b14 1665 if (buf_type == CIFS_SMALL_BUFFER)
ec637e3f 1666 cifs_small_buf_release(smb_read_data);
fb8c4b14 1667 else if (buf_type == CIFS_LARGE_BUFFER)
ec637e3f 1668 cifs_buf_release(smb_read_data);
1da177e4
LT
1669 smb_read_data = NULL;
1670 }
1671 }
1672 if (rc || (bytes_read == 0)) {
1673 if (total_read) {
1674 break;
1675 } else {
1676 FreeXid(xid);
1677 return rc;
1678 }
1679 } else {
a4544347 1680 cifs_stats_bytes_read(pTcon, bytes_read);
1da177e4
LT
1681 *poffset += bytes_read;
1682 }
1683 }
1684 FreeXid(xid);
1685 return total_read;
1686}
1687
1688
1689static ssize_t cifs_read(struct file *file, char *read_data, size_t read_size,
1690 loff_t *poffset)
1691{
1692 int rc = -EACCES;
1693 unsigned int bytes_read = 0;
1694 unsigned int total_read;
1695 unsigned int current_read_size;
1696 struct cifs_sb_info *cifs_sb;
1697 struct cifsTconInfo *pTcon;
1698 int xid;
1699 char *current_offset;
1700 struct cifsFileInfo *open_file;
ec637e3f 1701 int buf_type = CIFS_NO_BUFFER;
1da177e4
LT
1702
1703 xid = GetXid();
e6a00296 1704 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
1da177e4
LT
1705 pTcon = cifs_sb->tcon;
1706
1707 if (file->private_data == NULL) {
1708 FreeXid(xid);
1709 return -EBADF;
1710 }
1711 open_file = (struct cifsFileInfo *)file->private_data;
1712
1713 if ((file->f_flags & O_ACCMODE) == O_WRONLY)
1714 cFYI(1, ("attempting read on write only file instance"));
1715
fb8c4b14 1716 for (total_read = 0, current_offset = read_data;
1da177e4
LT
1717 read_size > total_read;
1718 total_read += bytes_read, current_offset += bytes_read) {
1719 current_read_size = min_t(const int, read_size - total_read,
1720 cifs_sb->rsize);
f9f5c817
SF
1721 /* For windows me and 9x we do not want to request more
1722 than it negotiated since it will refuse the read then */
fb8c4b14 1723 if ((pTcon->ses) &&
f9f5c817
SF
1724 !(pTcon->ses->capabilities & CAP_LARGE_FILES)) {
1725 current_read_size = min_t(const int, current_read_size,
1726 pTcon->ses->server->maxBuf - 128);
1727 }
1da177e4
LT
1728 rc = -EAGAIN;
1729 while (rc == -EAGAIN) {
fb8c4b14 1730 if ((open_file->invalidHandle) &&
1da177e4 1731 (!open_file->closePend)) {
4b18f2a9 1732 rc = cifs_reopen_file(file, true);
1da177e4
LT
1733 if (rc != 0)
1734 break;
1735 }
bfa0d75a 1736 rc = CIFSSMBRead(xid, pTcon,
ec637e3f
SF
1737 open_file->netfid,
1738 current_read_size, *poffset,
1739 &bytes_read, &current_offset,
1740 &buf_type);
1da177e4
LT
1741 }
1742 if (rc || (bytes_read == 0)) {
1743 if (total_read) {
1744 break;
1745 } else {
1746 FreeXid(xid);
1747 return rc;
1748 }
1749 } else {
a4544347 1750 cifs_stats_bytes_read(pTcon, total_read);
1da177e4
LT
1751 *poffset += bytes_read;
1752 }
1753 }
1754 FreeXid(xid);
1755 return total_read;
1756}
1757
1758int cifs_file_mmap(struct file *file, struct vm_area_struct *vma)
1759{
e6a00296 1760 struct dentry *dentry = file->f_path.dentry;
1da177e4
LT
1761 int rc, xid;
1762
1763 xid = GetXid();
1764 rc = cifs_revalidate(dentry);
1765 if (rc) {
1766 cFYI(1, ("Validation prior to mmap failed, error=%d", rc));
1767 FreeXid(xid);
1768 return rc;
1769 }
1770 rc = generic_file_mmap(file, vma);
1771 FreeXid(xid);
1772 return rc;
1773}
1774
1775
fb8c4b14 1776static void cifs_copy_cache_pages(struct address_space *mapping,
1da177e4
LT
1777 struct list_head *pages, int bytes_read, char *data,
1778 struct pagevec *plru_pvec)
1779{
1780 struct page *page;
1781 char *target;
1782
1783 while (bytes_read > 0) {
1784 if (list_empty(pages))
1785 break;
1786
1787 page = list_entry(pages->prev, struct page, lru);
1788 list_del(&page->lru);
1789
1790 if (add_to_page_cache(page, mapping, page->index,
1791 GFP_KERNEL)) {
1792 page_cache_release(page);
1793 cFYI(1, ("Add page cache failed"));
3079ca62
SF
1794 data += PAGE_CACHE_SIZE;
1795 bytes_read -= PAGE_CACHE_SIZE;
1da177e4
LT
1796 continue;
1797 }
1798
fb8c4b14 1799 target = kmap_atomic(page, KM_USER0);
1da177e4
LT
1800
1801 if (PAGE_CACHE_SIZE > bytes_read) {
1802 memcpy(target, data, bytes_read);
1803 /* zero the tail end of this partial page */
fb8c4b14 1804 memset(target + bytes_read, 0,
1da177e4
LT
1805 PAGE_CACHE_SIZE - bytes_read);
1806 bytes_read = 0;
1807 } else {
1808 memcpy(target, data, PAGE_CACHE_SIZE);
1809 bytes_read -= PAGE_CACHE_SIZE;
1810 }
1811 kunmap_atomic(target, KM_USER0);
1812
1813 flush_dcache_page(page);
1814 SetPageUptodate(page);
1815 unlock_page(page);
1816 if (!pagevec_add(plru_pvec, page))
4f98a2fe 1817 __pagevec_lru_add_file(plru_pvec);
1da177e4
LT
1818 data += PAGE_CACHE_SIZE;
1819 }
1820 return;
1821}
1822
1823static int cifs_readpages(struct file *file, struct address_space *mapping,
1824 struct list_head *page_list, unsigned num_pages)
1825{
1826 int rc = -EACCES;
1827 int xid;
1828 loff_t offset;
1829 struct page *page;
1830 struct cifs_sb_info *cifs_sb;
1831 struct cifsTconInfo *pTcon;
2c2130e1 1832 unsigned int bytes_read = 0;
fb8c4b14 1833 unsigned int read_size, i;
1da177e4
LT
1834 char *smb_read_data = NULL;
1835 struct smb_com_read_rsp *pSMBr;
1836 struct pagevec lru_pvec;
1837 struct cifsFileInfo *open_file;
ec637e3f 1838 int buf_type = CIFS_NO_BUFFER;
1da177e4
LT
1839
1840 xid = GetXid();
1841 if (file->private_data == NULL) {
1842 FreeXid(xid);
1843 return -EBADF;
1844 }
1845 open_file = (struct cifsFileInfo *)file->private_data;
e6a00296 1846 cifs_sb = CIFS_SB(file->f_path.dentry->d_sb);
1da177e4 1847 pTcon = cifs_sb->tcon;
bfa0d75a 1848
1da177e4 1849 pagevec_init(&lru_pvec, 0);
61de800d 1850 cFYI(DBG2, ("rpages: num pages %d", num_pages));
1da177e4
LT
1851 for (i = 0; i < num_pages; ) {
1852 unsigned contig_pages;
1853 struct page *tmp_page;
1854 unsigned long expected_index;
1855
1856 if (list_empty(page_list))
1857 break;
1858
1859 page = list_entry(page_list->prev, struct page, lru);
1860 offset = (loff_t)page->index << PAGE_CACHE_SHIFT;
1861
1862 /* count adjacent pages that we will read into */
1863 contig_pages = 0;
fb8c4b14 1864 expected_index =
1da177e4 1865 list_entry(page_list->prev, struct page, lru)->index;
fb8c4b14 1866 list_for_each_entry_reverse(tmp_page, page_list, lru) {
1da177e4
LT
1867 if (tmp_page->index == expected_index) {
1868 contig_pages++;
1869 expected_index++;
1870 } else
fb8c4b14 1871 break;
1da177e4
LT
1872 }
1873 if (contig_pages + i > num_pages)
1874 contig_pages = num_pages - i;
1875
1876 /* for reads over a certain size could initiate async
1877 read ahead */
1878
1879 read_size = contig_pages * PAGE_CACHE_SIZE;
1880 /* Read size needs to be in multiples of one page */
1881 read_size = min_t(const unsigned int, read_size,
1882 cifs_sb->rsize & PAGE_CACHE_MASK);
90c81e0b 1883 cFYI(DBG2, ("rpages: read size 0x%x contiguous pages %d",
75865f8c 1884 read_size, contig_pages));
1da177e4
LT
1885 rc = -EAGAIN;
1886 while (rc == -EAGAIN) {
fb8c4b14 1887 if ((open_file->invalidHandle) &&
1da177e4 1888 (!open_file->closePend)) {
4b18f2a9 1889 rc = cifs_reopen_file(file, true);
1da177e4
LT
1890 if (rc != 0)
1891 break;
1892 }
1893
bfa0d75a 1894 rc = CIFSSMBRead(xid, pTcon,
ec637e3f
SF
1895 open_file->netfid,
1896 read_size, offset,
1897 &bytes_read, &smb_read_data,
1898 &buf_type);
a9d02ad4 1899 /* BB more RC checks ? */
fb8c4b14 1900 if (rc == -EAGAIN) {
1da177e4 1901 if (smb_read_data) {
fb8c4b14 1902 if (buf_type == CIFS_SMALL_BUFFER)
ec637e3f 1903 cifs_small_buf_release(smb_read_data);
fb8c4b14 1904 else if (buf_type == CIFS_LARGE_BUFFER)
ec637e3f 1905 cifs_buf_release(smb_read_data);
1da177e4
LT
1906 smb_read_data = NULL;
1907 }
1908 }
1909 }
1910 if ((rc < 0) || (smb_read_data == NULL)) {
1911 cFYI(1, ("Read error in readpages: %d", rc));
1da177e4
LT
1912 break;
1913 } else if (bytes_read > 0) {
6f88cc2e 1914 task_io_account_read(bytes_read);
1da177e4
LT
1915 pSMBr = (struct smb_com_read_rsp *)smb_read_data;
1916 cifs_copy_cache_pages(mapping, page_list, bytes_read,
1917 smb_read_data + 4 /* RFC1001 hdr */ +
1918 le16_to_cpu(pSMBr->DataOffset), &lru_pvec);
1919
1920 i += bytes_read >> PAGE_CACHE_SHIFT;
a4544347 1921 cifs_stats_bytes_read(pTcon, bytes_read);
2c2130e1 1922 if ((bytes_read & PAGE_CACHE_MASK) != bytes_read) {
1da177e4
LT
1923 i++; /* account for partial page */
1924
fb8c4b14 1925 /* server copy of file can have smaller size
1da177e4 1926 than client */
fb8c4b14
SF
1927 /* BB do we need to verify this common case ?
1928 this case is ok - if we are at server EOF
1da177e4
LT
1929 we will hit it on next read */
1930
05ac9d4b 1931 /* break; */
1da177e4
LT
1932 }
1933 } else {
1934 cFYI(1, ("No bytes read (%d) at offset %lld . "
1935 "Cleaning remaining pages from readahead list",
1936 bytes_read, offset));
fb8c4b14 1937 /* BB turn off caching and do new lookup on
1da177e4 1938 file size at server? */
1da177e4
LT
1939 break;
1940 }
1941 if (smb_read_data) {
fb8c4b14 1942 if (buf_type == CIFS_SMALL_BUFFER)
ec637e3f 1943 cifs_small_buf_release(smb_read_data);
fb8c4b14 1944 else if (buf_type == CIFS_LARGE_BUFFER)
ec637e3f 1945 cifs_buf_release(smb_read_data);
1da177e4
LT
1946 smb_read_data = NULL;
1947 }
1948 bytes_read = 0;
1949 }
1950
4f98a2fe 1951 pagevec_lru_add_file(&lru_pvec);
1da177e4
LT
1952
1953/* need to free smb_read_data buf before exit */
1954 if (smb_read_data) {
fb8c4b14 1955 if (buf_type == CIFS_SMALL_BUFFER)
47c886b3 1956 cifs_small_buf_release(smb_read_data);
fb8c4b14 1957 else if (buf_type == CIFS_LARGE_BUFFER)
47c886b3 1958 cifs_buf_release(smb_read_data);
1da177e4 1959 smb_read_data = NULL;
fb8c4b14 1960 }
1da177e4
LT
1961
1962 FreeXid(xid);
1963 return rc;
1964}
1965
1966static int cifs_readpage_worker(struct file *file, struct page *page,
1967 loff_t *poffset)
1968{
1969 char *read_data;
1970 int rc;
1971
1972 page_cache_get(page);
1973 read_data = kmap(page);
1974 /* for reads over a certain size could initiate async read ahead */
fb8c4b14 1975
1da177e4 1976 rc = cifs_read(file, read_data, PAGE_CACHE_SIZE, poffset);
fb8c4b14 1977
1da177e4
LT
1978 if (rc < 0)
1979 goto io_error;
1980 else
fb8c4b14
SF
1981 cFYI(1, ("Bytes read %d", rc));
1982
e6a00296
JJS
1983 file->f_path.dentry->d_inode->i_atime =
1984 current_fs_time(file->f_path.dentry->d_inode->i_sb);
fb8c4b14 1985
1da177e4
LT
1986 if (PAGE_CACHE_SIZE > rc)
1987 memset(read_data + rc, 0, PAGE_CACHE_SIZE - rc);
1988
1989 flush_dcache_page(page);
1990 SetPageUptodate(page);
1991 rc = 0;
fb8c4b14 1992
1da177e4 1993io_error:
fb8c4b14 1994 kunmap(page);
1da177e4
LT
1995 page_cache_release(page);
1996 return rc;
1997}
1998
1999static int cifs_readpage(struct file *file, struct page *page)
2000{
2001 loff_t offset = (loff_t)page->index << PAGE_CACHE_SHIFT;
2002 int rc = -EACCES;
2003 int xid;
2004
2005 xid = GetXid();
2006
2007 if (file->private_data == NULL) {
2008 FreeXid(xid);
2009 return -EBADF;
2010 }
2011
fb8c4b14 2012 cFYI(1, ("readpage %p at offset %d 0x%x\n",
1da177e4
LT
2013 page, (int)offset, (int)offset));
2014
2015 rc = cifs_readpage_worker(file, page, &offset);
2016
2017 unlock_page(page);
2018
2019 FreeXid(xid);
2020 return rc;
2021}
2022
a403a0a3
SF
2023static int is_inode_writable(struct cifsInodeInfo *cifs_inode)
2024{
2025 struct cifsFileInfo *open_file;
2026
2027 read_lock(&GlobalSMBSeslock);
2028 list_for_each_entry(open_file, &cifs_inode->openFileList, flist) {
2029 if (open_file->closePend)
2030 continue;
2031 if (open_file->pfile &&
2032 ((open_file->pfile->f_flags & O_RDWR) ||
2033 (open_file->pfile->f_flags & O_WRONLY))) {
2034 read_unlock(&GlobalSMBSeslock);
2035 return 1;
2036 }
2037 }
2038 read_unlock(&GlobalSMBSeslock);
2039 return 0;
2040}
2041
1da177e4
LT
2042/* We do not want to update the file size from server for inodes
2043 open for write - to avoid races with writepage extending
2044 the file - in the future we could consider allowing
fb8c4b14 2045 refreshing the inode only on increases in the file size
1da177e4
LT
2046 but this is tricky to do without racing with writebehind
2047 page caching in the current Linux kernel design */
4b18f2a9 2048bool is_size_safe_to_change(struct cifsInodeInfo *cifsInode, __u64 end_of_file)
1da177e4 2049{
a403a0a3 2050 if (!cifsInode)
4b18f2a9 2051 return true;
50c2f753 2052
a403a0a3
SF
2053 if (is_inode_writable(cifsInode)) {
2054 /* This inode is open for write at least once */
c32a0b68
SF
2055 struct cifs_sb_info *cifs_sb;
2056
c32a0b68 2057 cifs_sb = CIFS_SB(cifsInode->vfs_inode.i_sb);
ad7a2926 2058 if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_DIRECT_IO) {
fb8c4b14 2059 /* since no page cache to corrupt on directio
c32a0b68 2060 we can change size safely */
4b18f2a9 2061 return true;
c32a0b68
SF
2062 }
2063
fb8c4b14 2064 if (i_size_read(&cifsInode->vfs_inode) < end_of_file)
4b18f2a9 2065 return true;
7ba52631 2066
4b18f2a9 2067 return false;
23e7dd7d 2068 } else
4b18f2a9 2069 return true;
1da177e4
LT
2070}
2071
d9414774
NP
2072static int cifs_write_begin(struct file *file, struct address_space *mapping,
2073 loff_t pos, unsigned len, unsigned flags,
2074 struct page **pagep, void **fsdata)
1da177e4 2075{
d9414774
NP
2076 pgoff_t index = pos >> PAGE_CACHE_SHIFT;
2077 loff_t offset = pos & (PAGE_CACHE_SIZE - 1);
a98ee8c1
JL
2078 loff_t page_start = pos & PAGE_MASK;
2079 loff_t i_size;
2080 struct page *page;
2081 int rc = 0;
d9414774
NP
2082
2083 cFYI(1, ("write_begin from %lld len %d", (long long)pos, len));
2084
54566b2c 2085 page = grab_cache_page_write_begin(mapping, index, flags);
a98ee8c1
JL
2086 if (!page) {
2087 rc = -ENOMEM;
2088 goto out;
2089 }
8a236264 2090
a98ee8c1
JL
2091 if (PageUptodate(page))
2092 goto out;
8a236264 2093
a98ee8c1
JL
2094 /*
2095 * If we write a full page it will be up to date, no need to read from
2096 * the server. If the write is short, we'll end up doing a sync write
2097 * instead.
2098 */
2099 if (len == PAGE_CACHE_SIZE)
2100 goto out;
8a236264 2101
a98ee8c1
JL
2102 /*
2103 * optimize away the read when we have an oplock, and we're not
2104 * expecting to use any of the data we'd be reading in. That
2105 * is, when the page lies beyond the EOF, or straddles the EOF
2106 * and the write will cover all of the existing data.
2107 */
2108 if (CIFS_I(mapping->host)->clientCanCacheRead) {
2109 i_size = i_size_read(mapping->host);
2110 if (page_start >= i_size ||
2111 (offset == 0 && (pos + len) >= i_size)) {
2112 zero_user_segments(page, 0, offset,
2113 offset + len,
2114 PAGE_CACHE_SIZE);
2115 /*
2116 * PageChecked means that the parts of the page
2117 * to which we're not writing are considered up
2118 * to date. Once the data is copied to the
2119 * page, it can be set uptodate.
2120 */
2121 SetPageChecked(page);
2122 goto out;
2123 }
2124 }
d9414774 2125
a98ee8c1
JL
2126 if ((file->f_flags & O_ACCMODE) != O_WRONLY) {
2127 /*
2128 * might as well read a page, it is fast enough. If we get
2129 * an error, we don't need to return it. cifs_write_end will
2130 * do a sync write instead since PG_uptodate isn't set.
2131 */
2132 cifs_readpage_worker(file, page, &page_start);
8a236264
SF
2133 } else {
2134 /* we could try using another file handle if there is one -
2135 but how would we lock it to prevent close of that handle
2136 racing with this read? In any case
d9414774 2137 this will be written out by write_end so is fine */
1da177e4 2138 }
a98ee8c1
JL
2139out:
2140 *pagep = page;
2141 return rc;
1da177e4
LT
2142}
2143
f5e54d6e 2144const struct address_space_operations cifs_addr_ops = {
1da177e4
LT
2145 .readpage = cifs_readpage,
2146 .readpages = cifs_readpages,
2147 .writepage = cifs_writepage,
37c0eb46 2148 .writepages = cifs_writepages,
d9414774
NP
2149 .write_begin = cifs_write_begin,
2150 .write_end = cifs_write_end,
1da177e4
LT
2151 .set_page_dirty = __set_page_dirty_nobuffers,
2152 /* .sync_page = cifs_sync_page, */
2153 /* .direct_IO = */
2154};
273d81d6
DK
2155
2156/*
2157 * cifs_readpages requires the server to support a buffer large enough to
2158 * contain the header plus one complete page of data. Otherwise, we need
2159 * to leave cifs_readpages out of the address space operations.
2160 */
f5e54d6e 2161const struct address_space_operations cifs_addr_ops_smallbuf = {
273d81d6
DK
2162 .readpage = cifs_readpage,
2163 .writepage = cifs_writepage,
2164 .writepages = cifs_writepages,
d9414774
NP
2165 .write_begin = cifs_write_begin,
2166 .write_end = cifs_write_end,
273d81d6
DK
2167 .set_page_dirty = __set_page_dirty_nobuffers,
2168 /* .sync_page = cifs_sync_page, */
2169 /* .direct_IO = */
2170};