nfsfh.c 20.4 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0
Linus Torvalds's avatar
Linus Torvalds committed
2 3 4 5 6 7 8 9 10
/*
 * NFS server file handle treatment.
 *
 * Copyright (C) 1995, 1996 Olaf Kirch <okir@monad.swb.de>
 * Portions Copyright (C) 1999 G. Allen Morris III <gam3@acm.org>
 * Extensive rewrite by Neil Brown <neilb@cse.unsw.edu.au> Southern-Spring 1999
 * ... and again Southern-Winter 2001 to support export_operations
 */

11
#include <linux/exportfs.h>
Linus Torvalds's avatar
Linus Torvalds committed
12

13
#include <linux/sunrpc/svcauth_gss.h>
14
#include "nfsd.h"
15
#include "vfs.h"
16
#include "auth.h"
17
#include "trace.h"
Linus Torvalds's avatar
Linus Torvalds committed
18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38

#define NFSDDBG_FACILITY		NFSDDBG_FH


/*
 * our acceptability function.
 * if NOSUBTREECHECK, accept anything
 * if not, require that we can walk up to exp->ex_dentry
 * doing some checks on the 'x' bits
 */
static int nfsd_acceptable(void *expv, struct dentry *dentry)
{
	struct svc_export *exp = expv;
	int rv;
	struct dentry *tdentry;
	struct dentry *parent;

	if (exp->ex_flags & NFSEXP_NOSUBTREECHECK)
		return 1;

	tdentry = dget(dentry);
39
	while (tdentry != exp->ex_path.dentry && !IS_ROOT(tdentry)) {
Linus Torvalds's avatar
Linus Torvalds committed
40 41 42
		/* make sure parents give x permission to user */
		int err;
		parent = dget_parent(tdentry);
43
		err = inode_permission(&nop_mnt_idmap,
44
				       d_inode(parent), MAY_EXEC);
Linus Torvalds's avatar
Linus Torvalds committed
45 46 47 48 49 50 51
		if (err < 0) {
			dput(parent);
			break;
		}
		dput(tdentry);
		tdentry = parent;
	}
52
	if (tdentry != exp->ex_path.dentry)
Al Viro's avatar
Al Viro committed
53
		dprintk("nfsd_acceptable failed at %p %pd\n", tdentry, tdentry);
54
	rv = (tdentry == exp->ex_path.dentry);
Linus Torvalds's avatar
Linus Torvalds committed
55 56 57 58 59 60 61 62 63
	dput(tdentry);
	return rv;
}

/* Type check. The correct error return for type mismatches does not seem to be
 * generally agreed upon. SunOS seems to use EISDIR if file isn't S_IFREG; a
 * comment in the NFSv3 spec says this is incorrect (implementation notes for
 * the write call).
 */
64
static inline __be32
65
nfsd_mode_check(struct dentry *dentry, umode_t requested)
Linus Torvalds's avatar
Linus Torvalds committed
66
{
67
	umode_t mode = d_inode(dentry)->i_mode & S_IFMT;
68 69 70

	if (requested == 0) /* the caller doesn't care */
		return nfs_ok;
71 72 73 74 75
	if (mode == requested) {
		if (mode == S_IFDIR && !d_can_lookup(dentry)) {
			WARN_ON_ONCE(1);
			return nfserr_notdir;
		}
76
		return nfs_ok;
77
	}
78 79 80
	if (mode == S_IFLNK) {
		if (requested == S_IFDIR)
			return nfserr_symlink_not_dir;
81
		return nfserr_symlink;
82
	}
83 84 85 86
	if (requested == S_IFDIR)
		return nfserr_notdir;
	if (mode == S_IFDIR)
		return nfserr_isdir;
87
	return nfserr_wrong_type;
Linus Torvalds's avatar
Linus Torvalds committed
88 89
}

90 91 92
static bool nfsd_originating_port_ok(struct svc_rqst *rqstp,
				     struct svc_cred *cred,
				     struct svc_export *exp)
93
{
94
	if (nfsexp_flags(cred, exp) & NFSEXP_INSECURE_PORT)
95 96
		return true;
	/* We don't require gss requests to use low ports: */
97
	if (cred->cr_flavor >= RPC_AUTH_GSS)
98 99 100 101
		return true;
	return test_bit(RQ_SECURE, &rqstp->rq_flags);
}

102
static __be32 nfsd_setuser_and_check_port(struct svc_rqst *rqstp,
103
					  struct svc_cred *cred,
104 105 106
					  struct svc_export *exp)
{
	/* Check if the request originated from a secure port. */
107
	if (rqstp && !nfsd_originating_port_ok(rqstp, cred, exp)) {
108
		RPC_IFDEBUG(char buf[RPC_MAX_ADDRBUFLEN]);
109 110
		dprintk("nfsd: request from insecure port %s!\n",
		        svc_print_addr(rqstp, buf, sizeof(buf)));
111 112 113 114
		return nfserr_perm;
	}

	/* Set user creds for this exportpoint */
115
	return nfserrno(nfsd_setuser(cred, exp));
116 117
}

118 119
static inline __be32 check_pseudo_root(struct dentry *dentry,
				       struct svc_export *exp)
120 121 122 123 124 125 126
{
	if (!(exp->ex_flags & NFSEXP_V4ROOT))
		return nfs_ok;
	/*
	 * We're exposing only the directories and symlinks that have to be
	 * traversed on the way to real exports:
	 */
127 128
	if (unlikely(!d_is_dir(dentry) &&
		     !d_is_symlink(dentry)))
129 130 131 132 133 134 135 136 137 138 139
		return nfserr_stale;
	/*
	 * A pseudoroot export gives permission to access only one
	 * single directory; the kernel has to make another upcall
	 * before granting access to anything else under it:
	 */
	if (unlikely(dentry != exp->ex_path.dentry))
		return nfserr_stale;
	return nfs_ok;
}

140 141 142 143 144 145 146 147
/*
 * Use the given filehandle to look up the corresponding export and
 * dentry.  On success, the results are used to set fh_export and
 * fh_dentry.
 */
static __be32 nfsd_set_fh_dentry(struct svc_rqst *rqstp, struct svc_fh *fhp)
{
	struct knfsd_fh	*fh = &fhp->fh_handle;
148
	struct fid *fid = NULL;
149 150 151 152
	struct svc_export *exp;
	struct dentry *dentry;
	int fileid_type;
	int data_left = fh->fh_size/4;
153
	int len;
154 155
	__be32 error;

156 157
	error = nfserr_badhandle;
	if (fh->fh_size == 0)
158 159
		return nfserr_nofilehandle;

160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182
	if (fh->fh_version != 1)
		return error;

	if (--data_left < 0)
		return error;
	if (fh->fh_auth_type != 0)
		return error;
	len = key_len(fh->fh_fsid_type) / 4;
	if (len == 0)
		return error;
	if (fh->fh_fsid_type == FSID_MAJOR_MINOR) {
		/* deprecated, convert to type 3 */
		len = key_len(FSID_ENCODE_DEV)/4;
		fh->fh_fsid_type = FSID_ENCODE_DEV;
		/*
		 * struct knfsd_fh uses host-endian fields, which are
		 * sometimes used to hold net-endian values. This
		 * confuses sparse, so we must use __force here to
		 * keep it from complaining.
		 */
		fh->fh_fsid[0] = new_encode_dev(MKDEV(ntohl((__force __be32)fh->fh_fsid[0]),
						      ntohl((__force __be32)fh->fh_fsid[1])));
		fh->fh_fsid[1] = fh->fh_fsid[2];
183
	}
184 185 186
	data_left -= len;
	if (data_left < 0)
		return error;
187 188 189
	exp = rqst_exp_find(&rqstp->rq_chandle, SVC_NET(rqstp),
			    rqstp->rq_client, rqstp->rq_gssclient,
			    fh->fh_fsid_type, fh->fh_fsid);
190
	fid = (struct fid *)(fh->fh_fsid + len);
191 192

	error = nfserr_stale;
193 194 195 196 197
	if (IS_ERR(exp)) {
		trace_nfsd_set_fh_dentry_badexport(rqstp, fhp, PTR_ERR(exp));

		if (PTR_ERR(exp) == -ENOENT)
			return error;
198 199

		return nfserrno(PTR_ERR(exp));
200
	}
201

202 203 204 205 206 207 208 209 210 211
	if (exp->ex_flags & NFSEXP_NOSUBTREECHECK) {
		/* Elevate privileges so that the lack of 'r' or 'x'
		 * permission on some parent directory will
		 * not stop exportfs_decode_fh from being able
		 * to reconnect a directory into the dentry cache.
		 * The same problem can affect "SUBTREECHECK" exports,
		 * but as nfsd_acceptable depends on correct
		 * access control settings being in effect, we cannot
		 * fix that case easily.
		 */
212
		struct cred *new = prepare_creds();
213 214 215 216
		if (!new) {
			error =  nfserrno(-ENOMEM);
			goto out;
		}
217 218 219 220 221
		new->cap_effective =
			cap_raise_nfsd_set(new->cap_effective,
					   new->cap_permitted);
		put_cred(override_creds(new));
		put_cred(new);
222
	} else {
223
		error = nfsd_setuser_and_check_port(rqstp, &rqstp->rq_cred, exp);
224 225 226
		if (error)
			goto out;
	}
227 228 229 230

	/*
	 * Look up the dentry using the NFS file handle.
	 */
231
	error = nfserr_badhandle;
232

233
	fileid_type = fh->fh_fileid_type;
234 235 236 237

	if (fileid_type == FILEID_ROOT)
		dentry = dget(exp->ex_path.dentry);
	else {
238
		dentry = exportfs_decode_fh_raw(exp->ex_path.mnt, fid,
239
						data_left, fileid_type, 0,
240 241
						nfsd_acceptable, exp);
		if (IS_ERR_OR_NULL(dentry)) {
242 243
			trace_nfsd_set_fh_dentry_badhandle(rqstp, fhp,
					dentry ?  PTR_ERR(dentry) : -ESTALE);
244 245 246 247 248 249 250 251
			switch (PTR_ERR(dentry)) {
			case -ENOMEM:
			case -ETIMEDOUT:
				break;
			default:
				dentry = ERR_PTR(-ESTALE);
			}
		}
252 253 254 255 256 257 258 259 260
	}
	if (dentry == NULL)
		goto out;
	if (IS_ERR(dentry)) {
		if (PTR_ERR(dentry) != -EINVAL)
			error = nfserrno(PTR_ERR(dentry));
		goto out;
	}

261
	if (d_is_dir(dentry) &&
262
			(dentry->d_flags & DCACHE_DISCONNECTED)) {
Al Viro's avatar
Al Viro committed
263 264
		printk("nfsd: find_fh_dentry returned a DISCONNECTED directory: %pd2\n",
				dentry);
265 266 267 268
	}

	fhp->fh_dentry = dentry;
	fhp->fh_export = exp;
269 270

	switch (rqstp->rq_vers) {
271 272 273
	case 4:
		if (dentry->d_sb->s_export_op->flags & EXPORT_OP_NOATOMIC_ATTR)
			fhp->fh_no_atomic_attr = true;
274
		fhp->fh_64bit_cookies = true;
275
		break;
276 277 278
	case 3:
		if (dentry->d_sb->s_export_op->flags & EXPORT_OP_NOWCC)
			fhp->fh_no_wcc = true;
279
		fhp->fh_64bit_cookies = true;
280 281
		if (exp->ex_flags & NFSEXP_V4ROOT)
			goto out;
282 283 284
		break;
	case 2:
		fhp->fh_no_wcc = true;
285 286
		if (EX_WGATHER(exp))
			fhp->fh_use_wgather = true;
287 288
		if (exp->ex_flags & NFSEXP_V4ROOT)
			goto out;
289 290
	}

291 292 293 294 295 296
	return 0;
out:
	exp_put(exp);
	return error;
}

297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314
/**
 * fh_verify - filehandle lookup and access checking
 * @rqstp: pointer to current rpc request
 * @fhp: filehandle to be verified
 * @type: expected type of object pointed to by filehandle
 * @access: type of access needed to object
 *
 * Look up a dentry from the on-the-wire filehandle, check the client's
 * access to the export, and set the current task's credentials.
 *
 * Regardless of success or failure of fh_verify(), fh_put() should be
 * called on @fhp when the caller is finished with the filehandle.
 *
 * fh_verify() may be called multiple times on a given filehandle, for
 * example, when processing an NFSv4 compound.  The first call will look
 * up a dentry using the on-the-wire filehandle.  Subsequent calls will
 * skip the lookup and just perform the other checks and possibly change
 * the current task's credentials.
Linus Torvalds's avatar
Linus Torvalds committed
315
 *
316 317 318 319
 * @type specifies the type of object expected using one of the S_IF*
 * constants defined in include/linux/stat.h.  The caller may use zero
 * to indicate that it doesn't care, or a negative integer to indicate
 * that it expects something not of the given type.
Linus Torvalds's avatar
Linus Torvalds committed
320
 *
321
 * @access is formed from the NFSD_MAY_* constants defined in
322
 * fs/nfsd/vfs.h.
Linus Torvalds's avatar
Linus Torvalds committed
323
 */
324
__be32
Al Viro's avatar
Al Viro committed
325
fh_verify(struct svc_rqst *rqstp, struct svc_fh *fhp, umode_t type, int access)
Linus Torvalds's avatar
Linus Torvalds committed
326
{
327
	struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
328
	struct svc_export *exp = NULL;
Linus Torvalds's avatar
Linus Torvalds committed
329
	struct dentry	*dentry;
330
	__be32		error;
Linus Torvalds's avatar
Linus Torvalds committed
331 332

	if (!fhp->fh_dentry) {
333
		error = nfsd_set_fh_dentry(rqstp, fhp);
334 335
		if (error)
			goto out;
Linus Torvalds's avatar
Linus Torvalds committed
336
	}
337 338
	dentry = fhp->fh_dentry;
	exp = fhp->fh_export;
Chuck Lever's avatar
Chuck Lever committed
339 340 341

	trace_nfsd_fh_verify(rqstp, fhp, type, access);

342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357
	/*
	 * We still have to do all these permission checks, even when
	 * fh_dentry is already set:
	 * 	- fh_verify may be called multiple times with different
	 * 	  "access" arguments (e.g. nfsd_proc_create calls
	 * 	  fh_verify(...,NFSD_MAY_EXEC) first, then later (in
	 * 	  nfsd_create) calls fh_verify(...,NFSD_MAY_CREATE).
	 *	- in the NFSv4 case, the filehandle may have been filled
	 *	  in by fh_compose, and given a dentry, but further
	 *	  compound operations performed with that filehandle
	 *	  still need permissions checks.  In the worst case, a
	 *	  mountpoint crossing may have changed the export
	 *	  options, and we may now need to use a different uid
	 *	  (for example, if different id-squashing options are in
	 *	  effect on the new filesystem).
	 */
358
	error = check_pseudo_root(dentry, exp);
359 360 361
	if (error)
		goto out;

362
	error = nfsd_setuser_and_check_port(rqstp, &rqstp->rq_cred, exp);
363 364
	if (error)
		goto out;
365

366
	error = nfsd_mode_check(dentry, type);
Linus Torvalds's avatar
Linus Torvalds committed
367 368 369
	if (error)
		goto out;

370 371 372 373 374
	/*
	 * pseudoflavor restrictions are not enforced on NLM,
	 * which clients virtually always use auth_sys for,
	 * even while using RPCSEC_GSS for NFS.
	 */
375
	if (access & NFSD_MAY_LOCK || access & NFSD_MAY_BYPASS_GSS)
376 377 378 379 380 381 382 383 384 385 386 387 388
		goto skip_pseudoflavor_check;
	/*
	 * Clients may expect to be able to use auth_sys during mount,
	 * even if they use gss for everything else; see section 2.3.2
	 * of rfc 2623.
	 */
	if (access & NFSD_MAY_BYPASS_GSS_ON_ROOT
			&& exp->ex_path.dentry == dentry)
		goto skip_pseudoflavor_check;

	error = check_nfsd_access(exp, rqstp);
	if (error)
		goto out;
389

390
skip_pseudoflavor_check:
Linus Torvalds's avatar
Linus Torvalds committed
391
	/* Finally, check access permissions. */
392
	error = nfsd_permission(&rqstp->rq_cred, exp, dentry, access);
Linus Torvalds's avatar
Linus Torvalds committed
393
out:
394
	trace_nfsd_fh_verify_err(rqstp, fhp, type, access, error);
Linus Torvalds's avatar
Linus Torvalds committed
395
	if (error == nfserr_stale)
396
		nfsd_stats_fh_stale_inc(nn, exp);
Linus Torvalds's avatar
Linus Torvalds committed
397 398 399 400 401 402 403 404 405 406 407
	return error;
}


/*
 * Compose a file handle for an NFS reply.
 *
 * Note that when first composed, the dentry may not yet have
 * an inode.  In this case a call to fh_update should be made
 * before the fh goes out on the wire ...
 */
Christoph Hellwig's avatar
Christoph Hellwig committed
408 409
static void _fh_update(struct svc_fh *fhp, struct svc_export *exp,
		struct dentry *dentry)
Linus Torvalds's avatar
Linus Torvalds committed
410
{
411
	if (dentry != exp->ex_path.dentry) {
Christoph Hellwig's avatar
Christoph Hellwig committed
412
		struct fid *fid = (struct fid *)
413
			(fhp->fh_handle.fh_fsid + fhp->fh_handle.fh_size/4 - 1);
Christoph Hellwig's avatar
Christoph Hellwig committed
414
		int maxsize = (fhp->fh_maxsize - fhp->fh_handle.fh_size)/4;
415 416
		int fh_flags = (exp->ex_flags & NFSEXP_NOSUBTREECHECK) ? 0 :
				EXPORT_FH_CONNECTABLE;
417 418
		int fileid_type =
			exportfs_encode_fh(dentry, fid, &maxsize, fh_flags);
Linus Torvalds's avatar
Linus Torvalds committed
419

Christoph Hellwig's avatar
Christoph Hellwig committed
420
		fhp->fh_handle.fh_fileid_type =
421
			fileid_type > 0 ? fileid_type : FILEID_INVALID;
Christoph Hellwig's avatar
Christoph Hellwig committed
422 423 424 425
		fhp->fh_handle.fh_size += maxsize * 4;
	} else {
		fhp->fh_handle.fh_fileid_type = FILEID_ROOT;
	}
Linus Torvalds's avatar
Linus Torvalds committed
426 427
}

428 429 430 431 432 433 434
static bool is_root_export(struct svc_export *exp)
{
	return exp->ex_path.dentry == exp->ex_path.dentry->d_sb->s_root;
}

static struct super_block *exp_sb(struct svc_export *exp)
{
435
	return exp->ex_path.dentry->d_sb;
436 437 438 439 440 441 442
}

static bool fsid_type_ok_for_exp(u8 fsid_type, struct svc_export *exp)
{
	switch (fsid_type) {
	case FSID_DEV:
		if (!old_valid_dev(exp_sb(exp)->s_dev))
443
			return false;
444
		fallthrough;
445 446 447 448 449 450 451 452
	case FSID_MAJOR_MINOR:
	case FSID_ENCODE_DEV:
		return exp_sb(exp)->s_type->fs_flags & FS_REQUIRES_DEV;
	case FSID_NUM:
		return exp->ex_flags & NFSEXP_FSID;
	case FSID_UUID8:
	case FSID_UUID16:
		if (!is_root_export(exp))
453
			return false;
454
		fallthrough;
455 456 457 458
	case FSID_UUID4_INUM:
	case FSID_UUID16_INUM:
		return exp->ex_uuid != NULL;
	}
459
	return true;
460 461
}

Linus Torvalds's avatar
Linus Torvalds committed
462

463 464
static void set_version_and_fsid_type(struct svc_fh *fhp, struct svc_export *exp, struct svc_fh *ref_fh)
{
465
	u8 version;
466 467
	u8 fsid_type;
retry:
468
	version = 1;
469
	if (ref_fh && ref_fh->fh_export == exp) {
470
		version = ref_fh->fh_handle.fh_version;
471 472 473 474 475 476
		fsid_type = ref_fh->fh_handle.fh_fsid_type;

		ref_fh = NULL;

		switch (version) {
		case 0xca:
477
			fsid_type = FSID_DEV;
478 479 480 481 482 483 484
			break;
		case 1:
			break;
		default:
			goto retry;
		}

485 486 487 488 489
		/*
		 * As the fsid -> filesystem mapping was guided by
		 * user-space, there is no guarantee that the filesystem
		 * actually supports that fsid type. If it doesn't we
		 * loop around again without ref_fh set.
490
		 */
491 492
		if (!fsid_type_ok_for_exp(fsid_type, exp))
			goto retry;
493 494
	} else if (exp->ex_flags & NFSEXP_FSID) {
		fsid_type = FSID_NUM;
495 496
	} else if (exp->ex_uuid) {
		if (fhp->fh_maxsize >= 64) {
497
			if (is_root_export(exp))
498 499 500 501
				fsid_type = FSID_UUID16;
			else
				fsid_type = FSID_UUID16_INUM;
		} else {
502
			if (is_root_export(exp))
503 504 505 506
				fsid_type = FSID_UUID8;
			else
				fsid_type = FSID_UUID4_INUM;
		}
507
	} else if (!old_valid_dev(exp_sb(exp)->s_dev))
Linus Torvalds's avatar
Linus Torvalds committed
508
		/* for newer device numbers, we must use a newer fsid format */
509
		fsid_type = FSID_ENCODE_DEV;
510
	else
511
		fsid_type = FSID_DEV;
512 513 514 515 516 517 518 519 520 521 522 523 524 525
	fhp->fh_handle.fh_version = version;
	if (version)
		fhp->fh_handle.fh_fsid_type = fsid_type;
}

__be32
fh_compose(struct svc_fh *fhp, struct svc_export *exp, struct dentry *dentry,
	   struct svc_fh *ref_fh)
{
	/* ref_fh is a reference file handle.
	 * if it is non-null and for the same filesystem, then we should compose
	 * a filehandle which is of the same version, where possible.
	 */

526
	struct inode * inode = d_inode(dentry);
527 528
	dev_t ex_dev = exp_sb(exp)->s_dev;

Al Viro's avatar
Al Viro committed
529
	dprintk("nfsd: fh_compose(exp %02x:%02x/%ld %pd2, ino=%ld)\n",
530
		MAJOR(ex_dev), MINOR(ex_dev),
531
		(long) d_inode(exp->ex_path.dentry)->i_ino,
Al Viro's avatar
Al Viro committed
532
		dentry,
533 534 535 536 537 538
		(inode ? inode->i_ino : 0));

	/* Choose filehandle version and fsid type based on
	 * the reference filehandle (if it is in the same export)
	 * or the export options.
	 */
539
	set_version_and_fsid_type(fhp, exp, ref_fh);
Linus Torvalds's avatar
Linus Torvalds committed
540

541 542 543
	/* If we have a ref_fh, then copy the fh_no_wcc setting from it. */
	fhp->fh_no_wcc = ref_fh ? ref_fh->fh_no_wcc : false;

Linus Torvalds's avatar
Linus Torvalds committed
544 545 546
	if (ref_fh == fhp)
		fh_put(ref_fh);

547
	if (fhp->fh_dentry) {
Al Viro's avatar
Al Viro committed
548 549
		printk(KERN_ERR "fh_compose: fh %pd2 not initialized!\n",
		       dentry);
Linus Torvalds's avatar
Linus Torvalds committed
550 551
	}
	if (fhp->fh_maxsize < NFS_FHSIZE)
Al Viro's avatar
Al Viro committed
552
		printk(KERN_ERR "fh_compose: called with maxsize %d! %pd2\n",
553
		       fhp->fh_maxsize,
Al Viro's avatar
Al Viro committed
554
		       dentry);
Linus Torvalds's avatar
Linus Torvalds committed
555 556

	fhp->fh_dentry = dget(dentry); /* our internal copy */
557
	fhp->fh_export = exp_get(exp);
Linus Torvalds's avatar
Linus Torvalds committed
558

559 560 561 562 563 564 565 566 567 568 569 570 571 572
	fhp->fh_handle.fh_size =
		key_len(fhp->fh_handle.fh_fsid_type) + 4;
	fhp->fh_handle.fh_auth_type = 0;

	mk_fsid(fhp->fh_handle.fh_fsid_type,
		fhp->fh_handle.fh_fsid,
		ex_dev,
		d_inode(exp->ex_path.dentry)->i_ino,
		exp->ex_fsid, exp->ex_uuid);

	if (inode)
		_fh_update(fhp, exp, dentry);
	if (fhp->fh_handle.fh_fileid_type == FILEID_INVALID) {
		fh_put(fhp);
573
		return nfserr_stale;
Linus Torvalds's avatar
Linus Torvalds committed
574 575 576 577 578 579 580 581 582
	}

	return 0;
}

/*
 * Update file handle information after changing a dentry.
 * This is only called by nfsd_create, nfsd_create_v3 and nfsd_proc_create
 */
583
__be32
Linus Torvalds's avatar
Linus Torvalds committed
584 585 586
fh_update(struct svc_fh *fhp)
{
	struct dentry *dentry;
587

Linus Torvalds's avatar
Linus Torvalds committed
588 589 590 591
	if (!fhp->fh_dentry)
		goto out_bad;

	dentry = fhp->fh_dentry;
592
	if (d_really_is_negative(dentry))
Linus Torvalds's avatar
Linus Torvalds committed
593
		goto out_negative;
594 595
	if (fhp->fh_handle.fh_fileid_type != FILEID_ROOT)
		return 0;
Christoph Hellwig's avatar
Christoph Hellwig committed
596

597 598
	_fh_update(fhp, fhp->fh_export, dentry);
	if (fhp->fh_handle.fh_fileid_type == FILEID_INVALID)
599
		return nfserr_stale;
Linus Torvalds's avatar
Linus Torvalds committed
600 601 602
	return 0;
out_bad:
	printk(KERN_ERR "fh_update: fh not verified!\n");
603
	return nfserr_serverfault;
Linus Torvalds's avatar
Linus Torvalds committed
604
out_negative:
Al Viro's avatar
Al Viro committed
605 606
	printk(KERN_ERR "fh_update: %pd2 still negative!\n",
		dentry);
607
	return nfserr_serverfault;
Linus Torvalds's avatar
Linus Torvalds committed
608 609
}

610 611 612 613 614
/**
 * fh_fill_pre_attrs - Fill in pre-op attributes
 * @fhp: file handle to be updated
 *
 */
615
__be32 __must_check fh_fill_pre_attrs(struct svc_fh *fhp)
616 617 618 619 620 621 622
{
	bool v4 = (fhp->fh_maxsize == NFS4_FHSIZE);
	struct inode *inode;
	struct kstat stat;
	__be32 err;

	if (fhp->fh_no_wcc || fhp->fh_pre_saved)
623
		return nfs_ok;
624 625 626

	inode = d_inode(fhp->fh_dentry);
	err = fh_getattr(fhp, &stat);
627
	if (err)
628
		return err;
629

630 631 632 633 634 635 636
	if (v4)
		fhp->fh_pre_change = nfsd4_change_attribute(&stat, inode);

	fhp->fh_pre_mtime = stat.mtime;
	fhp->fh_pre_ctime = stat.ctime;
	fhp->fh_pre_size  = stat.size;
	fhp->fh_pre_saved = true;
637
	return nfs_ok;
638 639 640 641 642 643 644
}

/**
 * fh_fill_post_attrs - Fill in post-op attributes
 * @fhp: file handle to be updated
 *
 */
645
__be32 fh_fill_post_attrs(struct svc_fh *fhp)
646 647 648 649 650 651
{
	bool v4 = (fhp->fh_maxsize == NFS4_FHSIZE);
	struct inode *inode = d_inode(fhp->fh_dentry);
	__be32 err;

	if (fhp->fh_no_wcc)
652
		return nfs_ok;
653 654 655 656 657

	if (fhp->fh_post_saved)
		printk("nfsd: inode locked twice during operation.\n");

	err = fh_getattr(fhp, &fhp->fh_post_attr);
658
	if (err)
659
		return err;
660 661

	fhp->fh_post_saved = true;
662 663 664
	if (v4)
		fhp->fh_post_change =
			nfsd4_change_attribute(&fhp->fh_post_attr, inode);
665
	return nfs_ok;
666 667
}

668 669 670 671 672 673 674
/**
 * fh_fill_both_attrs - Fill pre-op and post-op attributes
 * @fhp: file handle to be updated
 *
 * This is used when the directory wasn't changed, but wcc attributes
 * are needed anyway.
 */
675
__be32 __must_check fh_fill_both_attrs(struct svc_fh *fhp)
676
{
677 678 679 680 681 682
	__be32 err;

	err = fh_fill_post_attrs(fhp);
	if (err)
		return err;

683 684 685 686 687
	fhp->fh_pre_change = fhp->fh_post_change;
	fhp->fh_pre_mtime = fhp->fh_post_attr.mtime;
	fhp->fh_pre_ctime = fhp->fh_post_attr.ctime;
	fhp->fh_pre_size = fhp->fh_post_attr.size;
	fhp->fh_pre_saved = true;
688
	return nfs_ok;
689 690
}

Linus Torvalds's avatar
Linus Torvalds committed
691 692 693 694 695 696 697 698 699 700 701
/*
 * Release a file handle.
 */
void
fh_put(struct svc_fh *fhp)
{
	struct dentry * dentry = fhp->fh_dentry;
	struct svc_export * exp = fhp->fh_export;
	if (dentry) {
		fhp->fh_dentry = NULL;
		dput(dentry);
702
		fh_clear_pre_post_attrs(fhp);
Linus Torvalds's avatar
Linus Torvalds committed
703
	}
704
	fh_drop_write(fhp);
Linus Torvalds's avatar
Linus Torvalds committed
705
	if (exp) {
706
		exp_put(exp);
Linus Torvalds's avatar
Linus Torvalds committed
707 708
		fhp->fh_export = NULL;
	}
709
	fhp->fh_no_wcc = false;
Linus Torvalds's avatar
Linus Torvalds committed
710 711 712 713 714 715 716 717 718
	return;
}

/*
 * Shorthand for dprintk()'s
 */
char * SVCFH_fmt(struct svc_fh *fhp)
{
	struct knfsd_fh *fh = &fhp->fh_handle;
NeilBrown's avatar
NeilBrown committed
719
	static char buf[2+1+1+64*3+1];
Linus Torvalds's avatar
Linus Torvalds committed
720

NeilBrown's avatar
NeilBrown committed
721 722 723
	if (fh->fh_size < 0 || fh->fh_size> 64)
		return "bad-fh";
	sprintf(buf, "%d: %*ph", fh->fh_size, fh->fh_size, fh->fh_raw);
Linus Torvalds's avatar
Linus Torvalds committed
724 725
	return buf;
}
726

727
enum fsid_source fsid_source(const struct svc_fh *fhp)
728 729 730 731 732 733 734
{
	if (fhp->fh_handle.fh_version != 1)
		return FSIDSOURCE_DEV;
	switch(fhp->fh_handle.fh_fsid_type) {
	case FSID_DEV:
	case FSID_ENCODE_DEV:
	case FSID_MAJOR_MINOR:
735
		if (exp_sb(fhp->fh_export)->s_type->fs_flags & FS_REQUIRES_DEV)
736 737
			return FSIDSOURCE_DEV;
		break;
738 739 740
	case FSID_NUM:
		if (fhp->fh_export->ex_flags & NFSEXP_FSID)
			return FSIDSOURCE_FSID;
741 742 743
		break;
	default:
		break;
744
	}
745 746 747 748 749 750 751 752
	/* either a UUID type filehandle, or the filehandle doesn't
	 * match the export.
	 */
	if (fhp->fh_export->ex_flags & NFSEXP_FSID)
		return FSIDSOURCE_FSID;
	if (fhp->fh_export->ex_uuid)
		return FSIDSOURCE_UUID;
	return FSIDSOURCE_DEV;
753
}
754 755

/*
756 757 758 759 760 761 762 763 764 765 766
 * We could use i_version alone as the change attribute.  However, i_version
 * can go backwards on a regular file after an unclean shutdown.  On its own
 * that doesn't necessarily cause a problem, but if i_version goes backwards
 * and then is incremented again it could reuse a value that was previously
 * used before boot, and a client who queried the two values might incorrectly
 * assume nothing changed.
 *
 * By using both ctime and the i_version counter we guarantee that as long as
 * time doesn't go backwards we never reuse an old value. If the filesystem
 * advertises STATX_ATTR_CHANGE_MONOTONIC, then this mitigation is not
 * needed.
767
 *
768 769 770
 * We only need to do this for regular files as well. For directories, we
 * assume that the new change attr is always logged to stable storage in some
 * fashion before the results can be seen.
771
 */
772
u64 nfsd4_change_attribute(const struct kstat *stat, const struct inode *inode)
773
{
774 775 776 777 778 779 780 781 782 783 784 785 786
	u64 chattr;

	if (stat->result_mask & STATX_CHANGE_COOKIE) {
		chattr = stat->change_cookie;
		if (S_ISREG(inode->i_mode) &&
		    !(stat->attributes & STATX_ATTR_CHANGE_MONOTONIC)) {
			chattr += (u64)stat->ctime.tv_sec << 30;
			chattr += stat->ctime.tv_nsec;
		}
	} else {
		chattr = time_to_chattr(&stat->ctime);
	}
	return chattr;
787
}