nfs_commonkrpc.c revision 336899
1/*- 2 * Copyright (c) 1989, 1991, 1993, 1995 3 * The Regents of the University of California. All rights reserved. 4 * 5 * This code is derived from software contributed to Berkeley by 6 * Rick Macklem at The University of Guelph. 7 * 8 * Redistribution and use in source and binary forms, with or without 9 * modification, are permitted provided that the following conditions 10 * are met: 11 * 1. Redistributions of source code must retain the above copyright 12 * notice, this list of conditions and the following disclaimer. 13 * 2. Redistributions in binary form must reproduce the above copyright 14 * notice, this list of conditions and the following disclaimer in the 15 * documentation and/or other materials provided with the distribution. 16 * 4. Neither the name of the University nor the names of its contributors 17 * may be used to endorse or promote products derived from this software 18 * without specific prior written permission. 19 * 20 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 21 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 22 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 23 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 24 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 25 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 26 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 27 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 28 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 29 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 30 * SUCH DAMAGE. 31 * 32 */ 33 34#include <sys/cdefs.h> 35__FBSDID("$FreeBSD: stable/10/sys/fs/nfs/nfs_commonkrpc.c 336899 2018-07-30 12:17:10Z rmacklem $"); 36 37/* 38 * Socket operations for use by nfs 39 */ 40 41#include "opt_kdtrace.h" 42#include "opt_kgssapi.h" 43#include "opt_nfs.h" 44 45#include <sys/param.h> 46#include <sys/systm.h> 47#include <sys/kernel.h> 48#include <sys/limits.h> 49#include <sys/lock.h> 50#include <sys/malloc.h> 51#include <sys/mbuf.h> 52#include <sys/mount.h> 53#include <sys/mutex.h> 54#include <sys/proc.h> 55#include <sys/signalvar.h> 56#include <sys/syscallsubr.h> 57#include <sys/sysctl.h> 58#include <sys/syslog.h> 59#include <sys/vnode.h> 60 61#include <rpc/rpc.h> 62#include <rpc/krpc.h> 63 64#include <kgssapi/krb5/kcrypto.h> 65 66#include <fs/nfs/nfsport.h> 67 68#ifdef KDTRACE_HOOKS 69#include <sys/dtrace_bsd.h> 70 71dtrace_nfsclient_nfs23_start_probe_func_t 72 dtrace_nfscl_nfs234_start_probe; 73 74dtrace_nfsclient_nfs23_done_probe_func_t 75 dtrace_nfscl_nfs234_done_probe; 76 77/* 78 * Registered probes by RPC type. 79 */ 80uint32_t nfscl_nfs2_start_probes[NFSV41_NPROCS + 1]; 81uint32_t nfscl_nfs2_done_probes[NFSV41_NPROCS + 1]; 82 83uint32_t nfscl_nfs3_start_probes[NFSV41_NPROCS + 1]; 84uint32_t nfscl_nfs3_done_probes[NFSV41_NPROCS + 1]; 85 86uint32_t nfscl_nfs4_start_probes[NFSV41_NPROCS + 1]; 87uint32_t nfscl_nfs4_done_probes[NFSV41_NPROCS + 1]; 88#endif 89 90NFSSTATESPINLOCK; 91NFSREQSPINLOCK; 92NFSDLOCKMUTEX; 93NFSCLSTATEMUTEX; 94extern struct nfsstats newnfsstats; 95extern struct nfsreqhead nfsd_reqq; 96extern int nfscl_ticks; 97extern void (*ncl_call_invalcaches)(struct vnode *); 98extern int nfs_numnfscbd; 99extern int nfscl_debuglevel; 100 101SVCPOOL *nfscbd_pool; 102static int nfsrv_gsscallbackson = 0; 103static int nfs_bufpackets = 4; 104static int nfs_reconnects; 105static int nfs3_jukebox_delay = 10; 106static int nfs_skip_wcc_data_onerr = 1; 107 108SYSCTL_DECL(_vfs_nfs); 109 110SYSCTL_INT(_vfs_nfs, OID_AUTO, bufpackets, CTLFLAG_RW, &nfs_bufpackets, 0, 111 "Buffer reservation size 2 < x < 64"); 112SYSCTL_INT(_vfs_nfs, OID_AUTO, reconnects, CTLFLAG_RD, &nfs_reconnects, 0, 113 "Number of times the nfs client has had to reconnect"); 114SYSCTL_INT(_vfs_nfs, OID_AUTO, nfs3_jukebox_delay, CTLFLAG_RW, &nfs3_jukebox_delay, 0, 115 "Number of seconds to delay a retry after receiving EJUKEBOX"); 116SYSCTL_INT(_vfs_nfs, OID_AUTO, skip_wcc_data_onerr, CTLFLAG_RW, &nfs_skip_wcc_data_onerr, 0, 117 "Disable weak cache consistency checking when server returns an error"); 118 119static void nfs_down(struct nfsmount *, struct thread *, const char *, 120 int, int); 121static void nfs_up(struct nfsmount *, struct thread *, const char *, 122 int, int); 123static int nfs_msg(struct thread *, const char *, const char *, int); 124 125struct nfs_cached_auth { 126 int ca_refs; /* refcount, including 1 from the cache */ 127 uid_t ca_uid; /* uid that corresponds to this auth */ 128 AUTH *ca_auth; /* RPC auth handle */ 129}; 130 131static int nfsv2_procid[NFS_V3NPROCS] = { 132 NFSV2PROC_NULL, 133 NFSV2PROC_GETATTR, 134 NFSV2PROC_SETATTR, 135 NFSV2PROC_LOOKUP, 136 NFSV2PROC_NOOP, 137 NFSV2PROC_READLINK, 138 NFSV2PROC_READ, 139 NFSV2PROC_WRITE, 140 NFSV2PROC_CREATE, 141 NFSV2PROC_MKDIR, 142 NFSV2PROC_SYMLINK, 143 NFSV2PROC_CREATE, 144 NFSV2PROC_REMOVE, 145 NFSV2PROC_RMDIR, 146 NFSV2PROC_RENAME, 147 NFSV2PROC_LINK, 148 NFSV2PROC_READDIR, 149 NFSV2PROC_NOOP, 150 NFSV2PROC_STATFS, 151 NFSV2PROC_NOOP, 152 NFSV2PROC_NOOP, 153 NFSV2PROC_NOOP, 154}; 155 156/* 157 * Initialize sockets and congestion for a new NFS connection. 158 * We do not free the sockaddr if error. 159 */ 160int 161newnfs_connect(struct nfsmount *nmp, struct nfssockreq *nrp, 162 struct ucred *cred, NFSPROC_T *p, int callback_retry_mult) 163{ 164 int rcvreserve, sndreserve; 165 int pktscale, pktscalesav; 166 struct sockaddr *saddr; 167 struct ucred *origcred; 168 CLIENT *client; 169 struct netconfig *nconf; 170 struct socket *so; 171 int one = 1, retries, error = 0; 172 struct thread *td = curthread; 173 SVCXPRT *xprt; 174 struct timeval timo; 175 176 /* 177 * We need to establish the socket using the credentials of 178 * the mountpoint. Some parts of this process (such as 179 * sobind() and soconnect()) will use the curent thread's 180 * credential instead of the socket credential. To work 181 * around this, temporarily change the current thread's 182 * credential to that of the mountpoint. 183 * 184 * XXX: It would be better to explicitly pass the correct 185 * credential to sobind() and soconnect(). 186 */ 187 origcred = td->td_ucred; 188 189 /* 190 * Use the credential in nr_cred, if not NULL. 191 */ 192 if (nrp->nr_cred != NULL) 193 td->td_ucred = nrp->nr_cred; 194 else 195 td->td_ucred = cred; 196 saddr = nrp->nr_nam; 197 198 if (saddr->sa_family == AF_INET) 199 if (nrp->nr_sotype == SOCK_DGRAM) 200 nconf = getnetconfigent("udp"); 201 else 202 nconf = getnetconfigent("tcp"); 203 else 204 if (nrp->nr_sotype == SOCK_DGRAM) 205 nconf = getnetconfigent("udp6"); 206 else 207 nconf = getnetconfigent("tcp6"); 208 209 pktscale = nfs_bufpackets; 210 if (pktscale < 2) 211 pktscale = 2; 212 if (pktscale > 64) 213 pktscale = 64; 214 pktscalesav = pktscale; 215 /* 216 * soreserve() can fail if sb_max is too small, so shrink pktscale 217 * and try again if there is an error. 218 * Print a log message suggesting increasing sb_max. 219 * Creating a socket and doing this is necessary since, if the 220 * reservation sizes are too large and will make soreserve() fail, 221 * the connection will work until a large send is attempted and 222 * then it will loop in the krpc code. 223 */ 224 so = NULL; 225 saddr = NFSSOCKADDR(nrp->nr_nam, struct sockaddr *); 226 error = socreate(saddr->sa_family, &so, nrp->nr_sotype, 227 nrp->nr_soproto, td->td_ucred, td); 228 if (error) { 229 td->td_ucred = origcred; 230 goto out; 231 } 232 do { 233 if (error != 0 && pktscale > 2) { 234 if (nmp != NULL && nrp->nr_sotype == SOCK_STREAM && 235 pktscale == pktscalesav) 236 printf("Consider increasing kern.ipc.maxsockbuf\n"); 237 pktscale--; 238 } 239 if (nrp->nr_sotype == SOCK_DGRAM) { 240 if (nmp != NULL) { 241 sndreserve = (NFS_MAXDGRAMDATA + NFS_MAXPKTHDR) * 242 pktscale; 243 rcvreserve = (NFS_MAXDGRAMDATA + NFS_MAXPKTHDR) * 244 pktscale; 245 } else { 246 sndreserve = rcvreserve = 1024 * pktscale; 247 } 248 } else { 249 if (nrp->nr_sotype != SOCK_STREAM) 250 panic("nfscon sotype"); 251 if (nmp != NULL) { 252 sndreserve = (NFS_MAXBSIZE + NFS_MAXXDR + 253 sizeof (u_int32_t)) * pktscale; 254 rcvreserve = (NFS_MAXBSIZE + NFS_MAXXDR + 255 sizeof (u_int32_t)) * pktscale; 256 } else { 257 sndreserve = rcvreserve = 1024 * pktscale; 258 } 259 } 260 error = soreserve(so, sndreserve, rcvreserve); 261 if (error != 0 && nmp != NULL && nrp->nr_sotype == SOCK_STREAM && 262 pktscale <= 2) 263 printf("Must increase kern.ipc.maxsockbuf or reduce" 264 " rsize, wsize\n"); 265 } while (error != 0 && pktscale > 2); 266 soclose(so); 267 if (error) { 268 td->td_ucred = origcred; 269 goto out; 270 } 271 272 client = clnt_reconnect_create(nconf, saddr, nrp->nr_prog, 273 nrp->nr_vers, sndreserve, rcvreserve); 274 CLNT_CONTROL(client, CLSET_WAITCHAN, "newnfsreq"); 275 if (nmp != NULL) { 276 if ((nmp->nm_flag & NFSMNT_INT)) 277 CLNT_CONTROL(client, CLSET_INTERRUPTIBLE, &one); 278 if ((nmp->nm_flag & NFSMNT_RESVPORT)) 279 CLNT_CONTROL(client, CLSET_PRIVPORT, &one); 280 if (NFSHASSOFT(nmp)) { 281 if (nmp->nm_sotype == SOCK_DGRAM) 282 /* 283 * For UDP, the large timeout for a reconnect 284 * will be set to "nm_retry * nm_timeo / 2", so 285 * we only want to do 2 reconnect timeout 286 * retries. 287 */ 288 retries = 2; 289 else 290 retries = nmp->nm_retry; 291 } else 292 retries = INT_MAX; 293 /* cred == NULL for DS connects. */ 294 if (NFSHASNFSV4N(nmp) && cred != NULL) { 295 /* 296 * Make sure the nfscbd_pool doesn't get destroyed 297 * while doing this. 298 */ 299 NFSD_LOCK(); 300 if (nfs_numnfscbd > 0) { 301 nfs_numnfscbd++; 302 NFSD_UNLOCK(); 303 xprt = svc_vc_create_backchannel(nfscbd_pool); 304 CLNT_CONTROL(client, CLSET_BACKCHANNEL, xprt); 305 NFSD_LOCK(); 306 nfs_numnfscbd--; 307 if (nfs_numnfscbd == 0) 308 wakeup(&nfs_numnfscbd); 309 } 310 NFSD_UNLOCK(); 311 } 312 } else { 313 /* 314 * Three cases: 315 * - Null RPC callback to client 316 * - Non-Null RPC callback to client, wait a little longer 317 * - upcalls to nfsuserd and gssd (clp == NULL) 318 */ 319 if (callback_retry_mult == 0) { 320 retries = NFSV4_UPCALLRETRY; 321 CLNT_CONTROL(client, CLSET_PRIVPORT, &one); 322 } else { 323 retries = NFSV4_CALLBACKRETRY * callback_retry_mult; 324 } 325 } 326 CLNT_CONTROL(client, CLSET_RETRIES, &retries); 327 328 if (nmp != NULL) { 329 /* 330 * For UDP, there are 2 timeouts: 331 * - CLSET_RETRY_TIMEOUT sets the initial timeout for the timer 332 * that does a retransmit of an RPC request using the same 333 * socket and xid. This is what you normally want to do, 334 * since NFS servers depend on "same xid" for their 335 * Duplicate Request Cache. 336 * - timeout specified in CLNT_CALL_MBUF(), which specifies when 337 * retransmits on the same socket should fail and a fresh 338 * socket created. Each of these timeouts counts as one 339 * CLSET_RETRIES as set above. 340 * Set the initial retransmit timeout for UDP. This timeout 341 * doesn't exist for TCP and the following call just fails, 342 * which is ok. 343 */ 344 timo.tv_sec = nmp->nm_timeo / NFS_HZ; 345 timo.tv_usec = (nmp->nm_timeo % NFS_HZ) * 1000000 / NFS_HZ; 346 CLNT_CONTROL(client, CLSET_RETRY_TIMEOUT, &timo); 347 } 348 349 mtx_lock(&nrp->nr_mtx); 350 if (nrp->nr_client != NULL) { 351 mtx_unlock(&nrp->nr_mtx); 352 /* 353 * Someone else already connected. 354 */ 355 CLNT_RELEASE(client); 356 } else { 357 nrp->nr_client = client; 358 /* 359 * Protocols that do not require connections may be optionally 360 * left unconnected for servers that reply from a port other 361 * than NFS_PORT. 362 */ 363 if (nmp == NULL || (nmp->nm_flag & NFSMNT_NOCONN) == 0) { 364 mtx_unlock(&nrp->nr_mtx); 365 CLNT_CONTROL(client, CLSET_CONNECT, &one); 366 } else 367 mtx_unlock(&nrp->nr_mtx); 368 } 369 370 371 /* Restore current thread's credentials. */ 372 td->td_ucred = origcred; 373 374out: 375 NFSEXITCODE(error); 376 return (error); 377} 378 379/* 380 * NFS disconnect. Clean up and unlink. 381 */ 382void 383newnfs_disconnect(struct nfssockreq *nrp) 384{ 385 CLIENT *client; 386 387 mtx_lock(&nrp->nr_mtx); 388 if (nrp->nr_client != NULL) { 389 client = nrp->nr_client; 390 nrp->nr_client = NULL; 391 mtx_unlock(&nrp->nr_mtx); 392 rpc_gss_secpurge_call(client); 393 CLNT_CLOSE(client); 394 CLNT_RELEASE(client); 395 } else { 396 mtx_unlock(&nrp->nr_mtx); 397 } 398} 399 400static AUTH * 401nfs_getauth(struct nfssockreq *nrp, int secflavour, char *clnt_principal, 402 char *srv_principal, gss_OID mech_oid, struct ucred *cred) 403{ 404 rpc_gss_service_t svc; 405 AUTH *auth; 406 407 switch (secflavour) { 408 case RPCSEC_GSS_KRB5: 409 case RPCSEC_GSS_KRB5I: 410 case RPCSEC_GSS_KRB5P: 411 if (!mech_oid) { 412 if (!rpc_gss_mech_to_oid_call("kerberosv5", &mech_oid)) 413 return (NULL); 414 } 415 if (secflavour == RPCSEC_GSS_KRB5) 416 svc = rpc_gss_svc_none; 417 else if (secflavour == RPCSEC_GSS_KRB5I) 418 svc = rpc_gss_svc_integrity; 419 else 420 svc = rpc_gss_svc_privacy; 421 422 if (clnt_principal == NULL) 423 auth = rpc_gss_secfind_call(nrp->nr_client, cred, 424 srv_principal, mech_oid, svc); 425 else { 426 auth = rpc_gss_seccreate_call(nrp->nr_client, cred, 427 clnt_principal, srv_principal, "kerberosv5", 428 svc, NULL, NULL, NULL); 429 return (auth); 430 } 431 if (auth != NULL) 432 return (auth); 433 /* fallthrough */ 434 case AUTH_SYS: 435 default: 436 return (authunix_create(cred)); 437 438 } 439} 440 441/* 442 * Callback from the RPC code to generate up/down notifications. 443 */ 444 445struct nfs_feedback_arg { 446 struct nfsmount *nf_mount; 447 int nf_lastmsg; /* last tprintf */ 448 int nf_tprintfmsg; 449 struct thread *nf_td; 450}; 451 452static void 453nfs_feedback(int type, int proc, void *arg) 454{ 455 struct nfs_feedback_arg *nf = (struct nfs_feedback_arg *) arg; 456 struct nfsmount *nmp = nf->nf_mount; 457 time_t now; 458 459 switch (type) { 460 case FEEDBACK_REXMIT2: 461 case FEEDBACK_RECONNECT: 462 now = NFSD_MONOSEC; 463 if (nf->nf_lastmsg + nmp->nm_tprintf_delay < now) { 464 nfs_down(nmp, nf->nf_td, 465 "not responding", 0, NFSSTA_TIMEO); 466 nf->nf_tprintfmsg = TRUE; 467 nf->nf_lastmsg = now; 468 } 469 break; 470 471 case FEEDBACK_OK: 472 nfs_up(nf->nf_mount, nf->nf_td, 473 "is alive again", NFSSTA_TIMEO, nf->nf_tprintfmsg); 474 break; 475 } 476} 477 478/* 479 * newnfs_request - goes something like this 480 * - does the rpc by calling the krpc layer 481 * - break down rpc header and return with nfs reply 482 * nb: always frees up nd_mreq mbuf list 483 */ 484int 485newnfs_request(struct nfsrv_descript *nd, struct nfsmount *nmp, 486 struct nfsclient *clp, struct nfssockreq *nrp, vnode_t vp, 487 struct thread *td, struct ucred *cred, u_int32_t prog, u_int32_t vers, 488 u_char *retsum, int toplevel, u_int64_t *xidp, struct nfsclsession *dssep) 489{ 490 uint32_t retseq, retval, slotseq, *tl; 491 time_t waituntil; 492 int i = 0, j = 0, opcnt, set_sigset = 0, slot; 493 int trycnt, error = 0, usegssname = 0, secflavour = AUTH_SYS; 494 int freeslot, maxslot, reterr, slotpos, timeo; 495 u_int16_t procnum; 496 u_int trylater_delay = 1; 497 struct nfs_feedback_arg nf; 498 struct timeval timo; 499 AUTH *auth; 500 struct rpc_callextra ext; 501 enum clnt_stat stat; 502 struct nfsreq *rep = NULL; 503 char *srv_principal = NULL, *clnt_principal = NULL; 504 sigset_t oldset; 505 struct ucred *authcred; 506 struct nfsclsession *sep; 507 uint8_t sessionid[NFSX_V4SESSIONID]; 508 509 sep = dssep; 510 if (xidp != NULL) 511 *xidp = 0; 512 /* Reject requests while attempting a forced unmount. */ 513 if (nmp != NULL && (nmp->nm_mountp->mnt_kern_flag & MNTK_UNMOUNTF)) { 514 m_freem(nd->nd_mreq); 515 return (ESTALE); 516 } 517 518 /* 519 * Set authcred, which is used to acquire RPC credentials to 520 * the cred argument, by default. The crhold() should not be 521 * necessary, but will ensure that some future code change 522 * doesn't result in the credential being free'd prematurely. 523 */ 524 authcred = crhold(cred); 525 526 /* For client side interruptible mounts, mask off the signals. */ 527 if (nmp != NULL && td != NULL && NFSHASINT(nmp)) { 528 newnfs_set_sigmask(td, &oldset); 529 set_sigset = 1; 530 } 531 532 /* 533 * XXX if not already connected call nfs_connect now. Longer 534 * term, change nfs_mount to call nfs_connect unconditionally 535 * and let clnt_reconnect_create handle reconnects. 536 */ 537 if (nrp->nr_client == NULL) 538 newnfs_connect(nmp, nrp, cred, td, 0); 539 540 /* 541 * For a client side mount, nmp is != NULL and clp == NULL. For 542 * server calls (callbacks or upcalls), nmp == NULL. 543 */ 544 if (clp != NULL) { 545 NFSLOCKSTATE(); 546 if ((clp->lc_flags & LCL_GSS) && nfsrv_gsscallbackson) { 547 secflavour = RPCSEC_GSS_KRB5; 548 if (nd->nd_procnum != NFSPROC_NULL) { 549 if (clp->lc_flags & LCL_GSSINTEGRITY) 550 secflavour = RPCSEC_GSS_KRB5I; 551 else if (clp->lc_flags & LCL_GSSPRIVACY) 552 secflavour = RPCSEC_GSS_KRB5P; 553 } 554 } 555 NFSUNLOCKSTATE(); 556 } else if (nmp != NULL && NFSHASKERB(nmp) && 557 nd->nd_procnum != NFSPROC_NULL) { 558 if (NFSHASALLGSSNAME(nmp) && nmp->nm_krbnamelen > 0) 559 nd->nd_flag |= ND_USEGSSNAME; 560 if ((nd->nd_flag & ND_USEGSSNAME) != 0) { 561 /* 562 * If there is a client side host based credential, 563 * use that, otherwise use the system uid, if set. 564 * The system uid is in the nmp->nm_sockreq.nr_cred 565 * credentials. 566 */ 567 if (nmp->nm_krbnamelen > 0) { 568 usegssname = 1; 569 clnt_principal = nmp->nm_krbname; 570 } else if (nmp->nm_uid != (uid_t)-1) { 571 KASSERT(nmp->nm_sockreq.nr_cred != NULL, 572 ("newnfs_request: NULL nr_cred")); 573 crfree(authcred); 574 authcred = crhold(nmp->nm_sockreq.nr_cred); 575 } 576 } else if (nmp->nm_krbnamelen == 0 && 577 nmp->nm_uid != (uid_t)-1 && cred->cr_uid == (uid_t)0) { 578 /* 579 * If there is no host based principal name and 580 * the system uid is set and this is root, use the 581 * system uid, since root won't have user 582 * credentials in a credentials cache file. 583 * The system uid is in the nmp->nm_sockreq.nr_cred 584 * credentials. 585 */ 586 KASSERT(nmp->nm_sockreq.nr_cred != NULL, 587 ("newnfs_request: NULL nr_cred")); 588 crfree(authcred); 589 authcred = crhold(nmp->nm_sockreq.nr_cred); 590 } 591 if (NFSHASINTEGRITY(nmp)) 592 secflavour = RPCSEC_GSS_KRB5I; 593 else if (NFSHASPRIVACY(nmp)) 594 secflavour = RPCSEC_GSS_KRB5P; 595 else 596 secflavour = RPCSEC_GSS_KRB5; 597 srv_principal = NFSMNT_SRVKRBNAME(nmp); 598 } else if (nmp != NULL && !NFSHASKERB(nmp) && 599 nd->nd_procnum != NFSPROC_NULL && 600 (nd->nd_flag & ND_USEGSSNAME) != 0) { 601 /* 602 * Use the uid that did the mount when the RPC is doing 603 * NFSv4 system operations, as indicated by the 604 * ND_USEGSSNAME flag, for the AUTH_SYS case. 605 * The credentials in nm_sockreq.nr_cred were used for the 606 * mount. 607 */ 608 KASSERT(nmp->nm_sockreq.nr_cred != NULL, 609 ("newnfs_request: NULL nr_cred")); 610 crfree(authcred); 611 authcred = crhold(nmp->nm_sockreq.nr_cred); 612 } 613 614 if (nmp != NULL) { 615 bzero(&nf, sizeof(struct nfs_feedback_arg)); 616 nf.nf_mount = nmp; 617 nf.nf_td = td; 618 nf.nf_lastmsg = NFSD_MONOSEC - 619 ((nmp->nm_tprintf_delay)-(nmp->nm_tprintf_initial_delay)); 620 } 621 622 if (nd->nd_procnum == NFSPROC_NULL) 623 auth = authnone_create(); 624 else if (usegssname) { 625 /* 626 * For this case, the authenticator is held in the 627 * nfssockreq structure, so don't release the reference count 628 * held on it. --> Don't AUTH_DESTROY() it in this function. 629 */ 630 if (nrp->nr_auth == NULL) 631 nrp->nr_auth = nfs_getauth(nrp, secflavour, 632 clnt_principal, srv_principal, NULL, authcred); 633 else 634 rpc_gss_refresh_auth_call(nrp->nr_auth); 635 auth = nrp->nr_auth; 636 } else 637 auth = nfs_getauth(nrp, secflavour, NULL, 638 srv_principal, NULL, authcred); 639 crfree(authcred); 640 if (auth == NULL) { 641 m_freem(nd->nd_mreq); 642 if (set_sigset) 643 newnfs_restore_sigmask(td, &oldset); 644 return (EACCES); 645 } 646 bzero(&ext, sizeof(ext)); 647 ext.rc_auth = auth; 648 if (nmp != NULL) { 649 ext.rc_feedback = nfs_feedback; 650 ext.rc_feedback_arg = &nf; 651 } 652 653 procnum = nd->nd_procnum; 654 if ((nd->nd_flag & ND_NFSV4) && 655 nd->nd_procnum != NFSPROC_NULL && 656 nd->nd_procnum != NFSV4PROC_CBCOMPOUND) 657 procnum = NFSV4PROC_COMPOUND; 658 659 if (nmp != NULL) { 660 NFSINCRGLOBAL(newnfsstats.rpcrequests); 661 662 /* Map the procnum to the old NFSv2 one, as required. */ 663 if ((nd->nd_flag & ND_NFSV2) != 0) { 664 if (nd->nd_procnum < NFS_V3NPROCS) 665 procnum = nfsv2_procid[nd->nd_procnum]; 666 else 667 procnum = NFSV2PROC_NOOP; 668 } 669 670 /* 671 * Now only used for the R_DONTRECOVER case, but until that is 672 * supported within the krpc code, I need to keep a queue of 673 * outstanding RPCs for nfsv4 client requests. 674 */ 675 if ((nd->nd_flag & ND_NFSV4) && procnum == NFSV4PROC_COMPOUND) 676 MALLOC(rep, struct nfsreq *, sizeof(struct nfsreq), 677 M_NFSDREQ, M_WAITOK); 678#ifdef KDTRACE_HOOKS 679 if (dtrace_nfscl_nfs234_start_probe != NULL) { 680 uint32_t probe_id; 681 int probe_procnum; 682 683 if (nd->nd_flag & ND_NFSV4) { 684 probe_id = 685 nfscl_nfs4_start_probes[nd->nd_procnum]; 686 probe_procnum = nd->nd_procnum; 687 } else if (nd->nd_flag & ND_NFSV3) { 688 probe_id = nfscl_nfs3_start_probes[procnum]; 689 probe_procnum = procnum; 690 } else { 691 probe_id = 692 nfscl_nfs2_start_probes[nd->nd_procnum]; 693 probe_procnum = procnum; 694 } 695 if (probe_id != 0) 696 (dtrace_nfscl_nfs234_start_probe) 697 (probe_id, vp, nd->nd_mreq, cred, 698 probe_procnum); 699 } 700#endif 701 } 702 trycnt = 0; 703 freeslot = -1; /* Set to slot that needs to be free'd */ 704tryagain: 705 slot = -1; /* Slot that needs a sequence# increment. */ 706 /* 707 * This timeout specifies when a new socket should be created, 708 * along with new xid values. For UDP, this should be done 709 * infrequently, since retransmits of RPC requests should normally 710 * use the same xid. 711 */ 712 if (nmp == NULL) { 713 timo.tv_usec = 0; 714 if (clp == NULL) 715 timo.tv_sec = NFSV4_UPCALLTIMEO; 716 else 717 timo.tv_sec = NFSV4_CALLBACKTIMEO; 718 } else { 719 if (nrp->nr_sotype != SOCK_DGRAM) { 720 timo.tv_usec = 0; 721 if ((nmp->nm_flag & NFSMNT_NFSV4)) 722 timo.tv_sec = INT_MAX; 723 else 724 timo.tv_sec = NFS_TCPTIMEO; 725 } else { 726 if (NFSHASSOFT(nmp)) { 727 /* 728 * CLSET_RETRIES is set to 2, so this should be 729 * half of the total timeout required. 730 */ 731 timeo = nmp->nm_retry * nmp->nm_timeo / 2; 732 if (timeo < 1) 733 timeo = 1; 734 timo.tv_sec = timeo / NFS_HZ; 735 timo.tv_usec = (timeo % NFS_HZ) * 1000000 / 736 NFS_HZ; 737 } else { 738 /* For UDP hard mounts, use a large value. */ 739 timo.tv_sec = NFS_MAXTIMEO / NFS_HZ; 740 timo.tv_usec = 0; 741 } 742 } 743 744 if (rep != NULL) { 745 rep->r_flags = 0; 746 rep->r_nmp = nmp; 747 /* 748 * Chain request into list of outstanding requests. 749 */ 750 NFSLOCKREQ(); 751 TAILQ_INSERT_TAIL(&nfsd_reqq, rep, r_chain); 752 NFSUNLOCKREQ(); 753 } 754 } 755 756 nd->nd_mrep = NULL; 757 if (clp != NULL && sep != NULL) 758 stat = clnt_bck_call(nrp->nr_client, &ext, procnum, 759 nd->nd_mreq, &nd->nd_mrep, timo, sep->nfsess_xprt); 760 else 761 stat = CLNT_CALL_MBUF(nrp->nr_client, &ext, procnum, 762 nd->nd_mreq, &nd->nd_mrep, timo); 763 764 if (rep != NULL) { 765 /* 766 * RPC done, unlink the request. 767 */ 768 NFSLOCKREQ(); 769 TAILQ_REMOVE(&nfsd_reqq, rep, r_chain); 770 NFSUNLOCKREQ(); 771 } 772 773 /* 774 * If there was a successful reply and a tprintf msg. 775 * tprintf a response. 776 */ 777 if (stat == RPC_SUCCESS) { 778 error = 0; 779 } else if (stat == RPC_TIMEDOUT) { 780 NFSINCRGLOBAL(newnfsstats.rpctimeouts); 781 error = ETIMEDOUT; 782 } else if (stat == RPC_VERSMISMATCH) { 783 NFSINCRGLOBAL(newnfsstats.rpcinvalid); 784 error = EOPNOTSUPP; 785 } else if (stat == RPC_PROGVERSMISMATCH) { 786 NFSINCRGLOBAL(newnfsstats.rpcinvalid); 787 error = EPROTONOSUPPORT; 788 } else if (stat == RPC_INTR) { 789 error = EINTR; 790 } else { 791 NFSINCRGLOBAL(newnfsstats.rpcinvalid); 792 error = EACCES; 793 } 794 if (error) { 795 m_freem(nd->nd_mreq); 796 if (usegssname == 0) 797 AUTH_DESTROY(auth); 798 if (rep != NULL) 799 FREE((caddr_t)rep, M_NFSDREQ); 800 if (set_sigset) 801 newnfs_restore_sigmask(td, &oldset); 802 return (error); 803 } 804 805 KASSERT(nd->nd_mrep != NULL, ("mrep shouldn't be NULL if no error\n")); 806 807 /* 808 * Search for any mbufs that are not a multiple of 4 bytes long 809 * or with m_data not longword aligned. 810 * These could cause pointer alignment problems, so copy them to 811 * well aligned mbufs. 812 */ 813 newnfs_realign(&nd->nd_mrep, M_WAITOK); 814 nd->nd_md = nd->nd_mrep; 815 nd->nd_dpos = NFSMTOD(nd->nd_md, caddr_t); 816 nd->nd_repstat = 0; 817 if (nd->nd_procnum != NFSPROC_NULL && 818 nd->nd_procnum != NFSV4PROC_CBNULL) { 819 /* If sep == NULL, set it to the default in nmp. */ 820 if (sep == NULL && nmp != NULL) 821 sep = nfsmnt_mdssession(nmp); 822 /* 823 * and now the actual NFS xdr. 824 */ 825 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED); 826 nd->nd_repstat = fxdr_unsigned(u_int32_t, *tl); 827 if (nd->nd_repstat >= 10000) 828 NFSCL_DEBUG(1, "proc=%d reps=%d\n", (int)nd->nd_procnum, 829 (int)nd->nd_repstat); 830 831 /* 832 * Get rid of the tag, return count and SEQUENCE result for 833 * NFSv4. 834 */ 835 if ((nd->nd_flag & ND_NFSV4) != 0) { 836 NFSM_DISSECT(tl, u_int32_t *, NFSX_UNSIGNED); 837 i = fxdr_unsigned(int, *tl); 838 error = nfsm_advance(nd, NFSM_RNDUP(i), -1); 839 if (error) 840 goto nfsmout; 841 NFSM_DISSECT(tl, u_int32_t *, 3 * NFSX_UNSIGNED); 842 opcnt = fxdr_unsigned(int, *tl++); 843 i = fxdr_unsigned(int, *tl++); 844 j = fxdr_unsigned(int, *tl); 845 if (j >= 10000) 846 NFSCL_DEBUG(1, "fop=%d fst=%d\n", i, j); 847 /* 848 * If the first op is Sequence, free up the slot. 849 */ 850 if ((nmp != NULL && i == NFSV4OP_SEQUENCE && j != 0) || 851 (clp != NULL && i == NFSV4OP_CBSEQUENCE && j != 0)) 852 NFSCL_DEBUG(1, "failed seq=%d\n", j); 853 if (((nmp != NULL && i == NFSV4OP_SEQUENCE && j == 0) || 854 (clp != NULL && i == NFSV4OP_CBSEQUENCE && 855 j == 0)) && sep != NULL) { 856 if (i == NFSV4OP_SEQUENCE) 857 NFSM_DISSECT(tl, uint32_t *, 858 NFSX_V4SESSIONID + 859 5 * NFSX_UNSIGNED); 860 else 861 NFSM_DISSECT(tl, uint32_t *, 862 NFSX_V4SESSIONID + 863 4 * NFSX_UNSIGNED); 864 mtx_lock(&sep->nfsess_mtx); 865 if (bcmp(tl, sep->nfsess_sessionid, 866 NFSX_V4SESSIONID) == 0) { 867 tl += NFSX_V4SESSIONID / NFSX_UNSIGNED; 868 retseq = fxdr_unsigned(uint32_t, *tl++); 869 slot = fxdr_unsigned(int, *tl++); 870 freeslot = slot; 871 if (retseq != sep->nfsess_slotseq[slot]) 872 printf("retseq diff 0x%x\n", 873 retseq); 874 retval = fxdr_unsigned(uint32_t, *++tl); 875 if ((retval + 1) < sep->nfsess_foreslots 876 ) 877 sep->nfsess_foreslots = (retval 878 + 1); 879 else if ((retval + 1) > 880 sep->nfsess_foreslots) 881 sep->nfsess_foreslots = (retval 882 < 64) ? (retval + 1) : 64; 883 } 884 mtx_unlock(&sep->nfsess_mtx); 885 886 /* Grab the op and status for the next one. */ 887 if (opcnt > 1) { 888 NFSM_DISSECT(tl, uint32_t *, 889 2 * NFSX_UNSIGNED); 890 i = fxdr_unsigned(int, *tl++); 891 j = fxdr_unsigned(int, *tl); 892 } 893 } 894 } 895 if (nd->nd_repstat != 0) { 896 if (nd->nd_repstat == NFSERR_BADSESSION && 897 nmp != NULL && dssep == NULL && 898 (nd->nd_flag & ND_NFSV41) != 0) { 899 /* 900 * If this is a client side MDS RPC, mark 901 * the MDS session defunct and initiate 902 * recovery, as required. 903 * The nfsess_defunct field is protected by 904 * the NFSLOCKMNT()/nm_mtx lock and not the 905 * nfsess_mtx lock to simplify its handling, 906 * for the MDS session. This lock is also 907 * sufficient for nfsess_sessionid, since it 908 * never changes in the structure. 909 */ 910 NFSCL_DEBUG(1, "Got badsession\n"); 911 NFSLOCKCLSTATE(); 912 NFSLOCKMNT(nmp); 913 sep = NFSMNT_MDSSESSION(nmp); 914 if (bcmp(sep->nfsess_sessionid, nd->nd_sequence, 915 NFSX_V4SESSIONID) == 0) { 916 /* Initiate recovery. */ 917 sep->nfsess_defunct = 1; 918 NFSCL_DEBUG(1, "Marked defunct\n"); 919 if (nmp->nm_clp != NULL) { 920 nmp->nm_clp->nfsc_flags |= 921 NFSCLFLAGS_RECOVER; 922 wakeup(nmp->nm_clp); 923 } 924 } 925 NFSUNLOCKCLSTATE(); 926 /* 927 * Sleep for up to 1sec waiting for a new 928 * session. 929 */ 930 mtx_sleep(&nmp->nm_sess, &nmp->nm_mtx, PZERO, 931 "nfsbadsess", hz); 932 /* 933 * Get the session again, in case a new one 934 * has been created during the sleep. 935 */ 936 sep = NFSMNT_MDSSESSION(nmp); 937 NFSUNLOCKMNT(nmp); 938 if ((nd->nd_flag & ND_LOOPBADSESS) != 0) { 939 reterr = nfsv4_sequencelookup(nmp, sep, 940 &slotpos, &maxslot, &slotseq, 941 sessionid); 942 if (reterr == 0) { 943 /* Fill in new session info. */ 944 NFSCL_DEBUG(1, 945 "Filling in new sequence\n"); 946 tl = nd->nd_sequence; 947 bcopy(sessionid, tl, 948 NFSX_V4SESSIONID); 949 tl += NFSX_V4SESSIONID / 950 NFSX_UNSIGNED; 951 *tl++ = txdr_unsigned(slotseq); 952 *tl++ = txdr_unsigned(slotpos); 953 *tl = txdr_unsigned(maxslot); 954 } 955 if (reterr == NFSERR_BADSESSION || 956 reterr == 0) { 957 NFSCL_DEBUG(1, 958 "Badsession looping\n"); 959 m_freem(nd->nd_mrep); 960 nd->nd_mrep = NULL; 961 goto tryagain; 962 } 963 nd->nd_repstat = reterr; 964 NFSCL_DEBUG(1, "Got err=%d\n", reterr); 965 } 966 } 967 if (((nd->nd_repstat == NFSERR_DELAY || 968 nd->nd_repstat == NFSERR_GRACE) && 969 (nd->nd_flag & ND_NFSV4) && 970 nd->nd_procnum != NFSPROC_DELEGRETURN && 971 nd->nd_procnum != NFSPROC_SETATTR && 972 nd->nd_procnum != NFSPROC_READ && 973 nd->nd_procnum != NFSPROC_READDS && 974 nd->nd_procnum != NFSPROC_WRITE && 975 nd->nd_procnum != NFSPROC_WRITEDS && 976 nd->nd_procnum != NFSPROC_OPEN && 977 nd->nd_procnum != NFSPROC_CREATE && 978 nd->nd_procnum != NFSPROC_OPENCONFIRM && 979 nd->nd_procnum != NFSPROC_OPENDOWNGRADE && 980 nd->nd_procnum != NFSPROC_CLOSE && 981 nd->nd_procnum != NFSPROC_LOCK && 982 nd->nd_procnum != NFSPROC_LOCKU) || 983 (nd->nd_repstat == NFSERR_DELAY && 984 (nd->nd_flag & ND_NFSV4) == 0) || 985 nd->nd_repstat == NFSERR_RESOURCE) { 986 if (trylater_delay > NFS_TRYLATERDEL) 987 trylater_delay = NFS_TRYLATERDEL; 988 waituntil = NFSD_MONOSEC + trylater_delay; 989 while (NFSD_MONOSEC < waituntil) 990 (void) nfs_catnap(PZERO, 0, "nfstry"); 991 trylater_delay *= 2; 992 if (slot != -1) { 993 mtx_lock(&sep->nfsess_mtx); 994 sep->nfsess_slotseq[slot]++; 995 *nd->nd_slotseq = txdr_unsigned( 996 sep->nfsess_slotseq[slot]); 997 mtx_unlock(&sep->nfsess_mtx); 998 } 999 m_freem(nd->nd_mrep); 1000 nd->nd_mrep = NULL; 1001 goto tryagain; 1002 } 1003 1004 /* 1005 * If the File Handle was stale, invalidate the 1006 * lookup cache, just in case. 1007 * (vp != NULL implies a client side call) 1008 */ 1009 if (nd->nd_repstat == ESTALE && vp != NULL) { 1010 cache_purge(vp); 1011 if (ncl_call_invalcaches != NULL) 1012 (*ncl_call_invalcaches)(vp); 1013 } 1014 } 1015 if ((nd->nd_flag & ND_NFSV4) != 0) { 1016 /* Free the slot, as required. */ 1017 if (freeslot != -1) 1018 nfsv4_freeslot(sep, freeslot); 1019 /* 1020 * If this op is Putfh, throw its results away. 1021 */ 1022 if (j >= 10000) 1023 NFSCL_DEBUG(1, "nop=%d nst=%d\n", i, j); 1024 if (nmp != NULL && i == NFSV4OP_PUTFH && j == 0) { 1025 NFSM_DISSECT(tl,u_int32_t *,2 * NFSX_UNSIGNED); 1026 i = fxdr_unsigned(int, *tl++); 1027 j = fxdr_unsigned(int, *tl); 1028 if (j >= 10000) 1029 NFSCL_DEBUG(1, "n2op=%d n2st=%d\n", i, 1030 j); 1031 /* 1032 * All Compounds that do an Op that must 1033 * be in sequence consist of NFSV4OP_PUTFH 1034 * followed by one of these. As such, we 1035 * can determine if the seqid# should be 1036 * incremented, here. 1037 */ 1038 if ((i == NFSV4OP_OPEN || 1039 i == NFSV4OP_OPENCONFIRM || 1040 i == NFSV4OP_OPENDOWNGRADE || 1041 i == NFSV4OP_CLOSE || 1042 i == NFSV4OP_LOCK || 1043 i == NFSV4OP_LOCKU) && 1044 (j == 0 || 1045 (j != NFSERR_STALECLIENTID && 1046 j != NFSERR_STALESTATEID && 1047 j != NFSERR_BADSTATEID && 1048 j != NFSERR_BADSEQID && 1049 j != NFSERR_BADXDR && 1050 j != NFSERR_RESOURCE && 1051 j != NFSERR_NOFILEHANDLE))) 1052 nd->nd_flag |= ND_INCRSEQID; 1053 } 1054 /* 1055 * If this op's status is non-zero, mark 1056 * that there is no more data to process. 1057 * The exception is Setattr, which always has xdr 1058 * when it has failed. 1059 */ 1060 if (j != 0 && i != NFSV4OP_SETATTR) 1061 nd->nd_flag |= ND_NOMOREDATA; 1062 1063 /* 1064 * If R_DONTRECOVER is set, replace the stale error 1065 * reply, so that recovery isn't initiated. 1066 */ 1067 if ((nd->nd_repstat == NFSERR_STALECLIENTID || 1068 nd->nd_repstat == NFSERR_BADSESSION || 1069 nd->nd_repstat == NFSERR_STALESTATEID) && 1070 rep != NULL && (rep->r_flags & R_DONTRECOVER)) 1071 nd->nd_repstat = NFSERR_STALEDONTRECOVER; 1072 } 1073 } 1074 1075#ifdef KDTRACE_HOOKS 1076 if (nmp != NULL && dtrace_nfscl_nfs234_done_probe != NULL) { 1077 uint32_t probe_id; 1078 int probe_procnum; 1079 1080 if (nd->nd_flag & ND_NFSV4) { 1081 probe_id = nfscl_nfs4_done_probes[nd->nd_procnum]; 1082 probe_procnum = nd->nd_procnum; 1083 } else if (nd->nd_flag & ND_NFSV3) { 1084 probe_id = nfscl_nfs3_done_probes[procnum]; 1085 probe_procnum = procnum; 1086 } else { 1087 probe_id = nfscl_nfs2_done_probes[nd->nd_procnum]; 1088 probe_procnum = procnum; 1089 } 1090 if (probe_id != 0) 1091 (dtrace_nfscl_nfs234_done_probe)(probe_id, vp, 1092 nd->nd_mreq, cred, probe_procnum, 0); 1093 } 1094#endif 1095 1096 m_freem(nd->nd_mreq); 1097 if (usegssname == 0) 1098 AUTH_DESTROY(auth); 1099 if (rep != NULL) 1100 FREE((caddr_t)rep, M_NFSDREQ); 1101 if (set_sigset) 1102 newnfs_restore_sigmask(td, &oldset); 1103 return (0); 1104nfsmout: 1105 mbuf_freem(nd->nd_mrep); 1106 mbuf_freem(nd->nd_mreq); 1107 if (usegssname == 0) 1108 AUTH_DESTROY(auth); 1109 if (rep != NULL) 1110 FREE((caddr_t)rep, M_NFSDREQ); 1111 if (set_sigset) 1112 newnfs_restore_sigmask(td, &oldset); 1113 return (error); 1114} 1115 1116/* 1117 * Mark all of an nfs mount's outstanding requests with R_SOFTTERM and 1118 * wait for all requests to complete. This is used by forced unmounts 1119 * to terminate any outstanding RPCs. 1120 */ 1121int 1122newnfs_nmcancelreqs(struct nfsmount *nmp) 1123{ 1124 struct nfsclds *dsp; 1125 struct __rpc_client *cl; 1126 1127 if (nmp->nm_sockreq.nr_client != NULL) 1128 CLNT_CLOSE(nmp->nm_sockreq.nr_client); 1129lookformore: 1130 NFSLOCKMNT(nmp); 1131 TAILQ_FOREACH(dsp, &nmp->nm_sess, nfsclds_list) { 1132 NFSLOCKDS(dsp); 1133 if (dsp != TAILQ_FIRST(&nmp->nm_sess) && 1134 (dsp->nfsclds_flags & NFSCLDS_CLOSED) == 0 && 1135 dsp->nfsclds_sockp != NULL && 1136 dsp->nfsclds_sockp->nr_client != NULL) { 1137 dsp->nfsclds_flags |= NFSCLDS_CLOSED; 1138 cl = dsp->nfsclds_sockp->nr_client; 1139 NFSUNLOCKDS(dsp); 1140 NFSUNLOCKMNT(nmp); 1141 CLNT_CLOSE(cl); 1142 goto lookformore; 1143 } 1144 NFSUNLOCKDS(dsp); 1145 } 1146 NFSUNLOCKMNT(nmp); 1147 return (0); 1148} 1149 1150/* 1151 * Any signal that can interrupt an NFS operation in an intr mount 1152 * should be added to this set. SIGSTOP and SIGKILL cannot be masked. 1153 */ 1154int newnfs_sig_set[] = { 1155 SIGINT, 1156 SIGTERM, 1157 SIGHUP, 1158 SIGKILL, 1159 SIGQUIT 1160}; 1161 1162/* 1163 * Check to see if one of the signals in our subset is pending on 1164 * the process (in an intr mount). 1165 */ 1166static int 1167nfs_sig_pending(sigset_t set) 1168{ 1169 int i; 1170 1171 for (i = 0 ; i < sizeof(newnfs_sig_set)/sizeof(int) ; i++) 1172 if (SIGISMEMBER(set, newnfs_sig_set[i])) 1173 return (1); 1174 return (0); 1175} 1176 1177/* 1178 * The set/restore sigmask functions are used to (temporarily) overwrite 1179 * the thread td_sigmask during an RPC call (for example). These are also 1180 * used in other places in the NFS client that might tsleep(). 1181 */ 1182void 1183newnfs_set_sigmask(struct thread *td, sigset_t *oldset) 1184{ 1185 sigset_t newset; 1186 int i; 1187 struct proc *p; 1188 1189 SIGFILLSET(newset); 1190 if (td == NULL) 1191 td = curthread; /* XXX */ 1192 p = td->td_proc; 1193 /* Remove the NFS set of signals from newset */ 1194 PROC_LOCK(p); 1195 mtx_lock(&p->p_sigacts->ps_mtx); 1196 for (i = 0 ; i < sizeof(newnfs_sig_set)/sizeof(int) ; i++) { 1197 /* 1198 * But make sure we leave the ones already masked 1199 * by the process, ie. remove the signal from the 1200 * temporary signalmask only if it wasn't already 1201 * in p_sigmask. 1202 */ 1203 if (!SIGISMEMBER(td->td_sigmask, newnfs_sig_set[i]) && 1204 !SIGISMEMBER(p->p_sigacts->ps_sigignore, newnfs_sig_set[i])) 1205 SIGDELSET(newset, newnfs_sig_set[i]); 1206 } 1207 mtx_unlock(&p->p_sigacts->ps_mtx); 1208 kern_sigprocmask(td, SIG_SETMASK, &newset, oldset, 1209 SIGPROCMASK_PROC_LOCKED); 1210 PROC_UNLOCK(p); 1211} 1212 1213void 1214newnfs_restore_sigmask(struct thread *td, sigset_t *set) 1215{ 1216 if (td == NULL) 1217 td = curthread; /* XXX */ 1218 kern_sigprocmask(td, SIG_SETMASK, set, NULL, 0); 1219} 1220 1221/* 1222 * NFS wrapper to msleep(), that shoves a new p_sigmask and restores the 1223 * old one after msleep() returns. 1224 */ 1225int 1226newnfs_msleep(struct thread *td, void *ident, struct mtx *mtx, int priority, char *wmesg, int timo) 1227{ 1228 sigset_t oldset; 1229 int error; 1230 struct proc *p; 1231 1232 if ((priority & PCATCH) == 0) 1233 return msleep(ident, mtx, priority, wmesg, timo); 1234 if (td == NULL) 1235 td = curthread; /* XXX */ 1236 newnfs_set_sigmask(td, &oldset); 1237 error = msleep(ident, mtx, priority, wmesg, timo); 1238 newnfs_restore_sigmask(td, &oldset); 1239 p = td->td_proc; 1240 return (error); 1241} 1242 1243/* 1244 * Test for a termination condition pending on the process. 1245 * This is used for NFSMNT_INT mounts. 1246 */ 1247int 1248newnfs_sigintr(struct nfsmount *nmp, struct thread *td) 1249{ 1250 struct proc *p; 1251 sigset_t tmpset; 1252 1253 /* Terminate all requests while attempting a forced unmount. */ 1254 if (nmp->nm_mountp->mnt_kern_flag & MNTK_UNMOUNTF) 1255 return (EIO); 1256 if (!(nmp->nm_flag & NFSMNT_INT)) 1257 return (0); 1258 if (td == NULL) 1259 return (0); 1260 p = td->td_proc; 1261 PROC_LOCK(p); 1262 tmpset = p->p_siglist; 1263 SIGSETOR(tmpset, td->td_siglist); 1264 SIGSETNAND(tmpset, td->td_sigmask); 1265 mtx_lock(&p->p_sigacts->ps_mtx); 1266 SIGSETNAND(tmpset, p->p_sigacts->ps_sigignore); 1267 mtx_unlock(&p->p_sigacts->ps_mtx); 1268 if ((SIGNOTEMPTY(p->p_siglist) || SIGNOTEMPTY(td->td_siglist)) 1269 && nfs_sig_pending(tmpset)) { 1270 PROC_UNLOCK(p); 1271 return (EINTR); 1272 } 1273 PROC_UNLOCK(p); 1274 return (0); 1275} 1276 1277static int 1278nfs_msg(struct thread *td, const char *server, const char *msg, int error) 1279{ 1280 struct proc *p; 1281 1282 p = td ? td->td_proc : NULL; 1283 if (error) { 1284 tprintf(p, LOG_INFO, "newnfs server %s: %s, error %d\n", 1285 server, msg, error); 1286 } else { 1287 tprintf(p, LOG_INFO, "newnfs server %s: %s\n", server, msg); 1288 } 1289 return (0); 1290} 1291 1292static void 1293nfs_down(struct nfsmount *nmp, struct thread *td, const char *msg, 1294 int error, int flags) 1295{ 1296 if (nmp == NULL) 1297 return; 1298 mtx_lock(&nmp->nm_mtx); 1299 if ((flags & NFSSTA_TIMEO) && !(nmp->nm_state & NFSSTA_TIMEO)) { 1300 nmp->nm_state |= NFSSTA_TIMEO; 1301 mtx_unlock(&nmp->nm_mtx); 1302 vfs_event_signal(&nmp->nm_mountp->mnt_stat.f_fsid, 1303 VQ_NOTRESP, 0); 1304 } else 1305 mtx_unlock(&nmp->nm_mtx); 1306 mtx_lock(&nmp->nm_mtx); 1307 if ((flags & NFSSTA_LOCKTIMEO) && !(nmp->nm_state & NFSSTA_LOCKTIMEO)) { 1308 nmp->nm_state |= NFSSTA_LOCKTIMEO; 1309 mtx_unlock(&nmp->nm_mtx); 1310 vfs_event_signal(&nmp->nm_mountp->mnt_stat.f_fsid, 1311 VQ_NOTRESPLOCK, 0); 1312 } else 1313 mtx_unlock(&nmp->nm_mtx); 1314 nfs_msg(td, nmp->nm_mountp->mnt_stat.f_mntfromname, msg, error); 1315} 1316 1317static void 1318nfs_up(struct nfsmount *nmp, struct thread *td, const char *msg, 1319 int flags, int tprintfmsg) 1320{ 1321 if (nmp == NULL) 1322 return; 1323 if (tprintfmsg) { 1324 nfs_msg(td, nmp->nm_mountp->mnt_stat.f_mntfromname, msg, 0); 1325 } 1326 1327 mtx_lock(&nmp->nm_mtx); 1328 if ((flags & NFSSTA_TIMEO) && (nmp->nm_state & NFSSTA_TIMEO)) { 1329 nmp->nm_state &= ~NFSSTA_TIMEO; 1330 mtx_unlock(&nmp->nm_mtx); 1331 vfs_event_signal(&nmp->nm_mountp->mnt_stat.f_fsid, 1332 VQ_NOTRESP, 1); 1333 } else 1334 mtx_unlock(&nmp->nm_mtx); 1335 1336 mtx_lock(&nmp->nm_mtx); 1337 if ((flags & NFSSTA_LOCKTIMEO) && (nmp->nm_state & NFSSTA_LOCKTIMEO)) { 1338 nmp->nm_state &= ~NFSSTA_LOCKTIMEO; 1339 mtx_unlock(&nmp->nm_mtx); 1340 vfs_event_signal(&nmp->nm_mountp->mnt_stat.f_fsid, 1341 VQ_NOTRESPLOCK, 1); 1342 } else 1343 mtx_unlock(&nmp->nm_mtx); 1344} 1345 1346