52ec47de1185d0a4fddffa2e3ff79f66eb1fd4c9
[firefly-linux-kernel-4.4.55.git] / fs / nfsd / nfs4state.c
1 /*
2 *  Copyright (c) 2001 The Regents of the University of Michigan.
3 *  All rights reserved.
4 *
5 *  Kendrick Smith <kmsmith@umich.edu>
6 *  Andy Adamson <kandros@umich.edu>
7 *
8 *  Redistribution and use in source and binary forms, with or without
9 *  modification, are permitted provided that the following conditions
10 *  are met:
11 *
12 *  1. Redistributions of source code must retain the above copyright
13 *     notice, this list of conditions and the following disclaimer.
14 *  2. Redistributions in binary form must reproduce the above copyright
15 *     notice, this list of conditions and the following disclaimer in the
16 *     documentation and/or other materials provided with the distribution.
17 *  3. Neither the name of the University nor the names of its
18 *     contributors may be used to endorse or promote products derived
19 *     from this software without specific prior written permission.
20 *
21 *  THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
22 *  WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
23 *  MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
24 *  DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25 *  FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26 *  CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27 *  SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
28 *  BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
29 *  LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
30 *  NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
31 *  SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32 *
33 */
34
35 #include <linux/file.h>
36 #include <linux/fs.h>
37 #include <linux/slab.h>
38 #include <linux/namei.h>
39 #include <linux/swap.h>
40 #include <linux/pagemap.h>
41 #include <linux/ratelimit.h>
42 #include <linux/sunrpc/svcauth_gss.h>
43 #include <linux/sunrpc/addr.h>
44 #include <linux/hash.h>
45 #include "xdr4.h"
46 #include "xdr4cb.h"
47 #include "vfs.h"
48 #include "current_stateid.h"
49
50 #include "netns.h"
51
52 #define NFSDDBG_FACILITY                NFSDDBG_PROC
53
54 #define all_ones {{~0,~0},~0}
55 static const stateid_t one_stateid = {
56         .si_generation = ~0,
57         .si_opaque = all_ones,
58 };
59 static const stateid_t zero_stateid = {
60         /* all fields zero */
61 };
62 static const stateid_t currentstateid = {
63         .si_generation = 1,
64 };
65
66 static u64 current_sessionid = 1;
67
68 #define ZERO_STATEID(stateid) (!memcmp((stateid), &zero_stateid, sizeof(stateid_t)))
69 #define ONE_STATEID(stateid)  (!memcmp((stateid), &one_stateid, sizeof(stateid_t)))
70 #define CURRENT_STATEID(stateid) (!memcmp((stateid), &currentstateid, sizeof(stateid_t)))
71
72 /* forward declarations */
73 static bool check_for_locks(struct nfs4_file *fp, struct nfs4_lockowner *lowner);
74 static void nfs4_free_ol_stateid(struct nfs4_stid *stid);
75
76 /* Locking: */
77
78 /* Currently used for almost all code touching nfsv4 state: */
79 static DEFINE_MUTEX(client_mutex);
80
81 /*
82  * Currently used for the del_recall_lru and file hash table.  In an
83  * effort to decrease the scope of the client_mutex, this spinlock may
84  * eventually cover more:
85  */
86 static DEFINE_SPINLOCK(state_lock);
87
88 /*
89  * A waitqueue for all in-progress 4.0 CLOSE operations that are waiting for
90  * the refcount on the open stateid to drop.
91  */
92 static DECLARE_WAIT_QUEUE_HEAD(close_wq);
93
94 static struct kmem_cache *openowner_slab;
95 static struct kmem_cache *lockowner_slab;
96 static struct kmem_cache *file_slab;
97 static struct kmem_cache *stateid_slab;
98 static struct kmem_cache *deleg_slab;
99
100 void
101 nfs4_lock_state(void)
102 {
103         mutex_lock(&client_mutex);
104 }
105
106 static void free_session(struct nfsd4_session *);
107
108 static bool is_session_dead(struct nfsd4_session *ses)
109 {
110         return ses->se_flags & NFS4_SESSION_DEAD;
111 }
112
113 static __be32 mark_session_dead_locked(struct nfsd4_session *ses, int ref_held_by_me)
114 {
115         if (atomic_read(&ses->se_ref) > ref_held_by_me)
116                 return nfserr_jukebox;
117         ses->se_flags |= NFS4_SESSION_DEAD;
118         return nfs_ok;
119 }
120
121 void
122 nfs4_unlock_state(void)
123 {
124         mutex_unlock(&client_mutex);
125 }
126
127 static bool is_client_expired(struct nfs4_client *clp)
128 {
129         return clp->cl_time == 0;
130 }
131
132 static __be32 mark_client_expired_locked(struct nfs4_client *clp)
133 {
134         if (atomic_read(&clp->cl_refcount))
135                 return nfserr_jukebox;
136         clp->cl_time = 0;
137         return nfs_ok;
138 }
139
140 static __be32 mark_client_expired(struct nfs4_client *clp)
141 {
142         struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
143         __be32 ret;
144
145         spin_lock(&nn->client_lock);
146         ret = mark_client_expired_locked(clp);
147         spin_unlock(&nn->client_lock);
148         return ret;
149 }
150
151 static __be32 get_client_locked(struct nfs4_client *clp)
152 {
153         if (is_client_expired(clp))
154                 return nfserr_expired;
155         atomic_inc(&clp->cl_refcount);
156         return nfs_ok;
157 }
158
159 /* must be called under the client_lock */
160 static inline void
161 renew_client_locked(struct nfs4_client *clp)
162 {
163         struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
164
165         if (is_client_expired(clp)) {
166                 WARN_ON(1);
167                 printk("%s: client (clientid %08x/%08x) already expired\n",
168                         __func__,
169                         clp->cl_clientid.cl_boot,
170                         clp->cl_clientid.cl_id);
171                 return;
172         }
173
174         dprintk("renewing client (clientid %08x/%08x)\n",
175                         clp->cl_clientid.cl_boot,
176                         clp->cl_clientid.cl_id);
177         list_move_tail(&clp->cl_lru, &nn->client_lru);
178         clp->cl_time = get_seconds();
179 }
180
181 static inline void
182 renew_client(struct nfs4_client *clp)
183 {
184         struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
185
186         spin_lock(&nn->client_lock);
187         renew_client_locked(clp);
188         spin_unlock(&nn->client_lock);
189 }
190
191 static void put_client_renew_locked(struct nfs4_client *clp)
192 {
193         if (!atomic_dec_and_test(&clp->cl_refcount))
194                 return;
195         if (!is_client_expired(clp))
196                 renew_client_locked(clp);
197 }
198
199 static void put_client_renew(struct nfs4_client *clp)
200 {
201         struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
202
203         if (!atomic_dec_and_lock(&clp->cl_refcount, &nn->client_lock))
204                 return;
205         if (!is_client_expired(clp))
206                 renew_client_locked(clp);
207         spin_unlock(&nn->client_lock);
208 }
209
210 static __be32 nfsd4_get_session_locked(struct nfsd4_session *ses)
211 {
212         __be32 status;
213
214         if (is_session_dead(ses))
215                 return nfserr_badsession;
216         status = get_client_locked(ses->se_client);
217         if (status)
218                 return status;
219         atomic_inc(&ses->se_ref);
220         return nfs_ok;
221 }
222
223 static void nfsd4_put_session_locked(struct nfsd4_session *ses)
224 {
225         struct nfs4_client *clp = ses->se_client;
226
227         if (atomic_dec_and_test(&ses->se_ref) && is_session_dead(ses))
228                 free_session(ses);
229         put_client_renew_locked(clp);
230 }
231
232 static void nfsd4_put_session(struct nfsd4_session *ses)
233 {
234         struct nfs4_client *clp = ses->se_client;
235         struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
236
237         spin_lock(&nn->client_lock);
238         nfsd4_put_session_locked(ses);
239         spin_unlock(&nn->client_lock);
240 }
241
242 static int
243 same_owner_str(struct nfs4_stateowner *sop, struct xdr_netobj *owner)
244 {
245         return (sop->so_owner.len == owner->len) &&
246                 0 == memcmp(sop->so_owner.data, owner->data, owner->len);
247 }
248
249 static struct nfs4_openowner *
250 find_openstateowner_str_locked(unsigned int hashval, struct nfsd4_open *open,
251                         struct nfs4_client *clp)
252 {
253         struct nfs4_stateowner *so;
254
255         lockdep_assert_held(&clp->cl_lock);
256
257         list_for_each_entry(so, &clp->cl_ownerstr_hashtbl[hashval],
258                             so_strhash) {
259                 if (!so->so_is_open_owner)
260                         continue;
261                 if (same_owner_str(so, &open->op_owner)) {
262                         atomic_inc(&so->so_count);
263                         return openowner(so);
264                 }
265         }
266         return NULL;
267 }
268
269 static struct nfs4_openowner *
270 find_openstateowner_str(unsigned int hashval, struct nfsd4_open *open,
271                         struct nfs4_client *clp)
272 {
273         struct nfs4_openowner *oo;
274
275         spin_lock(&clp->cl_lock);
276         oo = find_openstateowner_str_locked(hashval, open, clp);
277         spin_unlock(&clp->cl_lock);
278         return oo;
279 }
280
281 static inline u32
282 opaque_hashval(const void *ptr, int nbytes)
283 {
284         unsigned char *cptr = (unsigned char *) ptr;
285
286         u32 x = 0;
287         while (nbytes--) {
288                 x *= 37;
289                 x += *cptr++;
290         }
291         return x;
292 }
293
294 static void nfsd4_free_file(struct nfs4_file *f)
295 {
296         kmem_cache_free(file_slab, f);
297 }
298
299 static inline void
300 put_nfs4_file(struct nfs4_file *fi)
301 {
302         might_lock(&state_lock);
303
304         if (atomic_dec_and_lock(&fi->fi_ref, &state_lock)) {
305                 hlist_del(&fi->fi_hash);
306                 spin_unlock(&state_lock);
307                 nfsd4_free_file(fi);
308         }
309 }
310
311 static inline void
312 get_nfs4_file(struct nfs4_file *fi)
313 {
314         atomic_inc(&fi->fi_ref);
315 }
316
317 static struct file *
318 __nfs4_get_fd(struct nfs4_file *f, int oflag)
319 {
320         if (f->fi_fds[oflag])
321                 return get_file(f->fi_fds[oflag]);
322         return NULL;
323 }
324
325 static struct file *
326 find_writeable_file_locked(struct nfs4_file *f)
327 {
328         struct file *ret;
329
330         lockdep_assert_held(&f->fi_lock);
331
332         ret = __nfs4_get_fd(f, O_WRONLY);
333         if (!ret)
334                 ret = __nfs4_get_fd(f, O_RDWR);
335         return ret;
336 }
337
338 static struct file *
339 find_writeable_file(struct nfs4_file *f)
340 {
341         struct file *ret;
342
343         spin_lock(&f->fi_lock);
344         ret = find_writeable_file_locked(f);
345         spin_unlock(&f->fi_lock);
346
347         return ret;
348 }
349
350 static struct file *find_readable_file_locked(struct nfs4_file *f)
351 {
352         struct file *ret;
353
354         lockdep_assert_held(&f->fi_lock);
355
356         ret = __nfs4_get_fd(f, O_RDONLY);
357         if (!ret)
358                 ret = __nfs4_get_fd(f, O_RDWR);
359         return ret;
360 }
361
362 static struct file *
363 find_readable_file(struct nfs4_file *f)
364 {
365         struct file *ret;
366
367         spin_lock(&f->fi_lock);
368         ret = find_readable_file_locked(f);
369         spin_unlock(&f->fi_lock);
370
371         return ret;
372 }
373
374 static struct file *
375 find_any_file(struct nfs4_file *f)
376 {
377         struct file *ret;
378
379         spin_lock(&f->fi_lock);
380         ret = __nfs4_get_fd(f, O_RDWR);
381         if (!ret) {
382                 ret = __nfs4_get_fd(f, O_WRONLY);
383                 if (!ret)
384                         ret = __nfs4_get_fd(f, O_RDONLY);
385         }
386         spin_unlock(&f->fi_lock);
387         return ret;
388 }
389
390 static atomic_long_t num_delegations;
391 unsigned long max_delegations;
392
393 /*
394  * Open owner state (share locks)
395  */
396
397 /* hash tables for lock and open owners */
398 #define OWNER_HASH_BITS              8
399 #define OWNER_HASH_SIZE             (1 << OWNER_HASH_BITS)
400 #define OWNER_HASH_MASK             (OWNER_HASH_SIZE - 1)
401
402 static unsigned int ownerstr_hashval(struct xdr_netobj *ownername)
403 {
404         unsigned int ret;
405
406         ret = opaque_hashval(ownername->data, ownername->len);
407         return ret & OWNER_HASH_MASK;
408 }
409
410 /* hash table for nfs4_file */
411 #define FILE_HASH_BITS                   8
412 #define FILE_HASH_SIZE                  (1 << FILE_HASH_BITS)
413
414 static unsigned int nfsd_fh_hashval(struct knfsd_fh *fh)
415 {
416         return jhash2(fh->fh_base.fh_pad, XDR_QUADLEN(fh->fh_size), 0);
417 }
418
419 static unsigned int file_hashval(struct knfsd_fh *fh)
420 {
421         return nfsd_fh_hashval(fh) & (FILE_HASH_SIZE - 1);
422 }
423
424 static bool nfsd_fh_match(struct knfsd_fh *fh1, struct knfsd_fh *fh2)
425 {
426         return fh1->fh_size == fh2->fh_size &&
427                 !memcmp(fh1->fh_base.fh_pad,
428                                 fh2->fh_base.fh_pad,
429                                 fh1->fh_size);
430 }
431
432 static struct hlist_head file_hashtbl[FILE_HASH_SIZE];
433
434 static void
435 __nfs4_file_get_access(struct nfs4_file *fp, u32 access)
436 {
437         lockdep_assert_held(&fp->fi_lock);
438
439         if (access & NFS4_SHARE_ACCESS_WRITE)
440                 atomic_inc(&fp->fi_access[O_WRONLY]);
441         if (access & NFS4_SHARE_ACCESS_READ)
442                 atomic_inc(&fp->fi_access[O_RDONLY]);
443 }
444
445 static __be32
446 nfs4_file_get_access(struct nfs4_file *fp, u32 access)
447 {
448         lockdep_assert_held(&fp->fi_lock);
449
450         /* Does this access mode make sense? */
451         if (access & ~NFS4_SHARE_ACCESS_BOTH)
452                 return nfserr_inval;
453
454         /* Does it conflict with a deny mode already set? */
455         if ((access & fp->fi_share_deny) != 0)
456                 return nfserr_share_denied;
457
458         __nfs4_file_get_access(fp, access);
459         return nfs_ok;
460 }
461
462 static __be32 nfs4_file_check_deny(struct nfs4_file *fp, u32 deny)
463 {
464         /* Common case is that there is no deny mode. */
465         if (deny) {
466                 /* Does this deny mode make sense? */
467                 if (deny & ~NFS4_SHARE_DENY_BOTH)
468                         return nfserr_inval;
469
470                 if ((deny & NFS4_SHARE_DENY_READ) &&
471                     atomic_read(&fp->fi_access[O_RDONLY]))
472                         return nfserr_share_denied;
473
474                 if ((deny & NFS4_SHARE_DENY_WRITE) &&
475                     atomic_read(&fp->fi_access[O_WRONLY]))
476                         return nfserr_share_denied;
477         }
478         return nfs_ok;
479 }
480
481 static void __nfs4_file_put_access(struct nfs4_file *fp, int oflag)
482 {
483         might_lock(&fp->fi_lock);
484
485         if (atomic_dec_and_lock(&fp->fi_access[oflag], &fp->fi_lock)) {
486                 struct file *f1 = NULL;
487                 struct file *f2 = NULL;
488
489                 swap(f1, fp->fi_fds[oflag]);
490                 if (atomic_read(&fp->fi_access[1 - oflag]) == 0)
491                         swap(f2, fp->fi_fds[O_RDWR]);
492                 spin_unlock(&fp->fi_lock);
493                 if (f1)
494                         fput(f1);
495                 if (f2)
496                         fput(f2);
497         }
498 }
499
500 static void nfs4_file_put_access(struct nfs4_file *fp, u32 access)
501 {
502         WARN_ON_ONCE(access & ~NFS4_SHARE_ACCESS_BOTH);
503
504         if (access & NFS4_SHARE_ACCESS_WRITE)
505                 __nfs4_file_put_access(fp, O_WRONLY);
506         if (access & NFS4_SHARE_ACCESS_READ)
507                 __nfs4_file_put_access(fp, O_RDONLY);
508 }
509
510 static struct nfs4_stid *nfs4_alloc_stid(struct nfs4_client *cl,
511                                          struct kmem_cache *slab)
512 {
513         struct nfs4_stid *stid;
514         int new_id;
515
516         stid = kmem_cache_zalloc(slab, GFP_KERNEL);
517         if (!stid)
518                 return NULL;
519
520         idr_preload(GFP_KERNEL);
521         spin_lock(&cl->cl_lock);
522         new_id = idr_alloc_cyclic(&cl->cl_stateids, stid, 0, 0, GFP_NOWAIT);
523         spin_unlock(&cl->cl_lock);
524         idr_preload_end();
525         if (new_id < 0)
526                 goto out_free;
527         stid->sc_client = cl;
528         stid->sc_stateid.si_opaque.so_id = new_id;
529         stid->sc_stateid.si_opaque.so_clid = cl->cl_clientid;
530         /* Will be incremented before return to client: */
531         atomic_set(&stid->sc_count, 1);
532
533         /*
534          * It shouldn't be a problem to reuse an opaque stateid value.
535          * I don't think it is for 4.1.  But with 4.0 I worry that, for
536          * example, a stray write retransmission could be accepted by
537          * the server when it should have been rejected.  Therefore,
538          * adopt a trick from the sctp code to attempt to maximize the
539          * amount of time until an id is reused, by ensuring they always
540          * "increase" (mod INT_MAX):
541          */
542         return stid;
543 out_free:
544         kmem_cache_free(slab, stid);
545         return NULL;
546 }
547
548 static struct nfs4_ol_stateid * nfs4_alloc_open_stateid(struct nfs4_client *clp)
549 {
550         struct nfs4_stid *stid;
551         struct nfs4_ol_stateid *stp;
552
553         stid = nfs4_alloc_stid(clp, stateid_slab);
554         if (!stid)
555                 return NULL;
556
557         stp = openlockstateid(stid);
558         stp->st_stid.sc_free = nfs4_free_ol_stateid;
559         return stp;
560 }
561
562 static void nfs4_free_deleg(struct nfs4_stid *stid)
563 {
564         kmem_cache_free(deleg_slab, stid);
565         atomic_long_dec(&num_delegations);
566 }
567
568 /*
569  * When we recall a delegation, we should be careful not to hand it
570  * out again straight away.
571  * To ensure this we keep a pair of bloom filters ('new' and 'old')
572  * in which the filehandles of recalled delegations are "stored".
573  * If a filehandle appear in either filter, a delegation is blocked.
574  * When a delegation is recalled, the filehandle is stored in the "new"
575  * filter.
576  * Every 30 seconds we swap the filters and clear the "new" one,
577  * unless both are empty of course.
578  *
579  * Each filter is 256 bits.  We hash the filehandle to 32bit and use the
580  * low 3 bytes as hash-table indices.
581  *
582  * 'blocked_delegations_lock', which is always taken in block_delegations(),
583  * is used to manage concurrent access.  Testing does not need the lock
584  * except when swapping the two filters.
585  */
586 static DEFINE_SPINLOCK(blocked_delegations_lock);
587 static struct bloom_pair {
588         int     entries, old_entries;
589         time_t  swap_time;
590         int     new; /* index into 'set' */
591         DECLARE_BITMAP(set[2], 256);
592 } blocked_delegations;
593
594 static int delegation_blocked(struct knfsd_fh *fh)
595 {
596         u32 hash;
597         struct bloom_pair *bd = &blocked_delegations;
598
599         if (bd->entries == 0)
600                 return 0;
601         if (seconds_since_boot() - bd->swap_time > 30) {
602                 spin_lock(&blocked_delegations_lock);
603                 if (seconds_since_boot() - bd->swap_time > 30) {
604                         bd->entries -= bd->old_entries;
605                         bd->old_entries = bd->entries;
606                         memset(bd->set[bd->new], 0,
607                                sizeof(bd->set[0]));
608                         bd->new = 1-bd->new;
609                         bd->swap_time = seconds_since_boot();
610                 }
611                 spin_unlock(&blocked_delegations_lock);
612         }
613         hash = arch_fast_hash(&fh->fh_base, fh->fh_size, 0);
614         if (test_bit(hash&255, bd->set[0]) &&
615             test_bit((hash>>8)&255, bd->set[0]) &&
616             test_bit((hash>>16)&255, bd->set[0]))
617                 return 1;
618
619         if (test_bit(hash&255, bd->set[1]) &&
620             test_bit((hash>>8)&255, bd->set[1]) &&
621             test_bit((hash>>16)&255, bd->set[1]))
622                 return 1;
623
624         return 0;
625 }
626
627 static void block_delegations(struct knfsd_fh *fh)
628 {
629         u32 hash;
630         struct bloom_pair *bd = &blocked_delegations;
631
632         hash = arch_fast_hash(&fh->fh_base, fh->fh_size, 0);
633
634         spin_lock(&blocked_delegations_lock);
635         __set_bit(hash&255, bd->set[bd->new]);
636         __set_bit((hash>>8)&255, bd->set[bd->new]);
637         __set_bit((hash>>16)&255, bd->set[bd->new]);
638         if (bd->entries == 0)
639                 bd->swap_time = seconds_since_boot();
640         bd->entries += 1;
641         spin_unlock(&blocked_delegations_lock);
642 }
643
644 static struct nfs4_delegation *
645 alloc_init_deleg(struct nfs4_client *clp, struct svc_fh *current_fh)
646 {
647         struct nfs4_delegation *dp;
648         long n;
649
650         dprintk("NFSD alloc_init_deleg\n");
651         n = atomic_long_inc_return(&num_delegations);
652         if (n < 0 || n > max_delegations)
653                 goto out_dec;
654         if (delegation_blocked(&current_fh->fh_handle))
655                 goto out_dec;
656         dp = delegstateid(nfs4_alloc_stid(clp, deleg_slab));
657         if (dp == NULL)
658                 goto out_dec;
659
660         dp->dl_stid.sc_free = nfs4_free_deleg;
661         /*
662          * delegation seqid's are never incremented.  The 4.1 special
663          * meaning of seqid 0 isn't meaningful, really, but let's avoid
664          * 0 anyway just for consistency and use 1:
665          */
666         dp->dl_stid.sc_stateid.si_generation = 1;
667         INIT_LIST_HEAD(&dp->dl_perfile);
668         INIT_LIST_HEAD(&dp->dl_perclnt);
669         INIT_LIST_HEAD(&dp->dl_recall_lru);
670         dp->dl_type = NFS4_OPEN_DELEGATE_READ;
671         INIT_WORK(&dp->dl_recall.cb_work, nfsd4_run_cb_recall);
672         return dp;
673 out_dec:
674         atomic_long_dec(&num_delegations);
675         return NULL;
676 }
677
678 void
679 nfs4_put_stid(struct nfs4_stid *s)
680 {
681         struct nfs4_file *fp = s->sc_file;
682         struct nfs4_client *clp = s->sc_client;
683
684         might_lock(&clp->cl_lock);
685
686         if (!atomic_dec_and_lock(&s->sc_count, &clp->cl_lock)) {
687                 wake_up_all(&close_wq);
688                 return;
689         }
690         idr_remove(&clp->cl_stateids, s->sc_stateid.si_opaque.so_id);
691         spin_unlock(&clp->cl_lock);
692         s->sc_free(s);
693         if (fp)
694                 put_nfs4_file(fp);
695 }
696
697 static void nfs4_put_deleg_lease(struct nfs4_file *fp)
698 {
699         lockdep_assert_held(&state_lock);
700
701         if (!fp->fi_lease)
702                 return;
703         if (atomic_dec_and_test(&fp->fi_delegees)) {
704                 vfs_setlease(fp->fi_deleg_file, F_UNLCK, &fp->fi_lease);
705                 fp->fi_lease = NULL;
706                 fput(fp->fi_deleg_file);
707                 fp->fi_deleg_file = NULL;
708         }
709 }
710
711 static void unhash_stid(struct nfs4_stid *s)
712 {
713         s->sc_type = 0;
714 }
715
716 static void
717 hash_delegation_locked(struct nfs4_delegation *dp, struct nfs4_file *fp)
718 {
719         lockdep_assert_held(&state_lock);
720         lockdep_assert_held(&fp->fi_lock);
721
722         atomic_inc(&dp->dl_stid.sc_count);
723         dp->dl_stid.sc_type = NFS4_DELEG_STID;
724         list_add(&dp->dl_perfile, &fp->fi_delegations);
725         list_add(&dp->dl_perclnt, &dp->dl_stid.sc_client->cl_delegations);
726 }
727
728 static void
729 unhash_delegation_locked(struct nfs4_delegation *dp)
730 {
731         struct nfs4_file *fp = dp->dl_stid.sc_file;
732
733         lockdep_assert_held(&state_lock);
734
735         dp->dl_stid.sc_type = NFS4_CLOSED_DELEG_STID;
736         /* Ensure that deleg break won't try to requeue it */
737         ++dp->dl_time;
738         spin_lock(&fp->fi_lock);
739         list_del_init(&dp->dl_perclnt);
740         list_del_init(&dp->dl_recall_lru);
741         list_del_init(&dp->dl_perfile);
742         spin_unlock(&fp->fi_lock);
743         if (fp)
744                 nfs4_put_deleg_lease(fp);
745 }
746
747 static void destroy_delegation(struct nfs4_delegation *dp)
748 {
749         spin_lock(&state_lock);
750         unhash_delegation_locked(dp);
751         spin_unlock(&state_lock);
752         nfs4_put_stid(&dp->dl_stid);
753 }
754
755 static void revoke_delegation(struct nfs4_delegation *dp)
756 {
757         struct nfs4_client *clp = dp->dl_stid.sc_client;
758
759         WARN_ON(!list_empty(&dp->dl_recall_lru));
760
761         if (clp->cl_minorversion == 0)
762                 nfs4_put_stid(&dp->dl_stid);
763         else {
764                 dp->dl_stid.sc_type = NFS4_REVOKED_DELEG_STID;
765                 spin_lock(&clp->cl_lock);
766                 list_add(&dp->dl_recall_lru, &clp->cl_revoked);
767                 spin_unlock(&clp->cl_lock);
768         }
769 }
770
771 /* 
772  * SETCLIENTID state 
773  */
774
775 static unsigned int clientid_hashval(u32 id)
776 {
777         return id & CLIENT_HASH_MASK;
778 }
779
780 static unsigned int clientstr_hashval(const char *name)
781 {
782         return opaque_hashval(name, 8) & CLIENT_HASH_MASK;
783 }
784
785 /*
786  * We store the NONE, READ, WRITE, and BOTH bits separately in the
787  * st_{access,deny}_bmap field of the stateid, in order to track not
788  * only what share bits are currently in force, but also what
789  * combinations of share bits previous opens have used.  This allows us
790  * to enforce the recommendation of rfc 3530 14.2.19 that the server
791  * return an error if the client attempt to downgrade to a combination
792  * of share bits not explicable by closing some of its previous opens.
793  *
794  * XXX: This enforcement is actually incomplete, since we don't keep
795  * track of access/deny bit combinations; so, e.g., we allow:
796  *
797  *      OPEN allow read, deny write
798  *      OPEN allow both, deny none
799  *      DOWNGRADE allow read, deny none
800  *
801  * which we should reject.
802  */
803 static unsigned int
804 bmap_to_share_mode(unsigned long bmap) {
805         int i;
806         unsigned int access = 0;
807
808         for (i = 1; i < 4; i++) {
809                 if (test_bit(i, &bmap))
810                         access |= i;
811         }
812         return access;
813 }
814
815 /* set share access for a given stateid */
816 static inline void
817 set_access(u32 access, struct nfs4_ol_stateid *stp)
818 {
819         unsigned char mask = 1 << access;
820
821         WARN_ON_ONCE(access > NFS4_SHARE_ACCESS_BOTH);
822         stp->st_access_bmap |= mask;
823 }
824
825 /* clear share access for a given stateid */
826 static inline void
827 clear_access(u32 access, struct nfs4_ol_stateid *stp)
828 {
829         unsigned char mask = 1 << access;
830
831         WARN_ON_ONCE(access > NFS4_SHARE_ACCESS_BOTH);
832         stp->st_access_bmap &= ~mask;
833 }
834
835 /* test whether a given stateid has access */
836 static inline bool
837 test_access(u32 access, struct nfs4_ol_stateid *stp)
838 {
839         unsigned char mask = 1 << access;
840
841         return (bool)(stp->st_access_bmap & mask);
842 }
843
844 /* set share deny for a given stateid */
845 static inline void
846 set_deny(u32 deny, struct nfs4_ol_stateid *stp)
847 {
848         unsigned char mask = 1 << deny;
849
850         WARN_ON_ONCE(deny > NFS4_SHARE_DENY_BOTH);
851         stp->st_deny_bmap |= mask;
852 }
853
854 /* clear share deny for a given stateid */
855 static inline void
856 clear_deny(u32 deny, struct nfs4_ol_stateid *stp)
857 {
858         unsigned char mask = 1 << deny;
859
860         WARN_ON_ONCE(deny > NFS4_SHARE_DENY_BOTH);
861         stp->st_deny_bmap &= ~mask;
862 }
863
864 /* test whether a given stateid is denying specific access */
865 static inline bool
866 test_deny(u32 deny, struct nfs4_ol_stateid *stp)
867 {
868         unsigned char mask = 1 << deny;
869
870         return (bool)(stp->st_deny_bmap & mask);
871 }
872
873 static int nfs4_access_to_omode(u32 access)
874 {
875         switch (access & NFS4_SHARE_ACCESS_BOTH) {
876         case NFS4_SHARE_ACCESS_READ:
877                 return O_RDONLY;
878         case NFS4_SHARE_ACCESS_WRITE:
879                 return O_WRONLY;
880         case NFS4_SHARE_ACCESS_BOTH:
881                 return O_RDWR;
882         }
883         WARN_ON_ONCE(1);
884         return O_RDONLY;
885 }
886
887 /*
888  * A stateid that had a deny mode associated with it is being released
889  * or downgraded. Recalculate the deny mode on the file.
890  */
891 static void
892 recalculate_deny_mode(struct nfs4_file *fp)
893 {
894         struct nfs4_ol_stateid *stp;
895
896         spin_lock(&fp->fi_lock);
897         fp->fi_share_deny = 0;
898         list_for_each_entry(stp, &fp->fi_stateids, st_perfile)
899                 fp->fi_share_deny |= bmap_to_share_mode(stp->st_deny_bmap);
900         spin_unlock(&fp->fi_lock);
901 }
902
903 static void
904 reset_union_bmap_deny(u32 deny, struct nfs4_ol_stateid *stp)
905 {
906         int i;
907         bool change = false;
908
909         for (i = 1; i < 4; i++) {
910                 if ((i & deny) != i) {
911                         change = true;
912                         clear_deny(i, stp);
913                 }
914         }
915
916         /* Recalculate per-file deny mode if there was a change */
917         if (change)
918                 recalculate_deny_mode(stp->st_stid.sc_file);
919 }
920
921 /* release all access and file references for a given stateid */
922 static void
923 release_all_access(struct nfs4_ol_stateid *stp)
924 {
925         int i;
926         struct nfs4_file *fp = stp->st_stid.sc_file;
927
928         if (fp && stp->st_deny_bmap != 0)
929                 recalculate_deny_mode(fp);
930
931         for (i = 1; i < 4; i++) {
932                 if (test_access(i, stp))
933                         nfs4_file_put_access(stp->st_stid.sc_file, i);
934                 clear_access(i, stp);
935         }
936 }
937
938 static void nfs4_put_stateowner(struct nfs4_stateowner *sop)
939 {
940         struct nfs4_client *clp = sop->so_client;
941
942         might_lock(&clp->cl_lock);
943
944         if (!atomic_dec_and_lock(&sop->so_count, &clp->cl_lock))
945                 return;
946         sop->so_ops->so_unhash(sop);
947         spin_unlock(&clp->cl_lock);
948         kfree(sop->so_owner.data);
949         sop->so_ops->so_free(sop);
950 }
951
952 static void unhash_ol_stateid(struct nfs4_ol_stateid *stp)
953 {
954         struct nfs4_file *fp = stp->st_stid.sc_file;
955
956         lockdep_assert_held(&stp->st_stateowner->so_client->cl_lock);
957
958         spin_lock(&fp->fi_lock);
959         list_del(&stp->st_perfile);
960         spin_unlock(&fp->fi_lock);
961         list_del(&stp->st_perstateowner);
962 }
963
964 static void nfs4_free_ol_stateid(struct nfs4_stid *stid)
965 {
966         struct nfs4_ol_stateid *stp = openlockstateid(stid);
967
968         release_all_access(stp);
969         if (stp->st_stateowner)
970                 nfs4_put_stateowner(stp->st_stateowner);
971         kmem_cache_free(stateid_slab, stid);
972 }
973
974 static void nfs4_free_lock_stateid(struct nfs4_stid *stid)
975 {
976         struct nfs4_ol_stateid *stp = openlockstateid(stid);
977         struct nfs4_lockowner *lo = lockowner(stp->st_stateowner);
978         struct file *file;
979
980         file = find_any_file(stp->st_stid.sc_file);
981         if (file)
982                 filp_close(file, (fl_owner_t)lo);
983         nfs4_free_ol_stateid(stid);
984 }
985
986 /*
987  * Put the persistent reference to an already unhashed generic stateid, while
988  * holding the cl_lock. If it's the last reference, then put it onto the
989  * reaplist for later destruction.
990  */
991 static void put_ol_stateid_locked(struct nfs4_ol_stateid *stp,
992                                        struct list_head *reaplist)
993 {
994         struct nfs4_stid *s = &stp->st_stid;
995         struct nfs4_client *clp = s->sc_client;
996
997         lockdep_assert_held(&clp->cl_lock);
998
999         WARN_ON_ONCE(!list_empty(&stp->st_locks));
1000
1001         if (!atomic_dec_and_test(&s->sc_count)) {
1002                 wake_up_all(&close_wq);
1003                 return;
1004         }
1005
1006         idr_remove(&clp->cl_stateids, s->sc_stateid.si_opaque.so_id);
1007         list_add(&stp->st_locks, reaplist);
1008 }
1009
1010 static void unhash_lock_stateid(struct nfs4_ol_stateid *stp)
1011 {
1012         struct nfs4_openowner *oo = openowner(stp->st_openstp->st_stateowner);
1013
1014         lockdep_assert_held(&oo->oo_owner.so_client->cl_lock);
1015
1016         list_del_init(&stp->st_locks);
1017         unhash_ol_stateid(stp);
1018         unhash_stid(&stp->st_stid);
1019 }
1020
1021 static void release_lock_stateid(struct nfs4_ol_stateid *stp)
1022 {
1023         struct nfs4_openowner *oo = openowner(stp->st_openstp->st_stateowner);
1024
1025         spin_lock(&oo->oo_owner.so_client->cl_lock);
1026         unhash_lock_stateid(stp);
1027         spin_unlock(&oo->oo_owner.so_client->cl_lock);
1028         nfs4_put_stid(&stp->st_stid);
1029 }
1030
1031 static void unhash_lockowner_locked(struct nfs4_lockowner *lo)
1032 {
1033         struct nfs4_client *clp = lo->lo_owner.so_client;
1034
1035         lockdep_assert_held(&clp->cl_lock);
1036
1037         list_del_init(&lo->lo_owner.so_strhash);
1038 }
1039
1040 /*
1041  * Free a list of generic stateids that were collected earlier after being
1042  * fully unhashed.
1043  */
1044 static void
1045 free_ol_stateid_reaplist(struct list_head *reaplist)
1046 {
1047         struct nfs4_ol_stateid *stp;
1048
1049         might_sleep();
1050
1051         while (!list_empty(reaplist)) {
1052                 stp = list_first_entry(reaplist, struct nfs4_ol_stateid,
1053                                        st_locks);
1054                 list_del(&stp->st_locks);
1055                 stp->st_stid.sc_free(&stp->st_stid);
1056         }
1057 }
1058
1059 static void release_lockowner(struct nfs4_lockowner *lo)
1060 {
1061         struct nfs4_client *clp = lo->lo_owner.so_client;
1062         struct nfs4_ol_stateid *stp;
1063         struct list_head reaplist;
1064
1065         INIT_LIST_HEAD(&reaplist);
1066
1067         spin_lock(&clp->cl_lock);
1068         unhash_lockowner_locked(lo);
1069         while (!list_empty(&lo->lo_owner.so_stateids)) {
1070                 stp = list_first_entry(&lo->lo_owner.so_stateids,
1071                                 struct nfs4_ol_stateid, st_perstateowner);
1072                 unhash_lock_stateid(stp);
1073                 put_ol_stateid_locked(stp, &reaplist);
1074         }
1075         spin_unlock(&clp->cl_lock);
1076         free_ol_stateid_reaplist(&reaplist);
1077         nfs4_put_stateowner(&lo->lo_owner);
1078 }
1079
1080 static void release_open_stateid_locks(struct nfs4_ol_stateid *open_stp,
1081                                        struct list_head *reaplist)
1082 {
1083         struct nfs4_ol_stateid *stp;
1084
1085         while (!list_empty(&open_stp->st_locks)) {
1086                 stp = list_entry(open_stp->st_locks.next,
1087                                 struct nfs4_ol_stateid, st_locks);
1088                 unhash_lock_stateid(stp);
1089                 put_ol_stateid_locked(stp, reaplist);
1090         }
1091 }
1092
1093 static void unhash_open_stateid(struct nfs4_ol_stateid *stp,
1094                                 struct list_head *reaplist)
1095 {
1096         lockdep_assert_held(&stp->st_stid.sc_client->cl_lock);
1097
1098         unhash_ol_stateid(stp);
1099         release_open_stateid_locks(stp, reaplist);
1100 }
1101
1102 static void release_open_stateid(struct nfs4_ol_stateid *stp)
1103 {
1104         LIST_HEAD(reaplist);
1105
1106         spin_lock(&stp->st_stid.sc_client->cl_lock);
1107         unhash_open_stateid(stp, &reaplist);
1108         put_ol_stateid_locked(stp, &reaplist);
1109         spin_unlock(&stp->st_stid.sc_client->cl_lock);
1110         free_ol_stateid_reaplist(&reaplist);
1111 }
1112
1113 static void unhash_openowner_locked(struct nfs4_openowner *oo)
1114 {
1115         struct nfs4_client *clp = oo->oo_owner.so_client;
1116
1117         lockdep_assert_held(&clp->cl_lock);
1118
1119         list_del_init(&oo->oo_owner.so_strhash);
1120         list_del_init(&oo->oo_perclient);
1121 }
1122
1123 static void release_last_closed_stateid(struct nfs4_openowner *oo)
1124 {
1125         struct nfs4_ol_stateid *s = oo->oo_last_closed_stid;
1126
1127         if (s) {
1128                 list_del_init(&oo->oo_close_lru);
1129                 oo->oo_last_closed_stid = NULL;
1130                 nfs4_put_stid(&s->st_stid);
1131         }
1132 }
1133
1134 static void release_openowner(struct nfs4_openowner *oo)
1135 {
1136         struct nfs4_ol_stateid *stp;
1137         struct nfs4_client *clp = oo->oo_owner.so_client;
1138         struct list_head reaplist;
1139
1140         INIT_LIST_HEAD(&reaplist);
1141
1142         spin_lock(&clp->cl_lock);
1143         unhash_openowner_locked(oo);
1144         while (!list_empty(&oo->oo_owner.so_stateids)) {
1145                 stp = list_first_entry(&oo->oo_owner.so_stateids,
1146                                 struct nfs4_ol_stateid, st_perstateowner);
1147                 unhash_open_stateid(stp, &reaplist);
1148                 put_ol_stateid_locked(stp, &reaplist);
1149         }
1150         spin_unlock(&clp->cl_lock);
1151         free_ol_stateid_reaplist(&reaplist);
1152         release_last_closed_stateid(oo);
1153         nfs4_put_stateowner(&oo->oo_owner);
1154 }
1155
1156 static inline int
1157 hash_sessionid(struct nfs4_sessionid *sessionid)
1158 {
1159         struct nfsd4_sessionid *sid = (struct nfsd4_sessionid *)sessionid;
1160
1161         return sid->sequence % SESSION_HASH_SIZE;
1162 }
1163
1164 #ifdef NFSD_DEBUG
1165 static inline void
1166 dump_sessionid(const char *fn, struct nfs4_sessionid *sessionid)
1167 {
1168         u32 *ptr = (u32 *)(&sessionid->data[0]);
1169         dprintk("%s: %u:%u:%u:%u\n", fn, ptr[0], ptr[1], ptr[2], ptr[3]);
1170 }
1171 #else
1172 static inline void
1173 dump_sessionid(const char *fn, struct nfs4_sessionid *sessionid)
1174 {
1175 }
1176 #endif
1177
1178 /*
1179  * Bump the seqid on cstate->replay_owner, and clear replay_owner if it
1180  * won't be used for replay.
1181  */
1182 void nfsd4_bump_seqid(struct nfsd4_compound_state *cstate, __be32 nfserr)
1183 {
1184         struct nfs4_stateowner *so = cstate->replay_owner;
1185
1186         if (nfserr == nfserr_replay_me)
1187                 return;
1188
1189         if (!seqid_mutating_err(ntohl(nfserr))) {
1190                 nfsd4_cstate_clear_replay(cstate);
1191                 return;
1192         }
1193         if (!so)
1194                 return;
1195         if (so->so_is_open_owner)
1196                 release_last_closed_stateid(openowner(so));
1197         so->so_seqid++;
1198         return;
1199 }
1200
1201 static void
1202 gen_sessionid(struct nfsd4_session *ses)
1203 {
1204         struct nfs4_client *clp = ses->se_client;
1205         struct nfsd4_sessionid *sid;
1206
1207         sid = (struct nfsd4_sessionid *)ses->se_sessionid.data;
1208         sid->clientid = clp->cl_clientid;
1209         sid->sequence = current_sessionid++;
1210         sid->reserved = 0;
1211 }
1212
1213 /*
1214  * The protocol defines ca_maxresponssize_cached to include the size of
1215  * the rpc header, but all we need to cache is the data starting after
1216  * the end of the initial SEQUENCE operation--the rest we regenerate
1217  * each time.  Therefore we can advertise a ca_maxresponssize_cached
1218  * value that is the number of bytes in our cache plus a few additional
1219  * bytes.  In order to stay on the safe side, and not promise more than
1220  * we can cache, those additional bytes must be the minimum possible: 24
1221  * bytes of rpc header (xid through accept state, with AUTH_NULL
1222  * verifier), 12 for the compound header (with zero-length tag), and 44
1223  * for the SEQUENCE op response:
1224  */
1225 #define NFSD_MIN_HDR_SEQ_SZ  (24 + 12 + 44)
1226
1227 static void
1228 free_session_slots(struct nfsd4_session *ses)
1229 {
1230         int i;
1231
1232         for (i = 0; i < ses->se_fchannel.maxreqs; i++)
1233                 kfree(ses->se_slots[i]);
1234 }
1235
1236 /*
1237  * We don't actually need to cache the rpc and session headers, so we
1238  * can allocate a little less for each slot:
1239  */
1240 static inline u32 slot_bytes(struct nfsd4_channel_attrs *ca)
1241 {
1242         u32 size;
1243
1244         if (ca->maxresp_cached < NFSD_MIN_HDR_SEQ_SZ)
1245                 size = 0;
1246         else
1247                 size = ca->maxresp_cached - NFSD_MIN_HDR_SEQ_SZ;
1248         return size + sizeof(struct nfsd4_slot);
1249 }
1250
1251 /*
1252  * XXX: If we run out of reserved DRC memory we could (up to a point)
1253  * re-negotiate active sessions and reduce their slot usage to make
1254  * room for new connections. For now we just fail the create session.
1255  */
1256 static u32 nfsd4_get_drc_mem(struct nfsd4_channel_attrs *ca)
1257 {
1258         u32 slotsize = slot_bytes(ca);
1259         u32 num = ca->maxreqs;
1260         int avail;
1261
1262         spin_lock(&nfsd_drc_lock);
1263         avail = min((unsigned long)NFSD_MAX_MEM_PER_SESSION,
1264                     nfsd_drc_max_mem - nfsd_drc_mem_used);
1265         num = min_t(int, num, avail / slotsize);
1266         nfsd_drc_mem_used += num * slotsize;
1267         spin_unlock(&nfsd_drc_lock);
1268
1269         return num;
1270 }
1271
1272 static void nfsd4_put_drc_mem(struct nfsd4_channel_attrs *ca)
1273 {
1274         int slotsize = slot_bytes(ca);
1275
1276         spin_lock(&nfsd_drc_lock);
1277         nfsd_drc_mem_used -= slotsize * ca->maxreqs;
1278         spin_unlock(&nfsd_drc_lock);
1279 }
1280
1281 static struct nfsd4_session *alloc_session(struct nfsd4_channel_attrs *fattrs,
1282                                            struct nfsd4_channel_attrs *battrs)
1283 {
1284         int numslots = fattrs->maxreqs;
1285         int slotsize = slot_bytes(fattrs);
1286         struct nfsd4_session *new;
1287         int mem, i;
1288
1289         BUILD_BUG_ON(NFSD_MAX_SLOTS_PER_SESSION * sizeof(struct nfsd4_slot *)
1290                         + sizeof(struct nfsd4_session) > PAGE_SIZE);
1291         mem = numslots * sizeof(struct nfsd4_slot *);
1292
1293         new = kzalloc(sizeof(*new) + mem, GFP_KERNEL);
1294         if (!new)
1295                 return NULL;
1296         /* allocate each struct nfsd4_slot and data cache in one piece */
1297         for (i = 0; i < numslots; i++) {
1298                 new->se_slots[i] = kzalloc(slotsize, GFP_KERNEL);
1299                 if (!new->se_slots[i])
1300                         goto out_free;
1301         }
1302
1303         memcpy(&new->se_fchannel, fattrs, sizeof(struct nfsd4_channel_attrs));
1304         memcpy(&new->se_bchannel, battrs, sizeof(struct nfsd4_channel_attrs));
1305
1306         return new;
1307 out_free:
1308         while (i--)
1309                 kfree(new->se_slots[i]);
1310         kfree(new);
1311         return NULL;
1312 }
1313
1314 static void free_conn(struct nfsd4_conn *c)
1315 {
1316         svc_xprt_put(c->cn_xprt);
1317         kfree(c);
1318 }
1319
1320 static void nfsd4_conn_lost(struct svc_xpt_user *u)
1321 {
1322         struct nfsd4_conn *c = container_of(u, struct nfsd4_conn, cn_xpt_user);
1323         struct nfs4_client *clp = c->cn_session->se_client;
1324
1325         spin_lock(&clp->cl_lock);
1326         if (!list_empty(&c->cn_persession)) {
1327                 list_del(&c->cn_persession);
1328                 free_conn(c);
1329         }
1330         nfsd4_probe_callback(clp);
1331         spin_unlock(&clp->cl_lock);
1332 }
1333
1334 static struct nfsd4_conn *alloc_conn(struct svc_rqst *rqstp, u32 flags)
1335 {
1336         struct nfsd4_conn *conn;
1337
1338         conn = kmalloc(sizeof(struct nfsd4_conn), GFP_KERNEL);
1339         if (!conn)
1340                 return NULL;
1341         svc_xprt_get(rqstp->rq_xprt);
1342         conn->cn_xprt = rqstp->rq_xprt;
1343         conn->cn_flags = flags;
1344         INIT_LIST_HEAD(&conn->cn_xpt_user.list);
1345         return conn;
1346 }
1347
1348 static void __nfsd4_hash_conn(struct nfsd4_conn *conn, struct nfsd4_session *ses)
1349 {
1350         conn->cn_session = ses;
1351         list_add(&conn->cn_persession, &ses->se_conns);
1352 }
1353
1354 static void nfsd4_hash_conn(struct nfsd4_conn *conn, struct nfsd4_session *ses)
1355 {
1356         struct nfs4_client *clp = ses->se_client;
1357
1358         spin_lock(&clp->cl_lock);
1359         __nfsd4_hash_conn(conn, ses);
1360         spin_unlock(&clp->cl_lock);
1361 }
1362
1363 static int nfsd4_register_conn(struct nfsd4_conn *conn)
1364 {
1365         conn->cn_xpt_user.callback = nfsd4_conn_lost;
1366         return register_xpt_user(conn->cn_xprt, &conn->cn_xpt_user);
1367 }
1368
1369 static void nfsd4_init_conn(struct svc_rqst *rqstp, struct nfsd4_conn *conn, struct nfsd4_session *ses)
1370 {
1371         int ret;
1372
1373         nfsd4_hash_conn(conn, ses);
1374         ret = nfsd4_register_conn(conn);
1375         if (ret)
1376                 /* oops; xprt is already down: */
1377                 nfsd4_conn_lost(&conn->cn_xpt_user);
1378         /* We may have gained or lost a callback channel: */
1379         nfsd4_probe_callback_sync(ses->se_client);
1380 }
1381
1382 static struct nfsd4_conn *alloc_conn_from_crses(struct svc_rqst *rqstp, struct nfsd4_create_session *cses)
1383 {
1384         u32 dir = NFS4_CDFC4_FORE;
1385
1386         if (cses->flags & SESSION4_BACK_CHAN)
1387                 dir |= NFS4_CDFC4_BACK;
1388         return alloc_conn(rqstp, dir);
1389 }
1390
1391 /* must be called under client_lock */
1392 static void nfsd4_del_conns(struct nfsd4_session *s)
1393 {
1394         struct nfs4_client *clp = s->se_client;
1395         struct nfsd4_conn *c;
1396
1397         spin_lock(&clp->cl_lock);
1398         while (!list_empty(&s->se_conns)) {
1399                 c = list_first_entry(&s->se_conns, struct nfsd4_conn, cn_persession);
1400                 list_del_init(&c->cn_persession);
1401                 spin_unlock(&clp->cl_lock);
1402
1403                 unregister_xpt_user(c->cn_xprt, &c->cn_xpt_user);
1404                 free_conn(c);
1405
1406                 spin_lock(&clp->cl_lock);
1407         }
1408         spin_unlock(&clp->cl_lock);
1409 }
1410
1411 static void __free_session(struct nfsd4_session *ses)
1412 {
1413         free_session_slots(ses);
1414         kfree(ses);
1415 }
1416
1417 static void free_session(struct nfsd4_session *ses)
1418 {
1419         struct nfsd_net *nn = net_generic(ses->se_client->net, nfsd_net_id);
1420
1421         lockdep_assert_held(&nn->client_lock);
1422         nfsd4_del_conns(ses);
1423         nfsd4_put_drc_mem(&ses->se_fchannel);
1424         __free_session(ses);
1425 }
1426
1427 static void init_session(struct svc_rqst *rqstp, struct nfsd4_session *new, struct nfs4_client *clp, struct nfsd4_create_session *cses)
1428 {
1429         int idx;
1430         struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
1431
1432         new->se_client = clp;
1433         gen_sessionid(new);
1434
1435         INIT_LIST_HEAD(&new->se_conns);
1436
1437         new->se_cb_seq_nr = 1;
1438         new->se_flags = cses->flags;
1439         new->se_cb_prog = cses->callback_prog;
1440         new->se_cb_sec = cses->cb_sec;
1441         atomic_set(&new->se_ref, 0);
1442         idx = hash_sessionid(&new->se_sessionid);
1443         spin_lock(&nn->client_lock);
1444         list_add(&new->se_hash, &nn->sessionid_hashtbl[idx]);
1445         spin_lock(&clp->cl_lock);
1446         list_add(&new->se_perclnt, &clp->cl_sessions);
1447         spin_unlock(&clp->cl_lock);
1448         spin_unlock(&nn->client_lock);
1449
1450         if (cses->flags & SESSION4_BACK_CHAN) {
1451                 struct sockaddr *sa = svc_addr(rqstp);
1452                 /*
1453                  * This is a little silly; with sessions there's no real
1454                  * use for the callback address.  Use the peer address
1455                  * as a reasonable default for now, but consider fixing
1456                  * the rpc client not to require an address in the
1457                  * future:
1458                  */
1459                 rpc_copy_addr((struct sockaddr *)&clp->cl_cb_conn.cb_addr, sa);
1460                 clp->cl_cb_conn.cb_addrlen = svc_addr_len(sa);
1461         }
1462 }
1463
1464 /* caller must hold client_lock */
1465 static struct nfsd4_session *
1466 __find_in_sessionid_hashtbl(struct nfs4_sessionid *sessionid, struct net *net)
1467 {
1468         struct nfsd4_session *elem;
1469         int idx;
1470         struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1471
1472         dump_sessionid(__func__, sessionid);
1473         idx = hash_sessionid(sessionid);
1474         /* Search in the appropriate list */
1475         list_for_each_entry(elem, &nn->sessionid_hashtbl[idx], se_hash) {
1476                 if (!memcmp(elem->se_sessionid.data, sessionid->data,
1477                             NFS4_MAX_SESSIONID_LEN)) {
1478                         return elem;
1479                 }
1480         }
1481
1482         dprintk("%s: session not found\n", __func__);
1483         return NULL;
1484 }
1485
1486 static struct nfsd4_session *
1487 find_in_sessionid_hashtbl(struct nfs4_sessionid *sessionid, struct net *net,
1488                 __be32 *ret)
1489 {
1490         struct nfsd4_session *session;
1491         __be32 status = nfserr_badsession;
1492
1493         session = __find_in_sessionid_hashtbl(sessionid, net);
1494         if (!session)
1495                 goto out;
1496         status = nfsd4_get_session_locked(session);
1497         if (status)
1498                 session = NULL;
1499 out:
1500         *ret = status;
1501         return session;
1502 }
1503
1504 /* caller must hold client_lock */
1505 static void
1506 unhash_session(struct nfsd4_session *ses)
1507 {
1508         list_del(&ses->se_hash);
1509         spin_lock(&ses->se_client->cl_lock);
1510         list_del(&ses->se_perclnt);
1511         spin_unlock(&ses->se_client->cl_lock);
1512 }
1513
1514 /* SETCLIENTID and SETCLIENTID_CONFIRM Helper functions */
1515 static int
1516 STALE_CLIENTID(clientid_t *clid, struct nfsd_net *nn)
1517 {
1518         if (clid->cl_boot == nn->boot_time)
1519                 return 0;
1520         dprintk("NFSD stale clientid (%08x/%08x) boot_time %08lx\n",
1521                 clid->cl_boot, clid->cl_id, nn->boot_time);
1522         return 1;
1523 }
1524
1525 /* 
1526  * XXX Should we use a slab cache ?
1527  * This type of memory management is somewhat inefficient, but we use it
1528  * anyway since SETCLIENTID is not a common operation.
1529  */
1530 static struct nfs4_client *alloc_client(struct xdr_netobj name)
1531 {
1532         struct nfs4_client *clp;
1533         int i;
1534
1535         clp = kzalloc(sizeof(struct nfs4_client), GFP_KERNEL);
1536         if (clp == NULL)
1537                 return NULL;
1538         clp->cl_name.data = kmemdup(name.data, name.len, GFP_KERNEL);
1539         if (clp->cl_name.data == NULL)
1540                 goto err_no_name;
1541         clp->cl_ownerstr_hashtbl = kmalloc(sizeof(struct list_head) *
1542                         OWNER_HASH_SIZE, GFP_KERNEL);
1543         if (!clp->cl_ownerstr_hashtbl)
1544                 goto err_no_hashtbl;
1545         for (i = 0; i < OWNER_HASH_SIZE; i++)
1546                 INIT_LIST_HEAD(&clp->cl_ownerstr_hashtbl[i]);
1547         clp->cl_name.len = name.len;
1548         INIT_LIST_HEAD(&clp->cl_sessions);
1549         idr_init(&clp->cl_stateids);
1550         atomic_set(&clp->cl_refcount, 0);
1551         clp->cl_cb_state = NFSD4_CB_UNKNOWN;
1552         INIT_LIST_HEAD(&clp->cl_idhash);
1553         INIT_LIST_HEAD(&clp->cl_openowners);
1554         INIT_LIST_HEAD(&clp->cl_delegations);
1555         INIT_LIST_HEAD(&clp->cl_lru);
1556         INIT_LIST_HEAD(&clp->cl_callbacks);
1557         INIT_LIST_HEAD(&clp->cl_revoked);
1558         spin_lock_init(&clp->cl_lock);
1559         rpc_init_wait_queue(&clp->cl_cb_waitq, "Backchannel slot table");
1560         return clp;
1561 err_no_hashtbl:
1562         kfree(clp->cl_name.data);
1563 err_no_name:
1564         kfree(clp);
1565         return NULL;
1566 }
1567
1568 static void
1569 free_client(struct nfs4_client *clp)
1570 {
1571         struct nfsd_net __maybe_unused *nn = net_generic(clp->net, nfsd_net_id);
1572
1573         lockdep_assert_held(&nn->client_lock);
1574         while (!list_empty(&clp->cl_sessions)) {
1575                 struct nfsd4_session *ses;
1576                 ses = list_entry(clp->cl_sessions.next, struct nfsd4_session,
1577                                 se_perclnt);
1578                 list_del(&ses->se_perclnt);
1579                 WARN_ON_ONCE(atomic_read(&ses->se_ref));
1580                 free_session(ses);
1581         }
1582         rpc_destroy_wait_queue(&clp->cl_cb_waitq);
1583         free_svc_cred(&clp->cl_cred);
1584         kfree(clp->cl_ownerstr_hashtbl);
1585         kfree(clp->cl_name.data);
1586         idr_destroy(&clp->cl_stateids);
1587         kfree(clp);
1588 }
1589
1590 /* must be called under the client_lock */
1591 static inline void
1592 unhash_client_locked(struct nfs4_client *clp)
1593 {
1594         struct nfsd4_session *ses;
1595
1596         list_del(&clp->cl_lru);
1597         spin_lock(&clp->cl_lock);
1598         list_for_each_entry(ses, &clp->cl_sessions, se_perclnt)
1599                 list_del_init(&ses->se_hash);
1600         spin_unlock(&clp->cl_lock);
1601 }
1602
1603 static void
1604 destroy_client(struct nfs4_client *clp)
1605 {
1606         struct nfs4_openowner *oo;
1607         struct nfs4_delegation *dp;
1608         struct list_head reaplist;
1609         struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1610
1611         INIT_LIST_HEAD(&reaplist);
1612         spin_lock(&state_lock);
1613         while (!list_empty(&clp->cl_delegations)) {
1614                 dp = list_entry(clp->cl_delegations.next, struct nfs4_delegation, dl_perclnt);
1615                 unhash_delegation_locked(dp);
1616                 list_add(&dp->dl_recall_lru, &reaplist);
1617         }
1618         spin_unlock(&state_lock);
1619         while (!list_empty(&reaplist)) {
1620                 dp = list_entry(reaplist.next, struct nfs4_delegation, dl_recall_lru);
1621                 list_del_init(&dp->dl_recall_lru);
1622                 nfs4_put_stid(&dp->dl_stid);
1623         }
1624         while (!list_empty(&clp->cl_revoked)) {
1625                 dp = list_entry(reaplist.next, struct nfs4_delegation, dl_recall_lru);
1626                 list_del_init(&dp->dl_recall_lru);
1627                 nfs4_put_stid(&dp->dl_stid);
1628         }
1629         while (!list_empty(&clp->cl_openowners)) {
1630                 oo = list_entry(clp->cl_openowners.next, struct nfs4_openowner, oo_perclient);
1631                 atomic_inc(&oo->oo_owner.so_count);
1632                 release_openowner(oo);
1633         }
1634         nfsd4_shutdown_callback(clp);
1635         if (clp->cl_cb_conn.cb_xprt)
1636                 svc_xprt_put(clp->cl_cb_conn.cb_xprt);
1637         list_del(&clp->cl_idhash);
1638         if (test_bit(NFSD4_CLIENT_CONFIRMED, &clp->cl_flags))
1639                 rb_erase(&clp->cl_namenode, &nn->conf_name_tree);
1640         else
1641                 rb_erase(&clp->cl_namenode, &nn->unconf_name_tree);
1642         spin_lock(&nn->client_lock);
1643         unhash_client_locked(clp);
1644         WARN_ON_ONCE(atomic_read(&clp->cl_refcount));
1645         free_client(clp);
1646         spin_unlock(&nn->client_lock);
1647 }
1648
1649 static void expire_client(struct nfs4_client *clp)
1650 {
1651         nfsd4_client_record_remove(clp);
1652         destroy_client(clp);
1653 }
1654
1655 static void copy_verf(struct nfs4_client *target, nfs4_verifier *source)
1656 {
1657         memcpy(target->cl_verifier.data, source->data,
1658                         sizeof(target->cl_verifier.data));
1659 }
1660
1661 static void copy_clid(struct nfs4_client *target, struct nfs4_client *source)
1662 {
1663         target->cl_clientid.cl_boot = source->cl_clientid.cl_boot; 
1664         target->cl_clientid.cl_id = source->cl_clientid.cl_id; 
1665 }
1666
1667 static int copy_cred(struct svc_cred *target, struct svc_cred *source)
1668 {
1669         if (source->cr_principal) {
1670                 target->cr_principal =
1671                                 kstrdup(source->cr_principal, GFP_KERNEL);
1672                 if (target->cr_principal == NULL)
1673                         return -ENOMEM;
1674         } else
1675                 target->cr_principal = NULL;
1676         target->cr_flavor = source->cr_flavor;
1677         target->cr_uid = source->cr_uid;
1678         target->cr_gid = source->cr_gid;
1679         target->cr_group_info = source->cr_group_info;
1680         get_group_info(target->cr_group_info);
1681         target->cr_gss_mech = source->cr_gss_mech;
1682         if (source->cr_gss_mech)
1683                 gss_mech_get(source->cr_gss_mech);
1684         return 0;
1685 }
1686
1687 static long long
1688 compare_blob(const struct xdr_netobj *o1, const struct xdr_netobj *o2)
1689 {
1690         long long res;
1691
1692         res = o1->len - o2->len;
1693         if (res)
1694                 return res;
1695         return (long long)memcmp(o1->data, o2->data, o1->len);
1696 }
1697
1698 static int same_name(const char *n1, const char *n2)
1699 {
1700         return 0 == memcmp(n1, n2, HEXDIR_LEN);
1701 }
1702
1703 static int
1704 same_verf(nfs4_verifier *v1, nfs4_verifier *v2)
1705 {
1706         return 0 == memcmp(v1->data, v2->data, sizeof(v1->data));
1707 }
1708
1709 static int
1710 same_clid(clientid_t *cl1, clientid_t *cl2)
1711 {
1712         return (cl1->cl_boot == cl2->cl_boot) && (cl1->cl_id == cl2->cl_id);
1713 }
1714
1715 static bool groups_equal(struct group_info *g1, struct group_info *g2)
1716 {
1717         int i;
1718
1719         if (g1->ngroups != g2->ngroups)
1720                 return false;
1721         for (i=0; i<g1->ngroups; i++)
1722                 if (!gid_eq(GROUP_AT(g1, i), GROUP_AT(g2, i)))
1723                         return false;
1724         return true;
1725 }
1726
1727 /*
1728  * RFC 3530 language requires clid_inuse be returned when the
1729  * "principal" associated with a requests differs from that previously
1730  * used.  We use uid, gid's, and gss principal string as our best
1731  * approximation.  We also don't want to allow non-gss use of a client
1732  * established using gss: in theory cr_principal should catch that
1733  * change, but in practice cr_principal can be null even in the gss case
1734  * since gssd doesn't always pass down a principal string.
1735  */
1736 static bool is_gss_cred(struct svc_cred *cr)
1737 {
1738         /* Is cr_flavor one of the gss "pseudoflavors"?: */
1739         return (cr->cr_flavor > RPC_AUTH_MAXFLAVOR);
1740 }
1741
1742
1743 static bool
1744 same_creds(struct svc_cred *cr1, struct svc_cred *cr2)
1745 {
1746         if ((is_gss_cred(cr1) != is_gss_cred(cr2))
1747                 || (!uid_eq(cr1->cr_uid, cr2->cr_uid))
1748                 || (!gid_eq(cr1->cr_gid, cr2->cr_gid))
1749                 || !groups_equal(cr1->cr_group_info, cr2->cr_group_info))
1750                 return false;
1751         if (cr1->cr_principal == cr2->cr_principal)
1752                 return true;
1753         if (!cr1->cr_principal || !cr2->cr_principal)
1754                 return false;
1755         return 0 == strcmp(cr1->cr_principal, cr2->cr_principal);
1756 }
1757
1758 static bool svc_rqst_integrity_protected(struct svc_rqst *rqstp)
1759 {
1760         struct svc_cred *cr = &rqstp->rq_cred;
1761         u32 service;
1762
1763         if (!cr->cr_gss_mech)
1764                 return false;
1765         service = gss_pseudoflavor_to_service(cr->cr_gss_mech, cr->cr_flavor);
1766         return service == RPC_GSS_SVC_INTEGRITY ||
1767                service == RPC_GSS_SVC_PRIVACY;
1768 }
1769
1770 static bool mach_creds_match(struct nfs4_client *cl, struct svc_rqst *rqstp)
1771 {
1772         struct svc_cred *cr = &rqstp->rq_cred;
1773
1774         if (!cl->cl_mach_cred)
1775                 return true;
1776         if (cl->cl_cred.cr_gss_mech != cr->cr_gss_mech)
1777                 return false;
1778         if (!svc_rqst_integrity_protected(rqstp))
1779                 return false;
1780         if (!cr->cr_principal)
1781                 return false;
1782         return 0 == strcmp(cl->cl_cred.cr_principal, cr->cr_principal);
1783 }
1784
1785 static void gen_clid(struct nfs4_client *clp, struct nfsd_net *nn)
1786 {
1787         static u32 current_clientid = 1;
1788
1789         clp->cl_clientid.cl_boot = nn->boot_time;
1790         clp->cl_clientid.cl_id = current_clientid++; 
1791 }
1792
1793 static void gen_confirm(struct nfs4_client *clp)
1794 {
1795         __be32 verf[2];
1796         static u32 i;
1797
1798         /*
1799          * This is opaque to client, so no need to byte-swap. Use
1800          * __force to keep sparse happy
1801          */
1802         verf[0] = (__force __be32)get_seconds();
1803         verf[1] = (__force __be32)i++;
1804         memcpy(clp->cl_confirm.data, verf, sizeof(clp->cl_confirm.data));
1805 }
1806
1807 static struct nfs4_stid *
1808 find_stateid_locked(struct nfs4_client *cl, stateid_t *t)
1809 {
1810         struct nfs4_stid *ret;
1811
1812         ret = idr_find(&cl->cl_stateids, t->si_opaque.so_id);
1813         if (!ret || !ret->sc_type)
1814                 return NULL;
1815         return ret;
1816 }
1817
1818 static struct nfs4_stid *
1819 find_stateid_by_type(struct nfs4_client *cl, stateid_t *t, char typemask)
1820 {
1821         struct nfs4_stid *s;
1822
1823         spin_lock(&cl->cl_lock);
1824         s = find_stateid_locked(cl, t);
1825         if (s != NULL) {
1826                 if (typemask & s->sc_type)
1827                         atomic_inc(&s->sc_count);
1828                 else
1829                         s = NULL;
1830         }
1831         spin_unlock(&cl->cl_lock);
1832         return s;
1833 }
1834
1835 static struct nfs4_client *create_client(struct xdr_netobj name,
1836                 struct svc_rqst *rqstp, nfs4_verifier *verf)
1837 {
1838         struct nfs4_client *clp;
1839         struct sockaddr *sa = svc_addr(rqstp);
1840         int ret;
1841         struct net *net = SVC_NET(rqstp);
1842         struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1843
1844         clp = alloc_client(name);
1845         if (clp == NULL)
1846                 return NULL;
1847
1848         ret = copy_cred(&clp->cl_cred, &rqstp->rq_cred);
1849         if (ret) {
1850                 spin_lock(&nn->client_lock);
1851                 free_client(clp);
1852                 spin_unlock(&nn->client_lock);
1853                 return NULL;
1854         }
1855         INIT_WORK(&clp->cl_cb_null.cb_work, nfsd4_run_cb_null);
1856         clp->cl_time = get_seconds();
1857         clear_bit(0, &clp->cl_cb_slot_busy);
1858         copy_verf(clp, verf);
1859         rpc_copy_addr((struct sockaddr *) &clp->cl_addr, sa);
1860         gen_confirm(clp);
1861         clp->cl_cb_session = NULL;
1862         clp->net = net;
1863         return clp;
1864 }
1865
1866 static void
1867 add_clp_to_name_tree(struct nfs4_client *new_clp, struct rb_root *root)
1868 {
1869         struct rb_node **new = &(root->rb_node), *parent = NULL;
1870         struct nfs4_client *clp;
1871
1872         while (*new) {
1873                 clp = rb_entry(*new, struct nfs4_client, cl_namenode);
1874                 parent = *new;
1875
1876                 if (compare_blob(&clp->cl_name, &new_clp->cl_name) > 0)
1877                         new = &((*new)->rb_left);
1878                 else
1879                         new = &((*new)->rb_right);
1880         }
1881
1882         rb_link_node(&new_clp->cl_namenode, parent, new);
1883         rb_insert_color(&new_clp->cl_namenode, root);
1884 }
1885
1886 static struct nfs4_client *
1887 find_clp_in_name_tree(struct xdr_netobj *name, struct rb_root *root)
1888 {
1889         long long cmp;
1890         struct rb_node *node = root->rb_node;
1891         struct nfs4_client *clp;
1892
1893         while (node) {
1894                 clp = rb_entry(node, struct nfs4_client, cl_namenode);
1895                 cmp = compare_blob(&clp->cl_name, name);
1896                 if (cmp > 0)
1897                         node = node->rb_left;
1898                 else if (cmp < 0)
1899                         node = node->rb_right;
1900                 else
1901                         return clp;
1902         }
1903         return NULL;
1904 }
1905
1906 static void
1907 add_to_unconfirmed(struct nfs4_client *clp)
1908 {
1909         unsigned int idhashval;
1910         struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1911
1912         clear_bit(NFSD4_CLIENT_CONFIRMED, &clp->cl_flags);
1913         add_clp_to_name_tree(clp, &nn->unconf_name_tree);
1914         idhashval = clientid_hashval(clp->cl_clientid.cl_id);
1915         list_add(&clp->cl_idhash, &nn->unconf_id_hashtbl[idhashval]);
1916         renew_client(clp);
1917 }
1918
1919 static void
1920 move_to_confirmed(struct nfs4_client *clp)
1921 {
1922         unsigned int idhashval = clientid_hashval(clp->cl_clientid.cl_id);
1923         struct nfsd_net *nn = net_generic(clp->net, nfsd_net_id);
1924
1925         dprintk("NFSD: move_to_confirm nfs4_client %p\n", clp);
1926         list_move(&clp->cl_idhash, &nn->conf_id_hashtbl[idhashval]);
1927         rb_erase(&clp->cl_namenode, &nn->unconf_name_tree);
1928         add_clp_to_name_tree(clp, &nn->conf_name_tree);
1929         set_bit(NFSD4_CLIENT_CONFIRMED, &clp->cl_flags);
1930         renew_client(clp);
1931 }
1932
1933 static struct nfs4_client *
1934 find_client_in_id_table(struct list_head *tbl, clientid_t *clid, bool sessions)
1935 {
1936         struct nfs4_client *clp;
1937         unsigned int idhashval = clientid_hashval(clid->cl_id);
1938
1939         list_for_each_entry(clp, &tbl[idhashval], cl_idhash) {
1940                 if (same_clid(&clp->cl_clientid, clid)) {
1941                         if ((bool)clp->cl_minorversion != sessions)
1942                                 return NULL;
1943                         renew_client(clp);
1944                         return clp;
1945                 }
1946         }
1947         return NULL;
1948 }
1949
1950 static struct nfs4_client *
1951 find_confirmed_client(clientid_t *clid, bool sessions, struct nfsd_net *nn)
1952 {
1953         struct list_head *tbl = nn->conf_id_hashtbl;
1954
1955         return find_client_in_id_table(tbl, clid, sessions);
1956 }
1957
1958 static struct nfs4_client *
1959 find_unconfirmed_client(clientid_t *clid, bool sessions, struct nfsd_net *nn)
1960 {
1961         struct list_head *tbl = nn->unconf_id_hashtbl;
1962
1963         return find_client_in_id_table(tbl, clid, sessions);
1964 }
1965
1966 static bool clp_used_exchangeid(struct nfs4_client *clp)
1967 {
1968         return clp->cl_exchange_flags != 0;
1969
1970
1971 static struct nfs4_client *
1972 find_confirmed_client_by_name(struct xdr_netobj *name, struct nfsd_net *nn)
1973 {
1974         return find_clp_in_name_tree(name, &nn->conf_name_tree);
1975 }
1976
1977 static struct nfs4_client *
1978 find_unconfirmed_client_by_name(struct xdr_netobj *name, struct nfsd_net *nn)
1979 {
1980         return find_clp_in_name_tree(name, &nn->unconf_name_tree);
1981 }
1982
1983 static void
1984 gen_callback(struct nfs4_client *clp, struct nfsd4_setclientid *se, struct svc_rqst *rqstp)
1985 {
1986         struct nfs4_cb_conn *conn = &clp->cl_cb_conn;
1987         struct sockaddr *sa = svc_addr(rqstp);
1988         u32 scopeid = rpc_get_scope_id(sa);
1989         unsigned short expected_family;
1990
1991         /* Currently, we only support tcp and tcp6 for the callback channel */
1992         if (se->se_callback_netid_len == 3 &&
1993             !memcmp(se->se_callback_netid_val, "tcp", 3))
1994                 expected_family = AF_INET;
1995         else if (se->se_callback_netid_len == 4 &&
1996                  !memcmp(se->se_callback_netid_val, "tcp6", 4))
1997                 expected_family = AF_INET6;
1998         else
1999                 goto out_err;
2000
2001         conn->cb_addrlen = rpc_uaddr2sockaddr(clp->net, se->se_callback_addr_val,
2002                                             se->se_callback_addr_len,
2003                                             (struct sockaddr *)&conn->cb_addr,
2004                                             sizeof(conn->cb_addr));
2005
2006         if (!conn->cb_addrlen || conn->cb_addr.ss_family != expected_family)
2007                 goto out_err;
2008
2009         if (conn->cb_addr.ss_family == AF_INET6)
2010                 ((struct sockaddr_in6 *)&conn->cb_addr)->sin6_scope_id = scopeid;
2011
2012         conn->cb_prog = se->se_callback_prog;
2013         conn->cb_ident = se->se_callback_ident;
2014         memcpy(&conn->cb_saddr, &rqstp->rq_daddr, rqstp->rq_daddrlen);
2015         return;
2016 out_err:
2017         conn->cb_addr.ss_family = AF_UNSPEC;
2018         conn->cb_addrlen = 0;
2019         dprintk(KERN_INFO "NFSD: this client (clientid %08x/%08x) "
2020                 "will not receive delegations\n",
2021                 clp->cl_clientid.cl_boot, clp->cl_clientid.cl_id);
2022
2023         return;
2024 }
2025
2026 /*
2027  * Cache a reply. nfsd4_check_resp_size() has bounded the cache size.
2028  */
2029 static void
2030 nfsd4_store_cache_entry(struct nfsd4_compoundres *resp)
2031 {
2032         struct xdr_buf *buf = resp->xdr.buf;
2033         struct nfsd4_slot *slot = resp->cstate.slot;
2034         unsigned int base;
2035
2036         dprintk("--> %s slot %p\n", __func__, slot);
2037
2038         slot->sl_opcnt = resp->opcnt;
2039         slot->sl_status = resp->cstate.status;
2040
2041         slot->sl_flags |= NFSD4_SLOT_INITIALIZED;
2042         if (nfsd4_not_cached(resp)) {
2043                 slot->sl_datalen = 0;
2044                 return;
2045         }
2046         base = resp->cstate.data_offset;
2047         slot->sl_datalen = buf->len - base;
2048         if (read_bytes_from_xdr_buf(buf, base, slot->sl_data, slot->sl_datalen))
2049                 WARN("%s: sessions DRC could not cache compound\n", __func__);
2050         return;
2051 }
2052
2053 /*
2054  * Encode the replay sequence operation from the slot values.
2055  * If cachethis is FALSE encode the uncached rep error on the next
2056  * operation which sets resp->p and increments resp->opcnt for
2057  * nfs4svc_encode_compoundres.
2058  *
2059  */
2060 static __be32
2061 nfsd4_enc_sequence_replay(struct nfsd4_compoundargs *args,
2062                           struct nfsd4_compoundres *resp)
2063 {
2064         struct nfsd4_op *op;
2065         struct nfsd4_slot *slot = resp->cstate.slot;
2066
2067         /* Encode the replayed sequence operation */
2068         op = &args->ops[resp->opcnt - 1];
2069         nfsd4_encode_operation(resp, op);
2070
2071         /* Return nfserr_retry_uncached_rep in next operation. */
2072         if (args->opcnt > 1 && !(slot->sl_flags & NFSD4_SLOT_CACHETHIS)) {
2073                 op = &args->ops[resp->opcnt++];
2074                 op->status = nfserr_retry_uncached_rep;
2075                 nfsd4_encode_operation(resp, op);
2076         }
2077         return op->status;
2078 }
2079
2080 /*
2081  * The sequence operation is not cached because we can use the slot and
2082  * session values.
2083  */
2084 static __be32
2085 nfsd4_replay_cache_entry(struct nfsd4_compoundres *resp,
2086                          struct nfsd4_sequence *seq)
2087 {
2088         struct nfsd4_slot *slot = resp->cstate.slot;
2089         struct xdr_stream *xdr = &resp->xdr;
2090         __be32 *p;
2091         __be32 status;
2092
2093         dprintk("--> %s slot %p\n", __func__, slot);
2094
2095         status = nfsd4_enc_sequence_replay(resp->rqstp->rq_argp, resp);
2096         if (status)
2097                 return status;
2098
2099         p = xdr_reserve_space(xdr, slot->sl_datalen);
2100         if (!p) {
2101                 WARN_ON_ONCE(1);
2102                 return nfserr_serverfault;
2103         }
2104         xdr_encode_opaque_fixed(p, slot->sl_data, slot->sl_datalen);
2105         xdr_commit_encode(xdr);
2106
2107         resp->opcnt = slot->sl_opcnt;
2108         return slot->sl_status;
2109 }
2110
2111 /*
2112  * Set the exchange_id flags returned by the server.
2113  */
2114 static void
2115 nfsd4_set_ex_flags(struct nfs4_client *new, struct nfsd4_exchange_id *clid)
2116 {
2117         /* pNFS is not supported */
2118         new->cl_exchange_flags |= EXCHGID4_FLAG_USE_NON_PNFS;
2119
2120         /* Referrals are supported, Migration is not. */
2121         new->cl_exchange_flags |= EXCHGID4_FLAG_SUPP_MOVED_REFER;
2122
2123         /* set the wire flags to return to client. */
2124         clid->flags = new->cl_exchange_flags;
2125 }
2126
2127 static bool client_has_state(struct nfs4_client *clp)
2128 {
2129         /*
2130          * Note clp->cl_openowners check isn't quite right: there's no
2131          * need to count owners without stateid's.
2132          *
2133          * Also note we should probably be using this in 4.0 case too.
2134          */
2135         return !list_empty(&clp->cl_openowners)
2136                 || !list_empty(&clp->cl_delegations)
2137                 || !list_empty(&clp->cl_sessions);
2138 }
2139
2140 __be32
2141 nfsd4_exchange_id(struct svc_rqst *rqstp,
2142                   struct nfsd4_compound_state *cstate,
2143                   struct nfsd4_exchange_id *exid)
2144 {
2145         struct nfs4_client *unconf, *conf, *new;
2146         __be32 status;
2147         char                    addr_str[INET6_ADDRSTRLEN];
2148         nfs4_verifier           verf = exid->verifier;
2149         struct sockaddr         *sa = svc_addr(rqstp);
2150         bool    update = exid->flags & EXCHGID4_FLAG_UPD_CONFIRMED_REC_A;
2151         struct nfsd_net         *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
2152
2153         rpc_ntop(sa, addr_str, sizeof(addr_str));
2154         dprintk("%s rqstp=%p exid=%p clname.len=%u clname.data=%p "
2155                 "ip_addr=%s flags %x, spa_how %d\n",
2156                 __func__, rqstp, exid, exid->clname.len, exid->clname.data,
2157                 addr_str, exid->flags, exid->spa_how);
2158
2159         if (exid->flags & ~EXCHGID4_FLAG_MASK_A)
2160                 return nfserr_inval;
2161
2162         switch (exid->spa_how) {
2163         case SP4_MACH_CRED:
2164                 if (!svc_rqst_integrity_protected(rqstp))
2165                         return nfserr_inval;
2166         case SP4_NONE:
2167                 break;
2168         default:                                /* checked by xdr code */
2169                 WARN_ON_ONCE(1);
2170         case SP4_SSV:
2171                 return nfserr_encr_alg_unsupp;
2172         }
2173
2174         /* Cases below refer to rfc 5661 section 18.35.4: */
2175         nfs4_lock_state();
2176         conf = find_confirmed_client_by_name(&exid->clname, nn);
2177         if (conf) {
2178                 bool creds_match = same_creds(&conf->cl_cred, &rqstp->rq_cred);
2179                 bool verfs_match = same_verf(&verf, &conf->cl_verifier);
2180
2181                 if (update) {
2182                         if (!clp_used_exchangeid(conf)) { /* buggy client */
2183                                 status = nfserr_inval;
2184                                 goto out;
2185                         }
2186                         if (!mach_creds_match(conf, rqstp)) {
2187                                 status = nfserr_wrong_cred;
2188                                 goto out;
2189                         }
2190                         if (!creds_match) { /* case 9 */
2191                                 status = nfserr_perm;
2192                                 goto out;
2193                         }
2194                         if (!verfs_match) { /* case 8 */
2195                                 status = nfserr_not_same;
2196                                 goto out;
2197                         }
2198                         /* case 6 */
2199                         exid->flags |= EXCHGID4_FLAG_CONFIRMED_R;
2200                         new = conf;
2201                         goto out_copy;
2202                 }
2203                 if (!creds_match) { /* case 3 */
2204                         if (client_has_state(conf)) {
2205                                 status = nfserr_clid_inuse;
2206                                 goto out;
2207                         }
2208                         expire_client(conf);
2209                         goto out_new;
2210                 }
2211                 if (verfs_match) { /* case 2 */
2212                         conf->cl_exchange_flags |= EXCHGID4_FLAG_CONFIRMED_R;
2213                         new = conf;
2214                         goto out_copy;
2215                 }
2216                 /* case 5, client reboot */
2217                 goto out_new;
2218         }
2219
2220         if (update) { /* case 7 */
2221                 status = nfserr_noent;
2222                 goto out;
2223         }
2224
2225         unconf  = find_unconfirmed_client_by_name(&exid->clname, nn);
2226         if (unconf) /* case 4, possible retry or client restart */
2227                 expire_client(unconf);
2228
2229         /* case 1 (normal case) */
2230 out_new:
2231         new = create_client(exid->clname, rqstp, &verf);
2232         if (new == NULL) {
2233                 status = nfserr_jukebox;
2234                 goto out;
2235         }
2236         new->cl_minorversion = cstate->minorversion;
2237         new->cl_mach_cred = (exid->spa_how == SP4_MACH_CRED);
2238
2239         gen_clid(new, nn);
2240         add_to_unconfirmed(new);
2241 out_copy:
2242         exid->clientid.cl_boot = new->cl_clientid.cl_boot;
2243         exid->clientid.cl_id = new->cl_clientid.cl_id;
2244
2245         exid->seqid = new->cl_cs_slot.sl_seqid + 1;
2246         nfsd4_set_ex_flags(new, exid);
2247
2248         dprintk("nfsd4_exchange_id seqid %d flags %x\n",
2249                 new->cl_cs_slot.sl_seqid, new->cl_exchange_flags);
2250         status = nfs_ok;
2251
2252 out:
2253         nfs4_unlock_state();
2254         return status;
2255 }
2256
2257 static __be32
2258 check_slot_seqid(u32 seqid, u32 slot_seqid, int slot_inuse)
2259 {
2260         dprintk("%s enter. seqid %d slot_seqid %d\n", __func__, seqid,
2261                 slot_seqid);
2262
2263         /* The slot is in use, and no response has been sent. */
2264         if (slot_inuse) {
2265                 if (seqid == slot_seqid)
2266                         return nfserr_jukebox;
2267                 else
2268                         return nfserr_seq_misordered;
2269         }
2270         /* Note unsigned 32-bit arithmetic handles wraparound: */
2271         if (likely(seqid == slot_seqid + 1))
2272                 return nfs_ok;
2273         if (seqid == slot_seqid)
2274                 return nfserr_replay_cache;
2275         return nfserr_seq_misordered;
2276 }
2277
2278 /*
2279  * Cache the create session result into the create session single DRC
2280  * slot cache by saving the xdr structure. sl_seqid has been set.
2281  * Do this for solo or embedded create session operations.
2282  */
2283 static void
2284 nfsd4_cache_create_session(struct nfsd4_create_session *cr_ses,
2285                            struct nfsd4_clid_slot *slot, __be32 nfserr)
2286 {
2287         slot->sl_status = nfserr;
2288         memcpy(&slot->sl_cr_ses, cr_ses, sizeof(*cr_ses));
2289 }
2290
2291 static __be32
2292 nfsd4_replay_create_session(struct nfsd4_create_session *cr_ses,
2293                             struct nfsd4_clid_slot *slot)
2294 {
2295         memcpy(cr_ses, &slot->sl_cr_ses, sizeof(*cr_ses));
2296         return slot->sl_status;
2297 }
2298
2299 #define NFSD_MIN_REQ_HDR_SEQ_SZ ((\
2300                         2 * 2 + /* credential,verifier: AUTH_NULL, length 0 */ \
2301                         1 +     /* MIN tag is length with zero, only length */ \
2302                         3 +     /* version, opcount, opcode */ \
2303                         XDR_QUADLEN(NFS4_MAX_SESSIONID_LEN) + \
2304                                 /* seqid, slotID, slotID, cache */ \
2305                         4 ) * sizeof(__be32))
2306
2307 #define NFSD_MIN_RESP_HDR_SEQ_SZ ((\
2308                         2 +     /* verifier: AUTH_NULL, length 0 */\
2309                         1 +     /* status */ \
2310                         1 +     /* MIN tag is length with zero, only length */ \
2311                         3 +     /* opcount, opcode, opstatus*/ \
2312                         XDR_QUADLEN(NFS4_MAX_SESSIONID_LEN) + \
2313                                 /* seqid, slotID, slotID, slotID, status */ \
2314                         5 ) * sizeof(__be32))
2315
2316 static __be32 check_forechannel_attrs(struct nfsd4_channel_attrs *ca, struct nfsd_net *nn)
2317 {
2318         u32 maxrpc = nn->nfsd_serv->sv_max_mesg;
2319
2320         if (ca->maxreq_sz < NFSD_MIN_REQ_HDR_SEQ_SZ)
2321                 return nfserr_toosmall;
2322         if (ca->maxresp_sz < NFSD_MIN_RESP_HDR_SEQ_SZ)
2323                 return nfserr_toosmall;
2324         ca->headerpadsz = 0;
2325         ca->maxreq_sz = min_t(u32, ca->maxreq_sz, maxrpc);
2326         ca->maxresp_sz = min_t(u32, ca->maxresp_sz, maxrpc);
2327         ca->maxops = min_t(u32, ca->maxops, NFSD_MAX_OPS_PER_COMPOUND);
2328         ca->maxresp_cached = min_t(u32, ca->maxresp_cached,
2329                         NFSD_SLOT_CACHE_SIZE + NFSD_MIN_HDR_SEQ_SZ);
2330         ca->maxreqs = min_t(u32, ca->maxreqs, NFSD_MAX_SLOTS_PER_SESSION);
2331         /*
2332          * Note decreasing slot size below client's request may make it
2333          * difficult for client to function correctly, whereas
2334          * decreasing the number of slots will (just?) affect
2335          * performance.  When short on memory we therefore prefer to
2336          * decrease number of slots instead of their size.  Clients that
2337          * request larger slots than they need will get poor results:
2338          */
2339         ca->maxreqs = nfsd4_get_drc_mem(ca);
2340         if (!ca->maxreqs)
2341                 return nfserr_jukebox;
2342
2343         return nfs_ok;
2344 }
2345
2346 #define NFSD_CB_MAX_REQ_SZ      ((NFS4_enc_cb_recall_sz + \
2347                                  RPC_MAX_HEADER_WITH_AUTH) * sizeof(__be32))
2348 #define NFSD_CB_MAX_RESP_SZ     ((NFS4_dec_cb_recall_sz + \
2349                                  RPC_MAX_REPHEADER_WITH_AUTH) * sizeof(__be32))
2350
2351 static __be32 check_backchannel_attrs(struct nfsd4_channel_attrs *ca)
2352 {
2353         ca->headerpadsz = 0;
2354
2355         /*
2356          * These RPC_MAX_HEADER macros are overkill, especially since we
2357          * don't even do gss on the backchannel yet.  But this is still
2358          * less than 1k.  Tighten up this estimate in the unlikely event
2359          * it turns out to be a problem for some client:
2360          */
2361         if (ca->maxreq_sz < NFSD_CB_MAX_REQ_SZ)
2362                 return nfserr_toosmall;
2363         if (ca->maxresp_sz < NFSD_CB_MAX_RESP_SZ)
2364                 return nfserr_toosmall;
2365         ca->maxresp_cached = 0;
2366         if (ca->maxops < 2)
2367                 return nfserr_toosmall;
2368
2369         return nfs_ok;
2370 }
2371
2372 static __be32 nfsd4_check_cb_sec(struct nfsd4_cb_sec *cbs)
2373 {
2374         switch (cbs->flavor) {
2375         case RPC_AUTH_NULL:
2376         case RPC_AUTH_UNIX:
2377                 return nfs_ok;
2378         default:
2379                 /*
2380                  * GSS case: the spec doesn't allow us to return this
2381                  * error.  But it also doesn't allow us not to support
2382                  * GSS.
2383                  * I'd rather this fail hard than return some error the
2384                  * client might think it can already handle:
2385                  */
2386                 return nfserr_encr_alg_unsupp;
2387         }
2388 }
2389
2390 __be32
2391 nfsd4_create_session(struct svc_rqst *rqstp,
2392                      struct nfsd4_compound_state *cstate,
2393                      struct nfsd4_create_session *cr_ses)
2394 {
2395         struct sockaddr *sa = svc_addr(rqstp);
2396         struct nfs4_client *conf, *unconf;
2397         struct nfsd4_session *new;
2398         struct nfsd4_conn *conn;
2399         struct nfsd4_clid_slot *cs_slot = NULL;
2400         __be32 status = 0;
2401         struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
2402
2403         if (cr_ses->flags & ~SESSION4_FLAG_MASK_A)
2404                 return nfserr_inval;
2405         status = nfsd4_check_cb_sec(&cr_ses->cb_sec);
2406         if (status)
2407                 return status;
2408         status = check_forechannel_attrs(&cr_ses->fore_channel, nn);
2409         if (status)
2410                 return status;
2411         status = check_backchannel_attrs(&cr_ses->back_channel);
2412         if (status)
2413                 goto out_release_drc_mem;
2414         status = nfserr_jukebox;
2415         new = alloc_session(&cr_ses->fore_channel, &cr_ses->back_channel);
2416         if (!new)
2417                 goto out_release_drc_mem;
2418         conn = alloc_conn_from_crses(rqstp, cr_ses);
2419         if (!conn)
2420                 goto out_free_session;
2421
2422         nfs4_lock_state();
2423         unconf = find_unconfirmed_client(&cr_ses->clientid, true, nn);
2424         conf = find_confirmed_client(&cr_ses->clientid, true, nn);
2425         WARN_ON_ONCE(conf && unconf);
2426
2427         if (conf) {
2428                 status = nfserr_wrong_cred;
2429                 if (!mach_creds_match(conf, rqstp))
2430                         goto out_free_conn;
2431                 cs_slot = &conf->cl_cs_slot;
2432                 status = check_slot_seqid(cr_ses->seqid, cs_slot->sl_seqid, 0);
2433                 if (status == nfserr_replay_cache) {
2434                         status = nfsd4_replay_create_session(cr_ses, cs_slot);
2435                         goto out_free_conn;
2436                 } else if (cr_ses->seqid != cs_slot->sl_seqid + 1) {
2437                         status = nfserr_seq_misordered;
2438                         goto out_free_conn;
2439                 }
2440         } else if (unconf) {
2441                 struct nfs4_client *old;
2442                 if (!same_creds(&unconf->cl_cred, &rqstp->rq_cred) ||
2443                     !rpc_cmp_addr(sa, (struct sockaddr *) &unconf->cl_addr)) {
2444                         status = nfserr_clid_inuse;
2445                         goto out_free_conn;
2446                 }
2447                 status = nfserr_wrong_cred;
2448                 if (!mach_creds_match(unconf, rqstp))
2449                         goto out_free_conn;
2450                 cs_slot = &unconf->cl_cs_slot;
2451                 status = check_slot_seqid(cr_ses->seqid, cs_slot->sl_seqid, 0);
2452                 if (status) {
2453                         /* an unconfirmed replay returns misordered */
2454                         status = nfserr_seq_misordered;
2455                         goto out_free_conn;
2456                 }
2457                 old = find_confirmed_client_by_name(&unconf->cl_name, nn);
2458                 if (old) {
2459                         status = mark_client_expired(old);
2460                         if (status)
2461                                 goto out_free_conn;
2462                         expire_client(old);
2463                 }
2464                 move_to_confirmed(unconf);
2465                 conf = unconf;
2466         } else {
2467                 status = nfserr_stale_clientid;
2468                 goto out_free_conn;
2469         }
2470         status = nfs_ok;
2471         /*
2472          * We do not support RDMA or persistent sessions
2473          */
2474         cr_ses->flags &= ~SESSION4_PERSIST;
2475         cr_ses->flags &= ~SESSION4_RDMA;
2476
2477         init_session(rqstp, new, conf, cr_ses);
2478         nfsd4_init_conn(rqstp, conn, new);
2479
2480         memcpy(cr_ses->sessionid.data, new->se_sessionid.data,
2481                NFS4_MAX_SESSIONID_LEN);
2482         cs_slot->sl_seqid++;
2483         cr_ses->seqid = cs_slot->sl_seqid;
2484
2485         /* cache solo and embedded create sessions under the state lock */
2486         nfsd4_cache_create_session(cr_ses, cs_slot, status);
2487         nfs4_unlock_state();
2488         return status;
2489 out_free_conn:
2490         nfs4_unlock_state();
2491         free_conn(conn);
2492 out_free_session:
2493         __free_session(new);
2494 out_release_drc_mem:
2495         nfsd4_put_drc_mem(&cr_ses->fore_channel);
2496         return status;
2497 }
2498
2499 static __be32 nfsd4_map_bcts_dir(u32 *dir)
2500 {
2501         switch (*dir) {
2502         case NFS4_CDFC4_FORE:
2503         case NFS4_CDFC4_BACK:
2504                 return nfs_ok;
2505         case NFS4_CDFC4_FORE_OR_BOTH:
2506         case NFS4_CDFC4_BACK_OR_BOTH:
2507                 *dir = NFS4_CDFC4_BOTH;
2508                 return nfs_ok;
2509         };
2510         return nfserr_inval;
2511 }
2512
2513 __be32 nfsd4_backchannel_ctl(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate, struct nfsd4_backchannel_ctl *bc)
2514 {
2515         struct nfsd4_session *session = cstate->session;
2516         struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
2517         __be32 status;
2518
2519         status = nfsd4_check_cb_sec(&bc->bc_cb_sec);
2520         if (status)
2521                 return status;
2522         spin_lock(&nn->client_lock);
2523         session->se_cb_prog = bc->bc_cb_program;
2524         session->se_cb_sec = bc->bc_cb_sec;
2525         spin_unlock(&nn->client_lock);
2526
2527         nfsd4_probe_callback(session->se_client);
2528
2529         return nfs_ok;
2530 }
2531
2532 __be32 nfsd4_bind_conn_to_session(struct svc_rqst *rqstp,
2533                      struct nfsd4_compound_state *cstate,
2534                      struct nfsd4_bind_conn_to_session *bcts)
2535 {
2536         __be32 status;
2537         struct nfsd4_conn *conn;
2538         struct nfsd4_session *session;
2539         struct net *net = SVC_NET(rqstp);
2540         struct nfsd_net *nn = net_generic(net, nfsd_net_id);
2541
2542         if (!nfsd4_last_compound_op(rqstp))
2543                 return nfserr_not_only_op;
2544         nfs4_lock_state();
2545         spin_lock(&nn->client_lock);
2546         session = find_in_sessionid_hashtbl(&bcts->sessionid, net, &status);
2547         spin_unlock(&nn->client_lock);
2548         if (!session)
2549                 goto out_no_session;
2550         status = nfserr_wrong_cred;
2551         if (!mach_creds_match(session->se_client, rqstp))
2552                 goto out;
2553         status = nfsd4_map_bcts_dir(&bcts->dir);
2554         if (status)
2555                 goto out;
2556         conn = alloc_conn(rqstp, bcts->dir);
2557         status = nfserr_jukebox;
2558         if (!conn)
2559                 goto out;
2560         nfsd4_init_conn(rqstp, conn, session);
2561         status = nfs_ok;
2562 out:
2563         nfsd4_put_session(session);
2564 out_no_session:
2565         nfs4_unlock_state();
2566         return status;
2567 }
2568
2569 static bool nfsd4_compound_in_session(struct nfsd4_session *session, struct nfs4_sessionid *sid)
2570 {
2571         if (!session)
2572                 return 0;
2573         return !memcmp(sid, &session->se_sessionid, sizeof(*sid));
2574 }
2575
2576 __be32
2577 nfsd4_destroy_session(struct svc_rqst *r,
2578                       struct nfsd4_compound_state *cstate,
2579                       struct nfsd4_destroy_session *sessionid)
2580 {
2581         struct nfsd4_session *ses;
2582         __be32 status;
2583         int ref_held_by_me = 0;
2584         struct net *net = SVC_NET(r);
2585         struct nfsd_net *nn = net_generic(net, nfsd_net_id);
2586
2587         nfs4_lock_state();
2588         status = nfserr_not_only_op;
2589         if (nfsd4_compound_in_session(cstate->session, &sessionid->sessionid)) {
2590                 if (!nfsd4_last_compound_op(r))
2591                         goto out;
2592                 ref_held_by_me++;
2593         }
2594         dump_sessionid(__func__, &sessionid->sessionid);
2595         spin_lock(&nn->client_lock);
2596         ses = find_in_sessionid_hashtbl(&sessionid->sessionid, net, &status);
2597         if (!ses)
2598                 goto out_client_lock;
2599         status = nfserr_wrong_cred;
2600         if (!mach_creds_match(ses->se_client, r))
2601                 goto out_put_session;
2602         status = mark_session_dead_locked(ses, 1 + ref_held_by_me);
2603         if (status)
2604                 goto out_put_session;
2605         unhash_session(ses);
2606         spin_unlock(&nn->client_lock);
2607
2608         nfsd4_probe_callback_sync(ses->se_client);
2609
2610         spin_lock(&nn->client_lock);
2611         status = nfs_ok;
2612 out_put_session:
2613         nfsd4_put_session_locked(ses);
2614 out_client_lock:
2615         spin_unlock(&nn->client_lock);
2616 out:
2617         nfs4_unlock_state();
2618         return status;
2619 }
2620
2621 static struct nfsd4_conn *__nfsd4_find_conn(struct svc_xprt *xpt, struct nfsd4_session *s)
2622 {
2623         struct nfsd4_conn *c;
2624
2625         list_for_each_entry(c, &s->se_conns, cn_persession) {
2626                 if (c->cn_xprt == xpt) {
2627                         return c;
2628                 }
2629         }
2630         return NULL;
2631 }
2632
2633 static __be32 nfsd4_sequence_check_conn(struct nfsd4_conn *new, struct nfsd4_session *ses)
2634 {
2635         struct nfs4_client *clp = ses->se_client;
2636         struct nfsd4_conn *c;
2637         __be32 status = nfs_ok;
2638         int ret;
2639
2640         spin_lock(&clp->cl_lock);
2641         c = __nfsd4_find_conn(new->cn_xprt, ses);
2642         if (c)
2643                 goto out_free;
2644         status = nfserr_conn_not_bound_to_session;
2645         if (clp->cl_mach_cred)
2646                 goto out_free;
2647         __nfsd4_hash_conn(new, ses);
2648         spin_unlock(&clp->cl_lock);
2649         ret = nfsd4_register_conn(new);
2650         if (ret)
2651                 /* oops; xprt is already down: */
2652                 nfsd4_conn_lost(&new->cn_xpt_user);
2653         return nfs_ok;
2654 out_free:
2655         spin_unlock(&clp->cl_lock);
2656         free_conn(new);
2657         return status;
2658 }
2659
2660 static bool nfsd4_session_too_many_ops(struct svc_rqst *rqstp, struct nfsd4_session *session)
2661 {
2662         struct nfsd4_compoundargs *args = rqstp->rq_argp;
2663
2664         return args->opcnt > session->se_fchannel.maxops;
2665 }
2666
2667 static bool nfsd4_request_too_big(struct svc_rqst *rqstp,
2668                                   struct nfsd4_session *session)
2669 {
2670         struct xdr_buf *xb = &rqstp->rq_arg;
2671
2672         return xb->len > session->se_fchannel.maxreq_sz;
2673 }
2674
2675 __be32
2676 nfsd4_sequence(struct svc_rqst *rqstp,
2677                struct nfsd4_compound_state *cstate,
2678                struct nfsd4_sequence *seq)
2679 {
2680         struct nfsd4_compoundres *resp = rqstp->rq_resp;
2681         struct xdr_stream *xdr = &resp->xdr;
2682         struct nfsd4_session *session;
2683         struct nfs4_client *clp;
2684         struct nfsd4_slot *slot;
2685         struct nfsd4_conn *conn;
2686         __be32 status;
2687         int buflen;
2688         struct net *net = SVC_NET(rqstp);
2689         struct nfsd_net *nn = net_generic(net, nfsd_net_id);
2690
2691         if (resp->opcnt != 1)
2692                 return nfserr_sequence_pos;
2693
2694         /*
2695          * Will be either used or freed by nfsd4_sequence_check_conn
2696          * below.
2697          */
2698         conn = alloc_conn(rqstp, NFS4_CDFC4_FORE);
2699         if (!conn)
2700                 return nfserr_jukebox;
2701
2702         spin_lock(&nn->client_lock);
2703         session = find_in_sessionid_hashtbl(&seq->sessionid, net, &status);
2704         if (!session)
2705                 goto out_no_session;
2706         clp = session->se_client;
2707
2708         status = nfserr_too_many_ops;
2709         if (nfsd4_session_too_many_ops(rqstp, session))
2710                 goto out_put_session;
2711
2712         status = nfserr_req_too_big;
2713         if (nfsd4_request_too_big(rqstp, session))
2714                 goto out_put_session;
2715
2716         status = nfserr_badslot;
2717         if (seq->slotid >= session->se_fchannel.maxreqs)
2718                 goto out_put_session;
2719
2720         slot = session->se_slots[seq->slotid];
2721         dprintk("%s: slotid %d\n", __func__, seq->slotid);
2722
2723         /* We do not negotiate the number of slots yet, so set the
2724          * maxslots to the session maxreqs which is used to encode
2725          * sr_highest_slotid and the sr_target_slot id to maxslots */
2726         seq->maxslots = session->se_fchannel.maxreqs;
2727
2728         status = check_slot_seqid(seq->seqid, slot->sl_seqid,
2729                                         slot->sl_flags & NFSD4_SLOT_INUSE);
2730         if (status == nfserr_replay_cache) {
2731                 status = nfserr_seq_misordered;
2732                 if (!(slot->sl_flags & NFSD4_SLOT_INITIALIZED))
2733                         goto out_put_session;
2734                 cstate->slot = slot;
2735                 cstate->session = session;
2736                 cstate->clp = clp;
2737                 /* Return the cached reply status and set cstate->status
2738                  * for nfsd4_proc_compound processing */
2739                 status = nfsd4_replay_cache_entry(resp, seq);
2740                 cstate->status = nfserr_replay_cache;
2741                 goto out;
2742         }
2743         if (status)
2744                 goto out_put_session;
2745
2746         status = nfsd4_sequence_check_conn(conn, session);
2747         conn = NULL;
2748         if (status)
2749                 goto out_put_session;
2750
2751         buflen = (seq->cachethis) ?
2752                         session->se_fchannel.maxresp_cached :
2753                         session->se_fchannel.maxresp_sz;
2754         status = (seq->cachethis) ? nfserr_rep_too_big_to_cache :
2755                                     nfserr_rep_too_big;
2756         if (xdr_restrict_buflen(xdr, buflen - rqstp->rq_auth_slack))
2757                 goto out_put_session;
2758         svc_reserve(rqstp, buflen);
2759
2760         status = nfs_ok;
2761         /* Success! bump slot seqid */
2762         slot->sl_seqid = seq->seqid;
2763         slot->sl_flags |= NFSD4_SLOT_INUSE;
2764         if (seq->cachethis)
2765                 slot->sl_flags |= NFSD4_SLOT_CACHETHIS;
2766         else
2767                 slot->sl_flags &= ~NFSD4_SLOT_CACHETHIS;
2768
2769         cstate->slot = slot;
2770         cstate->session = session;
2771         cstate->clp = clp;
2772
2773 out:
2774         switch (clp->cl_cb_state) {
2775         case NFSD4_CB_DOWN:
2776                 seq->status_flags = SEQ4_STATUS_CB_PATH_DOWN;
2777                 break;
2778         case NFSD4_CB_FAULT:
2779                 seq->status_flags = SEQ4_STATUS_BACKCHANNEL_FAULT;
2780                 break;
2781         default:
2782                 seq->status_flags = 0;
2783         }
2784         if (!list_empty(&clp->cl_revoked))
2785                 seq->status_flags |= SEQ4_STATUS_RECALLABLE_STATE_REVOKED;
2786 out_no_session:
2787         if (conn)
2788                 free_conn(conn);
2789         spin_unlock(&nn->client_lock);
2790         return status;
2791 out_put_session:
2792         nfsd4_put_session_locked(session);
2793         goto out_no_session;
2794 }
2795
2796 void
2797 nfsd4_sequence_done(struct nfsd4_compoundres *resp)
2798 {
2799         struct nfsd4_compound_state *cs = &resp->cstate;
2800
2801         if (nfsd4_has_session(cs)) {
2802                 if (cs->status != nfserr_replay_cache) {
2803                         nfsd4_store_cache_entry(resp);
2804                         cs->slot->sl_flags &= ~NFSD4_SLOT_INUSE;
2805                 }
2806                 /* Drop session reference that was taken in nfsd4_sequence() */
2807                 nfsd4_put_session(cs->session);
2808         } else if (cs->clp)
2809                 put_client_renew(cs->clp);
2810 }
2811
2812 __be32
2813 nfsd4_destroy_clientid(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate, struct nfsd4_destroy_clientid *dc)
2814 {
2815         struct nfs4_client *conf, *unconf, *clp;
2816         __be32 status = 0;
2817         struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
2818
2819         nfs4_lock_state();
2820         unconf = find_unconfirmed_client(&dc->clientid, true, nn);
2821         conf = find_confirmed_client(&dc->clientid, true, nn);
2822         WARN_ON_ONCE(conf && unconf);
2823
2824         if (conf) {
2825                 clp = conf;
2826
2827                 if (client_has_state(conf)) {
2828                         status = nfserr_clientid_busy;
2829                         goto out;
2830                 }
2831         } else if (unconf)
2832                 clp = unconf;
2833         else {
2834                 status = nfserr_stale_clientid;
2835                 goto out;
2836         }
2837         if (!mach_creds_match(clp, rqstp)) {
2838                 status = nfserr_wrong_cred;
2839                 goto out;
2840         }
2841         expire_client(clp);
2842 out:
2843         nfs4_unlock_state();
2844         return status;
2845 }
2846
2847 __be32
2848 nfsd4_reclaim_complete(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate, struct nfsd4_reclaim_complete *rc)
2849 {
2850         __be32 status = 0;
2851
2852         if (rc->rca_one_fs) {
2853                 if (!cstate->current_fh.fh_dentry)
2854                         return nfserr_nofilehandle;
2855                 /*
2856                  * We don't take advantage of the rca_one_fs case.
2857                  * That's OK, it's optional, we can safely ignore it.
2858                  */
2859                  return nfs_ok;
2860         }
2861
2862         nfs4_lock_state();
2863         status = nfserr_complete_already;
2864         if (test_and_set_bit(NFSD4_CLIENT_RECLAIM_COMPLETE,
2865                              &cstate->session->se_client->cl_flags))
2866                 goto out;
2867
2868         status = nfserr_stale_clientid;
2869         if (is_client_expired(cstate->session->se_client))
2870                 /*
2871                  * The following error isn't really legal.
2872                  * But we only get here if the client just explicitly
2873                  * destroyed the client.  Surely it no longer cares what
2874                  * error it gets back on an operation for the dead
2875                  * client.
2876                  */
2877                 goto out;
2878
2879         status = nfs_ok;
2880         nfsd4_client_record_create(cstate->session->se_client);
2881 out:
2882         nfs4_unlock_state();
2883         return status;
2884 }
2885
2886 __be32
2887 nfsd4_setclientid(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
2888                   struct nfsd4_setclientid *setclid)
2889 {
2890         struct xdr_netobj       clname = setclid->se_name;
2891         nfs4_verifier           clverifier = setclid->se_verf;
2892         struct nfs4_client      *conf, *unconf, *new;
2893         __be32                  status;
2894         struct nfsd_net         *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
2895
2896         /* Cases below refer to rfc 3530 section 14.2.33: */
2897         nfs4_lock_state();
2898         conf = find_confirmed_client_by_name(&clname, nn);
2899         if (conf) {
2900                 /* case 0: */
2901                 status = nfserr_clid_inuse;
2902                 if (clp_used_exchangeid(conf))
2903                         goto out;
2904                 if (!same_creds(&conf->cl_cred, &rqstp->rq_cred)) {
2905                         char addr_str[INET6_ADDRSTRLEN];
2906                         rpc_ntop((struct sockaddr *) &conf->cl_addr, addr_str,
2907                                  sizeof(addr_str));
2908                         dprintk("NFSD: setclientid: string in use by client "
2909                                 "at %s\n", addr_str);
2910                         goto out;
2911                 }
2912         }
2913         unconf = find_unconfirmed_client_by_name(&clname, nn);
2914         if (unconf)
2915                 expire_client(unconf);
2916         status = nfserr_jukebox;
2917         new = create_client(clname, rqstp, &clverifier);
2918         if (new == NULL)
2919                 goto out;
2920         if (conf && same_verf(&conf->cl_verifier, &clverifier))
2921                 /* case 1: probable callback update */
2922                 copy_clid(new, conf);
2923         else /* case 4 (new client) or cases 2, 3 (client reboot): */
2924                 gen_clid(new, nn);
2925         new->cl_minorversion = 0;
2926         gen_callback(new, setclid, rqstp);
2927         add_to_unconfirmed(new);
2928         setclid->se_clientid.cl_boot = new->cl_clientid.cl_boot;
2929         setclid->se_clientid.cl_id = new->cl_clientid.cl_id;
2930         memcpy(setclid->se_confirm.data, new->cl_confirm.data, sizeof(setclid->se_confirm.data));
2931         status = nfs_ok;
2932 out:
2933         nfs4_unlock_state();
2934         return status;
2935 }
2936
2937
2938 __be32
2939 nfsd4_setclientid_confirm(struct svc_rqst *rqstp,
2940                          struct nfsd4_compound_state *cstate,
2941                          struct nfsd4_setclientid_confirm *setclientid_confirm)
2942 {
2943         struct nfs4_client *conf, *unconf;
2944         nfs4_verifier confirm = setclientid_confirm->sc_confirm; 
2945         clientid_t * clid = &setclientid_confirm->sc_clientid;
2946         __be32 status;
2947         struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
2948
2949         if (STALE_CLIENTID(clid, nn))
2950                 return nfserr_stale_clientid;
2951         nfs4_lock_state();
2952
2953         conf = find_confirmed_client(clid, false, nn);
2954         unconf = find_unconfirmed_client(clid, false, nn);
2955         /*
2956          * We try hard to give out unique clientid's, so if we get an
2957          * attempt to confirm the same clientid with a different cred,
2958          * there's a bug somewhere.  Let's charitably assume it's our
2959          * bug.
2960          */
2961         status = nfserr_serverfault;
2962         if (unconf && !same_creds(&unconf->cl_cred, &rqstp->rq_cred))
2963                 goto out;
2964         if (conf && !same_creds(&conf->cl_cred, &rqstp->rq_cred))
2965                 goto out;
2966         /* cases below refer to rfc 3530 section 14.2.34: */
2967         if (!unconf || !same_verf(&confirm, &unconf->cl_confirm)) {
2968                 if (conf && !unconf) /* case 2: probable retransmit */
2969                         status = nfs_ok;
2970                 else /* case 4: client hasn't noticed we rebooted yet? */
2971                         status = nfserr_stale_clientid;
2972                 goto out;
2973         }
2974         status = nfs_ok;
2975         if (conf) { /* case 1: callback update */
2976                 nfsd4_change_callback(conf, &unconf->cl_cb_conn);
2977                 nfsd4_probe_callback(conf);
2978                 expire_client(unconf);
2979         } else { /* case 3: normal case; new or rebooted client */
2980                 conf = find_confirmed_client_by_name(&unconf->cl_name, nn);
2981                 if (conf) {
2982                         status = mark_client_expired(conf);
2983                         if (status)
2984                                 goto out;
2985                         expire_client(conf);
2986                 }
2987                 move_to_confirmed(unconf);
2988                 nfsd4_probe_callback(unconf);
2989         }
2990 out:
2991         nfs4_unlock_state();
2992         return status;
2993 }
2994
2995 static struct nfs4_file *nfsd4_alloc_file(void)
2996 {
2997         return kmem_cache_alloc(file_slab, GFP_KERNEL);
2998 }
2999
3000 /* OPEN Share state helper functions */
3001 static void nfsd4_init_file(struct nfs4_file *fp, struct knfsd_fh *fh)
3002 {
3003         unsigned int hashval = file_hashval(fh);
3004
3005         lockdep_assert_held(&state_lock);
3006
3007         atomic_set(&fp->fi_ref, 1);
3008         spin_lock_init(&fp->fi_lock);
3009         INIT_LIST_HEAD(&fp->fi_stateids);
3010         INIT_LIST_HEAD(&fp->fi_delegations);
3011         fh_copy_shallow(&fp->fi_fhandle, fh);
3012         fp->fi_had_conflict = false;
3013         fp->fi_lease = NULL;
3014         fp->fi_share_deny = 0;
3015         memset(fp->fi_fds, 0, sizeof(fp->fi_fds));
3016         memset(fp->fi_access, 0, sizeof(fp->fi_access));
3017         hlist_add_head(&fp->fi_hash, &file_hashtbl[hashval]);
3018 }
3019
3020 void
3021 nfsd4_free_slabs(void)
3022 {
3023         kmem_cache_destroy(openowner_slab);
3024         kmem_cache_destroy(lockowner_slab);
3025         kmem_cache_destroy(file_slab);
3026         kmem_cache_destroy(stateid_slab);
3027         kmem_cache_destroy(deleg_slab);
3028 }
3029
3030 int
3031 nfsd4_init_slabs(void)
3032 {
3033         openowner_slab = kmem_cache_create("nfsd4_openowners",
3034                         sizeof(struct nfs4_openowner), 0, 0, NULL);
3035         if (openowner_slab == NULL)
3036                 goto out;
3037         lockowner_slab = kmem_cache_create("nfsd4_lockowners",
3038                         sizeof(struct nfs4_lockowner), 0, 0, NULL);
3039         if (lockowner_slab == NULL)
3040                 goto out_free_openowner_slab;
3041         file_slab = kmem_cache_create("nfsd4_files",
3042                         sizeof(struct nfs4_file), 0, 0, NULL);
3043         if (file_slab == NULL)
3044                 goto out_free_lockowner_slab;
3045         stateid_slab = kmem_cache_create("nfsd4_stateids",
3046                         sizeof(struct nfs4_ol_stateid), 0, 0, NULL);
3047         if (stateid_slab == NULL)
3048                 goto out_free_file_slab;
3049         deleg_slab = kmem_cache_create("nfsd4_delegations",
3050                         sizeof(struct nfs4_delegation), 0, 0, NULL);
3051         if (deleg_slab == NULL)
3052                 goto out_free_stateid_slab;
3053         return 0;
3054
3055 out_free_stateid_slab:
3056         kmem_cache_destroy(stateid_slab);
3057 out_free_file_slab:
3058         kmem_cache_destroy(file_slab);
3059 out_free_lockowner_slab:
3060         kmem_cache_destroy(lockowner_slab);
3061 out_free_openowner_slab:
3062         kmem_cache_destroy(openowner_slab);
3063 out:
3064         dprintk("nfsd4: out of memory while initializing nfsv4\n");
3065         return -ENOMEM;
3066 }
3067
3068 static void init_nfs4_replay(struct nfs4_replay *rp)
3069 {
3070         rp->rp_status = nfserr_serverfault;
3071         rp->rp_buflen = 0;
3072         rp->rp_buf = rp->rp_ibuf;
3073         mutex_init(&rp->rp_mutex);
3074 }
3075
3076 static void nfsd4_cstate_assign_replay(struct nfsd4_compound_state *cstate,
3077                 struct nfs4_stateowner *so)
3078 {
3079         if (!nfsd4_has_session(cstate)) {
3080                 mutex_lock(&so->so_replay.rp_mutex);
3081                 cstate->replay_owner = so;
3082                 atomic_inc(&so->so_count);
3083         }
3084 }
3085
3086 void nfsd4_cstate_clear_replay(struct nfsd4_compound_state *cstate)
3087 {
3088         struct nfs4_stateowner *so = cstate->replay_owner;
3089
3090         if (so != NULL) {
3091                 cstate->replay_owner = NULL;
3092                 mutex_unlock(&so->so_replay.rp_mutex);
3093                 nfs4_put_stateowner(so);
3094         }
3095 }
3096
3097 static inline void *alloc_stateowner(struct kmem_cache *slab, struct xdr_netobj *owner, struct nfs4_client *clp)
3098 {
3099         struct nfs4_stateowner *sop;
3100
3101         sop = kmem_cache_alloc(slab, GFP_KERNEL);
3102         if (!sop)
3103                 return NULL;
3104
3105         sop->so_owner.data = kmemdup(owner->data, owner->len, GFP_KERNEL);
3106         if (!sop->so_owner.data) {
3107                 kmem_cache_free(slab, sop);
3108                 return NULL;
3109         }
3110         sop->so_owner.len = owner->len;
3111
3112         INIT_LIST_HEAD(&sop->so_stateids);
3113         sop->so_client = clp;
3114         init_nfs4_replay(&sop->so_replay);
3115         atomic_set(&sop->so_count, 1);
3116         return sop;
3117 }
3118
3119 static void hash_openowner(struct nfs4_openowner *oo, struct nfs4_client *clp, unsigned int strhashval)
3120 {
3121         lockdep_assert_held(&clp->cl_lock);
3122
3123         list_add(&oo->oo_owner.so_strhash,
3124                  &clp->cl_ownerstr_hashtbl[strhashval]);
3125         list_add(&oo->oo_perclient, &clp->cl_openowners);
3126 }
3127
3128 static void nfs4_unhash_openowner(struct nfs4_stateowner *so)
3129 {
3130         unhash_openowner_locked(openowner(so));
3131 }
3132
3133 static void nfs4_free_openowner(struct nfs4_stateowner *so)
3134 {
3135         struct nfs4_openowner *oo = openowner(so);
3136
3137         kmem_cache_free(openowner_slab, oo);
3138 }
3139
3140 static const struct nfs4_stateowner_operations openowner_ops = {
3141         .so_unhash =    nfs4_unhash_openowner,
3142         .so_free =      nfs4_free_openowner,
3143 };
3144
3145 static struct nfs4_openowner *
3146 alloc_init_open_stateowner(unsigned int strhashval, struct nfsd4_open *open,
3147                            struct nfsd4_compound_state *cstate)
3148 {
3149         struct nfs4_client *clp = cstate->clp;
3150         struct nfs4_openowner *oo, *ret;
3151
3152         oo = alloc_stateowner(openowner_slab, &open->op_owner, clp);
3153         if (!oo)
3154                 return NULL;
3155         oo->oo_owner.so_ops = &openowner_ops;
3156         oo->oo_owner.so_is_open_owner = 1;
3157         oo->oo_owner.so_seqid = open->op_seqid;
3158         oo->oo_flags = 0;
3159         if (nfsd4_has_session(cstate))
3160                 oo->oo_flags |= NFS4_OO_CONFIRMED;
3161         oo->oo_time = 0;
3162         oo->oo_last_closed_stid = NULL;
3163         INIT_LIST_HEAD(&oo->oo_close_lru);
3164         spin_lock(&clp->cl_lock);
3165         ret = find_openstateowner_str_locked(strhashval, open, clp);
3166         if (ret == NULL) {
3167                 hash_openowner(oo, clp, strhashval);
3168                 ret = oo;
3169         } else
3170                 nfs4_free_openowner(&oo->oo_owner);
3171         spin_unlock(&clp->cl_lock);
3172         return oo;
3173 }
3174
3175 static void init_open_stateid(struct nfs4_ol_stateid *stp, struct nfs4_file *fp, struct nfsd4_open *open) {
3176         struct nfs4_openowner *oo = open->op_openowner;
3177
3178         atomic_inc(&stp->st_stid.sc_count);
3179         stp->st_stid.sc_type = NFS4_OPEN_STID;
3180         INIT_LIST_HEAD(&stp->st_locks);
3181         stp->st_stateowner = &oo->oo_owner;
3182         atomic_inc(&stp->st_stateowner->so_count);
3183         get_nfs4_file(fp);
3184         stp->st_stid.sc_file = fp;
3185         stp->st_access_bmap = 0;
3186         stp->st_deny_bmap = 0;
3187         stp->st_openstp = NULL;
3188         spin_lock(&oo->oo_owner.so_client->cl_lock);
3189         list_add(&stp->st_perstateowner, &oo->oo_owner.so_stateids);
3190         spin_lock(&fp->fi_lock);
3191         list_add(&stp->st_perfile, &fp->fi_stateids);
3192         spin_unlock(&fp->fi_lock);
3193         spin_unlock(&oo->oo_owner.so_client->cl_lock);
3194 }
3195
3196 /*
3197  * In the 4.0 case we need to keep the owners around a little while to handle
3198  * CLOSE replay. We still do need to release any file access that is held by
3199  * them before returning however.
3200  */
3201 static void
3202 move_to_close_lru(struct nfs4_ol_stateid *s, struct net *net)
3203 {
3204         struct nfs4_openowner *oo = openowner(s->st_stateowner);
3205         struct nfsd_net *nn = net_generic(s->st_stid.sc_client->net,
3206                                                 nfsd_net_id);
3207
3208         dprintk("NFSD: move_to_close_lru nfs4_openowner %p\n", oo);
3209
3210         /*
3211          * We know that we hold one reference via nfsd4_close, and another
3212          * "persistent" reference for the client. If the refcount is higher
3213          * than 2, then there are still calls in progress that are using this
3214          * stateid. We can't put the sc_file reference until they are finished.
3215          * Wait for the refcount to drop to 2. Since it has been unhashed,
3216          * there should be no danger of the refcount going back up again at
3217          * this point.
3218          */
3219         wait_event(close_wq, atomic_read(&s->st_stid.sc_count) == 2);
3220
3221         release_all_access(s);
3222         if (s->st_stid.sc_file) {
3223                 put_nfs4_file(s->st_stid.sc_file);
3224                 s->st_stid.sc_file = NULL;
3225         }
3226         release_last_closed_stateid(oo);
3227         oo->oo_last_closed_stid = s;
3228         list_move_tail(&oo->oo_close_lru, &nn->close_lru);
3229         oo->oo_time = get_seconds();
3230 }
3231
3232 /* search file_hashtbl[] for file */
3233 static struct nfs4_file *
3234 find_file_locked(struct knfsd_fh *fh)
3235 {
3236         unsigned int hashval = file_hashval(fh);
3237         struct nfs4_file *fp;
3238
3239         lockdep_assert_held(&state_lock);
3240
3241         hlist_for_each_entry(fp, &file_hashtbl[hashval], fi_hash) {
3242                 if (nfsd_fh_match(&fp->fi_fhandle, fh)) {
3243                         get_nfs4_file(fp);
3244                         return fp;
3245                 }
3246         }
3247         return NULL;
3248 }
3249
3250 static struct nfs4_file *
3251 find_file(struct knfsd_fh *fh)
3252 {
3253         struct nfs4_file *fp;
3254
3255         spin_lock(&state_lock);
3256         fp = find_file_locked(fh);
3257         spin_unlock(&state_lock);
3258         return fp;
3259 }
3260
3261 static struct nfs4_file *
3262 find_or_add_file(struct nfs4_file *new, struct knfsd_fh *fh)
3263 {
3264         struct nfs4_file *fp;
3265
3266         spin_lock(&state_lock);
3267         fp = find_file_locked(fh);
3268         if (fp == NULL) {
3269                 nfsd4_init_file(new, fh);
3270                 fp = new;
3271         }
3272         spin_unlock(&state_lock);
3273
3274         return fp;
3275 }
3276
3277 /*
3278  * Called to check deny when READ with all zero stateid or
3279  * WRITE with all zero or all one stateid
3280  */
3281 static __be32
3282 nfs4_share_conflict(struct svc_fh *current_fh, unsigned int deny_type)
3283 {
3284         struct nfs4_file *fp;
3285         __be32 ret = nfs_ok;
3286
3287         fp = find_file(&current_fh->fh_handle);
3288         if (!fp)
3289                 return ret;
3290         /* Check for conflicting share reservations */
3291         spin_lock(&fp->fi_lock);
3292         if (fp->fi_share_deny & deny_type)
3293                 ret = nfserr_locked;
3294         spin_unlock(&fp->fi_lock);
3295         put_nfs4_file(fp);
3296         return ret;
3297 }
3298
3299 void nfsd4_prepare_cb_recall(struct nfs4_delegation *dp)
3300 {
3301         struct nfsd_net *nn = net_generic(dp->dl_stid.sc_client->net,
3302                                           nfsd_net_id);
3303
3304         block_delegations(&dp->dl_stid.sc_file->fi_fhandle);
3305
3306         /*
3307          * We can't do this in nfsd_break_deleg_cb because it is
3308          * already holding inode->i_lock.
3309          *
3310          * If the dl_time != 0, then we know that it has already been
3311          * queued for a lease break. Don't queue it again.
3312          */
3313         spin_lock(&state_lock);
3314         if (dp->dl_time == 0) {
3315                 dp->dl_time = get_seconds();
3316                 list_add_tail(&dp->dl_recall_lru, &nn->del_recall_lru);
3317         }
3318         spin_unlock(&state_lock);
3319 }
3320
3321 static void nfsd_break_one_deleg(struct nfs4_delegation *dp)
3322 {
3323         /*
3324          * We're assuming the state code never drops its reference
3325          * without first removing the lease.  Since we're in this lease
3326          * callback (and since the lease code is serialized by the kernel
3327          * lock) we know the server hasn't removed the lease yet, we know
3328          * it's safe to take a reference.
3329          */
3330         atomic_inc(&dp->dl_stid.sc_count);
3331         nfsd4_cb_recall(dp);
3332 }
3333
3334 /* Called from break_lease() with i_lock held. */
3335 static void nfsd_break_deleg_cb(struct file_lock *fl)
3336 {
3337         struct nfs4_file *fp = (struct nfs4_file *)fl->fl_owner;
3338         struct nfs4_delegation *dp;
3339
3340         if (!fp) {
3341                 WARN(1, "(%p)->fl_owner NULL\n", fl);
3342                 return;
3343         }
3344         if (fp->fi_had_conflict) {
3345                 WARN(1, "duplicate break on %p\n", fp);
3346                 return;
3347         }
3348         /*
3349          * We don't want the locks code to timeout the lease for us;
3350          * we'll remove it ourself if a delegation isn't returned
3351          * in time:
3352          */
3353         fl->fl_break_time = 0;
3354
3355         spin_lock(&fp->fi_lock);
3356         fp->fi_had_conflict = true;
3357         /*
3358          * If there are no delegations on the list, then we can't count on this
3359          * lease ever being cleaned up. Set the fl_break_time to jiffies so that
3360          * time_out_leases will do it ASAP. The fact that fi_had_conflict is now
3361          * true should keep any new delegations from being hashed.
3362          */
3363         if (list_empty(&fp->fi_delegations))
3364                 fl->fl_break_time = jiffies;
3365         else
3366                 list_for_each_entry(dp, &fp->fi_delegations, dl_perfile)
3367                         nfsd_break_one_deleg(dp);
3368         spin_unlock(&fp->fi_lock);
3369 }
3370
3371 static
3372 int nfsd_change_deleg_cb(struct file_lock **onlist, int arg)
3373 {
3374         if (arg & F_UNLCK)
3375                 return lease_modify(onlist, arg);
3376         else
3377                 return -EAGAIN;
3378 }
3379
3380 static const struct lock_manager_operations nfsd_lease_mng_ops = {
3381         .lm_break = nfsd_break_deleg_cb,
3382         .lm_change = nfsd_change_deleg_cb,
3383 };
3384
3385 static __be32 nfsd4_check_seqid(struct nfsd4_compound_state *cstate, struct nfs4_stateowner *so, u32 seqid)
3386 {
3387         if (nfsd4_has_session(cstate))
3388                 return nfs_ok;
3389         if (seqid == so->so_seqid - 1)
3390                 return nfserr_replay_me;
3391         if (seqid == so->so_seqid)
3392                 return nfs_ok;
3393         return nfserr_bad_seqid;
3394 }
3395
3396 static __be32 lookup_clientid(clientid_t *clid,
3397                 struct nfsd4_compound_state *cstate,
3398                 struct nfsd_net *nn)
3399 {
3400         struct nfs4_client *found;
3401
3402         if (cstate->clp) {
3403                 found = cstate->clp;
3404                 if (!same_clid(&found->cl_clientid, clid))
3405                         return nfserr_stale_clientid;
3406                 return nfs_ok;
3407         }
3408
3409         if (STALE_CLIENTID(clid, nn))
3410                 return nfserr_stale_clientid;
3411
3412         /*
3413          * For v4.1+ we get the client in the SEQUENCE op. If we don't have one
3414          * cached already then we know this is for is for v4.0 and "sessions"
3415          * will be false.
3416          */
3417         WARN_ON_ONCE(cstate->session);
3418         found = find_confirmed_client(clid, false, nn);
3419         if (!found)
3420                 return nfserr_expired;
3421
3422         /* Cache the nfs4_client in cstate! */
3423         cstate->clp = found;
3424         atomic_inc(&found->cl_refcount);
3425         return nfs_ok;
3426 }
3427
3428 __be32
3429 nfsd4_process_open1(struct nfsd4_compound_state *cstate,
3430                     struct nfsd4_open *open, struct nfsd_net *nn)
3431 {
3432         clientid_t *clientid = &open->op_clientid;
3433         struct nfs4_client *clp = NULL;
3434         unsigned int strhashval;
3435         struct nfs4_openowner *oo = NULL;
3436         __be32 status;
3437
3438         if (STALE_CLIENTID(&open->op_clientid, nn))
3439                 return nfserr_stale_clientid;
3440         /*
3441          * In case we need it later, after we've already created the
3442          * file and don't want to risk a further failure:
3443          */
3444         open->op_file = nfsd4_alloc_file();
3445         if (open->op_file == NULL)
3446                 return nfserr_jukebox;
3447
3448         status = lookup_clientid(clientid, cstate, nn);
3449         if (status)
3450                 return status;
3451         clp = cstate->clp;
3452
3453         strhashval = ownerstr_hashval(&open->op_owner);
3454         oo = find_openstateowner_str(strhashval, open, clp);
3455         open->op_openowner = oo;
3456         if (!oo) {
3457                 goto new_owner;
3458         }
3459         if (!(oo->oo_flags & NFS4_OO_CONFIRMED)) {
3460                 /* Replace unconfirmed owners without checking for replay. */
3461                 release_openowner(oo);
3462                 open->op_openowner = NULL;
3463                 goto new_owner;
3464         }
3465         status = nfsd4_check_seqid(cstate, &oo->oo_owner, open->op_seqid);
3466         if (status)
3467                 return status;
3468         goto alloc_stateid;
3469 new_owner:
3470         oo = alloc_init_open_stateowner(strhashval, open, cstate);
3471         if (oo == NULL)
3472                 return nfserr_jukebox;
3473         open->op_openowner = oo;
3474 alloc_stateid:
3475         open->op_stp = nfs4_alloc_open_stateid(clp);
3476         if (!open->op_stp)
3477                 return nfserr_jukebox;
3478         return nfs_ok;
3479 }
3480
3481 static inline __be32
3482 nfs4_check_delegmode(struct nfs4_delegation *dp, int flags)
3483 {
3484         if ((flags & WR_STATE) && (dp->dl_type == NFS4_OPEN_DELEGATE_READ))
3485                 return nfserr_openmode;
3486         else
3487                 return nfs_ok;
3488 }
3489
3490 static int share_access_to_flags(u32 share_access)
3491 {
3492         return share_access == NFS4_SHARE_ACCESS_READ ? RD_STATE : WR_STATE;
3493 }
3494
3495 static struct nfs4_delegation *find_deleg_stateid(struct nfs4_client *cl, stateid_t *s)
3496 {
3497         struct nfs4_stid *ret;
3498
3499         ret = find_stateid_by_type(cl, s, NFS4_DELEG_STID);
3500         if (!ret)
3501                 return NULL;
3502         return delegstateid(ret);
3503 }
3504
3505 static bool nfsd4_is_deleg_cur(struct nfsd4_open *open)
3506 {
3507         return open->op_claim_type == NFS4_OPEN_CLAIM_DELEGATE_CUR ||
3508                open->op_claim_type == NFS4_OPEN_CLAIM_DELEG_CUR_FH;
3509 }
3510
3511 static __be32
3512 nfs4_check_deleg(struct nfs4_client *cl, struct nfsd4_open *open,
3513                 struct nfs4_delegation **dp)
3514 {
3515         int flags;
3516         __be32 status = nfserr_bad_stateid;
3517         struct nfs4_delegation *deleg;
3518
3519         deleg = find_deleg_stateid(cl, &open->op_delegate_stateid);
3520         if (deleg == NULL)
3521                 goto out;
3522         flags = share_access_to_flags(open->op_share_access);
3523         status = nfs4_check_delegmode(deleg, flags);
3524         if (status) {
3525                 nfs4_put_stid(&deleg->dl_stid);
3526                 goto out;
3527         }
3528         *dp = deleg;
3529 out:
3530         if (!nfsd4_is_deleg_cur(open))
3531                 return nfs_ok;
3532         if (status)
3533                 return status;
3534         open->op_openowner->oo_flags |= NFS4_OO_CONFIRMED;
3535         return nfs_ok;
3536 }
3537
3538 static struct nfs4_ol_stateid *
3539 nfsd4_find_existing_open(struct nfs4_file *fp, struct nfsd4_open *open)
3540 {
3541         struct nfs4_ol_stateid *local, *ret = NULL;
3542         struct nfs4_openowner *oo = open->op_openowner;
3543
3544         spin_lock(&fp->fi_lock);
3545         list_for_each_entry(local, &fp->fi_stateids, st_perfile) {
3546                 /* ignore lock owners */
3547                 if (local->st_stateowner->so_is_open_owner == 0)
3548                         continue;
3549                 if (local->st_stateowner == &oo->oo_owner) {
3550                         ret = local;
3551                         atomic_inc(&ret->st_stid.sc_count);
3552                         break;
3553                 }
3554         }
3555         spin_unlock(&fp->fi_lock);
3556         return ret;
3557 }
3558
3559 static inline int nfs4_access_to_access(u32 nfs4_access)
3560 {
3561         int flags = 0;
3562
3563         if (nfs4_access & NFS4_SHARE_ACCESS_READ)
3564                 flags |= NFSD_MAY_READ;
3565         if (nfs4_access & NFS4_SHARE_ACCESS_WRITE)
3566                 flags |= NFSD_MAY_WRITE;
3567         return flags;
3568 }
3569
3570 static inline __be32
3571 nfsd4_truncate(struct svc_rqst *rqstp, struct svc_fh *fh,
3572                 struct nfsd4_open *open)
3573 {
3574         struct iattr iattr = {
3575                 .ia_valid = ATTR_SIZE,
3576                 .ia_size = 0,
3577         };
3578         if (!open->op_truncate)
3579                 return 0;
3580         if (!(open->op_share_access & NFS4_SHARE_ACCESS_WRITE))
3581                 return nfserr_inval;
3582         return nfsd_setattr(rqstp, fh, &iattr, 0, (time_t)0);
3583 }
3584
3585 static __be32 nfs4_get_vfs_file(struct svc_rqst *rqstp, struct nfs4_file *fp,
3586                 struct svc_fh *cur_fh, struct nfs4_ol_stateid *stp,
3587                 struct nfsd4_open *open)
3588 {
3589         struct file *filp = NULL;
3590         __be32 status;
3591         int oflag = nfs4_access_to_omode(open->op_share_access);
3592         int access = nfs4_access_to_access(open->op_share_access);
3593         unsigned char old_access_bmap, old_deny_bmap;
3594
3595         spin_lock(&fp->fi_lock);
3596
3597         /*
3598          * Are we trying to set a deny mode that would conflict with
3599          * current access?
3600          */
3601         status = nfs4_file_check_deny(fp, open->op_share_deny);
3602         if (status != nfs_ok) {
3603                 spin_unlock(&fp->fi_lock);
3604                 goto out;
3605         }
3606
3607         /* set access to the file */
3608         status = nfs4_file_get_access(fp, open->op_share_access);
3609         if (status != nfs_ok) {
3610                 spin_unlock(&fp->fi_lock);
3611                 goto out;
3612         }
3613
3614         /* Set access bits in stateid */
3615         old_access_bmap = stp->st_access_bmap;
3616         set_access(open->op_share_access, stp);
3617
3618         /* Set new deny mask */
3619         old_deny_bmap = stp->st_deny_bmap;
3620         set_deny(open->op_share_deny, stp);
3621         fp->fi_share_deny |= (open->op_share_deny & NFS4_SHARE_DENY_BOTH);
3622
3623         if (!fp->fi_fds[oflag]) {
3624                 spin_unlock(&fp->fi_lock);
3625                 status = nfsd_open(rqstp, cur_fh, S_IFREG, access, &filp);
3626                 if (status)
3627                         goto out_put_access;
3628                 spin_lock(&fp->fi_lock);
3629                 if (!fp->fi_fds[oflag]) {
3630                         fp->fi_fds[oflag] = filp;
3631                         filp = NULL;
3632                 }
3633         }
3634         spin_unlock(&fp->fi_lock);
3635         if (filp)
3636                 fput(filp);
3637
3638         status = nfsd4_truncate(rqstp, cur_fh, open);
3639         if (status)
3640                 goto out_put_access;
3641 out:
3642         return status;
3643 out_put_access:
3644         stp->st_access_bmap = old_access_bmap;
3645         nfs4_file_put_access(fp, open->op_share_access);
3646         reset_union_bmap_deny(bmap_to_share_mode(old_deny_bmap), stp);
3647         goto out;
3648 }
3649
3650 static __be32
3651 nfs4_upgrade_open(struct svc_rqst *rqstp, struct nfs4_file *fp, struct svc_fh *cur_fh, struct nfs4_ol_stateid *stp, struct nfsd4_open *open)
3652 {
3653         __be32 status;
3654         unsigned char old_deny_bmap;
3655
3656         if (!test_access(open->op_share_access, stp))
3657                 return nfs4_get_vfs_file(rqstp, fp, cur_fh, stp, open);
3658
3659         /* test and set deny mode */
3660         spin_lock(&fp->fi_lock);
3661         status = nfs4_file_check_deny(fp, open->op_share_deny);
3662         if (status == nfs_ok) {
3663                 old_deny_bmap = stp->st_deny_bmap;
3664                 set_deny(open->op_share_deny, stp);
3665                 fp->fi_share_deny |=
3666                                 (open->op_share_deny & NFS4_SHARE_DENY_BOTH);
3667         }
3668         spin_unlock(&fp->fi_lock);
3669
3670         if (status != nfs_ok)
3671                 return status;
3672
3673         status = nfsd4_truncate(rqstp, cur_fh, open);
3674         if (status != nfs_ok)
3675                 reset_union_bmap_deny(old_deny_bmap, stp);
3676         return status;
3677 }
3678
3679 static void
3680 nfs4_set_claim_prev(struct nfsd4_open *open, bool has_session)
3681 {
3682         open->op_openowner->oo_flags |= NFS4_OO_CONFIRMED;
3683 }
3684
3685 /* Should we give out recallable state?: */
3686 static bool nfsd4_cb_channel_good(struct nfs4_client *clp)
3687 {
3688         if (clp->cl_cb_state == NFSD4_CB_UP)
3689                 return true;
3690         /*
3691          * In the sessions case, since we don't have to establish a
3692          * separate connection for callbacks, we assume it's OK
3693          * until we hear otherwise:
3694          */
3695         return clp->cl_minorversion && clp->cl_cb_state == NFSD4_CB_UNKNOWN;
3696 }
3697
3698 static struct file_lock *nfs4_alloc_init_lease(struct nfs4_file *fp, int flag)
3699 {
3700         struct file_lock *fl;
3701
3702         fl = locks_alloc_lock();
3703         if (!fl)
3704                 return NULL;
3705         locks_init_lock(fl);
3706         fl->fl_lmops = &nfsd_lease_mng_ops;
3707         fl->fl_flags = FL_DELEG;
3708         fl->fl_type = flag == NFS4_OPEN_DELEGATE_READ? F_RDLCK: F_WRLCK;
3709         fl->fl_end = OFFSET_MAX;
3710         fl->fl_owner = (fl_owner_t)fp;
3711         fl->fl_pid = current->tgid;
3712         return fl;
3713 }
3714
3715 static int nfs4_setlease(struct nfs4_delegation *dp)
3716 {
3717         struct nfs4_file *fp = dp->dl_stid.sc_file;
3718         struct file_lock *fl;
3719         struct file *filp;
3720         int status = 0;
3721
3722         fl = nfs4_alloc_init_lease(fp, NFS4_OPEN_DELEGATE_READ);
3723         if (!fl)
3724                 return -ENOMEM;
3725         filp = find_readable_file(fp);
3726         if (!filp) {
3727                 /* We should always have a readable file here */
3728                 WARN_ON_ONCE(1);
3729                 return -EBADF;
3730         }
3731         fl->fl_file = filp;
3732         status = vfs_setlease(filp, fl->fl_type, &fl);
3733         if (status) {
3734                 locks_free_lock(fl);
3735                 goto out_fput;
3736         }
3737         spin_lock(&state_lock);
3738         spin_lock(&fp->fi_lock);
3739         /* Did the lease get broken before we took the lock? */
3740         status = -EAGAIN;
3741         if (fp->fi_had_conflict)
3742                 goto out_unlock;
3743         /* Race breaker */
3744         if (fp->fi_lease) {
3745                 status = 0;
3746                 atomic_inc(&fp->fi_delegees);
3747                 hash_delegation_locked(dp, fp);
3748                 goto out_unlock;
3749         }
3750         fp->fi_lease = fl;
3751         fp->fi_deleg_file = filp;
3752         atomic_set(&fp->fi_delegees, 1);
3753         hash_delegation_locked(dp, fp);
3754         spin_unlock(&fp->fi_lock);
3755         spin_unlock(&state_lock);
3756         return 0;
3757 out_unlock:
3758         spin_unlock(&fp->fi_lock);
3759         spin_unlock(&state_lock);
3760 out_fput:
3761         fput(filp);
3762         return status;
3763 }
3764
3765 static struct nfs4_delegation *
3766 nfs4_set_delegation(struct nfs4_client *clp, struct svc_fh *fh,
3767                     struct nfs4_file *fp)
3768 {
3769         int status;
3770         struct nfs4_delegation *dp;
3771
3772         if (fp->fi_had_conflict)
3773                 return ERR_PTR(-EAGAIN);
3774
3775         dp = alloc_init_deleg(clp, fh);
3776         if (!dp)
3777                 return ERR_PTR(-ENOMEM);
3778
3779         get_nfs4_file(fp);
3780         spin_lock(&state_lock);
3781         spin_lock(&fp->fi_lock);
3782         dp->dl_stid.sc_file = fp;
3783         if (!fp->fi_lease) {
3784                 spin_unlock(&fp->fi_lock);
3785                 spin_unlock(&state_lock);
3786                 status = nfs4_setlease(dp);
3787                 goto out;
3788         }
3789         atomic_inc(&fp->fi_delegees);
3790         if (fp->fi_had_conflict) {
3791                 status = -EAGAIN;
3792                 goto out_unlock;
3793         }
3794         hash_delegation_locked(dp, fp);
3795         status = 0;
3796 out_unlock:
3797         spin_unlock(&fp->fi_lock);
3798         spin_unlock(&state_lock);
3799 out:
3800         if (status) {
3801                 nfs4_put_stid(&dp->dl_stid);
3802                 return ERR_PTR(status);
3803         }
3804         return dp;
3805 }
3806
3807 static void nfsd4_open_deleg_none_ext(struct nfsd4_open *open, int status)
3808 {
3809         open->op_delegate_type = NFS4_OPEN_DELEGATE_NONE_EXT;
3810         if (status == -EAGAIN)
3811                 open->op_why_no_deleg = WND4_CONTENTION;
3812         else {
3813                 open->op_why_no_deleg = WND4_RESOURCE;
3814                 switch (open->op_deleg_want) {
3815                 case NFS4_SHARE_WANT_READ_DELEG:
3816                 case NFS4_SHARE_WANT_WRITE_DELEG:
3817                 case NFS4_SHARE_WANT_ANY_DELEG:
3818                         break;
3819                 case NFS4_SHARE_WANT_CANCEL:
3820                         open->op_why_no_deleg = WND4_CANCELLED;
3821                         break;
3822                 case NFS4_SHARE_WANT_NO_DELEG:
3823                         WARN_ON_ONCE(1);
3824                 }
3825         }
3826 }
3827
3828 /*
3829  * Attempt to hand out a delegation.
3830  *
3831  * Note we don't support write delegations, and won't until the vfs has
3832  * proper support for them.
3833  */
3834 static void
3835 nfs4_open_delegation(struct svc_fh *fh, struct nfsd4_open *open,
3836                         struct nfs4_ol_stateid *stp)
3837 {
3838         struct nfs4_delegation *dp;
3839         struct nfs4_openowner *oo = openowner(stp->st_stateowner);
3840         struct nfs4_client *clp = stp->st_stid.sc_client;
3841         int cb_up;
3842         int status = 0;
3843
3844         cb_up = nfsd4_cb_channel_good(oo->oo_owner.so_client);
3845         open->op_recall = 0;
3846         switch (open->op_claim_type) {
3847                 case NFS4_OPEN_CLAIM_PREVIOUS:
3848                         if (!cb_up)
3849                                 open->op_recall = 1;
3850                         if (open->op_delegate_type != NFS4_OPEN_DELEGATE_READ)
3851                                 goto out_no_deleg;
3852                         break;
3853                 case NFS4_OPEN_CLAIM_NULL:
3854                 case NFS4_OPEN_CLAIM_FH:
3855                         /*
3856                          * Let's not give out any delegations till everyone's
3857                          * had the chance to reclaim theirs....
3858                          */
3859                         if (locks_in_grace(clp->net))
3860                                 goto out_no_deleg;
3861                         if (!cb_up || !(oo->oo_flags & NFS4_OO_CONFIRMED))
3862                                 goto out_no_deleg;
3863                         /*
3864                          * Also, if the file was opened for write or
3865                          * create, there's a good chance the client's
3866                          * about to write to it, resulting in an
3867                          * immediate recall (since we don't support
3868                          * write delegations):
3869                          */
3870                         if (open->op_share_access & NFS4_SHARE_ACCESS_WRITE)
3871                                 goto out_no_deleg;
3872                         if (open->op_create == NFS4_OPEN_CREATE)
3873                                 goto out_no_deleg;
3874                         break;
3875                 default:
3876                         goto out_no_deleg;
3877         }
3878         dp = nfs4_set_delegation(clp, fh, stp->st_stid.sc_file);
3879         if (IS_ERR(dp))
3880                 goto out_no_deleg;
3881
3882         memcpy(&open->op_delegate_stateid, &dp->dl_stid.sc_stateid, sizeof(dp->dl_stid.sc_stateid));
3883
3884         dprintk("NFSD: delegation stateid=" STATEID_FMT "\n",
3885                 STATEID_VAL(&dp->dl_stid.sc_stateid));
3886         open->op_delegate_type = NFS4_OPEN_DELEGATE_READ;
3887         nfs4_put_stid(&dp->dl_stid);
3888         return;
3889 out_no_deleg:
3890         open->op_delegate_type = NFS4_OPEN_DELEGATE_NONE;
3891         if (open->op_claim_type == NFS4_OPEN_CLAIM_PREVIOUS &&
3892             open->op_delegate_type != NFS4_OPEN_DELEGATE_NONE) {
3893                 dprintk("NFSD: WARNING: refusing delegation reclaim\n");
3894                 open->op_recall = 1;
3895         }
3896
3897         /* 4.1 client asking for a delegation? */
3898         if (open->op_deleg_want)
3899                 nfsd4_open_deleg_none_ext(open, status);
3900         return;
3901 }
3902
3903 static void nfsd4_deleg_xgrade_none_ext(struct nfsd4_open *open,
3904                                         struct nfs4_delegation *dp)
3905 {
3906         if (open->op_deleg_want == NFS4_SHARE_WANT_READ_DELEG &&
3907             dp->dl_type == NFS4_OPEN_DELEGATE_WRITE) {
3908                 open->op_delegate_type = NFS4_OPEN_DELEGATE_NONE_EXT;
3909                 open->op_why_no_deleg = WND4_NOT_SUPP_DOWNGRADE;
3910         } else if (open->op_deleg_want == NFS4_SHARE_WANT_WRITE_DELEG &&
3911                    dp->dl_type == NFS4_OPEN_DELEGATE_WRITE) {
3912                 open->op_delegate_type = NFS4_OPEN_DELEGATE_NONE_EXT;
3913                 open->op_why_no_deleg = WND4_NOT_SUPP_UPGRADE;
3914         }
3915         /* Otherwise the client must be confused wanting a delegation
3916          * it already has, therefore we don't return
3917          * NFS4_OPEN_DELEGATE_NONE_EXT and reason.
3918          */
3919 }
3920
3921 /*
3922  * called with nfs4_lock_state() held.
3923  */
3924 __be32
3925 nfsd4_process_open2(struct svc_rqst *rqstp, struct svc_fh *current_fh, struct nfsd4_open *open)
3926 {
3927         struct nfsd4_compoundres *resp = rqstp->rq_resp;
3928         struct nfs4_client *cl = open->op_openowner->oo_owner.so_client;
3929         struct nfs4_file *fp = NULL;
3930         struct nfs4_ol_stateid *stp = NULL;
3931         struct nfs4_delegation *dp = NULL;
3932         __be32 status;
3933
3934         /*
3935          * Lookup file; if found, lookup stateid and check open request,
3936          * and check for delegations in the process of being recalled.
3937          * If not found, create the nfs4_file struct
3938          */
3939         fp = find_or_add_file(open->op_file, &current_fh->fh_handle);
3940         if (fp != open->op_file) {
3941                 status = nfs4_check_deleg(cl, open, &dp);
3942                 if (status)
3943                         goto out;
3944                 stp = nfsd4_find_existing_open(fp, open);
3945         } else {
3946                 open->op_file = NULL;
3947                 status = nfserr_bad_stateid;
3948                 if (nfsd4_is_deleg_cur(open))
3949                         goto out;
3950                 status = nfserr_jukebox;
3951         }
3952
3953         /*
3954          * OPEN the file, or upgrade an existing OPEN.
3955          * If truncate fails, the OPEN fails.
3956          */
3957         if (stp) {
3958                 /* Stateid was found, this is an OPEN upgrade */
3959                 status = nfs4_upgrade_open(rqstp, fp, current_fh, stp, open);
3960                 if (status)
3961                         goto out;
3962         } else {
3963                 stp = open->op_stp;
3964                 open->op_stp = NULL;
3965                 init_open_stateid(stp, fp, open);
3966                 status = nfs4_get_vfs_file(rqstp, fp, current_fh, stp, open);
3967                 if (status) {
3968                         release_open_stateid(stp);
3969                         goto out;
3970                 }
3971         }
3972         update_stateid(&stp->st_stid.sc_stateid);
3973         memcpy(&open->op_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
3974
3975         if (nfsd4_has_session(&resp->cstate)) {
3976                 if (open->op_deleg_want & NFS4_SHARE_WANT_NO_DELEG) {
3977                         open->op_delegate_type = NFS4_OPEN_DELEGATE_NONE_EXT;
3978                         open->op_why_no_deleg = WND4_NOT_WANTED;
3979                         goto nodeleg;
3980                 }
3981         }
3982
3983         /*
3984         * Attempt to hand out a delegation. No error return, because the
3985         * OPEN succeeds even if we fail.
3986         */
3987         nfs4_open_delegation(current_fh, open, stp);
3988 nodeleg:
3989         status = nfs_ok;
3990
3991         dprintk("%s: stateid=" STATEID_FMT "\n", __func__,
3992                 STATEID_VAL(&stp->st_stid.sc_stateid));
3993 out:
3994         /* 4.1 client trying to upgrade/downgrade delegation? */
3995         if (open->op_delegate_type == NFS4_OPEN_DELEGATE_NONE && dp &&
3996             open->op_deleg_want)
3997                 nfsd4_deleg_xgrade_none_ext(open, dp);
3998
3999         if (fp)
4000                 put_nfs4_file(fp);
4001         if (status == 0 && open->op_claim_type == NFS4_OPEN_CLAIM_PREVIOUS)
4002                 nfs4_set_claim_prev(open, nfsd4_has_session(&resp->cstate));
4003         /*
4004         * To finish the open response, we just need to set the rflags.
4005         */
4006         open->op_rflags = NFS4_OPEN_RESULT_LOCKTYPE_POSIX;
4007         if (!(open->op_openowner->oo_flags & NFS4_OO_CONFIRMED) &&
4008             !nfsd4_has_session(&resp->cstate))
4009                 open->op_rflags |= NFS4_OPEN_RESULT_CONFIRM;
4010         if (dp)
4011                 nfs4_put_stid(&dp->dl_stid);
4012         if (stp)
4013                 nfs4_put_stid(&stp->st_stid);
4014
4015         return status;
4016 }
4017
4018 void nfsd4_cleanup_open_state(struct nfsd4_compound_state *cstate,
4019                               struct nfsd4_open *open, __be32 status)
4020 {
4021         if (open->op_openowner) {
4022                 struct nfs4_stateowner *so = &open->op_openowner->oo_owner;
4023
4024                 nfsd4_cstate_assign_replay(cstate, so);
4025                 nfs4_put_stateowner(so);
4026         }
4027         if (open->op_file)
4028                 nfsd4_free_file(open->op_file);
4029         if (open->op_stp)
4030                 nfs4_put_stid(&open->op_stp->st_stid);
4031 }
4032
4033 __be32
4034 nfsd4_renew(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
4035             clientid_t *clid)
4036 {
4037         struct nfs4_client *clp;
4038         __be32 status;
4039         struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
4040
4041         nfs4_lock_state();
4042         dprintk("process_renew(%08x/%08x): starting\n", 
4043                         clid->cl_boot, clid->cl_id);
4044         status = lookup_clientid(clid, cstate, nn);
4045         if (status)
4046                 goto out;
4047         clp = cstate->clp;
4048         status = nfserr_cb_path_down;
4049         if (!list_empty(&clp->cl_delegations)
4050                         && clp->cl_cb_state != NFSD4_CB_UP)
4051                 goto out;
4052         status = nfs_ok;
4053 out:
4054         nfs4_unlock_state();
4055         return status;
4056 }
4057
4058 static void
4059 nfsd4_end_grace(struct nfsd_net *nn)
4060 {
4061         /* do nothing if grace period already ended */
4062         if (nn->grace_ended)
4063                 return;
4064
4065         dprintk("NFSD: end of grace period\n");
4066         nn->grace_ended = true;
4067         nfsd4_record_grace_done(nn, nn->boot_time);
4068         locks_end_grace(&nn->nfsd4_manager);
4069         /*
4070          * Now that every NFSv4 client has had the chance to recover and
4071          * to see the (possibly new, possibly shorter) lease time, we
4072          * can safely set the next grace time to the current lease time:
4073          */
4074         nn->nfsd4_grace = nn->nfsd4_lease;
4075 }
4076
4077 static time_t
4078 nfs4_laundromat(struct nfsd_net *nn)
4079 {
4080         struct nfs4_client *clp;
4081         struct nfs4_openowner *oo;
4082         struct nfs4_delegation *dp;
4083         struct list_head *pos, *next, reaplist;
4084         time_t cutoff = get_seconds() - nn->nfsd4_lease;
4085         time_t t, new_timeo = nn->nfsd4_lease;
4086
4087         nfs4_lock_state();
4088
4089         dprintk("NFSD: laundromat service - starting\n");
4090         nfsd4_end_grace(nn);
4091         INIT_LIST_HEAD(&reaplist);
4092         spin_lock(&nn->client_lock);
4093         list_for_each_safe(pos, next, &nn->client_lru) {
4094                 clp = list_entry(pos, struct nfs4_client, cl_lru);
4095                 if (time_after((unsigned long)clp->cl_time, (unsigned long)cutoff)) {
4096                         t = clp->cl_time - cutoff;
4097                         new_timeo = min(new_timeo, t);
4098                         break;
4099                 }
4100                 if (mark_client_expired_locked(clp)) {
4101                         dprintk("NFSD: client in use (clientid %08x)\n",
4102                                 clp->cl_clientid.cl_id);
4103                         continue;
4104                 }
4105                 list_move(&clp->cl_lru, &reaplist);
4106         }
4107         spin_unlock(&nn->client_lock);
4108         list_for_each_safe(pos, next, &reaplist) {
4109                 clp = list_entry(pos, struct nfs4_client, cl_lru);
4110                 dprintk("NFSD: purging unused client (clientid %08x)\n",
4111                         clp->cl_clientid.cl_id);
4112                 expire_client(clp);
4113         }
4114         spin_lock(&state_lock);
4115         list_for_each_safe(pos, next, &nn->del_recall_lru) {
4116                 dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
4117                 if (net_generic(dp->dl_stid.sc_client->net, nfsd_net_id) != nn)
4118                         continue;
4119                 if (time_after((unsigned long)dp->dl_time, (unsigned long)cutoff)) {
4120                         t = dp->dl_time - cutoff;
4121                         new_timeo = min(new_timeo, t);
4122                         break;
4123                 }
4124                 unhash_delegation_locked(dp);
4125                 list_add(&dp->dl_recall_lru, &reaplist);
4126         }
4127         spin_unlock(&state_lock);
4128         while (!list_empty(&reaplist)) {
4129                 dp = list_first_entry(&reaplist, struct nfs4_delegation,
4130                                         dl_recall_lru);
4131                 list_del_init(&dp->dl_recall_lru);
4132                 revoke_delegation(dp);
4133         }
4134         list_for_each_safe(pos, next, &nn->close_lru) {
4135                 oo = container_of(pos, struct nfs4_openowner, oo_close_lru);
4136                 if (time_after((unsigned long)oo->oo_time, (unsigned long)cutoff)) {
4137                         t = oo->oo_time - cutoff;
4138                         new_timeo = min(new_timeo, t);
4139                         break;
4140                 }
4141                 release_last_closed_stateid(oo);
4142         }
4143         new_timeo = max_t(time_t, new_timeo, NFSD_LAUNDROMAT_MINTIMEOUT);
4144         nfs4_unlock_state();
4145         return new_timeo;
4146 }
4147
4148 static struct workqueue_struct *laundry_wq;
4149 static void laundromat_main(struct work_struct *);
4150
4151 static void
4152 laundromat_main(struct work_struct *laundry)
4153 {
4154         time_t t;
4155         struct delayed_work *dwork = container_of(laundry, struct delayed_work,
4156                                                   work);
4157         struct nfsd_net *nn = container_of(dwork, struct nfsd_net,
4158                                            laundromat_work);
4159
4160         t = nfs4_laundromat(nn);
4161         dprintk("NFSD: laundromat_main - sleeping for %ld seconds\n", t);
4162         queue_delayed_work(laundry_wq, &nn->laundromat_work, t*HZ);
4163 }
4164
4165 static inline __be32 nfs4_check_fh(struct svc_fh *fhp, struct nfs4_ol_stateid *stp)
4166 {
4167         if (!nfsd_fh_match(&fhp->fh_handle, &stp->st_stid.sc_file->fi_fhandle))
4168                 return nfserr_bad_stateid;
4169         return nfs_ok;
4170 }
4171
4172 static inline int
4173 access_permit_read(struct nfs4_ol_stateid *stp)
4174 {
4175         return test_access(NFS4_SHARE_ACCESS_READ, stp) ||
4176                 test_access(NFS4_SHARE_ACCESS_BOTH, stp) ||
4177                 test_access(NFS4_SHARE_ACCESS_WRITE, stp);
4178 }
4179
4180 static inline int
4181 access_permit_write(struct nfs4_ol_stateid *stp)
4182 {
4183         return test_access(NFS4_SHARE_ACCESS_WRITE, stp) ||
4184                 test_access(NFS4_SHARE_ACCESS_BOTH, stp);
4185 }
4186
4187 static
4188 __be32 nfs4_check_openmode(struct nfs4_ol_stateid *stp, int flags)
4189 {
4190         __be32 status = nfserr_openmode;
4191
4192         /* For lock stateid's, we test the parent open, not the lock: */
4193         if (stp->st_openstp)
4194                 stp = stp->st_openstp;
4195         if ((flags & WR_STATE) && !access_permit_write(stp))
4196                 goto out;
4197         if ((flags & RD_STATE) && !access_permit_read(stp))
4198                 goto out;
4199         status = nfs_ok;
4200 out:
4201         return status;
4202 }
4203
4204 static inline __be32
4205 check_special_stateids(struct net *net, svc_fh *current_fh, stateid_t *stateid, int flags)
4206 {
4207         if (ONE_STATEID(stateid) && (flags & RD_STATE))
4208                 return nfs_ok;
4209         else if (locks_in_grace(net)) {
4210                 /* Answer in remaining cases depends on existence of
4211                  * conflicting state; so we must wait out the grace period. */
4212                 return nfserr_grace;
4213         } else if (flags & WR_STATE)
4214                 return nfs4_share_conflict(current_fh,
4215                                 NFS4_SHARE_DENY_WRITE);
4216         else /* (flags & RD_STATE) && ZERO_STATEID(stateid) */
4217                 return nfs4_share_conflict(current_fh,
4218                                 NFS4_SHARE_DENY_READ);
4219 }
4220
4221 /*
4222  * Allow READ/WRITE during grace period on recovered state only for files
4223  * that are not able to provide mandatory locking.
4224  */
4225 static inline int
4226 grace_disallows_io(struct net *net, struct inode *inode)
4227 {
4228         return locks_in_grace(net) && mandatory_lock(inode);
4229 }
4230
4231 /* Returns true iff a is later than b: */
4232 static bool stateid_generation_after(stateid_t *a, stateid_t *b)
4233 {
4234         return (s32)(a->si_generation - b->si_generation) > 0;
4235 }
4236
4237 static __be32 check_stateid_generation(stateid_t *in, stateid_t *ref, bool has_session)
4238 {
4239         /*
4240          * When sessions are used the stateid generation number is ignored
4241          * when it is zero.
4242          */
4243         if (has_session && in->si_generation == 0)
4244                 return nfs_ok;
4245
4246         if (in->si_generation == ref->si_generation)
4247                 return nfs_ok;
4248
4249         /* If the client sends us a stateid from the future, it's buggy: */
4250         if (stateid_generation_after(in, ref))
4251                 return nfserr_bad_stateid;
4252         /*
4253          * However, we could see a stateid from the past, even from a
4254          * non-buggy client.  For example, if the client sends a lock
4255          * while some IO is outstanding, the lock may bump si_generation
4256          * while the IO is still in flight.  The client could avoid that
4257          * situation by waiting for responses on all the IO requests,
4258          * but better performance may result in retrying IO that
4259          * receives an old_stateid error if requests are rarely
4260          * reordered in flight:
4261          */
4262         return nfserr_old_stateid;
4263 }
4264
4265 static __be32 nfsd4_validate_stateid(struct nfs4_client *cl, stateid_t *stateid)
4266 {
4267         struct nfs4_stid *s;
4268         struct nfs4_ol_stateid *ols;
4269         __be32 status = nfserr_bad_stateid;
4270
4271         if (ZERO_STATEID(stateid) || ONE_STATEID(stateid))
4272                 return status;
4273         /* Client debugging aid. */
4274         if (!same_clid(&stateid->si_opaque.so_clid, &cl->cl_clientid)) {
4275                 char addr_str[INET6_ADDRSTRLEN];
4276                 rpc_ntop((struct sockaddr *)&cl->cl_addr, addr_str,
4277                                  sizeof(addr_str));
4278                 pr_warn_ratelimited("NFSD: client %s testing state ID "
4279                                         "with incorrect client ID\n", addr_str);
4280                 return status;
4281         }
4282         spin_lock(&cl->cl_lock);
4283         s = find_stateid_locked(cl, stateid);
4284         if (!s)
4285                 goto out_unlock;
4286         status = check_stateid_generation(stateid, &s->sc_stateid, 1);
4287         if (status)
4288                 goto out_unlock;
4289         switch (s->sc_type) {
4290         case NFS4_DELEG_STID:
4291                 status = nfs_ok;
4292                 break;
4293         case NFS4_REVOKED_DELEG_STID:
4294                 status = nfserr_deleg_revoked;
4295                 break;
4296         case NFS4_OPEN_STID:
4297         case NFS4_LOCK_STID:
4298                 ols = openlockstateid(s);
4299                 if (ols->st_stateowner->so_is_open_owner
4300                                 && !(openowner(ols->st_stateowner)->oo_flags
4301                                                 & NFS4_OO_CONFIRMED))
4302                         status = nfserr_bad_stateid;
4303                 else
4304                         status = nfs_ok;
4305                 break;
4306         default:
4307                 printk("unknown stateid type %x\n", s->sc_type);
4308                 /* Fallthrough */
4309         case NFS4_CLOSED_STID:
4310         case NFS4_CLOSED_DELEG_STID:
4311                 status = nfserr_bad_stateid;
4312         }
4313 out_unlock:
4314         spin_unlock(&cl->cl_lock);
4315         return status;
4316 }
4317
4318 static __be32
4319 nfsd4_lookup_stateid(struct nfsd4_compound_state *cstate,
4320                      stateid_t *stateid, unsigned char typemask,
4321                      struct nfs4_stid **s, struct nfsd_net *nn)
4322 {
4323         __be32 status;
4324
4325         if (ZERO_STATEID(stateid) || ONE_STATEID(stateid))
4326                 return nfserr_bad_stateid;
4327         status = lookup_clientid(&stateid->si_opaque.so_clid, cstate, nn);
4328         if (status == nfserr_stale_clientid) {
4329                 if (cstate->session)
4330                         return nfserr_bad_stateid;
4331                 return nfserr_stale_stateid;
4332         }
4333         if (status)
4334                 return status;
4335         *s = find_stateid_by_type(cstate->clp, stateid, typemask);
4336         if (!*s)
4337                 return nfserr_bad_stateid;
4338         return nfs_ok;
4339 }
4340
4341 /*
4342 * Checks for stateid operations
4343 */
4344 __be32
4345 nfs4_preprocess_stateid_op(struct net *net, struct nfsd4_compound_state *cstate,
4346                            stateid_t *stateid, int flags, struct file **filpp)
4347 {
4348         struct nfs4_stid *s;
4349         struct nfs4_ol_stateid *stp = NULL;
4350         struct nfs4_delegation *dp = NULL;
4351         struct svc_fh *current_fh = &cstate->current_fh;
4352         struct inode *ino = current_fh->fh_dentry->d_inode;
4353         struct nfsd_net *nn = net_generic(net, nfsd_net_id);
4354         struct file *file = NULL;
4355         __be32 status;
4356
4357         if (filpp)
4358                 *filpp = NULL;
4359
4360         if (grace_disallows_io(net, ino))
4361                 return nfserr_grace;
4362
4363         if (ZERO_STATEID(stateid) || ONE_STATEID(stateid))
4364                 return check_special_stateids(net, current_fh, stateid, flags);
4365
4366         nfs4_lock_state();
4367
4368         status = nfsd4_lookup_stateid(cstate, stateid,
4369                                 NFS4_DELEG_STID|NFS4_OPEN_STID|NFS4_LOCK_STID,
4370                                 &s, nn);
4371         if (status)
4372                 goto unlock_state;
4373         status = check_stateid_generation(stateid, &s->sc_stateid, nfsd4_has_session(cstate));
4374         if (status)
4375                 goto out;
4376         switch (s->sc_type) {
4377         case NFS4_DELEG_STID:
4378                 dp = delegstateid(s);
4379                 status = nfs4_check_delegmode(dp, flags);
4380                 if (status)
4381                         goto out;
4382                 if (filpp) {
4383                         file = dp->dl_stid.sc_file->fi_deleg_file;
4384                         if (!file) {
4385                                 WARN_ON_ONCE(1);
4386                                 status = nfserr_serverfault;
4387                                 goto out;
4388                         }
4389                         get_file(file);
4390                 }
4391                 break;
4392         case NFS4_OPEN_STID:
4393         case NFS4_LOCK_STID:
4394                 stp = openlockstateid(s);
4395                 status = nfs4_check_fh(current_fh, stp);
4396                 if (status)
4397                         goto out;
4398                 if (stp->st_stateowner->so_is_open_owner
4399                     && !(openowner(stp->st_stateowner)->oo_flags & NFS4_OO_CONFIRMED))
4400                         goto out;
4401                 status = nfs4_check_openmode(stp, flags);
4402                 if (status)
4403                         goto out;
4404                 if (filpp) {
4405                         struct nfs4_file *fp = stp->st_stid.sc_file;
4406
4407                         if (flags & RD_STATE)
4408                                 file = find_readable_file(fp);
4409                         else
4410                                 file = find_writeable_file(fp);
4411                 }
4412                 break;
4413         default:
4414                 status = nfserr_bad_stateid;
4415                 goto out;
4416         }
4417         status = nfs_ok;
4418         if (file)
4419                 *filpp = file;
4420 out:
4421         nfs4_put_stid(s);
4422 unlock_state:
4423         nfs4_unlock_state();
4424         return status;
4425 }
4426
4427 /*
4428  * Test if the stateid is valid
4429  */
4430 __be32
4431 nfsd4_test_stateid(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
4432                    struct nfsd4_test_stateid *test_stateid)
4433 {
4434         struct nfsd4_test_stateid_id *stateid;
4435         struct nfs4_client *cl = cstate->session->se_client;
4436
4437         nfs4_lock_state();
4438         list_for_each_entry(stateid, &test_stateid->ts_stateid_list, ts_id_list)
4439                 stateid->ts_id_status =
4440                         nfsd4_validate_stateid(cl, &stateid->ts_id_stateid);
4441         nfs4_unlock_state();
4442
4443         return nfs_ok;
4444 }
4445
4446 __be32
4447 nfsd4_free_stateid(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
4448                    struct nfsd4_free_stateid *free_stateid)
4449 {
4450         stateid_t *stateid = &free_stateid->fr_stateid;
4451         struct nfs4_stid *s;
4452         struct nfs4_delegation *dp;
4453         struct nfs4_ol_stateid *stp;
4454         struct nfs4_client *cl = cstate->session->se_client;
4455         __be32 ret = nfserr_bad_stateid;
4456
4457         nfs4_lock_state();
4458         spin_lock(&cl->cl_lock);
4459         s = find_stateid_locked(cl, stateid);
4460         if (!s)
4461                 goto out_unlock;
4462         switch (s->sc_type) {
4463         case NFS4_DELEG_STID:
4464                 ret = nfserr_locks_held;
4465                 break;
4466         case NFS4_OPEN_STID:
4467                 ret = check_stateid_generation(stateid, &s->sc_stateid, 1);
4468                 if (ret)
4469                         break;
4470                 ret = nfserr_locks_held;
4471                 break;
4472         case NFS4_LOCK_STID:
4473                 ret = check_stateid_generation(stateid, &s->sc_stateid, 1);
4474                 if (ret)
4475                         break;
4476                 stp = openlockstateid(s);
4477                 ret = nfserr_locks_held;
4478                 if (check_for_locks(stp->st_stid.sc_file,
4479                                     lockowner(stp->st_stateowner)))
4480                         break;
4481                 unhash_lock_stateid(stp);
4482                 spin_unlock(&cl->cl_lock);
4483                 nfs4_put_stid(s);
4484                 ret = nfs_ok;
4485                 goto out;
4486         case NFS4_REVOKED_DELEG_STID:
4487                 dp = delegstateid(s);
4488                 list_del_init(&dp->dl_recall_lru);
4489                 spin_unlock(&cl->cl_lock);
4490                 nfs4_put_stid(s);
4491                 ret = nfs_ok;
4492                 goto out;
4493         /* Default falls through and returns nfserr_bad_stateid */
4494         }
4495 out_unlock:
4496         spin_unlock(&cl->cl_lock);
4497 out:
4498         nfs4_unlock_state();
4499         return ret;
4500 }
4501
4502 static inline int
4503 setlkflg (int type)
4504 {
4505         return (type == NFS4_READW_LT || type == NFS4_READ_LT) ?
4506                 RD_STATE : WR_STATE;
4507 }
4508
4509 static __be32 nfs4_seqid_op_checks(struct nfsd4_compound_state *cstate, stateid_t *stateid, u32 seqid, struct nfs4_ol_stateid *stp)
4510 {
4511         struct svc_fh *current_fh = &cstate->current_fh;
4512         struct nfs4_stateowner *sop = stp->st_stateowner;
4513         __be32 status;
4514
4515         status = nfsd4_check_seqid(cstate, sop, seqid);
4516         if (status)
4517                 return status;
4518         if (stp->st_stid.sc_type == NFS4_CLOSED_STID
4519                 || stp->st_stid.sc_type == NFS4_REVOKED_DELEG_STID)
4520                 /*
4521                  * "Closed" stateid's exist *only* to return
4522                  * nfserr_replay_me from the previous step, and
4523                  * revoked delegations are kept only for free_stateid.
4524                  */
4525                 return nfserr_bad_stateid;
4526         status = check_stateid_generation(stateid, &stp->st_stid.sc_stateid, nfsd4_has_session(cstate));
4527         if (status)
4528                 return status;
4529         return nfs4_check_fh(current_fh, stp);
4530 }
4531
4532 /* 
4533  * Checks for sequence id mutating operations. 
4534  */
4535 static __be32
4536 nfs4_preprocess_seqid_op(struct nfsd4_compound_state *cstate, u32 seqid,
4537                          stateid_t *stateid, char typemask,
4538                          struct nfs4_ol_stateid **stpp,
4539                          struct nfsd_net *nn)
4540 {
4541         __be32 status;
4542         struct nfs4_stid *s;
4543         struct nfs4_ol_stateid *stp = NULL;
4544
4545         dprintk("NFSD: %s: seqid=%d stateid = " STATEID_FMT "\n", __func__,
4546                 seqid, STATEID_VAL(stateid));
4547
4548         *stpp = NULL;
4549         status = nfsd4_lookup_stateid(cstate, stateid, typemask, &s, nn);
4550         if (status)
4551                 return status;
4552         stp = openlockstateid(s);
4553         nfsd4_cstate_assign_replay(cstate, stp->st_stateowner);
4554
4555         status = nfs4_seqid_op_checks(cstate, stateid, seqid, stp);
4556         if (!status)
4557                 *stpp = stp;
4558         else
4559                 nfs4_put_stid(&stp->st_stid);
4560         return status;
4561 }
4562
4563 static __be32 nfs4_preprocess_confirmed_seqid_op(struct nfsd4_compound_state *cstate, u32 seqid,
4564                                                  stateid_t *stateid, struct nfs4_ol_stateid **stpp, struct nfsd_net *nn)
4565 {
4566         __be32 status;
4567         struct nfs4_openowner *oo;
4568         struct nfs4_ol_stateid *stp;
4569
4570         status = nfs4_preprocess_seqid_op(cstate, seqid, stateid,
4571                                                 NFS4_OPEN_STID, &stp, nn);
4572         if (status)
4573                 return status;
4574         oo = openowner(stp->st_stateowner);
4575         if (!(oo->oo_flags & NFS4_OO_CONFIRMED)) {
4576                 nfs4_put_stid(&stp->st_stid);
4577                 return nfserr_bad_stateid;
4578         }
4579         *stpp = stp;
4580         return nfs_ok;
4581 }
4582
4583 __be32
4584 nfsd4_open_confirm(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
4585                    struct nfsd4_open_confirm *oc)
4586 {
4587         __be32 status;
4588         struct nfs4_openowner *oo;
4589         struct nfs4_ol_stateid *stp;
4590         struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
4591
4592         dprintk("NFSD: nfsd4_open_confirm on file %pd\n",
4593                         cstate->current_fh.fh_dentry);
4594
4595         status = fh_verify(rqstp, &cstate->current_fh, S_IFREG, 0);
4596         if (status)
4597                 return status;
4598
4599         nfs4_lock_state();
4600
4601         status = nfs4_preprocess_seqid_op(cstate,
4602                                         oc->oc_seqid, &oc->oc_req_stateid,
4603                                         NFS4_OPEN_STID, &stp, nn);
4604         if (status)
4605                 goto out;
4606         oo = openowner(stp->st_stateowner);
4607         status = nfserr_bad_stateid;
4608         if (oo->oo_flags & NFS4_OO_CONFIRMED)
4609                 goto put_stateid;
4610         oo->oo_flags |= NFS4_OO_CONFIRMED;
4611         update_stateid(&stp->st_stid.sc_stateid);
4612         memcpy(&oc->oc_resp_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
4613         dprintk("NFSD: %s: success, seqid=%d stateid=" STATEID_FMT "\n",
4614                 __func__, oc->oc_seqid, STATEID_VAL(&stp->st_stid.sc_stateid));
4615
4616         nfsd4_client_record_create(oo->oo_owner.so_client);
4617         status = nfs_ok;
4618 put_stateid:
4619         nfs4_put_stid(&stp->st_stid);
4620 out:
4621         nfsd4_bump_seqid(cstate, status);
4622         nfs4_unlock_state();
4623         return status;
4624 }
4625
4626 static inline void nfs4_stateid_downgrade_bit(struct nfs4_ol_stateid *stp, u32 access)
4627 {
4628         if (!test_access(access, stp))
4629                 return;
4630         nfs4_file_put_access(stp->st_stid.sc_file, access);
4631         clear_access(access, stp);
4632 }
4633
4634 static inline void nfs4_stateid_downgrade(struct nfs4_ol_stateid *stp, u32 to_access)
4635 {
4636         switch (to_access) {
4637         case NFS4_SHARE_ACCESS_READ:
4638                 nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_WRITE);
4639                 nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_BOTH);
4640                 break;
4641         case NFS4_SHARE_ACCESS_WRITE:
4642                 nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_READ);
4643                 nfs4_stateid_downgrade_bit(stp, NFS4_SHARE_ACCESS_BOTH);
4644                 break;
4645         case NFS4_SHARE_ACCESS_BOTH:
4646                 break;
4647         default:
4648                 WARN_ON_ONCE(1);
4649         }
4650 }
4651
4652 __be32
4653 nfsd4_open_downgrade(struct svc_rqst *rqstp,
4654                      struct nfsd4_compound_state *cstate,
4655                      struct nfsd4_open_downgrade *od)
4656 {
4657         __be32 status;
4658         struct nfs4_ol_stateid *stp;
4659         struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
4660
4661         dprintk("NFSD: nfsd4_open_downgrade on file %pd\n", 
4662                         cstate->current_fh.fh_dentry);
4663
4664         /* We don't yet support WANT bits: */
4665         if (od->od_deleg_want)
4666                 dprintk("NFSD: %s: od_deleg_want=0x%x ignored\n", __func__,
4667                         od->od_deleg_want);
4668
4669         nfs4_lock_state();
4670         status = nfs4_preprocess_confirmed_seqid_op(cstate, od->od_seqid,
4671                                         &od->od_stateid, &stp, nn);
4672         if (status)
4673                 goto out; 
4674         status = nfserr_inval;
4675         if (!test_access(od->od_share_access, stp)) {
4676                 dprintk("NFSD: access not a subset of current bitmap: 0x%hhx, input access=%08x\n",
4677                         stp->st_access_bmap, od->od_share_access);
4678                 goto put_stateid;
4679         }
4680         if (!test_deny(od->od_share_deny, stp)) {
4681                 dprintk("NFSD: deny not a subset of current bitmap: 0x%hhx, input deny=%08x\n",
4682                         stp->st_deny_bmap, od->od_share_deny);
4683                 goto put_stateid;
4684         }
4685         nfs4_stateid_downgrade(stp, od->od_share_access);
4686
4687         reset_union_bmap_deny(od->od_share_deny, stp);
4688
4689         update_stateid(&stp->st_stid.sc_stateid);
4690         memcpy(&od->od_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
4691         status = nfs_ok;
4692 put_stateid:
4693         nfs4_put_stid(&stp->st_stid);
4694 out:
4695         nfsd4_bump_seqid(cstate, status);
4696         nfs4_unlock_state();
4697         return status;
4698 }
4699
4700 static void nfsd4_close_open_stateid(struct nfs4_ol_stateid *s)
4701 {
4702         struct nfs4_client *clp = s->st_stid.sc_client;
4703         LIST_HEAD(reaplist);
4704
4705         s->st_stid.sc_type = NFS4_CLOSED_STID;
4706         spin_lock(&clp->cl_lock);
4707         unhash_open_stateid(s, &reaplist);
4708
4709         if (clp->cl_minorversion) {
4710                 put_ol_stateid_locked(s, &reaplist);
4711                 spin_unlock(&clp->cl_lock);
4712                 free_ol_stateid_reaplist(&reaplist);
4713         } else {
4714                 spin_unlock(&clp->cl_lock);
4715                 free_ol_stateid_reaplist(&reaplist);
4716                 move_to_close_lru(s, clp->net);
4717         }
4718 }
4719
4720 /*
4721  * nfs4_unlock_state() called after encode
4722  */
4723 __be32
4724 nfsd4_close(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
4725             struct nfsd4_close *close)
4726 {
4727         __be32 status;
4728         struct nfs4_ol_stateid *stp;
4729         struct net *net = SVC_NET(rqstp);
4730         struct nfsd_net *nn = net_generic(net, nfsd_net_id);
4731
4732         dprintk("NFSD: nfsd4_close on file %pd\n", 
4733                         cstate->current_fh.fh_dentry);
4734
4735         nfs4_lock_state();
4736         status = nfs4_preprocess_seqid_op(cstate, close->cl_seqid,
4737                                         &close->cl_stateid,
4738                                         NFS4_OPEN_STID|NFS4_CLOSED_STID,
4739                                         &stp, nn);
4740         nfsd4_bump_seqid(cstate, status);
4741         if (status)
4742                 goto out; 
4743         update_stateid(&stp->st_stid.sc_stateid);
4744         memcpy(&close->cl_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
4745
4746         nfsd4_close_open_stateid(stp);
4747
4748         /* put reference from nfs4_preprocess_seqid_op */
4749         nfs4_put_stid(&stp->st_stid);
4750 out:
4751         nfs4_unlock_state();
4752         return status;
4753 }
4754
4755 __be32
4756 nfsd4_delegreturn(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
4757                   struct nfsd4_delegreturn *dr)
4758 {
4759         struct nfs4_delegation *dp;
4760         stateid_t *stateid = &dr->dr_stateid;
4761         struct nfs4_stid *s;
4762         __be32 status;
4763         struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
4764
4765         if ((status = fh_verify(rqstp, &cstate->current_fh, S_IFREG, 0)))
4766                 return status;
4767
4768         nfs4_lock_state();
4769         status = nfsd4_lookup_stateid(cstate, stateid, NFS4_DELEG_STID, &s, nn);
4770         if (status)
4771                 goto out;
4772         dp = delegstateid(s);
4773         status = check_stateid_generation(stateid, &dp->dl_stid.sc_stateid, nfsd4_has_session(cstate));
4774         if (status)
4775                 goto put_stateid;
4776
4777         destroy_delegation(dp);
4778 put_stateid:
4779         nfs4_put_stid(&dp->dl_stid);
4780 out:
4781         nfs4_unlock_state();
4782
4783         return status;
4784 }
4785
4786
4787 #define LOFF_OVERFLOW(start, len)      ((u64)(len) > ~(u64)(start))
4788
4789 static inline u64
4790 end_offset(u64 start, u64 len)
4791 {
4792         u64 end;
4793
4794         end = start + len;
4795         return end >= start ? end: NFS4_MAX_UINT64;
4796 }
4797
4798 /* last octet in a range */
4799 static inline u64
4800 last_byte_offset(u64 start, u64 len)
4801 {
4802         u64 end;
4803
4804         WARN_ON_ONCE(!len);
4805         end = start + len;
4806         return end > start ? end - 1: NFS4_MAX_UINT64;
4807 }
4808
4809 /*
4810  * TODO: Linux file offsets are _signed_ 64-bit quantities, which means that
4811  * we can't properly handle lock requests that go beyond the (2^63 - 1)-th
4812  * byte, because of sign extension problems.  Since NFSv4 calls for 64-bit
4813  * locking, this prevents us from being completely protocol-compliant.  The
4814  * real solution to this problem is to start using unsigned file offsets in
4815  * the VFS, but this is a very deep change!
4816  */
4817 static inline void
4818 nfs4_transform_lock_offset(struct file_lock *lock)
4819 {
4820         if (lock->fl_start < 0)
4821                 lock->fl_start = OFFSET_MAX;
4822         if (lock->fl_end < 0)
4823                 lock->fl_end = OFFSET_MAX;
4824 }
4825
4826 /* Hack!: For now, we're defining this just so we can use a pointer to it
4827  * as a unique cookie to identify our (NFSv4's) posix locks. */
4828 static const struct lock_manager_operations nfsd_posix_mng_ops  = {
4829 };
4830
4831 static inline void
4832 nfs4_set_lock_denied(struct file_lock *fl, struct nfsd4_lock_denied *deny)
4833 {
4834         struct nfs4_lockowner *lo;
4835
4836         if (fl->fl_lmops == &nfsd_posix_mng_ops) {
4837                 lo = (struct nfs4_lockowner *) fl->fl_owner;
4838                 deny->ld_owner.data = kmemdup(lo->lo_owner.so_owner.data,
4839                                         lo->lo_owner.so_owner.len, GFP_KERNEL);
4840                 if (!deny->ld_owner.data)
4841                         /* We just don't care that much */
4842                         goto nevermind;
4843                 deny->ld_owner.len = lo->lo_owner.so_owner.len;
4844                 deny->ld_clientid = lo->lo_owner.so_client->cl_clientid;
4845         } else {
4846 nevermind:
4847                 deny->ld_owner.len = 0;
4848                 deny->ld_owner.data = NULL;
4849                 deny->ld_clientid.cl_boot = 0;
4850                 deny->ld_clientid.cl_id = 0;
4851         }
4852         deny->ld_start = fl->fl_start;
4853         deny->ld_length = NFS4_MAX_UINT64;
4854         if (fl->fl_end != NFS4_MAX_UINT64)
4855                 deny->ld_length = fl->fl_end - fl->fl_start + 1;        
4856         deny->ld_type = NFS4_READ_LT;
4857         if (fl->fl_type != F_RDLCK)
4858                 deny->ld_type = NFS4_WRITE_LT;
4859 }
4860
4861 static struct nfs4_lockowner *
4862 find_lockowner_str_locked(clientid_t *clid, struct xdr_netobj *owner,
4863                 struct nfs4_client *clp)
4864 {
4865         unsigned int strhashval = ownerstr_hashval(owner);
4866         struct nfs4_stateowner *so;
4867
4868         list_for_each_entry(so, &clp->cl_ownerstr_hashtbl[strhashval],
4869                             so_strhash) {
4870                 if (so->so_is_open_owner)
4871                         continue;
4872                 if (!same_owner_str(so, owner))
4873                         continue;
4874                 atomic_inc(&so->so_count);
4875                 return lockowner(so);
4876         }
4877         return NULL;
4878 }
4879
4880 static struct nfs4_lockowner *
4881 find_lockowner_str(clientid_t *clid, struct xdr_netobj *owner,
4882                 struct nfs4_client *clp)
4883 {
4884         struct nfs4_lockowner *lo;
4885
4886         spin_lock(&clp->cl_lock);
4887         lo = find_lockowner_str_locked(clid, owner, clp);
4888         spin_unlock(&clp->cl_lock);
4889         return lo;
4890 }
4891
4892 static void nfs4_unhash_lockowner(struct nfs4_stateowner *sop)
4893 {
4894         unhash_lockowner_locked(lockowner(sop));
4895 }
4896
4897 static void nfs4_free_lockowner(struct nfs4_stateowner *sop)
4898 {
4899         struct nfs4_lockowner *lo = lockowner(sop);
4900
4901         kmem_cache_free(lockowner_slab, lo);
4902 }
4903
4904 static const struct nfs4_stateowner_operations lockowner_ops = {
4905         .so_unhash =    nfs4_unhash_lockowner,
4906         .so_free =      nfs4_free_lockowner,
4907 };
4908
4909 /*
4910  * Alloc a lock owner structure.
4911  * Called in nfsd4_lock - therefore, OPEN and OPEN_CONFIRM (if needed) has 
4912  * occurred. 
4913  *
4914  * strhashval = ownerstr_hashval
4915  */
4916 static struct nfs4_lockowner *
4917 alloc_init_lock_stateowner(unsigned int strhashval, struct nfs4_client *clp,
4918                            struct nfs4_ol_stateid *open_stp,
4919                            struct nfsd4_lock *lock)
4920 {
4921         struct nfs4_lockowner *lo, *ret;
4922
4923         lo = alloc_stateowner(lockowner_slab, &lock->lk_new_owner, clp);
4924         if (!lo)
4925                 return NULL;
4926         INIT_LIST_HEAD(&lo->lo_owner.so_stateids);
4927         lo->lo_owner.so_is_open_owner = 0;
4928         lo->lo_owner.so_seqid = lock->lk_new_lock_seqid;
4929         lo->lo_owner.so_ops = &lockowner_ops;
4930         spin_lock(&clp->cl_lock);
4931         ret = find_lockowner_str_locked(&clp->cl_clientid,
4932                         &lock->lk_new_owner, clp);
4933         if (ret == NULL) {
4934                 list_add(&lo->lo_owner.so_strhash,
4935                          &clp->cl_ownerstr_hashtbl[strhashval]);
4936                 ret = lo;
4937         } else
4938                 nfs4_free_lockowner(&lo->lo_owner);
4939         spin_unlock(&clp->cl_lock);
4940         return lo;
4941 }
4942
4943 static void
4944 init_lock_stateid(struct nfs4_ol_stateid *stp, struct nfs4_lockowner *lo,
4945                   struct nfs4_file *fp, struct inode *inode,
4946                   struct nfs4_ol_stateid *open_stp)
4947 {
4948         struct nfs4_client *clp = lo->lo_owner.so_client;
4949
4950         lockdep_assert_held(&clp->cl_lock);
4951
4952         atomic_inc(&stp->st_stid.sc_count);
4953         stp->st_stid.sc_type = NFS4_LOCK_STID;
4954         stp->st_stateowner = &lo->lo_owner;
4955         atomic_inc(&lo->lo_owner.so_count);
4956         get_nfs4_file(fp);
4957         stp->st_stid.sc_file = fp;
4958         stp->st_stid.sc_free = nfs4_free_lock_stateid;
4959         stp->st_access_bmap = 0;
4960         stp->st_deny_bmap = open_stp->st_deny_bmap;
4961         stp->st_openstp = open_stp;
4962         list_add(&stp->st_locks, &open_stp->st_locks);
4963         list_add(&stp->st_perstateowner, &lo->lo_owner.so_stateids);
4964         spin_lock(&fp->fi_lock);
4965         list_add(&stp->st_perfile, &fp->fi_stateids);
4966         spin_unlock(&fp->fi_lock);
4967 }
4968
4969 static struct nfs4_ol_stateid *
4970 find_lock_stateid(struct nfs4_lockowner *lo, struct nfs4_file *fp)
4971 {
4972         struct nfs4_ol_stateid *lst;
4973         struct nfs4_client *clp = lo->lo_owner.so_client;
4974
4975         lockdep_assert_held(&clp->cl_lock);
4976
4977         list_for_each_entry(lst, &lo->lo_owner.so_stateids, st_perstateowner) {
4978                 if (lst->st_stid.sc_file == fp) {
4979                         atomic_inc(&lst->st_stid.sc_count);
4980                         return lst;
4981                 }
4982         }
4983         return NULL;
4984 }
4985
4986 static struct nfs4_ol_stateid *
4987 find_or_create_lock_stateid(struct nfs4_lockowner *lo, struct nfs4_file *fi,
4988                             struct inode *inode, struct nfs4_ol_stateid *ost,
4989                             bool *new)
4990 {
4991         struct nfs4_stid *ns = NULL;
4992         struct nfs4_ol_stateid *lst;
4993         struct nfs4_openowner *oo = openowner(ost->st_stateowner);
4994         struct nfs4_client *clp = oo->oo_owner.so_client;
4995
4996         spin_lock(&clp->cl_lock);
4997         lst = find_lock_stateid(lo, fi);
4998         if (lst == NULL) {
4999                 spin_unlock(&clp->cl_lock);
5000                 ns = nfs4_alloc_stid(clp, stateid_slab);
5001                 if (ns == NULL)
5002                         return NULL;
5003
5004                 spin_lock(&clp->cl_lock);
5005                 lst = find_lock_stateid(lo, fi);
5006                 if (likely(!lst)) {
5007                         lst = openlockstateid(ns);
5008                         init_lock_stateid(lst, lo, fi, inode, ost);
5009                         ns = NULL;
5010                         *new = true;
5011                 }
5012         }
5013         spin_unlock(&clp->cl_lock);
5014         if (ns)
5015                 nfs4_put_stid(ns);
5016         return lst;
5017 }
5018
5019 static int
5020 check_lock_length(u64 offset, u64 length)
5021 {
5022         return ((length == 0)  || ((length != NFS4_MAX_UINT64) &&
5023              LOFF_OVERFLOW(offset, length)));
5024 }
5025
5026 static void get_lock_access(struct nfs4_ol_stateid *lock_stp, u32 access)
5027 {
5028         struct nfs4_file *fp = lock_stp->st_stid.sc_file;
5029
5030         lockdep_assert_held(&fp->fi_lock);
5031
5032         if (test_access(access, lock_stp))
5033                 return;
5034         __nfs4_file_get_access(fp, access);
5035         set_access(access, lock_stp);
5036 }
5037
5038 static __be32
5039 lookup_or_create_lock_state(struct nfsd4_compound_state *cstate,
5040                             struct nfs4_ol_stateid *ost,
5041                             struct nfsd4_lock *lock,
5042                             struct nfs4_ol_stateid **lst, bool *new)
5043 {
5044         __be32 status;
5045         struct nfs4_file *fi = ost->st_stid.sc_file;
5046         struct nfs4_openowner *oo = openowner(ost->st_stateowner);
5047         struct nfs4_client *cl = oo->oo_owner.so_client;
5048         struct inode *inode = cstate->current_fh.fh_dentry->d_inode;
5049         struct nfs4_lockowner *lo;
5050         unsigned int strhashval;
5051
5052         lo = find_lockowner_str(&cl->cl_clientid, &lock->v.new.owner, cl);
5053         if (!lo) {
5054                 strhashval = ownerstr_hashval(&lock->v.new.owner);
5055                 lo = alloc_init_lock_stateowner(strhashval, cl, ost, lock);
5056                 if (lo == NULL)
5057                         return nfserr_jukebox;
5058         } else {
5059                 /* with an existing lockowner, seqids must be the same */
5060                 status = nfserr_bad_seqid;
5061                 if (!cstate->minorversion &&
5062                     lock->lk_new_lock_seqid != lo->lo_owner.so_seqid)
5063                         goto out;
5064         }
5065
5066         *lst = find_or_create_lock_stateid(lo, fi, inode, ost, new);
5067         if (*lst == NULL) {
5068                 status = nfserr_jukebox;
5069                 goto out;
5070         }
5071         status = nfs_ok;
5072 out:
5073         nfs4_put_stateowner(&lo->lo_owner);
5074         return status;
5075 }
5076
5077 /*
5078  *  LOCK operation 
5079  */
5080 __be32
5081 nfsd4_lock(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
5082            struct nfsd4_lock *lock)
5083 {
5084         struct nfs4_openowner *open_sop = NULL;
5085         struct nfs4_lockowner *lock_sop = NULL;
5086         struct nfs4_ol_stateid *lock_stp = NULL;
5087         struct nfs4_ol_stateid *open_stp = NULL;
5088         struct nfs4_file *fp;
5089         struct file *filp = NULL;
5090         struct file_lock *file_lock = NULL;
5091         struct file_lock *conflock = NULL;
5092         __be32 status = 0;
5093         int lkflg;
5094         int err;
5095         bool new = false;
5096         struct net *net = SVC_NET(rqstp);
5097         struct nfsd_net *nn = net_generic(net, nfsd_net_id);
5098
5099         dprintk("NFSD: nfsd4_lock: start=%Ld length=%Ld\n",
5100                 (long long) lock->lk_offset,
5101                 (long long) lock->lk_length);
5102
5103         if (check_lock_length(lock->lk_offset, lock->lk_length))
5104                  return nfserr_inval;
5105
5106         if ((status = fh_verify(rqstp, &cstate->current_fh,
5107                                 S_IFREG, NFSD_MAY_LOCK))) {
5108                 dprintk("NFSD: nfsd4_lock: permission denied!\n");
5109                 return status;
5110         }
5111
5112         nfs4_lock_state();
5113
5114         if (lock->lk_is_new) {
5115                 if (nfsd4_has_session(cstate))
5116                         /* See rfc 5661 18.10.3: given clientid is ignored: */
5117                         memcpy(&lock->v.new.clientid,
5118                                 &cstate->session->se_client->cl_clientid,
5119                                 sizeof(clientid_t));
5120
5121                 status = nfserr_stale_clientid;
5122                 if (STALE_CLIENTID(&lock->lk_new_clientid, nn))
5123                         goto out;
5124
5125                 /* validate and update open stateid and open seqid */
5126                 status = nfs4_preprocess_confirmed_seqid_op(cstate,
5127                                         lock->lk_new_open_seqid,
5128                                         &lock->lk_new_open_stateid,
5129                                         &open_stp, nn);
5130                 if (status)
5131                         goto out;
5132                 open_sop = openowner(open_stp->st_stateowner);
5133                 status = nfserr_bad_stateid;
5134                 if (!same_clid(&open_sop->oo_owner.so_client->cl_clientid,
5135                                                 &lock->v.new.clientid))
5136                         goto out;
5137                 status = lookup_or_create_lock_state(cstate, open_stp, lock,
5138                                                         &lock_stp, &new);
5139         } else {
5140                 status = nfs4_preprocess_seqid_op(cstate,
5141                                        lock->lk_old_lock_seqid,
5142                                        &lock->lk_old_lock_stateid,
5143                                        NFS4_LOCK_STID, &lock_stp, nn);
5144         }
5145         if (status)
5146                 goto out;
5147         lock_sop = lockowner(lock_stp->st_stateowner);
5148
5149         lkflg = setlkflg(lock->lk_type);
5150         status = nfs4_check_openmode(lock_stp, lkflg);
5151         if (status)
5152                 goto out;
5153
5154         status = nfserr_grace;
5155         if (locks_in_grace(net) && !lock->lk_reclaim)
5156                 goto out;
5157         status = nfserr_no_grace;
5158         if (!locks_in_grace(net) && lock->lk_reclaim)
5159                 goto out;
5160
5161         file_lock = locks_alloc_lock();
5162         if (!file_lock) {
5163                 dprintk("NFSD: %s: unable to allocate lock!\n", __func__);
5164                 status = nfserr_jukebox;
5165                 goto out;
5166         }
5167
5168         fp = lock_stp->st_stid.sc_file;
5169         locks_init_lock(file_lock);
5170         switch (lock->lk_type) {
5171                 case NFS4_READ_LT:
5172                 case NFS4_READW_LT:
5173                         spin_lock(&fp->fi_lock);
5174                         filp = find_readable_file_locked(fp);
5175                         if (filp)
5176                                 get_lock_access(lock_stp, NFS4_SHARE_ACCESS_READ);
5177                         spin_unlock(&fp->fi_lock);
5178                         file_lock->fl_type = F_RDLCK;
5179                         break;
5180                 case NFS4_WRITE_LT:
5181                 case NFS4_WRITEW_LT:
5182                         spin_lock(&fp->fi_lock);
5183                         filp = find_writeable_file_locked(fp);
5184                         if (filp)
5185                                 get_lock_access(lock_stp, NFS4_SHARE_ACCESS_WRITE);
5186                         spin_unlock(&fp->fi_lock);
5187                         file_lock->fl_type = F_WRLCK;
5188                         break;
5189                 default:
5190                         status = nfserr_inval;
5191                 goto out;
5192         }
5193         if (!filp) {
5194                 status = nfserr_openmode;
5195                 goto out;
5196         }
5197         file_lock->fl_owner = (fl_owner_t)lock_sop;
5198         file_lock->fl_pid = current->tgid;
5199         file_lock->fl_file = filp;
5200         file_lock->fl_flags = FL_POSIX;
5201         file_lock->fl_lmops = &nfsd_posix_mng_ops;
5202         file_lock->fl_start = lock->lk_offset;
5203         file_lock->fl_end = last_byte_offset(lock->lk_offset, lock->lk_length);
5204         nfs4_transform_lock_offset(file_lock);
5205
5206         conflock = locks_alloc_lock();
5207         if (!conflock) {
5208                 dprintk("NFSD: %s: unable to allocate lock!\n", __func__);
5209                 status = nfserr_jukebox;
5210                 goto out;
5211         }
5212
5213         err = vfs_lock_file(filp, F_SETLK, file_lock, conflock);
5214         switch (-err) {
5215         case 0: /* success! */
5216                 update_stateid(&lock_stp->st_stid.sc_stateid);
5217                 memcpy(&lock->lk_resp_stateid, &lock_stp->st_stid.sc_stateid, 
5218                                 sizeof(stateid_t));
5219                 status = 0;
5220                 break;
5221         case (EAGAIN):          /* conflock holds conflicting lock */
5222                 status = nfserr_denied;
5223                 dprintk("NFSD: nfsd4_lock: conflicting lock found!\n");
5224                 nfs4_set_lock_denied(conflock, &lock->lk_denied);
5225                 break;
5226         case (EDEADLK):
5227                 status = nfserr_deadlock;
5228                 break;
5229         default:
5230                 dprintk("NFSD: nfsd4_lock: vfs_lock_file() failed! status %d\n",err);
5231                 status = nfserrno(err);
5232                 break;
5233         }
5234 out:
5235         if (filp)
5236                 fput(filp);
5237         if (lock_stp) {
5238                 /* Bump seqid manually if the 4.0 replay owner is openowner */
5239                 if (cstate->replay_owner &&
5240                     cstate->replay_owner != &lock_sop->lo_owner &&
5241                     seqid_mutating_err(ntohl(status)))
5242                         lock_sop->lo_owner.so_seqid++;
5243
5244                 /*
5245                  * If this is a new, never-before-used stateid, and we are
5246                  * returning an error, then just go ahead and release it.
5247                  */
5248                 if (status && new)
5249                         release_lock_stateid(lock_stp);
5250
5251                 nfs4_put_stid(&lock_stp->st_stid);
5252         }
5253         if (open_stp)
5254                 nfs4_put_stid(&open_stp->st_stid);
5255         nfsd4_bump_seqid(cstate, status);
5256         nfs4_unlock_state();
5257         if (file_lock)
5258                 locks_free_lock(file_lock);
5259         if (conflock)
5260                 locks_free_lock(conflock);
5261         return status;
5262 }
5263
5264 /*
5265  * The NFSv4 spec allows a client to do a LOCKT without holding an OPEN,
5266  * so we do a temporary open here just to get an open file to pass to
5267  * vfs_test_lock.  (Arguably perhaps test_lock should be done with an
5268  * inode operation.)
5269  */
5270 static __be32 nfsd_test_lock(struct svc_rqst *rqstp, struct svc_fh *fhp, struct file_lock *lock)
5271 {
5272         struct file *file;
5273         __be32 err = nfsd_open(rqstp, fhp, S_IFREG, NFSD_MAY_READ, &file);
5274         if (!err) {
5275                 err = nfserrno(vfs_test_lock(file, lock));
5276                 nfsd_close(file);
5277         }
5278         return err;
5279 }
5280
5281 /*
5282  * LOCKT operation
5283  */
5284 __be32
5285 nfsd4_lockt(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
5286             struct nfsd4_lockt *lockt)
5287 {
5288         struct file_lock *file_lock = NULL;
5289         struct nfs4_lockowner *lo = NULL;
5290         __be32 status;
5291         struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
5292
5293         if (locks_in_grace(SVC_NET(rqstp)))
5294                 return nfserr_grace;
5295
5296         if (check_lock_length(lockt->lt_offset, lockt->lt_length))
5297                  return nfserr_inval;
5298
5299         nfs4_lock_state();
5300
5301         if (!nfsd4_has_session(cstate)) {
5302                 status = lookup_clientid(&lockt->lt_clientid, cstate, nn);
5303                 if (status)
5304                         goto out;
5305         }
5306
5307         if ((status = fh_verify(rqstp, &cstate->current_fh, S_IFREG, 0)))
5308                 goto out;
5309
5310         file_lock = locks_alloc_lock();
5311         if (!file_lock) {
5312                 dprintk("NFSD: %s: unable to allocate lock!\n", __func__);
5313                 status = nfserr_jukebox;
5314                 goto out;
5315         }
5316         locks_init_lock(file_lock);
5317         switch (lockt->lt_type) {
5318                 case NFS4_READ_LT:
5319                 case NFS4_READW_LT:
5320                         file_lock->fl_type = F_RDLCK;
5321                 break;
5322                 case NFS4_WRITE_LT:
5323                 case NFS4_WRITEW_LT:
5324                         file_lock->fl_type = F_WRLCK;
5325                 break;
5326                 default:
5327                         dprintk("NFSD: nfs4_lockt: bad lock type!\n");
5328                         status = nfserr_inval;
5329                 goto out;
5330         }
5331
5332         lo = find_lockowner_str(&lockt->lt_clientid, &lockt->lt_owner,
5333                                 cstate->clp);
5334         if (lo)
5335                 file_lock->fl_owner = (fl_owner_t)lo;
5336         file_lock->fl_pid = current->tgid;
5337         file_lock->fl_flags = FL_POSIX;
5338
5339         file_lock->fl_start = lockt->lt_offset;
5340         file_lock->fl_end = last_byte_offset(lockt->lt_offset, lockt->lt_length);
5341
5342         nfs4_transform_lock_offset(file_lock);
5343
5344         status = nfsd_test_lock(rqstp, &cstate->current_fh, file_lock);
5345         if (status)
5346                 goto out;
5347
5348         if (file_lock->fl_type != F_UNLCK) {
5349                 status = nfserr_denied;
5350                 nfs4_set_lock_denied(file_lock, &lockt->lt_denied);
5351         }
5352 out:
5353         if (lo)
5354                 nfs4_put_stateowner(&lo->lo_owner);
5355         nfs4_unlock_state();
5356         if (file_lock)
5357                 locks_free_lock(file_lock);
5358         return status;
5359 }
5360
5361 __be32
5362 nfsd4_locku(struct svc_rqst *rqstp, struct nfsd4_compound_state *cstate,
5363             struct nfsd4_locku *locku)
5364 {
5365         struct nfs4_ol_stateid *stp;
5366         struct file *filp = NULL;
5367         struct file_lock *file_lock = NULL;
5368         __be32 status;
5369         int err;
5370         struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
5371
5372         dprintk("NFSD: nfsd4_locku: start=%Ld length=%Ld\n",
5373                 (long long) locku->lu_offset,
5374                 (long long) locku->lu_length);
5375
5376         if (check_lock_length(locku->lu_offset, locku->lu_length))
5377                  return nfserr_inval;
5378
5379         nfs4_lock_state();
5380                                                                                 
5381         status = nfs4_preprocess_seqid_op(cstate, locku->lu_seqid,
5382                                         &locku->lu_stateid, NFS4_LOCK_STID,
5383                                         &stp, nn);
5384         if (status)
5385                 goto out;
5386         filp = find_any_file(stp->st_stid.sc_file);
5387         if (!filp) {
5388                 status = nfserr_lock_range;
5389                 goto put_stateid;
5390         }
5391         file_lock = locks_alloc_lock();
5392         if (!file_lock) {
5393                 dprintk("NFSD: %s: unable to allocate lock!\n", __func__);
5394                 status = nfserr_jukebox;
5395                 goto fput;
5396         }
5397         locks_init_lock(file_lock);
5398         file_lock->fl_type = F_UNLCK;
5399         file_lock->fl_owner = (fl_owner_t)lockowner(stp->st_stateowner);
5400         file_lock->fl_pid = current->tgid;
5401         file_lock->fl_file = filp;
5402         file_lock->fl_flags = FL_POSIX;
5403         file_lock->fl_lmops = &nfsd_posix_mng_ops;
5404         file_lock->fl_start = locku->lu_offset;
5405
5406         file_lock->fl_end = last_byte_offset(locku->lu_offset,
5407                                                 locku->lu_length);
5408         nfs4_transform_lock_offset(file_lock);
5409
5410         err = vfs_lock_file(filp, F_SETLK, file_lock, NULL);
5411         if (err) {
5412                 dprintk("NFSD: nfs4_locku: vfs_lock_file failed!\n");
5413                 goto out_nfserr;
5414         }
5415         update_stateid(&stp->st_stid.sc_stateid);
5416         memcpy(&locku->lu_stateid, &stp->st_stid.sc_stateid, sizeof(stateid_t));
5417 fput:
5418         fput(filp);
5419 put_stateid:
5420         nfs4_put_stid(&stp->st_stid);
5421 out:
5422         nfsd4_bump_seqid(cstate, status);
5423         nfs4_unlock_state();
5424         if (file_lock)
5425                 locks_free_lock(file_lock);
5426         return status;
5427
5428 out_nfserr:
5429         status = nfserrno(err);
5430         goto fput;
5431 }
5432
5433 /*
5434  * returns
5435  *      true:  locks held by lockowner
5436  *      false: no locks held by lockowner
5437  */
5438 static bool
5439 check_for_locks(struct nfs4_file *fp, struct nfs4_lockowner *lowner)
5440 {
5441         struct file_lock **flpp;
5442         int status = false;
5443         struct file *filp = find_any_file(fp);
5444         struct inode *inode;
5445
5446         if (!filp) {
5447                 /* Any valid lock stateid should have some sort of access */
5448                 WARN_ON_ONCE(1);
5449                 return status;
5450         }
5451
5452         inode = file_inode(filp);
5453
5454         spin_lock(&inode->i_lock);
5455         for (flpp = &inode->i_flock; *flpp != NULL; flpp = &(*flpp)->fl_next) {
5456                 if ((*flpp)->fl_owner == (fl_owner_t)lowner) {
5457                         status = true;
5458                         break;
5459                 }
5460         }
5461         spin_unlock(&inode->i_lock);
5462         fput(filp);
5463         return status;
5464 }
5465
5466 __be32
5467 nfsd4_release_lockowner(struct svc_rqst *rqstp,
5468                         struct nfsd4_compound_state *cstate,
5469                         struct nfsd4_release_lockowner *rlockowner)
5470 {
5471         clientid_t *clid = &rlockowner->rl_clientid;
5472         struct nfs4_stateowner *sop;
5473         struct nfs4_lockowner *lo = NULL;
5474         struct nfs4_ol_stateid *stp;
5475         struct xdr_netobj *owner = &rlockowner->rl_owner;
5476         unsigned int hashval = ownerstr_hashval(owner);
5477         __be32 status;
5478         struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
5479         struct nfs4_client *clp;
5480
5481         dprintk("nfsd4_release_lockowner clientid: (%08x/%08x):\n",
5482                 clid->cl_boot, clid->cl_id);
5483
5484         nfs4_lock_state();
5485
5486         status = lookup_clientid(clid, cstate, nn);
5487         if (status)
5488                 goto out;
5489
5490         clp = cstate->clp;
5491         /* Find the matching lock stateowner */
5492         spin_lock(&clp->cl_lock);
5493         list_for_each_entry(sop, &clp->cl_ownerstr_hashtbl[hashval],
5494                             so_strhash) {
5495
5496                 if (sop->so_is_open_owner || !same_owner_str(sop, owner))
5497                         continue;
5498
5499                 /* see if there are still any locks associated with it */
5500                 lo = lockowner(sop);
5501                 list_for_each_entry(stp, &sop->so_stateids, st_perstateowner) {
5502                         if (check_for_locks(stp->st_stid.sc_file, lo)) {
5503                                 status = nfserr_locks_held;
5504                                 spin_unlock(&clp->cl_lock);
5505                                 goto out;
5506                         }
5507                 }
5508
5509                 atomic_inc(&sop->so_count);
5510                 break;
5511         }
5512         spin_unlock(&clp->cl_lock);
5513         if (lo)
5514                 release_lockowner(lo);
5515 out:
5516         nfs4_unlock_state();
5517         return status;
5518 }
5519
5520 static inline struct nfs4_client_reclaim *
5521 alloc_reclaim(void)
5522 {
5523         return kmalloc(sizeof(struct nfs4_client_reclaim), GFP_KERNEL);
5524 }
5525
5526 bool
5527 nfs4_has_reclaimed_state(const char *name, struct nfsd_net *nn)
5528 {
5529         struct nfs4_client_reclaim *crp;
5530
5531         crp = nfsd4_find_reclaim_client(name, nn);
5532         return (crp && crp->cr_clp);
5533 }
5534
5535 /*
5536  * failure => all reset bets are off, nfserr_no_grace...
5537  */
5538 struct nfs4_client_reclaim *
5539 nfs4_client_to_reclaim(const char *name, struct nfsd_net *nn)
5540 {
5541         unsigned int strhashval;
5542         struct nfs4_client_reclaim *crp;
5543
5544         dprintk("NFSD nfs4_client_to_reclaim NAME: %.*s\n", HEXDIR_LEN, name);
5545         crp = alloc_reclaim();
5546         if (crp) {
5547                 strhashval = clientstr_hashval(name);
5548                 INIT_LIST_HEAD(&crp->cr_strhash);
5549                 list_add(&crp->cr_strhash, &nn->reclaim_str_hashtbl[strhashval]);
5550                 memcpy(crp->cr_recdir, name, HEXDIR_LEN);
5551                 crp->cr_clp = NULL;
5552                 nn->reclaim_str_hashtbl_size++;
5553         }
5554         return crp;
5555 }
5556
5557 void
5558 nfs4_remove_reclaim_record(struct nfs4_client_reclaim *crp, struct nfsd_net *nn)
5559 {
5560         list_del(&crp->cr_strhash);
5561         kfree(crp);
5562         nn->reclaim_str_hashtbl_size--;
5563 }
5564
5565 void
5566 nfs4_release_reclaim(struct nfsd_net *nn)
5567 {
5568         struct nfs4_client_reclaim *crp = NULL;
5569         int i;
5570
5571         for (i = 0; i < CLIENT_HASH_SIZE; i++) {
5572                 while (!list_empty(&nn->reclaim_str_hashtbl[i])) {
5573                         crp = list_entry(nn->reclaim_str_hashtbl[i].next,
5574                                         struct nfs4_client_reclaim, cr_strhash);
5575                         nfs4_remove_reclaim_record(crp, nn);
5576                 }
5577         }
5578         WARN_ON_ONCE(nn->reclaim_str_hashtbl_size);
5579 }
5580
5581 /*
5582  * called from OPEN, CLAIM_PREVIOUS with a new clientid. */
5583 struct nfs4_client_reclaim *
5584 nfsd4_find_reclaim_client(const char *recdir, struct nfsd_net *nn)
5585 {
5586         unsigned int strhashval;
5587         struct nfs4_client_reclaim *crp = NULL;
5588
5589         dprintk("NFSD: nfs4_find_reclaim_client for recdir %s\n", recdir);
5590
5591         strhashval = clientstr_hashval(recdir);
5592         list_for_each_entry(crp, &nn->reclaim_str_hashtbl[strhashval], cr_strhash) {
5593                 if (same_name(crp->cr_recdir, recdir)) {
5594                         return crp;
5595                 }
5596         }
5597         return NULL;
5598 }
5599
5600 /*
5601 * Called from OPEN. Look for clientid in reclaim list.
5602 */
5603 __be32
5604 nfs4_check_open_reclaim(clientid_t *clid,
5605                 struct nfsd4_compound_state *cstate,
5606                 struct nfsd_net *nn)
5607 {
5608         __be32 status;
5609
5610         /* find clientid in conf_id_hashtbl */
5611         status = lookup_clientid(clid, cstate, nn);
5612         if (status)
5613                 return nfserr_reclaim_bad;
5614
5615         if (nfsd4_client_record_check(cstate->clp))
5616                 return nfserr_reclaim_bad;
5617
5618         return nfs_ok;
5619 }
5620
5621 #ifdef CONFIG_NFSD_FAULT_INJECTION
5622
5623 u64 nfsd_forget_client(struct nfs4_client *clp, u64 max)
5624 {
5625         if (mark_client_expired(clp))
5626                 return 0;
5627         expire_client(clp);
5628         return 1;
5629 }
5630
5631 u64 nfsd_print_client(struct nfs4_client *clp, u64 num)
5632 {
5633         char buf[INET6_ADDRSTRLEN];
5634         rpc_ntop((struct sockaddr *)&clp->cl_addr, buf, sizeof(buf));
5635         printk(KERN_INFO "NFS Client: %s\n", buf);
5636         return 1;
5637 }
5638
5639 static void nfsd_print_count(struct nfs4_client *clp, unsigned int count,
5640                              const char *type)
5641 {
5642         char buf[INET6_ADDRSTRLEN];
5643         rpc_ntop((struct sockaddr *)&clp->cl_addr, buf, sizeof(buf));
5644         printk(KERN_INFO "NFS Client: %s has %u %s\n", buf, count, type);
5645 }
5646
5647 static u64 nfsd_foreach_client_lock(struct nfs4_client *clp, u64 max,
5648                                     void (*func)(struct nfs4_ol_stateid *))
5649 {
5650         struct nfs4_openowner *oop;
5651         struct nfs4_ol_stateid *stp, *st_next;
5652         struct nfs4_ol_stateid *lst, *lst_next;
5653         u64 count = 0;
5654
5655         list_for_each_entry(oop, &clp->cl_openowners, oo_perclient) {
5656                 list_for_each_entry_safe(stp, st_next,
5657                                 &oop->oo_owner.so_stateids, st_perstateowner) {
5658                         list_for_each_entry_safe(lst, lst_next,
5659                                         &stp->st_locks, st_locks) {
5660                                 if (func)
5661                                         func(lst);
5662                                 if (++count == max)
5663                                         return count;
5664                         }
5665                 }
5666         }
5667
5668         return count;
5669 }
5670
5671 u64 nfsd_forget_client_locks(struct nfs4_client *clp, u64 max)
5672 {
5673         return nfsd_foreach_client_lock(clp, max, release_lock_stateid);
5674 }
5675
5676 u64 nfsd_print_client_locks(struct nfs4_client *clp, u64 max)
5677 {
5678         u64 count = nfsd_foreach_client_lock(clp, max, NULL);
5679         nfsd_print_count(clp, count, "locked files");
5680         return count;
5681 }
5682
5683 static u64 nfsd_foreach_client_open(struct nfs4_client *clp, u64 max, void (*func)(struct nfs4_openowner *))
5684 {
5685         struct nfs4_openowner *oop, *next;
5686         u64 count = 0;
5687
5688         list_for_each_entry_safe(oop, next, &clp->cl_openowners, oo_perclient) {
5689                 if (func)
5690                         func(oop);
5691                 if (++count == max)
5692                         break;
5693         }
5694
5695         return count;
5696 }
5697
5698 u64 nfsd_forget_client_openowners(struct nfs4_client *clp, u64 max)
5699 {
5700         return nfsd_foreach_client_open(clp, max, release_openowner);
5701 }
5702
5703 u64 nfsd_print_client_openowners(struct nfs4_client *clp, u64 max)
5704 {
5705         u64 count = nfsd_foreach_client_open(clp, max, NULL);
5706         nfsd_print_count(clp, count, "open files");
5707         return count;
5708 }
5709
5710 static u64 nfsd_find_all_delegations(struct nfs4_client *clp, u64 max,
5711                                      struct list_head *victims)
5712 {
5713         struct nfs4_delegation *dp, *next;
5714         u64 count = 0;
5715
5716         lockdep_assert_held(&state_lock);
5717         list_for_each_entry_safe(dp, next, &clp->cl_delegations, dl_perclnt) {
5718                 if (victims) {
5719                         /*
5720                          * It's not safe to mess with delegations that have a
5721                          * non-zero dl_time. They might have already been broken
5722                          * and could be processed by the laundromat outside of
5723                          * the state_lock. Just leave them be.
5724                          */
5725                         if (dp->dl_time != 0)
5726                                 continue;
5727
5728                         unhash_delegation_locked(dp);
5729                         list_add(&dp->dl_recall_lru, victims);
5730                 }
5731                 if (++count == max)
5732                         break;
5733         }
5734         return count;
5735 }
5736
5737 u64 nfsd_forget_client_delegations(struct nfs4_client *clp, u64 max)
5738 {
5739         struct nfs4_delegation *dp, *next;
5740         LIST_HEAD(victims);
5741         u64 count;
5742
5743         spin_lock(&state_lock);
5744         count = nfsd_find_all_delegations(clp, max, &victims);
5745         spin_unlock(&state_lock);
5746
5747         list_for_each_entry_safe(dp, next, &victims, dl_recall_lru) {
5748                 list_del_init(&dp->dl_recall_lru);
5749                 revoke_delegation(dp);
5750         }
5751
5752         return count;
5753 }
5754
5755 u64 nfsd_recall_client_delegations(struct nfs4_client *clp, u64 max)
5756 {
5757         struct nfs4_delegation *dp;
5758         LIST_HEAD(victims);
5759         u64 count;
5760
5761         spin_lock(&state_lock);
5762         count = nfsd_find_all_delegations(clp, max, &victims);
5763         while (!list_empty(&victims)) {
5764                 dp = list_first_entry(&victims, struct nfs4_delegation,
5765                                         dl_recall_lru);
5766                 list_del_init(&dp->dl_recall_lru);
5767                 dp->dl_time = 0;
5768                 nfsd_break_one_deleg(dp);
5769         }
5770         spin_unlock(&state_lock);
5771
5772         return count;
5773 }
5774
5775 u64 nfsd_print_client_delegations(struct nfs4_client *clp, u64 max)
5776 {
5777         u64 count = 0;
5778
5779         spin_lock(&state_lock);
5780         count = nfsd_find_all_delegations(clp, max, NULL);
5781         spin_unlock(&state_lock);
5782
5783         nfsd_print_count(clp, count, "delegations");
5784         return count;
5785 }
5786
5787 u64 nfsd_for_n_state(u64 max, u64 (*func)(struct nfs4_client *, u64))
5788 {
5789         struct nfs4_client *clp, *next;
5790         u64 count = 0;
5791         struct nfsd_net *nn = net_generic(current->nsproxy->net_ns, nfsd_net_id);
5792
5793         if (!nfsd_netns_ready(nn))
5794                 return 0;
5795
5796         list_for_each_entry_safe(clp, next, &nn->client_lru, cl_lru) {
5797                 count += func(clp, max - count);
5798                 if ((max != 0) && (count >= max))
5799                         break;
5800         }
5801
5802         return count;
5803 }
5804
5805 struct nfs4_client *nfsd_find_client(struct sockaddr_storage *addr, size_t addr_size)
5806 {
5807         struct nfs4_client *clp;
5808         struct nfsd_net *nn = net_generic(current->nsproxy->net_ns, nfsd_net_id);
5809
5810         if (!nfsd_netns_ready(nn))
5811                 return NULL;
5812
5813         list_for_each_entry(clp, &nn->client_lru, cl_lru) {
5814                 if (memcmp(&clp->cl_addr, addr, addr_size) == 0)
5815                         return clp;
5816         }
5817         return NULL;
5818 }
5819
5820 #endif /* CONFIG_NFSD_FAULT_INJECTION */
5821
5822 /*
5823  * Since the lifetime of a delegation isn't limited to that of an open, a
5824  * client may quite reasonably hang on to a delegation as long as it has
5825  * the inode cached.  This becomes an obvious problem the first time a
5826  * client's inode cache approaches the size of the server's total memory.
5827  *
5828  * For now we avoid this problem by imposing a hard limit on the number
5829  * of delegations, which varies according to the server's memory size.
5830  */
5831 static void
5832 set_max_delegations(void)
5833 {
5834         /*
5835          * Allow at most 4 delegations per megabyte of RAM.  Quick
5836          * estimates suggest that in the worst case (where every delegation
5837          * is for a different inode), a delegation could take about 1.5K,
5838          * giving a worst case usage of about 6% of memory.
5839          */
5840         max_delegations = nr_free_buffer_pages() >> (20 - 2 - PAGE_SHIFT);
5841 }
5842
5843 static int nfs4_state_create_net(struct net *net)
5844 {
5845         struct nfsd_net *nn = net_generic(net, nfsd_net_id);
5846         int i;
5847
5848         nn->conf_id_hashtbl = kmalloc(sizeof(struct list_head) *
5849                         CLIENT_HASH_SIZE, GFP_KERNEL);
5850         if (!nn->conf_id_hashtbl)
5851                 goto err;
5852         nn->unconf_id_hashtbl = kmalloc(sizeof(struct list_head) *
5853                         CLIENT_HASH_SIZE, GFP_KERNEL);
5854         if (!nn->unconf_id_hashtbl)
5855                 goto err_unconf_id;
5856         nn->sessionid_hashtbl = kmalloc(sizeof(struct list_head) *
5857                         SESSION_HASH_SIZE, GFP_KERNEL);
5858         if (!nn->sessionid_hashtbl)
5859                 goto err_sessionid;
5860
5861         for (i = 0; i < CLIENT_HASH_SIZE; i++) {
5862                 INIT_LIST_HEAD(&nn->conf_id_hashtbl[i]);
5863                 INIT_LIST_HEAD(&nn->unconf_id_hashtbl[i]);
5864         }
5865         for (i = 0; i < SESSION_HASH_SIZE; i++)
5866                 INIT_LIST_HEAD(&nn->sessionid_hashtbl[i]);
5867         nn->conf_name_tree = RB_ROOT;
5868         nn->unconf_name_tree = RB_ROOT;
5869         INIT_LIST_HEAD(&nn->client_lru);
5870         INIT_LIST_HEAD(&nn->close_lru);
5871         INIT_LIST_HEAD(&nn->del_recall_lru);
5872         spin_lock_init(&nn->client_lock);
5873
5874         INIT_DELAYED_WORK(&nn->laundromat_work, laundromat_main);
5875         get_net(net);
5876
5877         return 0;
5878
5879 err_sessionid:
5880         kfree(nn->unconf_id_hashtbl);
5881 err_unconf_id:
5882         kfree(nn->conf_id_hashtbl);
5883 err:
5884         return -ENOMEM;
5885 }
5886
5887 static void
5888 nfs4_state_destroy_net(struct net *net)
5889 {
5890         int i;
5891         struct nfs4_client *clp = NULL;
5892         struct nfsd_net *nn = net_generic(net, nfsd_net_id);
5893
5894         for (i = 0; i < CLIENT_HASH_SIZE; i++) {
5895                 while (!list_empty(&nn->conf_id_hashtbl[i])) {
5896                         clp = list_entry(nn->conf_id_hashtbl[i].next, struct nfs4_client, cl_idhash);
5897                         destroy_client(clp);
5898                 }
5899         }
5900
5901         for (i = 0; i < CLIENT_HASH_SIZE; i++) {
5902                 while (!list_empty(&nn->unconf_id_hashtbl[i])) {
5903                         clp = list_entry(nn->unconf_id_hashtbl[i].next, struct nfs4_client, cl_idhash);
5904                         destroy_client(clp);
5905                 }
5906         }
5907
5908         kfree(nn->sessionid_hashtbl);
5909         kfree(nn->unconf_id_hashtbl);
5910         kfree(nn->conf_id_hashtbl);
5911         put_net(net);
5912 }
5913
5914 int
5915 nfs4_state_start_net(struct net *net)
5916 {
5917         struct nfsd_net *nn = net_generic(net, nfsd_net_id);
5918         int ret;
5919
5920         ret = nfs4_state_create_net(net);
5921         if (ret)
5922                 return ret;
5923         nfsd4_client_tracking_init(net);
5924         nn->boot_time = get_seconds();
5925         locks_start_grace(net, &nn->nfsd4_manager);
5926         nn->grace_ended = false;
5927         printk(KERN_INFO "NFSD: starting %ld-second grace period (net %p)\n",
5928                nn->nfsd4_grace, net);
5929         queue_delayed_work(laundry_wq, &nn->laundromat_work, nn->nfsd4_grace * HZ);
5930         return 0;
5931 }
5932
5933 /* initialization to perform when the nfsd service is started: */
5934
5935 int
5936 nfs4_state_start(void)
5937 {
5938         int ret;
5939
5940         ret = set_callback_cred();
5941         if (ret)
5942                 return -ENOMEM;
5943         laundry_wq = create_singlethread_workqueue("nfsd4");
5944         if (laundry_wq == NULL) {
5945                 ret = -ENOMEM;
5946                 goto out_recovery;
5947         }
5948         ret = nfsd4_create_callback_queue();
5949         if (ret)
5950                 goto out_free_laundry;
5951
5952         set_max_delegations();
5953
5954         return 0;
5955
5956 out_free_laundry:
5957         destroy_workqueue(laundry_wq);
5958 out_recovery:
5959         return ret;
5960 }
5961
5962 void
5963 nfs4_state_shutdown_net(struct net *net)
5964 {
5965         struct nfs4_delegation *dp = NULL;
5966         struct list_head *pos, *next, reaplist;
5967         struct nfsd_net *nn = net_generic(net, nfsd_net_id);
5968
5969         cancel_delayed_work_sync(&nn->laundromat_work);
5970         locks_end_grace(&nn->nfsd4_manager);
5971
5972         nfs4_lock_state();
5973         INIT_LIST_HEAD(&reaplist);
5974         spin_lock(&state_lock);
5975         list_for_each_safe(pos, next, &nn->del_recall_lru) {
5976                 dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
5977                 unhash_delegation_locked(dp);
5978                 list_add(&dp->dl_recall_lru, &reaplist);
5979         }
5980         spin_unlock(&state_lock);
5981         list_for_each_safe(pos, next, &reaplist) {
5982                 dp = list_entry (pos, struct nfs4_delegation, dl_recall_lru);
5983                 list_del_init(&dp->dl_recall_lru);
5984                 nfs4_put_stid(&dp->dl_stid);
5985         }
5986
5987         nfsd4_client_tracking_exit(net);
5988         nfs4_state_destroy_net(net);
5989         nfs4_unlock_state();
5990 }
5991
5992 void
5993 nfs4_state_shutdown(void)
5994 {
5995         destroy_workqueue(laundry_wq);
5996         nfsd4_destroy_callback_queue();
5997 }
5998
5999 static void
6000 get_stateid(struct nfsd4_compound_state *cstate, stateid_t *stateid)
6001 {
6002         if (HAS_STATE_ID(cstate, CURRENT_STATE_ID_FLAG) && CURRENT_STATEID(stateid))
6003                 memcpy(stateid, &cstate->current_stateid, sizeof(stateid_t));
6004 }
6005
6006 static void
6007 put_stateid(struct nfsd4_compound_state *cstate, stateid_t *stateid)
6008 {
6009         if (cstate->minorversion) {
6010                 memcpy(&cstate->current_stateid, stateid, sizeof(stateid_t));
6011                 SET_STATE_ID(cstate, CURRENT_STATE_ID_FLAG);
6012         }
6013 }
6014
6015 void
6016 clear_current_stateid(struct nfsd4_compound_state *cstate)
6017 {
6018         CLEAR_STATE_ID(cstate, CURRENT_STATE_ID_FLAG);
6019 }
6020
6021 /*
6022  * functions to set current state id
6023  */
6024 void
6025 nfsd4_set_opendowngradestateid(struct nfsd4_compound_state *cstate, struct nfsd4_open_downgrade *odp)
6026 {
6027         put_stateid(cstate, &odp->od_stateid);
6028 }
6029
6030 void
6031 nfsd4_set_openstateid(struct nfsd4_compound_state *cstate, struct nfsd4_open *open)
6032 {
6033         put_stateid(cstate, &open->op_stateid);
6034 }
6035
6036 void
6037 nfsd4_set_closestateid(struct nfsd4_compound_state *cstate, struct nfsd4_close *close)
6038 {
6039         put_stateid(cstate, &close->cl_stateid);
6040 }
6041
6042 void
6043 nfsd4_set_lockstateid(struct nfsd4_compound_state *cstate, struct nfsd4_lock *lock)
6044 {
6045         put_stateid(cstate, &lock->lk_resp_stateid);
6046 }
6047
6048 /*
6049  * functions to consume current state id
6050  */
6051
6052 void
6053 nfsd4_get_opendowngradestateid(struct nfsd4_compound_state *cstate, struct nfsd4_open_downgrade *odp)
6054 {
6055         get_stateid(cstate, &odp->od_stateid);
6056 }
6057
6058 void
6059 nfsd4_get_delegreturnstateid(struct nfsd4_compound_state *cstate, struct nfsd4_delegreturn *drp)
6060 {
6061         get_stateid(cstate, &drp->dr_stateid);
6062 }
6063
6064 void
6065 nfsd4_get_freestateid(struct nfsd4_compound_state *cstate, struct nfsd4_free_stateid *fsp)
6066 {
6067         get_stateid(cstate, &fsp->fr_stateid);
6068 }
6069
6070 void
6071 nfsd4_get_setattrstateid(struct nfsd4_compound_state *cstate, struct nfsd4_setattr *setattr)
6072 {
6073         get_stateid(cstate, &setattr->sa_stateid);
6074 }
6075
6076 void
6077 nfsd4_get_closestateid(struct nfsd4_compound_state *cstate, struct nfsd4_close *close)
6078 {
6079         get_stateid(cstate, &close->cl_stateid);
6080 }
6081
6082 void
6083 nfsd4_get_lockustateid(struct nfsd4_compound_state *cstate, struct nfsd4_locku *locku)
6084 {
6085         get_stateid(cstate, &locku->lu_stateid);
6086 }
6087
6088 void
6089 nfsd4_get_readstateid(struct nfsd4_compound_state *cstate, struct nfsd4_read *read)
6090 {
6091         get_stateid(cstate, &read->rd_stateid);
6092 }
6093
6094 void
6095 nfsd4_get_writestateid(struct nfsd4_compound_state *cstate, struct nfsd4_write *write)
6096 {
6097         get_stateid(cstate, &write->wr_stateid);
6098 }