quota: Fix race between dqput() and dquot_scan_active()
[pandora-kernel.git] / fs / quota / dquot.c
1 /*
2  * Implementation of the diskquota system for the LINUX operating system. QUOTA
3  * is implemented using the BSD system call interface as the means of
4  * communication with the user level. This file contains the generic routines
5  * called by the different filesystems on allocation of an inode or block.
6  * These routines take care of the administration needed to have a consistent
7  * diskquota tracking system. The ideas of both user and group quotas are based
8  * on the Melbourne quota system as used on BSD derived systems. The internal
9  * implementation is based on one of the several variants of the LINUX
10  * inode-subsystem with added complexity of the diskquota system.
11  * 
12  * Author:      Marco van Wieringen <mvw@planets.elm.net>
13  *
14  * Fixes:   Dmitry Gorodchanin <pgmdsg@ibi.com>, 11 Feb 96
15  *
16  *              Revised list management to avoid races
17  *              -- Bill Hawes, <whawes@star.net>, 9/98
18  *
19  *              Fixed races in dquot_transfer(), dqget() and dquot_alloc_...().
20  *              As the consequence the locking was moved from dquot_decr_...(),
21  *              dquot_incr_...() to calling functions.
22  *              invalidate_dquots() now writes modified dquots.
23  *              Serialized quota_off() and quota_on() for mount point.
24  *              Fixed a few bugs in grow_dquots().
25  *              Fixed deadlock in write_dquot() - we no longer account quotas on
26  *              quota files
27  *              remove_dquot_ref() moved to inode.c - it now traverses through inodes
28  *              add_dquot_ref() restarts after blocking
29  *              Added check for bogus uid and fixed check for group in quotactl.
30  *              Jan Kara, <jack@suse.cz>, sponsored by SuSE CR, 10-11/99
31  *
32  *              Used struct list_head instead of own list struct
33  *              Invalidation of referenced dquots is no longer possible
34  *              Improved free_dquots list management
35  *              Quota and i_blocks are now updated in one place to avoid races
36  *              Warnings are now delayed so we won't block in critical section
37  *              Write updated not to require dquot lock
38  *              Jan Kara, <jack@suse.cz>, 9/2000
39  *
40  *              Added dynamic quota structure allocation
41  *              Jan Kara <jack@suse.cz> 12/2000
42  *
43  *              Rewritten quota interface. Implemented new quota format and
44  *              formats registering.
45  *              Jan Kara, <jack@suse.cz>, 2001,2002
46  *
47  *              New SMP locking.
48  *              Jan Kara, <jack@suse.cz>, 10/2002
49  *
50  *              Added journalled quota support, fix lock inversion problems
51  *              Jan Kara, <jack@suse.cz>, 2003,2004
52  *
53  * (C) Copyright 1994 - 1997 Marco van Wieringen 
54  */
55
56 #include <linux/errno.h>
57 #include <linux/kernel.h>
58 #include <linux/fs.h>
59 #include <linux/mount.h>
60 #include <linux/mm.h>
61 #include <linux/time.h>
62 #include <linux/types.h>
63 #include <linux/string.h>
64 #include <linux/fcntl.h>
65 #include <linux/stat.h>
66 #include <linux/tty.h>
67 #include <linux/file.h>
68 #include <linux/slab.h>
69 #include <linux/sysctl.h>
70 #include <linux/init.h>
71 #include <linux/module.h>
72 #include <linux/proc_fs.h>
73 #include <linux/security.h>
74 #include <linux/kmod.h>
75 #include <linux/namei.h>
76 #include <linux/buffer_head.h>
77 #include <linux/capability.h>
78 #include <linux/quotaops.h>
79 #include "../internal.h" /* ugh */
80
81 #include <asm/uaccess.h>
82
83 /*
84  * There are three quota SMP locks. dq_list_lock protects all lists with quotas
85  * and quota formats.
86  * dq_data_lock protects data from dq_dqb and also mem_dqinfo structures and
87  * also guards consistency of dquot->dq_dqb with inode->i_blocks, i_bytes.
88  * i_blocks and i_bytes updates itself are guarded by i_lock acquired directly
89  * in inode_add_bytes() and inode_sub_bytes(). dq_state_lock protects
90  * modifications of quota state (on quotaon and quotaoff) and readers who care
91  * about latest values take it as well.
92  *
93  * The spinlock ordering is hence: dq_data_lock > dq_list_lock > i_lock,
94  *   dq_list_lock > dq_state_lock
95  *
96  * Note that some things (eg. sb pointer, type, id) doesn't change during
97  * the life of the dquot structure and so needn't to be protected by a lock
98  *
99  * Any operation working on dquots via inode pointers must hold dqptr_sem.  If
100  * operation is just reading pointers from inode (or not using them at all) the
101  * read lock is enough. If pointers are altered function must hold write lock.
102  * Special care needs to be taken about S_NOQUOTA inode flag (marking that
103  * inode is a quota file). Functions adding pointers from inode to dquots have
104  * to check this flag under dqptr_sem and then (if S_NOQUOTA is not set) they
105  * have to do all pointer modifications before dropping dqptr_sem. This makes
106  * sure they cannot race with quotaon which first sets S_NOQUOTA flag and
107  * then drops all pointers to dquots from an inode.
108  *
109  * Each dquot has its dq_lock mutex. Locked dquots might not be referenced
110  * from inodes (dquot_alloc_space() and such don't check the dq_lock).
111  * Currently dquot is locked only when it is being read to memory (or space for
112  * it is being allocated) on the first dqget() and when it is being released on
113  * the last dqput(). The allocation and release oparations are serialized by
114  * the dq_lock and by checking the use count in dquot_release().  Write
115  * operations on dquots don't hold dq_lock as they copy data under dq_data_lock
116  * spinlock to internal buffers before writing.
117  *
118  * Lock ordering (including related VFS locks) is the following:
119  *   i_mutex > dqonoff_sem > journal_lock > dqptr_sem > dquot->dq_lock >
120  *   dqio_mutex
121  * The lock ordering of dqptr_sem imposed by quota code is only dqonoff_sem >
122  * dqptr_sem. But filesystem has to count with the fact that functions such as
123  * dquot_alloc_space() acquire dqptr_sem and they usually have to be called
124  * from inside a transaction to keep filesystem consistency after a crash. Also
125  * filesystems usually want to do some IO on dquot from ->mark_dirty which is
126  * called with dqptr_sem held.
127  * i_mutex on quota files is special (it's below dqio_mutex)
128  */
129
130 static __cacheline_aligned_in_smp DEFINE_SPINLOCK(dq_list_lock);
131 static __cacheline_aligned_in_smp DEFINE_SPINLOCK(dq_state_lock);
132 __cacheline_aligned_in_smp DEFINE_SPINLOCK(dq_data_lock);
133 EXPORT_SYMBOL(dq_data_lock);
134
135 void __quota_error(struct super_block *sb, const char *func,
136                    const char *fmt, ...)
137 {
138         if (printk_ratelimit()) {
139                 va_list args;
140                 struct va_format vaf;
141
142                 va_start(args, fmt);
143
144                 vaf.fmt = fmt;
145                 vaf.va = &args;
146
147                 printk(KERN_ERR "Quota error (device %s): %s: %pV\n",
148                        sb->s_id, func, &vaf);
149
150                 va_end(args);
151         }
152 }
153 EXPORT_SYMBOL(__quota_error);
154
155 #if defined(CONFIG_QUOTA_DEBUG) || defined(CONFIG_PRINT_QUOTA_WARNING)
156 static char *quotatypes[] = INITQFNAMES;
157 #endif
158 static struct quota_format_type *quota_formats; /* List of registered formats */
159 static struct quota_module_name module_names[] = INIT_QUOTA_MODULE_NAMES;
160
161 /* SLAB cache for dquot structures */
162 static struct kmem_cache *dquot_cachep;
163
164 int register_quota_format(struct quota_format_type *fmt)
165 {
166         spin_lock(&dq_list_lock);
167         fmt->qf_next = quota_formats;
168         quota_formats = fmt;
169         spin_unlock(&dq_list_lock);
170         return 0;
171 }
172 EXPORT_SYMBOL(register_quota_format);
173
174 void unregister_quota_format(struct quota_format_type *fmt)
175 {
176         struct quota_format_type **actqf;
177
178         spin_lock(&dq_list_lock);
179         for (actqf = &quota_formats; *actqf && *actqf != fmt;
180              actqf = &(*actqf)->qf_next)
181                 ;
182         if (*actqf)
183                 *actqf = (*actqf)->qf_next;
184         spin_unlock(&dq_list_lock);
185 }
186 EXPORT_SYMBOL(unregister_quota_format);
187
188 static struct quota_format_type *find_quota_format(int id)
189 {
190         struct quota_format_type *actqf;
191
192         spin_lock(&dq_list_lock);
193         for (actqf = quota_formats; actqf && actqf->qf_fmt_id != id;
194              actqf = actqf->qf_next)
195                 ;
196         if (!actqf || !try_module_get(actqf->qf_owner)) {
197                 int qm;
198
199                 spin_unlock(&dq_list_lock);
200                 
201                 for (qm = 0; module_names[qm].qm_fmt_id &&
202                              module_names[qm].qm_fmt_id != id; qm++)
203                         ;
204                 if (!module_names[qm].qm_fmt_id ||
205                     request_module(module_names[qm].qm_mod_name))
206                         return NULL;
207
208                 spin_lock(&dq_list_lock);
209                 for (actqf = quota_formats; actqf && actqf->qf_fmt_id != id;
210                      actqf = actqf->qf_next)
211                         ;
212                 if (actqf && !try_module_get(actqf->qf_owner))
213                         actqf = NULL;
214         }
215         spin_unlock(&dq_list_lock);
216         return actqf;
217 }
218
219 static void put_quota_format(struct quota_format_type *fmt)
220 {
221         module_put(fmt->qf_owner);
222 }
223
224 /*
225  * Dquot List Management:
226  * The quota code uses three lists for dquot management: the inuse_list,
227  * free_dquots, and dquot_hash[] array. A single dquot structure may be
228  * on all three lists, depending on its current state.
229  *
230  * All dquots are placed to the end of inuse_list when first created, and this
231  * list is used for invalidate operation, which must look at every dquot.
232  *
233  * Unused dquots (dq_count == 0) are added to the free_dquots list when freed,
234  * and this list is searched whenever we need an available dquot.  Dquots are
235  * removed from the list as soon as they are used again, and
236  * dqstats.free_dquots gives the number of dquots on the list. When
237  * dquot is invalidated it's completely released from memory.
238  *
239  * Dquots with a specific identity (device, type and id) are placed on
240  * one of the dquot_hash[] hash chains. The provides an efficient search
241  * mechanism to locate a specific dquot.
242  */
243
244 static LIST_HEAD(inuse_list);
245 static LIST_HEAD(free_dquots);
246 static unsigned int dq_hash_bits, dq_hash_mask;
247 static struct hlist_head *dquot_hash;
248
249 struct dqstats dqstats;
250 EXPORT_SYMBOL(dqstats);
251
252 static qsize_t inode_get_rsv_space(struct inode *inode);
253 static void __dquot_initialize(struct inode *inode, int type);
254
255 static inline unsigned int
256 hashfn(const struct super_block *sb, unsigned int id, int type)
257 {
258         unsigned long tmp;
259
260         tmp = (((unsigned long)sb>>L1_CACHE_SHIFT) ^ id) * (MAXQUOTAS - type);
261         return (tmp + (tmp >> dq_hash_bits)) & dq_hash_mask;
262 }
263
264 /*
265  * Following list functions expect dq_list_lock to be held
266  */
267 static inline void insert_dquot_hash(struct dquot *dquot)
268 {
269         struct hlist_head *head;
270         head = dquot_hash + hashfn(dquot->dq_sb, dquot->dq_id, dquot->dq_type);
271         hlist_add_head(&dquot->dq_hash, head);
272 }
273
274 static inline void remove_dquot_hash(struct dquot *dquot)
275 {
276         hlist_del_init(&dquot->dq_hash);
277 }
278
279 static struct dquot *find_dquot(unsigned int hashent, struct super_block *sb,
280                                 unsigned int id, int type)
281 {
282         struct hlist_node *node;
283         struct dquot *dquot;
284
285         hlist_for_each (node, dquot_hash+hashent) {
286                 dquot = hlist_entry(node, struct dquot, dq_hash);
287                 if (dquot->dq_sb == sb && dquot->dq_id == id &&
288                     dquot->dq_type == type)
289                         return dquot;
290         }
291         return NULL;
292 }
293
294 /* Add a dquot to the tail of the free list */
295 static inline void put_dquot_last(struct dquot *dquot)
296 {
297         list_add_tail(&dquot->dq_free, &free_dquots);
298         dqstats_inc(DQST_FREE_DQUOTS);
299 }
300
301 static inline void remove_free_dquot(struct dquot *dquot)
302 {
303         if (list_empty(&dquot->dq_free))
304                 return;
305         list_del_init(&dquot->dq_free);
306         dqstats_dec(DQST_FREE_DQUOTS);
307 }
308
309 static inline void put_inuse(struct dquot *dquot)
310 {
311         /* We add to the back of inuse list so we don't have to restart
312          * when traversing this list and we block */
313         list_add_tail(&dquot->dq_inuse, &inuse_list);
314         dqstats_inc(DQST_ALLOC_DQUOTS);
315 }
316
317 static inline void remove_inuse(struct dquot *dquot)
318 {
319         dqstats_dec(DQST_ALLOC_DQUOTS);
320         list_del(&dquot->dq_inuse);
321 }
322 /*
323  * End of list functions needing dq_list_lock
324  */
325
326 static void wait_on_dquot(struct dquot *dquot)
327 {
328         mutex_lock(&dquot->dq_lock);
329         mutex_unlock(&dquot->dq_lock);
330 }
331
332 static inline int dquot_dirty(struct dquot *dquot)
333 {
334         return test_bit(DQ_MOD_B, &dquot->dq_flags);
335 }
336
337 static inline int mark_dquot_dirty(struct dquot *dquot)
338 {
339         return dquot->dq_sb->dq_op->mark_dirty(dquot);
340 }
341
342 /* Mark dquot dirty in atomic manner, and return it's old dirty flag state */
343 int dquot_mark_dquot_dirty(struct dquot *dquot)
344 {
345         int ret = 1;
346
347         /* If quota is dirty already, we don't have to acquire dq_list_lock */
348         if (test_bit(DQ_MOD_B, &dquot->dq_flags))
349                 return 1;
350
351         spin_lock(&dq_list_lock);
352         if (!test_and_set_bit(DQ_MOD_B, &dquot->dq_flags)) {
353                 list_add(&dquot->dq_dirty, &sb_dqopt(dquot->dq_sb)->
354                                 info[dquot->dq_type].dqi_dirty_list);
355                 ret = 0;
356         }
357         spin_unlock(&dq_list_lock);
358         return ret;
359 }
360 EXPORT_SYMBOL(dquot_mark_dquot_dirty);
361
362 /* Dirtify all the dquots - this can block when journalling */
363 static inline int mark_all_dquot_dirty(struct dquot * const *dquot)
364 {
365         int ret, err, cnt;
366
367         ret = err = 0;
368         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
369                 if (dquot[cnt])
370                         /* Even in case of error we have to continue */
371                         ret = mark_dquot_dirty(dquot[cnt]);
372                 if (!err)
373                         err = ret;
374         }
375         return err;
376 }
377
378 static inline void dqput_all(struct dquot **dquot)
379 {
380         unsigned int cnt;
381
382         for (cnt = 0; cnt < MAXQUOTAS; cnt++)
383                 dqput(dquot[cnt]);
384 }
385
386 /* This function needs dq_list_lock */
387 static inline int clear_dquot_dirty(struct dquot *dquot)
388 {
389         if (!test_and_clear_bit(DQ_MOD_B, &dquot->dq_flags))
390                 return 0;
391         list_del_init(&dquot->dq_dirty);
392         return 1;
393 }
394
395 void mark_info_dirty(struct super_block *sb, int type)
396 {
397         set_bit(DQF_INFO_DIRTY_B, &sb_dqopt(sb)->info[type].dqi_flags);
398 }
399 EXPORT_SYMBOL(mark_info_dirty);
400
401 /*
402  *      Read dquot from disk and alloc space for it
403  */
404
405 int dquot_acquire(struct dquot *dquot)
406 {
407         int ret = 0, ret2 = 0;
408         struct quota_info *dqopt = sb_dqopt(dquot->dq_sb);
409
410         mutex_lock(&dquot->dq_lock);
411         mutex_lock(&dqopt->dqio_mutex);
412         if (!test_bit(DQ_READ_B, &dquot->dq_flags))
413                 ret = dqopt->ops[dquot->dq_type]->read_dqblk(dquot);
414         if (ret < 0)
415                 goto out_iolock;
416         set_bit(DQ_READ_B, &dquot->dq_flags);
417         /* Instantiate dquot if needed */
418         if (!test_bit(DQ_ACTIVE_B, &dquot->dq_flags) && !dquot->dq_off) {
419                 ret = dqopt->ops[dquot->dq_type]->commit_dqblk(dquot);
420                 /* Write the info if needed */
421                 if (info_dirty(&dqopt->info[dquot->dq_type])) {
422                         ret2 = dqopt->ops[dquot->dq_type]->write_file_info(
423                                                 dquot->dq_sb, dquot->dq_type);
424                 }
425                 if (ret < 0)
426                         goto out_iolock;
427                 if (ret2 < 0) {
428                         ret = ret2;
429                         goto out_iolock;
430                 }
431         }
432         set_bit(DQ_ACTIVE_B, &dquot->dq_flags);
433 out_iolock:
434         mutex_unlock(&dqopt->dqio_mutex);
435         mutex_unlock(&dquot->dq_lock);
436         return ret;
437 }
438 EXPORT_SYMBOL(dquot_acquire);
439
440 /*
441  *      Write dquot to disk
442  */
443 int dquot_commit(struct dquot *dquot)
444 {
445         int ret = 0;
446         struct quota_info *dqopt = sb_dqopt(dquot->dq_sb);
447
448         mutex_lock(&dqopt->dqio_mutex);
449         spin_lock(&dq_list_lock);
450         if (!clear_dquot_dirty(dquot)) {
451                 spin_unlock(&dq_list_lock);
452                 goto out_sem;
453         }
454         spin_unlock(&dq_list_lock);
455         /* Inactive dquot can be only if there was error during read/init
456          * => we have better not writing it */
457         if (test_bit(DQ_ACTIVE_B, &dquot->dq_flags))
458                 ret = dqopt->ops[dquot->dq_type]->commit_dqblk(dquot);
459         else
460                 ret = -EIO;
461 out_sem:
462         mutex_unlock(&dqopt->dqio_mutex);
463         return ret;
464 }
465 EXPORT_SYMBOL(dquot_commit);
466
467 /*
468  *      Release dquot
469  */
470 int dquot_release(struct dquot *dquot)
471 {
472         int ret = 0, ret2 = 0;
473         struct quota_info *dqopt = sb_dqopt(dquot->dq_sb);
474
475         mutex_lock(&dquot->dq_lock);
476         /* Check whether we are not racing with some other dqget() */
477         if (atomic_read(&dquot->dq_count) > 1)
478                 goto out_dqlock;
479         mutex_lock(&dqopt->dqio_mutex);
480         if (dqopt->ops[dquot->dq_type]->release_dqblk) {
481                 ret = dqopt->ops[dquot->dq_type]->release_dqblk(dquot);
482                 /* Write the info */
483                 if (info_dirty(&dqopt->info[dquot->dq_type])) {
484                         ret2 = dqopt->ops[dquot->dq_type]->write_file_info(
485                                                 dquot->dq_sb, dquot->dq_type);
486                 }
487                 if (ret >= 0)
488                         ret = ret2;
489         }
490         clear_bit(DQ_ACTIVE_B, &dquot->dq_flags);
491         mutex_unlock(&dqopt->dqio_mutex);
492 out_dqlock:
493         mutex_unlock(&dquot->dq_lock);
494         return ret;
495 }
496 EXPORT_SYMBOL(dquot_release);
497
498 void dquot_destroy(struct dquot *dquot)
499 {
500         kmem_cache_free(dquot_cachep, dquot);
501 }
502 EXPORT_SYMBOL(dquot_destroy);
503
504 static inline void do_destroy_dquot(struct dquot *dquot)
505 {
506         dquot->dq_sb->dq_op->destroy_dquot(dquot);
507 }
508
509 /* Invalidate all dquots on the list. Note that this function is called after
510  * quota is disabled and pointers from inodes removed so there cannot be new
511  * quota users. There can still be some users of quotas due to inodes being
512  * just deleted or pruned by prune_icache() (those are not attached to any
513  * list) or parallel quotactl call. We have to wait for such users.
514  */
515 static void invalidate_dquots(struct super_block *sb, int type)
516 {
517         struct dquot *dquot, *tmp;
518
519 restart:
520         spin_lock(&dq_list_lock);
521         list_for_each_entry_safe(dquot, tmp, &inuse_list, dq_inuse) {
522                 if (dquot->dq_sb != sb)
523                         continue;
524                 if (dquot->dq_type != type)
525                         continue;
526                 /* Wait for dquot users */
527                 if (atomic_read(&dquot->dq_count)) {
528                         DEFINE_WAIT(wait);
529
530                         atomic_inc(&dquot->dq_count);
531                         prepare_to_wait(&dquot->dq_wait_unused, &wait,
532                                         TASK_UNINTERRUPTIBLE);
533                         spin_unlock(&dq_list_lock);
534                         /* Once dqput() wakes us up, we know it's time to free
535                          * the dquot.
536                          * IMPORTANT: we rely on the fact that there is always
537                          * at most one process waiting for dquot to free.
538                          * Otherwise dq_count would be > 1 and we would never
539                          * wake up.
540                          */
541                         if (atomic_read(&dquot->dq_count) > 1)
542                                 schedule();
543                         finish_wait(&dquot->dq_wait_unused, &wait);
544                         dqput(dquot);
545                         /* At this moment dquot() need not exist (it could be
546                          * reclaimed by prune_dqcache(). Hence we must
547                          * restart. */
548                         goto restart;
549                 }
550                 /*
551                  * Quota now has no users and it has been written on last
552                  * dqput()
553                  */
554                 remove_dquot_hash(dquot);
555                 remove_free_dquot(dquot);
556                 remove_inuse(dquot);
557                 do_destroy_dquot(dquot);
558         }
559         spin_unlock(&dq_list_lock);
560 }
561
562 /* Call callback for every active dquot on given filesystem */
563 int dquot_scan_active(struct super_block *sb,
564                       int (*fn)(struct dquot *dquot, unsigned long priv),
565                       unsigned long priv)
566 {
567         struct dquot *dquot, *old_dquot = NULL;
568         int ret = 0;
569
570         mutex_lock(&sb_dqopt(sb)->dqonoff_mutex);
571         spin_lock(&dq_list_lock);
572         list_for_each_entry(dquot, &inuse_list, dq_inuse) {
573                 if (!test_bit(DQ_ACTIVE_B, &dquot->dq_flags))
574                         continue;
575                 if (dquot->dq_sb != sb)
576                         continue;
577                 /* Now we have active dquot so we can just increase use count */
578                 atomic_inc(&dquot->dq_count);
579                 spin_unlock(&dq_list_lock);
580                 dqstats_inc(DQST_LOOKUPS);
581                 dqput(old_dquot);
582                 old_dquot = dquot;
583                 /*
584                  * ->release_dquot() can be racing with us. Our reference
585                  * protects us from new calls to it so just wait for any
586                  * outstanding call and recheck the DQ_ACTIVE_B after that.
587                  */
588                 wait_on_dquot(dquot);
589                 if (test_bit(DQ_ACTIVE_B, &dquot->dq_flags)) {
590                         ret = fn(dquot, priv);
591                         if (ret < 0)
592                                 goto out;
593                 }
594                 spin_lock(&dq_list_lock);
595                 /* We are safe to continue now because our dquot could not
596                  * be moved out of the inuse list while we hold the reference */
597         }
598         spin_unlock(&dq_list_lock);
599 out:
600         dqput(old_dquot);
601         mutex_unlock(&sb_dqopt(sb)->dqonoff_mutex);
602         return ret;
603 }
604 EXPORT_SYMBOL(dquot_scan_active);
605
606 int dquot_quota_sync(struct super_block *sb, int type, int wait)
607 {
608         struct list_head *dirty;
609         struct dquot *dquot;
610         struct quota_info *dqopt = sb_dqopt(sb);
611         int cnt;
612
613         mutex_lock(&dqopt->dqonoff_mutex);
614         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
615                 if (type != -1 && cnt != type)
616                         continue;
617                 if (!sb_has_quota_active(sb, cnt))
618                         continue;
619                 spin_lock(&dq_list_lock);
620                 dirty = &dqopt->info[cnt].dqi_dirty_list;
621                 while (!list_empty(dirty)) {
622                         dquot = list_first_entry(dirty, struct dquot,
623                                                  dq_dirty);
624                         /* Dirty and inactive can be only bad dquot... */
625                         if (!test_bit(DQ_ACTIVE_B, &dquot->dq_flags)) {
626                                 clear_dquot_dirty(dquot);
627                                 continue;
628                         }
629                         /* Now we have active dquot from which someone is
630                          * holding reference so we can safely just increase
631                          * use count */
632                         atomic_inc(&dquot->dq_count);
633                         spin_unlock(&dq_list_lock);
634                         dqstats_inc(DQST_LOOKUPS);
635                         sb->dq_op->write_dquot(dquot);
636                         dqput(dquot);
637                         spin_lock(&dq_list_lock);
638                 }
639                 spin_unlock(&dq_list_lock);
640         }
641
642         for (cnt = 0; cnt < MAXQUOTAS; cnt++)
643                 if ((cnt == type || type == -1) && sb_has_quota_active(sb, cnt)
644                     && info_dirty(&dqopt->info[cnt]))
645                         sb->dq_op->write_info(sb, cnt);
646         dqstats_inc(DQST_SYNCS);
647         mutex_unlock(&dqopt->dqonoff_mutex);
648
649         if (!wait || (sb_dqopt(sb)->flags & DQUOT_QUOTA_SYS_FILE))
650                 return 0;
651
652         /* This is not very clever (and fast) but currently I don't know about
653          * any other simple way of getting quota data to disk and we must get
654          * them there for userspace to be visible... */
655         if (sb->s_op->sync_fs)
656                 sb->s_op->sync_fs(sb, 1);
657         sync_blockdev(sb->s_bdev);
658
659         /*
660          * Now when everything is written we can discard the pagecache so
661          * that userspace sees the changes.
662          */
663         mutex_lock(&sb_dqopt(sb)->dqonoff_mutex);
664         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
665                 if (type != -1 && cnt != type)
666                         continue;
667                 if (!sb_has_quota_active(sb, cnt))
668                         continue;
669                 mutex_lock_nested(&sb_dqopt(sb)->files[cnt]->i_mutex,
670                                   I_MUTEX_QUOTA);
671                 truncate_inode_pages(&sb_dqopt(sb)->files[cnt]->i_data, 0);
672                 mutex_unlock(&sb_dqopt(sb)->files[cnt]->i_mutex);
673         }
674         mutex_unlock(&sb_dqopt(sb)->dqonoff_mutex);
675
676         return 0;
677 }
678 EXPORT_SYMBOL(dquot_quota_sync);
679
680 /* Free unused dquots from cache */
681 static void prune_dqcache(int count)
682 {
683         struct list_head *head;
684         struct dquot *dquot;
685
686         head = free_dquots.prev;
687         while (head != &free_dquots && count) {
688                 dquot = list_entry(head, struct dquot, dq_free);
689                 remove_dquot_hash(dquot);
690                 remove_free_dquot(dquot);
691                 remove_inuse(dquot);
692                 do_destroy_dquot(dquot);
693                 count--;
694                 head = free_dquots.prev;
695         }
696 }
697
698 /*
699  * This is called from kswapd when we think we need some
700  * more memory
701  */
702 static int shrink_dqcache_memory(struct shrinker *shrink,
703                                  struct shrink_control *sc)
704 {
705         int nr = sc->nr_to_scan;
706
707         if (nr) {
708                 spin_lock(&dq_list_lock);
709                 prune_dqcache(nr);
710                 spin_unlock(&dq_list_lock);
711         }
712         return ((unsigned)
713                 percpu_counter_read_positive(&dqstats.counter[DQST_FREE_DQUOTS])
714                 /100) * sysctl_vfs_cache_pressure;
715 }
716
717 static struct shrinker dqcache_shrinker = {
718         .shrink = shrink_dqcache_memory,
719         .seeks = DEFAULT_SEEKS,
720 };
721
722 /*
723  * Put reference to dquot
724  * NOTE: If you change this function please check whether dqput_blocks() works right...
725  */
726 void dqput(struct dquot *dquot)
727 {
728         int ret;
729
730         if (!dquot)
731                 return;
732 #ifdef CONFIG_QUOTA_DEBUG
733         if (!atomic_read(&dquot->dq_count)) {
734                 quota_error(dquot->dq_sb, "trying to free free dquot of %s %d",
735                             quotatypes[dquot->dq_type], dquot->dq_id);
736                 BUG();
737         }
738 #endif
739         dqstats_inc(DQST_DROPS);
740 we_slept:
741         spin_lock(&dq_list_lock);
742         if (atomic_read(&dquot->dq_count) > 1) {
743                 /* We have more than one user... nothing to do */
744                 atomic_dec(&dquot->dq_count);
745                 /* Releasing dquot during quotaoff phase? */
746                 if (!sb_has_quota_active(dquot->dq_sb, dquot->dq_type) &&
747                     atomic_read(&dquot->dq_count) == 1)
748                         wake_up(&dquot->dq_wait_unused);
749                 spin_unlock(&dq_list_lock);
750                 return;
751         }
752         /* Need to release dquot? */
753         if (test_bit(DQ_ACTIVE_B, &dquot->dq_flags) && dquot_dirty(dquot)) {
754                 spin_unlock(&dq_list_lock);
755                 /* Commit dquot before releasing */
756                 ret = dquot->dq_sb->dq_op->write_dquot(dquot);
757                 if (ret < 0) {
758                         quota_error(dquot->dq_sb, "Can't write quota structure"
759                                     " (error %d). Quota may get out of sync!",
760                                     ret);
761                         /*
762                          * We clear dirty bit anyway, so that we avoid
763                          * infinite loop here
764                          */
765                         spin_lock(&dq_list_lock);
766                         clear_dquot_dirty(dquot);
767                         spin_unlock(&dq_list_lock);
768                 }
769                 goto we_slept;
770         }
771         /* Clear flag in case dquot was inactive (something bad happened) */
772         clear_dquot_dirty(dquot);
773         if (test_bit(DQ_ACTIVE_B, &dquot->dq_flags)) {
774                 spin_unlock(&dq_list_lock);
775                 dquot->dq_sb->dq_op->release_dquot(dquot);
776                 goto we_slept;
777         }
778         atomic_dec(&dquot->dq_count);
779 #ifdef CONFIG_QUOTA_DEBUG
780         /* sanity check */
781         BUG_ON(!list_empty(&dquot->dq_free));
782 #endif
783         put_dquot_last(dquot);
784         spin_unlock(&dq_list_lock);
785 }
786 EXPORT_SYMBOL(dqput);
787
788 struct dquot *dquot_alloc(struct super_block *sb, int type)
789 {
790         return kmem_cache_zalloc(dquot_cachep, GFP_NOFS);
791 }
792 EXPORT_SYMBOL(dquot_alloc);
793
794 static struct dquot *get_empty_dquot(struct super_block *sb, int type)
795 {
796         struct dquot *dquot;
797
798         dquot = sb->dq_op->alloc_dquot(sb, type);
799         if(!dquot)
800                 return NULL;
801
802         mutex_init(&dquot->dq_lock);
803         INIT_LIST_HEAD(&dquot->dq_free);
804         INIT_LIST_HEAD(&dquot->dq_inuse);
805         INIT_HLIST_NODE(&dquot->dq_hash);
806         INIT_LIST_HEAD(&dquot->dq_dirty);
807         init_waitqueue_head(&dquot->dq_wait_unused);
808         dquot->dq_sb = sb;
809         dquot->dq_type = type;
810         atomic_set(&dquot->dq_count, 1);
811
812         return dquot;
813 }
814
815 /*
816  * Get reference to dquot
817  *
818  * Locking is slightly tricky here. We are guarded from parallel quotaoff()
819  * destroying our dquot by:
820  *   a) checking for quota flags under dq_list_lock and
821  *   b) getting a reference to dquot before we release dq_list_lock
822  */
823 struct dquot *dqget(struct super_block *sb, unsigned int id, int type)
824 {
825         unsigned int hashent = hashfn(sb, id, type);
826         struct dquot *dquot = NULL, *empty = NULL;
827
828         if (!sb_has_quota_active(sb, type))
829                 return NULL;
830 we_slept:
831         spin_lock(&dq_list_lock);
832         spin_lock(&dq_state_lock);
833         if (!sb_has_quota_active(sb, type)) {
834                 spin_unlock(&dq_state_lock);
835                 spin_unlock(&dq_list_lock);
836                 goto out;
837         }
838         spin_unlock(&dq_state_lock);
839
840         dquot = find_dquot(hashent, sb, id, type);
841         if (!dquot) {
842                 if (!empty) {
843                         spin_unlock(&dq_list_lock);
844                         empty = get_empty_dquot(sb, type);
845                         if (!empty)
846                                 schedule();     /* Try to wait for a moment... */
847                         goto we_slept;
848                 }
849                 dquot = empty;
850                 empty = NULL;
851                 dquot->dq_id = id;
852                 /* all dquots go on the inuse_list */
853                 put_inuse(dquot);
854                 /* hash it first so it can be found */
855                 insert_dquot_hash(dquot);
856                 spin_unlock(&dq_list_lock);
857                 dqstats_inc(DQST_LOOKUPS);
858         } else {
859                 if (!atomic_read(&dquot->dq_count))
860                         remove_free_dquot(dquot);
861                 atomic_inc(&dquot->dq_count);
862                 spin_unlock(&dq_list_lock);
863                 dqstats_inc(DQST_CACHE_HITS);
864                 dqstats_inc(DQST_LOOKUPS);
865         }
866         /* Wait for dq_lock - after this we know that either dquot_release() is
867          * already finished or it will be canceled due to dq_count > 1 test */
868         wait_on_dquot(dquot);
869         /* Read the dquot / allocate space in quota file */
870         if (!test_bit(DQ_ACTIVE_B, &dquot->dq_flags) &&
871             sb->dq_op->acquire_dquot(dquot) < 0) {
872                 dqput(dquot);
873                 dquot = NULL;
874                 goto out;
875         }
876 #ifdef CONFIG_QUOTA_DEBUG
877         BUG_ON(!dquot->dq_sb);  /* Has somebody invalidated entry under us? */
878 #endif
879 out:
880         if (empty)
881                 do_destroy_dquot(empty);
882
883         return dquot;
884 }
885 EXPORT_SYMBOL(dqget);
886
887 static int dqinit_needed(struct inode *inode, int type)
888 {
889         int cnt;
890
891         if (IS_NOQUOTA(inode))
892                 return 0;
893         if (type != -1)
894                 return !inode->i_dquot[type];
895         for (cnt = 0; cnt < MAXQUOTAS; cnt++)
896                 if (!inode->i_dquot[cnt])
897                         return 1;
898         return 0;
899 }
900
901 /* This routine is guarded by dqonoff_mutex mutex */
902 static void add_dquot_ref(struct super_block *sb, int type)
903 {
904         struct inode *inode, *old_inode = NULL;
905 #ifdef CONFIG_QUOTA_DEBUG
906         int reserved = 0;
907 #endif
908
909         spin_lock(&inode_sb_list_lock);
910         list_for_each_entry(inode, &sb->s_inodes, i_sb_list) {
911                 spin_lock(&inode->i_lock);
912                 if ((inode->i_state & (I_FREEING|I_WILL_FREE|I_NEW)) ||
913                     !atomic_read(&inode->i_writecount) ||
914                     !dqinit_needed(inode, type)) {
915                         spin_unlock(&inode->i_lock);
916                         continue;
917                 }
918 #ifdef CONFIG_QUOTA_DEBUG
919                 if (unlikely(inode_get_rsv_space(inode) > 0))
920                         reserved = 1;
921 #endif
922                 __iget(inode);
923                 spin_unlock(&inode->i_lock);
924                 spin_unlock(&inode_sb_list_lock);
925
926                 iput(old_inode);
927                 __dquot_initialize(inode, type);
928
929                 /*
930                  * We hold a reference to 'inode' so it couldn't have been
931                  * removed from s_inodes list while we dropped the
932                  * inode_sb_list_lock We cannot iput the inode now as we can be
933                  * holding the last reference and we cannot iput it under
934                  * inode_sb_list_lock. So we keep the reference and iput it
935                  * later.
936                  */
937                 old_inode = inode;
938                 spin_lock(&inode_sb_list_lock);
939         }
940         spin_unlock(&inode_sb_list_lock);
941         iput(old_inode);
942
943 #ifdef CONFIG_QUOTA_DEBUG
944         if (reserved) {
945                 quota_error(sb, "Writes happened before quota was turned on "
946                         "thus quota information is probably inconsistent. "
947                         "Please run quotacheck(8)");
948         }
949 #endif
950 }
951
952 /*
953  * Return 0 if dqput() won't block.
954  * (note that 1 doesn't necessarily mean blocking)
955  */
956 static inline int dqput_blocks(struct dquot *dquot)
957 {
958         if (atomic_read(&dquot->dq_count) <= 1)
959                 return 1;
960         return 0;
961 }
962
963 /*
964  * Remove references to dquots from inode and add dquot to list for freeing
965  * if we have the last reference to dquot
966  * We can't race with anybody because we hold dqptr_sem for writing...
967  */
968 static int remove_inode_dquot_ref(struct inode *inode, int type,
969                                   struct list_head *tofree_head)
970 {
971         struct dquot *dquot = inode->i_dquot[type];
972
973         inode->i_dquot[type] = NULL;
974         if (dquot) {
975                 if (dqput_blocks(dquot)) {
976 #ifdef CONFIG_QUOTA_DEBUG
977                         if (atomic_read(&dquot->dq_count) != 1)
978                                 quota_error(inode->i_sb, "Adding dquot with "
979                                             "dq_count %d to dispose list",
980                                             atomic_read(&dquot->dq_count));
981 #endif
982                         spin_lock(&dq_list_lock);
983                         /* As dquot must have currently users it can't be on
984                          * the free list... */
985                         list_add(&dquot->dq_free, tofree_head);
986                         spin_unlock(&dq_list_lock);
987                         return 1;
988                 }
989                 else
990                         dqput(dquot);   /* We have guaranteed we won't block */
991         }
992         return 0;
993 }
994
995 /*
996  * Free list of dquots
997  * Dquots are removed from inodes and no new references can be got so we are
998  * the only ones holding reference
999  */
1000 static void put_dquot_list(struct list_head *tofree_head)
1001 {
1002         struct list_head *act_head;
1003         struct dquot *dquot;
1004
1005         act_head = tofree_head->next;
1006         while (act_head != tofree_head) {
1007                 dquot = list_entry(act_head, struct dquot, dq_free);
1008                 act_head = act_head->next;
1009                 /* Remove dquot from the list so we won't have problems... */
1010                 list_del_init(&dquot->dq_free);
1011                 dqput(dquot);
1012         }
1013 }
1014
1015 static void remove_dquot_ref(struct super_block *sb, int type,
1016                 struct list_head *tofree_head)
1017 {
1018         struct inode *inode;
1019         int reserved = 0;
1020
1021         spin_lock(&inode_sb_list_lock);
1022         list_for_each_entry(inode, &sb->s_inodes, i_sb_list) {
1023                 /*
1024                  *  We have to scan also I_NEW inodes because they can already
1025                  *  have quota pointer initialized. Luckily, we need to touch
1026                  *  only quota pointers and these have separate locking
1027                  *  (dqptr_sem).
1028                  */
1029                 if (!IS_NOQUOTA(inode)) {
1030                         if (unlikely(inode_get_rsv_space(inode) > 0))
1031                                 reserved = 1;
1032                         remove_inode_dquot_ref(inode, type, tofree_head);
1033                 }
1034         }
1035         spin_unlock(&inode_sb_list_lock);
1036 #ifdef CONFIG_QUOTA_DEBUG
1037         if (reserved) {
1038                 printk(KERN_WARNING "VFS (%s): Writes happened after quota"
1039                         " was disabled thus quota information is probably "
1040                         "inconsistent. Please run quotacheck(8).\n", sb->s_id);
1041         }
1042 #endif
1043 }
1044
1045 /* Gather all references from inodes and drop them */
1046 static void drop_dquot_ref(struct super_block *sb, int type)
1047 {
1048         LIST_HEAD(tofree_head);
1049
1050         if (sb->dq_op) {
1051                 down_write(&sb_dqopt(sb)->dqptr_sem);
1052                 remove_dquot_ref(sb, type, &tofree_head);
1053                 up_write(&sb_dqopt(sb)->dqptr_sem);
1054                 put_dquot_list(&tofree_head);
1055         }
1056 }
1057
1058 static inline void dquot_incr_inodes(struct dquot *dquot, qsize_t number)
1059 {
1060         dquot->dq_dqb.dqb_curinodes += number;
1061 }
1062
1063 static inline void dquot_incr_space(struct dquot *dquot, qsize_t number)
1064 {
1065         dquot->dq_dqb.dqb_curspace += number;
1066 }
1067
1068 static inline void dquot_resv_space(struct dquot *dquot, qsize_t number)
1069 {
1070         dquot->dq_dqb.dqb_rsvspace += number;
1071 }
1072
1073 /*
1074  * Claim reserved quota space
1075  */
1076 static void dquot_claim_reserved_space(struct dquot *dquot, qsize_t number)
1077 {
1078         if (dquot->dq_dqb.dqb_rsvspace < number) {
1079                 WARN_ON_ONCE(1);
1080                 number = dquot->dq_dqb.dqb_rsvspace;
1081         }
1082         dquot->dq_dqb.dqb_curspace += number;
1083         dquot->dq_dqb.dqb_rsvspace -= number;
1084 }
1085
1086 static inline
1087 void dquot_free_reserved_space(struct dquot *dquot, qsize_t number)
1088 {
1089         if (dquot->dq_dqb.dqb_rsvspace >= number)
1090                 dquot->dq_dqb.dqb_rsvspace -= number;
1091         else {
1092                 WARN_ON_ONCE(1);
1093                 dquot->dq_dqb.dqb_rsvspace = 0;
1094         }
1095 }
1096
1097 static void dquot_decr_inodes(struct dquot *dquot, qsize_t number)
1098 {
1099         if (sb_dqopt(dquot->dq_sb)->flags & DQUOT_NEGATIVE_USAGE ||
1100             dquot->dq_dqb.dqb_curinodes >= number)
1101                 dquot->dq_dqb.dqb_curinodes -= number;
1102         else
1103                 dquot->dq_dqb.dqb_curinodes = 0;
1104         if (dquot->dq_dqb.dqb_curinodes <= dquot->dq_dqb.dqb_isoftlimit)
1105                 dquot->dq_dqb.dqb_itime = (time_t) 0;
1106         clear_bit(DQ_INODES_B, &dquot->dq_flags);
1107 }
1108
1109 static void dquot_decr_space(struct dquot *dquot, qsize_t number)
1110 {
1111         if (sb_dqopt(dquot->dq_sb)->flags & DQUOT_NEGATIVE_USAGE ||
1112             dquot->dq_dqb.dqb_curspace >= number)
1113                 dquot->dq_dqb.dqb_curspace -= number;
1114         else
1115                 dquot->dq_dqb.dqb_curspace = 0;
1116         if (dquot->dq_dqb.dqb_curspace <= dquot->dq_dqb.dqb_bsoftlimit)
1117                 dquot->dq_dqb.dqb_btime = (time_t) 0;
1118         clear_bit(DQ_BLKS_B, &dquot->dq_flags);
1119 }
1120
1121 static int warning_issued(struct dquot *dquot, const int warntype)
1122 {
1123         int flag = (warntype == QUOTA_NL_BHARDWARN ||
1124                 warntype == QUOTA_NL_BSOFTLONGWARN) ? DQ_BLKS_B :
1125                 ((warntype == QUOTA_NL_IHARDWARN ||
1126                 warntype == QUOTA_NL_ISOFTLONGWARN) ? DQ_INODES_B : 0);
1127
1128         if (!flag)
1129                 return 0;
1130         return test_and_set_bit(flag, &dquot->dq_flags);
1131 }
1132
1133 #ifdef CONFIG_PRINT_QUOTA_WARNING
1134 static int flag_print_warnings = 1;
1135
1136 static int need_print_warning(struct dquot *dquot)
1137 {
1138         if (!flag_print_warnings)
1139                 return 0;
1140
1141         switch (dquot->dq_type) {
1142                 case USRQUOTA:
1143                         return current_fsuid() == dquot->dq_id;
1144                 case GRPQUOTA:
1145                         return in_group_p(dquot->dq_id);
1146         }
1147         return 0;
1148 }
1149
1150 /* Print warning to user which exceeded quota */
1151 static void print_warning(struct dquot *dquot, const int warntype)
1152 {
1153         char *msg = NULL;
1154         struct tty_struct *tty;
1155
1156         if (warntype == QUOTA_NL_IHARDBELOW ||
1157             warntype == QUOTA_NL_ISOFTBELOW ||
1158             warntype == QUOTA_NL_BHARDBELOW ||
1159             warntype == QUOTA_NL_BSOFTBELOW || !need_print_warning(dquot))
1160                 return;
1161
1162         tty = get_current_tty();
1163         if (!tty)
1164                 return;
1165         tty_write_message(tty, dquot->dq_sb->s_id);
1166         if (warntype == QUOTA_NL_ISOFTWARN || warntype == QUOTA_NL_BSOFTWARN)
1167                 tty_write_message(tty, ": warning, ");
1168         else
1169                 tty_write_message(tty, ": write failed, ");
1170         tty_write_message(tty, quotatypes[dquot->dq_type]);
1171         switch (warntype) {
1172                 case QUOTA_NL_IHARDWARN:
1173                         msg = " file limit reached.\r\n";
1174                         break;
1175                 case QUOTA_NL_ISOFTLONGWARN:
1176                         msg = " file quota exceeded too long.\r\n";
1177                         break;
1178                 case QUOTA_NL_ISOFTWARN:
1179                         msg = " file quota exceeded.\r\n";
1180                         break;
1181                 case QUOTA_NL_BHARDWARN:
1182                         msg = " block limit reached.\r\n";
1183                         break;
1184                 case QUOTA_NL_BSOFTLONGWARN:
1185                         msg = " block quota exceeded too long.\r\n";
1186                         break;
1187                 case QUOTA_NL_BSOFTWARN:
1188                         msg = " block quota exceeded.\r\n";
1189                         break;
1190         }
1191         tty_write_message(tty, msg);
1192         tty_kref_put(tty);
1193 }
1194 #endif
1195
1196 /*
1197  * Write warnings to the console and send warning messages over netlink.
1198  *
1199  * Note that this function can sleep.
1200  */
1201 static void flush_warnings(struct dquot *const *dquots, char *warntype)
1202 {
1203         struct dquot *dq;
1204         int i;
1205
1206         for (i = 0; i < MAXQUOTAS; i++) {
1207                 dq = dquots[i];
1208                 if (dq && warntype[i] != QUOTA_NL_NOWARN &&
1209                     !warning_issued(dq, warntype[i])) {
1210 #ifdef CONFIG_PRINT_QUOTA_WARNING
1211                         print_warning(dq, warntype[i]);
1212 #endif
1213                         quota_send_warning(dq->dq_type, dq->dq_id,
1214                                            dq->dq_sb->s_dev, warntype[i]);
1215                 }
1216         }
1217 }
1218
1219 static int ignore_hardlimit(struct dquot *dquot)
1220 {
1221         struct mem_dqinfo *info = &sb_dqopt(dquot->dq_sb)->info[dquot->dq_type];
1222
1223         return capable(CAP_SYS_RESOURCE) &&
1224                (info->dqi_format->qf_fmt_id != QFMT_VFS_OLD ||
1225                 !(info->dqi_flags & V1_DQF_RSQUASH));
1226 }
1227
1228 /* needs dq_data_lock */
1229 static int check_idq(struct dquot *dquot, qsize_t inodes, char *warntype)
1230 {
1231         qsize_t newinodes = dquot->dq_dqb.dqb_curinodes + inodes;
1232
1233         *warntype = QUOTA_NL_NOWARN;
1234         if (!sb_has_quota_limits_enabled(dquot->dq_sb, dquot->dq_type) ||
1235             test_bit(DQ_FAKE_B, &dquot->dq_flags))
1236                 return 0;
1237
1238         if (dquot->dq_dqb.dqb_ihardlimit &&
1239             newinodes > dquot->dq_dqb.dqb_ihardlimit &&
1240             !ignore_hardlimit(dquot)) {
1241                 *warntype = QUOTA_NL_IHARDWARN;
1242                 return -EDQUOT;
1243         }
1244
1245         if (dquot->dq_dqb.dqb_isoftlimit &&
1246             newinodes > dquot->dq_dqb.dqb_isoftlimit &&
1247             dquot->dq_dqb.dqb_itime &&
1248             get_seconds() >= dquot->dq_dqb.dqb_itime &&
1249             !ignore_hardlimit(dquot)) {
1250                 *warntype = QUOTA_NL_ISOFTLONGWARN;
1251                 return -EDQUOT;
1252         }
1253
1254         if (dquot->dq_dqb.dqb_isoftlimit &&
1255             newinodes > dquot->dq_dqb.dqb_isoftlimit &&
1256             dquot->dq_dqb.dqb_itime == 0) {
1257                 *warntype = QUOTA_NL_ISOFTWARN;
1258                 dquot->dq_dqb.dqb_itime = get_seconds() +
1259                     sb_dqopt(dquot->dq_sb)->info[dquot->dq_type].dqi_igrace;
1260         }
1261
1262         return 0;
1263 }
1264
1265 /* needs dq_data_lock */
1266 static int check_bdq(struct dquot *dquot, qsize_t space, int prealloc, char *warntype)
1267 {
1268         qsize_t tspace;
1269         struct super_block *sb = dquot->dq_sb;
1270
1271         *warntype = QUOTA_NL_NOWARN;
1272         if (!sb_has_quota_limits_enabled(sb, dquot->dq_type) ||
1273             test_bit(DQ_FAKE_B, &dquot->dq_flags))
1274                 return 0;
1275
1276         tspace = dquot->dq_dqb.dqb_curspace + dquot->dq_dqb.dqb_rsvspace
1277                 + space;
1278
1279         if (dquot->dq_dqb.dqb_bhardlimit &&
1280             tspace > dquot->dq_dqb.dqb_bhardlimit &&
1281             !ignore_hardlimit(dquot)) {
1282                 if (!prealloc)
1283                         *warntype = QUOTA_NL_BHARDWARN;
1284                 return -EDQUOT;
1285         }
1286
1287         if (dquot->dq_dqb.dqb_bsoftlimit &&
1288             tspace > dquot->dq_dqb.dqb_bsoftlimit &&
1289             dquot->dq_dqb.dqb_btime &&
1290             get_seconds() >= dquot->dq_dqb.dqb_btime &&
1291             !ignore_hardlimit(dquot)) {
1292                 if (!prealloc)
1293                         *warntype = QUOTA_NL_BSOFTLONGWARN;
1294                 return -EDQUOT;
1295         }
1296
1297         if (dquot->dq_dqb.dqb_bsoftlimit &&
1298             tspace > dquot->dq_dqb.dqb_bsoftlimit &&
1299             dquot->dq_dqb.dqb_btime == 0) {
1300                 if (!prealloc) {
1301                         *warntype = QUOTA_NL_BSOFTWARN;
1302                         dquot->dq_dqb.dqb_btime = get_seconds() +
1303                             sb_dqopt(sb)->info[dquot->dq_type].dqi_bgrace;
1304                 }
1305                 else
1306                         /*
1307                          * We don't allow preallocation to exceed softlimit so exceeding will
1308                          * be always printed
1309                          */
1310                         return -EDQUOT;
1311         }
1312
1313         return 0;
1314 }
1315
1316 static int info_idq_free(struct dquot *dquot, qsize_t inodes)
1317 {
1318         qsize_t newinodes;
1319
1320         if (test_bit(DQ_FAKE_B, &dquot->dq_flags) ||
1321             dquot->dq_dqb.dqb_curinodes <= dquot->dq_dqb.dqb_isoftlimit ||
1322             !sb_has_quota_limits_enabled(dquot->dq_sb, dquot->dq_type))
1323                 return QUOTA_NL_NOWARN;
1324
1325         newinodes = dquot->dq_dqb.dqb_curinodes - inodes;
1326         if (newinodes <= dquot->dq_dqb.dqb_isoftlimit)
1327                 return QUOTA_NL_ISOFTBELOW;
1328         if (dquot->dq_dqb.dqb_curinodes >= dquot->dq_dqb.dqb_ihardlimit &&
1329             newinodes < dquot->dq_dqb.dqb_ihardlimit)
1330                 return QUOTA_NL_IHARDBELOW;
1331         return QUOTA_NL_NOWARN;
1332 }
1333
1334 static int info_bdq_free(struct dquot *dquot, qsize_t space)
1335 {
1336         if (test_bit(DQ_FAKE_B, &dquot->dq_flags) ||
1337             dquot->dq_dqb.dqb_curspace <= dquot->dq_dqb.dqb_bsoftlimit)
1338                 return QUOTA_NL_NOWARN;
1339
1340         if (dquot->dq_dqb.dqb_curspace - space <= dquot->dq_dqb.dqb_bsoftlimit)
1341                 return QUOTA_NL_BSOFTBELOW;
1342         if (dquot->dq_dqb.dqb_curspace >= dquot->dq_dqb.dqb_bhardlimit &&
1343             dquot->dq_dqb.dqb_curspace - space < dquot->dq_dqb.dqb_bhardlimit)
1344                 return QUOTA_NL_BHARDBELOW;
1345         return QUOTA_NL_NOWARN;
1346 }
1347
1348 static int dquot_active(const struct inode *inode)
1349 {
1350         struct super_block *sb = inode->i_sb;
1351
1352         if (IS_NOQUOTA(inode))
1353                 return 0;
1354         return sb_any_quota_loaded(sb) & ~sb_any_quota_suspended(sb);
1355 }
1356
1357 /*
1358  * Initialize quota pointers in inode
1359  *
1360  * We do things in a bit complicated way but by that we avoid calling
1361  * dqget() and thus filesystem callbacks under dqptr_sem.
1362  *
1363  * It is better to call this function outside of any transaction as it
1364  * might need a lot of space in journal for dquot structure allocation.
1365  */
1366 static void __dquot_initialize(struct inode *inode, int type)
1367 {
1368         unsigned int id = 0;
1369         int cnt;
1370         struct dquot *got[MAXQUOTAS];
1371         struct super_block *sb = inode->i_sb;
1372         qsize_t rsv;
1373
1374         /* First test before acquiring mutex - solves deadlocks when we
1375          * re-enter the quota code and are already holding the mutex */
1376         if (!dquot_active(inode))
1377                 return;
1378
1379         /* First get references to structures we might need. */
1380         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1381                 got[cnt] = NULL;
1382                 if (type != -1 && cnt != type)
1383                         continue;
1384                 switch (cnt) {
1385                 case USRQUOTA:
1386                         id = inode->i_uid;
1387                         break;
1388                 case GRPQUOTA:
1389                         id = inode->i_gid;
1390                         break;
1391                 }
1392                 got[cnt] = dqget(sb, id, cnt);
1393         }
1394
1395         down_write(&sb_dqopt(sb)->dqptr_sem);
1396         if (IS_NOQUOTA(inode))
1397                 goto out_err;
1398         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1399                 if (type != -1 && cnt != type)
1400                         continue;
1401                 /* Avoid races with quotaoff() */
1402                 if (!sb_has_quota_active(sb, cnt))
1403                         continue;
1404                 /* We could race with quotaon or dqget() could have failed */
1405                 if (!got[cnt])
1406                         continue;
1407                 if (!inode->i_dquot[cnt]) {
1408                         inode->i_dquot[cnt] = got[cnt];
1409                         got[cnt] = NULL;
1410                         /*
1411                          * Make quota reservation system happy if someone
1412                          * did a write before quota was turned on
1413                          */
1414                         rsv = inode_get_rsv_space(inode);
1415                         if (unlikely(rsv))
1416                                 dquot_resv_space(inode->i_dquot[cnt], rsv);
1417                 }
1418         }
1419 out_err:
1420         up_write(&sb_dqopt(sb)->dqptr_sem);
1421         /* Drop unused references */
1422         dqput_all(got);
1423 }
1424
1425 void dquot_initialize(struct inode *inode)
1426 {
1427         __dquot_initialize(inode, -1);
1428 }
1429 EXPORT_SYMBOL(dquot_initialize);
1430
1431 /*
1432  *      Release all quotas referenced by inode
1433  */
1434 static void __dquot_drop(struct inode *inode)
1435 {
1436         int cnt;
1437         struct dquot *put[MAXQUOTAS];
1438
1439         down_write(&sb_dqopt(inode->i_sb)->dqptr_sem);
1440         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1441                 put[cnt] = inode->i_dquot[cnt];
1442                 inode->i_dquot[cnt] = NULL;
1443         }
1444         up_write(&sb_dqopt(inode->i_sb)->dqptr_sem);
1445         dqput_all(put);
1446 }
1447
1448 void dquot_drop(struct inode *inode)
1449 {
1450         int cnt;
1451
1452         if (IS_NOQUOTA(inode))
1453                 return;
1454
1455         /*
1456          * Test before calling to rule out calls from proc and such
1457          * where we are not allowed to block. Note that this is
1458          * actually reliable test even without the lock - the caller
1459          * must assure that nobody can come after the DQUOT_DROP and
1460          * add quota pointers back anyway.
1461          */
1462         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1463                 if (inode->i_dquot[cnt])
1464                         break;
1465         }
1466
1467         if (cnt < MAXQUOTAS)
1468                 __dquot_drop(inode);
1469 }
1470 EXPORT_SYMBOL(dquot_drop);
1471
1472 /*
1473  * inode_reserved_space is managed internally by quota, and protected by
1474  * i_lock similar to i_blocks+i_bytes.
1475  */
1476 static qsize_t *inode_reserved_space(struct inode * inode)
1477 {
1478         /* Filesystem must explicitly define it's own method in order to use
1479          * quota reservation interface */
1480         BUG_ON(!inode->i_sb->dq_op->get_reserved_space);
1481         return inode->i_sb->dq_op->get_reserved_space(inode);
1482 }
1483
1484 void inode_add_rsv_space(struct inode *inode, qsize_t number)
1485 {
1486         spin_lock(&inode->i_lock);
1487         *inode_reserved_space(inode) += number;
1488         spin_unlock(&inode->i_lock);
1489 }
1490 EXPORT_SYMBOL(inode_add_rsv_space);
1491
1492 void inode_claim_rsv_space(struct inode *inode, qsize_t number)
1493 {
1494         spin_lock(&inode->i_lock);
1495         *inode_reserved_space(inode) -= number;
1496         __inode_add_bytes(inode, number);
1497         spin_unlock(&inode->i_lock);
1498 }
1499 EXPORT_SYMBOL(inode_claim_rsv_space);
1500
1501 void inode_sub_rsv_space(struct inode *inode, qsize_t number)
1502 {
1503         spin_lock(&inode->i_lock);
1504         *inode_reserved_space(inode) -= number;
1505         spin_unlock(&inode->i_lock);
1506 }
1507 EXPORT_SYMBOL(inode_sub_rsv_space);
1508
1509 static qsize_t inode_get_rsv_space(struct inode *inode)
1510 {
1511         qsize_t ret;
1512
1513         if (!inode->i_sb->dq_op->get_reserved_space)
1514                 return 0;
1515         spin_lock(&inode->i_lock);
1516         ret = *inode_reserved_space(inode);
1517         spin_unlock(&inode->i_lock);
1518         return ret;
1519 }
1520
1521 static void inode_incr_space(struct inode *inode, qsize_t number,
1522                                 int reserve)
1523 {
1524         if (reserve)
1525                 inode_add_rsv_space(inode, number);
1526         else
1527                 inode_add_bytes(inode, number);
1528 }
1529
1530 static void inode_decr_space(struct inode *inode, qsize_t number, int reserve)
1531 {
1532         if (reserve)
1533                 inode_sub_rsv_space(inode, number);
1534         else
1535                 inode_sub_bytes(inode, number);
1536 }
1537
1538 /*
1539  * This functions updates i_blocks+i_bytes fields and quota information
1540  * (together with appropriate checks).
1541  *
1542  * NOTE: We absolutely rely on the fact that caller dirties the inode
1543  * (usually helpers in quotaops.h care about this) and holds a handle for
1544  * the current transaction so that dquot write and inode write go into the
1545  * same transaction.
1546  */
1547
1548 /*
1549  * This operation can block, but only after everything is updated
1550  */
1551 int __dquot_alloc_space(struct inode *inode, qsize_t number, int flags)
1552 {
1553         int cnt, ret = 0;
1554         char warntype[MAXQUOTAS];
1555         int warn = flags & DQUOT_SPACE_WARN;
1556         int reserve = flags & DQUOT_SPACE_RESERVE;
1557         int nofail = flags & DQUOT_SPACE_NOFAIL;
1558
1559         /*
1560          * First test before acquiring mutex - solves deadlocks when we
1561          * re-enter the quota code and are already holding the mutex
1562          */
1563         if (!dquot_active(inode)) {
1564                 inode_incr_space(inode, number, reserve);
1565                 goto out;
1566         }
1567
1568         down_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
1569         for (cnt = 0; cnt < MAXQUOTAS; cnt++)
1570                 warntype[cnt] = QUOTA_NL_NOWARN;
1571
1572         spin_lock(&dq_data_lock);
1573         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1574                 if (!inode->i_dquot[cnt])
1575                         continue;
1576                 ret = check_bdq(inode->i_dquot[cnt], number, !warn,
1577                                 warntype+cnt);
1578                 if (ret && !nofail) {
1579                         spin_unlock(&dq_data_lock);
1580                         goto out_flush_warn;
1581                 }
1582         }
1583         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1584                 if (!inode->i_dquot[cnt])
1585                         continue;
1586                 if (reserve)
1587                         dquot_resv_space(inode->i_dquot[cnt], number);
1588                 else
1589                         dquot_incr_space(inode->i_dquot[cnt], number);
1590         }
1591         inode_incr_space(inode, number, reserve);
1592         spin_unlock(&dq_data_lock);
1593
1594         if (reserve)
1595                 goto out_flush_warn;
1596         mark_all_dquot_dirty(inode->i_dquot);
1597 out_flush_warn:
1598         flush_warnings(inode->i_dquot, warntype);
1599         up_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
1600 out:
1601         return ret;
1602 }
1603 EXPORT_SYMBOL(__dquot_alloc_space);
1604
1605 /*
1606  * This operation can block, but only after everything is updated
1607  */
1608 int dquot_alloc_inode(const struct inode *inode)
1609 {
1610         int cnt, ret = 0;
1611         char warntype[MAXQUOTAS];
1612
1613         /* First test before acquiring mutex - solves deadlocks when we
1614          * re-enter the quota code and are already holding the mutex */
1615         if (!dquot_active(inode))
1616                 return 0;
1617         for (cnt = 0; cnt < MAXQUOTAS; cnt++)
1618                 warntype[cnt] = QUOTA_NL_NOWARN;
1619         down_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
1620         spin_lock(&dq_data_lock);
1621         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1622                 if (!inode->i_dquot[cnt])
1623                         continue;
1624                 ret = check_idq(inode->i_dquot[cnt], 1, warntype + cnt);
1625                 if (ret)
1626                         goto warn_put_all;
1627         }
1628
1629         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1630                 if (!inode->i_dquot[cnt])
1631                         continue;
1632                 dquot_incr_inodes(inode->i_dquot[cnt], 1);
1633         }
1634
1635 warn_put_all:
1636         spin_unlock(&dq_data_lock);
1637         if (ret == 0)
1638                 mark_all_dquot_dirty(inode->i_dquot);
1639         flush_warnings(inode->i_dquot, warntype);
1640         up_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
1641         return ret;
1642 }
1643 EXPORT_SYMBOL(dquot_alloc_inode);
1644
1645 /*
1646  * Convert in-memory reserved quotas to real consumed quotas
1647  */
1648 int dquot_claim_space_nodirty(struct inode *inode, qsize_t number)
1649 {
1650         int cnt;
1651
1652         if (!dquot_active(inode)) {
1653                 inode_claim_rsv_space(inode, number);
1654                 return 0;
1655         }
1656
1657         down_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
1658         spin_lock(&dq_data_lock);
1659         /* Claim reserved quotas to allocated quotas */
1660         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1661                 if (inode->i_dquot[cnt])
1662                         dquot_claim_reserved_space(inode->i_dquot[cnt],
1663                                                         number);
1664         }
1665         /* Update inode bytes */
1666         inode_claim_rsv_space(inode, number);
1667         spin_unlock(&dq_data_lock);
1668         mark_all_dquot_dirty(inode->i_dquot);
1669         up_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
1670         return 0;
1671 }
1672 EXPORT_SYMBOL(dquot_claim_space_nodirty);
1673
1674 /*
1675  * This operation can block, but only after everything is updated
1676  */
1677 void __dquot_free_space(struct inode *inode, qsize_t number, int flags)
1678 {
1679         unsigned int cnt;
1680         char warntype[MAXQUOTAS];
1681         int reserve = flags & DQUOT_SPACE_RESERVE;
1682
1683         /* First test before acquiring mutex - solves deadlocks when we
1684          * re-enter the quota code and are already holding the mutex */
1685         if (!dquot_active(inode)) {
1686                 inode_decr_space(inode, number, reserve);
1687                 return;
1688         }
1689
1690         down_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
1691         spin_lock(&dq_data_lock);
1692         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1693                 if (!inode->i_dquot[cnt])
1694                         continue;
1695                 warntype[cnt] = info_bdq_free(inode->i_dquot[cnt], number);
1696                 if (reserve)
1697                         dquot_free_reserved_space(inode->i_dquot[cnt], number);
1698                 else
1699                         dquot_decr_space(inode->i_dquot[cnt], number);
1700         }
1701         inode_decr_space(inode, number, reserve);
1702         spin_unlock(&dq_data_lock);
1703
1704         if (reserve)
1705                 goto out_unlock;
1706         mark_all_dquot_dirty(inode->i_dquot);
1707 out_unlock:
1708         flush_warnings(inode->i_dquot, warntype);
1709         up_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
1710 }
1711 EXPORT_SYMBOL(__dquot_free_space);
1712
1713 /*
1714  * This operation can block, but only after everything is updated
1715  */
1716 void dquot_free_inode(const struct inode *inode)
1717 {
1718         unsigned int cnt;
1719         char warntype[MAXQUOTAS];
1720
1721         /* First test before acquiring mutex - solves deadlocks when we
1722          * re-enter the quota code and are already holding the mutex */
1723         if (!dquot_active(inode))
1724                 return;
1725
1726         down_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
1727         spin_lock(&dq_data_lock);
1728         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1729                 if (!inode->i_dquot[cnt])
1730                         continue;
1731                 warntype[cnt] = info_idq_free(inode->i_dquot[cnt], 1);
1732                 dquot_decr_inodes(inode->i_dquot[cnt], 1);
1733         }
1734         spin_unlock(&dq_data_lock);
1735         mark_all_dquot_dirty(inode->i_dquot);
1736         flush_warnings(inode->i_dquot, warntype);
1737         up_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
1738 }
1739 EXPORT_SYMBOL(dquot_free_inode);
1740
1741 /*
1742  * Transfer the number of inode and blocks from one diskquota to an other.
1743  * On success, dquot references in transfer_to are consumed and references
1744  * to original dquots that need to be released are placed there. On failure,
1745  * references are kept untouched.
1746  *
1747  * This operation can block, but only after everything is updated
1748  * A transaction must be started when entering this function.
1749  *
1750  */
1751 int __dquot_transfer(struct inode *inode, struct dquot **transfer_to)
1752 {
1753         qsize_t space, cur_space;
1754         qsize_t rsv_space = 0;
1755         struct dquot *transfer_from[MAXQUOTAS] = {};
1756         int cnt, ret = 0;
1757         char is_valid[MAXQUOTAS] = {};
1758         char warntype_to[MAXQUOTAS];
1759         char warntype_from_inodes[MAXQUOTAS], warntype_from_space[MAXQUOTAS];
1760
1761         /* First test before acquiring mutex - solves deadlocks when we
1762          * re-enter the quota code and are already holding the mutex */
1763         if (IS_NOQUOTA(inode))
1764                 return 0;
1765         /* Initialize the arrays */
1766         for (cnt = 0; cnt < MAXQUOTAS; cnt++)
1767                 warntype_to[cnt] = QUOTA_NL_NOWARN;
1768         down_write(&sb_dqopt(inode->i_sb)->dqptr_sem);
1769         if (IS_NOQUOTA(inode)) {        /* File without quota accounting? */
1770                 up_write(&sb_dqopt(inode->i_sb)->dqptr_sem);
1771                 return 0;
1772         }
1773         spin_lock(&dq_data_lock);
1774         cur_space = inode_get_bytes(inode);
1775         rsv_space = inode_get_rsv_space(inode);
1776         space = cur_space + rsv_space;
1777         /* Build the transfer_from list and check the limits */
1778         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1779                 /*
1780                  * Skip changes for same uid or gid or for turned off quota-type.
1781                  */
1782                 if (!transfer_to[cnt])
1783                         continue;
1784                 /* Avoid races with quotaoff() */
1785                 if (!sb_has_quota_active(inode->i_sb, cnt))
1786                         continue;
1787                 is_valid[cnt] = 1;
1788                 transfer_from[cnt] = inode->i_dquot[cnt];
1789                 ret = check_idq(transfer_to[cnt], 1, warntype_to + cnt);
1790                 if (ret)
1791                         goto over_quota;
1792                 ret = check_bdq(transfer_to[cnt], space, 0, warntype_to + cnt);
1793                 if (ret)
1794                         goto over_quota;
1795         }
1796
1797         /*
1798          * Finally perform the needed transfer from transfer_from to transfer_to
1799          */
1800         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1801                 if (!is_valid[cnt])
1802                         continue;
1803                 /* Due to IO error we might not have transfer_from[] structure */
1804                 if (transfer_from[cnt]) {
1805                         warntype_from_inodes[cnt] =
1806                                 info_idq_free(transfer_from[cnt], 1);
1807                         warntype_from_space[cnt] =
1808                                 info_bdq_free(transfer_from[cnt], space);
1809                         dquot_decr_inodes(transfer_from[cnt], 1);
1810                         dquot_decr_space(transfer_from[cnt], cur_space);
1811                         dquot_free_reserved_space(transfer_from[cnt],
1812                                                   rsv_space);
1813                 }
1814
1815                 dquot_incr_inodes(transfer_to[cnt], 1);
1816                 dquot_incr_space(transfer_to[cnt], cur_space);
1817                 dquot_resv_space(transfer_to[cnt], rsv_space);
1818
1819                 inode->i_dquot[cnt] = transfer_to[cnt];
1820         }
1821         spin_unlock(&dq_data_lock);
1822         up_write(&sb_dqopt(inode->i_sb)->dqptr_sem);
1823
1824         mark_all_dquot_dirty(transfer_from);
1825         mark_all_dquot_dirty(transfer_to);
1826         flush_warnings(transfer_to, warntype_to);
1827         flush_warnings(transfer_from, warntype_from_inodes);
1828         flush_warnings(transfer_from, warntype_from_space);
1829         /* Pass back references to put */
1830         for (cnt = 0; cnt < MAXQUOTAS; cnt++)
1831                 if (is_valid[cnt])
1832                         transfer_to[cnt] = transfer_from[cnt];
1833         return 0;
1834 over_quota:
1835         spin_unlock(&dq_data_lock);
1836         up_write(&sb_dqopt(inode->i_sb)->dqptr_sem);
1837         flush_warnings(transfer_to, warntype_to);
1838         return ret;
1839 }
1840 EXPORT_SYMBOL(__dquot_transfer);
1841
1842 /* Wrapper for transferring ownership of an inode for uid/gid only
1843  * Called from FSXXX_setattr()
1844  */
1845 int dquot_transfer(struct inode *inode, struct iattr *iattr)
1846 {
1847         struct dquot *transfer_to[MAXQUOTAS] = {};
1848         struct super_block *sb = inode->i_sb;
1849         int ret;
1850
1851         if (!dquot_active(inode))
1852                 return 0;
1853
1854         if (iattr->ia_valid & ATTR_UID && iattr->ia_uid != inode->i_uid)
1855                 transfer_to[USRQUOTA] = dqget(sb, iattr->ia_uid, USRQUOTA);
1856         if (iattr->ia_valid & ATTR_GID && iattr->ia_gid != inode->i_gid)
1857                 transfer_to[GRPQUOTA] = dqget(sb, iattr->ia_gid, GRPQUOTA);
1858
1859         ret = __dquot_transfer(inode, transfer_to);
1860         dqput_all(transfer_to);
1861         return ret;
1862 }
1863 EXPORT_SYMBOL(dquot_transfer);
1864
1865 /*
1866  * Write info of quota file to disk
1867  */
1868 int dquot_commit_info(struct super_block *sb, int type)
1869 {
1870         int ret;
1871         struct quota_info *dqopt = sb_dqopt(sb);
1872
1873         mutex_lock(&dqopt->dqio_mutex);
1874         ret = dqopt->ops[type]->write_file_info(sb, type);
1875         mutex_unlock(&dqopt->dqio_mutex);
1876         return ret;
1877 }
1878 EXPORT_SYMBOL(dquot_commit_info);
1879
1880 /*
1881  * Definitions of diskquota operations.
1882  */
1883 const struct dquot_operations dquot_operations = {
1884         .write_dquot    = dquot_commit,
1885         .acquire_dquot  = dquot_acquire,
1886         .release_dquot  = dquot_release,
1887         .mark_dirty     = dquot_mark_dquot_dirty,
1888         .write_info     = dquot_commit_info,
1889         .alloc_dquot    = dquot_alloc,
1890         .destroy_dquot  = dquot_destroy,
1891 };
1892 EXPORT_SYMBOL(dquot_operations);
1893
1894 /*
1895  * Generic helper for ->open on filesystems supporting disk quotas.
1896  */
1897 int dquot_file_open(struct inode *inode, struct file *file)
1898 {
1899         int error;
1900
1901         error = generic_file_open(inode, file);
1902         if (!error && (file->f_mode & FMODE_WRITE))
1903                 dquot_initialize(inode);
1904         return error;
1905 }
1906 EXPORT_SYMBOL(dquot_file_open);
1907
1908 /*
1909  * Turn quota off on a device. type == -1 ==> quotaoff for all types (umount)
1910  */
1911 int dquot_disable(struct super_block *sb, int type, unsigned int flags)
1912 {
1913         int cnt, ret = 0;
1914         struct quota_info *dqopt = sb_dqopt(sb);
1915         struct inode *toputinode[MAXQUOTAS];
1916
1917         /* Cannot turn off usage accounting without turning off limits, or
1918          * suspend quotas and simultaneously turn quotas off. */
1919         if ((flags & DQUOT_USAGE_ENABLED && !(flags & DQUOT_LIMITS_ENABLED))
1920             || (flags & DQUOT_SUSPENDED && flags & (DQUOT_LIMITS_ENABLED |
1921             DQUOT_USAGE_ENABLED)))
1922                 return -EINVAL;
1923
1924         /* We need to serialize quota_off() for device */
1925         mutex_lock(&dqopt->dqonoff_mutex);
1926
1927         /*
1928          * Skip everything if there's nothing to do. We have to do this because
1929          * sometimes we are called when fill_super() failed and calling
1930          * sync_fs() in such cases does no good.
1931          */
1932         if (!sb_any_quota_loaded(sb)) {
1933                 mutex_unlock(&dqopt->dqonoff_mutex);
1934                 return 0;
1935         }
1936         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
1937                 toputinode[cnt] = NULL;
1938                 if (type != -1 && cnt != type)
1939                         continue;
1940                 if (!sb_has_quota_loaded(sb, cnt))
1941                         continue;
1942
1943                 if (flags & DQUOT_SUSPENDED) {
1944                         spin_lock(&dq_state_lock);
1945                         dqopt->flags |=
1946                                 dquot_state_flag(DQUOT_SUSPENDED, cnt);
1947                         spin_unlock(&dq_state_lock);
1948                 } else {
1949                         spin_lock(&dq_state_lock);
1950                         dqopt->flags &= ~dquot_state_flag(flags, cnt);
1951                         /* Turning off suspended quotas? */
1952                         if (!sb_has_quota_loaded(sb, cnt) &&
1953                             sb_has_quota_suspended(sb, cnt)) {
1954                                 dqopt->flags &= ~dquot_state_flag(
1955                                                         DQUOT_SUSPENDED, cnt);
1956                                 spin_unlock(&dq_state_lock);
1957                                 iput(dqopt->files[cnt]);
1958                                 dqopt->files[cnt] = NULL;
1959                                 continue;
1960                         }
1961                         spin_unlock(&dq_state_lock);
1962                 }
1963
1964                 /* We still have to keep quota loaded? */
1965                 if (sb_has_quota_loaded(sb, cnt) && !(flags & DQUOT_SUSPENDED))
1966                         continue;
1967
1968                 /* Note: these are blocking operations */
1969                 drop_dquot_ref(sb, cnt);
1970                 invalidate_dquots(sb, cnt);
1971                 /*
1972                  * Now all dquots should be invalidated, all writes done so we
1973                  * should be only users of the info. No locks needed.
1974                  */
1975                 if (info_dirty(&dqopt->info[cnt]))
1976                         sb->dq_op->write_info(sb, cnt);
1977                 if (dqopt->ops[cnt]->free_file_info)
1978                         dqopt->ops[cnt]->free_file_info(sb, cnt);
1979                 put_quota_format(dqopt->info[cnt].dqi_format);
1980
1981                 toputinode[cnt] = dqopt->files[cnt];
1982                 if (!sb_has_quota_loaded(sb, cnt))
1983                         dqopt->files[cnt] = NULL;
1984                 dqopt->info[cnt].dqi_flags = 0;
1985                 dqopt->info[cnt].dqi_igrace = 0;
1986                 dqopt->info[cnt].dqi_bgrace = 0;
1987                 dqopt->ops[cnt] = NULL;
1988         }
1989         mutex_unlock(&dqopt->dqonoff_mutex);
1990
1991         /* Skip syncing and setting flags if quota files are hidden */
1992         if (dqopt->flags & DQUOT_QUOTA_SYS_FILE)
1993                 goto put_inodes;
1994
1995         /* Sync the superblock so that buffers with quota data are written to
1996          * disk (and so userspace sees correct data afterwards). */
1997         if (sb->s_op->sync_fs)
1998                 sb->s_op->sync_fs(sb, 1);
1999         sync_blockdev(sb->s_bdev);
2000         /* Now the quota files are just ordinary files and we can set the
2001          * inode flags back. Moreover we discard the pagecache so that
2002          * userspace sees the writes we did bypassing the pagecache. We
2003          * must also discard the blockdev buffers so that we see the
2004          * changes done by userspace on the next quotaon() */
2005         for (cnt = 0; cnt < MAXQUOTAS; cnt++)
2006                 if (toputinode[cnt]) {
2007                         mutex_lock(&dqopt->dqonoff_mutex);
2008                         /* If quota was reenabled in the meantime, we have
2009                          * nothing to do */
2010                         if (!sb_has_quota_loaded(sb, cnt)) {
2011                                 mutex_lock_nested(&toputinode[cnt]->i_mutex,
2012                                                   I_MUTEX_QUOTA);
2013                                 toputinode[cnt]->i_flags &= ~(S_IMMUTABLE |
2014                                   S_NOATIME | S_NOQUOTA);
2015                                 truncate_inode_pages(&toputinode[cnt]->i_data,
2016                                                      0);
2017                                 mutex_unlock(&toputinode[cnt]->i_mutex);
2018                                 mark_inode_dirty_sync(toputinode[cnt]);
2019                         }
2020                         mutex_unlock(&dqopt->dqonoff_mutex);
2021                 }
2022         if (sb->s_bdev)
2023                 invalidate_bdev(sb->s_bdev);
2024 put_inodes:
2025         for (cnt = 0; cnt < MAXQUOTAS; cnt++)
2026                 if (toputinode[cnt]) {
2027                         /* On remount RO, we keep the inode pointer so that we
2028                          * can reenable quota on the subsequent remount RW. We
2029                          * have to check 'flags' variable and not use sb_has_
2030                          * function because another quotaon / quotaoff could
2031                          * change global state before we got here. We refuse
2032                          * to suspend quotas when there is pending delete on
2033                          * the quota file... */
2034                         if (!(flags & DQUOT_SUSPENDED))
2035                                 iput(toputinode[cnt]);
2036                         else if (!toputinode[cnt]->i_nlink)
2037                                 ret = -EBUSY;
2038                 }
2039         return ret;
2040 }
2041 EXPORT_SYMBOL(dquot_disable);
2042
2043 int dquot_quota_off(struct super_block *sb, int type)
2044 {
2045         return dquot_disable(sb, type,
2046                              DQUOT_USAGE_ENABLED | DQUOT_LIMITS_ENABLED);
2047 }
2048 EXPORT_SYMBOL(dquot_quota_off);
2049
2050 /*
2051  *      Turn quotas on on a device
2052  */
2053
2054 /*
2055  * Helper function to turn quotas on when we already have the inode of
2056  * quota file and no quota information is loaded.
2057  */
2058 static int vfs_load_quota_inode(struct inode *inode, int type, int format_id,
2059         unsigned int flags)
2060 {
2061         struct quota_format_type *fmt = find_quota_format(format_id);
2062         struct super_block *sb = inode->i_sb;
2063         struct quota_info *dqopt = sb_dqopt(sb);
2064         int error;
2065         int oldflags = -1;
2066
2067         if (!fmt)
2068                 return -ESRCH;
2069         if (!S_ISREG(inode->i_mode)) {
2070                 error = -EACCES;
2071                 goto out_fmt;
2072         }
2073         if (IS_RDONLY(inode)) {
2074                 error = -EROFS;
2075                 goto out_fmt;
2076         }
2077         if (!sb->s_op->quota_write || !sb->s_op->quota_read) {
2078                 error = -EINVAL;
2079                 goto out_fmt;
2080         }
2081         /* Usage always has to be set... */
2082         if (!(flags & DQUOT_USAGE_ENABLED)) {
2083                 error = -EINVAL;
2084                 goto out_fmt;
2085         }
2086
2087         if (!(dqopt->flags & DQUOT_QUOTA_SYS_FILE)) {
2088                 /* As we bypass the pagecache we must now flush all the
2089                  * dirty data and invalidate caches so that kernel sees
2090                  * changes from userspace. It is not enough to just flush
2091                  * the quota file since if blocksize < pagesize, invalidation
2092                  * of the cache could fail because of other unrelated dirty
2093                  * data */
2094                 sync_filesystem(sb);
2095                 invalidate_bdev(sb->s_bdev);
2096         }
2097         mutex_lock(&dqopt->dqonoff_mutex);
2098         if (sb_has_quota_loaded(sb, type)) {
2099                 error = -EBUSY;
2100                 goto out_lock;
2101         }
2102
2103         if (!(dqopt->flags & DQUOT_QUOTA_SYS_FILE)) {
2104                 /* We don't want quota and atime on quota files (deadlocks
2105                  * possible) Also nobody should write to the file - we use
2106                  * special IO operations which ignore the immutable bit. */
2107                 mutex_lock_nested(&inode->i_mutex, I_MUTEX_QUOTA);
2108                 oldflags = inode->i_flags & (S_NOATIME | S_IMMUTABLE |
2109                                              S_NOQUOTA);
2110                 inode->i_flags |= S_NOQUOTA | S_NOATIME | S_IMMUTABLE;
2111                 mutex_unlock(&inode->i_mutex);
2112                 /*
2113                  * When S_NOQUOTA is set, remove dquot references as no more
2114                  * references can be added
2115                  */
2116                 __dquot_drop(inode);
2117         }
2118
2119         error = -EIO;
2120         dqopt->files[type] = igrab(inode);
2121         if (!dqopt->files[type])
2122                 goto out_lock;
2123         error = -EINVAL;
2124         if (!fmt->qf_ops->check_quota_file(sb, type))
2125                 goto out_file_init;
2126
2127         dqopt->ops[type] = fmt->qf_ops;
2128         dqopt->info[type].dqi_format = fmt;
2129         dqopt->info[type].dqi_fmt_id = format_id;
2130         INIT_LIST_HEAD(&dqopt->info[type].dqi_dirty_list);
2131         mutex_lock(&dqopt->dqio_mutex);
2132         error = dqopt->ops[type]->read_file_info(sb, type);
2133         if (error < 0) {
2134                 mutex_unlock(&dqopt->dqio_mutex);
2135                 goto out_file_init;
2136         }
2137         mutex_unlock(&dqopt->dqio_mutex);
2138         spin_lock(&dq_state_lock);
2139         dqopt->flags |= dquot_state_flag(flags, type);
2140         spin_unlock(&dq_state_lock);
2141
2142         add_dquot_ref(sb, type);
2143         mutex_unlock(&dqopt->dqonoff_mutex);
2144
2145         return 0;
2146
2147 out_file_init:
2148         dqopt->files[type] = NULL;
2149         iput(inode);
2150 out_lock:
2151         if (oldflags != -1) {
2152                 mutex_lock_nested(&inode->i_mutex, I_MUTEX_QUOTA);
2153                 /* Set the flags back (in the case of accidental quotaon()
2154                  * on a wrong file we don't want to mess up the flags) */
2155                 inode->i_flags &= ~(S_NOATIME | S_NOQUOTA | S_IMMUTABLE);
2156                 inode->i_flags |= oldflags;
2157                 mutex_unlock(&inode->i_mutex);
2158         }
2159         mutex_unlock(&dqopt->dqonoff_mutex);
2160 out_fmt:
2161         put_quota_format(fmt);
2162
2163         return error; 
2164 }
2165
2166 /* Reenable quotas on remount RW */
2167 int dquot_resume(struct super_block *sb, int type)
2168 {
2169         struct quota_info *dqopt = sb_dqopt(sb);
2170         struct inode *inode;
2171         int ret = 0, cnt;
2172         unsigned int flags;
2173
2174         for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
2175                 if (type != -1 && cnt != type)
2176                         continue;
2177
2178                 mutex_lock(&dqopt->dqonoff_mutex);
2179                 if (!sb_has_quota_suspended(sb, cnt)) {
2180                         mutex_unlock(&dqopt->dqonoff_mutex);
2181                         continue;
2182                 }
2183                 inode = dqopt->files[cnt];
2184                 dqopt->files[cnt] = NULL;
2185                 spin_lock(&dq_state_lock);
2186                 flags = dqopt->flags & dquot_state_flag(DQUOT_USAGE_ENABLED |
2187                                                         DQUOT_LIMITS_ENABLED,
2188                                                         cnt);
2189                 dqopt->flags &= ~dquot_state_flag(DQUOT_STATE_FLAGS, cnt);
2190                 spin_unlock(&dq_state_lock);
2191                 mutex_unlock(&dqopt->dqonoff_mutex);
2192
2193                 flags = dquot_generic_flag(flags, cnt);
2194                 ret = vfs_load_quota_inode(inode, cnt,
2195                                 dqopt->info[cnt].dqi_fmt_id, flags);
2196                 iput(inode);
2197         }
2198
2199         return ret;
2200 }
2201 EXPORT_SYMBOL(dquot_resume);
2202
2203 int dquot_quota_on(struct super_block *sb, int type, int format_id,
2204                    struct path *path)
2205 {
2206         int error = security_quota_on(path->dentry);
2207         if (error)
2208                 return error;
2209         /* Quota file not on the same filesystem? */
2210         if (path->mnt->mnt_sb != sb)
2211                 error = -EXDEV;
2212         else
2213                 error = vfs_load_quota_inode(path->dentry->d_inode, type,
2214                                              format_id, DQUOT_USAGE_ENABLED |
2215                                              DQUOT_LIMITS_ENABLED);
2216         return error;
2217 }
2218 EXPORT_SYMBOL(dquot_quota_on);
2219
2220 /*
2221  * More powerful function for turning on quotas allowing setting
2222  * of individual quota flags
2223  */
2224 int dquot_enable(struct inode *inode, int type, int format_id,
2225                  unsigned int flags)
2226 {
2227         int ret = 0;
2228         struct super_block *sb = inode->i_sb;
2229         struct quota_info *dqopt = sb_dqopt(sb);
2230
2231         /* Just unsuspend quotas? */
2232         BUG_ON(flags & DQUOT_SUSPENDED);
2233
2234         if (!flags)
2235                 return 0;
2236         /* Just updating flags needed? */
2237         if (sb_has_quota_loaded(sb, type)) {
2238                 mutex_lock(&dqopt->dqonoff_mutex);
2239                 /* Now do a reliable test... */
2240                 if (!sb_has_quota_loaded(sb, type)) {
2241                         mutex_unlock(&dqopt->dqonoff_mutex);
2242                         goto load_quota;
2243                 }
2244                 if (flags & DQUOT_USAGE_ENABLED &&
2245                     sb_has_quota_usage_enabled(sb, type)) {
2246                         ret = -EBUSY;
2247                         goto out_lock;
2248                 }
2249                 if (flags & DQUOT_LIMITS_ENABLED &&
2250                     sb_has_quota_limits_enabled(sb, type)) {
2251                         ret = -EBUSY;
2252                         goto out_lock;
2253                 }
2254                 spin_lock(&dq_state_lock);
2255                 sb_dqopt(sb)->flags |= dquot_state_flag(flags, type);
2256                 spin_unlock(&dq_state_lock);
2257 out_lock:
2258                 mutex_unlock(&dqopt->dqonoff_mutex);
2259                 return ret;
2260         }
2261
2262 load_quota:
2263         return vfs_load_quota_inode(inode, type, format_id, flags);
2264 }
2265 EXPORT_SYMBOL(dquot_enable);
2266
2267 /*
2268  * This function is used when filesystem needs to initialize quotas
2269  * during mount time.
2270  */
2271 int dquot_quota_on_mount(struct super_block *sb, char *qf_name,
2272                 int format_id, int type)
2273 {
2274         struct dentry *dentry;
2275         int error;
2276
2277         mutex_lock(&sb->s_root->d_inode->i_mutex);
2278         dentry = lookup_one_len(qf_name, sb->s_root, strlen(qf_name));
2279         mutex_unlock(&sb->s_root->d_inode->i_mutex);
2280         if (IS_ERR(dentry))
2281                 return PTR_ERR(dentry);
2282
2283         if (!dentry->d_inode) {
2284                 error = -ENOENT;
2285                 goto out;
2286         }
2287
2288         error = security_quota_on(dentry);
2289         if (!error)
2290                 error = vfs_load_quota_inode(dentry->d_inode, type, format_id,
2291                                 DQUOT_USAGE_ENABLED | DQUOT_LIMITS_ENABLED);
2292
2293 out:
2294         dput(dentry);
2295         return error;
2296 }
2297 EXPORT_SYMBOL(dquot_quota_on_mount);
2298
2299 static inline qsize_t qbtos(qsize_t blocks)
2300 {
2301         return blocks << QIF_DQBLKSIZE_BITS;
2302 }
2303
2304 static inline qsize_t stoqb(qsize_t space)
2305 {
2306         return (space + QIF_DQBLKSIZE - 1) >> QIF_DQBLKSIZE_BITS;
2307 }
2308
2309 /* Generic routine for getting common part of quota structure */
2310 static void do_get_dqblk(struct dquot *dquot, struct fs_disk_quota *di)
2311 {
2312         struct mem_dqblk *dm = &dquot->dq_dqb;
2313
2314         memset(di, 0, sizeof(*di));
2315         di->d_version = FS_DQUOT_VERSION;
2316         di->d_flags = dquot->dq_type == USRQUOTA ?
2317                         FS_USER_QUOTA : FS_GROUP_QUOTA;
2318         di->d_id = dquot->dq_id;
2319
2320         spin_lock(&dq_data_lock);
2321         di->d_blk_hardlimit = stoqb(dm->dqb_bhardlimit);
2322         di->d_blk_softlimit = stoqb(dm->dqb_bsoftlimit);
2323         di->d_ino_hardlimit = dm->dqb_ihardlimit;
2324         di->d_ino_softlimit = dm->dqb_isoftlimit;
2325         di->d_bcount = dm->dqb_curspace + dm->dqb_rsvspace;
2326         di->d_icount = dm->dqb_curinodes;
2327         di->d_btimer = dm->dqb_btime;
2328         di->d_itimer = dm->dqb_itime;
2329         spin_unlock(&dq_data_lock);
2330 }
2331
2332 int dquot_get_dqblk(struct super_block *sb, int type, qid_t id,
2333                     struct fs_disk_quota *di)
2334 {
2335         struct dquot *dquot;
2336
2337         dquot = dqget(sb, id, type);
2338         if (!dquot)
2339                 return -ESRCH;
2340         do_get_dqblk(dquot, di);
2341         dqput(dquot);
2342
2343         return 0;
2344 }
2345 EXPORT_SYMBOL(dquot_get_dqblk);
2346
2347 #define VFS_FS_DQ_MASK \
2348         (FS_DQ_BCOUNT | FS_DQ_BSOFT | FS_DQ_BHARD | \
2349          FS_DQ_ICOUNT | FS_DQ_ISOFT | FS_DQ_IHARD | \
2350          FS_DQ_BTIMER | FS_DQ_ITIMER)
2351
2352 /* Generic routine for setting common part of quota structure */
2353 static int do_set_dqblk(struct dquot *dquot, struct fs_disk_quota *di)
2354 {
2355         struct mem_dqblk *dm = &dquot->dq_dqb;
2356         int check_blim = 0, check_ilim = 0;
2357         struct mem_dqinfo *dqi = &sb_dqopt(dquot->dq_sb)->info[dquot->dq_type];
2358
2359         if (di->d_fieldmask & ~VFS_FS_DQ_MASK)
2360                 return -EINVAL;
2361
2362         if (((di->d_fieldmask & FS_DQ_BSOFT) &&
2363              (di->d_blk_softlimit > dqi->dqi_maxblimit)) ||
2364             ((di->d_fieldmask & FS_DQ_BHARD) &&
2365              (di->d_blk_hardlimit > dqi->dqi_maxblimit)) ||
2366             ((di->d_fieldmask & FS_DQ_ISOFT) &&
2367              (di->d_ino_softlimit > dqi->dqi_maxilimit)) ||
2368             ((di->d_fieldmask & FS_DQ_IHARD) &&
2369              (di->d_ino_hardlimit > dqi->dqi_maxilimit)))
2370                 return -ERANGE;
2371
2372         spin_lock(&dq_data_lock);
2373         if (di->d_fieldmask & FS_DQ_BCOUNT) {
2374                 dm->dqb_curspace = di->d_bcount - dm->dqb_rsvspace;
2375                 check_blim = 1;
2376                 set_bit(DQ_LASTSET_B + QIF_SPACE_B, &dquot->dq_flags);
2377         }
2378
2379         if (di->d_fieldmask & FS_DQ_BSOFT)
2380                 dm->dqb_bsoftlimit = qbtos(di->d_blk_softlimit);
2381         if (di->d_fieldmask & FS_DQ_BHARD)
2382                 dm->dqb_bhardlimit = qbtos(di->d_blk_hardlimit);
2383         if (di->d_fieldmask & (FS_DQ_BSOFT | FS_DQ_BHARD)) {
2384                 check_blim = 1;
2385                 set_bit(DQ_LASTSET_B + QIF_BLIMITS_B, &dquot->dq_flags);
2386         }
2387
2388         if (di->d_fieldmask & FS_DQ_ICOUNT) {
2389                 dm->dqb_curinodes = di->d_icount;
2390                 check_ilim = 1;
2391                 set_bit(DQ_LASTSET_B + QIF_INODES_B, &dquot->dq_flags);
2392         }
2393
2394         if (di->d_fieldmask & FS_DQ_ISOFT)
2395                 dm->dqb_isoftlimit = di->d_ino_softlimit;
2396         if (di->d_fieldmask & FS_DQ_IHARD)
2397                 dm->dqb_ihardlimit = di->d_ino_hardlimit;
2398         if (di->d_fieldmask & (FS_DQ_ISOFT | FS_DQ_IHARD)) {
2399                 check_ilim = 1;
2400                 set_bit(DQ_LASTSET_B + QIF_ILIMITS_B, &dquot->dq_flags);
2401         }
2402
2403         if (di->d_fieldmask & FS_DQ_BTIMER) {
2404                 dm->dqb_btime = di->d_btimer;
2405                 check_blim = 1;
2406                 set_bit(DQ_LASTSET_B + QIF_BTIME_B, &dquot->dq_flags);
2407         }
2408
2409         if (di->d_fieldmask & FS_DQ_ITIMER) {
2410                 dm->dqb_itime = di->d_itimer;
2411                 check_ilim = 1;
2412                 set_bit(DQ_LASTSET_B + QIF_ITIME_B, &dquot->dq_flags);
2413         }
2414
2415         if (check_blim) {
2416                 if (!dm->dqb_bsoftlimit ||
2417                     dm->dqb_curspace < dm->dqb_bsoftlimit) {
2418                         dm->dqb_btime = 0;
2419                         clear_bit(DQ_BLKS_B, &dquot->dq_flags);
2420                 } else if (!(di->d_fieldmask & FS_DQ_BTIMER))
2421                         /* Set grace only if user hasn't provided his own... */
2422                         dm->dqb_btime = get_seconds() + dqi->dqi_bgrace;
2423         }
2424         if (check_ilim) {
2425                 if (!dm->dqb_isoftlimit ||
2426                     dm->dqb_curinodes < dm->dqb_isoftlimit) {
2427                         dm->dqb_itime = 0;
2428                         clear_bit(DQ_INODES_B, &dquot->dq_flags);
2429                 } else if (!(di->d_fieldmask & FS_DQ_ITIMER))
2430                         /* Set grace only if user hasn't provided his own... */
2431                         dm->dqb_itime = get_seconds() + dqi->dqi_igrace;
2432         }
2433         if (dm->dqb_bhardlimit || dm->dqb_bsoftlimit || dm->dqb_ihardlimit ||
2434             dm->dqb_isoftlimit)
2435                 clear_bit(DQ_FAKE_B, &dquot->dq_flags);
2436         else
2437                 set_bit(DQ_FAKE_B, &dquot->dq_flags);
2438         spin_unlock(&dq_data_lock);
2439         mark_dquot_dirty(dquot);
2440
2441         return 0;
2442 }
2443
2444 int dquot_set_dqblk(struct super_block *sb, int type, qid_t id,
2445                   struct fs_disk_quota *di)
2446 {
2447         struct dquot *dquot;
2448         int rc;
2449
2450         dquot = dqget(sb, id, type);
2451         if (!dquot) {
2452                 rc = -ESRCH;
2453                 goto out;
2454         }
2455         rc = do_set_dqblk(dquot, di);
2456         dqput(dquot);
2457 out:
2458         return rc;
2459 }
2460 EXPORT_SYMBOL(dquot_set_dqblk);
2461
2462 /* Generic routine for getting common part of quota file information */
2463 int dquot_get_dqinfo(struct super_block *sb, int type, struct if_dqinfo *ii)
2464 {
2465         struct mem_dqinfo *mi;
2466   
2467         mutex_lock(&sb_dqopt(sb)->dqonoff_mutex);
2468         if (!sb_has_quota_active(sb, type)) {
2469                 mutex_unlock(&sb_dqopt(sb)->dqonoff_mutex);
2470                 return -ESRCH;
2471         }
2472         mi = sb_dqopt(sb)->info + type;
2473         spin_lock(&dq_data_lock);
2474         ii->dqi_bgrace = mi->dqi_bgrace;
2475         ii->dqi_igrace = mi->dqi_igrace;
2476         ii->dqi_flags = mi->dqi_flags & DQF_MASK;
2477         ii->dqi_valid = IIF_ALL;
2478         spin_unlock(&dq_data_lock);
2479         mutex_unlock(&sb_dqopt(sb)->dqonoff_mutex);
2480         return 0;
2481 }
2482 EXPORT_SYMBOL(dquot_get_dqinfo);
2483
2484 /* Generic routine for setting common part of quota file information */
2485 int dquot_set_dqinfo(struct super_block *sb, int type, struct if_dqinfo *ii)
2486 {
2487         struct mem_dqinfo *mi;
2488         int err = 0;
2489
2490         mutex_lock(&sb_dqopt(sb)->dqonoff_mutex);
2491         if (!sb_has_quota_active(sb, type)) {
2492                 err = -ESRCH;
2493                 goto out;
2494         }
2495         mi = sb_dqopt(sb)->info + type;
2496         spin_lock(&dq_data_lock);
2497         if (ii->dqi_valid & IIF_BGRACE)
2498                 mi->dqi_bgrace = ii->dqi_bgrace;
2499         if (ii->dqi_valid & IIF_IGRACE)
2500                 mi->dqi_igrace = ii->dqi_igrace;
2501         if (ii->dqi_valid & IIF_FLAGS)
2502                 mi->dqi_flags = (mi->dqi_flags & ~DQF_MASK) |
2503                                 (ii->dqi_flags & DQF_MASK);
2504         spin_unlock(&dq_data_lock);
2505         mark_info_dirty(sb, type);
2506         /* Force write to disk */
2507         sb->dq_op->write_info(sb, type);
2508 out:
2509         mutex_unlock(&sb_dqopt(sb)->dqonoff_mutex);
2510         return err;
2511 }
2512 EXPORT_SYMBOL(dquot_set_dqinfo);
2513
2514 const struct quotactl_ops dquot_quotactl_ops = {
2515         .quota_on       = dquot_quota_on,
2516         .quota_off      = dquot_quota_off,
2517         .quota_sync     = dquot_quota_sync,
2518         .get_info       = dquot_get_dqinfo,
2519         .set_info       = dquot_set_dqinfo,
2520         .get_dqblk      = dquot_get_dqblk,
2521         .set_dqblk      = dquot_set_dqblk
2522 };
2523 EXPORT_SYMBOL(dquot_quotactl_ops);
2524
2525 static int do_proc_dqstats(struct ctl_table *table, int write,
2526                      void __user *buffer, size_t *lenp, loff_t *ppos)
2527 {
2528         unsigned int type = (int *)table->data - dqstats.stat;
2529
2530         /* Update global table */
2531         dqstats.stat[type] =
2532                         percpu_counter_sum_positive(&dqstats.counter[type]);
2533         return proc_dointvec(table, write, buffer, lenp, ppos);
2534 }
2535
2536 static ctl_table fs_dqstats_table[] = {
2537         {
2538                 .procname       = "lookups",
2539                 .data           = &dqstats.stat[DQST_LOOKUPS],
2540                 .maxlen         = sizeof(int),
2541                 .mode           = 0444,
2542                 .proc_handler   = do_proc_dqstats,
2543         },
2544         {
2545                 .procname       = "drops",
2546                 .data           = &dqstats.stat[DQST_DROPS],
2547                 .maxlen         = sizeof(int),
2548                 .mode           = 0444,
2549                 .proc_handler   = do_proc_dqstats,
2550         },
2551         {
2552                 .procname       = "reads",
2553                 .data           = &dqstats.stat[DQST_READS],
2554                 .maxlen         = sizeof(int),
2555                 .mode           = 0444,
2556                 .proc_handler   = do_proc_dqstats,
2557         },
2558         {
2559                 .procname       = "writes",
2560                 .data           = &dqstats.stat[DQST_WRITES],
2561                 .maxlen         = sizeof(int),
2562                 .mode           = 0444,
2563                 .proc_handler   = do_proc_dqstats,
2564         },
2565         {
2566                 .procname       = "cache_hits",
2567                 .data           = &dqstats.stat[DQST_CACHE_HITS],
2568                 .maxlen         = sizeof(int),
2569                 .mode           = 0444,
2570                 .proc_handler   = do_proc_dqstats,
2571         },
2572         {
2573                 .procname       = "allocated_dquots",
2574                 .data           = &dqstats.stat[DQST_ALLOC_DQUOTS],
2575                 .maxlen         = sizeof(int),
2576                 .mode           = 0444,
2577                 .proc_handler   = do_proc_dqstats,
2578         },
2579         {
2580                 .procname       = "free_dquots",
2581                 .data           = &dqstats.stat[DQST_FREE_DQUOTS],
2582                 .maxlen         = sizeof(int),
2583                 .mode           = 0444,
2584                 .proc_handler   = do_proc_dqstats,
2585         },
2586         {
2587                 .procname       = "syncs",
2588                 .data           = &dqstats.stat[DQST_SYNCS],
2589                 .maxlen         = sizeof(int),
2590                 .mode           = 0444,
2591                 .proc_handler   = do_proc_dqstats,
2592         },
2593 #ifdef CONFIG_PRINT_QUOTA_WARNING
2594         {
2595                 .procname       = "warnings",
2596                 .data           = &flag_print_warnings,
2597                 .maxlen         = sizeof(int),
2598                 .mode           = 0644,
2599                 .proc_handler   = proc_dointvec,
2600         },
2601 #endif
2602         { },
2603 };
2604
2605 static ctl_table fs_table[] = {
2606         {
2607                 .procname       = "quota",
2608                 .mode           = 0555,
2609                 .child          = fs_dqstats_table,
2610         },
2611         { },
2612 };
2613
2614 static ctl_table sys_table[] = {
2615         {
2616                 .procname       = "fs",
2617                 .mode           = 0555,
2618                 .child          = fs_table,
2619         },
2620         { },
2621 };
2622
2623 static int __init dquot_init(void)
2624 {
2625         int i, ret;
2626         unsigned long nr_hash, order;
2627
2628         printk(KERN_NOTICE "VFS: Disk quotas %s\n", __DQUOT_VERSION__);
2629
2630         register_sysctl_table(sys_table);
2631
2632         dquot_cachep = kmem_cache_create("dquot",
2633                         sizeof(struct dquot), sizeof(unsigned long) * 4,
2634                         (SLAB_HWCACHE_ALIGN|SLAB_RECLAIM_ACCOUNT|
2635                                 SLAB_MEM_SPREAD|SLAB_PANIC),
2636                         NULL);
2637
2638         order = 0;
2639         dquot_hash = (struct hlist_head *)__get_free_pages(GFP_ATOMIC, order);
2640         if (!dquot_hash)
2641                 panic("Cannot create dquot hash table");
2642
2643         for (i = 0; i < _DQST_DQSTAT_LAST; i++) {
2644                 ret = percpu_counter_init(&dqstats.counter[i], 0);
2645                 if (ret)
2646                         panic("Cannot create dquot stat counters");
2647         }
2648
2649         /* Find power-of-two hlist_heads which can fit into allocation */
2650         nr_hash = (1UL << order) * PAGE_SIZE / sizeof(struct hlist_head);
2651         dq_hash_bits = 0;
2652         do {
2653                 dq_hash_bits++;
2654         } while (nr_hash >> dq_hash_bits);
2655         dq_hash_bits--;
2656
2657         nr_hash = 1UL << dq_hash_bits;
2658         dq_hash_mask = nr_hash - 1;
2659         for (i = 0; i < nr_hash; i++)
2660                 INIT_HLIST_HEAD(dquot_hash + i);
2661
2662         printk("Dquot-cache hash table entries: %ld (order %ld, %ld bytes)\n",
2663                         nr_hash, order, (PAGE_SIZE << order));
2664
2665         register_shrinker(&dqcache_shrinker);
2666
2667         return 0;
2668 }
2669 module_init(dquot_init);