Merge git://git.kernel.org/pub/scm/linux/kernel/git/x86/linux-2.6-x86
[sfrench/cifs-2.6.git] / fs / gfs2 / ops_fstype.c
1 /*
2  * Copyright (C) Sistina Software, Inc.  1997-2003 All rights reserved.
3  * Copyright (C) 2004-2007 Red Hat, Inc.  All rights reserved.
4  *
5  * This copyrighted material is made available to anyone wishing to use,
6  * modify, copy, or redistribute it subject to the terms and conditions
7  * of the GNU General Public License version 2.
8  */
9
10 #include <linux/sched.h>
11 #include <linux/slab.h>
12 #include <linux/spinlock.h>
13 #include <linux/completion.h>
14 #include <linux/buffer_head.h>
15 #include <linux/blkdev.h>
16 #include <linux/kthread.h>
17 #include <linux/namei.h>
18 #include <linux/mount.h>
19 #include <linux/gfs2_ondisk.h>
20 #include <linux/lm_interface.h>
21
22 #include "gfs2.h"
23 #include "incore.h"
24 #include "bmap.h"
25 #include "daemon.h"
26 #include "glock.h"
27 #include "glops.h"
28 #include "inode.h"
29 #include "lm.h"
30 #include "mount.h"
31 #include "ops_fstype.h"
32 #include "ops_dentry.h"
33 #include "ops_super.h"
34 #include "recovery.h"
35 #include "rgrp.h"
36 #include "super.h"
37 #include "sys.h"
38 #include "util.h"
39 #include "log.h"
40
41 #define DO 0
42 #define UNDO 1
43
44 static struct gfs2_sbd *init_sbd(struct super_block *sb)
45 {
46         struct gfs2_sbd *sdp;
47
48         sdp = kzalloc(sizeof(struct gfs2_sbd), GFP_KERNEL);
49         if (!sdp)
50                 return NULL;
51
52         sb->s_fs_info = sdp;
53         sdp->sd_vfs = sb;
54
55         gfs2_tune_init(&sdp->sd_tune);
56
57         INIT_LIST_HEAD(&sdp->sd_reclaim_list);
58         spin_lock_init(&sdp->sd_reclaim_lock);
59         init_waitqueue_head(&sdp->sd_reclaim_wq);
60
61         mutex_init(&sdp->sd_inum_mutex);
62         spin_lock_init(&sdp->sd_statfs_spin);
63
64         spin_lock_init(&sdp->sd_rindex_spin);
65         mutex_init(&sdp->sd_rindex_mutex);
66         INIT_LIST_HEAD(&sdp->sd_rindex_list);
67         INIT_LIST_HEAD(&sdp->sd_rindex_mru_list);
68         INIT_LIST_HEAD(&sdp->sd_rindex_recent_list);
69
70         INIT_LIST_HEAD(&sdp->sd_jindex_list);
71         spin_lock_init(&sdp->sd_jindex_spin);
72         mutex_init(&sdp->sd_jindex_mutex);
73
74         INIT_LIST_HEAD(&sdp->sd_quota_list);
75         spin_lock_init(&sdp->sd_quota_spin);
76         mutex_init(&sdp->sd_quota_mutex);
77
78         spin_lock_init(&sdp->sd_log_lock);
79
80         INIT_LIST_HEAD(&sdp->sd_log_le_buf);
81         INIT_LIST_HEAD(&sdp->sd_log_le_revoke);
82         INIT_LIST_HEAD(&sdp->sd_log_le_rg);
83         INIT_LIST_HEAD(&sdp->sd_log_le_databuf);
84         INIT_LIST_HEAD(&sdp->sd_log_le_ordered);
85
86         mutex_init(&sdp->sd_log_reserve_mutex);
87         INIT_LIST_HEAD(&sdp->sd_ail1_list);
88         INIT_LIST_HEAD(&sdp->sd_ail2_list);
89
90         init_rwsem(&sdp->sd_log_flush_lock);
91         atomic_set(&sdp->sd_log_in_flight, 0);
92         init_waitqueue_head(&sdp->sd_log_flush_wait);
93
94         INIT_LIST_HEAD(&sdp->sd_revoke_list);
95
96         mutex_init(&sdp->sd_freeze_lock);
97
98         return sdp;
99 }
100
101 static void init_vfs(struct super_block *sb, unsigned noatime)
102 {
103         struct gfs2_sbd *sdp = sb->s_fs_info;
104
105         sb->s_magic = GFS2_MAGIC;
106         sb->s_op = &gfs2_super_ops;
107         sb->s_export_op = &gfs2_export_ops;
108         sb->s_time_gran = 1;
109         sb->s_maxbytes = MAX_LFS_FILESIZE;
110
111         if (sb->s_flags & (MS_NOATIME | MS_NODIRATIME))
112                 set_bit(noatime, &sdp->sd_flags);
113
114         /* Don't let the VFS update atimes.  GFS2 handles this itself. */
115         sb->s_flags |= MS_NOATIME | MS_NODIRATIME;
116 }
117
118 static int init_names(struct gfs2_sbd *sdp, int silent)
119 {
120         char *proto, *table;
121         int error = 0;
122
123         proto = sdp->sd_args.ar_lockproto;
124         table = sdp->sd_args.ar_locktable;
125
126         /*  Try to autodetect  */
127
128         if (!proto[0] || !table[0]) {
129                 error = gfs2_read_super(sdp, GFS2_SB_ADDR >> sdp->sd_fsb2bb_shift);
130                 if (error)
131                         return error;
132
133                 error = gfs2_check_sb(sdp, &sdp->sd_sb, silent);
134                 if (error)
135                         goto out;
136
137                 if (!proto[0])
138                         proto = sdp->sd_sb.sb_lockproto;
139                 if (!table[0])
140                         table = sdp->sd_sb.sb_locktable;
141         }
142
143         if (!table[0])
144                 table = sdp->sd_vfs->s_id;
145
146         snprintf(sdp->sd_proto_name, GFS2_FSNAME_LEN, "%s", proto);
147         snprintf(sdp->sd_table_name, GFS2_FSNAME_LEN, "%s", table);
148
149         table = sdp->sd_table_name;
150         while ((table = strchr(table, '/')))
151                 *table = '_';
152
153 out:
154         return error;
155 }
156
157 static int init_locking(struct gfs2_sbd *sdp, struct gfs2_holder *mount_gh,
158                         int undo)
159 {
160         struct task_struct *p;
161         int error = 0;
162
163         if (undo)
164                 goto fail_trans;
165
166         for (sdp->sd_glockd_num = 0;
167              sdp->sd_glockd_num < sdp->sd_args.ar_num_glockd;
168              sdp->sd_glockd_num++) {
169                 p = kthread_run(gfs2_glockd, sdp, "gfs2_glockd");
170                 error = IS_ERR(p);
171                 if (error) {
172                         fs_err(sdp, "can't start glockd thread: %d\n", error);
173                         goto fail;
174                 }
175                 sdp->sd_glockd_process[sdp->sd_glockd_num] = p;
176         }
177
178         error = gfs2_glock_nq_num(sdp,
179                                   GFS2_MOUNT_LOCK, &gfs2_nondisk_glops,
180                                   LM_ST_EXCLUSIVE, LM_FLAG_NOEXP | GL_NOCACHE,
181                                   mount_gh);
182         if (error) {
183                 fs_err(sdp, "can't acquire mount glock: %d\n", error);
184                 goto fail;
185         }
186
187         error = gfs2_glock_nq_num(sdp,
188                                   GFS2_LIVE_LOCK, &gfs2_nondisk_glops,
189                                   LM_ST_SHARED,
190                                   LM_FLAG_NOEXP | GL_EXACT,
191                                   &sdp->sd_live_gh);
192         if (error) {
193                 fs_err(sdp, "can't acquire live glock: %d\n", error);
194                 goto fail_mount;
195         }
196
197         error = gfs2_glock_get(sdp, GFS2_RENAME_LOCK, &gfs2_nondisk_glops,
198                                CREATE, &sdp->sd_rename_gl);
199         if (error) {
200                 fs_err(sdp, "can't create rename glock: %d\n", error);
201                 goto fail_live;
202         }
203
204         error = gfs2_glock_get(sdp, GFS2_TRANS_LOCK, &gfs2_trans_glops,
205                                CREATE, &sdp->sd_trans_gl);
206         if (error) {
207                 fs_err(sdp, "can't create transaction glock: %d\n", error);
208                 goto fail_rename;
209         }
210         set_bit(GLF_STICKY, &sdp->sd_trans_gl->gl_flags);
211
212         return 0;
213
214 fail_trans:
215         gfs2_glock_put(sdp->sd_trans_gl);
216 fail_rename:
217         gfs2_glock_put(sdp->sd_rename_gl);
218 fail_live:
219         gfs2_glock_dq_uninit(&sdp->sd_live_gh);
220 fail_mount:
221         gfs2_glock_dq_uninit(mount_gh);
222 fail:
223         while (sdp->sd_glockd_num--)
224                 kthread_stop(sdp->sd_glockd_process[sdp->sd_glockd_num]);
225
226         return error;
227 }
228
229 static inline struct inode *gfs2_lookup_root(struct super_block *sb,
230                                              u64 no_addr)
231 {
232         return gfs2_inode_lookup(sb, DT_DIR, no_addr, 0, 0);
233 }
234
235 static int init_sb(struct gfs2_sbd *sdp, int silent, int undo)
236 {
237         struct super_block *sb = sdp->sd_vfs;
238         struct gfs2_holder sb_gh;
239         u64 no_addr;
240         struct inode *inode;
241         int error = 0;
242
243         if (undo) {
244                 if (sb->s_root) {
245                         dput(sb->s_root);
246                         sb->s_root = NULL;
247                 }
248                 return 0;
249         }
250
251         error = gfs2_glock_nq_num(sdp, GFS2_SB_LOCK, &gfs2_meta_glops,
252                                  LM_ST_SHARED, 0, &sb_gh);
253         if (error) {
254                 fs_err(sdp, "can't acquire superblock glock: %d\n", error);
255                 return error;
256         }
257
258         error = gfs2_read_sb(sdp, sb_gh.gh_gl, silent);
259         if (error) {
260                 fs_err(sdp, "can't read superblock: %d\n", error);
261                 goto out;
262         }
263
264         /* Set up the buffer cache and SB for real */
265         if (sdp->sd_sb.sb_bsize < bdev_hardsect_size(sb->s_bdev)) {
266                 error = -EINVAL;
267                 fs_err(sdp, "FS block size (%u) is too small for device "
268                        "block size (%u)\n",
269                        sdp->sd_sb.sb_bsize, bdev_hardsect_size(sb->s_bdev));
270                 goto out;
271         }
272         if (sdp->sd_sb.sb_bsize > PAGE_SIZE) {
273                 error = -EINVAL;
274                 fs_err(sdp, "FS block size (%u) is too big for machine "
275                        "page size (%u)\n",
276                        sdp->sd_sb.sb_bsize, (unsigned int)PAGE_SIZE);
277                 goto out;
278         }
279         sb_set_blocksize(sb, sdp->sd_sb.sb_bsize);
280
281         /* Get the root inode */
282         no_addr = sdp->sd_sb.sb_root_dir.no_addr;
283         if (sb->s_type == &gfs2meta_fs_type)
284                 no_addr = sdp->sd_sb.sb_master_dir.no_addr;
285         inode = gfs2_lookup_root(sb, no_addr);
286         if (IS_ERR(inode)) {
287                 error = PTR_ERR(inode);
288                 fs_err(sdp, "can't read in root inode: %d\n", error);
289                 goto out;
290         }
291
292         sb->s_root = d_alloc_root(inode);
293         if (!sb->s_root) {
294                 fs_err(sdp, "can't get root dentry\n");
295                 error = -ENOMEM;
296                 iput(inode);
297         } else
298                 sb->s_root->d_op = &gfs2_dops;
299         
300 out:
301         gfs2_glock_dq_uninit(&sb_gh);
302         return error;
303 }
304
305 /**
306  * map_journal_extents - create a reusable "extent" mapping from all logical
307  * blocks to all physical blocks for the given journal.  This will save
308  * us time when writing journal blocks.  Most journals will have only one
309  * extent that maps all their logical blocks.  That's because gfs2.mkfs
310  * arranges the journal blocks sequentially to maximize performance.
311  * So the extent would map the first block for the entire file length.
312  * However, gfs2_jadd can happen while file activity is happening, so
313  * those journals may not be sequential.  Less likely is the case where
314  * the users created their own journals by mounting the metafs and
315  * laying it out.  But it's still possible.  These journals might have
316  * several extents.
317  *
318  * TODO: This should be done in bigger chunks rather than one block at a time,
319  *       but since it's only done at mount time, I'm not worried about the
320  *       time it takes.
321  */
322 static int map_journal_extents(struct gfs2_sbd *sdp)
323 {
324         struct gfs2_jdesc *jd = sdp->sd_jdesc;
325         unsigned int lb;
326         u64 db, prev_db; /* logical block, disk block, prev disk block */
327         struct gfs2_inode *ip = GFS2_I(jd->jd_inode);
328         struct gfs2_journal_extent *jext = NULL;
329         struct buffer_head bh;
330         int rc = 0;
331
332         prev_db = 0;
333
334         for (lb = 0; lb < ip->i_di.di_size >> sdp->sd_sb.sb_bsize_shift; lb++) {
335                 bh.b_state = 0;
336                 bh.b_blocknr = 0;
337                 bh.b_size = 1 << ip->i_inode.i_blkbits;
338                 rc = gfs2_block_map(jd->jd_inode, lb, &bh, 0);
339                 db = bh.b_blocknr;
340                 if (rc || !db) {
341                         printk(KERN_INFO "GFS2 journal mapping error %d: lb="
342                                "%u db=%llu\n", rc, lb, (unsigned long long)db);
343                         break;
344                 }
345                 if (!prev_db || db != prev_db + 1) {
346                         jext = kzalloc(sizeof(struct gfs2_journal_extent),
347                                        GFP_KERNEL);
348                         if (!jext) {
349                                 printk(KERN_INFO "GFS2 error: out of memory "
350                                        "mapping journal extents.\n");
351                                 rc = -ENOMEM;
352                                 break;
353                         }
354                         jext->dblock = db;
355                         jext->lblock = lb;
356                         jext->blocks = 1;
357                         list_add_tail(&jext->extent_list, &jd->extent_list);
358                 } else {
359                         jext->blocks++;
360                 }
361                 prev_db = db;
362         }
363         return rc;
364 }
365
366 static int init_journal(struct gfs2_sbd *sdp, int undo)
367 {
368         struct gfs2_holder ji_gh;
369         struct task_struct *p;
370         struct gfs2_inode *ip;
371         int jindex = 1;
372         int error = 0;
373
374         if (undo) {
375                 jindex = 0;
376                 goto fail_recoverd;
377         }
378
379         sdp->sd_jindex = gfs2_lookup_simple(sdp->sd_master_dir, "jindex");
380         if (IS_ERR(sdp->sd_jindex)) {
381                 fs_err(sdp, "can't lookup journal index: %d\n", error);
382                 return PTR_ERR(sdp->sd_jindex);
383         }
384         ip = GFS2_I(sdp->sd_jindex);
385         set_bit(GLF_STICKY, &ip->i_gl->gl_flags);
386
387         /* Load in the journal index special file */
388
389         error = gfs2_jindex_hold(sdp, &ji_gh);
390         if (error) {
391                 fs_err(sdp, "can't read journal index: %d\n", error);
392                 goto fail;
393         }
394
395         error = -EINVAL;
396         if (!gfs2_jindex_size(sdp)) {
397                 fs_err(sdp, "no journals!\n");
398                 goto fail_jindex;
399         }
400
401         if (sdp->sd_args.ar_spectator) {
402                 sdp->sd_jdesc = gfs2_jdesc_find(sdp, 0);
403                 atomic_set(&sdp->sd_log_blks_free, sdp->sd_jdesc->jd_blocks);
404         } else {
405                 if (sdp->sd_lockstruct.ls_jid >= gfs2_jindex_size(sdp)) {
406                         fs_err(sdp, "can't mount journal #%u\n",
407                                sdp->sd_lockstruct.ls_jid);
408                         fs_err(sdp, "there are only %u journals (0 - %u)\n",
409                                gfs2_jindex_size(sdp),
410                                gfs2_jindex_size(sdp) - 1);
411                         goto fail_jindex;
412                 }
413                 sdp->sd_jdesc = gfs2_jdesc_find(sdp, sdp->sd_lockstruct.ls_jid);
414
415                 error = gfs2_glock_nq_num(sdp, sdp->sd_lockstruct.ls_jid,
416                                           &gfs2_journal_glops,
417                                           LM_ST_EXCLUSIVE, LM_FLAG_NOEXP,
418                                           &sdp->sd_journal_gh);
419                 if (error) {
420                         fs_err(sdp, "can't acquire journal glock: %d\n", error);
421                         goto fail_jindex;
422                 }
423
424                 ip = GFS2_I(sdp->sd_jdesc->jd_inode);
425                 error = gfs2_glock_nq_init(ip->i_gl, LM_ST_SHARED,
426                                            LM_FLAG_NOEXP | GL_EXACT | GL_NOCACHE,
427                                            &sdp->sd_jinode_gh);
428                 if (error) {
429                         fs_err(sdp, "can't acquire journal inode glock: %d\n",
430                                error);
431                         goto fail_journal_gh;
432                 }
433
434                 error = gfs2_jdesc_check(sdp->sd_jdesc);
435                 if (error) {
436                         fs_err(sdp, "my journal (%u) is bad: %d\n",
437                                sdp->sd_jdesc->jd_jid, error);
438                         goto fail_jinode_gh;
439                 }
440                 atomic_set(&sdp->sd_log_blks_free, sdp->sd_jdesc->jd_blocks);
441
442                 /* Map the extents for this journal's blocks */
443                 map_journal_extents(sdp);
444         }
445
446         if (sdp->sd_lockstruct.ls_first) {
447                 unsigned int x;
448                 for (x = 0; x < sdp->sd_journals; x++) {
449                         error = gfs2_recover_journal(gfs2_jdesc_find(sdp, x));
450                         if (error) {
451                                 fs_err(sdp, "error recovering journal %u: %d\n",
452                                        x, error);
453                                 goto fail_jinode_gh;
454                         }
455                 }
456
457                 gfs2_lm_others_may_mount(sdp);
458         } else if (!sdp->sd_args.ar_spectator) {
459                 error = gfs2_recover_journal(sdp->sd_jdesc);
460                 if (error) {
461                         fs_err(sdp, "error recovering my journal: %d\n", error);
462                         goto fail_jinode_gh;
463                 }
464         }
465
466         set_bit(SDF_JOURNAL_CHECKED, &sdp->sd_flags);
467         gfs2_glock_dq_uninit(&ji_gh);
468         jindex = 0;
469
470         p = kthread_run(gfs2_recoverd, sdp, "gfs2_recoverd");
471         error = IS_ERR(p);
472         if (error) {
473                 fs_err(sdp, "can't start recoverd thread: %d\n", error);
474                 goto fail_jinode_gh;
475         }
476         sdp->sd_recoverd_process = p;
477
478         return 0;
479
480 fail_recoverd:
481         kthread_stop(sdp->sd_recoverd_process);
482 fail_jinode_gh:
483         if (!sdp->sd_args.ar_spectator)
484                 gfs2_glock_dq_uninit(&sdp->sd_jinode_gh);
485 fail_journal_gh:
486         if (!sdp->sd_args.ar_spectator)
487                 gfs2_glock_dq_uninit(&sdp->sd_journal_gh);
488 fail_jindex:
489         gfs2_jindex_free(sdp);
490         if (jindex)
491                 gfs2_glock_dq_uninit(&ji_gh);
492 fail:
493         iput(sdp->sd_jindex);
494         return error;
495 }
496
497
498 static int init_inodes(struct gfs2_sbd *sdp, int undo)
499 {
500         int error = 0;
501         struct gfs2_inode *ip;
502         struct inode *inode;
503
504         if (undo)
505                 goto fail_qinode;
506
507         inode = gfs2_lookup_root(sdp->sd_vfs, sdp->sd_sb.sb_master_dir.no_addr);
508         if (IS_ERR(inode)) {
509                 error = PTR_ERR(inode);
510                 fs_err(sdp, "can't read in master directory: %d\n", error);
511                 goto fail;
512         }
513         sdp->sd_master_dir = inode;
514
515         error = init_journal(sdp, undo);
516         if (error)
517                 goto fail_master;
518
519         /* Read in the master inode number inode */
520         sdp->sd_inum_inode = gfs2_lookup_simple(sdp->sd_master_dir, "inum");
521         if (IS_ERR(sdp->sd_inum_inode)) {
522                 error = PTR_ERR(sdp->sd_inum_inode);
523                 fs_err(sdp, "can't read in inum inode: %d\n", error);
524                 goto fail_journal;
525         }
526
527
528         /* Read in the master statfs inode */
529         sdp->sd_statfs_inode = gfs2_lookup_simple(sdp->sd_master_dir, "statfs");
530         if (IS_ERR(sdp->sd_statfs_inode)) {
531                 error = PTR_ERR(sdp->sd_statfs_inode);
532                 fs_err(sdp, "can't read in statfs inode: %d\n", error);
533                 goto fail_inum;
534         }
535
536         /* Read in the resource index inode */
537         sdp->sd_rindex = gfs2_lookup_simple(sdp->sd_master_dir, "rindex");
538         if (IS_ERR(sdp->sd_rindex)) {
539                 error = PTR_ERR(sdp->sd_rindex);
540                 fs_err(sdp, "can't get resource index inode: %d\n", error);
541                 goto fail_statfs;
542         }
543         ip = GFS2_I(sdp->sd_rindex);
544         set_bit(GLF_STICKY, &ip->i_gl->gl_flags);
545         sdp->sd_rindex_vn = ip->i_gl->gl_vn - 1;
546
547         /* Read in the quota inode */
548         sdp->sd_quota_inode = gfs2_lookup_simple(sdp->sd_master_dir, "quota");
549         if (IS_ERR(sdp->sd_quota_inode)) {
550                 error = PTR_ERR(sdp->sd_quota_inode);
551                 fs_err(sdp, "can't get quota file inode: %d\n", error);
552                 goto fail_rindex;
553         }
554         return 0;
555
556 fail_qinode:
557         iput(sdp->sd_quota_inode);
558 fail_rindex:
559         gfs2_clear_rgrpd(sdp);
560         iput(sdp->sd_rindex);
561 fail_statfs:
562         iput(sdp->sd_statfs_inode);
563 fail_inum:
564         iput(sdp->sd_inum_inode);
565 fail_journal:
566         init_journal(sdp, UNDO);
567 fail_master:
568         iput(sdp->sd_master_dir);
569 fail:
570         return error;
571 }
572
573 static int init_per_node(struct gfs2_sbd *sdp, int undo)
574 {
575         struct inode *pn = NULL;
576         char buf[30];
577         int error = 0;
578         struct gfs2_inode *ip;
579
580         if (sdp->sd_args.ar_spectator)
581                 return 0;
582
583         if (undo)
584                 goto fail_qc_gh;
585
586         pn = gfs2_lookup_simple(sdp->sd_master_dir, "per_node");
587         if (IS_ERR(pn)) {
588                 error = PTR_ERR(pn);
589                 fs_err(sdp, "can't find per_node directory: %d\n", error);
590                 return error;
591         }
592
593         sprintf(buf, "inum_range%u", sdp->sd_jdesc->jd_jid);
594         sdp->sd_ir_inode = gfs2_lookup_simple(pn, buf);
595         if (IS_ERR(sdp->sd_ir_inode)) {
596                 error = PTR_ERR(sdp->sd_ir_inode);
597                 fs_err(sdp, "can't find local \"ir\" file: %d\n", error);
598                 goto fail;
599         }
600
601         sprintf(buf, "statfs_change%u", sdp->sd_jdesc->jd_jid);
602         sdp->sd_sc_inode = gfs2_lookup_simple(pn, buf);
603         if (IS_ERR(sdp->sd_sc_inode)) {
604                 error = PTR_ERR(sdp->sd_sc_inode);
605                 fs_err(sdp, "can't find local \"sc\" file: %d\n", error);
606                 goto fail_ir_i;
607         }
608
609         sprintf(buf, "quota_change%u", sdp->sd_jdesc->jd_jid);
610         sdp->sd_qc_inode = gfs2_lookup_simple(pn, buf);
611         if (IS_ERR(sdp->sd_qc_inode)) {
612                 error = PTR_ERR(sdp->sd_qc_inode);
613                 fs_err(sdp, "can't find local \"qc\" file: %d\n", error);
614                 goto fail_ut_i;
615         }
616
617         iput(pn);
618         pn = NULL;
619
620         ip = GFS2_I(sdp->sd_ir_inode);
621         error = gfs2_glock_nq_init(ip->i_gl,
622                                    LM_ST_EXCLUSIVE, 0,
623                                    &sdp->sd_ir_gh);
624         if (error) {
625                 fs_err(sdp, "can't lock local \"ir\" file: %d\n", error);
626                 goto fail_qc_i;
627         }
628
629         ip = GFS2_I(sdp->sd_sc_inode);
630         error = gfs2_glock_nq_init(ip->i_gl,
631                                    LM_ST_EXCLUSIVE, 0,
632                                    &sdp->sd_sc_gh);
633         if (error) {
634                 fs_err(sdp, "can't lock local \"sc\" file: %d\n", error);
635                 goto fail_ir_gh;
636         }
637
638         ip = GFS2_I(sdp->sd_qc_inode);
639         error = gfs2_glock_nq_init(ip->i_gl,
640                                    LM_ST_EXCLUSIVE, 0,
641                                    &sdp->sd_qc_gh);
642         if (error) {
643                 fs_err(sdp, "can't lock local \"qc\" file: %d\n", error);
644                 goto fail_ut_gh;
645         }
646
647         return 0;
648
649 fail_qc_gh:
650         gfs2_glock_dq_uninit(&sdp->sd_qc_gh);
651 fail_ut_gh:
652         gfs2_glock_dq_uninit(&sdp->sd_sc_gh);
653 fail_ir_gh:
654         gfs2_glock_dq_uninit(&sdp->sd_ir_gh);
655 fail_qc_i:
656         iput(sdp->sd_qc_inode);
657 fail_ut_i:
658         iput(sdp->sd_sc_inode);
659 fail_ir_i:
660         iput(sdp->sd_ir_inode);
661 fail:
662         if (pn)
663                 iput(pn);
664         return error;
665 }
666
667 static int init_threads(struct gfs2_sbd *sdp, int undo)
668 {
669         struct task_struct *p;
670         int error = 0;
671
672         if (undo)
673                 goto fail_quotad;
674
675         sdp->sd_log_flush_time = jiffies;
676         sdp->sd_jindex_refresh_time = jiffies;
677
678         p = kthread_run(gfs2_logd, sdp, "gfs2_logd");
679         error = IS_ERR(p);
680         if (error) {
681                 fs_err(sdp, "can't start logd thread: %d\n", error);
682                 return error;
683         }
684         sdp->sd_logd_process = p;
685
686         sdp->sd_statfs_sync_time = jiffies;
687         sdp->sd_quota_sync_time = jiffies;
688
689         p = kthread_run(gfs2_quotad, sdp, "gfs2_quotad");
690         error = IS_ERR(p);
691         if (error) {
692                 fs_err(sdp, "can't start quotad thread: %d\n", error);
693                 goto fail;
694         }
695         sdp->sd_quotad_process = p;
696
697         return 0;
698
699
700 fail_quotad:
701         kthread_stop(sdp->sd_quotad_process);
702 fail:
703         kthread_stop(sdp->sd_logd_process);
704         return error;
705 }
706
707 /**
708  * fill_super - Read in superblock
709  * @sb: The VFS superblock
710  * @data: Mount options
711  * @silent: Don't complain if it's not a GFS2 filesystem
712  *
713  * Returns: errno
714  */
715
716 static int fill_super(struct super_block *sb, void *data, int silent)
717 {
718         struct gfs2_sbd *sdp;
719         struct gfs2_holder mount_gh;
720         int error;
721
722         sdp = init_sbd(sb);
723         if (!sdp) {
724                 printk(KERN_WARNING "GFS2: can't alloc struct gfs2_sbd\n");
725                 return -ENOMEM;
726         }
727
728         error = gfs2_mount_args(sdp, (char *)data, 0);
729         if (error) {
730                 printk(KERN_WARNING "GFS2: can't parse mount arguments\n");
731                 goto fail;
732         }
733
734         init_vfs(sb, SDF_NOATIME);
735
736         /* Set up the buffer cache and fill in some fake block size values
737            to allow us to read-in the on-disk superblock. */
738         sdp->sd_sb.sb_bsize = sb_min_blocksize(sb, GFS2_BASIC_BLOCK);
739         sdp->sd_sb.sb_bsize_shift = sb->s_blocksize_bits;
740         sdp->sd_fsb2bb_shift = sdp->sd_sb.sb_bsize_shift -
741                                GFS2_BASIC_BLOCK_SHIFT;
742         sdp->sd_fsb2bb = 1 << sdp->sd_fsb2bb_shift;
743
744         error = init_names(sdp, silent);
745         if (error)
746                 goto fail;
747
748         gfs2_create_debugfs_file(sdp);
749
750         error = gfs2_sys_fs_add(sdp);
751         if (error)
752                 goto fail;
753
754         error = gfs2_lm_mount(sdp, silent);
755         if (error)
756                 goto fail_sys;
757
758         error = init_locking(sdp, &mount_gh, DO);
759         if (error)
760                 goto fail_lm;
761
762         error = init_sb(sdp, silent, DO);
763         if (error)
764                 goto fail_locking;
765
766         error = init_inodes(sdp, DO);
767         if (error)
768                 goto fail_sb;
769
770         error = init_per_node(sdp, DO);
771         if (error)
772                 goto fail_inodes;
773
774         error = gfs2_statfs_init(sdp);
775         if (error) {
776                 fs_err(sdp, "can't initialize statfs subsystem: %d\n", error);
777                 goto fail_per_node;
778         }
779
780         error = init_threads(sdp, DO);
781         if (error)
782                 goto fail_per_node;
783
784         if (!(sb->s_flags & MS_RDONLY)) {
785                 error = gfs2_make_fs_rw(sdp);
786                 if (error) {
787                         fs_err(sdp, "can't make FS RW: %d\n", error);
788                         goto fail_threads;
789                 }
790         }
791
792         gfs2_glock_dq_uninit(&mount_gh);
793
794         return 0;
795
796 fail_threads:
797         init_threads(sdp, UNDO);
798 fail_per_node:
799         init_per_node(sdp, UNDO);
800 fail_inodes:
801         init_inodes(sdp, UNDO);
802 fail_sb:
803         init_sb(sdp, 0, UNDO);
804 fail_locking:
805         init_locking(sdp, &mount_gh, UNDO);
806 fail_lm:
807         gfs2_gl_hash_clear(sdp, WAIT);
808         gfs2_lm_unmount(sdp);
809         while (invalidate_inodes(sb))
810                 yield();
811 fail_sys:
812         gfs2_sys_fs_del(sdp);
813 fail:
814         gfs2_delete_debugfs_file(sdp);
815         kfree(sdp);
816         sb->s_fs_info = NULL;
817         return error;
818 }
819
820 static int gfs2_get_sb(struct file_system_type *fs_type, int flags,
821                 const char *dev_name, void *data, struct vfsmount *mnt)
822 {
823         struct super_block *sb;
824         struct gfs2_sbd *sdp;
825         int error = get_sb_bdev(fs_type, flags, dev_name, data, fill_super, mnt);
826         if (error)
827                 goto out;
828         sb = mnt->mnt_sb;
829         sdp = sb->s_fs_info;
830         sdp->sd_gfs2mnt = mnt;
831 out:
832         return error;
833 }
834
835 static int fill_super_meta(struct super_block *sb, struct super_block *new,
836                            void *data, int silent)
837 {
838         struct gfs2_sbd *sdp = sb->s_fs_info;
839         struct inode *inode;
840         int error = 0;
841
842         new->s_fs_info = sdp;
843         sdp->sd_vfs_meta = sb;
844
845         init_vfs(new, SDF_NOATIME);
846
847         /* Get the master inode */
848         inode = igrab(sdp->sd_master_dir);
849
850         new->s_root = d_alloc_root(inode);
851         if (!new->s_root) {
852                 fs_err(sdp, "can't get root dentry\n");
853                 error = -ENOMEM;
854                 iput(inode);
855         } else
856                 new->s_root->d_op = &gfs2_dops;
857
858         return error;
859 }
860
861 static int set_bdev_super(struct super_block *s, void *data)
862 {
863         s->s_bdev = data;
864         s->s_dev = s->s_bdev->bd_dev;
865         return 0;
866 }
867
868 static int test_bdev_super(struct super_block *s, void *data)
869 {
870         return s->s_bdev == data;
871 }
872
873 static struct super_block* get_gfs2_sb(const char *dev_name)
874 {
875         struct kstat stat;
876         struct nameidata nd;
877         struct file_system_type *fstype;
878         struct super_block *sb = NULL, *s;
879         int error;
880
881         error = path_lookup(dev_name, LOOKUP_FOLLOW, &nd);
882         if (error) {
883                 printk(KERN_WARNING "GFS2: path_lookup on %s returned error\n",
884                        dev_name);
885                 goto out;
886         }
887         error = vfs_getattr(nd.path.mnt, nd.path.dentry, &stat);
888
889         fstype = get_fs_type("gfs2");
890         list_for_each_entry(s, &fstype->fs_supers, s_instances) {
891                 if ((S_ISBLK(stat.mode) && s->s_dev == stat.rdev) ||
892                     (S_ISDIR(stat.mode) &&
893                      s == nd.path.dentry->d_inode->i_sb)) {
894                         sb = s;
895                         goto free_nd;
896                 }
897         }
898
899         printk(KERN_WARNING "GFS2: Unrecognized block device or "
900                "mount point %s\n", dev_name);
901
902 free_nd:
903         path_put(&nd.path);
904 out:
905         return sb;
906 }
907
908 static int gfs2_get_sb_meta(struct file_system_type *fs_type, int flags,
909                             const char *dev_name, void *data, struct vfsmount *mnt)
910 {
911         int error = 0;
912         struct super_block *sb = NULL, *new;
913         struct gfs2_sbd *sdp;
914
915         sb = get_gfs2_sb(dev_name);
916         if (!sb) {
917                 printk(KERN_WARNING "GFS2: gfs2 mount does not exist\n");
918                 error = -ENOENT;
919                 goto error;
920         }
921         sdp = sb->s_fs_info;
922         if (sdp->sd_vfs_meta) {
923                 printk(KERN_WARNING "GFS2: gfs2meta mount already exists\n");
924                 error = -EBUSY;
925                 goto error;
926         }
927         down(&sb->s_bdev->bd_mount_sem);
928         new = sget(fs_type, test_bdev_super, set_bdev_super, sb->s_bdev);
929         up(&sb->s_bdev->bd_mount_sem);
930         if (IS_ERR(new)) {
931                 error = PTR_ERR(new);
932                 goto error;
933         }
934         module_put(fs_type->owner);
935         new->s_flags = flags;
936         strlcpy(new->s_id, sb->s_id, sizeof(new->s_id));
937         sb_set_blocksize(new, sb->s_blocksize);
938         error = fill_super_meta(sb, new, data, flags & MS_SILENT ? 1 : 0);
939         if (error) {
940                 up_write(&new->s_umount);
941                 deactivate_super(new);
942                 goto error;
943         }
944
945         new->s_flags |= MS_ACTIVE;
946
947         /* Grab a reference to the gfs2 mount point */
948         atomic_inc(&sdp->sd_gfs2mnt->mnt_count);
949         return simple_set_mnt(mnt, new);
950 error:
951         return error;
952 }
953
954 static void gfs2_kill_sb(struct super_block *sb)
955 {
956         if (sb->s_fs_info) {
957                 gfs2_delete_debugfs_file(sb->s_fs_info);
958                 gfs2_meta_syncfs(sb->s_fs_info);
959         }
960         kill_block_super(sb);
961 }
962
963 static void gfs2_kill_sb_meta(struct super_block *sb)
964 {
965         struct gfs2_sbd *sdp = sb->s_fs_info;
966         generic_shutdown_super(sb);
967         sdp->sd_vfs_meta = NULL;
968         atomic_dec(&sdp->sd_gfs2mnt->mnt_count);
969 }
970
971 struct file_system_type gfs2_fs_type = {
972         .name = "gfs2",
973         .fs_flags = FS_REQUIRES_DEV,
974         .get_sb = gfs2_get_sb,
975         .kill_sb = gfs2_kill_sb,
976         .owner = THIS_MODULE,
977 };
978
979 struct file_system_type gfs2meta_fs_type = {
980         .name = "gfs2meta",
981         .fs_flags = FS_REQUIRES_DEV,
982         .get_sb = gfs2_get_sb_meta,
983         .kill_sb = gfs2_kill_sb_meta,
984         .owner = THIS_MODULE,
985 };
986