2 * Copyright (C) International Business Machines Corp., 2000-2004
3 * Portions Copyright (C) Christoph Hellwig, 2001-2002
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
13 * the GNU General Public License for more details.
15 * You should have received a copy of the GNU General Public License
16 * along with this program; if not, write to the Free Software
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21 #include <linux/module.h>
22 #include <linux/parser.h>
23 #include <linux/completion.h>
24 #include <linux/vfs.h>
25 #include <linux/quotaops.h>
26 #include <linux/mount.h>
27 #include <linux/moduleparam.h>
28 #include <linux/kthread.h>
29 #include <linux/posix_acl.h>
30 #include <linux/buffer_head.h>
31 #include <linux/exportfs.h>
32 #include <linux/crc32.h>
33 #include <linux/slab.h>
34 #include <asm/uaccess.h>
35 #include <linux/seq_file.h>
37 #include "jfs_incore.h"
38 #include "jfs_filsys.h"
39 #include "jfs_inode.h"
40 #include "jfs_metapage.h"
41 #include "jfs_superblock.h"
45 #include "jfs_debug.h"
47 MODULE_DESCRIPTION("The Journaled Filesystem (JFS)");
48 MODULE_AUTHOR("Steve Best/Dave Kleikamp/Barry Arndt, IBM");
49 MODULE_LICENSE("GPL");
51 static struct kmem_cache * jfs_inode_cachep;
53 static const struct super_operations jfs_super_operations;
54 static const struct export_operations jfs_export_operations;
55 static struct file_system_type jfs_fs_type;
57 #define MAX_COMMIT_THREADS 64
58 static int commit_threads = 0;
59 module_param(commit_threads, int, 0);
60 MODULE_PARM_DESC(commit_threads, "Number of commit threads");
62 static struct task_struct *jfsCommitThread[MAX_COMMIT_THREADS];
63 struct task_struct *jfsIOthread;
64 struct task_struct *jfsSyncThread;
66 #ifdef CONFIG_JFS_DEBUG
67 int jfsloglevel = JFS_LOGLEVEL_WARN;
68 module_param(jfsloglevel, int, 0644);
69 MODULE_PARM_DESC(jfsloglevel, "Specify JFS loglevel (0, 1 or 2)");
72 static void jfs_handle_error(struct super_block *sb)
74 struct jfs_sb_info *sbi = JFS_SBI(sb);
76 if (sb->s_flags & MS_RDONLY)
79 updateSuper(sb, FM_DIRTY);
81 if (sbi->flag & JFS_ERR_PANIC)
82 panic("JFS (device %s): panic forced after error\n",
84 else if (sbi->flag & JFS_ERR_REMOUNT_RO) {
85 jfs_err("ERROR: (device %s): remounting filesystem "
88 sb->s_flags |= MS_RDONLY;
91 /* nothing is done for continue beyond marking the superblock dirty */
94 void jfs_error(struct super_block *sb, const char * function, ...)
96 static char error_buf[256];
99 va_start(args, function);
100 vsnprintf(error_buf, sizeof(error_buf), function, args);
103 printk(KERN_ERR "ERROR: (device %s): %s\n", sb->s_id, error_buf);
105 jfs_handle_error(sb);
108 static struct inode *jfs_alloc_inode(struct super_block *sb)
110 struct jfs_inode_info *jfs_inode;
112 jfs_inode = kmem_cache_alloc(jfs_inode_cachep, GFP_NOFS);
115 return &jfs_inode->vfs_inode;
118 static void jfs_i_callback(struct rcu_head *head)
120 struct inode *inode = container_of(head, struct inode, i_rcu);
121 struct jfs_inode_info *ji = JFS_IP(inode);
122 kmem_cache_free(jfs_inode_cachep, ji);
125 static void jfs_destroy_inode(struct inode *inode)
127 struct jfs_inode_info *ji = JFS_IP(inode);
129 BUG_ON(!list_empty(&ji->anon_inode_list));
131 spin_lock_irq(&ji->ag_lock);
132 if (ji->active_ag != -1) {
133 struct bmap *bmap = JFS_SBI(inode->i_sb)->bmap;
134 atomic_dec(&bmap->db_active[ji->active_ag]);
137 spin_unlock_irq(&ji->ag_lock);
138 call_rcu(&inode->i_rcu, jfs_i_callback);
141 static int jfs_statfs(struct dentry *dentry, struct kstatfs *buf)
143 struct jfs_sb_info *sbi = JFS_SBI(dentry->d_sb);
145 struct inomap *imap = JFS_IP(sbi->ipimap)->i_imap;
147 jfs_info("In jfs_statfs");
148 buf->f_type = JFS_SUPER_MAGIC;
149 buf->f_bsize = sbi->bsize;
150 buf->f_blocks = sbi->bmap->db_mapsize;
151 buf->f_bfree = sbi->bmap->db_nfree;
152 buf->f_bavail = sbi->bmap->db_nfree;
154 * If we really return the number of allocated & free inodes, some
155 * applications will fail because they won't see enough free inodes.
156 * We'll try to calculate some guess as to how may inodes we can
159 * buf->f_files = atomic_read(&imap->im_numinos);
160 * buf->f_ffree = atomic_read(&imap->im_numfree);
162 maxinodes = min((s64) atomic_read(&imap->im_numinos) +
163 ((sbi->bmap->db_nfree >> imap->im_l2nbperiext)
164 << L2INOSPEREXT), (s64) 0xffffffffLL);
165 buf->f_files = maxinodes;
166 buf->f_ffree = maxinodes - (atomic_read(&imap->im_numinos) -
167 atomic_read(&imap->im_numfree));
168 buf->f_fsid.val[0] = (u32)crc32_le(0, sbi->uuid, sizeof(sbi->uuid)/2);
169 buf->f_fsid.val[1] = (u32)crc32_le(0, sbi->uuid + sizeof(sbi->uuid)/2,
170 sizeof(sbi->uuid)/2);
172 buf->f_namelen = JFS_NAME_MAX;
176 static void jfs_put_super(struct super_block *sb)
178 struct jfs_sb_info *sbi = JFS_SBI(sb);
181 jfs_info("In jfs_put_super");
183 dquot_disable(sb, -1, DQUOT_USAGE_ENABLED | DQUOT_LIMITS_ENABLED);
187 jfs_err("jfs_umount failed with return code %d", rc);
189 unload_nls(sbi->nls_tab);
191 truncate_inode_pages(sbi->direct_inode->i_mapping, 0);
192 iput(sbi->direct_inode);
198 Opt_integrity, Opt_nointegrity, Opt_iocharset, Opt_resize,
199 Opt_resize_nosize, Opt_errors, Opt_ignore, Opt_err, Opt_quota,
200 Opt_usrquota, Opt_grpquota, Opt_uid, Opt_gid, Opt_umask
203 static const match_table_t tokens = {
204 {Opt_integrity, "integrity"},
205 {Opt_nointegrity, "nointegrity"},
206 {Opt_iocharset, "iocharset=%s"},
207 {Opt_resize, "resize=%u"},
208 {Opt_resize_nosize, "resize"},
209 {Opt_errors, "errors=%s"},
210 {Opt_ignore, "noquota"},
211 {Opt_ignore, "quota"},
212 {Opt_usrquota, "usrquota"},
213 {Opt_grpquota, "grpquota"},
216 {Opt_umask, "umask=%u"},
220 static int parse_options(char *options, struct super_block *sb, s64 *newLVSize,
223 void *nls_map = (void *)-1; /* -1: no change; NULL: none */
225 struct jfs_sb_info *sbi = JFS_SBI(sb);
232 while ((p = strsep(&options, ",")) != NULL) {
233 substring_t args[MAX_OPT_ARGS];
238 token = match_token(p, tokens, args);
241 *flag &= ~JFS_NOINTEGRITY;
243 case Opt_nointegrity:
244 *flag |= JFS_NOINTEGRITY;
247 /* Silently ignore the quota options */
248 /* Don't do anything ;-) */
251 if (nls_map && nls_map != (void *) -1)
253 if (!strcmp(args[0].from, "none"))
256 nls_map = load_nls(args[0].from);
259 "JFS: charset not found\n");
266 char *resize = args[0].from;
267 *newLVSize = simple_strtoull(resize, &resize, 0);
270 case Opt_resize_nosize:
272 *newLVSize = sb->s_bdev->bd_inode->i_size >>
273 sb->s_blocksize_bits;
276 "JFS: Cannot determine volume size\n");
281 char *errors = args[0].from;
282 if (!errors || !*errors)
284 if (!strcmp(errors, "continue")) {
285 *flag &= ~JFS_ERR_REMOUNT_RO;
286 *flag &= ~JFS_ERR_PANIC;
287 *flag |= JFS_ERR_CONTINUE;
288 } else if (!strcmp(errors, "remount-ro")) {
289 *flag &= ~JFS_ERR_CONTINUE;
290 *flag &= ~JFS_ERR_PANIC;
291 *flag |= JFS_ERR_REMOUNT_RO;
292 } else if (!strcmp(errors, "panic")) {
293 *flag &= ~JFS_ERR_CONTINUE;
294 *flag &= ~JFS_ERR_REMOUNT_RO;
295 *flag |= JFS_ERR_PANIC;
298 "JFS: %s is an invalid error handler\n",
308 *flag |= JFS_USRQUOTA;
311 *flag |= JFS_GRPQUOTA;
318 "JFS: quota operations not supported\n");
323 char *uid = args[0].from;
324 uid_t val = simple_strtoul(uid, &uid, 0);
325 sbi->uid = make_kuid(current_user_ns(), val);
326 if (!uid_valid(sbi->uid))
332 char *gid = args[0].from;
333 gid_t val = simple_strtoul(gid, &gid, 0);
334 sbi->gid = make_kgid(current_user_ns(), val);
335 if (!gid_valid(sbi->gid))
341 char *umask = args[0].from;
342 sbi->umask = simple_strtoul(umask, &umask, 8);
343 if (sbi->umask & ~0777) {
345 "JFS: Invalid value of umask\n");
351 printk("jfs: Unrecognized mount option \"%s\" "
352 " or missing value\n", p);
357 if (nls_map != (void *) -1) {
358 /* Discard old (if remount) */
359 unload_nls(sbi->nls_tab);
360 sbi->nls_tab = nls_map;
365 if (nls_map && nls_map != (void *) -1)
370 static int jfs_remount(struct super_block *sb, int *flags, char *data)
374 int flag = JFS_SBI(sb)->flag;
377 if (!parse_options(data, sb, &newLVSize, &flag)) {
382 if (sb->s_flags & MS_RDONLY) {
384 "JFS: resize requires volume to be mounted read-write\n");
387 rc = jfs_extendfs(sb, newLVSize, 0);
392 if ((sb->s_flags & MS_RDONLY) && !(*flags & MS_RDONLY)) {
394 * Invalidate any previously read metadata. fsck may have
395 * changed the on-disk data since we mounted r/o
397 truncate_inode_pages(JFS_SBI(sb)->direct_inode->i_mapping, 0);
399 JFS_SBI(sb)->flag = flag;
400 ret = jfs_mount_rw(sb, 1);
402 /* mark the fs r/w for quota activity */
403 sb->s_flags &= ~MS_RDONLY;
405 dquot_resume(sb, -1);
408 if ((!(sb->s_flags & MS_RDONLY)) && (*flags & MS_RDONLY)) {
409 rc = dquot_suspend(sb, -1);
413 rc = jfs_umount_rw(sb);
414 JFS_SBI(sb)->flag = flag;
417 if ((JFS_SBI(sb)->flag & JFS_NOINTEGRITY) != (flag & JFS_NOINTEGRITY))
418 if (!(sb->s_flags & MS_RDONLY)) {
419 rc = jfs_umount_rw(sb);
423 JFS_SBI(sb)->flag = flag;
424 ret = jfs_mount_rw(sb, 1);
427 JFS_SBI(sb)->flag = flag;
432 static int jfs_fill_super(struct super_block *sb, void *data, int silent)
434 struct jfs_sb_info *sbi;
438 int flag, ret = -EINVAL;
440 jfs_info("In jfs_read_super: s_flags=0x%lx", sb->s_flags);
442 if (!new_valid_dev(sb->s_bdev->bd_dev))
445 sbi = kzalloc(sizeof (struct jfs_sb_info), GFP_KERNEL);
450 sb->s_max_links = JFS_LINK_MAX;
452 sbi->uid = INVALID_UID;
453 sbi->gid = INVALID_GID;
456 /* initialize the mount flag and determine the default error handler */
457 flag = JFS_ERR_REMOUNT_RO;
459 if (!parse_options((char *) data, sb, &newLVSize, &flag))
463 #ifdef CONFIG_JFS_POSIX_ACL
464 sb->s_flags |= MS_POSIXACL;
468 printk(KERN_ERR "resize option for remount only\n");
473 * Initialize blocksize to 4K.
475 sb_set_blocksize(sb, PSIZE);
478 * Set method vectors.
480 sb->s_op = &jfs_super_operations;
481 sb->s_export_op = &jfs_export_operations;
483 sb->dq_op = &dquot_operations;
484 sb->s_qcop = &dquot_quotactl_ops;
488 * Initialize direct-mapping inode/address-space
490 inode = new_inode(sb);
496 inode->i_size = sb->s_bdev->bd_inode->i_size;
497 inode->i_mapping->a_ops = &jfs_metapage_aops;
498 insert_inode_hash(inode);
499 mapping_set_gfp_mask(inode->i_mapping, GFP_NOFS);
501 sbi->direct_inode = inode;
506 jfs_err("jfs_mount failed w/return code = %d", rc);
508 goto out_mount_failed;
510 if (sb->s_flags & MS_RDONLY)
513 rc = jfs_mount_rw(sb, 0);
516 jfs_err("jfs_mount_rw failed, return code = %d",
523 sb->s_magic = JFS_SUPER_MAGIC;
525 if (sbi->mntflag & JFS_OS2)
526 sb->s_d_op = &jfs_ci_dentry_operations;
528 inode = jfs_iget(sb, ROOT_I);
530 ret = PTR_ERR(inode);
533 sb->s_root = d_make_root(inode);
537 /* logical blocks are represented by 40 bits in pxd_t, etc. */
538 sb->s_maxbytes = ((u64) sb->s_blocksize) << 40;
539 #if BITS_PER_LONG == 32
541 * Page cache is indexed by long.
542 * I would use MAX_LFS_FILESIZE, but it's only half as big
544 sb->s_maxbytes = min(((u64) PAGE_CACHE_SIZE << 32) - 1, (u64)sb->s_maxbytes);
550 jfs_err("jfs_read_super: get root dentry failed");
555 jfs_err("jfs_umount failed with return code %d", rc);
558 filemap_write_and_wait(sbi->direct_inode->i_mapping);
559 truncate_inode_pages(sbi->direct_inode->i_mapping, 0);
560 make_bad_inode(sbi->direct_inode);
561 iput(sbi->direct_inode);
562 sbi->direct_inode = NULL;
565 unload_nls(sbi->nls_tab);
571 static int jfs_freeze(struct super_block *sb)
573 struct jfs_sb_info *sbi = JFS_SBI(sb);
574 struct jfs_log *log = sbi->log;
576 if (!(sb->s_flags & MS_RDONLY)) {
579 updateSuper(sb, FM_CLEAN);
584 static int jfs_unfreeze(struct super_block *sb)
586 struct jfs_sb_info *sbi = JFS_SBI(sb);
587 struct jfs_log *log = sbi->log;
590 if (!(sb->s_flags & MS_RDONLY)) {
591 updateSuper(sb, FM_MOUNT);
592 if ((rc = lmLogInit(log)))
593 jfs_err("jfs_unlock failed with return code %d", rc);
600 static struct dentry *jfs_do_mount(struct file_system_type *fs_type,
601 int flags, const char *dev_name, void *data)
603 return mount_bdev(fs_type, flags, dev_name, data, jfs_fill_super);
606 static int jfs_sync_fs(struct super_block *sb, int wait)
608 struct jfs_log *log = JFS_SBI(sb)->log;
610 /* log == NULL indicates read-only mount */
613 * Write quota structures to quota file, sync_blockdev() will
614 * write them to disk later
616 dquot_writeback_dquots(sb, -1);
617 jfs_flush_journal(log, wait);
624 static int jfs_show_options(struct seq_file *seq, struct dentry *root)
626 struct jfs_sb_info *sbi = JFS_SBI(root->d_sb);
628 if (uid_valid(sbi->uid))
629 seq_printf(seq, ",uid=%d", from_kuid(&init_user_ns, sbi->uid));
630 if (gid_valid(sbi->gid))
631 seq_printf(seq, ",gid=%d", from_kgid(&init_user_ns, sbi->gid));
632 if (sbi->umask != -1)
633 seq_printf(seq, ",umask=%03o", sbi->umask);
634 if (sbi->flag & JFS_NOINTEGRITY)
635 seq_puts(seq, ",nointegrity");
637 seq_printf(seq, ",iocharset=%s", sbi->nls_tab->charset);
638 if (sbi->flag & JFS_ERR_CONTINUE)
639 seq_printf(seq, ",errors=continue");
640 if (sbi->flag & JFS_ERR_PANIC)
641 seq_printf(seq, ",errors=panic");
644 if (sbi->flag & JFS_USRQUOTA)
645 seq_puts(seq, ",usrquota");
647 if (sbi->flag & JFS_GRPQUOTA)
648 seq_puts(seq, ",grpquota");
656 /* Read data from quotafile - avoid pagecache and such because we cannot afford
657 * acquiring the locks... As quota files are never truncated and quota code
658 * itself serializes the operations (and no one else should touch the files)
659 * we don't have to be afraid of races */
660 static ssize_t jfs_quota_read(struct super_block *sb, int type, char *data,
661 size_t len, loff_t off)
663 struct inode *inode = sb_dqopt(sb)->files[type];
664 sector_t blk = off >> sb->s_blocksize_bits;
666 int offset = off & (sb->s_blocksize - 1);
669 struct buffer_head tmp_bh;
670 struct buffer_head *bh;
671 loff_t i_size = i_size_read(inode);
675 if (off+len > i_size)
679 tocopy = sb->s_blocksize - offset < toread ?
680 sb->s_blocksize - offset : toread;
683 tmp_bh.b_size = 1 << inode->i_blkbits;
684 err = jfs_get_block(inode, blk, &tmp_bh, 0);
687 if (!buffer_mapped(&tmp_bh)) /* A hole? */
688 memset(data, 0, tocopy);
690 bh = sb_bread(sb, tmp_bh.b_blocknr);
693 memcpy(data, bh->b_data+offset, tocopy);
704 /* Write to quotafile */
705 static ssize_t jfs_quota_write(struct super_block *sb, int type,
706 const char *data, size_t len, loff_t off)
708 struct inode *inode = sb_dqopt(sb)->files[type];
709 sector_t blk = off >> sb->s_blocksize_bits;
711 int offset = off & (sb->s_blocksize - 1);
713 size_t towrite = len;
714 struct buffer_head tmp_bh;
715 struct buffer_head *bh;
717 mutex_lock(&inode->i_mutex);
718 while (towrite > 0) {
719 tocopy = sb->s_blocksize - offset < towrite ?
720 sb->s_blocksize - offset : towrite;
723 tmp_bh.b_size = 1 << inode->i_blkbits;
724 err = jfs_get_block(inode, blk, &tmp_bh, 1);
727 if (offset || tocopy != sb->s_blocksize)
728 bh = sb_bread(sb, tmp_bh.b_blocknr);
730 bh = sb_getblk(sb, tmp_bh.b_blocknr);
736 memcpy(bh->b_data+offset, data, tocopy);
737 flush_dcache_page(bh->b_page);
738 set_buffer_uptodate(bh);
739 mark_buffer_dirty(bh);
748 if (len == towrite) {
749 mutex_unlock(&inode->i_mutex);
752 if (inode->i_size < off+len-towrite)
753 i_size_write(inode, off+len-towrite);
755 inode->i_mtime = inode->i_ctime = CURRENT_TIME;
756 mark_inode_dirty(inode);
757 mutex_unlock(&inode->i_mutex);
758 return len - towrite;
763 static const struct super_operations jfs_super_operations = {
764 .alloc_inode = jfs_alloc_inode,
765 .destroy_inode = jfs_destroy_inode,
766 .dirty_inode = jfs_dirty_inode,
767 .write_inode = jfs_write_inode,
768 .evict_inode = jfs_evict_inode,
769 .put_super = jfs_put_super,
770 .sync_fs = jfs_sync_fs,
771 .freeze_fs = jfs_freeze,
772 .unfreeze_fs = jfs_unfreeze,
773 .statfs = jfs_statfs,
774 .remount_fs = jfs_remount,
775 .show_options = jfs_show_options,
777 .quota_read = jfs_quota_read,
778 .quota_write = jfs_quota_write,
782 static const struct export_operations jfs_export_operations = {
783 .fh_to_dentry = jfs_fh_to_dentry,
784 .fh_to_parent = jfs_fh_to_parent,
785 .get_parent = jfs_get_parent,
788 static struct file_system_type jfs_fs_type = {
789 .owner = THIS_MODULE,
791 .mount = jfs_do_mount,
792 .kill_sb = kill_block_super,
793 .fs_flags = FS_REQUIRES_DEV,
796 static void init_once(void *foo)
798 struct jfs_inode_info *jfs_ip = (struct jfs_inode_info *) foo;
800 memset(jfs_ip, 0, sizeof(struct jfs_inode_info));
801 INIT_LIST_HEAD(&jfs_ip->anon_inode_list);
802 init_rwsem(&jfs_ip->rdwrlock);
803 mutex_init(&jfs_ip->commit_mutex);
804 init_rwsem(&jfs_ip->xattr_sem);
805 spin_lock_init(&jfs_ip->ag_lock);
806 jfs_ip->active_ag = -1;
807 inode_init_once(&jfs_ip->vfs_inode);
810 static int __init init_jfs_fs(void)
816 kmem_cache_create("jfs_ip", sizeof(struct jfs_inode_info), 0,
817 SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD,
819 if (jfs_inode_cachep == NULL)
823 * Metapage initialization
825 rc = metapage_init();
827 jfs_err("metapage_init failed w/rc = %d", rc);
832 * Transaction Manager initialization
836 jfs_err("txInit failed w/rc = %d", rc);
841 * I/O completion thread (endio)
843 jfsIOthread = kthread_run(jfsIOWait, NULL, "jfsIO");
844 if (IS_ERR(jfsIOthread)) {
845 rc = PTR_ERR(jfsIOthread);
846 jfs_err("init_jfs_fs: fork failed w/rc = %d", rc);
850 if (commit_threads < 1)
851 commit_threads = num_online_cpus();
852 if (commit_threads > MAX_COMMIT_THREADS)
853 commit_threads = MAX_COMMIT_THREADS;
855 for (i = 0; i < commit_threads; i++) {
856 jfsCommitThread[i] = kthread_run(jfs_lazycommit, NULL, "jfsCommit");
857 if (IS_ERR(jfsCommitThread[i])) {
858 rc = PTR_ERR(jfsCommitThread[i]);
859 jfs_err("init_jfs_fs: fork failed w/rc = %d", rc);
861 goto kill_committask;
865 jfsSyncThread = kthread_run(jfs_sync, NULL, "jfsSync");
866 if (IS_ERR(jfsSyncThread)) {
867 rc = PTR_ERR(jfsSyncThread);
868 jfs_err("init_jfs_fs: fork failed w/rc = %d", rc);
869 goto kill_committask;
876 rc = register_filesystem(&jfs_fs_type);
883 kthread_stop(jfsSyncThread);
885 for (i = 0; i < commit_threads; i++)
886 kthread_stop(jfsCommitThread[i]);
887 kthread_stop(jfsIOthread);
893 kmem_cache_destroy(jfs_inode_cachep);
897 static void __exit exit_jfs_fs(void)
901 jfs_info("exit_jfs_fs called");
906 kthread_stop(jfsIOthread);
907 for (i = 0; i < commit_threads; i++)
908 kthread_stop(jfsCommitThread[i]);
909 kthread_stop(jfsSyncThread);
913 unregister_filesystem(&jfs_fs_type);
914 kmem_cache_destroy(jfs_inode_cachep);
917 module_init(init_jfs_fs)
918 module_exit(exit_jfs_fs)