/* * Copyright 2000 by Hans Reiser, licensing governed by reiserfs/README * * Trivial changes by Alan Cox to add the LFS fixes * * Trivial Changes: * Rights granted to Hans Reiser to redistribute under other terms providing * he accepts all liability including but not limited to patent, fitness * for purpose, and direct or indirect claims arising from failure to perform. * * NO WARRANTY */ #include #include #include #include #include #include #include #include #include #include #include struct file_system_type reiserfs_fs_type; const char reiserfs_3_5_magic_string[] = REISERFS_SUPER_MAGIC_STRING; const char reiserfs_3_6_magic_string[] = REISER2FS_SUPER_MAGIC_STRING; const char reiserfs_jr_magic_string[] = REISER2FS_JR_SUPER_MAGIC_STRING; int is_reiserfs_3_5 (struct reiserfs_super_block * rs) { return !strncmp (rs->s_v1.s_magic, reiserfs_3_5_magic_string, strlen (reiserfs_3_5_magic_string)); } int is_reiserfs_3_6 (struct reiserfs_super_block * rs) { return !strncmp (rs->s_v1.s_magic, reiserfs_3_6_magic_string, strlen (reiserfs_3_6_magic_string)); } int is_reiserfs_jr (struct reiserfs_super_block * rs) { return !strncmp (rs->s_v1.s_magic, reiserfs_jr_magic_string, strlen (reiserfs_jr_magic_string)); } static int is_any_reiserfs_magic_string (struct reiserfs_super_block * rs) { return (is_reiserfs_3_5 (rs) || is_reiserfs_3_6 (rs) || is_reiserfs_jr (rs)); } static int reiserfs_remount (struct super_block * s, int * flags, char * data); static int reiserfs_statfs (struct super_block * s, struct kstatfs * buf); static void reiserfs_sync_fs (struct super_block * s) { if (!(s->s_flags & MS_RDONLY)) { struct reiserfs_transaction_handle th; reiserfs_write_lock(s); journal_begin(&th, s, 1); journal_end_sync(&th, s, 1); reiserfs_flush_old_commits(s); s->s_dirt = 0; reiserfs_write_unlock(s); } } static void reiserfs_write_super(struct super_block *s) { reiserfs_sync_fs(s); } static void reiserfs_write_super_lockfs (struct super_block * s) { struct reiserfs_transaction_handle th ; reiserfs_write_lock(s); if (!(s->s_flags & MS_RDONLY)) { journal_begin(&th, s, 1) ; reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s), 1); journal_mark_dirty(&th, s, SB_BUFFER_WITH_SB (s)); reiserfs_block_writes(&th) ; journal_end_sync(&th, s, 1) ; } s->s_dirt = 0; reiserfs_write_unlock(s); } void reiserfs_unlockfs(struct super_block *s) { reiserfs_allow_writes(s) ; } extern const struct key MAX_KEY; /* this is used to delete "save link" when there are no items of a file it points to. It can either happen if unlink is completed but "save unlink" removal, or if file has both unlink and truncate pending and as unlink completes first (because key of "save link" protecting unlink is bigger that a key lf "save link" which protects truncate), so there left no items to make truncate completion on */ static void remove_save_link_only (struct super_block * s, struct key * key, int oid_free) { struct reiserfs_transaction_handle th; /* we are going to do one balancing */ journal_begin (&th, s, JOURNAL_PER_BALANCE_CNT); reiserfs_delete_solid_item (&th, key); if (oid_free) /* removals are protected by direct items */ reiserfs_release_objectid (&th, le32_to_cpu (key->k_objectid)); journal_end (&th, s, JOURNAL_PER_BALANCE_CNT); } /* look for uncompleted unlinks and truncates and complete them */ static void finish_unfinished (struct super_block * s) { INITIALIZE_PATH (path); struct cpu_key max_cpu_key, obj_key; struct key save_link_key; int retval; struct item_head * ih; struct buffer_head * bh; int item_pos; char * item; int done; struct inode * inode; int truncate; /* compose key to look for "save" links */ max_cpu_key.version = KEY_FORMAT_3_5; max_cpu_key.on_disk_key = MAX_KEY; max_cpu_key.key_length = 3; done = 0; REISERFS_SB(s)->s_is_unlinked_ok = 1; while (1) { retval = search_item (s, &max_cpu_key, &path); if (retval != ITEM_NOT_FOUND) { reiserfs_warning ("vs-2140: finish_unfinished: search_by_key returned %d\n", retval); break; } bh = get_last_bh (&path); item_pos = get_item_pos (&path); if (item_pos != B_NR_ITEMS (bh)) { reiserfs_warning ("vs-2060: finish_unfinished: wrong position found\n"); break; } item_pos --; ih = B_N_PITEM_HEAD (bh, item_pos); if (le32_to_cpu (ih->ih_key.k_dir_id) != MAX_KEY_OBJECTID) /* there are no "save" links anymore */ break; save_link_key = ih->ih_key; if (is_indirect_le_ih (ih)) truncate = 1; else truncate = 0; /* reiserfs_iget needs k_dirid and k_objectid only */ item = B_I_PITEM (bh, ih); obj_key.on_disk_key.k_dir_id = le32_to_cpu (*(__u32 *)item); obj_key.on_disk_key.k_objectid = le32_to_cpu (ih->ih_key.k_objectid); obj_key.on_disk_key.u.k_offset_v1.k_offset = 0; obj_key.on_disk_key.u.k_offset_v1.k_uniqueness = 0; pathrelse (&path); inode = reiserfs_iget (s, &obj_key); if (!inode) { /* the unlink almost completed, it just did not manage to remove "save" link and release objectid */ reiserfs_warning ("vs-2180: finish_unfinished: iget failed for %K\n", &obj_key); remove_save_link_only (s, &save_link_key, 1); continue; } if (!truncate && inode->i_nlink) { /* file is not unlinked */ reiserfs_warning ("vs-2185: finish_unfinished: file %K is not unlinked\n", &obj_key); remove_save_link_only (s, &save_link_key, 0); continue; } if (truncate && S_ISDIR (inode->i_mode) ) { /* We got a truncate request for a dir which is impossible. The only imaginable way is to execute unfinished truncate request then boot into old kernel, remove the file and create dir with the same key. */ reiserfs_warning("green-2101: impossible truncate on a directory %k. Please report\n", INODE_PKEY (inode)); remove_save_link_only (s, &save_link_key, 0); truncate = 0; iput (inode); continue; } if (truncate) { REISERFS_I(inode) -> i_flags |= i_link_saved_truncate_mask; /* not completed truncate found. New size was committed together with "save" link */ reiserfs_warning ("Truncating %k to %Ld ..", INODE_PKEY (inode), inode->i_size); reiserfs_truncate_file (inode, 0/*don't update modification time*/); remove_save_link (inode, truncate); } else { REISERFS_I(inode) -> i_flags |= i_link_saved_unlink_mask; /* not completed unlink (rmdir) found */ reiserfs_warning ("Removing %k..", INODE_PKEY (inode)); /* removal gets completed in iput */ } iput (inode); printk ("done\n"); done ++; } REISERFS_SB(s)->s_is_unlinked_ok = 0; pathrelse (&path); if (done) reiserfs_warning ("There were %d uncompleted unlinks/truncates. " "Completed\n", done); } /* to protect file being unlinked from getting lost we "safe" link files being unlinked. This link will be deleted in the same transaction with last item of file. mounting the filesytem we scan all these links and remove files which almost got lost */ void add_save_link (struct reiserfs_transaction_handle * th, struct inode * inode, int truncate) { INITIALIZE_PATH (path); int retval; struct cpu_key key; struct item_head ih; __u32 link; /* file can only get one "save link" of each kind */ RFALSE( truncate && ( REISERFS_I(inode) -> i_flags & i_link_saved_truncate_mask ), "saved link already exists for truncated inode %lx", ( long ) inode -> i_ino ); RFALSE( !truncate && ( REISERFS_I(inode) -> i_flags & i_link_saved_unlink_mask ), "saved link already exists for unlinked inode %lx", ( long ) inode -> i_ino ); /* setup key of "save" link */ key.version = KEY_FORMAT_3_5; key.on_disk_key.k_dir_id = MAX_KEY_OBJECTID; key.on_disk_key.k_objectid = inode->i_ino; if (!truncate) { /* unlink, rmdir, rename */ set_cpu_key_k_offset (&key, 1 + inode->i_sb->s_blocksize); set_cpu_key_k_type (&key, TYPE_DIRECT); /* item head of "safe" link */ make_le_item_head (&ih, &key, key.version, 1 + inode->i_sb->s_blocksize, TYPE_DIRECT, 4/*length*/, 0xffff/*free space*/); } else { /* truncate */ if (S_ISDIR (inode->i_mode)) reiserfs_warning("green-2102: Adding a truncate savelink for a directory %k! Please report\n", INODE_PKEY(inode)); set_cpu_key_k_offset (&key, 1); set_cpu_key_k_type (&key, TYPE_INDIRECT); /* item head of "safe" link */ make_le_item_head (&ih, &key, key.version, 1, TYPE_INDIRECT, 4/*length*/, 0/*free space*/); } key.key_length = 3; /* look for its place in the tree */ retval = search_item (inode->i_sb, &key, &path); if (retval != ITEM_NOT_FOUND) { if ( retval != -ENOSPC ) reiserfs_warning ("vs-2100: add_save_link:" "search_by_key (%K) returned %d\n", &key, retval); pathrelse (&path); return; } /* body of "save" link */ link = INODE_PKEY (inode)->k_dir_id; /* put "save" link inot tree */ retval = reiserfs_insert_item (th, &path, &key, &ih, (char *)&link); if (retval) { if (retval != -ENOSPC) reiserfs_warning ("vs-2120: add_save_link: insert_item returned %d\n", retval); } else { if( truncate ) REISERFS_I(inode) -> i_flags |= i_link_saved_truncate_mask; else REISERFS_I(inode) -> i_flags |= i_link_saved_unlink_mask; } } /* this opens transaction unlike add_save_link */ void remove_save_link (struct inode * inode, int truncate) { struct reiserfs_transaction_handle th; struct key key; /* we are going to do one balancing only */ journal_begin (&th, inode->i_sb, JOURNAL_PER_BALANCE_CNT); /* setup key of "save" link */ key.k_dir_id = cpu_to_le32 (MAX_KEY_OBJECTID); key.k_objectid = INODE_PKEY (inode)->k_objectid; if (!truncate) { /* unlink, rmdir, rename */ set_le_key_k_offset (KEY_FORMAT_3_5, &key, 1 + inode->i_sb->s_blocksize); set_le_key_k_type (KEY_FORMAT_3_5, &key, TYPE_DIRECT); } else { /* truncate */ set_le_key_k_offset (KEY_FORMAT_3_5, &key, 1); set_le_key_k_type (KEY_FORMAT_3_5, &key, TYPE_INDIRECT); } if( ( truncate && ( REISERFS_I(inode) -> i_flags & i_link_saved_truncate_mask ) ) || ( !truncate && ( REISERFS_I(inode) -> i_flags & i_link_saved_unlink_mask ) ) ) reiserfs_delete_solid_item (&th, &key); if (!truncate) { reiserfs_release_objectid (&th, inode->i_ino); REISERFS_I(inode) -> i_flags &= ~i_link_saved_unlink_mask; } else REISERFS_I(inode) -> i_flags &= ~i_link_saved_truncate_mask; journal_end (&th, inode->i_sb, JOURNAL_PER_BALANCE_CNT); } static void reiserfs_put_super (struct super_block * s) { int i; struct reiserfs_transaction_handle th ; /* change file system state to current state if it was mounted with read-write permissions */ if (!(s->s_flags & MS_RDONLY)) { journal_begin(&th, s, 10) ; reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s), 1) ; set_sb_umount_state( SB_DISK_SUPER_BLOCK(s), REISERFS_SB(s)->s_mount_state ); journal_mark_dirty(&th, s, SB_BUFFER_WITH_SB (s)); } /* note, journal_release checks for readonly mount, and can decide not ** to do a journal_end */ journal_release(&th, s) ; for (i = 0; i < SB_BMAP_NR (s); i ++) brelse (SB_AP_BITMAP (s)[i].bh); vfree (SB_AP_BITMAP (s)); brelse (SB_BUFFER_WITH_SB (s)); print_statistics (s); if (REISERFS_SB(s)->s_kmallocs != 0) { reiserfs_warning ("vs-2004: reiserfs_put_super: allocated memory left %d\n", REISERFS_SB(s)->s_kmallocs); } if (REISERFS_SB(s)->reserved_blocks != 0) { reiserfs_warning ("green-2005: reiserfs_put_super: reserved blocks left %d\n", REISERFS_SB(s)->reserved_blocks); } reiserfs_proc_info_done( s ); kfree(s->s_fs_info); s->s_fs_info = NULL; return; } static kmem_cache_t * reiserfs_inode_cachep; static struct inode *reiserfs_alloc_inode(struct super_block *sb) { struct reiserfs_inode_info *ei; ei = (struct reiserfs_inode_info *)kmem_cache_alloc(reiserfs_inode_cachep, SLAB_KERNEL); if (!ei) return NULL; return &ei->vfs_inode; } static void reiserfs_destroy_inode(struct inode *inode) { kmem_cache_free(reiserfs_inode_cachep, REISERFS_I(inode)); } static void init_once(void * foo, kmem_cache_t * cachep, unsigned long flags) { struct reiserfs_inode_info *ei = (struct reiserfs_inode_info *) foo; if ((flags & (SLAB_CTOR_VERIFY|SLAB_CTOR_CONSTRUCTOR)) == SLAB_CTOR_CONSTRUCTOR) { INIT_LIST_HEAD(&ei->i_prealloc_list) ; inode_init_once(&ei->vfs_inode); } } static int init_inodecache(void) { reiserfs_inode_cachep = kmem_cache_create("reiser_inode_cache", sizeof(struct reiserfs_inode_info), 0, SLAB_HWCACHE_ALIGN|SLAB_RECLAIM_ACCOUNT, init_once, NULL); if (reiserfs_inode_cachep == NULL) return -ENOMEM; return 0; } static void destroy_inodecache(void) { if (kmem_cache_destroy(reiserfs_inode_cachep)) printk(KERN_INFO "reiserfs_inode_cache: not all structures were freed\n"); } /* we don't mark inodes dirty, we just log them */ static void reiserfs_dirty_inode (struct inode * inode) { struct reiserfs_transaction_handle th ; if (inode->i_sb->s_flags & MS_RDONLY) { reiserfs_warning("clm-6006: writing inode %lu on readonly FS\n", inode->i_ino) ; return ; } reiserfs_write_lock(inode->i_sb); /* this is really only used for atime updates, so they don't have ** to be included in O_SYNC or fsync */ journal_begin(&th, inode->i_sb, 1) ; reiserfs_update_sd (&th, inode); journal_end(&th, inode->i_sb, 1) ; reiserfs_write_unlock(inode->i_sb); } struct super_operations reiserfs_sops = { .alloc_inode = reiserfs_alloc_inode, .destroy_inode = reiserfs_destroy_inode, .write_inode = reiserfs_write_inode, .dirty_inode = reiserfs_dirty_inode, .delete_inode = reiserfs_delete_inode, .put_super = reiserfs_put_super, .write_super = reiserfs_write_super, .write_super_lockfs = reiserfs_write_super_lockfs, .unlockfs = reiserfs_unlockfs, .statfs = reiserfs_statfs, .remount_fs = reiserfs_remount, }; static struct export_operations reiserfs_export_ops = { .encode_fh = reiserfs_encode_fh, .decode_fh = reiserfs_decode_fh, .get_parent = reiserfs_get_parent, .get_dentry = reiserfs_get_dentry, } ; /* this struct is used in reiserfs_getopt () for containing the value for those mount options that have values rather than being toggles. */ typedef struct { char * value; int setmask; /* bitmask which is to set on mount_options bitmask when this value is found, 0 is no bits are to be changed. */ int clrmask; /* bitmask which is to clear on mount_options bitmask when this value is found, 0 is no bits are to be changed. This is applied BEFORE setmask */ } arg_desc_t; /* this struct is used in reiserfs_getopt() for describing the set of reiserfs mount options */ typedef struct { char * option_name; int arg_required; /* 0 if argument is not required, not 0 otherwise */ const arg_desc_t * values; /* list of values accepted by an option */ int setmask; /* bitmask which is to set on mount_options bitmask when this value is found, 0 is no bits are to be changed. */ int clrmask; /* bitmask which is to clear on mount_options bitmask when this value is found, 0 is no bits are to be changed. This is applied BEFORE setmask */ } opt_desc_t; /* possible values for -o data= */ static const arg_desc_t logging_mode[] = { {"ordered", 1<arg_required otherwise */ static int reiserfs_getopt ( struct super_block * s, char ** cur, opt_desc_t * opts, char ** opt_arg, unsigned long * bit_flags) { char * p; /* foo=bar, ^ ^ ^ | | +-- option_end | +-- arg_start +-- option_start */ const opt_desc_t * opt; const arg_desc_t * arg; p = *cur; /* assume argument cannot contain commas */ *cur = strchr (p, ','); if (*cur) { *(*cur) = '\0'; (*cur) ++; } if ( !strncmp (p, "alloc=", 6) ) { /* Ugly special case, probably we should redo options parser so that it can understand several arguments for some options, also so that it can fill several bitfields with option values. */ if ( reiserfs_parse_alloc_options( s, p + 6) ) { return -1; } else { return 0; } } /* for every option in the list */ for (opt = opts; opt->option_name; opt ++) { if (!strncmp (p, opt->option_name, strlen (opt->option_name))) { if (bit_flags) { *bit_flags &= ~opt->clrmask; *bit_flags |= opt->setmask; } break; } } if (!opt->option_name) { printk ("reiserfs_getopt: unknown option \"%s\"\n", p); return -1; } p += strlen (opt->option_name); switch (*p) { case '=': if (!opt->arg_required) { printk ("reiserfs_getopt: the option \"%s\" does not require an argument\n", opt->option_name); return -1; } break; case 0: if (opt->arg_required) { printk ("reiserfs_getopt: the option \"%s\" requires an argument\n", opt->option_name); return -1; } break; default: printk ("reiserfs_getopt: head of option \"%s\" is only correct\n", opt->option_name); return -1; } /* move to the argument, or to next option if argument is not required */ p ++; if ( opt->arg_required && !strlen (p) ) { /* this catches "option=," */ printk ("reiserfs_getopt: empty argument for \"%s\"\n", opt->option_name); return -1; } if (!opt->values) { /* *=NULLopt_arg contains pointer to argument */ *opt_arg = p; return opt->arg_required; } /* values possible for this option are listed in opt->values */ for (arg = opt->values; arg->value; arg ++) { if (!strcmp (p, arg->value)) { if (bit_flags) { *bit_flags &= ~arg->clrmask; *bit_flags |= arg->setmask; } return opt->arg_required; } } printk ("reiserfs_getopt: bad value \"%s\" for option \"%s\"\n", p, opt->option_name); return -1; } /* returns 0 if something is wrong in option string, 1 - otherwise */ static int reiserfs_parse_options (struct super_block * s, char * options, /* string given via mount's -o */ unsigned long * mount_options, /* after the parsing phase, contains the collection of bitflags defining what mount options were selected. */ unsigned long * blocks, /* strtol-ed from NNN of resize=NNN */ char ** jdev_name, unsigned int * commit_max_age) { int c; char * arg = NULL; char * pos; opt_desc_t opts[] = { {"tails", 't', tails, 0, 0}, /* Compatibility stuff, so that -o notail for old setups still work */ {"notail", 0, 0, 0, (1<s_mount_opt &= ~((1 << REISERFS_DATA_LOG) | (1 << REISERFS_DATA_ORDERED) | (1 << REISERFS_DATA_WRITEBACK)); REISERFS_SB(s)->s_mount_opt |= (1 << mode); } static void handle_data_mode(struct super_block *s, unsigned long mount_options) { if (mount_options & (1 << REISERFS_DATA_LOG)) { if (!reiserfs_data_log(s)) { switch_data_mode(s, REISERFS_DATA_LOG); printk("reiserfs: switching to journaled data mode\n"); } } else if (mount_options & (1 << REISERFS_DATA_ORDERED)) { if (!reiserfs_data_ordered(s)) { switch_data_mode(s, REISERFS_DATA_ORDERED); printk("reiserfs: switching to ordered data mode\n"); } } else if (mount_options & (1 << REISERFS_DATA_WRITEBACK)) { if (!reiserfs_data_writeback(s)) { switch_data_mode(s, REISERFS_DATA_WRITEBACK); printk("reiserfs: switching to writeback data mode\n"); } } } static void handle_attrs( struct super_block *s ) { struct reiserfs_super_block * rs; if( reiserfs_attrs( s ) ) { rs = SB_DISK_SUPER_BLOCK (s); if( old_format_only(s) ) { reiserfs_warning( "reiserfs: cannot support attributes on 3.5.x disk format\n" ); REISERFS_SB(s) -> s_mount_opt &= ~ ( 1 << REISERFS_ATTRS ); return; } if( !( le32_to_cpu( rs -> s_flags ) & reiserfs_attrs_cleared ) ) { reiserfs_warning( "reiserfs: cannot support attributes until flag is set in super-block\n" ); REISERFS_SB(s) -> s_mount_opt &= ~ ( 1 << REISERFS_ATTRS ); } } } static int reiserfs_remount (struct super_block * s, int * mount_flags, char * arg) { struct reiserfs_super_block * rs; struct reiserfs_transaction_handle th ; unsigned long blocks; unsigned long mount_options = REISERFS_SB(s)->s_mount_opt; unsigned long safe_mask = 0; unsigned int commit_max_age = 0; rs = SB_DISK_SUPER_BLOCK (s); if (!reiserfs_parse_options(s, arg, &mount_options, &blocks, NULL, &commit_max_age)) return -EINVAL; handle_attrs(s); /* Add options that are safe here */ safe_mask |= 1 << REISERFS_SMALLTAIL; safe_mask |= 1 << REISERFS_LARGETAIL; safe_mask |= 1 << REISERFS_NO_BORDER; safe_mask |= 1 << REISERFS_NO_UNHASHED_RELOCATION; safe_mask |= 1 << REISERFS_HASHED_RELOCATION; safe_mask |= 1 << REISERFS_TEST4; safe_mask |= 1 << REISERFS_ATTRS; /* Update the bitmask, taking care to keep * the bits we're not allowed to change here */ REISERFS_SB(s)->s_mount_opt = (REISERFS_SB(s)->s_mount_opt & ~safe_mask) | (mount_options & safe_mask); if(commit_max_age != 0) { SB_JOURNAL_MAX_COMMIT_AGE(s) = commit_max_age; SB_JOURNAL_MAX_TRANS_AGE(s) = commit_max_age; } else { /* 0 means restore defaults. */ SB_JOURNAL_MAX_COMMIT_AGE(s) = SB_JOURNAL_DEFAULT_MAX_COMMIT_AGE(s); SB_JOURNAL_MAX_TRANS_AGE(s) = JOURNAL_MAX_TRANS_AGE; } if(blocks) { int rc = reiserfs_resize(s, blocks); if (rc != 0) return rc; } if (*mount_flags & MS_RDONLY) { /* remount read-only */ if (s->s_flags & MS_RDONLY) /* it is read-only already */ return 0; /* try to remount file system with read-only permissions */ if (sb_umount_state(rs) == REISERFS_VALID_FS || REISERFS_SB(s)->s_mount_state != REISERFS_VALID_FS) { return 0; } journal_begin(&th, s, 10) ; /* Mounting a rw partition read-only. */ reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s), 1) ; set_sb_umount_state( rs, REISERFS_SB(s)->s_mount_state ); journal_mark_dirty(&th, s, SB_BUFFER_WITH_SB (s)); } else { /* remount read-write */ if (!(s->s_flags & MS_RDONLY)) return 0; /* We are read-write already */ handle_data_mode(s, mount_options); REISERFS_SB(s)->s_mount_state = sb_umount_state(rs) ; s->s_flags &= ~MS_RDONLY ; /* now it is safe to call journal_begin */ journal_begin(&th, s, 10) ; /* Mount a partition which is read-only, read-write */ reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s), 1) ; REISERFS_SB(s)->s_mount_state = sb_umount_state(rs); s->s_flags &= ~MS_RDONLY; set_sb_umount_state( rs, REISERFS_ERROR_FS ); /* mark_buffer_dirty (SB_BUFFER_WITH_SB (s), 1); */ journal_mark_dirty(&th, s, SB_BUFFER_WITH_SB (s)); REISERFS_SB(s)->s_mount_state = REISERFS_VALID_FS ; } /* this will force a full flush of all journal lists */ SB_JOURNAL(s)->j_must_wait = 1 ; journal_end(&th, s, 10) ; s->s_dirt = 0; if (!( *mount_flags & MS_RDONLY ) ) finish_unfinished( s ); return 0; } /* load_bitmap_info_data - Sets up the reiserfs_bitmap_info structure from disk. * @sb - superblock for this filesystem * @bi - the bitmap info to be loaded. Requires that bi->bh is valid. * * This routine counts how many free bits there are, finding the first zero * as a side effect. Could also be implemented as a loop of test_bit() calls, or * a loop of find_first_zero_bit() calls. This implementation is similar to * find_first_zero_bit(), but doesn't return after it finds the first bit. * Should only be called on fs mount, but should be fairly efficient anyways. * * bi->first_zero_hint is considered unset if it == 0, since the bitmap itself * will * invariably occupt block 0 represented in the bitmap. The only * exception to this is when free_count also == 0, since there will be no * free blocks at all. */ static void load_bitmap_info_data (struct super_block *sb, struct reiserfs_bitmap_info *bi) { unsigned long *cur = (unsigned long *)bi->bh->b_data; while ((char *)cur < (bi->bh->b_data + sb->s_blocksize)) { /* No need to scan if all 0's or all 1's. * Since we're only counting 0's, we can simply ignore all 1's */ if (*cur == 0) { if (bi->first_zero_hint == 0) { bi->first_zero_hint = ((char *)cur - bi->bh->b_data) << 3; } bi->free_count += sizeof(unsigned long)*8; } else if (*cur != ~0L) { int b; for (b = 0; b < sizeof(unsigned long)*8; b++) { if (!reiserfs_test_le_bit (b, cur)) { bi->free_count ++; if (bi->first_zero_hint == 0) bi->first_zero_hint = (((char *)cur - bi->bh->b_data) << 3) + b; } } } cur ++; } #ifdef CONFIG_REISERFS_CHECK // This outputs a lot of unneded info on big FSes // reiserfs_warning ("bitmap loaded from block %d: %d free blocks\n", // bi->bh->b_blocknr, bi->free_count); #endif } static int read_bitmaps (struct super_block * s) { int i, bmap_nr; SB_AP_BITMAP (s) = vmalloc (sizeof (struct reiserfs_bitmap_info) * SB_BMAP_NR(s)); if (SB_AP_BITMAP (s) == 0) return 1; memset (SB_AP_BITMAP (s), 0, sizeof (struct reiserfs_bitmap_info) * SB_BMAP_NR(s)); for (i = 0, bmap_nr = REISERFS_DISK_OFFSET_IN_BYTES / s->s_blocksize + 1; i < SB_BMAP_NR(s); i++, bmap_nr = s->s_blocksize * 8 * i) { SB_AP_BITMAP (s)[i].bh = sb_getblk(s, bmap_nr); if (!buffer_uptodate(SB_AP_BITMAP(s)[i].bh)) ll_rw_block(READ, 1, &SB_AP_BITMAP(s)[i].bh); } for (i = 0; i < SB_BMAP_NR(s); i++) { wait_on_buffer(SB_AP_BITMAP (s)[i].bh); if (!buffer_uptodate(SB_AP_BITMAP(s)[i].bh)) { reiserfs_warning("sh-2029: reiserfs read_bitmaps: " "bitmap block (#%lu) reading failed\n", SB_AP_BITMAP(s)[i].bh->b_blocknr); for (i = 0; i < SB_BMAP_NR(s); i++) brelse(SB_AP_BITMAP(s)[i].bh); vfree(SB_AP_BITMAP(s)); SB_AP_BITMAP(s) = NULL; return 1; } load_bitmap_info_data (s, SB_AP_BITMAP (s) + i); } return 0; } static int read_old_bitmaps (struct super_block * s) { int i ; struct reiserfs_super_block * rs = SB_DISK_SUPER_BLOCK(s); int bmp1 = (REISERFS_OLD_DISK_OFFSET_IN_BYTES / s->s_blocksize) + 1; /* first of bitmap blocks */ /* read true bitmap */ SB_AP_BITMAP (s) = vmalloc (sizeof (struct reiserfs_buffer_info *) * sb_bmap_nr(rs)); if (SB_AP_BITMAP (s) == 0) return 1; memset (SB_AP_BITMAP (s), 0, sizeof (struct reiserfs_buffer_info *) * sb_bmap_nr(rs)); for (i = 0; i < sb_bmap_nr(rs); i ++) { SB_AP_BITMAP (s)[i].bh = sb_bread (s, bmp1 + i); if (!SB_AP_BITMAP (s)[i].bh) return 1; load_bitmap_info_data (s, SB_AP_BITMAP (s) + i); } return 0; } void check_bitmap (struct super_block * s) { int i = 0; int free = 0; char * buf; while (i < SB_BLOCK_COUNT (s)) { buf = SB_AP_BITMAP (s)[i / (s->s_blocksize * 8)].bh->b_data; if (!reiserfs_test_le_bit (i % (s->s_blocksize * 8), buf)) free ++; i ++; } if (free != SB_FREE_BLOCKS (s)) reiserfs_warning ("vs-4000: check_bitmap: %d free blocks, must be %d\n", free, SB_FREE_BLOCKS (s)); } static int read_super_block (struct super_block * s, int offset) { struct buffer_head * bh; struct reiserfs_super_block * rs; int fs_blocksize; bh = sb_bread (s, offset / s->s_blocksize); if (!bh) { printk ("sh-2006: read_super_block: " "bread failed (dev %s, block %lu, size %lu)\n", reiserfs_bdevname (s), offset / s->s_blocksize, s->s_blocksize); return 1; } rs = (struct reiserfs_super_block *)bh->b_data; if (!is_any_reiserfs_magic_string (rs)) { brelse (bh); return 1; } // // ok, reiserfs signature (old or new) found in at the given offset // fs_blocksize = sb_blocksize(rs); brelse (bh); sb_set_blocksize (s, fs_blocksize); bh = sb_bread (s, offset / s->s_blocksize); if (!bh) { printk("sh-2007: read_super_block: " "bread failed (dev %s, block %lu, size %lu)\n", reiserfs_bdevname (s), offset / s->s_blocksize, s->s_blocksize); return 1; } rs = (struct reiserfs_super_block *)bh->b_data; if (sb_blocksize(rs) != s->s_blocksize) { printk ("sh-2011: read_super_block: " "can't find a reiserfs filesystem on (dev %s, block %Lu, size %lu)\n", reiserfs_bdevname (s), (unsigned long long)bh->b_blocknr, s->s_blocksize); brelse (bh); return 1; } if ( rs->s_v1.s_root_block == -1 ) { brelse(bh) ; printk("dev %s: Unfinished reiserfsck --rebuild-tree run detected. Please run\n" "reiserfsck --rebuild-tree and wait for a completion. If that fails\n" "get newer reiserfsprogs package\n", reiserfs_bdevname (s)); return 1; } SB_BUFFER_WITH_SB (s) = bh; SB_DISK_SUPER_BLOCK (s) = rs; if (is_reiserfs_jr (rs)) { /* magic is of non-standard journal filesystem, look at s_version to find which format is in use */ if (sb_version(rs) == REISERFS_VERSION_2) printk ("read_super_block: found reiserfs format \"3.6\" " "with non-standard journal\n"); else if (sb_version(rs) == REISERFS_VERSION_1) printk ("read_super_block: found reiserfs format \"3.5\" " "with non-standard journal\n"); else { printk ("sh-2012: read_super_block: found unknown format \"%u\" " "of reiserfs with non-standard magic\n", sb_version(rs)); return 1; } } else /* s_version of standard format may contain incorrect information, so we just look at the magic string */ printk ("found reiserfs format \"%s\" with standard journal\n", is_reiserfs_3_5 (rs) ? "3.5" : "3.6"); s->s_op = &reiserfs_sops; s->s_export_op = &reiserfs_export_ops; /* new format is limited by the 32 bit wide i_blocks field, want to ** be one full block below that. */ s->s_maxbytes = (512LL << 32) - s->s_blocksize ; return 0; } /* after journal replay, reread all bitmap and super blocks */ static int reread_meta_blocks(struct super_block *s) { int i ; ll_rw_block(READ, 1, &(SB_BUFFER_WITH_SB(s))) ; wait_on_buffer(SB_BUFFER_WITH_SB(s)) ; if (!buffer_uptodate(SB_BUFFER_WITH_SB(s))) { printk("reread_meta_blocks, error reading the super\n") ; return 1 ; } for (i = 0; i < SB_BMAP_NR(s) ; i++) { ll_rw_block(READ, 1, &(SB_AP_BITMAP(s)[i].bh)) ; wait_on_buffer(SB_AP_BITMAP(s)[i].bh) ; if (!buffer_uptodate(SB_AP_BITMAP(s)[i].bh)) { printk("reread_meta_blocks, error reading bitmap block number %d at %llu\n", i, (unsigned long long)SB_AP_BITMAP(s)[i].bh->b_blocknr) ; return 1 ; } } return 0 ; } ///////////////////////////////////////////////////// // hash detection stuff // if root directory is empty - we set default - Yura's - hash and // warn about it // FIXME: we look for only one name in a directory. If tea and yura // bith have the same value - we ask user to send report to the // mailing list __u32 find_hash_out (struct super_block * s) { int retval; struct inode * inode; struct cpu_key key; INITIALIZE_PATH (path); struct reiserfs_dir_entry de; __u32 hash = DEFAULT_HASH; inode = s->s_root->d_inode; do { // Some serious "goto"-hater was there ;) u32 teahash, r5hash, yurahash; make_cpu_key (&key, inode, ~0, TYPE_DIRENTRY, 3); retval = search_by_entry_key (s, &key, &path, &de); if (retval == IO_ERROR) { pathrelse (&path); return UNSET_HASH ; } if (retval == NAME_NOT_FOUND) de.de_entry_num --; set_de_name_and_namelen (&de); if (deh_offset( &(de.de_deh[de.de_entry_num]) ) == DOT_DOT_OFFSET) { /* allow override in this case */ if (reiserfs_rupasov_hash(s)) { hash = YURA_HASH ; } reiserfs_warning("reiserfs: FS seems to be empty, autodetect " "is using the default hash\n"); break; } r5hash=GET_HASH_VALUE (r5_hash (de.de_name, de.de_namelen)); teahash=GET_HASH_VALUE (keyed_hash (de.de_name, de.de_namelen)); yurahash=GET_HASH_VALUE (yura_hash (de.de_name, de.de_namelen)); if ( ( (teahash == r5hash) && (GET_HASH_VALUE( deh_offset(&(de.de_deh[de.de_entry_num]))) == r5hash) ) || ( (teahash == yurahash) && (yurahash == GET_HASH_VALUE( deh_offset(&(de.de_deh[de.de_entry_num])))) ) || ( (r5hash == yurahash) && (yurahash == GET_HASH_VALUE( deh_offset(&(de.de_deh[de.de_entry_num])))) ) ) { reiserfs_warning("reiserfs: Unable to automatically detect hash" "function for device %s\n" "please mount with -o hash={tea,rupasov,r5}\n", reiserfs_bdevname (s)); hash = UNSET_HASH; break; } if (GET_HASH_VALUE( deh_offset(&(de.de_deh[de.de_entry_num])) ) == yurahash) hash = YURA_HASH; else if (GET_HASH_VALUE( deh_offset(&(de.de_deh[de.de_entry_num])) ) == teahash) hash = TEA_HASH; else if (GET_HASH_VALUE( deh_offset(&(de.de_deh[de.de_entry_num])) ) == r5hash) hash = R5_HASH; else { reiserfs_warning("reiserfs: Unrecognised hash function for " "device %s\n", reiserfs_bdevname (s)); hash = UNSET_HASH; } } while (0); pathrelse (&path); return hash; } // finds out which hash names are sorted with static int what_hash (struct super_block * s) { __u32 code; code = sb_hash_function_code(SB_DISK_SUPER_BLOCK(s)); /* reiserfs_hash_detect() == true if any of the hash mount options ** were used. We must check them to make sure the user isn't ** using a bad hash value */ if (code == UNSET_HASH || reiserfs_hash_detect(s)) code = find_hash_out (s); if (code != UNSET_HASH && reiserfs_hash_detect(s)) { /* detection has found the hash, and we must check against the ** mount options */ if (reiserfs_rupasov_hash(s) && code != YURA_HASH) { printk("REISERFS: Error, %s hash detected, " "unable to force rupasov hash\n", reiserfs_hashname(code)) ; code = UNSET_HASH ; } else if (reiserfs_tea_hash(s) && code != TEA_HASH) { printk("REISERFS: Error, %s hash detected, " "unable to force tea hash\n", reiserfs_hashname(code)) ; code = UNSET_HASH ; } else if (reiserfs_r5_hash(s) && code != R5_HASH) { printk("REISERFS: Error, %s hash detected, " "unable to force r5 hash\n", reiserfs_hashname(code)) ; code = UNSET_HASH ; } } else { /* find_hash_out was not called or could not determine the hash */ if (reiserfs_rupasov_hash(s)) { code = YURA_HASH ; } else if (reiserfs_tea_hash(s)) { code = TEA_HASH ; } else if (reiserfs_r5_hash(s)) { code = R5_HASH ; } } /* if we are mounted RW, and we have a new valid hash code, update ** the super */ if (code != UNSET_HASH && !(s->s_flags & MS_RDONLY) && code != sb_hash_function_code(SB_DISK_SUPER_BLOCK(s))) { set_sb_hash_function_code(SB_DISK_SUPER_BLOCK(s), code); } return code; } // return pointer to appropriate function static hashf_t hash_function (struct super_block * s) { switch (what_hash (s)) { case TEA_HASH: reiserfs_warning ("Using tea hash to sort names\n"); return keyed_hash; case YURA_HASH: reiserfs_warning ("Using rupasov hash to sort names\n"); return yura_hash; case R5_HASH: reiserfs_warning ("Using r5 hash to sort names\n"); return r5_hash; } return NULL; } // this is used to set up correct value for old partitions int function2code (hashf_t func) { if (func == keyed_hash) return TEA_HASH; if (func == yura_hash) return YURA_HASH; if (func == r5_hash) return R5_HASH; BUG() ; // should never happen return 0; } #define SPRINTK(silent, ...) \ if (!(silent)) \ printk(__VA_ARGS__) static int reiserfs_fill_super (struct super_block * s, void * data, int silent) { struct inode *root_inode; int j; struct reiserfs_transaction_handle th ; int old_format = 0; unsigned long blocks; unsigned int commit_max_age = 0; int jinit_done = 0 ; struct reiserfs_iget_args args ; struct reiserfs_super_block * rs; char *jdev_name; struct reiserfs_sb_info *sbi; int errval = -EINVAL; sbi = kmalloc(sizeof(struct reiserfs_sb_info), GFP_KERNEL); if (!sbi) { errval = -ENOMEM; goto error; } s->s_fs_info = sbi; memset (sbi, 0, sizeof (struct reiserfs_sb_info)); /* Set default values for options: non-aggressive tails */ REISERFS_SB(s)->s_mount_opt = ( 1 << REISERFS_SMALLTAIL ); /* default block allocator option: skip_busy */ REISERFS_SB(s)->s_alloc_options.bits = ( 1 << 5); /* If file grew past 4 blocks, start preallocation blocks for it. */ REISERFS_SB(s)->s_alloc_options.preallocmin = 4; /* Preallocate by 16 blocks (17-1) at once */ REISERFS_SB(s)->s_alloc_options.preallocsize = 17; jdev_name = NULL; if (reiserfs_parse_options (s, (char *) data, &(sbi->s_mount_opt), &blocks, &jdev_name, &commit_max_age) == 0) { goto error; } if (blocks) { SPRINTK(silent, "jmacd-7: reiserfs_fill_super: resize option for remount only\n"); goto error; } /* try old format (undistributed bitmap, super block in 8-th 1k block of a device) */ if (!read_super_block (s, REISERFS_OLD_DISK_OFFSET_IN_BYTES)) old_format = 1; /* try new format (64-th 1k block), which can contain reiserfs super block */ else if (read_super_block (s, REISERFS_DISK_OFFSET_IN_BYTES)) { SPRINTK(silent, "sh-2021: reiserfs_fill_super: can not find reiserfs on %s\n", reiserfs_bdevname (s)); goto error; } rs = SB_DISK_SUPER_BLOCK (s); /* Let's do basic sanity check to verify that underlying device is not smaller than the filesystem. If the check fails then abort and scream, because bad stuff will happen otherwise. */ if ( s->s_bdev && s->s_bdev->bd_inode && i_size_read(s->s_bdev->bd_inode) < sb_block_count(rs)*sb_blocksize(rs)) { SPRINTK(silent, "Filesystem on %s cannot be mounted because it is bigger than the device\n", reiserfs_bdevname(s)); SPRINTK(silent, "You may need to run fsck or increase size of your LVM partition\n"); SPRINTK(silent, "Or may be you forgot to reboot after fdisk when it told you to\n"); goto error; } sbi->s_mount_state = SB_REISERFS_STATE(s); sbi->s_mount_state = REISERFS_VALID_FS ; if (old_format ? read_old_bitmaps(s) : read_bitmaps(s)) { SPRINTK(silent, "jmacd-8: reiserfs_fill_super: unable to read bitmap\n"); goto error; } #ifdef CONFIG_REISERFS_CHECK SPRINTK(silent, "reiserfs:warning: CONFIG_REISERFS_CHECK is set ON\n"); SPRINTK(silent, "reiserfs:warning: - it is slow mode for debugging.\n"); #endif /* make data=ordered the default */ if (!reiserfs_data_log(s) && !reiserfs_data_ordered(s) && !reiserfs_data_writeback(s)) { REISERFS_SB(s)->s_mount_opt |= (1 << REISERFS_DATA_ORDERED); } if (reiserfs_data_log(s)) { printk("reiserfs: using journaled data mode\n"); } else if (reiserfs_data_ordered(s)) { printk("reiserfs: using ordered data mode\n"); } else { printk("reiserfs: using writeback data mode\n"); } // set_device_ro(s->s_dev, 1) ; if( journal_init(s, jdev_name, old_format, commit_max_age) ) { SPRINTK(silent, "sh-2022: reiserfs_fill_super: unable to initialize journal space\n") ; goto error ; } else { jinit_done = 1 ; /* once this is set, journal_release must be called ** if we error out of the mount */ } if (reread_meta_blocks(s)) { SPRINTK(silent, "jmacd-9: reiserfs_fill_super: unable to reread meta blocks after journal init\n") ; goto error ; } if (replay_only (s)) goto error; if (bdev_read_only(s->s_bdev) && !(s->s_flags & MS_RDONLY)) { SPRINTK(silent, "clm-7000: Detected readonly device, marking FS readonly\n") ; s->s_flags |= MS_RDONLY ; } args.objectid = REISERFS_ROOT_OBJECTID ; args.dirid = REISERFS_ROOT_PARENT_OBJECTID ; root_inode = iget5_locked (s, REISERFS_ROOT_OBJECTID, reiserfs_find_actor, reiserfs_init_locked_inode, (void *)(&args)); if (!root_inode) { SPRINTK(silent, "jmacd-10: reiserfs_fill_super: get root inode failed\n"); goto error; } if (root_inode->i_state & I_NEW) { reiserfs_read_locked_inode(root_inode, &args); unlock_new_inode(root_inode); } s->s_root = d_alloc_root(root_inode); if (!s->s_root) { iput(root_inode); goto error; } // define and initialize hash function sbi->s_hash_function = hash_function (s); if (sbi->s_hash_function == NULL) { dput(s->s_root) ; s->s_root = NULL ; goto error ; } if (is_reiserfs_3_5 (rs) || (is_reiserfs_jr (rs) && SB_VERSION (s) == REISERFS_VERSION_1)) set_bit(REISERFS_3_5, &(sbi->s_properties)); else set_bit(REISERFS_3_6, &(sbi->s_properties)); if (!(s->s_flags & MS_RDONLY)) { journal_begin(&th, s, 1) ; reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s), 1) ; set_sb_umount_state( rs, REISERFS_ERROR_FS ); set_sb_fs_state (rs, 0); if (old_format_only(s)) { /* filesystem of format 3.5 either with standard or non-standard journal */ if (convert_reiserfs (s)) { /* and -o conv is given */ if(!silent) reiserfs_warning ("reiserfs: converting 3.5 filesystem to the 3.6 format\n") ; if (is_reiserfs_3_5 (rs)) /* put magic string of 3.6 format. 2.2 will not be able to mount this filesystem anymore */ memcpy (rs->s_v1.s_magic, reiserfs_3_6_magic_string, sizeof (reiserfs_3_6_magic_string)); set_sb_version(rs,REISERFS_VERSION_2); reiserfs_convert_objectid_map_v1(s) ; set_bit(REISERFS_3_6, &(sbi->s_properties)); clear_bit(REISERFS_3_5, &(sbi->s_properties)); } else if (!silent){ reiserfs_warning("reiserfs: using 3.5.x disk format\n") ; } } journal_mark_dirty(&th, s, SB_BUFFER_WITH_SB (s)); journal_end(&th, s, 1) ; /* look for files which were to be removed in previous session */ finish_unfinished (s); } else { if ( old_format_only(s) && !silent) { reiserfs_warning("reiserfs: using 3.5.x disk format\n") ; } } // mark hash in super block: it could be unset. overwrite should be ok set_sb_hash_function_code( rs, function2code(sbi->s_hash_function ) ); handle_attrs( s ); reiserfs_proc_info_init( s ); init_waitqueue_head (&(sbi->s_wait)); sbi->bitmap_lock = SPIN_LOCK_UNLOCKED; return (0); error: if (jinit_done) { /* kill the commit thread, free journal ram */ journal_release_error(NULL, s) ; } if (SB_DISK_SUPER_BLOCK (s)) { for (j = 0; j < SB_BMAP_NR (s); j ++) { if (SB_AP_BITMAP (s)) brelse (SB_AP_BITMAP (s)[j].bh); } if (SB_AP_BITMAP (s)) vfree (SB_AP_BITMAP (s)); } if (SB_BUFFER_WITH_SB (s)) brelse(SB_BUFFER_WITH_SB (s)); if (sbi != NULL) { kfree(sbi); } s->s_fs_info = NULL; return errval; } static int reiserfs_statfs (struct super_block * s, struct kstatfs * buf) { struct reiserfs_super_block * rs = SB_DISK_SUPER_BLOCK (s); buf->f_namelen = (REISERFS_MAX_NAME (s->s_blocksize)); buf->f_bfree = sb_free_blocks(rs); buf->f_bavail = buf->f_bfree; buf->f_blocks = sb_block_count(rs) - sb_bmap_nr(rs) - 1; buf->f_bsize = s->s_blocksize; /* changed to accommodate gcc folks.*/ buf->f_type = REISERFS_SUPER_MAGIC; return 0; } static struct super_block* get_super_block (struct file_system_type *fs_type, int flags, const char *dev_name, void *data) { return get_sb_bdev(fs_type, flags, dev_name, data, reiserfs_fill_super); } static int __init init_reiserfs_fs ( void ) { int ret; if ((ret = init_inodecache ())) { return ret; } reiserfs_proc_info_global_init (); reiserfs_proc_register_global ("version", reiserfs_global_version_in_proc); ret = register_filesystem (& reiserfs_fs_type); if (ret == 0) { return 0; } reiserfs_proc_unregister_global ("version"); reiserfs_proc_info_global_done (); destroy_inodecache (); return ret; } static void __exit exit_reiserfs_fs ( void ) { reiserfs_proc_unregister_global ("version"); reiserfs_proc_info_global_done (); unregister_filesystem (& reiserfs_fs_type); destroy_inodecache (); } struct file_system_type reiserfs_fs_type = { .owner = THIS_MODULE, .name = "reiserfs", .get_sb = get_super_block, .kill_sb = kill_block_super, .fs_flags = FS_REQUIRES_DEV, }; MODULE_DESCRIPTION ("ReiserFS journaled filesystem"); MODULE_AUTHOR ("Hans Reiser "); MODULE_LICENSE ("GPL"); module_init (init_reiserfs_fs); module_exit (exit_reiserfs_fs);