Message ID | 1320372920-21308-1-git-send-email-adityakali@google.com |
---|---|
State | Superseded, archived |
Headers | show |
This version of the patch enables only the quota usage tracking at mount time as suggested in previous patch. The quota limits enforcement is turned on by calling quotaon quotactl. On Thu, Nov 3, 2011 at 7:15 PM, Aditya Kali <adityakali@google.com> wrote: > This patch is an attempt towards supporting quotas as first class > feature in ext4. It is based on the proposal at: > https://ext4.wiki.kernel.org/index.php/Design_For_1st_Class_Quota_in_Ext4 > This patch introduces a new feature - EXT4_FEATURE_RO_COMPAT_QUOTA which, when > turned on, enables quota accounting at mount time iteself. Also, the > quota inodes are stored in two additional superblock fields. > Some changes introduced by this patch that should be pointed out are: > 1) Two new ext4-superblock fields - s_usr_quota_inum and s_grp_quota_inum > for storing the quota inodes in use. > 2) Default quota inodes are: inode#3 for tracking userquota and inode#4 for > tracking group quota. The superblock fields can be set to use other inodes > as well. > 3) If the QUOTA feature and corresponding quota inodes are set in superblock, > the quota usage tracking is turned on at mount time. On 'quotaon' ioctl, the > quota limits enforcement is turned on. 'quotaoff' ioctl turns off only the > limits enforcement in this case. > 4) When QUOTA feature is in use, the quota mount options 'quota', 'usrquota', > 'grpquota' are ignored by the kernel.. > 5) mke2fs or tune2fs can be used to set the QUOTA feature and initialize quota > inodes. The default reserved inodes will not be visible to user as > regular files. > 6) The quota-tools will need to be modified to support hidden quota files on > ext4. E2fsprogs will also include support for creating and fixing quota > files. > 7) Support is only for the new V2 quota file format. > > Signed-off-by: Aditya Kali <adityakali@google.com> > --- > fs/ext4/ext4.h | 6 ++- > fs/ext4/ext4_jbd2.h | 18 ++++++--- > fs/ext4/super.c | 107 +++++++++++++++++++++++++++++++++++++++++++++++++-- > 3 files changed, 120 insertions(+), 11 deletions(-) > > diff --git a/fs/ext4/ext4.h b/fs/ext4/ext4.h > index 5b0e26a..dccfe65 100644 > --- a/fs/ext4/ext4.h > +++ b/fs/ext4/ext4.h > @@ -1170,6 +1170,7 @@ struct ext4_sb_info { > #ifdef CONFIG_QUOTA > char *s_qf_names[MAXQUOTAS]; /* Names of quota files with journalled quota */ > int s_jquota_fmt; /* Format of quota to use */ > + unsigned long s_qf_inums[MAXQUOTAS]; /* Quota file inodes */ > #endif > unsigned int s_want_extra_isize; /* New inodes should reserve # bytes */ > struct rb_root system_blks; > @@ -1269,6 +1270,8 @@ static inline struct timespec ext4_current_time(struct inode *inode) > static inline int ext4_valid_inum(struct super_block *sb, unsigned long ino) > { > return ino == EXT4_ROOT_INO || > + ino == EXT4_USR_QUOTA_INO || > + ino == EXT4_GRP_QUOTA_INO || > ino == EXT4_JOURNAL_INO || > ino == EXT4_RESIZE_INO || > (ino >= EXT4_FIRST_INO(sb) && > @@ -1440,7 +1443,8 @@ static inline void ext4_clear_state_flags(struct ext4_inode_info *ei) > EXT4_FEATURE_RO_COMPAT_EXTRA_ISIZE | \ > EXT4_FEATURE_RO_COMPAT_BTREE_DIR |\ > EXT4_FEATURE_RO_COMPAT_HUGE_FILE |\ > - EXT4_FEATURE_RO_COMPAT_BIGALLOC) > + EXT4_FEATURE_RO_COMPAT_BIGALLOC | \ > + EXT4_FEATURE_RO_COMPAT_QUOTA) > > /* > * Default values for user and/or group using reserved blocks > diff --git a/fs/ext4/ext4_jbd2.h b/fs/ext4/ext4_jbd2.h > index 5802fa1..45de190 100644 > --- a/fs/ext4/ext4_jbd2.h > +++ b/fs/ext4/ext4_jbd2.h > @@ -87,14 +87,20 @@ > #ifdef CONFIG_QUOTA > /* Amount of blocks needed for quota update - we know that the structure was > * allocated so we need to update only data block */ > -#define EXT4_QUOTA_TRANS_BLOCKS(sb) (test_opt(sb, QUOTA) ? 1 : 0) > +#define EXT4_QUOTA_TRANS_BLOCKS(sb) ((test_opt(sb, QUOTA) ||\ > + EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) ?\ > + 1 : 0) > /* Amount of blocks needed for quota insert/delete - we do some block writes > * but inode, sb and group updates are done only once */ > -#define EXT4_QUOTA_INIT_BLOCKS(sb) (test_opt(sb, QUOTA) ? (DQUOT_INIT_ALLOC*\ > - (EXT4_SINGLEDATA_TRANS_BLOCKS(sb)-3)+3+DQUOT_INIT_REWRITE) : 0) > - > -#define EXT4_QUOTA_DEL_BLOCKS(sb) (test_opt(sb, QUOTA) ? (DQUOT_DEL_ALLOC*\ > - (EXT4_SINGLEDATA_TRANS_BLOCKS(sb)-3)+3+DQUOT_DEL_REWRITE) : 0) > +#define EXT4_QUOTA_INIT_BLOCKS(sb) ((test_opt(sb, QUOTA) ||\ > + EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) ?\ > + (DQUOT_INIT_ALLOC*(EXT4_SINGLEDATA_TRANS_BLOCKS(sb)-3)\ > + +3+DQUOT_INIT_REWRITE) : 0) > + > +#define EXT4_QUOTA_DEL_BLOCKS(sb) ((test_opt(sb, QUOTA) ||\ > + EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) ?\ > + (DQUOT_DEL_ALLOC*(EXT4_SINGLEDATA_TRANS_BLOCKS(sb)-3)\ > + +3+DQUOT_DEL_REWRITE) : 0) > #else > #define EXT4_QUOTA_TRANS_BLOCKS(sb) 0 > #define EXT4_QUOTA_INIT_BLOCKS(sb) 0 > diff --git a/fs/ext4/super.c b/fs/ext4/super.c > index 9953d80..eb40645 100644 > --- a/fs/ext4/super.c > +++ b/fs/ext4/super.c > @@ -1239,6 +1239,9 @@ static int ext4_mark_dquot_dirty(struct dquot *dquot); > static int ext4_write_info(struct super_block *sb, int type); > static int ext4_quota_on(struct super_block *sb, int type, int format_id, > struct path *path); > +static int ext4_quota_on_meta(struct super_block *sb, int type, int format_id); > +static int ext4_quota_enable(struct super_block *sb, int type, int format_id, > + unsigned int flags); > static int ext4_quota_off(struct super_block *sb, int type); > static int ext4_quota_on_mount(struct super_block *sb, int type); > static ssize_t ext4_quota_read(struct super_block *sb, int type, char *data, > @@ -1266,6 +1269,16 @@ static const struct quotactl_ops ext4_qctl_operations = { > .get_dqblk = dquot_get_dqblk, > .set_dqblk = dquot_set_dqblk > }; > + > +static const struct quotactl_ops ext4_new_qctl_operations = { > + .quota_on_meta = ext4_quota_on_meta, > + .quota_off = ext4_quota_off, > + .quota_sync = dquot_quota_sync, > + .get_info = dquot_get_dqinfo, > + .set_info = dquot_set_dqinfo, > + .get_dqblk = dquot_get_dqblk, > + .set_dqblk = dquot_set_dqblk > +}; > #endif > > static const struct super_operations ext4_sops = { > @@ -3610,6 +3623,15 @@ static int ext4_fill_super(struct super_block *sb, void *data, int silent) > #ifdef CONFIG_QUOTA > sb->s_qcop = &ext4_qctl_operations; > sb->dq_op = &ext4_quota_operations; > + > + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) { > + /* Use new qctl operations with quota on function that does not > + * require user specified quota file path. */ > + sb->s_qcop = &ext4_new_qctl_operations; > + > + sbi->s_qf_inums[USRQUOTA] = es->s_usr_quota_inum; > + sbi->s_qf_inums[GRPQUOTA] = es->s_grp_quota_inum; > + } > #endif > memcpy(sb->s_uuid, es->s_uuid, sizeof(es->s_uuid)); > > @@ -3815,8 +3837,21 @@ no_journal: > } else > descr = "out journal"; > > - ext4_msg(sb, KERN_INFO, "mounted filesystem with%s. " > - "Opts: %s%s%s", descr, sbi->s_es->s_mount_opts, > +#ifdef CONFIG_QUOTA > + /* Enable quota usage during mount. */ > + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA) && > + !(sb->s_flags & MS_RDONLY)) { > + ext4_quota_enable(sb, USRQUOTA, QFMT_VFS_V1, > + DQUOT_USAGE_ENABLED); > + ext4_quota_enable(sb, GRPQUOTA, QFMT_VFS_V1, > + DQUOT_USAGE_ENABLED); > + } > +#endif /* CONFIG_QUOTA */ > + > + ext4_msg(sb, KERN_INFO, "mounted filesystem with%s. quota=%s. " > + "Opts: %s%s%s", descr, > + sb_any_quota_loaded(sb) ? "on" : "off", > + sbi->s_es->s_mount_opts, > *sbi->s_es->s_mount_opts ? "; " : "", orig_data); > > if (es->s_error_count) > @@ -4183,6 +4218,12 @@ static int ext4_commit_super(struct super_block *sb, int sync) > es->s_free_inodes_count = > cpu_to_le32(percpu_counter_sum_positive( > &EXT4_SB(sb)->s_freeinodes_counter)); > +#ifdef CONFIG_QUOTA > + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) { > + es->s_usr_quota_inum = EXT4_SB(sb)->s_qf_inums[USRQUOTA]; > + es->s_grp_quota_inum = EXT4_SB(sb)->s_qf_inums[GRPQUOTA]; > + } > +#endif > sb->s_dirt = 0; > BUFFER_TRACE(sbh, "marking dirty"); > mark_buffer_dirty(sbh); > @@ -4775,7 +4816,7 @@ static int ext4_quota_on_mount(struct super_block *sb, int type) > * Standard function to be called on quota_on > */ > static int ext4_quota_on(struct super_block *sb, int type, int format_id, > - struct path *path) > + struct path *path) > { > int err; > > @@ -4814,6 +4855,59 @@ static int ext4_quota_on(struct super_block *sb, int type, int format_id, > return dquot_quota_on(sb, type, format_id, path); > } > > +static int ext4_quota_enable(struct super_block *sb, int type, int format_id, > + unsigned int flags) > +{ > + struct ext4_sb_info *sbi = EXT4_SB(sb); > + struct inode *qf_inode; > + int err; > + > + if (!sbi->s_qf_inums[type]) > + return -EPERM; > + > + qf_inode = ext4_iget(sb, sbi->s_qf_inums[type]); > + if (IS_ERR(qf_inode)) { > + ext4_error(sb, "Bad quota inode # %lu", sbi->s_qf_inums[type]); > + return PTR_ERR(qf_inode); > + } > + > + /* > + * When we journal data on quota file, we have to flush journal to see > + * all updates to the file when we bypass pagecache... > + */ > + if (sbi->s_journal && > + ext4_should_journal_data(qf_inode)) { > + /* > + * We don't need to lock updates but journal_flush() could > + * otherwise be livelocked... > + */ > + jbd2_journal_lock_updates(sbi->s_journal); > + err = jbd2_journal_flush(sbi->s_journal); > + jbd2_journal_unlock_updates(sbi->s_journal); > + if (err) > + return err; > + } > + > + err = dquot_enable(qf_inode, type, format_id, flags); > + iput(qf_inode); > + > + return err; > +} > + > +/* > + * New quota_on function that is used when QUOTA feature is set. > + */ > +static int ext4_quota_on_meta(struct super_block *sb, int type, int format_id) > +{ > + if (!EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) > + return -EINVAL; > + > + /* > + * USAGE was enabled at mount time. Only need to enable LIMITS now. > + */ > + return ext4_quota_enable(sb, type, format_id, DQUOT_LIMITS_ENABLED); > +} > + > static int ext4_quota_off(struct super_block *sb, int type) > { > struct inode *inode = sb_dqopt(sb)->files[type]; > @@ -4837,7 +4931,12 @@ static int ext4_quota_off(struct super_block *sb, int type) > ext4_journal_stop(handle); > > out: > - return dquot_quota_off(sb, type); > + /* Disable only the limits if QUOTA feature is set. */ > + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) > + return dquot_disable(sb, type, DQUOT_LIMITS_ENABLED); > + else > + return dquot_disable(sb, type, > + DQUOT_USAGE_ENABLED | DQUOT_LIMITS_ENABLED); > } > > /* Read data from quotafile - avoid pagecache and such because we cannot afford > -- > 1.7.3.1 > >
On Thu, Nov 03, 2011 at 07:15:20PM -0700, Aditya Kali wrote: > +#ifdef CONFIG_QUOTA > + /* Enable quota usage during mount. */ > + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA) && > + !(sb->s_flags & MS_RDONLY)) { > + ext4_quota_enable(sb, USRQUOTA, QFMT_VFS_V1, > + DQUOT_USAGE_ENABLED); > + ext4_quota_enable(sb, GRPQUOTA, QFMT_VFS_V1, > + DQUOT_USAGE_ENABLED); I think we should print an error message if one of the calls to ext4_quota_enable() failed. Space accounting in the quota files won't be accurate any more and e2fsck is required. > +static int ext4_quota_enable(struct super_block *sb, int type, int format_id, > + unsigned int flags) > +{ > + struct ext4_sb_info *sbi = EXT4_SB(sb); > + struct inode *qf_inode; > + int err; > + > + if (!sbi->s_qf_inums[type]) > + return -EPERM; > + > + qf_inode = ext4_iget(sb, sbi->s_qf_inums[type]); > + if (IS_ERR(qf_inode)) { > + ext4_error(sb, "Bad quota inode # %lu", sbi->s_qf_inums[type]); > + return PTR_ERR(qf_inode); > + } > + > + /* > + * When we journal data on quota file, we have to flush journal to see > + * all updates to the file when we bypass pagecache... > + */ > + if (sbi->s_journal && > + ext4_should_journal_data(qf_inode)) { > + /* > + * We don't need to lock updates but journal_flush() could > + * otherwise be livelocked... > + */ > + jbd2_journal_lock_updates(sbi->s_journal); > + err = jbd2_journal_flush(sbi->s_journal); > + jbd2_journal_unlock_updates(sbi->s_journal); > + if (err) > + return err; iput(qf_inode) is missing in this error path. Cheers, Johann -- To unsubscribe from this list: send the line "unsubscribe linux-ext4" in the body of a message to majordomo@vger.kernel.org More majordomo info at http://vger.kernel.org/majordomo-info.html
On Fri, Nov 04, 2011 at 10:43:10AM -0700, Aditya Kali wrote: > On Fri, Nov 4, 2011 at 2:20 AM, Johann Lombardi <johann@whamcloud.com> wrote: > > On Thu, Nov 03, 2011 at 07:15:20PM -0700, Aditya Kali wrote: > >> +#ifdef CONFIG_QUOTA > >> + /* Enable quota usage during mount. */ > >> + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA) && > >> + !(sb->s_flags & MS_RDONLY)) { > >> + ext4_quota_enable(sb, USRQUOTA, QFMT_VFS_V1, > >> + DQUOT_USAGE_ENABLED); > >> + ext4_quota_enable(sb, GRPQUOTA, QFMT_VFS_V1, > >> + DQUOT_USAGE_ENABLED); > > > > I think we should print an error message if one of the calls to ext4_quota_enable() failed. Space accounting in the quota files won't be accurate any more and e2fsck is required. > > Are you suggesting that we mark the filesystem has having errors if > this fails (use ext4_error() ) or simply print a warning in dmesg? A warning in dmesg is the least we could do IMHO. Marking the filesystem as having errors would be even better, i think. BTW, we have the same problem if CONFIG_QUOTA is not defined. > I am currently marking the filesystem as having errors if ext4_iget() > fails for the quota inode. But dquot_enable() could fail for other > reasons too (specially if we allow using user-specified quota files). Cheers, Johann -- To unsubscribe from this list: send the line "unsubscribe linux-ext4" in the body of a message to majordomo@vger.kernel.org More majordomo info at http://vger.kernel.org/majordomo-info.html
Thanks for the patch. I did a detailed review of it. I have quite some comments but all of them are easily fixable so I think we should be mostly ready in the next iteration. On Thu 03-11-11 19:15:20, Aditya Kali wrote: > +static const struct quotactl_ops ext4_new_qctl_operations = { ext4_new_qctl_operations is rather poor name. What if you need to create even newer set of operations in future? So I'd rather name them by "what they do" - so something like ext4_sysfile_qctl_operations - meaning that these operations handle quota stored in hidden system files. > + .quota_on_meta = ext4_quota_on_meta, > + .quota_off = ext4_quota_off, > + .quota_sync = dquot_quota_sync, > + .get_info = dquot_get_dqinfo, > + .set_info = dquot_set_dqinfo, > + .get_dqblk = dquot_get_dqblk, > + .set_dqblk = dquot_set_dqblk .. > @@ -3610,6 +3623,15 @@ static int ext4_fill_super(struct super_block *sb, void *data, int silent) > #ifdef CONFIG_QUOTA > sb->s_qcop = &ext4_qctl_operations; > sb->dq_op = &ext4_quota_operations; > + > + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) { > + /* Use new qctl operations with quota on function that does not > + * require user specified quota file path. */ > + sb->s_qcop = &ext4_new_qctl_operations; > + > + sbi->s_qf_inums[USRQUOTA] = es->s_usr_quota_inum; > + sbi->s_qf_inums[GRPQUOTA] = es->s_grp_quota_inum; You need to convert from ondisk format here - i.e. use le32_to_cpu(). > + } > #endif > memcpy(sb->s_uuid, es->s_uuid, sizeof(es->s_uuid)); > > @@ -3815,8 +3837,21 @@ no_journal: > } else > descr = "out journal"; > > - ext4_msg(sb, KERN_INFO, "mounted filesystem with%s. " > - "Opts: %s%s%s", descr, sbi->s_es->s_mount_opts, > +#ifdef CONFIG_QUOTA > + /* Enable quota usage during mount. */ > + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA) && > + !(sb->s_flags & MS_RDONLY)) { > + ext4_quota_enable(sb, USRQUOTA, QFMT_VFS_V1, > + DQUOT_USAGE_ENABLED); > + ext4_quota_enable(sb, GRPQUOTA, QFMT_VFS_V1, > + DQUOT_USAGE_ENABLED); > + } You should check the return value here and fail the mount in case turning quotas on fails... Also you should set DQUOT_QUOTA_SYS_FILE in sb_dqopt(sb)->flags before calling ext4_quota_enable() to indicate that quota file is a hidden system file and generic quota code can then skip some rather costly steps during quota handling to keep user visible and kernel visible content in sync. > +#endif /* CONFIG_QUOTA */ > + > + ext4_msg(sb, KERN_INFO, "mounted filesystem with%s. quota=%s. " > + "Opts: %s%s%s", descr, > + sb_any_quota_loaded(sb) ? "on" : "off", > + sbi->s_es->s_mount_opts, > *sbi->s_es->s_mount_opts ? "; " : "", orig_data); Should info about quotas really be in the message? After all it's just another feature and we definitely don't report all the features filesystem has set. > @@ -4183,6 +4218,12 @@ static int ext4_commit_super(struct super_block *sb, int sync) > es->s_free_inodes_count = > cpu_to_le32(percpu_counter_sum_positive( > &EXT4_SB(sb)->s_freeinodes_counter)); > +#ifdef CONFIG_QUOTA > + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) { > + es->s_usr_quota_inum = EXT4_SB(sb)->s_qf_inums[USRQUOTA]; > + es->s_grp_quota_inum = EXT4_SB(sb)->s_qf_inums[GRPQUOTA]; > + } > +#endif Is there really need to reset these numbers? They should be stable during the whole lifetime of a filesystem, no (modulo changes by tune2fs)? If I'm missing something and numbers indeed can change, you should convert them to on disk format - i.e. cpu_to_le32(). > @@ -4814,6 +4855,59 @@ static int ext4_quota_on(struct super_block *sb, int type, int format_id, > return dquot_quota_on(sb, type, format_id, path); > } > > +static int ext4_quota_enable(struct super_block *sb, int type, int format_id, > + unsigned int flags) > +{ > + struct ext4_sb_info *sbi = EXT4_SB(sb); > + struct inode *qf_inode; > + int err; > + > + if (!sbi->s_qf_inums[type]) > + return -EPERM; > + > + qf_inode = ext4_iget(sb, sbi->s_qf_inums[type]); > + if (IS_ERR(qf_inode)) { > + ext4_error(sb, "Bad quota inode # %lu", sbi->s_qf_inums[type]); > + return PTR_ERR(qf_inode); > + } > + > + /* > + * When we journal data on quota file, we have to flush journal to see > + * all updates to the file when we bypass pagecache... > + */ > + if (sbi->s_journal && > + ext4_should_journal_data(qf_inode)) { > + /* > + * We don't need to lock updates but journal_flush() could > + * otherwise be livelocked... > + */ > + jbd2_journal_lock_updates(sbi->s_journal); > + err = jbd2_journal_flush(sbi->s_journal); > + jbd2_journal_unlock_updates(sbi->s_journal); > + if (err) > + return err; > + } Why do you have the above check? Since this function is called only for reserved quota inodes which are hidden, ext4_should_journal_data() will never be true for them. > + > + err = dquot_enable(qf_inode, type, format_id, flags); > + iput(qf_inode); > + > + return err; > +} > @@ -4837,7 +4931,12 @@ static int ext4_quota_off(struct super_block *sb, int type) > ext4_journal_stop(handle); > > out: > - return dquot_quota_off(sb, type); > + /* Disable only the limits if QUOTA feature is set. */ > + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) > + return dquot_disable(sb, type, DQUOT_LIMITS_ENABLED); > + else > + return dquot_disable(sb, type, > + DQUOT_USAGE_ENABLED | DQUOT_LIMITS_ENABLED); > } Hmm, most of the work ext4_quota_off() does is unnecessary when quota is handled internally - there's no need to sync the filesystem, no need to update mtime or ctime... So I'd rather provide a new ext4_quota_off() function in case quota feature is enabled and that would just call dquot_disable(sb, type, DQUOT_LIMITS_ENABLED). Honza
Thanks for the feedback. I will address all the comments in next revision. Some comments inline: On Tue, Nov 8, 2011 at 5:55 AM, Jan Kara <jack@suse.cz> wrote: > Thanks for the patch. I did a detailed review of it. I have quite some > comments but all of them are easily fixable so I think we should be mostly > ready in the next iteration. > > On Thu 03-11-11 19:15:20, Aditya Kali wrote: >> +static const struct quotactl_ops ext4_new_qctl_operations = { > ext4_new_qctl_operations is rather poor name. What if you need to create > even newer set of operations in future? So I'd rather name them by "what > they do" - so something like ext4_sysfile_qctl_operations - meaning that these > operations handle quota stored in hidden system files. > >> + .quota_on_meta = ext4_quota_on_meta, >> + .quota_off = ext4_quota_off, >> + .quota_sync = dquot_quota_sync, >> + .get_info = dquot_get_dqinfo, >> + .set_info = dquot_set_dqinfo, >> + .get_dqblk = dquot_get_dqblk, >> + .set_dqblk = dquot_set_dqblk > .. >> @@ -3610,6 +3623,15 @@ static int ext4_fill_super(struct super_block *sb, void *data, int silent) >> #ifdef CONFIG_QUOTA >> sb->s_qcop = &ext4_qctl_operations; >> sb->dq_op = &ext4_quota_operations; >> + >> + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) { >> + /* Use new qctl operations with quota on function that does not >> + * require user specified quota file path. */ >> + sb->s_qcop = &ext4_new_qctl_operations; >> + >> + sbi->s_qf_inums[USRQUOTA] = es->s_usr_quota_inum; >> + sbi->s_qf_inums[GRPQUOTA] = es->s_grp_quota_inum; > You need to convert from ondisk format here - i.e. use le32_to_cpu(). > >> + } >> #endif >> memcpy(sb->s_uuid, es->s_uuid, sizeof(es->s_uuid)); >> >> @@ -3815,8 +3837,21 @@ no_journal: >> } else >> descr = "out journal"; >> >> - ext4_msg(sb, KERN_INFO, "mounted filesystem with%s. " >> - "Opts: %s%s%s", descr, sbi->s_es->s_mount_opts, >> +#ifdef CONFIG_QUOTA >> + /* Enable quota usage during mount. */ >> + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA) && >> + !(sb->s_flags & MS_RDONLY)) { >> + ext4_quota_enable(sb, USRQUOTA, QFMT_VFS_V1, >> + DQUOT_USAGE_ENABLED); >> + ext4_quota_enable(sb, GRPQUOTA, QFMT_VFS_V1, >> + DQUOT_USAGE_ENABLED); >> + } > You should check the return value here and fail the mount in case turning > quotas on fails... Also you should set DQUOT_QUOTA_SYS_FILE in > sb_dqopt(sb)->flags before calling ext4_quota_enable() to indicate that > quota file is a hidden system file and generic quota code can then skip > some rather costly steps during quota handling to keep user visible and > kernel visible content in sync. > > >> +#endif /* CONFIG_QUOTA */ >> + >> + ext4_msg(sb, KERN_INFO, "mounted filesystem with%s. quota=%s. " >> + "Opts: %s%s%s", descr, >> + sb_any_quota_loaded(sb) ? "on" : "off", >> + sbi->s_es->s_mount_opts, >> *sbi->s_es->s_mount_opts ? "; " : "", orig_data); > Should info about quotas really be in the message? After all it's just > another feature and we definitely don't report all the features filesystem > has set. > >> @@ -4183,6 +4218,12 @@ static int ext4_commit_super(struct super_block *sb, int sync) >> es->s_free_inodes_count = >> cpu_to_le32(percpu_counter_sum_positive( >> &EXT4_SB(sb)->s_freeinodes_counter)); >> +#ifdef CONFIG_QUOTA >> + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) { >> + es->s_usr_quota_inum = EXT4_SB(sb)->s_qf_inums[USRQUOTA]; >> + es->s_grp_quota_inum = EXT4_SB(sb)->s_qf_inums[GRPQUOTA]; >> + } >> +#endif > Is there really need to reset these numbers? They should be stable > during the whole lifetime of a filesystem, no (modulo changes by tune2fs)? > If I'm missing something and numbers indeed can change, you should convert > them to on disk format - i.e. cpu_to_le32(). > Currently tune2fs does not support enabling quota feature on mounted filesystem. (I think we should probably make it enable quotas on a read-only mount though). Even in that case, this is incorrect. I will remove this. >> @@ -4814,6 +4855,59 @@ static int ext4_quota_on(struct super_block *sb, int type, int format_id, >> return dquot_quota_on(sb, type, format_id, path); >> } >> >> +static int ext4_quota_enable(struct super_block *sb, int type, int format_id, >> + unsigned int flags) >> +{ >> + struct ext4_sb_info *sbi = EXT4_SB(sb); >> + struct inode *qf_inode; >> + int err; >> + >> + if (!sbi->s_qf_inums[type]) >> + return -EPERM; >> + >> + qf_inode = ext4_iget(sb, sbi->s_qf_inums[type]); >> + if (IS_ERR(qf_inode)) { >> + ext4_error(sb, "Bad quota inode # %lu", sbi->s_qf_inums[type]); >> + return PTR_ERR(qf_inode); >> + } >> + >> + /* >> + * When we journal data on quota file, we have to flush journal to see >> + * all updates to the file when we bypass pagecache... >> + */ >> + if (sbi->s_journal && >> + ext4_should_journal_data(qf_inode)) { >> + /* >> + * We don't need to lock updates but journal_flush() could >> + * otherwise be livelocked... >> + */ >> + jbd2_journal_lock_updates(sbi->s_journal); >> + err = jbd2_journal_flush(sbi->s_journal); >> + jbd2_journal_unlock_updates(sbi->s_journal); >> + if (err) >> + return err; >> + } > Why do you have the above check? Since this function is called only for > reserved quota inodes which are hidden, ext4_should_journal_data() will > never be true for them. > This inode could refer to a user-visible file if existing quota file was used by tune2fs. We will need to remove the journal flag on the inode if present at tune2fs time. >> + >> + err = dquot_enable(qf_inode, type, format_id, flags); >> + iput(qf_inode); >> + >> + return err; >> +} >> @@ -4837,7 +4931,12 @@ static int ext4_quota_off(struct super_block *sb, int type) >> ext4_journal_stop(handle); >> >> out: >> - return dquot_quota_off(sb, type); >> + /* Disable only the limits if QUOTA feature is set. */ >> + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) >> + return dquot_disable(sb, type, DQUOT_LIMITS_ENABLED); >> + else >> + return dquot_disable(sb, type, >> + DQUOT_USAGE_ENABLED | DQUOT_LIMITS_ENABLED); >> } > Hmm, most of the work ext4_quota_off() does is unnecessary when quota is > handled internally - there's no need to sync the filesystem, no need to > update mtime or ctime... So I'd rather provide a new ext4_quota_off() > function in case quota feature is enabled and that would just call > dquot_disable(sb, type, DQUOT_LIMITS_ENABLED). > > Honza > -- > Jan Kara <jack@suse.cz> > SUSE Labs, CR >
diff --git a/fs/ext4/ext4.h b/fs/ext4/ext4.h index 5b0e26a..dccfe65 100644 --- a/fs/ext4/ext4.h +++ b/fs/ext4/ext4.h @@ -1170,6 +1170,7 @@ struct ext4_sb_info { #ifdef CONFIG_QUOTA char *s_qf_names[MAXQUOTAS]; /* Names of quota files with journalled quota */ int s_jquota_fmt; /* Format of quota to use */ + unsigned long s_qf_inums[MAXQUOTAS]; /* Quota file inodes */ #endif unsigned int s_want_extra_isize; /* New inodes should reserve # bytes */ struct rb_root system_blks; @@ -1269,6 +1270,8 @@ static inline struct timespec ext4_current_time(struct inode *inode) static inline int ext4_valid_inum(struct super_block *sb, unsigned long ino) { return ino == EXT4_ROOT_INO || + ino == EXT4_USR_QUOTA_INO || + ino == EXT4_GRP_QUOTA_INO || ino == EXT4_JOURNAL_INO || ino == EXT4_RESIZE_INO || (ino >= EXT4_FIRST_INO(sb) && @@ -1440,7 +1443,8 @@ static inline void ext4_clear_state_flags(struct ext4_inode_info *ei) EXT4_FEATURE_RO_COMPAT_EXTRA_ISIZE | \ EXT4_FEATURE_RO_COMPAT_BTREE_DIR |\ EXT4_FEATURE_RO_COMPAT_HUGE_FILE |\ - EXT4_FEATURE_RO_COMPAT_BIGALLOC) + EXT4_FEATURE_RO_COMPAT_BIGALLOC | \ + EXT4_FEATURE_RO_COMPAT_QUOTA) /* * Default values for user and/or group using reserved blocks diff --git a/fs/ext4/ext4_jbd2.h b/fs/ext4/ext4_jbd2.h index 5802fa1..45de190 100644 --- a/fs/ext4/ext4_jbd2.h +++ b/fs/ext4/ext4_jbd2.h @@ -87,14 +87,20 @@ #ifdef CONFIG_QUOTA /* Amount of blocks needed for quota update - we know that the structure was * allocated so we need to update only data block */ -#define EXT4_QUOTA_TRANS_BLOCKS(sb) (test_opt(sb, QUOTA) ? 1 : 0) +#define EXT4_QUOTA_TRANS_BLOCKS(sb) ((test_opt(sb, QUOTA) ||\ + EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) ?\ + 1 : 0) /* Amount of blocks needed for quota insert/delete - we do some block writes * but inode, sb and group updates are done only once */ -#define EXT4_QUOTA_INIT_BLOCKS(sb) (test_opt(sb, QUOTA) ? (DQUOT_INIT_ALLOC*\ - (EXT4_SINGLEDATA_TRANS_BLOCKS(sb)-3)+3+DQUOT_INIT_REWRITE) : 0) - -#define EXT4_QUOTA_DEL_BLOCKS(sb) (test_opt(sb, QUOTA) ? (DQUOT_DEL_ALLOC*\ - (EXT4_SINGLEDATA_TRANS_BLOCKS(sb)-3)+3+DQUOT_DEL_REWRITE) : 0) +#define EXT4_QUOTA_INIT_BLOCKS(sb) ((test_opt(sb, QUOTA) ||\ + EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) ?\ + (DQUOT_INIT_ALLOC*(EXT4_SINGLEDATA_TRANS_BLOCKS(sb)-3)\ + +3+DQUOT_INIT_REWRITE) : 0) + +#define EXT4_QUOTA_DEL_BLOCKS(sb) ((test_opt(sb, QUOTA) ||\ + EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) ?\ + (DQUOT_DEL_ALLOC*(EXT4_SINGLEDATA_TRANS_BLOCKS(sb)-3)\ + +3+DQUOT_DEL_REWRITE) : 0) #else #define EXT4_QUOTA_TRANS_BLOCKS(sb) 0 #define EXT4_QUOTA_INIT_BLOCKS(sb) 0 diff --git a/fs/ext4/super.c b/fs/ext4/super.c index 9953d80..eb40645 100644 --- a/fs/ext4/super.c +++ b/fs/ext4/super.c @@ -1239,6 +1239,9 @@ static int ext4_mark_dquot_dirty(struct dquot *dquot); static int ext4_write_info(struct super_block *sb, int type); static int ext4_quota_on(struct super_block *sb, int type, int format_id, struct path *path); +static int ext4_quota_on_meta(struct super_block *sb, int type, int format_id); +static int ext4_quota_enable(struct super_block *sb, int type, int format_id, + unsigned int flags); static int ext4_quota_off(struct super_block *sb, int type); static int ext4_quota_on_mount(struct super_block *sb, int type); static ssize_t ext4_quota_read(struct super_block *sb, int type, char *data, @@ -1266,6 +1269,16 @@ static const struct quotactl_ops ext4_qctl_operations = { .get_dqblk = dquot_get_dqblk, .set_dqblk = dquot_set_dqblk }; + +static const struct quotactl_ops ext4_new_qctl_operations = { + .quota_on_meta = ext4_quota_on_meta, + .quota_off = ext4_quota_off, + .quota_sync = dquot_quota_sync, + .get_info = dquot_get_dqinfo, + .set_info = dquot_set_dqinfo, + .get_dqblk = dquot_get_dqblk, + .set_dqblk = dquot_set_dqblk +}; #endif static const struct super_operations ext4_sops = { @@ -3610,6 +3623,15 @@ static int ext4_fill_super(struct super_block *sb, void *data, int silent) #ifdef CONFIG_QUOTA sb->s_qcop = &ext4_qctl_operations; sb->dq_op = &ext4_quota_operations; + + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) { + /* Use new qctl operations with quota on function that does not + * require user specified quota file path. */ + sb->s_qcop = &ext4_new_qctl_operations; + + sbi->s_qf_inums[USRQUOTA] = es->s_usr_quota_inum; + sbi->s_qf_inums[GRPQUOTA] = es->s_grp_quota_inum; + } #endif memcpy(sb->s_uuid, es->s_uuid, sizeof(es->s_uuid)); @@ -3815,8 +3837,21 @@ no_journal: } else descr = "out journal"; - ext4_msg(sb, KERN_INFO, "mounted filesystem with%s. " - "Opts: %s%s%s", descr, sbi->s_es->s_mount_opts, +#ifdef CONFIG_QUOTA + /* Enable quota usage during mount. */ + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA) && + !(sb->s_flags & MS_RDONLY)) { + ext4_quota_enable(sb, USRQUOTA, QFMT_VFS_V1, + DQUOT_USAGE_ENABLED); + ext4_quota_enable(sb, GRPQUOTA, QFMT_VFS_V1, + DQUOT_USAGE_ENABLED); + } +#endif /* CONFIG_QUOTA */ + + ext4_msg(sb, KERN_INFO, "mounted filesystem with%s. quota=%s. " + "Opts: %s%s%s", descr, + sb_any_quota_loaded(sb) ? "on" : "off", + sbi->s_es->s_mount_opts, *sbi->s_es->s_mount_opts ? "; " : "", orig_data); if (es->s_error_count) @@ -4183,6 +4218,12 @@ static int ext4_commit_super(struct super_block *sb, int sync) es->s_free_inodes_count = cpu_to_le32(percpu_counter_sum_positive( &EXT4_SB(sb)->s_freeinodes_counter)); +#ifdef CONFIG_QUOTA + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) { + es->s_usr_quota_inum = EXT4_SB(sb)->s_qf_inums[USRQUOTA]; + es->s_grp_quota_inum = EXT4_SB(sb)->s_qf_inums[GRPQUOTA]; + } +#endif sb->s_dirt = 0; BUFFER_TRACE(sbh, "marking dirty"); mark_buffer_dirty(sbh); @@ -4775,7 +4816,7 @@ static int ext4_quota_on_mount(struct super_block *sb, int type) * Standard function to be called on quota_on */ static int ext4_quota_on(struct super_block *sb, int type, int format_id, - struct path *path) + struct path *path) { int err; @@ -4814,6 +4855,59 @@ static int ext4_quota_on(struct super_block *sb, int type, int format_id, return dquot_quota_on(sb, type, format_id, path); } +static int ext4_quota_enable(struct super_block *sb, int type, int format_id, + unsigned int flags) +{ + struct ext4_sb_info *sbi = EXT4_SB(sb); + struct inode *qf_inode; + int err; + + if (!sbi->s_qf_inums[type]) + return -EPERM; + + qf_inode = ext4_iget(sb, sbi->s_qf_inums[type]); + if (IS_ERR(qf_inode)) { + ext4_error(sb, "Bad quota inode # %lu", sbi->s_qf_inums[type]); + return PTR_ERR(qf_inode); + } + + /* + * When we journal data on quota file, we have to flush journal to see + * all updates to the file when we bypass pagecache... + */ + if (sbi->s_journal && + ext4_should_journal_data(qf_inode)) { + /* + * We don't need to lock updates but journal_flush() could + * otherwise be livelocked... + */ + jbd2_journal_lock_updates(sbi->s_journal); + err = jbd2_journal_flush(sbi->s_journal); + jbd2_journal_unlock_updates(sbi->s_journal); + if (err) + return err; + } + + err = dquot_enable(qf_inode, type, format_id, flags); + iput(qf_inode); + + return err; +} + +/* + * New quota_on function that is used when QUOTA feature is set. + */ +static int ext4_quota_on_meta(struct super_block *sb, int type, int format_id) +{ + if (!EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) + return -EINVAL; + + /* + * USAGE was enabled at mount time. Only need to enable LIMITS now. + */ + return ext4_quota_enable(sb, type, format_id, DQUOT_LIMITS_ENABLED); +} + static int ext4_quota_off(struct super_block *sb, int type) { struct inode *inode = sb_dqopt(sb)->files[type]; @@ -4837,7 +4931,12 @@ static int ext4_quota_off(struct super_block *sb, int type) ext4_journal_stop(handle); out: - return dquot_quota_off(sb, type); + /* Disable only the limits if QUOTA feature is set. */ + if (EXT4_HAS_RO_COMPAT_FEATURE(sb, EXT4_FEATURE_RO_COMPAT_QUOTA)) + return dquot_disable(sb, type, DQUOT_LIMITS_ENABLED); + else + return dquot_disable(sb, type, + DQUOT_USAGE_ENABLED | DQUOT_LIMITS_ENABLED); } /* Read data from quotafile - avoid pagecache and such because we cannot afford
This patch is an attempt towards supporting quotas as first class feature in ext4. It is based on the proposal at: https://ext4.wiki.kernel.org/index.php/Design_For_1st_Class_Quota_in_Ext4 This patch introduces a new feature - EXT4_FEATURE_RO_COMPAT_QUOTA which, when turned on, enables quota accounting at mount time iteself. Also, the quota inodes are stored in two additional superblock fields. Some changes introduced by this patch that should be pointed out are: 1) Two new ext4-superblock fields - s_usr_quota_inum and s_grp_quota_inum for storing the quota inodes in use. 2) Default quota inodes are: inode#3 for tracking userquota and inode#4 for tracking group quota. The superblock fields can be set to use other inodes as well. 3) If the QUOTA feature and corresponding quota inodes are set in superblock, the quota usage tracking is turned on at mount time. On 'quotaon' ioctl, the quota limits enforcement is turned on. 'quotaoff' ioctl turns off only the limits enforcement in this case. 4) When QUOTA feature is in use, the quota mount options 'quota', 'usrquota', 'grpquota' are ignored by the kernel.. 5) mke2fs or tune2fs can be used to set the QUOTA feature and initialize quota inodes. The default reserved inodes will not be visible to user as regular files. 6) The quota-tools will need to be modified to support hidden quota files on ext4. E2fsprogs will also include support for creating and fixing quota files. 7) Support is only for the new V2 quota file format. Signed-off-by: Aditya Kali <adityakali@google.com> --- fs/ext4/ext4.h | 6 ++- fs/ext4/ext4_jbd2.h | 18 ++++++--- fs/ext4/super.c | 107 +++++++++++++++++++++++++++++++++++++++++++++++++-- 3 files changed, 120 insertions(+), 11 deletions(-)