On Tue, Jan 21, 2014 at 11:45:17AM -0700, Andreas Dilger wrote: > On Jan 20, 2014, at 11:17 PM, Theodore Ts'o <tytso@xxxxxxx> wrote: > > This feature is enabled via settings in /etc/mke2fs.conf. For > > example: > > > > hugefile = { > > features = extent,huge_file,flex_bg,uninit_bg,dir_nlink,extra_isize,^resize_inode,sparse_super2 > > inode_size = 128 > > packed_meta_blocks = 1 > > make_hugefiles = 1 > > inode_ratio = 4194304 > > hugefiles_dir = /database > > hugefiles_uid = 120 > > hugefiles_gid = 50 > > hugefiles_name = storage > > hugefiles_digits = 4 > > hugefile_size = 1G > > num_hugefiles = 0 > > } > > > > Then "mke2fs -T hugefile /dev/sdXX" will create as many 1G files > > needed to fill the file system. > > How is this different from using fallocate to allocate the files? > Is this just to create a test image for e2fsck or similar? It > might make sense to include f_hugefiles/script and expect.1 for it? Maybe the author of the patches circulating to turn mke2fs into a 'format-and-populate' utility might have an opinion here? :) I'd adapt fuse2fs to use a ext2fs_fallocate function, if one existed. That said, it would have to be more general than this, handling the case where there might be blocks mapped. Hey Ted, if I wrote an ext2fs_fallocate, would you adapt this for it? --D > > Cheers, Andreas > > > Signed-off-by: "Theodore Ts'o" <tytso@xxxxxxx> > > --- > > > > This is an enhancement to mke2fs which I developed for a use case at > > work, where it is convenient to create a set of pre-allocated files > > which use all or most of the space in the file system. I've tried to > > make it to be as general as possible, but I'm still considering whether > > it's appropriate to include this in the e2fprogs sources, perhaps under > > a configure --enable-make-hugefiles option or some such. Nearly all of > > the new code is in a separate file for ease of maintenance. > > > > > > misc/Makefile.in | 3 +- > > misc/mk_hugefiles.c | 385 ++++++++++++++++++++++++++++++++++++++++++++++++++ > > misc/mke2fs.c | 21 +-- > > misc/mke2fs.conf.5.in | 45 ++++++ > > misc/mke2fs.h | 29 ++++ > > 5 files changed, 474 insertions(+), 9 deletions(-) > > create mode 100644 misc/mk_hugefiles.c > > create mode 100644 misc/mke2fs.h > > > > diff --git a/misc/Makefile.in b/misc/Makefile.in > > index 8342940..c5f332b 100644 > > --- a/misc/Makefile.in > > +++ b/misc/Makefile.in > > @@ -42,7 +42,8 @@ LPROGS= @E2INITRD_PROG@ > > > > TUNE2FS_OBJS= tune2fs.o util.o > > MKLPF_OBJS= mklost+found.o > > -MKE2FS_OBJS= mke2fs.o util.o profile.o prof_err.o default_profile.o > > +MKE2FS_OBJS= mke2fs.o util.o profile.o prof_err.o default_profile.o \ > > + mk_hugefiles.o > > CHATTR_OBJS= chattr.o > > LSATTR_OBJS= lsattr.o > > UUIDGEN_OBJS= uuidgen.o > > diff --git a/misc/mk_hugefiles.c b/misc/mk_hugefiles.c > > new file mode 100644 > > index 0000000..c43a2b0 > > --- /dev/null > > +++ b/misc/mk_hugefiles.c > > @@ -0,0 +1,385 @@ > > +/* > > + * mk_hugefiles.c -- create huge files > > + */ > > + > > +#define _XOPEN_SOURCE 600 /* for inclusion of PATH_MAX in Solaris */ > > + > > +#include "config.h" > > +#include <stdio.h> > > +#include <string.h> > > +#include <strings.h> > > +#include <fcntl.h> > > +#include <ctype.h> > > +#include <time.h> > > +#ifdef __linux__ > > +#include <sys/utsname.h> > > +#endif > > +#ifdef HAVE_GETOPT_H > > +#include <getopt.h> > > +#else > > +extern char *optarg; > > +extern int optind; > > +#endif > > +#ifdef HAVE_UNISTD_H > > +#include <unistd.h> > > +#endif > > +#ifdef HAVE_STDLIB_H > > +#include <stdlib.h> > > +#endif > > +#ifdef HAVE_ERRNO_H > > +#include <errno.h> > > +#endif > > +#include <sys/ioctl.h> > > +#include <sys/types.h> > > +#include <sys/stat.h> > > +#include <libgen.h> > > +#include <limits.h> > > +#include <blkid/blkid.h> > > + > > +#include "ext2fs/ext2_fs.h" > > +#include "ext2fs/ext2fsP.h" > > +#include "et/com_err.h" > > +#include "uuid/uuid.h" > > +#include "e2p/e2p.h" > > +#include "ext2fs/ext2fs.h" > > +#include "util.h" > > +#include "profile.h" > > +#include "prof_err.h" > > +#include "nls-enable.h" > > +#include "mke2fs.h" > > + > > +static int uid; > > +static int gid; > > +static blk64_t num_blocks; > > +static blk64_t num_slack; > > +static unsigned long num_files; > > +static blk64_t goal; > > +static char *fn_prefix; > > +static int idx_digits; > > +static char *fn_buf; > > +static char *fn_numbuf; > > + > > +static errcode_t create_directory(ext2_filsys fs, char *dir, > > + ext2_ino_t *ret_ino) > > + > > +{ > > + struct ext2_inode inode; > > + ext2_ino_t ino = EXT2_ROOT_INO; > > + ext2_ino_t newdir; > > + errcode_t retval; > > + char *fn, *cp, *next; > > + > > + fn = malloc(strlen(dir) + 1); > > + if (fn == NULL) > > + return ENOMEM; > > + > > + strcpy(fn, dir); > > + cp = fn; > > + while(1) { > > + next = strchr(cp, '/'); > > + if (next) > > + *next++ = 0; > > + if (*cp) { > > + retval = ext2fs_new_inode(fs, ino, LINUX_S_IFDIR, > > + NULL, &newdir); > > + if (retval) > > + goto errout; > > + > > + retval = ext2fs_mkdir(fs, ino, newdir, cp); > > + if (retval) > > + goto errout; > > + > > + ino = newdir; > > + retval = ext2fs_read_inode(fs, ino, &inode); > > + if (retval) > > + goto errout; > > + > > + inode.i_uid = uid & 0xFFFF; > > + ext2fs_set_i_uid_high(inode, (uid >> 16) & 0xffff); > > + inode.i_gid = gid & 0xFFFF; > > + ext2fs_set_i_gid_high(inode, (gid >> 16) & 0xffff); > > + retval = ext2fs_write_inode(fs, ino, &inode); > > + if (retval) > > + goto errout; > > + } > > + if (next == NULL || *next == '\0') > > + break; > > + cp = next; > > + } > > +errout: > > + free(fn); > > + if (retval == 0) > > + *ret_ino = ino; > > + return retval; > > +} > > + > > +static errcode_t mk_hugefile(ext2_filsys fs, blk64_t num, > > + ext2_ino_t dir, int idx, ext2_ino_t *ino) > > + > > +{ > > + errcode_t retval; > > + blk64_t lblk, blk, bend; > > + __u64 size; > > + blk64_t left; > > + blk64_t count = 0; > > + struct ext2_inode inode; > > + ext2_extent_handle_t handle; > > + > > + retval = ext2fs_new_inode(fs, 0, LINUX_S_IFREG, NULL, ino); > > + if (retval) > > + return retval; > > + > > + memset(&inode, 0, sizeof(struct ext2_inode)); > > + inode.i_mode = LINUX_S_IFREG | (0666 & ~fs->umask); > > + inode.i_links_count = 1; > > + inode.i_uid = uid & 0xFFFF; > > + ext2fs_set_i_uid_high(inode, (uid >> 16) & 0xffff); > > + inode.i_gid = gid & 0xFFFF; > > + ext2fs_set_i_gid_high(inode, (gid >> 16) & 0xffff); > > + > > + retval = ext2fs_write_new_inode(fs, *ino, &inode); > > + if (retval) > > + return retval; > > + > > + ext2fs_inode_alloc_stats2(fs, *ino, +1, 0); > > + > > + retval = ext2fs_extent_open2(fs, *ino, &inode, &handle); > > + if (retval) > > + return retval; > > + > > + lblk = 0; > > + left = num ? num : 1; > > + while (left) { > > + blk64_t pblk, end; > > + blk64_t n = left; > > + > > + retval = ext2fs_find_first_zero_block_bitmap2(fs->block_map, > > + goal, ext2fs_blocks_count(fs->super) - 1, &end); > > + if (retval) > > + return ENOSPC; > > + goal = end; > > + > > + retval = ext2fs_find_first_set_block_bitmap2(fs->block_map, goal, > > + ext2fs_blocks_count(fs->super) - 1, &bend); > > + if (retval == ENOENT) { > > + bend = ext2fs_blocks_count(fs->super); > > + if (num == 0) > > + left = 0; > > + } > > + if (!num || bend - goal < left) > > + n = bend - goal; > > + pblk = goal; > > + if (num) > > + left -= n; > > + goal += n; > > + count += n; > > + ext2fs_block_alloc_stats_range(fs, pblk, n, +1); > > + > > + while (n) { > > + blk64_t l = n; > > + struct ext2fs_extent newextent; > > + > > + if (l > EXT_INIT_MAX_LEN) > > + l = EXT_INIT_MAX_LEN; > > + > > + newextent.e_len = l; > > + newextent.e_pblk = pblk; > > + newextent.e_lblk = lblk; > > + newextent.e_flags = 0; > > + > > + retval = ext2fs_extent_insert(handle, > > + EXT2_EXTENT_INSERT_AFTER, &newextent); > > + if (retval) > > + return retval; > > + pblk += l; > > + lblk += l; > > + n -= l; > > + } > > + } > > + > > + retval = ext2fs_read_inode(fs, *ino, &inode); > > + if (retval) > > + goto errout; > > + > > + retval = ext2fs_iblk_add_blocks(fs, &inode, > > + count / EXT2FS_CLUSTER_RATIO(fs)); > > + if (retval) > > + goto errout; > > + size = (__u64) count * fs->blocksize; > > + inode.i_size = size & 0xffffffff; > > + inode.i_size_high = (size >> 32); > > + > > + retval = ext2fs_write_new_inode(fs, *ino, &inode); > > + if (retval) > > + goto errout; > > + > > + if (idx_digits) > > + sprintf(fn_numbuf, "%0*d", idx_digits, idx); > > + else if (num_files > 1) > > + sprintf(fn_numbuf, "%d", idx); > > + > > +retry: > > + retval = ext2fs_link(fs, dir, fn_buf, *ino, EXT2_FT_REG_FILE); > > + if (retval == EXT2_ET_DIR_NO_SPACE) { > > + retval = ext2fs_expand_dir(fs, dir); > > + if (retval) > > + goto errout; > > + goto retry; > > + } > > + > > + if (retval) > > + goto errout; > > + > > +errout: > > + if (handle) > > + ext2fs_extent_free(handle); > > + > > + return retval; > > +} > > + > > +static blk64_t calc_overhead(ext2_filsys fs, blk64_t num_blocks) > > +{ > > + blk64_t e_blocks, e_blocks2, e_blocks3, e_blocks4; > > + int extents_per_block; > > + int extents = (num_blocks + EXT_INIT_MAX_LEN - 1) / EXT_INIT_MAX_LEN; > > + > > + if (extents <= 4) > > + return 0; > > + > > + /* > > + * This calculation is due to the fact that we are inefficient > > + * in how handle extent splits when appending to the end of > > + * the extent tree. Sigh. We should fix this so that we can > > + * actually store 340 extents per 4k block, instead of only 170. > > + */ > > + extents_per_block = ((fs->blocksize - > > + sizeof(struct ext3_extent_header)) / > > + sizeof(struct ext3_extent)); > > + extents_per_block = (extents_per_block/ 2) - 1; > > + > > + e_blocks = (extents + extents_per_block - 1) / extents_per_block; > > + e_blocks2 = (e_blocks + extents_per_block - 1) / extents_per_block; > > + e_blocks3 = (e_blocks2 + extents_per_block - 1) / extents_per_block; > > + e_blocks4 = (e_blocks3 + extents_per_block - 1) / extents_per_block; > > + return e_blocks + e_blocks2 + e_blocks3 + e_blocks4; > > +} > > + > > +/* > > + * Find the place where we should start allocating blocks for the huge > > + * files. Leave <slack> free blocks at the beginning of the file > > + * system for things like metadata blocks. > > + */ > > +static blk64_t get_start_block(ext2_filsys fs, blk64_t slack) > > +{ > > + errcode_t retval; > > + blk64_t goal = fs->super->s_first_data_block, next; > > + blk64_t last_blk = ext2fs_blocks_count(fs->super) - 1; > > + > > + while (slack) { > > + retval = ext2fs_find_first_zero_block_bitmap2(fs->block_map, > > + goal, last_blk, &goal); > > + if (retval) > > + break; > > + > > + retval = ext2fs_find_first_set_block_bitmap2(fs->block_map, > > + goal, last_blk, &next); > > + if (retval) > > + next = last_blk; > > + next--; > > + > > + if (next - goal > slack) { > > + goal += slack; > > + break; > > + } > > + > > + slack -= (next - goal); > > + goal = next; > > + } > > + return goal; > > +} > > + > > +errcode_t mk_hugefiles(ext2_filsys fs) > > +{ > > + errcode_t retval; > > + ext2_ino_t dir; > > + int i; > > + char *t; > > + > > + if (!get_bool_from_profile(fs_types, "make_hugefiles", 0)) > > + return 0; > > + > > + uid = get_int_from_profile(fs_types, "hugefiles_uid", 0); > > + gid = get_int_from_profile(fs_types, "hugefiles_gid", 0); > > + fs->umask = get_int_from_profile(fs_types, "hugefiles_umask", 077); > > + num_files = get_int_from_profile(fs_types, "num_hugefiles", 0); > > + t = get_string_from_profile(fs_types, "hugefiles_slack", "1M"); > > + num_slack = parse_num_blocks2(t, fs->super->s_log_block_size); > > + t = get_string_from_profile(fs_types, "hugefiles_size", "0"); > > + num_blocks = parse_num_blocks2(t, fs->super->s_log_block_size); > > + > > + retval = create_directory(fs, get_string_from_profile(fs_types, > > + "hugefiles_dir", "/"), &dir); > > + if (retval) > > + return dir; > > + > > + if (num_blocks == 0 && num_files == 0) > > + num_files = 1; > > + > > + if (num_files == 0 && num_blocks) { > > + blk64_t fs_blocks = ext2fs_free_blocks_count(fs->super); > > + > > + fs_blocks -= num_slack; > > + num_files = fs_blocks / num_blocks; > > + fs_blocks -= (num_files / 16) + 1; > > + fs_blocks -= calc_overhead(fs, num_blocks) * num_files; > > + num_files = fs_blocks / num_blocks; > > + } > > + > > + if (num_blocks == 0 && num_files > 1) { > > + blk64_t fs_blocks = ext2fs_free_blocks_count(fs->super); > > + > > + fs_blocks -= num_slack; > > + num_blocks = fs_blocks / num_files; > > + > > + fs_blocks -= calc_overhead(fs, num_blocks) * num_files; > > + fs_blocks -= num_slack; > > + num_blocks = fs_blocks / num_files; > > + printf("Using num_blocks %llu\n", num_blocks); > > + } > > + > > + num_slack += calc_overhead(fs, num_blocks) * num_files; > > + num_slack += (num_files / 16) + 1; /* space for dir entries */ > > + goal = get_start_block(fs, num_slack); > > + > > + fn_prefix = get_string_from_profile(fs_types, "hugefiles_name", > > + "hugefile"); > > + idx_digits = get_int_from_profile(fs_types, "hugefiles_digits", 5); > > + i = int_log10(num_files) + 1; > > + if (idx_digits > i) > > + i = idx_digits; > > + fn_buf = malloc(strlen(fn_prefix) + i + 1); > > + if (!fn_buf) > > + return ENOMEM; > > + strcpy(fn_buf, fn_prefix); > > + fn_numbuf = fn_buf + strlen(fn_prefix); > > + > > + if (!quiet) { > > + printf(_("Creating %d huge file(s) "), num_files); > > + if (num_blocks) > > + printf(_("with %llu blocks each"), num_blocks); > > + fputc('\n', stdout); > > + } > > + for (i=0; i < num_files; i++) { > > + ext2_ino_t ino; > > + > > + retval = mk_hugefile(fs, num_blocks, dir, i, &ino); > > + if (retval) { > > + com_err(program_name, retval, > > + _("while creating huge file %d"), i); > > + goto errout; > > + } > > + } > > +errout: > > + free(fn_buf); > > + return retval; > > +} > > diff --git a/misc/mke2fs.c b/misc/mke2fs.c > > index e798648..9d7673f 100644 > > --- a/misc/mke2fs.c > > +++ b/misc/mke2fs.c > > @@ -62,6 +62,7 @@ extern int optind; > > #include "../version.h" > > #include "nls-enable.h" > > #include "quota/mkquota.h" > > +#include "mke2fs.h" > > > > #define STRIDE_LENGTH 8 > > > > @@ -76,13 +77,13 @@ extern int optind; > > extern int isatty(int); > > extern FILE *fpopen(const char *cmd, const char *mode); > > > > -static const char * program_name = "mke2fs"; > > +const char * program_name = "mke2fs"; > > static const char * device_name /* = NULL */; > > > > /* Command line options */ > > static int cflag; > > -static int verbose; > > -static int quiet; > > +int verbose; > > +int quiet; > > static int super_only; > > static int discard = 1; /* attempt to discard device before fs creation */ > > static int direct_io; > > @@ -107,7 +108,7 @@ static char *volume_label; > > static char *mount_dir; > > char *journal_device; > > static int sync_kludge; /* Set using the MKE2FS_SYNC env. option */ > > -static char **fs_types; > > +char **fs_types; > > > > static profile_t profile; > > > > @@ -142,7 +143,7 @@ static int int_log2(unsigned long long arg) > > return l; > > } > > > > -static int int_log10(unsigned long long arg) > > +int int_log10(unsigned long long arg) > > { > > int l; > > > > @@ -1253,7 +1254,7 @@ static char **parse_fs_type(const char *fs_type, > > return (list.list); > > } > > > > -static char *get_string_from_profile(char **types, const char *opt, > > +char *get_string_from_profile(char **types, const char *opt, > > const char *def_val) > > { > > char *ret = 0; > > @@ -1270,7 +1271,7 @@ static char *get_string_from_profile(char **types, const char *opt, > > return (ret); > > } > > > > -static int get_int_from_profile(char **types, const char *opt, int def_val) > > +int get_int_from_profile(char **types, const char *opt, int def_val) > > { > > int ret; > > char **cpp; > > @@ -1293,7 +1294,7 @@ static double get_double_from_profile(char **types, const char *opt, > > return ret; > > } > > > > -static int get_bool_from_profile(char **types, const char *opt, int def_val) > > +int get_bool_from_profile(char **types, const char *opt, int def_val) > > { > > int ret; > > char **cpp; > > @@ -2847,6 +2848,10 @@ no_journal: > > EXT4_FEATURE_RO_COMPAT_QUOTA)) > > create_quota_inodes(fs); > > > > + retval = mk_hugefiles(fs); > > + if (retval) > > + com_err(program_name, retval, "while creating huge files"); > > + > > if (!quiet) > > printf("%s", _("Writing superblocks and " > > "filesystem accounting information: ")); > > diff --git a/misc/mke2fs.conf.5.in b/misc/mke2fs.conf.5.in > > index 1aba87b..8f628a7 100644 > > --- a/misc/mke2fs.conf.5.in > > +++ b/misc/mke2fs.conf.5.in > > @@ -417,6 +417,51 @@ system feature is enabled. It can be overridden via the > > .B \-C > > command line option to > > .BR mke2fs (8) > > +.TP > > +.I make_hugefiles > > +This boolean relation enables the creation of pre-allocated files as > > +part of formatting the file system. > > +.TP > > +.I hugefiles_uid > > +This relation controls the user ownership for all of the files and > > +directories created by the > > +.I make_hugefiles > > +feature. > > +.TP > > +.I hugefiles_gid > > +This relation controls the group ownership for all of the files and > > +directories created by the > > +.I make_hugefiles > > +feature. > > +.TP > > +.I hugefiles_umask > > +This relation specifies the umask used when creating the files and > > +directories by the > > +.I make_hugefiles > > +feature. > > +.TP > > +.I num_hugefiles > > +This relation specifies the number of huge files to be created. If this > > +relation is not specified, or is set to zero, and the > > +.I hugefiles_size > > +relation is non-zero, then > > +.I make_hugefiles > > +will create as many huge files as can fit to fill the entire file system. > > +.TP > > +.I hugefiles_slack > > +This relation specifies how much space should be reserved for other > > +files. > > +.TP > > +.I hugefiles_size > > +This relation specifies the size of the huge files. If this relation is > > +not specified, the default is to fill th efile system. > > +.TP > > +.I hugefiles_name > > +This relation specifies the base file name for the huge files. > > +.TP > > +.I hugefiles_digits > > +This relation specifies the (zero-padded) width of the field for the > > +huge file number. > > .SH THE [devices] STANZA > > Each tag in the > > .I [devices] > > diff --git a/misc/mke2fs.h b/misc/mke2fs.h > > new file mode 100644 > > index 0000000..73d8c71 > > --- /dev/null > > +++ b/misc/mke2fs.h > > @@ -0,0 +1,29 @@ > > +/* > > + * mke2fs.h > > + * > > + * Copyright (C) 1994, 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, > > + * 2003, 2004, 2005 by Theodore Ts'o. > > + * > > + * %Begin-Header% > > + * This file may be redistributed under the terms of the GNU Public > > + * License. > > + * %End-Header% > > + */ > > + > > +/* mke2fs.c */ > > +extern const char * program_name; > > +extern int quiet; > > +extern int verbose; > > +extern char **fs_types; > > + > > +extern char *get_string_from_profile(char **types, const char *opt, > > + const char *def_val); > > +extern int get_int_from_profile(char **types, const char *opt, int def_val); > > +extern int get_bool_from_profile(char **types, const char *opt, int def_val); > > +extern int int_log10(unsigned long long arg); > > + > > +/* mk_hugefiles.c */ > > +extern errcode_t mk_hugefiles(ext2_filsys fs); > > + > > + > > + > > -- > > 1.8.5.rc3.362.gdf10213 > > > > -- > > To unsubscribe from this list: send the line "unsubscribe linux-ext4" in > > the body of a message to majordomo@xxxxxxxxxxxxxxx > > More majordomo info at http://vger.kernel.org/majordomo-info.html > > > Cheers, Andreas > > > > > -- To unsubscribe from this list: send the line "unsubscribe linux-ext4" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html