From: Gerrit Huizenga Updates CKRM Resource Control Filesystem (rcfs) to include full directory structure support. This is the user level API for managing CKRM. Signed-Off-By: Chandra Seetharaman Signed-Off-By: Hubertus Franke Signed-Off-By: Shailabh Nagar Signed-Off-By: Vivek Kashyap Signed-Off-By: Gerrit Huizenga Signed-off-by: Nishanth Aravamudan Signed-off-by: Andrew Morton --- fs/Makefile | 1 fs/rcfs/Makefile | 7 fs/rcfs/dir.c | 220 +++++++++++++++++++++ fs/rcfs/inode.c | 160 +++++++++++++++ fs/rcfs/magic.c | 517 +++++++++++++++++++++++++++++++++++++++++++++++++++ fs/rcfs/rootdir.c | 198 +++++++++++++++++++ fs/rcfs/super.c | 291 ++++++++++++++++++++++++++++ include/linux/rcfs.h | 20 + init/Kconfig | 10 9 files changed, 1417 insertions(+), 7 deletions(-) diff -puN fs/Makefile~ckrm-resource-control-file-system-rcfs fs/Makefile --- 25/fs/Makefile~ckrm-resource-control-file-system-rcfs Wed Jul 13 14:43:50 2005 +++ 25-akpm/fs/Makefile Wed Jul 13 14:43:50 2005 @@ -95,6 +95,7 @@ obj-$(CONFIG_JFS_FS) += jfs/ obj-$(CONFIG_XFS_FS) += xfs/ obj-$(CONFIG_AFS_FS) += afs/ obj-$(CONFIG_BEFS_FS) += befs/ +obj-$(CONFIG_RCFS_FS) += rcfs/ obj-$(CONFIG_HOSTFS) += hostfs/ obj-$(CONFIG_HPPFS) += hppfs/ obj-$(CONFIG_DEBUG_FS) += debugfs/ diff -puN /dev/null fs/rcfs/dir.c --- /dev/null Thu Apr 11 07:25:15 2002 +++ 25-akpm/fs/rcfs/dir.c Wed Jul 13 14:43:50 2005 @@ -0,0 +1,220 @@ +/* + * fs/rcfs/dir.c + * + * Copyright (C) Shailabh Nagar, IBM Corp. 2004 + * Vivek Kashyap, IBM Corp. 2004 + * + * + * Directory operations for rcfs + * + * Latest version, more details at http://ckrm.sf.net + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the version 2 of the GNU General Public License + * as published by the Free Software Foundation. + * + */ + +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include + +#define rcfs_positive(dentry) ((dentry)->d_inode && !d_unhashed((dentry))) + +int rcfs_empty(struct dentry *dentry) +{ + struct dentry *child; + int ret = 0; + + spin_lock(&dcache_lock); + list_for_each_entry(child, &dentry->d_subdirs, d_child) + if (!rcfs_is_magic(child) && rcfs_positive(child)) + goto out; + ret = 1; +out: + spin_unlock(&dcache_lock); + return ret; +} + +/* Directory inode operations */ + +int rcfs_create_coredir(struct inode *dir, struct dentry *dentry) +{ + + struct rcfs_inode_info *ripar, *ridir; + int sz; + + ripar = rcfs_get_inode_info(dir); + ridir = rcfs_get_inode_info(dentry->d_inode); + /* Inform resource controllers - do Core operations */ + if (ckrm_is_core_valid(ripar->core)) { + sz = strlen(ripar->name) + strlen(dentry->d_name.name) + 2; + ridir->name = kmalloc(sz, GFP_KERNEL); + if (!ridir->name) { + return -ENOMEM; + } + snprintf(ridir->name, sz, "%s/%s", ripar->name, + dentry->d_name.name); + ridir->core = (*(ripar->core->classtype->alloc)) + (ripar->core, ridir->name); + } else { + printk(KERN_ERR "rcfs_mkdir: Invalid parent core %p\n", + ripar->core); + return -EINVAL; + } + + return 0; +} + +int rcfs_mkdir(struct inode *dir, struct dentry *dentry, int mode) +{ + + int retval = 0; + struct ckrm_classtype *clstype; + + if (rcfs_mknod(dir, dentry, mode | S_IFDIR, 0)) { + printk(KERN_ERR "rcfs_mkdir: error in rcfs_mknod\n"); + return retval; + } + dir->i_nlink++; + /* Inherit parent's ops since rcfs_mknod assigns noperm ops. */ + dentry->d_inode->i_op = dir->i_op; + dentry->d_inode->i_fop = dir->i_fop; + retval = rcfs_create_coredir(dir, dentry); + if (retval) { + simple_rmdir(dir, dentry); + return retval; + } + /* create the default set of magic files */ + clstype = (rcfs_get_inode_info(dentry->d_inode))->core->classtype; + rcfs_create_magic(dentry, &(((struct rcfs_magf *)clstype->mfdesc)[1]), + clstype->mfcount - 3); + return retval; +} + +int rcfs_rmdir(struct inode *dir, struct dentry *dentry) +{ + struct rcfs_inode_info *ri = rcfs_get_inode_info(dentry->d_inode); + + if (!rcfs_empty(dentry)) { + printk(KERN_ERR "rcfs_rmdir: directory not empty\n"); + return -ENOTEMPTY; + } + /* Core class removal */ + + if (ri->core == NULL) { + printk(KERN_ERR "rcfs_rmdir: core==NULL\n"); + /* likely a race condition */ + return 0; + } + + if ((*(ri->core->classtype->free)) (ri->core)) { + printk(KERN_ERR "rcfs_rmdir: ckrm_free_core_class failed\n"); + goto out; + } + ri->core = NULL; /* just to be safe */ + + /* Clear magic files only after core successfully removed */ + rcfs_clear_magic(dentry); + + return simple_rmdir(dir, dentry); + +out: + return -EBUSY; +} + +int rcfs_unlink(struct inode *dir, struct dentry *dentry) +{ + /* + * -ENOENT and not -ENOPERM to allow rm -rf to work despite + * magic files being present + */ + return -ENOENT; +} + +/* rename is allowed on directories only */ +int +rcfs_rename(struct inode *old_dir, struct dentry *old_dentry, + struct inode *new_dir, struct dentry *new_dentry) +{ + if (S_ISDIR(old_dentry->d_inode->i_mode)) + return simple_rename(old_dir, old_dentry, new_dir, new_dentry); + else + return -EINVAL; +} + +int rcfs_create_noperm(struct inode *dir, struct dentry *dentry, int mode, struct nameidata *nd) +{ + return -EPERM; +} + +int rcfs_symlink_noperm(struct inode *dir, struct dentry *dentry, const char *symname) +{ + return -EPERM; +} + +int rcfs_mkdir_noperm(struct inode *dir, struct dentry *dentry, int mode) +{ + return -EPERM; +} + +int rcfs_rmdir_noperm(struct inode *dir, struct dentry *dentry) +{ + return -EPERM; +} + +int rcfs_link_noperm(struct dentry *old_dentry, struct inode *dir, struct dentry *dentry) +{ + return -EPERM; +} + +int rcfs_unlink_noperm(struct inode *dir, struct dentry *dentry) +{ + return -EPERM; +} + +int rcfs_mknod_noperm(struct inode *dir, struct dentry *dentry, int mode, dev_t dev) +{ + return -EPERM; +} + +int rcfs_rename_noperm(struct inode *old_dir, struct dentry *old_dentry, struct inode *new_dir, struct dentry *new_dentry) +{ + return -EPERM; +} + +struct inode_operations rcfs_dir_inode_operations = { + .create = rcfs_create_noperm, + .lookup = simple_lookup, + .link = rcfs_link_noperm, + .unlink = rcfs_unlink, + .symlink = rcfs_symlink_noperm, + .mkdir = rcfs_mkdir, + .rmdir = rcfs_rmdir, + .mknod = rcfs_mknod_noperm, + .rename = rcfs_rename, +}; + +struct inode_operations rcfs_rootdir_inode_operations = { + .create = rcfs_create_noperm, + .lookup = simple_lookup, + .link = rcfs_link_noperm, + .unlink = rcfs_unlink_noperm, + .symlink = rcfs_symlink_noperm, + .mkdir = rcfs_mkdir_noperm, + .rmdir = rcfs_rmdir_noperm, + .mknod = rcfs_mknod_noperm, + .rename = rcfs_rename_noperm, +}; diff -puN /dev/null fs/rcfs/inode.c --- /dev/null Thu Apr 11 07:25:15 2002 +++ 25-akpm/fs/rcfs/inode.c Wed Jul 13 14:43:50 2005 @@ -0,0 +1,160 @@ +/* + * fs/rcfs/inode.c + * + * Copyright (C) Shailabh Nagar, IBM Corp. 2004 + * Vivek Kashyap, IBM Corp. 2004 + * + * Resource class filesystem (rcfs) forming the + * user interface to Class-based Kernel Resource Management (CKRM). + * + * Latest version, more details at http://ckrm.sf.net + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of version 2 of the GNU General Public License + * as published by the Free Software Foundation. + * + */ + +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include + +/* + * Address of variable used as flag to indicate a magic file, + * value unimportant + */ +int RCFS_IS_MAGIC; + +struct inode *rcfs_get_inode(struct super_block *sb, int mode, dev_t dev) +{ + struct inode *inode = new_inode(sb); + + if (inode) { + inode->i_mode = mode; + inode->i_uid = current->fsuid; + inode->i_gid = current->fsgid; + inode->i_blksize = PAGE_CACHE_SIZE; + inode->i_blocks = 0; + inode->i_atime = inode->i_mtime = inode->i_ctime = CURRENT_TIME; + switch (mode & S_IFMT) { + default: + init_special_inode(inode, mode, dev); + break; + case S_IFREG: + /* Treat as default assignment */ + inode->i_op = &rcfs_file_inode_operations; + break; + case S_IFDIR: + inode->i_op = &rcfs_rootdir_inode_operations; + inode->i_fop = &simple_dir_operations; + + /* + * directory inodes start off with i_nlink == 2 + * (for "." entry) + */ + inode->i_nlink++; + break; + case S_IFLNK: + inode->i_op = &page_symlink_inode_operations; + break; + } + } + return inode; +} + +int rcfs_mknod(struct inode *dir, struct dentry *dentry, int mode, dev_t dev) +{ + struct inode *inode; + int error = -EPERM; + + if (dentry->d_inode) + return -EEXIST; + inode = rcfs_get_inode(dir->i_sb, mode, dev); + if (inode) { + if (dir->i_mode & S_ISGID) { + inode->i_gid = dir->i_gid; + if (S_ISDIR(mode)) + inode->i_mode |= S_ISGID; + } + d_instantiate(dentry, inode); + dget(dentry); + error = 0; + } + return error; +} + +struct dentry *rcfs_create_internal(struct dentry *parent, + struct rcfs_magf *magf, int magic) +{ + struct qstr qstr; + struct dentry *mfdentry; + + /* Get new dentry for name */ + qstr.name = magf->name; + qstr.len = strlen(magf->name); + qstr.hash = full_name_hash(magf->name, qstr.len); + mfdentry = lookup_hash(&qstr, parent); + + if (!IS_ERR(mfdentry)) { + int err; + + down(&parent->d_inode->i_sem); + if (magic && (magf->mode & S_IFDIR)) + err = parent->d_inode->i_op->mkdir(parent->d_inode, + mfdentry, + magf->mode); + else { + err = rcfs_mknod(parent->d_inode, mfdentry, + magf->mode, 0); + /* + * rcfs_mknod doesn't increment parent's link count, + * i_op->mkdir does. + */ + parent->d_inode->i_nlink++; + } + up(&parent->d_inode->i_sem); + if (err) { + dput(mfdentry); + return mfdentry; + } + } + return mfdentry; +} + +int rcfs_delete_internal(struct dentry *mfdentry) +{ + struct dentry *parent; + + if (!mfdentry || !mfdentry->d_parent) + return -EINVAL; + parent = mfdentry->d_parent; + if (!mfdentry->d_inode) { + return 0; + } + down(&mfdentry->d_inode->i_sem); + if (S_ISDIR(mfdentry->d_inode->i_mode)) + simple_rmdir(parent->d_inode, mfdentry); + else + simple_unlink(parent->d_inode, mfdentry); + up(&mfdentry->d_inode->i_sem); + d_delete(mfdentry); + + return 0; +} + +struct inode_operations rcfs_file_inode_operations = { + .getattr = simple_getattr, +}; diff -puN /dev/null fs/rcfs/magic.c --- /dev/null Thu Apr 11 07:25:15 2002 +++ 25-akpm/fs/rcfs/magic.c Wed Jul 13 14:43:50 2005 @@ -0,0 +1,517 @@ +/* + * fs/rcfs/magic.c + * + * Copyright (C) Shailabh Nagar, IBM Corp. 2004 + * (C) Vivek Kashyap, IBM Corp. 2004 + * (C) Chandra Seetharaman, IBM Corp. 2004 + * (C) Hubertus Franke, IBM Corp. 2004 + * + * File operations for common magic files in rcfs, + * the user interface for CKRM. + * + * Latest version, more details at http://ckrm.sf.net + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of version 2 of the GNU General Public License + * as published by the Free Software Foundation. + */ + +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include + +#define MAX_INPUT_SIZE 100U + +static void mkvalidstr(char *s) +{ + char *p; + + for (p = s; *p != '\0'; ++p) { + if (*p < ' ' || *p > '~') { + *p = '\0'; + return; + } + } +} + + +static int +magic_show(struct seq_file *s, void *v) +{ + int rc=0; + ssize_t precnt; + struct ckrm_core_class *core; + struct rcfs_inode_info *rcfs_i = (struct rcfs_inode_info *)s->private; + int (*func) (struct ckrm_core_class *, struct seq_file *) = NULL; + + core = rcfs_i->core; + + if (!ckrm_is_core_valid(core)) + return -EINVAL; + + precnt = s->count; + if (!strcmp(rcfs_i->mfdentry->d_name.name, RCFS_CONFIG_NAME)) { + func = core->classtype->show_config; + } else if (!strcmp(rcfs_i->mfdentry->d_name.name, RCFS_MEMBERS_NAME)) { + func = core->classtype->show_members; + } else if (!strcmp(rcfs_i->mfdentry->d_name.name, RCFS_STATS_NAME)) { + func = core->classtype->show_stats; + } else if (!strcmp(rcfs_i->mfdentry->d_name.name, RCFS_SHARES_NAME)) { + func = core->classtype->show_shares; + } + if (func) + rc = func(core, s); + + if (s->count == precnt) + seq_printf(s, "No data to display\n"); + return rc; +}; + +static int +magic_open(struct inode *inode, struct file *file) +{ + struct rcfs_inode_info *ri; + int ret=-EINVAL; + + if (file->f_dentry) { + ri = rcfs_get_inode_info(file->f_dentry->d_inode); + ret = single_open(file, magic_show, (void *)ri); + } + return ret; +} + +static int +magic_close(struct inode *inode, struct file *file) +{ + return single_release(inode, file); +} + +enum parse_token_t { + parse_res_type, parse_str, parse_err +}; + +static match_table_t parse_tokens = { + {parse_res_type, "res=%s"}, + {parse_str, NULL}, + {parse_err, NULL}, +}; + +static int +magic_parse(const unsigned char *fname, char *options, + char **resstr, char **otherstr) +{ + char *p; + *resstr = NULL; + + if (!options) + return 0; + + while ((p = strsep(&options, ",")) != NULL) { + substring_t args[MAX_OPT_ARGS]; + int token; + + if (!*p) + continue; + + token = match_token(p, parse_tokens, args); + switch (token) { + case parse_res_type: + *resstr = match_strdup(args); + if (!strcmp(fname, RCFS_CONFIG_NAME)) { + char *str = p + strlen(p) + 1; + *otherstr = kmalloc(strlen(str) + 1, + GFP_KERNEL); + if (*otherstr == NULL) { + kfree(*resstr); + *resstr = NULL; + return 0; + } else { + strcpy(*otherstr, str); + return 1; + } + } + break; + case parse_str: + *otherstr = match_strdup(args); + break; + default: + return 0; + } + } + return (*resstr != NULL); +} + +static ssize_t +magic_write(struct file *file, const char __user *buf, + size_t count, loff_t *ppos) +{ + struct rcfs_inode_info *ri = + rcfs_get_inode_info(file->f_dentry->d_parent->d_inode); + char *optbuf, *otherstr=NULL, *resname=NULL; + int done, rc = 0; + struct ckrm_core_class *core ; + int (*func) (struct ckrm_core_class *, const char *, + const char *) = NULL; + + core = ri->core; + if (!ckrm_is_core_valid(core)) + return -EINVAL; + + if (count > MAX_INPUT_SIZE) + return -EINVAL; + + if (!access_ok(VERIFY_READ, buf, count)) + return -EFAULT; + + down(&(ri->vfs_inode.i_sem)); + + optbuf = kmalloc(MAX_INPUT_SIZE+1, GFP_KERNEL); + if (!optbuf) { + up(&(ri->vfs_inode.i_sem)); + return -ENOMEM; + } + __copy_from_user(optbuf, buf, count); + mkvalidstr(optbuf); + done = magic_parse(ri->mfdentry->d_name.name, + optbuf, &resname, &otherstr); + if (!done) { + printk(KERN_ERR "Error parsing data written to %s\n", + ri->mfdentry->d_name.name); + goto out; + } + if (!strcmp(ri->mfdentry->d_name.name, RCFS_CONFIG_NAME)) { + func = core->classtype->set_config; + } else if (!strcmp(ri->mfdentry->d_name.name, RCFS_STATS_NAME)) { + func = core->classtype->reset_stats; + } + if (func) { + rc = func(core, resname, otherstr); + if (rc) { + printk(KERN_ERR "magic_write: %s: error\n", + ri->mfdentry->d_name.name); + } + } +out: + up(&(ri->vfs_inode.i_sem)); + kfree(optbuf); + kfree(otherstr); + kfree(resname); + return rc ? rc : count; +} + +/* + * Shared function used by Target / Reclassify + */ + +static ssize_t +target_reclassify_write(struct file *file, const char __user * buf, + size_t count, loff_t * ppos, int manual) +{ + struct rcfs_inode_info *ri = rcfs_get_inode_info(file->f_dentry->d_inode); + char *optbuf; + int rc = -EINVAL; + struct ckrm_classtype *clstype; + + if (count > MAX_INPUT_SIZE) + return -EINVAL; + if (!access_ok(VERIFY_READ, buf, count)) + return -EFAULT; + down(&(ri->vfs_inode.i_sem)); + optbuf = kmalloc(MAX_INPUT_SIZE, GFP_KERNEL); + __copy_from_user(optbuf, buf, count); + mkvalidstr(optbuf); + clstype = ri->core->classtype; + if (clstype->forced_reclassify) + rc = (*clstype->forced_reclassify) (manual ? ri->core: NULL, optbuf); + up(&(ri->vfs_inode.i_sem)); + kfree(optbuf); + return (!rc ? count : rc); + +} + +/* + * Target + * + * pseudo file for manually reclassifying members to a class + */ + +static ssize_t +target_write(struct file *file, const char __user * buf, + size_t count, loff_t * ppos) +{ + return target_reclassify_write(file, buf, count, ppos, 1); +} + +struct file_operations target_fileops = { + .write = target_write, +}; + +/* + * Reclassify + * + * pseudo file for reclassification of an object through CE + */ + +static ssize_t +reclassify_write(struct file *file, const char __user * buf, + size_t count, loff_t * ppos) +{ + return target_reclassify_write(file, buf, count, ppos, 0); +} + +struct file_operations reclassify_fileops = { + .write = reclassify_write, +}; + +/* + * Config + * + * Set/get configuration parameters of a class. + */ + +/* + * Currently there are no per-class config parameters defined. + * Use existing code as a template + */ + +struct file_operations config_fileops = { + .open = magic_open, + .read = seq_read, + .llseek = seq_lseek, + .release = magic_close, + .write = magic_write, +}; + +/* + * Members + * + * List members of a class + */ + +struct file_operations members_fileops = { + .open = magic_open, + .read = seq_read, + .llseek = seq_lseek, + .release = magic_close, +}; + +/* + * Stats + * + * Get/reset class statistics + * No standard set of stats defined. Each resource controller chooses + * its own set of statistics to maintain and export. + */ + +struct file_operations stats_fileops = { + .open = magic_open, + .read = seq_read, + .llseek = seq_lseek, + .release = magic_close, + .write = magic_write, +}; + +/* + * Shares + * + * Set/get shares of a taskclass. + * Share types and semantics are defined by rcfs and ckrm core + */ + +#define SHARES_MAX_INPUT_SIZE 300U + +/* + * The enums for the share types should match the indices expected by + * array parameter to ckrm_set_resshare + * + * Note only the first NUM_SHAREVAL enums correspond to share types, + * the remaining ones are for token matching purposes + */ + +enum share_token_t { + MY_GUAR, MY_LIM, TOT_GUAR, MAX_LIM, SHARE_RES_TYPE, SHARE_ERR +}; + +/* Token matching for parsing input to this magic file */ +static match_table_t shares_tokens = { + {SHARE_RES_TYPE, "res=%s"}, + {MY_GUAR, "guarantee=%d"}, + {MY_LIM, "limit=%d"}, + {TOT_GUAR, "total_guarantee=%d"}, + {MAX_LIM, "max_limit=%d"}, + {SHARE_ERR, NULL} +}; + +static int +shares_parse(char *options, char **resstr, struct ckrm_shares *shares) +{ + char *p; + int option; + + if (!options) + return 1; + while ((p = strsep(&options, ",")) != NULL) { + substring_t args[MAX_OPT_ARGS]; + int token; + + if (!*p) + continue; + token = match_token(p, shares_tokens, args); + switch (token) { + case SHARE_RES_TYPE: + *resstr = match_strdup(args); + break; + case MY_GUAR: + if (match_int(args, &option)) + return 0; + shares->my_guarantee = option; + break; + case MY_LIM: + if (match_int(args, &option)) + return 0; + shares->my_limit = option; + break; + case TOT_GUAR: + if (match_int(args, &option)) + return 0; + shares->total_guarantee = option; + break; + case MAX_LIM: + if (match_int(args, &option)) + return 0; + shares->max_limit = option; + break; + default: + return 0; + } + } + return 1; +} + +static ssize_t +shares_write(struct file *file, const char __user * buf, + size_t count, loff_t * ppos) +{ + struct inode *inode = file->f_dentry->d_inode; + struct rcfs_inode_info *ri; + char *optbuf; + int rc = 0; + struct ckrm_core_class *core; + int done; + char *resname = NULL; + + struct ckrm_shares newshares = { + CKRM_SHARE_UNCHANGED, + CKRM_SHARE_UNCHANGED, + CKRM_SHARE_UNCHANGED, + CKRM_SHARE_UNCHANGED, + CKRM_SHARE_UNCHANGED, + CKRM_SHARE_UNCHANGED + }; + if (count > SHARES_MAX_INPUT_SIZE) + return -EINVAL; + if (!access_ok(VERIFY_READ, buf, count)) + return -EFAULT; + ri = rcfs_get_inode_info(file->f_dentry->d_parent->d_inode); + if (!ri || !ckrm_is_core_valid((struct ckrm_core_class *) (ri->core))) { + printk(KERN_ERR "shares_write: Error accessing core class\n"); + return -EFAULT; + } + down(&inode->i_sem); + core = ri->core; + optbuf = kmalloc(SHARES_MAX_INPUT_SIZE, GFP_KERNEL); + if (!optbuf) { + up(&inode->i_sem); + return -ENOMEM; + } + __copy_from_user(optbuf, buf, count); + mkvalidstr(optbuf); + done = shares_parse(optbuf, &resname, &newshares); + if (!done) { + printk(KERN_ERR "Error parsing shares\n"); + rc = -EINVAL; + goto write_out; + } + if (core->classtype->set_shares) { + rc = (*core->classtype->set_shares) (core, resname, &newshares); + if (rc) { + printk(KERN_ERR + "shares_write: resctlr share set error\n"); + goto write_out; + } + } + printk(KERN_ERR "Set %s shares to %d %d %d %d\n", + resname, + newshares.my_guarantee, + newshares.my_limit, + newshares.total_guarantee, newshares.max_limit); + rc = count; + +write_out: + up(&inode->i_sem); + kfree(optbuf); + kfree(resname); + return rc; +} + +struct file_operations shares_fileops = { + .open = magic_open, + .read = seq_read, + .llseek = seq_lseek, + .release = magic_close, + .write = shares_write, +}; + +/* + * magic file creation/deletion + */ + +int rcfs_clear_magic(struct dentry *parent) +{ + struct dentry *mftmp, *mfdentry; + + list_for_each_entry_safe(mfdentry, mftmp, &parent->d_subdirs, d_child) { + if (!rcfs_is_magic(mfdentry)) + continue; + if (rcfs_delete_internal(mfdentry)) + printk(KERN_ERR + "rcfs_clear_magic: error deleting one\n"); + } + return 0; +} + +EXPORT_SYMBOL_GPL(rcfs_clear_magic); + +int rcfs_create_magic(struct dentry *parent, struct rcfs_magf magf[], int count) +{ + int i; + struct dentry *mfdentry; + + for (i = 0; i < count; i++) { + mfdentry = rcfs_create_internal(parent, &magf[i], 0); + if (IS_ERR(mfdentry)) { + rcfs_clear_magic(parent); + return -ENOMEM; + } + rcfs_get_inode_info(mfdentry->d_inode)->core = + rcfs_get_inode_info(parent->d_inode)->core; + rcfs_get_inode_info(mfdentry->d_inode)->mfdentry = mfdentry; + mfdentry->d_fsdata = &RCFS_IS_MAGIC; + if (magf[i].i_fop) + mfdentry->d_inode->i_fop = magf[i].i_fop; + if (magf[i].i_op) + mfdentry->d_inode->i_op = magf[i].i_op; + } + return 0; +} + +EXPORT_SYMBOL_GPL(rcfs_create_magic); diff -puN /dev/null fs/rcfs/Makefile --- /dev/null Thu Apr 11 07:25:15 2002 +++ 25-akpm/fs/rcfs/Makefile Wed Jul 13 14:43:50 2005 @@ -0,0 +1,7 @@ +# +# Makefile for rcfs routines. +# + +obj-$(CONFIG_RCFS_FS) += rcfs.o + +rcfs-y := super.o inode.o dir.o rootdir.o magic.o diff -puN /dev/null fs/rcfs/rootdir.c --- /dev/null Thu Apr 11 07:25:15 2002 +++ 25-akpm/fs/rcfs/rootdir.c Wed Jul 13 14:43:50 2005 @@ -0,0 +1,198 @@ +/* + * fs/rcfs/rootdir.c + * + * Copyright (C) Vivek Kashyap, IBM Corp. 2004 + * + * + * Functions for creating root directories and magic files + * for classtypes and classification engines under rcfs + * + * Latest version, more details at http://ckrm.sf.net + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of version 2 of the GNU General Public License + * as published by the Free Software Foundation. + */ + +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include + +struct rbce_eng_callback rcfs_eng_callbacks = { + NULL, NULL +}; + +int rcfs_register_engine(struct rbce_eng_callback * rcbs) +{ + if (!rcbs->mkdir || rcfs_eng_callbacks.mkdir) { + return -EINVAL; + } + rcfs_eng_callbacks = *rcbs; + rcfs_engine_regd++; + return 0; +} + +EXPORT_SYMBOL_GPL(rcfs_register_engine); + +int rcfs_unregister_engine(struct rbce_eng_callback * rcbs) +{ + if (!rcbs->mkdir || !rcfs_eng_callbacks.mkdir || + (rcbs->mkdir != rcfs_eng_callbacks.mkdir)) { + return -EINVAL; + } + rcfs_eng_callbacks.mkdir = NULL; + rcfs_eng_callbacks.rmdir = NULL; + rcfs_engine_regd--; + return 0; +} + +EXPORT_SYMBOL(rcfs_unregister_engine); + +/* + * rcfs_mkroot + * Create and return a "root" dentry under /rcfs. + * Also create associated magic files + * + * @mfdesc: array of rcfs_magf describing root dir and its magic files + * @count: number of entries in mfdesc + * @core: core class to be associated with root + * @rootde: output parameter to return the newly created root dentry + */ + +int rcfs_mkroot(struct rcfs_magf *mfdesc, int mfcount, struct dentry **rootde) +{ + int sz; + struct rcfs_magf *rootdesc = &mfdesc[0]; + struct dentry *dentry; + struct rcfs_inode_info *rootri; + + if ((mfcount < 0) || (!mfdesc)) + return -EINVAL; + + rootdesc = &mfdesc[0]; + printk("allocating classtype root <%s>\n", rootdesc->name); + dentry = rcfs_create_internal(rcfs_rootde, rootdesc, 0); + + if (!dentry) { + printk(KERN_ERR "Could not create %s\n", rootdesc->name); + return -ENOMEM; + } + rootri = rcfs_get_inode_info(dentry->d_inode); + sz = strlen(rootdesc->name) + strlen(RCFS_ROOT) + 2; + rootri->name = kmalloc(sz, GFP_KERNEL); + if (!rootri->name) { + printk(KERN_ERR "Error allocating name for %s\n", + rootdesc->name); + rcfs_delete_internal(dentry); + return -ENOMEM; + } + snprintf(rootri->name, sz, "%s/%s", RCFS_ROOT, rootdesc->name); + if (rootdesc->i_fop) + dentry->d_inode->i_fop = rootdesc->i_fop; + if (rootdesc->i_op) + dentry->d_inode->i_op = rootdesc->i_op; + + /* set output parameters */ + *rootde = dentry; + + return 0; +} + +EXPORT_SYMBOL_GPL(rcfs_mkroot); + +int rcfs_rmroot(struct dentry *rootde) +{ + struct rcfs_inode_info *ri; + + if (!rootde) + return -EINVAL; + + rcfs_clear_magic(rootde); + ri = rcfs_get_inode_info(rootde->d_inode); + kfree(ri->name); + ri->name = NULL; + rcfs_delete_internal(rootde); + return 0; +} + +EXPORT_SYMBOL_GPL(rcfs_rmroot); + +int rcfs_register_classtype(struct ckrm_classtype * clstype) +{ + int rc; + struct rcfs_inode_info *rootri; + struct rcfs_magf *mfdesc; + + if (genmfdesc[clstype->mfidx] == NULL) { + return -ENOMEM; + } + + clstype->mfdesc = (void *)genmfdesc[clstype->mfidx]->rootmf; + clstype->mfcount = genmfdesc[clstype->mfidx]->rootmflen; + + mfdesc = (struct rcfs_magf *)clstype->mfdesc; + + /* rcfs root entry has the same name as the classtype */ + strncpy(mfdesc[0].name, clstype->name, RCFS_MAGF_NAMELEN); + + rc = rcfs_mkroot(mfdesc, clstype->mfcount, + (struct dentry **)&(clstype->rootde)); + if (rc) + return rc; + rootri = rcfs_get_inode_info(((struct dentry *)(clstype->rootde))->d_inode); + rootri->core = clstype->default_class; + clstype->default_class->name = rootri->name; + ckrm_core_grab(clstype->default_class); + + /* Create magic files under root */ + if ((rc = rcfs_create_magic(clstype->rootde, &mfdesc[1], + clstype->mfcount - 1))) { + kfree(rootri->name); + rootri->name = NULL; + rcfs_delete_internal(clstype->rootde); + return rc; + } + return rc; +} + +EXPORT_SYMBOL_GPL(rcfs_register_classtype); + +int rcfs_deregister_classtype(struct ckrm_classtype * clstype) +{ + int rc; + + rc = rcfs_rmroot((struct dentry *)clstype->rootde); + if (!rc) { + clstype->default_class->name = NULL; + ckrm_core_drop(clstype->default_class); + } + return rc; +} + +EXPORT_SYMBOL_GPL(rcfs_deregister_classtype); + +/* Common root and magic file entries. + * root name, root permissions, magic file names and magic file permissions + * are needed by all entities (classtypes and classification engines) existing + * under the rcfs mount point + * + * The common sets of these attributes are listed here as a table. Individual + * classtypes and classification engines can simple specify the index into the + * table to initialize their magf entries. + */ + +struct rcfs_mfdesc *genmfdesc[] = { + NULL, +}; diff -puN /dev/null fs/rcfs/super.c --- /dev/null Thu Apr 11 07:25:15 2002 +++ 25-akpm/fs/rcfs/super.c Wed Jul 13 14:43:50 2005 @@ -0,0 +1,291 @@ +/* + * fs/rcfs/super.c + * + * Copyright (C) Shailabh Nagar, IBM Corp. 2004 + * Vivek Kashyap, IBM Corp. 2004 + * + * Super block operations for rcfs + * + * + * Latest version, more details at http://ckrm.sf.net + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of version 2 of the GNU General Public License + * as published by the Free Software Foundation. + */ + +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include + +static kmem_cache_t *rcfs_inode_cachep; + +inline struct rcfs_inode_info *rcfs_get_inode_info(struct inode *inode) +{ + return container_of(inode, struct rcfs_inode_info, vfs_inode); +} + +static struct inode *rcfs_alloc_inode(struct super_block *sb) +{ + struct rcfs_inode_info *ri; + ri = (struct rcfs_inode_info *)kmem_cache_alloc(rcfs_inode_cachep, + SLAB_KERNEL); + if (!ri) + return NULL; + ri->name = NULL; + return &ri->vfs_inode; +} + +static void rcfs_destroy_inode(struct inode *inode) +{ + struct rcfs_inode_info *ri = rcfs_get_inode_info(inode); + + kfree(ri->name); + kmem_cache_free(rcfs_inode_cachep, ri); +} + +static void +rcfs_init_once(void *foo, kmem_cache_t * cachep, unsigned long flags) +{ + struct rcfs_inode_info *ri = (struct rcfs_inode_info *)foo; + + if ((flags & (SLAB_CTOR_VERIFY | SLAB_CTOR_CONSTRUCTOR)) == + SLAB_CTOR_CONSTRUCTOR) + inode_init_once(&ri->vfs_inode); +} + +int rcfs_init_inodecache(void) +{ + rcfs_inode_cachep = kmem_cache_create("rcfs_inode_cache", + sizeof(struct rcfs_inode_info), + 0, + SLAB_HWCACHE_ALIGN | + SLAB_RECLAIM_ACCOUNT, + rcfs_init_once, NULL); + if (rcfs_inode_cachep == NULL) + return -ENOMEM; + return 0; +} + +void rcfs_destroy_inodecache(void) +{ + pr_debug("destroy inodecache was called\n"); + if (kmem_cache_destroy(rcfs_inode_cachep)) + printk(KERN_INFO + "rcfs_inode_cache: not all structures were freed\n"); +} + +struct super_operations rcfs_super_ops = { + .alloc_inode = rcfs_alloc_inode, + .destroy_inode = rcfs_destroy_inode, + .statfs = simple_statfs, + .drop_inode = generic_delete_inode, +}; + +struct dentry *rcfs_rootde; /* redundant; can also get it from sb */ +static struct inode *rcfs_root; +static struct rcfs_inode_info *rcfs_rootri; + +static int rcfs_fill_super(struct super_block *sb, void *data, int silent) +{ + struct inode *inode; + struct dentry *root; + struct rcfs_inode_info *rootri; + struct ckrm_classtype *clstype; + int i, rc; + + sb->s_fs_info = NULL; + if (rcfs_mounted) { + return -EPERM; + } + rcfs_mounted++; + + sb->s_blocksize = PAGE_CACHE_SIZE; + sb->s_blocksize_bits = PAGE_CACHE_SHIFT; + sb->s_magic = RCFS_MAGIC; + sb->s_op = &rcfs_super_ops; + inode = rcfs_get_inode(sb, S_IFDIR | 0755, 0); + if (!inode) + return -ENOMEM; + inode->i_op = &rcfs_rootdir_inode_operations; + + root = d_alloc_root(inode); + if (!root) { + iput(inode); + return -ENOMEM; + } + sb->s_root = root; + + /* Link inode and core class */ + rootri = rcfs_get_inode_info(inode); + rootri->name = kmalloc(strlen(RCFS_ROOT) + 1, GFP_KERNEL); + if (!rootri->name) { + d_delete(root); + iput(inode); + return -ENOMEM; + } + strcpy(rootri->name, RCFS_ROOT); + rootri->core = NULL; + + rcfs_root = inode; + sb->s_fs_info = rcfs_root = inode; + rcfs_rootde = root; + rcfs_rootri = rootri; + + /* register metatypes */ + for (i = 0; i < CKRM_MAX_CLASSTYPES; i++) { + clstype = ckrm_classtypes[i]; + if (clstype == NULL) + continue; + printk("A non null classtype\n"); + + if ((rc = rcfs_register_classtype(clstype))) + continue; /* could return with an error too */ + } + + /* + * do post-mount initializations needed by CE + * this is distinct from CE registration done on rcfs module load + */ + if (rcfs_engine_regd) { + if (rcfs_eng_callbacks.mnt) + if ((rc = (*rcfs_eng_callbacks.mnt) ())) { + printk(KERN_ERR "Error in CE mnt %d\n", rc); + } + } + /* + * Following comment handled by code above; keep nonetheless if it + * can be done better + * + * register CE's with rcfs + * check if CE loaded + * call rcfs_register_engine for each classtype + * AND rcfs_mkroot (preferably subsume latter in former) + */ + return 0; +} + +static struct super_block *rcfs_get_sb(struct file_system_type *fs_type, + int flags, const char *dev_name, + void *data) +{ + return get_sb_nodev(fs_type, flags, data, rcfs_fill_super); +} + +void rcfs_kill_sb(struct super_block *sb) +{ + int i, rc; + struct ckrm_classtype *clstype; + + if (sb->s_fs_info != rcfs_root) { + generic_shutdown_super(sb); + return; + } + rcfs_mounted--; + + for (i = 0; i < CKRM_MAX_CLASSTYPES; i++) { + clstype = ckrm_classtypes[i]; + if (clstype == NULL || clstype->rootde == NULL) + continue; + + if ((rc = rcfs_deregister_classtype(clstype))) { + printk(KERN_ERR "Error removing classtype %s\n", + clstype->name); + } + } + + /* + * do pre-umount shutdown needed by CE + * this is distinct from CE deregistration done on rcfs module unload + */ + if (rcfs_engine_regd) { + if (rcfs_eng_callbacks.umnt) + if ((rc = (*rcfs_eng_callbacks.umnt) ())) { + printk(KERN_ERR "Error in CE umnt %d\n", rc); + /* TODO: return ; until error handling improves */ + } + } + /* + * Following comment handled by code above; keep nonetheless if it + * can be done better + * + * deregister CE with rcfs + * Check if loaded + * if ce is in one directory /rcfs/ce, + * rcfs_deregister_engine for all classtypes within above + * codebase + * followed by + * rcfs_rmroot here + * if ce in multiple (per-classtype) directories + * call rbce_deregister_engine within ckrm_deregister_classtype + * + * following will automatically clear rcfs root entry including its + * rcfs_inode_info + */ + + generic_shutdown_super(sb); +} + +static struct file_system_type rcfs_fs_type = { + .name = "rcfs", + .get_sb = rcfs_get_sb, + .kill_sb = rcfs_kill_sb, +}; + +struct rcfs_functions my_rcfs_fn = { + .mkroot = rcfs_mkroot, + .rmroot = rcfs_rmroot, + .register_classtype = rcfs_register_classtype, + .deregister_classtype = rcfs_deregister_classtype, +}; + +extern struct rcfs_functions rcfs_fn; + +static int __init init_rcfs_fs(void) +{ + int ret; + + ret = register_filesystem(&rcfs_fs_type); + if (ret) + goto init_register_err; + ret = rcfs_init_inodecache(); + if (ret) + goto init_cache_err; + rcfs_fn = my_rcfs_fn; + /* + * Due to tight coupling of this module with ckrm + * do not allow this module to be removed. + */ + try_module_get(THIS_MODULE); + return ret; + +init_cache_err: + unregister_filesystem(&rcfs_fs_type); +init_register_err: + return ret; +} + +static void __exit exit_rcfs_fs(void) +{ + rcfs_destroy_inodecache(); + unregister_filesystem(&rcfs_fs_type); +} + +module_init(init_rcfs_fs) +module_exit(exit_rcfs_fs) + +MODULE_LICENSE("GPL"); diff -puN include/linux/rcfs.h~ckrm-resource-control-file-system-rcfs include/linux/rcfs.h --- 25/include/linux/rcfs.h~ckrm-resource-control-file-system-rcfs Wed Jul 13 14:43:50 2005 +++ 25-akpm/include/linux/rcfs.h Wed Jul 13 14:43:50 2005 @@ -16,12 +16,24 @@ #define RCFS_MAGF_NAMELEN 20 extern int RCFS_IS_MAGIC; +/* + * Following strings are the names of the system defined files under + * the rcfs filesystem + */ + +#define RCFS_CONFIG_NAME "config" +#define RCFS_MEMBERS_NAME "members" +#define RCFS_STATS_NAME "stats" +#define RCFS_SHARES_NAME "shares" +#define RCFS_RECLASSIFY_NAME "reclassify" + #define rcfs_is_magic(dentry) ((dentry)->d_fsdata == &RCFS_IS_MAGIC) struct rcfs_inode_info { struct ckrm_core_class *core; char *name; struct inode vfs_inode; + struct dentry *mfdentry; }; #define RCFS_DEFAULT_DIR_MODE (S_IFDIR | S_IRUGO | S_IXUGO) @@ -45,16 +57,10 @@ struct rcfs_mfdesc { extern struct rcfs_mfdesc *genmfdesc[]; -struct rcfs_inode_info *RCFS_I(struct inode *inode); - -int rcfs_empty(struct dentry *); +struct rcfs_inode_info *rcfs_get_inode_info(struct inode *inode); struct inode *rcfs_get_inode(struct super_block *, int, dev_t); int rcfs_mknod(struct inode *, struct dentry *, int, dev_t); -int _rcfs_mknod(struct inode *, struct dentry *, int, dev_t); -int rcfs_mkdir(struct inode *, struct dentry *, int); -struct ckrm_core_class *rcfs_make_core(struct dentry *, struct ckrm_core_class *); struct dentry *rcfs_set_magf_byname(char *, void *); - struct dentry *rcfs_create_internal(struct dentry *, struct rcfs_magf *, int); int rcfs_delete_internal(struct dentry *); int rcfs_create_magic(struct dentry *, struct rcfs_magf *, int); diff -puN init/Kconfig~ckrm-resource-control-file-system-rcfs init/Kconfig --- 25/init/Kconfig~ckrm-resource-control-file-system-rcfs Wed Jul 13 14:43:50 2005 +++ 25-akpm/init/Kconfig Wed Jul 13 14:43:50 2005 @@ -160,6 +160,16 @@ config CKRM If you say Y here, enable the Resource Class File System and at least one of the resource controllers below. Say N if you are unsure. +config RCFS_FS + tristate "Resource Class File System (User API)" + depends on CKRM + default m + help + RCFS is the filesystem API for CKRM. Compiling it as a module permits + users to only load RCFS if they intend to use CKRM. + + Say M if unsure, Y to save on module loading. N doesn't make sense + when CKRM has been configured. endmenu config SYSCTL _