Re: [PATCH] ceph: new mount option that specifies fscache uniquifier

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On Wed, 2017-06-28 at 16:04 +0800, Yan, Zheng wrote:
> Current ceph uses FSID as primary index key of fscache data. This
> allows ceph to retain cached data across remount. But this causes
> problem (kernel opps, fscache does not support sharing data) when
> a filesystem get mounted several times (with fscache enabled, with
> different mount options).
> 
> The fix is adding a new mount option, which specifies uniquifier
> for fscache.
> 
> Signed-off-by: "Yan, Zheng" <zyan@xxxxxxxxxx>
> ---
>  fs/ceph/cache.c | 92 +++++++++++++++++++++++++++++++++++++++++++++++++++------
>  fs/ceph/super.c | 41 +++++++++++++++++--------
>  fs/ceph/super.h |  1 +
>  3 files changed, 113 insertions(+), 21 deletions(-)
> 
> diff --git a/fs/ceph/cache.c b/fs/ceph/cache.c
> index 4e7421c..fd11728 100644
> --- a/fs/ceph/cache.c
> +++ b/fs/ceph/cache.c
> @@ -35,18 +35,34 @@ struct fscache_netfs ceph_cache_netfs = {
>  	.version	= 0,
>  };
>  
> +static DEFINE_MUTEX(ceph_fscache_lock);
> +static LIST_HEAD(ceph_fscache_list);
> +
> +struct ceph_fscache_entry {
> +	struct list_head list;
> +	struct fscache_cookie *fscache;
> +	struct ceph_fsid fsid;
> +	size_t uniq_len;
> +	char uniquifier[0];
> +};
> +
>  static uint16_t ceph_fscache_session_get_key(const void *cookie_netfs_data,
>  					     void *buffer, uint16_t maxbuf)
>  {
>  	const struct ceph_fs_client* fsc = cookie_netfs_data;
> -	uint16_t klen;
> +	const char *fscache_uniq = fsc->mount_options->fscache_uniq;
> +	uint16_t fsid_len, uniq_len;
>  
> -	klen = sizeof(fsc->client->fsid);
> -	if (klen > maxbuf)
> +	fsid_len = sizeof(fsc->client->fsid);
> +	uniq_len = fscache_uniq ? strlen(fscache_uniq) : 0;
> +	if (fsid_len + uniq_len > maxbuf)
>  		return 0;
>  
> -	memcpy(buffer, &fsc->client->fsid, klen);
> -	return klen;
> +	memcpy(buffer, &fsc->client->fsid, fsid_len);
> +	if (uniq_len)
> +		memcpy(buffer + fsid_len, fscache_uniq, uniq_len);
> +
> +	return fsid_len + uniq_len;
>  }
>  
>  static const struct fscache_cookie_def ceph_fscache_fsid_object_def = {
> @@ -67,13 +83,54 @@ void ceph_fscache_unregister(void)
>  
>  int ceph_fscache_register_fs(struct ceph_fs_client* fsc)
>  {
> +	const struct ceph_fsid *fsid = &fsc->client->fsid;
> +	const char *fscache_uniq = fsc->mount_options->fscache_uniq;
> +	size_t uniq_len = fscache_uniq ? strlen(fscache_uniq) : 0;
> +	struct ceph_fscache_entry *ent;
> +	int err = 0;
> +
> +	mutex_lock(&ceph_fscache_lock);
> +	list_for_each_entry(ent, &ceph_fscache_list, list) {
> +		if (memcmp(&ent->fsid, fsid, sizeof(*fsid)))
> +			continue;
> +		if (ent->uniq_len != uniq_len)
> +			continue;
> +		if (uniq_len && memcmp(ent->uniquifier, fscache_uniq, uniq_len))
> +			continue;
> +
> +		pr_err("fscache cookie already registered for fsid %pU\n", fsid);
> +		pr_err("  use fsc=%%s mount option to specify a uniquifier\n");
> +		err = -EBUSY;
> +		goto out_unlock;
> +	}
> +
> +	ent = kzalloc(sizeof(*ent) + uniq_len, GFP_KERNEL);
> +	if (!ent) {
> +		err = -ENOMEM;
> +		goto out_unlock;
> +	}
> +
>  	fsc->fscache = fscache_acquire_cookie(ceph_cache_netfs.primary_index,
>  					      &ceph_fscache_fsid_object_def,
>  					      fsc, true);
> -	if (!fsc->fscache)
> -		pr_err("Unable to register fsid: %p fscache cookie\n", fsc);
>  
> -	return 0;
> +	if (fsc->fscache) {
> +		memcpy(&ent->fsid, fsid, sizeof(*fsid));
> +		if (uniq_len > 0) {
> +			memcpy(&ent->uniquifier, fscache_uniq, uniq_len);
> +			ent->uniq_len = uniq_len;
> +		}
> +		ent->fscache = fsc->fscache;
> +		list_add_tail(&ent->list, &ceph_fscache_list);
> +	} else {
> +		kfree(ent);
> +		pr_err("unable to register fscache cookie for fsid %pU\n",
> +		       fsid);
> +		/* all other fs ignore this error */
> +	}
> +out_unlock:
> +	mutex_unlock(&ceph_fscache_lock);
> +	return err;
>  }
>  
>  static uint16_t ceph_fscache_inode_get_key(const void *cookie_netfs_data,
> @@ -349,7 +406,24 @@ void ceph_invalidate_fscache_page(struct inode* inode, struct page *page)
>  
>  void ceph_fscache_unregister_fs(struct ceph_fs_client* fsc)
>  {
> -	fscache_relinquish_cookie(fsc->fscache, 0);
> +	if (fscache_cookie_valid(fsc->fscache)) {
> +		struct ceph_fscache_entry *ent;
> +		bool found = false;
> +
> +		mutex_lock(&ceph_fscache_lock);
> +		list_for_each_entry(ent, &ceph_fscache_list, list) {
> +			if (ent->fscache == fsc->fscache) {
> +				list_del(&ent->list);
> +				kfree(ent);
> +				found = true;
> +				break;
> +			}
> +		}
> +		WARN_ON_ONCE(!found);
> +		mutex_unlock(&ceph_fscache_lock);
> +
> +		__fscache_relinquish_cookie(fsc->fscache, 0);
> +	}
>  	fsc->fscache = NULL;
>  }
>  
> diff --git a/fs/ceph/super.c b/fs/ceph/super.c
> index 14e78dd..aa06a8c 100644
> --- a/fs/ceph/super.c
> +++ b/fs/ceph/super.c
> @@ -121,6 +121,7 @@ enum {
>  	/* int args above */
>  	Opt_snapdirname,
>  	Opt_mds_namespace,
> +	Opt_fscache_uniq,
>  	Opt_last_string,
>  	/* string args above */
>  	Opt_dirstat,
> @@ -158,6 +159,7 @@ static match_table_t fsopt_tokens = {
>  	/* int args above */
>  	{Opt_snapdirname, "snapdirname=%s"},
>  	{Opt_mds_namespace, "mds_namespace=%s"},
> +	{Opt_fscache_uniq, "fsc=%s"},
>  	/* string args above */
>  	{Opt_dirstat, "dirstat"},
>  	{Opt_nodirstat, "nodirstat"},
> @@ -223,6 +225,14 @@ static int parse_fsopt_token(char *c, void *private)
>  		if (!fsopt->mds_namespace)
>  			return -ENOMEM;
>  		break;
> +	case Opt_fscache_uniq:
> +		fsopt->fscache_uniq = kstrndup(argstr[0].from,
> +					       argstr[0].to-argstr[0].from,
> +					       GFP_KERNEL);
> +		if (!fsopt->fscache_uniq)
> +			return -ENOMEM;
> +		fsopt->flags |= CEPH_MOUNT_OPT_FSCACHE;
> +		break;
>  		/* misc */
>  	case Opt_wsize:
>  		fsopt->wsize = intval;
> @@ -317,6 +327,7 @@ static void destroy_mount_options(struct ceph_mount_options *args)
>  	kfree(args->snapdir_name);
>  	kfree(args->mds_namespace);
>  	kfree(args->server_path);
> +	kfree(args->fscache_uniq);
>  	kfree(args);
>  }
>  
> @@ -350,10 +361,12 @@ static int compare_mount_options(struct ceph_mount_options *new_fsopt,
>  	ret = strcmp_null(fsopt1->mds_namespace, fsopt2->mds_namespace);
>  	if (ret)
>  		return ret;
> -
>  	ret = strcmp_null(fsopt1->server_path, fsopt2->server_path);
>  	if (ret)
>  		return ret;
> +	ret = strcmp_null(fsopt1->fscache_uniq, fsopt2->fscache_uniq);
> +	if (ret)
> +		return ret;
>  
>  	return ceph_compare_options(new_opt, fsc->client);
>  }
> @@ -475,8 +488,12 @@ static int ceph_show_options(struct seq_file *m, struct dentry *root)
>  		seq_puts(m, ",noasyncreaddir");
>  	if ((fsopt->flags & CEPH_MOUNT_OPT_DCACHE) == 0)
>  		seq_puts(m, ",nodcache");
> -	if (fsopt->flags & CEPH_MOUNT_OPT_FSCACHE)
> -		seq_puts(m, ",fsc");
> +	if (fsopt->flags & CEPH_MOUNT_OPT_FSCACHE) {
> +		if (fsopt->fscache_uniq)
> +			seq_printf(m, ",fsc=%s", fsopt->fscache_uniq);
> +		else
> +			seq_puts(m, ",fsc");
> +	}
>  	if (fsopt->flags & CEPH_MOUNT_OPT_NOPOOLPERM)
>  		seq_puts(m, ",nopoolperm");
>  
> @@ -597,18 +614,11 @@ static struct ceph_fs_client *create_fs_client(struct ceph_mount_options *fsopt,
>  	if (!fsc->wb_pagevec_pool)
>  		goto fail_trunc_wq;
>  
> -	/* setup fscache */
> -	if ((fsopt->flags & CEPH_MOUNT_OPT_FSCACHE) &&
> -	    (ceph_fscache_register_fs(fsc) != 0))
> -		goto fail_fscache;
> -
>  	/* caps */
>  	fsc->min_caps = fsopt->max_readdir;
>  
>  	return fsc;
>  
> -fail_fscache:
> -	ceph_fscache_unregister_fs(fsc);
>  fail_trunc_wq:
>  	destroy_workqueue(fsc->trunc_wq);
>  fail_pg_inv_wq:
> @@ -626,8 +636,6 @@ static void destroy_fs_client(struct ceph_fs_client *fsc)
>  {
>  	dout("destroy_fs_client %p\n", fsc);
>  
> -	ceph_fscache_unregister_fs(fsc);
> -
>  	destroy_workqueue(fsc->wb_wq);
>  	destroy_workqueue(fsc->pg_inv_wq);
>  	destroy_workqueue(fsc->trunc_wq);
> @@ -820,6 +828,13 @@ static struct dentry *ceph_real_mount(struct ceph_fs_client *fsc)
>  		if (err < 0)
>  			goto out;
>  
> +		/* setup fscache */
> +		if (fsc->mount_options->flags & CEPH_MOUNT_OPT_FSCACHE) {
> +			err = ceph_fscache_register_fs(fsc);
> +			if (err < 0)
> +				goto out;
> +		}
> +
>  		if (!fsc->mount_options->server_path) {
>  			path = "";
>  			dout("mount opening path \\t\n");
> @@ -1042,6 +1057,8 @@ static void ceph_kill_sb(struct super_block *s)
>  	fsc->client->extra_mon_dispatch = NULL;
>  	ceph_fs_debugfs_cleanup(fsc);
>  
> +	ceph_fscache_unregister_fs(fsc);
> +
>  	ceph_mdsc_destroy(fsc);
>  
>  	destroy_fs_client(fsc);
> diff --git a/fs/ceph/super.h b/fs/ceph/super.h
> index f8a0aba..f02a222 100644
> --- a/fs/ceph/super.h
> +++ b/fs/ceph/super.h
> @@ -73,6 +73,7 @@ struct ceph_mount_options {
>  	char *snapdir_name;   /* default ".snap" */
>  	char *mds_namespace;  /* default NULL */
>  	char *server_path;    /* default  "/" */
> +	char *fscache_uniq;   /* default NULL */
>  };
>  
>  struct ceph_fs_client {

Acked-by: Jeff Layton <jlayton@xxxxxxxxxx>
--
To unsubscribe from this list: send the line "unsubscribe ceph-devel" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at  http://vger.kernel.org/majordomo-info.html



[Index of Archives]     [CEPH Users]     [Ceph Large]     [Information on CEPH]     [Linux BTRFS]     [Linux USB Devel]     [Video for Linux]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]
  Powered by Linux