Re: [PATCH v1] NFSD: Add a switch to disable nfsd_splice_read()

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 




> On Jan 24, 2024, at 3:34 PM, Jeff Layton <jlayton@xxxxxxxxxx> wrote:
> 
> On Tue, 2024-01-23 at 11:12 -0500, Chuck Lever wrote:
>> From: Chuck Lever <chuck.lever@xxxxxxxxxx>
>> 
>> This enables us to ensure that testing properly covers the readv
>> paths as well as the spliced read paths, which are more commonly
>> used. Also this makes it easier to do benchmark comparisons between
>> splice and vectored reads.
>> 
>> Suggested-by: Jeff Layton <jlayton@xxxxxxxxxx>
>> Signed-off-by: Chuck Lever <chuck.lever@xxxxxxxxxx>
>> ---
>> Documentation/netlink/specs/nfsd.yaml |   19 +++++++
>> fs/nfsd/netlink.c                     |   17 ++++++
>> fs/nfsd/netlink.h                     |    3 +
>> fs/nfsd/netns.h                       |    1 
>> fs/nfsd/nfsctl.c                      |   45 ++++++++++++++++
>> include/uapi/linux/nfsd_netlink.h     |    8 +++
>> tools/net/ynl/generated/nfsd-user.c   |   95 +++++++++++++++++++++++++++++++++
>> tools/net/ynl/generated/nfsd-user.h   |   47 ++++++++++++++++
>> 8 files changed, 235 insertions(+)
>> 
> 
> I think this makes sense. How are you testing it,

So far it's only been regression testing. Nothing breaks.


> and how do you forsee
> us using this interface? Will we need a new program in nfs-utils or will
> you extend an existing one?

We could add a command line option to rpc.nfsd. That doesn't
seem convenient for automated testers, though.


>> diff --git a/Documentation/netlink/specs/nfsd.yaml b/Documentation/netlink/specs/nfsd.yaml
>> index 05acc73e2e33..1a3c5e78b388 100644
>> --- a/Documentation/netlink/specs/nfsd.yaml
>> +++ b/Documentation/netlink/specs/nfsd.yaml
>> @@ -62,6 +62,12 @@ attribute-sets:
>>         name: compound-ops
>>         type: u32
>>         multi-attr: true
>> +  -
>> +    name: splice-read
>> +    attributes:
>> +      -
>> +        name: enabled
>> +        type: u32
>> 
>> operations:
>>   list:
>> @@ -87,3 +93,16 @@ operations:
>>             - sport
>>             - dport
>>             - compound-ops
>> +    -
>> +      name: splice-read
>> +      doc: Disable the use of splice for NFS READ operations
>> +      attribute-set: splice-read
>> +      flags: [ admin-perm ]
>> +      do:
>> +        request:
>> +          attributes:
>> +            - enabled
>> +      dump:
>> +        reply:
>> +          attributes:
>> +            - enabled
>> diff --git a/fs/nfsd/netlink.c b/fs/nfsd/netlink.c
>> index 0e1d635ec5f9..c47f3527d30b 100644
>> --- a/fs/nfsd/netlink.c
>> +++ b/fs/nfsd/netlink.c
>> @@ -10,6 +10,11 @@
>> 
>> #include <uapi/linux/nfsd_netlink.h>
>> 
>> +/* NFSD_CMD_SPLICE_READ - do */
>> +static const struct nla_policy nfsd_splice_read_nl_policy[NFSD_A_SPLICE_READ_ENABLED + 1] = {
>> + [NFSD_A_SPLICE_READ_ENABLED] = { .type = NLA_U32, },
>> +};
>> +
>> /* Ops table for nfsd */
>> static const struct genl_split_ops nfsd_nl_ops[] = {
>> {
>> @@ -19,6 +24,18 @@ static const struct genl_split_ops nfsd_nl_ops[] = {
>> .done = nfsd_nl_rpc_status_get_done,
>> .flags = GENL_CMD_CAP_DUMP,
>> },
>> + {
>> + .cmd = NFSD_CMD_SPLICE_READ,
>> + .doit = nfsd_nl_splice_read_doit,
>> + .policy = nfsd_splice_read_nl_policy,
>> + .maxattr = NFSD_A_SPLICE_READ_ENABLED,
>> + .flags = GENL_ADMIN_PERM | GENL_CMD_CAP_DO,
>> + },
>> + {
>> + .cmd = NFSD_CMD_SPLICE_READ,
>> + .dumpit = nfsd_nl_splice_read_dumpit,
>> + .flags = GENL_ADMIN_PERM | GENL_CMD_CAP_DUMP,
>> + },
>> };
>> 
>> struct genl_family nfsd_nl_family __ro_after_init = {
>> diff --git a/fs/nfsd/netlink.h b/fs/nfsd/netlink.h
>> index d83dd6bdee92..2d96d0f093bb 100644
>> --- a/fs/nfsd/netlink.h
>> +++ b/fs/nfsd/netlink.h
>> @@ -16,6 +16,9 @@ int nfsd_nl_rpc_status_get_done(struct netlink_callback *cb);
>> 
>> int nfsd_nl_rpc_status_get_dumpit(struct sk_buff *skb,
>>   struct netlink_callback *cb);
>> +int nfsd_nl_splice_read_doit(struct sk_buff *skb, struct genl_info *info);
>> +int nfsd_nl_splice_read_dumpit(struct sk_buff *skb,
>> +        struct netlink_callback *cb);
>> 
>> extern struct genl_family nfsd_nl_family;
>> 
>> diff --git a/fs/nfsd/netns.h b/fs/nfsd/netns.h
>> index 74b4360779a1..3b9e09fecbfc 100644
>> --- a/fs/nfsd/netns.h
>> +++ b/fs/nfsd/netns.h
>> @@ -109,6 +109,7 @@ struct nfsd_net {
>> 
>> bool nfsd_net_up;
>> bool lockd_up;
>> + bool spliced_reads;
>> 
>> seqlock_t writeverf_lock;
>> unsigned char writeverf[8];
>> diff --git a/fs/nfsd/nfsctl.c b/fs/nfsd/nfsctl.c
>> index 8e6dbe9e0b65..86f466dbc784 100644
>> --- a/fs/nfsd/nfsctl.c
>> +++ b/fs/nfsd/nfsctl.c
>> @@ -1696,6 +1696,51 @@ int nfsd_nl_rpc_status_get_done(struct netlink_callback *cb)
>> return 0;
>> }
>> 
>> +/**
>> + * nfsd_nl_splice_read_doit - Set the value of splice_read
>> + * @skb: call buffer
>> + * @info: netlink metadata and command arguments
>> + *
>> + * Returns zero on success, or a negative errno.
>> + */
>> +int nfsd_nl_splice_read_doit(struct sk_buff *skb, struct genl_info *info)
>> +{
>> + struct nfsd_net *nn = net_generic(sock_net(skb->sk), nfsd_net_id);
>> + u32 newval;
>> +
>> + if (GENL_REQ_ATTR_CHECK(info, NFSD_A_SPLICE_READ_ENABLED))
>> + return -EINVAL;
>> +
>> + newval = nla_get_u32(info->attrs[NFSD_A_SPLICE_READ_ENABLED]);
>> + nn->spliced_reads = newval ? true : false;
>> + return 0;
>> +}
>> +
>> +/**
>> + * nfsd_nl_splice_read_dumpit - Return the value of splice_read
>> + * @skb: reply buffer
>> + * @cb: netlink metadata and command arguments
>> + *
>> + * Returns the size of the reply or a negative errno.
>> + */
>> +int nfsd_nl_splice_read_dumpit(struct sk_buff *skb, struct netlink_callback *cb)
>> +{
>> + struct nfsd_net *nn = net_generic(sock_net(skb->sk), nfsd_net_id);
>> + void *hdr;
>> +
>> + hdr = genlmsg_put(skb, NETLINK_CB(cb->skb).portid, cb->nlh->nlmsg_seq,
>> +   &nfsd_nl_family, 0, NFSD_CMD_SPLICE_READ);
>> + if (!hdr)
>> + return -ENOBUFS;
>> +
>> + if (nla_put_s32(skb, NFSD_A_SPLICE_READ_ENABLED,
>> + (nn->spliced_reads ? 1 : 0)))
>> + return -ENOBUFS;
>> +
>> + genlmsg_end(skb, hdr);
>> + return 0;
>> +}
>> +
>> /**
>>  * nfsd_net_init - Prepare the nfsd_net portion of a new net namespace
>>  * @net: a freshly-created network namespace
>> diff --git a/include/uapi/linux/nfsd_netlink.h b/include/uapi/linux/nfsd_netlink.h
>> index 3cd044edee5d..c2542ed18b50 100644
>> --- a/include/uapi/linux/nfsd_netlink.h
>> +++ b/include/uapi/linux/nfsd_netlink.h
>> @@ -29,8 +29,16 @@ enum {
>> NFSD_A_RPC_STATUS_MAX = (__NFSD_A_RPC_STATUS_MAX - 1)
>> };
>> 
>> +enum {
>> + NFSD_A_SPLICE_READ_ENABLED = 1,
>> +
>> + __NFSD_A_SPLICE_READ_MAX,
>> + NFSD_A_SPLICE_READ_MAX = (__NFSD_A_SPLICE_READ_MAX - 1)
>> +};
>> +
>> enum {
>> NFSD_CMD_RPC_STATUS_GET = 1,
>> + NFSD_CMD_SPLICE_READ,
>> 
>> __NFSD_CMD_MAX,
>> NFSD_CMD_MAX = (__NFSD_CMD_MAX - 1)
>> diff --git a/tools/net/ynl/generated/nfsd-user.c b/tools/net/ynl/generated/nfsd-user.c
>> index 360b6448c6e9..14957bdfbe9c 100644
>> --- a/tools/net/ynl/generated/nfsd-user.c
>> +++ b/tools/net/ynl/generated/nfsd-user.c
>> @@ -15,6 +15,7 @@
>> /* Enums */
>> static const char * const nfsd_op_strmap[] = {
>> [NFSD_CMD_RPC_STATUS_GET] = "rpc-status-get",
>> + [NFSD_CMD_SPLICE_READ] = "splice-read",
>> };
>> 
>> const char *nfsd_op_str(int op)
>> @@ -47,6 +48,15 @@ struct ynl_policy_nest nfsd_rpc_status_nest = {
>> .table = nfsd_rpc_status_policy,
>> };
>> 
>> +struct ynl_policy_attr nfsd_splice_read_policy[NFSD_A_SPLICE_READ_MAX + 1] = {
>> + [NFSD_A_SPLICE_READ_ENABLED] = { .name = "enabled", .type = YNL_PT_U32, },
>> +};
>> +
>> +struct ynl_policy_nest nfsd_splice_read_nest = {
>> + .max_attr = NFSD_A_SPLICE_READ_MAX,
>> + .table = nfsd_splice_read_policy,
>> +};
>> +
>> /* Common nested types */
>> /* ============== NFSD_CMD_RPC_STATUS_GET ============== */
>> /* NFSD_CMD_RPC_STATUS_GET - dump */
>> @@ -198,6 +208,91 @@ nfsd_rpc_status_get_dump(struct ynl_sock *ys)
>> return NULL;
>> }
>> 
>> +/* ============== NFSD_CMD_SPLICE_READ ============== */
>> +/* NFSD_CMD_SPLICE_READ - do */
>> +void nfsd_splice_read_req_free(struct nfsd_splice_read_req *req)
>> +{
>> + free(req);
>> +}
>> +
>> +int nfsd_splice_read(struct ynl_sock *ys, struct nfsd_splice_read_req *req)
>> +{
>> + struct nlmsghdr *nlh;
>> + int err;
>> +
>> + nlh = ynl_gemsg_start_req(ys, ys->family_id, NFSD_CMD_SPLICE_READ, 1);
>> + ys->req_policy = &nfsd_splice_read_nest;
>> +
>> + if (req->_present.enabled)
>> + mnl_attr_put_u32(nlh, NFSD_A_SPLICE_READ_ENABLED, req->enabled);
>> +
>> + err = ynl_exec(ys, nlh, NULL);
>> + if (err < 0)
>> + return -1;
>> +
>> + return 0;
>> +}
>> +
>> +/* NFSD_CMD_SPLICE_READ - dump */
>> +int nfsd_splice_read_rsp_dump_parse(const struct nlmsghdr *nlh, void *data)
>> +{
>> + struct nfsd_splice_read_rsp_dump *dst;
>> + struct ynl_parse_arg *yarg = data;
>> + const struct nlattr *attr;
>> +
>> + dst = yarg->data;
>> +
>> + mnl_attr_for_each(attr, nlh, sizeof(struct genlmsghdr)) {
>> + unsigned int type = mnl_attr_get_type(attr);
>> +
>> + if (type == NFSD_A_SPLICE_READ_ENABLED) {
>> + if (ynl_attr_validate(yarg, attr))
>> + return MNL_CB_ERROR;
>> + dst->_present.enabled = 1;
>> + dst->enabled = mnl_attr_get_u32(attr);
>> + }
>> + }
>> +
>> + return MNL_CB_OK;
>> +}
>> +
>> +void nfsd_splice_read_rsp_list_free(struct nfsd_splice_read_rsp_list *rsp)
>> +{
>> + struct nfsd_splice_read_rsp_list *next = rsp;
>> +
>> + while ((void *)next != YNL_LIST_END) {
>> + rsp = next;
>> + next = rsp->next;
>> +
>> + free(rsp);
>> + }
>> +}
>> +
>> +struct nfsd_splice_read_rsp_list *nfsd_splice_read_dump(struct ynl_sock *ys)
>> +{
>> + struct ynl_dump_state yds = {};
>> + struct nlmsghdr *nlh;
>> + int err;
>> +
>> + yds.ys = ys;
>> + yds.alloc_sz = sizeof(struct nfsd_splice_read_rsp_list);
>> + yds.cb = nfsd_splice_read_rsp_dump_parse;
>> + yds.rsp_cmd = NFSD_CMD_SPLICE_READ;
>> + yds.rsp_policy = &nfsd_splice_read_nest;
>> +
>> + nlh = ynl_gemsg_start_dump(ys, ys->family_id, NFSD_CMD_SPLICE_READ, 1);
>> +
>> + err = ynl_exec_dump(ys, nlh, &yds);
>> + if (err < 0)
>> + goto free_list;
>> +
>> + return yds.first;
>> +
>> +free_list:
>> + nfsd_splice_read_rsp_list_free(yds.first);
>> + return NULL;
>> +}
>> +
>> const struct ynl_family ynl_nfsd_family =  {
>> .name = "nfsd",
>> };
>> diff --git a/tools/net/ynl/generated/nfsd-user.h b/tools/net/ynl/generated/nfsd-user.h
>> index 989c6e209ced..5732c5a665e7 100644
>> --- a/tools/net/ynl/generated/nfsd-user.h
>> +++ b/tools/net/ynl/generated/nfsd-user.h
>> @@ -64,4 +64,51 @@ nfsd_rpc_status_get_rsp_list_free(struct nfsd_rpc_status_get_rsp_list *rsp);
>> struct nfsd_rpc_status_get_rsp_list *
>> nfsd_rpc_status_get_dump(struct ynl_sock *ys);
>> 
>> +/* ============== NFSD_CMD_SPLICE_READ ============== */
>> +/* NFSD_CMD_SPLICE_READ - do */
>> +struct nfsd_splice_read_req {
>> + struct {
>> + __u32 enabled:1;
>> + } _present;
>> +
>> + __u32 enabled;
>> +};
>> +
>> +static inline struct nfsd_splice_read_req *nfsd_splice_read_req_alloc(void)
>> +{
>> + return calloc(1, sizeof(struct nfsd_splice_read_req));
>> +}
>> +void nfsd_splice_read_req_free(struct nfsd_splice_read_req *req);
>> +
>> +static inline void
>> +nfsd_splice_read_req_set_enabled(struct nfsd_splice_read_req *req,
>> +  __u32 enabled)
>> +{
>> + req->_present.enabled = 1;
>> + req->enabled = enabled;
>> +}
>> +
>> +/*
>> + * Disable the use of splice for NFS READ operations
>> + */
>> +int nfsd_splice_read(struct ynl_sock *ys, struct nfsd_splice_read_req *req);
>> +
>> +/* NFSD_CMD_SPLICE_READ - dump */
>> +struct nfsd_splice_read_rsp_dump {
>> + struct {
>> + __u32 enabled:1;
>> + } _present;
>> +
>> + __u32 enabled;
>> +};
>> +
>> +struct nfsd_splice_read_rsp_list {
>> + struct nfsd_splice_read_rsp_list *next;
>> + struct nfsd_splice_read_rsp_dump obj __attribute__ ((aligned (8)));
>> +};
>> +
>> +void nfsd_splice_read_rsp_list_free(struct nfsd_splice_read_rsp_list *rsp);
>> +
>> +struct nfsd_splice_read_rsp_list *nfsd_splice_read_dump(struct ynl_sock *ys);
>> +
>> #endif /* _LINUX_NFSD_GEN_H */
>> 
>> 
>> 
> 
> -- 
> Jeff Layton <jlayton@xxxxxxxxxx>


--
Chuck Lever






[Index of Archives]     [Linux Filesystem Development]     [Linux USB Development]     [Linux Media Development]     [Video for Linux]     [Linux NILFS]     [Linux Audio Users]     [Yosemite Info]     [Linux SCSI]

  Powered by Linux