Re: [PATCH v1] NFSD: Add a switch to disable nfsd_splice_read()

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 




> On Jan 24, 2024, at 5:26 PM, Jeff Layton <jlayton@xxxxxxxxxx> wrote:
> 
> On Wed, 2024-01-24 at 21:56 +0000, Chuck Lever III wrote:
>> 
>>> On Jan 24, 2024, at 3:34 PM, Jeff Layton <jlayton@xxxxxxxxxx> wrote:
>>> 
>>> On Tue, 2024-01-23 at 11:12 -0500, Chuck Lever wrote:
>>>> From: Chuck Lever <chuck.lever@xxxxxxxxxx>
>>>> 
>>>> This enables us to ensure that testing properly covers the readv
>>>> paths as well as the spliced read paths, which are more commonly
>>>> used. Also this makes it easier to do benchmark comparisons between
>>>> splice and vectored reads.
>>>> 
>>>> Suggested-by: Jeff Layton <jlayton@xxxxxxxxxx>
>>>> Signed-off-by: Chuck Lever <chuck.lever@xxxxxxxxxx>
>>>> ---
>>>> Documentation/netlink/specs/nfsd.yaml |   19 +++++++
>>>> fs/nfsd/netlink.c                     |   17 ++++++
>>>> fs/nfsd/netlink.h                     |    3 +
>>>> fs/nfsd/netns.h                       |    1 
>>>> fs/nfsd/nfsctl.c                      |   45 ++++++++++++++++
>>>> include/uapi/linux/nfsd_netlink.h     |    8 +++
>>>> tools/net/ynl/generated/nfsd-user.c   |   95 +++++++++++++++++++++++++++++++++
>>>> tools/net/ynl/generated/nfsd-user.h   |   47 ++++++++++++++++
>>>> 8 files changed, 235 insertions(+)
>>>> 
>>> 
>>> I think this makes sense. How are you testing it,
>> 
>> So far it's only been regression testing. Nothing breaks.
>> 
>> 
>>> and how do you forsee
>>> us using this interface? Will we need a new program in nfs-utils or will
>>> you extend an existing one?
>> 
>> We could add a command line option to rpc.nfsd. That doesn't
>> seem convenient for automated testers, though.
>> 
> 
> It's starting to feel like we ought to create a new nfsdctl program or
> something. It could dump the new stats and allow you to twiddle knobs
> like this one.

I thought Lorenzo had one already? I agree, switching to vectored
reads sounds like something that tool should handle.


> Maybe we could teach it to start up and shut down the
> server too so it eventually could replace rpc.nfsd?
> 
> That might be simpler than plumbing netlink support into rpc.nfsd.
> 
>> 
>>>> diff --git a/Documentation/netlink/specs/nfsd.yaml b/Documentation/netlink/specs/nfsd.yaml
>>>> index 05acc73e2e33..1a3c5e78b388 100644
>>>> --- a/Documentation/netlink/specs/nfsd.yaml
>>>> +++ b/Documentation/netlink/specs/nfsd.yaml
>>>> @@ -62,6 +62,12 @@ attribute-sets:
>>>>        name: compound-ops
>>>>        type: u32
>>>>        multi-attr: true
>>>> +  -
>>>> +    name: splice-read
>>>> +    attributes:
>>>> +      -
>>>> +        name: enabled
>>>> +        type: u32
>>>> 
>>>> operations:
>>>>  list:
>>>> @@ -87,3 +93,16 @@ operations:
>>>>            - sport
>>>>            - dport
>>>>            - compound-ops
>>>> +    -
>>>> +      name: splice-read
>>>> +      doc: Disable the use of splice for NFS READ operations
>>>> +      attribute-set: splice-read
>>>> +      flags: [ admin-perm ]
>>>> +      do:
>>>> +        request:
>>>> +          attributes:
>>>> +            - enabled
>>>> +      dump:
>>>> +        reply:
>>>> +          attributes:
>>>> +            - enabled
>>>> diff --git a/fs/nfsd/netlink.c b/fs/nfsd/netlink.c
>>>> index 0e1d635ec5f9..c47f3527d30b 100644
>>>> --- a/fs/nfsd/netlink.c
>>>> +++ b/fs/nfsd/netlink.c
>>>> @@ -10,6 +10,11 @@
>>>> 
>>>> #include <uapi/linux/nfsd_netlink.h>
>>>> 
>>>> +/* NFSD_CMD_SPLICE_READ - do */
>>>> +static const struct nla_policy nfsd_splice_read_nl_policy[NFSD_A_SPLICE_READ_ENABLED + 1] = {
>>>> + [NFSD_A_SPLICE_READ_ENABLED] = { .type = NLA_U32, },
>>>> +};
>>>> +
>>>> /* Ops table for nfsd */
>>>> static const struct genl_split_ops nfsd_nl_ops[] = {
>>>> {
>>>> @@ -19,6 +24,18 @@ static const struct genl_split_ops nfsd_nl_ops[] = {
>>>> .done = nfsd_nl_rpc_status_get_done,
>>>> .flags = GENL_CMD_CAP_DUMP,
>>>> },
>>>> + {
>>>> + .cmd = NFSD_CMD_SPLICE_READ,
>>>> + .doit = nfsd_nl_splice_read_doit,
>>>> + .policy = nfsd_splice_read_nl_policy,
>>>> + .maxattr = NFSD_A_SPLICE_READ_ENABLED,
>>>> + .flags = GENL_ADMIN_PERM | GENL_CMD_CAP_DO,
>>>> + },
>>>> + {
>>>> + .cmd = NFSD_CMD_SPLICE_READ,
>>>> + .dumpit = nfsd_nl_splice_read_dumpit,
>>>> + .flags = GENL_ADMIN_PERM | GENL_CMD_CAP_DUMP,
>>>> + },
>>>> };
>>>> 
>>>> struct genl_family nfsd_nl_family __ro_after_init = {
>>>> diff --git a/fs/nfsd/netlink.h b/fs/nfsd/netlink.h
>>>> index d83dd6bdee92..2d96d0f093bb 100644
>>>> --- a/fs/nfsd/netlink.h
>>>> +++ b/fs/nfsd/netlink.h
>>>> @@ -16,6 +16,9 @@ int nfsd_nl_rpc_status_get_done(struct netlink_callback *cb);
>>>> 
>>>> int nfsd_nl_rpc_status_get_dumpit(struct sk_buff *skb,
>>>>  struct netlink_callback *cb);
>>>> +int nfsd_nl_splice_read_doit(struct sk_buff *skb, struct genl_info *info);
>>>> +int nfsd_nl_splice_read_dumpit(struct sk_buff *skb,
>>>> +        struct netlink_callback *cb);
>>>> 
>>>> extern struct genl_family nfsd_nl_family;
>>>> 
>>>> diff --git a/fs/nfsd/netns.h b/fs/nfsd/netns.h
>>>> index 74b4360779a1..3b9e09fecbfc 100644
>>>> --- a/fs/nfsd/netns.h
>>>> +++ b/fs/nfsd/netns.h
>>>> @@ -109,6 +109,7 @@ struct nfsd_net {
>>>> 
>>>> bool nfsd_net_up;
>>>> bool lockd_up;
>>>> + bool spliced_reads;
>>>> 
>>>> seqlock_t writeverf_lock;
>>>> unsigned char writeverf[8];
>>>> diff --git a/fs/nfsd/nfsctl.c b/fs/nfsd/nfsctl.c
>>>> index 8e6dbe9e0b65..86f466dbc784 100644
>>>> --- a/fs/nfsd/nfsctl.c
>>>> +++ b/fs/nfsd/nfsctl.c
>>>> @@ -1696,6 +1696,51 @@ int nfsd_nl_rpc_status_get_done(struct netlink_callback *cb)
>>>> return 0;
>>>> }
>>>> 
>>>> +/**
>>>> + * nfsd_nl_splice_read_doit - Set the value of splice_read
>>>> + * @skb: call buffer
>>>> + * @info: netlink metadata and command arguments
>>>> + *
>>>> + * Returns zero on success, or a negative errno.
>>>> + */
>>>> +int nfsd_nl_splice_read_doit(struct sk_buff *skb, struct genl_info *info)
>>>> +{
>>>> + struct nfsd_net *nn = net_generic(sock_net(skb->sk), nfsd_net_id);
>>>> + u32 newval;
>>>> +
>>>> + if (GENL_REQ_ATTR_CHECK(info, NFSD_A_SPLICE_READ_ENABLED))
>>>> + return -EINVAL;
>>>> +
>>>> + newval = nla_get_u32(info->attrs[NFSD_A_SPLICE_READ_ENABLED]);
>>>> + nn->spliced_reads = newval ? true : false;
>>>> + return 0;
>>>> +}
>>>> +
>>>> +/**
>>>> + * nfsd_nl_splice_read_dumpit - Return the value of splice_read
>>>> + * @skb: reply buffer
>>>> + * @cb: netlink metadata and command arguments
>>>> + *
>>>> + * Returns the size of the reply or a negative errno.
>>>> + */
>>>> +int nfsd_nl_splice_read_dumpit(struct sk_buff *skb, struct netlink_callback *cb)
>>>> +{
>>>> + struct nfsd_net *nn = net_generic(sock_net(skb->sk), nfsd_net_id);
>>>> + void *hdr;
>>>> +
>>>> + hdr = genlmsg_put(skb, NETLINK_CB(cb->skb).portid, cb->nlh->nlmsg_seq,
>>>> +   &nfsd_nl_family, 0, NFSD_CMD_SPLICE_READ);
>>>> + if (!hdr)
>>>> + return -ENOBUFS;
>>>> +
>>>> + if (nla_put_s32(skb, NFSD_A_SPLICE_READ_ENABLED,
>>>> + (nn->spliced_reads ? 1 : 0)))
>>>> + return -ENOBUFS;
>>>> +
>>>> + genlmsg_end(skb, hdr);
>>>> + return 0;
>>>> +}
>>>> +
>>>> /**
>>>> * nfsd_net_init - Prepare the nfsd_net portion of a new net namespace
>>>> * @net: a freshly-created network namespace
>>>> diff --git a/include/uapi/linux/nfsd_netlink.h b/include/uapi/linux/nfsd_netlink.h
>>>> index 3cd044edee5d..c2542ed18b50 100644
>>>> --- a/include/uapi/linux/nfsd_netlink.h
>>>> +++ b/include/uapi/linux/nfsd_netlink.h
>>>> @@ -29,8 +29,16 @@ enum {
>>>> NFSD_A_RPC_STATUS_MAX = (__NFSD_A_RPC_STATUS_MAX - 1)
>>>> };
>>>> 
>>>> +enum {
>>>> + NFSD_A_SPLICE_READ_ENABLED = 1,
>>>> +
>>>> + __NFSD_A_SPLICE_READ_MAX,
>>>> + NFSD_A_SPLICE_READ_MAX = (__NFSD_A_SPLICE_READ_MAX - 1)
>>>> +};
>>>> +
>>>> enum {
>>>> NFSD_CMD_RPC_STATUS_GET = 1,
>>>> + NFSD_CMD_SPLICE_READ,
>>>> 
>>>> __NFSD_CMD_MAX,
>>>> NFSD_CMD_MAX = (__NFSD_CMD_MAX - 1)
>>>> diff --git a/tools/net/ynl/generated/nfsd-user.c b/tools/net/ynl/generated/nfsd-user.c
>>>> index 360b6448c6e9..14957bdfbe9c 100644
>>>> --- a/tools/net/ynl/generated/nfsd-user.c
>>>> +++ b/tools/net/ynl/generated/nfsd-user.c
>>>> @@ -15,6 +15,7 @@
>>>> /* Enums */
>>>> static const char * const nfsd_op_strmap[] = {
>>>> [NFSD_CMD_RPC_STATUS_GET] = "rpc-status-get",
>>>> + [NFSD_CMD_SPLICE_READ] = "splice-read",
>>>> };
>>>> 
>>>> const char *nfsd_op_str(int op)
>>>> @@ -47,6 +48,15 @@ struct ynl_policy_nest nfsd_rpc_status_nest = {
>>>> .table = nfsd_rpc_status_policy,
>>>> };
>>>> 
>>>> +struct ynl_policy_attr nfsd_splice_read_policy[NFSD_A_SPLICE_READ_MAX + 1] = {
>>>> + [NFSD_A_SPLICE_READ_ENABLED] = { .name = "enabled", .type = YNL_PT_U32, },
>>>> +};
>>>> +
>>>> +struct ynl_policy_nest nfsd_splice_read_nest = {
>>>> + .max_attr = NFSD_A_SPLICE_READ_MAX,
>>>> + .table = nfsd_splice_read_policy,
>>>> +};
>>>> +
>>>> /* Common nested types */
>>>> /* ============== NFSD_CMD_RPC_STATUS_GET ============== */
>>>> /* NFSD_CMD_RPC_STATUS_GET - dump */
>>>> @@ -198,6 +208,91 @@ nfsd_rpc_status_get_dump(struct ynl_sock *ys)
>>>> return NULL;
>>>> }
>>>> 
>>>> +/* ============== NFSD_CMD_SPLICE_READ ============== */
>>>> +/* NFSD_CMD_SPLICE_READ - do */
>>>> +void nfsd_splice_read_req_free(struct nfsd_splice_read_req *req)
>>>> +{
>>>> + free(req);
>>>> +}
>>>> +
>>>> +int nfsd_splice_read(struct ynl_sock *ys, struct nfsd_splice_read_req *req)
>>>> +{
>>>> + struct nlmsghdr *nlh;
>>>> + int err;
>>>> +
>>>> + nlh = ynl_gemsg_start_req(ys, ys->family_id, NFSD_CMD_SPLICE_READ, 1);
>>>> + ys->req_policy = &nfsd_splice_read_nest;
>>>> +
>>>> + if (req->_present.enabled)
>>>> + mnl_attr_put_u32(nlh, NFSD_A_SPLICE_READ_ENABLED, req->enabled);
>>>> +
>>>> + err = ynl_exec(ys, nlh, NULL);
>>>> + if (err < 0)
>>>> + return -1;
>>>> +
>>>> + return 0;
>>>> +}
>>>> +
>>>> +/* NFSD_CMD_SPLICE_READ - dump */
>>>> +int nfsd_splice_read_rsp_dump_parse(const struct nlmsghdr *nlh, void *data)
>>>> +{
>>>> + struct nfsd_splice_read_rsp_dump *dst;
>>>> + struct ynl_parse_arg *yarg = data;
>>>> + const struct nlattr *attr;
>>>> +
>>>> + dst = yarg->data;
>>>> +
>>>> + mnl_attr_for_each(attr, nlh, sizeof(struct genlmsghdr)) {
>>>> + unsigned int type = mnl_attr_get_type(attr);
>>>> +
>>>> + if (type == NFSD_A_SPLICE_READ_ENABLED) {
>>>> + if (ynl_attr_validate(yarg, attr))
>>>> + return MNL_CB_ERROR;
>>>> + dst->_present.enabled = 1;
>>>> + dst->enabled = mnl_attr_get_u32(attr);
>>>> + }
>>>> + }
>>>> +
>>>> + return MNL_CB_OK;
>>>> +}
>>>> +
>>>> +void nfsd_splice_read_rsp_list_free(struct nfsd_splice_read_rsp_list *rsp)
>>>> +{
>>>> + struct nfsd_splice_read_rsp_list *next = rsp;
>>>> +
>>>> + while ((void *)next != YNL_LIST_END) {
>>>> + rsp = next;
>>>> + next = rsp->next;
>>>> +
>>>> + free(rsp);
>>>> + }
>>>> +}
>>>> +
>>>> +struct nfsd_splice_read_rsp_list *nfsd_splice_read_dump(struct ynl_sock *ys)
>>>> +{
>>>> + struct ynl_dump_state yds = {};
>>>> + struct nlmsghdr *nlh;
>>>> + int err;
>>>> +
>>>> + yds.ys = ys;
>>>> + yds.alloc_sz = sizeof(struct nfsd_splice_read_rsp_list);
>>>> + yds.cb = nfsd_splice_read_rsp_dump_parse;
>>>> + yds.rsp_cmd = NFSD_CMD_SPLICE_READ;
>>>> + yds.rsp_policy = &nfsd_splice_read_nest;
>>>> +
>>>> + nlh = ynl_gemsg_start_dump(ys, ys->family_id, NFSD_CMD_SPLICE_READ, 1);
>>>> +
>>>> + err = ynl_exec_dump(ys, nlh, &yds);
>>>> + if (err < 0)
>>>> + goto free_list;
>>>> +
>>>> + return yds.first;
>>>> +
>>>> +free_list:
>>>> + nfsd_splice_read_rsp_list_free(yds.first);
>>>> + return NULL;
>>>> +}
>>>> +
>>>> const struct ynl_family ynl_nfsd_family =  {
>>>> .name = "nfsd",
>>>> };
>>>> diff --git a/tools/net/ynl/generated/nfsd-user.h b/tools/net/ynl/generated/nfsd-user.h
>>>> index 989c6e209ced..5732c5a665e7 100644
>>>> --- a/tools/net/ynl/generated/nfsd-user.h
>>>> +++ b/tools/net/ynl/generated/nfsd-user.h
>>>> @@ -64,4 +64,51 @@ nfsd_rpc_status_get_rsp_list_free(struct nfsd_rpc_status_get_rsp_list *rsp);
>>>> struct nfsd_rpc_status_get_rsp_list *
>>>> nfsd_rpc_status_get_dump(struct ynl_sock *ys);
>>>> 
>>>> +/* ============== NFSD_CMD_SPLICE_READ ============== */
>>>> +/* NFSD_CMD_SPLICE_READ - do */
>>>> +struct nfsd_splice_read_req {
>>>> + struct {
>>>> + __u32 enabled:1;
>>>> + } _present;
>>>> +
>>>> + __u32 enabled;
>>>> +};
>>>> +
>>>> +static inline struct nfsd_splice_read_req *nfsd_splice_read_req_alloc(void)
>>>> +{
>>>> + return calloc(1, sizeof(struct nfsd_splice_read_req));
>>>> +}
>>>> +void nfsd_splice_read_req_free(struct nfsd_splice_read_req *req);
>>>> +
>>>> +static inline void
>>>> +nfsd_splice_read_req_set_enabled(struct nfsd_splice_read_req *req,
>>>> +  __u32 enabled)
>>>> +{
>>>> + req->_present.enabled = 1;
>>>> + req->enabled = enabled;
>>>> +}
>>>> +
>>>> +/*
>>>> + * Disable the use of splice for NFS READ operations
>>>> + */
>>>> +int nfsd_splice_read(struct ynl_sock *ys, struct nfsd_splice_read_req *req);
>>>> +
>>>> +/* NFSD_CMD_SPLICE_READ - dump */
>>>> +struct nfsd_splice_read_rsp_dump {
>>>> + struct {
>>>> + __u32 enabled:1;
>>>> + } _present;
>>>> +
>>>> + __u32 enabled;
>>>> +};
>>>> +
>>>> +struct nfsd_splice_read_rsp_list {
>>>> + struct nfsd_splice_read_rsp_list *next;
>>>> + struct nfsd_splice_read_rsp_dump obj __attribute__ ((aligned (8)));
>>>> +};
>>>> +
>>>> +void nfsd_splice_read_rsp_list_free(struct nfsd_splice_read_rsp_list *rsp);
>>>> +
>>>> +struct nfsd_splice_read_rsp_list *nfsd_splice_read_dump(struct ynl_sock *ys);
>>>> +
>>>> #endif /* _LINUX_NFSD_GEN_H */
>>>> 
>>>> 
>>>> 
>>> 
>>> -- 
>>> Jeff Layton <jlayton@xxxxxxxxxx>
>> 
>> 
>> --
>> Chuck Lever
>> 
>> 
> 
> -- 
> Jeff Layton <jlayton@xxxxxxxxxx>


--
Chuck Lever






[Index of Archives]     [Linux Filesystem Development]     [Linux USB Development]     [Linux Media Development]     [Video for Linux]     [Linux NILFS]     [Linux Audio Users]     [Yosemite Info]     [Linux SCSI]

  Powered by Linux