Re: [PATCHv3 2/2] IPVS: Add genetlink interface implementation

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On Fri, 8 Aug 2008, Julius Volz wrote:

> This still had two bugs:
> - policies for IPVS_DEST_ATTR_FWD_METHOD and IPVS_SVC_ATTR_FLAGS
>   were swapped
> - svc not initialized to NULL at the beginning of ip_vs_genl_set_cmd()
> 
> The version below fixes this:
> 
> ----
> Add the implementation of the new Generic Netlink interface to IPVS and
> keep the old set/getsockopt interface for userspace backwards
> compatibility.
> 
> Signed-off-by: Julius Volz <juliusv@xxxxxxxxxx>
> 
>  1 files changed, 880 insertions(+), 0 deletions(-)
> 
> diff --git a/net/ipv4/ipvs/ip_vs_ctl.c b/net/ipv4/ipvs/ip_vs_ctl.c
> index 9a5ace0..8038420 100644
> --- a/net/ipv4/ipvs/ip_vs_ctl.c
> +++ b/net/ipv4/ipvs/ip_vs_ctl.c
> @@ -37,6 +37,7 @@
>  #include <net/ip.h>
>  #include <net/route.h>
>  #include <net/sock.h>
> +#include <net/genetlink.h>
>  
>  #include <asm/uaccess.h>
>  
> @@ -2305,6 +2306,877 @@ static struct nf_sockopt_ops ip_vs_sockopts = {
>  	.owner		= THIS_MODULE,
>  };
>  
> +/*
> + * Generic Netlink interface
> + */
> +
> +/* IPVS genetlink family */
> +static struct genl_family ip_vs_genl_family = {
> +	.id		= GENL_ID_GENERATE,
> +	.hdrsize	= 0,
> +	.name		= IPVS_GENL_NAME,
> +	.version	= IPVS_GENL_VERSION,
> +	.maxattr	= IPVS_CMD_MAX,
> +};
> +
> +/* Policy used for first-level command attributes */
> +static const struct nla_policy ip_vs_cmd_policy[IPVS_CMD_ATTR_MAX + 1] = {
> +	[IPVS_CMD_ATTR_SERVICE]		= { .type = NLA_NESTED },
> +	[IPVS_CMD_ATTR_DEST]		= { .type = NLA_NESTED },
> +	[IPVS_CMD_ATTR_DAEMON]		= { .type = NLA_NESTED },
> +	[IPVS_CMD_ATTR_TIMEOUT_TCP]	= { .type = NLA_U32 },
> +	[IPVS_CMD_ATTR_TIMEOUT_TCP_FIN]	= { .type = NLA_U32 },
> +	[IPVS_CMD_ATTR_TIMEOUT_UDP]	= { .type = NLA_U32 },
> +};
> +
> +/* Policy used for attributes in nested attribute IPVS_CMD_ATTR_DAEMON */
> +static const struct nla_policy ip_vs_daemon_policy[IPVS_DAEMON_ATTR_MAX + 1] = {
> +	[IPVS_DAEMON_ATTR_STATE]	= { .type = NLA_U32 },
> +	[IPVS_DAEMON_ATTR_MCAST_IFN]	= { .type = NLA_NUL_STRING,
> +					    .len = IP_VS_IFNAME_MAXLEN },
> +	[IPVS_DAEMON_ATTR_SYNC_ID]	= { .type = NLA_U32 },
> +};
> +
> +/* Policy used for attributes in nested attribute IPVS_CMD_ATTR_SERVICE */
> +static const struct nla_policy ip_vs_svc_policy[IPVS_SVC_ATTR_MAX + 1] = {
> +	[IPVS_SVC_ATTR_AF]		= { .type = NLA_U16 },
> +	[IPVS_SVC_ATTR_PROTOCOL]	= { .type = NLA_U16 },
> +	[IPVS_SVC_ATTR_ADDR]		= { .type = NLA_BINARY,
> +					    .len = sizeof(union nf_inet_addr) },
> +	[IPVS_SVC_ATTR_PORT]		= { .type = NLA_U16 },
> +	[IPVS_SVC_ATTR_FWMARK]		= { .type = NLA_U32 },
> +	[IPVS_SVC_ATTR_SCHED_NAME]	= { .type = NLA_NUL_STRING,
> +					    .len = IP_VS_SCHEDNAME_MAXLEN },
> +	[IPVS_SVC_ATTR_FLAGS]		= { .type = NLA_BINARY,
> +					    .len = sizeof(struct ip_vs_flags) },
> +	[IPVS_SVC_ATTR_TIMEOUT]		= { .type = NLA_U32 },
> +	[IPVS_SVC_ATTR_NETMASK]		= { .type = NLA_U32 },
> +	[IPVS_SVC_ATTR_STATS]		= { .type = NLA_NESTED },
> +};
> +
> +/* Policy used for attributes in nested attribute IPVS_CMD_ATTR_DEST */
> +static const struct nla_policy ip_vs_dest_policy[IPVS_DEST_ATTR_MAX + 1] = {
> +	[IPVS_DEST_ATTR_ADDR]		= { .type = NLA_BINARY,
> +					    .len = sizeof(union nf_inet_addr) },
> +	[IPVS_DEST_ATTR_PORT]		= { .type = NLA_U16 },
> +	[IPVS_DEST_ATTR_FWD_METHOD]	= { .type = NLA_U32 },
> +	[IPVS_DEST_ATTR_WEIGHT]		= { .type = NLA_U32 },
> +	[IPVS_DEST_ATTR_U_THRESH]	= { .type = NLA_U32 },
> +	[IPVS_DEST_ATTR_L_THRESH]	= { .type = NLA_U32 },
> +	[IPVS_DEST_ATTR_ACTIVE_CONNS]	= { .type = NLA_U32 },
> +	[IPVS_DEST_ATTR_INACT_CONNS]	= { .type = NLA_U32 },
> +	[IPVS_DEST_ATTR_PERSIST_CONNS]	= { .type = NLA_U32 },
> +	[IPVS_DEST_ATTR_STATS]		= { .type = NLA_NESTED },
> +};
> +
> +static int ip_vs_genl_fill_stats(struct sk_buff *skb, int container_type,
> +				 struct ip_vs_stats *stats)
> +{
> +	struct nlattr *nl_stats = nla_nest_start(skb, container_type);
> +	if (!nl_stats)
> +		return -EMSGSIZE;
> +
> +	spin_lock_bh(&stats->lock);
> +
> +	NLA_PUT_U32(skb, IPVS_STATS_ATTR_CONNS, stats->conns);
> +	NLA_PUT_U32(skb, IPVS_STATS_ATTR_INPKTS, stats->inpkts);
> +	NLA_PUT_U32(skb, IPVS_STATS_ATTR_OUTPKTS, stats->outpkts);
> +	NLA_PUT_U64(skb, IPVS_STATS_ATTR_INBYTES, stats->inbytes);
> +	NLA_PUT_U64(skb, IPVS_STATS_ATTR_OUTBYTES, stats->outbytes);
> +	NLA_PUT_U32(skb, IPVS_STATS_ATTR_CPS, stats->cps);
> +	NLA_PUT_U32(skb, IPVS_STATS_ATTR_INPPS, stats->inpps);
> +	NLA_PUT_U32(skb, IPVS_STATS_ATTR_OUTPPS, stats->outpps);
> +	NLA_PUT_U32(skb, IPVS_STATS_ATTR_INBPS, stats->inbps);
> +	NLA_PUT_U32(skb, IPVS_STATS_ATTR_OUTBPS, stats->outbps);
> +
> +	spin_unlock_bh(&stats->lock);
> +
> +	nla_nest_end(skb, nl_stats);
> +
> +	return 0;
> +
> +nla_put_failure:
> +	spin_unlock_bh(&stats->lock);
> +	nla_nest_cancel(skb, nl_stats);
> +	return -EMSGSIZE;
> +}
> +
> +static int ip_vs_genl_fill_service(struct sk_buff *skb,
> +				   struct ip_vs_service *svc)
> +{
> +	struct nlattr *nl_service;
> +	struct ip_vs_flags flags = { .flags = svc->flags,
> +				     .mask = ~0 };
> +
> +	nl_service = nla_nest_start(skb, IPVS_CMD_ATTR_SERVICE);
> +	if (!nl_service)
> +		return -EMSGSIZE;
> +
> +	NLA_PUT_U16(skb, IPVS_SVC_ATTR_AF, AF_INET);
> +
> +	if (svc->fwmark) {
> +		NLA_PUT_U32(skb, IPVS_SVC_ATTR_FWMARK, svc->fwmark);
> +	} else {
> +		NLA_PUT_U16(skb, IPVS_SVC_ATTR_PROTOCOL, svc->protocol);
> +		NLA_PUT(skb, IPVS_SVC_ATTR_ADDR, sizeof(svc->addr), &svc->addr);
> +		NLA_PUT_U16(skb, IPVS_SVC_ATTR_PORT, svc->port);
> +	}
> +
> +	NLA_PUT_STRING(skb, IPVS_SVC_ATTR_SCHED_NAME, svc->scheduler->name);
> +	NLA_PUT(skb, IPVS_SVC_ATTR_FLAGS, sizeof(flags), &flags);
> +	NLA_PUT_U32(skb, IPVS_SVC_ATTR_TIMEOUT, svc->timeout / HZ);
> +	NLA_PUT_U32(skb, IPVS_SVC_ATTR_NETMASK, svc->netmask);
> +
> +	if (ip_vs_genl_fill_stats(skb, IPVS_SVC_ATTR_STATS, &svc->stats))
> +		goto nla_put_failure;
> +
> +	nla_nest_end(skb, nl_service);
> +
> +	return 0;
> +
> +nla_put_failure:
> +	nla_nest_cancel(skb, nl_service);
> +	return -EMSGSIZE;
> +}
> +
> +static int ip_vs_genl_dump_service(struct sk_buff *skb,
> +				   struct ip_vs_service *svc,
> +				   struct netlink_callback *cb)
> +{
> +	void *hdr;
> +
> +	hdr = genlmsg_put(skb, NETLINK_CB(cb->skb).pid, cb->nlh->nlmsg_seq,
> +			  &ip_vs_genl_family, NLM_F_MULTI,
> +			  IPVS_CMD_NEW_SERVICE);
> +	if (!hdr)
> +		return -EMSGSIZE;
> +
> +	if (ip_vs_genl_fill_service(skb, svc) < 0)
> +		goto nla_put_failure;
> +
> +	return genlmsg_end(skb, hdr);
> +
> +nla_put_failure:
> +	genlmsg_cancel(skb, hdr);
> +	return -EMSGSIZE;
> +}
> +
> +static int ip_vs_genl_dump_services(struct sk_buff *skb,
> +				    struct netlink_callback *cb)
> +{
> +	int idx = 0, i;
> +	int start = cb->args[0];
> +	struct ip_vs_service *svc;
> +
> +	mutex_lock(&__ip_vs_mutex);
> +	for (i = 0; i < IP_VS_SVC_TAB_SIZE; i++) {
> +		list_for_each_entry(svc, &ip_vs_svc_table[i], s_list) {
> +			if (++idx <= start)
> +				continue;
> +			if (ip_vs_genl_dump_service(skb, svc, cb) < 0) {
> +				idx--;
> +				goto nla_put_failure;
> +			}
> +		}
> +	}
> +
> +	for (i = 0; i < IP_VS_SVC_TAB_SIZE; i++) {
> +		list_for_each_entry(svc, &ip_vs_svc_fwm_table[i], f_list) {
> +			if (++idx <= start)
> +				continue;
> +			if (ip_vs_genl_dump_service(skb, svc, cb) < 0) {
> +				idx--;
> +				goto nla_put_failure;
> +			}
> +		}
> +	}
> +
> +nla_put_failure:
> +	mutex_unlock(&__ip_vs_mutex);
> +	cb->args[0] = idx;
> +
> +	return skb->len;
> +}
> +
> +static int ip_vs_genl_parse_service(struct ip_vs_service_user *usvc,
> +				    struct nlattr *nla, int full_entry)
> +{
> +	struct nlattr *attrs[IPVS_SVC_ATTR_MAX + 1];
> +	struct nlattr *nla_af, *nla_port, *nla_fwmark, *nla_protocol, *nla_addr;
> +
> +	/* Parse mandatory identifying service fields first */
> +	if (nla == NULL ||
> +	    nla_parse_nested(attrs, IPVS_SVC_ATTR_MAX, nla, ip_vs_svc_policy))
> +		return -EINVAL;
> +
> +	nla_af		= attrs[IPVS_SVC_ATTR_AF];
> +	nla_protocol	= attrs[IPVS_SVC_ATTR_PROTOCOL];
> +	nla_addr	= attrs[IPVS_SVC_ATTR_ADDR];
> +	nla_port	= attrs[IPVS_SVC_ATTR_PORT];
> +	nla_fwmark	= attrs[IPVS_SVC_ATTR_FWMARK];
> +
> +	if (!(nla_af && (nla_fwmark || (nla_port && nla_protocol && nla_addr))))
> +		return -EINVAL;
> +
> +	/* For now, only support IPv4 */
> +	if (nla_get_u16(nla_af) != AF_INET)
> +		return -EAFNOSUPPORT;
> +
> +	if (nla_fwmark) {
> +		usvc->protocol = IPPROTO_TCP;
> +		usvc->fwmark = nla_get_u32(nla_fwmark);
> +	} else {
> +		usvc->protocol = nla_get_u16(nla_protocol);
> +		nla_memcpy(&usvc->addr, nla_addr, sizeof(usvc->addr));
> +		usvc->port = nla_get_u16(nla_port);
> +		usvc->fwmark = 0;
> +	}
> +
> +	/* If a full entry was requested, check for the additional fields */
> +	if (full_entry) {
> +		struct nlattr *nla_sched, *nla_flags, *nla_timeout,
> +			      *nla_netmask;
> +		struct ip_vs_flags flags;
> +		struct ip_vs_service *svc;
> +
> +		nla_sched = attrs[IPVS_SVC_ATTR_SCHED_NAME];
> +		nla_flags = attrs[IPVS_SVC_ATTR_FLAGS];
> +		nla_timeout = attrs[IPVS_SVC_ATTR_TIMEOUT];
> +		nla_netmask = attrs[IPVS_SVC_ATTR_NETMASK];
> +
> +		if (!(nla_sched && nla_flags && nla_timeout && nla_netmask))
> +			return -EINVAL;
> +
> +		nla_memcpy(&flags, nla_flags, sizeof(flags));
> +
> +		/* prefill flags from service if it already exists */
> +		if (usvc->fwmark)
> +			svc = __ip_vs_svc_fwm_get(usvc->fwmark);
> +		else
> +			svc = __ip_vs_service_get(usvc->protocol, usvc->addr,
> +						  usvc->port);
> +		if (svc) {
> +			usvc->flags = svc->flags;
> +			ip_vs_service_put(svc);
> +		} else
> +			usvc->flags = 0;
> +
> +		/* set new flags from userland */
> +		usvc->flags = (usvc->flags & ~flags.mask) |
> +			      (flags.flags & flags.mask);
> +
> +		strlcpy(usvc->sched_name, nla_data(nla_sched),
> +			sizeof(usvc->sched_name));
> +		usvc->timeout = nla_get_u32(nla_timeout);
> +		usvc->netmask = nla_get_u32(nla_netmask);
> +	}
> +
> +	return 0;
> +}
> +
> +static struct ip_vs_service *ip_vs_genl_find_service(struct nlattr *nla)
> +{
> +	struct ip_vs_service_user usvc;
> +	int ret;
> +
> +	ret = ip_vs_genl_parse_service(&usvc, nla, 0);
> +	if (ret)
> +		return ERR_PTR(ret);
> +
> +	if (usvc.fwmark)
> +		return __ip_vs_svc_fwm_get(usvc.fwmark);
> +	else
> +		return __ip_vs_service_get(usvc.protocol, usvc.addr,
> +					   usvc.port);
> +}
> +
> +static int ip_vs_genl_fill_dest(struct sk_buff *skb, struct ip_vs_dest *dest)
> +{
> +	struct nlattr *nl_dest;
> +
> +	nl_dest = nla_nest_start(skb, IPVS_CMD_ATTR_DEST);
> +	if (!nl_dest)
> +		return -EMSGSIZE;
> +
> +	NLA_PUT(skb, IPVS_DEST_ATTR_ADDR, sizeof(dest->addr), &dest->addr);
> +	NLA_PUT_U16(skb, IPVS_DEST_ATTR_PORT, dest->port);
> +
> +	NLA_PUT_U32(skb, IPVS_DEST_ATTR_FWD_METHOD,
> +		    atomic_read(&dest->conn_flags) & IP_VS_CONN_F_FWD_MASK);
> +	NLA_PUT_U32(skb, IPVS_DEST_ATTR_WEIGHT, atomic_read(&dest->weight));
> +	NLA_PUT_U32(skb, IPVS_DEST_ATTR_U_THRESH, dest->u_threshold);
> +	NLA_PUT_U32(skb, IPVS_DEST_ATTR_L_THRESH, dest->l_threshold);
> +	NLA_PUT_U32(skb, IPVS_DEST_ATTR_ACTIVE_CONNS,
> +		    atomic_read(&dest->activeconns));
> +	NLA_PUT_U32(skb, IPVS_DEST_ATTR_INACT_CONNS,
> +		    atomic_read(&dest->inactconns));
> +	NLA_PUT_U32(skb, IPVS_DEST_ATTR_PERSIST_CONNS,
> +		    atomic_read(&dest->persistconns));
> +
> +	if (ip_vs_genl_fill_stats(skb, IPVS_DEST_ATTR_STATS, &dest->stats))
> +		goto nla_put_failure;
> +
> +	nla_nest_end(skb, nl_dest);
> +
> +	return 0;
> +
> +nla_put_failure:
> +	nla_nest_cancel(skb, nl_dest);
> +	return -EMSGSIZE;
> +}
> +
> +static int ip_vs_genl_dump_dest(struct sk_buff *skb, struct ip_vs_dest *dest,
> +				struct netlink_callback *cb)
> +{
> +	void *hdr;
> +
> +	hdr = genlmsg_put(skb, NETLINK_CB(cb->skb).pid, cb->nlh->nlmsg_seq,
> +			  &ip_vs_genl_family, NLM_F_MULTI,
> +			  IPVS_CMD_NEW_DEST);
> +	if (!hdr)
> +		return -EMSGSIZE;
> +
> +	if (ip_vs_genl_fill_dest(skb, dest) < 0)
> +		goto nla_put_failure;
> +
> +	return genlmsg_end(skb, hdr);
> +
> +nla_put_failure:
> +	genlmsg_cancel(skb, hdr);
> +	return -EMSGSIZE;
> +}
> +
> +static int ip_vs_genl_dump_dests(struct sk_buff *skb,
> +				 struct netlink_callback *cb)
> +{
> +	int idx = 0;
> +	int start = cb->args[0];
> +	struct ip_vs_service *svc;
> +	struct ip_vs_dest *dest;
> +	struct nlattr *attrs[IPVS_CMD_ATTR_MAX + 1];
> +
> +	mutex_lock(&__ip_vs_mutex);
> +
> +	/* Try to find the service for which to dump destinations */
> +	if (nlmsg_parse(cb->nlh, GENL_HDRLEN, attrs,
> +			IPVS_CMD_ATTR_MAX, ip_vs_cmd_policy))
> +		goto out_err;
> +
> +	svc = ip_vs_genl_find_service(attrs[IPVS_CMD_ATTR_SERVICE]);
> +	if (IS_ERR(svc) || svc == NULL)
> +		goto out_err;
> +
> +	/* Dump the destinations */
> +	list_for_each_entry(dest, &svc->destinations, n_list) {
> +		if (++idx <= start)
> +			continue;
> +		if (ip_vs_genl_dump_dest(skb, dest, cb) < 0) {
> +			idx--;
> +			goto nla_put_failure;
> +		}
> +	}
> +
> +nla_put_failure:
> +	cb->args[0] = idx;
> +	ip_vs_service_put(svc);
> +
> +out_err:
> +	mutex_unlock(&__ip_vs_mutex);
> +
> +	return skb->len;
> +}
> +
> +static int ip_vs_genl_parse_dest(struct ip_vs_dest_user *udest,
> +				 struct nlattr *nla, int full_entry)
> +{
> +	struct nlattr *attrs[IPVS_DEST_ATTR_MAX + 1];
> +	struct nlattr *nla_addr, *nla_port;
> +
> +	/* Parse mandatory identifying destination fields first */
> +	if (nla == NULL ||
> +	    nla_parse_nested(attrs, IPVS_DEST_ATTR_MAX, nla, ip_vs_dest_policy))
> +		return -EINVAL;
> +
> +	nla_addr	= attrs[IPVS_DEST_ATTR_ADDR];
> +	nla_port	= attrs[IPVS_DEST_ATTR_PORT];
> +
> +	if (!(nla_addr && nla_port))
> +		return -EINVAL;
> +
> +	nla_memcpy(&udest->addr, nla_addr, sizeof(udest->addr));
> +	udest->port = nla_get_u16(nla_port);
> +
> +	/* If a full entry was requested, check for the additional fields */
> +	if (full_entry) {
> +		struct nlattr *nla_fwd, *nla_weight, *nla_u_thresh,
> +			      *nla_l_thresh;
> +
> +		nla_fwd		= attrs[IPVS_DEST_ATTR_FWD_METHOD];
> +		nla_weight	= attrs[IPVS_DEST_ATTR_WEIGHT];
> +		nla_u_thresh	= attrs[IPVS_DEST_ATTR_U_THRESH];
> +		nla_l_thresh	= attrs[IPVS_DEST_ATTR_L_THRESH];
> +
> +		if (!(nla_fwd && nla_weight && nla_u_thresh && nla_l_thresh))
> +			return -EINVAL;
> +
> +		udest->conn_flags = nla_get_u32(nla_fwd)
> +				    & IP_VS_CONN_F_FWD_MASK;
> +		udest->weight = nla_get_u32(nla_weight);
> +		udest->u_threshold = nla_get_u32(nla_u_thresh);
> +		udest->l_threshold = nla_get_u32(nla_l_thresh);
> +	}
> +
> +	return 0;
> +}
> +
> +static int ip_vs_genl_fill_daemon(struct sk_buff *skb, __be32 state,
> +				  const char *mcast_ifn, __be32 syncid)
> +{
> +	struct nlattr *nl_daemon;
> +
> +	nl_daemon = nla_nest_start(skb, IPVS_CMD_ATTR_DAEMON);
> +	if (!nl_daemon)
> +		return -EMSGSIZE;
> +
> +	NLA_PUT_U32(skb, IPVS_DAEMON_ATTR_STATE, state);
> +	NLA_PUT_STRING(skb, IPVS_DAEMON_ATTR_MCAST_IFN, mcast_ifn);
> +	NLA_PUT_U32(skb, IPVS_DAEMON_ATTR_SYNC_ID, syncid);
> +
> +	nla_nest_end(skb, nl_daemon);
> +
> +	return 0;
> +
> +nla_put_failure:
> +	nla_nest_cancel(skb, nl_daemon);
> +	return -EMSGSIZE;
> +}
> +
> +static int ip_vs_genl_dump_daemon(struct sk_buff *skb, __be32 state,
> +				  const char *mcast_ifn, __be32 syncid,
> +				  struct netlink_callback *cb)
> +{
> +	void *hdr;
> +	hdr = genlmsg_put(skb, NETLINK_CB(cb->skb).pid, cb->nlh->nlmsg_seq,
> +			  &ip_vs_genl_family, NLM_F_MULTI,
> +			  IPVS_CMD_NEW_DAEMON);
> +	if (!hdr)
> +		return -EMSGSIZE;
> +
> +	if (ip_vs_genl_fill_daemon(skb, state, mcast_ifn, syncid))
> +		goto nla_put_failure;
> +
> +	return genlmsg_end(skb, hdr);
> +
> +nla_put_failure:
> +	genlmsg_cancel(skb, hdr);
> +	return -EMSGSIZE;
> +}
> +
> +static int ip_vs_genl_dump_daemons(struct sk_buff *skb,
> +				   struct netlink_callback *cb)
> +{
> +	mutex_lock(&__ip_vs_mutex);
> +	if ((ip_vs_sync_state & IP_VS_STATE_MASTER) && !cb->args[0]) {
> +		if (ip_vs_genl_dump_daemon(skb, IP_VS_STATE_MASTER,
> +					   ip_vs_master_mcast_ifn,
> +					   ip_vs_master_syncid, cb) < 0)
> +			goto nla_put_failure;
> +
> +		cb->args[0] = 1;
> +	}
> +
> +	if ((ip_vs_sync_state & IP_VS_STATE_BACKUP) && !cb->args[1]) {
> +		if (ip_vs_genl_dump_daemon(skb, IP_VS_STATE_BACKUP,
> +					   ip_vs_backup_mcast_ifn,
> +					   ip_vs_backup_syncid, cb) < 0)
> +			goto nla_put_failure;
> +
> +		cb->args[1] = 1;
> +	}
> +
> +nla_put_failure:
> +	mutex_unlock(&__ip_vs_mutex);
> +
> +	return skb->len;
> +}
> +
> +static int ip_vs_genl_new_daemon(struct nlattr **attrs)
> +{
> +	if (!(attrs[IPVS_DAEMON_ATTR_STATE] &&
> +	      attrs[IPVS_DAEMON_ATTR_MCAST_IFN] &&
> +	      attrs[IPVS_DAEMON_ATTR_SYNC_ID]))
> +		return -EINVAL;
> +
> +	return start_sync_thread(nla_get_u32(attrs[IPVS_DAEMON_ATTR_STATE]),
> +				 nla_data(attrs[IPVS_DAEMON_ATTR_MCAST_IFN]),
> +				 nla_get_u32(attrs[IPVS_DAEMON_ATTR_SYNC_ID]));
> +}
> +
> +static int ip_vs_genl_del_daemon(struct nlattr **attrs)
> +{
> +	if (!attrs[IPVS_DAEMON_ATTR_STATE])
> +		return -EINVAL;
> +
> +	return stop_sync_thread(nla_get_u32(attrs[IPVS_DAEMON_ATTR_STATE]));
> +}
> +
> +static int ip_vs_genl_set_config(struct nlattr **attrs)
> +{
> +	struct ip_vs_timeout_user t;
> +
> +	__ip_vs_get_timeouts(&t);
> +
> +	if (attrs[IPVS_CMD_ATTR_TIMEOUT_TCP])
> +		t.tcp_timeout = nla_get_u32(attrs[IPVS_CMD_ATTR_TIMEOUT_TCP]);
> +
> +	if (attrs[IPVS_CMD_ATTR_TIMEOUT_TCP_FIN])
> +		t.tcp_fin_timeout =
> +			nla_get_u32(attrs[IPVS_CMD_ATTR_TIMEOUT_TCP_FIN]);
> +
> +	if (attrs[IPVS_CMD_ATTR_TIMEOUT_UDP])
> +		t.udp_timeout = nla_get_u32(attrs[IPVS_CMD_ATTR_TIMEOUT_UDP]);
> +
> +	return ip_vs_set_timeout(&t);
> +}
> +
> +static int ip_vs_genl_set_cmd(struct sk_buff *skb, struct genl_info *info)
> +{
> +	struct ip_vs_service *svc = NULL;
> +	struct ip_vs_service_user usvc;
> +	struct ip_vs_dest_user udest;
> +	int ret = 0, cmd;
> +	int need_full_svc = 0, need_full_dest = 0;
> +
> +	cmd = info->genlhdr->cmd;
> +
> +	mutex_lock(&__ip_vs_mutex);
> +
> +	if (cmd == IPVS_CMD_FLUSH) {
> +		ret = ip_vs_flush();
> +		goto out;
> +	} else if (cmd == IPVS_CMD_SET_CONFIG) {
> +		ret = ip_vs_genl_set_config(info->attrs);
> +		goto out;
> +	} else if (cmd == IPVS_CMD_NEW_DAEMON ||
> +		   cmd == IPVS_CMD_DEL_DAEMON) {
> +
> +		struct nlattr *daemon_attrs[IPVS_DAEMON_ATTR_MAX + 1];
> +
> +		if (!info->attrs[IPVS_CMD_ATTR_DAEMON] ||
> +		    nla_parse_nested(daemon_attrs, IPVS_DAEMON_ATTR_MAX,
> +				     info->attrs[IPVS_CMD_ATTR_DAEMON],
> +				     ip_vs_daemon_policy)) {
> +			ret = -EINVAL;
> +			goto out;
> +		}
> +
> +		if (cmd == IPVS_CMD_NEW_DAEMON)
> +			ret = ip_vs_genl_new_daemon(daemon_attrs);
> +		else
> +			ret = ip_vs_genl_del_daemon(daemon_attrs);
> +		goto out;
> +	} else if (cmd == IPVS_CMD_ZERO &&
> +		   !info->attrs[IPVS_CMD_ATTR_SERVICE]) {
> +		ret = ip_vs_zero_all();
> +		goto out;
> +	}
> +
> +	/* All following commands require a service argument, so check if we
> +	 * received a valid one. We need a full service specification when
> +	 * adding / editing a service. Only identifying members otherwise. */
> +	if (cmd == IPVS_CMD_NEW_SERVICE || cmd == IPVS_CMD_SET_SERVICE)
> +		need_full_svc = 1;
> +
> +	ret = ip_vs_genl_parse_service(&usvc,
> +				       info->attrs[IPVS_CMD_ATTR_SERVICE],
> +				       need_full_svc);
> +	if (ret)
> +		goto out;
> +
> +	/* Lookup the exact service by <protocol, addr, port> or fwmark */
> +	if (usvc.fwmark == 0)
> +		svc = __ip_vs_service_get(usvc.protocol, usvc.addr, usvc.port);
> +	else
> +		svc = __ip_vs_svc_fwm_get(usvc.fwmark);
> +
> +	/* Unless we're adding a new service, the service must already exist */
> +	if ((cmd != IPVS_CMD_NEW_SERVICE) && (svc == NULL)) {
> +		ret = -ESRCH;
> +		goto out;
> +	}
> +
> +	/* Destination commands require a valid destination argument. For
> +	 * adding / editing a destination, we need a full destination
> +	 * specification. */
> +	if (cmd == IPVS_CMD_NEW_DEST || cmd == IPVS_CMD_SET_DEST ||
> +	    cmd == IPVS_CMD_DEL_DEST) {
> +		if (cmd != IPVS_CMD_DEL_DEST)
> +			need_full_dest = 1;
> +
> +		ret = ip_vs_genl_parse_dest(&udest,
> +					    info->attrs[IPVS_CMD_ATTR_DEST],
> +					    need_full_dest);
> +		if (ret)
> +			goto out;
> +	}
> +
> +	switch (cmd) {
> +	case IPVS_CMD_NEW_SERVICE:
> +		if (svc == NULL)
> +			ret = ip_vs_add_service(&usvc, &svc);
> +		else
> +			ret = -EEXIST;
> +		break;
> +	case IPVS_CMD_SET_SERVICE:
> +		ret = ip_vs_edit_service(svc, &usvc);
> +		break;
> +	case IPVS_CMD_DEL_SERVICE:
> +		ret = ip_vs_del_service(svc);
> +		break;
> +	case IPVS_CMD_NEW_DEST:
> +		ret = ip_vs_add_dest(svc, &udest);
> +		break;
> +	case IPVS_CMD_SET_DEST:
> +		ret = ip_vs_edit_dest(svc, &udest);
> +		break;
> +	case IPVS_CMD_DEL_DEST:
> +		ret = ip_vs_del_dest(svc, &udest);
> +		break;
> +	case IPVS_CMD_ZERO:
> +		ret = ip_vs_zero_service(svc);
> +		break;
> +	default:
> +		ret = -EINVAL;
> +	}
> +
> +out:
> +	if (svc)
> +		ip_vs_service_put(svc);
> +	mutex_unlock(&__ip_vs_mutex);
> +
> +	return ret;
> +}
> +
> +static int ip_vs_genl_get_cmd(struct sk_buff *skb, struct genl_info *info)
> +{
> +	struct sk_buff *msg;
> +	void *reply;
> +	int ret, cmd, reply_cmd;
> +
> +	mutex_lock(&__ip_vs_mutex);
> +
> +	cmd = info->genlhdr->cmd;
> +
> +	msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL);
> +	if (!msg) {
> +		ret = -ENOMEM;
> +		goto out_err;
> +	}
> +
> +	if (cmd == IPVS_CMD_GET_SERVICE)
> +		reply_cmd = IPVS_CMD_NEW_SERVICE;
> +	else if (cmd == IPVS_CMD_GET_INFO)
> +		reply_cmd = IPVS_CMD_SET_INFO;
> +	else if (cmd == IPVS_CMD_GET_CONFIG)
> +		reply_cmd = IPVS_CMD_SET_CONFIG;
> +	else {
> +		IP_VS_ERR("unknown Generic Netlink command\n");
> +		ret = -EINVAL;
> +		goto out;
> +	}
> +
> +	reply = genlmsg_put_reply(msg, info, &ip_vs_genl_family, 0, reply_cmd);
> +	if (reply == NULL)
> +		goto nla_put_failure;

And for what it's worth, the code above doesn't require __ip_vs_mutex, you 
can defer the locking until here for concurrency improvement.

> +
> +	switch (cmd) {
> +	case IPVS_CMD_GET_SERVICE:
> +	{
> +		struct ip_vs_service *svc;
> +
> +		svc = ip_vs_genl_find_service(info->attrs[IPVS_CMD_ATTR_SERVICE]);
> +		if (IS_ERR(svc)) {
> +			ret = PTR_ERR(svc);
> +			goto out_err;
> +		} else if (svc) {
> +			ret = ip_vs_genl_fill_service(msg, svc);
> +			ip_vs_service_put(svc);
> +			if (ret)
> +				goto nla_put_failure;
> +		} else {
> +			ret = -ESRCH;
> +			goto out_err;
> +		}
> +
> +		break;
> +	}
> +
> +	case IPVS_CMD_GET_CONFIG:
> +	{
> +		struct ip_vs_timeout_user t;
> +
> +		__ip_vs_get_timeouts(&t);
> +#ifdef CONFIG_IP_VS_PROTO_TCP
> +		NLA_PUT_U32(msg, IPVS_CMD_ATTR_TIMEOUT_TCP, t.tcp_timeout);
> +		NLA_PUT_U32(msg, IPVS_CMD_ATTR_TIMEOUT_TCP_FIN,
> +			    t.tcp_fin_timeout);
> +#endif
> +#ifdef CONFIG_IP_VS_PROTO_UDP
> +		NLA_PUT_U32(msg, IPVS_CMD_ATTR_TIMEOUT_UDP, t.udp_timeout);
> +#endif
> +
> +		break;
> +	}
> +
> +	case IPVS_CMD_GET_INFO:
> +		NLA_PUT_U32(msg, IPVS_INFO_ATTR_VERSION, IP_VS_VERSION_CODE);
> +		NLA_PUT_U32(msg, IPVS_INFO_ATTR_CONN_TAB_SIZE,
> +			    IP_VS_CONN_TAB_SIZE);
> +		break;
> +	}
> +
> +	genlmsg_end(msg, reply);
> +	ret = genlmsg_unicast(msg, info->snd_pid);
> +	goto out;
> +
> +nla_put_failure:
> +	IP_VS_ERR("not enough space in Netlink message\n");
> +	ret = -EMSGSIZE;
> +
> +out_err:
> +	if (msg)
> +		nlmsg_free(msg);
> +out:
> +	mutex_unlock(&__ip_vs_mutex);
> +
> +	return ret;
> +}
> +
> +
> +static struct genl_ops ip_vs_genl_ops[] __read_mostly = {
> +	/* SET commands */
> +	{
> +		.cmd	= IPVS_CMD_NEW_SERVICE,
> +		.flags	= GENL_ADMIN_PERM,
> +		.policy	= ip_vs_cmd_policy,
> +		.doit	= ip_vs_genl_set_cmd,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_SET_SERVICE,
> +		.flags	= GENL_ADMIN_PERM,
> +		.policy	= ip_vs_cmd_policy,
> +		.doit	= ip_vs_genl_set_cmd,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_DEL_SERVICE,
> +		.flags	= GENL_ADMIN_PERM,
> +		.policy	= ip_vs_cmd_policy,
> +		.doit	= ip_vs_genl_set_cmd,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_GET_SERVICE,
> +		.flags	= GENL_ADMIN_PERM,
> +		.doit	= ip_vs_genl_get_cmd,
> +		.dumpit	= ip_vs_genl_dump_services,
> +		.policy	= ip_vs_cmd_policy,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_NEW_DEST,
> +		.flags	= GENL_ADMIN_PERM,
> +		.policy	= ip_vs_cmd_policy,
> +		.doit	= ip_vs_genl_set_cmd,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_SET_DEST,
> +		.flags	= GENL_ADMIN_PERM,
> +		.policy	= ip_vs_cmd_policy,
> +		.doit	= ip_vs_genl_set_cmd,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_DEL_DEST,
> +		.flags	= GENL_ADMIN_PERM,
> +		.policy	= ip_vs_cmd_policy,
> +		.doit	= ip_vs_genl_set_cmd,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_GET_DEST,
> +		.flags	= GENL_ADMIN_PERM,
> +		.policy	= ip_vs_cmd_policy,
> +		.dumpit	= ip_vs_genl_dump_dests,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_NEW_DAEMON,
> +		.flags	= GENL_ADMIN_PERM,
> +		.policy	= ip_vs_cmd_policy,
> +		.doit	= ip_vs_genl_set_cmd,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_DEL_DAEMON,
> +		.flags	= GENL_ADMIN_PERM,
> +		.policy	= ip_vs_cmd_policy,
> +		.doit	= ip_vs_genl_set_cmd,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_GET_DAEMON,
> +		.flags	= GENL_ADMIN_PERM,
> +		.dumpit	= ip_vs_genl_dump_daemons,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_SET_CONFIG,
> +		.flags	= GENL_ADMIN_PERM,
> +		.policy	= ip_vs_cmd_policy,
> +		.doit	= ip_vs_genl_set_cmd,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_GET_CONFIG,
> +		.flags	= GENL_ADMIN_PERM,
> +		.doit	= ip_vs_genl_get_cmd,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_GET_INFO,
> +		.flags	= GENL_ADMIN_PERM,
> +		.doit	= ip_vs_genl_get_cmd,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_ZERO,
> +		.flags	= GENL_ADMIN_PERM,
> +		.policy	= ip_vs_cmd_policy,
> +		.doit	= ip_vs_genl_set_cmd,
> +	},
> +	{
> +		.cmd	= IPVS_CMD_FLUSH,
> +		.flags	= GENL_ADMIN_PERM,
> +		.doit	= ip_vs_genl_set_cmd,
> +	},
> +};
> +
> +int ip_vs_genl_register(void)
> +{
> +	int ret, i;
> +
> +	ret = genl_register_family(&ip_vs_genl_family);
> +	if (ret)
> +		return ret;
> +
> +	for (i = 0; i < ARRAY_SIZE(ip_vs_genl_ops); i++) {
> +		ret = genl_register_ops(&ip_vs_genl_family, &ip_vs_genl_ops[i]);
> +		if (ret)
> +			goto err_out;
> +	}
> +	return 0;
> +
> +err_out:
> +	genl_unregister_family(&ip_vs_genl_family);
> +	return ret;
> +}
> +
> +void ip_vs_genl_unregister(void)
> +{
> +	genl_unregister_family(&ip_vs_genl_family);
> +}
> +
> +/* End of Generic Netlink interface definitions */
> +
>  
>  int ip_vs_control_init(void)
>  {
> @@ -2319,6 +3191,13 @@ int ip_vs_control_init(void)
>  		return ret;
>  	}
>  
> +	ret = ip_vs_genl_register();
> +	if (ret) {
> +		IP_VS_ERR("cannot register Generic Netlink interface.\n");
> +		nf_unregister_sockopt(&ip_vs_sockopts);
> +		return ret;
> +	}
> +
>  	proc_net_fops_create(&init_net, "ip_vs", 0, &ip_vs_info_fops);
>  	proc_net_fops_create(&init_net, "ip_vs_stats",0, &ip_vs_stats_fops);
>  
> @@ -2355,6 +3234,7 @@ void ip_vs_control_cleanup(void)
>  	unregister_sysctl_table(sysctl_header);
>  	proc_net_remove(&init_net, "ip_vs_stats");
>  	proc_net_remove(&init_net, "ip_vs");
> +	ip_vs_genl_unregister();
>  	nf_unregister_sockopt(&ip_vs_sockopts);
>  	LeaveFunction(2);
>  }
> 
--
To unsubscribe from this list: send the line "unsubscribe lvs-devel" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at  http://vger.kernel.org/majordomo-info.html

[Index of Archives]     [Linux Filesystem Devel]     [Linux NFS]     [Linux USB Devel]     [Video for Linux]     [Linux Audio Users]     [Yosemite News]     [Linux SCSI]     [X.Org]

  Powered by Linux