/*-
 * SPDX-License-Identifier: BSD-2-Clause
 *
 * Copyright (c) 2022 Alexander V. Chernikov <melifaro@FreeBSD.org>
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 *
 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 */

#include <sys/types.h>
#include <sys/ck.h>
#include <sys/epoch.h>
#include <sys/eventhandler.h>
#include <sys/kernel.h>
#include <sys/jail.h>
#include <sys/lock.h>
#include <sys/malloc.h>
#include <sys/priv.h>
#include <sys/proc.h>
#include <sys/socket.h>
#include <sys/sx.h>

#include <netlink/netlink.h>
#include <netlink/netlink_ctl.h>
#include <netlink/netlink_generic.h>
#include <netlink/netlink_var.h>

#define	DEBUG_MOD_NAME	nl_generic
#define	DEBUG_MAX_LEVEL	LOG_DEBUG3
#include <netlink/netlink_debug.h>
_DECLARE_DEBUG(LOG_INFO);

static int nlctrl_handle_getfamily(struct nlmsghdr *, struct nl_pstate *);

static struct genl_cmd nlctrl_cmds[] = {
	[CTRL_CMD_GETFAMILY] = {
		.cmd_num = CTRL_CMD_GETFAMILY,
		.cmd_name = "GETFAMILY",
		.cmd_cb = nlctrl_handle_getfamily,
		.cmd_flags = GENL_CMD_CAP_DO | GENL_CMD_CAP_DUMP |
		    GENL_CMD_CAP_HASPOL,
	},
};

static struct genl_family {
	const char	*family_name;
	uint16_t	family_hdrsize;
	uint16_t	family_version;
	uint16_t	family_attr_max;
	uint16_t	family_cmd_size;
	uint16_t	family_num_groups;
	struct genl_cmd	*family_cmds;
} families[MAX_FAMILIES] = {
	[CTRL_FAMILY_ID] = {
		.family_name = CTRL_FAMILY_NAME,
		.family_hdrsize = 0,
		.family_version = 2,
		.family_attr_max = CTRL_ATTR_MAX,
		.family_cmd_size = CTRL_CMD_GETFAMILY + 1,
		.family_cmds = nlctrl_cmds,
		.family_num_groups = 1,
	},
};

static struct genl_group {
	struct genl_family	*group_family;
	const char		*group_name;
} groups[MAX_GROUPS] = {
	[CTRL_GROUP_ID] = {
		.group_family = &families[CTRL_FAMILY_ID],
		.group_name = CTRL_GROUP_NAME,
	},
};

static inline struct genl_family *
genl_family(uint16_t family_id)
{
	struct genl_family *gf;

	gf = &families[family_id - GENL_MIN_ID];
	KASSERT(family_id - GENL_MIN_ID < MAX_FAMILIES &&
	    gf->family_name != NULL, ("family %u does not exist", family_id));
	return (gf);
}

static inline uint16_t
genl_family_id(const struct genl_family *gf)
{
	MPASS(gf >= &families[0] && gf < &families[MAX_FAMILIES]);
	return ((uint16_t)(gf - &families[0]) + GENL_MIN_ID);
}

/*
 * Handler called by netlink subsystem when matching netlink message is received
 */
static int
genl_handle_message(struct nlmsghdr *hdr, struct nl_pstate *npt)
{
	struct nlpcb *nlp = npt->nlp;
	struct genl_family *gf;
	uint16_t family_id;
	int error = 0;

	if (__predict_false(hdr->nlmsg_len < sizeof(struct nlmsghdr) +
	    GENL_HDRLEN)) {
		NLP_LOG(LOG_DEBUG, nlp, "invalid message size: %d",
		    hdr->nlmsg_len);
		return (EINVAL);
	}

	family_id = hdr->nlmsg_type - GENL_MIN_ID;
	gf = &families[family_id];
	if (__predict_false(family_id >= MAX_FAMILIES ||
	    gf->family_name == NULL)) {
		NLP_LOG(LOG_DEBUG, nlp, "invalid message type: %d",
		    hdr->nlmsg_type);
		return (ENOTSUP);
	}

	struct genlmsghdr *ghdr = (struct genlmsghdr *)(hdr + 1);

	if (ghdr->cmd >= gf->family_cmd_size || gf->family_cmds[ghdr->cmd].cmd_cb == NULL) {
		NLP_LOG(LOG_DEBUG, nlp, "family %s: invalid cmd %d",
		    gf->family_name, ghdr->cmd);
		return (ENOTSUP);
	}

	struct genl_cmd *cmd = &gf->family_cmds[ghdr->cmd];

	if (cmd->cmd_priv != 0 && !nlp_has_priv(nlp, cmd->cmd_priv)) {
		NLP_LOG(LOG_DEBUG, nlp, "family %s: cmd %d priv_check() failed",
		    gf->family_name, ghdr->cmd);
		return (EPERM);
	}

	if (cmd->cmd_securelevel > 0 &&
	    securelevel_ge(nlp_get_cred(nlp), cmd->cmd_securelevel)) {
		NLP_LOG(LOG_DEBUG, nlp, "family %s: cmd %d securelevel_gt() failed",
		    gf->family_name, ghdr->cmd);
		return (EPERM);
	}

	NLP_LOG(LOG_DEBUG2, nlp, "received family %s cmd %s(%d) len %d",
	    gf->family_name, cmd->cmd_name, ghdr->cmd, hdr->nlmsg_len);

	error = cmd->cmd_cb(hdr, npt);

	return (error);
}

static uint32_t
get_cmd_flags(const struct genl_cmd *cmd)
{
	uint32_t flags = cmd->cmd_flags;
	if (cmd->cmd_priv != 0)
		flags |= GENL_ADMIN_PERM;
	return (flags);
}

static int
dump_family(struct nlmsghdr *hdr, struct genlmsghdr *ghdr,
    const struct genl_family *gf, struct nl_writer *nw)
{
	if (!nlmsg_reply(nw, hdr, sizeof(struct genlmsghdr)))
		goto enomem;

	struct genlmsghdr *ghdr_new = nlmsg_reserve_object(nw, struct genlmsghdr);
	ghdr_new->cmd = ghdr->cmd;
	ghdr_new->version = gf->family_version;
	ghdr_new->reserved = 0;

        nlattr_add_string(nw, CTRL_ATTR_FAMILY_NAME, gf->family_name);
        nlattr_add_u16(nw, CTRL_ATTR_FAMILY_ID, genl_family_id(gf));
        nlattr_add_u32(nw, CTRL_ATTR_VERSION, gf->family_version);
        nlattr_add_u32(nw, CTRL_ATTR_HDRSIZE, gf->family_hdrsize);
        nlattr_add_u32(nw, CTRL_ATTR_MAXATTR, gf->family_attr_max);

	if (gf->family_cmd_size > 0) {
		int off = nlattr_add_nested(nw, CTRL_ATTR_OPS);
		if (off == 0)
			goto enomem;
		for (int i = 0, cnt=0; i < gf->family_cmd_size; i++) {
			struct genl_cmd *cmd = &gf->family_cmds[i];
			if (cmd->cmd_cb == NULL)
				continue;
			int cmd_off = nlattr_add_nested(nw, ++cnt);
			if (cmd_off == 0)
				goto enomem;

			nlattr_add_u32(nw, CTRL_ATTR_OP_ID, cmd->cmd_num);
			nlattr_add_u32(nw, CTRL_ATTR_OP_FLAGS, get_cmd_flags(cmd));
			nlattr_set_len(nw, cmd_off);
		}
		nlattr_set_len(nw, off);
	}
	if (gf->family_num_groups > 0) {
		int off = nlattr_add_nested(nw, CTRL_ATTR_MCAST_GROUPS);
		if (off == 0)
			goto enomem;
		for (u_int i = 0, cnt = 0; i < MAX_GROUPS; i++) {
			struct genl_group *gg = &groups[i];

			if (gg->group_family != gf)
				continue;

			int cmd_off = nlattr_add_nested(nw, ++cnt);
			if (cmd_off == 0)
				goto enomem;
			nlattr_add_u32(nw, CTRL_ATTR_MCAST_GRP_ID, i + MIN_GROUP_NUM);
			nlattr_add_string(nw, CTRL_ATTR_MCAST_GRP_NAME, gg->group_name);
			nlattr_set_len(nw, cmd_off);
		}
		nlattr_set_len(nw, off);
	}
	if (nlmsg_end(nw))
		return (0);
enomem:
        NL_LOG(LOG_DEBUG, "unable to dump family %s state (ENOMEM)", gf->family_name);
        nlmsg_abort(nw);
	return (ENOMEM);
}

struct nl_parsed_family {
	char		*family_name;
	uint16_t	family_id;
	uint8_t		version;
};

#define	_IN(_field)	offsetof(struct genlmsghdr, _field)
#define	_OUT(_field)	offsetof(struct nl_parsed_family, _field)
static const struct nlfield_parser nlf_p_generic[] = {
	{ .off_in = _IN(version), .off_out = _OUT(version), .cb = nlf_get_u8 },
};

static struct nlattr_parser nla_p_generic[] = {
	{ .type = CTRL_ATTR_FAMILY_ID , .off = _OUT(family_id), .cb = nlattr_get_uint16 },
	{ .type = CTRL_ATTR_FAMILY_NAME , .off = _OUT(family_name), .cb = nlattr_get_string },
};
#undef _IN
#undef _OUT
NL_DECLARE_PARSER(genl_parser, struct genlmsghdr, nlf_p_generic, nla_p_generic);

static int
nlctrl_handle_getfamily(struct nlmsghdr *hdr, struct nl_pstate *npt)
{
	int error = 0;

	struct nl_parsed_family attrs = {};
	error = nl_parse_nlmsg(hdr, &genl_parser, npt, &attrs);
	if (error != 0)
		return (error);

	struct genlmsghdr ghdr = {
		.cmd = CTRL_CMD_NEWFAMILY,
	};

	if (attrs.family_id != 0 || attrs.family_name != NULL) {
		for (u_int i = 0; i < MAX_FAMILIES; i++) {
			struct genl_family *gf = &families[i];

			if (gf->family_name == NULL)
				continue;
			if (attrs.family_id != 0 &&
			    attrs.family_id != genl_family_id(gf))
				continue;
			if (attrs.family_name != NULL &&
			    strcmp(attrs.family_name, gf->family_name) != 0)
				continue;
			return (dump_family(hdr, &ghdr, gf, npt->nw));
		}
		return (ENOENT);
	}

	hdr->nlmsg_flags = hdr->nlmsg_flags | NLM_F_MULTI;
	for (u_int i = 0; i < MAX_FAMILIES; i++) {
		struct genl_family *gf = &families[i];

		if (gf->family_name != NULL) {
			error = dump_family(hdr, &ghdr, gf, npt->nw);
			if (error != 0)
				break;
		}
	}

	if (!nlmsg_end_dump(npt->nw, error, hdr)) {
                NL_LOG(LOG_DEBUG, "Unable to finalize the dump");
                return (ENOMEM);
        }

	return (error);
}

static void
nlctrl_notify(void *arg __unused, const char *family_name __unused,
    uint16_t family_id, u_int cmd)
{
	struct nlmsghdr hdr = {.nlmsg_type = NETLINK_GENERIC };
	struct genlmsghdr ghdr = { .cmd = cmd };
	struct genl_family *gf;
	struct nl_writer nw;

	gf = genl_family(family_id);
	if (!nl_writer_group(&nw, NLMSG_SMALL, NETLINK_GENERIC, CTRL_GROUP_ID,
	    0, false)) {
		NL_LOG(LOG_DEBUG, "error allocating group writer");
		return;
	}

	dump_family(&hdr, &ghdr, gf, &nw);
	nlmsg_flush(&nw);
}

static const struct nlhdr_parser *all_parsers[] = { &genl_parser };
static eventhandler_tag family_event_tag;

static void
genl_load_all(void *u __unused)
{
	NL_VERIFY_PARSERS(all_parsers);
	family_event_tag = EVENTHANDLER_REGISTER(genl_family_event,
	    nlctrl_notify, NULL, EVENTHANDLER_PRI_ANY);
	netlink_register_proto(NETLINK_GENERIC, "NETLINK_GENERIC",
	    genl_handle_message);
}
SYSINIT(genl_load_all, SI_SUB_PROTO_DOMAIN, SI_ORDER_THIRD, genl_load_all, NULL);

static void
genl_unload(void *u __unused)
{
	netlink_unregister_proto(NETLINK_GENERIC);
	EVENTHANDLER_DEREGISTER(genl_family_event, family_event_tag);
	NET_EPOCH_WAIT();
}
SYSUNINIT(genl_unload, SI_SUB_PROTO_DOMAIN, SI_ORDER_THIRD, genl_unload, NULL);

/*
 * Public KPI for NETLINK_GENERIC families/groups registration logic below.
 */

static struct sx sx_lock;
SX_SYSINIT(genl_lock, &sx_lock, "genetlink lock");
#define	GENL_LOCK()		sx_xlock(&sx_lock)
#define	GENL_UNLOCK()		sx_xunlock(&sx_lock)
#define	GENL_ASSERT_LOCKED()	sx_assert(&sx_lock, SA_LOCKED)
#define	GENL_ASSERT_XLOCKED()	sx_assert(&sx_lock, SA_XLOCKED)

uint16_t
genl_register_family(const char *family_name, size_t hdrsize,
    uint16_t family_version, uint16_t max_attr_idx)
{
	struct genl_family *gf;
	uint16_t family_id;

	MPASS(family_name != NULL);

	GENL_LOCK();
	for (u_int i = 0; i < MAX_FAMILIES; i++)
		if (families[i].family_name != NULL &&
		    strcmp(families[i].family_name, family_name) == 0) {
			GENL_UNLOCK();
			return (0);
		}

	/* Microoptimization: index 0 is reserved for the control family. */
	gf = NULL;
	for (u_int i = 1; i < MAX_FAMILIES; i++)
		if (families[i].family_name == NULL) {
			gf = &families[i];
			break;
		}
	KASSERT(gf, ("%s: maximum of %u generic netlink families allocated",
	    __func__, MAX_FAMILIES));

	*gf = (struct genl_family) {
	    .family_name = family_name,
	    .family_version = family_version,
	    .family_hdrsize = hdrsize,
	    .family_attr_max = max_attr_idx,
	};
	family_id = genl_family_id(gf);
	GENL_UNLOCK();

	NL_LOG(LOG_DEBUG2, "Registered family %s id %d", gf->family_name,
	    family_id);
	EVENTHANDLER_INVOKE(genl_family_event, gf->family_name, family_id,
	    CTRL_CMD_NEWFAMILY);

	return (family_id);
}

void
genl_unregister_family(uint16_t family_id)
{
	struct genl_family *gf;

	GENL_LOCK();
	gf = genl_family(family_id);

	EVENTHANDLER_INVOKE(genl_family_event, gf->family_name,
	    family_id, CTRL_CMD_DELFAMILY);
	for (u_int i = 0; i < MAX_GROUPS; i++) {
		struct genl_group *gg = &groups[i];
		if (gg->group_family == gf && gg->group_name != NULL) {
			gg->group_family = NULL;
			gg->group_name = NULL;
		}
	}
	if (gf->family_cmds != NULL)
		free(gf->family_cmds, M_NETLINK);
	bzero(gf, sizeof(*gf));
	GENL_UNLOCK();
}

bool
genl_register_cmds(uint16_t family_id, const struct genl_cmd *cmds,
    u_int count)
{
	struct genl_family *gf;
	uint16_t cmd_size;

	GENL_LOCK();
	gf = genl_family(family_id);

	cmd_size = gf->family_cmd_size;

	for (u_int i = 0; i < count; i++) {
		MPASS(cmds[i].cmd_cb != NULL);
		if (cmds[i].cmd_num >= cmd_size)
			cmd_size = cmds[i].cmd_num + 1;
	}

	if (cmd_size > gf->family_cmd_size) {
		void *old_data;

		/* need to realloc */
		size_t sz = cmd_size * sizeof(struct genl_cmd);
		void *data = malloc(sz, M_NETLINK, M_WAITOK | M_ZERO);

		memcpy(data, gf->family_cmds,
		    gf->family_cmd_size * sizeof(struct genl_cmd));
		old_data = gf->family_cmds;
		gf->family_cmds = data;
		gf->family_cmd_size = cmd_size;
		free(old_data, M_NETLINK);
	}

	for (u_int i = 0; i < count; i++) {
		const struct genl_cmd *cmd = &cmds[i];

		MPASS(gf->family_cmds[cmd->cmd_num].cmd_cb == NULL);
		gf->family_cmds[cmd->cmd_num] = cmds[i];
		NL_LOG(LOG_DEBUG2, "Adding cmd %s(%d) to family %s",
		    cmd->cmd_name, cmd->cmd_num, gf->family_name);
	}
	GENL_UNLOCK();
	return (true);
}

uint32_t
genl_register_group(uint16_t family_id, const char *group_name)
{
	struct genl_family *gf;
	uint32_t group_id = 0;

	MPASS(group_name != NULL);

	GENL_LOCK();
	gf = genl_family(family_id);

	for (u_int i = 0; i < MAX_GROUPS; i++)
		if (groups[i].group_family == gf &&
		    strcmp(groups[i].group_name, group_name) == 0) {
			GENL_UNLOCK();
			return (0);
		}

	/* Microoptimization: index 0 is reserved for the control family */
	for (u_int i = 1; i < MAX_GROUPS; i++) {
		struct genl_group *gg = &groups[i];
		if (gg->group_family == NULL) {
			gf->family_num_groups++;
			gg->group_family = gf;
			gg->group_name = group_name;
			group_id = i + MIN_GROUP_NUM;
			break;
		}
	}
	GENL_UNLOCK();

	return (group_id);
}

void
genl_unregister_group(uint16_t family_id, uint32_t group_id)
{
	struct genl_family *gf;
	struct genl_group *gg;

	MPASS(group_id > MIN_GROUP_NUM &&
	    group_id < MIN_GROUP_NUM + MAX_GROUPS);

	nl_clear_group(group_id);

	group_id -= MIN_GROUP_NUM;

	GENL_LOCK();
	gf = genl_family(family_id);
	gg = &groups[group_id];

	MPASS(gg->group_family == gf);
	MPASS(gf->family_num_groups > 0);

	gf->family_num_groups--;
	gg->group_family = NULL;
	gg->group_name = NULL;
	GENL_UNLOCK();
}
