summaryrefslogtreecommitdiff
path: root/usr/src/lib/libipadm/common/ipadm_ngz.c
diff options
context:
space:
mode:
Diffstat (limited to 'usr/src/lib/libipadm/common/ipadm_ngz.c')
-rw-r--r--usr/src/lib/libipadm/common/ipadm_ngz.c485
1 files changed, 485 insertions, 0 deletions
diff --git a/usr/src/lib/libipadm/common/ipadm_ngz.c b/usr/src/lib/libipadm/common/ipadm_ngz.c
new file mode 100644
index 0000000000..e5f59fe6d2
--- /dev/null
+++ b/usr/src/lib/libipadm/common/ipadm_ngz.c
@@ -0,0 +1,485 @@
+/*
+ * CDDL HEADER START
+ *
+ * The contents of this file are subject to the terms of the
+ * Common Development and Distribution License (the "License").
+ * You may not use this file except in compliance with the License.
+ *
+ * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
+ * or http://www.opensolaris.org/os/licensing.
+ * See the License for the specific language governing permissions
+ * and limitations under the License.
+ *
+ * When distributing Covered Code, include this CDDL HEADER in each
+ * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
+ * If applicable, add the following below this CDDL HEADER, with the
+ * fields enclosed by brackets "[]" replaced with your own identifying
+ * information: Portions Copyright [yyyy] [name of copyright owner]
+ *
+ * CDDL HEADER END
+ */
+/*
+ * Copyright (c) 2010, Oracle and/or its affiliates. All rights reserved.
+ */
+
+#include <errno.h>
+#include <fcntl.h>
+#include <priv_utils.h>
+#include <signal.h>
+#include <stdlib.h>
+#include <stdio.h>
+#include <strings.h>
+#include <sys/param.h>
+#include <sys/stat.h>
+#include <unistd.h>
+#include <zone.h>
+#include <libipadm.h>
+#include <libdladm.h>
+#include <libdllink.h>
+#include <net/route.h>
+#include <netinet/in.h>
+#include <net/route.h>
+#include <errno.h>
+#include <inet/ip.h>
+#include <string.h>
+#include <libinetutil.h>
+#include <unistd.h>
+#include <libipadm_impl.h>
+#include <sys/brand.h>
+
+#define ROUNDUP_LONG(a) \
+ ((a) > 0 ? (1 + (((a) - 1) | (sizeof (long) - 1))) : sizeof (long))
+#define HOST_MASK 0xffffffffU
+
+typedef struct ngz_walk_data_s {
+ ipadm_handle_t ngz_iph;
+ zoneid_t ngz_zoneid;
+ char *ngz_ifname;
+ boolean_t ngz_s10c;
+ ipadm_status_t ngz_ipstatus;
+ persist_cb_t ngz_persist_if;
+} ngz_walk_data_t;
+
+/*
+ * Tell the kernel to add, delete or change a route
+ */
+static void
+i_ipadm_rtioctl4(int rtsock,
+ int action, /* RTM_DELETE, etc */
+ in_addr_t dst,
+ in_addr_t gate,
+ uint_t masklen,
+ char *ifname,
+ uint8_t metric,
+ int flags)
+{
+ static int rt_sock_seqno = 0;
+ struct {
+ struct rt_msghdr w_rtm;
+ struct sockaddr_in w_dst;
+ struct sockaddr_in w_gate;
+ uint8_t w_space[512];
+ } w;
+ struct sockaddr_in w_mask;
+ struct sockaddr_dl w_ifp;
+ uint8_t *cp;
+ long cc;
+
+again:
+ (void) memset(&w, 0, sizeof (w));
+ (void) memset(&w_mask, 0, sizeof (w_mask));
+ (void) memset(&w_ifp, 0, sizeof (w_ifp));
+ cp = w.w_space;
+ w.w_rtm.rtm_msglen = sizeof (struct rt_msghdr) +
+ 2 * ROUNDUP_LONG(sizeof (struct sockaddr_in));
+ w.w_rtm.rtm_version = RTM_VERSION;
+ w.w_rtm.rtm_type = action;
+ w.w_rtm.rtm_flags = (flags | RTF_ZONE);
+ w.w_rtm.rtm_seq = ++rt_sock_seqno;
+ w.w_rtm.rtm_addrs = RTA_DST|RTA_GATEWAY;
+ if (metric != 0 || action == RTM_CHANGE) {
+ w.w_rtm.rtm_rmx.rmx_hopcount = metric;
+ w.w_rtm.rtm_inits |= RTV_HOPCOUNT;
+ }
+ w.w_dst.sin_family = AF_INET;
+ w.w_dst.sin_addr.s_addr = dst;
+ w.w_gate.sin_family = AF_INET;
+ w.w_gate.sin_addr.s_addr = gate;
+ if (masklen == HOST_MASK) {
+ w.w_rtm.rtm_flags |= RTF_HOST;
+ } else {
+ struct sockaddr_storage m4;
+
+ w.w_rtm.rtm_addrs |= RTA_NETMASK;
+ w_mask.sin_family = AF_INET;
+ if (plen2mask(masklen, AF_INET, &m4) != 0) {
+ return;
+ }
+ w_mask.sin_addr = ((struct sockaddr_in *)&m4)->sin_addr;
+ (void) memmove(cp, &w_mask, sizeof (w_mask));
+ cp += ROUNDUP_LONG(sizeof (struct sockaddr_in));
+ w.w_rtm.rtm_msglen += ROUNDUP_LONG(sizeof (struct sockaddr_in));
+ }
+ w_ifp.sdl_family = AF_LINK;
+ w.w_rtm.rtm_addrs |= RTA_IFP;
+ w_ifp.sdl_index = if_nametoindex(ifname);
+ (void) memmove(cp, &w_ifp, sizeof (w_ifp));
+ w.w_rtm.rtm_msglen += ROUNDUP_LONG(sizeof (struct sockaddr_dl));
+
+ cc = write(rtsock, &w, w.w_rtm.rtm_msglen);
+ if (cc < 0) {
+ if (errno == ESRCH && (action == RTM_CHANGE ||
+ action == RTM_DELETE)) {
+ if (action == RTM_CHANGE) {
+ action = RTM_ADD;
+ goto again;
+ }
+ return;
+ }
+ return;
+ } else if (cc != w.w_rtm.rtm_msglen) {
+ return;
+ }
+}
+
+static void
+i_ipadm_rtioctl6(int rtsock,
+ int action, /* RTM_DELETE, etc */
+ in6_addr_t dst,
+ in6_addr_t gate,
+ uint_t prefix_length,
+ char *ifname,
+ int flags)
+{
+ static int rt_sock_seqno = 0;
+ struct {
+ struct rt_msghdr w_rtm;
+ struct sockaddr_in6 w_dst;
+ struct sockaddr_in6 w_gate;
+ uint8_t w_space[512];
+ } w;
+ struct sockaddr_in6 w_mask;
+ struct sockaddr_dl w_ifp;
+ uint8_t *cp;
+ long cc;
+
+again:
+ (void) memset(&w, 0, sizeof (w));
+ (void) memset(&w_mask, 0, sizeof (w_mask));
+ (void) memset(&w_ifp, 0, sizeof (w_ifp));
+ cp = w.w_space;
+ w.w_rtm.rtm_msglen = sizeof (struct rt_msghdr) +
+ 2 * ROUNDUP_LONG(sizeof (struct sockaddr_in6));
+ w.w_rtm.rtm_version = RTM_VERSION;
+ w.w_rtm.rtm_type = action;
+ w.w_rtm.rtm_flags = (flags | RTF_ZONE);
+ w.w_rtm.rtm_seq = ++rt_sock_seqno;
+ w.w_rtm.rtm_addrs = RTA_DST|RTA_GATEWAY;
+ w.w_dst.sin6_family = AF_INET6;
+ w.w_dst.sin6_addr = dst;
+ w.w_gate.sin6_family = AF_INET6;
+ w.w_gate.sin6_addr = gate;
+ if (prefix_length == IPV6_ABITS) {
+ w.w_rtm.rtm_flags |= RTF_HOST;
+ } else {
+ struct sockaddr_storage m6;
+
+ w.w_rtm.rtm_addrs |= RTA_NETMASK;
+ w_mask.sin6_family = AF_INET6;
+ if (plen2mask(prefix_length, AF_INET6, &m6) != 0) {
+ return;
+ }
+ w_mask.sin6_addr = ((struct sockaddr_in6 *)&m6)->sin6_addr;
+ (void) memmove(cp, &w_mask, sizeof (w_mask));
+ cp += ROUNDUP_LONG(sizeof (struct sockaddr_in6));
+ w.w_rtm.rtm_msglen +=
+ ROUNDUP_LONG(sizeof (struct sockaddr_in6));
+ }
+ w_ifp.sdl_family = AF_LINK;
+ w.w_rtm.rtm_addrs |= RTA_IFP;
+ w_ifp.sdl_index = if_nametoindex(ifname);
+ (void) memmove(cp, &w_ifp, sizeof (w_ifp));
+ w.w_rtm.rtm_msglen += ROUNDUP_LONG(sizeof (struct sockaddr_dl));
+
+ cc = write(rtsock, &w, w.w_rtm.rtm_msglen);
+ if (cc < 0) {
+ if (errno == ESRCH && (action == RTM_CHANGE ||
+ action == RTM_DELETE)) {
+ if (action == RTM_CHANGE) {
+ action = RTM_ADD;
+ goto again;
+ }
+ return;
+ }
+ return;
+ } else if (cc != w.w_rtm.rtm_msglen) {
+ return;
+ }
+}
+
+/*
+ * Return TRUE if running in a Solaris 10 Container.
+ */
+static boolean_t
+i_ipadm_zone_is_s10c(zoneid_t zoneid)
+{
+ char brand[MAXNAMELEN];
+
+ if (zone_getattr(zoneid, ZONE_ATTR_BRAND, brand, sizeof (brand)) < 0)
+ return (B_FALSE);
+ return (strcmp(brand, NATIVE_BRAND_NAME) != 0);
+}
+
+/*
+ * Configure addresses on link. `buf' is a string of comma-separated
+ * IP addresses.
+ */
+static ipadm_status_t
+i_ipadm_ngz_addr(ipadm_handle_t iph, char *link, char *buf)
+{
+ ipadm_status_t ipstatus;
+ ipadm_addrobj_t ipaddr;
+ char *cp;
+
+ for (cp = strtok(buf, ","); cp != NULL; cp = strtok(NULL, ",")) {
+ ipstatus = ipadm_create_addrobj(IPADM_ADDR_STATIC, link,
+ &ipaddr);
+ if (ipstatus != IPADM_SUCCESS)
+ return (ipstatus);
+ /*
+ * ipadm_set_addr does the appropriate name resolution and
+ * sets up the ipadm_static_addr field.
+ */
+ ipstatus = ipadm_set_addr(ipaddr, cp, AF_UNSPEC);
+ if (ipstatus != IPADM_SUCCESS) {
+ ipadm_destroy_addrobj(ipaddr);
+ return (ipstatus);
+ }
+
+ ipstatus = ipadm_create_addr(iph, ipaddr,
+ (IPADM_OPT_ACTIVE | IPADM_OPT_UP));
+ if (ipstatus != IPADM_SUCCESS) {
+ ipadm_destroy_addrobj(ipaddr);
+ return (ipstatus);
+ }
+ ipadm_destroy_addrobj(ipaddr);
+ }
+ return (IPADM_SUCCESS);
+}
+
+/*
+ * The (*persist_if)() will set up persistent information for the interface,
+ * based on what interface families are required, so just resolve the
+ * address and inform the callback about the linkname, and required address
+ * families.
+ */
+static ipadm_status_t
+i_ipadm_ngz_persist_if(char *link, char *buf,
+ void (*ngz_persist_if)(char *, boolean_t, boolean_t))
+{
+ char *cp, *slashp, addr[INET6_ADDRSTRLEN];
+ ipadm_status_t ipstatus;
+ struct sockaddr_storage ss;
+ boolean_t v4 = B_FALSE;
+ boolean_t v6 = B_FALSE;
+
+ for (cp = strtok(buf, ","); cp != NULL; cp = strtok(NULL, ",")) {
+ /* remove the /<masklen> that's always added by zoneadmd */
+ slashp = strchr(cp, '/');
+ (void) strlcpy(addr, cp, (slashp - cp + 1));
+
+ /* resolve the address to find the family */
+ bzero(&ss, sizeof (ss));
+ ipstatus = i_ipadm_resolve_addr(addr, AF_UNSPEC, &ss);
+ if (ipstatus != IPADM_SUCCESS)
+ return (ipstatus);
+ switch (ss.ss_family) {
+ case AF_INET:
+ v4 = B_TRUE;
+ break;
+ case AF_INET6:
+ v6 = B_TRUE;
+ break;
+ default:
+ return (IPADM_BAD_ADDR);
+ }
+ }
+ (*ngz_persist_if)(link, v4, v6);
+ return (IPADM_SUCCESS);
+}
+
+static void
+i_ipadm_create_ngz_route(int rtsock, char *link, uint8_t *buf, size_t buflen)
+{
+ struct in6_addr defrouter;
+ boolean_t isv6;
+ struct in_addr gw4;
+ uint8_t *cp;
+ const in6_addr_t ipv6_all_zeros = { 0, 0, 0, 0 };
+
+ if (rtsock == -1)
+ return;
+
+ for (cp = buf; cp < buf + buflen; cp += sizeof (defrouter)) {
+ bcopy(cp, &defrouter, sizeof (defrouter));
+ if (IN6_IS_ADDR_UNSPECIFIED(&defrouter))
+ break;
+ isv6 = !IN6_IS_ADDR_V4MAPPED(&defrouter);
+ if (isv6) {
+ i_ipadm_rtioctl6(rtsock, RTM_ADD, ipv6_all_zeros,
+ defrouter, 0, link, RTF_GATEWAY);
+ } else {
+ IN6_V4MAPPED_TO_INADDR(&defrouter, &gw4);
+ i_ipadm_rtioctl4(rtsock, RTM_ADD, INADDR_ANY,
+ gw4.s_addr, 0, link, 0, RTF_GATEWAY);
+ }
+ }
+}
+
+/*
+ * Wrapper function to zone_getattr() for retrieving from-gz attributes that
+ * were made availabe for exclusive IP non-global zones by zoneadmd from teh
+ * global zone.
+ */
+static ipadm_status_t
+i_ipadm_zone_get_network(zoneid_t zoneid, datalink_id_t linkid, int type,
+ void *buf, size_t *bufsize)
+{
+ zone_net_data_t *zndata;
+
+ zndata = calloc(1, sizeof (*zndata) + *bufsize);
+ if (zndata == NULL)
+ return (IPADM_NO_MEMORY);
+ zndata->zn_type = type;
+ zndata->zn_linkid = linkid;
+ zndata->zn_len = *bufsize;
+
+ if (zone_getattr(zoneid, ZONE_ATTR_NETWORK, zndata,
+ sizeof (*zndata) + *bufsize) < 0) {
+ return (ipadm_errno2status(errno));
+ }
+ *bufsize = zndata->zn_len;
+ bcopy(zndata->zn_val, buf, *bufsize);
+ return (IPADM_SUCCESS);
+}
+
+/*
+ * Callback function that configures a single datalink in a non-global zone.
+ */
+static int
+i_ipadm_zone_network_attr(dladm_handle_t dh, datalink_id_t linkid, void *arg)
+{
+ ngz_walk_data_t *nwd = arg;
+ zoneid_t zoneid = nwd->ngz_zoneid;
+ uint8_t buf[PIPE_BUF];
+ dladm_status_t dlstatus;
+ ipadm_status_t ipstatus;
+ char link[MAXLINKNAMELEN];
+ ipadm_handle_t iph = nwd->ngz_iph;
+ int rtsock = iph->iph_rtsock;
+ char *ifname = nwd->ngz_ifname;
+ boolean_t s10c = nwd->ngz_s10c;
+ boolean_t is_ipmgmtd = (iph->iph_flags & IPH_IPMGMTD);
+ size_t bufsize = sizeof (buf);
+
+ bzero(buf, bufsize);
+ ipstatus = i_ipadm_zone_get_network(zoneid, linkid,
+ ZONE_NETWORK_ADDRESS, buf, &bufsize);
+ if (ipstatus != IPADM_SUCCESS)
+ goto fail;
+
+ dlstatus = dladm_datalink_id2info(dh, linkid, NULL, NULL,
+ NULL, link, sizeof (link));
+ if (dlstatus != DLADM_STATUS_OK)
+ return (DLADM_WALK_CONTINUE);
+
+ /*
+ * if ifname has been specified, then skip interfaces that don't match
+ */
+ if (ifname != NULL && strcmp(ifname, link) != 0)
+ return (DLADM_WALK_CONTINUE);
+
+ /*
+ * Plumb the interface and configure addresses on for S10 Containers.
+ * We need to always do this for S10C because ipadm persistent
+ * configuration is not available in S10C. For ipkg zones,
+ * we skip the actual plumbing/configuration, but will call the
+ * (*ngz_persist_if)() callback to create the persistent state for the
+ * interface. The interface will be configured in ipkg zones when
+ * ipadm_enable_if() is invoked to restore persistent configuration.
+ */
+ if (is_ipmgmtd && !s10c) {
+ (void) i_ipadm_ngz_persist_if(link, (char *)buf,
+ nwd->ngz_persist_if);
+ return (DLADM_WALK_CONTINUE);
+ }
+ ipstatus = i_ipadm_ngz_addr(iph, link, (char *)buf);
+ if (ipstatus != IPADM_SUCCESS)
+ goto fail;
+
+ /* apply any default router information. */
+ bufsize = sizeof (buf);
+ bzero(buf, bufsize);
+ ipstatus = i_ipadm_zone_get_network(zoneid, linkid,
+ ZONE_NETWORK_DEFROUTER, buf, &bufsize);
+ if (ipstatus != IPADM_SUCCESS)
+ goto fail;
+
+ i_ipadm_create_ngz_route(rtsock, link, buf, bufsize);
+
+ return (DLADM_WALK_CONTINUE);
+fail:
+ if (ifname != NULL) {
+ nwd->ngz_ipstatus = ipstatus;
+ return (DLADM_WALK_TERMINATE);
+ }
+ return (DLADM_WALK_CONTINUE);
+}
+
+/*
+ * ipmgmt_net_from_gz_init() initializes exclusive-IP stack non-global zones by
+ * extracting configuration that has been saved in the kernel and applying
+ * that information to the appropriate datalinks for the zone. If an ifname
+ * argument is passed in, only the selected IP interface corresponding to
+ * datalink will be initialized, otherwise all datalinks will be plumbed for IP
+ * and IP address and route information will be configured.
+ */
+ipadm_status_t
+ipadm_init_net_from_gz(ipadm_handle_t iph, char *ifname,
+ void (*persist_if)(char *, boolean_t, boolean_t))
+{
+ ngz_walk_data_t nwd;
+ uint64_t flags;
+ dladm_handle_t dlh = iph->iph_dlh;
+ datalink_id_t linkid;
+
+ if (iph->iph_zoneid == GLOBAL_ZONEID)
+ return (IPADM_NOTSUP);
+
+ if (ifname != NULL &&
+ i_ipadm_get_flags(iph, ifname, AF_INET, &flags) != IPADM_SUCCESS &&
+ i_ipadm_get_flags(iph, ifname, AF_INET6, &flags) != IPADM_SUCCESS)
+ return (IPADM_ENXIO);
+
+ if (ifname != NULL && !(flags & IFF_L3PROTECT))
+ return (IPADM_SUCCESS); /* nothing to initialize */
+
+ nwd.ngz_iph = iph;
+ nwd.ngz_zoneid = iph->iph_zoneid;
+ nwd.ngz_ifname = ifname;
+ nwd.ngz_persist_if = persist_if;
+ nwd.ngz_s10c = i_ipadm_zone_is_s10c(iph->iph_zoneid);
+ nwd.ngz_ipstatus = IPADM_SUCCESS;
+ if (ifname != NULL) {
+ if (dladm_name2info(dlh, ifname, &linkid, NULL, NULL,
+ NULL) != DLADM_STATUS_OK) {
+ return (IPADM_ENXIO);
+ }
+ (void) i_ipadm_zone_network_attr(dlh, linkid, &nwd);
+ } else {
+ (void) dladm_walk_datalink_id(i_ipadm_zone_network_attr, dlh,
+ &nwd, DATALINK_CLASS_ALL, DATALINK_ANY_MEDIATYPE,
+ DLADM_OPT_PERSIST);
+ }
+ return (nwd.ngz_ipstatus);
+}