nsjail/net.c

369 lines
9.0 KiB
C
Raw Normal View History

2015-05-15 05:44:48 +08:00
/*
nsjail - networking routines
-----------------------------------------
Copyright 2014 Google Inc. All Rights Reserved.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
#include "net.h"
#include <arpa/inet.h>
#include <errno.h>
2016-02-29 07:14:36 +08:00
#include <net/if.h>
#include <net/route.h>
#include <netinet/ip6.h>
#include <netinet/tcp.h>
2015-05-15 05:44:48 +08:00
#include <sched.h>
#include <stdio.h>
#include <stdint.h>
#include <stdlib.h>
#include <string.h>
#include <strings.h>
2016-02-29 07:14:36 +08:00
#include <sys/ioctl.h>
#include <sys/resource.h>
2015-05-15 05:44:48 +08:00
#include <sys/socket.h>
#include <sys/time.h>
2015-05-15 05:44:48 +08:00
#include <sys/types.h>
#include <sys/wait.h>
2015-05-15 05:44:48 +08:00
#include <unistd.h>
#include "log.h"
2016-02-29 07:14:36 +08:00
static bool netSystemSbinIp(struct nsjconf_t *nsjconf, char *const *argv)
{
2016-02-29 07:14:36 +08:00
if (nsjconf->clone_newnet == false) {
LOG_W
("CLONE_NEWNET not enabled. All changes would affect the global networking namespace");
return false;
}
int pid = fork();
if (pid == -1) {
PLOG_E("fork()");
return false;
}
if (pid == 0) {
2016-02-29 06:40:34 +08:00
fexecve(nsjconf->sbinip_fd, argv, environ);
PLOG_E("fexecve('fd=%d')", nsjconf->sbinip_fd);
_exit(1);
}
for (;;) {
int status;
while (wait4(pid, &status, __WALL, NULL) != pid) ;
if (WIFEXITED(status)) {
if (WEXITSTATUS(status) == 0) {
return true;
}
2016-02-29 06:40:34 +08:00
LOG_W("'/sbin/ip' returned with exit status: %d", WEXITSTATUS(status));
return false;
}
if (WIFSIGNALED(status)) {
2016-02-29 06:40:34 +08:00
LOG_W("'/sbin/ip' killed with signal: %d", WTERMSIG(status));
return false;
}
if (WIFSTOPPED(status)) {
continue;
}
if (WIFCONTINUED(status)) {
continue;
}
2016-02-29 07:14:36 +08:00
LOG_W("Unknown exit status for '/sbin/ip' (pid=%d): %d", pid, status);
kill(pid, SIGKILL);
}
}
#define IFACE_NAME "vs"
bool netCloneMacVtapAndNS(struct nsjconf_t *nsjconf, int pid)
{
if (nsjconf->iface == NULL) {
return true;
}
2016-02-29 07:14:36 +08:00
char iface[IF_NAMESIZE];
2016-02-28 23:52:37 +08:00
snprintf(iface, sizeof(iface), "NS.TAP.%d", pid);
char *const argv_add[] =
2016-02-29 06:40:34 +08:00
{ "ip", "link", "add", "link", nsjconf->iface, iface, "type", "macvtap", NULL };
if (netSystemSbinIp(nsjconf, argv_add) == false) {
LOG_E("Couldn't create MACVTAP interface for '%s'", nsjconf->iface);
return false;
}
char pid_str[256];
snprintf(pid_str, sizeof(pid_str), "%d", pid);
2015-08-16 02:10:07 +08:00
char *const argv_netns[] =
{ "ip", "link", "set", "dev", iface, "netns", pid_str, "name", IFACE_NAME,
2016-02-29 06:23:24 +08:00
NULL
};
2016-02-29 06:40:34 +08:00
if (netSystemSbinIp(nsjconf, argv_netns) == false) {
LOG_E("Couldn't put interface '%s' into NS of PID '%d'", iface, pid);
return false;
}
return true;
}
2015-05-15 05:44:48 +08:00
static bool netIsSocket(int fd)
{
int optval;
socklen_t optlen = sizeof(optval);
int ret = getsockopt(fd, SOL_SOCKET, SO_TYPE, &optval, &optlen);
if (ret == -1) {
return false;
}
return true;
}
bool netLimitConns(struct nsjconf_t * nsjconf, int connsock)
{
/* 0 means 'unlimited' */
if (nsjconf->max_conns_per_ip == 0) {
return true;
}
struct sockaddr_in6 addr;
char cs_addr[64];
netConnToText(connsock, true /* remote */ , cs_addr, sizeof(cs_addr), &addr);
unsigned int cnt = 0;
struct pids_t *p;
TAILQ_FOREACH(p, &nsjconf->pids, pointers) {
2015-05-15 05:44:48 +08:00
if (memcmp
(addr.sin6_addr.s6_addr, p->remote_addr.sin6_addr.s6_addr,
sizeof(*p->remote_addr.sin6_addr.s6_addr)) == 0) {
cnt++;
}
}
if (cnt >= nsjconf->max_conns_per_ip) {
LOG_W("Rejecting connection from '%s', max_conns_per_ip limit reached: %u", cs_addr,
nsjconf->max_conns_per_ip);
return false;
}
return true;
}
2016-02-26 01:27:48 +08:00
int netGetRecvSocket(const char *bindhost, int port)
2015-05-15 05:44:48 +08:00
{
if (port < 1 || port > 65535) {
LOG_F("TCP port %d out of bounds (0 <= port <= 65535)", port);
}
2016-02-26 01:27:48 +08:00
struct in6_addr in6a;
if (inet_pton(AF_INET6, bindhost, &in6a) != 1) {
PLOG_E("Couldn't convert '%s' into AF_INET6 address", bindhost);
return -1;
}
2015-05-15 05:44:48 +08:00
int sockfd = socket(AF_INET6, SOCK_STREAM, 0);
if (sockfd == -1) {
PLOG_E("socket(AF_INET6)");
return -1;
}
int so = 1;
if (setsockopt(sockfd, SOL_SOCKET, SO_REUSEADDR, &so, sizeof(so)) == -1) {
PLOG_E("setsockopt(%d, SO_REUSEADDR)", sockfd);
return -1;
}
struct sockaddr_in6 addr = {
.sin6_family = AF_INET6,
.sin6_port = htons(port),
.sin6_flowinfo = 0,
2016-02-26 01:27:48 +08:00
.sin6_addr = in6a,
2015-05-15 05:44:48 +08:00
.sin6_scope_id = 0,
};
if (bind(sockfd, (struct sockaddr *)&addr, sizeof(addr)) == -1) {
2016-02-26 01:27:48 +08:00
PLOG_E("bind(host:[%s], port:%d)", bindhost, port);
2015-05-15 05:44:48 +08:00
return -1;
}
if (listen(sockfd, SOMAXCONN) == -1) {
PLOG_E("listen(%d)", SOMAXCONN);
return -1;
}
char ss_addr[64];
netConnToText(sockfd, false /* remote */ , ss_addr, sizeof(ss_addr), NULL);
LOG_I("Listening on %s", ss_addr);
return sockfd;
}
int netAcceptConn(int listenfd)
{
struct sockaddr_in6 cli_addr;
socklen_t socklen = sizeof(cli_addr);
int connfd = accept(listenfd, (struct sockaddr *)&cli_addr, &socklen);
if (connfd == -1) {
if (errno != EINTR) {
PLOG_E("accept(%d)", listenfd);
}
return -1;
}
char cs_addr[64], ss_addr[64];
netConnToText(connfd, true /* remote */ , cs_addr, sizeof(cs_addr), NULL);
netConnToText(connfd, false /* remote */ , ss_addr, sizeof(ss_addr), NULL);
LOG_I("New connection from: %s on: %s", cs_addr, ss_addr);
int so = 1;
if (setsockopt(connfd, SOL_TCP, TCP_CORK, &so, sizeof(so)) == -1) {
PLOG_W("setsockopt(%d, TCP_CORK)", connfd);
}
return connfd;
}
void netConnToText(int fd, bool remote, char *buf, size_t s, struct sockaddr_in6 *addr_or_null)
{
if (netIsSocket(fd) == false) {
snprintf(buf, s, "[STANDALONE_MODE]");
return;
}
struct sockaddr_in6 addr;
socklen_t addrlen = sizeof(addr);
if (remote) {
if (getpeername(fd, (struct sockaddr *)&addr, &addrlen) == -1) {
PLOG_W("getpeername(%d)", fd);
snprintf(buf, s, "[unknown]");
return;
}
} else {
if (getsockname(fd, (struct sockaddr *)&addr, &addrlen) == -1) {
PLOG_W("getsockname(%d)", fd);
snprintf(buf, s, "[unknown]");
return;
}
}
if (addr_or_null) {
memcpy(addr_or_null, &addr, sizeof(*addr_or_null));
}
char tmp[s];
if (inet_ntop(AF_INET6, addr.sin6_addr.s6_addr, tmp, s) == NULL) {
PLOG_W("inet_ntop()");
snprintf(buf, s, "[unknown]:%hu", ntohs(addr.sin6_port));
return;
}
2016-02-26 01:27:48 +08:00
snprintf(buf, s, "[%s]:%hu", tmp, ntohs(addr.sin6_port));
2015-05-15 05:44:48 +08:00
return;
}
2016-02-29 07:14:36 +08:00
bool netIfaceUp(const char *ifacename)
{
int sock = socket(AF_INET, SOCK_STREAM, IPPROTO_IP);
if (sock == -1) {
PLOG_E("socket(AF_INET, SOCK_STREAM, IPPROTO_IP)");
return false;
}
struct ifreq ifr;
snprintf(ifr.ifr_name, IF_NAMESIZE, "%s", ifacename);
if (ioctl(sock, SIOCGIFFLAGS, &ifr) == -1) {
PLOG_E("ioctl(iface='%s', SIOCGIFFLAGS, IFF_UP)", ifacename);
2016-02-29 07:14:36 +08:00
close(sock);
return false;
}
ifr.ifr_flags |= (IFF_UP | IFF_RUNNING);
if (ioctl(sock, SIOCSIFFLAGS, &ifr) == -1) {
PLOG_E("ioctl(iface='%s', SIOCSIFFLAGS, IFF_UP)", ifacename);
close(sock);
return false;
}
close(sock);
return true;
}
bool netConfigureVs(struct nsjconf_t * nsjconf)
{
struct ifreq ifr;
snprintf(ifr.ifr_name, IF_NAMESIZE, "%s", IFACE_NAME);
struct in_addr addr;
int sock = socket(AF_INET, SOCK_STREAM, IPPROTO_IP);
if (sock == -1) {
PLOG_E("socket(AF_INET, SOCK_STREAM, IPPROTO_IP)");
return false;
}
if (inet_pton(AF_INET, nsjconf->iface_vs_ip, &addr) != 1) {
PLOG_E("Cannot convert '%s' into an IPv4 address", nsjconf->iface_vs_ip);
close(sock);
return false;
}
struct sockaddr_in *sa = (struct sockaddr_in *)(&ifr.ifr_addr);
sa->sin_family = AF_INET;
sa->sin_addr = addr;
if (ioctl(sock, SIOCSIFADDR, &ifr) == -1) {
PLOG_E("ioctl(iface='%s', SIOCSIFADDR, '%s')", IFACE_NAME, nsjconf->iface_vs_ip);
close(sock);
return false;
}
if (inet_pton(AF_INET, nsjconf->iface_vs_nm, &addr) != 1) {
PLOG_E("Cannot convert '%s' into an IPv4 netmask", nsjconf->iface_vs_nm);
close(sock);
return false;
}
sa->sin_family = AF_INET;
sa->sin_addr = addr;
if (ioctl(sock, SIOCSIFNETMASK, &ifr) == -1) {
PLOG_E("ioctl(iface='%s', SIOCSIFNETMASK, '%s')", IFACE_NAME, nsjconf->iface_vs_nm);
close(sock);
return false;
}
if (netIfaceUp(IFACE_NAME) == false) {
return false;
}
if (inet_pton(AF_INET, nsjconf->iface_vs_gw, &addr) != 1) {
PLOG_E("Cannot convert '%s' into an IPv4 GW address", nsjconf->iface_vs_gw);
close(sock);
return false;
}
struct rtentry rt;
memset(&rt, '\0', sizeof(rt));
struct sockaddr_in *sdest = (struct sockaddr_in *)(&rt.rt_dst);
struct sockaddr_in *smask = (struct sockaddr_in *)(&rt.rt_genmask);
struct sockaddr_in *sgate = (struct sockaddr_in *)(&rt.rt_gateway);
sdest->sin_family = AF_INET;
sdest->sin_addr.s_addr = INADDR_ANY;
smask->sin_family = AF_INET;
smask->sin_addr.s_addr = INADDR_ANY;
sgate->sin_family = AF_INET;
sgate->sin_addr = addr;
rt.rt_flags = RTF_UP | RTF_GATEWAY;
if (ioctl(sock, SIOCADDRT, &rt) == -1) {
PLOG_E("ioctl(SIOCADDRT, '%s')", nsjconf->iface_vs_gw);
2016-02-29 07:14:36 +08:00
close(sock);
return false;
}
close(sock);
return true;
}