Type: fix Change-Id: I0ce8183ded601bdab031c9689ca361414fed165f Signed-off-by: Nathan Skrzypczak <nathan.skrzypczak@gmail.com>
639 lines
15 KiB
C
639 lines
15 KiB
C
/*
|
|
* Copyright (c) 2015 Cisco and/or its affiliates.
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at:
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
/*
|
|
Copyright (c) 2001, 2002, 2003, 2005 Eliot Dresselhaus
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining
|
|
a copy of this software and associated documentation files (the
|
|
"Software"), to deal in the Software without restriction, including
|
|
without limitation the rights to use, copy, modify, merge, publish,
|
|
distribute, sublicense, and/or sell copies of the Software, and to
|
|
permit persons to whom the Software is furnished to do so, subject to
|
|
the following conditions:
|
|
|
|
The above copyright notice and this permission notice shall be
|
|
included in all copies or substantial portions of the Software.
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
|
EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
|
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
|
NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
|
|
LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
|
|
OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
|
|
WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
|
*/
|
|
|
|
#include <stdio.h>
|
|
#include <string.h> /* strchr */
|
|
#define __USE_GNU
|
|
#define _GNU_SOURCE
|
|
#include <sys/types.h>
|
|
#include <sys/socket.h>
|
|
#include <sys/un.h>
|
|
#include <sys/stat.h>
|
|
#include <netinet/in.h>
|
|
#include <arpa/inet.h>
|
|
#include <netdb.h>
|
|
#include <unistd.h>
|
|
#include <fcntl.h>
|
|
|
|
#include <vppinfra/mem.h>
|
|
#include <vppinfra/vec.h>
|
|
#include <vppinfra/socket.h>
|
|
#include <vppinfra/linux/netns.h>
|
|
#include <vppinfra/format.h>
|
|
#include <vppinfra/error.h>
|
|
|
|
#ifndef __GLIBC__
|
|
/* IPPORT_USERRESERVED is not part of musl libc. */
|
|
#define IPPORT_USERRESERVED 5000
|
|
#endif
|
|
|
|
__clib_export void
|
|
clib_socket_tx_add_formatted (clib_socket_t * s, char *fmt, ...)
|
|
{
|
|
va_list va;
|
|
va_start (va, fmt);
|
|
clib_socket_tx_add_va_formatted (s, fmt, &va);
|
|
va_end (va);
|
|
}
|
|
|
|
/* Return and bind to an unused port. */
|
|
static word
|
|
find_free_port (word sock)
|
|
{
|
|
word port;
|
|
|
|
for (port = IPPORT_USERRESERVED; port < 1 << 16; port++)
|
|
{
|
|
struct sockaddr_in a;
|
|
|
|
clib_memset (&a, 0, sizeof (a)); /* Warnings be gone */
|
|
|
|
a.sin_family = PF_INET;
|
|
a.sin_addr.s_addr = INADDR_ANY;
|
|
a.sin_port = htons (port);
|
|
|
|
if (bind (sock, (struct sockaddr *) &a, sizeof (a)) >= 0)
|
|
break;
|
|
}
|
|
|
|
return port < 1 << 16 ? port : -1;
|
|
}
|
|
|
|
/* Convert a config string to a struct sockaddr and length for use
|
|
with bind or connect. */
|
|
static clib_error_t *
|
|
socket_config (char *config,
|
|
void *addr, socklen_t * addr_len, u32 ip4_default_address)
|
|
{
|
|
clib_error_t *error = 0;
|
|
|
|
if (!config)
|
|
config = "";
|
|
|
|
/* Anything that begins with a / is a local PF_LOCAL socket. */
|
|
if (config[0] == '/')
|
|
{
|
|
struct sockaddr_un *su = addr;
|
|
su->sun_family = PF_LOCAL;
|
|
clib_memcpy (&su->sun_path, config,
|
|
clib_min (sizeof (su->sun_path), 1 + strlen (config)));
|
|
*addr_len = sizeof (su[0]);
|
|
}
|
|
|
|
/* Treat everything that starts with @ as an abstract socket. */
|
|
else if (config[0] == '@')
|
|
{
|
|
struct sockaddr_un *su = addr;
|
|
su->sun_family = PF_LOCAL;
|
|
clib_memcpy (&su->sun_path, config,
|
|
clib_min (sizeof (su->sun_path), 1 + strlen (config)));
|
|
|
|
*addr_len = sizeof (su->sun_family) + strlen (config);
|
|
su->sun_path[0] = '\0';
|
|
}
|
|
|
|
/* Hostname or hostname:port or port. */
|
|
else
|
|
{
|
|
char *host_name;
|
|
int port = -1;
|
|
struct sockaddr_in *sa = addr;
|
|
|
|
host_name = 0;
|
|
port = -1;
|
|
if (config[0] != 0)
|
|
{
|
|
unformat_input_t i;
|
|
|
|
unformat_init_string (&i, config, strlen (config));
|
|
if (unformat (&i, "%s:%d", &host_name, &port)
|
|
|| unformat (&i, "%s:0x%x", &host_name, &port))
|
|
;
|
|
else if (unformat (&i, "%s", &host_name))
|
|
;
|
|
else
|
|
error = clib_error_return (0, "unknown input `%U'",
|
|
format_unformat_error, &i);
|
|
unformat_free (&i);
|
|
|
|
if (error)
|
|
goto done;
|
|
}
|
|
|
|
sa->sin_family = PF_INET;
|
|
*addr_len = sizeof (sa[0]);
|
|
if (port != -1)
|
|
sa->sin_port = htons (port);
|
|
else
|
|
sa->sin_port = 0;
|
|
|
|
if (host_name)
|
|
{
|
|
struct in_addr host_addr;
|
|
|
|
/* Recognize localhost to avoid host lookup in most common cast. */
|
|
if (!strcmp (host_name, "localhost"))
|
|
sa->sin_addr.s_addr = htonl (INADDR_LOOPBACK);
|
|
|
|
else if (inet_aton (host_name, &host_addr))
|
|
sa->sin_addr = host_addr;
|
|
|
|
else if (host_name && strlen (host_name) > 0)
|
|
{
|
|
struct hostent *host = gethostbyname (host_name);
|
|
if (!host)
|
|
error = clib_error_return (0, "unknown host `%s'", config);
|
|
else
|
|
clib_memcpy (&sa->sin_addr.s_addr, host->h_addr_list[0],
|
|
host->h_length);
|
|
}
|
|
|
|
else
|
|
sa->sin_addr.s_addr = htonl (ip4_default_address);
|
|
|
|
vec_free (host_name);
|
|
if (error)
|
|
goto done;
|
|
}
|
|
}
|
|
|
|
done:
|
|
return error;
|
|
}
|
|
|
|
static clib_error_t *
|
|
default_socket_write (clib_socket_t * s)
|
|
{
|
|
clib_error_t *err = 0;
|
|
word written = 0;
|
|
word fd = 0;
|
|
word tx_len;
|
|
|
|
fd = s->fd;
|
|
|
|
/* Map standard input to standard output.
|
|
Typically, fd is a socket for which read/write both work. */
|
|
if (fd == 0)
|
|
fd = 1;
|
|
|
|
tx_len = vec_len (s->tx_buffer);
|
|
written = write (fd, s->tx_buffer, tx_len);
|
|
|
|
/* Ignore certain errors. */
|
|
if (written < 0 && !unix_error_is_fatal (errno))
|
|
written = 0;
|
|
|
|
/* A "real" error occurred. */
|
|
if (written < 0)
|
|
{
|
|
err = clib_error_return_unix (0, "write %wd bytes (fd %d, '%s')",
|
|
tx_len, s->fd, s->config);
|
|
vec_free (s->tx_buffer);
|
|
goto done;
|
|
}
|
|
|
|
/* Reclaim the transmitted part of the tx buffer on successful writes. */
|
|
else if (written > 0)
|
|
{
|
|
if (written == tx_len)
|
|
_vec_len (s->tx_buffer) = 0;
|
|
else
|
|
vec_delete (s->tx_buffer, written, 0);
|
|
}
|
|
|
|
/* If a non-fatal error occurred AND
|
|
the buffer is full, then we must free it. */
|
|
else if (written == 0 && tx_len > 64 * 1024)
|
|
{
|
|
vec_free (s->tx_buffer);
|
|
}
|
|
|
|
done:
|
|
return err;
|
|
}
|
|
|
|
static clib_error_t *
|
|
default_socket_read (clib_socket_t * sock, int n_bytes)
|
|
{
|
|
word fd, n_read;
|
|
u8 *buf;
|
|
|
|
/* RX side of socket is down once end of file is reached. */
|
|
if (sock->flags & CLIB_SOCKET_F_RX_END_OF_FILE)
|
|
return 0;
|
|
|
|
fd = sock->fd;
|
|
|
|
n_bytes = clib_max (n_bytes, 4096);
|
|
vec_add2 (sock->rx_buffer, buf, n_bytes);
|
|
|
|
if ((n_read = read (fd, buf, n_bytes)) < 0)
|
|
{
|
|
n_read = 0;
|
|
|
|
/* Ignore certain errors. */
|
|
if (!unix_error_is_fatal (errno))
|
|
goto non_fatal;
|
|
|
|
return clib_error_return_unix (0, "read %d bytes (fd %d, '%s')",
|
|
n_bytes, sock->fd, sock->config);
|
|
}
|
|
|
|
/* Other side closed the socket. */
|
|
if (n_read == 0)
|
|
sock->flags |= CLIB_SOCKET_F_RX_END_OF_FILE;
|
|
|
|
non_fatal:
|
|
_vec_len (sock->rx_buffer) += n_read - n_bytes;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static clib_error_t *
|
|
default_socket_close (clib_socket_t * s)
|
|
{
|
|
if (close (s->fd) < 0)
|
|
return clib_error_return_unix (0, "close (fd %d, %s)", s->fd, s->config);
|
|
return 0;
|
|
}
|
|
|
|
static clib_error_t *
|
|
default_socket_sendmsg (clib_socket_t * s, void *msg, int msglen,
|
|
int fds[], int num_fds)
|
|
{
|
|
struct msghdr mh = { 0 };
|
|
struct iovec iov[1];
|
|
char ctl[CMSG_SPACE (sizeof (int) * num_fds)];
|
|
int rv;
|
|
|
|
iov[0].iov_base = msg;
|
|
iov[0].iov_len = msglen;
|
|
mh.msg_iov = iov;
|
|
mh.msg_iovlen = 1;
|
|
|
|
if (num_fds > 0)
|
|
{
|
|
struct cmsghdr *cmsg;
|
|
clib_memset (&ctl, 0, sizeof (ctl));
|
|
mh.msg_control = ctl;
|
|
mh.msg_controllen = sizeof (ctl);
|
|
cmsg = CMSG_FIRSTHDR (&mh);
|
|
cmsg->cmsg_len = CMSG_LEN (sizeof (int) * num_fds);
|
|
cmsg->cmsg_level = SOL_SOCKET;
|
|
cmsg->cmsg_type = SCM_RIGHTS;
|
|
memcpy (CMSG_DATA (cmsg), fds, sizeof (int) * num_fds);
|
|
}
|
|
rv = sendmsg (s->fd, &mh, 0);
|
|
if (rv < 0)
|
|
return clib_error_return_unix (0, "sendmsg");
|
|
return 0;
|
|
}
|
|
|
|
|
|
static clib_error_t *
|
|
default_socket_recvmsg (clib_socket_t * s, void *msg, int msglen,
|
|
int fds[], int num_fds)
|
|
{
|
|
#ifdef __linux__
|
|
char ctl[CMSG_SPACE (sizeof (int) * num_fds) +
|
|
CMSG_SPACE (sizeof (struct ucred))];
|
|
struct ucred *cr = 0;
|
|
#else
|
|
char ctl[CMSG_SPACE (sizeof (int) * num_fds)];
|
|
#endif
|
|
struct msghdr mh = { 0 };
|
|
struct iovec iov[1];
|
|
ssize_t size;
|
|
struct cmsghdr *cmsg;
|
|
|
|
iov[0].iov_base = msg;
|
|
iov[0].iov_len = msglen;
|
|
mh.msg_iov = iov;
|
|
mh.msg_iovlen = 1;
|
|
mh.msg_control = ctl;
|
|
mh.msg_controllen = sizeof (ctl);
|
|
|
|
clib_memset (ctl, 0, sizeof (ctl));
|
|
|
|
/* receive the incoming message */
|
|
size = recvmsg (s->fd, &mh, 0);
|
|
if (size != msglen)
|
|
{
|
|
return (size == 0) ? clib_error_return (0, "disconnected") :
|
|
clib_error_return_unix (0, "recvmsg: malformed message (fd %d, '%s')",
|
|
s->fd, s->config);
|
|
}
|
|
|
|
cmsg = CMSG_FIRSTHDR (&mh);
|
|
while (cmsg)
|
|
{
|
|
if (cmsg->cmsg_level == SOL_SOCKET)
|
|
{
|
|
#ifdef __linux__
|
|
if (cmsg->cmsg_type == SCM_CREDENTIALS)
|
|
{
|
|
cr = (struct ucred *) CMSG_DATA (cmsg);
|
|
s->uid = cr->uid;
|
|
s->gid = cr->gid;
|
|
s->pid = cr->pid;
|
|
}
|
|
else
|
|
#endif
|
|
if (cmsg->cmsg_type == SCM_RIGHTS)
|
|
{
|
|
clib_memcpy_fast (fds, CMSG_DATA (cmsg),
|
|
num_fds * sizeof (int));
|
|
}
|
|
}
|
|
cmsg = CMSG_NXTHDR (&mh, cmsg);
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static void
|
|
socket_init_funcs (clib_socket_t * s)
|
|
{
|
|
if (!s->write_func)
|
|
s->write_func = default_socket_write;
|
|
if (!s->read_func)
|
|
s->read_func = default_socket_read;
|
|
if (!s->close_func)
|
|
s->close_func = default_socket_close;
|
|
if (!s->sendmsg_func)
|
|
s->sendmsg_func = default_socket_sendmsg;
|
|
if (!s->recvmsg_func)
|
|
s->recvmsg_func = default_socket_recvmsg;
|
|
}
|
|
|
|
__clib_export clib_error_t *
|
|
clib_socket_init (clib_socket_t * s)
|
|
{
|
|
union
|
|
{
|
|
struct sockaddr sa;
|
|
struct sockaddr_un su;
|
|
} addr;
|
|
socklen_t addr_len = 0;
|
|
int socket_type, rv;
|
|
clib_error_t *error = 0;
|
|
word port;
|
|
|
|
error = socket_config (s->config, &addr.sa, &addr_len,
|
|
(s->flags & CLIB_SOCKET_F_IS_SERVER
|
|
? INADDR_LOOPBACK : INADDR_ANY));
|
|
if (error)
|
|
goto done;
|
|
|
|
socket_init_funcs (s);
|
|
|
|
socket_type = s->flags & CLIB_SOCKET_F_SEQPACKET ?
|
|
SOCK_SEQPACKET : SOCK_STREAM;
|
|
|
|
s->fd = socket (addr.sa.sa_family, socket_type, 0);
|
|
if (s->fd < 0)
|
|
{
|
|
error = clib_error_return_unix (0, "socket (fd %d, '%s')",
|
|
s->fd, s->config);
|
|
goto done;
|
|
}
|
|
|
|
port = 0;
|
|
if (addr.sa.sa_family == PF_INET)
|
|
port = ((struct sockaddr_in *) &addr)->sin_port;
|
|
|
|
if (s->flags & CLIB_SOCKET_F_IS_SERVER)
|
|
{
|
|
uword need_bind = 1;
|
|
|
|
if (addr.sa.sa_family == PF_INET)
|
|
{
|
|
if (port == 0)
|
|
{
|
|
port = find_free_port (s->fd);
|
|
if (port < 0)
|
|
{
|
|
error = clib_error_return (0, "no free port (fd %d, '%s')",
|
|
s->fd, s->config);
|
|
goto done;
|
|
}
|
|
need_bind = 0;
|
|
}
|
|
}
|
|
if (addr.sa.sa_family == PF_LOCAL &&
|
|
((struct sockaddr_un *) &addr)->sun_path[0] != 0)
|
|
unlink (((struct sockaddr_un *) &addr)->sun_path);
|
|
|
|
/* Make address available for multiple users. */
|
|
{
|
|
int v = 1;
|
|
if (setsockopt (s->fd, SOL_SOCKET, SO_REUSEADDR, &v, sizeof (v)) < 0)
|
|
clib_unix_warning ("setsockopt SO_REUSEADDR fails");
|
|
}
|
|
|
|
#if __linux__
|
|
if (addr.sa.sa_family == PF_LOCAL && s->flags & CLIB_SOCKET_F_PASSCRED)
|
|
{
|
|
int x = 1;
|
|
if (setsockopt (s->fd, SOL_SOCKET, SO_PASSCRED, &x, sizeof (x)) < 0)
|
|
{
|
|
error = clib_error_return_unix (0, "setsockopt (SO_PASSCRED, "
|
|
"fd %d, '%s')", s->fd,
|
|
s->config);
|
|
goto done;
|
|
}
|
|
}
|
|
#endif
|
|
|
|
if (need_bind && bind (s->fd, &addr.sa, addr_len) < 0)
|
|
{
|
|
error = clib_error_return_unix (0, "bind (fd %d, '%s')",
|
|
s->fd, s->config);
|
|
goto done;
|
|
}
|
|
|
|
if (listen (s->fd, 5) < 0)
|
|
{
|
|
error = clib_error_return_unix (0, "listen (fd %d, '%s')",
|
|
s->fd, s->config);
|
|
goto done;
|
|
}
|
|
if (addr.sa.sa_family == PF_LOCAL &&
|
|
s->flags & CLIB_SOCKET_F_ALLOW_GROUP_WRITE &&
|
|
((struct sockaddr_un *) &addr)->sun_path[0] != 0)
|
|
{
|
|
struct stat st = { 0 };
|
|
if (stat (((struct sockaddr_un *) &addr)->sun_path, &st) < 0)
|
|
{
|
|
error = clib_error_return_unix (0, "stat (fd %d, '%s')",
|
|
s->fd, s->config);
|
|
goto done;
|
|
}
|
|
st.st_mode |= S_IWGRP;
|
|
if (chmod (((struct sockaddr_un *) &addr)->sun_path, st.st_mode) <
|
|
0)
|
|
{
|
|
error =
|
|
clib_error_return_unix (0, "chmod (fd %d, '%s', mode %o)",
|
|
s->fd, s->config, st.st_mode);
|
|
goto done;
|
|
}
|
|
}
|
|
}
|
|
else
|
|
{
|
|
if ((s->flags & CLIB_SOCKET_F_NON_BLOCKING_CONNECT)
|
|
&& fcntl (s->fd, F_SETFL, O_NONBLOCK) < 0)
|
|
{
|
|
error = clib_error_return_unix (0, "fcntl NONBLOCK (fd %d, '%s')",
|
|
s->fd, s->config);
|
|
goto done;
|
|
}
|
|
|
|
while ((rv = connect (s->fd, &addr.sa, addr_len)) < 0
|
|
&& errno == EAGAIN)
|
|
;
|
|
if (rv < 0 && !((s->flags & CLIB_SOCKET_F_NON_BLOCKING_CONNECT) &&
|
|
errno == EINPROGRESS))
|
|
{
|
|
error = clib_error_return_unix (0, "connect (fd %d, '%s')",
|
|
s->fd, s->config);
|
|
goto done;
|
|
}
|
|
/* Connect was blocking so set fd to non-blocking now unless
|
|
* blocking mode explicitly requested. */
|
|
if (!(s->flags & CLIB_SOCKET_F_NON_BLOCKING_CONNECT) &&
|
|
!(s->flags & CLIB_SOCKET_F_BLOCKING) &&
|
|
fcntl (s->fd, F_SETFL, O_NONBLOCK) < 0)
|
|
{
|
|
error = clib_error_return_unix (0, "fcntl NONBLOCK2 (fd %d, '%s')",
|
|
s->fd, s->config);
|
|
goto done;
|
|
}
|
|
}
|
|
|
|
return error;
|
|
|
|
done:
|
|
if (s->fd > 0)
|
|
close (s->fd);
|
|
return error;
|
|
}
|
|
|
|
__clib_export clib_error_t *
|
|
clib_socket_init_netns (clib_socket_t *s, u8 *namespace)
|
|
{
|
|
if (namespace == NULL || namespace[0] == 0)
|
|
return clib_socket_init (s);
|
|
|
|
clib_error_t *error;
|
|
int old_netns_fd, nfd = -1;
|
|
|
|
old_netns_fd = clib_netns_open (NULL /* self */);
|
|
if ((nfd = clib_netns_open (namespace)) == -1)
|
|
{
|
|
error = clib_error_return_unix (0, "clib_netns_open '%s'", namespace);
|
|
goto done;
|
|
}
|
|
|
|
if (clib_setns (nfd) == -1)
|
|
{
|
|
error = clib_error_return_unix (0, "setns '%s'", namespace);
|
|
goto done;
|
|
}
|
|
|
|
error = clib_socket_init (s);
|
|
|
|
done:
|
|
if (clib_setns (old_netns_fd) == -1)
|
|
clib_warning ("Cannot set old ns");
|
|
|
|
close (old_netns_fd);
|
|
|
|
if (-1 != nfd)
|
|
close (nfd);
|
|
|
|
return error;
|
|
}
|
|
|
|
__clib_export clib_error_t *
|
|
clib_socket_accept (clib_socket_t * server, clib_socket_t * client)
|
|
{
|
|
clib_error_t *err = 0;
|
|
socklen_t len = 0;
|
|
|
|
clib_memset (client, 0, sizeof (client[0]));
|
|
|
|
/* Accept the new socket connection. */
|
|
client->fd = accept (server->fd, 0, 0);
|
|
if (client->fd < 0)
|
|
return clib_error_return_unix (0, "accept (fd %d, '%s')",
|
|
server->fd, server->config);
|
|
|
|
/* Set the new socket to be non-blocking. */
|
|
if (fcntl (client->fd, F_SETFL, O_NONBLOCK) < 0)
|
|
{
|
|
err = clib_error_return_unix (0, "fcntl O_NONBLOCK (fd %d)",
|
|
client->fd);
|
|
goto close_client;
|
|
}
|
|
|
|
/* Get peer info. */
|
|
len = sizeof (client->peer);
|
|
if (getpeername (client->fd, (struct sockaddr *) &client->peer, &len) < 0)
|
|
{
|
|
err = clib_error_return_unix (0, "getpeername (fd %d)", client->fd);
|
|
goto close_client;
|
|
}
|
|
|
|
client->flags = CLIB_SOCKET_F_IS_CLIENT;
|
|
|
|
socket_init_funcs (client);
|
|
return 0;
|
|
|
|
close_client:
|
|
close (client->fd);
|
|
return err;
|
|
}
|
|
|
|
/*
|
|
* fd.io coding-style-patch-verification: ON
|
|
*
|
|
* Local Variables:
|
|
* eval: (c-set-style "gnu")
|
|
* End:
|
|
*/
|