X-Git-Url: https://pintos-os.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=lib%2Fsocket-util.c;h=935e7477771b494edcc09170c490492b1d62e913;hb=520e9a2acdcf6136bf0a20586df6351ecf72dd3e;hp=16a321c201804343bd285b56d41232422fefafe7;hpb=5136ce492c414f377f7be9ae32b259abb9f76580;p=openvswitch diff --git a/lib/socket-util.c b/lib/socket-util.c index 16a321c2..935e7477 100644 --- a/lib/socket-util.c +++ b/lib/socket-util.c @@ -1,5 +1,5 @@ /* - * Copyright (c) 2008, 2009, 2010 Nicira Networks. + * Copyright (c) 2008, 2009, 2010, 2011 Nicira Networks. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -19,6 +19,7 @@ #include #include #include +#include #include #include #include @@ -30,11 +31,33 @@ #include #include #include +#include "dynamic-string.h" #include "fatal-signal.h" +#include "packets.h" #include "util.h" #include "vlog.h" +#if AF_PACKET && __linux__ +#include +#endif +#ifdef HAVE_NETLINK +#include "netlink-protocol.h" +#include "netlink-socket.h" +#endif -VLOG_DEFINE_THIS_MODULE(socket_util) +VLOG_DEFINE_THIS_MODULE(socket_util); + +/* #ifdefs make it a pain to maintain code: you have to try to build both ways. + * Thus, this file compiles all of the code regardless of the target, by + * writing "if (LINUX)" instead of "#ifdef __linux__". */ +#ifdef __linux__ +#define LINUX 1 +#else +#define LINUX 0 +#endif + +#ifndef O_DIRECTORY +#define O_DIRECTORY 0 +#endif /* Sets 'fd' to non-blocking mode. Returns 0 if successful, otherwise a * positive errno value. */ @@ -98,25 +121,39 @@ get_max_fds(void) * address, into a numeric IP address in '*addr'. Returns 0 if successful, * otherwise a positive errno value. */ int -lookup_ip(const char *host_name, struct in_addr *addr) +lookup_ip(const char *host_name, struct in_addr *addr) { if (!inet_aton(host_name, addr)) { - struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(1, 5); + static struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(1, 5); VLOG_ERR_RL(&rl, "\"%s\" is not a valid IP address", host_name); return ENOENT; } return 0; } +/* Translates 'host_name', which must be a string representation of an IPv6 + * address, into a numeric IPv6 address in '*addr'. Returns 0 if successful, + * otherwise a positive errno value. */ +int +lookup_ipv6(const char *host_name, struct in6_addr *addr) +{ + if (inet_pton(AF_INET6, host_name, addr) != 1) { + static struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(1, 5); + VLOG_ERR_RL(&rl, "\"%s\" is not a valid IPv6 address", host_name); + return ENOENT; + } + return 0; +} + /* Returns the error condition associated with socket 'fd' and resets the * socket's error status. */ int -get_socket_error(int fd) +get_socket_error(int fd) { int error; socklen_t len = sizeof(error); if (getsockopt(fd, SOL_SOCKET, SO_ERROR, &error, &len) < 0) { - struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(5, 10); + static struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(5, 10); error = errno; VLOG_ERR_RL(&rl, "getsockopt(SO_ERROR): %s", strerror(error)); } @@ -124,7 +161,7 @@ get_socket_error(int fd) } int -check_connection_completion(int fd) +check_connection_completion(int fd) { struct pollfd pfd; int retval; @@ -171,12 +208,7 @@ drain_rcvbuf(int fd) * * On other Unix-like OSes, MSG_TRUNC has no effect in the flags * argument. */ -#ifdef __linux__ -#define BUFFER_SIZE 1 -#else -#define BUFFER_SIZE 2048 -#endif - char buffer[BUFFER_SIZE]; + char buffer[LINUX ? 1 : 2048]; ssize_t n_bytes = recv(fd, buffer, sizeof buffer, MSG_TRUNC | MSG_DONTWAIT); if (n_bytes <= 0 || n_bytes >= rcvbuf) { @@ -208,15 +240,89 @@ drain_fd(int fd, size_t n_packets) /* Stores in '*un' a sockaddr_un that refers to file 'name'. Stores in * '*un_len' the size of the sockaddr_un. */ static void -make_sockaddr_un(const char *name, struct sockaddr_un* un, socklen_t *un_len) +make_sockaddr_un__(const char *name, struct sockaddr_un *un, socklen_t *un_len) { un->sun_family = AF_UNIX; - strncpy(un->sun_path, name, sizeof un->sun_path); - un->sun_path[sizeof un->sun_path - 1] = '\0'; + ovs_strzcpy(un->sun_path, name, sizeof un->sun_path); *un_len = (offsetof(struct sockaddr_un, sun_path) + strlen (un->sun_path) + 1); } +/* Stores in '*un' a sockaddr_un that refers to file 'name'. Stores in + * '*un_len' the size of the sockaddr_un. + * + * Returns 0 on success, otherwise a positive errno value. On success, + * '*dirfdp' is either -1 or a nonnegative file descriptor that the caller + * should close after using '*un' to bind or connect. On failure, '*dirfdp' is + * -1. */ +static int +make_sockaddr_un(const char *name, struct sockaddr_un *un, socklen_t *un_len, + int *dirfdp) +{ + enum { MAX_UN_LEN = sizeof un->sun_path - 1 }; + + *dirfdp = -1; + if (strlen(name) > MAX_UN_LEN) { + static struct vlog_rate_limit rl = VLOG_RATE_LIMIT_INIT(1, 1); + + if (LINUX) { + /* 'name' is too long to fit in a sockaddr_un, but we have a + * workaround for that on Linux: shorten it by opening a file + * descriptor for the directory part of the name and indirecting + * through /proc/self/fd//. */ + char *dir, *base; + char *short_name; + int dirfd; + + dir = dir_name(name); + base = base_name(name); + + dirfd = open(dir, O_DIRECTORY | O_RDONLY); + if (dirfd < 0) { + free(base); + free(dir); + return errno; + } + + short_name = xasprintf("/proc/self/fd/%d/%s", dirfd, base); + free(dir); + free(base); + + if (strlen(short_name) <= MAX_UN_LEN) { + make_sockaddr_un__(short_name, un, un_len); + free(short_name); + *dirfdp = dirfd; + return 0; + } + free(short_name); + close(dirfd); + + VLOG_WARN_RL(&rl, "Unix socket name %s is longer than maximum " + "%d bytes (even shortened)", name, MAX_UN_LEN); + } else { + /* 'name' is too long and we have no workaround. */ + VLOG_WARN_RL(&rl, "Unix socket name %s is longer than maximum " + "%d bytes", name, MAX_UN_LEN); + } + + return ENAMETOOLONG; + } else { + make_sockaddr_un__(name, un, un_len); + return 0; + } +} + +/* Binds Unix domain socket 'fd' to a file with permissions 0700. */ +static int +bind_unix_socket(int fd, struct sockaddr *sun, socklen_t sun_len) +{ + /* According to _Unix Network Programming_, umask should affect bind(). */ + mode_t old_umask = umask(0077); + int error = bind(fd, sun, sun_len) ? errno : 0; + umask(old_umask); + return error; +} + /* Creates a Unix domain socket in the given 'style' (either SOCK_DGRAM or * SOCK_STREAM) that is bound to '*bind_path' (if 'bind_path' is non-null) and * connected to '*connect_path' (if 'connect_path' is non-null). If 'nonblock' @@ -243,9 +349,11 @@ make_unix_socket(int style, bool nonblock, bool passcred OVS_UNUSED, if (nonblock) { int flags = fcntl(fd, F_GETFL, 0); if (flags == -1) { + error = errno; goto error; } if (fcntl(fd, F_SETFL, flags | O_NONBLOCK) == -1) { + error = errno; goto error; } } @@ -253,13 +361,21 @@ make_unix_socket(int style, bool nonblock, bool passcred OVS_UNUSED, if (bind_path) { struct sockaddr_un un; socklen_t un_len; - make_sockaddr_un(bind_path, &un, &un_len); - if (unlink(un.sun_path) && errno != ENOENT) { - VLOG_WARN("unlinking \"%s\": %s\n", un.sun_path, strerror(errno)); + int dirfd; + + if (unlink(bind_path) && errno != ENOENT) { + VLOG_WARN("unlinking \"%s\": %s\n", bind_path, strerror(errno)); } fatal_signal_add_file_to_unlink(bind_path); - if (bind(fd, (struct sockaddr*) &un, un_len) - || fchmod(fd, S_IRWXU)) { + + error = make_sockaddr_un(bind_path, &un, &un_len, &dirfd); + if (!error) { + error = bind_unix_socket(fd, (struct sockaddr *) &un, un_len); + } + if (dirfd >= 0) { + close(dirfd); + } + if (error) { goto error; } } @@ -267,10 +383,18 @@ make_unix_socket(int style, bool nonblock, bool passcred OVS_UNUSED, if (connect_path) { struct sockaddr_un un; socklen_t un_len; - make_sockaddr_un(connect_path, &un, &un_len); - if (connect(fd, (struct sockaddr*) &un, un_len) + int dirfd; + + error = make_sockaddr_un(connect_path, &un, &un_len, &dirfd); + if (!error + && connect(fd, (struct sockaddr*) &un, un_len) && errno != EINPROGRESS) { - printf("connect failed with %s\n", strerror(errno)); + error = errno; + } + if (dirfd >= 0) { + close(dirfd); + } + if (error) { goto error; } } @@ -279,6 +403,7 @@ make_unix_socket(int style, bool nonblock, bool passcred OVS_UNUSED, if (passcred) { int enable = 1; if (setsockopt(fd, SOL_SOCKET, SO_PASSCRED, &enable, sizeof(enable))) { + error = errno; goto error; } } @@ -287,7 +412,9 @@ make_unix_socket(int style, bool nonblock, bool passcred OVS_UNUSED, return fd; error: - error = errno == EAGAIN ? EPROTO : errno; + if (error == EAGAIN) { + error = EPROTO; + } if (bind_path) { fatal_signal_remove_file_to_unlink(bind_path); } @@ -303,10 +430,10 @@ get_unix_name_len(socklen_t sun_len) : 0); } -uint32_t -guess_netmask(uint32_t ip) +ovs_be32 +guess_netmask(ovs_be32 ip_) { - ip = ntohl(ip); + uint32_t ip = ntohl(ip_); return ((ip >> 31) == 0 ? htonl(0xff000000) /* Class A */ : (ip >> 30) == 2 ? htonl(0xffff0000) /* Class B */ : (ip >> 29) == 6 ? htonl(0xffffff00) /* Class C */ @@ -457,7 +584,7 @@ inet_open_passive(int style, const char *target_, int default_port, struct sockaddr_in sin; const char *host_name; const char *port_string; - int fd, error, port; + int fd = 0, error, port; unsigned int yes = 1; /* Address defaults. */ @@ -660,3 +787,155 @@ get_mtime(const char *file_name, struct timespec *mtime) } } +void +xpipe(int fds[2]) +{ + if (pipe(fds)) { + VLOG_FATAL("failed to create pipe (%s)", strerror(errno)); + } +} + +static int +getsockopt_int(int fd, int level, int optname, int *valuep) +{ + socklen_t len = sizeof *valuep; + + return (getsockopt(fd, level, optname, valuep, &len) ? errno + : len == sizeof *valuep ? 0 + : EINVAL); +} + +static void +describe_sockaddr(struct ds *string, int fd, + int (*getaddr)(int, struct sockaddr *, socklen_t *)) +{ + struct sockaddr_storage ss; + socklen_t len = sizeof ss; + + if (!getaddr(fd, (struct sockaddr *) &ss, &len)) { + if (ss.ss_family == AF_INET) { + struct sockaddr_in sin; + + memcpy(&sin, &ss, sizeof sin); + ds_put_format(string, IP_FMT":%"PRIu16, + IP_ARGS(&sin.sin_addr.s_addr), ntohs(sin.sin_port)); + } else if (ss.ss_family == AF_UNIX) { + struct sockaddr_un sun; + const char *null; + size_t maxlen; + + memcpy(&sun, &ss, sizeof sun); + maxlen = len - offsetof(struct sockaddr_un, sun_path); + null = memchr(sun.sun_path, '\0', maxlen); + ds_put_buffer(string, sun.sun_path, + null ? null - sun.sun_path : maxlen); + } +#ifdef HAVE_NETLINK + else if (ss.ss_family == AF_NETLINK) { + int protocol; + +/* SO_PROTOCOL was introduced in 2.6.32. Support it regardless of the version + * of the Linux kernel headers in use at build time. */ +#ifndef SO_PROTOCOL +#define SO_PROTOCOL 38 +#endif + + if (!getsockopt_int(fd, SOL_SOCKET, SO_PROTOCOL, &protocol)) { + switch (protocol) { + case NETLINK_ROUTE: + ds_put_cstr(string, "NETLINK_ROUTE"); + break; + + case NETLINK_GENERIC: + ds_put_cstr(string, "NETLINK_GENERIC"); + break; + + default: + ds_put_format(string, "AF_NETLINK family %d", protocol); + break; + } + } else { + ds_put_cstr(string, "AF_NETLINK"); + } + } +#endif +#if AF_PACKET && __linux__ + else if (ss.ss_family == AF_PACKET) { + struct sockaddr_ll sll; + + memcpy(&sll, &ss, sizeof sll); + ds_put_cstr(string, "AF_PACKET"); + if (sll.sll_ifindex) { + char name[IFNAMSIZ]; + + if (if_indextoname(sll.sll_ifindex, name)) { + ds_put_format(string, "(%s)", name); + } else { + ds_put_format(string, "(ifindex=%d)", sll.sll_ifindex); + } + } + if (sll.sll_protocol) { + ds_put_format(string, "(protocol=0x%"PRIu16")", + ntohs(sll.sll_protocol)); + } + } +#endif + else if (ss.ss_family == AF_UNSPEC) { + ds_put_cstr(string, "AF_UNSPEC"); + } else { + ds_put_format(string, "AF_%d", (int) ss.ss_family); + } + } +} + + +#ifdef __linux__ +static void +put_fd_filename(struct ds *string, int fd) +{ + char buf[1024]; + char *linkname; + int n; + + linkname = xasprintf("/proc/self/fd/%d", fd); + n = readlink(linkname, buf, sizeof buf); + if (n > 0) { + ds_put_char(string, ' '); + ds_put_buffer(string, buf, n); + if (n > sizeof buf) { + ds_put_cstr(string, "..."); + } + } + free(linkname); +} +#endif + +/* Returns a malloc()'d string describing 'fd', for use in logging. */ +char * +describe_fd(int fd) +{ + struct ds string; + struct stat s; + + ds_init(&string); + if (fstat(fd, &s)) { + ds_put_format(&string, "fstat failed (%s)", strerror(errno)); + } else if (S_ISSOCK(s.st_mode)) { + describe_sockaddr(&string, fd, getsockname); + ds_put_cstr(&string, "<->"); + describe_sockaddr(&string, fd, getpeername); + } else { + ds_put_cstr(&string, (isatty(fd) ? "tty" + : S_ISDIR(s.st_mode) ? "directory" + : S_ISCHR(s.st_mode) ? "character device" + : S_ISBLK(s.st_mode) ? "block device" + : S_ISREG(s.st_mode) ? "file" + : S_ISFIFO(s.st_mode) ? "FIFO" + : S_ISLNK(s.st_mode) ? "symbolic link" + : "unknown")); +#ifdef __linux__ + put_fd_filename(&string, fd); +#endif + } + return ds_steal_cstr(&string); +}