| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511 |
- /* This Source Code Form is subject to the terms of the Mozilla Public
- * License, v. 2.0. If a copy of the MPL was not distributed with this
- * file, You can obtain one at https://mozilla.org/MPL/2.0/.
- *
- * (c) ZeroTier, Inc.
- * https://www.zerotier.com/
- */
- #include "BSDEthernetTap.hpp"
- #include "../node/Constants.hpp"
- #include "../node/Mutex.hpp"
- #include "../node/Utils.hpp"
- #include "OSUtils.hpp"
- #include <algorithm>
- #include <arpa/inet.h>
- #include <errno.h>
- #include <fcntl.h>
- #include <ifaddrs.h>
- #include <map>
- #include <net/if.h>
- #include <net/if_arp.h>
- #include <net/if_dl.h>
- #include <net/if_media.h>
- #include <net/route.h>
- #include <netinet/in.h>
- #include <pthread_np.h>
- #include <sched.h>
- #include <set>
- #include <signal.h>
- #include <stdint.h>
- #include <stdio.h>
- #include <stdlib.h>
- #include <string.h>
- #include <string>
- #include <sys/cdefs.h>
- #include <sys/ioctl.h>
- #include <sys/param.h>
- #include <sys/select.h>
- #include <sys/socket.h>
- #include <sys/stat.h>
- #include <sys/types.h>
- #include <sys/uio.h>
- #include <sys/wait.h>
- #include <unistd.h>
- #include <utility>
- #define ZT_BASE32_CHARS "0123456789abcdefghijklmnopqrstuv"
- #define ZT_TAP_BUF_SIZE (1024 * 16)
- // ff:ff:ff:ff:ff:ff with no ADI
- static const ZeroTier::MulticastGroup _blindWildcardMulticastGroup(ZeroTier::MAC(0xff), 0);
- namespace ZeroTier {
- BSDEthernetTap::BSDEthernetTap(
- const char* homePath,
- unsigned int concurrency,
- bool pinning,
- const MAC& mac,
- unsigned int mtu,
- unsigned int metric,
- uint64_t nwid,
- const char* friendlyName,
- void (*handler)(void*, void*, uint64_t, const MAC&, const MAC&, unsigned int, unsigned int, const void*, unsigned int),
- void* arg)
- : _handler(handler)
- , _concurrency(concurrency)
- , _pinning(pinning)
- , _arg(arg)
- , _nwid(nwid)
- , _mtu(mtu)
- , _metric(metric)
- , _fd(0)
- , _enabled(true)
- , _lastIfAddrsUpdate(0)
- {
- static Mutex globalTapCreateLock;
- char devpath[64], ethaddr[64], mtustr[32], metstr[32], tmpdevname[32];
- Mutex::Lock _gl(globalTapCreateLock);
- #ifdef __FreeBSD__
- /* FreeBSD allows long interface names and interface renaming */
- _dev = "zt";
- _dev.push_back(ZT_BASE32_CHARS[(unsigned long)((nwid >> 60) & 0x1f)]);
- _dev.push_back(ZT_BASE32_CHARS[(unsigned long)((nwid >> 55) & 0x1f)]);
- _dev.push_back(ZT_BASE32_CHARS[(unsigned long)((nwid >> 50) & 0x1f)]);
- _dev.push_back(ZT_BASE32_CHARS[(unsigned long)((nwid >> 45) & 0x1f)]);
- _dev.push_back(ZT_BASE32_CHARS[(unsigned long)((nwid >> 40) & 0x1f)]);
- _dev.push_back(ZT_BASE32_CHARS[(unsigned long)((nwid >> 35) & 0x1f)]);
- _dev.push_back(ZT_BASE32_CHARS[(unsigned long)((nwid >> 30) & 0x1f)]);
- _dev.push_back(ZT_BASE32_CHARS[(unsigned long)((nwid >> 25) & 0x1f)]);
- _dev.push_back(ZT_BASE32_CHARS[(unsigned long)((nwid >> 20) & 0x1f)]);
- _dev.push_back(ZT_BASE32_CHARS[(unsigned long)((nwid >> 15) & 0x1f)]);
- _dev.push_back(ZT_BASE32_CHARS[(unsigned long)((nwid >> 10) & 0x1f)]);
- _dev.push_back(ZT_BASE32_CHARS[(unsigned long)((nwid >> 5) & 0x1f)]);
- _dev.push_back(ZT_BASE32_CHARS[(unsigned long)(nwid & 0x1f)]);
- std::vector<std::string> devFiles(OSUtils::listDirectory("/dev"));
- for (int i = 9993; i < (9993 + 128); ++i) {
- OSUtils::ztsnprintf(tmpdevname, sizeof(tmpdevname), "tap%d", i);
- OSUtils::ztsnprintf(devpath, sizeof(devpath), "/dev/%s", tmpdevname);
- if (std::find(devFiles.begin(), devFiles.end(), std::string(tmpdevname)) == devFiles.end()) {
- long cpid = (long)vfork();
- if (cpid == 0) {
- #ifdef ZT_TRACE
- fprintf(stderr, "DEBUG: ifconfig %s create" ZT_EOL_S, tmpdevname);
- #endif
- ::execl("/sbin/ifconfig", "/sbin/ifconfig", tmpdevname, "create", (const char*)0);
- ::_exit(-1);
- }
- else if (cpid > 0) {
- int exitcode = -1;
- ::waitpid(cpid, &exitcode, 0);
- }
- else
- throw std::runtime_error("fork() failed");
- struct stat stattmp;
- if (! stat(devpath, &stattmp)) {
- cpid = (long)vfork();
- if (cpid == 0) {
- #ifdef ZT_TRACE
- fprintf(stderr, "DEBUG: ifconfig %s name %s" ZT_EOL_S, tmpdevname, _dev.c_str());
- #endif
- ::execl("/sbin/ifconfig", "/sbin/ifconfig", tmpdevname, "name", _dev.c_str(), (const char*)0);
- ::_exit(-1);
- }
- else if (cpid > 0) {
- int exitcode = -1;
- ::waitpid(cpid, &exitcode, 0);
- if (exitcode)
- throw std::runtime_error("ifconfig rename operation failed");
- }
- else
- throw std::runtime_error("fork() failed");
- _fd = ::open(devpath, O_RDWR);
- if (_fd > 0)
- break;
- else
- throw std::runtime_error("unable to open created tap device");
- }
- else {
- throw std::runtime_error("cannot find /dev node for newly created tap device");
- }
- }
- }
- #else
- /* Other BSDs like OpenBSD only have a limited number of tap devices that cannot be renamed */
- for (int i = 0; i < 64; ++i) {
- OSUtils::ztsnprintf(tmpdevname, sizeof(tmpdevname), "tap%d", i);
- OSUtils::ztsnprintf(devpath, sizeof(devpath), "/dev/%s", tmpdevname);
- _fd = ::open(devpath, O_RDWR);
- if (_fd > 0) {
- _dev = tmpdevname;
- break;
- }
- }
- #endif
- if (_fd <= 0)
- throw std::runtime_error("unable to open TAP device or no more devices available");
- if (fcntl(_fd, F_SETFL, fcntl(_fd, F_GETFL) & ~O_NONBLOCK) == -1) {
- ::close(_fd);
- throw std::runtime_error("unable to set flags on file descriptor for TAP device");
- }
- // Configure MAC address and MTU, bring interface up
- OSUtils::ztsnprintf(ethaddr, sizeof(ethaddr), "%.2x:%.2x:%.2x:%.2x:%.2x:%.2x", (int)mac[0], (int)mac[1], (int)mac[2], (int)mac[3], (int)mac[4], (int)mac[5]);
- OSUtils::ztsnprintf(mtustr, sizeof(mtustr), "%u", _mtu);
- OSUtils::ztsnprintf(metstr, sizeof(metstr), "%u", _metric);
- long cpid = (long)vfork();
- if (cpid == 0) {
- #ifdef ZT_TRACE
- fprintf(stderr, "DEBUG: ifconfig %s lladdr %s mtu %s metric %s up" ZT_EOL_S, _dev.c_str(), ethaddr, mtustr, metstr);
- #endif
- ::execl("/sbin/ifconfig", "/sbin/ifconfig", _dev.c_str(), "lladdr", ethaddr, "mtu", mtustr, "metric", metstr, "up", (const char*)0);
- ::_exit(-1);
- }
- else if (cpid > 0) {
- int exitcode = -1;
- ::waitpid(cpid, &exitcode, 0);
- if (exitcode) {
- ::close(_fd);
- throw std::runtime_error("ifconfig failure setting link-layer address and activating tap interface");
- }
- }
- // Set close-on-exec so that devices cannot persist if we fork/exec for update
- fcntl(_fd, F_SETFD, fcntl(_fd, F_GETFD) | FD_CLOEXEC);
- ::pipe(_shutdownSignalPipe);
- _thread = Thread::start(this);
- }
- BSDEthernetTap::~BSDEthernetTap()
- {
- ::write(_shutdownSignalPipe[1], "\0", 1); // causes thread to exit
- ::close(_fd);
- ::close(_shutdownSignalPipe[0]);
- ::close(_shutdownSignalPipe[1]);
- long cpid = (long)vfork();
- if (cpid == 0) {
- #ifdef ZT_TRACE
- fprintf(stderr, "DEBUG: ifconfig %s destroy" ZT_EOL_S, _dev.c_str());
- #endif
- ::execl("/sbin/ifconfig", "/sbin/ifconfig", _dev.c_str(), "destroy", (const char*)0);
- ::_exit(-1);
- }
- else if (cpid > 0) {
- int exitcode = -1;
- ::waitpid(cpid, &exitcode, 0);
- }
- Thread::join(_thread);
- for (std::thread& t : _rxThreads) {
- t.join();
- }
- }
- void BSDEthernetTap::setEnabled(bool en)
- {
- _enabled = en;
- }
- bool BSDEthernetTap::enabled() const
- {
- return _enabled;
- }
- static bool ___removeIp(const std::string& _dev, const InetAddress& ip)
- {
- long cpid = (long)vfork();
- if (cpid == 0) {
- char ipbuf[64];
- #ifdef ZT_TRACE
- fprintf(stderr, "DEBUG: ifconfig %s inet %s -alias" ZT_EOL_S, _dev.c_str(), ip.toIpString(ipbuf));
- #endif
- execl("/sbin/ifconfig", "/sbin/ifconfig", _dev.c_str(), "inet", ip.toIpString(ipbuf), "-alias", (const char*)0);
- _exit(-1);
- }
- else if (cpid > 0) {
- int exitcode = -1;
- waitpid(cpid, &exitcode, 0);
- return (exitcode == 0);
- }
- return false; // never reached, make compiler shut up about return value
- }
- bool BSDEthernetTap::addIp(const InetAddress& ip)
- {
- if (! ip)
- return false;
- std::vector<InetAddress> allIps(ips());
- if (std::find(allIps.begin(), allIps.end(), ip) != allIps.end())
- return true; // IP/netmask already assigned
- // Remove and reconfigure if address is the same but netmask is different
- for (std::vector<InetAddress>::iterator i(allIps.begin()); i != allIps.end(); ++i) {
- if ((i->ipsEqual(ip)) && (i->netmaskBits() != ip.netmaskBits())) {
- if (___removeIp(_dev, *i))
- break;
- }
- }
- long cpid = (long)vfork();
- if (cpid == 0) {
- char tmp[128];
- #ifdef ZT_TRACE
- fprintf(stderr, "DEBUG: ifconfig %s %s %s alias" ZT_EOL_S, _dev.c_str(), ip.isV4() ? "inet" : "inet6", ip.toString(tmp));
- #endif
- ::execl("/sbin/ifconfig", "/sbin/ifconfig", _dev.c_str(), ip.isV4() ? "inet" : "inet6", ip.toString(tmp), "alias", (const char*)0);
- ::_exit(-1);
- }
- else if (cpid > 0) {
- int exitcode = -1;
- ::waitpid(cpid, &exitcode, 0);
- return (exitcode == 0);
- }
- return false;
- }
- bool BSDEthernetTap::removeIp(const InetAddress& ip)
- {
- if (! ip)
- return false;
- std::vector<InetAddress> allIps(ips());
- if (std::find(allIps.begin(), allIps.end(), ip) != allIps.end()) {
- if (___removeIp(_dev, ip))
- return true;
- }
- return false;
- }
- std::vector<InetAddress> BSDEthernetTap::ips() const
- {
- uint64_t now = OSUtils::now();
- if ((now - _lastIfAddrsUpdate) <= GETIFADDRS_CACHE_TIME) {
- return _ifaddrs;
- }
- _lastIfAddrsUpdate = now;
- struct ifaddrs* ifa = (struct ifaddrs*)0;
- if (getifaddrs(&ifa))
- return std::vector<InetAddress>();
- std::vector<InetAddress> r;
- struct ifaddrs* p = ifa;
- while (p) {
- if ((! strcmp(p->ifa_name, _dev.c_str())) && (p->ifa_addr) && (p->ifa_netmask) && (p->ifa_addr->sa_family == p->ifa_netmask->sa_family)) {
- switch (p->ifa_addr->sa_family) {
- case AF_INET: {
- struct sockaddr_in* sin = (struct sockaddr_in*)p->ifa_addr;
- struct sockaddr_in* nm = (struct sockaddr_in*)p->ifa_netmask;
- r.push_back(InetAddress(&(sin->sin_addr.s_addr), 4, Utils::countBits((uint32_t)nm->sin_addr.s_addr)));
- } break;
- case AF_INET6: {
- struct sockaddr_in6* sin = (struct sockaddr_in6*)p->ifa_addr;
- struct sockaddr_in6* nm = (struct sockaddr_in6*)p->ifa_netmask;
- uint32_t b[4];
- memcpy(b, nm->sin6_addr.s6_addr, sizeof(b));
- r.push_back(InetAddress(sin->sin6_addr.s6_addr, 16, Utils::countBits(b[0]) + Utils::countBits(b[1]) + Utils::countBits(b[2]) + Utils::countBits(b[3])));
- } break;
- }
- }
- p = p->ifa_next;
- }
- if (ifa)
- freeifaddrs(ifa);
- std::sort(r.begin(), r.end());
- std::unique(r.begin(), r.end());
- _ifaddrs = r;
- return r;
- }
- void BSDEthernetTap::put(const MAC& from, const MAC& to, unsigned int etherType, const void* data, unsigned int len)
- {
- char putBuf[ZT_MAX_MTU + 64];
- if ((_fd > 0) && (len <= _mtu) && (_enabled)) {
- to.copyTo(putBuf, 6);
- from.copyTo(putBuf + 6, 6);
- *((uint16_t*)(putBuf + 12)) = htons((uint16_t)etherType);
- memcpy(putBuf + 14, data, len);
- len += 14;
- ::write(_fd, putBuf, len);
- }
- }
- std::string BSDEthernetTap::deviceName() const
- {
- return _dev;
- }
- void BSDEthernetTap::setFriendlyName(const char* friendlyName)
- {
- }
- void BSDEthernetTap::scanMulticastGroups(std::vector<MulticastGroup>& added, std::vector<MulticastGroup>& removed)
- {
- std::vector<MulticastGroup> newGroups;
- #ifndef __OpenBSD__
- struct ifmaddrs* ifmap = (struct ifmaddrs*)0;
- if (! getifmaddrs(&ifmap)) {
- struct ifmaddrs* p = ifmap;
- while (p) {
- if (p->ifma_addr->sa_family == AF_LINK) {
- struct sockaddr_dl* in = (struct sockaddr_dl*)p->ifma_name;
- struct sockaddr_dl* la = (struct sockaddr_dl*)p->ifma_addr;
- if ((la->sdl_alen == 6) && (in->sdl_nlen <= _dev.length()) && (! memcmp(_dev.data(), in->sdl_data, in->sdl_nlen)))
- newGroups.push_back(MulticastGroup(MAC(la->sdl_data + la->sdl_nlen, 6), 0));
- }
- p = p->ifma_next;
- }
- freeifmaddrs(ifmap);
- }
- #endif // __OpenBSD__
- std::vector<InetAddress> allIps(ips());
- for (std::vector<InetAddress>::iterator ip(allIps.begin()); ip != allIps.end(); ++ip)
- newGroups.push_back(MulticastGroup::deriveMulticastGroupForAddressResolution(*ip));
- std::sort(newGroups.begin(), newGroups.end());
- std::unique(newGroups.begin(), newGroups.end());
- for (std::vector<MulticastGroup>::iterator m(newGroups.begin()); m != newGroups.end(); ++m) {
- if (! std::binary_search(_multicastGroups.begin(), _multicastGroups.end(), *m))
- added.push_back(*m);
- }
- for (std::vector<MulticastGroup>::iterator m(_multicastGroups.begin()); m != _multicastGroups.end(); ++m) {
- if (! std::binary_search(newGroups.begin(), newGroups.end(), *m))
- removed.push_back(*m);
- }
- _multicastGroups.swap(newGroups);
- }
- void BSDEthernetTap::setMtu(unsigned int mtu)
- {
- if (mtu != _mtu) {
- _mtu = mtu;
- long cpid = (long)vfork();
- if (cpid == 0) {
- char tmp[64];
- OSUtils::ztsnprintf(tmp, sizeof(tmp), "%u", mtu);
- #ifdef ZT_TRACE
- fprintf(stderr, "DEBUG: ifconfig %s mtu %s" ZT_EOL_S, _dev.c_str(), tmp);
- #endif
- execl("/sbin/ifconfig", "/sbin/ifconfig", _dev.c_str(), "mtu", tmp, (const char*)0);
- _exit(-1);
- }
- else if (cpid > 0) {
- int exitcode = -1;
- waitpid(cpid, &exitcode, 0);
- }
- }
- }
- void BSDEthernetTap::threadMain() throw()
- {
- // Wait for a moment after startup -- wait for Network to finish
- // constructing itself.
- Thread::sleep(500);
- #ifndef __OpenBSD__
- bool pinning = _pinning;
- for (unsigned int i = 0; i < _concurrency; ++i) {
- _rxThreads.push_back(std::thread([this, i, pinning] {
- if (pinning) {
- int pinCore = i % _concurrency;
- fprintf(stderr, "Pinning thread %d to core %d\n", i, pinCore);
- pthread_t self = pthread_self();
- cpu_set_t cpuset;
- CPU_ZERO(&cpuset);
- CPU_SET(pinCore, &cpuset);
- // int rc = sched_setaffinity(self, sizeof(cpu_set_t), &cpuset);
- int rc = pthread_setaffinity_np(self, sizeof(cpu_set_t), &cpuset);
- if (rc != 0) {
- fprintf(stderr, "Failed to pin thread %d to core %d: %s\n", i, pinCore, strerror(errno));
- exit(1);
- }
- }
- #endif // __OpenBSD__
- uint8_t b[ZT_TAP_BUF_SIZE];
- MAC to, from;
- fd_set readfds, nullfds;
- int n, nfds, r;
- FD_ZERO(&readfds);
- FD_ZERO(&nullfds);
- nfds = (int)std::max(_shutdownSignalPipe[0], _fd) + 1;
- r = 0;
- for (;;) {
- FD_SET(_shutdownSignalPipe[0], &readfds);
- FD_SET(_fd, &readfds);
- select(nfds, &readfds, &nullfds, &nullfds, (struct timeval*)0);
- if (FD_ISSET(_shutdownSignalPipe[0], &readfds)) // writes to shutdown pipe terminate thread
- break;
- if (FD_ISSET(_fd, &readfds)) {
- n = (int)::read(_fd, b + r, sizeof(b) - r);
- if (n < 0) {
- if ((errno != EINTR) && (errno != ETIMEDOUT))
- break;
- }
- else {
- // Some tap drivers like to send the ethernet frame and the
- // payload in two chunks, so handle that by accumulating
- // data until we have at least a frame.
- r += n;
- if (r > 14) {
- if (r > ((int)_mtu + 14)) // sanity check for weird TAP behavior on some platforms
- r = _mtu + 14;
- if (_enabled) {
- to.setTo(b, 6);
- from.setTo(b + 6, 6);
- unsigned int etherType = ntohs(((const uint16_t*)b)[6]);
- _handler(_arg, (void*)0, _nwid, from, to, etherType, 0, (const void*)(b + 14), r - 14);
- }
- r = 0;
- }
- }
- }
- }
- #ifndef __OpenBSD__
- }));
- }
- #endif // __OpenBSD__
- }
- } // namespace ZeroTier
|