ExtOsdep.cpp 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623
  1. /* This Source Code Form is subject to the terms of the Mozilla Public
  2. * License, v. 2.0. If a copy of the MPL was not distributed with this
  3. * file, You can obtain one at https://mozilla.org/MPL/2.0/.
  4. *
  5. * (c) ZeroTier, Inc.
  6. * https://www.zerotier.com/
  7. */
  8. #include "ExtOsdep.hpp"
  9. #include "../node/AtomicCounter.hpp"
  10. #include <fcntl.h>
  11. #include <iostream>
  12. #include <list>
  13. #include <sys/times.h>
  14. #include <unistd.h>
  15. #define ZT_TAP_BUF_SIZE 16384
  16. namespace ZeroTier {
  17. static int eodFd = -1;
  18. static Mutex eodMutex;
  19. static int eodMgmtFd = -1;
  20. struct EodRoute {
  21. InetAddress target;
  22. InetAddress via;
  23. InetAddress src;
  24. std::string ifname;
  25. };
  26. static std::list<EodRoute> allRoutes;
  27. template <typename T> static void __eodSend(const T& t)
  28. {
  29. write(eodFd, &t, sizeof(t));
  30. }
  31. static void strncpyx(char* dest, const char* src, size_t n)
  32. {
  33. strncpy(dest, src, n);
  34. if (n > 1) {
  35. dest[n - 1] = 0;
  36. }
  37. }
  38. static int __eodWait(unsigned char msg, unsigned char* d, unsigned l, unsigned maxl = 0, int* recvfd = nullptr)
  39. {
  40. if (! maxl) {
  41. maxl = l;
  42. }
  43. auto start = times(NULL);
  44. while (1) {
  45. msghdr mh;
  46. iovec iov;
  47. struct {
  48. size_t cmsg_len;
  49. int cmsg_level;
  50. int cmsg_type;
  51. int fd;
  52. } __attribute__((packed)) cmsg;
  53. memset(&mh, 0, sizeof(mh));
  54. mh.msg_iov = &iov;
  55. mh.msg_iovlen = 1;
  56. if (recvfd) {
  57. mh.msg_control = &cmsg;
  58. mh.msg_controllen = sizeof(cmsg);
  59. }
  60. iov.iov_base = d;
  61. iov.iov_len = maxl;
  62. int r = recvmsg(eodFd, &mh, MSG_TRUNC | MSG_CMSG_CLOEXEC);
  63. if (r > 0) {
  64. if (recvfd && mh.msg_controllen >= sizeof(cmsg) && cmsg.cmsg_len == sizeof(cmsg) && cmsg.cmsg_level == SOL_SOCKET && cmsg.cmsg_type == SCM_RIGHTS) {
  65. *recvfd = cmsg.fd;
  66. fprintf(stderr, "eodWait: received fd %d\n", *recvfd);
  67. }
  68. if (d[0] != msg) {
  69. fprintf(stderr, "eodWait: wrong msg, expected %u got %u\n", msg, d[0]);
  70. return -1;
  71. }
  72. if ((unsigned)r < l || (unsigned)r > maxl) {
  73. fprintf(stderr, "eodWait: wrong len, expected %u got %d\n", l, r);
  74. return -1;
  75. }
  76. return r;
  77. }
  78. if (times(NULL) - start > 500) {
  79. fprintf(stderr, "eodWait: timeout\n");
  80. return -1;
  81. }
  82. usleep(100000);
  83. }
  84. }
  85. template <typename T> static bool __eodWait(unsigned msg, T& t)
  86. {
  87. return __eodWait(msg, (unsigned char*)&t, sizeof(T)) == (int)sizeof(T);
  88. }
  89. template <typename M, typename R> static bool __eodXchg(const M& m, unsigned rm, R& r)
  90. {
  91. __eodSend(m);
  92. return __eodWait(rm, r);
  93. }
  94. template <typename M, typename R> static bool eodXchg(const M& m, unsigned rm, R& r)
  95. {
  96. Mutex::Lock l(eodMutex);
  97. return __eodXchg(m, rm, r);
  98. }
  99. void ExtOsdep::init(int fd1, int fd2)
  100. {
  101. eodFd = fd1;
  102. eodMgmtFd = fd2;
  103. fcntl(eodMgmtFd, F_SETFL, O_NONBLOCK);
  104. }
  105. void ExtOsdep::started(int* f, void** cp)
  106. {
  107. *f = eodMgmtFd;
  108. *cp = (void*)eodMgmtFd;
  109. unsigned char msg = ZT_EOD_MSG_STARTED;
  110. Mutex::Lock l(eodMutex);
  111. __eodSend(msg);
  112. }
  113. static std::string mgmtrd;
  114. static std::string mgmtwr;
  115. bool ExtOsdep::mgmtWritable(void* cookie)
  116. {
  117. if (cookie != (void*)eodMgmtFd) {
  118. return false;
  119. }
  120. if (mgmtwr.size() == 0) {
  121. return true;
  122. }
  123. auto sz = write(eodMgmtFd, mgmtwr.data(), mgmtwr.size());
  124. if (sz <= 0) {
  125. return false;
  126. }
  127. mgmtwr.erase(mgmtwr.begin(), mgmtwr.begin() + sz);
  128. return mgmtwr.empty();
  129. }
  130. bool ExtOsdep::mgmtRecv(void* cookie, void* data, unsigned long len, std::function<unsigned(unsigned, const std::string&, const std::string&, std::string&)> cb)
  131. {
  132. if (cookie != (void*)eodMgmtFd) {
  133. return false;
  134. }
  135. mgmtrd.append((char*)data, len);
  136. while (1) {
  137. auto req = (zt_eod_mgmt_req*)mgmtrd.data();
  138. if (mgmtrd.size() < sizeof(*req)) {
  139. break;
  140. }
  141. unsigned reqsz = sizeof(*req) + req->pathlen + req->datalen;
  142. if (mgmtrd.size() < reqsz) {
  143. break;
  144. }
  145. std::string resp;
  146. char* p = (char*)req->data;
  147. zt_eod_mgmt_reply rep;
  148. rep.scode = cb(req->method, std::string(p, p + req->pathlen), std::string(p + req->pathlen, p + req->pathlen + req->datalen), resp);
  149. rep.datalen = resp.size();
  150. mgmtrd.erase(mgmtrd.begin(), mgmtrd.begin() + reqsz);
  151. mgmtwr.append((char*)&rep, sizeof(rep));
  152. mgmtwr.append(resp);
  153. auto sz = write(eodMgmtFd, mgmtwr.data(), mgmtwr.size());
  154. if (sz > 0) {
  155. mgmtwr.erase(mgmtwr.begin(), mgmtwr.begin() + sz);
  156. }
  157. }
  158. return ! mgmtwr.empty();
  159. }
  160. void ExtOsdep::routeAddDel(bool add, const InetAddress& target, const InetAddress& via, const InetAddress& src, const char* ifname)
  161. {
  162. Mutex::Lock l(eodMutex);
  163. std::string ifn;
  164. if (ifname) {
  165. ifn = ifname;
  166. }
  167. if (add) {
  168. for (auto x = allRoutes.begin(); x != allRoutes.end(); ++x) {
  169. if (x->target == target && x->via == via && x->src == src && x->ifname == ifn) {
  170. return;
  171. }
  172. }
  173. allRoutes.push_back({ target, via, src, ifn });
  174. }
  175. else {
  176. bool found = false;
  177. for (auto x = allRoutes.begin(); x != allRoutes.end(); ++x) {
  178. if (x->target == target && x->via == via && x->src == src && x->ifname == ifn) {
  179. allRoutes.erase(x);
  180. found = true;
  181. break;
  182. }
  183. }
  184. if (! found) {
  185. return;
  186. }
  187. }
  188. zt_eod_msg_route req;
  189. memset(&req, 0, sizeof(req));
  190. req.cmd = add ? ZT_EOD_MSG_ADDROUTE : ZT_EOD_MSG_DELROUTE;
  191. req.afi = target.isV4() ? 1 : 2;
  192. req.dstlen = target.netmaskBits();
  193. memcpy(req.dst, target.rawIpData(), target.isV4() ? 4 : 16);
  194. if (ifname) {
  195. strncpyx(req.dev, ifname, sizeof(req.dev));
  196. }
  197. if (via) {
  198. memcpy(req.gw, via.rawIpData(), target.isV4() ? 4 : 16);
  199. }
  200. if (src) {
  201. memcpy(req.src, src.rawIpData(), target.isV4() ? 4 : 16);
  202. }
  203. unsigned char resp;
  204. __eodXchg(req, add ? ZT_EOD_MSG_ADDROUTERESP : ZT_EOD_MSG_DELROUTERESP, resp);
  205. }
  206. bool ExtOsdep::getBindAddrs(std::map<InetAddress, std::string>& ret)
  207. {
  208. Mutex::Lock l(eodMutex);
  209. unsigned char req = ZT_EOD_MSG_GETBINDADDRS;
  210. __eodSend(req);
  211. zt_eod_msg_getbindaddrsresp* resp;
  212. unsigned char buf[ZT_EOD_MAXMSGSIZE];
  213. int r = __eodWait(ZT_EOD_MSG_GETBINDADDRSRESP, (unsigned char*)buf, sizeof(*resp), sizeof(buf));
  214. if (r < (int)sizeof(*resp)) {
  215. return false;
  216. }
  217. int c = (r - (int)sizeof(*resp)) / sizeof(resp->addrs[0]);
  218. resp = (zt_eod_msg_getbindaddrsresp*)buf;
  219. for (int i = 0; i < c; ++i) {
  220. ret[InetAddress(resp->addrs[i].data, resp->addrs[i].afi == 1 ? 4 : 16, resp->addrs[i].len)] = resp->addrs[i].ifname;
  221. }
  222. return resp->result;
  223. }
  224. ExtOsdepTap::ExtOsdepTap(
  225. const char* homePath,
  226. const MAC& mac,
  227. unsigned int mtu,
  228. unsigned int metric,
  229. uint64_t nwid,
  230. const char* friendlyName,
  231. void (*handler)(void*, void*, uint64_t, const MAC&, const MAC&, unsigned int, unsigned int, const void*, unsigned int),
  232. void* arg)
  233. : _handler(handler)
  234. , _arg(arg)
  235. , _nwid(nwid)
  236. , _mac(mac)
  237. , _homePath(homePath)
  238. , _mtu(mtu)
  239. , _fd(0)
  240. , _enabled(true)
  241. , _run(true)
  242. {
  243. zt_eod_msg_addtap req;
  244. req.cmd = ZT_EOD_MSG_ADDTAP;
  245. req.nwid = nwid;
  246. req.mtu = mtu;
  247. req.metric = metric;
  248. strncpyx(req.fname, friendlyName, sizeof(req.fname));
  249. mac.copyTo(req.mac, 6);
  250. zt_eod_msg_addtapresp resp;
  251. Mutex::Lock l(eodMutex);
  252. __eodSend(req);
  253. _fd = -1;
  254. if (__eodWait(ZT_EOD_MSG_ADDTAPRESP, (unsigned char*)&resp, sizeof(resp), sizeof(resp), &_fd) != sizeof(resp)) {
  255. throw std::runtime_error(std::string("could not create TAP"));
  256. }
  257. _dev = resp.name;
  258. if (_dev.empty() || _fd < 0) {
  259. throw std::runtime_error(std::string("could not create TAP"));
  260. }
  261. fcntl(_fd, F_SETFL, O_NONBLOCK);
  262. (void)::pipe(_shutdownSignalPipe);
  263. for (unsigned int t = 0; t < 2; ++t) {
  264. _tapReaderThread[t] = std::thread([this, t] {
  265. fd_set readfds, nullfds;
  266. int n, nfds, r;
  267. void* buf = nullptr;
  268. std::vector<void*> buffers;
  269. if (! _run) {
  270. return;
  271. }
  272. FD_ZERO(&readfds);
  273. FD_ZERO(&nullfds);
  274. nfds = (int)std::max(_shutdownSignalPipe[0], _fd) + 1;
  275. r = 0;
  276. for (;;) {
  277. FD_SET(_shutdownSignalPipe[0], &readfds);
  278. FD_SET(_fd, &readfds);
  279. select(nfds, &readfds, &nullfds, &nullfds, (struct timeval*)0);
  280. if (FD_ISSET(_shutdownSignalPipe[0], &readfds)) { // writes to shutdown pipe terminate thread
  281. break;
  282. }
  283. if (FD_ISSET(_fd, &readfds)) {
  284. for (;;) { // read until there are no more packets, then return to outer select() loop
  285. if (! buf) {
  286. // To reduce use of the mutex, we keep a local buffer vector and
  287. // swap (which is a pointer swap) with the global one when it's
  288. // empty. This retrieves a batch of buffers to use.
  289. if (buffers.empty()) {
  290. std::lock_guard<std::mutex> l(_buffers_l);
  291. buffers.swap(_buffers);
  292. }
  293. if (buffers.empty()) {
  294. buf = malloc(ZT_TAP_BUF_SIZE);
  295. if (! buf) {
  296. break;
  297. }
  298. }
  299. else {
  300. buf = buffers.back();
  301. buffers.pop_back();
  302. }
  303. }
  304. n = (int)::read(_fd, reinterpret_cast<uint8_t*>(buf) + r, ZT_TAP_BUF_SIZE - r);
  305. if (n > 0) {
  306. // Some tap drivers like to send the ethernet frame and the
  307. // payload in two chunks, so handle that by accumulating
  308. // data until we have at least a frame.
  309. r += n;
  310. if (r > 14) {
  311. if (r > ((int)_mtu + 14)) { // sanity check for weird TAP behavior on some platforms
  312. r = _mtu + 14;
  313. }
  314. if (_enabled && _tapqsize.load() < 1000) {
  315. ++_tapqsize;
  316. _tapq.post(std::pair<void*, int>(buf, r));
  317. buf = nullptr;
  318. }
  319. r = 0;
  320. }
  321. }
  322. else {
  323. r = 0;
  324. break;
  325. }
  326. }
  327. }
  328. }
  329. });
  330. }
  331. _tapProcessorThread = std::thread([this] {
  332. MAC to, from;
  333. std::pair<void*, int> qi;
  334. while (_tapq.get(qi)) {
  335. --_tapqsize;
  336. uint8_t* const b = reinterpret_cast<uint8_t*>(qi.first);
  337. if (b) {
  338. to.setTo(b, 6);
  339. from.setTo(b + 6, 6);
  340. unsigned int etherType = Utils::ntoh(((const uint16_t*)b)[6]);
  341. _handler(_arg, nullptr, _nwid, from, to, etherType, 0, (const void*)(b + 14), (unsigned int)(qi.second - 14));
  342. {
  343. std::lock_guard<std::mutex> l(_buffers_l);
  344. if (_buffers.size() < 128) {
  345. _buffers.push_back(qi.first);
  346. }
  347. else {
  348. free(qi.first);
  349. }
  350. }
  351. }
  352. else {
  353. break;
  354. }
  355. }
  356. });
  357. }
  358. ExtOsdepTap::~ExtOsdepTap()
  359. {
  360. _run = false;
  361. (void)::write(_shutdownSignalPipe[1], "\0", 1); // causes reader thread(s) to exit
  362. _tapq.post(std::pair<void*, int>(nullptr, 0)); // causes processor thread to exit
  363. _tapReaderThread[0].join();
  364. _tapReaderThread[1].join();
  365. _tapProcessorThread.join();
  366. ::close(_fd);
  367. ::close(_shutdownSignalPipe[0]);
  368. ::close(_shutdownSignalPipe[1]);
  369. for (std::vector<void*>::iterator i(_buffers.begin()); i != _buffers.end(); ++i) {
  370. free(*i);
  371. }
  372. std::vector<std::pair<void*, int> > dv(_tapq.drain());
  373. for (std::vector<std::pair<void*, int> >::iterator i(dv.begin()); i != dv.end(); ++i) {
  374. if (i->first) {
  375. free(i->first);
  376. }
  377. }
  378. zt_eod_msg_deltap req;
  379. req.cmd = ZT_EOD_MSG_DELTAP;
  380. strcpy(req.name, _dev.c_str());
  381. unsigned char resp;
  382. eodXchg(req, ZT_EOD_MSG_DELTAPRESP, resp);
  383. }
  384. void ExtOsdepTap::setEnabled(bool en)
  385. {
  386. _enabled = en;
  387. }
  388. bool ExtOsdepTap::enabled() const
  389. {
  390. return _enabled;
  391. }
  392. void ExtOsdepTap::doRemoveIp(const InetAddress& ip)
  393. {
  394. zt_eod_msg_ip req;
  395. req.cmd = ZT_EOD_MSG_DELIP;
  396. strcpy(req.name, _dev.c_str());
  397. req.afi = ip.isV4() ? 1 : 2;
  398. req.len = ip.netmaskBits();
  399. memcpy(req.data, ip.rawIpData(), ip.isV4() ? 4 : 16);
  400. unsigned char resp;
  401. __eodXchg(req, ZT_EOD_MSG_DELIPRESP, resp);
  402. }
  403. bool ExtOsdepTap::addIp(const InetAddress& ip)
  404. {
  405. Mutex::Lock l(eodMutex);
  406. for (auto i = allIps.begin(); i != allIps.end(); ++i) {
  407. if (*i == ip) {
  408. return true;
  409. }
  410. if (i->ipsEqual(ip)) {
  411. doRemoveIp(*i);
  412. }
  413. }
  414. zt_eod_msg_ip req;
  415. req.cmd = ZT_EOD_MSG_ADDIP;
  416. strcpy(req.name, _dev.c_str());
  417. req.afi = ip.isV4() ? 1 : 2;
  418. req.len = ip.netmaskBits();
  419. memcpy(req.data, ip.rawIpData(), ip.isV4() ? 4 : 16);
  420. unsigned char resp;
  421. __eodXchg(req, ZT_EOD_MSG_ADDIPRESP, resp);
  422. allIps.push_back(ip);
  423. return true;
  424. }
  425. bool ExtOsdepTap::addIps(std::vector<InetAddress> ips)
  426. {
  427. return false;
  428. }
  429. bool ExtOsdepTap::removeIp(const InetAddress& ip)
  430. {
  431. Mutex::Lock l(eodMutex);
  432. for (auto i = allIps.begin(); i != allIps.end(); ++i) {
  433. if (*i == ip) {
  434. doRemoveIp(*i);
  435. return true;
  436. }
  437. }
  438. return false;
  439. }
  440. std::vector<InetAddress> ExtOsdepTap::ips() const
  441. {
  442. std::vector<InetAddress> ret;
  443. Mutex::Lock l(eodMutex);
  444. zt_eod_msg_getips req;
  445. req.cmd = ZT_EOD_MSG_GETIPS;
  446. strcpy(req.name, _dev.c_str());
  447. __eodSend(req);
  448. zt_eod_msg_getipsresp* resp;
  449. unsigned char buf[ZT_EOD_MAXMSGSIZE];
  450. int r = __eodWait(ZT_EOD_MSG_GETIPSRESP, (unsigned char*)buf, sizeof(*resp), sizeof(buf));
  451. if (r < (int)sizeof(*resp)) {
  452. return ret;
  453. }
  454. int c = (r - (int)sizeof(*resp)) / sizeof(resp->addrs[0]);
  455. resp = (zt_eod_msg_getipsresp*)buf;
  456. for (int i = 0; i < c; ++i) {
  457. ret.push_back(InetAddress(resp->addrs[i].data, resp->addrs[i].afi == 1 ? 4 : 16, resp->addrs[i].len));
  458. }
  459. return ret;
  460. }
  461. void ExtOsdepTap::put(const MAC& from, const MAC& to, unsigned int etherType, const void* data, unsigned int len)
  462. {
  463. char putBuf[ZT_MAX_MTU + 64];
  464. if ((_fd > 0) && (len <= _mtu) && (_enabled)) {
  465. to.copyTo(putBuf, 6);
  466. from.copyTo(putBuf + 6, 6);
  467. *((uint16_t*)(putBuf + 12)) = htons((uint16_t)etherType);
  468. memcpy(putBuf + 14, data, len);
  469. len += 14;
  470. (void)::write(_fd, putBuf, len);
  471. }
  472. }
  473. std::string ExtOsdepTap::deviceName() const
  474. {
  475. return _dev;
  476. }
  477. void ExtOsdepTap::setFriendlyName(const char* friendlyName)
  478. {
  479. }
  480. void ExtOsdepTap::scanMulticastGroups(std::vector<MulticastGroup>& added, std::vector<MulticastGroup>& removed)
  481. {
  482. char *ptr, *ptr2;
  483. unsigned char mac[6];
  484. std::vector<MulticastGroup> newGroups;
  485. int fd = ::open("/proc/net/dev_mcast", O_RDONLY);
  486. if (fd > 0) {
  487. char buf[131072];
  488. int n = (int)::read(fd, buf, sizeof(buf));
  489. if ((n > 0) && (n < (int)sizeof(buf))) {
  490. buf[n] = (char)0;
  491. for (char* l = strtok_r(buf, "\r\n", &ptr); (l); l = strtok_r((char*)0, "\r\n", &ptr)) {
  492. int fno = 0;
  493. char* devname = (char*)0;
  494. char* mcastmac = (char*)0;
  495. for (char* f = strtok_r(l, " \t", &ptr2); (f); f = strtok_r((char*)0, " \t", &ptr2)) {
  496. if (fno == 1) {
  497. devname = f;
  498. }
  499. else if (fno == 4) {
  500. mcastmac = f;
  501. }
  502. ++fno;
  503. }
  504. if ((devname) && (! strcmp(devname, _dev.c_str())) && (mcastmac) && (Utils::unhex(mcastmac, mac, 6) == 6)) {
  505. newGroups.push_back(MulticastGroup(MAC(mac, 6), 0));
  506. }
  507. }
  508. }
  509. ::close(fd);
  510. }
  511. std::vector<InetAddress> allIps(ips());
  512. for (std::vector<InetAddress>::iterator ip(allIps.begin()); ip != allIps.end(); ++ip) {
  513. newGroups.push_back(MulticastGroup::deriveMulticastGroupForAddressResolution(*ip));
  514. }
  515. std::sort(newGroups.begin(), newGroups.end());
  516. newGroups.erase(std::unique(newGroups.begin(), newGroups.end()), newGroups.end());
  517. for (std::vector<MulticastGroup>::iterator m(newGroups.begin()); m != newGroups.end(); ++m) {
  518. if (! std::binary_search(_multicastGroups.begin(), _multicastGroups.end(), *m)) {
  519. added.push_back(*m);
  520. }
  521. }
  522. for (std::vector<MulticastGroup>::iterator m(_multicastGroups.begin()); m != _multicastGroups.end(); ++m) {
  523. if (! std::binary_search(newGroups.begin(), newGroups.end(), *m)) {
  524. removed.push_back(*m);
  525. }
  526. }
  527. _multicastGroups.swap(newGroups);
  528. }
  529. void ExtOsdepTap::setMtu(unsigned int mtu)
  530. {
  531. if (mtu == _mtu) {
  532. return;
  533. }
  534. _mtu = mtu;
  535. zt_eod_msg_setmtu req;
  536. req.cmd = ZT_EOD_MSG_SETMTU;
  537. strcpy(req.name, _dev.c_str());
  538. req.mtu = mtu;
  539. unsigned char resp;
  540. eodXchg(req, ZT_EOD_MSG_SETMTURESP, resp);
  541. }
  542. } // namespace ZeroTier