PostgreSQL.cpp 62 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842
  1. /*
  2. * Copyright (c)2019 ZeroTier, Inc.
  3. *
  4. * Use of this software is governed by the Business Source License included
  5. * in the LICENSE.TXT file in the project's root directory.
  6. *
  7. * Change Date: 2025-01-01
  8. *
  9. * On the date above, in accordance with the Business Source License, use
  10. * of this software will be governed by version 2.0 of the Apache License.
  11. */
  12. /****/
  13. #include "PostgreSQL.hpp"
  14. #ifdef ZT_CONTROLLER_USE_LIBPQ
  15. #include "../node/Constants.hpp"
  16. #include "../node/SHA512.hpp"
  17. #include "EmbeddedNetworkController.hpp"
  18. #include "../version.h"
  19. #include "Redis.hpp"
  20. #include <libpq-fe.h>
  21. #include <sstream>
  22. #include <iomanip>
  23. #include <climits>
  24. #include <chrono>
  25. // #define REDIS_TRACE 1
  26. using json = nlohmann::json;
  27. namespace {
  28. static const int DB_MINIMUM_VERSION = 38;
  29. static const char *_timestr()
  30. {
  31. time_t t = time(0);
  32. char *ts = ctime(&t);
  33. char *p = ts;
  34. if (!p)
  35. return "";
  36. while (*p) {
  37. if (*p == '\n') {
  38. *p = (char)0;
  39. break;
  40. }
  41. ++p;
  42. }
  43. return ts;
  44. }
  45. /*
  46. std::string join(const std::vector<std::string> &elements, const char * const separator)
  47. {
  48. switch(elements.size()) {
  49. case 0:
  50. return "";
  51. case 1:
  52. return elements[0];
  53. default:
  54. std::ostringstream os;
  55. std::copy(elements.begin(), elements.end()-1, std::ostream_iterator<std::string>(os, separator));
  56. os << *elements.rbegin();
  57. return os.str();
  58. }
  59. }
  60. */
  61. std::vector<std::string> split(std::string str, char delim){
  62. std::istringstream iss(str);
  63. std::vector<std::string> tokens;
  64. std::string item;
  65. while(std::getline(iss, item, delim)) {
  66. tokens.push_back(item);
  67. }
  68. return tokens;
  69. }
  70. std::string url_encode(const std::string &value) {
  71. std::ostringstream escaped;
  72. escaped.fill('0');
  73. escaped << std::hex;
  74. for (std::string::const_iterator i = value.begin(), n = value.end(); i != n; ++i) {
  75. std::string::value_type c = (*i);
  76. // Keep alphanumeric and other accepted characters intact
  77. if (isalnum(c) || c == '-' || c == '_' || c == '.' || c == '~') {
  78. escaped << c;
  79. continue;
  80. }
  81. // Any other characters are percent-encoded
  82. escaped << std::uppercase;
  83. escaped << '%' << std::setw(2) << int((unsigned char) c);
  84. escaped << std::nouppercase;
  85. }
  86. return escaped.str();
  87. }
  88. } // anonymous namespace
  89. using namespace ZeroTier;
  90. MemberNotificationReceiver::MemberNotificationReceiver(PostgreSQL *p, pqxx::connection &c, const std::string &channel)
  91. : pqxx::notification_receiver(c, channel)
  92. , _psql(p)
  93. {
  94. fprintf(stderr, "initialize MemberNotificationReceiver\n");
  95. }
  96. void MemberNotificationReceiver::operator() (const std::string &payload, int packend_pid) {
  97. fprintf(stderr, "Member Notification received: %s\n", payload.c_str());
  98. Metrics::pgsql_mem_notification++;
  99. json tmp(json::parse(payload));
  100. json &ov = tmp["old_val"];
  101. json &nv = tmp["new_val"];
  102. json oldConfig, newConfig;
  103. if (ov.is_object()) oldConfig = ov;
  104. if (nv.is_object()) newConfig = nv;
  105. if (oldConfig.is_object() || newConfig.is_object()) {
  106. _psql->_memberChanged(oldConfig,newConfig,(_psql->_ready>=2));
  107. fprintf(stderr, "payload sent\n");
  108. }
  109. }
  110. NetworkNotificationReceiver::NetworkNotificationReceiver(PostgreSQL *p, pqxx::connection &c, const std::string &channel)
  111. : pqxx::notification_receiver(c, channel)
  112. , _psql(p)
  113. {
  114. fprintf(stderr, "initialize NetworkNotificationReceiver\n");
  115. }
  116. void NetworkNotificationReceiver::operator() (const std::string &payload, int packend_pid) {
  117. fprintf(stderr, "Network Notification received: %s\n", payload.c_str());
  118. Metrics::pgsql_net_notification++;
  119. json tmp(json::parse(payload));
  120. json &ov = tmp["old_val"];
  121. json &nv = tmp["new_val"];
  122. json oldConfig, newConfig;
  123. if (ov.is_object()) oldConfig = ov;
  124. if (nv.is_object()) newConfig = nv;
  125. if (oldConfig.is_object() || newConfig.is_object()) {
  126. _psql->_networkChanged(oldConfig,newConfig,(_psql->_ready>=2));
  127. fprintf(stderr, "payload sent\n");
  128. }
  129. }
  130. using Attrs = std::vector<std::pair<std::string, std::string>>;
  131. using Item = std::pair<std::string, Attrs>;
  132. using ItemStream = std::vector<Item>;
  133. PostgreSQL::PostgreSQL(const Identity &myId, const char *path, int listenPort, RedisConfig *rc)
  134. : DB()
  135. , _pool()
  136. , _myId(myId)
  137. , _myAddress(myId.address())
  138. , _ready(0)
  139. , _connected(1)
  140. , _run(1)
  141. , _waitNoticePrinted(false)
  142. , _listenPort(listenPort)
  143. , _rc(rc)
  144. , _redis(NULL)
  145. , _cluster(NULL)
  146. , _redisMemberStatus(false)
  147. {
  148. char myAddress[64];
  149. _myAddressStr = myId.address().toString(myAddress);
  150. _connString = std::string(path);
  151. auto f = std::make_shared<PostgresConnFactory>(_connString);
  152. _pool = std::make_shared<ConnectionPool<PostgresConnection> >(
  153. 15, 5, std::static_pointer_cast<ConnectionFactory>(f));
  154. memset(_ssoPsk, 0, sizeof(_ssoPsk));
  155. char *const ssoPskHex = getenv("ZT_SSO_PSK");
  156. #ifdef ZT_TRACE
  157. fprintf(stderr, "ZT_SSO_PSK: %s\n", ssoPskHex);
  158. #endif
  159. if (ssoPskHex) {
  160. // SECURITY: note that ssoPskHex will always be null-terminated if libc actually
  161. // returns something non-NULL. If the hex encodes something shorter than 48 bytes,
  162. // it will be padded at the end with zeroes. If longer, it'll be truncated.
  163. Utils::unhex(ssoPskHex, _ssoPsk, sizeof(_ssoPsk));
  164. }
  165. const char *redisMemberStatus = getenv("ZT_REDIS_MEMBER_STATUS");
  166. if (redisMemberStatus && (strcmp(redisMemberStatus, "true") == 0)) {
  167. _redisMemberStatus = true;
  168. fprintf(stderr, "Using redis for member status\n");
  169. }
  170. auto c = _pool->borrow();
  171. pqxx::work txn{*c->c};
  172. pqxx::row r{txn.exec1("SELECT version FROM ztc_database")};
  173. int dbVersion = r[0].as<int>();
  174. txn.commit();
  175. if (dbVersion < DB_MINIMUM_VERSION) {
  176. fprintf(stderr, "Central database schema version too low. This controller version requires a minimum schema version of %d. Please upgrade your Central instance", DB_MINIMUM_VERSION);
  177. exit(1);
  178. }
  179. _pool->unborrow(c);
  180. if (_rc != NULL) {
  181. sw::redis::ConnectionOptions opts;
  182. sw::redis::ConnectionPoolOptions poolOpts;
  183. opts.host = _rc->hostname;
  184. opts.port = _rc->port;
  185. opts.password = _rc->password;
  186. opts.db = 0;
  187. opts.keep_alive = true;
  188. opts.connect_timeout = std::chrono::seconds(3);
  189. poolOpts.size = 25;
  190. poolOpts.wait_timeout = std::chrono::seconds(5);
  191. poolOpts.connection_lifetime = std::chrono::minutes(3);
  192. poolOpts.connection_idle_time = std::chrono::minutes(1);
  193. if (_rc->clusterMode) {
  194. fprintf(stderr, "Using Redis in Cluster Mode\n");
  195. _cluster = std::make_shared<sw::redis::RedisCluster>(opts, poolOpts);
  196. } else {
  197. fprintf(stderr, "Using Redis in Standalone Mode\n");
  198. _redis = std::make_shared<sw::redis::Redis>(opts, poolOpts);
  199. }
  200. }
  201. _readyLock.lock();
  202. fprintf(stderr, "[%s] NOTICE: %.10llx controller PostgreSQL waiting for initial data download..." ZT_EOL_S, ::_timestr(), (unsigned long long)_myAddress.toInt());
  203. _waitNoticePrinted = true;
  204. initializeNetworks();
  205. initializeMembers();
  206. _heartbeatThread = std::thread(&PostgreSQL::heartbeat, this);
  207. _membersDbWatcher = std::thread(&PostgreSQL::membersDbWatcher, this);
  208. _networksDbWatcher = std::thread(&PostgreSQL::networksDbWatcher, this);
  209. for (int i = 0; i < ZT_CENTRAL_CONTROLLER_COMMIT_THREADS; ++i) {
  210. _commitThread[i] = std::thread(&PostgreSQL::commitThread, this);
  211. }
  212. _onlineNotificationThread = std::thread(&PostgreSQL::onlineNotificationThread, this);
  213. }
  214. PostgreSQL::~PostgreSQL()
  215. {
  216. _run = 0;
  217. std::this_thread::sleep_for(std::chrono::milliseconds(100));
  218. _heartbeatThread.join();
  219. _membersDbWatcher.join();
  220. _networksDbWatcher.join();
  221. _commitQueue.stop();
  222. for (int i = 0; i < ZT_CENTRAL_CONTROLLER_COMMIT_THREADS; ++i) {
  223. _commitThread[i].join();
  224. }
  225. _onlineNotificationThread.join();
  226. }
  227. bool PostgreSQL::waitForReady()
  228. {
  229. while (_ready < 2) {
  230. _readyLock.lock();
  231. _readyLock.unlock();
  232. }
  233. return true;
  234. }
  235. bool PostgreSQL::isReady()
  236. {
  237. return ((_ready == 2)&&(_connected));
  238. }
  239. bool PostgreSQL::save(nlohmann::json &record,bool notifyListeners)
  240. {
  241. bool modified = false;
  242. try {
  243. if (!record.is_object()) {
  244. fprintf(stderr, "record is not an object?!?\n");
  245. return false;
  246. }
  247. const std::string objtype = record["objtype"];
  248. if (objtype == "network") {
  249. //fprintf(stderr, "network save\n");
  250. const uint64_t nwid = OSUtils::jsonIntHex(record["id"],0ULL);
  251. if (nwid) {
  252. nlohmann::json old;
  253. get(nwid,old);
  254. if ((!old.is_object())||(!_compareRecords(old,record))) {
  255. record["revision"] = OSUtils::jsonInt(record["revision"],0ULL) + 1ULL;
  256. _commitQueue.post(std::pair<nlohmann::json,bool>(record,notifyListeners));
  257. modified = true;
  258. }
  259. }
  260. } else if (objtype == "member") {
  261. std::string networkId = record["nwid"];
  262. std::string memberId = record["id"];
  263. const uint64_t nwid = OSUtils::jsonIntHex(record["nwid"],0ULL);
  264. const uint64_t id = OSUtils::jsonIntHex(record["id"],0ULL);
  265. //fprintf(stderr, "member save %s-%s\n", networkId.c_str(), memberId.c_str());
  266. if ((id)&&(nwid)) {
  267. nlohmann::json network,old;
  268. get(nwid,network,id,old);
  269. if ((!old.is_object())||(!_compareRecords(old,record))) {
  270. //fprintf(stderr, "commit queue post\n");
  271. record["revision"] = OSUtils::jsonInt(record["revision"],0ULL) + 1ULL;
  272. _commitQueue.post(std::pair<nlohmann::json,bool>(record,notifyListeners));
  273. modified = true;
  274. } else {
  275. //fprintf(stderr, "no change\n");
  276. }
  277. }
  278. } else {
  279. fprintf(stderr, "uhh waaat\n");
  280. }
  281. } catch (std::exception &e) {
  282. fprintf(stderr, "Error on PostgreSQL::save: %s\n", e.what());
  283. } catch (...) {
  284. fprintf(stderr, "Unknown error on PostgreSQL::save\n");
  285. }
  286. return modified;
  287. }
  288. void PostgreSQL::eraseNetwork(const uint64_t networkId)
  289. {
  290. fprintf(stderr, "PostgreSQL::eraseNetwork\n");
  291. char tmp2[24];
  292. waitForReady();
  293. Utils::hex(networkId, tmp2);
  294. std::pair<nlohmann::json,bool> tmp;
  295. tmp.first["id"] = tmp2;
  296. tmp.first["objtype"] = "_delete_network";
  297. tmp.second = true;
  298. _commitQueue.post(tmp);
  299. nlohmann::json nullJson;
  300. _networkChanged(tmp.first, nullJson, true);
  301. }
  302. void PostgreSQL::eraseMember(const uint64_t networkId, const uint64_t memberId)
  303. {
  304. fprintf(stderr, "PostgreSQL::eraseMember\n");
  305. char tmp2[24];
  306. waitForReady();
  307. std::pair<nlohmann::json,bool> tmp, nw;
  308. Utils::hex(networkId, tmp2);
  309. tmp.first["nwid"] = tmp2;
  310. Utils::hex(memberId, tmp2);
  311. tmp.first["id"] = tmp2;
  312. tmp.first["objtype"] = "_delete_member";
  313. tmp.second = true;
  314. _commitQueue.post(tmp);
  315. nlohmann::json nullJson;
  316. _memberChanged(tmp.first, nullJson, true);
  317. }
  318. void PostgreSQL::nodeIsOnline(const uint64_t networkId, const uint64_t memberId, const InetAddress &physicalAddress)
  319. {
  320. std::lock_guard<std::mutex> l(_lastOnline_l);
  321. std::pair<int64_t, InetAddress> &i = _lastOnline[std::pair<uint64_t,uint64_t>(networkId, memberId)];
  322. i.first = OSUtils::now();
  323. if (physicalAddress) {
  324. i.second = physicalAddress;
  325. }
  326. }
  327. AuthInfo PostgreSQL::getSSOAuthInfo(const nlohmann::json &member, const std::string &redirectURL)
  328. {
  329. Metrics::db_get_sso_info++;
  330. // NONCE is just a random character string. no semantic meaning
  331. // state = HMAC SHA384 of Nonce based on shared sso key
  332. //
  333. // need nonce timeout in database? make sure it's used within X time
  334. // X is 5 minutes for now. Make configurable later?
  335. //
  336. // how do we tell when a nonce is used? if auth_expiration_time is set
  337. std::string networkId = member["nwid"];
  338. std::string memberId = member["id"];
  339. char authenticationURL[4096] = {0};
  340. AuthInfo info;
  341. info.enabled = true;
  342. //if (memberId == "a10dccea52" && networkId == "8056c2e21c24673d") {
  343. // fprintf(stderr, "invalid authinfo for grant's machine\n");
  344. // info.version=1;
  345. // return info;
  346. //}
  347. // fprintf(stderr, "PostgreSQL::updateMemberOnLoad: %s-%s\n", networkId.c_str(), memberId.c_str());
  348. std::shared_ptr<PostgresConnection> c;
  349. try {
  350. c = _pool->borrow();
  351. pqxx::work w(*c->c);
  352. char nonceBytes[16] = {0};
  353. std::string nonce = "";
  354. // check if the member exists first.
  355. pqxx::row count = w.exec_params1("SELECT count(id) FROM ztc_member WHERE id = $1 AND network_id = $2 AND deleted = false", memberId, networkId);
  356. if (count[0].as<int>() == 1) {
  357. // get active nonce, if exists.
  358. pqxx::result r = w.exec_params("SELECT nonce FROM ztc_sso_expiry "
  359. "WHERE network_id = $1 AND member_id = $2 "
  360. "AND ((NOW() AT TIME ZONE 'UTC') <= authentication_expiry_time) AND ((NOW() AT TIME ZONE 'UTC') <= nonce_expiration)",
  361. networkId, memberId);
  362. if (r.size() == 0) {
  363. // no active nonce.
  364. // find an unused nonce, if one exists.
  365. pqxx::result r = w.exec_params("SELECT nonce FROM ztc_sso_expiry "
  366. "WHERE network_id = $1 AND member_id = $2 "
  367. "AND authentication_expiry_time IS NULL AND ((NOW() AT TIME ZONE 'UTC') <= nonce_expiration)",
  368. networkId, memberId);
  369. if (r.size() == 1) {
  370. // we have an existing nonce. Use it
  371. nonce = r.at(0)[0].as<std::string>();
  372. Utils::unhex(nonce.c_str(), nonceBytes, sizeof(nonceBytes));
  373. } else if (r.empty()) {
  374. // create a nonce
  375. Utils::getSecureRandom(nonceBytes, 16);
  376. char nonceBuf[64] = {0};
  377. Utils::hex(nonceBytes, sizeof(nonceBytes), nonceBuf);
  378. nonce = std::string(nonceBuf);
  379. pqxx::result ir = w.exec_params0("INSERT INTO ztc_sso_expiry "
  380. "(nonce, nonce_expiration, network_id, member_id) VALUES "
  381. "($1, TO_TIMESTAMP($2::double precision/1000), $3, $4)",
  382. nonce, OSUtils::now() + 300000, networkId, memberId);
  383. w.commit();
  384. } else {
  385. // > 1 ?!? Thats an error!
  386. fprintf(stderr, "> 1 unused nonce!\n");
  387. exit(6);
  388. }
  389. } else if (r.size() == 1) {
  390. nonce = r.at(0)[0].as<std::string>();
  391. Utils::unhex(nonce.c_str(), nonceBytes, sizeof(nonceBytes));
  392. } else {
  393. // more than 1 nonce in use? Uhhh...
  394. fprintf(stderr, "> 1 nonce in use for network member?!?\n");
  395. exit(7);
  396. }
  397. r = w.exec_params(
  398. "SELECT oc.client_id, oc.authorization_endpoint, oc.issuer, oc.provider, oc.sso_impl_version "
  399. "FROM ztc_network AS n "
  400. "INNER JOIN ztc_org o "
  401. " ON o.owner_id = n.owner_id "
  402. "LEFT OUTER JOIN ztc_network_oidc_config noc "
  403. " ON noc.network_id = n.id "
  404. "LEFT OUTER JOIN ztc_oidc_config oc "
  405. " ON noc.client_id = oc.client_id AND noc.org_id = o.org_id "
  406. "WHERE n.id = $1 AND n.sso_enabled = true", networkId);
  407. std::string client_id = "";
  408. std::string authorization_endpoint = "";
  409. std::string issuer = "";
  410. std::string provider = "";
  411. uint64_t sso_version = 0;
  412. if (r.size() == 1) {
  413. client_id = r.at(0)[0].as<std::optional<std::string>>().value_or("");
  414. authorization_endpoint = r.at(0)[1].as<std::optional<std::string>>().value_or("");
  415. issuer = r.at(0)[2].as<std::optional<std::string>>().value_or("");
  416. provider = r.at(0)[3].as<std::optional<std::string>>().value_or("");
  417. sso_version = r.at(0)[4].as<std::optional<uint64_t>>().value_or(1);
  418. } else if (r.size() > 1) {
  419. fprintf(stderr, "ERROR: More than one auth endpoint for an organization?!?!? NetworkID: %s\n", networkId.c_str());
  420. } else {
  421. fprintf(stderr, "No client or auth endpoint?!?\n");
  422. }
  423. info.version = sso_version;
  424. // no catch all else because we don't actually care if no records exist here. just continue as normal.
  425. if ((!client_id.empty())&&(!authorization_endpoint.empty())) {
  426. uint8_t state[48];
  427. HMACSHA384(_ssoPsk, nonceBytes, sizeof(nonceBytes), state);
  428. char state_hex[256];
  429. Utils::hex(state, 48, state_hex);
  430. if (info.version == 0) {
  431. char url[2048] = {0};
  432. OSUtils::ztsnprintf(url, sizeof(authenticationURL),
  433. "%s?response_type=id_token&response_mode=form_post&scope=openid+email+profile&redirect_uri=%s&nonce=%s&state=%s&client_id=%s",
  434. authorization_endpoint.c_str(),
  435. url_encode(redirectURL).c_str(),
  436. nonce.c_str(),
  437. state_hex,
  438. client_id.c_str());
  439. info.authenticationURL = std::string(url);
  440. } else if (info.version == 1) {
  441. info.ssoClientID = client_id;
  442. info.issuerURL = issuer;
  443. info.ssoProvider = provider;
  444. info.ssoNonce = nonce;
  445. info.ssoState = std::string(state_hex) + "_" +networkId;
  446. info.centralAuthURL = redirectURL;
  447. #ifdef ZT_DEBUG
  448. fprintf(
  449. stderr,
  450. "ssoClientID: %s\nissuerURL: %s\nssoNonce: %s\nssoState: %s\ncentralAuthURL: %s\nprovider: %s\n",
  451. info.ssoClientID.c_str(),
  452. info.issuerURL.c_str(),
  453. info.ssoNonce.c_str(),
  454. info.ssoState.c_str(),
  455. info.centralAuthURL.c_str(),
  456. provider.c_str());
  457. #endif
  458. }
  459. } else {
  460. fprintf(stderr, "client_id: %s\nauthorization_endpoint: %s\n", client_id.c_str(), authorization_endpoint.c_str());
  461. }
  462. }
  463. _pool->unborrow(c);
  464. } catch (std::exception &e) {
  465. if (c) {
  466. _pool->unborrow(c);
  467. }
  468. fprintf(stderr, "ERROR: Error updating member on load for network %s: %s\n", networkId.c_str(), e.what());
  469. }
  470. return info; //std::string(authenticationURL);
  471. }
  472. void PostgreSQL::initializeNetworks()
  473. {
  474. try {
  475. std::string setKey = "networks:{" + _myAddressStr + "}";
  476. fprintf(stderr, "Initializing Networks...\n");
  477. if (_redisMemberStatus) {
  478. fprintf(stderr, "Init Redis for networks...\n");
  479. try {
  480. if (_rc->clusterMode) {
  481. _cluster->del(setKey);
  482. } else {
  483. _redis->del(setKey);
  484. }
  485. } catch (sw::redis::Error &e) {
  486. // ignore. if this key doesn't exist, there's no reason to delete it
  487. }
  488. }
  489. std::unordered_set<std::string> networkSet;
  490. char qbuf[2048] = {0};
  491. sprintf(qbuf,
  492. "SELECT n.id, (EXTRACT(EPOCH FROM n.creation_time AT TIME ZONE 'UTC')*1000)::bigint as creation_time, n.capabilities, "
  493. "n.enable_broadcast, (EXTRACT(EPOCH FROM n.last_modified AT TIME ZONE 'UTC')*1000)::bigint AS last_modified, n.mtu, n.multicast_limit, n.name, n.private, n.remote_trace_level, "
  494. "n.remote_trace_target, n.revision, n.rules, n.tags, n.v4_assign_mode, n.v6_assign_mode, n.sso_enabled, (CASE WHEN n.sso_enabled THEN noc.client_id ELSE NULL END) as client_id, "
  495. "(CASE WHEN n.sso_enabled THEN oc.authorization_endpoint ELSE NULL END) as authorization_endpoint, "
  496. "(CASE WHEN n.sso_enabled THEN oc.provider ELSE NULL END) as provider, d.domain, d.servers, "
  497. "ARRAY(SELECT CONCAT(host(ip_range_start),'|', host(ip_range_end)) FROM ztc_network_assignment_pool WHERE network_id = n.id) AS assignment_pool, "
  498. "ARRAY(SELECT CONCAT(host(address),'/',bits::text,'|',COALESCE(host(via), 'NULL'))FROM ztc_network_route WHERE network_id = n.id) AS routes "
  499. "FROM ztc_network n "
  500. "LEFT OUTER JOIN ztc_org o "
  501. " ON o.owner_id = n.owner_id "
  502. "LEFT OUTER JOIN ztc_network_oidc_config noc "
  503. " ON noc.network_id = n.id "
  504. "LEFT OUTER JOIN ztc_oidc_config oc "
  505. " ON noc.client_id = oc.client_id AND oc.org_id = o.org_id "
  506. "LEFT OUTER JOIN ztc_network_dns d "
  507. " ON d.network_id = n.id "
  508. "WHERE deleted = false AND controller_id = '%s'", _myAddressStr.c_str());
  509. auto c = _pool->borrow();
  510. auto c2 = _pool->borrow();
  511. pqxx::work w{*c->c};
  512. fprintf(stderr, "Load networks from psql...\n");
  513. auto stream = pqxx::stream_from::query(w, qbuf);
  514. std::tuple<
  515. std::string // network ID
  516. , std::optional<int64_t> // creationTime
  517. , std::optional<std::string> // capabilities
  518. , std::optional<bool> // enableBroadcast
  519. , std::optional<uint64_t> // lastModified
  520. , std::optional<int> // mtu
  521. , std::optional<int> // multicastLimit
  522. , std::optional<std::string> // name
  523. , bool // private
  524. , std::optional<int> // remoteTraceLevel
  525. , std::optional<std::string> // remoteTraceTarget
  526. , std::optional<uint64_t> // revision
  527. , std::optional<std::string> // rules
  528. , std::optional<std::string> // tags
  529. , std::optional<std::string> // v4AssignMode
  530. , std::optional<std::string> // v6AssignMode
  531. , std::optional<bool> // ssoEnabled
  532. , std::optional<std::string> // clientId
  533. , std::optional<std::string> // authorizationEndpoint
  534. , std::optional<std::string> // ssoProvider
  535. , std::optional<std::string> // domain
  536. , std::optional<std::string> // servers
  537. , std::string // assignmentPoolString
  538. , std::string // routeString
  539. > row;
  540. uint64_t count = 0;
  541. auto tmp = std::chrono::high_resolution_clock::now();
  542. uint64_t total = 0;
  543. while (stream >> row) {
  544. auto start = std::chrono::high_resolution_clock::now();
  545. json empty;
  546. json config;
  547. initNetwork(config);
  548. std::string nwid = std::get<0>(row);
  549. std::optional<int64_t> creationTime = std::get<1>(row);
  550. std::optional<std::string> capabilities = std::get<2>(row);
  551. std::optional<bool> enableBroadcast = std::get<3>(row);
  552. std::optional<uint64_t> lastModified = std::get<4>(row);
  553. std::optional<int> mtu = std::get<5>(row);
  554. std::optional<int> multicastLimit = std::get<6>(row);
  555. std::optional<std::string> name = std::get<7>(row);
  556. bool isPrivate = std::get<8>(row);
  557. std::optional<int> remoteTraceLevel = std::get<9>(row);
  558. std::optional<std::string> remoteTraceTarget = std::get<10>(row);
  559. std::optional<uint64_t> revision = std::get<11>(row);
  560. std::optional<std::string> rules = std::get<12>(row);
  561. std::optional<std::string> tags = std::get<13>(row);
  562. std::optional<std::string> v4AssignMode = std::get<14>(row);
  563. std::optional<std::string> v6AssignMode = std::get<15>(row);
  564. std::optional<bool> ssoEnabled = std::get<16>(row);
  565. std::optional<std::string> clientId = std::get<17>(row);
  566. std::optional<std::string> authorizationEndpoint = std::get<18>(row);
  567. std::optional<std::string> ssoProvider = std::get<19>(row);
  568. std::optional<std::string> dnsDomain = std::get<20>(row);
  569. std::optional<std::string> dnsServers = std::get<21>(row);
  570. std::string assignmentPoolString = std::get<22>(row);
  571. std::string routesString = std::get<23>(row);
  572. config["id"] = nwid;
  573. config["nwid"] = nwid;
  574. config["creationTime"] = creationTime.value_or(0);
  575. config["capabilities"] = json::parse(capabilities.value_or("[]"));
  576. config["enableBroadcast"] = enableBroadcast.value_or(false);
  577. config["lastModified"] = lastModified.value_or(0);
  578. config["mtu"] = mtu.value_or(2800);
  579. config["multicastLimit"] = multicastLimit.value_or(64);
  580. config["name"] = name.value_or("");
  581. config["private"] = isPrivate;
  582. config["remoteTraceLevel"] = remoteTraceLevel.value_or(0);
  583. config["remoteTraceTarget"] = remoteTraceTarget.value_or("");
  584. config["revision"] = revision.value_or(0);
  585. config["rules"] = json::parse(rules.value_or("[]"));
  586. config["tags"] = json::parse(tags.value_or("[]"));
  587. config["v4AssignMode"] = json::parse(v4AssignMode.value_or("{}"));
  588. config["v6AssignMode"] = json::parse(v6AssignMode.value_or("{}"));
  589. config["ssoEnabled"] = ssoEnabled.value_or(false);
  590. config["objtype"] = "network";
  591. config["ipAssignmentPools"] = json::array();
  592. config["routes"] = json::array();
  593. config["clientId"] = clientId.value_or("");
  594. config["authorizationEndpoint"] = authorizationEndpoint.value_or("");
  595. config["provider"] = ssoProvider.value_or("");
  596. networkSet.insert(nwid);
  597. if (dnsDomain.has_value()) {
  598. std::string serverList = dnsServers.value();
  599. json obj;
  600. auto servers = json::array();
  601. if (serverList.rfind("{",0) != std::string::npos) {
  602. serverList = serverList.substr(1, serverList.size()-2);
  603. std::stringstream ss(serverList);
  604. while(ss.good()) {
  605. std::string server;
  606. std::getline(ss, server, ',');
  607. servers.push_back(server);
  608. }
  609. }
  610. obj["domain"] = dnsDomain.value();
  611. obj["servers"] = servers;
  612. config["dns"] = obj;
  613. }
  614. config["ipAssignmentPools"] = json::array();
  615. if (assignmentPoolString != "{}") {
  616. std::string tmp = assignmentPoolString.substr(1, assignmentPoolString.size()-2);
  617. std::vector<std::string> assignmentPools = split(tmp, ',');
  618. for (auto it = assignmentPools.begin(); it != assignmentPools.end(); ++it) {
  619. std::vector<std::string> r = split(*it, '|');
  620. json ip;
  621. ip["ipRangeStart"] = r[0];
  622. ip["ipRangeEnd"] = r[1];
  623. config["ipAssignmentPools"].push_back(ip);
  624. }
  625. }
  626. config["routes"] = json::array();
  627. if (routesString != "{}") {
  628. std::string tmp = routesString.substr(1, routesString.size()-2);
  629. std::vector<std::string> routes = split(tmp, ',');
  630. for (auto it = routes.begin(); it != routes.end(); ++it) {
  631. std::vector<std::string> r = split(*it, '|');
  632. json route;
  633. route["target"] = r[0];
  634. route["via"] = ((route["via"] == "NULL")? nullptr : r[1]);
  635. config["routes"].push_back(route);
  636. }
  637. }
  638. Metrics::network_count++;
  639. _networkChanged(empty, config, false);
  640. auto end = std::chrono::high_resolution_clock::now();
  641. auto dur = std::chrono::duration_cast<std::chrono::microseconds>(end - start);;
  642. total += dur.count();
  643. ++count;
  644. if (count > 0 && count % 10000 == 0) {
  645. fprintf(stderr, "Averaging %llu us per network\n", (total/count));
  646. }
  647. }
  648. if (count > 0) {
  649. fprintf(stderr, "Took %llu us per network to load\n", (total/count));
  650. }
  651. stream.complete();
  652. w.commit();
  653. _pool->unborrow(c2);
  654. _pool->unborrow(c);
  655. fprintf(stderr, "done.\n");
  656. if (!networkSet.empty()) {
  657. if (_redisMemberStatus) {
  658. fprintf(stderr, "adding networks to redis...\n");
  659. if (_rc->clusterMode) {
  660. auto tx = _cluster->transaction(_myAddressStr, true, false);
  661. tx.sadd(setKey, networkSet.begin(), networkSet.end());
  662. tx.exec();
  663. } else {
  664. auto tx = _redis->transaction(true, false);
  665. tx.sadd(setKey, networkSet.begin(), networkSet.end());
  666. tx.exec();
  667. }
  668. fprintf(stderr, "done.\n");
  669. }
  670. }
  671. if (++this->_ready == 2) {
  672. if (_waitNoticePrinted) {
  673. fprintf(stderr,"[%s] NOTICE: %.10llx controller PostgreSQL data download complete." ZT_EOL_S,_timestr(),(unsigned long long)_myAddress.toInt());
  674. }
  675. _readyLock.unlock();
  676. }
  677. fprintf(stderr, "network init done.\n");
  678. } catch (sw::redis::Error &e) {
  679. fprintf(stderr, "ERROR: Error initializing networks in Redis: %s\n", e.what());
  680. std::this_thread::sleep_for(std::chrono::milliseconds(5000));
  681. exit(-1);
  682. } catch (std::exception &e) {
  683. fprintf(stderr, "ERROR: Error initializing networks: %s\n", e.what());
  684. std::this_thread::sleep_for(std::chrono::milliseconds(5000));
  685. exit(-1);
  686. }
  687. }
  688. void PostgreSQL::initializeMembers()
  689. {
  690. std::string memberId;
  691. std::string networkId;
  692. try {
  693. std::unordered_map<std::string, std::string> networkMembers;
  694. fprintf(stderr, "Initializing Members...\n");
  695. std::string setKeyBase = "network-nodes-all:{" + _myAddressStr + "}:";
  696. if (_redisMemberStatus) {
  697. fprintf(stderr, "Initialize Redis for members...\n");
  698. std::unique_lock<std::shared_mutex> l(_networks_l);
  699. std::unordered_set<std::string> deletes;
  700. for ( auto it : _networks) {
  701. uint64_t nwid_i = it.first;
  702. char nwidTmp[64] = {0};
  703. OSUtils::ztsnprintf(nwidTmp, sizeof(nwidTmp), "%.16llx", nwid_i);
  704. std::string nwid(nwidTmp);
  705. std::string key = setKeyBase + nwid;
  706. deletes.insert(key);
  707. }
  708. if (!deletes.empty()) {
  709. try {
  710. if (_rc->clusterMode) {
  711. auto tx = _cluster->transaction(_myAddressStr, true, false);
  712. for (std::string k : deletes) {
  713. tx.del(k);
  714. }
  715. tx.exec();
  716. } else {
  717. auto tx = _redis->transaction(true, false);
  718. for (std::string k : deletes) {
  719. tx.del(k);
  720. }
  721. tx.exec();
  722. }
  723. } catch (sw::redis::Error &e) {
  724. // ignore
  725. }
  726. }
  727. }
  728. char qbuf[2048];
  729. sprintf(qbuf,
  730. "SELECT m.id, m.network_id, m.active_bridge, m.authorized, m.capabilities, "
  731. "(EXTRACT(EPOCH FROM m.creation_time AT TIME ZONE 'UTC')*1000)::bigint, m.identity, "
  732. "(EXTRACT(EPOCH FROM m.last_authorized_time AT TIME ZONE 'UTC')*1000)::bigint, "
  733. "(EXTRACT(EPOCH FROM m.last_deauthorized_time AT TIME ZONE 'UTC')*1000)::bigint, "
  734. "m.remote_trace_level, m.remote_trace_target, m.tags, m.v_major, m.v_minor, m.v_rev, m.v_proto, "
  735. "m.no_auto_assign_ips, m.revision, m.sso_exempt, "
  736. "(CASE WHEN n.sso_enabled = TRUE AND m.sso_exempt = FALSE THEN "
  737. " ( "
  738. " SELECT (EXTRACT(EPOCH FROM e.authentication_expiry_time)*1000)::bigint "
  739. " FROM ztc_sso_expiry e "
  740. " INNER JOIN ztc_network n1 "
  741. " ON n1.id = e.network_id AND n1.deleted = TRUE "
  742. " WHERE e.network_id = m.network_id AND e.member_id = m.id AND n.sso_enabled = TRUE AND e.authentication_expiry_time IS NOT NULL "
  743. " ORDER BY e.authentication_expiry_time DESC LIMIT 1 "
  744. " ) "
  745. " ELSE NULL "
  746. " END) AS authentication_expiry_time, "
  747. "ARRAY(SELECT DISTINCT address FROM ztc_member_ip_assignment WHERE member_id = m.id AND network_id = m.network_id) AS assigned_addresses "
  748. "FROM ztc_member m "
  749. "INNER JOIN ztc_network n "
  750. " ON n.id = m.network_id "
  751. "WHERE n.controller_id = '%s' AND n.deleted = FALSE AND m.deleted = FALSE", _myAddressStr.c_str());
  752. auto c = _pool->borrow();
  753. auto c2 = _pool->borrow();
  754. pqxx::work w{*c->c};
  755. fprintf(stderr, "Load members from psql...\n");
  756. auto stream = pqxx::stream_from::query(w, qbuf);
  757. std::tuple<
  758. std::string // memberId
  759. , std::string // memberId
  760. , std::optional<bool> // activeBridge
  761. , std::optional<bool> // authorized
  762. , std::optional<std::string> // capabilities
  763. , std::optional<uint64_t> // creationTime
  764. , std::optional<std::string> // identity
  765. , std::optional<uint64_t> // lastAuthorizedTime
  766. , std::optional<uint64_t> // lastDeauthorizedTime
  767. , std::optional<int> // remoteTraceLevel
  768. , std::optional<std::string> // remoteTraceTarget
  769. , std::optional<std::string> // tags
  770. , std::optional<int> // vMajor
  771. , std::optional<int> // vMinor
  772. , std::optional<int> // vRev
  773. , std::optional<int> // vProto
  774. , std::optional<bool> // noAutoAssignIps
  775. , std::optional<uint64_t> // revision
  776. , std::optional<bool> // ssoExempt
  777. , std::optional<uint64_t> // authenticationExpiryTime
  778. , std::string // assignedAddresses
  779. > row;
  780. uint64_t count = 0;
  781. auto tmp = std::chrono::high_resolution_clock::now();
  782. uint64_t total = 0;
  783. while (stream >> row) {
  784. auto start = std::chrono::high_resolution_clock::now();
  785. json empty;
  786. json config;
  787. initMember(config);
  788. memberId = std::get<0>(row);
  789. networkId = std::get<1>(row);
  790. std::optional<bool> activeBridge = std::get<2>(row);
  791. std::optional<bool> authorized = std::get<3>(row);
  792. std::optional<std::string> capabilities = std::get<4>(row);
  793. std::optional<uint64_t> creationTime = std::get<5>(row);
  794. std::optional<std::string> identity = std::get<6>(row);
  795. std::optional<uint64_t> lastAuthorizedTime = std::get<7>(row);
  796. std::optional<uint64_t> lastDeauthorizedTime = std::get<8>(row);
  797. std::optional<int> remoteTraceLevel = std::get<9>(row);
  798. std::optional<std::string> remoteTraceTarget = std::get<10>(row);
  799. std::optional<std::string> tags = std::get<11>(row);
  800. std::optional<int> vMajor = std::get<12>(row);
  801. std::optional<int> vMinor = std::get<13>(row);
  802. std::optional<int> vRev = std::get<14>(row);
  803. std::optional<int> vProto = std::get<15>(row);
  804. std::optional<bool> noAutoAssignIps = std::get<16>(row);
  805. std::optional<uint64_t> revision = std::get<17>(row);
  806. std::optional<bool> ssoExempt = std::get<18>(row);
  807. std::optional<uint64_t> authenticationExpiryTime = std::get<19>(row);
  808. std::string assignedAddresses = std::get<20>(row);
  809. networkMembers.insert(std::pair<std::string, std::string>(setKeyBase+networkId, memberId));
  810. config["id"] = memberId;
  811. config["address"] = memberId;
  812. config["nwid"] = networkId;
  813. config["activeBridge"] = activeBridge.value_or(false);
  814. config["authorized"] = authorized.value_or(false);
  815. config["capabilities"] = json::parse(capabilities.value_or("[]"));
  816. config["creationTime"] = creationTime.value_or(0);
  817. config["identity"] = identity.value_or("");
  818. config["lastAuthorizedTime"] = lastAuthorizedTime.value_or(0);
  819. config["lastDeauthorizedTime"] = lastDeauthorizedTime.value_or(0);
  820. config["remoteTraceLevel"] = remoteTraceLevel.value_or(0);
  821. config["remoteTraceTarget"] = remoteTraceTarget.value_or("");
  822. config["tags"] = json::parse(tags.value_or("[]"));
  823. config["vMajor"] = vMajor.value_or(-1);
  824. config["vMinor"] = vMinor.value_or(-1);
  825. config["vRev"] = vRev.value_or(-1);
  826. config["vProto"] = vProto.value_or(-1);
  827. config["noAutoAssignIps"] = noAutoAssignIps.value_or(false);
  828. config["revision"] = revision.value_or(0);
  829. config["ssoExempt"] = ssoExempt.value_or(false);
  830. config["authenticationExpiryTime"] = authenticationExpiryTime.value_or(0);
  831. config["objtype"] = "member";
  832. config["ipAssignments"] = json::array();
  833. if (assignedAddresses != "{}") {
  834. std::string tmp = assignedAddresses.substr(1, assignedAddresses.size()-2);
  835. std::vector<std::string> addrs = split(tmp, ',');
  836. for (auto it = addrs.begin(); it != addrs.end(); ++it) {
  837. config["ipAssignments"].push_back(*it);
  838. }
  839. }
  840. Metrics::member_count++;
  841. _memberChanged(empty, config, false);
  842. memberId = "";
  843. networkId = "";
  844. auto end = std::chrono::high_resolution_clock::now();
  845. auto dur = std::chrono::duration_cast<std::chrono::microseconds>(end - start);
  846. total += dur.count();
  847. ++count;
  848. if (count > 0 && count % 10000 == 0) {
  849. fprintf(stderr, "Averaging %llu us per member\n", (total/count));
  850. }
  851. }
  852. if (count > 0) {
  853. fprintf(stderr, "Took %llu us per member to load\n", (total/count));
  854. }
  855. stream.complete();
  856. w.commit();
  857. _pool->unborrow(c2);
  858. _pool->unborrow(c);
  859. fprintf(stderr, "done.\n");
  860. if (!networkMembers.empty()) {
  861. if (_redisMemberStatus) {
  862. fprintf(stderr, "Load member data into redis...\n");
  863. if (_rc->clusterMode) {
  864. auto tx = _cluster->transaction(_myAddressStr, true, false);
  865. for (auto it : networkMembers) {
  866. tx.sadd(it.first, it.second);
  867. }
  868. tx.exec();
  869. } else {
  870. auto tx = _redis->transaction(true, false);
  871. for (auto it : networkMembers) {
  872. tx.sadd(it.first, it.second);
  873. }
  874. tx.exec();
  875. }
  876. fprintf(stderr, "done.\n");
  877. }
  878. }
  879. fprintf(stderr, "Done loading members...\n");
  880. if (++this->_ready == 2) {
  881. if (_waitNoticePrinted) {
  882. fprintf(stderr,"[%s] NOTICE: %.10llx controller PostgreSQL data download complete." ZT_EOL_S,_timestr(),(unsigned long long)_myAddress.toInt());
  883. }
  884. _readyLock.unlock();
  885. }
  886. } catch (sw::redis::Error &e) {
  887. fprintf(stderr, "ERROR: Error initializing members (redis): %s\n", e.what());
  888. exit(-1);
  889. } catch (std::exception &e) {
  890. fprintf(stderr, "ERROR: Error initializing member: %s-%s %s\n", networkId.c_str(), memberId.c_str(), e.what());
  891. exit(-1);
  892. }
  893. }
  894. void PostgreSQL::heartbeat()
  895. {
  896. char publicId[1024];
  897. char hostnameTmp[1024];
  898. _myId.toString(false,publicId);
  899. if (gethostname(hostnameTmp, sizeof(hostnameTmp))!= 0) {
  900. hostnameTmp[0] = (char)0;
  901. } else {
  902. for (int i = 0; i < (int)sizeof(hostnameTmp); ++i) {
  903. if ((hostnameTmp[i] == '.')||(hostnameTmp[i] == 0)) {
  904. hostnameTmp[i] = (char)0;
  905. break;
  906. }
  907. }
  908. }
  909. const char *controllerId = _myAddressStr.c_str();
  910. const char *publicIdentity = publicId;
  911. const char *hostname = hostnameTmp;
  912. while (_run == 1) {
  913. // fprintf(stderr, "%s: heartbeat\n", controllerId);
  914. auto c = _pool->borrow();
  915. int64_t ts = OSUtils::now();
  916. if(c->c) {
  917. std::string major = std::to_string(ZEROTIER_ONE_VERSION_MAJOR);
  918. std::string minor = std::to_string(ZEROTIER_ONE_VERSION_MINOR);
  919. std::string rev = std::to_string(ZEROTIER_ONE_VERSION_REVISION);
  920. std::string build = std::to_string(ZEROTIER_ONE_VERSION_BUILD);
  921. std::string now = std::to_string(ts);
  922. std::string host_port = std::to_string(_listenPort);
  923. std::string use_redis = (_rc != NULL) ? "true" : "false";
  924. std::string redis_mem_status = (_redisMemberStatus) ? "true" : "false";
  925. try {
  926. pqxx::work w{*c->c};
  927. pqxx::result res =
  928. w.exec0("INSERT INTO ztc_controller (id, cluster_host, last_alive, public_identity, v_major, v_minor, v_rev, v_build, host_port, use_redis, redis_member_status) "
  929. "VALUES ("+w.quote(controllerId)+", "+w.quote(hostname)+", TO_TIMESTAMP("+now+"::double precision/1000), "+
  930. w.quote(publicIdentity)+", "+major+", "+minor+", "+rev+", "+build+", "+host_port+", "+use_redis+", "+redis_mem_status+") "
  931. "ON CONFLICT (id) DO UPDATE SET cluster_host = EXCLUDED.cluster_host, last_alive = EXCLUDED.last_alive, "
  932. "public_identity = EXCLUDED.public_identity, v_major = EXCLUDED.v_major, v_minor = EXCLUDED.v_minor, "
  933. "v_rev = EXCLUDED.v_rev, v_build = EXCLUDED.v_rev, host_port = EXCLUDED.host_port, "
  934. "use_redis = EXCLUDED.use_redis, redis_member_status = EXCLUDED.redis_member_status");
  935. w.commit();
  936. } catch (std::exception &e) {
  937. fprintf(stderr, "%s: Heartbeat update failed: %s\n", controllerId, e.what());
  938. _pool->unborrow(c);
  939. std::this_thread::sleep_for(std::chrono::milliseconds(1000));
  940. continue;
  941. }
  942. }
  943. _pool->unborrow(c);
  944. try {
  945. if (_redisMemberStatus) {
  946. if (_rc->clusterMode) {
  947. _cluster->zadd("controllers", "controllerId", ts);
  948. } else {
  949. _redis->zadd("controllers", "controllerId", ts);
  950. }
  951. }
  952. } catch (sw::redis::Error &e) {
  953. fprintf(stderr, "ERROR: Redis error in heartbeat thread: %s\n", e.what());
  954. }
  955. std::this_thread::sleep_for(std::chrono::milliseconds(1000));
  956. }
  957. fprintf(stderr, "Exited heartbeat thread\n");
  958. }
  959. void PostgreSQL::membersDbWatcher()
  960. {
  961. if (_rc) {
  962. _membersWatcher_Redis();
  963. } else {
  964. _membersWatcher_Postgres();
  965. }
  966. if (_run == 1) {
  967. fprintf(stderr, "ERROR: %s membersDbWatcher should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  968. exit(9);
  969. }
  970. fprintf(stderr, "Exited membersDbWatcher\n");
  971. }
  972. void PostgreSQL::_membersWatcher_Postgres() {
  973. auto c = _pool->borrow();
  974. std::string stream = "member_" + _myAddressStr;
  975. fprintf(stderr, "Listening to member stream: %s\n", stream.c_str());
  976. MemberNotificationReceiver m(this, *c->c, stream);
  977. while(_run == 1) {
  978. c->c->await_notification(5, 0);
  979. }
  980. _pool->unborrow(c);
  981. }
  982. void PostgreSQL::_membersWatcher_Redis() {
  983. char buf[11] = {0};
  984. std::string key = "member-stream:{" + std::string(_myAddress.toString(buf)) + "}";
  985. std::string lastID = "0";
  986. fprintf(stderr, "Listening to member stream: %s\n", key.c_str());
  987. while (_run == 1) {
  988. try {
  989. json tmp;
  990. std::unordered_map<std::string, ItemStream> result;
  991. if (_rc->clusterMode) {
  992. _cluster->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  993. } else {
  994. _redis->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  995. }
  996. if (!result.empty()) {
  997. for (auto element : result) {
  998. #ifdef REDIS_TRACE
  999. fprintf(stdout, "Received notification from: %s\n", element.first.c_str());
  1000. #endif
  1001. for (auto rec : element.second) {
  1002. std::string id = rec.first;
  1003. auto attrs = rec.second;
  1004. #ifdef REDIS_TRACE
  1005. fprintf(stdout, "Record ID: %s\n", id.c_str());
  1006. fprintf(stdout, "attrs len: %lu\n", attrs.size());
  1007. #endif
  1008. for (auto a : attrs) {
  1009. #ifdef REDIS_TRACE
  1010. fprintf(stdout, "key: %s\nvalue: %s\n", a.first.c_str(), a.second.c_str());
  1011. #endif
  1012. try {
  1013. tmp = json::parse(a.second);
  1014. json &ov = tmp["old_val"];
  1015. json &nv = tmp["new_val"];
  1016. json oldConfig, newConfig;
  1017. if (ov.is_object()) oldConfig = ov;
  1018. if (nv.is_object()) newConfig = nv;
  1019. if (oldConfig.is_object()||newConfig.is_object()) {
  1020. _memberChanged(oldConfig,newConfig,(this->_ready >= 2));
  1021. }
  1022. } catch (...) {
  1023. fprintf(stderr, "json parse error in networkWatcher_Redis\n");
  1024. }
  1025. }
  1026. if (_rc->clusterMode) {
  1027. _cluster->xdel(key, id);
  1028. } else {
  1029. _redis->xdel(key, id);
  1030. }
  1031. lastID = id;
  1032. Metrics::redis_mem_notification++;
  1033. }
  1034. }
  1035. }
  1036. } catch (sw::redis::Error &e) {
  1037. fprintf(stderr, "Error in Redis members watcher: %s\n", e.what());
  1038. }
  1039. }
  1040. fprintf(stderr, "membersWatcher ended\n");
  1041. }
  1042. void PostgreSQL::networksDbWatcher()
  1043. {
  1044. if (_rc) {
  1045. _networksWatcher_Redis();
  1046. } else {
  1047. _networksWatcher_Postgres();
  1048. }
  1049. if (_run == 1) {
  1050. fprintf(stderr, "ERROR: %s networksDbWatcher should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  1051. exit(8);
  1052. }
  1053. fprintf(stderr, "Exited networksDbWatcher\n");
  1054. }
  1055. void PostgreSQL::_networksWatcher_Postgres() {
  1056. std::string stream = "network_" + _myAddressStr;
  1057. fprintf(stderr, "Listening to member stream: %s\n", stream.c_str());
  1058. auto c = _pool->borrow();
  1059. NetworkNotificationReceiver n(this, *c->c, stream);
  1060. while(_run == 1) {
  1061. c->c->await_notification(5,0);
  1062. }
  1063. }
  1064. void PostgreSQL::_networksWatcher_Redis() {
  1065. char buf[11] = {0};
  1066. std::string key = "network-stream:{" + std::string(_myAddress.toString(buf)) + "}";
  1067. std::string lastID = "0";
  1068. while (_run == 1) {
  1069. try {
  1070. json tmp;
  1071. std::unordered_map<std::string, ItemStream> result;
  1072. if (_rc->clusterMode) {
  1073. _cluster->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  1074. } else {
  1075. _redis->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  1076. }
  1077. if (!result.empty()) {
  1078. for (auto element : result) {
  1079. #ifdef REDIS_TRACE
  1080. fprintf(stdout, "Received notification from: %s\n", element.first.c_str());
  1081. #endif
  1082. for (auto rec : element.second) {
  1083. std::string id = rec.first;
  1084. auto attrs = rec.second;
  1085. #ifdef REDIS_TRACE
  1086. fprintf(stdout, "Record ID: %s\n", id.c_str());
  1087. fprintf(stdout, "attrs len: %lu\n", attrs.size());
  1088. #endif
  1089. for (auto a : attrs) {
  1090. #ifdef REDIS_TRACE
  1091. fprintf(stdout, "key: %s\nvalue: %s\n", a.first.c_str(), a.second.c_str());
  1092. #endif
  1093. try {
  1094. tmp = json::parse(a.second);
  1095. json &ov = tmp["old_val"];
  1096. json &nv = tmp["new_val"];
  1097. json oldConfig, newConfig;
  1098. if (ov.is_object()) oldConfig = ov;
  1099. if (nv.is_object()) newConfig = nv;
  1100. if (oldConfig.is_object()||newConfig.is_object()) {
  1101. _networkChanged(oldConfig,newConfig,(this->_ready >= 2));
  1102. }
  1103. } catch (...) {
  1104. fprintf(stderr, "json parse error in networkWatcher_Redis\n");
  1105. }
  1106. }
  1107. if (_rc->clusterMode) {
  1108. _cluster->xdel(key, id);
  1109. } else {
  1110. _redis->xdel(key, id);
  1111. }
  1112. lastID = id;
  1113. }
  1114. Metrics::redis_net_notification++;
  1115. }
  1116. }
  1117. } catch (sw::redis::Error &e) {
  1118. fprintf(stderr, "Error in Redis networks watcher: %s\n", e.what());
  1119. }
  1120. }
  1121. fprintf(stderr, "networksWatcher ended\n");
  1122. }
  1123. void PostgreSQL::commitThread()
  1124. {
  1125. fprintf(stderr, "%s: commitThread start\n", _myAddressStr.c_str());
  1126. std::pair<nlohmann::json,bool> qitem;
  1127. while(_commitQueue.get(qitem)&(_run == 1)) {
  1128. //fprintf(stderr, "commitThread tick\n");
  1129. if (!qitem.first.is_object()) {
  1130. fprintf(stderr, "not an object\n");
  1131. continue;
  1132. }
  1133. std::shared_ptr<PostgresConnection> c;
  1134. try {
  1135. c = _pool->borrow();
  1136. } catch (std::exception &e) {
  1137. fprintf(stderr, "ERROR: %s\n", e.what());
  1138. continue;
  1139. }
  1140. if (!c) {
  1141. fprintf(stderr, "Error getting database connection\n");
  1142. continue;
  1143. }
  1144. Metrics::pgsql_commit_ticks++;
  1145. try {
  1146. nlohmann::json &config = (qitem.first);
  1147. const std::string objtype = config["objtype"];
  1148. if (objtype == "member") {
  1149. // fprintf(stderr, "%s: commitThread: member\n", _myAddressStr.c_str());
  1150. std::string memberId;
  1151. std::string networkId;
  1152. try {
  1153. pqxx::work w(*c->c);
  1154. memberId = config["id"];
  1155. networkId = config["nwid"];
  1156. std::string target = "NULL";
  1157. if (!config["remoteTraceTarget"].is_null()) {
  1158. target = config["remoteTraceTarget"];
  1159. }
  1160. pqxx::row nwrow = w.exec_params1("SELECT COUNT(id) FROM ztc_network WHERE id = $1", networkId);
  1161. int nwcount = nwrow[0].as<int>();
  1162. if (nwcount != 1) {
  1163. fprintf(stderr, "network %s does not exist. skipping member upsert\n", networkId.c_str());
  1164. w.abort();
  1165. _pool->unborrow(c);
  1166. continue;
  1167. }
  1168. pqxx::result res = w.exec_params0(
  1169. "INSERT INTO ztc_member (id, network_id, active_bridge, authorized, capabilities, "
  1170. "identity, last_authorized_time, last_deauthorized_time, no_auto_assign_ips, "
  1171. "remote_trace_level, remote_trace_target, revision, tags, v_major, v_minor, v_rev, v_proto) "
  1172. "VALUES ($1, $2, $3, $4, $5, $6, "
  1173. "TO_TIMESTAMP($7::double precision/1000), TO_TIMESTAMP($8::double precision/1000), "
  1174. "$9, $10, $11, $12, $13, $14, $15, $16, $17) ON CONFLICT (network_id, id) DO UPDATE SET "
  1175. "active_bridge = EXCLUDED.active_bridge, authorized = EXCLUDED.authorized, capabilities = EXCLUDED.capabilities, "
  1176. "identity = EXCLUDED.identity, last_authorized_time = EXCLUDED.last_authorized_time, "
  1177. "last_deauthorized_time = EXCLUDED.last_deauthorized_time, no_auto_assign_ips = EXCLUDED.no_auto_assign_ips, "
  1178. "remote_trace_level = EXCLUDED.remote_trace_level, remote_trace_target = EXCLUDED.remote_trace_target, "
  1179. "revision = EXCLUDED.revision+1, tags = EXCLUDED.tags, v_major = EXCLUDED.v_major, "
  1180. "v_minor = EXCLUDED.v_minor, v_rev = EXCLUDED.v_rev, v_proto = EXCLUDED.v_proto",
  1181. memberId,
  1182. networkId,
  1183. (bool)config["activeBridge"],
  1184. (bool)config["authorized"],
  1185. OSUtils::jsonDump(config["capabilities"], -1),
  1186. OSUtils::jsonString(config["identity"], ""),
  1187. (uint64_t)config["lastAuthorizedTime"],
  1188. (uint64_t)config["lastDeauthorizedTime"],
  1189. (bool)config["noAutoAssignIps"],
  1190. (int)config["remoteTraceLevel"],
  1191. target,
  1192. (uint64_t)config["revision"],
  1193. OSUtils::jsonDump(config["tags"], -1),
  1194. (int)config["vMajor"],
  1195. (int)config["vMinor"],
  1196. (int)config["vRev"],
  1197. (int)config["vProto"]);
  1198. res = w.exec_params0("DELETE FROM ztc_member_ip_assignment WHERE member_id = $1 AND network_id = $2",
  1199. memberId, networkId);
  1200. std::vector<std::string> assignments;
  1201. bool ipAssignError = false;
  1202. for (auto i = config["ipAssignments"].begin(); i != config["ipAssignments"].end(); ++i) {
  1203. std::string addr = *i;
  1204. if (std::find(assignments.begin(), assignments.end(), addr) != assignments.end()) {
  1205. continue;
  1206. }
  1207. res = w.exec_params0(
  1208. "INSERT INTO ztc_member_ip_assignment (member_id, network_id, address) VALUES ($1, $2, $3) ON CONFLICT (network_id, member_id, address) DO NOTHING",
  1209. memberId, networkId, addr);
  1210. assignments.push_back(addr);
  1211. }
  1212. if (ipAssignError) {
  1213. fprintf(stderr, "%s: ipAssignError\n", _myAddressStr.c_str());
  1214. w.abort();
  1215. _pool->unborrow(c);
  1216. c.reset();
  1217. continue;
  1218. }
  1219. w.commit();
  1220. const uint64_t nwidInt = OSUtils::jsonIntHex(config["nwid"], 0ULL);
  1221. const uint64_t memberidInt = OSUtils::jsonIntHex(config["id"], 0ULL);
  1222. if (nwidInt && memberidInt) {
  1223. nlohmann::json nwOrig;
  1224. nlohmann::json memOrig;
  1225. nlohmann::json memNew(config);
  1226. get(nwidInt, nwOrig, memberidInt, memOrig);
  1227. _memberChanged(memOrig, memNew, qitem.second);
  1228. } else {
  1229. fprintf(stderr, "%s: Can't notify of change. Error parsing nwid or memberid: %llu-%llu\n", _myAddressStr.c_str(), (unsigned long long)nwidInt, (unsigned long long)memberidInt);
  1230. }
  1231. } catch (std::exception &e) {
  1232. fprintf(stderr, "%s ERROR: Error updating member %s-%s: %s\n", _myAddressStr.c_str(), networkId.c_str(), memberId.c_str(), e.what());
  1233. }
  1234. } else if (objtype == "network") {
  1235. try {
  1236. // fprintf(stderr, "%s: commitThread: network\n", _myAddressStr.c_str());
  1237. pqxx::work w(*c->c);
  1238. std::string id = config["id"];
  1239. std::string remoteTraceTarget = "";
  1240. if(!config["remoteTraceTarget"].is_null()) {
  1241. remoteTraceTarget = config["remoteTraceTarget"];
  1242. }
  1243. std::string rulesSource = "";
  1244. if (config["rulesSource"].is_string()) {
  1245. rulesSource = config["rulesSource"];
  1246. }
  1247. // This ugly query exists because when we want to mirror networks to/from
  1248. // another data store (e.g. FileDB or LFDB) it is possible to get a network
  1249. // that doesn't exist in Central's database. This does an upsert and sets
  1250. // the owner_id to the "first" global admin in the user DB if the record
  1251. // did not previously exist. If the record already exists owner_id is left
  1252. // unchanged, so owner_id should be left out of the update clause.
  1253. pqxx::result res = w.exec_params0(
  1254. "INSERT INTO ztc_network (id, creation_time, owner_id, controller_id, capabilities, enable_broadcast, "
  1255. "last_modified, mtu, multicast_limit, name, private, "
  1256. "remote_trace_level, remote_trace_target, rules, rules_source, "
  1257. "tags, v4_assign_mode, v6_assign_mode, sso_enabled) VALUES ("
  1258. "$1, TO_TIMESTAMP($5::double precision/1000), "
  1259. "(SELECT user_id AS owner_id FROM ztc_global_permissions WHERE authorize = true AND del = true AND modify = true AND read = true LIMIT 1),"
  1260. "$2, $3, $4, TO_TIMESTAMP($5::double precision/1000), "
  1261. "$6, $7, $8, $9, $10, $11, $12, $13, $14, $15, $16, $17) "
  1262. "ON CONFLICT (id) DO UPDATE set controller_id = EXCLUDED.controller_id, "
  1263. "capabilities = EXCLUDED.capabilities, enable_broadcast = EXCLUDED.enable_broadcast, "
  1264. "last_modified = EXCLUDED.last_modified, mtu = EXCLUDED.mtu, "
  1265. "multicast_limit = EXCLUDED.multicast_limit, name = EXCLUDED.name, "
  1266. "private = EXCLUDED.private, remote_trace_level = EXCLUDED.remote_trace_level, "
  1267. "remote_trace_target = EXCLUDED.remote_trace_target, rules = EXCLUDED.rules, "
  1268. "rules_source = EXCLUDED.rules_source, tags = EXCLUDED.tags, "
  1269. "v4_assign_mode = EXCLUDED.v4_assign_mode, v6_assign_mode = EXCLUDED.v6_assign_mode, "
  1270. "sso_enabled = EXCLUDED.sso_enabled",
  1271. id,
  1272. _myAddressStr,
  1273. OSUtils::jsonDump(config["capabilities"], -1),
  1274. (bool)config["enableBroadcast"],
  1275. OSUtils::now(),
  1276. (int)config["mtu"],
  1277. (int)config["multicastLimit"],
  1278. OSUtils::jsonString(config["name"],""),
  1279. (bool)config["private"],
  1280. (int)config["remoteTraceLevel"],
  1281. remoteTraceTarget,
  1282. OSUtils::jsonDump(config["rules"], -1),
  1283. rulesSource,
  1284. OSUtils::jsonDump(config["tags"], -1),
  1285. OSUtils::jsonDump(config["v4AssignMode"],-1),
  1286. OSUtils::jsonDump(config["v6AssignMode"], -1),
  1287. OSUtils::jsonBool(config["ssoEnabled"], false));
  1288. res = w.exec_params0("DELETE FROM ztc_network_assignment_pool WHERE network_id = $1", 0);
  1289. auto pool = config["ipAssignmentPools"];
  1290. bool err = false;
  1291. for (auto i = pool.begin(); i != pool.end(); ++i) {
  1292. std::string start = (*i)["ipRangeStart"];
  1293. std::string end = (*i)["ipRangeEnd"];
  1294. res = w.exec_params0(
  1295. "INSERT INTO ztc_network_assignment_pool (network_id, ip_range_start, ip_range_end) "
  1296. "VALUES ($1, $2, $3)", id, start, end);
  1297. }
  1298. res = w.exec_params0("DELETE FROM ztc_network_route WHERE network_id = $1", id);
  1299. auto routes = config["routes"];
  1300. err = false;
  1301. for (auto i = routes.begin(); i != routes.end(); ++i) {
  1302. std::string t = (*i)["target"];
  1303. std::vector<std::string> target;
  1304. std::istringstream f(t);
  1305. std::string s;
  1306. while(std::getline(f, s, '/')) {
  1307. target.push_back(s);
  1308. }
  1309. if (target.empty() || target.size() != 2) {
  1310. continue;
  1311. }
  1312. std::string targetAddr = target[0];
  1313. std::string targetBits = target[1];
  1314. std::string via = "NULL";
  1315. if (!(*i)["via"].is_null()) {
  1316. via = (*i)["via"];
  1317. }
  1318. res = w.exec_params0("INSERT INTO ztc_network_route (network_id, address, bits, via) VALUES ($1, $2, $3, $4)",
  1319. id, targetAddr, targetBits, (via == "NULL" ? NULL : via.c_str()));
  1320. }
  1321. if (err) {
  1322. fprintf(stderr, "%s: route add error\n", _myAddressStr.c_str());
  1323. w.abort();
  1324. _pool->unborrow(c);
  1325. continue;
  1326. }
  1327. auto dns = config["dns"];
  1328. std::string domain = dns["domain"];
  1329. std::stringstream servers;
  1330. servers << "{";
  1331. for (auto j = dns["servers"].begin(); j < dns["servers"].end(); ++j) {
  1332. servers << *j;
  1333. if ( (j+1) != dns["servers"].end()) {
  1334. servers << ",";
  1335. }
  1336. }
  1337. servers << "}";
  1338. std::string s = servers.str();
  1339. res = w.exec_params0("INSERT INTO ztc_network_dns (network_id, domain, servers) VALUES ($1, $2, $3) ON CONFLICT (network_id) DO UPDATE SET domain = EXCLUDED.domain, servers = EXCLUDED.servers",
  1340. id, domain, s);
  1341. w.commit();
  1342. const uint64_t nwidInt = OSUtils::jsonIntHex(config["nwid"], 0ULL);
  1343. if (nwidInt) {
  1344. nlohmann::json nwOrig;
  1345. nlohmann::json nwNew(config);
  1346. get(nwidInt, nwOrig);
  1347. _networkChanged(nwOrig, nwNew, qitem.second);
  1348. } else {
  1349. fprintf(stderr, "%s: Can't notify network changed: %llu\n", _myAddressStr.c_str(), (unsigned long long)nwidInt);
  1350. }
  1351. } catch (std::exception &e) {
  1352. fprintf(stderr, "%s ERROR: Error updating network: %s\n", _myAddressStr.c_str(), e.what());
  1353. }
  1354. if (_redisMemberStatus) {
  1355. try {
  1356. std::string id = config["id"];
  1357. std::string controllerId = _myAddressStr.c_str();
  1358. std::string key = "networks:{" + controllerId + "}";
  1359. if (_rc->clusterMode) {
  1360. _cluster->sadd(key, id);
  1361. } else {
  1362. _redis->sadd(key, id);
  1363. }
  1364. } catch (sw::redis::Error &e) {
  1365. fprintf(stderr, "ERROR: Error adding network to Redis: %s\n", e.what());
  1366. }
  1367. }
  1368. } else if (objtype == "_delete_network") {
  1369. // fprintf(stderr, "%s: commitThread: delete network\n", _myAddressStr.c_str());
  1370. try {
  1371. pqxx::work w(*c->c);
  1372. std::string networkId = config["nwid"];
  1373. pqxx::result res = w.exec_params0("UPDATE ztc_network SET deleted = true WHERE id = $1",
  1374. networkId);
  1375. w.commit();
  1376. } catch (std::exception &e) {
  1377. fprintf(stderr, "%s ERROR: Error deleting network: %s\n", _myAddressStr.c_str(), e.what());
  1378. }
  1379. if (_redisMemberStatus) {
  1380. try {
  1381. std::string id = config["id"];
  1382. std::string controllerId = _myAddressStr.c_str();
  1383. std::string key = "networks:{" + controllerId + "}";
  1384. if (_rc->clusterMode) {
  1385. _cluster->srem(key, id);
  1386. _cluster->del("network-nodes-online:{"+controllerId+"}:"+id);
  1387. } else {
  1388. _redis->srem(key, id);
  1389. _redis->del("network-nodes-online:{"+controllerId+"}:"+id);
  1390. }
  1391. } catch (sw::redis::Error &e) {
  1392. fprintf(stderr, "ERROR: Error adding network to Redis: %s\n", e.what());
  1393. }
  1394. }
  1395. } else if (objtype == "_delete_member") {
  1396. // fprintf(stderr, "%s commitThread: delete member\n", _myAddressStr.c_str());
  1397. try {
  1398. pqxx::work w(*c->c);
  1399. std::string memberId = config["id"];
  1400. std::string networkId = config["nwid"];
  1401. pqxx::result res = w.exec_params0(
  1402. "UPDATE ztc_member SET hidden = true, deleted = true WHERE id = $1 AND network_id = $2",
  1403. memberId, networkId);
  1404. w.commit();
  1405. } catch (std::exception &e) {
  1406. fprintf(stderr, "%s ERROR: Error deleting member: %s\n", _myAddressStr.c_str(), e.what());
  1407. }
  1408. if (_redisMemberStatus) {
  1409. try {
  1410. std::string memberId = config["id"];
  1411. std::string networkId = config["nwid"];
  1412. std::string controllerId = _myAddressStr.c_str();
  1413. std::string key = "network-nodes-all:{" + controllerId + "}:" + networkId;
  1414. if (_rc->clusterMode) {
  1415. _cluster->srem(key, memberId);
  1416. _cluster->del("member:{"+controllerId+"}:"+networkId+":"+memberId);
  1417. } else {
  1418. _redis->srem(key, memberId);
  1419. _redis->del("member:{"+controllerId+"}:"+networkId+":"+memberId);
  1420. }
  1421. } catch (sw::redis::Error &e) {
  1422. fprintf(stderr, "ERROR: Error deleting member from Redis: %s\n", e.what());
  1423. }
  1424. }
  1425. } else {
  1426. fprintf(stderr, "%s ERROR: unknown objtype\n", _myAddressStr.c_str());
  1427. }
  1428. } catch (std::exception &e) {
  1429. fprintf(stderr, "%s ERROR: Error getting objtype: %s\n", _myAddressStr.c_str(), e.what());
  1430. }
  1431. _pool->unborrow(c);
  1432. c.reset();
  1433. }
  1434. fprintf(stderr, "%s commitThread finished\n", _myAddressStr.c_str());
  1435. }
  1436. void PostgreSQL::onlineNotificationThread()
  1437. {
  1438. waitForReady();
  1439. if (_redisMemberStatus) {
  1440. onlineNotification_Redis();
  1441. } else {
  1442. onlineNotification_Postgres();
  1443. }
  1444. }
  1445. /**
  1446. * ONLY UNCOMMENT FOR TEMPORARY DB MAINTENANCE
  1447. *
  1448. * This define temporarily turns off writing to the member status table
  1449. * so it can be reindexed when the indexes get too large.
  1450. */
  1451. // #define DISABLE_MEMBER_STATUS 1
  1452. void PostgreSQL::onlineNotification_Postgres()
  1453. {
  1454. _connected = 1;
  1455. nlohmann::json jtmp1, jtmp2;
  1456. while (_run == 1) {
  1457. auto c = _pool->borrow();
  1458. auto c2 = _pool->borrow();
  1459. try {
  1460. fprintf(stderr, "%s onlineNotification_Postgres\n", _myAddressStr.c_str());
  1461. std::unordered_map< std::pair<uint64_t,uint64_t>,std::pair<int64_t,InetAddress>,_PairHasher > lastOnline;
  1462. {
  1463. std::lock_guard<std::mutex> l(_lastOnline_l);
  1464. lastOnline.swap(_lastOnline);
  1465. }
  1466. #ifndef DISABLE_MEMBER_STATUS
  1467. pqxx::work w(*c->c);
  1468. pqxx::work w2(*c2->c);
  1469. fprintf(stderr, "online notification tick\n");
  1470. bool firstRun = true;
  1471. bool memberAdded = false;
  1472. int updateCount = 0;
  1473. pqxx::pipeline pipe(w);
  1474. for (auto i=lastOnline.begin(); i != lastOnline.end(); ++i) {
  1475. updateCount += 1;
  1476. uint64_t nwid_i = i->first.first;
  1477. char nwidTmp[64];
  1478. char memTmp[64];
  1479. char ipTmp[64];
  1480. OSUtils::ztsnprintf(nwidTmp,sizeof(nwidTmp), "%.16llx", nwid_i);
  1481. OSUtils::ztsnprintf(memTmp,sizeof(memTmp), "%.10llx", i->first.second);
  1482. if(!get(nwid_i, jtmp1, i->first.second, jtmp2)) {
  1483. continue; // skip non existent networks/members
  1484. }
  1485. std::string networkId(nwidTmp);
  1486. std::string memberId(memTmp);
  1487. try {
  1488. pqxx::row r = w2.exec_params1("SELECT id, network_id FROM ztc_member WHERE network_id = $1 AND id = $2",
  1489. networkId, memberId);
  1490. } catch (pqxx::unexpected_rows &e) {
  1491. continue;
  1492. }
  1493. int64_t ts = i->second.first;
  1494. std::string ipAddr = i->second.second.toIpString(ipTmp);
  1495. std::string timestamp = std::to_string(ts);
  1496. std::stringstream memberUpdate;
  1497. memberUpdate << "INSERT INTO ztc_member_status (network_id, member_id, address, last_updated) VALUES "
  1498. << "('" << networkId << "', '" << memberId << "', ";
  1499. if (ipAddr.empty()) {
  1500. memberUpdate << "NULL, ";
  1501. } else {
  1502. memberUpdate << "'" << ipAddr << "', ";
  1503. }
  1504. memberUpdate << "TO_TIMESTAMP(" << timestamp << "::double precision/1000)) "
  1505. << " ON CONFLICT (network_id, member_id) DO UPDATE SET address = EXCLUDED.address, last_updated = EXCLUDED.last_updated";
  1506. pipe.insert(memberUpdate.str());
  1507. Metrics::pgsql_node_checkin++;
  1508. }
  1509. while(!pipe.empty()) {
  1510. pipe.retrieve();
  1511. }
  1512. pipe.complete();
  1513. w.commit();
  1514. fprintf(stderr, "%s: Updated online status of %d members\n", _myAddressStr.c_str(), updateCount);
  1515. #endif
  1516. } catch (std::exception &e) {
  1517. fprintf(stderr, "%s: error in onlinenotification thread: %s\n", _myAddressStr.c_str(), e.what());
  1518. }
  1519. _pool->unborrow(c2);
  1520. _pool->unborrow(c);
  1521. ConnectionPoolStats stats = _pool->get_stats();
  1522. fprintf(stderr, "%s pool stats: in use size: %llu, available size: %llu, total: %llu\n",
  1523. _myAddressStr.c_str(), stats.borrowed_size, stats.pool_size, (stats.borrowed_size + stats.pool_size));
  1524. std::this_thread::sleep_for(std::chrono::seconds(10));
  1525. }
  1526. fprintf(stderr, "%s: Fell out of run loop in onlineNotificationThread\n", _myAddressStr.c_str());
  1527. if (_run == 1) {
  1528. fprintf(stderr, "ERROR: %s onlineNotificationThread should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  1529. exit(6);
  1530. }
  1531. }
  1532. void PostgreSQL::onlineNotification_Redis()
  1533. {
  1534. _connected = 1;
  1535. char buf[11] = {0};
  1536. std::string controllerId = std::string(_myAddress.toString(buf));
  1537. while (_run == 1) {
  1538. fprintf(stderr, "onlineNotification tick\n");
  1539. auto start = std::chrono::high_resolution_clock::now();
  1540. uint64_t count = 0;
  1541. std::unordered_map< std::pair<uint64_t,uint64_t>,std::pair<int64_t,InetAddress>,_PairHasher > lastOnline;
  1542. {
  1543. std::lock_guard<std::mutex> l(_lastOnline_l);
  1544. lastOnline.swap(_lastOnline);
  1545. }
  1546. try {
  1547. if (!lastOnline.empty()) {
  1548. if (_rc->clusterMode) {
  1549. auto tx = _cluster->transaction(controllerId, true, false);
  1550. count = _doRedisUpdate(tx, controllerId, lastOnline);
  1551. } else {
  1552. auto tx = _redis->transaction(true, false);
  1553. count = _doRedisUpdate(tx, controllerId, lastOnline);
  1554. }
  1555. }
  1556. } catch (sw::redis::Error &e) {
  1557. fprintf(stderr, "Error in online notification thread (redis): %s\n", e.what());
  1558. }
  1559. auto end = std::chrono::high_resolution_clock::now();
  1560. auto dur = std::chrono::duration_cast<std::chrono::milliseconds>(end - start);
  1561. auto total = dur.count();
  1562. fprintf(stderr, "onlineNotification ran in %llu ms\n", total);
  1563. std::this_thread::sleep_for(std::chrono::seconds(5));
  1564. }
  1565. }
  1566. uint64_t PostgreSQL::_doRedisUpdate(sw::redis::Transaction &tx, std::string &controllerId,
  1567. std::unordered_map< std::pair<uint64_t,uint64_t>,std::pair<int64_t,InetAddress>,_PairHasher > &lastOnline)
  1568. {
  1569. nlohmann::json jtmp1, jtmp2;
  1570. uint64_t count = 0;
  1571. for (auto i=lastOnline.begin(); i != lastOnline.end(); ++i) {
  1572. uint64_t nwid_i = i->first.first;
  1573. uint64_t memberid_i = i->first.second;
  1574. char nwidTmp[64];
  1575. char memTmp[64];
  1576. char ipTmp[64];
  1577. OSUtils::ztsnprintf(nwidTmp,sizeof(nwidTmp), "%.16llx", nwid_i);
  1578. OSUtils::ztsnprintf(memTmp,sizeof(memTmp), "%.10llx", memberid_i);
  1579. if (!get(nwid_i, jtmp1, memberid_i, jtmp2)){
  1580. continue; // skip non existent members/networks
  1581. }
  1582. std::string networkId(nwidTmp);
  1583. std::string memberId(memTmp);
  1584. int64_t ts = i->second.first;
  1585. std::string ipAddr = i->second.second.toIpString(ipTmp);
  1586. std::string timestamp = std::to_string(ts);
  1587. std::unordered_map<std::string, std::string> record = {
  1588. {"id", memberId},
  1589. {"address", ipAddr},
  1590. {"last_updated", std::to_string(ts)}
  1591. };
  1592. tx.zadd("nodes-online:{"+controllerId+"}", memberId, ts)
  1593. .zadd("nodes-online2:{"+controllerId+"}", networkId+"-"+memberId, ts)
  1594. .zadd("network-nodes-online:{"+controllerId+"}:"+networkId, memberId, ts)
  1595. .zadd("active-networks:{"+controllerId+"}", networkId, ts)
  1596. .sadd("network-nodes-all:{"+controllerId+"}:"+networkId, memberId)
  1597. .hmset("member:{"+controllerId+"}:"+networkId+":"+memberId, record.begin(), record.end());
  1598. ++count;
  1599. Metrics::redis_node_checkin++;
  1600. }
  1601. // expire records from all-nodes and network-nodes member list
  1602. uint64_t expireOld = OSUtils::now() - 300000;
  1603. tx.zremrangebyscore("nodes-online:{"+controllerId+"}",
  1604. sw::redis::RightBoundedInterval<double>(expireOld,
  1605. sw::redis::BoundType::LEFT_OPEN));
  1606. tx.zremrangebyscore("nodes-online2:{"+controllerId+"}",
  1607. sw::redis::RightBoundedInterval<double>(expireOld,
  1608. sw::redis::BoundType::LEFT_OPEN));
  1609. tx.zremrangebyscore("active-networks:{"+controllerId+"}",
  1610. sw::redis::RightBoundedInterval<double>(expireOld,
  1611. sw::redis::BoundType::LEFT_OPEN));
  1612. {
  1613. std::shared_lock<std::shared_mutex> l(_networks_l);
  1614. for (const auto &it : _networks) {
  1615. uint64_t nwid_i = it.first;
  1616. char nwidTmp[64];
  1617. OSUtils::ztsnprintf(nwidTmp,sizeof(nwidTmp), "%.16llx", nwid_i);
  1618. tx.zremrangebyscore("network-nodes-online:{"+controllerId+"}:"+nwidTmp,
  1619. sw::redis::RightBoundedInterval<double>(expireOld, sw::redis::BoundType::LEFT_OPEN));
  1620. }
  1621. }
  1622. tx.exec();
  1623. fprintf(stderr, "%s: Updated online status of %d members\n", _myAddressStr.c_str(), count);
  1624. return count;
  1625. }
  1626. #endif //ZT_CONTROLLER_USE_LIBPQ