PostgreSQL.cpp 60 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797
  1. /*
  2. * Copyright (c)2019 ZeroTier, Inc.
  3. *
  4. * Use of this software is governed by the Business Source License included
  5. * in the LICENSE.TXT file in the project's root directory.
  6. *
  7. * Change Date: 2025-01-01
  8. *
  9. * On the date above, in accordance with the Business Source License, use
  10. * of this software will be governed by version 2.0 of the Apache License.
  11. */
  12. /****/
  13. #include "PostgreSQL.hpp"
  14. #ifdef ZT_CONTROLLER_USE_LIBPQ
  15. #include "../node/Constants.hpp"
  16. #include "../node/SHA512.hpp"
  17. #include "EmbeddedNetworkController.hpp"
  18. #include "../version.h"
  19. #include "Redis.hpp"
  20. #include <libpq-fe.h>
  21. #include <sstream>
  22. #include <iomanip>
  23. #include <climits>
  24. #include <chrono>
  25. // #define REDIS_TRACE 1
  26. using json = nlohmann::json;
  27. namespace {
  28. static const int DB_MINIMUM_VERSION = 20;
  29. static const char *_timestr()
  30. {
  31. time_t t = time(0);
  32. char *ts = ctime(&t);
  33. char *p = ts;
  34. if (!p)
  35. return "";
  36. while (*p) {
  37. if (*p == '\n') {
  38. *p = (char)0;
  39. break;
  40. }
  41. ++p;
  42. }
  43. return ts;
  44. }
  45. /*
  46. std::string join(const std::vector<std::string> &elements, const char * const separator)
  47. {
  48. switch(elements.size()) {
  49. case 0:
  50. return "";
  51. case 1:
  52. return elements[0];
  53. default:
  54. std::ostringstream os;
  55. std::copy(elements.begin(), elements.end()-1, std::ostream_iterator<std::string>(os, separator));
  56. os << *elements.rbegin();
  57. return os.str();
  58. }
  59. }
  60. */
  61. std::vector<std::string> split(std::string str, char delim){
  62. std::istringstream iss(str);
  63. std::vector<std::string> tokens;
  64. std::string item;
  65. while(std::getline(iss, item, delim)) {
  66. tokens.push_back(item);
  67. }
  68. return tokens;
  69. }
  70. std::string url_encode(const std::string &value) {
  71. std::ostringstream escaped;
  72. escaped.fill('0');
  73. escaped << std::hex;
  74. for (std::string::const_iterator i = value.begin(), n = value.end(); i != n; ++i) {
  75. std::string::value_type c = (*i);
  76. // Keep alphanumeric and other accepted characters intact
  77. if (isalnum(c) || c == '-' || c == '_' || c == '.' || c == '~') {
  78. escaped << c;
  79. continue;
  80. }
  81. // Any other characters are percent-encoded
  82. escaped << std::uppercase;
  83. escaped << '%' << std::setw(2) << int((unsigned char) c);
  84. escaped << std::nouppercase;
  85. }
  86. return escaped.str();
  87. }
  88. } // anonymous namespace
  89. using namespace ZeroTier;
  90. MemberNotificationReceiver::MemberNotificationReceiver(PostgreSQL *p, pqxx::connection &c, const std::string &channel)
  91. : pqxx::notification_receiver(c, channel)
  92. , _psql(p)
  93. {
  94. fprintf(stderr, "initialize MemberNotificaitonReceiver\n");
  95. }
  96. void MemberNotificationReceiver::operator() (const std::string &payload, int packend_pid) {
  97. fprintf(stderr, "Member Notification received: %s\n", payload.c_str());
  98. json tmp(json::parse(payload));
  99. json &ov = tmp["old_val"];
  100. json &nv = tmp["new_val"];
  101. json oldConfig, newConfig;
  102. if (ov.is_object()) oldConfig = ov;
  103. if (nv.is_object()) newConfig = nv;
  104. if (oldConfig.is_object() || newConfig.is_object()) {
  105. _psql->_memberChanged(oldConfig,newConfig,(_psql->_ready>=2));
  106. fprintf(stderr, "payload sent\n");
  107. }
  108. }
  109. NetworkNotificationReceiver::NetworkNotificationReceiver(PostgreSQL *p, pqxx::connection &c, const std::string &channel)
  110. : pqxx::notification_receiver(c, channel)
  111. , _psql(p)
  112. {
  113. fprintf(stderr, "initialize NetworkNotificationReceiver\n");
  114. }
  115. void NetworkNotificationReceiver::operator() (const std::string &payload, int packend_pid) {
  116. fprintf(stderr, "Network Notificaiton received: %s\n", payload.c_str());
  117. json tmp(json::parse(payload));
  118. json &ov = tmp["old_val"];
  119. json &nv = tmp["new_val"];
  120. json oldConfig, newConfig;
  121. if (ov.is_object()) oldConfig = ov;
  122. if (nv.is_object()) newConfig = nv;
  123. if (oldConfig.is_object() || newConfig.is_object()) {
  124. _psql->_networkChanged(oldConfig,newConfig,(_psql->_ready>=2));
  125. fprintf(stderr, "payload sent\n");
  126. }
  127. }
  128. using Attrs = std::vector<std::pair<std::string, std::string>>;
  129. using Item = std::pair<std::string, Attrs>;
  130. using ItemStream = std::vector<Item>;
  131. PostgreSQL::PostgreSQL(const Identity &myId, const char *path, int listenPort, RedisConfig *rc)
  132. : DB()
  133. , _pool()
  134. , _myId(myId)
  135. , _myAddress(myId.address())
  136. , _ready(0)
  137. , _connected(1)
  138. , _run(1)
  139. , _waitNoticePrinted(false)
  140. , _listenPort(listenPort)
  141. , _rc(rc)
  142. , _redis(NULL)
  143. , _cluster(NULL)
  144. , _redisMemberStatus(false)
  145. {
  146. char myAddress[64];
  147. _myAddressStr = myId.address().toString(myAddress);
  148. _connString = std::string(path);
  149. auto f = std::make_shared<PostgresConnFactory>(_connString);
  150. _pool = std::make_shared<ConnectionPool<PostgresConnection> >(
  151. 15, 5, std::static_pointer_cast<ConnectionFactory>(f));
  152. memset(_ssoPsk, 0, sizeof(_ssoPsk));
  153. char *const ssoPskHex = getenv("ZT_SSO_PSK");
  154. #ifdef ZT_TRACE
  155. fprintf(stderr, "ZT_SSO_PSK: %s\n", ssoPskHex);
  156. #endif
  157. if (ssoPskHex) {
  158. // SECURITY: note that ssoPskHex will always be null-terminated if libc acatually
  159. // returns something non-NULL. If the hex encodes something shorter than 48 bytes,
  160. // it will be padded at the end with zeroes. If longer, it'll be truncated.
  161. Utils::unhex(ssoPskHex, _ssoPsk, sizeof(_ssoPsk));
  162. }
  163. const char *redisMemberStatus = getenv("ZT_REDIS_MEMBER_STATUS");
  164. if (redisMemberStatus && (strcmp(redisMemberStatus, "true") == 0)) {
  165. _redisMemberStatus = true;
  166. fprintf(stderr, "Using redis for member status\n");
  167. }
  168. auto c = _pool->borrow();
  169. pqxx::work txn{*c->c};
  170. pqxx::row r{txn.exec1("SELECT version FROM ztc_database")};
  171. int dbVersion = r[0].as<int>();
  172. txn.commit();
  173. if (dbVersion < DB_MINIMUM_VERSION) {
  174. fprintf(stderr, "Central database schema version too low. This controller version requires a minimum schema version of %d. Please upgrade your Central instance", DB_MINIMUM_VERSION);
  175. exit(1);
  176. }
  177. _pool->unborrow(c);
  178. if (_rc != NULL) {
  179. sw::redis::ConnectionOptions opts;
  180. sw::redis::ConnectionPoolOptions poolOpts;
  181. opts.host = _rc->hostname;
  182. opts.port = _rc->port;
  183. opts.password = _rc->password;
  184. opts.db = 0;
  185. opts.keep_alive = true;
  186. opts.connect_timeout = std::chrono::seconds(3);
  187. poolOpts.size = 25;
  188. poolOpts.wait_timeout = std::chrono::seconds(5);
  189. poolOpts.connection_lifetime = std::chrono::minutes(3);
  190. poolOpts.connection_idle_time = std::chrono::minutes(1);
  191. if (_rc->clusterMode) {
  192. fprintf(stderr, "Using Redis in Cluster Mode\n");
  193. _cluster = std::make_shared<sw::redis::RedisCluster>(opts, poolOpts);
  194. } else {
  195. fprintf(stderr, "Using Redis in Standalone Mode\n");
  196. _redis = std::make_shared<sw::redis::Redis>(opts, poolOpts);
  197. }
  198. }
  199. _readyLock.lock();
  200. fprintf(stderr, "[%s] NOTICE: %.10llx controller PostgreSQL waiting for initial data download..." ZT_EOL_S, ::_timestr(), (unsigned long long)_myAddress.toInt());
  201. _waitNoticePrinted = true;
  202. initializeNetworks();
  203. initializeMembers();
  204. _heartbeatThread = std::thread(&PostgreSQL::heartbeat, this);
  205. _membersDbWatcher = std::thread(&PostgreSQL::membersDbWatcher, this);
  206. _networksDbWatcher = std::thread(&PostgreSQL::networksDbWatcher, this);
  207. for (int i = 0; i < ZT_CENTRAL_CONTROLLER_COMMIT_THREADS; ++i) {
  208. _commitThread[i] = std::thread(&PostgreSQL::commitThread, this);
  209. }
  210. _onlineNotificationThread = std::thread(&PostgreSQL::onlineNotificationThread, this);
  211. }
  212. PostgreSQL::~PostgreSQL()
  213. {
  214. _run = 0;
  215. std::this_thread::sleep_for(std::chrono::milliseconds(100));
  216. _heartbeatThread.join();
  217. _membersDbWatcher.join();
  218. _networksDbWatcher.join();
  219. _commitQueue.stop();
  220. for (int i = 0; i < ZT_CENTRAL_CONTROLLER_COMMIT_THREADS; ++i) {
  221. _commitThread[i].join();
  222. }
  223. _onlineNotificationThread.join();
  224. }
  225. bool PostgreSQL::waitForReady()
  226. {
  227. while (_ready < 2) {
  228. _readyLock.lock();
  229. _readyLock.unlock();
  230. }
  231. return true;
  232. }
  233. bool PostgreSQL::isReady()
  234. {
  235. return ((_ready == 2)&&(_connected));
  236. }
  237. bool PostgreSQL::save(nlohmann::json &record,bool notifyListeners)
  238. {
  239. bool modified = false;
  240. try {
  241. if (!record.is_object()) {
  242. fprintf(stderr, "record is not an object?!?\n");
  243. return false;
  244. }
  245. const std::string objtype = record["objtype"];
  246. if (objtype == "network") {
  247. //fprintf(stderr, "network save\n");
  248. const uint64_t nwid = OSUtils::jsonIntHex(record["id"],0ULL);
  249. if (nwid) {
  250. nlohmann::json old;
  251. get(nwid,old);
  252. if ((!old.is_object())||(!_compareRecords(old,record))) {
  253. record["revision"] = OSUtils::jsonInt(record["revision"],0ULL) + 1ULL;
  254. _commitQueue.post(std::pair<nlohmann::json,bool>(record,notifyListeners));
  255. modified = true;
  256. }
  257. }
  258. } else if (objtype == "member") {
  259. std::string networkId = record["nwid"];
  260. std::string memberId = record["id"];
  261. const uint64_t nwid = OSUtils::jsonIntHex(record["nwid"],0ULL);
  262. const uint64_t id = OSUtils::jsonIntHex(record["id"],0ULL);
  263. //fprintf(stderr, "member save %s-%s\n", networkId.c_str(), memberId.c_str());
  264. if ((id)&&(nwid)) {
  265. nlohmann::json network,old;
  266. get(nwid,network,id,old);
  267. if ((!old.is_object())||(!_compareRecords(old,record))) {
  268. //fprintf(stderr, "commit queue post\n");
  269. record["revision"] = OSUtils::jsonInt(record["revision"],0ULL) + 1ULL;
  270. _commitQueue.post(std::pair<nlohmann::json,bool>(record,notifyListeners));
  271. modified = true;
  272. } else {
  273. //fprintf(stderr, "no change\n");
  274. }
  275. }
  276. } else {
  277. fprintf(stderr, "uhh waaat\n");
  278. }
  279. } catch (std::exception &e) {
  280. fprintf(stderr, "Error on PostgreSQL::save: %s\n", e.what());
  281. } catch (...) {
  282. fprintf(stderr, "Unknown error on PostgreSQL::save\n");
  283. }
  284. return modified;
  285. }
  286. void PostgreSQL::eraseNetwork(const uint64_t networkId)
  287. {
  288. fprintf(stderr, "PostgreSQL::eraseNetwork\n");
  289. char tmp2[24];
  290. waitForReady();
  291. Utils::hex(networkId, tmp2);
  292. std::pair<nlohmann::json,bool> tmp;
  293. tmp.first["id"] = tmp2;
  294. tmp.first["objtype"] = "_delete_network";
  295. tmp.second = true;
  296. _commitQueue.post(tmp);
  297. nlohmann::json nullJson;
  298. _networkChanged(tmp.first, nullJson, true);
  299. }
  300. void PostgreSQL::eraseMember(const uint64_t networkId, const uint64_t memberId)
  301. {
  302. fprintf(stderr, "PostgreSQL::eraseMember\n");
  303. char tmp2[24];
  304. waitForReady();
  305. std::pair<nlohmann::json,bool> tmp, nw;
  306. Utils::hex(networkId, tmp2);
  307. tmp.first["nwid"] = tmp2;
  308. Utils::hex(memberId, tmp2);
  309. tmp.first["id"] = tmp2;
  310. tmp.first["objtype"] = "_delete_member";
  311. tmp.second = true;
  312. _commitQueue.post(tmp);
  313. nlohmann::json nullJson;
  314. _memberChanged(tmp.first, nullJson, true);
  315. }
  316. void PostgreSQL::nodeIsOnline(const uint64_t networkId, const uint64_t memberId, const InetAddress &physicalAddress)
  317. {
  318. std::lock_guard<std::mutex> l(_lastOnline_l);
  319. std::pair<int64_t, InetAddress> &i = _lastOnline[std::pair<uint64_t,uint64_t>(networkId, memberId)];
  320. i.first = OSUtils::now();
  321. if (physicalAddress) {
  322. i.second = physicalAddress;
  323. }
  324. }
  325. AuthInfo PostgreSQL::getSSOAuthInfo(const nlohmann::json &member, const std::string &redirectURL)
  326. {
  327. // NONCE is just a random character string. no semantic meaning
  328. // state = HMAC SHA384 of Nonce based on shared sso key
  329. //
  330. // need nonce timeout in database? make sure it's used within X time
  331. // X is 5 minutes for now. Make configurable later?
  332. //
  333. // how do we tell when a nonce is used? if auth_expiration_time is set
  334. std::string networkId = member["nwid"];
  335. std::string memberId = member["id"];
  336. char authenticationURL[4096] = {0};
  337. AuthInfo info;
  338. info.enabled = true;
  339. // fprintf(stderr, "PostgreSQL::updateMemberOnLoad: %s-%s\n", networkId.c_str(), memberId.c_str());
  340. try {
  341. auto c = _pool->borrow();
  342. pqxx::work w(*c->c);
  343. char nonceBytes[16] = {0};
  344. std::string nonce = "";
  345. // check if the member exists first.
  346. pqxx::row count = w.exec_params1("SELECT count(id) FROM ztc_member WHERE id = $1 AND network_id = $2 AND deleted = false", memberId, networkId);
  347. if (count[0].as<int>() == 1) {
  348. // get active nonce, if exists.
  349. pqxx::result r = w.exec_params("SELECT nonce FROM ztc_sso_expiry "
  350. "WHERE network_id = $1 AND member_id = $2 "
  351. "AND ((NOW() AT TIME ZONE 'UTC') <= authentication_expiry_time) AND ((NOW() AT TIME ZONE 'UTC') <= nonce_expiration)",
  352. networkId, memberId);
  353. if (r.size() == 0) {
  354. // no active nonce.
  355. // find an unused nonce, if one exists.
  356. pqxx::result r = w.exec_params("SELECT nonce FROM ztc_sso_expiry "
  357. "WHERE network_id = $1 AND member_id = $2 "
  358. "AND authentication_expiry_time IS NULL AND ((NOW() AT TIME ZONE 'UTC') <= nonce_expiration)",
  359. networkId, memberId);
  360. if (r.size() == 1) {
  361. // we have an existing nonce. Use it
  362. nonce = r.at(0)[0].as<std::string>();
  363. Utils::unhex(nonce.c_str(), nonceBytes, sizeof(nonceBytes));
  364. } else if (r.empty()) {
  365. // create a nonce
  366. Utils::getSecureRandom(nonceBytes, 16);
  367. char nonceBuf[64] = {0};
  368. Utils::hex(nonceBytes, sizeof(nonceBytes), nonceBuf);
  369. nonce = std::string(nonceBuf);
  370. pqxx::result ir = w.exec_params0("INSERT INTO ztc_sso_expiry "
  371. "(nonce, nonce_expiration, network_id, member_id) VALUES "
  372. "($1, TO_TIMESTAMP($2::double precision/1000), $3, $4)",
  373. nonce, OSUtils::now() + 300000, networkId, memberId);
  374. w.commit();
  375. } else {
  376. // > 1 ?!? Thats an error!
  377. fprintf(stderr, "> 1 unused nonce!\n");
  378. exit(6);
  379. }
  380. } else if (r.size() == 1) {
  381. nonce = r.at(0)[0].as<std::string>();
  382. Utils::unhex(nonce.c_str(), nonceBytes, sizeof(nonceBytes));
  383. } else {
  384. // more than 1 nonce in use? Uhhh...
  385. fprintf(stderr, "> 1 nonce in use for network member?!?\n");
  386. exit(7);
  387. }
  388. r = w.exec_params("SELECT oc.client_id, oc.authorization_endpoint, oc.issuer, oc.sso_impl_version "
  389. "FROM ztc_network n "
  390. "INNER JOIN ztc_network_oidc_config noc "
  391. " ON noc.network_id = n.id "
  392. "INNER JOIN ztc_oidc_config oc "
  393. " ON noc.client_id = oc.client_id "
  394. "WHERE n.id = $1 AND n.sso_enabled = true", networkId);
  395. std::string client_id = "";
  396. std::string authorization_endpoint = "";
  397. std::string issuer = "";
  398. uint64_t sso_version = 0;
  399. if (r.size() == 1) {
  400. client_id = r.at(0)[0].as<std::string>();
  401. authorization_endpoint = r.at(0)[1].as<std::string>();
  402. issuer = r.at(0)[2].as<std::string>();
  403. sso_version = r.at(0)[3].as<uint64_t>();
  404. } else if (r.size() > 1) {
  405. fprintf(stderr, "ERROR: More than one auth endpoint for an organization?!?!? NetworkID: %s\n", networkId.c_str());
  406. } else {
  407. fprintf(stderr, "No client or auth endpoint?!?\n");
  408. }
  409. info.version = sso_version;
  410. // no catch all else because we don't actually care if no records exist here. just continue as normal.
  411. if ((!client_id.empty())&&(!authorization_endpoint.empty())) {
  412. uint8_t state[48];
  413. HMACSHA384(_ssoPsk, nonceBytes, sizeof(nonceBytes), state);
  414. char state_hex[256];
  415. Utils::hex(state, 48, state_hex);
  416. if (info.version == 0) {
  417. char url[2048] = {0};
  418. OSUtils::ztsnprintf(url, sizeof(authenticationURL),
  419. "%s?response_type=id_token&response_mode=form_post&scope=openid+email+profile&redirect_uri=%s&nonce=%s&state=%s&client_id=%s",
  420. authorization_endpoint.c_str(),
  421. url_encode(redirectURL).c_str(),
  422. nonce.c_str(),
  423. state_hex,
  424. client_id.c_str());
  425. info.authenticationURL = std::string(url);
  426. } else if (info.version == 1) {
  427. info.ssoClientID = client_id;
  428. info.issuerURL = issuer;
  429. info.ssoNonce = nonce;
  430. info.ssoState = std::string(state_hex) + "_" +networkId;
  431. info.centralAuthURL = redirectURL;
  432. #ifdef ZT_DEBUG
  433. fprintf(
  434. stderr,
  435. "ssoClientID: %s\nissuerURL: %s\nssoNonce: %s\nssoState: %s\ncentralAuthURL: %s\n",
  436. info.ssoClientID.c_str(),
  437. info.issuerURL.c_str(),
  438. info.ssoNonce.c_str(),
  439. info.ssoState.c_str(),
  440. info.centralAuthURL.c_str());
  441. #endif
  442. }
  443. } else {
  444. fprintf(stderr, "client_id: %s\nauthorization_endpoint: %s\n", client_id.c_str(), authorization_endpoint.c_str());
  445. }
  446. }
  447. _pool->unborrow(c);
  448. } catch (std::exception &e) {
  449. fprintf(stderr, "ERROR: Error updating member on load: %s\n", e.what());
  450. }
  451. return info; //std::string(authenticationURL);
  452. }
  453. void PostgreSQL::initializeNetworks()
  454. {
  455. try {
  456. std::string setKey = "networks:{" + _myAddressStr + "}";
  457. fprintf(stderr, "Initializing Networks...\n");
  458. if (_redisMemberStatus) {
  459. fprintf(stderr, "Init Redis for networks...\n");
  460. try {
  461. if (_rc->clusterMode) {
  462. _cluster->del(setKey);
  463. } else {
  464. _redis->del(setKey);
  465. }
  466. } catch (sw::redis::Error &e) {
  467. // ignore. if this key doesn't exist, there's no reason to delete it
  468. }
  469. }
  470. std::unordered_set<std::string> networkSet;
  471. char qbuf[2048] = {0};
  472. sprintf(qbuf, "SELECT n.id, (EXTRACT(EPOCH FROM n.creation_time AT TIME ZONE 'UTC')*1000)::bigint as creation_time, n.capabilities, "
  473. "n.enable_broadcast, (EXTRACT(EPOCH FROM n.last_modified AT TIME ZONE 'UTC')*1000)::bigint AS last_modified, n.mtu, n.multicast_limit, n.name, n.private, n.remote_trace_level, "
  474. "n.remote_trace_target, n.revision, n.rules, n.tags, n.v4_assign_mode, n.v6_assign_mode, n.sso_enabled, (CASE WHEN n.sso_enabled THEN o.client_id ELSE NULL END) as client_id, "
  475. "(CASE WHEN n.sso_enabled THEN o.authorization_endpoint ELSE NULL END) as authorization_endpoint, d.domain, d.servers, "
  476. "ARRAY(SELECT CONCAT(host(ip_range_start),'|', host(ip_range_end)) FROM ztc_network_assignment_pool WHERE network_id = n.id) AS assignment_pool, "
  477. "ARRAY(SELECT CONCAT(host(address),'/',bits::text,'|',COALESCE(host(via), 'NULL'))FROM ztc_network_route WHERE network_id = n.id) AS routes "
  478. "FROM ztc_network n "
  479. "LEFT OUTER JOIN ztc_org o "
  480. " ON o.owner_id = n.owner_id "
  481. "LEFT OUTER JOIN ztc_network_dns d "
  482. " ON d.network_id = n.id "
  483. "WHERE deleted = false AND controller_id = '%s'", _myAddressStr.c_str());
  484. auto c = _pool->borrow();
  485. auto c2 = _pool->borrow();
  486. pqxx::work w{*c->c};
  487. fprintf(stderr, "Load networks from psql...\n");
  488. auto stream = pqxx::stream_from::query(w, qbuf);
  489. std::tuple<
  490. std::string // network ID
  491. , std::optional<int64_t> // creationTime
  492. , std::optional<std::string> // capabilities
  493. , std::optional<bool> // enableBroadcast
  494. , std::optional<uint64_t> // lastModified
  495. , std::optional<int> // mtu
  496. , std::optional<int> // multicastLimit
  497. , std::optional<std::string> // name
  498. , bool // private
  499. , std::optional<int> // remoteTraceLevel
  500. , std::optional<std::string> // remoteTraceTarget
  501. , std::optional<uint64_t> // revision
  502. , std::optional<std::string> // rules
  503. , std::optional<std::string> // tags
  504. , std::optional<std::string> // v4AssignMode
  505. , std::optional<std::string> // v6AssignMode
  506. , std::optional<bool> // ssoEnabled
  507. , std::optional<std::string> // clientId
  508. , std::optional<std::string> // authorizationEndpoint
  509. , std::optional<std::string> // domain
  510. , std::optional<std::string> // servers
  511. , std::string // assignmentPoolString
  512. , std::string // routeString
  513. > row;
  514. uint64_t count = 0;
  515. auto tmp = std::chrono::high_resolution_clock::now();
  516. uint64_t total = 0;
  517. while (stream >> row) {
  518. auto start = std::chrono::high_resolution_clock::now();
  519. json empty;
  520. json config;
  521. initNetwork(config);
  522. std::string nwid = std::get<0>(row);
  523. std::optional<int64_t> creationTime = std::get<1>(row);
  524. std::optional<std::string> capabilities = std::get<2>(row);
  525. std::optional<bool> enableBroadcast = std::get<3>(row);
  526. std::optional<uint64_t> lastModified = std::get<4>(row);
  527. std::optional<int> mtu = std::get<5>(row);
  528. std::optional<int> multicastLimit = std::get<6>(row);
  529. std::optional<std::string> name = std::get<7>(row);
  530. bool isPrivate = std::get<8>(row);
  531. std::optional<int> remoteTraceLevel = std::get<9>(row);
  532. std::optional<std::string> remoteTraceTarget = std::get<10>(row);
  533. std::optional<uint64_t> revision = std::get<11>(row);
  534. std::optional<std::string> rules = std::get<12>(row);
  535. std::optional<std::string> tags = std::get<13>(row);
  536. std::optional<std::string> v4AssignMode = std::get<14>(row);
  537. std::optional<std::string> v6AssignMode = std::get<15>(row);
  538. std::optional<bool> ssoEnabled = std::get<16>(row);
  539. std::optional<std::string> clientId = std::get<17>(row);
  540. std::optional<std::string> authorizationEndpoint = std::get<18>(row);
  541. std::optional<std::string> dnsDomain = std::get<19>(row);
  542. std::optional<std::string> dnsServers = std::get<20>(row);
  543. std::string assignmentPoolString = std::get<21>(row);
  544. std::string routesString = std::get<22>(row);
  545. config["id"] = nwid;
  546. config["nwid"] = nwid;
  547. config["creationTime"] = creationTime.value_or(0);
  548. config["capabilities"] = json::parse(capabilities.value_or("[]"));
  549. config["enableBroadcast"] = enableBroadcast.value_or(false);
  550. config["lastModified"] = lastModified.value_or(0);
  551. config["mtu"] = mtu.value_or(2800);
  552. config["multicastLimit"] = multicastLimit.value_or(64);
  553. config["name"] = name.value_or("");
  554. config["private"] = isPrivate;
  555. config["remoteTraceLevel"] = remoteTraceLevel.value_or(0);
  556. config["remoteTraceTarget"] = remoteTraceTarget.value_or("");
  557. config["revision"] = revision.value_or(0);
  558. config["rules"] = json::parse(rules.value_or("[]"));
  559. config["tags"] = json::parse(tags.value_or("[]"));
  560. config["v4AssignMode"] = json::parse(v4AssignMode.value_or("{}"));
  561. config["v6AssignMode"] = json::parse(v6AssignMode.value_or("{}"));
  562. config["ssoEnabled"] = ssoEnabled.value_or(false);
  563. config["objtype"] = "network";
  564. config["ipAssignmentPools"] = json::array();
  565. config["routes"] = json::array();
  566. config["clientId"] = clientId.value_or("");
  567. config["authorizationEndpoint"] = authorizationEndpoint.value_or("");
  568. networkSet.insert(nwid);
  569. if (dnsDomain.has_value()) {
  570. std::string serverList = dnsServers.value();
  571. json obj;
  572. auto servers = json::array();
  573. if (serverList.rfind("{",0) != std::string::npos) {
  574. serverList = serverList.substr(1, serverList.size()-2);
  575. std::stringstream ss(serverList);
  576. while(ss.good()) {
  577. std::string server;
  578. std::getline(ss, server, ',');
  579. servers.push_back(server);
  580. }
  581. }
  582. obj["domain"] = dnsDomain.value();
  583. obj["servers"] = servers;
  584. config["dns"] = obj;
  585. }
  586. config["ipAssignmentPools"] = json::array();
  587. if (assignmentPoolString != "{}") {
  588. std::string tmp = assignmentPoolString.substr(1, assignmentPoolString.size()-2);
  589. std::vector<std::string> assignmentPools = split(tmp, ',');
  590. for (auto it = assignmentPools.begin(); it != assignmentPools.end(); ++it) {
  591. std::vector<std::string> r = split(*it, '|');
  592. json ip;
  593. ip["ipRangeStart"] = r[0];
  594. ip["ipRangeEnd"] = r[1];
  595. config["ipAssignmentPools"].push_back(ip);
  596. }
  597. }
  598. config["routes"] = json::array();
  599. if (routesString != "{}") {
  600. std::string tmp = routesString.substr(1, routesString.size()-2);
  601. std::vector<std::string> routes = split(tmp, ',');
  602. for (auto it = routes.begin(); it != routes.end(); ++it) {
  603. std::vector<std::string> r = split(*it, '|');
  604. json route;
  605. route["target"] = r[0];
  606. route["via"] = ((route["via"] == "NULL")? nullptr : r[1]);
  607. config["routes"].push_back(route);
  608. }
  609. }
  610. _networkChanged(empty, config, false);
  611. auto end = std::chrono::high_resolution_clock::now();
  612. auto dur = std::chrono::duration_cast<std::chrono::microseconds>(end - start);;
  613. total += dur.count();
  614. ++count;
  615. if (count > 0 && count % 10000 == 0) {
  616. fprintf(stderr, "Averaging %llu us per network\n", (total/count));
  617. }
  618. }
  619. if (count > 0) {
  620. fprintf(stderr, "Took %llu us per network to load\n", (total/count));
  621. }
  622. stream.complete();
  623. w.commit();
  624. _pool->unborrow(c2);
  625. _pool->unborrow(c);
  626. fprintf(stderr, "done.\n");
  627. if (!networkSet.empty()) {
  628. if (_redisMemberStatus) {
  629. fprintf(stderr, "adding networks to redis...\n");
  630. if (_rc->clusterMode) {
  631. auto tx = _cluster->transaction(_myAddressStr, true, false);
  632. tx.sadd(setKey, networkSet.begin(), networkSet.end());
  633. tx.exec();
  634. } else {
  635. auto tx = _redis->transaction(true, false);
  636. tx.sadd(setKey, networkSet.begin(), networkSet.end());
  637. tx.exec();
  638. }
  639. fprintf(stderr, "done.\n");
  640. }
  641. }
  642. if (++this->_ready == 2) {
  643. if (_waitNoticePrinted) {
  644. fprintf(stderr,"[%s] NOTICE: %.10llx controller PostgreSQL data download complete." ZT_EOL_S,_timestr(),(unsigned long long)_myAddress.toInt());
  645. }
  646. _readyLock.unlock();
  647. }
  648. fprintf(stderr, "network init done.\n");
  649. } catch (sw::redis::Error &e) {
  650. fprintf(stderr, "ERROR: Error initializing networks in Redis: %s\n", e.what());
  651. std::this_thread::sleep_for(std::chrono::milliseconds(5000));
  652. exit(-1);
  653. } catch (std::exception &e) {
  654. fprintf(stderr, "ERROR: Error initializing networks: %s\n", e.what());
  655. std::this_thread::sleep_for(std::chrono::milliseconds(5000));
  656. exit(-1);
  657. }
  658. }
  659. void PostgreSQL::initializeMembers()
  660. {
  661. std::string memberId;
  662. std::string networkId;
  663. try {
  664. std::unordered_map<std::string, std::string> networkMembers;
  665. fprintf(stderr, "Initializing Members...\n");
  666. std::string setKeyBase = "network-nodes-all:{" + _myAddressStr + "}:";
  667. if (_redisMemberStatus) {
  668. fprintf(stderr, "Initialize Redis for members...\n");
  669. std::lock_guard<std::mutex> l(_networks_l);
  670. std::unordered_set<std::string> deletes;
  671. for ( auto it : _networks) {
  672. uint64_t nwid_i = it.first;
  673. char nwidTmp[64] = {0};
  674. OSUtils::ztsnprintf(nwidTmp, sizeof(nwidTmp), "%.16llx", nwid_i);
  675. std::string nwid(nwidTmp);
  676. std::string key = setKeyBase + nwid;
  677. deletes.insert(key);
  678. }
  679. if (!deletes.empty()) {
  680. try {
  681. if (_rc->clusterMode) {
  682. auto tx = _cluster->transaction(_myAddressStr, true, false);
  683. for (std::string k : deletes) {
  684. tx.del(k);
  685. }
  686. tx.exec();
  687. } else {
  688. auto tx = _redis->transaction(true, false);
  689. for (std::string k : deletes) {
  690. tx.del(k);
  691. }
  692. tx.exec();
  693. }
  694. } catch (sw::redis::Error &e) {
  695. // ignore
  696. }
  697. }
  698. }
  699. char qbuf[2048];
  700. sprintf(qbuf, "SELECT m.id, m.network_id, m.active_bridge, m.authorized, m.capabilities, (EXTRACT(EPOCH FROM m.creation_time AT TIME ZONE 'UTC')*1000)::bigint, m.identity, "
  701. " (EXTRACT(EPOCH FROM m.last_authorized_time AT TIME ZONE 'UTC')*1000)::bigint, "
  702. " (EXTRACT(EPOCH FROM m.last_deauthorized_time AT TIME ZONE 'UTC')*1000)::bigint, "
  703. " m.remote_trace_level, m.remote_trace_target, m.tags, m.v_major, m.v_minor, m.v_rev, m.v_proto, "
  704. " m.no_auto_assign_ips, m.revision, sso_exempt, "
  705. " (SELECT (EXTRACT(EPOCH FROM e.authentication_expiry_time)*1000)::bigint "
  706. " FROM ztc_sso_expiry e "
  707. " INNER JOIN ztc_network n1 "
  708. " ON n.id = e.network_id "
  709. " WHERE e.network_id = m.network_id AND e.member_id = m.id AND n.sso_enabled = TRUE AND e.authentication_expiry_time IS NOT NULL "
  710. " ORDER BY e.authentication_expiry_time DESC LIMIT 1) AS authentication_expiry_time, "
  711. " ARRAY(SELECT DISTINCT address FROM ztc_member_ip_assignment WHERE member_id = m.id AND network_id = m.network_id) AS assigned_addresses "
  712. "FROM ztc_member m "
  713. "INNER JOIN ztc_network n "
  714. " ON n.id = m.network_id "
  715. "WHERE n.controller_id = '%s' AND m.deleted = false", _myAddressStr.c_str());
  716. auto c = _pool->borrow();
  717. auto c2 = _pool->borrow();
  718. pqxx::work w{*c->c};
  719. fprintf(stderr, "Load members from psql...\n");
  720. auto stream = pqxx::stream_from::query(w, qbuf);
  721. std::tuple<
  722. std::string // memberId
  723. , std::string // memberId
  724. , std::optional<bool> // activeBridge
  725. , std::optional<bool> // authorized
  726. , std::optional<std::string> // capabilities
  727. , std::optional<uint64_t> // creationTime
  728. , std::optional<std::string> // identity
  729. , std::optional<uint64_t> // lastAuthorizedTime
  730. , std::optional<uint64_t> // lastDeauthorizedTime
  731. , std::optional<int> // remoteTraceLevel
  732. , std::optional<std::string> // remoteTraceTarget
  733. , std::optional<std::string> // tags
  734. , std::optional<int> // vMajor
  735. , std::optional<int> // vMinor
  736. , std::optional<int> // vRev
  737. , std::optional<int> // vProto
  738. , std::optional<bool> // noAutoAssignIps
  739. , std::optional<uint64_t> // revision
  740. , std::optional<bool> // ssoExempt
  741. , std::optional<uint64_t> // authenticationExpiryTime
  742. , std::string // assignedAddresses
  743. > row;
  744. uint64_t count = 0;
  745. auto tmp = std::chrono::high_resolution_clock::now();
  746. uint64_t total = 0;
  747. while (stream >> row) {
  748. auto start = std::chrono::high_resolution_clock::now();
  749. json empty;
  750. json config;
  751. initMember(config);
  752. memberId = std::get<0>(row);
  753. networkId = std::get<1>(row);
  754. std::optional<bool> activeBridge = std::get<2>(row);
  755. std::optional<bool> authorized = std::get<3>(row);
  756. std::optional<std::string> capabilities = std::get<4>(row);
  757. std::optional<uint64_t> creationTime = std::get<5>(row);
  758. std::optional<std::string> identity = std::get<6>(row);
  759. std::optional<uint64_t> lastAuthorizedTime = std::get<7>(row);
  760. std::optional<uint64_t> lastDeauthorizedTime = std::get<8>(row);
  761. std::optional<int> remoteTraceLevel = std::get<9>(row);
  762. std::optional<std::string> remoteTraceTarget = std::get<10>(row);
  763. std::optional<std::string> tags = std::get<11>(row);
  764. std::optional<int> vMajor = std::get<12>(row);
  765. std::optional<int> vMinor = std::get<13>(row);
  766. std::optional<int> vRev = std::get<14>(row);
  767. std::optional<int> vProto = std::get<15>(row);
  768. std::optional<bool> noAutoAssignIps = std::get<16>(row);
  769. std::optional<uint64_t> revision = std::get<17>(row);
  770. std::optional<bool> ssoExempt = std::get<18>(row);
  771. std::optional<uint64_t> authenticationExpiryTime = std::get<19>(row);
  772. std::string assignedAddresses = std::get<20>(row);
  773. networkMembers.insert(std::pair<std::string, std::string>(setKeyBase+networkId, memberId));
  774. config["id"] = memberId;
  775. config["address"] = memberId;
  776. config["nwid"] = networkId;
  777. config["activeBridge"] = activeBridge.value_or(false);
  778. config["authorized"] = authorized.value_or(false);
  779. config["capabilities"] = json::parse(capabilities.value_or("[]"));
  780. config["creationTime"] = creationTime.value_or(0);
  781. config["identity"] = identity.value_or("");
  782. config["lastAuthorizedTime"] = lastAuthorizedTime.value_or(0);
  783. config["lastDeauthorizedTime"] = lastDeauthorizedTime.value_or(0);
  784. config["remoteTraceLevel"] = remoteTraceLevel.value_or(0);
  785. config["remoteTraceTarget"] = remoteTraceTarget.value_or("");
  786. config["tags"] = json::parse(tags.value_or("[]"));
  787. config["vMajor"] = vMajor.value_or(-1);
  788. config["vMinor"] = vMinor.value_or(-1);
  789. config["vRev"] = vRev.value_or(-1);
  790. config["vProto"] = vProto.value_or(-1);
  791. config["noAutoAssignIps"] = noAutoAssignIps.value_or(false);
  792. config["revision"] = revision.value_or(0);
  793. config["ssoExempt"] = ssoExempt.value_or(false);
  794. config["authenticationExpiryTime"] = authenticationExpiryTime.value_or(0);
  795. config["objtype"] = "member";
  796. config["ipAssignments"] = json::array();
  797. if (assignedAddresses != "{}") {
  798. std::string tmp = assignedAddresses.substr(1, assignedAddresses.size()-2);
  799. std::vector<std::string> addrs = split(tmp, ',');
  800. for (auto it = addrs.begin(); it != addrs.end(); ++it) {
  801. config["ipAssignments"].push_back(*it);
  802. }
  803. }
  804. _memberChanged(empty, config, false);
  805. memberId = "";
  806. networkId = "";
  807. auto end = std::chrono::high_resolution_clock::now();
  808. auto dur = std::chrono::duration_cast<std::chrono::microseconds>(end - start);
  809. total += dur.count();
  810. ++count;
  811. if (count > 0 && count % 10000 == 0) {
  812. fprintf(stderr, "Averaging %llu us per member\n", (total/count));
  813. }
  814. }
  815. if (count > 0) {
  816. fprintf(stderr, "Took %llu us per member to load\n", (total/count));
  817. }
  818. stream.complete();
  819. w.commit();
  820. _pool->unborrow(c2);
  821. _pool->unborrow(c);
  822. fprintf(stderr, "done.\n");
  823. if (!networkMembers.empty()) {
  824. if (_redisMemberStatus) {
  825. fprintf(stderr, "Load member data into redis...\n");
  826. if (_rc->clusterMode) {
  827. auto tx = _cluster->transaction(_myAddressStr, true, false);
  828. for (auto it : networkMembers) {
  829. tx.sadd(it.first, it.second);
  830. }
  831. tx.exec();
  832. } else {
  833. auto tx = _redis->transaction(true, false);
  834. for (auto it : networkMembers) {
  835. tx.sadd(it.first, it.second);
  836. }
  837. tx.exec();
  838. }
  839. fprintf(stderr, "done.\n");
  840. }
  841. }
  842. fprintf(stderr, "Done loading members...\n");
  843. if (++this->_ready == 2) {
  844. if (_waitNoticePrinted) {
  845. fprintf(stderr,"[%s] NOTICE: %.10llx controller PostgreSQL data download complete." ZT_EOL_S,_timestr(),(unsigned long long)_myAddress.toInt());
  846. }
  847. _readyLock.unlock();
  848. }
  849. } catch (sw::redis::Error &e) {
  850. fprintf(stderr, "ERROR: Error initializing members (redis): %s\n", e.what());
  851. exit(-1);
  852. } catch (std::exception &e) {
  853. fprintf(stderr, "ERROR: Error initializing member: %s-%s %s\n", networkId.c_str(), memberId.c_str(), e.what());
  854. exit(-1);
  855. }
  856. }
  857. void PostgreSQL::heartbeat()
  858. {
  859. char publicId[1024];
  860. char hostnameTmp[1024];
  861. _myId.toString(false,publicId);
  862. if (gethostname(hostnameTmp, sizeof(hostnameTmp))!= 0) {
  863. hostnameTmp[0] = (char)0;
  864. } else {
  865. for (int i = 0; i < (int)sizeof(hostnameTmp); ++i) {
  866. if ((hostnameTmp[i] == '.')||(hostnameTmp[i] == 0)) {
  867. hostnameTmp[i] = (char)0;
  868. break;
  869. }
  870. }
  871. }
  872. const char *controllerId = _myAddressStr.c_str();
  873. const char *publicIdentity = publicId;
  874. const char *hostname = hostnameTmp;
  875. while (_run == 1) {
  876. // fprintf(stderr, "%s: heartbeat\n", controllerId);
  877. auto c = _pool->borrow();
  878. int64_t ts = OSUtils::now();
  879. if(c->c) {
  880. pqxx::work w{*c->c};
  881. std::string major = std::to_string(ZEROTIER_ONE_VERSION_MAJOR);
  882. std::string minor = std::to_string(ZEROTIER_ONE_VERSION_MINOR);
  883. std::string rev = std::to_string(ZEROTIER_ONE_VERSION_REVISION);
  884. std::string build = std::to_string(ZEROTIER_ONE_VERSION_BUILD);
  885. std::string now = std::to_string(ts);
  886. std::string host_port = std::to_string(_listenPort);
  887. std::string use_redis = (_rc != NULL) ? "true" : "false";
  888. std::string redis_mem_status = (_redisMemberStatus) ? "true" : "false";
  889. try {
  890. pqxx::result res = w.exec0("INSERT INTO ztc_controller (id, cluster_host, last_alive, public_identity, v_major, v_minor, v_rev, v_build, host_port, use_redis, redis_member_status) "
  891. "VALUES ("+w.quote(controllerId)+", "+w.quote(hostname)+", TO_TIMESTAMP("+now+"::double precision/1000), "+
  892. w.quote(publicIdentity)+", "+major+", "+minor+", "+rev+", "+build+", "+host_port+", "+use_redis+", "+redis_mem_status+") "
  893. "ON CONFLICT (id) DO UPDATE SET cluster_host = EXCLUDED.cluster_host, last_alive = EXCLUDED.last_alive, "
  894. "public_identity = EXCLUDED.public_identity, v_major = EXCLUDED.v_major, v_minor = EXCLUDED.v_minor, "
  895. "v_rev = EXCLUDED.v_rev, v_build = EXCLUDED.v_rev, host_port = EXCLUDED.host_port, "
  896. "use_redis = EXCLUDED.use_redis, redis_member_status = EXCLUDED.redis_member_status");
  897. } catch (std::exception &e) {
  898. fprintf(stderr, "Heartbeat update failed: %s\n", e.what());
  899. w.abort();
  900. _pool->unborrow(c);
  901. std::this_thread::sleep_for(std::chrono::milliseconds(1000));
  902. continue;
  903. }
  904. w.commit();
  905. }
  906. _pool->unborrow(c);
  907. try {
  908. if (_redisMemberStatus) {
  909. if (_rc->clusterMode) {
  910. _cluster->zadd("controllers", "controllerId", ts);
  911. } else {
  912. _redis->zadd("controllers", "controllerId", ts);
  913. }
  914. }
  915. } catch (sw::redis::Error &e) {
  916. fprintf(stderr, "ERROR: Redis error in heartbeat thread: %s\n", e.what());
  917. }
  918. std::this_thread::sleep_for(std::chrono::milliseconds(1000));
  919. }
  920. fprintf(stderr, "Exited heartbeat thread\n");
  921. }
  922. void PostgreSQL::membersDbWatcher()
  923. {
  924. if (_rc) {
  925. _membersWatcher_Redis();
  926. } else {
  927. _membersWatcher_Postgres();
  928. }
  929. if (_run == 1) {
  930. fprintf(stderr, "ERROR: %s membersDbWatcher should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  931. exit(9);
  932. }
  933. fprintf(stderr, "Exited membersDbWatcher\n");
  934. }
  935. void PostgreSQL::_membersWatcher_Postgres() {
  936. auto c = _pool->borrow();
  937. std::string stream = "member_" + _myAddressStr;
  938. fprintf(stderr, "Listening to member stream: %s\n", stream.c_str());
  939. MemberNotificationReceiver m(this, *c->c, stream);
  940. while(_run == 1) {
  941. c->c->await_notification(5, 0);
  942. }
  943. _pool->unborrow(c);
  944. }
  945. void PostgreSQL::_membersWatcher_Redis() {
  946. char buf[11] = {0};
  947. std::string key = "member-stream:{" + std::string(_myAddress.toString(buf)) + "}";
  948. std::string lastID = "0";
  949. fprintf(stderr, "Listening to member stream: %s\n", key.c_str());
  950. while (_run == 1) {
  951. try {
  952. json tmp;
  953. std::unordered_map<std::string, ItemStream> result;
  954. if (_rc->clusterMode) {
  955. _cluster->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  956. } else {
  957. _redis->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  958. }
  959. if (!result.empty()) {
  960. for (auto element : result) {
  961. #ifdef REDIS_TRACE
  962. fprintf(stdout, "Received notification from: %s\n", element.first.c_str());
  963. #endif
  964. for (auto rec : element.second) {
  965. std::string id = rec.first;
  966. auto attrs = rec.second;
  967. #ifdef REDIS_TRACE
  968. fprintf(stdout, "Record ID: %s\n", id.c_str());
  969. fprintf(stdout, "attrs len: %lu\n", attrs.size());
  970. #endif
  971. for (auto a : attrs) {
  972. #ifdef REDIS_TRACE
  973. fprintf(stdout, "key: %s\nvalue: %s\n", a.first.c_str(), a.second.c_str());
  974. #endif
  975. try {
  976. tmp = json::parse(a.second);
  977. json &ov = tmp["old_val"];
  978. json &nv = tmp["new_val"];
  979. json oldConfig, newConfig;
  980. if (ov.is_object()) oldConfig = ov;
  981. if (nv.is_object()) newConfig = nv;
  982. if (oldConfig.is_object()||newConfig.is_object()) {
  983. _memberChanged(oldConfig,newConfig,(this->_ready >= 2));
  984. }
  985. } catch (...) {
  986. fprintf(stderr, "json parse error in networkWatcher_Redis\n");
  987. }
  988. }
  989. if (_rc->clusterMode) {
  990. _cluster->xdel(key, id);
  991. } else {
  992. _redis->xdel(key, id);
  993. }
  994. lastID = id;
  995. }
  996. }
  997. }
  998. } catch (sw::redis::Error &e) {
  999. fprintf(stderr, "Error in Redis members watcher: %s\n", e.what());
  1000. }
  1001. }
  1002. fprintf(stderr, "membersWatcher ended\n");
  1003. }
  1004. void PostgreSQL::networksDbWatcher()
  1005. {
  1006. if (_rc) {
  1007. _networksWatcher_Redis();
  1008. } else {
  1009. _networksWatcher_Postgres();
  1010. }
  1011. if (_run == 1) {
  1012. fprintf(stderr, "ERROR: %s networksDbWatcher should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  1013. exit(8);
  1014. }
  1015. fprintf(stderr, "Exited networksDbWatcher\n");
  1016. }
  1017. void PostgreSQL::_networksWatcher_Postgres() {
  1018. std::string stream = "network_" + _myAddressStr;
  1019. fprintf(stderr, "Listening to member stream: %s\n", stream.c_str());
  1020. auto c = _pool->borrow();
  1021. NetworkNotificationReceiver n(this, *c->c, stream);
  1022. while(_run == 1) {
  1023. c->c->await_notification(5,0);
  1024. }
  1025. }
  1026. void PostgreSQL::_networksWatcher_Redis() {
  1027. char buf[11] = {0};
  1028. std::string key = "network-stream:{" + std::string(_myAddress.toString(buf)) + "}";
  1029. std::string lastID = "0";
  1030. while (_run == 1) {
  1031. try {
  1032. json tmp;
  1033. std::unordered_map<std::string, ItemStream> result;
  1034. if (_rc->clusterMode) {
  1035. _cluster->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  1036. } else {
  1037. _redis->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  1038. }
  1039. if (!result.empty()) {
  1040. for (auto element : result) {
  1041. #ifdef REDIS_TRACE
  1042. fprintf(stdout, "Received notification from: %s\n", element.first.c_str());
  1043. #endif
  1044. for (auto rec : element.second) {
  1045. std::string id = rec.first;
  1046. auto attrs = rec.second;
  1047. #ifdef REDIS_TRACE
  1048. fprintf(stdout, "Record ID: %s\n", id.c_str());
  1049. fprintf(stdout, "attrs len: %lu\n", attrs.size());
  1050. #endif
  1051. for (auto a : attrs) {
  1052. #ifdef REDIS_TRACE
  1053. fprintf(stdout, "key: %s\nvalue: %s\n", a.first.c_str(), a.second.c_str());
  1054. #endif
  1055. try {
  1056. tmp = json::parse(a.second);
  1057. json &ov = tmp["old_val"];
  1058. json &nv = tmp["new_val"];
  1059. json oldConfig, newConfig;
  1060. if (ov.is_object()) oldConfig = ov;
  1061. if (nv.is_object()) newConfig = nv;
  1062. if (oldConfig.is_object()||newConfig.is_object()) {
  1063. _networkChanged(oldConfig,newConfig,(this->_ready >= 2));
  1064. }
  1065. } catch (...) {
  1066. fprintf(stderr, "json parse error in networkWatcher_Redis\n");
  1067. }
  1068. }
  1069. if (_rc->clusterMode) {
  1070. _cluster->xdel(key, id);
  1071. } else {
  1072. _redis->xdel(key, id);
  1073. }
  1074. lastID = id;
  1075. }
  1076. }
  1077. }
  1078. } catch (sw::redis::Error &e) {
  1079. fprintf(stderr, "Error in Redis networks watcher: %s\n", e.what());
  1080. }
  1081. }
  1082. fprintf(stderr, "networksWatcher ended\n");
  1083. }
  1084. void PostgreSQL::commitThread()
  1085. {
  1086. fprintf(stderr, "%s: commitThread start\n", _myAddressStr.c_str());
  1087. std::pair<nlohmann::json,bool> qitem;
  1088. while(_commitQueue.get(qitem)&(_run == 1)) {
  1089. //fprintf(stderr, "commitThread tick\n");
  1090. if (!qitem.first.is_object()) {
  1091. fprintf(stderr, "not an object\n");
  1092. continue;
  1093. }
  1094. std::shared_ptr<PostgresConnection> c;
  1095. try {
  1096. c = _pool->borrow();
  1097. } catch (std::exception &e) {
  1098. fprintf(stderr, "ERROR: %s\n", e.what());
  1099. continue;
  1100. }
  1101. if (!c) {
  1102. fprintf(stderr, "Error getting database connection\n");
  1103. continue;
  1104. }
  1105. try {
  1106. nlohmann::json &config = (qitem.first);
  1107. const std::string objtype = config["objtype"];
  1108. if (objtype == "member") {
  1109. // fprintf(stderr, "%s: commitThread: member\n", _myAddressStr.c_str());
  1110. std::string memberId;
  1111. std::string networkId;
  1112. try {
  1113. pqxx::work w(*c->c);
  1114. memberId = config["id"];
  1115. networkId = config["nwid"];
  1116. std::string target = "NULL";
  1117. if (!config["remoteTraceTarget"].is_null()) {
  1118. target = config["remoteTraceTarget"];
  1119. }
  1120. pqxx::row nwrow = w.exec_params1("SELECT COUNT(id) FROM ztc_network WHERE id = $1", networkId);
  1121. int nwcount = nwrow[0].as<int>();
  1122. if (nwcount != 1) {
  1123. fprintf(stderr, "network %s does not exist. skipping member upsert\n", networkId.c_str());
  1124. w.abort();
  1125. _pool->unborrow(c);
  1126. continue;
  1127. }
  1128. pqxx::result res = w.exec_params0(
  1129. "INSERT INTO ztc_member (id, network_id, active_bridge, authorized, capabilities, "
  1130. "identity, last_authorized_time, last_deauthorized_time, no_auto_assign_ips, "
  1131. "remote_trace_level, remote_trace_target, revision, tags, v_major, v_minor, v_rev, v_proto) "
  1132. "VALUES ($1, $2, $3, $4, $5, $6, "
  1133. "TO_TIMESTAMP($7::double precision/1000), TO_TIMESTAMP($8::double precision/1000), "
  1134. "$9, $10, $11, $12, $13, $14, $15, $16, $17) ON CONFLICT (network_id, id) DO UPDATE SET "
  1135. "active_bridge = EXCLUDED.active_bridge, authorized = EXCLUDED.authorized, capabilities = EXCLUDED.capabilities, "
  1136. "identity = EXCLUDED.identity, last_authorized_time = EXCLUDED.last_authorized_time, "
  1137. "last_deauthorized_time = EXCLUDED.last_deauthorized_time, no_auto_assign_ips = EXCLUDED.no_auto_assign_ips, "
  1138. "remote_trace_level = EXCLUDED.remote_trace_level, remote_trace_target = EXCLUDED.remote_trace_target, "
  1139. "revision = EXCLUDED.revision+1, tags = EXCLUDED.tags, v_major = EXCLUDED.v_major, "
  1140. "v_minor = EXCLUDED.v_minor, v_rev = EXCLUDED.v_rev, v_proto = EXCLUDED.v_proto",
  1141. memberId,
  1142. networkId,
  1143. (bool)config["activeBridge"],
  1144. (bool)config["authorized"],
  1145. OSUtils::jsonDump(config["capabilities"], -1),
  1146. OSUtils::jsonString(config["identity"], ""),
  1147. (uint64_t)config["lastAuthorizedTime"],
  1148. (uint64_t)config["lastDeauthorizedTime"],
  1149. (bool)config["noAutoAssignIps"],
  1150. (int)config["remoteTraceLevel"],
  1151. target,
  1152. (uint64_t)config["revision"],
  1153. OSUtils::jsonDump(config["tags"], -1),
  1154. (int)config["vMajor"],
  1155. (int)config["vMinor"],
  1156. (int)config["vRev"],
  1157. (int)config["vProto"]);
  1158. res = w.exec_params0("DELETE FROM ztc_member_ip_assignment WHERE member_id = $1 AND network_id = $2",
  1159. memberId, networkId);
  1160. std::vector<std::string> assignments;
  1161. bool ipAssignError = false;
  1162. for (auto i = config["ipAssignments"].begin(); i != config["ipAssignments"].end(); ++i) {
  1163. std::string addr = *i;
  1164. if (std::find(assignments.begin(), assignments.end(), addr) != assignments.end()) {
  1165. continue;
  1166. }
  1167. res = w.exec_params0(
  1168. "INSERT INTO ztc_member_ip_assignment (member_id, network_id, address) VALUES ($1, $2, $3) ON CONFLICT (network_id, member_id, address) DO NOTHING",
  1169. memberId, networkId, addr);
  1170. assignments.push_back(addr);
  1171. }
  1172. if (ipAssignError) {
  1173. fprintf(stderr, "%s: ipAssignError\n", _myAddressStr.c_str());
  1174. w.abort();
  1175. _pool->unborrow(c);
  1176. c.reset();
  1177. continue;
  1178. }
  1179. w.commit();
  1180. const uint64_t nwidInt = OSUtils::jsonIntHex(config["nwid"], 0ULL);
  1181. const uint64_t memberidInt = OSUtils::jsonIntHex(config["id"], 0ULL);
  1182. if (nwidInt && memberidInt) {
  1183. nlohmann::json nwOrig;
  1184. nlohmann::json memOrig;
  1185. nlohmann::json memNew(config);
  1186. get(nwidInt, nwOrig, memberidInt, memOrig);
  1187. _memberChanged(memOrig, memNew, qitem.second);
  1188. } else {
  1189. fprintf(stderr, "%s: Can't notify of change. Error parsing nwid or memberid: %llu-%llu\n", _myAddressStr.c_str(), (unsigned long long)nwidInt, (unsigned long long)memberidInt);
  1190. }
  1191. } catch (std::exception &e) {
  1192. fprintf(stderr, "%s ERROR: Error updating member %s-%s: %s\n", _myAddressStr.c_str(), networkId.c_str(), memberId.c_str(), e.what());
  1193. }
  1194. } else if (objtype == "network") {
  1195. try {
  1196. // fprintf(stderr, "%s: commitThread: network\n", _myAddressStr.c_str());
  1197. pqxx::work w(*c->c);
  1198. std::string id = config["id"];
  1199. std::string remoteTraceTarget = "";
  1200. if(!config["remoteTraceTarget"].is_null()) {
  1201. remoteTraceTarget = config["remoteTraceTarget"];
  1202. }
  1203. std::string rulesSource = "";
  1204. if (config["rulesSource"].is_string()) {
  1205. rulesSource = config["rulesSource"];
  1206. }
  1207. // This ugly query exists because when we want to mirror networks to/from
  1208. // another data store (e.g. FileDB or LFDB) it is possible to get a network
  1209. // that doesn't exist in Central's database. This does an upsert and sets
  1210. // the owner_id to the "first" global admin in the user DB if the record
  1211. // did not previously exist. If the record already exists owner_id is left
  1212. // unchanged, so owner_id should be left out of the update clause.
  1213. pqxx::result res = w.exec_params0(
  1214. "INSERT INTO ztc_network (id, creation_time, owner_id, controller_id, capabilities, enable_broadcast, "
  1215. "last_modified, mtu, multicast_limit, name, private, "
  1216. "remote_trace_level, remote_trace_target, rules, rules_source, "
  1217. "tags, v4_assign_mode, v6_assign_mode, sso_enabled) VALUES ("
  1218. "$1, TO_TIMESTAMP($5::double precision/1000), "
  1219. "(SELECT user_id AS owner_id FROM ztc_global_permissions WHERE authorize = true AND del = true AND modify = true AND read = true LIMIT 1),"
  1220. "$2, $3, $4, TO_TIMESTAMP($5::double precision/1000), "
  1221. "$6, $7, $8, $9, $10, $11, $12, $13, $14, $15, $16, $17) "
  1222. "ON CONFLICT (id) DO UPDATE set controller_id = EXCLUDED.controller_id, "
  1223. "capabilities = EXCLUDED.capabilities, enable_broadcast = EXCLUDED.enable_broadcast, "
  1224. "last_modified = EXCLUDED.last_modified, mtu = EXCLUDED.mtu, "
  1225. "multicast_limit = EXCLUDED.multicast_limit, name = EXCLUDED.name, "
  1226. "private = EXCLUDED.private, remote_trace_level = EXCLUDED.remote_trace_level, "
  1227. "remote_trace_target = EXCLUDED.remote_trace_target, rules = EXCLUDED.rules, "
  1228. "rules_source = EXCLUDED.rules_source, tags = EXCLUDED.tags, "
  1229. "v4_assign_mode = EXCLUDED.v4_assign_mode, v6_assign_mode = EXCLUDED.v6_assign_mode, "
  1230. "sso_enabled = EXCLUDED.sso_enabled",
  1231. id,
  1232. _myAddressStr,
  1233. OSUtils::jsonDump(config["capabilitles"], -1),
  1234. (bool)config["enableBroadcast"],
  1235. OSUtils::now(),
  1236. (int)config["mtu"],
  1237. (int)config["multicastLimit"],
  1238. OSUtils::jsonString(config["name"],""),
  1239. (bool)config["private"],
  1240. (int)config["remoteTraceLevel"],
  1241. remoteTraceTarget,
  1242. OSUtils::jsonDump(config["rules"], -1),
  1243. rulesSource,
  1244. OSUtils::jsonDump(config["tags"], -1),
  1245. OSUtils::jsonDump(config["v4AssignMode"],-1),
  1246. OSUtils::jsonDump(config["v6AssignMode"], -1),
  1247. OSUtils::jsonBool(config["ssoEnabled"], false));
  1248. res = w.exec_params0("DELETE FROM ztc_network_assignment_pool WHERE network_id = $1", 0);
  1249. auto pool = config["ipAssignmentPools"];
  1250. bool err = false;
  1251. for (auto i = pool.begin(); i != pool.end(); ++i) {
  1252. std::string start = (*i)["ipRangeStart"];
  1253. std::string end = (*i)["ipRangeEnd"];
  1254. res = w.exec_params0(
  1255. "INSERT INTO ztc_network_assignment_pool (network_id, ip_range_start, ip_range_end) "
  1256. "VALUES ($1, $2, $3)", id, start, end);
  1257. }
  1258. res = w.exec_params0("DELETE FROM ztc_network_route WHERE network_id = $1", id);
  1259. auto routes = config["routes"];
  1260. err = false;
  1261. for (auto i = routes.begin(); i != routes.end(); ++i) {
  1262. std::string t = (*i)["target"];
  1263. std::vector<std::string> target;
  1264. std::istringstream f(t);
  1265. std::string s;
  1266. while(std::getline(f, s, '/')) {
  1267. target.push_back(s);
  1268. }
  1269. if (target.empty() || target.size() != 2) {
  1270. continue;
  1271. }
  1272. std::string targetAddr = target[0];
  1273. std::string targetBits = target[1];
  1274. std::string via = "NULL";
  1275. if (!(*i)["via"].is_null()) {
  1276. via = (*i)["via"];
  1277. }
  1278. res = w.exec_params0("INSERT INTO ztc_network_route (network_id, address, bits, via) VALUES ($1, $2, $3, $4)",
  1279. id, targetAddr, targetBits, (via == "NULL" ? NULL : via.c_str()));
  1280. }
  1281. if (err) {
  1282. fprintf(stderr, "%s: route add error\n", _myAddressStr.c_str());
  1283. w.abort();
  1284. _pool->unborrow(c);
  1285. continue;
  1286. }
  1287. auto dns = config["dns"];
  1288. std::string domain = dns["domain"];
  1289. std::stringstream servers;
  1290. servers << "{";
  1291. for (auto j = dns["servers"].begin(); j < dns["servers"].end(); ++j) {
  1292. servers << *j;
  1293. if ( (j+1) != dns["servers"].end()) {
  1294. servers << ",";
  1295. }
  1296. }
  1297. servers << "}";
  1298. std::string s = servers.str();
  1299. res = w.exec_params0("INSERT INTO ztc_network_dns (network_id, domain, servers) VALUES ($1, $2, $3) ON CONFLICT (network_id) DO UPDATE SET domain = EXCLUDED.domain, servers = EXCLUDED.servers",
  1300. id, domain, s);
  1301. w.commit();
  1302. const uint64_t nwidInt = OSUtils::jsonIntHex(config["nwid"], 0ULL);
  1303. if (nwidInt) {
  1304. nlohmann::json nwOrig;
  1305. nlohmann::json nwNew(config);
  1306. get(nwidInt, nwOrig);
  1307. _networkChanged(nwOrig, nwNew, qitem.second);
  1308. } else {
  1309. fprintf(stderr, "%s: Can't notify network changed: %llu\n", _myAddressStr.c_str(), (unsigned long long)nwidInt);
  1310. }
  1311. } catch (std::exception &e) {
  1312. fprintf(stderr, "%s ERROR: Error updating network: %s\n", _myAddressStr.c_str(), e.what());
  1313. }
  1314. if (_redisMemberStatus) {
  1315. try {
  1316. std::string id = config["id"];
  1317. std::string controllerId = _myAddressStr.c_str();
  1318. std::string key = "networks:{" + controllerId + "}";
  1319. if (_rc->clusterMode) {
  1320. _cluster->sadd(key, id);
  1321. } else {
  1322. _redis->sadd(key, id);
  1323. }
  1324. } catch (sw::redis::Error &e) {
  1325. fprintf(stderr, "ERROR: Error adding network to Redis: %s\n", e.what());
  1326. }
  1327. }
  1328. } else if (objtype == "_delete_network") {
  1329. // fprintf(stderr, "%s: commitThread: delete network\n", _myAddressStr.c_str());
  1330. try {
  1331. pqxx::work w(*c->c);
  1332. std::string networkId = config["nwid"];
  1333. pqxx::result res = w.exec_params0("UPDATE ztc_network SET deleted = true WHERE id = $1",
  1334. networkId);
  1335. w.commit();
  1336. } catch (std::exception &e) {
  1337. fprintf(stderr, "%s ERROR: Error deleting network: %s\n", _myAddressStr.c_str(), e.what());
  1338. }
  1339. if (_redisMemberStatus) {
  1340. try {
  1341. std::string id = config["id"];
  1342. std::string controllerId = _myAddressStr.c_str();
  1343. std::string key = "networks:{" + controllerId + "}";
  1344. if (_rc->clusterMode) {
  1345. _cluster->srem(key, id);
  1346. _cluster->del("network-nodes-online:{"+controllerId+"}:"+id);
  1347. } else {
  1348. _redis->srem(key, id);
  1349. _redis->del("network-nodes-online:{"+controllerId+"}:"+id);
  1350. }
  1351. } catch (sw::redis::Error &e) {
  1352. fprintf(stderr, "ERROR: Error adding network to Redis: %s\n", e.what());
  1353. }
  1354. }
  1355. } else if (objtype == "_delete_member") {
  1356. // fprintf(stderr, "%s commitThread: delete member\n", _myAddressStr.c_str());
  1357. try {
  1358. pqxx::work w(*c->c);
  1359. std::string memberId = config["id"];
  1360. std::string networkId = config["nwid"];
  1361. pqxx::result res = w.exec_params0(
  1362. "UPDATE ztc_member SET hidden = true, deleted = true WHERE id = $1 AND network_id = $2",
  1363. memberId, networkId);
  1364. w.commit();
  1365. } catch (std::exception &e) {
  1366. fprintf(stderr, "%s ERROR: Error deleting member: %s\n", _myAddressStr.c_str(), e.what());
  1367. }
  1368. if (_redisMemberStatus) {
  1369. try {
  1370. std::string memberId = config["id"];
  1371. std::string networkId = config["nwid"];
  1372. std::string controllerId = _myAddressStr.c_str();
  1373. std::string key = "network-nodes-all:{" + controllerId + "}:" + networkId;
  1374. if (_rc->clusterMode) {
  1375. _cluster->srem(key, memberId);
  1376. _cluster->del("member:{"+controllerId+"}:"+networkId+":"+memberId);
  1377. } else {
  1378. _redis->srem(key, memberId);
  1379. _redis->del("member:{"+controllerId+"}:"+networkId+":"+memberId);
  1380. }
  1381. } catch (sw::redis::Error &e) {
  1382. fprintf(stderr, "ERROR: Error deleting member from Redis: %s\n", e.what());
  1383. }
  1384. }
  1385. } else {
  1386. fprintf(stderr, "%s ERROR: unknown objtype\n", _myAddressStr.c_str());
  1387. }
  1388. } catch (std::exception &e) {
  1389. fprintf(stderr, "%s ERROR: Error getting objtype: %s\n", _myAddressStr.c_str(), e.what());
  1390. }
  1391. _pool->unborrow(c);
  1392. c.reset();
  1393. std::this_thread::sleep_for(std::chrono::milliseconds(100));
  1394. }
  1395. fprintf(stderr, "%s commitThread finished\n", _myAddressStr.c_str());
  1396. }
  1397. void PostgreSQL::onlineNotificationThread()
  1398. {
  1399. waitForReady();
  1400. if (_redisMemberStatus) {
  1401. onlineNotification_Redis();
  1402. } else {
  1403. onlineNotification_Postgres();
  1404. }
  1405. }
  1406. /**
  1407. * ONLY UNCOMMENT FOR TEMPORARY DB MAINTENANCE
  1408. *
  1409. * This define temproarly turns off writing to the member status table
  1410. * so it can be reindexed when the indexes get too large.
  1411. */
  1412. // #define DISABLE_MEMBER_STATUS 1
  1413. void PostgreSQL::onlineNotification_Postgres()
  1414. {
  1415. _connected = 1;
  1416. nlohmann::json jtmp1, jtmp2;
  1417. while (_run == 1) {
  1418. auto c = _pool->borrow();
  1419. auto c2 = _pool->borrow();
  1420. try {
  1421. fprintf(stderr, "%s onlineNotification_Postgres\n", _myAddressStr.c_str());
  1422. std::unordered_map< std::pair<uint64_t,uint64_t>,std::pair<int64_t,InetAddress>,_PairHasher > lastOnline;
  1423. {
  1424. std::lock_guard<std::mutex> l(_lastOnline_l);
  1425. lastOnline.swap(_lastOnline);
  1426. }
  1427. #ifndef DISABLE_MEMBER_STATUS
  1428. pqxx::work w(*c->c);
  1429. pqxx::work w2(*c2->c);
  1430. fprintf(stderr, "online notification tick\n");
  1431. bool firstRun = true;
  1432. bool memberAdded = false;
  1433. int updateCount = 0;
  1434. pqxx::pipeline pipe(w);
  1435. for (auto i=lastOnline.begin(); i != lastOnline.end(); ++i) {
  1436. updateCount += 1;
  1437. uint64_t nwid_i = i->first.first;
  1438. char nwidTmp[64];
  1439. char memTmp[64];
  1440. char ipTmp[64];
  1441. OSUtils::ztsnprintf(nwidTmp,sizeof(nwidTmp), "%.16llx", nwid_i);
  1442. OSUtils::ztsnprintf(memTmp,sizeof(memTmp), "%.10llx", i->first.second);
  1443. if(!get(nwid_i, jtmp1, i->first.second, jtmp2)) {
  1444. continue; // skip non existent networks/members
  1445. }
  1446. std::string networkId(nwidTmp);
  1447. std::string memberId(memTmp);
  1448. try {
  1449. pqxx::row r = w2.exec_params1("SELECT id, network_id FROM ztc_member WHERE network_id = $1 AND id = $2",
  1450. networkId, memberId);
  1451. } catch (pqxx::unexpected_rows &e) {
  1452. continue;
  1453. }
  1454. int64_t ts = i->second.first;
  1455. std::string ipAddr = i->second.second.toIpString(ipTmp);
  1456. std::string timestamp = std::to_string(ts);
  1457. std::stringstream memberUpdate;
  1458. memberUpdate << "INSERT INTO ztc_member_status (network_id, member_id, address, last_updated) VALUES "
  1459. << "('" << networkId << "', '" << memberId << "', ";
  1460. if (ipAddr.empty()) {
  1461. memberUpdate << "NULL, ";
  1462. } else {
  1463. memberUpdate << "'" << ipAddr << "', ";
  1464. }
  1465. memberUpdate << "TO_TIMESTAMP(" << timestamp << "::double precision/1000)) "
  1466. << " ON CONFLICT (network_id, member_id) DO UPDATE SET address = EXCLUDED.address, last_updated = EXCLUDED.last_updated";
  1467. pipe.insert(memberUpdate.str());
  1468. }
  1469. while(!pipe.empty()) {
  1470. pipe.retrieve();
  1471. }
  1472. pipe.complete();
  1473. w.commit();
  1474. fprintf(stderr, "%s: Updated online status of %d members\n", _myAddressStr.c_str(), updateCount);
  1475. #endif
  1476. } catch (std::exception &e) {
  1477. fprintf(stderr, "%s: error in onlinenotification thread: %s\n", _myAddressStr.c_str(), e.what());
  1478. }
  1479. _pool->unborrow(c2);
  1480. _pool->unborrow(c);
  1481. ConnectionPoolStats stats = _pool->get_stats();
  1482. fprintf(stderr, "%s pool stats: in use size: %llu, available size: %llu, total: %llu\n",
  1483. _myAddressStr.c_str(), stats.borrowed_size, stats.pool_size, (stats.borrowed_size + stats.pool_size));
  1484. std::this_thread::sleep_for(std::chrono::seconds(10));
  1485. }
  1486. fprintf(stderr, "%s: Fell out of run loop in onlineNotificationThread\n", _myAddressStr.c_str());
  1487. if (_run == 1) {
  1488. fprintf(stderr, "ERROR: %s onlineNotificationThread should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  1489. exit(6);
  1490. }
  1491. }
  1492. void PostgreSQL::onlineNotification_Redis()
  1493. {
  1494. _connected = 1;
  1495. char buf[11] = {0};
  1496. std::string controllerId = std::string(_myAddress.toString(buf));
  1497. while (_run == 1) {
  1498. fprintf(stderr, "onlineNotification tick\n");
  1499. auto start = std::chrono::high_resolution_clock::now();
  1500. uint64_t count = 0;
  1501. std::unordered_map< std::pair<uint64_t,uint64_t>,std::pair<int64_t,InetAddress>,_PairHasher > lastOnline;
  1502. {
  1503. std::lock_guard<std::mutex> l(_lastOnline_l);
  1504. lastOnline.swap(_lastOnline);
  1505. }
  1506. try {
  1507. if (!lastOnline.empty()) {
  1508. if (_rc->clusterMode) {
  1509. auto tx = _cluster->transaction(controllerId, true, false);
  1510. count = _doRedisUpdate(tx, controllerId, lastOnline);
  1511. } else {
  1512. auto tx = _redis->transaction(true, false);
  1513. count = _doRedisUpdate(tx, controllerId, lastOnline);
  1514. }
  1515. }
  1516. } catch (sw::redis::Error &e) {
  1517. fprintf(stderr, "Error in online notification thread (redis): %s\n", e.what());
  1518. }
  1519. auto end = std::chrono::high_resolution_clock::now();
  1520. auto dur = std::chrono::duration_cast<std::chrono::milliseconds>(end - start);
  1521. auto total = dur.count();
  1522. fprintf(stderr, "onlineNotification ran in %llu ms\n", total);
  1523. std::this_thread::sleep_for(std::chrono::seconds(5));
  1524. }
  1525. }
  1526. uint64_t PostgreSQL::_doRedisUpdate(sw::redis::Transaction &tx, std::string &controllerId,
  1527. std::unordered_map< std::pair<uint64_t,uint64_t>,std::pair<int64_t,InetAddress>,_PairHasher > &lastOnline)
  1528. {
  1529. nlohmann::json jtmp1, jtmp2;
  1530. uint64_t count = 0;
  1531. for (auto i=lastOnline.begin(); i != lastOnline.end(); ++i) {
  1532. uint64_t nwid_i = i->first.first;
  1533. uint64_t memberid_i = i->first.second;
  1534. char nwidTmp[64];
  1535. char memTmp[64];
  1536. char ipTmp[64];
  1537. OSUtils::ztsnprintf(nwidTmp,sizeof(nwidTmp), "%.16llx", nwid_i);
  1538. OSUtils::ztsnprintf(memTmp,sizeof(memTmp), "%.10llx", memberid_i);
  1539. if (!get(nwid_i, jtmp1, memberid_i, jtmp2)){
  1540. continue; // skip non existent members/networks
  1541. }
  1542. std::string networkId(nwidTmp);
  1543. std::string memberId(memTmp);
  1544. int64_t ts = i->second.first;
  1545. std::string ipAddr = i->second.second.toIpString(ipTmp);
  1546. std::string timestamp = std::to_string(ts);
  1547. std::unordered_map<std::string, std::string> record = {
  1548. {"id", memberId},
  1549. {"address", ipAddr},
  1550. {"last_updated", std::to_string(ts)}
  1551. };
  1552. tx.zadd("nodes-online:{"+controllerId+"}", memberId, ts)
  1553. .zadd("nodes-online2:{"+controllerId+"}", networkId+"-"+memberId, ts)
  1554. .zadd("network-nodes-online:{"+controllerId+"}:"+networkId, memberId, ts)
  1555. .zadd("active-networks:{"+controllerId+"}", networkId, ts)
  1556. .sadd("network-nodes-all:{"+controllerId+"}:"+networkId, memberId)
  1557. .hmset("member:{"+controllerId+"}:"+networkId+":"+memberId, record.begin(), record.end());
  1558. ++count;
  1559. }
  1560. // expire records from all-nodes and network-nodes member list
  1561. uint64_t expireOld = OSUtils::now() - 300000;
  1562. tx.zremrangebyscore("nodes-online:{"+controllerId+"}",
  1563. sw::redis::RightBoundedInterval<double>(expireOld,
  1564. sw::redis::BoundType::LEFT_OPEN));
  1565. tx.zremrangebyscore("nodes-online2:{"+controllerId+"}",
  1566. sw::redis::RightBoundedInterval<double>(expireOld,
  1567. sw::redis::BoundType::LEFT_OPEN));
  1568. tx.zremrangebyscore("active-networks:{"+controllerId+"}",
  1569. sw::redis::RightBoundedInterval<double>(expireOld,
  1570. sw::redis::BoundType::LEFT_OPEN));
  1571. {
  1572. std::lock_guard<std::mutex> l(_networks_l);
  1573. for (const auto &it : _networks) {
  1574. uint64_t nwid_i = it.first;
  1575. char nwidTmp[64];
  1576. OSUtils::ztsnprintf(nwidTmp,sizeof(nwidTmp), "%.16llx", nwid_i);
  1577. tx.zremrangebyscore("network-nodes-online:{"+controllerId+"}:"+nwidTmp,
  1578. sw::redis::RightBoundedInterval<double>(expireOld, sw::redis::BoundType::LEFT_OPEN));
  1579. }
  1580. }
  1581. tx.exec();
  1582. fprintf(stderr, "%s: Updated online status of %d members\n", _myAddressStr.c_str(), count);
  1583. return count;
  1584. }
  1585. #endif //ZT_CONTROLLER_USE_LIBPQ