PostgreSQL.cpp 60 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787
  1. /*
  2. * Copyright (c)2019 ZeroTier, Inc.
  3. *
  4. * Use of this software is governed by the Business Source License included
  5. * in the LICENSE.TXT file in the project's root directory.
  6. *
  7. * Change Date: 2025-01-01
  8. *
  9. * On the date above, in accordance with the Business Source License, use
  10. * of this software will be governed by version 2.0 of the Apache License.
  11. */
  12. /****/
  13. #include "PostgreSQL.hpp"
  14. #ifdef ZT_CONTROLLER_USE_LIBPQ
  15. #include "../node/Constants.hpp"
  16. #include "../node/SHA512.hpp"
  17. #include "EmbeddedNetworkController.hpp"
  18. #include "../version.h"
  19. #include "Redis.hpp"
  20. #include <libpq-fe.h>
  21. #include <sstream>
  22. #include <iomanip>
  23. #include <climits>
  24. #include <chrono>
  25. // #define REDIS_TRACE 1
  26. using json = nlohmann::json;
  27. namespace {
  28. static const int DB_MINIMUM_VERSION = 20;
  29. static const char *_timestr()
  30. {
  31. time_t t = time(0);
  32. char *ts = ctime(&t);
  33. char *p = ts;
  34. if (!p)
  35. return "";
  36. while (*p) {
  37. if (*p == '\n') {
  38. *p = (char)0;
  39. break;
  40. }
  41. ++p;
  42. }
  43. return ts;
  44. }
  45. /*
  46. std::string join(const std::vector<std::string> &elements, const char * const separator)
  47. {
  48. switch(elements.size()) {
  49. case 0:
  50. return "";
  51. case 1:
  52. return elements[0];
  53. default:
  54. std::ostringstream os;
  55. std::copy(elements.begin(), elements.end()-1, std::ostream_iterator<std::string>(os, separator));
  56. os << *elements.rbegin();
  57. return os.str();
  58. }
  59. }
  60. */
  61. std::vector<std::string> split(std::string str, char delim){
  62. std::istringstream iss(str);
  63. std::vector<std::string> tokens;
  64. std::string item;
  65. while(std::getline(iss, item, delim)) {
  66. tokens.push_back(item);
  67. }
  68. return tokens;
  69. }
  70. std::string url_encode(const std::string &value) {
  71. std::ostringstream escaped;
  72. escaped.fill('0');
  73. escaped << std::hex;
  74. for (std::string::const_iterator i = value.begin(), n = value.end(); i != n; ++i) {
  75. std::string::value_type c = (*i);
  76. // Keep alphanumeric and other accepted characters intact
  77. if (isalnum(c) || c == '-' || c == '_' || c == '.' || c == '~') {
  78. escaped << c;
  79. continue;
  80. }
  81. // Any other characters are percent-encoded
  82. escaped << std::uppercase;
  83. escaped << '%' << std::setw(2) << int((unsigned char) c);
  84. escaped << std::nouppercase;
  85. }
  86. return escaped.str();
  87. }
  88. } // anonymous namespace
  89. using namespace ZeroTier;
  90. MemberNotificationReceiver::MemberNotificationReceiver(PostgreSQL *p, pqxx::connection &c, const std::string &channel)
  91. : pqxx::notification_receiver(c, channel)
  92. , _psql(p)
  93. {
  94. fprintf(stderr, "initialize MemberNotificaitonReceiver\n");
  95. }
  96. void MemberNotificationReceiver::operator() (const std::string &payload, int packend_pid) {
  97. fprintf(stderr, "Member Notification received: %s\n", payload.c_str());
  98. json tmp(json::parse(payload));
  99. json &ov = tmp["old_val"];
  100. json &nv = tmp["new_val"];
  101. json oldConfig, newConfig;
  102. if (ov.is_object()) oldConfig = ov;
  103. if (nv.is_object()) newConfig = nv;
  104. if (oldConfig.is_object() || newConfig.is_object()) {
  105. _psql->_memberChanged(oldConfig,newConfig,(_psql->_ready>=2));
  106. fprintf(stderr, "payload sent\n");
  107. }
  108. }
  109. NetworkNotificationReceiver::NetworkNotificationReceiver(PostgreSQL *p, pqxx::connection &c, const std::string &channel)
  110. : pqxx::notification_receiver(c, channel)
  111. , _psql(p)
  112. {
  113. fprintf(stderr, "initialize NetworkNotificationReceiver\n");
  114. }
  115. void NetworkNotificationReceiver::operator() (const std::string &payload, int packend_pid) {
  116. fprintf(stderr, "Network Notificaiton received: %s\n", payload.c_str());
  117. json tmp(json::parse(payload));
  118. json &ov = tmp["old_val"];
  119. json &nv = tmp["new_val"];
  120. json oldConfig, newConfig;
  121. if (ov.is_object()) oldConfig = ov;
  122. if (nv.is_object()) newConfig = nv;
  123. if (oldConfig.is_object() || newConfig.is_object()) {
  124. _psql->_networkChanged(oldConfig,newConfig,(_psql->_ready>=2));
  125. fprintf(stderr, "payload sent\n");
  126. }
  127. }
  128. using Attrs = std::vector<std::pair<std::string, std::string>>;
  129. using Item = std::pair<std::string, Attrs>;
  130. using ItemStream = std::vector<Item>;
  131. PostgreSQL::PostgreSQL(const Identity &myId, const char *path, int listenPort, RedisConfig *rc)
  132. : DB()
  133. , _pool()
  134. , _myId(myId)
  135. , _myAddress(myId.address())
  136. , _ready(0)
  137. , _connected(1)
  138. , _run(1)
  139. , _waitNoticePrinted(false)
  140. , _listenPort(listenPort)
  141. , _rc(rc)
  142. , _redis(NULL)
  143. , _cluster(NULL)
  144. , _redisMemberStatus(false)
  145. {
  146. char myAddress[64];
  147. _myAddressStr = myId.address().toString(myAddress);
  148. _connString = std::string(path);
  149. auto f = std::make_shared<PostgresConnFactory>(_connString);
  150. _pool = std::make_shared<ConnectionPool<PostgresConnection> >(
  151. 15, 5, std::static_pointer_cast<ConnectionFactory>(f));
  152. memset(_ssoPsk, 0, sizeof(_ssoPsk));
  153. char *const ssoPskHex = getenv("ZT_SSO_PSK");
  154. #ifdef ZT_TRACE
  155. fprintf(stderr, "ZT_SSO_PSK: %s\n", ssoPskHex);
  156. #endif
  157. if (ssoPskHex) {
  158. // SECURITY: note that ssoPskHex will always be null-terminated if libc acatually
  159. // returns something non-NULL. If the hex encodes something shorter than 48 bytes,
  160. // it will be padded at the end with zeroes. If longer, it'll be truncated.
  161. Utils::unhex(ssoPskHex, _ssoPsk, sizeof(_ssoPsk));
  162. }
  163. const char *redisMemberStatus = getenv("ZT_REDIS_MEMBER_STATUS");
  164. if (redisMemberStatus && (strcmp(redisMemberStatus, "true") == 0)) {
  165. _redisMemberStatus = true;
  166. fprintf(stderr, "Using redis for member status\n");
  167. }
  168. auto c = _pool->borrow();
  169. pqxx::work txn{*c->c};
  170. pqxx::row r{txn.exec1("SELECT version FROM ztc_database")};
  171. int dbVersion = r[0].as<int>();
  172. txn.commit();
  173. if (dbVersion < DB_MINIMUM_VERSION) {
  174. fprintf(stderr, "Central database schema version too low. This controller version requires a minimum schema version of %d. Please upgrade your Central instance", DB_MINIMUM_VERSION);
  175. exit(1);
  176. }
  177. _pool->unborrow(c);
  178. if (_rc != NULL) {
  179. sw::redis::ConnectionOptions opts;
  180. sw::redis::ConnectionPoolOptions poolOpts;
  181. opts.host = _rc->hostname;
  182. opts.port = _rc->port;
  183. opts.password = _rc->password;
  184. opts.db = 0;
  185. opts.keep_alive = true;
  186. opts.connect_timeout = std::chrono::seconds(5);
  187. poolOpts.size = 25;
  188. poolOpts.wait_timeout = std::chrono::milliseconds(1000);
  189. poolOpts.connection_lifetime = std::chrono::minutes(5);
  190. if (_rc->clusterMode) {
  191. fprintf(stderr, "Using Redis in Cluster Mode\n");
  192. _cluster = std::make_shared<sw::redis::RedisCluster>(opts, poolOpts);
  193. } else {
  194. fprintf(stderr, "Using Redis in Standalone Mode\n");
  195. _redis = std::make_shared<sw::redis::Redis>(opts, poolOpts);
  196. }
  197. }
  198. _readyLock.lock();
  199. fprintf(stderr, "[%s] NOTICE: %.10llx controller PostgreSQL waiting for initial data download..." ZT_EOL_S, ::_timestr(), (unsigned long long)_myAddress.toInt());
  200. _waitNoticePrinted = true;
  201. initializeNetworks();
  202. initializeMembers();
  203. _heartbeatThread = std::thread(&PostgreSQL::heartbeat, this);
  204. _membersDbWatcher = std::thread(&PostgreSQL::membersDbWatcher, this);
  205. _networksDbWatcher = std::thread(&PostgreSQL::networksDbWatcher, this);
  206. for (int i = 0; i < ZT_CENTRAL_CONTROLLER_COMMIT_THREADS; ++i) {
  207. _commitThread[i] = std::thread(&PostgreSQL::commitThread, this);
  208. }
  209. _onlineNotificationThread = std::thread(&PostgreSQL::onlineNotificationThread, this);
  210. }
  211. PostgreSQL::~PostgreSQL()
  212. {
  213. _run = 0;
  214. std::this_thread::sleep_for(std::chrono::milliseconds(100));
  215. _heartbeatThread.join();
  216. _membersDbWatcher.join();
  217. _networksDbWatcher.join();
  218. _commitQueue.stop();
  219. for (int i = 0; i < ZT_CENTRAL_CONTROLLER_COMMIT_THREADS; ++i) {
  220. _commitThread[i].join();
  221. }
  222. _onlineNotificationThread.join();
  223. }
  224. bool PostgreSQL::waitForReady()
  225. {
  226. while (_ready < 2) {
  227. _readyLock.lock();
  228. _readyLock.unlock();
  229. }
  230. return true;
  231. }
  232. bool PostgreSQL::isReady()
  233. {
  234. return ((_ready == 2)&&(_connected));
  235. }
  236. bool PostgreSQL::save(nlohmann::json &record,bool notifyListeners)
  237. {
  238. bool modified = false;
  239. try {
  240. if (!record.is_object()) {
  241. fprintf(stderr, "record is not an object?!?\n");
  242. return false;
  243. }
  244. const std::string objtype = record["objtype"];
  245. if (objtype == "network") {
  246. //fprintf(stderr, "network save\n");
  247. const uint64_t nwid = OSUtils::jsonIntHex(record["id"],0ULL);
  248. if (nwid) {
  249. nlohmann::json old;
  250. get(nwid,old);
  251. if ((!old.is_object())||(!_compareRecords(old,record))) {
  252. record["revision"] = OSUtils::jsonInt(record["revision"],0ULL) + 1ULL;
  253. _commitQueue.post(std::pair<nlohmann::json,bool>(record,notifyListeners));
  254. modified = true;
  255. }
  256. }
  257. } else if (objtype == "member") {
  258. std::string networkId = record["nwid"];
  259. std::string memberId = record["id"];
  260. const uint64_t nwid = OSUtils::jsonIntHex(record["nwid"],0ULL);
  261. const uint64_t id = OSUtils::jsonIntHex(record["id"],0ULL);
  262. //fprintf(stderr, "member save %s-%s\n", networkId.c_str(), memberId.c_str());
  263. if ((id)&&(nwid)) {
  264. nlohmann::json network,old;
  265. get(nwid,network,id,old);
  266. if ((!old.is_object())||(!_compareRecords(old,record))) {
  267. //fprintf(stderr, "commit queue post\n");
  268. record["revision"] = OSUtils::jsonInt(record["revision"],0ULL) + 1ULL;
  269. _commitQueue.post(std::pair<nlohmann::json,bool>(record,notifyListeners));
  270. modified = true;
  271. } else {
  272. //fprintf(stderr, "no change\n");
  273. }
  274. }
  275. } else {
  276. fprintf(stderr, "uhh waaat\n");
  277. }
  278. } catch (std::exception &e) {
  279. fprintf(stderr, "Error on PostgreSQL::save: %s\n", e.what());
  280. } catch (...) {
  281. fprintf(stderr, "Unknown error on PostgreSQL::save\n");
  282. }
  283. return modified;
  284. }
  285. void PostgreSQL::eraseNetwork(const uint64_t networkId)
  286. {
  287. fprintf(stderr, "PostgreSQL::eraseNetwork\n");
  288. char tmp2[24];
  289. waitForReady();
  290. Utils::hex(networkId, tmp2);
  291. std::pair<nlohmann::json,bool> tmp;
  292. tmp.first["id"] = tmp2;
  293. tmp.first["objtype"] = "_delete_network";
  294. tmp.second = true;
  295. _commitQueue.post(tmp);
  296. nlohmann::json nullJson;
  297. _networkChanged(tmp.first, nullJson, true);
  298. }
  299. void PostgreSQL::eraseMember(const uint64_t networkId, const uint64_t memberId)
  300. {
  301. fprintf(stderr, "PostgreSQL::eraseMember\n");
  302. char tmp2[24];
  303. waitForReady();
  304. std::pair<nlohmann::json,bool> tmp, nw;
  305. Utils::hex(networkId, tmp2);
  306. tmp.first["nwid"] = tmp2;
  307. Utils::hex(memberId, tmp2);
  308. tmp.first["id"] = tmp2;
  309. tmp.first["objtype"] = "_delete_member";
  310. tmp.second = true;
  311. _commitQueue.post(tmp);
  312. nlohmann::json nullJson;
  313. _memberChanged(tmp.first, nullJson, true);
  314. }
  315. void PostgreSQL::nodeIsOnline(const uint64_t networkId, const uint64_t memberId, const InetAddress &physicalAddress)
  316. {
  317. std::lock_guard<std::mutex> l(_lastOnline_l);
  318. std::pair<int64_t, InetAddress> &i = _lastOnline[std::pair<uint64_t,uint64_t>(networkId, memberId)];
  319. i.first = OSUtils::now();
  320. if (physicalAddress) {
  321. i.second = physicalAddress;
  322. }
  323. }
  324. AuthInfo PostgreSQL::getSSOAuthInfo(const nlohmann::json &member, const std::string &redirectURL)
  325. {
  326. // NONCE is just a random character string. no semantic meaning
  327. // state = HMAC SHA384 of Nonce based on shared sso key
  328. //
  329. // need nonce timeout in database? make sure it's used within X time
  330. // X is 5 minutes for now. Make configurable later?
  331. //
  332. // how do we tell when a nonce is used? if auth_expiration_time is set
  333. std::string networkId = member["nwid"];
  334. std::string memberId = member["id"];
  335. char authenticationURL[4096] = {0};
  336. AuthInfo info;
  337. info.enabled = true;
  338. // fprintf(stderr, "PostgreSQL::updateMemberOnLoad: %s-%s\n", networkId.c_str(), memberId.c_str());
  339. try {
  340. auto c = _pool->borrow();
  341. pqxx::work w(*c->c);
  342. char nonceBytes[16] = {0};
  343. std::string nonce = "";
  344. // check if the member exists first.
  345. pqxx::row count = w.exec_params1("SELECT count(id) FROM ztc_member WHERE id = $1 AND network_id = $2 AND deleted = false", memberId, networkId);
  346. if (count[0].as<int>() == 1) {
  347. // get active nonce, if exists.
  348. pqxx::result r = w.exec_params("SELECT nonce FROM ztc_sso_expiry "
  349. "WHERE network_id = $1 AND member_id = $2 "
  350. "AND ((NOW() AT TIME ZONE 'UTC') <= authentication_expiry_time) AND ((NOW() AT TIME ZONE 'UTC') <= nonce_expiration)",
  351. networkId, memberId);
  352. if (r.size() == 0) {
  353. // no active nonce.
  354. // find an unused nonce, if one exists.
  355. pqxx::result r = w.exec_params("SELECT nonce FROM ztc_sso_expiry "
  356. "WHERE network_id = $1 AND member_id = $2 "
  357. "AND authentication_expiry_time IS NULL AND ((NOW() AT TIME ZONE 'UTC') <= nonce_expiration)",
  358. networkId, memberId);
  359. if (r.size() == 1) {
  360. // we have an existing nonce. Use it
  361. nonce = r.at(0)[0].as<std::string>();
  362. Utils::unhex(nonce.c_str(), nonceBytes, sizeof(nonceBytes));
  363. } else if (r.empty()) {
  364. // create a nonce
  365. Utils::getSecureRandom(nonceBytes, 16);
  366. char nonceBuf[64] = {0};
  367. Utils::hex(nonceBytes, sizeof(nonceBytes), nonceBuf);
  368. nonce = std::string(nonceBuf);
  369. pqxx::result ir = w.exec_params0("INSERT INTO ztc_sso_expiry "
  370. "(nonce, nonce_expiration, network_id, member_id) VALUES "
  371. "($1, TO_TIMESTAMP($2::double precision/1000), $3, $4)",
  372. nonce, OSUtils::now() + 300000, networkId, memberId);
  373. w.commit();
  374. } else {
  375. // > 1 ?!? Thats an error!
  376. fprintf(stderr, "> 1 unused nonce!\n");
  377. exit(6);
  378. }
  379. } else if (r.size() == 1) {
  380. nonce = r.at(0)[0].as<std::string>();
  381. Utils::unhex(nonce.c_str(), nonceBytes, sizeof(nonceBytes));
  382. } else {
  383. // more than 1 nonce in use? Uhhh...
  384. fprintf(stderr, "> 1 nonce in use for network member?!?\n");
  385. exit(7);
  386. }
  387. r = w.exec_params("SELECT org.client_id, org.authorization_endpoint, org.issuer, org.sso_impl_version "
  388. "FROM ztc_network AS nw, ztc_org AS org "
  389. "WHERE nw.id = $1 AND nw.sso_enabled = true AND org.owner_id = nw.owner_id", networkId);
  390. std::string client_id = "";
  391. std::string authorization_endpoint = "";
  392. std::string issuer = "";
  393. uint64_t sso_version = 0;
  394. if (r.size() == 1) {
  395. client_id = r.at(0)[0].as<std::string>();
  396. authorization_endpoint = r.at(0)[1].as<std::string>();
  397. issuer = r.at(0)[2].as<std::string>();
  398. sso_version = r.at(0)[3].as<uint64_t>();
  399. } else if (r.size() > 1) {
  400. fprintf(stderr, "ERROR: More than one auth endpoint for an organization?!?!? NetworkID: %s\n", networkId.c_str());
  401. } else {
  402. fprintf(stderr, "No client or auth endpoint?!?\n");
  403. }
  404. info.version = sso_version;
  405. // no catch all else because we don't actually care if no records exist here. just continue as normal.
  406. if ((!client_id.empty())&&(!authorization_endpoint.empty())) {
  407. uint8_t state[48];
  408. HMACSHA384(_ssoPsk, nonceBytes, sizeof(nonceBytes), state);
  409. char state_hex[256];
  410. Utils::hex(state, 48, state_hex);
  411. if (info.version == 0) {
  412. char url[2048] = {0};
  413. OSUtils::ztsnprintf(url, sizeof(authenticationURL),
  414. "%s?response_type=id_token&response_mode=form_post&scope=openid+email+profile&redirect_uri=%s&nonce=%s&state=%s&client_id=%s",
  415. authorization_endpoint.c_str(),
  416. url_encode(redirectURL).c_str(),
  417. nonce.c_str(),
  418. state_hex,
  419. client_id.c_str());
  420. info.authenticationURL = std::string(url);
  421. } else if (info.version == 1) {
  422. info.ssoClientID = client_id;
  423. info.issuerURL = issuer;
  424. info.ssoNonce = nonce;
  425. info.ssoState = std::string(state_hex) + "_" +networkId;
  426. info.centralAuthURL = redirectURL;
  427. #ifdef ZT_DEBUG
  428. fprintf(
  429. stderr,
  430. "ssoClientID: %s\nissuerURL: %s\nssoNonce: %s\nssoState: %s\ncentralAuthURL: %s\n",
  431. info.ssoClientID.c_str(),
  432. info.issuerURL.c_str(),
  433. info.ssoNonce.c_str(),
  434. info.ssoState.c_str(),
  435. info.centralAuthURL.c_str());
  436. #endif
  437. }
  438. } else {
  439. fprintf(stderr, "client_id: %s\nauthorization_endpoint: %s\n", client_id.c_str(), authorization_endpoint.c_str());
  440. }
  441. }
  442. _pool->unborrow(c);
  443. } catch (std::exception &e) {
  444. fprintf(stderr, "ERROR: Error updating member on load: %s\n", e.what());
  445. }
  446. return info; //std::string(authenticationURL);
  447. }
  448. void PostgreSQL::initializeNetworks()
  449. {
  450. try {
  451. std::string setKey = "networks:{" + _myAddressStr + "}";
  452. fprintf(stderr, "Initializing Networks...\n");
  453. if (_redisMemberStatus) {
  454. fprintf(stderr, "Init Redis for networks...\n");
  455. try {
  456. if (_rc->clusterMode) {
  457. _cluster->del(setKey);
  458. } else {
  459. _redis->del(setKey);
  460. }
  461. } catch (sw::redis::Error &e) {
  462. // ignore. if this key doesn't exist, there's no reason to delete it
  463. }
  464. }
  465. std::unordered_set<std::string> networkSet;
  466. char qbuf[2048] = {0};
  467. sprintf(qbuf, "SELECT n.id, (EXTRACT(EPOCH FROM n.creation_time AT TIME ZONE 'UTC')*1000)::bigint as creation_time, n.capabilities, "
  468. "n.enable_broadcast, (EXTRACT(EPOCH FROM n.last_modified AT TIME ZONE 'UTC')*1000)::bigint AS last_modified, n.mtu, n.multicast_limit, n.name, n.private, n.remote_trace_level, "
  469. "n.remote_trace_target, n.revision, n.rules, n.tags, n.v4_assign_mode, n.v6_assign_mode, n.sso_enabled, (CASE WHEN n.sso_enabled THEN o.client_id ELSE NULL END) as client_id, "
  470. "(CASE WHEN n.sso_enabled THEN o.authorization_endpoint ELSE NULL END) as authorization_endpoint, d.domain, d.servers, "
  471. "ARRAY(SELECT CONCAT(host(ip_range_start),'|', host(ip_range_end)) FROM ztc_network_assignment_pool WHERE network_id = n.id) AS assignment_pool, "
  472. "ARRAY(SELECT CONCAT(host(address),'/',bits::text,'|',COALESCE(host(via), 'NULL'))FROM ztc_network_route WHERE network_id = n.id) AS routes "
  473. "FROM ztc_network n "
  474. "LEFT OUTER JOIN ztc_org o "
  475. " ON o.owner_id = n.owner_id "
  476. "LEFT OUTER JOIN ztc_network_dns d "
  477. " ON d.network_id = n.id "
  478. "WHERE deleted = false AND controller_id = '%s'", _myAddressStr.c_str());
  479. auto c = _pool->borrow();
  480. auto c2 = _pool->borrow();
  481. pqxx::work w{*c->c};
  482. fprintf(stderr, "Load networks from psql...\n");
  483. auto stream = pqxx::stream_from::query(w, qbuf);
  484. std::tuple<
  485. std::string // network ID
  486. , std::optional<int64_t> // creationTime
  487. , std::optional<std::string> // capabilities
  488. , std::optional<bool> // enableBroadcast
  489. , std::optional<uint64_t> // lastModified
  490. , std::optional<int> // mtu
  491. , std::optional<int> // multicastLimit
  492. , std::optional<std::string> // name
  493. , bool // private
  494. , std::optional<int> // remoteTraceLevel
  495. , std::optional<std::string> // remoteTraceTarget
  496. , std::optional<uint64_t> // revision
  497. , std::optional<std::string> // rules
  498. , std::optional<std::string> // tags
  499. , std::optional<std::string> // v4AssignMode
  500. , std::optional<std::string> // v6AssignMode
  501. , std::optional<bool> // ssoEnabled
  502. , std::optional<std::string> // clientId
  503. , std::optional<std::string> // authorizationEndpoint
  504. , std::optional<std::string> // domain
  505. , std::optional<std::string> // servers
  506. , std::string // assignmentPoolString
  507. , std::string // routeString
  508. > row;
  509. uint64_t count = 0;
  510. auto tmp = std::chrono::high_resolution_clock::now();
  511. uint64_t total = 0;
  512. while (stream >> row) {
  513. auto start = std::chrono::high_resolution_clock::now();
  514. json empty;
  515. json config;
  516. initNetwork(config);
  517. std::string nwid = std::get<0>(row);
  518. std::optional<int64_t> creationTime = std::get<1>(row);
  519. std::optional<std::string> capabilities = std::get<2>(row);
  520. std::optional<bool> enableBroadcast = std::get<3>(row);
  521. std::optional<uint64_t> lastModified = std::get<4>(row);
  522. std::optional<int> mtu = std::get<5>(row);
  523. std::optional<int> multicastLimit = std::get<6>(row);
  524. std::optional<std::string> name = std::get<7>(row);
  525. bool isPrivate = std::get<8>(row);
  526. std::optional<int> remoteTraceLevel = std::get<9>(row);
  527. std::optional<std::string> remoteTraceTarget = std::get<10>(row);
  528. std::optional<uint64_t> revision = std::get<11>(row);
  529. std::optional<std::string> rules = std::get<12>(row);
  530. std::optional<std::string> tags = std::get<13>(row);
  531. std::optional<std::string> v4AssignMode = std::get<14>(row);
  532. std::optional<std::string> v6AssignMode = std::get<15>(row);
  533. std::optional<bool> ssoEnabled = std::get<16>(row);
  534. std::optional<std::string> clientId = std::get<17>(row);
  535. std::optional<std::string> authorizationEndpoint = std::get<18>(row);
  536. std::optional<std::string> dnsDomain = std::get<19>(row);
  537. std::optional<std::string> dnsServers = std::get<20>(row);
  538. std::string assignmentPoolString = std::get<21>(row);
  539. std::string routesString = std::get<22>(row);
  540. config["id"] = nwid;
  541. config["nwid"] = nwid;
  542. config["creationTime"] = creationTime.value_or(0);
  543. config["capabilities"] = json::parse(capabilities.value_or("[]"));
  544. config["enableBroadcast"] = enableBroadcast.value_or(false);
  545. config["lastModified"] = lastModified.value_or(0);
  546. config["mtu"] = mtu.value_or(2800);
  547. config["multicastLimit"] = multicastLimit.value_or(64);
  548. config["name"] = name.value_or("");
  549. config["private"] = isPrivate;
  550. config["remoteTraceLevel"] = remoteTraceLevel.value_or(0);
  551. config["remoteTraceTarget"] = remoteTraceTarget.value_or("");
  552. config["revision"] = revision.value_or(0);
  553. config["rules"] = json::parse(rules.value_or("[]"));
  554. config["tags"] = json::parse(tags.value_or("[]"));
  555. config["v4AssignMode"] = json::parse(v4AssignMode.value_or("{}"));
  556. config["v6AssignMode"] = json::parse(v6AssignMode.value_or("{}"));
  557. config["ssoEnabled"] = ssoEnabled.value_or(false);
  558. config["objtype"] = "network";
  559. config["ipAssignmentPools"] = json::array();
  560. config["routes"] = json::array();
  561. config["clientId"] = clientId.value_or("");
  562. config["authorizationEndpoint"] = authorizationEndpoint.value_or("");
  563. networkSet.insert(nwid);
  564. if (dnsDomain.has_value()) {
  565. std::string serverList = dnsServers.value();
  566. json obj;
  567. auto servers = json::array();
  568. if (serverList.rfind("{",0) != std::string::npos) {
  569. serverList = serverList.substr(1, serverList.size()-2);
  570. std::stringstream ss(serverList);
  571. while(ss.good()) {
  572. std::string server;
  573. std::getline(ss, server, ',');
  574. servers.push_back(server);
  575. }
  576. }
  577. obj["domain"] = dnsDomain.value();
  578. obj["servers"] = servers;
  579. config["dns"] = obj;
  580. }
  581. config["ipAssignmentPools"] = json::array();
  582. if (assignmentPoolString != "{}") {
  583. std::string tmp = assignmentPoolString.substr(1, assignmentPoolString.size()-2);
  584. std::vector<std::string> assignmentPools = split(tmp, ',');
  585. for (auto it = assignmentPools.begin(); it != assignmentPools.end(); ++it) {
  586. std::vector<std::string> r = split(*it, '|');
  587. json ip;
  588. ip["ipRangeStart"] = r[0];
  589. ip["ipRangeEnd"] = r[1];
  590. config["ipAssignmentPools"].push_back(ip);
  591. }
  592. }
  593. config["routes"] = json::array();
  594. if (routesString != "{}") {
  595. std::string tmp = routesString.substr(1, routesString.size()-2);
  596. std::vector<std::string> routes = split(tmp, ',');
  597. for (auto it = routes.begin(); it != routes.end(); ++it) {
  598. std::vector<std::string> r = split(*it, '|');
  599. json route;
  600. route["target"] = r[0];
  601. route["via"] = ((route["via"] == "NULL")? nullptr : r[1]);
  602. config["routes"].push_back(route);
  603. }
  604. }
  605. _networkChanged(empty, config, false);
  606. auto end = std::chrono::high_resolution_clock::now();
  607. auto dur = std::chrono::duration_cast<std::chrono::microseconds>(end - start);;
  608. total += dur.count();
  609. ++count;
  610. if (count > 0 && count % 10000 == 0) {
  611. fprintf(stderr, "Averaging %llu us per network\n", (total/count));
  612. }
  613. }
  614. if (count > 0) {
  615. fprintf(stderr, "Took %llu us per network to load\n", (total/count));
  616. }
  617. stream.complete();
  618. w.commit();
  619. _pool->unborrow(c2);
  620. _pool->unborrow(c);
  621. fprintf(stderr, "done.\n");
  622. if (!networkSet.empty()) {
  623. if (_redisMemberStatus) {
  624. fprintf(stderr, "adding networks to redis...\n");
  625. if (_rc->clusterMode) {
  626. auto tx = _cluster->transaction(_myAddressStr, true);
  627. tx.sadd(setKey, networkSet.begin(), networkSet.end());
  628. tx.exec();
  629. } else {
  630. auto tx = _redis->transaction(true);
  631. tx.sadd(setKey, networkSet.begin(), networkSet.end());
  632. tx.exec();
  633. }
  634. fprintf(stderr, "done.\n");
  635. }
  636. }
  637. if (++this->_ready == 2) {
  638. if (_waitNoticePrinted) {
  639. fprintf(stderr,"[%s] NOTICE: %.10llx controller PostgreSQL data download complete." ZT_EOL_S,_timestr(),(unsigned long long)_myAddress.toInt());
  640. }
  641. _readyLock.unlock();
  642. }
  643. fprintf(stderr, "network init done.\n");
  644. } catch (sw::redis::Error &e) {
  645. fprintf(stderr, "ERROR: Error initializing networks in Redis: %s\n", e.what());
  646. std::this_thread::sleep_for(std::chrono::milliseconds(5000));
  647. exit(-1);
  648. } catch (std::exception &e) {
  649. fprintf(stderr, "ERROR: Error initializing networks: %s\n", e.what());
  650. std::this_thread::sleep_for(std::chrono::milliseconds(5000));
  651. exit(-1);
  652. }
  653. }
  654. void PostgreSQL::initializeMembers()
  655. {
  656. std::string memberId;
  657. std::string networkId;
  658. try {
  659. std::unordered_map<std::string, std::string> networkMembers;
  660. fprintf(stderr, "Initializing Members...\n");
  661. std::string setKeyBase = "network-nodes-all:{" + _myAddressStr + "}:";
  662. if (_redisMemberStatus) {
  663. fprintf(stderr, "Initialize Redis for members...\n");
  664. std::lock_guard<std::mutex> l(_networks_l);
  665. std::unordered_set<std::string> deletes;
  666. for ( auto it : _networks) {
  667. uint64_t nwid_i = it.first;
  668. char nwidTmp[64] = {0};
  669. OSUtils::ztsnprintf(nwidTmp, sizeof(nwidTmp), "%.16llx", nwid_i);
  670. std::string nwid(nwidTmp);
  671. std::string key = setKeyBase + nwid;
  672. deletes.insert(key);
  673. }
  674. if (!deletes.empty()) {
  675. try {
  676. if (_rc->clusterMode) {
  677. auto tx = _cluster->transaction(_myAddressStr, true);
  678. for (std::string k : deletes) {
  679. tx.del(k);
  680. }
  681. tx.exec();
  682. } else {
  683. auto tx = _redis->transaction(true);
  684. for (std::string k : deletes) {
  685. tx.del(k);
  686. }
  687. tx.exec();
  688. }
  689. } catch (sw::redis::Error &e) {
  690. // ignore
  691. }
  692. }
  693. }
  694. char qbuf[2048];
  695. sprintf(qbuf, "SELECT m.id, m.network_id, m.active_bridge, m.authorized, m.capabilities, (EXTRACT(EPOCH FROM m.creation_time AT TIME ZONE 'UTC')*1000)::bigint, m.identity, "
  696. " (EXTRACT(EPOCH FROM m.last_authorized_time AT TIME ZONE 'UTC')*1000)::bigint, "
  697. " (EXTRACT(EPOCH FROM m.last_deauthorized_time AT TIME ZONE 'UTC')*1000)::bigint, "
  698. " m.remote_trace_level, m.remote_trace_target, m.tags, m.v_major, m.v_minor, m.v_rev, m.v_proto, "
  699. " m.no_auto_assign_ips, m.revision, sso_exempt, "
  700. " (SELECT (EXTRACT(EPOCH FROM e.authentication_expiry_time)*1000)::bigint "
  701. " FROM ztc_sso_expiry e "
  702. " INNER JOIN ztc_network n1 "
  703. " ON n.id = e.network_id "
  704. " WHERE e.network_id = m.network_id AND e.member_id = m.id AND n.sso_enabled = TRUE AND e.authentication_expiry_time IS NOT NULL "
  705. " ORDER BY e.authentication_expiry_time DESC LIMIT 1) AS authentication_expiry_time, "
  706. " ARRAY(SELECT DISTINCT address FROM ztc_member_ip_assignment WHERE member_id = m.id AND network_id = m.network_id) AS assigned_addresses "
  707. "FROM ztc_member m "
  708. "INNER JOIN ztc_network n "
  709. " ON n.id = m.network_id "
  710. "WHERE n.controller_id = '%s' AND m.deleted = false", _myAddressStr.c_str());
  711. auto c = _pool->borrow();
  712. auto c2 = _pool->borrow();
  713. pqxx::work w{*c->c};
  714. fprintf(stderr, "Load members from psql...\n");
  715. auto stream = pqxx::stream_from::query(w, qbuf);
  716. std::tuple<
  717. std::string // memberId
  718. , std::string // memberId
  719. , std::optional<bool> // activeBridge
  720. , std::optional<bool> // authorized
  721. , std::optional<std::string> // capabilities
  722. , std::optional<uint64_t> // creationTime
  723. , std::optional<std::string> // identity
  724. , std::optional<uint64_t> // lastAuthorizedTime
  725. , std::optional<uint64_t> // lastDeauthorizedTime
  726. , std::optional<int> // remoteTraceLevel
  727. , std::optional<std::string> // remoteTraceTarget
  728. , std::optional<std::string> // tags
  729. , std::optional<int> // vMajor
  730. , std::optional<int> // vMinor
  731. , std::optional<int> // vRev
  732. , std::optional<int> // vProto
  733. , std::optional<bool> // noAutoAssignIps
  734. , std::optional<uint64_t> // revision
  735. , std::optional<bool> // ssoExempt
  736. , std::optional<uint64_t> // authenticationExpiryTime
  737. , std::string // assignedAddresses
  738. > row;
  739. uint64_t count = 0;
  740. auto tmp = std::chrono::high_resolution_clock::now();
  741. uint64_t total = 0;
  742. while (stream >> row) {
  743. auto start = std::chrono::high_resolution_clock::now();
  744. json empty;
  745. json config;
  746. initMember(config);
  747. memberId = std::get<0>(row);
  748. networkId = std::get<1>(row);
  749. std::optional<bool> activeBridge = std::get<2>(row);
  750. std::optional<bool> authorized = std::get<3>(row);
  751. std::optional<std::string> capabilities = std::get<4>(row);
  752. std::optional<uint64_t> creationTime = std::get<5>(row);
  753. std::optional<std::string> identity = std::get<6>(row);
  754. std::optional<uint64_t> lastAuthorizedTime = std::get<7>(row);
  755. std::optional<uint64_t> lastDeauthorizedTime = std::get<8>(row);
  756. std::optional<int> remoteTraceLevel = std::get<9>(row);
  757. std::optional<std::string> remoteTraceTarget = std::get<10>(row);
  758. std::optional<std::string> tags = std::get<11>(row);
  759. std::optional<int> vMajor = std::get<12>(row);
  760. std::optional<int> vMinor = std::get<13>(row);
  761. std::optional<int> vRev = std::get<14>(row);
  762. std::optional<int> vProto = std::get<15>(row);
  763. std::optional<bool> noAutoAssignIps = std::get<16>(row);
  764. std::optional<uint64_t> revision = std::get<17>(row);
  765. std::optional<bool> ssoExempt = std::get<18>(row);
  766. std::optional<uint64_t> authenticationExpiryTime = std::get<19>(row);
  767. std::string assignedAddresses = std::get<20>(row);
  768. networkMembers.insert(std::pair<std::string, std::string>(setKeyBase+networkId, memberId));
  769. config["id"] = memberId;
  770. config["address"] = memberId;
  771. config["nwid"] = networkId;
  772. config["activeBridge"] = activeBridge.value_or(false);
  773. config["authorized"] = authorized.value_or(false);
  774. config["capabilities"] = json::parse(capabilities.value_or("[]"));
  775. config["creationTime"] = creationTime.value_or(0);
  776. config["identity"] = identity.value_or("");
  777. config["lastAuthorizedTime"] = lastAuthorizedTime.value_or(0);
  778. config["lastDeauthorizedTime"] = lastDeauthorizedTime.value_or(0);
  779. config["remoteTraceLevel"] = remoteTraceLevel.value_or(0);
  780. config["remoteTraceTarget"] = remoteTraceTarget.value_or("");
  781. config["tags"] = json::parse(tags.value_or("[]"));
  782. config["vMajor"] = vMajor.value_or(-1);
  783. config["vMinor"] = vMinor.value_or(-1);
  784. config["vRev"] = vRev.value_or(-1);
  785. config["vProto"] = vProto.value_or(-1);
  786. config["noAutoAssignIps"] = noAutoAssignIps.value_or(false);
  787. config["revision"] = revision.value_or(0);
  788. config["ssoExempt"] = ssoExempt.value_or(false);
  789. config["authenticationExpiryTime"] = authenticationExpiryTime.value_or(0);
  790. config["objtype"] = "member";
  791. config["ipAssignments"] = json::array();
  792. if (assignedAddresses != "{}") {
  793. std::string tmp = assignedAddresses.substr(1, assignedAddresses.size()-2);
  794. std::vector<std::string> addrs = split(tmp, ',');
  795. for (auto it = addrs.begin(); it != addrs.end(); ++it) {
  796. config["ipAssignments"].push_back(*it);
  797. }
  798. }
  799. _memberChanged(empty, config, false);
  800. memberId = "";
  801. networkId = "";
  802. auto end = std::chrono::high_resolution_clock::now();
  803. auto dur = std::chrono::duration_cast<std::chrono::microseconds>(end - start);
  804. total += dur.count();
  805. ++count;
  806. if (count > 0 && count % 10000 == 0) {
  807. fprintf(stderr, "Averaging %llu us per member\n", (total/count));
  808. }
  809. }
  810. if (count > 0) {
  811. fprintf(stderr, "Took %llu us per member to load\n", (total/count));
  812. }
  813. stream.complete();
  814. w.commit();
  815. _pool->unborrow(c2);
  816. _pool->unborrow(c);
  817. fprintf(stderr, "done.\n");
  818. if (!networkMembers.empty()) {
  819. if (_redisMemberStatus) {
  820. fprintf(stderr, "Load member data into redis...\n");
  821. if (_rc->clusterMode) {
  822. auto tx = _cluster->transaction(_myAddressStr, true);
  823. for (auto it : networkMembers) {
  824. tx.sadd(it.first, it.second);
  825. }
  826. tx.exec();
  827. } else {
  828. auto tx = _redis->transaction(true);
  829. for (auto it : networkMembers) {
  830. tx.sadd(it.first, it.second);
  831. }
  832. tx.exec();
  833. }
  834. fprintf(stderr, "done.\n");
  835. }
  836. }
  837. fprintf(stderr, "Done loading members...\n");
  838. if (++this->_ready == 2) {
  839. if (_waitNoticePrinted) {
  840. fprintf(stderr,"[%s] NOTICE: %.10llx controller PostgreSQL data download complete." ZT_EOL_S,_timestr(),(unsigned long long)_myAddress.toInt());
  841. }
  842. _readyLock.unlock();
  843. }
  844. } catch (sw::redis::Error &e) {
  845. fprintf(stderr, "ERROR: Error initializing members (redis): %s\n", e.what());
  846. } catch (std::exception &e) {
  847. fprintf(stderr, "ERROR: Error initializing member: %s-%s %s\n", networkId.c_str(), memberId.c_str(), e.what());
  848. exit(-1);
  849. }
  850. }
  851. void PostgreSQL::heartbeat()
  852. {
  853. char publicId[1024];
  854. char hostnameTmp[1024];
  855. _myId.toString(false,publicId);
  856. if (gethostname(hostnameTmp, sizeof(hostnameTmp))!= 0) {
  857. hostnameTmp[0] = (char)0;
  858. } else {
  859. for (int i = 0; i < (int)sizeof(hostnameTmp); ++i) {
  860. if ((hostnameTmp[i] == '.')||(hostnameTmp[i] == 0)) {
  861. hostnameTmp[i] = (char)0;
  862. break;
  863. }
  864. }
  865. }
  866. const char *controllerId = _myAddressStr.c_str();
  867. const char *publicIdentity = publicId;
  868. const char *hostname = hostnameTmp;
  869. while (_run == 1) {
  870. // fprintf(stderr, "%s: heartbeat\n", controllerId);
  871. auto c = _pool->borrow();
  872. int64_t ts = OSUtils::now();
  873. if(c->c) {
  874. pqxx::work w{*c->c};
  875. std::string major = std::to_string(ZEROTIER_ONE_VERSION_MAJOR);
  876. std::string minor = std::to_string(ZEROTIER_ONE_VERSION_MINOR);
  877. std::string rev = std::to_string(ZEROTIER_ONE_VERSION_REVISION);
  878. std::string build = std::to_string(ZEROTIER_ONE_VERSION_BUILD);
  879. std::string now = std::to_string(ts);
  880. std::string host_port = std::to_string(_listenPort);
  881. std::string use_redis = (_rc != NULL) ? "true" : "false";
  882. std::string redis_mem_status = (_redisMemberStatus) ? "true" : "false";
  883. try {
  884. pqxx::result res = w.exec0("INSERT INTO ztc_controller (id, cluster_host, last_alive, public_identity, v_major, v_minor, v_rev, v_build, host_port, use_redis, redis_member_status) "
  885. "VALUES ("+w.quote(controllerId)+", "+w.quote(hostname)+", TO_TIMESTAMP("+now+"::double precision/1000), "+
  886. w.quote(publicIdentity)+", "+major+", "+minor+", "+rev+", "+build+", "+host_port+", "+use_redis+", "+redis_mem_status+") "
  887. "ON CONFLICT (id) DO UPDATE SET cluster_host = EXCLUDED.cluster_host, last_alive = EXCLUDED.last_alive, "
  888. "public_identity = EXCLUDED.public_identity, v_major = EXCLUDED.v_major, v_minor = EXCLUDED.v_minor, "
  889. "v_rev = EXCLUDED.v_rev, v_build = EXCLUDED.v_rev, host_port = EXCLUDED.host_port, "
  890. "use_redis = EXCLUDED.use_redis, redis_member_status = EXCLUDED.redis_member_status");
  891. } catch (std::exception &e) {
  892. fprintf(stderr, "Heartbeat update failed: %s\n", e.what());
  893. w.abort();
  894. _pool->unborrow(c);
  895. std::this_thread::sleep_for(std::chrono::milliseconds(1000));
  896. continue;
  897. }
  898. w.commit();
  899. }
  900. _pool->unborrow(c);
  901. if (_redisMemberStatus) {
  902. if (_rc->clusterMode) {
  903. _cluster->zadd("controllers", "controllerId", ts);
  904. } else {
  905. _redis->zadd("controllers", "controllerId", ts);
  906. }
  907. }
  908. std::this_thread::sleep_for(std::chrono::milliseconds(1000));
  909. }
  910. fprintf(stderr, "Exited heartbeat thread\n");
  911. }
  912. void PostgreSQL::membersDbWatcher()
  913. {
  914. if (_rc) {
  915. _membersWatcher_Redis();
  916. } else {
  917. _membersWatcher_Postgres();
  918. }
  919. if (_run == 1) {
  920. fprintf(stderr, "ERROR: %s membersDbWatcher should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  921. exit(9);
  922. }
  923. fprintf(stderr, "Exited membersDbWatcher\n");
  924. }
  925. void PostgreSQL::_membersWatcher_Postgres() {
  926. auto c = _pool->borrow();
  927. std::string stream = "member_" + _myAddressStr;
  928. fprintf(stderr, "Listening to member stream: %s\n", stream.c_str());
  929. MemberNotificationReceiver m(this, *c->c, stream);
  930. while(_run == 1) {
  931. c->c->await_notification(5, 0);
  932. }
  933. _pool->unborrow(c);
  934. }
  935. void PostgreSQL::_membersWatcher_Redis() {
  936. char buf[11] = {0};
  937. std::string key = "member-stream:{" + std::string(_myAddress.toString(buf)) + "}";
  938. std::string lastID = "0";
  939. fprintf(stderr, "Listening to member stream: %s\n", key.c_str());
  940. while (_run == 1) {
  941. try {
  942. json tmp;
  943. std::unordered_map<std::string, ItemStream> result;
  944. if (_rc->clusterMode) {
  945. _cluster->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  946. } else {
  947. _redis->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  948. }
  949. if (!result.empty()) {
  950. for (auto element : result) {
  951. #ifdef REDIS_TRACE
  952. fprintf(stdout, "Received notification from: %s\n", element.first.c_str());
  953. #endif
  954. for (auto rec : element.second) {
  955. std::string id = rec.first;
  956. auto attrs = rec.second;
  957. #ifdef REDIS_TRACE
  958. fprintf(stdout, "Record ID: %s\n", id.c_str());
  959. fprintf(stdout, "attrs len: %lu\n", attrs.size());
  960. #endif
  961. for (auto a : attrs) {
  962. #ifdef REDIS_TRACE
  963. fprintf(stdout, "key: %s\nvalue: %s\n", a.first.c_str(), a.second.c_str());
  964. #endif
  965. try {
  966. tmp = json::parse(a.second);
  967. json &ov = tmp["old_val"];
  968. json &nv = tmp["new_val"];
  969. json oldConfig, newConfig;
  970. if (ov.is_object()) oldConfig = ov;
  971. if (nv.is_object()) newConfig = nv;
  972. if (oldConfig.is_object()||newConfig.is_object()) {
  973. _memberChanged(oldConfig,newConfig,(this->_ready >= 2));
  974. }
  975. } catch (...) {
  976. fprintf(stderr, "json parse error in networkWatcher_Redis\n");
  977. }
  978. }
  979. if (_rc->clusterMode) {
  980. _cluster->xdel(key, id);
  981. } else {
  982. _redis->xdel(key, id);
  983. }
  984. lastID = id;
  985. }
  986. }
  987. }
  988. } catch (sw::redis::Error &e) {
  989. fprintf(stderr, "Error in Redis members watcher: %s\n", e.what());
  990. }
  991. }
  992. fprintf(stderr, "membersWatcher ended\n");
  993. }
  994. void PostgreSQL::networksDbWatcher()
  995. {
  996. if (_rc) {
  997. _networksWatcher_Redis();
  998. } else {
  999. _networksWatcher_Postgres();
  1000. }
  1001. if (_run == 1) {
  1002. fprintf(stderr, "ERROR: %s networksDbWatcher should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  1003. exit(8);
  1004. }
  1005. fprintf(stderr, "Exited networksDbWatcher\n");
  1006. }
  1007. void PostgreSQL::_networksWatcher_Postgres() {
  1008. std::string stream = "network_" + _myAddressStr;
  1009. fprintf(stderr, "Listening to member stream: %s\n", stream.c_str());
  1010. auto c = _pool->borrow();
  1011. NetworkNotificationReceiver n(this, *c->c, stream);
  1012. while(_run == 1) {
  1013. c->c->await_notification(5,0);
  1014. }
  1015. }
  1016. void PostgreSQL::_networksWatcher_Redis() {
  1017. char buf[11] = {0};
  1018. std::string key = "network-stream:{" + std::string(_myAddress.toString(buf)) + "}";
  1019. std::string lastID = "0";
  1020. while (_run == 1) {
  1021. try {
  1022. json tmp;
  1023. std::unordered_map<std::string, ItemStream> result;
  1024. if (_rc->clusterMode) {
  1025. _cluster->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  1026. } else {
  1027. _redis->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  1028. }
  1029. if (!result.empty()) {
  1030. for (auto element : result) {
  1031. #ifdef REDIS_TRACE
  1032. fprintf(stdout, "Received notification from: %s\n", element.first.c_str());
  1033. #endif
  1034. for (auto rec : element.second) {
  1035. std::string id = rec.first;
  1036. auto attrs = rec.second;
  1037. #ifdef REDIS_TRACE
  1038. fprintf(stdout, "Record ID: %s\n", id.c_str());
  1039. fprintf(stdout, "attrs len: %lu\n", attrs.size());
  1040. #endif
  1041. for (auto a : attrs) {
  1042. #ifdef REDIS_TRACE
  1043. fprintf(stdout, "key: %s\nvalue: %s\n", a.first.c_str(), a.second.c_str());
  1044. #endif
  1045. try {
  1046. tmp = json::parse(a.second);
  1047. json &ov = tmp["old_val"];
  1048. json &nv = tmp["new_val"];
  1049. json oldConfig, newConfig;
  1050. if (ov.is_object()) oldConfig = ov;
  1051. if (nv.is_object()) newConfig = nv;
  1052. if (oldConfig.is_object()||newConfig.is_object()) {
  1053. _networkChanged(oldConfig,newConfig,(this->_ready >= 2));
  1054. }
  1055. } catch (...) {
  1056. fprintf(stderr, "json parse error in networkWatcher_Redis\n");
  1057. }
  1058. }
  1059. if (_rc->clusterMode) {
  1060. _cluster->xdel(key, id);
  1061. } else {
  1062. _redis->xdel(key, id);
  1063. }
  1064. lastID = id;
  1065. }
  1066. }
  1067. }
  1068. } catch (sw::redis::Error &e) {
  1069. fprintf(stderr, "Error in Redis networks watcher: %s\n", e.what());
  1070. }
  1071. }
  1072. fprintf(stderr, "networksWatcher ended\n");
  1073. }
  1074. void PostgreSQL::commitThread()
  1075. {
  1076. fprintf(stderr, "%s: commitThread start\n", _myAddressStr.c_str());
  1077. std::pair<nlohmann::json,bool> qitem;
  1078. while(_commitQueue.get(qitem)&(_run == 1)) {
  1079. //fprintf(stderr, "commitThread tick\n");
  1080. if (!qitem.first.is_object()) {
  1081. fprintf(stderr, "not an object\n");
  1082. continue;
  1083. }
  1084. std::shared_ptr<PostgresConnection> c;
  1085. try {
  1086. c = _pool->borrow();
  1087. } catch (std::exception &e) {
  1088. fprintf(stderr, "ERROR: %s\n", e.what());
  1089. continue;
  1090. }
  1091. if (!c) {
  1092. fprintf(stderr, "Error getting database connection\n");
  1093. continue;
  1094. }
  1095. try {
  1096. nlohmann::json &config = (qitem.first);
  1097. const std::string objtype = config["objtype"];
  1098. if (objtype == "member") {
  1099. // fprintf(stderr, "%s: commitThread: member\n", _myAddressStr.c_str());
  1100. std::string memberId;
  1101. std::string networkId;
  1102. try {
  1103. pqxx::work w(*c->c);
  1104. memberId = config["id"];
  1105. networkId = config["nwid"];
  1106. std::string target = "NULL";
  1107. if (!config["remoteTraceTarget"].is_null()) {
  1108. target = config["remoteTraceTarget"];
  1109. }
  1110. pqxx::row nwrow = w.exec_params1("SELECT COUNT(id) FROM ztc_network WHERE id = $1", networkId);
  1111. int nwcount = nwrow[0].as<int>();
  1112. if (nwcount != 1) {
  1113. fprintf(stderr, "network %s does not exist. skipping member upsert\n", networkId.c_str());
  1114. w.abort();
  1115. _pool->unborrow(c);
  1116. continue;
  1117. }
  1118. pqxx::result res = w.exec_params0(
  1119. "INSERT INTO ztc_member (id, network_id, active_bridge, authorized, capabilities, "
  1120. "identity, last_authorized_time, last_deauthorized_time, no_auto_assign_ips, "
  1121. "remote_trace_level, remote_trace_target, revision, tags, v_major, v_minor, v_rev, v_proto) "
  1122. "VALUES ($1, $2, $3, $4, $5, $6, "
  1123. "TO_TIMESTAMP($7::double precision/1000), TO_TIMESTAMP($8::double precision/1000), "
  1124. "$9, $10, $11, $12, $13, $14, $15, $16, $17) ON CONFLICT (network_id, id) DO UPDATE SET "
  1125. "active_bridge = EXCLUDED.active_bridge, authorized = EXCLUDED.authorized, capabilities = EXCLUDED.capabilities, "
  1126. "identity = EXCLUDED.identity, last_authorized_time = EXCLUDED.last_authorized_time, "
  1127. "last_deauthorized_time = EXCLUDED.last_deauthorized_time, no_auto_assign_ips = EXCLUDED.no_auto_assign_ips, "
  1128. "remote_trace_level = EXCLUDED.remote_trace_level, remote_trace_target = EXCLUDED.remote_trace_target, "
  1129. "revision = EXCLUDED.revision+1, tags = EXCLUDED.tags, v_major = EXCLUDED.v_major, "
  1130. "v_minor = EXCLUDED.v_minor, v_rev = EXCLUDED.v_rev, v_proto = EXCLUDED.v_proto",
  1131. memberId,
  1132. networkId,
  1133. (bool)config["activeBridge"],
  1134. (bool)config["authorized"],
  1135. OSUtils::jsonDump(config["capabilities"], -1),
  1136. OSUtils::jsonString(config["identity"], ""),
  1137. (uint64_t)config["lastAuthorizedTime"],
  1138. (uint64_t)config["lastDeauthorizedTime"],
  1139. (bool)config["noAutoAssignIps"],
  1140. (int)config["remoteTraceLevel"],
  1141. target,
  1142. (uint64_t)config["revision"],
  1143. OSUtils::jsonDump(config["tags"], -1),
  1144. (int)config["vMajor"],
  1145. (int)config["vMinor"],
  1146. (int)config["vRev"],
  1147. (int)config["vProto"]);
  1148. res = w.exec_params0("DELETE FROM ztc_member_ip_assignment WHERE member_id = $1 AND network_id = $2",
  1149. memberId, networkId);
  1150. std::vector<std::string> assignments;
  1151. bool ipAssignError = false;
  1152. for (auto i = config["ipAssignments"].begin(); i != config["ipAssignments"].end(); ++i) {
  1153. std::string addr = *i;
  1154. if (std::find(assignments.begin(), assignments.end(), addr) != assignments.end()) {
  1155. continue;
  1156. }
  1157. res = w.exec_params0(
  1158. "INSERT INTO ztc_member_ip_assignment (member_id, network_id, address) VALUES ($1, $2, $3) ON CONFLICT (network_id, member_id, address) DO NOTHING",
  1159. memberId, networkId, addr);
  1160. assignments.push_back(addr);
  1161. }
  1162. if (ipAssignError) {
  1163. fprintf(stderr, "%s: ipAssignError\n", _myAddressStr.c_str());
  1164. w.abort();
  1165. _pool->unborrow(c);
  1166. c.reset();
  1167. continue;
  1168. }
  1169. w.commit();
  1170. const uint64_t nwidInt = OSUtils::jsonIntHex(config["nwid"], 0ULL);
  1171. const uint64_t memberidInt = OSUtils::jsonIntHex(config["id"], 0ULL);
  1172. if (nwidInt && memberidInt) {
  1173. nlohmann::json nwOrig;
  1174. nlohmann::json memOrig;
  1175. nlohmann::json memNew(config);
  1176. get(nwidInt, nwOrig, memberidInt, memOrig);
  1177. _memberChanged(memOrig, memNew, qitem.second);
  1178. } else {
  1179. fprintf(stderr, "%s: Can't notify of change. Error parsing nwid or memberid: %llu-%llu\n", _myAddressStr.c_str(), (unsigned long long)nwidInt, (unsigned long long)memberidInt);
  1180. }
  1181. } catch (std::exception &e) {
  1182. fprintf(stderr, "%s ERROR: Error updating member %s-%s: %s\n", _myAddressStr.c_str(), networkId.c_str(), memberId.c_str(), e.what());
  1183. }
  1184. } else if (objtype == "network") {
  1185. try {
  1186. // fprintf(stderr, "%s: commitThread: network\n", _myAddressStr.c_str());
  1187. pqxx::work w(*c->c);
  1188. std::string id = config["id"];
  1189. std::string remoteTraceTarget = "";
  1190. if(!config["remoteTraceTarget"].is_null()) {
  1191. remoteTraceTarget = config["remoteTraceTarget"];
  1192. }
  1193. std::string rulesSource = "";
  1194. if (config["rulesSource"].is_string()) {
  1195. rulesSource = config["rulesSource"];
  1196. }
  1197. // This ugly query exists because when we want to mirror networks to/from
  1198. // another data store (e.g. FileDB or LFDB) it is possible to get a network
  1199. // that doesn't exist in Central's database. This does an upsert and sets
  1200. // the owner_id to the "first" global admin in the user DB if the record
  1201. // did not previously exist. If the record already exists owner_id is left
  1202. // unchanged, so owner_id should be left out of the update clause.
  1203. pqxx::result res = w.exec_params0(
  1204. "INSERT INTO ztc_network (id, creation_time, owner_id, controller_id, capabilities, enable_broadcast, "
  1205. "last_modified, mtu, multicast_limit, name, private, "
  1206. "remote_trace_level, remote_trace_target, rules, rules_source, "
  1207. "tags, v4_assign_mode, v6_assign_mode, sso_enabled) VALUES ("
  1208. "$1, TO_TIMESTAMP($5::double precision/1000), "
  1209. "(SELECT user_id AS owner_id FROM ztc_global_permissions WHERE authorize = true AND del = true AND modify = true AND read = true LIMIT 1),"
  1210. "$2, $3, $4, TO_TIMESTAMP($5::double precision/1000), "
  1211. "$6, $7, $8, $9, $10, $11, $12, $13, $14, $15, $16, $17) "
  1212. "ON CONFLICT (id) DO UPDATE set controller_id = EXCLUDED.controller_id, "
  1213. "capabilities = EXCLUDED.capabilities, enable_broadcast = EXCLUDED.enable_broadcast, "
  1214. "last_modified = EXCLUDED.last_modified, mtu = EXCLUDED.mtu, "
  1215. "multicast_limit = EXCLUDED.multicast_limit, name = EXCLUDED.name, "
  1216. "private = EXCLUDED.private, remote_trace_level = EXCLUDED.remote_trace_level, "
  1217. "remote_trace_target = EXCLUDED.remote_trace_target, rules = EXCLUDED.rules, "
  1218. "rules_source = EXCLUDED.rules_source, tags = EXCLUDED.tags, "
  1219. "v4_assign_mode = EXCLUDED.v4_assign_mode, v6_assign_mode = EXCLUDED.v6_assign_mode, "
  1220. "sso_enabled = EXCLUDED.sso_enabled",
  1221. id,
  1222. _myAddressStr,
  1223. OSUtils::jsonDump(config["capabilitles"], -1),
  1224. (bool)config["enableBroadcast"],
  1225. OSUtils::now(),
  1226. (int)config["mtu"],
  1227. (int)config["multicastLimit"],
  1228. OSUtils::jsonString(config["name"],""),
  1229. (bool)config["private"],
  1230. (int)config["remoteTraceLevel"],
  1231. remoteTraceTarget,
  1232. OSUtils::jsonDump(config["rules"], -1),
  1233. rulesSource,
  1234. OSUtils::jsonDump(config["tags"], -1),
  1235. OSUtils::jsonDump(config["v4AssignMode"],-1),
  1236. OSUtils::jsonDump(config["v6AssignMode"], -1),
  1237. OSUtils::jsonBool(config["ssoEnabled"], false));
  1238. res = w.exec_params0("DELETE FROM ztc_network_assignment_pool WHERE network_id = $1", 0);
  1239. auto pool = config["ipAssignmentPools"];
  1240. bool err = false;
  1241. for (auto i = pool.begin(); i != pool.end(); ++i) {
  1242. std::string start = (*i)["ipRangeStart"];
  1243. std::string end = (*i)["ipRangeEnd"];
  1244. res = w.exec_params0(
  1245. "INSERT INTO ztc_network_assignment_pool (network_id, ip_range_start, ip_range_end) "
  1246. "VALUES ($1, $2, $3)", id, start, end);
  1247. }
  1248. res = w.exec_params0("DELETE FROM ztc_network_route WHERE network_id = $1", id);
  1249. auto routes = config["routes"];
  1250. err = false;
  1251. for (auto i = routes.begin(); i != routes.end(); ++i) {
  1252. std::string t = (*i)["target"];
  1253. std::vector<std::string> target;
  1254. std::istringstream f(t);
  1255. std::string s;
  1256. while(std::getline(f, s, '/')) {
  1257. target.push_back(s);
  1258. }
  1259. if (target.empty() || target.size() != 2) {
  1260. continue;
  1261. }
  1262. std::string targetAddr = target[0];
  1263. std::string targetBits = target[1];
  1264. std::string via = "NULL";
  1265. if (!(*i)["via"].is_null()) {
  1266. via = (*i)["via"];
  1267. }
  1268. res = w.exec_params0("INSERT INTO ztc_network_route (network_id, address, bits, via) VALUES ($1, $2, $3, $4)",
  1269. id, targetAddr, targetBits, (via == "NULL" ? NULL : via.c_str()));
  1270. }
  1271. if (err) {
  1272. fprintf(stderr, "%s: route add error\n", _myAddressStr.c_str());
  1273. w.abort();
  1274. _pool->unborrow(c);
  1275. continue;
  1276. }
  1277. auto dns = config["dns"];
  1278. std::string domain = dns["domain"];
  1279. std::stringstream servers;
  1280. servers << "{";
  1281. for (auto j = dns["servers"].begin(); j < dns["servers"].end(); ++j) {
  1282. servers << *j;
  1283. if ( (j+1) != dns["servers"].end()) {
  1284. servers << ",";
  1285. }
  1286. }
  1287. servers << "}";
  1288. std::string s = servers.str();
  1289. res = w.exec_params0("INSERT INTO ztc_network_dns (network_id, domain, servers) VALUES ($1, $2, $3) ON CONFLICT (network_id) DO UPDATE SET domain = EXCLUDED.domain, servers = EXCLUDED.servers",
  1290. id, domain, s);
  1291. w.commit();
  1292. const uint64_t nwidInt = OSUtils::jsonIntHex(config["nwid"], 0ULL);
  1293. if (nwidInt) {
  1294. nlohmann::json nwOrig;
  1295. nlohmann::json nwNew(config);
  1296. get(nwidInt, nwOrig);
  1297. _networkChanged(nwOrig, nwNew, qitem.second);
  1298. } else {
  1299. fprintf(stderr, "%s: Can't notify network changed: %llu\n", _myAddressStr.c_str(), (unsigned long long)nwidInt);
  1300. }
  1301. } catch (std::exception &e) {
  1302. fprintf(stderr, "%s ERROR: Error updating network: %s\n", _myAddressStr.c_str(), e.what());
  1303. }
  1304. if (_redisMemberStatus) {
  1305. try {
  1306. std::string id = config["id"];
  1307. std::string controllerId = _myAddressStr.c_str();
  1308. std::string key = "networks:{" + controllerId + "}";
  1309. if (_rc->clusterMode) {
  1310. _cluster->sadd(key, id);
  1311. } else {
  1312. _redis->sadd(key, id);
  1313. }
  1314. } catch (sw::redis::Error &e) {
  1315. fprintf(stderr, "ERROR: Error adding network to Redis: %s\n", e.what());
  1316. }
  1317. }
  1318. } else if (objtype == "_delete_network") {
  1319. // fprintf(stderr, "%s: commitThread: delete network\n", _myAddressStr.c_str());
  1320. try {
  1321. pqxx::work w(*c->c);
  1322. std::string networkId = config["nwid"];
  1323. pqxx::result res = w.exec_params0("UPDATE ztc_network SET deleted = true WHERE id = $1",
  1324. networkId);
  1325. w.commit();
  1326. } catch (std::exception &e) {
  1327. fprintf(stderr, "%s ERROR: Error deleting network: %s\n", _myAddressStr.c_str(), e.what());
  1328. }
  1329. if (_redisMemberStatus) {
  1330. try {
  1331. std::string id = config["id"];
  1332. std::string controllerId = _myAddressStr.c_str();
  1333. std::string key = "networks:{" + controllerId + "}";
  1334. if (_rc->clusterMode) {
  1335. _cluster->srem(key, id);
  1336. _cluster->del("network-nodes-online:{"+controllerId+"}:"+id);
  1337. } else {
  1338. _redis->srem(key, id);
  1339. _redis->del("network-nodes-online:{"+controllerId+"}:"+id);
  1340. }
  1341. } catch (sw::redis::Error &e) {
  1342. fprintf(stderr, "ERROR: Error adding network to Redis: %s\n", e.what());
  1343. }
  1344. }
  1345. } else if (objtype == "_delete_member") {
  1346. // fprintf(stderr, "%s commitThread: delete member\n", _myAddressStr.c_str());
  1347. try {
  1348. pqxx::work w(*c->c);
  1349. std::string memberId = config["id"];
  1350. std::string networkId = config["nwid"];
  1351. pqxx::result res = w.exec_params0(
  1352. "UPDATE ztc_member SET hidden = true, deleted = true WHERE id = $1 AND network_id = $2",
  1353. memberId, networkId);
  1354. w.commit();
  1355. } catch (std::exception &e) {
  1356. fprintf(stderr, "%s ERROR: Error deleting member: %s\n", _myAddressStr.c_str(), e.what());
  1357. }
  1358. if (_redisMemberStatus) {
  1359. try {
  1360. std::string memberId = config["id"];
  1361. std::string networkId = config["nwid"];
  1362. std::string controllerId = _myAddressStr.c_str();
  1363. std::string key = "network-nodes-all:{" + controllerId + "}:" + networkId;
  1364. if (_rc->clusterMode) {
  1365. _cluster->srem(key, memberId);
  1366. _cluster->del("member:{"+controllerId+"}:"+networkId+":"+memberId);
  1367. } else {
  1368. _redis->srem(key, memberId);
  1369. _redis->del("member:{"+controllerId+"}:"+networkId+":"+memberId);
  1370. }
  1371. } catch (sw::redis::Error &e) {
  1372. fprintf(stderr, "ERROR: Error deleting member from Redis: %s\n", e.what());
  1373. }
  1374. }
  1375. } else {
  1376. fprintf(stderr, "%s ERROR: unknown objtype\n", _myAddressStr.c_str());
  1377. }
  1378. } catch (std::exception &e) {
  1379. fprintf(stderr, "%s ERROR: Error getting objtype: %s\n", _myAddressStr.c_str(), e.what());
  1380. }
  1381. _pool->unborrow(c);
  1382. c.reset();
  1383. std::this_thread::sleep_for(std::chrono::milliseconds(100));
  1384. }
  1385. fprintf(stderr, "%s commitThread finished\n", _myAddressStr.c_str());
  1386. }
  1387. void PostgreSQL::onlineNotificationThread()
  1388. {
  1389. waitForReady();
  1390. if (_redisMemberStatus) {
  1391. onlineNotification_Redis();
  1392. } else {
  1393. onlineNotification_Postgres();
  1394. }
  1395. }
  1396. /**
  1397. * ONLY UNCOMMENT FOR TEMPORARY DB MAINTENANCE
  1398. *
  1399. * This define temproarly turns off writing to the member status table
  1400. * so it can be reindexed when the indexes get too large.
  1401. */
  1402. // #define DISABLE_MEMBER_STATUS 1
  1403. void PostgreSQL::onlineNotification_Postgres()
  1404. {
  1405. _connected = 1;
  1406. nlohmann::json jtmp1, jtmp2;
  1407. while (_run == 1) {
  1408. auto c = _pool->borrow();
  1409. auto c2 = _pool->borrow();
  1410. try {
  1411. fprintf(stderr, "%s onlineNotification_Postgres\n", _myAddressStr.c_str());
  1412. std::unordered_map< std::pair<uint64_t,uint64_t>,std::pair<int64_t,InetAddress>,_PairHasher > lastOnline;
  1413. {
  1414. std::lock_guard<std::mutex> l(_lastOnline_l);
  1415. lastOnline.swap(_lastOnline);
  1416. }
  1417. #ifndef DISABLE_MEMBER_STATUS
  1418. pqxx::work w(*c->c);
  1419. pqxx::work w2(*c2->c);
  1420. fprintf(stderr, "online notification tick\n");
  1421. bool firstRun = true;
  1422. bool memberAdded = false;
  1423. int updateCount = 0;
  1424. pqxx::pipeline pipe(w);
  1425. for (auto i=lastOnline.begin(); i != lastOnline.end(); ++i) {
  1426. updateCount += 1;
  1427. uint64_t nwid_i = i->first.first;
  1428. char nwidTmp[64];
  1429. char memTmp[64];
  1430. char ipTmp[64];
  1431. OSUtils::ztsnprintf(nwidTmp,sizeof(nwidTmp), "%.16llx", nwid_i);
  1432. OSUtils::ztsnprintf(memTmp,sizeof(memTmp), "%.10llx", i->first.second);
  1433. if(!get(nwid_i, jtmp1, i->first.second, jtmp2)) {
  1434. continue; // skip non existent networks/members
  1435. }
  1436. std::string networkId(nwidTmp);
  1437. std::string memberId(memTmp);
  1438. try {
  1439. pqxx::row r = w2.exec_params1("SELECT id, network_id FROM ztc_member WHERE network_id = $1 AND id = $2",
  1440. networkId, memberId);
  1441. } catch (pqxx::unexpected_rows &e) {
  1442. continue;
  1443. }
  1444. int64_t ts = i->second.first;
  1445. std::string ipAddr = i->second.second.toIpString(ipTmp);
  1446. std::string timestamp = std::to_string(ts);
  1447. std::stringstream memberUpdate;
  1448. memberUpdate << "INSERT INTO ztc_member_status (network_id, member_id, address, last_updated) VALUES "
  1449. << "('" << networkId << "', '" << memberId << "', ";
  1450. if (ipAddr.empty()) {
  1451. memberUpdate << "NULL, ";
  1452. } else {
  1453. memberUpdate << "'" << ipAddr << "', ";
  1454. }
  1455. memberUpdate << "TO_TIMESTAMP(" << timestamp << "::double precision/1000)) "
  1456. << " ON CONFLICT (network_id, member_id) DO UPDATE SET address = EXCLUDED.address, last_updated = EXCLUDED.last_updated";
  1457. pipe.insert(memberUpdate.str());
  1458. }
  1459. while(!pipe.empty()) {
  1460. pipe.retrieve();
  1461. }
  1462. pipe.complete();
  1463. w.commit();
  1464. fprintf(stderr, "%s: Updated online status of %d members\n", _myAddressStr.c_str(), updateCount);
  1465. #endif
  1466. } catch (std::exception &e) {
  1467. fprintf(stderr, "%s: error in onlinenotification thread: %s\n", _myAddressStr.c_str(), e.what());
  1468. }
  1469. _pool->unborrow(c2);
  1470. _pool->unborrow(c);
  1471. ConnectionPoolStats stats = _pool->get_stats();
  1472. fprintf(stderr, "%s pool stats: in use size: %llu, available size: %llu, total: %llu\n",
  1473. _myAddressStr.c_str(), stats.borrowed_size, stats.pool_size, (stats.borrowed_size + stats.pool_size));
  1474. std::this_thread::sleep_for(std::chrono::seconds(10));
  1475. }
  1476. fprintf(stderr, "%s: Fell out of run loop in onlineNotificationThread\n", _myAddressStr.c_str());
  1477. if (_run == 1) {
  1478. fprintf(stderr, "ERROR: %s onlineNotificationThread should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  1479. exit(6);
  1480. }
  1481. }
  1482. void PostgreSQL::onlineNotification_Redis()
  1483. {
  1484. _connected = 1;
  1485. char buf[11] = {0};
  1486. std::string controllerId = std::string(_myAddress.toString(buf));
  1487. while (_run == 1) {
  1488. fprintf(stderr, "onlineNotification tick\n");
  1489. auto start = std::chrono::high_resolution_clock::now();
  1490. uint64_t count = 0;
  1491. std::unordered_map< std::pair<uint64_t,uint64_t>,std::pair<int64_t,InetAddress>,_PairHasher > lastOnline;
  1492. {
  1493. std::lock_guard<std::mutex> l(_lastOnline_l);
  1494. lastOnline.swap(_lastOnline);
  1495. }
  1496. try {
  1497. if (!lastOnline.empty()) {
  1498. if (_rc->clusterMode) {
  1499. auto tx = _cluster->transaction(controllerId, true);
  1500. count = _doRedisUpdate(tx, controllerId, lastOnline);
  1501. } else {
  1502. auto tx = _redis->transaction(true);
  1503. count = _doRedisUpdate(tx, controllerId, lastOnline);
  1504. }
  1505. }
  1506. } catch (sw::redis::Error &e) {
  1507. fprintf(stderr, "Error in online notification thread (redis): %s\n", e.what());
  1508. }
  1509. auto end = std::chrono::high_resolution_clock::now();
  1510. auto dur = std::chrono::duration_cast<std::chrono::milliseconds>(end - start);
  1511. auto total = dur.count();
  1512. fprintf(stderr, "onlineNotification ran in %llu ms\n", total);
  1513. std::this_thread::sleep_for(std::chrono::seconds(5));
  1514. }
  1515. }
  1516. uint64_t PostgreSQL::_doRedisUpdate(sw::redis::Transaction &tx, std::string &controllerId,
  1517. std::unordered_map< std::pair<uint64_t,uint64_t>,std::pair<int64_t,InetAddress>,_PairHasher > &lastOnline)
  1518. {
  1519. nlohmann::json jtmp1, jtmp2;
  1520. uint64_t count = 0;
  1521. for (auto i=lastOnline.begin(); i != lastOnline.end(); ++i) {
  1522. uint64_t nwid_i = i->first.first;
  1523. uint64_t memberid_i = i->first.second;
  1524. char nwidTmp[64];
  1525. char memTmp[64];
  1526. char ipTmp[64];
  1527. OSUtils::ztsnprintf(nwidTmp,sizeof(nwidTmp), "%.16llx", nwid_i);
  1528. OSUtils::ztsnprintf(memTmp,sizeof(memTmp), "%.10llx", memberid_i);
  1529. if (!get(nwid_i, jtmp1, memberid_i, jtmp2)){
  1530. continue; // skip non existent members/networks
  1531. }
  1532. std::string networkId(nwidTmp);
  1533. std::string memberId(memTmp);
  1534. int64_t ts = i->second.first;
  1535. std::string ipAddr = i->second.second.toIpString(ipTmp);
  1536. std::string timestamp = std::to_string(ts);
  1537. std::unordered_map<std::string, std::string> record = {
  1538. {"id", memberId},
  1539. {"address", ipAddr},
  1540. {"last_updated", std::to_string(ts)}
  1541. };
  1542. tx.zadd("nodes-online:{"+controllerId+"}", memberId, ts)
  1543. .zadd("nodes-online2:{"+controllerId+"}", networkId+"-"+memberId, ts)
  1544. .zadd("network-nodes-online:{"+controllerId+"}:"+networkId, memberId, ts)
  1545. .zadd("active-networks:{"+controllerId+"}", networkId, ts)
  1546. .sadd("network-nodes-all:{"+controllerId+"}:"+networkId, memberId)
  1547. .hmset("member:{"+controllerId+"}:"+networkId+":"+memberId, record.begin(), record.end());
  1548. ++count;
  1549. }
  1550. // expire records from all-nodes and network-nodes member list
  1551. uint64_t expireOld = OSUtils::now() - 300000;
  1552. tx.zremrangebyscore("nodes-online:{"+controllerId+"}",
  1553. sw::redis::RightBoundedInterval<double>(expireOld,
  1554. sw::redis::BoundType::LEFT_OPEN));
  1555. tx.zremrangebyscore("nodes-online2:{"+controllerId+"}",
  1556. sw::redis::RightBoundedInterval<double>(expireOld,
  1557. sw::redis::BoundType::LEFT_OPEN));
  1558. tx.zremrangebyscore("active-networks:{"+controllerId+"}",
  1559. sw::redis::RightBoundedInterval<double>(expireOld,
  1560. sw::redis::BoundType::LEFT_OPEN));
  1561. {
  1562. std::lock_guard<std::mutex> l(_networks_l);
  1563. for (const auto &it : _networks) {
  1564. uint64_t nwid_i = it.first;
  1565. char nwidTmp[64];
  1566. OSUtils::ztsnprintf(nwidTmp,sizeof(nwidTmp), "%.16llx", nwid_i);
  1567. tx.zremrangebyscore("network-nodes-online:{"+controllerId+"}:"+nwidTmp,
  1568. sw::redis::RightBoundedInterval<double>(expireOld, sw::redis::BoundType::LEFT_OPEN));
  1569. }
  1570. }
  1571. tx.exec();
  1572. fprintf(stderr, "%s: Updated online status of %d members\n", _myAddressStr.c_str(), count);
  1573. return count;
  1574. }
  1575. #endif //ZT_CONTROLLER_USE_LIBPQ