PostgreSQL.cpp 62 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838
  1. /*
  2. * Copyright (c)2019 ZeroTier, Inc.
  3. *
  4. * Use of this software is governed by the Business Source License included
  5. * in the LICENSE.TXT file in the project's root directory.
  6. *
  7. * Change Date: 2025-01-01
  8. *
  9. * On the date above, in accordance with the Business Source License, use
  10. * of this software will be governed by version 2.0 of the Apache License.
  11. */
  12. /****/
  13. #include "PostgreSQL.hpp"
  14. #ifdef ZT_CONTROLLER_USE_LIBPQ
  15. #include "../node/Constants.hpp"
  16. #include "../node/SHA512.hpp"
  17. #include "EmbeddedNetworkController.hpp"
  18. #include "../version.h"
  19. #include "Redis.hpp"
  20. #include <libpq-fe.h>
  21. #include <sstream>
  22. #include <iomanip>
  23. #include <climits>
  24. #include <chrono>
  25. // #define REDIS_TRACE 1
  26. using json = nlohmann::json;
  27. namespace {
  28. static const int DB_MINIMUM_VERSION = 38;
  29. static const char *_timestr()
  30. {
  31. time_t t = time(0);
  32. char *ts = ctime(&t);
  33. char *p = ts;
  34. if (!p)
  35. return "";
  36. while (*p) {
  37. if (*p == '\n') {
  38. *p = (char)0;
  39. break;
  40. }
  41. ++p;
  42. }
  43. return ts;
  44. }
  45. /*
  46. std::string join(const std::vector<std::string> &elements, const char * const separator)
  47. {
  48. switch(elements.size()) {
  49. case 0:
  50. return "";
  51. case 1:
  52. return elements[0];
  53. default:
  54. std::ostringstream os;
  55. std::copy(elements.begin(), elements.end()-1, std::ostream_iterator<std::string>(os, separator));
  56. os << *elements.rbegin();
  57. return os.str();
  58. }
  59. }
  60. */
  61. std::vector<std::string> split(std::string str, char delim){
  62. std::istringstream iss(str);
  63. std::vector<std::string> tokens;
  64. std::string item;
  65. while(std::getline(iss, item, delim)) {
  66. tokens.push_back(item);
  67. }
  68. return tokens;
  69. }
  70. std::string url_encode(const std::string &value) {
  71. std::ostringstream escaped;
  72. escaped.fill('0');
  73. escaped << std::hex;
  74. for (std::string::const_iterator i = value.begin(), n = value.end(); i != n; ++i) {
  75. std::string::value_type c = (*i);
  76. // Keep alphanumeric and other accepted characters intact
  77. if (isalnum(c) || c == '-' || c == '_' || c == '.' || c == '~') {
  78. escaped << c;
  79. continue;
  80. }
  81. // Any other characters are percent-encoded
  82. escaped << std::uppercase;
  83. escaped << '%' << std::setw(2) << int((unsigned char) c);
  84. escaped << std::nouppercase;
  85. }
  86. return escaped.str();
  87. }
  88. } // anonymous namespace
  89. using namespace ZeroTier;
  90. MemberNotificationReceiver::MemberNotificationReceiver(PostgreSQL *p, pqxx::connection &c, const std::string &channel)
  91. : pqxx::notification_receiver(c, channel)
  92. , _psql(p)
  93. {
  94. fprintf(stderr, "initialize MemberNotificationReceiver\n");
  95. }
  96. void MemberNotificationReceiver::operator() (const std::string &payload, int packend_pid) {
  97. fprintf(stderr, "Member Notification received: %s\n", payload.c_str());
  98. Metrics::pgsql_mem_notification++;
  99. json tmp(json::parse(payload));
  100. json &ov = tmp["old_val"];
  101. json &nv = tmp["new_val"];
  102. json oldConfig, newConfig;
  103. if (ov.is_object()) oldConfig = ov;
  104. if (nv.is_object()) newConfig = nv;
  105. if (oldConfig.is_object() || newConfig.is_object()) {
  106. _psql->_memberChanged(oldConfig,newConfig,(_psql->_ready>=2));
  107. fprintf(stderr, "payload sent\n");
  108. }
  109. }
  110. NetworkNotificationReceiver::NetworkNotificationReceiver(PostgreSQL *p, pqxx::connection &c, const std::string &channel)
  111. : pqxx::notification_receiver(c, channel)
  112. , _psql(p)
  113. {
  114. fprintf(stderr, "initialize NetworkNotificationReceiver\n");
  115. }
  116. void NetworkNotificationReceiver::operator() (const std::string &payload, int packend_pid) {
  117. fprintf(stderr, "Network Notification received: %s\n", payload.c_str());
  118. Metrics::pgsql_net_notification++;
  119. json tmp(json::parse(payload));
  120. json &ov = tmp["old_val"];
  121. json &nv = tmp["new_val"];
  122. json oldConfig, newConfig;
  123. if (ov.is_object()) oldConfig = ov;
  124. if (nv.is_object()) newConfig = nv;
  125. if (oldConfig.is_object() || newConfig.is_object()) {
  126. _psql->_networkChanged(oldConfig,newConfig,(_psql->_ready>=2));
  127. fprintf(stderr, "payload sent\n");
  128. }
  129. }
  130. using Attrs = std::vector<std::pair<std::string, std::string>>;
  131. using Item = std::pair<std::string, Attrs>;
  132. using ItemStream = std::vector<Item>;
  133. PostgreSQL::PostgreSQL(const Identity &myId, const char *path, int listenPort, RedisConfig *rc)
  134. : DB()
  135. , _pool()
  136. , _myId(myId)
  137. , _myAddress(myId.address())
  138. , _ready(0)
  139. , _connected(1)
  140. , _run(1)
  141. , _waitNoticePrinted(false)
  142. , _listenPort(listenPort)
  143. , _rc(rc)
  144. , _redis(NULL)
  145. , _cluster(NULL)
  146. , _redisMemberStatus(false)
  147. {
  148. char myAddress[64];
  149. _myAddressStr = myId.address().toString(myAddress);
  150. _connString = std::string(path);
  151. auto f = std::make_shared<PostgresConnFactory>(_connString);
  152. _pool = std::make_shared<ConnectionPool<PostgresConnection> >(
  153. 15, 5, std::static_pointer_cast<ConnectionFactory>(f));
  154. memset(_ssoPsk, 0, sizeof(_ssoPsk));
  155. char *const ssoPskHex = getenv("ZT_SSO_PSK");
  156. #ifdef ZT_TRACE
  157. fprintf(stderr, "ZT_SSO_PSK: %s\n", ssoPskHex);
  158. #endif
  159. if (ssoPskHex) {
  160. // SECURITY: note that ssoPskHex will always be null-terminated if libc actually
  161. // returns something non-NULL. If the hex encodes something shorter than 48 bytes,
  162. // it will be padded at the end with zeroes. If longer, it'll be truncated.
  163. Utils::unhex(ssoPskHex, _ssoPsk, sizeof(_ssoPsk));
  164. }
  165. const char *redisMemberStatus = getenv("ZT_REDIS_MEMBER_STATUS");
  166. if (redisMemberStatus && (strcmp(redisMemberStatus, "true") == 0)) {
  167. _redisMemberStatus = true;
  168. fprintf(stderr, "Using redis for member status\n");
  169. }
  170. auto c = _pool->borrow();
  171. pqxx::work txn{*c->c};
  172. pqxx::row r{txn.exec1("SELECT version FROM ztc_database")};
  173. int dbVersion = r[0].as<int>();
  174. txn.commit();
  175. if (dbVersion < DB_MINIMUM_VERSION) {
  176. fprintf(stderr, "Central database schema version too low. This controller version requires a minimum schema version of %d. Please upgrade your Central instance", DB_MINIMUM_VERSION);
  177. exit(1);
  178. }
  179. _pool->unborrow(c);
  180. if (_rc != NULL) {
  181. sw::redis::ConnectionOptions opts;
  182. sw::redis::ConnectionPoolOptions poolOpts;
  183. opts.host = _rc->hostname;
  184. opts.port = _rc->port;
  185. opts.password = _rc->password;
  186. opts.db = 0;
  187. opts.keep_alive = true;
  188. opts.connect_timeout = std::chrono::seconds(3);
  189. poolOpts.size = 25;
  190. poolOpts.wait_timeout = std::chrono::seconds(5);
  191. poolOpts.connection_lifetime = std::chrono::minutes(3);
  192. poolOpts.connection_idle_time = std::chrono::minutes(1);
  193. if (_rc->clusterMode) {
  194. fprintf(stderr, "Using Redis in Cluster Mode\n");
  195. _cluster = std::make_shared<sw::redis::RedisCluster>(opts, poolOpts);
  196. } else {
  197. fprintf(stderr, "Using Redis in Standalone Mode\n");
  198. _redis = std::make_shared<sw::redis::Redis>(opts, poolOpts);
  199. }
  200. }
  201. _readyLock.lock();
  202. fprintf(stderr, "[%s] NOTICE: %.10llx controller PostgreSQL waiting for initial data download..." ZT_EOL_S, ::_timestr(), (unsigned long long)_myAddress.toInt());
  203. _waitNoticePrinted = true;
  204. initializeNetworks();
  205. initializeMembers();
  206. _heartbeatThread = std::thread(&PostgreSQL::heartbeat, this);
  207. _membersDbWatcher = std::thread(&PostgreSQL::membersDbWatcher, this);
  208. _networksDbWatcher = std::thread(&PostgreSQL::networksDbWatcher, this);
  209. for (int i = 0; i < ZT_CENTRAL_CONTROLLER_COMMIT_THREADS; ++i) {
  210. _commitThread[i] = std::thread(&PostgreSQL::commitThread, this);
  211. }
  212. _onlineNotificationThread = std::thread(&PostgreSQL::onlineNotificationThread, this);
  213. }
  214. PostgreSQL::~PostgreSQL()
  215. {
  216. _run = 0;
  217. std::this_thread::sleep_for(std::chrono::milliseconds(100));
  218. _heartbeatThread.join();
  219. _membersDbWatcher.join();
  220. _networksDbWatcher.join();
  221. _commitQueue.stop();
  222. for (int i = 0; i < ZT_CENTRAL_CONTROLLER_COMMIT_THREADS; ++i) {
  223. _commitThread[i].join();
  224. }
  225. _onlineNotificationThread.join();
  226. }
  227. bool PostgreSQL::waitForReady()
  228. {
  229. while (_ready < 2) {
  230. _readyLock.lock();
  231. _readyLock.unlock();
  232. }
  233. return true;
  234. }
  235. bool PostgreSQL::isReady()
  236. {
  237. return ((_ready == 2)&&(_connected));
  238. }
  239. bool PostgreSQL::save(nlohmann::json &record,bool notifyListeners)
  240. {
  241. bool modified = false;
  242. try {
  243. if (!record.is_object()) {
  244. fprintf(stderr, "record is not an object?!?\n");
  245. return false;
  246. }
  247. const std::string objtype = record["objtype"];
  248. if (objtype == "network") {
  249. //fprintf(stderr, "network save\n");
  250. const uint64_t nwid = OSUtils::jsonIntHex(record["id"],0ULL);
  251. if (nwid) {
  252. nlohmann::json old;
  253. get(nwid,old);
  254. if ((!old.is_object())||(!_compareRecords(old,record))) {
  255. record["revision"] = OSUtils::jsonInt(record["revision"],0ULL) + 1ULL;
  256. _commitQueue.post(std::pair<nlohmann::json,bool>(record,notifyListeners));
  257. modified = true;
  258. }
  259. }
  260. } else if (objtype == "member") {
  261. std::string networkId = record["nwid"];
  262. std::string memberId = record["id"];
  263. const uint64_t nwid = OSUtils::jsonIntHex(record["nwid"],0ULL);
  264. const uint64_t id = OSUtils::jsonIntHex(record["id"],0ULL);
  265. //fprintf(stderr, "member save %s-%s\n", networkId.c_str(), memberId.c_str());
  266. if ((id)&&(nwid)) {
  267. nlohmann::json network,old;
  268. get(nwid,network,id,old);
  269. if ((!old.is_object())||(!_compareRecords(old,record))) {
  270. //fprintf(stderr, "commit queue post\n");
  271. record["revision"] = OSUtils::jsonInt(record["revision"],0ULL) + 1ULL;
  272. _commitQueue.post(std::pair<nlohmann::json,bool>(record,notifyListeners));
  273. modified = true;
  274. } else {
  275. //fprintf(stderr, "no change\n");
  276. }
  277. }
  278. } else {
  279. fprintf(stderr, "uhh waaat\n");
  280. }
  281. } catch (std::exception &e) {
  282. fprintf(stderr, "Error on PostgreSQL::save: %s\n", e.what());
  283. } catch (...) {
  284. fprintf(stderr, "Unknown error on PostgreSQL::save\n");
  285. }
  286. return modified;
  287. }
  288. void PostgreSQL::eraseNetwork(const uint64_t networkId)
  289. {
  290. fprintf(stderr, "PostgreSQL::eraseNetwork\n");
  291. char tmp2[24];
  292. waitForReady();
  293. Utils::hex(networkId, tmp2);
  294. std::pair<nlohmann::json,bool> tmp;
  295. tmp.first["id"] = tmp2;
  296. tmp.first["objtype"] = "_delete_network";
  297. tmp.second = true;
  298. _commitQueue.post(tmp);
  299. nlohmann::json nullJson;
  300. _networkChanged(tmp.first, nullJson, true);
  301. }
  302. void PostgreSQL::eraseMember(const uint64_t networkId, const uint64_t memberId)
  303. {
  304. fprintf(stderr, "PostgreSQL::eraseMember\n");
  305. char tmp2[24];
  306. waitForReady();
  307. std::pair<nlohmann::json,bool> tmp, nw;
  308. Utils::hex(networkId, tmp2);
  309. tmp.first["nwid"] = tmp2;
  310. Utils::hex(memberId, tmp2);
  311. tmp.first["id"] = tmp2;
  312. tmp.first["objtype"] = "_delete_member";
  313. tmp.second = true;
  314. _commitQueue.post(tmp);
  315. nlohmann::json nullJson;
  316. _memberChanged(tmp.first, nullJson, true);
  317. }
  318. void PostgreSQL::nodeIsOnline(const uint64_t networkId, const uint64_t memberId, const InetAddress &physicalAddress)
  319. {
  320. std::lock_guard<std::mutex> l(_lastOnline_l);
  321. std::pair<int64_t, InetAddress> &i = _lastOnline[std::pair<uint64_t,uint64_t>(networkId, memberId)];
  322. i.first = OSUtils::now();
  323. if (physicalAddress) {
  324. i.second = physicalAddress;
  325. }
  326. }
  327. AuthInfo PostgreSQL::getSSOAuthInfo(const nlohmann::json &member, const std::string &redirectURL)
  328. {
  329. Metrics::db_get_sso_info++;
  330. // NONCE is just a random character string. no semantic meaning
  331. // state = HMAC SHA384 of Nonce based on shared sso key
  332. //
  333. // need nonce timeout in database? make sure it's used within X time
  334. // X is 5 minutes for now. Make configurable later?
  335. //
  336. // how do we tell when a nonce is used? if auth_expiration_time is set
  337. std::string networkId = member["nwid"];
  338. std::string memberId = member["id"];
  339. char authenticationURL[4096] = {0};
  340. AuthInfo info;
  341. info.enabled = true;
  342. //if (memberId == "a10dccea52" && networkId == "8056c2e21c24673d") {
  343. // fprintf(stderr, "invalid authinfo for grant's machine\n");
  344. // info.version=1;
  345. // return info;
  346. //}
  347. // fprintf(stderr, "PostgreSQL::updateMemberOnLoad: %s-%s\n", networkId.c_str(), memberId.c_str());
  348. std::shared_ptr<PostgresConnection> c;
  349. try {
  350. c = _pool->borrow();
  351. pqxx::work w(*c->c);
  352. char nonceBytes[16] = {0};
  353. std::string nonce = "";
  354. // check if the member exists first.
  355. pqxx::row count = w.exec_params1("SELECT count(id) FROM ztc_member WHERE id = $1 AND network_id = $2 AND deleted = false", memberId, networkId);
  356. if (count[0].as<int>() == 1) {
  357. // get active nonce, if exists.
  358. pqxx::result r = w.exec_params("SELECT nonce FROM ztc_sso_expiry "
  359. "WHERE network_id = $1 AND member_id = $2 "
  360. "AND ((NOW() AT TIME ZONE 'UTC') <= authentication_expiry_time) AND ((NOW() AT TIME ZONE 'UTC') <= nonce_expiration)",
  361. networkId, memberId);
  362. if (r.size() == 0) {
  363. // no active nonce.
  364. // find an unused nonce, if one exists.
  365. pqxx::result r = w.exec_params("SELECT nonce FROM ztc_sso_expiry "
  366. "WHERE network_id = $1 AND member_id = $2 "
  367. "AND authentication_expiry_time IS NULL AND ((NOW() AT TIME ZONE 'UTC') <= nonce_expiration)",
  368. networkId, memberId);
  369. if (r.size() == 1) {
  370. // we have an existing nonce. Use it
  371. nonce = r.at(0)[0].as<std::string>();
  372. Utils::unhex(nonce.c_str(), nonceBytes, sizeof(nonceBytes));
  373. } else if (r.empty()) {
  374. // create a nonce
  375. Utils::getSecureRandom(nonceBytes, 16);
  376. char nonceBuf[64] = {0};
  377. Utils::hex(nonceBytes, sizeof(nonceBytes), nonceBuf);
  378. nonce = std::string(nonceBuf);
  379. pqxx::result ir = w.exec_params0("INSERT INTO ztc_sso_expiry "
  380. "(nonce, nonce_expiration, network_id, member_id) VALUES "
  381. "($1, TO_TIMESTAMP($2::double precision/1000), $3, $4)",
  382. nonce, OSUtils::now() + 300000, networkId, memberId);
  383. w.commit();
  384. } else {
  385. // > 1 ?!? Thats an error!
  386. fprintf(stderr, "> 1 unused nonce!\n");
  387. exit(6);
  388. }
  389. } else if (r.size() == 1) {
  390. nonce = r.at(0)[0].as<std::string>();
  391. Utils::unhex(nonce.c_str(), nonceBytes, sizeof(nonceBytes));
  392. } else {
  393. // more than 1 nonce in use? Uhhh...
  394. fprintf(stderr, "> 1 nonce in use for network member?!?\n");
  395. exit(7);
  396. }
  397. r = w.exec_params(
  398. "SELECT oc.client_id, oc.authorization_endpoint, oc.issuer, oc.provider, oc.sso_impl_version "
  399. "FROM ztc_network AS n "
  400. "INNER JOIN ztc_org o "
  401. " ON o.owner_id = n.owner_id "
  402. "LEFT OUTER JOIN ztc_network_oidc_config noc "
  403. " ON noc.network_id = n.id "
  404. "LEFT OUTER JOIN ztc_oidc_config oc "
  405. " ON noc.client_id = oc.client_id AND oc.org_id = o.org_id "
  406. "WHERE n.id = $1 AND n.sso_enabled = true", networkId);
  407. std::string client_id = "";
  408. std::string authorization_endpoint = "";
  409. std::string issuer = "";
  410. std::string provider = "";
  411. uint64_t sso_version = 0;
  412. if (r.size() == 1) {
  413. client_id = r.at(0)[0].as<std::optional<std::string>>().value_or("");
  414. authorization_endpoint = r.at(0)[1].as<std::optional<std::string>>().value_or("");
  415. issuer = r.at(0)[2].as<std::optional<std::string>>().value_or("");
  416. provider = r.at(0)[3].as<std::optional<std::string>>().value_or("");
  417. sso_version = r.at(0)[4].as<std::optional<uint64_t>>().value_or(1);
  418. } else if (r.size() > 1) {
  419. fprintf(stderr, "ERROR: More than one auth endpoint for an organization?!?!? NetworkID: %s\n", networkId.c_str());
  420. } else {
  421. fprintf(stderr, "No client or auth endpoint?!?\n");
  422. }
  423. info.version = sso_version;
  424. // no catch all else because we don't actually care if no records exist here. just continue as normal.
  425. if ((!client_id.empty())&&(!authorization_endpoint.empty())) {
  426. uint8_t state[48];
  427. HMACSHA384(_ssoPsk, nonceBytes, sizeof(nonceBytes), state);
  428. char state_hex[256];
  429. Utils::hex(state, 48, state_hex);
  430. if (info.version == 0) {
  431. char url[2048] = {0};
  432. OSUtils::ztsnprintf(url, sizeof(authenticationURL),
  433. "%s?response_type=id_token&response_mode=form_post&scope=openid+email+profile&redirect_uri=%s&nonce=%s&state=%s&client_id=%s",
  434. authorization_endpoint.c_str(),
  435. url_encode(redirectURL).c_str(),
  436. nonce.c_str(),
  437. state_hex,
  438. client_id.c_str());
  439. info.authenticationURL = std::string(url);
  440. } else if (info.version == 1) {
  441. info.ssoClientID = client_id;
  442. info.issuerURL = issuer;
  443. info.ssoProvider = provider;
  444. info.ssoNonce = nonce;
  445. info.ssoState = std::string(state_hex) + "_" +networkId;
  446. info.centralAuthURL = redirectURL;
  447. #ifdef ZT_DEBUG
  448. fprintf(
  449. stderr,
  450. "ssoClientID: %s\nissuerURL: %s\nssoNonce: %s\nssoState: %s\ncentralAuthURL: %s\nprovider: %s\n",
  451. info.ssoClientID.c_str(),
  452. info.issuerURL.c_str(),
  453. info.ssoNonce.c_str(),
  454. info.ssoState.c_str(),
  455. info.centralAuthURL.c_str(),
  456. provider.c_str());
  457. #endif
  458. }
  459. } else {
  460. fprintf(stderr, "client_id: %s\nauthorization_endpoint: %s\n", client_id.c_str(), authorization_endpoint.c_str());
  461. }
  462. }
  463. _pool->unborrow(c);
  464. } catch (std::exception &e) {
  465. fprintf(stderr, "ERROR: Error updating member on load for network %s: %s\n", networkId.c_str(), e.what());
  466. }
  467. return info; //std::string(authenticationURL);
  468. }
  469. void PostgreSQL::initializeNetworks()
  470. {
  471. try {
  472. std::string setKey = "networks:{" + _myAddressStr + "}";
  473. fprintf(stderr, "Initializing Networks...\n");
  474. if (_redisMemberStatus) {
  475. fprintf(stderr, "Init Redis for networks...\n");
  476. try {
  477. if (_rc->clusterMode) {
  478. _cluster->del(setKey);
  479. } else {
  480. _redis->del(setKey);
  481. }
  482. } catch (sw::redis::Error &e) {
  483. // ignore. if this key doesn't exist, there's no reason to delete it
  484. }
  485. }
  486. std::unordered_set<std::string> networkSet;
  487. char qbuf[2048] = {0};
  488. sprintf(qbuf,
  489. "SELECT n.id, (EXTRACT(EPOCH FROM n.creation_time AT TIME ZONE 'UTC')*1000)::bigint as creation_time, n.capabilities, "
  490. "n.enable_broadcast, (EXTRACT(EPOCH FROM n.last_modified AT TIME ZONE 'UTC')*1000)::bigint AS last_modified, n.mtu, n.multicast_limit, n.name, n.private, n.remote_trace_level, "
  491. "n.remote_trace_target, n.revision, n.rules, n.tags, n.v4_assign_mode, n.v6_assign_mode, n.sso_enabled, (CASE WHEN n.sso_enabled THEN noc.client_id ELSE NULL END) as client_id, "
  492. "(CASE WHEN n.sso_enabled THEN oc.authorization_endpoint ELSE NULL END) as authorization_endpoint, "
  493. "(CASE WHEN n.sso_enabled THEN oc.provider ELSE NULL END) as provider, d.domain, d.servers, "
  494. "ARRAY(SELECT CONCAT(host(ip_range_start),'|', host(ip_range_end)) FROM ztc_network_assignment_pool WHERE network_id = n.id) AS assignment_pool, "
  495. "ARRAY(SELECT CONCAT(host(address),'/',bits::text,'|',COALESCE(host(via), 'NULL'))FROM ztc_network_route WHERE network_id = n.id) AS routes "
  496. "FROM ztc_network n "
  497. "LEFT OUTER JOIN ztc_org o "
  498. " ON o.owner_id = n.owner_id "
  499. "LEFT OUTER JOIN ztc_network_oidc_config noc "
  500. " ON noc.network_id = n.id "
  501. "LEFT OUTER JOIN ztc_oidc_config oc "
  502. " ON noc.client_id = oc.client_id AND oc.org_id = o.org_id "
  503. "LEFT OUTER JOIN ztc_network_dns d "
  504. " ON d.network_id = n.id "
  505. "WHERE deleted = false AND controller_id = '%s'", _myAddressStr.c_str());
  506. auto c = _pool->borrow();
  507. auto c2 = _pool->borrow();
  508. pqxx::work w{*c->c};
  509. fprintf(stderr, "Load networks from psql...\n");
  510. auto stream = pqxx::stream_from::query(w, qbuf);
  511. std::tuple<
  512. std::string // network ID
  513. , std::optional<int64_t> // creationTime
  514. , std::optional<std::string> // capabilities
  515. , std::optional<bool> // enableBroadcast
  516. , std::optional<uint64_t> // lastModified
  517. , std::optional<int> // mtu
  518. , std::optional<int> // multicastLimit
  519. , std::optional<std::string> // name
  520. , bool // private
  521. , std::optional<int> // remoteTraceLevel
  522. , std::optional<std::string> // remoteTraceTarget
  523. , std::optional<uint64_t> // revision
  524. , std::optional<std::string> // rules
  525. , std::optional<std::string> // tags
  526. , std::optional<std::string> // v4AssignMode
  527. , std::optional<std::string> // v6AssignMode
  528. , std::optional<bool> // ssoEnabled
  529. , std::optional<std::string> // clientId
  530. , std::optional<std::string> // authorizationEndpoint
  531. , std::optional<std::string> // ssoProvider
  532. , std::optional<std::string> // domain
  533. , std::optional<std::string> // servers
  534. , std::string // assignmentPoolString
  535. , std::string // routeString
  536. > row;
  537. uint64_t count = 0;
  538. auto tmp = std::chrono::high_resolution_clock::now();
  539. uint64_t total = 0;
  540. while (stream >> row) {
  541. auto start = std::chrono::high_resolution_clock::now();
  542. json empty;
  543. json config;
  544. initNetwork(config);
  545. std::string nwid = std::get<0>(row);
  546. std::optional<int64_t> creationTime = std::get<1>(row);
  547. std::optional<std::string> capabilities = std::get<2>(row);
  548. std::optional<bool> enableBroadcast = std::get<3>(row);
  549. std::optional<uint64_t> lastModified = std::get<4>(row);
  550. std::optional<int> mtu = std::get<5>(row);
  551. std::optional<int> multicastLimit = std::get<6>(row);
  552. std::optional<std::string> name = std::get<7>(row);
  553. bool isPrivate = std::get<8>(row);
  554. std::optional<int> remoteTraceLevel = std::get<9>(row);
  555. std::optional<std::string> remoteTraceTarget = std::get<10>(row);
  556. std::optional<uint64_t> revision = std::get<11>(row);
  557. std::optional<std::string> rules = std::get<12>(row);
  558. std::optional<std::string> tags = std::get<13>(row);
  559. std::optional<std::string> v4AssignMode = std::get<14>(row);
  560. std::optional<std::string> v6AssignMode = std::get<15>(row);
  561. std::optional<bool> ssoEnabled = std::get<16>(row);
  562. std::optional<std::string> clientId = std::get<17>(row);
  563. std::optional<std::string> authorizationEndpoint = std::get<18>(row);
  564. std::optional<std::string> ssoProvider = std::get<19>(row);
  565. std::optional<std::string> dnsDomain = std::get<20>(row);
  566. std::optional<std::string> dnsServers = std::get<21>(row);
  567. std::string assignmentPoolString = std::get<22>(row);
  568. std::string routesString = std::get<23>(row);
  569. config["id"] = nwid;
  570. config["nwid"] = nwid;
  571. config["creationTime"] = creationTime.value_or(0);
  572. config["capabilities"] = json::parse(capabilities.value_or("[]"));
  573. config["enableBroadcast"] = enableBroadcast.value_or(false);
  574. config["lastModified"] = lastModified.value_or(0);
  575. config["mtu"] = mtu.value_or(2800);
  576. config["multicastLimit"] = multicastLimit.value_or(64);
  577. config["name"] = name.value_or("");
  578. config["private"] = isPrivate;
  579. config["remoteTraceLevel"] = remoteTraceLevel.value_or(0);
  580. config["remoteTraceTarget"] = remoteTraceTarget.value_or("");
  581. config["revision"] = revision.value_or(0);
  582. config["rules"] = json::parse(rules.value_or("[]"));
  583. config["tags"] = json::parse(tags.value_or("[]"));
  584. config["v4AssignMode"] = json::parse(v4AssignMode.value_or("{}"));
  585. config["v6AssignMode"] = json::parse(v6AssignMode.value_or("{}"));
  586. config["ssoEnabled"] = ssoEnabled.value_or(false);
  587. config["objtype"] = "network";
  588. config["ipAssignmentPools"] = json::array();
  589. config["routes"] = json::array();
  590. config["clientId"] = clientId.value_or("");
  591. config["authorizationEndpoint"] = authorizationEndpoint.value_or("");
  592. config["provider"] = ssoProvider.value_or("");
  593. networkSet.insert(nwid);
  594. if (dnsDomain.has_value()) {
  595. std::string serverList = dnsServers.value();
  596. json obj;
  597. auto servers = json::array();
  598. if (serverList.rfind("{",0) != std::string::npos) {
  599. serverList = serverList.substr(1, serverList.size()-2);
  600. std::stringstream ss(serverList);
  601. while(ss.good()) {
  602. std::string server;
  603. std::getline(ss, server, ',');
  604. servers.push_back(server);
  605. }
  606. }
  607. obj["domain"] = dnsDomain.value();
  608. obj["servers"] = servers;
  609. config["dns"] = obj;
  610. }
  611. config["ipAssignmentPools"] = json::array();
  612. if (assignmentPoolString != "{}") {
  613. std::string tmp = assignmentPoolString.substr(1, assignmentPoolString.size()-2);
  614. std::vector<std::string> assignmentPools = split(tmp, ',');
  615. for (auto it = assignmentPools.begin(); it != assignmentPools.end(); ++it) {
  616. std::vector<std::string> r = split(*it, '|');
  617. json ip;
  618. ip["ipRangeStart"] = r[0];
  619. ip["ipRangeEnd"] = r[1];
  620. config["ipAssignmentPools"].push_back(ip);
  621. }
  622. }
  623. config["routes"] = json::array();
  624. if (routesString != "{}") {
  625. std::string tmp = routesString.substr(1, routesString.size()-2);
  626. std::vector<std::string> routes = split(tmp, ',');
  627. for (auto it = routes.begin(); it != routes.end(); ++it) {
  628. std::vector<std::string> r = split(*it, '|');
  629. json route;
  630. route["target"] = r[0];
  631. route["via"] = ((route["via"] == "NULL")? nullptr : r[1]);
  632. config["routes"].push_back(route);
  633. }
  634. }
  635. Metrics::network_count++;
  636. _networkChanged(empty, config, false);
  637. auto end = std::chrono::high_resolution_clock::now();
  638. auto dur = std::chrono::duration_cast<std::chrono::microseconds>(end - start);;
  639. total += dur.count();
  640. ++count;
  641. if (count > 0 && count % 10000 == 0) {
  642. fprintf(stderr, "Averaging %llu us per network\n", (total/count));
  643. }
  644. }
  645. if (count > 0) {
  646. fprintf(stderr, "Took %llu us per network to load\n", (total/count));
  647. }
  648. stream.complete();
  649. w.commit();
  650. _pool->unborrow(c2);
  651. _pool->unborrow(c);
  652. fprintf(stderr, "done.\n");
  653. if (!networkSet.empty()) {
  654. if (_redisMemberStatus) {
  655. fprintf(stderr, "adding networks to redis...\n");
  656. if (_rc->clusterMode) {
  657. auto tx = _cluster->transaction(_myAddressStr, true, false);
  658. tx.sadd(setKey, networkSet.begin(), networkSet.end());
  659. tx.exec();
  660. } else {
  661. auto tx = _redis->transaction(true, false);
  662. tx.sadd(setKey, networkSet.begin(), networkSet.end());
  663. tx.exec();
  664. }
  665. fprintf(stderr, "done.\n");
  666. }
  667. }
  668. if (++this->_ready == 2) {
  669. if (_waitNoticePrinted) {
  670. fprintf(stderr,"[%s] NOTICE: %.10llx controller PostgreSQL data download complete." ZT_EOL_S,_timestr(),(unsigned long long)_myAddress.toInt());
  671. }
  672. _readyLock.unlock();
  673. }
  674. fprintf(stderr, "network init done.\n");
  675. } catch (sw::redis::Error &e) {
  676. fprintf(stderr, "ERROR: Error initializing networks in Redis: %s\n", e.what());
  677. std::this_thread::sleep_for(std::chrono::milliseconds(5000));
  678. exit(-1);
  679. } catch (std::exception &e) {
  680. fprintf(stderr, "ERROR: Error initializing networks: %s\n", e.what());
  681. std::this_thread::sleep_for(std::chrono::milliseconds(5000));
  682. exit(-1);
  683. }
  684. }
  685. void PostgreSQL::initializeMembers()
  686. {
  687. std::string memberId;
  688. std::string networkId;
  689. try {
  690. std::unordered_map<std::string, std::string> networkMembers;
  691. fprintf(stderr, "Initializing Members...\n");
  692. std::string setKeyBase = "network-nodes-all:{" + _myAddressStr + "}:";
  693. if (_redisMemberStatus) {
  694. fprintf(stderr, "Initialize Redis for members...\n");
  695. std::unique_lock<std::shared_mutex> l(_networks_l);
  696. std::unordered_set<std::string> deletes;
  697. for ( auto it : _networks) {
  698. uint64_t nwid_i = it.first;
  699. char nwidTmp[64] = {0};
  700. OSUtils::ztsnprintf(nwidTmp, sizeof(nwidTmp), "%.16llx", nwid_i);
  701. std::string nwid(nwidTmp);
  702. std::string key = setKeyBase + nwid;
  703. deletes.insert(key);
  704. }
  705. if (!deletes.empty()) {
  706. try {
  707. if (_rc->clusterMode) {
  708. auto tx = _cluster->transaction(_myAddressStr, true, false);
  709. for (std::string k : deletes) {
  710. tx.del(k);
  711. }
  712. tx.exec();
  713. } else {
  714. auto tx = _redis->transaction(true, false);
  715. for (std::string k : deletes) {
  716. tx.del(k);
  717. }
  718. tx.exec();
  719. }
  720. } catch (sw::redis::Error &e) {
  721. // ignore
  722. }
  723. }
  724. }
  725. char qbuf[2048];
  726. sprintf(qbuf,
  727. "SELECT m.id, m.network_id, m.active_bridge, m.authorized, m.capabilities, "
  728. "(EXTRACT(EPOCH FROM m.creation_time AT TIME ZONE 'UTC')*1000)::bigint, m.identity, "
  729. "(EXTRACT(EPOCH FROM m.last_authorized_time AT TIME ZONE 'UTC')*1000)::bigint, "
  730. "(EXTRACT(EPOCH FROM m.last_deauthorized_time AT TIME ZONE 'UTC')*1000)::bigint, "
  731. "m.remote_trace_level, m.remote_trace_target, m.tags, m.v_major, m.v_minor, m.v_rev, m.v_proto, "
  732. "m.no_auto_assign_ips, m.revision, m.sso_exempt, "
  733. "(CASE WHEN n.sso_enabled = TRUE AND m.sso_exempt = FALSE THEN "
  734. " ( "
  735. " SELECT (EXTRACT(EPOCH FROM e.authentication_expiry_time)*1000)::bigint "
  736. " FROM ztc_sso_expiry e "
  737. " INNER JOIN ztc_network n1 "
  738. " ON n1.id = e.network_id AND n1.deleted = TRUE "
  739. " WHERE e.network_id = m.network_id AND e.member_id = m.id AND n.sso_enabled = TRUE AND e.authentication_expiry_time IS NOT NULL "
  740. " ORDER BY e.authentication_expiry_time DESC LIMIT 1 "
  741. " ) "
  742. " ELSE NULL "
  743. " END) AS authentication_expiry_time, "
  744. "ARRAY(SELECT DISTINCT address FROM ztc_member_ip_assignment WHERE member_id = m.id AND network_id = m.network_id) AS assigned_addresses "
  745. "FROM ztc_member m "
  746. "INNER JOIN ztc_network n "
  747. " ON n.id = m.network_id "
  748. "WHERE n.controller_id = '%s' AND n.deleted = FALSE AND m.deleted = FALSE", _myAddressStr.c_str());
  749. auto c = _pool->borrow();
  750. auto c2 = _pool->borrow();
  751. pqxx::work w{*c->c};
  752. fprintf(stderr, "Load members from psql...\n");
  753. auto stream = pqxx::stream_from::query(w, qbuf);
  754. std::tuple<
  755. std::string // memberId
  756. , std::string // memberId
  757. , std::optional<bool> // activeBridge
  758. , std::optional<bool> // authorized
  759. , std::optional<std::string> // capabilities
  760. , std::optional<uint64_t> // creationTime
  761. , std::optional<std::string> // identity
  762. , std::optional<uint64_t> // lastAuthorizedTime
  763. , std::optional<uint64_t> // lastDeauthorizedTime
  764. , std::optional<int> // remoteTraceLevel
  765. , std::optional<std::string> // remoteTraceTarget
  766. , std::optional<std::string> // tags
  767. , std::optional<int> // vMajor
  768. , std::optional<int> // vMinor
  769. , std::optional<int> // vRev
  770. , std::optional<int> // vProto
  771. , std::optional<bool> // noAutoAssignIps
  772. , std::optional<uint64_t> // revision
  773. , std::optional<bool> // ssoExempt
  774. , std::optional<uint64_t> // authenticationExpiryTime
  775. , std::string // assignedAddresses
  776. > row;
  777. uint64_t count = 0;
  778. auto tmp = std::chrono::high_resolution_clock::now();
  779. uint64_t total = 0;
  780. while (stream >> row) {
  781. auto start = std::chrono::high_resolution_clock::now();
  782. json empty;
  783. json config;
  784. initMember(config);
  785. memberId = std::get<0>(row);
  786. networkId = std::get<1>(row);
  787. std::optional<bool> activeBridge = std::get<2>(row);
  788. std::optional<bool> authorized = std::get<3>(row);
  789. std::optional<std::string> capabilities = std::get<4>(row);
  790. std::optional<uint64_t> creationTime = std::get<5>(row);
  791. std::optional<std::string> identity = std::get<6>(row);
  792. std::optional<uint64_t> lastAuthorizedTime = std::get<7>(row);
  793. std::optional<uint64_t> lastDeauthorizedTime = std::get<8>(row);
  794. std::optional<int> remoteTraceLevel = std::get<9>(row);
  795. std::optional<std::string> remoteTraceTarget = std::get<10>(row);
  796. std::optional<std::string> tags = std::get<11>(row);
  797. std::optional<int> vMajor = std::get<12>(row);
  798. std::optional<int> vMinor = std::get<13>(row);
  799. std::optional<int> vRev = std::get<14>(row);
  800. std::optional<int> vProto = std::get<15>(row);
  801. std::optional<bool> noAutoAssignIps = std::get<16>(row);
  802. std::optional<uint64_t> revision = std::get<17>(row);
  803. std::optional<bool> ssoExempt = std::get<18>(row);
  804. std::optional<uint64_t> authenticationExpiryTime = std::get<19>(row);
  805. std::string assignedAddresses = std::get<20>(row);
  806. networkMembers.insert(std::pair<std::string, std::string>(setKeyBase+networkId, memberId));
  807. config["id"] = memberId;
  808. config["address"] = memberId;
  809. config["nwid"] = networkId;
  810. config["activeBridge"] = activeBridge.value_or(false);
  811. config["authorized"] = authorized.value_or(false);
  812. config["capabilities"] = json::parse(capabilities.value_or("[]"));
  813. config["creationTime"] = creationTime.value_or(0);
  814. config["identity"] = identity.value_or("");
  815. config["lastAuthorizedTime"] = lastAuthorizedTime.value_or(0);
  816. config["lastDeauthorizedTime"] = lastDeauthorizedTime.value_or(0);
  817. config["remoteTraceLevel"] = remoteTraceLevel.value_or(0);
  818. config["remoteTraceTarget"] = remoteTraceTarget.value_or("");
  819. config["tags"] = json::parse(tags.value_or("[]"));
  820. config["vMajor"] = vMajor.value_or(-1);
  821. config["vMinor"] = vMinor.value_or(-1);
  822. config["vRev"] = vRev.value_or(-1);
  823. config["vProto"] = vProto.value_or(-1);
  824. config["noAutoAssignIps"] = noAutoAssignIps.value_or(false);
  825. config["revision"] = revision.value_or(0);
  826. config["ssoExempt"] = ssoExempt.value_or(false);
  827. config["authenticationExpiryTime"] = authenticationExpiryTime.value_or(0);
  828. config["objtype"] = "member";
  829. config["ipAssignments"] = json::array();
  830. if (assignedAddresses != "{}") {
  831. std::string tmp = assignedAddresses.substr(1, assignedAddresses.size()-2);
  832. std::vector<std::string> addrs = split(tmp, ',');
  833. for (auto it = addrs.begin(); it != addrs.end(); ++it) {
  834. config["ipAssignments"].push_back(*it);
  835. }
  836. }
  837. Metrics::member_count++;
  838. _memberChanged(empty, config, false);
  839. memberId = "";
  840. networkId = "";
  841. auto end = std::chrono::high_resolution_clock::now();
  842. auto dur = std::chrono::duration_cast<std::chrono::microseconds>(end - start);
  843. total += dur.count();
  844. ++count;
  845. if (count > 0 && count % 10000 == 0) {
  846. fprintf(stderr, "Averaging %llu us per member\n", (total/count));
  847. }
  848. }
  849. if (count > 0) {
  850. fprintf(stderr, "Took %llu us per member to load\n", (total/count));
  851. }
  852. stream.complete();
  853. w.commit();
  854. _pool->unborrow(c2);
  855. _pool->unborrow(c);
  856. fprintf(stderr, "done.\n");
  857. if (!networkMembers.empty()) {
  858. if (_redisMemberStatus) {
  859. fprintf(stderr, "Load member data into redis...\n");
  860. if (_rc->clusterMode) {
  861. auto tx = _cluster->transaction(_myAddressStr, true, false);
  862. for (auto it : networkMembers) {
  863. tx.sadd(it.first, it.second);
  864. }
  865. tx.exec();
  866. } else {
  867. auto tx = _redis->transaction(true, false);
  868. for (auto it : networkMembers) {
  869. tx.sadd(it.first, it.second);
  870. }
  871. tx.exec();
  872. }
  873. fprintf(stderr, "done.\n");
  874. }
  875. }
  876. fprintf(stderr, "Done loading members...\n");
  877. if (++this->_ready == 2) {
  878. if (_waitNoticePrinted) {
  879. fprintf(stderr,"[%s] NOTICE: %.10llx controller PostgreSQL data download complete." ZT_EOL_S,_timestr(),(unsigned long long)_myAddress.toInt());
  880. }
  881. _readyLock.unlock();
  882. }
  883. } catch (sw::redis::Error &e) {
  884. fprintf(stderr, "ERROR: Error initializing members (redis): %s\n", e.what());
  885. exit(-1);
  886. } catch (std::exception &e) {
  887. fprintf(stderr, "ERROR: Error initializing member: %s-%s %s\n", networkId.c_str(), memberId.c_str(), e.what());
  888. exit(-1);
  889. }
  890. }
  891. void PostgreSQL::heartbeat()
  892. {
  893. char publicId[1024];
  894. char hostnameTmp[1024];
  895. _myId.toString(false,publicId);
  896. if (gethostname(hostnameTmp, sizeof(hostnameTmp))!= 0) {
  897. hostnameTmp[0] = (char)0;
  898. } else {
  899. for (int i = 0; i < (int)sizeof(hostnameTmp); ++i) {
  900. if ((hostnameTmp[i] == '.')||(hostnameTmp[i] == 0)) {
  901. hostnameTmp[i] = (char)0;
  902. break;
  903. }
  904. }
  905. }
  906. const char *controllerId = _myAddressStr.c_str();
  907. const char *publicIdentity = publicId;
  908. const char *hostname = hostnameTmp;
  909. while (_run == 1) {
  910. // fprintf(stderr, "%s: heartbeat\n", controllerId);
  911. auto c = _pool->borrow();
  912. int64_t ts = OSUtils::now();
  913. if(c->c) {
  914. std::string major = std::to_string(ZEROTIER_ONE_VERSION_MAJOR);
  915. std::string minor = std::to_string(ZEROTIER_ONE_VERSION_MINOR);
  916. std::string rev = std::to_string(ZEROTIER_ONE_VERSION_REVISION);
  917. std::string build = std::to_string(ZEROTIER_ONE_VERSION_BUILD);
  918. std::string now = std::to_string(ts);
  919. std::string host_port = std::to_string(_listenPort);
  920. std::string use_redis = (_rc != NULL) ? "true" : "false";
  921. std::string redis_mem_status = (_redisMemberStatus) ? "true" : "false";
  922. try {
  923. pqxx::work w{*c->c};
  924. pqxx::result res =
  925. w.exec0("INSERT INTO ztc_controller (id, cluster_host, last_alive, public_identity, v_major, v_minor, v_rev, v_build, host_port, use_redis, redis_member_status) "
  926. "VALUES ("+w.quote(controllerId)+", "+w.quote(hostname)+", TO_TIMESTAMP("+now+"::double precision/1000), "+
  927. w.quote(publicIdentity)+", "+major+", "+minor+", "+rev+", "+build+", "+host_port+", "+use_redis+", "+redis_mem_status+") "
  928. "ON CONFLICT (id) DO UPDATE SET cluster_host = EXCLUDED.cluster_host, last_alive = EXCLUDED.last_alive, "
  929. "public_identity = EXCLUDED.public_identity, v_major = EXCLUDED.v_major, v_minor = EXCLUDED.v_minor, "
  930. "v_rev = EXCLUDED.v_rev, v_build = EXCLUDED.v_rev, host_port = EXCLUDED.host_port, "
  931. "use_redis = EXCLUDED.use_redis, redis_member_status = EXCLUDED.redis_member_status");
  932. w.commit();
  933. } catch (std::exception &e) {
  934. fprintf(stderr, "%s: Heartbeat update failed: %s\n", controllerId, e.what());
  935. std::this_thread::sleep_for(std::chrono::milliseconds(1000));
  936. continue;
  937. }
  938. }
  939. _pool->unborrow(c);
  940. try {
  941. if (_redisMemberStatus) {
  942. if (_rc->clusterMode) {
  943. _cluster->zadd("controllers", "controllerId", ts);
  944. } else {
  945. _redis->zadd("controllers", "controllerId", ts);
  946. }
  947. }
  948. } catch (sw::redis::Error &e) {
  949. fprintf(stderr, "ERROR: Redis error in heartbeat thread: %s\n", e.what());
  950. }
  951. std::this_thread::sleep_for(std::chrono::milliseconds(1000));
  952. }
  953. fprintf(stderr, "Exited heartbeat thread\n");
  954. }
  955. void PostgreSQL::membersDbWatcher()
  956. {
  957. if (_rc) {
  958. _membersWatcher_Redis();
  959. } else {
  960. _membersWatcher_Postgres();
  961. }
  962. if (_run == 1) {
  963. fprintf(stderr, "ERROR: %s membersDbWatcher should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  964. exit(9);
  965. }
  966. fprintf(stderr, "Exited membersDbWatcher\n");
  967. }
  968. void PostgreSQL::_membersWatcher_Postgres() {
  969. auto c = _pool->borrow();
  970. std::string stream = "member_" + _myAddressStr;
  971. fprintf(stderr, "Listening to member stream: %s\n", stream.c_str());
  972. MemberNotificationReceiver m(this, *c->c, stream);
  973. while(_run == 1) {
  974. c->c->await_notification(5, 0);
  975. }
  976. _pool->unborrow(c);
  977. }
  978. void PostgreSQL::_membersWatcher_Redis() {
  979. char buf[11] = {0};
  980. std::string key = "member-stream:{" + std::string(_myAddress.toString(buf)) + "}";
  981. std::string lastID = "0";
  982. fprintf(stderr, "Listening to member stream: %s\n", key.c_str());
  983. while (_run == 1) {
  984. try {
  985. json tmp;
  986. std::unordered_map<std::string, ItemStream> result;
  987. if (_rc->clusterMode) {
  988. _cluster->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  989. } else {
  990. _redis->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  991. }
  992. if (!result.empty()) {
  993. for (auto element : result) {
  994. #ifdef REDIS_TRACE
  995. fprintf(stdout, "Received notification from: %s\n", element.first.c_str());
  996. #endif
  997. for (auto rec : element.second) {
  998. std::string id = rec.first;
  999. auto attrs = rec.second;
  1000. #ifdef REDIS_TRACE
  1001. fprintf(stdout, "Record ID: %s\n", id.c_str());
  1002. fprintf(stdout, "attrs len: %lu\n", attrs.size());
  1003. #endif
  1004. for (auto a : attrs) {
  1005. #ifdef REDIS_TRACE
  1006. fprintf(stdout, "key: %s\nvalue: %s\n", a.first.c_str(), a.second.c_str());
  1007. #endif
  1008. try {
  1009. tmp = json::parse(a.second);
  1010. json &ov = tmp["old_val"];
  1011. json &nv = tmp["new_val"];
  1012. json oldConfig, newConfig;
  1013. if (ov.is_object()) oldConfig = ov;
  1014. if (nv.is_object()) newConfig = nv;
  1015. if (oldConfig.is_object()||newConfig.is_object()) {
  1016. _memberChanged(oldConfig,newConfig,(this->_ready >= 2));
  1017. }
  1018. } catch (...) {
  1019. fprintf(stderr, "json parse error in networkWatcher_Redis\n");
  1020. }
  1021. }
  1022. if (_rc->clusterMode) {
  1023. _cluster->xdel(key, id);
  1024. } else {
  1025. _redis->xdel(key, id);
  1026. }
  1027. lastID = id;
  1028. Metrics::redis_mem_notification++;
  1029. }
  1030. }
  1031. }
  1032. } catch (sw::redis::Error &e) {
  1033. fprintf(stderr, "Error in Redis members watcher: %s\n", e.what());
  1034. }
  1035. }
  1036. fprintf(stderr, "membersWatcher ended\n");
  1037. }
  1038. void PostgreSQL::networksDbWatcher()
  1039. {
  1040. if (_rc) {
  1041. _networksWatcher_Redis();
  1042. } else {
  1043. _networksWatcher_Postgres();
  1044. }
  1045. if (_run == 1) {
  1046. fprintf(stderr, "ERROR: %s networksDbWatcher should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  1047. exit(8);
  1048. }
  1049. fprintf(stderr, "Exited networksDbWatcher\n");
  1050. }
  1051. void PostgreSQL::_networksWatcher_Postgres() {
  1052. std::string stream = "network_" + _myAddressStr;
  1053. fprintf(stderr, "Listening to member stream: %s\n", stream.c_str());
  1054. auto c = _pool->borrow();
  1055. NetworkNotificationReceiver n(this, *c->c, stream);
  1056. while(_run == 1) {
  1057. c->c->await_notification(5,0);
  1058. }
  1059. }
  1060. void PostgreSQL::_networksWatcher_Redis() {
  1061. char buf[11] = {0};
  1062. std::string key = "network-stream:{" + std::string(_myAddress.toString(buf)) + "}";
  1063. std::string lastID = "0";
  1064. while (_run == 1) {
  1065. try {
  1066. json tmp;
  1067. std::unordered_map<std::string, ItemStream> result;
  1068. if (_rc->clusterMode) {
  1069. _cluster->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  1070. } else {
  1071. _redis->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  1072. }
  1073. if (!result.empty()) {
  1074. for (auto element : result) {
  1075. #ifdef REDIS_TRACE
  1076. fprintf(stdout, "Received notification from: %s\n", element.first.c_str());
  1077. #endif
  1078. for (auto rec : element.second) {
  1079. std::string id = rec.first;
  1080. auto attrs = rec.second;
  1081. #ifdef REDIS_TRACE
  1082. fprintf(stdout, "Record ID: %s\n", id.c_str());
  1083. fprintf(stdout, "attrs len: %lu\n", attrs.size());
  1084. #endif
  1085. for (auto a : attrs) {
  1086. #ifdef REDIS_TRACE
  1087. fprintf(stdout, "key: %s\nvalue: %s\n", a.first.c_str(), a.second.c_str());
  1088. #endif
  1089. try {
  1090. tmp = json::parse(a.second);
  1091. json &ov = tmp["old_val"];
  1092. json &nv = tmp["new_val"];
  1093. json oldConfig, newConfig;
  1094. if (ov.is_object()) oldConfig = ov;
  1095. if (nv.is_object()) newConfig = nv;
  1096. if (oldConfig.is_object()||newConfig.is_object()) {
  1097. _networkChanged(oldConfig,newConfig,(this->_ready >= 2));
  1098. }
  1099. } catch (...) {
  1100. fprintf(stderr, "json parse error in networkWatcher_Redis\n");
  1101. }
  1102. }
  1103. if (_rc->clusterMode) {
  1104. _cluster->xdel(key, id);
  1105. } else {
  1106. _redis->xdel(key, id);
  1107. }
  1108. lastID = id;
  1109. }
  1110. Metrics::redis_net_notification++;
  1111. }
  1112. }
  1113. } catch (sw::redis::Error &e) {
  1114. fprintf(stderr, "Error in Redis networks watcher: %s\n", e.what());
  1115. }
  1116. }
  1117. fprintf(stderr, "networksWatcher ended\n");
  1118. }
  1119. void PostgreSQL::commitThread()
  1120. {
  1121. fprintf(stderr, "%s: commitThread start\n", _myAddressStr.c_str());
  1122. std::pair<nlohmann::json,bool> qitem;
  1123. while(_commitQueue.get(qitem)&(_run == 1)) {
  1124. //fprintf(stderr, "commitThread tick\n");
  1125. if (!qitem.first.is_object()) {
  1126. fprintf(stderr, "not an object\n");
  1127. continue;
  1128. }
  1129. std::shared_ptr<PostgresConnection> c;
  1130. try {
  1131. c = _pool->borrow();
  1132. } catch (std::exception &e) {
  1133. fprintf(stderr, "ERROR: %s\n", e.what());
  1134. continue;
  1135. }
  1136. if (!c) {
  1137. fprintf(stderr, "Error getting database connection\n");
  1138. continue;
  1139. }
  1140. Metrics::pgsql_commit_ticks++;
  1141. try {
  1142. nlohmann::json &config = (qitem.first);
  1143. const std::string objtype = config["objtype"];
  1144. if (objtype == "member") {
  1145. // fprintf(stderr, "%s: commitThread: member\n", _myAddressStr.c_str());
  1146. std::string memberId;
  1147. std::string networkId;
  1148. try {
  1149. pqxx::work w(*c->c);
  1150. memberId = config["id"];
  1151. networkId = config["nwid"];
  1152. std::string target = "NULL";
  1153. if (!config["remoteTraceTarget"].is_null()) {
  1154. target = config["remoteTraceTarget"];
  1155. }
  1156. pqxx::row nwrow = w.exec_params1("SELECT COUNT(id) FROM ztc_network WHERE id = $1", networkId);
  1157. int nwcount = nwrow[0].as<int>();
  1158. if (nwcount != 1) {
  1159. fprintf(stderr, "network %s does not exist. skipping member upsert\n", networkId.c_str());
  1160. w.abort();
  1161. _pool->unborrow(c);
  1162. continue;
  1163. }
  1164. pqxx::result res = w.exec_params0(
  1165. "INSERT INTO ztc_member (id, network_id, active_bridge, authorized, capabilities, "
  1166. "identity, last_authorized_time, last_deauthorized_time, no_auto_assign_ips, "
  1167. "remote_trace_level, remote_trace_target, revision, tags, v_major, v_minor, v_rev, v_proto) "
  1168. "VALUES ($1, $2, $3, $4, $5, $6, "
  1169. "TO_TIMESTAMP($7::double precision/1000), TO_TIMESTAMP($8::double precision/1000), "
  1170. "$9, $10, $11, $12, $13, $14, $15, $16, $17) ON CONFLICT (network_id, id) DO UPDATE SET "
  1171. "active_bridge = EXCLUDED.active_bridge, authorized = EXCLUDED.authorized, capabilities = EXCLUDED.capabilities, "
  1172. "identity = EXCLUDED.identity, last_authorized_time = EXCLUDED.last_authorized_time, "
  1173. "last_deauthorized_time = EXCLUDED.last_deauthorized_time, no_auto_assign_ips = EXCLUDED.no_auto_assign_ips, "
  1174. "remote_trace_level = EXCLUDED.remote_trace_level, remote_trace_target = EXCLUDED.remote_trace_target, "
  1175. "revision = EXCLUDED.revision+1, tags = EXCLUDED.tags, v_major = EXCLUDED.v_major, "
  1176. "v_minor = EXCLUDED.v_minor, v_rev = EXCLUDED.v_rev, v_proto = EXCLUDED.v_proto",
  1177. memberId,
  1178. networkId,
  1179. (bool)config["activeBridge"],
  1180. (bool)config["authorized"],
  1181. OSUtils::jsonDump(config["capabilities"], -1),
  1182. OSUtils::jsonString(config["identity"], ""),
  1183. (uint64_t)config["lastAuthorizedTime"],
  1184. (uint64_t)config["lastDeauthorizedTime"],
  1185. (bool)config["noAutoAssignIps"],
  1186. (int)config["remoteTraceLevel"],
  1187. target,
  1188. (uint64_t)config["revision"],
  1189. OSUtils::jsonDump(config["tags"], -1),
  1190. (int)config["vMajor"],
  1191. (int)config["vMinor"],
  1192. (int)config["vRev"],
  1193. (int)config["vProto"]);
  1194. res = w.exec_params0("DELETE FROM ztc_member_ip_assignment WHERE member_id = $1 AND network_id = $2",
  1195. memberId, networkId);
  1196. std::vector<std::string> assignments;
  1197. bool ipAssignError = false;
  1198. for (auto i = config["ipAssignments"].begin(); i != config["ipAssignments"].end(); ++i) {
  1199. std::string addr = *i;
  1200. if (std::find(assignments.begin(), assignments.end(), addr) != assignments.end()) {
  1201. continue;
  1202. }
  1203. res = w.exec_params0(
  1204. "INSERT INTO ztc_member_ip_assignment (member_id, network_id, address) VALUES ($1, $2, $3) ON CONFLICT (network_id, member_id, address) DO NOTHING",
  1205. memberId, networkId, addr);
  1206. assignments.push_back(addr);
  1207. }
  1208. if (ipAssignError) {
  1209. fprintf(stderr, "%s: ipAssignError\n", _myAddressStr.c_str());
  1210. w.abort();
  1211. _pool->unborrow(c);
  1212. c.reset();
  1213. continue;
  1214. }
  1215. w.commit();
  1216. const uint64_t nwidInt = OSUtils::jsonIntHex(config["nwid"], 0ULL);
  1217. const uint64_t memberidInt = OSUtils::jsonIntHex(config["id"], 0ULL);
  1218. if (nwidInt && memberidInt) {
  1219. nlohmann::json nwOrig;
  1220. nlohmann::json memOrig;
  1221. nlohmann::json memNew(config);
  1222. get(nwidInt, nwOrig, memberidInt, memOrig);
  1223. _memberChanged(memOrig, memNew, qitem.second);
  1224. } else {
  1225. fprintf(stderr, "%s: Can't notify of change. Error parsing nwid or memberid: %llu-%llu\n", _myAddressStr.c_str(), (unsigned long long)nwidInt, (unsigned long long)memberidInt);
  1226. }
  1227. } catch (std::exception &e) {
  1228. fprintf(stderr, "%s ERROR: Error updating member %s-%s: %s\n", _myAddressStr.c_str(), networkId.c_str(), memberId.c_str(), e.what());
  1229. }
  1230. } else if (objtype == "network") {
  1231. try {
  1232. // fprintf(stderr, "%s: commitThread: network\n", _myAddressStr.c_str());
  1233. pqxx::work w(*c->c);
  1234. std::string id = config["id"];
  1235. std::string remoteTraceTarget = "";
  1236. if(!config["remoteTraceTarget"].is_null()) {
  1237. remoteTraceTarget = config["remoteTraceTarget"];
  1238. }
  1239. std::string rulesSource = "";
  1240. if (config["rulesSource"].is_string()) {
  1241. rulesSource = config["rulesSource"];
  1242. }
  1243. // This ugly query exists because when we want to mirror networks to/from
  1244. // another data store (e.g. FileDB or LFDB) it is possible to get a network
  1245. // that doesn't exist in Central's database. This does an upsert and sets
  1246. // the owner_id to the "first" global admin in the user DB if the record
  1247. // did not previously exist. If the record already exists owner_id is left
  1248. // unchanged, so owner_id should be left out of the update clause.
  1249. pqxx::result res = w.exec_params0(
  1250. "INSERT INTO ztc_network (id, creation_time, owner_id, controller_id, capabilities, enable_broadcast, "
  1251. "last_modified, mtu, multicast_limit, name, private, "
  1252. "remote_trace_level, remote_trace_target, rules, rules_source, "
  1253. "tags, v4_assign_mode, v6_assign_mode, sso_enabled) VALUES ("
  1254. "$1, TO_TIMESTAMP($5::double precision/1000), "
  1255. "(SELECT user_id AS owner_id FROM ztc_global_permissions WHERE authorize = true AND del = true AND modify = true AND read = true LIMIT 1),"
  1256. "$2, $3, $4, TO_TIMESTAMP($5::double precision/1000), "
  1257. "$6, $7, $8, $9, $10, $11, $12, $13, $14, $15, $16, $17) "
  1258. "ON CONFLICT (id) DO UPDATE set controller_id = EXCLUDED.controller_id, "
  1259. "capabilities = EXCLUDED.capabilities, enable_broadcast = EXCLUDED.enable_broadcast, "
  1260. "last_modified = EXCLUDED.last_modified, mtu = EXCLUDED.mtu, "
  1261. "multicast_limit = EXCLUDED.multicast_limit, name = EXCLUDED.name, "
  1262. "private = EXCLUDED.private, remote_trace_level = EXCLUDED.remote_trace_level, "
  1263. "remote_trace_target = EXCLUDED.remote_trace_target, rules = EXCLUDED.rules, "
  1264. "rules_source = EXCLUDED.rules_source, tags = EXCLUDED.tags, "
  1265. "v4_assign_mode = EXCLUDED.v4_assign_mode, v6_assign_mode = EXCLUDED.v6_assign_mode, "
  1266. "sso_enabled = EXCLUDED.sso_enabled",
  1267. id,
  1268. _myAddressStr,
  1269. OSUtils::jsonDump(config["capabilities"], -1),
  1270. (bool)config["enableBroadcast"],
  1271. OSUtils::now(),
  1272. (int)config["mtu"],
  1273. (int)config["multicastLimit"],
  1274. OSUtils::jsonString(config["name"],""),
  1275. (bool)config["private"],
  1276. (int)config["remoteTraceLevel"],
  1277. remoteTraceTarget,
  1278. OSUtils::jsonDump(config["rules"], -1),
  1279. rulesSource,
  1280. OSUtils::jsonDump(config["tags"], -1),
  1281. OSUtils::jsonDump(config["v4AssignMode"],-1),
  1282. OSUtils::jsonDump(config["v6AssignMode"], -1),
  1283. OSUtils::jsonBool(config["ssoEnabled"], false));
  1284. res = w.exec_params0("DELETE FROM ztc_network_assignment_pool WHERE network_id = $1", 0);
  1285. auto pool = config["ipAssignmentPools"];
  1286. bool err = false;
  1287. for (auto i = pool.begin(); i != pool.end(); ++i) {
  1288. std::string start = (*i)["ipRangeStart"];
  1289. std::string end = (*i)["ipRangeEnd"];
  1290. res = w.exec_params0(
  1291. "INSERT INTO ztc_network_assignment_pool (network_id, ip_range_start, ip_range_end) "
  1292. "VALUES ($1, $2, $3)", id, start, end);
  1293. }
  1294. res = w.exec_params0("DELETE FROM ztc_network_route WHERE network_id = $1", id);
  1295. auto routes = config["routes"];
  1296. err = false;
  1297. for (auto i = routes.begin(); i != routes.end(); ++i) {
  1298. std::string t = (*i)["target"];
  1299. std::vector<std::string> target;
  1300. std::istringstream f(t);
  1301. std::string s;
  1302. while(std::getline(f, s, '/')) {
  1303. target.push_back(s);
  1304. }
  1305. if (target.empty() || target.size() != 2) {
  1306. continue;
  1307. }
  1308. std::string targetAddr = target[0];
  1309. std::string targetBits = target[1];
  1310. std::string via = "NULL";
  1311. if (!(*i)["via"].is_null()) {
  1312. via = (*i)["via"];
  1313. }
  1314. res = w.exec_params0("INSERT INTO ztc_network_route (network_id, address, bits, via) VALUES ($1, $2, $3, $4)",
  1315. id, targetAddr, targetBits, (via == "NULL" ? NULL : via.c_str()));
  1316. }
  1317. if (err) {
  1318. fprintf(stderr, "%s: route add error\n", _myAddressStr.c_str());
  1319. w.abort();
  1320. _pool->unborrow(c);
  1321. continue;
  1322. }
  1323. auto dns = config["dns"];
  1324. std::string domain = dns["domain"];
  1325. std::stringstream servers;
  1326. servers << "{";
  1327. for (auto j = dns["servers"].begin(); j < dns["servers"].end(); ++j) {
  1328. servers << *j;
  1329. if ( (j+1) != dns["servers"].end()) {
  1330. servers << ",";
  1331. }
  1332. }
  1333. servers << "}";
  1334. std::string s = servers.str();
  1335. res = w.exec_params0("INSERT INTO ztc_network_dns (network_id, domain, servers) VALUES ($1, $2, $3) ON CONFLICT (network_id) DO UPDATE SET domain = EXCLUDED.domain, servers = EXCLUDED.servers",
  1336. id, domain, s);
  1337. w.commit();
  1338. const uint64_t nwidInt = OSUtils::jsonIntHex(config["nwid"], 0ULL);
  1339. if (nwidInt) {
  1340. nlohmann::json nwOrig;
  1341. nlohmann::json nwNew(config);
  1342. get(nwidInt, nwOrig);
  1343. _networkChanged(nwOrig, nwNew, qitem.second);
  1344. } else {
  1345. fprintf(stderr, "%s: Can't notify network changed: %llu\n", _myAddressStr.c_str(), (unsigned long long)nwidInt);
  1346. }
  1347. } catch (std::exception &e) {
  1348. fprintf(stderr, "%s ERROR: Error updating network: %s\n", _myAddressStr.c_str(), e.what());
  1349. }
  1350. if (_redisMemberStatus) {
  1351. try {
  1352. std::string id = config["id"];
  1353. std::string controllerId = _myAddressStr.c_str();
  1354. std::string key = "networks:{" + controllerId + "}";
  1355. if (_rc->clusterMode) {
  1356. _cluster->sadd(key, id);
  1357. } else {
  1358. _redis->sadd(key, id);
  1359. }
  1360. } catch (sw::redis::Error &e) {
  1361. fprintf(stderr, "ERROR: Error adding network to Redis: %s\n", e.what());
  1362. }
  1363. }
  1364. } else if (objtype == "_delete_network") {
  1365. // fprintf(stderr, "%s: commitThread: delete network\n", _myAddressStr.c_str());
  1366. try {
  1367. pqxx::work w(*c->c);
  1368. std::string networkId = config["nwid"];
  1369. pqxx::result res = w.exec_params0("UPDATE ztc_network SET deleted = true WHERE id = $1",
  1370. networkId);
  1371. w.commit();
  1372. } catch (std::exception &e) {
  1373. fprintf(stderr, "%s ERROR: Error deleting network: %s\n", _myAddressStr.c_str(), e.what());
  1374. }
  1375. if (_redisMemberStatus) {
  1376. try {
  1377. std::string id = config["id"];
  1378. std::string controllerId = _myAddressStr.c_str();
  1379. std::string key = "networks:{" + controllerId + "}";
  1380. if (_rc->clusterMode) {
  1381. _cluster->srem(key, id);
  1382. _cluster->del("network-nodes-online:{"+controllerId+"}:"+id);
  1383. } else {
  1384. _redis->srem(key, id);
  1385. _redis->del("network-nodes-online:{"+controllerId+"}:"+id);
  1386. }
  1387. } catch (sw::redis::Error &e) {
  1388. fprintf(stderr, "ERROR: Error adding network to Redis: %s\n", e.what());
  1389. }
  1390. }
  1391. } else if (objtype == "_delete_member") {
  1392. // fprintf(stderr, "%s commitThread: delete member\n", _myAddressStr.c_str());
  1393. try {
  1394. pqxx::work w(*c->c);
  1395. std::string memberId = config["id"];
  1396. std::string networkId = config["nwid"];
  1397. pqxx::result res = w.exec_params0(
  1398. "UPDATE ztc_member SET hidden = true, deleted = true WHERE id = $1 AND network_id = $2",
  1399. memberId, networkId);
  1400. w.commit();
  1401. } catch (std::exception &e) {
  1402. fprintf(stderr, "%s ERROR: Error deleting member: %s\n", _myAddressStr.c_str(), e.what());
  1403. }
  1404. if (_redisMemberStatus) {
  1405. try {
  1406. std::string memberId = config["id"];
  1407. std::string networkId = config["nwid"];
  1408. std::string controllerId = _myAddressStr.c_str();
  1409. std::string key = "network-nodes-all:{" + controllerId + "}:" + networkId;
  1410. if (_rc->clusterMode) {
  1411. _cluster->srem(key, memberId);
  1412. _cluster->del("member:{"+controllerId+"}:"+networkId+":"+memberId);
  1413. } else {
  1414. _redis->srem(key, memberId);
  1415. _redis->del("member:{"+controllerId+"}:"+networkId+":"+memberId);
  1416. }
  1417. } catch (sw::redis::Error &e) {
  1418. fprintf(stderr, "ERROR: Error deleting member from Redis: %s\n", e.what());
  1419. }
  1420. }
  1421. } else {
  1422. fprintf(stderr, "%s ERROR: unknown objtype\n", _myAddressStr.c_str());
  1423. }
  1424. } catch (std::exception &e) {
  1425. fprintf(stderr, "%s ERROR: Error getting objtype: %s\n", _myAddressStr.c_str(), e.what());
  1426. }
  1427. _pool->unborrow(c);
  1428. c.reset();
  1429. }
  1430. fprintf(stderr, "%s commitThread finished\n", _myAddressStr.c_str());
  1431. }
  1432. void PostgreSQL::onlineNotificationThread()
  1433. {
  1434. waitForReady();
  1435. if (_redisMemberStatus) {
  1436. onlineNotification_Redis();
  1437. } else {
  1438. onlineNotification_Postgres();
  1439. }
  1440. }
  1441. /**
  1442. * ONLY UNCOMMENT FOR TEMPORARY DB MAINTENANCE
  1443. *
  1444. * This define temporarily turns off writing to the member status table
  1445. * so it can be reindexed when the indexes get too large.
  1446. */
  1447. // #define DISABLE_MEMBER_STATUS 1
  1448. void PostgreSQL::onlineNotification_Postgres()
  1449. {
  1450. _connected = 1;
  1451. nlohmann::json jtmp1, jtmp2;
  1452. while (_run == 1) {
  1453. auto c = _pool->borrow();
  1454. auto c2 = _pool->borrow();
  1455. try {
  1456. fprintf(stderr, "%s onlineNotification_Postgres\n", _myAddressStr.c_str());
  1457. std::unordered_map< std::pair<uint64_t,uint64_t>,std::pair<int64_t,InetAddress>,_PairHasher > lastOnline;
  1458. {
  1459. std::lock_guard<std::mutex> l(_lastOnline_l);
  1460. lastOnline.swap(_lastOnline);
  1461. }
  1462. #ifndef DISABLE_MEMBER_STATUS
  1463. pqxx::work w(*c->c);
  1464. pqxx::work w2(*c2->c);
  1465. fprintf(stderr, "online notification tick\n");
  1466. bool firstRun = true;
  1467. bool memberAdded = false;
  1468. int updateCount = 0;
  1469. pqxx::pipeline pipe(w);
  1470. for (auto i=lastOnline.begin(); i != lastOnline.end(); ++i) {
  1471. updateCount += 1;
  1472. uint64_t nwid_i = i->first.first;
  1473. char nwidTmp[64];
  1474. char memTmp[64];
  1475. char ipTmp[64];
  1476. OSUtils::ztsnprintf(nwidTmp,sizeof(nwidTmp), "%.16llx", nwid_i);
  1477. OSUtils::ztsnprintf(memTmp,sizeof(memTmp), "%.10llx", i->first.second);
  1478. if(!get(nwid_i, jtmp1, i->first.second, jtmp2)) {
  1479. continue; // skip non existent networks/members
  1480. }
  1481. std::string networkId(nwidTmp);
  1482. std::string memberId(memTmp);
  1483. try {
  1484. pqxx::row r = w2.exec_params1("SELECT id, network_id FROM ztc_member WHERE network_id = $1 AND id = $2",
  1485. networkId, memberId);
  1486. } catch (pqxx::unexpected_rows &e) {
  1487. continue;
  1488. }
  1489. int64_t ts = i->second.first;
  1490. std::string ipAddr = i->second.second.toIpString(ipTmp);
  1491. std::string timestamp = std::to_string(ts);
  1492. std::stringstream memberUpdate;
  1493. memberUpdate << "INSERT INTO ztc_member_status (network_id, member_id, address, last_updated) VALUES "
  1494. << "('" << networkId << "', '" << memberId << "', ";
  1495. if (ipAddr.empty()) {
  1496. memberUpdate << "NULL, ";
  1497. } else {
  1498. memberUpdate << "'" << ipAddr << "', ";
  1499. }
  1500. memberUpdate << "TO_TIMESTAMP(" << timestamp << "::double precision/1000)) "
  1501. << " ON CONFLICT (network_id, member_id) DO UPDATE SET address = EXCLUDED.address, last_updated = EXCLUDED.last_updated";
  1502. pipe.insert(memberUpdate.str());
  1503. Metrics::pgsql_node_checkin++;
  1504. }
  1505. while(!pipe.empty()) {
  1506. pipe.retrieve();
  1507. }
  1508. pipe.complete();
  1509. w.commit();
  1510. fprintf(stderr, "%s: Updated online status of %d members\n", _myAddressStr.c_str(), updateCount);
  1511. #endif
  1512. } catch (std::exception &e) {
  1513. fprintf(stderr, "%s: error in onlinenotification thread: %s\n", _myAddressStr.c_str(), e.what());
  1514. }
  1515. _pool->unborrow(c2);
  1516. _pool->unborrow(c);
  1517. ConnectionPoolStats stats = _pool->get_stats();
  1518. fprintf(stderr, "%s pool stats: in use size: %llu, available size: %llu, total: %llu\n",
  1519. _myAddressStr.c_str(), stats.borrowed_size, stats.pool_size, (stats.borrowed_size + stats.pool_size));
  1520. std::this_thread::sleep_for(std::chrono::seconds(10));
  1521. }
  1522. fprintf(stderr, "%s: Fell out of run loop in onlineNotificationThread\n", _myAddressStr.c_str());
  1523. if (_run == 1) {
  1524. fprintf(stderr, "ERROR: %s onlineNotificationThread should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  1525. exit(6);
  1526. }
  1527. }
  1528. void PostgreSQL::onlineNotification_Redis()
  1529. {
  1530. _connected = 1;
  1531. char buf[11] = {0};
  1532. std::string controllerId = std::string(_myAddress.toString(buf));
  1533. while (_run == 1) {
  1534. fprintf(stderr, "onlineNotification tick\n");
  1535. auto start = std::chrono::high_resolution_clock::now();
  1536. uint64_t count = 0;
  1537. std::unordered_map< std::pair<uint64_t,uint64_t>,std::pair<int64_t,InetAddress>,_PairHasher > lastOnline;
  1538. {
  1539. std::lock_guard<std::mutex> l(_lastOnline_l);
  1540. lastOnline.swap(_lastOnline);
  1541. }
  1542. try {
  1543. if (!lastOnline.empty()) {
  1544. if (_rc->clusterMode) {
  1545. auto tx = _cluster->transaction(controllerId, true, false);
  1546. count = _doRedisUpdate(tx, controllerId, lastOnline);
  1547. } else {
  1548. auto tx = _redis->transaction(true, false);
  1549. count = _doRedisUpdate(tx, controllerId, lastOnline);
  1550. }
  1551. }
  1552. } catch (sw::redis::Error &e) {
  1553. fprintf(stderr, "Error in online notification thread (redis): %s\n", e.what());
  1554. }
  1555. auto end = std::chrono::high_resolution_clock::now();
  1556. auto dur = std::chrono::duration_cast<std::chrono::milliseconds>(end - start);
  1557. auto total = dur.count();
  1558. fprintf(stderr, "onlineNotification ran in %llu ms\n", total);
  1559. std::this_thread::sleep_for(std::chrono::seconds(5));
  1560. }
  1561. }
  1562. uint64_t PostgreSQL::_doRedisUpdate(sw::redis::Transaction &tx, std::string &controllerId,
  1563. std::unordered_map< std::pair<uint64_t,uint64_t>,std::pair<int64_t,InetAddress>,_PairHasher > &lastOnline)
  1564. {
  1565. nlohmann::json jtmp1, jtmp2;
  1566. uint64_t count = 0;
  1567. for (auto i=lastOnline.begin(); i != lastOnline.end(); ++i) {
  1568. uint64_t nwid_i = i->first.first;
  1569. uint64_t memberid_i = i->first.second;
  1570. char nwidTmp[64];
  1571. char memTmp[64];
  1572. char ipTmp[64];
  1573. OSUtils::ztsnprintf(nwidTmp,sizeof(nwidTmp), "%.16llx", nwid_i);
  1574. OSUtils::ztsnprintf(memTmp,sizeof(memTmp), "%.10llx", memberid_i);
  1575. if (!get(nwid_i, jtmp1, memberid_i, jtmp2)){
  1576. continue; // skip non existent members/networks
  1577. }
  1578. std::string networkId(nwidTmp);
  1579. std::string memberId(memTmp);
  1580. int64_t ts = i->second.first;
  1581. std::string ipAddr = i->second.second.toIpString(ipTmp);
  1582. std::string timestamp = std::to_string(ts);
  1583. std::unordered_map<std::string, std::string> record = {
  1584. {"id", memberId},
  1585. {"address", ipAddr},
  1586. {"last_updated", std::to_string(ts)}
  1587. };
  1588. tx.zadd("nodes-online:{"+controllerId+"}", memberId, ts)
  1589. .zadd("nodes-online2:{"+controllerId+"}", networkId+"-"+memberId, ts)
  1590. .zadd("network-nodes-online:{"+controllerId+"}:"+networkId, memberId, ts)
  1591. .zadd("active-networks:{"+controllerId+"}", networkId, ts)
  1592. .sadd("network-nodes-all:{"+controllerId+"}:"+networkId, memberId)
  1593. .hmset("member:{"+controllerId+"}:"+networkId+":"+memberId, record.begin(), record.end());
  1594. ++count;
  1595. Metrics::redis_node_checkin++;
  1596. }
  1597. // expire records from all-nodes and network-nodes member list
  1598. uint64_t expireOld = OSUtils::now() - 300000;
  1599. tx.zremrangebyscore("nodes-online:{"+controllerId+"}",
  1600. sw::redis::RightBoundedInterval<double>(expireOld,
  1601. sw::redis::BoundType::LEFT_OPEN));
  1602. tx.zremrangebyscore("nodes-online2:{"+controllerId+"}",
  1603. sw::redis::RightBoundedInterval<double>(expireOld,
  1604. sw::redis::BoundType::LEFT_OPEN));
  1605. tx.zremrangebyscore("active-networks:{"+controllerId+"}",
  1606. sw::redis::RightBoundedInterval<double>(expireOld,
  1607. sw::redis::BoundType::LEFT_OPEN));
  1608. {
  1609. std::shared_lock<std::shared_mutex> l(_networks_l);
  1610. for (const auto &it : _networks) {
  1611. uint64_t nwid_i = it.first;
  1612. char nwidTmp[64];
  1613. OSUtils::ztsnprintf(nwidTmp,sizeof(nwidTmp), "%.16llx", nwid_i);
  1614. tx.zremrangebyscore("network-nodes-online:{"+controllerId+"}:"+nwidTmp,
  1615. sw::redis::RightBoundedInterval<double>(expireOld, sw::redis::BoundType::LEFT_OPEN));
  1616. }
  1617. }
  1618. tx.exec();
  1619. fprintf(stderr, "%s: Updated online status of %d members\n", _myAddressStr.c_str(), count);
  1620. return count;
  1621. }
  1622. #endif //ZT_CONTROLLER_USE_LIBPQ