CV1.cpp 70 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114
  1. /*
  2. * Copyright (c)2019 ZeroTier, Inc.
  3. *
  4. * Use of this software is governed by the Business Source License included
  5. * in the LICENSE.TXT file in the project's root directory.
  6. *
  7. * Change Date: 2026-01-01
  8. *
  9. * On the date above, in accordance with the Business Source License, use
  10. * of this software will be governed by version 2.0 of the Apache License.
  11. */
  12. /****/
  13. #include "CV1.hpp"
  14. #ifdef ZT_CONTROLLER_USE_LIBPQ
  15. #include "../node/Constants.hpp"
  16. #include "../node/SHA512.hpp"
  17. #include "../version.h"
  18. #include "CtlUtil.hpp"
  19. #include "EmbeddedNetworkController.hpp"
  20. #include "Redis.hpp"
  21. #include "opentelemetry/trace/provider.h"
  22. #include <chrono>
  23. #include <climits>
  24. #include <iomanip>
  25. #include <libpq-fe.h>
  26. #include <rustybits.h>
  27. #include <sstream>
  28. // #define REDIS_TRACE 1
  29. using json = nlohmann::json;
  30. namespace {
  31. static const int DB_MINIMUM_VERSION = 38;
  32. } // anonymous namespace
  33. using namespace ZeroTier;
  34. using Attrs = std::vector<std::pair<std::string, std::string> >;
  35. using Item = std::pair<std::string, Attrs>;
  36. using ItemStream = std::vector<Item>;
  37. CV1::CV1(const Identity& myId, const char* path, int listenPort, RedisConfig* rc)
  38. : DB()
  39. , _pool()
  40. , _myId(myId)
  41. , _myAddress(myId.address())
  42. , _ready(0)
  43. , _connected(1)
  44. , _run(1)
  45. , _waitNoticePrinted(false)
  46. , _listenPort(listenPort)
  47. , _rc(rc)
  48. , _redis(NULL)
  49. , _cluster(NULL)
  50. , _redisMemberStatus(false)
  51. , _smee(NULL)
  52. {
  53. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  54. auto tracer = provider->GetTracer("cv1");
  55. auto span = tracer->StartSpan("cv1::CV1");
  56. auto scope = tracer->WithActiveSpan(span);
  57. rustybits::init_async_runtime();
  58. char myAddress[64];
  59. _myAddressStr = myId.address().toString(myAddress);
  60. _connString = std::string(path);
  61. auto f = std::make_shared<PostgresConnFactory>(_connString);
  62. _pool = std::make_shared<ConnectionPool<PostgresConnection> >(15, 5, std::static_pointer_cast<ConnectionFactory>(f));
  63. memset(_ssoPsk, 0, sizeof(_ssoPsk));
  64. char* const ssoPskHex = getenv("ZT_SSO_PSK");
  65. #ifdef ZT_TRACE
  66. fprintf(stderr, "ZT_SSO_PSK: %s\n", ssoPskHex);
  67. #endif
  68. if (ssoPskHex) {
  69. // SECURITY: note that ssoPskHex will always be null-terminated if libc actually
  70. // returns something non-NULL. If the hex encodes something shorter than 48 bytes,
  71. // it will be padded at the end with zeroes. If longer, it'll be truncated.
  72. Utils::unhex(ssoPskHex, _ssoPsk, sizeof(_ssoPsk));
  73. }
  74. const char* redisMemberStatus = getenv("ZT_REDIS_MEMBER_STATUS");
  75. if (redisMemberStatus && (strcmp(redisMemberStatus, "true") == 0)) {
  76. _redisMemberStatus = true;
  77. fprintf(stderr, "Using redis for member status\n");
  78. }
  79. auto c = _pool->borrow();
  80. pqxx::work txn { *c->c };
  81. pqxx::row r { txn.exec1("SELECT version FROM ztc_database") };
  82. int dbVersion = r[0].as<int>();
  83. txn.commit();
  84. if (dbVersion < DB_MINIMUM_VERSION) {
  85. fprintf(stderr, "Central database schema version too low. This controller version requires a minimum schema version of %d. Please upgrade your Central instance", DB_MINIMUM_VERSION);
  86. exit(1);
  87. }
  88. _pool->unborrow(c);
  89. if (_rc != NULL) {
  90. auto innerspan = tracer->StartSpan("cv1::CV1::configureRedis");
  91. auto innerscope = tracer->WithActiveSpan(innerspan);
  92. sw::redis::ConnectionOptions opts;
  93. sw::redis::ConnectionPoolOptions poolOpts;
  94. opts.host = _rc->hostname;
  95. opts.port = _rc->port;
  96. opts.password = _rc->password;
  97. opts.db = 0;
  98. opts.keep_alive = true;
  99. opts.connect_timeout = std::chrono::seconds(3);
  100. poolOpts.size = 25;
  101. poolOpts.wait_timeout = std::chrono::seconds(5);
  102. poolOpts.connection_lifetime = std::chrono::minutes(3);
  103. poolOpts.connection_idle_time = std::chrono::minutes(1);
  104. if (_rc->clusterMode) {
  105. innerspan->SetAttribute("cluster_mode", "true");
  106. fprintf(stderr, "Using Redis in Cluster Mode\n");
  107. _cluster = std::make_shared<sw::redis::RedisCluster>(opts, poolOpts);
  108. }
  109. else {
  110. innerspan->SetAttribute("cluster_mode", "false");
  111. fprintf(stderr, "Using Redis in Standalone Mode\n");
  112. _redis = std::make_shared<sw::redis::Redis>(opts, poolOpts);
  113. }
  114. }
  115. _readyLock.lock();
  116. fprintf(stderr, "[%s] NOTICE: %.10llx controller PostgreSQL waiting for initial data download..." ZT_EOL_S, ::_timestr(), (unsigned long long)_myAddress.toInt());
  117. _waitNoticePrinted = true;
  118. initializeNetworks();
  119. initializeMembers();
  120. _heartbeatThread = std::thread(&CV1::heartbeat, this);
  121. _membersDbWatcher = std::thread(&CV1::membersDbWatcher, this);
  122. _networksDbWatcher = std::thread(&CV1::networksDbWatcher, this);
  123. for (int i = 0; i < ZT_CENTRAL_CONTROLLER_COMMIT_THREADS; ++i) {
  124. _commitThread[i] = std::thread(&CV1::commitThread, this);
  125. }
  126. _onlineNotificationThread = std::thread(&CV1::onlineNotificationThread, this);
  127. configureSmee();
  128. }
  129. CV1::~CV1()
  130. {
  131. if (_smee != NULL) {
  132. rustybits::smee_client_delete(_smee);
  133. _smee = NULL;
  134. }
  135. rustybits::shutdown_async_runtime();
  136. _run = 0;
  137. std::this_thread::sleep_for(std::chrono::milliseconds(100));
  138. _heartbeatThread.join();
  139. _membersDbWatcher.join();
  140. _networksDbWatcher.join();
  141. _commitQueue.stop();
  142. for (int i = 0; i < ZT_CENTRAL_CONTROLLER_COMMIT_THREADS; ++i) {
  143. _commitThread[i].join();
  144. }
  145. _onlineNotificationThread.join();
  146. }
  147. void CV1::configureSmee()
  148. {
  149. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  150. auto tracer = provider->GetTracer("cv1");
  151. auto span = tracer->StartSpan("cv1::configureSmee");
  152. auto scope = tracer->WithActiveSpan(span);
  153. const char* TEMPORAL_SCHEME = "ZT_TEMPORAL_SCHEME";
  154. const char* TEMPORAL_HOST = "ZT_TEMPORAL_HOST";
  155. const char* TEMPORAL_PORT = "ZT_TEMPORAL_PORT";
  156. const char* TEMPORAL_NAMESPACE = "ZT_TEMPORAL_NAMESPACE";
  157. const char* SMEE_TASK_QUEUE = "ZT_SMEE_TASK_QUEUE";
  158. const char* scheme = getenv(TEMPORAL_SCHEME);
  159. if (scheme == NULL) {
  160. scheme = "http";
  161. }
  162. const char* host = getenv(TEMPORAL_HOST);
  163. const char* port = getenv(TEMPORAL_PORT);
  164. const char* ns = getenv(TEMPORAL_NAMESPACE);
  165. const char* task_queue = getenv(SMEE_TASK_QUEUE);
  166. if (scheme != NULL && host != NULL && port != NULL && ns != NULL && task_queue != NULL) {
  167. fprintf(stderr, "creating smee client\n");
  168. std::string hostPort = std::string(scheme) + std::string("://") + std::string(host) + std::string(":") + std::string(port);
  169. this->_smee = rustybits::smee_client_new(hostPort.c_str(), ns, task_queue);
  170. }
  171. else {
  172. fprintf(stderr, "Smee client not configured\n");
  173. }
  174. }
  175. bool CV1::waitForReady()
  176. {
  177. while (_ready < 2) {
  178. _readyLock.lock();
  179. _readyLock.unlock();
  180. }
  181. return true;
  182. }
  183. bool CV1::isReady()
  184. {
  185. return ((_ready == 2) && (_connected));
  186. }
  187. bool CV1::save(nlohmann::json& record, bool notifyListeners)
  188. {
  189. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  190. auto tracer = provider->GetTracer("cv1");
  191. auto span = tracer->StartSpan("cv1::save");
  192. auto scope = tracer->WithActiveSpan(span);
  193. bool modified = false;
  194. try {
  195. if (! record.is_object()) {
  196. fprintf(stderr, "record is not an object?!?\n");
  197. return false;
  198. }
  199. const std::string objtype = record["objtype"];
  200. if (objtype == "network") {
  201. // fprintf(stderr, "network save\n");
  202. const uint64_t nwid = OSUtils::jsonIntHex(record["id"], 0ULL);
  203. if (nwid) {
  204. nlohmann::json old;
  205. get(nwid, old);
  206. if ((! old.is_object()) || (! _compareRecords(old, record))) {
  207. record["revision"] = OSUtils::jsonInt(record["revision"], 0ULL) + 1ULL;
  208. _commitQueue.post(std::pair<nlohmann::json, bool>(record, notifyListeners));
  209. modified = true;
  210. }
  211. }
  212. }
  213. else if (objtype == "member") {
  214. std::string networkId = record["nwid"];
  215. std::string memberId = record["id"];
  216. const uint64_t nwid = OSUtils::jsonIntHex(record["nwid"], 0ULL);
  217. const uint64_t id = OSUtils::jsonIntHex(record["id"], 0ULL);
  218. // fprintf(stderr, "member save %s-%s\n", networkId.c_str(), memberId.c_str());
  219. if ((id) && (nwid)) {
  220. nlohmann::json network, old;
  221. get(nwid, network, id, old);
  222. if ((! old.is_object()) || (! _compareRecords(old, record))) {
  223. // fprintf(stderr, "commit queue post\n");
  224. record["revision"] = OSUtils::jsonInt(record["revision"], 0ULL) + 1ULL;
  225. _commitQueue.post(std::pair<nlohmann::json, bool>(record, notifyListeners));
  226. modified = true;
  227. }
  228. else {
  229. // fprintf(stderr, "no change\n");
  230. }
  231. }
  232. }
  233. else {
  234. fprintf(stderr, "uhh waaat\n");
  235. }
  236. }
  237. catch (std::exception& e) {
  238. fprintf(stderr, "Error on PostgreSQL::save: %s\n", e.what());
  239. }
  240. catch (...) {
  241. fprintf(stderr, "Unknown error on PostgreSQL::save\n");
  242. }
  243. return modified;
  244. }
  245. void CV1::eraseNetwork(const uint64_t networkId)
  246. {
  247. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  248. auto tracer = provider->GetTracer("cv1");
  249. auto span = tracer->StartSpan("cv1::eraseNetwork");
  250. auto scope = tracer->WithActiveSpan(span);
  251. char networkIdStr[17];
  252. span->SetAttribute("network_id", Utils::hex(networkId, networkIdStr));
  253. fprintf(stderr, "PostgreSQL::eraseNetwork\n");
  254. char tmp2[24];
  255. waitForReady();
  256. Utils::hex(networkId, tmp2);
  257. std::pair<nlohmann::json, bool> tmp;
  258. tmp.first["id"] = tmp2;
  259. tmp.first["objtype"] = "_delete_network";
  260. tmp.second = true;
  261. _commitQueue.post(tmp);
  262. nlohmann::json nullJson;
  263. _networkChanged(tmp.first, nullJson, true);
  264. }
  265. void CV1::eraseMember(const uint64_t networkId, const uint64_t memberId)
  266. {
  267. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  268. auto tracer = provider->GetTracer("cv1");
  269. auto span = tracer->StartSpan("cv1::eraseMember");
  270. auto scope = tracer->WithActiveSpan(span);
  271. char networkIdStr[17];
  272. char memberIdStr[11];
  273. span->SetAttribute("network_id", Utils::hex(networkId, networkIdStr));
  274. span->SetAttribute("member_id", Utils::hex10(memberId, memberIdStr));
  275. fprintf(stderr, "PostgreSQL::eraseMember\n");
  276. char tmp2[24];
  277. waitForReady();
  278. std::pair<nlohmann::json, bool> tmp, nw;
  279. Utils::hex(networkId, tmp2);
  280. tmp.first["nwid"] = tmp2;
  281. Utils::hex(memberId, tmp2);
  282. tmp.first["id"] = tmp2;
  283. tmp.first["objtype"] = "_delete_member";
  284. tmp.second = true;
  285. _commitQueue.post(tmp);
  286. nlohmann::json nullJson;
  287. _memberChanged(tmp.first, nullJson, true);
  288. }
  289. void CV1::nodeIsOnline(const uint64_t networkId, const uint64_t memberId, const InetAddress& physicalAddress, const char* osArch)
  290. {
  291. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  292. auto tracer = provider->GetTracer("cv1");
  293. auto span = tracer->StartSpan("cv1::nodeIsOnline");
  294. auto scope = tracer->WithActiveSpan(span);
  295. char networkIdStr[17];
  296. char memberIdStr[11];
  297. char ipStr[INET6_ADDRSTRLEN];
  298. span->SetAttribute("network_id", Utils::hex(networkId, networkIdStr));
  299. span->SetAttribute("member_id", Utils::hex10(memberId, memberIdStr));
  300. span->SetAttribute("physical_address", physicalAddress.toString(ipStr));
  301. span->SetAttribute("os_arch", osArch);
  302. std::lock_guard<std::mutex> l(_lastOnline_l);
  303. NodeOnlineRecord& i = _lastOnline[std::pair<uint64_t, uint64_t>(networkId, memberId)];
  304. i.lastSeen = OSUtils::now();
  305. if (physicalAddress) {
  306. i.physicalAddress = physicalAddress;
  307. }
  308. i.osArch = std::string(osArch);
  309. }
  310. void CV1::nodeIsOnline(const uint64_t networkId, const uint64_t memberId, const InetAddress& physicalAddress)
  311. {
  312. this->nodeIsOnline(networkId, memberId, physicalAddress, "unknown/unknown");
  313. }
  314. AuthInfo CV1::getSSOAuthInfo(const nlohmann::json& member, const std::string& redirectURL)
  315. {
  316. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  317. auto tracer = provider->GetTracer("cv1");
  318. auto span = tracer->StartSpan("cv1::getSSOAuthInfo");
  319. auto scope = tracer->WithActiveSpan(span);
  320. Metrics::db_get_sso_info++;
  321. // NONCE is just a random character string. no semantic meaning
  322. // state = HMAC SHA384 of Nonce based on shared sso key
  323. //
  324. // need nonce timeout in database? make sure it's used within X time
  325. // X is 5 minutes for now. Make configurable later?
  326. //
  327. // how do we tell when a nonce is used? if auth_expiration_time is set
  328. std::string networkId = member["nwid"];
  329. std::string memberId = member["id"];
  330. char authenticationURL[4096] = { 0 };
  331. AuthInfo info;
  332. info.enabled = true;
  333. // if (memberId == "a10dccea52" && networkId == "8056c2e21c24673d") {
  334. // fprintf(stderr, "invalid authinfo for grant's machine\n");
  335. // info.version=1;
  336. // return info;
  337. // }
  338. // fprintf(stderr, "PostgreSQL::updateMemberOnLoad: %s-%s\n", networkId.c_str(), memberId.c_str());
  339. std::shared_ptr<PostgresConnection> c;
  340. try {
  341. c = _pool->borrow();
  342. pqxx::work w(*c->c);
  343. char nonceBytes[16] = { 0 };
  344. std::string nonce = "";
  345. // check if the member exists first.
  346. pqxx::row count = w.exec_params1("SELECT count(id) FROM ztc_member WHERE id = $1 AND network_id = $2 AND deleted = false", memberId, networkId);
  347. if (count[0].as<int>() == 1) {
  348. // get active nonce, if exists.
  349. pqxx::result r = w.exec_params(
  350. "SELECT nonce FROM ztc_sso_expiry "
  351. "WHERE network_id = $1 AND member_id = $2 "
  352. "AND ((NOW() AT TIME ZONE 'UTC') <= authentication_expiry_time) AND ((NOW() AT TIME ZONE 'UTC') <= nonce_expiration)",
  353. networkId,
  354. memberId);
  355. if (r.size() == 0) {
  356. // no active nonce.
  357. // find an unused nonce, if one exists.
  358. pqxx::result r = w.exec_params(
  359. "SELECT nonce FROM ztc_sso_expiry "
  360. "WHERE network_id = $1 AND member_id = $2 "
  361. "AND authentication_expiry_time IS NULL AND ((NOW() AT TIME ZONE 'UTC') <= nonce_expiration)",
  362. networkId,
  363. memberId);
  364. if (r.size() == 1) {
  365. // we have an existing nonce. Use it
  366. nonce = r.at(0)[0].as<std::string>();
  367. Utils::unhex(nonce.c_str(), nonceBytes, sizeof(nonceBytes));
  368. }
  369. else if (r.empty()) {
  370. // create a nonce
  371. Utils::getSecureRandom(nonceBytes, 16);
  372. char nonceBuf[64] = { 0 };
  373. Utils::hex(nonceBytes, sizeof(nonceBytes), nonceBuf);
  374. nonce = std::string(nonceBuf);
  375. pqxx::result ir = w.exec_params0(
  376. "INSERT INTO ztc_sso_expiry "
  377. "(nonce, nonce_expiration, network_id, member_id) VALUES "
  378. "($1, TO_TIMESTAMP($2::double precision/1000), $3, $4)",
  379. nonce,
  380. OSUtils::now() + 300000,
  381. networkId,
  382. memberId);
  383. w.commit();
  384. }
  385. else {
  386. // > 1 ?!? Thats an error!
  387. fprintf(stderr, "> 1 unused nonce!\n");
  388. exit(6);
  389. }
  390. }
  391. else if (r.size() == 1) {
  392. nonce = r.at(0)[0].as<std::string>();
  393. Utils::unhex(nonce.c_str(), nonceBytes, sizeof(nonceBytes));
  394. }
  395. else {
  396. // more than 1 nonce in use? Uhhh...
  397. fprintf(stderr, "> 1 nonce in use for network member?!?\n");
  398. exit(7);
  399. }
  400. r = w.exec_params(
  401. "SELECT oc.client_id, oc.authorization_endpoint, oc.issuer, oc.provider, oc.sso_impl_version "
  402. "FROM ztc_network AS n "
  403. "INNER JOIN ztc_org o "
  404. " ON o.owner_id = n.owner_id "
  405. "LEFT OUTER JOIN ztc_network_oidc_config noc "
  406. " ON noc.network_id = n.id "
  407. "LEFT OUTER JOIN ztc_oidc_config oc "
  408. " ON noc.client_id = oc.client_id AND oc.org_id = o.org_id "
  409. "WHERE n.id = $1 AND n.sso_enabled = true",
  410. networkId);
  411. std::string client_id = "";
  412. std::string authorization_endpoint = "";
  413. std::string issuer = "";
  414. std::string provider = "";
  415. uint64_t sso_version = 0;
  416. if (r.size() == 1) {
  417. client_id = r.at(0)[0].as<std::optional<std::string> >().value_or("");
  418. authorization_endpoint = r.at(0)[1].as<std::optional<std::string> >().value_or("");
  419. issuer = r.at(0)[2].as<std::optional<std::string> >().value_or("");
  420. provider = r.at(0)[3].as<std::optional<std::string> >().value_or("");
  421. sso_version = r.at(0)[4].as<std::optional<uint64_t> >().value_or(1);
  422. }
  423. else if (r.size() > 1) {
  424. fprintf(stderr, "ERROR: More than one auth endpoint for an organization?!?!? NetworkID: %s\n", networkId.c_str());
  425. }
  426. else {
  427. fprintf(stderr, "No client or auth endpoint?!?\n");
  428. }
  429. info.version = sso_version;
  430. // no catch all else because we don't actually care if no records exist here. just continue as normal.
  431. if ((! client_id.empty()) && (! authorization_endpoint.empty())) {
  432. uint8_t state[48];
  433. HMACSHA384(_ssoPsk, nonceBytes, sizeof(nonceBytes), state);
  434. char state_hex[256];
  435. Utils::hex(state, 48, state_hex);
  436. if (info.version == 0) {
  437. char url[2048] = { 0 };
  438. OSUtils::ztsnprintf(
  439. url,
  440. sizeof(authenticationURL),
  441. "%s?response_type=id_token&response_mode=form_post&scope=openid+email+profile&redirect_uri=%s&nonce=%s&state=%s&client_id=%s",
  442. authorization_endpoint.c_str(),
  443. url_encode(redirectURL).c_str(),
  444. nonce.c_str(),
  445. state_hex,
  446. client_id.c_str());
  447. info.authenticationURL = std::string(url);
  448. }
  449. else if (info.version == 1) {
  450. info.ssoClientID = client_id;
  451. info.issuerURL = issuer;
  452. info.ssoProvider = provider;
  453. info.ssoNonce = nonce;
  454. info.ssoState = std::string(state_hex) + "_" + networkId;
  455. info.centralAuthURL = redirectURL;
  456. #ifdef ZT_DEBUG
  457. fprintf(
  458. stderr,
  459. "ssoClientID: %s\nissuerURL: %s\nssoNonce: %s\nssoState: %s\ncentralAuthURL: %s\nprovider: %s\n",
  460. info.ssoClientID.c_str(),
  461. info.issuerURL.c_str(),
  462. info.ssoNonce.c_str(),
  463. info.ssoState.c_str(),
  464. info.centralAuthURL.c_str(),
  465. provider.c_str());
  466. #endif
  467. }
  468. }
  469. else {
  470. fprintf(stderr, "client_id: %s\nauthorization_endpoint: %s\n", client_id.c_str(), authorization_endpoint.c_str());
  471. }
  472. }
  473. _pool->unborrow(c);
  474. }
  475. catch (std::exception& e) {
  476. span->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  477. fprintf(stderr, "ERROR: Error updating member on load for network %s: %s\n", networkId.c_str(), e.what());
  478. }
  479. return info; // std::string(authenticationURL);
  480. }
  481. void CV1::initializeNetworks()
  482. {
  483. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  484. auto tracer = provider->GetTracer("cv1");
  485. auto span = tracer->StartSpan("cv1::initializeNetworks");
  486. auto scope = tracer->WithActiveSpan(span);
  487. try {
  488. std::string setKey = "networks:{" + _myAddressStr + "}";
  489. fprintf(stderr, "Initializing Networks...\n");
  490. if (_redisMemberStatus) {
  491. fprintf(stderr, "Init Redis for networks...\n");
  492. try {
  493. if (_rc->clusterMode) {
  494. _cluster->del(setKey);
  495. }
  496. else {
  497. _redis->del(setKey);
  498. }
  499. }
  500. catch (sw::redis::Error& e) {
  501. // ignore. if this key doesn't exist, there's no reason to delete it
  502. }
  503. }
  504. std::unordered_set<std::string> networkSet;
  505. char qbuf[2048] = { 0 };
  506. sprintf(
  507. qbuf,
  508. "SELECT n.id, (EXTRACT(EPOCH FROM n.creation_time AT TIME ZONE 'UTC')*1000)::bigint as creation_time, n.capabilities, "
  509. "n.enable_broadcast, (EXTRACT(EPOCH FROM n.last_modified AT TIME ZONE 'UTC')*1000)::bigint AS last_modified, n.mtu, n.multicast_limit, n.name, n.private, n.remote_trace_level, "
  510. "n.remote_trace_target, n.revision, n.rules, n.tags, n.v4_assign_mode, n.v6_assign_mode, n.sso_enabled, (CASE WHEN n.sso_enabled THEN noc.client_id ELSE NULL END) as client_id, "
  511. "(CASE WHEN n.sso_enabled THEN oc.authorization_endpoint ELSE NULL END) as authorization_endpoint, "
  512. "(CASE WHEN n.sso_enabled THEN oc.provider ELSE NULL END) as provider, d.domain, d.servers, "
  513. "ARRAY(SELECT CONCAT(host(ip_range_start),'|', host(ip_range_end)) FROM ztc_network_assignment_pool WHERE network_id = n.id) AS assignment_pool, "
  514. "ARRAY(SELECT CONCAT(host(address),'/',bits::text,'|',COALESCE(host(via), 'NULL'))FROM ztc_network_route WHERE network_id = n.id) AS routes "
  515. "FROM ztc_network n "
  516. "LEFT OUTER JOIN ztc_org o "
  517. " ON o.owner_id = n.owner_id "
  518. "LEFT OUTER JOIN ztc_network_oidc_config noc "
  519. " ON noc.network_id = n.id "
  520. "LEFT OUTER JOIN ztc_oidc_config oc "
  521. " ON noc.client_id = oc.client_id AND oc.org_id = o.org_id "
  522. "LEFT OUTER JOIN ztc_network_dns d "
  523. " ON d.network_id = n.id "
  524. "WHERE deleted = false AND controller_id = '%s'",
  525. _myAddressStr.c_str());
  526. auto c = _pool->borrow();
  527. auto c2 = _pool->borrow();
  528. pqxx::work w { *c->c };
  529. fprintf(stderr, "Load networks from psql...\n");
  530. auto stream = pqxx::stream_from::query(w, qbuf);
  531. std::tuple<
  532. std::string // network ID
  533. ,
  534. std::optional<int64_t> // creationTime
  535. ,
  536. std::optional<std::string> // capabilities
  537. ,
  538. std::optional<bool> // enableBroadcast
  539. ,
  540. std::optional<uint64_t> // lastModified
  541. ,
  542. std::optional<int> // mtu
  543. ,
  544. std::optional<int> // multicastLimit
  545. ,
  546. std::optional<std::string> // name
  547. ,
  548. bool // private
  549. ,
  550. std::optional<int> // remoteTraceLevel
  551. ,
  552. std::optional<std::string> // remoteTraceTarget
  553. ,
  554. std::optional<uint64_t> // revision
  555. ,
  556. std::optional<std::string> // rules
  557. ,
  558. std::optional<std::string> // tags
  559. ,
  560. std::optional<std::string> // v4AssignMode
  561. ,
  562. std::optional<std::string> // v6AssignMode
  563. ,
  564. std::optional<bool> // ssoEnabled
  565. ,
  566. std::optional<std::string> // clientId
  567. ,
  568. std::optional<std::string> // authorizationEndpoint
  569. ,
  570. std::optional<std::string> // ssoProvider
  571. ,
  572. std::optional<std::string> // domain
  573. ,
  574. std::optional<std::string> // servers
  575. ,
  576. std::string // assignmentPoolString
  577. ,
  578. std::string // routeString
  579. >
  580. row;
  581. uint64_t count = 0;
  582. auto tmp = std::chrono::high_resolution_clock::now();
  583. uint64_t total = 0;
  584. while (stream >> row) {
  585. auto start = std::chrono::high_resolution_clock::now();
  586. json empty;
  587. json config;
  588. initNetwork(config);
  589. std::string nwid = std::get<0>(row);
  590. std::optional<int64_t> creationTime = std::get<1>(row);
  591. std::optional<std::string> capabilities = std::get<2>(row);
  592. std::optional<bool> enableBroadcast = std::get<3>(row);
  593. std::optional<uint64_t> lastModified = std::get<4>(row);
  594. std::optional<int> mtu = std::get<5>(row);
  595. std::optional<int> multicastLimit = std::get<6>(row);
  596. std::optional<std::string> name = std::get<7>(row);
  597. bool isPrivate = std::get<8>(row);
  598. std::optional<int> remoteTraceLevel = std::get<9>(row);
  599. std::optional<std::string> remoteTraceTarget = std::get<10>(row);
  600. std::optional<uint64_t> revision = std::get<11>(row);
  601. std::optional<std::string> rules = std::get<12>(row);
  602. std::optional<std::string> tags = std::get<13>(row);
  603. std::optional<std::string> v4AssignMode = std::get<14>(row);
  604. std::optional<std::string> v6AssignMode = std::get<15>(row);
  605. std::optional<bool> ssoEnabled = std::get<16>(row);
  606. std::optional<std::string> clientId = std::get<17>(row);
  607. std::optional<std::string> authorizationEndpoint = std::get<18>(row);
  608. std::optional<std::string> ssoProvider = std::get<19>(row);
  609. std::optional<std::string> dnsDomain = std::get<20>(row);
  610. std::optional<std::string> dnsServers = std::get<21>(row);
  611. std::string assignmentPoolString = std::get<22>(row);
  612. std::string routesString = std::get<23>(row);
  613. config["id"] = nwid;
  614. config["nwid"] = nwid;
  615. config["creationTime"] = creationTime.value_or(0);
  616. config["capabilities"] = json::parse(capabilities.value_or("[]"));
  617. config["enableBroadcast"] = enableBroadcast.value_or(false);
  618. config["lastModified"] = lastModified.value_or(0);
  619. config["mtu"] = mtu.value_or(2800);
  620. config["multicastLimit"] = multicastLimit.value_or(64);
  621. config["name"] = name.value_or("");
  622. config["private"] = isPrivate;
  623. config["remoteTraceLevel"] = remoteTraceLevel.value_or(0);
  624. config["remoteTraceTarget"] = remoteTraceTarget.value_or("");
  625. config["revision"] = revision.value_or(0);
  626. config["rules"] = json::parse(rules.value_or("[]"));
  627. config["tags"] = json::parse(tags.value_or("[]"));
  628. config["v4AssignMode"] = json::parse(v4AssignMode.value_or("{}"));
  629. config["v6AssignMode"] = json::parse(v6AssignMode.value_or("{}"));
  630. config["ssoEnabled"] = ssoEnabled.value_or(false);
  631. config["objtype"] = "network";
  632. config["ipAssignmentPools"] = json::array();
  633. config["routes"] = json::array();
  634. config["clientId"] = clientId.value_or("");
  635. config["authorizationEndpoint"] = authorizationEndpoint.value_or("");
  636. config["provider"] = ssoProvider.value_or("");
  637. networkSet.insert(nwid);
  638. if (dnsDomain.has_value()) {
  639. std::string serverList = dnsServers.value();
  640. json obj;
  641. auto servers = json::array();
  642. if (serverList.rfind("{", 0) != std::string::npos) {
  643. serverList = serverList.substr(1, serverList.size() - 2);
  644. std::stringstream ss(serverList);
  645. while (ss.good()) {
  646. std::string server;
  647. std::getline(ss, server, ',');
  648. servers.push_back(server);
  649. }
  650. }
  651. obj["domain"] = dnsDomain.value();
  652. obj["servers"] = servers;
  653. config["dns"] = obj;
  654. }
  655. config["ipAssignmentPools"] = json::array();
  656. if (assignmentPoolString != "{}") {
  657. std::string tmp = assignmentPoolString.substr(1, assignmentPoolString.size() - 2);
  658. std::vector<std::string> assignmentPools = split(tmp, ',');
  659. for (auto it = assignmentPools.begin(); it != assignmentPools.end(); ++it) {
  660. std::vector<std::string> r = split(*it, '|');
  661. json ip;
  662. ip["ipRangeStart"] = r[0];
  663. ip["ipRangeEnd"] = r[1];
  664. config["ipAssignmentPools"].push_back(ip);
  665. }
  666. }
  667. config["routes"] = json::array();
  668. if (routesString != "{}") {
  669. std::string tmp = routesString.substr(1, routesString.size() - 2);
  670. std::vector<std::string> routes = split(tmp, ',');
  671. for (auto it = routes.begin(); it != routes.end(); ++it) {
  672. std::vector<std::string> r = split(*it, '|');
  673. json route;
  674. route["target"] = r[0];
  675. route["via"] = ((route["via"] == "NULL") ? nullptr : r[1]);
  676. config["routes"].push_back(route);
  677. }
  678. }
  679. Metrics::network_count++;
  680. _networkChanged(empty, config, false);
  681. auto end = std::chrono::high_resolution_clock::now();
  682. auto dur = std::chrono::duration_cast<std::chrono::microseconds>(end - start);
  683. ;
  684. total += dur.count();
  685. ++count;
  686. if (count > 0 && count % 10000 == 0) {
  687. fprintf(stderr, "Averaging %llu us per network\n", (total / count));
  688. }
  689. }
  690. if (count > 0) {
  691. fprintf(stderr, "Took %llu us per network to load\n", (total / count));
  692. }
  693. stream.complete();
  694. w.commit();
  695. _pool->unborrow(c2);
  696. _pool->unborrow(c);
  697. fprintf(stderr, "done.\n");
  698. if (! networkSet.empty()) {
  699. if (_redisMemberStatus) {
  700. fprintf(stderr, "adding networks to redis...\n");
  701. if (_rc->clusterMode) {
  702. auto tx = _cluster->transaction(_myAddressStr, true, false);
  703. uint64_t count = 0;
  704. for (std::string nwid : networkSet) {
  705. tx.sadd(setKey, nwid);
  706. if (++count % 30000 == 0) {
  707. tx.exec();
  708. tx = _cluster->transaction(_myAddressStr, true, false);
  709. }
  710. }
  711. tx.exec();
  712. }
  713. else {
  714. auto tx = _redis->transaction(true, false);
  715. uint64_t count = 0;
  716. for (std::string nwid : networkSet) {
  717. tx.sadd(setKey, nwid);
  718. if (++count % 30000 == 0) {
  719. tx.exec();
  720. tx = _redis->transaction(true, false);
  721. }
  722. }
  723. tx.exec();
  724. }
  725. fprintf(stderr, "done.\n");
  726. }
  727. }
  728. if (++this->_ready == 2) {
  729. if (_waitNoticePrinted) {
  730. fprintf(stderr, "[%s] NOTICE: %.10llx controller PostgreSQL data download complete." ZT_EOL_S, _timestr(), (unsigned long long)_myAddress.toInt());
  731. }
  732. _readyLock.unlock();
  733. }
  734. fprintf(stderr, "network init done.\n");
  735. }
  736. catch (sw::redis::Error& e) {
  737. span->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  738. fprintf(stderr, "ERROR: Error initializing networks in Redis: %s\n", e.what());
  739. std::this_thread::sleep_for(std::chrono::milliseconds(5000));
  740. exit(-1);
  741. }
  742. catch (std::exception& e) {
  743. span->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  744. fprintf(stderr, "ERROR: Error initializing networks: %s\n", e.what());
  745. std::this_thread::sleep_for(std::chrono::milliseconds(5000));
  746. exit(-1);
  747. }
  748. }
  749. void CV1::initializeMembers()
  750. {
  751. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  752. auto tracer = provider->GetTracer("cv1");
  753. auto span = tracer->StartSpan("cv1::initializeMembers");
  754. auto scope = tracer->WithActiveSpan(span);
  755. std::string memberId;
  756. std::string networkId;
  757. try {
  758. std::unordered_map<std::string, std::string> networkMembers;
  759. fprintf(stderr, "Initializing Members...\n");
  760. std::string setKeyBase = "network-nodes-all:{" + _myAddressStr + "}:";
  761. if (_redisMemberStatus) {
  762. fprintf(stderr, "Initialize Redis for members...\n");
  763. std::unique_lock<std::shared_mutex> l(_networks_l);
  764. std::unordered_set<std::string> deletes;
  765. for (auto it : _networks) {
  766. uint64_t nwid_i = it.first;
  767. char nwidTmp[64] = { 0 };
  768. OSUtils::ztsnprintf(nwidTmp, sizeof(nwidTmp), "%.16llx", nwid_i);
  769. std::string nwid(nwidTmp);
  770. std::string key = setKeyBase + nwid;
  771. deletes.insert(key);
  772. }
  773. if (! deletes.empty()) {
  774. try {
  775. if (_rc->clusterMode) {
  776. auto tx = _cluster->transaction(_myAddressStr, true, false);
  777. for (std::string k : deletes) {
  778. tx.del(k);
  779. }
  780. tx.exec();
  781. }
  782. else {
  783. auto tx = _redis->transaction(true, false);
  784. for (std::string k : deletes) {
  785. tx.del(k);
  786. }
  787. tx.exec();
  788. }
  789. }
  790. catch (sw::redis::Error& e) {
  791. // ignore
  792. }
  793. }
  794. }
  795. char qbuf[2048];
  796. sprintf(
  797. qbuf,
  798. "SELECT m.id, m.network_id, m.active_bridge, m.authorized, m.capabilities, "
  799. "(EXTRACT(EPOCH FROM m.creation_time AT TIME ZONE 'UTC')*1000)::bigint, m.identity, "
  800. "(EXTRACT(EPOCH FROM m.last_authorized_time AT TIME ZONE 'UTC')*1000)::bigint, "
  801. "(EXTRACT(EPOCH FROM m.last_deauthorized_time AT TIME ZONE 'UTC')*1000)::bigint, "
  802. "m.remote_trace_level, m.remote_trace_target, m.tags, m.v_major, m.v_minor, m.v_rev, m.v_proto, "
  803. "m.no_auto_assign_ips, m.revision, m.sso_exempt, "
  804. "(CASE WHEN n.sso_enabled = TRUE AND m.sso_exempt = FALSE THEN "
  805. " ( "
  806. " SELECT (EXTRACT(EPOCH FROM e.authentication_expiry_time)*1000)::bigint "
  807. " FROM ztc_sso_expiry e "
  808. " INNER JOIN ztc_network n1 "
  809. " ON n1.id = e.network_id AND n1.deleted = TRUE "
  810. " WHERE e.network_id = m.network_id AND e.member_id = m.id AND n.sso_enabled = TRUE AND e.authentication_expiry_time IS NOT NULL "
  811. " ORDER BY e.authentication_expiry_time DESC LIMIT 1 "
  812. " ) "
  813. " ELSE NULL "
  814. " END) AS authentication_expiry_time, "
  815. "ARRAY(SELECT DISTINCT address FROM ztc_member_ip_assignment WHERE member_id = m.id AND network_id = m.network_id) AS assigned_addresses "
  816. "FROM ztc_member m "
  817. "INNER JOIN ztc_network n "
  818. " ON n.id = m.network_id "
  819. "WHERE n.controller_id = '%s' AND n.deleted = FALSE AND m.deleted = FALSE",
  820. _myAddressStr.c_str());
  821. auto c = _pool->borrow();
  822. auto c2 = _pool->borrow();
  823. pqxx::work w { *c->c };
  824. fprintf(stderr, "Load members from psql...\n");
  825. auto stream = pqxx::stream_from::query(w, qbuf);
  826. std::tuple<
  827. std::string // memberId
  828. ,
  829. std::string // memberId
  830. ,
  831. std::optional<bool> // activeBridge
  832. ,
  833. std::optional<bool> // authorized
  834. ,
  835. std::optional<std::string> // capabilities
  836. ,
  837. std::optional<uint64_t> // creationTime
  838. ,
  839. std::optional<std::string> // identity
  840. ,
  841. std::optional<uint64_t> // lastAuthorizedTime
  842. ,
  843. std::optional<uint64_t> // lastDeauthorizedTime
  844. ,
  845. std::optional<int> // remoteTraceLevel
  846. ,
  847. std::optional<std::string> // remoteTraceTarget
  848. ,
  849. std::optional<std::string> // tags
  850. ,
  851. std::optional<int> // vMajor
  852. ,
  853. std::optional<int> // vMinor
  854. ,
  855. std::optional<int> // vRev
  856. ,
  857. std::optional<int> // vProto
  858. ,
  859. std::optional<bool> // noAutoAssignIps
  860. ,
  861. std::optional<uint64_t> // revision
  862. ,
  863. std::optional<bool> // ssoExempt
  864. ,
  865. std::optional<uint64_t> // authenticationExpiryTime
  866. ,
  867. std::string // assignedAddresses
  868. >
  869. row;
  870. uint64_t count = 0;
  871. auto tmp = std::chrono::high_resolution_clock::now();
  872. uint64_t total = 0;
  873. while (stream >> row) {
  874. auto start = std::chrono::high_resolution_clock::now();
  875. json empty;
  876. json config;
  877. initMember(config);
  878. memberId = std::get<0>(row);
  879. networkId = std::get<1>(row);
  880. std::optional<bool> activeBridge = std::get<2>(row);
  881. std::optional<bool> authorized = std::get<3>(row);
  882. std::optional<std::string> capabilities = std::get<4>(row);
  883. std::optional<uint64_t> creationTime = std::get<5>(row);
  884. std::optional<std::string> identity = std::get<6>(row);
  885. std::optional<uint64_t> lastAuthorizedTime = std::get<7>(row);
  886. std::optional<uint64_t> lastDeauthorizedTime = std::get<8>(row);
  887. std::optional<int> remoteTraceLevel = std::get<9>(row);
  888. std::optional<std::string> remoteTraceTarget = std::get<10>(row);
  889. std::optional<std::string> tags = std::get<11>(row);
  890. std::optional<int> vMajor = std::get<12>(row);
  891. std::optional<int> vMinor = std::get<13>(row);
  892. std::optional<int> vRev = std::get<14>(row);
  893. std::optional<int> vProto = std::get<15>(row);
  894. std::optional<bool> noAutoAssignIps = std::get<16>(row);
  895. std::optional<uint64_t> revision = std::get<17>(row);
  896. std::optional<bool> ssoExempt = std::get<18>(row);
  897. std::optional<uint64_t> authenticationExpiryTime = std::get<19>(row);
  898. std::string assignedAddresses = std::get<20>(row);
  899. networkMembers.insert(std::pair<std::string, std::string>(setKeyBase + networkId, memberId));
  900. config["id"] = memberId;
  901. config["address"] = memberId;
  902. config["nwid"] = networkId;
  903. config["activeBridge"] = activeBridge.value_or(false);
  904. config["authorized"] = authorized.value_or(false);
  905. config["capabilities"] = json::parse(capabilities.value_or("[]"));
  906. config["creationTime"] = creationTime.value_or(0);
  907. config["identity"] = identity.value_or("");
  908. config["lastAuthorizedTime"] = lastAuthorizedTime.value_or(0);
  909. config["lastDeauthorizedTime"] = lastDeauthorizedTime.value_or(0);
  910. config["remoteTraceLevel"] = remoteTraceLevel.value_or(0);
  911. config["remoteTraceTarget"] = remoteTraceTarget.value_or("");
  912. config["tags"] = json::parse(tags.value_or("[]"));
  913. config["vMajor"] = vMajor.value_or(-1);
  914. config["vMinor"] = vMinor.value_or(-1);
  915. config["vRev"] = vRev.value_or(-1);
  916. config["vProto"] = vProto.value_or(-1);
  917. config["noAutoAssignIps"] = noAutoAssignIps.value_or(false);
  918. config["revision"] = revision.value_or(0);
  919. config["ssoExempt"] = ssoExempt.value_or(false);
  920. config["authenticationExpiryTime"] = authenticationExpiryTime.value_or(0);
  921. config["objtype"] = "member";
  922. config["ipAssignments"] = json::array();
  923. if (assignedAddresses != "{}") {
  924. std::string tmp = assignedAddresses.substr(1, assignedAddresses.size() - 2);
  925. std::vector<std::string> addrs = split(tmp, ',');
  926. for (auto it = addrs.begin(); it != addrs.end(); ++it) {
  927. config["ipAssignments"].push_back(*it);
  928. }
  929. }
  930. Metrics::member_count++;
  931. _memberChanged(empty, config, false);
  932. memberId = "";
  933. networkId = "";
  934. auto end = std::chrono::high_resolution_clock::now();
  935. auto dur = std::chrono::duration_cast<std::chrono::microseconds>(end - start);
  936. total += dur.count();
  937. ++count;
  938. if (count > 0 && count % 10000 == 0) {
  939. fprintf(stderr, "Averaging %llu us per member\n", (total / count));
  940. }
  941. }
  942. if (count > 0) {
  943. fprintf(stderr, "Took %llu us per member to load\n", (total / count));
  944. }
  945. stream.complete();
  946. w.commit();
  947. _pool->unborrow(c2);
  948. _pool->unborrow(c);
  949. fprintf(stderr, "done.\n");
  950. if (! networkMembers.empty()) {
  951. if (_redisMemberStatus) {
  952. fprintf(stderr, "Load member data into redis...\n");
  953. if (_rc->clusterMode) {
  954. auto tx = _cluster->transaction(_myAddressStr, true, false);
  955. uint64_t count = 0;
  956. for (auto it : networkMembers) {
  957. tx.sadd(it.first, it.second);
  958. if (++count % 30000 == 0) {
  959. tx.exec();
  960. tx = _cluster->transaction(_myAddressStr, true, false);
  961. }
  962. }
  963. tx.exec();
  964. }
  965. else {
  966. auto tx = _redis->transaction(true, false);
  967. uint64_t count = 0;
  968. for (auto it : networkMembers) {
  969. tx.sadd(it.first, it.second);
  970. if (++count % 30000 == 0) {
  971. tx.exec();
  972. tx = _redis->transaction(true, false);
  973. }
  974. }
  975. tx.exec();
  976. }
  977. fprintf(stderr, "done.\n");
  978. }
  979. }
  980. fprintf(stderr, "Done loading members...\n");
  981. if (++this->_ready == 2) {
  982. if (_waitNoticePrinted) {
  983. fprintf(stderr, "[%s] NOTICE: %.10llx controller PostgreSQL data download complete." ZT_EOL_S, _timestr(), (unsigned long long)_myAddress.toInt());
  984. }
  985. _readyLock.unlock();
  986. }
  987. }
  988. catch (sw::redis::Error& e) {
  989. span->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  990. fprintf(stderr, "ERROR: Error initializing members (redis): %s\n", e.what());
  991. exit(-1);
  992. }
  993. catch (std::exception& e) {
  994. span->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  995. fprintf(stderr, "ERROR: Error initializing member: %s-%s %s\n", networkId.c_str(), memberId.c_str(), e.what());
  996. exit(-1);
  997. }
  998. }
  999. void CV1::heartbeat()
  1000. {
  1001. char publicId[1024];
  1002. char hostnameTmp[1024];
  1003. _myId.toString(false, publicId);
  1004. if (gethostname(hostnameTmp, sizeof(hostnameTmp)) != 0) {
  1005. hostnameTmp[0] = (char)0;
  1006. }
  1007. else {
  1008. for (int i = 0; i < (int)sizeof(hostnameTmp); ++i) {
  1009. if ((hostnameTmp[i] == '.') || (hostnameTmp[i] == 0)) {
  1010. hostnameTmp[i] = (char)0;
  1011. break;
  1012. }
  1013. }
  1014. }
  1015. const char* controllerId = _myAddressStr.c_str();
  1016. const char* publicIdentity = publicId;
  1017. const char* hostname = hostnameTmp;
  1018. while (_run == 1) {
  1019. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  1020. auto tracer = provider->GetTracer("cv1");
  1021. auto span = tracer->StartSpan("cv1::heartbeat");
  1022. auto scope = tracer->WithActiveSpan(span);
  1023. // fprintf(stderr, "%s: heartbeat\n", controllerId);
  1024. auto c = _pool->borrow();
  1025. int64_t ts = OSUtils::now();
  1026. if (c->c) {
  1027. std::string major = std::to_string(ZEROTIER_ONE_VERSION_MAJOR);
  1028. std::string minor = std::to_string(ZEROTIER_ONE_VERSION_MINOR);
  1029. std::string rev = std::to_string(ZEROTIER_ONE_VERSION_REVISION);
  1030. std::string build = std::to_string(ZEROTIER_ONE_VERSION_BUILD);
  1031. std::string now = std::to_string(ts);
  1032. std::string host_port = std::to_string(_listenPort);
  1033. std::string use_redis = (_rc != NULL) ? "true" : "false";
  1034. std::string redis_mem_status = (_redisMemberStatus) ? "true" : "false";
  1035. try {
  1036. pqxx::work w { *c->c };
  1037. pqxx::result res = w.exec0(
  1038. "INSERT INTO ztc_controller (id, cluster_host, last_alive, public_identity, v_major, v_minor, v_rev, v_build, host_port, use_redis, redis_member_status) "
  1039. "VALUES ("
  1040. + w.quote(controllerId) + ", " + w.quote(hostname) + ", TO_TIMESTAMP(" + now + "::double precision/1000), " + w.quote(publicIdentity) + ", " + major + ", " + minor + ", " + rev + ", " + build + ", " + host_port + ", "
  1041. + use_redis + ", " + redis_mem_status
  1042. + ") "
  1043. "ON CONFLICT (id) DO UPDATE SET cluster_host = EXCLUDED.cluster_host, last_alive = EXCLUDED.last_alive, "
  1044. "public_identity = EXCLUDED.public_identity, v_major = EXCLUDED.v_major, v_minor = EXCLUDED.v_minor, "
  1045. "v_rev = EXCLUDED.v_rev, v_build = EXCLUDED.v_rev, host_port = EXCLUDED.host_port, "
  1046. "use_redis = EXCLUDED.use_redis, redis_member_status = EXCLUDED.redis_member_status");
  1047. w.commit();
  1048. }
  1049. catch (std::exception& e) {
  1050. fprintf(stderr, "%s: Heartbeat update failed: %s\n", controllerId, e.what());
  1051. span->End();
  1052. std::this_thread::sleep_for(std::chrono::milliseconds(1000));
  1053. continue;
  1054. }
  1055. }
  1056. _pool->unborrow(c);
  1057. try {
  1058. if (_redisMemberStatus) {
  1059. if (_rc->clusterMode) {
  1060. _cluster->zadd("controllers", "controllerId", ts);
  1061. }
  1062. else {
  1063. _redis->zadd("controllers", "controllerId", ts);
  1064. }
  1065. }
  1066. }
  1067. catch (sw::redis::Error& e) {
  1068. fprintf(stderr, "ERROR: Redis error in heartbeat thread: %s\n", e.what());
  1069. }
  1070. span->End();
  1071. std::this_thread::sleep_for(std::chrono::milliseconds(1000));
  1072. }
  1073. fprintf(stderr, "Exited heartbeat thread\n");
  1074. }
  1075. void CV1::membersDbWatcher()
  1076. {
  1077. if (_rc) {
  1078. _membersWatcher_Redis();
  1079. }
  1080. else {
  1081. _membersWatcher_Postgres();
  1082. }
  1083. if (_run == 1) {
  1084. fprintf(stderr, "ERROR: %s membersDbWatcher should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  1085. exit(9);
  1086. }
  1087. fprintf(stderr, "Exited membersDbWatcher\n");
  1088. }
  1089. void CV1::_membersWatcher_Postgres()
  1090. {
  1091. auto c = _pool->borrow();
  1092. std::string stream = "member_" + _myAddressStr;
  1093. fprintf(stderr, "Listening to member stream: %s\n", stream.c_str());
  1094. MemberNotificationReceiver<CV1> m(this, *c->c, stream);
  1095. while (_run == 1) {
  1096. c->c->await_notification(5, 0);
  1097. }
  1098. _pool->unborrow(c);
  1099. }
  1100. void CV1::_membersWatcher_Redis()
  1101. {
  1102. char buf[11] = { 0 };
  1103. std::string key = "member-stream:{" + std::string(_myAddress.toString(buf)) + "}";
  1104. std::string lastID = "0";
  1105. fprintf(stderr, "Listening to member stream: %s\n", key.c_str());
  1106. while (_run == 1) {
  1107. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  1108. auto tracer = provider->GetTracer("cv1");
  1109. auto span = tracer->StartSpan("cv1::_membersWatcher_Redis");
  1110. auto scope = tracer->WithActiveSpan(span);
  1111. try {
  1112. json tmp;
  1113. std::unordered_map<std::string, ItemStream> result;
  1114. if (_rc->clusterMode) {
  1115. _cluster->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  1116. }
  1117. else {
  1118. _redis->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  1119. }
  1120. if (! result.empty()) {
  1121. for (auto element : result) {
  1122. #ifdef REDIS_TRACE
  1123. fprintf(stdout, "Received notification from: %s\n", element.first.c_str());
  1124. #endif
  1125. for (auto rec : element.second) {
  1126. std::string id = rec.first;
  1127. auto attrs = rec.second;
  1128. #ifdef REDIS_TRACE
  1129. fprintf(stdout, "Record ID: %s\n", id.c_str());
  1130. fprintf(stdout, "attrs len: %lu\n", attrs.size());
  1131. #endif
  1132. for (auto a : attrs) {
  1133. #ifdef REDIS_TRACE
  1134. fprintf(stdout, "key: %s\nvalue: %s\n", a.first.c_str(), a.second.c_str());
  1135. #endif
  1136. try {
  1137. tmp = json::parse(a.second);
  1138. json& ov = tmp["old_val"];
  1139. json& nv = tmp["new_val"];
  1140. json oldConfig, newConfig;
  1141. if (ov.is_object())
  1142. oldConfig = ov;
  1143. if (nv.is_object())
  1144. newConfig = nv;
  1145. if (oldConfig.is_object() || newConfig.is_object()) {
  1146. _memberChanged(oldConfig, newConfig, (this->_ready >= 2));
  1147. }
  1148. }
  1149. catch (...) {
  1150. fprintf(stderr, "json parse error in _membersWatcher_Redis: %s\n", a.second.c_str());
  1151. }
  1152. }
  1153. if (_rc->clusterMode) {
  1154. _cluster->xdel(key, id);
  1155. }
  1156. else {
  1157. _redis->xdel(key, id);
  1158. }
  1159. lastID = id;
  1160. Metrics::redis_mem_notification++;
  1161. }
  1162. }
  1163. }
  1164. }
  1165. catch (sw::redis::Error& e) {
  1166. span->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  1167. fprintf(stderr, "Error in Redis members watcher: %s\n", e.what());
  1168. }
  1169. }
  1170. fprintf(stderr, "membersWatcher ended\n");
  1171. }
  1172. void CV1::networksDbWatcher()
  1173. {
  1174. if (_rc) {
  1175. _networksWatcher_Redis();
  1176. }
  1177. else {
  1178. _networksWatcher_Postgres();
  1179. }
  1180. if (_run == 1) {
  1181. fprintf(stderr, "ERROR: %s networksDbWatcher should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  1182. exit(8);
  1183. }
  1184. fprintf(stderr, "Exited networksDbWatcher\n");
  1185. }
  1186. void CV1::_networksWatcher_Postgres()
  1187. {
  1188. std::string stream = "network_" + _myAddressStr;
  1189. fprintf(stderr, "Listening to member stream: %s\n", stream.c_str());
  1190. auto c = _pool->borrow();
  1191. NetworkNotificationReceiver<CV1> n(this, *c->c, stream);
  1192. while (_run == 1) {
  1193. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  1194. auto tracer = provider->GetTracer("cv1");
  1195. auto span = tracer->StartSpan("cv1::_networksWatcher_Postgres");
  1196. auto scope = tracer->WithActiveSpan(span);
  1197. c->c->await_notification(5, 0);
  1198. }
  1199. }
  1200. void CV1::_networksWatcher_Redis()
  1201. {
  1202. char buf[11] = { 0 };
  1203. std::string key = "network-stream:{" + std::string(_myAddress.toString(buf)) + "}";
  1204. std::string lastID = "0";
  1205. while (_run == 1) {
  1206. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  1207. auto tracer = provider->GetTracer("cv1");
  1208. auto span = tracer->StartSpan("cv1::_networksWatcher_Redis");
  1209. auto scope = tracer->WithActiveSpan(span);
  1210. try {
  1211. json tmp;
  1212. std::unordered_map<std::string, ItemStream> result;
  1213. if (_rc->clusterMode) {
  1214. _cluster->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  1215. }
  1216. else {
  1217. _redis->xread(key, lastID, std::chrono::seconds(1), 0, std::inserter(result, result.end()));
  1218. }
  1219. if (! result.empty()) {
  1220. for (auto element : result) {
  1221. #ifdef REDIS_TRACE
  1222. fprintf(stdout, "Received notification from: %s\n", element.first.c_str());
  1223. #endif
  1224. for (auto rec : element.second) {
  1225. std::string id = rec.first;
  1226. auto attrs = rec.second;
  1227. #ifdef REDIS_TRACE
  1228. fprintf(stdout, "Record ID: %s\n", id.c_str());
  1229. fprintf(stdout, "attrs len: %lu\n", attrs.size());
  1230. #endif
  1231. for (auto a : attrs) {
  1232. #ifdef REDIS_TRACE
  1233. fprintf(stdout, "key: %s\nvalue: %s\n", a.first.c_str(), a.second.c_str());
  1234. #endif
  1235. try {
  1236. tmp = json::parse(a.second);
  1237. json& ov = tmp["old_val"];
  1238. json& nv = tmp["new_val"];
  1239. json oldConfig, newConfig;
  1240. if (ov.is_object())
  1241. oldConfig = ov;
  1242. if (nv.is_object())
  1243. newConfig = nv;
  1244. if (oldConfig.is_object() || newConfig.is_object()) {
  1245. _networkChanged(oldConfig, newConfig, (this->_ready >= 2));
  1246. }
  1247. }
  1248. catch (std::exception& e) {
  1249. fprintf(stderr, "json parse error in networkWatcher_Redis: what: %s json: %s\n", e.what(), a.second.c_str());
  1250. }
  1251. }
  1252. if (_rc->clusterMode) {
  1253. _cluster->xdel(key, id);
  1254. }
  1255. else {
  1256. _redis->xdel(key, id);
  1257. }
  1258. lastID = id;
  1259. }
  1260. Metrics::redis_net_notification++;
  1261. }
  1262. }
  1263. }
  1264. catch (sw::redis::Error& e) {
  1265. span->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  1266. fprintf(stderr, "Error in Redis networks watcher: %s\n", e.what());
  1267. }
  1268. }
  1269. fprintf(stderr, "networksWatcher ended\n");
  1270. }
  1271. void CV1::commitThread()
  1272. {
  1273. fprintf(stderr, "%s: commitThread start\n", _myAddressStr.c_str());
  1274. std::pair<nlohmann::json, bool> qitem;
  1275. while (_commitQueue.get(qitem) && (_run == 1)) {
  1276. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  1277. auto tracer = provider->GetTracer("cv1");
  1278. auto span = tracer->StartSpan("cv1::commitThread");
  1279. auto scope = tracer->WithActiveSpan(span);
  1280. // fprintf(stderr, "commitThread tick\n");
  1281. if (! qitem.first.is_object()) {
  1282. fprintf(stderr, "not an object\n");
  1283. continue;
  1284. }
  1285. std::shared_ptr<PostgresConnection> c;
  1286. try {
  1287. c = _pool->borrow();
  1288. }
  1289. catch (std::exception& e) {
  1290. fprintf(stderr, "ERROR: %s\n", e.what());
  1291. continue;
  1292. }
  1293. if (! c) {
  1294. fprintf(stderr, "Error getting database connection\n");
  1295. continue;
  1296. }
  1297. Metrics::pgsql_commit_ticks++;
  1298. try {
  1299. nlohmann::json& config = (qitem.first);
  1300. const std::string objtype = config["objtype"];
  1301. if (objtype == "member") {
  1302. auto mspan = tracer->StartSpan("cv1::commitThread::member");
  1303. auto mscope = tracer->WithActiveSpan(mspan);
  1304. // fprintf(stderr, "%s: commitThread: member\n", _myAddressStr.c_str());
  1305. std::string memberId;
  1306. std::string networkId;
  1307. try {
  1308. pqxx::work w(*c->c);
  1309. memberId = config["id"];
  1310. networkId = config["nwid"];
  1311. std::string target = "NULL";
  1312. if (! config["remoteTraceTarget"].is_null()) {
  1313. target = config["remoteTraceTarget"];
  1314. }
  1315. pqxx::row nwrow = w.exec_params1("SELECT COUNT(id) FROM ztc_network WHERE id = $1", networkId);
  1316. int nwcount = nwrow[0].as<int>();
  1317. if (nwcount != 1) {
  1318. fprintf(stderr, "network %s does not exist. skipping member upsert\n", networkId.c_str());
  1319. w.abort();
  1320. _pool->unborrow(c);
  1321. continue;
  1322. }
  1323. pqxx::row mrow = w.exec_params1("SELECT COUNT(id) FROM ztc_member WHERE id = $1 AND network_id = $2", memberId, networkId);
  1324. int membercount = mrow[0].as<int>();
  1325. bool isNewMember = false;
  1326. if (membercount == 0) {
  1327. // new member
  1328. isNewMember = true;
  1329. pqxx::result res = w.exec_params0(
  1330. "INSERT INTO ztc_member (id, network_id, active_bridge, authorized, capabilities, "
  1331. "identity, last_authorized_time, last_deauthorized_time, no_auto_assign_ips, "
  1332. "remote_trace_level, remote_trace_target, revision, tags, v_major, v_minor, v_rev, v_proto) "
  1333. "VALUES ($1, $2, $3, $4, $5, $6, "
  1334. "TO_TIMESTAMP($7::double precision/1000), TO_TIMESTAMP($8::double precision/1000), "
  1335. "$9, $10, $11, $12, $13, $14, $15, $16, $17)",
  1336. memberId,
  1337. networkId,
  1338. (bool)config["activeBridge"],
  1339. (bool)config["authorized"],
  1340. OSUtils::jsonDump(config["capabilities"], -1),
  1341. OSUtils::jsonString(config["identity"], ""),
  1342. (uint64_t)config["lastAuthorizedTime"],
  1343. (uint64_t)config["lastDeauthorizedTime"],
  1344. (bool)config["noAutoAssignIps"],
  1345. (int)config["remoteTraceLevel"],
  1346. target,
  1347. (uint64_t)config["revision"],
  1348. OSUtils::jsonDump(config["tags"], -1),
  1349. (int)config["vMajor"],
  1350. (int)config["vMinor"],
  1351. (int)config["vRev"],
  1352. (int)config["vProto"]);
  1353. }
  1354. else {
  1355. // existing member
  1356. pqxx::result res = w.exec_params0(
  1357. "UPDATE ztc_member "
  1358. "SET active_bridge = $3, authorized = $4, capabilities = $5, identity = $6, "
  1359. "last_authorized_time = TO_TIMESTAMP($7::double precision/1000), "
  1360. "last_deauthorized_time = TO_TIMESTAMP($8::double precision/1000), "
  1361. "no_auto_assign_ips = $9, remote_trace_level = $10, remote_trace_target= $11, "
  1362. "revision = $12, tags = $13, v_major = $14, v_minor = $15, v_rev = $16, v_proto = $17 "
  1363. "WHERE id = $1 AND network_id = $2",
  1364. memberId,
  1365. networkId,
  1366. (bool)config["activeBridge"],
  1367. (bool)config["authorized"],
  1368. OSUtils::jsonDump(config["capabilities"], -1),
  1369. OSUtils::jsonString(config["identity"], ""),
  1370. (uint64_t)config["lastAuthorizedTime"],
  1371. (uint64_t)config["lastDeauthorizedTime"],
  1372. (bool)config["noAutoAssignIps"],
  1373. (int)config["remoteTraceLevel"],
  1374. target,
  1375. (uint64_t)config["revision"],
  1376. OSUtils::jsonDump(config["tags"], -1),
  1377. (int)config["vMajor"],
  1378. (int)config["vMinor"],
  1379. (int)config["vRev"],
  1380. (int)config["vProto"]);
  1381. }
  1382. if (! isNewMember) {
  1383. pqxx::result res = w.exec_params0("DELETE FROM ztc_member_ip_assignment WHERE member_id = $1 AND network_id = $2", memberId, networkId);
  1384. }
  1385. std::vector<std::string> assignments;
  1386. bool ipAssignError = false;
  1387. for (auto i = config["ipAssignments"].begin(); i != config["ipAssignments"].end(); ++i) {
  1388. std::string addr = *i;
  1389. if (std::find(assignments.begin(), assignments.end(), addr) != assignments.end()) {
  1390. continue;
  1391. }
  1392. pqxx::result res = w.exec_params0("INSERT INTO ztc_member_ip_assignment (member_id, network_id, address) VALUES ($1, $2, $3) ON CONFLICT (network_id, member_id, address) DO NOTHING", memberId, networkId, addr);
  1393. assignments.push_back(addr);
  1394. }
  1395. if (ipAssignError) {
  1396. fprintf(stderr, "%s: ipAssignError\n", _myAddressStr.c_str());
  1397. w.abort();
  1398. _pool->unborrow(c);
  1399. c.reset();
  1400. continue;
  1401. }
  1402. w.commit();
  1403. if (_smee != NULL && isNewMember) {
  1404. pqxx::row row = w.exec_params1(
  1405. "SELECT "
  1406. " count(h.hook_id) "
  1407. "FROM "
  1408. " ztc_hook h "
  1409. " INNER JOIN ztc_org o ON o.org_id = h.org_id "
  1410. " INNER JOIN ztc_network n ON n.owner_id = o.owner_id "
  1411. " WHERE "
  1412. "n.id = $1 ",
  1413. networkId);
  1414. int64_t hookCount = row[0].as<int64_t>();
  1415. if (hookCount > 0) {
  1416. notifyNewMember(networkId, memberId);
  1417. }
  1418. }
  1419. const uint64_t nwidInt = OSUtils::jsonIntHex(config["nwid"], 0ULL);
  1420. const uint64_t memberidInt = OSUtils::jsonIntHex(config["id"], 0ULL);
  1421. if (nwidInt && memberidInt) {
  1422. nlohmann::json nwOrig;
  1423. nlohmann::json memOrig;
  1424. nlohmann::json memNew(config);
  1425. get(nwidInt, nwOrig, memberidInt, memOrig);
  1426. _memberChanged(memOrig, memNew, qitem.second);
  1427. }
  1428. else {
  1429. fprintf(stderr, "%s: Can't notify of change. Error parsing nwid or memberid: %llu-%llu\n", _myAddressStr.c_str(), (unsigned long long)nwidInt, (unsigned long long)memberidInt);
  1430. }
  1431. }
  1432. catch (std::exception& e) {
  1433. fprintf(stderr, "%s ERROR: Error updating member %s-%s: %s\n", _myAddressStr.c_str(), networkId.c_str(), memberId.c_str(), e.what());
  1434. mspan->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  1435. }
  1436. }
  1437. else if (objtype == "network") {
  1438. auto nspan = tracer->StartSpan("cv1::commitThread::network");
  1439. auto nscope = tracer->WithActiveSpan(nspan);
  1440. try {
  1441. // fprintf(stderr, "%s: commitThread: network\n", _myAddressStr.c_str());
  1442. pqxx::work w(*c->c);
  1443. std::string id = config["id"];
  1444. std::string remoteTraceTarget = "";
  1445. if (! config["remoteTraceTarget"].is_null()) {
  1446. remoteTraceTarget = config["remoteTraceTarget"];
  1447. }
  1448. std::string rulesSource = "";
  1449. if (config["rulesSource"].is_string()) {
  1450. rulesSource = config["rulesSource"];
  1451. }
  1452. // This ugly query exists because when we want to mirror networks to/from
  1453. // another data store (e.g. FileDB or LFDB) it is possible to get a network
  1454. // that doesn't exist in Central's database. This does an upsert and sets
  1455. // the owner_id to the "first" global admin in the user DB if the record
  1456. // did not previously exist. If the record already exists owner_id is left
  1457. // unchanged, so owner_id should be left out of the update clause.
  1458. pqxx::result res = w.exec_params0(
  1459. "INSERT INTO ztc_network (id, creation_time, owner_id, controller_id, capabilities, enable_broadcast, "
  1460. "last_modified, mtu, multicast_limit, name, private, "
  1461. "remote_trace_level, remote_trace_target, rules, rules_source, "
  1462. "tags, v4_assign_mode, v6_assign_mode, sso_enabled) VALUES ("
  1463. "$1, TO_TIMESTAMP($5::double precision/1000), "
  1464. "(SELECT user_id AS owner_id FROM ztc_global_permissions WHERE authorize = true AND del = true AND modify = true AND read = true LIMIT 1),"
  1465. "$2, $3, $4, TO_TIMESTAMP($5::double precision/1000), "
  1466. "$6, $7, $8, $9, $10, $11, $12, $13, $14, $15, $16, $17) "
  1467. "ON CONFLICT (id) DO UPDATE set controller_id = EXCLUDED.controller_id, "
  1468. "capabilities = EXCLUDED.capabilities, enable_broadcast = EXCLUDED.enable_broadcast, "
  1469. "last_modified = EXCLUDED.last_modified, mtu = EXCLUDED.mtu, "
  1470. "multicast_limit = EXCLUDED.multicast_limit, name = EXCLUDED.name, "
  1471. "private = EXCLUDED.private, remote_trace_level = EXCLUDED.remote_trace_level, "
  1472. "remote_trace_target = EXCLUDED.remote_trace_target, rules = EXCLUDED.rules, "
  1473. "rules_source = EXCLUDED.rules_source, tags = EXCLUDED.tags, "
  1474. "v4_assign_mode = EXCLUDED.v4_assign_mode, v6_assign_mode = EXCLUDED.v6_assign_mode, "
  1475. "sso_enabled = EXCLUDED.sso_enabled",
  1476. id,
  1477. _myAddressStr,
  1478. OSUtils::jsonDump(config["capabilities"], -1),
  1479. (bool)config["enableBroadcast"],
  1480. OSUtils::now(),
  1481. (int)config["mtu"],
  1482. (int)config["multicastLimit"],
  1483. OSUtils::jsonString(config["name"], ""),
  1484. (bool)config["private"],
  1485. (int)config["remoteTraceLevel"],
  1486. remoteTraceTarget,
  1487. OSUtils::jsonDump(config["rules"], -1),
  1488. rulesSource,
  1489. OSUtils::jsonDump(config["tags"], -1),
  1490. OSUtils::jsonDump(config["v4AssignMode"], -1),
  1491. OSUtils::jsonDump(config["v6AssignMode"], -1),
  1492. OSUtils::jsonBool(config["ssoEnabled"], false));
  1493. res = w.exec_params0("DELETE FROM ztc_network_assignment_pool WHERE network_id = $1", 0);
  1494. auto pool = config["ipAssignmentPools"];
  1495. bool err = false;
  1496. for (auto i = pool.begin(); i != pool.end(); ++i) {
  1497. std::string start = (*i)["ipRangeStart"];
  1498. std::string end = (*i)["ipRangeEnd"];
  1499. res = w.exec_params0(
  1500. "INSERT INTO ztc_network_assignment_pool (network_id, ip_range_start, ip_range_end) "
  1501. "VALUES ($1, $2, $3)",
  1502. id,
  1503. start,
  1504. end);
  1505. }
  1506. res = w.exec_params0("DELETE FROM ztc_network_route WHERE network_id = $1", id);
  1507. auto routes = config["routes"];
  1508. err = false;
  1509. for (auto i = routes.begin(); i != routes.end(); ++i) {
  1510. std::string t = (*i)["target"];
  1511. std::vector<std::string> target;
  1512. std::istringstream f(t);
  1513. std::string s;
  1514. while (std::getline(f, s, '/')) {
  1515. target.push_back(s);
  1516. }
  1517. if (target.empty() || target.size() != 2) {
  1518. continue;
  1519. }
  1520. std::string targetAddr = target[0];
  1521. std::string targetBits = target[1];
  1522. std::string via = "NULL";
  1523. if (! (*i)["via"].is_null()) {
  1524. via = (*i)["via"];
  1525. }
  1526. res = w.exec_params0("INSERT INTO ztc_network_route (network_id, address, bits, via) VALUES ($1, $2, $3, $4)", id, targetAddr, targetBits, (via == "NULL" ? NULL : via.c_str()));
  1527. }
  1528. if (err) {
  1529. fprintf(stderr, "%s: route add error\n", _myAddressStr.c_str());
  1530. w.abort();
  1531. _pool->unborrow(c);
  1532. continue;
  1533. }
  1534. auto dns = config["dns"];
  1535. std::string domain = dns["domain"];
  1536. std::stringstream servers;
  1537. servers << "{";
  1538. for (auto j = dns["servers"].begin(); j < dns["servers"].end(); ++j) {
  1539. servers << *j;
  1540. if ((j + 1) != dns["servers"].end()) {
  1541. servers << ",";
  1542. }
  1543. }
  1544. servers << "}";
  1545. std::string s = servers.str();
  1546. res = w.exec_params0("INSERT INTO ztc_network_dns (network_id, domain, servers) VALUES ($1, $2, $3) ON CONFLICT (network_id) DO UPDATE SET domain = EXCLUDED.domain, servers = EXCLUDED.servers", id, domain, s);
  1547. w.commit();
  1548. const uint64_t nwidInt = OSUtils::jsonIntHex(config["nwid"], 0ULL);
  1549. if (nwidInt) {
  1550. nlohmann::json nwOrig;
  1551. nlohmann::json nwNew(config);
  1552. get(nwidInt, nwOrig);
  1553. _networkChanged(nwOrig, nwNew, qitem.second);
  1554. }
  1555. else {
  1556. fprintf(stderr, "%s: Can't notify network changed: %llu\n", _myAddressStr.c_str(), (unsigned long long)nwidInt);
  1557. }
  1558. }
  1559. catch (std::exception& e) {
  1560. nspan->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  1561. fprintf(stderr, "%s ERROR: Error updating network: %s\n", _myAddressStr.c_str(), e.what());
  1562. }
  1563. if (_redisMemberStatus) {
  1564. try {
  1565. std::string id = config["id"];
  1566. std::string controllerId = _myAddressStr.c_str();
  1567. std::string key = "networks:{" + controllerId + "}";
  1568. if (_rc->clusterMode) {
  1569. _cluster->sadd(key, id);
  1570. }
  1571. else {
  1572. _redis->sadd(key, id);
  1573. }
  1574. }
  1575. catch (sw::redis::Error& e) {
  1576. nspan->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  1577. fprintf(stderr, "ERROR: Error adding network to Redis: %s\n", e.what());
  1578. }
  1579. }
  1580. }
  1581. else if (objtype == "_delete_network") {
  1582. auto dspan = tracer->StartSpan("cv1::commitThread::_delete_network");
  1583. auto dscope = tracer->WithActiveSpan(dspan);
  1584. // fprintf(stderr, "%s: commitThread: delete network\n", _myAddressStr.c_str());
  1585. try {
  1586. pqxx::work w(*c->c);
  1587. std::string networkId = config["nwid"];
  1588. pqxx::result res = w.exec_params0("UPDATE ztc_network SET deleted = true WHERE id = $1", networkId);
  1589. w.commit();
  1590. }
  1591. catch (std::exception& e) {
  1592. dspan->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  1593. fprintf(stderr, "%s ERROR: Error deleting network: %s\n", _myAddressStr.c_str(), e.what());
  1594. }
  1595. if (_redisMemberStatus) {
  1596. try {
  1597. std::string id = config["id"];
  1598. std::string controllerId = _myAddressStr.c_str();
  1599. std::string key = "networks:{" + controllerId + "}";
  1600. if (_rc->clusterMode) {
  1601. _cluster->srem(key, id);
  1602. _cluster->del("network-nodes-online:{" + controllerId + "}:" + id);
  1603. }
  1604. else {
  1605. _redis->srem(key, id);
  1606. _redis->del("network-nodes-online:{" + controllerId + "}:" + id);
  1607. }
  1608. }
  1609. catch (sw::redis::Error& e) {
  1610. dspan->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  1611. fprintf(stderr, "ERROR: Error adding network to Redis: %s\n", e.what());
  1612. }
  1613. }
  1614. }
  1615. else if (objtype == "_delete_member") {
  1616. auto mspan = tracer->StartSpan("cv1::commitThread::_delete_member");
  1617. auto mscope = tracer->WithActiveSpan(mspan);
  1618. // fprintf(stderr, "%s commitThread: delete member\n", _myAddressStr.c_str());
  1619. try {
  1620. pqxx::work w(*c->c);
  1621. std::string memberId = config["id"];
  1622. std::string networkId = config["nwid"];
  1623. pqxx::result res = w.exec_params0("UPDATE ztc_member SET hidden = true, deleted = true WHERE id = $1 AND network_id = $2", memberId, networkId);
  1624. w.commit();
  1625. }
  1626. catch (std::exception& e) {
  1627. mspan->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  1628. fprintf(stderr, "%s ERROR: Error deleting member: %s\n", _myAddressStr.c_str(), e.what());
  1629. }
  1630. if (_redisMemberStatus) {
  1631. try {
  1632. std::string memberId = config["id"];
  1633. std::string networkId = config["nwid"];
  1634. std::string controllerId = _myAddressStr.c_str();
  1635. std::string key = "network-nodes-all:{" + controllerId + "}:" + networkId;
  1636. if (_rc->clusterMode) {
  1637. _cluster->srem(key, memberId);
  1638. _cluster->del("member:{" + controllerId + "}:" + networkId + ":" + memberId);
  1639. }
  1640. else {
  1641. _redis->srem(key, memberId);
  1642. _redis->del("member:{" + controllerId + "}:" + networkId + ":" + memberId);
  1643. }
  1644. }
  1645. catch (sw::redis::Error& e) {
  1646. mspan->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  1647. fprintf(stderr, "ERROR: Error deleting member from Redis: %s\n", e.what());
  1648. }
  1649. }
  1650. }
  1651. else {
  1652. fprintf(stderr, "%s ERROR: unknown objtype\n", _myAddressStr.c_str());
  1653. }
  1654. }
  1655. catch (std::exception& e) {
  1656. span->SetStatus(opentelemetry::trace::StatusCode::kError, e.what());
  1657. fprintf(stderr, "%s ERROR: Error getting objtype: %s\n", _myAddressStr.c_str(), e.what());
  1658. }
  1659. _pool->unborrow(c);
  1660. c.reset();
  1661. }
  1662. fprintf(stderr, "%s commitThread finished\n", _myAddressStr.c_str());
  1663. }
  1664. void CV1::notifyNewMember(const std::string& networkID, const std::string& memberID)
  1665. {
  1666. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  1667. auto tracer = provider->GetTracer("cv1");
  1668. auto span = tracer->StartSpan("cv1::notifyNewMember");
  1669. auto scope = tracer->WithActiveSpan(span);
  1670. rustybits::smee_client_notify_network_joined(_smee, networkID.c_str(), memberID.c_str());
  1671. }
  1672. void CV1::onlineNotificationThread()
  1673. {
  1674. waitForReady();
  1675. if (_redisMemberStatus) {
  1676. onlineNotification_Redis();
  1677. }
  1678. else {
  1679. onlineNotification_Postgres();
  1680. }
  1681. }
  1682. /**
  1683. * ONLY UNCOMMENT FOR TEMPORARY DB MAINTENANCE
  1684. *
  1685. * This define temporarily turns off writing to the member status table
  1686. * so it can be reindexed when the indexes get too large.
  1687. */
  1688. // #define DISABLE_MEMBER_STATUS 1
  1689. void CV1::onlineNotification_Postgres()
  1690. {
  1691. _connected = 1;
  1692. nlohmann::json jtmp1, jtmp2;
  1693. while (_run == 1) {
  1694. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  1695. auto tracer = provider->GetTracer("cv1");
  1696. auto span = tracer->StartSpan("cv1::onlineNotification_Postgres");
  1697. auto scope = tracer->WithActiveSpan(span);
  1698. auto c = _pool->borrow();
  1699. auto c2 = _pool->borrow();
  1700. try {
  1701. fprintf(stderr, "%s onlineNotification_Postgres\n", _myAddressStr.c_str());
  1702. std::unordered_map<std::pair<uint64_t, uint64_t>, NodeOnlineRecord, _PairHasher> lastOnline;
  1703. {
  1704. std::lock_guard<std::mutex> l(_lastOnline_l);
  1705. lastOnline.swap(_lastOnline);
  1706. }
  1707. #ifndef DISABLE_MEMBER_STATUS
  1708. pqxx::work w(*c->c);
  1709. pqxx::work w2(*c2->c);
  1710. fprintf(stderr, "online notification tick\n");
  1711. bool firstRun = true;
  1712. bool memberAdded = false;
  1713. int updateCount = 0;
  1714. pqxx::pipeline pipe(w);
  1715. for (auto i = lastOnline.begin(); i != lastOnline.end(); ++i) {
  1716. updateCount += 1;
  1717. uint64_t nwid_i = i->first.first;
  1718. char nwidTmp[64];
  1719. char memTmp[64];
  1720. char ipTmp[64];
  1721. OSUtils::ztsnprintf(nwidTmp, sizeof(nwidTmp), "%.16llx", nwid_i);
  1722. OSUtils::ztsnprintf(memTmp, sizeof(memTmp), "%.10llx", i->first.second);
  1723. if (! get(nwid_i, jtmp1, i->first.second, jtmp2)) {
  1724. continue; // skip non existent networks/members
  1725. }
  1726. std::string networkId(nwidTmp);
  1727. std::string memberId(memTmp);
  1728. try {
  1729. pqxx::row r = w2.exec_params1("SELECT id, network_id FROM ztc_member WHERE network_id = $1 AND id = $2", networkId, memberId);
  1730. }
  1731. catch (pqxx::unexpected_rows& e) {
  1732. continue;
  1733. }
  1734. int64_t ts = i->second.lastSeen;
  1735. std::string ipAddr = i->second.physicalAddress.toIpString(ipTmp);
  1736. std::string timestamp = std::to_string(ts);
  1737. std::string osArch = i->second.osArch;
  1738. std::vector<std::string> osArchSplit = split(osArch, '/');
  1739. std::string os = "unknown";
  1740. std::string arch = "unknown";
  1741. if (osArchSplit.size() == 2) {
  1742. os = osArchSplit[0];
  1743. arch = osArchSplit[1];
  1744. }
  1745. std::stringstream memberUpdate;
  1746. memberUpdate << "INSERT INTO ztc_member_status (network_id, member_id, address, last_updated, os, arch) VALUES "
  1747. << "('" << networkId << "', '" << memberId << "', ";
  1748. if (ipAddr.empty()) {
  1749. memberUpdate << "NULL, ";
  1750. }
  1751. else {
  1752. memberUpdate << "'" << ipAddr << "', ";
  1753. }
  1754. memberUpdate << "TO_TIMESTAMP(" << timestamp << "::double precision/1000), "
  1755. << "'" << os << "', "
  1756. << "'" << arch << "'"
  1757. << ") "
  1758. << " ON CONFLICT (network_id, member_id) DO UPDATE SET address = EXCLUDED.address, last_updated = EXCLUDED.last_updated, "
  1759. << "os = EXCLUDED.os, arch = EXCLUDED.arch";
  1760. pipe.insert(memberUpdate.str());
  1761. Metrics::pgsql_node_checkin++;
  1762. }
  1763. while (! pipe.empty()) {
  1764. pipe.retrieve();
  1765. }
  1766. pipe.complete();
  1767. w.commit();
  1768. fprintf(stderr, "%s: Updated online status of %d members\n", _myAddressStr.c_str(), updateCount);
  1769. #endif
  1770. }
  1771. catch (std::exception& e) {
  1772. fprintf(stderr, "%s: error in onlinenotification thread: %s\n", _myAddressStr.c_str(), e.what());
  1773. }
  1774. _pool->unborrow(c2);
  1775. _pool->unborrow(c);
  1776. ConnectionPoolStats stats = _pool->get_stats();
  1777. fprintf(stderr, "%s pool stats: in use size: %llu, available size: %llu, total: %llu\n", _myAddressStr.c_str(), stats.borrowed_size, stats.pool_size, (stats.borrowed_size + stats.pool_size));
  1778. span->End();
  1779. std::this_thread::sleep_for(std::chrono::seconds(10));
  1780. }
  1781. fprintf(stderr, "%s: Fell out of run loop in onlineNotificationThread\n", _myAddressStr.c_str());
  1782. if (_run == 1) {
  1783. fprintf(stderr, "ERROR: %s onlineNotificationThread should still be running! Exiting Controller.\n", _myAddressStr.c_str());
  1784. exit(6);
  1785. }
  1786. }
  1787. void CV1::onlineNotification_Redis()
  1788. {
  1789. _connected = 1;
  1790. char buf[11] = { 0 };
  1791. std::string controllerId = std::string(_myAddress.toString(buf));
  1792. while (_run == 1) {
  1793. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  1794. auto tracer = provider->GetTracer("cv1");
  1795. auto span = tracer->StartSpan("cv1::onlineNotification_Redis");
  1796. auto scope = tracer->WithActiveSpan(span);
  1797. fprintf(stderr, "onlineNotification tick\n");
  1798. auto start = std::chrono::high_resolution_clock::now();
  1799. uint64_t count = 0;
  1800. std::unordered_map<std::pair<uint64_t, uint64_t>, NodeOnlineRecord, _PairHasher> lastOnline;
  1801. {
  1802. std::lock_guard<std::mutex> l(_lastOnline_l);
  1803. lastOnline.swap(_lastOnline);
  1804. }
  1805. try {
  1806. if (! lastOnline.empty()) {
  1807. if (_rc->clusterMode) {
  1808. auto tx = _cluster->transaction(controllerId, true, false);
  1809. count = _doRedisUpdate(tx, controllerId, lastOnline);
  1810. }
  1811. else {
  1812. auto tx = _redis->transaction(true, false);
  1813. count = _doRedisUpdate(tx, controllerId, lastOnline);
  1814. }
  1815. }
  1816. }
  1817. catch (sw::redis::Error& e) {
  1818. fprintf(stderr, "Error in online notification thread (redis): %s\n", e.what());
  1819. }
  1820. auto end = std::chrono::high_resolution_clock::now();
  1821. auto dur = std::chrono::duration_cast<std::chrono::milliseconds>(end - start);
  1822. auto total = dur.count();
  1823. fprintf(stderr, "onlineNotification ran in %llu ms\n", total);
  1824. span->End();
  1825. std::this_thread::sleep_for(std::chrono::seconds(5));
  1826. }
  1827. }
  1828. uint64_t CV1::_doRedisUpdate(sw::redis::Transaction& tx, std::string& controllerId, std::unordered_map<std::pair<uint64_t, uint64_t>, NodeOnlineRecord, _PairHasher>& lastOnline)
  1829. {
  1830. auto provider = opentelemetry::trace::Provider::GetTracerProvider();
  1831. auto tracer = provider->GetTracer("cv1");
  1832. auto span = tracer->StartSpan("cv1::_doRedisUpdate");
  1833. auto scope = tracer->WithActiveSpan(span);
  1834. nlohmann::json jtmp1, jtmp2;
  1835. uint64_t count = 0;
  1836. for (auto i = lastOnline.begin(); i != lastOnline.end(); ++i) {
  1837. uint64_t nwid_i = i->first.first;
  1838. uint64_t memberid_i = i->first.second;
  1839. char nwidTmp[64];
  1840. char memTmp[64];
  1841. char ipTmp[64];
  1842. OSUtils::ztsnprintf(nwidTmp, sizeof(nwidTmp), "%.16llx", nwid_i);
  1843. OSUtils::ztsnprintf(memTmp, sizeof(memTmp), "%.10llx", memberid_i);
  1844. if (! get(nwid_i, jtmp1, memberid_i, jtmp2)) {
  1845. continue; // skip non existent members/networks
  1846. }
  1847. std::string networkId(nwidTmp);
  1848. std::string memberId(memTmp);
  1849. int64_t ts = i->second.lastSeen;
  1850. std::string ipAddr = i->second.physicalAddress.toIpString(ipTmp);
  1851. std::string timestamp = std::to_string(ts);
  1852. std::string osArch = i->second.osArch;
  1853. std::vector<std::string> osArchSplit = split(osArch, '/');
  1854. std::string os = "unknown";
  1855. std::string arch = "unknown";
  1856. if (osArchSplit.size() == 2) {
  1857. os = osArchSplit[0];
  1858. arch = osArchSplit[1];
  1859. }
  1860. std::unordered_map<std::string, std::string> record = { { "id", memberId }, { "address", ipAddr }, { "last_updated", std::to_string(ts) }, { "os", os }, { "arch", arch } };
  1861. tx.zadd("nodes-online:{" + controllerId + "}", memberId, ts)
  1862. .zadd("nodes-online2:{" + controllerId + "}", networkId + "-" + memberId, ts)
  1863. .zadd("network-nodes-online:{" + controllerId + "}:" + networkId, memberId, ts)
  1864. .zadd("active-networks:{" + controllerId + "}", networkId, ts)
  1865. .sadd("network-nodes-all:{" + controllerId + "}:" + networkId, memberId)
  1866. .hmset("member:{" + controllerId + "}:" + networkId + ":" + memberId, record.begin(), record.end());
  1867. ++count;
  1868. Metrics::redis_node_checkin++;
  1869. }
  1870. // expire records from all-nodes and network-nodes member list
  1871. uint64_t expireOld = OSUtils::now() - 300000;
  1872. tx.zremrangebyscore("nodes-online:{" + controllerId + "}", sw::redis::RightBoundedInterval<double>(expireOld, sw::redis::BoundType::LEFT_OPEN));
  1873. tx.zremrangebyscore("nodes-online2:{" + controllerId + "}", sw::redis::RightBoundedInterval<double>(expireOld, sw::redis::BoundType::LEFT_OPEN));
  1874. tx.zremrangebyscore("active-networks:{" + controllerId + "}", sw::redis::RightBoundedInterval<double>(expireOld, sw::redis::BoundType::LEFT_OPEN));
  1875. {
  1876. std::shared_lock<std::shared_mutex> l(_networks_l);
  1877. for (const auto& it : _networks) {
  1878. uint64_t nwid_i = it.first;
  1879. char nwidTmp[64];
  1880. OSUtils::ztsnprintf(nwidTmp, sizeof(nwidTmp), "%.16llx", nwid_i);
  1881. tx.zremrangebyscore("network-nodes-online:{" + controllerId + "}:" + nwidTmp, sw::redis::RightBoundedInterval<double>(expireOld, sw::redis::BoundType::LEFT_OPEN));
  1882. }
  1883. }
  1884. tx.exec();
  1885. fprintf(stderr, "%s: Updated online status of %d members\n", _myAddressStr.c_str(), count);
  1886. return count;
  1887. }
  1888. #endif // ZT_CONTROLLER_USE_LIBPQ