1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440 |
- /* vim: set expandtab ts=4 sw=4: */
- /*
- * You may redistribute this program and/or modify it under the terms of
- * the GNU General Public License as published by the Free Software Foundation,
- * either version 3 of the License, or (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this program. If not, see <http://www.gnu.org/licenses/>.
- */
- #include "dht/Address.h"
- #include "dht/dhtcore/Node.h"
- #include "dht/dhtcore/NodeStore.h"
- #include "dht/dhtcore/NodeList.h"
- #include "util/AddrTools.h"
- #include "util/Assert.h"
- #include "util/Bits.h"
- #include "util/log/Log.h"
- #include "util/version/Version.h"
- #include "switch/NumberCompress.h"
- #include "switch/LabelSplicer.h"
- #include "util/Gcc.h"
- #include "util/Defined.h"
- #include "util/Endian.h"
- #include "util/events/Time.h"
- #include <tree.h>
- /** A list of DHT nodes. */
- struct NodeStore_pvt
- {
- struct NodeStore pub;
- /** A fake link where we are both the parent and child. */
- struct Node_Link* selfLink;
- /** A tree containing all nodes ordered by ipv6 */
- struct NodeRBTree {
- struct Node_Two* rbh_root;
- } nodeTree;
- struct Allocator* alloc;
- /**
- * The links to be freed next time freePendingLinks() is called.
- */
- struct Node_Link* linksToFree;
- /** Nodes which have very likely been reset. */
- struct RumorMill* renumberMill;
- /** The means for this node store to log. */
- struct Log* logger;
- /** To track time, for e.g. figuring out when nodes were last pinged */
- struct EventBase* eventBase;
- Identity
- };
- // My memory is really bad
- #define A_COMES_FIRST 1
- #define B_COMES_FIRST -1
- static int comparePeers(const struct Node_Link* la, const struct Node_Link* lb)
- {
- Identity_check(lb);
- uint64_t a = la->cannonicalLabel;
- uint64_t b = lb->cannonicalLabel;
- int log2Diff = Bits_log2x64(b) - Bits_log2x64(a);
- if (log2Diff) {
- return log2Diff;
- }
- if (Bits_bitReverse64(a) < Bits_bitReverse64(b)) {
- return A_COMES_FIRST;
- } else if (a == b) {
- return 0;
- }
- return B_COMES_FIRST;
- }
- RB_GENERATE_STATIC(PeerRBTree, Node_Link, peerTree, comparePeers)
- static int compareNodes(const struct Node_Two* na, const struct Node_Two* nb)
- {
- Identity_check(nb);
- int ret;
- ret = Address_xorcmp(0, na->address.ip6.ints.one_be, nb->address.ip6.ints.one_be);
- if (ret) { return ret; }
- ret = Address_xorcmp(0, na->address.ip6.ints.two_be, nb->address.ip6.ints.two_be);
- if (ret) { return ret; }
- ret = Address_xorcmp(0, na->address.ip6.ints.three_be, nb->address.ip6.ints.three_be);
- if (ret) { return ret; }
- ret = Address_xorcmp(0, na->address.ip6.ints.four_be, nb->address.ip6.ints.four_be);
- return ret;
- }
- RB_GENERATE_STATIC(NodeRBTree, Node_Two, nodeTree, compareNodes)
- static void freeLink(struct Node_Link* link, struct NodeStore_pvt* store)
- {
- Allocator_realloc(store->alloc, link, 0);
- store->pub.linkCount--;
- }
- static struct Node_Link* getLink(struct NodeStore_pvt* store)
- {
- store->pub.linkCount++;
- return Allocator_calloc(store->alloc, sizeof(struct Node_Link), 1);
- }
- static void logLink(struct NodeStore_pvt* store,
- struct Node_Link* link,
- char* message)
- {
- if (!Defined(Log_DEBUG)) {
- return;
- }
- uint8_t parent[40];
- uint8_t child[40];
- AddrTools_printIp(parent, link->parent->address.ip6.bytes);
- AddrTools_printIp(child, link->child->address.ip6.bytes);
- uint8_t path[20];
- AddrTools_printPath(path, link->cannonicalLabel);
- Log_debug(store->logger, "link[%s]->[%s] [%s] %s", parent, child, path, message);
- }
- static void _checkNode(struct Node_Two* node, struct NodeStore_pvt* store, char* file, int line)
- {
- if (!Defined(PARANOIA)) {
- return;
- }
- Assert_true(node->address.path ==
- EncodingScheme_convertLabel(store->pub.selfNode->encodingScheme,
- node->address.path,
- EncodingScheme_convertLabel_convertTo_CANNONICAL));
- struct Node_Link* link;
- for (link = node->reversePeers; link; link = link->nextPeer) {
- Assert_fileLine(link->child == node, file, line);
- Assert_fileLine(RB_FIND(PeerRBTree, &link->parent->peerTree, link) == link, file, line);
- // This is for you arc
- int ok = 0;
- struct Node_Link* nl = NULL;
- while ((nl = NodeStore_nextLink(link->parent, nl))) {
- if (nl == link) { ok = 1; break; }
- }
- Assert_fileLine(ok, file, line);
- //
- }
- struct Node_Link* lastLink = NULL;
- RB_FOREACH_REVERSE(link, PeerRBTree, &node->peerTree) {
- Assert_fileLine(!EncodingScheme_isSelfRoute(link->parent->encodingScheme,
- link->cannonicalLabel)
- || link == store->selfLink,
- file, line);
- Assert_fileLine(Node_getBestParent(node) || Node_getBestParent(link->child) != link,
- file, line);
- Assert_fileLine(link->parent == node, file, line);
- Assert_fileLine(link->child != node || link == store->selfLink, file, line);
- Assert_fileLine(!lastLink || link->cannonicalLabel != lastLink->cannonicalLabel,
- file, line);
- Assert_fileLine(link->cannonicalLabel < UINT64_MAX && link->cannonicalLabel > 0,
- file, line);
- // Make sure there isn't a link which has a completely wacky link encoding number.
- // Also make sure links are all flushed if a node is discovered to have changed it's
- // encoding scheme...
- Assert_fileLine(link->inverseLinkEncodingFormNumber < link->child->encodingScheme->count,
- file, line);
- struct Node_Link* rlink = NULL;
- for (rlink = link->child->reversePeers; rlink; rlink = rlink->nextPeer) {
- if (rlink == link) {
- break;
- }
- }
- Assert_fileLine(rlink && "child contains reverse link", file, line);
- lastLink = link;
- }
- if (Node_getBestParent(node)) {
- Assert_fileLine(node->address.path != UINT64_MAX, file, line);
- Assert_fileLine(Node_getReach(node) > 0, file, line);
- struct Node_Two* nn = node;
- do {
- Assert_fileLine(
- LabelSplicer_routesThrough(nn->address.path,
- Node_getBestParent(nn)->parent->address.path),
- file,
- line
- );
- nn = Node_getBestParent(nn)->parent;
- } while (nn != store->pub.selfNode);
- } else {
- Assert_fileLine(node->address.path == UINT64_MAX, file, line);
- Assert_fileLine(Node_getReach(node) == 0, file, line);
- }
- }
- #define checkNode(node, store) _checkNode(node, store, Gcc_SHORT_FILE, Gcc_LINE)
- static void _verifyNode(struct Node_Two* node, struct NodeStore_pvt* store, char* file, int line)
- {
- if (!Defined(PARANOIA)) {
- return;
- }
- // #1 check the node (do the basic checks)
- _checkNode(node, store, file, line);
- // #2 make sure all of the node's outgoing links are split properly
- struct Node_Link* link = NULL;
- RB_FOREACH_REVERSE(link, PeerRBTree, &node->peerTree) {
- // make sure any peers of this node are split properly
- struct Node_Link* linkB = link;
- struct Node_Link* linkC = link;
- RB_FOREACH_REVERSE_FROM(linkB, PeerRBTree, linkC) {
- if (linkB == link || link == store->selfLink) { continue; }
- Assert_fileLine(
- !LabelSplicer_routesThrough(linkB->cannonicalLabel, link->cannonicalLabel),
- file, line
- );
- }
- Assert_true(!link->nextInSplitList);
- }
- // #3 make sure looking for the node by address will actually find the correct node.
- if (Node_getBestParent(node)) {
- Assert_fileLine(node == NodeStore_closestNode(&store->pub, node->address.path), file, line);
- }
- // #5 no persistant markings are allowed.
- Assert_true(!node->marked);
- }
- #define verifyNode(node, store) _verifyNode(node, store, Gcc_SHORT_FILE, Gcc_LINE)
- // Verify is more thorough than check because it makes sure all links are split properly.
- static void _verify(struct NodeStore_pvt* store, char* file, int line)
- {
- if (!Defined(PARANOIA)) {
- return;
- }
- Assert_true(Node_getBestParent(store->pub.selfNode) == store->selfLink || !store->selfLink);
- int linkedNodes = 0;
- struct Node_Two* nn = NULL;
- RB_FOREACH(nn, NodeRBTree, &store->nodeTree) {
- _verifyNode(nn, store, file, line);
- if (Node_getBestParent(nn)) { linkedNodes++; }
- }
- Assert_fileLine(linkedNodes == store->pub.linkedNodes, file, line);
- }
- #define verify(store) _verify(store, Gcc_SHORT_FILE, Gcc_LINE)
- static void _check(struct NodeStore_pvt* store, char* file, int line)
- {
- if (!Defined(PARANOIA)) {
- return;
- }
- Assert_true(Node_getBestParent(store->pub.selfNode) == store->selfLink || !store->selfLink);
- struct Node_Two* nn = NULL;
- RB_FOREACH(nn, NodeRBTree, &store->nodeTree) {
- _checkNode(nn, store, file, line);
- }
- }
- #define check(store) _check(store, Gcc_SHORT_FILE, Gcc_LINE)
- /**
- * Extend a route by splicing on another link.
- * This will modify the Encoding Form of the first Director in next section of the route to make
- * it's size greater than or equal to the size of the return route through the parent node in the
- * link.
- *
- * @param routeToParent the label for reaching the parent node
- * @param parentScheme the label encoding scheme used by the parent node
- * @param routeParentToChild the cannonicalLabel for the link from parent to child
- * @param previousLinkEncoding the encoding used for the parent's interface back to the grandparent
- * @return a converted/spliced label or extendRoute_INVALID if it happens that the parent
- * or extendRoute_TOOLONG if the label is too long to represent.
- */
- #define extendRoute_INVALID (((uint64_t)~0)-1)
- #define extendRoute_TOOLONG (((uint64_t)~0))
- static uint64_t extendRoute(uint64_t routeToParent,
- struct EncodingScheme* parentScheme,
- uint64_t routeParentToChild,
- int previousLinkEncoding)
- {
- Assert_true(routeParentToChild != EncodingScheme_convertLabel_INVALID);
- // Make sure they didn't send us a 'silly' route.
- int nextLinkEncoding = EncodingScheme_getFormNum(parentScheme, routeParentToChild);
- if (nextLinkEncoding == EncodingScheme_getFormNum_INVALID) { return extendRoute_INVALID; }
- // If the encoding to get to the parent uses more bits than the encoding to get from parent
- // to child, we need to change the encoding...
- if (previousLinkEncoding > nextLinkEncoding) {
- routeParentToChild =
- EncodingScheme_convertLabel(parentScheme, routeParentToChild, previousLinkEncoding);
- Assert_true(routeParentToChild != EncodingScheme_convertLabel_INVALID);
- }
- return LabelSplicer_splice(routeParentToChild, routeToParent);
- }
- static void update(struct Node_Link* link,
- int64_t linkStateDiff,
- struct NodeStore_pvt* store)
- {
- if (linkStateDiff + link->linkState > UINT32_MAX) {
- link->linkState = UINT32_MAX;
- //logLink(store, link, "link state set to maximum");
- } else if (linkStateDiff + link->linkState < 0) {
- link->linkState = 0;
- logLink(store, link, "link state set to zero");
- } else {
- link->linkState += linkStateDiff;
- }
- }
- static bool isPeer(struct Node_Two* node, struct NodeStore_pvt* store)
- {
- struct Node_Link* bp = Node_getBestParent(node);
- return bp && bp->parent == store->pub.selfNode && Node_isOneHopLink(bp);
- }
- static void setParentReachAndPath(struct Node_Two* node,
- struct Node_Link* parent,
- uint32_t reach,
- uint64_t path,
- struct NodeStore_pvt* store)
- {
- uint64_t oldPath = node->address.path;
- Node_setParentReachAndPath(node, parent, reach, path);
- if (oldPath != path && store->pub.onBestPathChange) {
- store->pub.onBestPathChange(store->pub.onBestPathChangeCtx, node);
- }
- }
- static void unreachable(struct Node_Two* node, struct NodeStore_pvt* store)
- {
- struct Node_Link* next = NULL;
- RB_FOREACH_REVERSE(next, PeerRBTree, &node->peerTree) {
- if (Node_getBestParent(next->child) == next) { unreachable(next->child, store); }
- }
- // We think the link is down, so reset the link state.
- struct Node_Link* bp = Node_getBestParent(node);
- if (bp) {
- update(bp, -UINT32_MAX, store);
- store->pub.linkedNodes--;
- }
- setParentReachAndPath(node, NULL, 0, UINT64_MAX, store);
- }
- /** Adds the reach of path A->B to path B->C to get the expected reach of A->C. */
- static uint32_t addReach(uint32_t reachAB, uint32_t reachBC)
- {
- uint64_t b = reachAB;
- uint64_t c = reachBC;
- uint64_t reachAC = (b * c) / (b + c);
- if (reachAC > UINT32_MAX) { return UINT32_MAX; }
- return reachAC;
- }
- /** Subtracts the reach of path A->B from path A->B->C, to get reach of B->C. */
- static uint32_t subReach(uint32_t reachAB, uint32_t reachAC)
- {
- if (reachAB <= reachAC) { return UINT32_MAX; }
- uint64_t b = reachAB;
- uint64_t c = reachAC;
- uint64_t reachBC = (b * c) / (b - c);
- if (reachBC > UINT32_MAX) { return UINT32_MAX; }
- return reachBC;
- }
- /**
- * This is called when we have no idea what the reach should be for the next hop
- * because the path we previously used to get to it is broken and we need to use
- * a different one. Take a somewhat educated guess as to what it might be in a way
- * that will make the reach non-zero.
- */
- static uint32_t guessReachOfChild(struct Node_Link* link)
- {
- uint32_t r;
- if (Node_isOneHopLink(link)) {
- // Single-hop link, so guess that it's 3/4 the parent's reach
- r = (Node_getReach(link->parent) * 3) / 4;
- }
- else {
- // Multi-hop link, so let's assume 1/2 the parent's reach.
- r = Node_getReach(link->parent) / 2;
- }
- if (r < (1<<12)) {
- if (Node_getReach(link->parent) == 1) {
- r = 1;
- } else {
- r = Node_getReach(link->parent) - 1;
- }
- } else if (r < (1<<16)) {
- r = Node_getReach(link->parent) - Bits_log2x64(link->cannonicalLabel);
- }
- // Educated guess, parent's latency + link's latency (neither of which is known perfectly).
- uint32_t guess = addReach(Node_getReach(link->parent), link->linkState);
- if (guess < Node_getReach(link->parent) && guess > r) {
- // Our guess is sensible, so use it.
- r = guess;
- }
- // Try to reduce oscillation based on guesses.
- struct Node_Link* bp = Node_getBestParent(link->child);
- if (bp && bp != link) {
- uint32_t bpGuess = guessReachOfChild(bp);
- if (r > bpGuess) { r = bpGuess; }
- }
- Assert_true(r <= Node_getReach(link->parent));
- Assert_true(r);
- return r;
- }
- // Must always return 0 for null link or link which is disconnected from the tree.
- static uint32_t pathQuality(struct Node_Link* link)
- {
- if (!link || !Node_getBestParent(link->parent)) { return 0; }
- uint32_t out = 0;
- out |= (Node_isOneHopLink(link) << 31);
- out |= (Node_getReach(link->parent) & 0x7fffffff);
- return out;
- }
- static int updateBestParentCycle(struct Node_Link* newBestLink,
- int cycle,
- int limit,
- uint32_t nextReach,
- struct NodeStore_pvt* store)
- {
- Assert_true(cycle < 1000);
- struct Node_Two* node = newBestLink->child;
- if (cycle < limit) {
- int total = 0;
- struct Node_Link* next = NULL;
- RB_FOREACH_REVERSE(next, PeerRBTree, &node->peerTree) {
- if (Node_getBestParent(next->child) == next && next->child != node) {
- total += updateBestParentCycle(next, cycle+1, limit, nextReach, store);
- }
- }
- return total;
- }
- struct Node_Two* newBest = newBestLink->parent;
- Assert_true(Node_getBestParent(newBest));
- uint64_t bestPath = extendRoute(newBest->address.path,
- newBest->encodingScheme,
- newBestLink->cannonicalLabel,
- Node_getBestParent(newBest)->inverseLinkEncodingFormNumber);
- if (bestPath == extendRoute_TOOLONG) {
- // too long to splice.
- unreachable(node, store);
- return 1;
- }
- Assert_true(bestPath != extendRoute_INVALID);
- /*if (Defined(Log_DEBUG)) {
- if (node->address.path != bestPath) {
- uint8_t pathStr[20];
- AddrTools_printPath(pathStr, bestPath);
- uint8_t addrStr[40];
- AddrTools_printIp(addrStr, node->address.ip6.bytes);
- Log_debug(store->logger, "New best path [%s@%s]", addrStr, pathStr);
- }
- }*/
- if (limit) {
- // We're only altering the reach of the top node in the chain.
- // If we want to deduce reach of further nodes along the path, here's the place.
- nextReach = Node_getReach(node);
- Assert_true(Node_getBestParent(node) == newBestLink);
- }
- if (!Node_getBestParent(node)) { store->pub.linkedNodes++; }
- setParentReachAndPath(node, newBestLink, nextReach, bestPath, store);
- checkNode(node, store);
- return 1;
- }
- /**
- * Update the best parent of this node.
- * propigating path changes out through the tree.
- *
- * @param newBestParent the new best link to the node. The affected node is newBestParent->child.
- * @param nextReach the reach to set the node to.
- * @param store the nodestore.
- */
- static void updateBestParent(struct Node_Link* newBestParent,
- uint32_t nextReach,
- struct NodeStore_pvt* store)
- {
- check(store);
- Assert_true(newBestParent);
- for (int i = 0; i < 10000; i++) {
- if (!updateBestParentCycle(newBestParent, 0, i, nextReach, store)) {
- check(store);
- return;
- }
- }
- Assert_true(0);
- }
- static void handleGoodNews(struct Node_Two* node,
- uint32_t newReach,
- struct NodeStore_pvt* store)
- {
- // TODO(cjd): Paths longer than 1024 will blow up, handle more gracefully
- Assert_true(newReach != UINT32_MAX);
- Assert_true(newReach > Node_getReach(node));
- // The nodestore thinks it's unreachable, we can't very well update the reach.
- if (Node_getBestParent(node) == NULL) { return; }
- struct Node_Two* bp = Node_getBestParent(node)->parent;
- if (newReach+1 > Node_getReach(bp)) {
- handleGoodNews(bp, newReach+1, store);
- }
- Node_setReach(node, newReach);
- struct Node_Link* link = NULL;
- RB_FOREACH_REVERSE(link, PeerRBTree, &node->peerTree) {
- Identity_check(link);
- struct Node_Two* child = link->child;
- struct Node_Link* childBestParent = Node_getBestParent(child);
- if (!childBestParent || pathQuality(childBestParent) < pathQuality(link)) {
- uint32_t nextReach = guessReachOfChild(link);
- if (Node_getReach(child) > nextReach) { continue; }
- updateBestParent(link, nextReach, store);
- }
- }
- }
- /**
- * The news has hit (in handleBadNewsOne) and now all of the nodes in the affected zone have
- * been knocked down. Now lets see if there's a better path for any of them.
- */
- static int handleBadNewsTwoCycle(struct Node_Two* node,
- int cycle,
- int limit,
- struct NodeStore_pvt* store)
- {
- Assert_true(cycle < 1000);
- if (cycle < limit) {
- int total = 0;
- struct Node_Link* next = NULL;
- RB_FOREACH_REVERSE(next, PeerRBTree, &node->peerTree) {
- if (Node_getBestParent(next->child) == next && next->child != node) {
- total += handleBadNewsTwoCycle(next->child, cycle+1, limit, store);
- }
- }
- return total;
- }
- struct Node_Link* rp = node->reversePeers;
- struct Node_Link* best = Node_getBestParent(node);
- uint32_t bq = pathQuality(best);
- while (rp) {
- if (!Node_isAncestorOf(node, rp->parent) && pathQuality(rp) > bq) {
- best = rp;
- bq = pathQuality(best);
- }
- rp = rp->nextPeer;
- }
- if (best == Node_getBestParent(node)) { return 1; }
- if (!Node_getBestParent(best->parent)) { return 1; }
- if (Node_getBestParent(node) == store->selfLink) { return 1; }
- uint32_t nextReach = guessReachOfChild(best);
- if (nextReach < Node_getReach(node)) {
- // We've already knocked down the reach of this node in handleBadNewsOne
- // now we have determined that link quality of the other parent is better
- // so reach should be the greater of guessReachOfChild and current reach.
- nextReach = Node_getReach(node);
- }
- check(store);
- updateBestParent(best, nextReach, store);
- check(store);
- return 1;
- }
- /**
- * First thing we do is knock down everybody's reach.
- * This way they don't all cling to eachother for safety making
- * endless routing loops and stupid processing.
- */
- static void handleBadNewsOne(struct Node_Two* node,
- uint32_t newReach,
- struct NodeStore_pvt* store)
- {
- struct Node_Link* next = NULL;
- RB_FOREACH_REVERSE(next, PeerRBTree, &node->peerTree) {
- if (Node_getBestParent(next->child) != next) { continue; }
- if (next == store->selfLink) { continue; }
- if (Node_getReach(next->child) < newReach) { continue; }
- handleBadNewsOne(next->child, newReach, store);
- }
- Assert_true(node != store->pub.selfNode);
- if (!newReach) {
- unreachable(node, store);
- } else {
- Node_setReach(node, newReach);
- }
- }
- static void handleBadNews(struct Node_Two* node,
- uint32_t newReach,
- struct NodeStore_pvt* store)
- {
- Assert_true(newReach < Node_getReach(node));
- Assert_true(Node_getBestParent(node) && node != store->pub.selfNode);
- handleBadNewsOne(node, newReach, store);
- check(store);
- for (int i = 0; ; i++) {
- if (!handleBadNewsTwoCycle(node, 0, i, store)) {
- check(store);
- return;
- }
- }
- }
- static void handleNews(struct Node_Two* node, uint32_t newReach, struct NodeStore_pvt* store)
- {
- // This is because reach is used to prevent loops so it must be 1 more for each hop closer
- // to the root.
- if (newReach > (UINT32_MAX - 1024)) { newReach = (UINT32_MAX - 1024); }
- check(store);
- if (newReach < Node_getReach(node)) {
- handleBadNews(node, newReach, store);
- check(store);
- } else if (newReach > Node_getReach(node)) {
- handleGoodNews(node, newReach, store);
- check(store);
- }
- }
- void NodeStore_unlinkNodes(struct NodeStore* nodeStore, struct Node_Link* link)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*) nodeStore);
- struct Node_Two* child = Identity_check(link->child);
- struct Node_Two* parent = Identity_check(link->parent);
- check(store);
- if (parent == store->pub.selfNode) {
- // yuh ok
- if (link == store->selfLink) { return; }
- Assert_true(Node_isOneHopLink(link));
- store->pub.peerCount--;
- if (Defined(Log_INFO)) {
- uint8_t addr[60];
- Address_print(addr, &child->address);
- Log_info(store->logger, "Direct peer [%s] has been unlinked", addr);
- }
- }
- // Change the best parent and path if necessary
- if (Node_getBestParent(child) == link) {
- handleBadNews(child, 0, store);
- }
- if (Node_getBestParent(child) == link) {
- unreachable(child, store);
- }
- check(store);
- // Remove the entry from the reversePeers
- struct Node_Link* current = child->reversePeers;
- struct Node_Link** currentP = &child->reversePeers;
- while (current) {
- if (current == link) {
- *currentP = current->nextPeer;
- break;
- }
- currentP = &(current->nextPeer);
- current = *currentP;
- }
- Assert_true(current);
- // Remove the RBTree entry
- Assert_ifParanoid(link == RB_FIND(PeerRBTree, &parent->peerTree, link));
- RB_REMOVE(PeerRBTree, &parent->peerTree, link);
- link->nextPeer = store->linksToFree;
- store->linksToFree = link;
- // prevent double-free of link.
- link->parent = NULL;
- link->child = NULL;
- check(store);
- }
- /**
- * Link two nodes in the graph together.
- * If a parent of the child node is also a parent of the parent node, they are
- * unlinked (the link is split and the child is inserted in the middle).
- *
- * @param parent the current end of the graph
- * @param child the new node to extend the graph
- * @param cannonicalLabel the label for getting from the parent to the child.
- * @param linkStateDiff how much to change the link state for this link.
- * @param store
- */
- static struct Node_Link* linkNodes(struct Node_Two* parent,
- struct Node_Two* child,
- uint64_t cannonicalLabel,
- int64_t linkStateDiff,
- int inverseLinkEncodingFormNumber,
- uint64_t discoveredPath,
- struct NodeStore_pvt* store)
- {
- check(store);
- if (Defined(Log_DEBUG)) {
- uint8_t parentIp[40];
- uint8_t childIp[40];
- AddrTools_printIp(parentIp, parent->address.ip6.bytes);
- AddrTools_printIp(childIp, child->address.ip6.bytes);
- uint8_t printedLabel[20];
- AddrTools_printPath(printedLabel, cannonicalLabel);
- Log_debug(store->logger, "Linking [%s] with [%s] with label fragment [%s]",
- parentIp, childIp, printedLabel);
- }
- // It's ok to link a node with itself via some loopey route.
- // in practice it should never actually be used and it might yield some interesting
- // information when the link is split, self-routes are not allowed unless the self
- // link is being set up :)
- Assert_true(cannonicalLabel != 1 || store->selfLink == NULL);
- if (Defined(PARANOIA)) {
- uint64_t definitelyCannonical =
- EncodingScheme_convertLabel(parent->encodingScheme,
- cannonicalLabel,
- EncodingScheme_convertLabel_convertTo_CANNONICAL);
- Assert_true(definitelyCannonical == cannonicalLabel);
- }
- {
- struct Node_Link* link;
- RB_FOREACH_REVERSE(link, PeerRBTree, &parent->peerTree) {
- Identity_check(link);
- if (link->child == child) {
- if (link->cannonicalLabel != cannonicalLabel) {
- // multiple paths between A and B are ok because they
- // will have divergent paths following the first director.
- continue;
- } else if (link->inverseLinkEncodingFormNumber != inverseLinkEncodingFormNumber) {
- logLink(store, link, "Relinking nodes with different encoding form");
- // This can happen when C renumbers but B->C is the same because B did
- // not renumber, EG: if C restarts.
- link->inverseLinkEncodingFormNumber = inverseLinkEncodingFormNumber;
- }
- update(link, linkStateDiff, store);
- return link;
- }
- }
- }
- if (Defined(PARANOIA)) {
- struct Node_Link dummy = { .cannonicalLabel = cannonicalLabel };
- struct Node_Link* link = Identity_ncheck(RB_FIND(PeerRBTree, &parent->peerTree, &dummy));
- if (link) {
- logLink(store, link, "Attempted to create alternate link with same label!");
- Assert_true(0);
- return link;
- }
- }
- Assert_true(cannonicalLabel <= discoveredPath);
- struct Node_Link* link = getLink(store);
- // set it up
- link->cannonicalLabel = cannonicalLabel;
- link->inverseLinkEncodingFormNumber = inverseLinkEncodingFormNumber;
- link->child = child;
- link->parent = parent;
- link->discoveredPath = discoveredPath;
- link->linkState = 0;
- link->timeLastSeen = Time_currentTimeMilliseconds(store->eventBase);
- Identity_set(link);
- // reverse link
- link->nextPeer = child->reversePeers;
- child->reversePeers = link;
- // forward link
- Assert_ifParanoid(!RB_FIND(PeerRBTree, &parent->peerTree, link));
- RB_INSERT(PeerRBTree, &parent->peerTree, link);
- if (!Node_getBestParent(child)) {
- if (Node_getBestParent(parent)) {
- updateBestParent(link, guessReachOfChild(link), store);
- } else {
- unreachable(child, store);
- }
- }
- // update the child's link state and possibly change it's preferred path
- update(link, linkStateDiff, store);
- if (parent == store->pub.selfNode && child != store->pub.selfNode) {
- Assert_true(Node_isOneHopLink(link));
- store->pub.peerCount++;
- if (Defined(Log_DEBUG)) {
- uint8_t addr[60];
- Address_print(addr, &child->address);
- Log_info(store->logger, "Direct peer [%s] has been linked", addr);
- }
- }
- check(store);
- return link;
- }
- #define removeLinkFromLabel_IMPOSSIBLE UINT64_MAX
- #define removeLinkFromLabel_OVERSIZE (UINT64_MAX-1)
- #define removeLinkFromLabel_ERR(x) (((uint64_t)x) >> 63)
- // TODO(cjd): This does not depend on nodeStore or alter the link, consider moving to Node.c
- static uint64_t removeLinkFromLabel(struct Node_Link* link, uint64_t label)
- {
- // First we splice off the parent's Director leaving the child's Director.
- uint64_t unspliced = LabelSplicer_unsplice(label, link->cannonicalLabel);
- int formNum = EncodingScheme_getFormNum(link->child->encodingScheme, unspliced);
- if (formNum < link->inverseLinkEncodingFormNumber) {
- // Can't get there from here.
- return removeLinkFromLabel_IMPOSSIBLE;
- }
- uint64_t cannonical =
- EncodingScheme_convertLabel(link->child->encodingScheme,
- unspliced,
- EncodingScheme_convertLabel_convertTo_CANNONICAL);
- // Check that they didn't waste space by sending an oversize encoding form.
- if (formNum > link->inverseLinkEncodingFormNumber && cannonical != unspliced) {
- return removeLinkFromLabel_OVERSIZE;
- }
- Assert_true(cannonical != EncodingScheme_convertLabel_INVALID);
- return cannonical;
- }
- /**
- * Find the next hop on a given path.
- * Given a label representing a path from parentLink to some destination, set
- * outLink to the first link along that journey and return the path from outLink
- * to the original destination.
- * Feeding outLink back in to parentLink and the return value back into label argument
- * will allow you to iteratively walk a path.
- *
- * @param label the path from parentLink to some unspecified destination.
- * @param outLink a pointer to a location which will receive the first link in the path.
- * @param parentLink the link where to begin the trek.
- * @param store
- * @return a label which would take you from the node in memory location outLink to the
- * destination provided by the label argument. OR: firstHopInPath_INVALID if the
- * label argument traverces a node whose encoding scheme is inconsistent with
- * the label. OR: firstHopInPath_NO_NEXT_LINK if there are no *known* further
- * links along the path. If the result is firstHopInPath_INVALID, outLink will
- * still be set to the node. Use firstHopInPath_ERR() to check if the return
- * is an error code.
- */
- #define firstHopInPath_INVALID UINT64_MAX
- #define firstHopInPath_NO_NEXT_LINK (UINT64_MAX-1)
- #define firstHopInPath_ERR(path) (path >= firstHopInPath_NO_NEXT_LINK)
- static uint64_t firstHopInPath(uint64_t label,
- struct Node_Link** outLink,
- struct Node_Link* parentLink,
- struct NodeStore_pvt* store)
- {
- // Then we search for the next peer in the path
- // RB_NFIND will find a link for which we know that no link before it is in the path.
- // Unfortunately I have not found a way to store links in a tree where the search time
- // is less than O(n) where n = peers of a given node.
- struct Node_Link tmpl = { .cannonicalLabel = label };
- struct Node_Link* nextLink =
- Identity_ncheck(RB_NFIND(PeerRBTree, &parentLink->child->peerTree, &tmpl));
- // Now we walk back through the potential candidates looking for a path which it routes though.
- while (nextLink && !LabelSplicer_routesThrough(label, nextLink->cannonicalLabel)) {
- nextLink = Identity_ncheck(RB_NEXT(PeerRBTree, NULL, nextLink));
- }
- // This node has no peers, if it's us then it always has a peer (which is the selfLink)
- if (!nextLink || nextLink == store->selfLink) {
- return firstHopInPath_NO_NEXT_LINK;
- }
- // check for a looping link, this should never happen but adding the assert helps me
- // refactor this function a little more agressively.
- Assert_true(nextLink != parentLink);
- if (label == nextLink->cannonicalLabel) {
- //logLink(store, nextLink, "Exact match");
- *outLink = nextLink;
- return 1;
- }
- if (!LabelSplicer_routesThrough(label, nextLink->cannonicalLabel)) {
- // child of next link is not in the path, we reached the end.
- return firstHopInPath_NO_NEXT_LINK;
- }
- *outLink = nextLink;
- // Cannoicalize the child's Director
- label = removeLinkFromLabel(nextLink, label);
- if (removeLinkFromLabel_ERR(label)) {
- return firstHopInPath_INVALID;
- }
- return label;
- }
- #define findClosest_INVALID (~((uint64_t)0))
- static uint64_t findClosest(uint64_t path,
- struct Node_Link** output,
- struct Node_Link* parentLink,
- struct NodeStore_pvt* store)
- {
- for (;;) {
- struct Node_Link* nextLink = NULL;
- uint64_t nextPath = firstHopInPath(path, &nextLink, parentLink, store);
- if (nextPath == firstHopInPath_NO_NEXT_LINK) {
- *output = parentLink;
- return path;
- }
- if (firstHopInPath_INVALID == nextPath) {
- return findClosest_INVALID;
- }
- Assert_true(nextLink);
- path = nextPath;
- parentLink = nextLink;
- }
- }
- static struct Node_Two* nodeForIp(struct NodeStore_pvt* store, uint8_t ip[16])
- {
- struct Node_Two fakeNode;
- Identity_set(&fakeNode);
- Bits_memcpyConst(fakeNode.address.ip6.bytes, ip, 16);
- return Identity_ncheck(RB_FIND(NodeRBTree, &store->nodeTree, &fakeNode));
- }
- static void freePendingLinks(struct NodeStore_pvt* store)
- {
- struct Node_Link* link;
- while ((link = store->linksToFree)) {
- store->linksToFree = link->nextPeer;
- freeLink(link, store);
- }
- }
- static struct Node_Link* discoverLinkC(struct NodeStore_pvt* store,
- struct Node_Link* closestKnown,
- uint64_t pathKnownParentChild,
- struct Node_Two* child,
- uint64_t discoveredPath,
- int inverseLinkEncodingFormNumber)
- {
- // Make sure this link cannot be split before beginning.
- struct Node_Link* closest = NULL;
- uint64_t pathParentChild = findClosest(pathKnownParentChild, &closest, closestKnown, store);
- if (pathParentChild == findClosest_INVALID) {
- return NULL;
- }
- struct Node_Two* parent = closest->child;
- if (Defined(Log_DEBUG)) {
- uint8_t parentStr[40];
- uint8_t childStr[40];
- uint8_t pathStr[20];
- AddrTools_printIp(parentStr, parent->address.ip6.bytes);
- AddrTools_printIp(childStr, child->address.ip6.bytes);
- AddrTools_printPath(pathStr, pathParentChild);
- Log_debug(store->logger, "discoverLinkC( [%s]->[%s] [%s] )", parentStr, childStr, pathStr);
- }
- if (closest == store->selfLink &&
- !EncodingScheme_isOneHop(parent->encodingScheme, pathParentChild))
- {
- Log_debug(store->logger, "Attempting to create a link with no parent peer");
- return NULL;
- }
- if (parent == child) {
- if (pathParentChild == 1) {
- // Link is already known.
- update(closest, 0, store);
- //Log_debug(store->logger, "Already known");
- return closest;
- }
- Log_debug(store->logger, "Loopey route");
- // lets not bother storing this link, a link with the same parent and child is
- // invalid according to verify() and it's just going to take up space in the store
- // we'll return closest which is a perfectly valid path to the same node.
- // We could reasonably return the closest since it is the same node but it causes
- // problems with an assertion in discoverLink.
- return NULL;
- }
- if (EncodingScheme_isSelfRoute(parent->encodingScheme, pathParentChild)) {
- logLink(store, closest, "Node at end of path appears to have changed");
- // This should never happen for a direct peer or for a direct decendent in a split link.
- // This sometimes triggers because a link is split which contains an invalid encoding
- // somewhere in the middle.
- // It is not harmful to remove it becaue the route is not re-added.
- Assert_ifTesting(closestKnown != closest);
- // This probably means the parent node has renumbered it's switch...
- RumorMill_addNode(store->renumberMill, &closest->parent->address);
- check(store);
- // But it's possible someone is just lieing to us.
- return NULL;
- }
- // link parent to child
- //
- // ACKTUNG: From this point forward, the nodeStore is in an invalid state, calls to _verify()
- // will fail (calls to _check() will still succeed). We have linked parent with child
- // but we have not split all of the splitLinks from parent.
- //
- // TODO(cjd): linking every node with 0 link state, this can't be right.
- struct Node_Link* parentLink = linkNodes(parent,
- child,
- pathParentChild,
- 0,
- inverseLinkEncodingFormNumber,
- discoveredPath,
- store);
- if (!RB_FIND(NodeRBTree, &store->nodeTree, child)) {
- checkNode(child, store);
- RB_INSERT(NodeRBTree, &store->nodeTree, child);
- store->pub.nodeCount++;
- }
- check(store);
- return parentLink;
- }
- static void fixLink(struct Node_Link* parentLink,
- struct Node_Link** outLinks,
- struct NodeStore_pvt* store)
- {
- int verifyOrder = 0;
- // Check whether the parent is already linked with a node which is "behind" the child.
- // splitLink appears to be a "sibling link" to the closest->node link but in reality the
- // splitLink link should be split and node should be inserted in the middle.
- struct Node_Link* splitLink = RB_MIN(PeerRBTree, &parentLink->parent->peerTree);
- while (splitLink) {
- if (splitLink == parentLink) {
- if (Defined(PARANOIA)) {
- verifyOrder = 1;
- splitLink = PeerRBTree_RB_NEXT(splitLink);
- continue;
- } else {
- // Since they're in order, definitely not found.
- break;
- }
- }
- if (!LabelSplicer_routesThrough(splitLink->cannonicalLabel, parentLink->cannonicalLabel)) {
- splitLink = PeerRBTree_RB_NEXT(splitLink);
- continue;
- }
- if (Defined(PARANOIA)) {
- Assert_true(!verifyOrder);
- }
- struct Node_Two* grandChild = splitLink->child;
- if (parentLink->child == grandChild) {
- // loopey route, kill it and let the bestParent pivit over to parentLink
- } else {
- logLink(store, splitLink, "Splitting link");
- // unsplice and cannonicalize so we now have a path from child to grandchild
- uint64_t childToGrandchild =
- LabelSplicer_unsplice(splitLink->cannonicalLabel, parentLink->cannonicalLabel);
- childToGrandchild =
- EncodingScheme_convertLabel(parentLink->child->encodingScheme,
- childToGrandchild,
- EncodingScheme_convertLabel_convertTo_CANNONICAL);
- Assert_true(childToGrandchild < UINT64_MAX);
- Assert_true(childToGrandchild != 1);
- Assert_true(splitLink->cannonicalLabel != parentLink->cannonicalLabel);
- // We forgot what was the discovered path for the link when we split (destroyed)
- // it so we'll just assume the worst among these two possibilities.
- // There is an assertion that discoveredPath is never < cannonicalLabel so we must.
- uint64_t discoveredPath = parentLink->discoveredPath;
- if (childToGrandchild > discoveredPath) { discoveredPath = childToGrandchild; }
- struct Node_Link* childLink =
- discoverLinkC(store, parentLink, childToGrandchild, grandChild,
- discoveredPath, splitLink->inverseLinkEncodingFormNumber);
- // Three possibilities:
- // 1. discoverLinkC returned NULL for whatever reason, skip this routine.
- // 2. discoverLinkC determined that childLink already exists and returned it, this
- // routine added it in a previous iteration so
- // childLink->nextInSplitList is not NULL so we should skip this
- // routine as splitLinks will already attempt to split childLink.
- // 3. childLink is new or has existed since before this discoverNode, we will add it
- // to the splitList so that splitLinks will attempt to split it.
- if (childLink && !childLink->nextInSplitList) {
- // Order the list so that the next set of links will be split from
- // smallest to largest and nothing will ever be split twice.
- for (struct Node_Link** x = outLinks;; x = &(*x)->nextInSplitList) {
- if (*x == childLink) { break; }
- if (*x && (*x)->cannonicalLabel <= childLink->cannonicalLabel) { continue; }
- childLink->nextInSplitList = *x;
- *x = childLink;
- break;
- }
- }
- }
- check(store);
- struct Node_Link* next = PeerRBTree_RB_NEXT(splitLink);
- NodeStore_unlinkNodes(&store->pub, splitLink);
- splitLink = next;
- }
- }
- static void fixLinks(struct Node_Link* parentLinkList,
- struct Node_Link** outLinks,
- struct NodeStore_pvt* store)
- {
- while (parentLinkList) {
- struct Node_Link* next = parentLinkList->nextInSplitList;
- parentLinkList->nextInSplitList = NULL;
- // else the parent link has been trashed by splitting another link.
- if (parentLinkList->child) {
- fixLink(parentLinkList, outLinks, store);
- }
- parentLinkList = next;
- }
- }
- static struct Node_Link* discoverLink(struct NodeStore_pvt* store,
- uint64_t path,
- struct Node_Two* child,
- int inverseLinkEncodingFormNumber)
- {
- struct Node_Link* link =
- discoverLinkC(store, store->selfLink, path, child, path, inverseLinkEncodingFormNumber);
- if (!link) { return NULL; }
- uint64_t pathParentChild = findClosest(path, &link, store->selfLink, store);
- // This should always be 1 because the link is gone only because it was just split!
- Assert_true(pathParentChild == 1);
- struct Node_Link* ol = NULL;
- struct Node_Link* nl = NULL;
- fixLinks(link, &ol, store);
- for (;;) {
- if (ol) {
- fixLinks(ol, &nl, store);
- ol = NULL;
- } else if (nl) {
- fixLinks(nl, &ol, store);
- nl = NULL;
- } else {
- break;
- }
- }
- verify(store);
- return link;
- }
- static struct Node_Two* whichIsWorse(struct Node_Two* one,
- struct Node_Two* two,
- struct NodeStore_pvt* store)
- {
- // a peer is nevar worse
- int worse = isPeer(one, store) - isPeer(two, store);
- if (worse) {
- return (worse > 0) ? two : one;
- }
- worse = (one->address.path == UINT64_MAX) - (two->address.path == UINT64_MAX);
- if (worse) {
- return (worse > 0) ? one : two;
- }
- if (one->address.protocolVersion != two->address.protocolVersion) {
- if (one->address.protocolVersion < Version_CURRENT_PROTOCOL) {
- if (two->address.protocolVersion >= Version_CURRENT_PROTOCOL) {
- return one;
- }
- } else if (two->address.protocolVersion < Version_CURRENT_PROTOCOL) {
- if (one->address.protocolVersion >= Version_CURRENT_PROTOCOL) {
- return two;
- }
- }
- }
- uint32_t selfPrefix = Address_getPrefix(&store->pub.selfNode->address);
- uint64_t distOne = Address_getPrefix(&one->address) ^ selfPrefix;
- uint64_t distTwo = Address_getPrefix(&two->address) ^ selfPrefix;
- distOne += 0xffffffff - Node_getReach(one);
- distTwo += 0xffffffff - Node_getReach(two);
- if (Defined(NodeStore_whichIsWorse_PATHCOUNTS)) {
- distOne += Bits_log2x64(one->address.path) << 26;
- distTwo += Bits_log2x64(two->address.path) << 26;
- }
- if (distOne < distTwo) { return two; }
- return one;
- }
- struct NodeList* NodeStore_getNodesForBucket(struct NodeStore* nodeStore,
- struct Allocator* allocator,
- uint16_t bucket,
- const uint32_t count)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- struct NodeList* nodeList = Allocator_malloc(allocator, sizeof(struct NodeList));
- nodeList->nodes = Allocator_calloc(allocator, count, sizeof(char*));
- nodeList->size = 0;
- struct Node_Two* nn = NULL;
- RB_FOREACH(nn, NodeRBTree, &store->nodeTree) {
- if (!Node_getReach(nn)) { continue; }
- if (NodeStore_bucketForAddr(store->pub.selfAddress, &nn->address) == bucket) {
- struct Node_Two* newNode = nn;
- struct Node_Two* tempNode = NULL;
- for (uint32_t i = 0 ; i < count ; i++) {
- if (nodeList->size < i+1) {
- // The list isn't full yet, so insert at the end.
- nodeList->size = i+1;
- nodeList->nodes[i] = newNode;
- break;
- }
- if ( (newNode->marked && !nodeList->nodes[i]->marked) ||
- whichIsWorse(nodeList->nodes[i], newNode, store) == nodeList->nodes[i] ) {
- // If we've already marked nodes because they're a bestParent,
- // lets give them priority in the bucket since we need to keep
- // them either way.
- // Otherwise, decide based on whichIsWorse().
- // Insertion sorted list.
- tempNode = nodeList->nodes[i];
- nodeList->nodes[i] = newNode;
- newNode = tempNode;
- }
- }
- }
- }
- return nodeList;
- }
- static bool markNodesForBucket(struct NodeStore_pvt* store,
- uint16_t bucket,
- const uint32_t count)
- {
- struct Allocator* nodeListAlloc = Allocator_child(store->alloc);
- struct NodeList* nodeList = NodeStore_getNodesForBucket(&store->pub,
- nodeListAlloc,
- bucket,
- count);
- bool retVal = false;
- if (nodeList->size > 0) { retVal = true; }
- for (uint32_t i = 0; i < nodeList->size; i++) {
- // Now mark the nodes in the list to protect them.
- Identity_check(nodeList->nodes[i]);
- nodeList->nodes[i]->marked = 1;
- }
- // Cleanup
- Allocator_free(nodeListAlloc);
- return retVal;
- }
- static void markKeyspaceNodes(struct NodeStore_pvt* store)
- {
- for (uint16_t bucket = 0; bucket < NodeStore_bucketNumber ; bucket++) {
- markNodesForBucket(store, bucket, NodeStore_bucketSize);
- }
- }
- /**
- * We define the worst node the node with the lowest reach, excluding nodes which are required for
- * the DHT, and nodes which are somebody's bestParent (only relevant if they're the bestParent of
- * a DHT-required node, as otherwise their child would always be lower reach).
- * If two nodes tie (e.g. two unreachable nodes with 0 reach) then the node which is
- * further from us in keyspace is worse.
- */
- static struct Node_Two* getWorstNode(struct NodeStore_pvt* store)
- {
- struct Node_Two* worst = NULL;
- struct Node_Two* nn = NULL;
- RB_FOREACH(nn, NodeRBTree, &store->nodeTree) {
- // first cycle we set markings so markings remain if they are behind us
- struct Node_Link* parentLink = Node_getBestParent(nn);
- if (parentLink) {
- parentLink->parent->marked = 1;
- } else if (!worst || whichIsWorse(nn, worst, store) == nn) {
- // this time around we're only addressing nodes which are unreachable.
- worst = nn;
- }
- }
- if (worst) {
- RB_FOREACH(nn, NodeRBTree, &store->nodeTree) {
- if (nn->marked) { nn->marked = false; }
- }
- return worst;
- }
- // Mark the nodes that we need to protect for keyspace reasons.
- markKeyspaceNodes(store);
- RB_FOREACH(nn, NodeRBTree, &store->nodeTree) {
- if (nn->marked) {
- nn->marked = false;
- } else if (!worst || whichIsWorse(nn, worst, store) == nn) {
- worst = nn;
- }
- }
- if (worst) { return worst; }
- RB_FOREACH(nn, NodeRBTree, &store->nodeTree) {
- // third cycle, every node is apparently important but we need to get rid of someone
- // get whoever is worst if we ignore markings
- // by definition, this shouldn't be a bestParent, because their children have lower reach
- // so we're potentially creating a keyspace hole (routing blackhole) when we do this.
- // TODO(arceliar): protect keyspace, evict the worst bestParent instead?
- // Would require something like a forgetNode() to splice links together between
- // that node's bestParent and all its children, before we kill it.
- if (!worst || whichIsWorse(nn, worst, store) == nn) {
- worst = nn;
- }
- }
- // somebody has to be at the end of the line, not *everyone* can be someone's best parent!
- Assert_true(worst);
- return worst;
- }
- static void destroyNode(struct Node_Two* node, struct NodeStore_pvt* store)
- {
- // careful, undefined unless debug is enabled...
- uint8_t address_debug[60];
- if (Defined(Log_DEBUG)) {
- Address_print(address_debug, &node->address);
- }
- struct Node_Link* link;
- RB_FOREACH(link, PeerRBTree, &node->peerTree) {
- Identity_check(link);
- NodeStore_unlinkNodes(&store->pub, link);
- }
- // If the node has a bestParent, it will be changed a number
- // of times as we kill off all of it's parent links.
- // This is an optimization:
- if (!Defined(PARANOIA)) {
- store->pub.linkedNodes--;
- setParentReachAndPath(node, NULL, 0, UINT64_MAX, store);
- }
- link = node->reversePeers;
- while (link) {
- struct Node_Link* nextLink = link->nextPeer;
- NodeStore_unlinkNodes(&store->pub, link);
- link = nextLink;
- }
- Assert_true(!Node_getBestParent(node));
- Assert_ifParanoid(node == RB_FIND(NodeRBTree, &store->nodeTree, node));
- RB_REMOVE(NodeRBTree, &store->nodeTree, node);
- store->pub.nodeCount--;
- Allocator_free(node->alloc);
- }
- // Must be at least 2 to avoid multiplying by 0.
- // If too large, path choice may become unstable due to a guess we make in calcNextReach.
- // This is fixable by storing reach based on links. A lot of work.
- // In the mean time, just don't use a large value.
- #define NodeStore_latencyWindow 8
- static uint32_t reachAfterDecay(const uint32_t oldReach)
- {
- // Reduce the reach by 1/Xth where X = NodeStore_latencyWindow
- // This is used to keep a weighted rolling average
- return (uint64_t)oldReach * (NodeStore_latencyWindow - 1) / (NodeStore_latencyWindow);
- }
- static uint32_t reachAfterTimeout(const uint32_t oldReach)
- {
- return reachAfterDecay(oldReach);
- }
- static uint32_t calcNextReach(const uint32_t oldReach, const uint32_t millisecondsLag)
- {
- int64_t out = reachAfterDecay(oldReach) +
- ((UINT32_MAX / NodeStore_latencyWindow) / (millisecondsLag + 1));
- if (!oldReach) {
- // We don't know the old reach for this path.
- // If every response comes in after same millisecondsLag, then we expect that the
- // reach will stabilize to a value of (out * NodeStoare_latencyWindow).
- // Lets guess what the reach will stabilize to, but try to be a little conservative,
- // so we don't cause bestParents to switch unless the new route is appreciably better.
- out = out * (NodeStore_latencyWindow - 1);
- }
- // TODO(arceliar): is this safe?
- Assert_true(out < (UINT32_MAX - 1024) && out > 0);
- return out;
- }
- struct Node_Link* NodeStore_discoverNode(struct NodeStore* nodeStore,
- struct Address* addr,
- struct EncodingScheme* scheme,
- int inverseLinkEncodingFormNumber,
- uint64_t milliseconds)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- verify(store);
- // conservative guess of what the reach would stabilize to
- uint32_t reach = calcNextReach(0, milliseconds);
- struct Node_Two* child = nodeForIp(store, addr->ip6.bytes);
- if (Defined(Log_DEBUG)) {
- uint8_t printedAddr[60];
- Address_print(printedAddr, addr);
- Log_debug(store->logger, "Discover node [%s]", printedAddr);
- }
- if (child && child == store->selfLink->child) {
- return NULL;
- }
- if (child && EncodingScheme_compare(child->encodingScheme, scheme)) {
- // Shit.
- // Box reset *and* they just updated and changed their encoding scheme.
- RumorMill_addNode(store->renumberMill, &child->address);
- if (addr->path > (child->address.path | (child->address.path << 3))) {
- Log_debug(store->logger, "Node appears to have changed it's encoding scheme "
- "but the message came from far away and we will not trust it");
- return NULL;
- } else {
- Log_debug(store->logger, "Node appears to have changed it's encoding scheme "
- "dropping him from the table and re-inserting");
- destroyNode(child, store);
- child = NULL;
- }
- } else if (child && child->address.protocolVersion != addr->protocolVersion) {
- child->address.protocolVersion = addr->protocolVersion;
- }
- struct Allocator* alloc = NULL;
- if (!child) {
- alloc = Allocator_child(store->alloc);
- child = Allocator_calloc(alloc, sizeof(struct Node_Two), 1);
- child->alloc = alloc;
- Bits_memcpyConst(&child->address, addr, sizeof(struct Address));
- child->encodingScheme = EncodingScheme_clone(scheme, child->alloc);
- child->timeLastPinged = Time_currentTimeMilliseconds(store->eventBase);
- Identity_set(child);
- }
- struct Node_Link* link = NULL;
- for (;;) {
- link = discoverLink(store,
- addr->path,
- child,
- inverseLinkEncodingFormNumber);
- if (link) { break; }
- // We might have a broken link in the store which is causing new links to be rejected.
- // On the other hand, this path might actually be garbage :)
- // There's a DoS risk in that someone might use garbage paths to evict all of the
- // existing good paths.
- // While an attacker can send in a packet, it will necessarily follow a ridiculous path
- // in order that the path contains one of their nodes.
- // To resolve this, we'll walk the path looking for the "bad" link, then we'll check that
- // node to see if the path we took to reach it is actually the *best* path to that node.
- uint64_t path = addr->path;
- struct Node_Link* lastLink = store->selfLink;
- do {
- struct Node_Link* nextLink = NULL;
- path = firstHopInPath(path, &nextLink, lastLink, store);
- lastLink = nextLink;
- if (path == firstHopInPath_NO_NEXT_LINK) {
- // discoverNode() failed for some other reason.
- lastLink = NULL;
- break;
- }
- } while (firstHopInPath_INVALID != path);
- if (lastLink && LabelSplicer_routesThrough(addr->path, lastLink->child->address.path)) {
- // checking for sillyness...
- Assert_true(lastLink != store->selfLink);
- NodeStore_unlinkNodes(&store->pub, lastLink);
- continue;
- }
- if (alloc) {
- Allocator_free(alloc);
- }
- verify(store);
- Log_debug(store->logger, "Invalid path");
- return NULL;
- }
- if (link->parent == store->pub.selfNode && !Node_getBestParent(link->child)) {
- updateBestParent(link, reach, store);
- }
- #ifdef PARANOIA
- struct Node_Two* parent = link->parent;
- #endif
- handleNews(link->child, reach, store);
- freePendingLinks(store);
- while ((store->pub.nodeCount - store->pub.peerCount) >
- store->pub.nodeCapacity
- || store->pub.linkCount > store->pub.linkCapacity)
- {
- struct Node_Two* worst = getWorstNode(store);
- if (Defined(Log_DEBUG)) {
- uint8_t worstAddr[60];
- Address_print(worstAddr, &worst->address);
- Log_debug(store->logger, "store full, removing worst node: [%s] nodes [%d] links [%d]",
- worstAddr, store->pub.nodeCount, store->pub.linkCount);
- }
- Assert_true(!isPeer(worst, store));
- if (link && (worst == link->parent || worst == link->child)) { link = NULL; }
- destroyNode(worst, store);
- freePendingLinks(store);
- }
- verify(store);
- // This should test that link == NodeStore_linkForPath(path) but that is not guaranteed
- // to work because links are not healed up when a node is removed from the store
- Assert_ifParanoid(!link || RB_FIND(PeerRBTree, &parent->peerTree, link) == link);
- return link;
- }
- struct Node_Two* NodeStore_nodeForAddr(struct NodeStore* nodeStore, uint8_t addr[16])
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- struct Node_Two* n = nodeForIp(store, addr);
- if (n && n->address.path == UINT64_MAX) {
- if (Defined(Log_DEBUG)) {
- uint8_t addrStr[40];
- AddrTools_printIp(addrStr, n->address.ip6.bytes);
- Log_debug(store->logger, "No way to represent path to [%s]", addrStr);
- }
- return NULL;
- }
- return n;
- }
- struct Node_Two* NodeStore_closestNode(struct NodeStore* nodeStore, uint64_t path)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- struct Node_Link* out = NULL;
- findClosest(path, &out, store->selfLink, store);
- if (!out) { return NULL; }
- return Identity_check(out->child);
- }
- struct Node_Link* NodeStore_linkForPath(struct NodeStore* nodeStore, uint64_t path)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- struct Node_Link* out = NULL;
- uint64_t pathParentChild = findClosest(path, &out, store->selfLink, store);
- if (pathParentChild != 1) { return NULL; }
- return Identity_check(out);
- }
- struct Node_Link* NodeStore_firstHopInPath(struct NodeStore* nodeStore,
- uint64_t path,
- uint64_t* correctedPath,
- struct Node_Link* startingPoint)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- if (!startingPoint) { startingPoint = store->selfLink; }
- if (!Node_getBestParent(startingPoint->parent)) { return NULL; }
- struct Node_Link* out = NULL;
- path = firstHopInPath(path, &out, startingPoint, store);
- if (firstHopInPath_ERR(path)) { return NULL; }
- if (correctedPath) { *correctedPath = path; }
- return out;
- }
- char* NodeStore_getRouteLabel_strerror(uint64_t returnVal)
- {
- switch (returnVal) {
- case NodeStore_getRouteLabel_PARENT_NOT_FOUND:
- return "NodeStore_getRouteLabel_PARENT_NOT_FOUND";
- case NodeStore_getRouteLabel_CHILD_NOT_FOUND:
- return "NodeStore_getRouteLabel_CHILD_NOT_FOUND";
- default: return NULL;
- }
- }
- uint64_t NodeStore_getRouteLabel(struct NodeStore* nodeStore,
- uint64_t pathToParent,
- uint64_t pathParentToChild)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- struct Node_Link* linkToParent;
- if (findClosest(pathToParent, &linkToParent, store->selfLink, store) != 1) {
- return NodeStore_getRouteLabel_PARENT_NOT_FOUND;
- }
- //logLink(store, linkToParent, "NodeStore_getRouteLabel() PARENT");
- struct Node_Link* linkToChild = NULL;
- RB_FOREACH_REVERSE(linkToChild, PeerRBTree, &linkToParent->child->peerTree) {
- if (pathParentToChild == linkToChild->cannonicalLabel) {
- if (linkToParent == store->selfLink) {
- return linkToChild->cannonicalLabel;
- }
- // TODO(cjd): this could return ~0
- return extendRoute(pathToParent,
- linkToChild->parent->encodingScheme,
- linkToChild->cannonicalLabel,
- linkToParent->inverseLinkEncodingFormNumber);
- }
- }
- return NodeStore_getRouteLabel_CHILD_NOT_FOUND;
- }
- uint64_t NodeStore_optimizePath(struct NodeStore* nodeStore, uint64_t path)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- struct Node_Link* linkToParent;
- uint64_t next = findClosest(path, &linkToParent, store->selfLink, store);
- if (next == findClosest_INVALID) {
- return NodeStore_optimizePath_INVALID;
- }
- if (EncodingScheme_isSelfRoute(linkToParent->child->encodingScheme, next)) {
- // cannoicalize all the other wild ways that they can represent self routes.
- // TODO(cjd): this has been the source of assert failures and we might be sweeping
- // a significant bug under the carpet.
- next = 1;
- }
- if (linkToParent == store->selfLink) {
- if (next == 1) { return 1; }
- return path;
- }
- if (next == 1) { return linkToParent->child->address.path; }
- struct Node_Link* childBestParent = Node_getBestParent(linkToParent->child);
- if (childBestParent) {
- linkToParent = childBestParent;
- }
- uint64_t optimized = extendRoute(linkToParent->child->address.path,
- linkToParent->child->encodingScheme,
- next,
- linkToParent->inverseLinkEncodingFormNumber);
- if (optimized != UINT64_MAX) {
- return optimized;
- }
- if (optimized == extendRoute_INVALID) {
- if (Defined(Log_DEBUG)) {
- do {
- uint8_t pathStr[20];
- uint8_t nextStr[20];
- uint8_t bestPathStr[20];
- AddrTools_printPath(pathStr, path);
- AddrTools_printPath(nextStr, next);
- AddrTools_printPath(bestPathStr, linkToParent->child->address.path);
- Log_debug(store->logger, "Failed to optimize path [%s] with closest known [%s] and "
- "best path to closest known [%s]",
- pathStr, nextStr, bestPathStr);
- } while (0);
- }
- return path;
- }
- // path is too long...
- /*if (Defined(Log_DEBUG)) {
- do {
- uint8_t pathStr[20];
- uint8_t nextStr[20];
- uint8_t bestPathStr[20];
- AddrTools_printPath(pathStr, path);
- AddrTools_printPath(nextStr, next);
- AddrTools_printPath(bestPathStr, linkToParent->child->address.path);
- Log_debug(store->logger, "Failed to optimize path [%s] with closest known [%s] and best "
- "path to closest known [%s]", pathStr, nextStr, bestPathStr);
- } while (0);
- }*/
- return path;
- }
- struct Node_Link* NodeStore_nextLink(struct Node_Two* parent, struct Node_Link* startLink)
- {
- if (!startLink) {
- return RB_MIN(PeerRBTree, &parent->peerTree);
- }
- return PeerRBTree_RB_NEXT(startLink);
- }
- /** See: NodeStore.h */
- struct NodeStore* NodeStore_new(struct Address* myAddress,
- struct Allocator* allocator,
- struct EventBase* eventBase,
- struct Log* logger,
- struct RumorMill* renumberMill)
- {
- struct Allocator* alloc = Allocator_child(allocator);
- struct NodeStore_pvt* out = Allocator_clone(alloc, (&(struct NodeStore_pvt) {
- .pub = {
- .nodeCapacity = NodeStore_DEFAULT_NODE_CAPACITY,
- .linkCapacity = NodeStore_DEFAULT_LINK_CAPACITY
- },
- .renumberMill = renumberMill,
- .logger = logger,
- .eventBase = eventBase,
- .alloc = alloc
- }));
- Identity_set(out);
- // Create the self node
- struct Node_Two* selfNode = Allocator_calloc(alloc, sizeof(struct Node_Two), 1);
- Bits_memcpyConst(&selfNode->address, myAddress, sizeof(struct Address));
- selfNode->encodingScheme = NumberCompress_defineScheme(alloc);
- selfNode->alloc = alloc;
- Identity_set(selfNode);
- out->pub.linkedNodes = 1;
- out->pub.selfNode = selfNode;
- struct Node_Link* selfLink = linkNodes(selfNode, selfNode, 1, 0xffffffffu, 0, 1, out);
- Node_setParentReachAndPath(selfNode, selfLink, UINT32_MAX, 1);
- selfNode->timeLastPinged = Time_currentTimeMilliseconds(out->eventBase);
- out->selfLink = selfLink;
- RB_INSERT(NodeRBTree, &out->nodeTree, selfNode);
- out->pub.selfAddress = &out->selfLink->child->address;
- out->pub.selfAddress->protocolVersion = Version_CURRENT_PROTOCOL;
- return &out->pub;
- }
- //////////////////////////////////////////////////////////////////////////////////////////////
- //////////////////////////////////////////////////////////////////////////////////////////////
- //////////////////////////////////////////////////////////////////////////////////////////////
- /**
- * Dump the table, one node at a time.
- */
- struct Node_Two* NodeStore_dumpTable(struct NodeStore* nodeStore, uint32_t index)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- // TODO(cjd): Schlameil the painter
- uint32_t i = 0;
- struct Node_Two* nn = NULL;
- RB_FOREACH(nn, NodeRBTree, &store->nodeTree) {
- if (i++ == index) { return nn; }
- }
- return NULL;
- }
- struct Node_Link* NodeStore_getNextLink(struct NodeStore* nodeStore, struct Node_Link* last)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- struct Node_Two* nn;
- struct Node_Link* next;
- // NULL input, take first link of first node in store
- if (!last) {
- nn = Identity_ncheck(RB_MIN(NodeRBTree, &store->nodeTree));
- next = NULL;
- } else {
- next = Identity_ncheck(PeerRBTree_RB_NEXT(last));
- if (next) { return next; }
- nn = Identity_ncheck(NodeRBTree_RB_NEXT(last->parent));
- }
- while (!next) {
- if (!nn) { return NULL; }
- next = Identity_ncheck(RB_MIN(PeerRBTree, &nn->peerTree));
- nn = Identity_ncheck(NodeRBTree_RB_NEXT(nn));
- }
- return next;
- }
- struct Node_Two* NodeStore_getNextNode(struct NodeStore* nodeStore, struct Node_Two* lastNode)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- if (!lastNode) {
- return Identity_ncheck(RB_MIN(NodeRBTree, &store->nodeTree));
- }
- return Identity_ncheck(NodeRBTree_RB_NEXT(lastNode));
- }
- static struct Node_Two* getBestCycleB(struct Node_Two* node,
- uint8_t target[16],
- struct NodeStore_pvt* store)
- {
- uint32_t targetPfx = Address_prefixForIp6(target);
- uint32_t ourDistance = Address_getPrefix(store->pub.selfAddress) ^ targetPfx;
- struct Node_Link* next = NULL;
- RB_FOREACH_REVERSE(next, PeerRBTree, &node->peerTree) {
- if (Node_getBestParent(next->child) != next || next == store->selfLink) { continue; }
- if (next->child->address.path == UINT64_MAX) { continue; }
- if ((Address_getPrefix(&next->child->address) ^ targetPfx) >= ourDistance) { continue; }
- return next->child;
- }
- return NULL;
- }
- static int getBestCycle(struct Node_Two* node,
- uint8_t target[16],
- struct Node_Two** output,
- int limit,
- int cycle,
- struct NodeStore_pvt* store)
- {
- Assert_true(cycle < 1000);
- if (cycle < limit) {
- int total = 0;
- struct Node_Link* next = NULL;
- RB_FOREACH_REVERSE(next, PeerRBTree, &node->peerTree) {
- if (*output) { return total; }
- if (Node_getBestParent(next->child) != next || next == store->selfLink) { continue; }
- total += getBestCycle(next->child, target, output, limit, cycle+1, store);
- }
- return total;
- }
- *output = getBestCycleB(node, target, store);
- return 1;
- }
- struct Node_Two* NodeStore_getBest(struct NodeStore* nodeStore, uint8_t targetAddress[16])
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- // First try to find the node directly
- struct Node_Two* n = NodeStore_nodeForAddr(nodeStore, targetAddress);
- if (n && Node_getBestParent(n)) { return n; }
- /**
- * The network is small enough that a per-bucket lookup is inefficient
- * Basically, the first bucket is likely to route through an "edge" node
- * In theory, it scales better if the network is large.
- // Next try to find the best node in the correct bucket
- struct Address fakeAddr;
- Bits_memcpyConst(fakeAddr.ip6.bytes, targetAddress, 16);
- uint16_t bucket = NodeStore_bucketForAddr(&store->pub.selfNode->address, &fakeAddr);
- struct Allocator* nodeListAlloc = Allocator_child(store->alloc);
- struct NodeList* nodeList = NodeStore_getNodesForBucket(&store->pub,
- nodeListAlloc,
- bucket,
- NodeStore_bucketSize);
- for (uint32_t i = 0 ; i < nodeList->size ; i++) {
- if (Node_getBestParent(nodeList->nodes[i])) {
- n = nodeList->nodes[i];
- break;
- }
- }
- Allocator_free(nodeListAlloc);
- if (n && Node_getBestParent(n)) { return n; }
- */
- // Finally try to find the best node that is a valid next hop (closer in keyspace)
- for (int i = 0; i < 10000; i++) {
- int ret = getBestCycle(store->pub.selfNode, targetAddress, &n, i, 0, store);
- if (n || !ret) {
- if (n) { Assert_true(Node_getBestParent(n)); }
- return n;
- }
- }
- // Apparently there are no valid next hops
- return NULL;
- }
- struct NodeList* NodeStore_getPeers(uint64_t label,
- const uint32_t max,
- struct Allocator* allocator,
- struct NodeStore* nodeStore)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- Log_debug(store->logger, "getPeers request for [%llx]", (unsigned long long) label);
- // truncate the label to the part which this node uses PLUS
- // the self-interface bit for the next hop
- if (label > 1) {
- int bitsUsed = NumberCompress_bitsUsedForLabel(label);
- label = (label & Bits_maxBits64(bitsUsed)) | 1 << bitsUsed;
- }
- struct NodeList* out = Allocator_calloc(allocator, sizeof(struct NodeList), 1);
- out->nodes = Allocator_calloc(allocator, sizeof(char*), max);
- struct Node_Link* next = NULL;
- RB_FOREACH(next, PeerRBTree, &store->pub.selfNode->peerTree) {
- uint64_t p = next->child->address.path;
- if (!Node_isOneHopLink(next) && p != 1) { continue; }
- if (p < label) { continue; }
- int j;
- for (j = 0; j < (int)max; j++) {
- if (!out->nodes[j]) { continue; }
- if ((out->nodes[j]->address.path - label) > (p - label)) { continue; }
- break;
- }
- switch (j) {
- default: Bits_memmove(out->nodes, &out->nodes[1], (j - 1) * sizeof(char*));
- case 1: out->nodes[j - 1] = next->child;
- case 0:;
- }
- }
- out->size = 0;
- for (int i = 0; i < (int)max; i++) {
- if (out->nodes[i]) {
- out->nodes = &out->nodes[i];
- out->size = max - i;
- break;
- }
- }
- for (int i = 0; i < (int)out->size; i++) {
- Identity_check(out->nodes[i]);
- checkNode(out->nodes[i], store);
- Assert_true(out->nodes[i]->address.path);
- Assert_true(out->nodes[i]->address.path < (((uint64_t)1)<<63));
- out->nodes[i] = Allocator_clone(allocator, out->nodes[i]);
- }
- return out;
- }
- static bool isOkAnswer(struct Node_Two* node,
- uint32_t compatVer,
- struct NodeStore_pvt* store)
- {
- if (node->address.path == UINT64_MAX) {
- // (very) unreachable
- return false;
- }
- if (!Version_isCompatible(compatVer, node->address.protocolVersion)) {
- return false;
- }
- if (node == store->pub.selfNode) {
- return false;
- }
- return true;
- }
- /** See: NodeStore.h */
- struct NodeList* NodeStore_getClosestNodes(struct NodeStore* nodeStore,
- struct Address* targetAddress,
- const uint32_t count,
- uint32_t compatVer,
- struct Allocator* allocator)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- struct NodeList* out = Allocator_malloc(allocator, sizeof(struct NodeList));
- out->nodes = Allocator_calloc(allocator, count, sizeof(char*));
- out->size = count;
- struct Node_Two fakeNode = { .marked = 0 };
- Bits_memcpyConst(&fakeNode.address, targetAddress, sizeof(struct Address));
- struct Node_Two* next = Identity_ncheck(RB_NFIND(NodeRBTree, &store->nodeTree, &fakeNode));
- if (!next) {
- next = Identity_ncheck(RB_MAX(NodeRBTree, &store->nodeTree));
- }
- if (!next) {
- out->size = 0;
- return out;
- }
- struct Node_Two* prev = Identity_ncheck(NodeRBTree_RB_PREV(next));
- int idx = out->size-1;
- while (idx > -1) {
- if (prev && (!next || Address_closest(targetAddress, &next->address, &prev->address) > 0)) {
- if (isOkAnswer(prev, compatVer, store)) { out->nodes[idx--] = prev; }
- prev = Identity_ncheck(NodeRBTree_RB_PREV(prev));
- continue;
- }
- if (next && (!prev || Address_closest(targetAddress, &next->address, &prev->address) < 0)) {
- if (isOkAnswer(next, compatVer, store)) { out->nodes[idx--] = next; }
- next = Identity_ncheck(NodeRBTree_RB_NEXT(next));
- continue;
- }
- break;
- }
- out->nodes = &out->nodes[idx+1];
- out->size -= idx+1;
- for (int i = 0; i < (int)out->size; i++) {
- Identity_check(out->nodes[i]);
- Assert_true(out->nodes[i]->address.path);
- Assert_true(out->nodes[i]->address.path < (((uint64_t)1)<<63));
- out->nodes[i] = Allocator_clone(allocator, out->nodes[i]);
- }
- return out;
- }
- void NodeStore_disconnectedPeer(struct NodeStore* nodeStore, uint64_t path)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- struct Node_Link* nl = NodeStore_linkForPath(nodeStore, path);
- if (!nl) { return; }
- if (Defined(Log_DEBUG)) {
- uint8_t pathStr[20];
- AddrTools_printPath(pathStr, path);
- Log_debug(store->logger, "NodeStore_disconnectedPeer(%s)", pathStr);
- }
- NodeStore_unlinkNodes(&store->pub, nl);
- }
- static void brokenLink(struct NodeStore_pvt* store, struct Node_Link* brokenLink)
- {
- NodeStore_unlinkNodes(&store->pub, brokenLink);
- }
- static void addLinkToMill(struct NodeStore_pvt* store, struct Node_Link* link)
- {
- struct Address addr;
- Bits_memcpyConst(&addr, &link->child->address, sizeof(struct Address));
- addr.path =
- NodeStore_getRouteLabel(&store->pub, link->parent->address.path, link->cannonicalLabel);
- Assert_true(!NodeStore_getRouteLabel_ERR(addr.path));
- RumorMill_addNode(store->renumberMill, &addr);
- }
- void NodeStore_brokenLink(struct NodeStore* nodeStore, uint64_t path, uint64_t pathAtErrorHop)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- if (Defined(Log_DEBUG)) {
- uint8_t pathStr[20];
- uint8_t pathAtErrorHopStr[20];
- AddrTools_printPath(pathStr, path);
- AddrTools_printPath(pathAtErrorHopStr, pathAtErrorHop);
- Log_debug(store->logger, "NodeStore_brokenLink(%s, %s)", pathStr, pathAtErrorHopStr);
- }
- struct Node_Link* link = store->selfLink;
- uint64_t thisPath = path;
- for (;;) {
- uint64_t nextPath = firstHopInPath(thisPath, &link, link, store);
- uint64_t mask = (((uint64_t)1) << (Bits_log2x64(thisPath) + 1)) - 1;
- if (Defined(Log_DEBUG)) {
- uint8_t maskStr[20];
- uint8_t pathStr[20];
- AddrTools_printPath(pathStr, nextPath);
- AddrTools_printPath(maskStr, mask);
- Log_debug(store->logger, "NodeStore_brokenLink() nextPath = [%s] mask = [%s]",
- pathStr, maskStr);
- }
- uint64_t cannonicalPath =
- NodeStore_getRouteLabel(&store->pub, link->parent->address.path, link->cannonicalLabel);
- Assert_true(!NodeStore_getRouteLabel_ERR(cannonicalPath) ||
- cannonicalPath == UINT64_MAX ||
- link->parent->address.path == UINT64_MAX);
- if ((pathAtErrorHop & mask) >= nextPath) {
- uint64_t cannPathAtErrorHop =
- EncodingScheme_convertLabel(link->child->encodingScheme,
- (pathAtErrorHop & mask),
- EncodingScheme_convertLabel_convertTo_CANNONICAL);
- uint8_t cannPathAtErrorHopStr[20];
- AddrTools_printPath(cannPathAtErrorHopStr, cannPathAtErrorHop);
- Log_debug(store->logger, "NodeStore_brokenLink() converted pathAtErrorHop to [%s]",
- cannPathAtErrorHopStr);
- if (cannPathAtErrorHop == UINT64_MAX) {
- // error
- } else if ((cannPathAtErrorHop & mask) != thisPath) {
- // wrong path
- } else if (path != cannonicalPath && !NodeStore_getRouteLabel_ERR(cannonicalPath)) {
- logLink(store, link, "NodeStore_brokenLink() not cannonucal, sending ping");
- addLinkToMill(store, link);
- return;
- } else {
- logLink(store, link, "NodeStore_brokenLink() removing");
- brokenLink(store, link);
- return;
- }
- } else if (firstHopInPath_NO_NEXT_LINK == nextPath && thisPath == 1) {
- Assert_ifParanoid(NodeStore_linkForPath(nodeStore, path) == link);
- if (path >> 56) {
- logLink(store, link, "NodeStore_brokenLink() probably caused by long path");
- } else if (path != cannonicalPath && !NodeStore_getRouteLabel_ERR(cannonicalPath)) {
- logLink(store, link, "NodeStore_brokenLink() not cannonical, sending ping (1link)");
- addLinkToMill(store, link);
- return;
- } else {
- logLink(store, link, "NodeStore_brokenLink() removing (1link)");
- brokenLink(store, link);
- }
- return;
- }
- if (firstHopInPath_NO_NEXT_LINK == nextPath) {
- Log_debug(store->logger, "NodeStore_brokenLink() firstHopInPath_NO_NEXT_LINK");
- // fails if pathAtErrorHop is garbage.
- Assert_ifTesting(!NodeStore_linkForPath(nodeStore, path));
- return;
- }
- if (firstHopInPath_INVALID == nextPath) {
- Log_debug(store->logger, "NodeStore_brokenLink() firstHopInPath_INVALID");
- return;
- }
- Assert_true(link);
- thisPath = nextPath;
- }
- }
- // When a response comes in, we need to pay attention to the path used.
- static void updatePathReach(struct NodeStore_pvt* store, const uint64_t path, uint32_t newReach)
- {
- struct Node_Link* link = store->selfLink;
- uint64_t pathFrag = path;
- uint64_t now = Time_currentTimeMilliseconds(store->eventBase);
- for (;;) {
- struct Node_Link* nextLink = NULL;
- uint64_t nextPath = firstHopInPath(pathFrag, &nextLink, link, store);
- if (firstHopInPath_ERR(nextPath)) {
- break;
- }
- // expecting behavior of nextLinkOnPath()
- Assert_ifParanoid(nextLink->parent == link->child);
- if (Node_getBestParent(nextLink->child) == nextLink) {
- // the packet came in along the bestParent link to the child so don't bother changing it
- } else if (pathQuality(Node_getBestParent(nextLink->child)) >= pathQuality(nextLink)) {
- // this path is not obviously better better than the bestParent link
- } else if (Node_isAncestorOf(nextLink->child, nextLink->parent)) {
- // loop route
- } else {
- // This path apparently gives us a better route than our current bestParent.
- updateBestParent(nextLink, newReach, store);
- }
- if (Node_getReach(link->child) >= newReach) {
- // Node already has enough reach...
- // selfNode reach == UINT32_MAX so this case handles it.
- } else if (!LabelSplicer_routesThrough(path, link->child->address.path)) {
- // The path the packet came in on is not actually the best known path to the node.
- } else {
- handleNews(link->child, newReach, store);
- }
- if (Node_getBestParent(link->child) == link) {
- // Update linkState.
- uint32_t guessedLinkState = subReach(Node_getReach(link->parent), newReach);
- uint32_t linkStateDiff = (guessedLinkState > link->linkState)
- ? (guessedLinkState - link->linkState)
- : 1;
- update(link, linkStateDiff, store);
- } else {
- // Well we at least know it's not dead.
- update(link, 1, store);
- }
- nextLink->timeLastSeen = now;
- pathFrag = nextPath;
- link = nextLink;
- newReach--;
- }
- // Now we have to unconditionally update the reach for the last link in the chain.
- if (link->child && link->child->address.path == path) {
- // Behavior of nextLinkOnPath()
- Assert_ifParanoid(pathFrag == 1);
- handleNews(link->child, newReach, store);
- uint32_t newLinkState = subReach(Node_getReach(link->parent), newReach);
- update(link, newLinkState - link->linkState, store);
- }
- link->child->timeLastPinged = Time_currentTimeMilliseconds(store->eventBase);
- }
- void NodeStore_pathResponse(struct NodeStore* nodeStore, uint64_t path, uint64_t milliseconds)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- struct Node_Link* link = NodeStore_linkForPath(nodeStore, path);
- if (!link || link == store->selfLink) { return; }
- struct Node_Two* node = link->child;
- uint32_t newReach;
- if (node->address.path == path) {
- // Use old reach value to calculate new reach.
- newReach = calcNextReach(Node_getReach(node), milliseconds);
- }
- else {
- // Old reach value doesn't relate to this path, so we should do something different
- // FIXME(arceliar): calcNextReach is guessing what the reach would stabilize to
- // I think actually fixing this would require storing reach (or latency?) per link,
- // so we can calculate the expected reach for an arbitrary path
- newReach = calcNextReach(0, milliseconds);
- }
- updatePathReach(store, path, newReach);
- }
- void NodeStore_pathTimeout(struct NodeStore* nodeStore, uint64_t path)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- struct Node_Link* link = store->selfLink;
- uint64_t pathFrag = path;
- for (;;) {
- struct Node_Link* nextLink = NULL;
- uint64_t nextPath = firstHopInPath(pathFrag, &nextLink, link, store);
- if (firstHopInPath_ERR(nextPath)) {
- break;
- }
- // expecting behavior of nextLinkOnPath()
- Assert_true(nextLink->parent == link->child);
- if (link != store->selfLink) {
- // TODO(arceliar): Something sane. We don't know which link on the path is bad.
- // For now, just penalize them all.
- // The good ones will be rewarded again when they relay another ping.
- update(link, reachAfterTimeout(link->linkState)-link->linkState, store);
- }
- pathFrag = nextPath;
- link = nextLink;
- }
- link = NodeStore_linkForPath(nodeStore, path);
- if (!link || link->child->address.path != path) { return; }
- struct Node_Two* node = link->child;
- uint32_t newReach = reachAfterTimeout(Node_getReach(node));
- if (!newReach) {
- // The node hasn't responded in a really long time.
- // Possible causes:
- // 1) The node is offline, and for some reason we're not getting an error packet back.
- // 2) The node is behind a node that's offline, and for some reason we're not getting error.
- // 3) The node is online, but in a bad state, where it cannot respond to pings.
- // (E.g. Our CA session broke and it refuses to reset, known bug in old versions.)
- // If we don't do something, we'll guessReachOfChild to re-discover a path through the link.
- // Doing that can get the node store stuck in a bad state where this node is blackholed.
- // As a workaround, break the link. That prevents re-discovering the same broken path.
- // If 2), we might accidentally break a valid link, but we should re-discover it the
- // next time we successfully contact link->child (via another path).
- brokenLink(store, link);
- return;
- }
- if (Defined(Log_DEBUG)) {
- uint8_t addr[60];
- Address_print(addr, &node->address);
- Log_debug(store->logger,
- "Ping timeout for %s. changing reach from %u to %u\n",
- addr,
- Node_getReach(node),
- newReach);
- }
- handleNews(node, newReach, store);
- if (node->address.path != path) { return; }
- // TODO(cjd): What we really should be doing here is storing this link in a
- // potentially-down-list, after pinging the parent, if the parent does not respond
- // and then we replace the link with the parent's link and walk backwards up
- // the tree. If the parent does respond then we keep pinging the child of the path
- // hoping it will respond or die and as it's link-state is destroyed by subsequent
- // lost packets, children will be re-parented to other paths.
- // Keep checking until we're sure it's either OK or down.
- RumorMill_addNode(store->renumberMill, &node->address);
- if (link->parent != store->pub.selfNode) {
- // All we know for sure is that link->child didn't respond.
- // That could be because an earlier link is down.
- // Same idea as the workaround in NodeStore_brokenPath();
- RumorMill_addNode(store->renumberMill, &link->parent->address);
- }
- }
- /* Find the address that describes the source's Nth (furthest-away) bucket. */
- /*
- struct Address NodeStore_addrForBucket(struct Address* source, uint16_t bucket)
- {
- if (bucket >= NodeStore_bucketNumber) {
- // This does not exist.
- return *source;
- } else {
- struct Address addr = *source;
- // Figure out which bits of our address to flip for this step in keyspace.
- // Note: This assumes NodeStore_bucketNumber == 512
- // (Some of those, the fc and every 16th bucket, won't actually have nodes)
- Assert_compileTime(NodeStore_bucketNumber == 512);
- uint64_t extras = 15 - ((bucket % 256)/16);
- uint64_t prefix = 0x0F - (bucket % 16);
- uint64_t bitmask = prefix << (4*extras);
- // We have the bitmask for this bucket, now we need to apply it.
- uint64_t* addrPart = (bucket < 256) ? &addr.ip6.longs.one_be : &addr.ip6.longs.two_be;
- *addrPart = Endian_bigEndianToHost64(*addrPart);
- *addrPart ^= bitmask;
- *addrPart = Endian_hostToBigEndian64(*addrPart);
- // Just to be sure...
- Assert_ifParanoid((bucket % 16) == 15 || NodeStore_bucketForAddr(source, &addr) == bucket);
- return addr;
- }
- }
- uint16_t NodeStore_bucketForAddr(struct Address* source, struct Address* dest)
- {
- uint16_t retVal = 0;
- // This is a place where the implementation depends on how buckets work.
- Assert_compileTime(NodeStore_bucketNumber == 512);
- uint64_t addrPart = source->ip6.longs.one_be ^ dest->ip6.longs.one_be;
- if (!addrPart) {
- // We're apparently close enough in keyspace to use two_be instead.
- addrPart = source->ip6.longs.two_be ^ dest->ip6.longs.two_be;
- retVal += 256;
- }
- addrPart = Endian_bigEndianToHost64(addrPart);
- uint64_t extras = Bits_log2x64(addrPart)/4;
- uint64_t prefix = addrPart >> (4*extras);
- retVal += (15 - extras)*16;
- retVal += 0x0F - prefix;
- return retVal;
- }
- */
- struct Address NodeStore_addrForBucket(struct Address* source, uint16_t bucket)
- {
- Assert_compileTime(NodeStore_bucketNumber == 128);
- struct Address addr = *source;
- uint64_t* addrPart = (bucket < 64) ? &addr.ip6.longs.one_be : &addr.ip6.longs.two_be;
- uint64_t bitmask = (uint64_t)1 << (63 - (bucket % 64));
- *addrPart ^= Endian_hostToBigEndian64(bitmask);
- Assert_ifParanoid(bucket == NodeStore_bucketForAddr(source, &addr));
- return addr;
- }
- uint16_t NodeStore_bucketForAddr(struct Address* source, struct Address* dest)
- {
- Assert_compileTime(NodeStore_bucketNumber == 128);
- uint16_t bucket = 0;
- uint64_t addrPart = source->ip6.longs.one_be ^ dest->ip6.longs.one_be;
- if (!addrPart) {
- addrPart = source->ip6.longs.two_be ^ dest->ip6.longs.two_be;
- bucket += 64;
- }
- addrPart = Endian_bigEndianToHost64(addrPart);
- bucket += 63 - Bits_log2x64(addrPart);
- return bucket;
- }
- uint64_t NodeStore_timeSinceLastPing(struct NodeStore* nodeStore, struct Node_Two* node)
- {
- struct NodeStore_pvt* store = Identity_check((struct NodeStore_pvt*)nodeStore);
- uint64_t now = Time_currentTimeMilliseconds(store->eventBase);
- uint64_t lastSeen = node->timeLastPinged;
- struct Node_Link* link = Node_getBestParent(node);
- while (link && link != store->selfLink) {
- lastSeen = (link->timeLastSeen < lastSeen) ? link->timeLastSeen : lastSeen;
- link = Node_getBestParent(link->parent);
- }
- return now - lastSeen;
- }
|