/* vim: set expandtab ts=4 sw=4: */ /* * You may redistribute this program and/or modify it under the terms of * the GNU General Public License as published by the Free Software Foundation, * either version 3 of the License, or (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see . */ #include "crypto/AddressCalc.h" #include "dht/dhtcore/ReplySerializer.h" #include "net/SwitchPinger.h" #include "subnode/ReachabilityCollector.h" #include "util/log/Log.h" #include "util/Identity.h" #include "util/events/Timeout.h" #include "util/AddrTools.h" #include "util/events/Time.h" #include #include #define TIMEOUT_MILLISECONDS 10000 struct ReachabilityCollector_pvt; struct PeerInfo_pvt { struct ReachabilityCollector_PeerInfo pub; struct ReachabilityCollector_pvt* rcp; // Next path to check when sending getPeers requests to our peer looking for ourselves. uint64_t pathToCheck; // For this 10 second period uint32_t sumOfLag; uint32_t lagSamples; uint32_t timeOfLastLagUpdate; uint64_t sumOfDropsLastSlot; uint64_t sumOfPacketsLastSlot; uint64_t sumOfKbLastSlot; uint64_t sumOfDrops; uint64_t sumOfPackets; uint64_t sumOfKb; // We have an outstanding query and we are waiting for a response from this peer. bool waitForResponse; struct Allocator* alloc; Identity }; #define ArrayList_NAME OfPeerInfo_pvt #define ArrayList_TYPE struct PeerInfo_pvt #include "util/ArrayList.h" struct ReachabilityCollector_pvt { struct ReachabilityCollector pub; struct MsgCore* msgCore; struct Allocator* alloc; struct Log* log; struct BoilerplateResponder* br; struct Address* myAddr; EventBase_t* base; struct EncodingScheme* myScheme; struct SwitchPinger* sp; uint32_t resampleCycle; uint32_t linkStateSamples; struct ArrayList_OfPeerInfo_pvt* piList; Identity }; static struct PeerInfo_pvt* piForLabel(struct ReachabilityCollector_pvt* rcp, uint64_t label) { for (int j = 0; j < rcp->piList->length; j++) { struct PeerInfo_pvt* pi0 = ArrayList_OfPeerInfo_pvt_get(rcp->piList, j); if (pi0->pub.addr.path == label) { return pi0; } } return NULL; } struct ReachabilityCollector_PeerInfo* ReachabilityCollector_piForLabel(struct ReachabilityCollector* rc, uint64_t label) { struct ReachabilityCollector_pvt* rcp = Identity_check((struct ReachabilityCollector_pvt*) rc); struct PeerInfo_pvt* out = piForLabel(rcp, label); return out ? &out->pub : NULL; } static struct PeerInfo_pvt* piForAddr(struct ReachabilityCollector_pvt* rcp, struct Address* addr) { struct PeerInfo_pvt* pi = piForLabel(rcp, addr->path); if (pi && Address_isSame(&pi->pub.addr, addr)) { return pi; } return NULL; } static void piOnFree(struct Allocator_OnFreeJob* j) { struct PeerInfo_pvt* pi = Identity_check((struct PeerInfo_pvt*) j->userData); struct ReachabilityCollector_pvt* rcp = Identity_check(pi->rcp); for (int j = 0; j < rcp->piList->length; j++) { struct PeerInfo_pvt* pi0 = ArrayList_OfPeerInfo_pvt_get(rcp->piList, j); if (pi0 != pi) { continue; } ArrayList_OfPeerInfo_pvt_remove(rcp->piList, j); } } static void mkNextRequest(struct ReachabilityCollector_pvt* rcp); void ReachabilityCollector_unreachable(struct ReachabilityCollector* rc, struct Address* nodeAddr) { struct ReachabilityCollector_pvt* rcp = Identity_check((struct ReachabilityCollector_pvt*) rc); struct PeerInfo_pvt* pi = piForAddr(rcp, nodeAddr); if (pi) { Log_debug(rcp->log, "Peer [%s] dropped", Address_toString(&pi->pub.addr, pi->alloc)->bytes); rcp->pub.onChange(&rcp->pub, &pi->pub.addr, NULL); Allocator_free(pi->alloc); return; } uint8_t buf[60]; Address_print(buf, nodeAddr); Log_debug(rcp->log, "Nonexistant peer [%s] dropped", buf); return; } static void change0(struct ReachabilityCollector_pvt* rcp, struct Address* nodeAddr, struct Allocator* tempAlloc) { struct PeerInfo_pvt* oldPi = piForLabel(rcp, nodeAddr->path); if (oldPi) { if (Address_isSame(&oldPi->pub.addr, nodeAddr)) { // Log_debug(rcp->log, "Peer [%s] message, peer already registered", // Address_toString(nodeAddr, tempAlloc)->bytes); return; } Log_debug(rcp->log, "Dropping ghost peer [%s] to add peer [%s]", Address_toString(&oldPi->pub.addr, tempAlloc)->bytes, Address_toString(nodeAddr, tempAlloc)->bytes); ReachabilityCollector_unreachable(&rcp->pub, &oldPi->pub.addr); } struct Allocator* piAlloc = Allocator_child(rcp->alloc); struct PeerInfo_pvt* pi = Allocator_calloc(piAlloc, sizeof(struct PeerInfo_pvt), 1); Identity_set(pi); pi->rcp = rcp; Bits_memcpy(&pi->pub.addr, nodeAddr, Address_SIZE); pi->alloc = piAlloc; pi->pub.isQuerying = true; pi->pathToCheck = 1; Allocator_onFree(piAlloc, piOnFree, pi); ArrayList_OfPeerInfo_pvt_add(rcp->piList, pi); Log_debug(rcp->log, "Peer [%s] added", Address_toString(&pi->pub.addr, tempAlloc)->bytes); mkNextRequest(rcp); } void ReachabilityCollector_change(struct ReachabilityCollector* rc, struct Address* nodeAddr) { struct ReachabilityCollector_pvt* rcp = Identity_check((struct ReachabilityCollector_pvt*) rc); struct Allocator* tempAlloc = Allocator_child(rcp->alloc); change0(rcp, nodeAddr, tempAlloc); Allocator_free(tempAlloc); } struct Query { struct ReachabilityCollector_pvt* rcp; uint8_t targetPath[20]; Identity }; static void onReplyTimeout(struct MsgCore_Promise* prom) { struct Query* q = Identity_check((struct Query*) prom->userData); struct ReachabilityCollector_pvt* rcp = Identity_check((struct ReachabilityCollector_pvt*) q->rcp); Log_debug(rcp->log, "Timeout querying [%s]", Address_toString(prom->target, prom->alloc)->bytes); struct PeerInfo_pvt* pi = piForAddr(rcp, prom->target); if (pi) { pi->waitForResponse = false; } } static void latencyUpdate( struct ReachabilityCollector_pvt* rcp, struct PeerInfo_pvt* pip, uint32_t lag) { //Log_debug(rcp->log, "Latency update for [%" PRIx64 "] [%u]ms", pip->pub.addr.path, lag); pip->sumOfLag += lag; pip->lagSamples++; pip->timeOfLastLagUpdate = Time_currentTimeMilliseconds(); } static void onReplyOld(Dict* msg, struct Address* src, struct MsgCore_Promise* prom) { struct Query* q = Identity_check((struct Query*) prom->userData); struct ReachabilityCollector_pvt* rcp = Identity_check((struct ReachabilityCollector_pvt*) q->rcp); if (!src) { onReplyTimeout(prom); mkNextRequest(rcp); return; } Log_debug(rcp->log, "Got response from peer [%s]", Address_toString(src, prom->alloc)->bytes); struct PeerInfo_pvt* pi = piForAddr(rcp, src); if (!pi) { Log_debug(rcp->log, "Got message from peer [%s] which is gone from list", Address_toString(src, prom->alloc)->bytes); return; } pi->waitForResponse = false; latencyUpdate(rcp, pi, prom->lag); struct Address_List* results = ReplySerializer_parse(src, msg, rcp->log, false, prom->alloc); uint64_t path = 1; if (!results) { Log_debug(rcp->log, "Got invalid getPeers reply from [%s]", Address_toString(src, prom->alloc)->bytes); return; } for (int i = results->length - 1; i >= 0; i--) { path = results->elems[i].path; if (Bits_memcmp(results->elems[i].ip6.bytes, rcp->myAddr->ip6.bytes, 16)) { continue; } // We're going to get one or more paths from them to us // We don't have a clue which one is correct, but we'll try to reduce // flap by sticking to one after we've adopted it. if (pi->pub.pathThemToUs == path) { Log_debug(rcp->log, "Found back-route for [%s] (exact match)", Address_toString(src, prom->alloc)->bytes); pi->pub.isQuerying = false; mkNextRequest(rcp); return; } } // Ok, no matches, if any of them mismatch then we're going to change for (int i = results->length - 1; i >= 0; i--) { path = results->elems[i].path; if (Bits_memcmp(results->elems[i].ip6.bytes, rcp->myAddr->ip6.bytes, 16)) { continue; } Log_debug(rcp->log, "Found back-route for [%s]", Address_toString(src, prom->alloc)->bytes); pi->pub.pathThemToUs = path; rcp->pub.onChange(&rcp->pub, src, &pi->pub); pi->pub.isQuerying = false; mkNextRequest(rcp); return; } if (results->length < 8) { // Peer's gp response does not include my addr, meaning the peer might not know us yet. // should wait peer sendPing (see InterfaceControl.c). Log_debug(rcp->log, "No back-route found for peer [%s]", Address_toString(src, prom->alloc)->bytes); pi->pathToCheck = 1; return; } else { pi->pathToCheck = path; } mkNextRequest(rcp); } static void queryOldPeer(struct ReachabilityCollector_pvt* rcp, struct PeerInfo_pvt* pi) { struct MsgCore_Promise* query = MsgCore_createQuery(rcp->msgCore, TIMEOUT_MILLISECONDS, rcp->alloc); struct Query* q = Allocator_calloc(query->alloc, sizeof(struct Query), 1); Identity_set(q); q->rcp = rcp; query->userData = q; query->cb = onReplyOld; Assert_true(AddressCalc_validAddress(pi->pub.addr.ip6.bytes)); query->target = Address_clone(&pi->pub.addr, query->alloc); Assert_true(pi->pub.addr.path); Dict* d = query->msg = Dict_new(query->alloc); Dict_putStringCC(d, "q", "gp", query->alloc); // getpeers (if < v21) uint64_t label_be = Endian_hostToBigEndian64(pi->pathToCheck); uint8_t nearbyLabelBytes[8]; Bits_memcpy(nearbyLabelBytes, &label_be, 8); AddrTools_printPath(q->targetPath, pi->pathToCheck); Log_debug(rcp->log, "Getting reverse path for old peer [%s] tar [%s]", Address_toString(&pi->pub.addr, query->alloc)->bytes, q->targetPath); Dict_putStringC(d, "tar", String_newBinary(nearbyLabelBytes, 8, query->alloc), query->alloc); BoilerplateResponder_addBoilerplate(rcp->br, d, &pi->pub.addr, query->alloc); pi->waitForResponse = true; } static void pingReply(Dict* msg, struct Address* src, struct MsgCore_Promise* prom) { struct ReachabilityCollector_pvt* rcp = Identity_check((struct ReachabilityCollector_pvt*) prom->userData); struct PeerInfo_pvt* pi = piForAddr(rcp, prom->target); if (!pi) { if (src) { Log_debug(rcp->log, "Got message from peer [%s] which is gone from list", Address_toString(src, prom->alloc)->bytes); } return; } pi->waitForResponse = false; if (!src) { //Log_debug(pf->log, "Ping timeout"); return; } Log_debug(rcp->log, "Ping reply from [%s]", Address_toString(src, prom->alloc)->bytes); latencyUpdate(rcp, pi, prom->lag); } static void pingPeer(struct ReachabilityCollector_pvt* rcp, struct PeerInfo_pvt* pi) { struct MsgCore_Promise* qp = MsgCore_createQuery(rcp->msgCore, 0, rcp->alloc); Dict* dict = qp->msg = Dict_new(qp->alloc); qp->cb = pingReply; qp->userData = rcp; Assert_true(AddressCalc_validAddress(pi->pub.addr.ip6.bytes)); Assert_true(pi->pub.addr.path); qp->target = Address_clone(&pi->pub.addr, qp->alloc); Log_debug(rcp->log, "Pinging [%s] to determine latency", Address_toString(qp->target, qp->alloc)->bytes); Dict_putStringCC(dict, "q", "pn", qp->alloc); BoilerplateResponder_addBoilerplate(rcp->br, dict, qp->target, qp->alloc); } static void peerResponseOK( struct ReachabilityCollector_pvt* rcp, struct PeerInfo_pvt* pi, struct SwitchPinger_Response* resp) { ReachabilityCollector_lagSample(&rcp->pub, resp->label, resp->milliseconds); Log_debug(rcp->log, "Found back-route for [%s] (sp)", Address_toString(&pi->pub.addr, resp->ping->pingAlloc)->bytes); pi->pub.pathThemToUs = resp->rpath; rcp->pub.onChange(&rcp->pub, &pi->pub.addr, &pi->pub); pi->pub.isQuerying = false; pingPeer(rcp, pi); mkNextRequest(rcp); } static void peerResponse(struct SwitchPinger_Response* resp, void* userData) { struct ReachabilityCollector_pvt* rcp = Identity_check((struct ReachabilityCollector_pvt*) userData); struct PeerInfo_pvt* pi = piForLabel(rcp, resp->label); if (!pi) { Log_debug(rcp->log, "Response from [%" PRIx64 "] with no peer info", resp->label); mkNextRequest(rcp); return; } Log_debug(rcp->log, "Response from [%" PRIx64 "] [%d]", resp->label, pi->waitForResponse); pi->waitForResponse = false; char* err = ""; switch (resp->res) { case SwitchPinger_Result_OK: peerResponseOK(rcp, pi, resp); return; case SwitchPinger_Result_LABEL_MISMATCH: err = "LABEL_MISMATCH"; break; case SwitchPinger_Result_WRONG_DATA: err = "WRONG_DATA"; break; case SwitchPinger_Result_ERROR_RESPONSE: err = "ERROR_RESPONSE"; break; case SwitchPinger_Result_LOOP_ROUTE: err = "LOOP_ROUTE"; break; case SwitchPinger_Result_TIMEOUT: err = "TIMEOUT"; break; default: err = "unknown error"; break; } // We don't want to unreachable the peer here because this could be spurious packet loss Log_debug(rcp->log, "Error sending rpath query to peer [%s]", err); mkNextRequest(rcp); } static void queryBackroute(struct ReachabilityCollector_pvt* rcp, struct PeerInfo_pvt* pi) { if (pi->pub.addr.protocolVersion == 0) { // We don't know the version yet, we don't need to explicitly message the peer // here, we're going to discover it one way or another from talking to them. return; } else if (pi->pub.addr.protocolVersion < 21) { queryOldPeer(rcp, pi); return; } struct SwitchPinger_Ping* p = SwitchPinger_newPing( pi->pub.addr.path, String_CONST(""), 3000, peerResponse, rcp->alloc, rcp->sp); Assert_true(p); Log_debug(rcp->log, "Getting reverse path for new peer [%s]", Address_toString(&pi->pub.addr, p->pingAlloc)->bytes); p->type = SwitchPinger_Type_RPATH; p->onResponseContext = rcp; pi->waitForResponse = true; } static void mkNextRequest(struct ReachabilityCollector_pvt* rcp) { struct PeerInfo_pvt* pi = NULL; for (int i = 0; i < rcp->piList->length; i++) { pi = ArrayList_OfPeerInfo_pvt_get(rcp->piList, i); if (pi->pub.addr.protocolVersion == 0) { continue; } if (pi->pub.isQuerying && !pi->waitForResponse) { break; } } if (!pi || !pi->pub.isQuerying) { // if (rcp->piList->length > 0) { // Log_debug(rcp->log, "All [%u] peers have been queried", rcp->piList->length); // } return; } if (pi->waitForResponse) { Log_debug(rcp->log, "Message outstanding, waiting for peer to respond"); return; } queryBackroute(rcp, pi); } static void cycle(void* vrc) { struct ReachabilityCollector_pvt* rcp = Identity_check((struct ReachabilityCollector_pvt*) vrc); mkNextRequest(rcp); // 10 second window is cut into 5 intervals // second 0, 2, 4, 6, 8 // number 1, 2, 3, 4, 5 // in number 4, we will ping any peer who has not received one yet to get latency // in number 5, we will collect everything back rcp->resampleCycle++; if (rcp->resampleCycle < 4) { return; } for (int j = 0; j < rcp->piList->length; j++) { struct PeerInfo_pvt* pi = ArrayList_OfPeerInfo_pvt_get(rcp->piList, j); Log_debug(rcp->log, "Visiting peer [%" PRIx64 "] samples [%u]", pi->pub.addr.path, pi->lagSamples); if (pi->lagSamples == 0 && !pi->waitForResponse) { pingPeer(rcp, pi); } if (rcp->resampleCycle < 5) { continue; } int sampleNum = rcp->linkStateSamples % LinkState_SLOTS; uint64_t drops = pi->sumOfDrops - pi->sumOfDropsLastSlot; // uint64 rollover, will "never" happen //if (drops < pi->sumOfDrops) { drops = pi->sumOfDrops; } uint64_t packets = pi->sumOfPackets - pi->sumOfPacketsLastSlot; //if (packets < pi->sumOfPackets) { drops = pi->sumOfPackets; } uint64_t dropRateShl18 = packets ? (drops << 18) / packets : 0; pi->pub.linkState.dropSlots[sampleNum] = dropRateShl18 > 0xfffe ? 0xfffe : dropRateShl18; pi->sumOfDropsLastSlot = pi->sumOfDrops; Log_debug(rcp->log, "[%" PRIx64 "] has sumOfDrops [%" PRIu64 "] sumOfDropsLastSlot [%" PRIu64 "]", pi->pub.addr.path, pi->sumOfDrops, pi->sumOfDropsLastSlot); pi->pub.linkState.kbRecvSlots[sampleNum] = pi->sumOfKb - pi->sumOfKbLastSlot; pi->sumOfKbLastSlot = pi->sumOfKb; pi->pub.linkState.lagSlots[sampleNum] = pi->lagSamples ? pi->sumOfLag / pi->lagSamples : 0; pi->sumOfLag = 0; pi->lagSamples = 0; pi->pub.linkState.samples = rcp->linkStateSamples + 1; } if (rcp->resampleCycle >= 5) { rcp->resampleCycle = 0; rcp->linkStateSamples++; } } struct ReachabilityCollector_PeerInfo* ReachabilityCollector_getPeerInfo(struct ReachabilityCollector* rc, int peerNum) { struct ReachabilityCollector_pvt* rcp = Identity_check((struct ReachabilityCollector_pvt*) rc); struct PeerInfo_pvt* pi = ArrayList_OfPeerInfo_pvt_get(rcp->piList, peerNum); return pi ? &pi->pub : NULL; } int ReachabilityCollector_peerCount(struct ReachabilityCollector* rc) { struct ReachabilityCollector_pvt* rcp = Identity_check((struct ReachabilityCollector_pvt*) rc); return rcp->piList->length; } void ReachabilityCollector_lagSample( struct ReachabilityCollector* rc, uint64_t label, uint32_t milliseconds) { struct ReachabilityCollector_pvt* rcp = Identity_check((struct ReachabilityCollector_pvt*) rc); struct PeerInfo_pvt* pi = piForLabel(rcp, label); if (!pi) { return; } latencyUpdate(rcp, pi, milliseconds); } void ReachabilityCollector_updateBandwidthAndDrops( struct ReachabilityCollector* rc, uint64_t label, uint64_t sumOfPackets, uint64_t sumOfDrops, uint64_t sumOfKb) { struct ReachabilityCollector_pvt* rcp = Identity_check((struct ReachabilityCollector_pvt*) rc); struct PeerInfo_pvt* pi = piForLabel(rcp, label); if (!pi) { return; } pi->sumOfPackets = sumOfPackets; pi->sumOfDrops = sumOfDrops; pi->sumOfKb = sumOfKb; } static void dummyOnChange( struct ReachabilityCollector* rc, struct Address* addr, struct ReachabilityCollector_PeerInfo* pi) { struct ReachabilityCollector_pvt* rcp = Identity_check((struct ReachabilityCollector_pvt*) rc); Log_debug(rcp->log, "dummyOnChange called, onChange unassigned"); } struct ReachabilityCollector* ReachabilityCollector_new(struct Allocator* allocator, struct MsgCore* msgCore, struct Log* log, EventBase_t* base, struct BoilerplateResponder* br, struct Address* myAddr, struct EncodingScheme* myScheme, struct SwitchPinger* sp) { struct Allocator* alloc = Allocator_child(allocator); struct ReachabilityCollector_pvt* rcp = Allocator_calloc(alloc, sizeof(struct ReachabilityCollector_pvt), 1); rcp->myAddr = myAddr; rcp->msgCore = msgCore; rcp->alloc = alloc; rcp->piList = ArrayList_OfPeerInfo_pvt_new(alloc); rcp->log = log; rcp->br = br; rcp->base = base; rcp->pub.onChange = dummyOnChange; rcp->myScheme = myScheme; rcp->sp = sp; Identity_set(rcp); Timeout_setInterval(cycle, rcp, 2000, base, alloc); return &rcp->pub; }