More multicast work...
This commit is contained in:
parent
592e743349
commit
bccb86a401
7 changed files with 410 additions and 230 deletions
|
@ -17,6 +17,7 @@
|
|||
#include "RuntimeEnvironment.hpp"
|
||||
#include "Multicaster.hpp"
|
||||
#include "Network.hpp"
|
||||
#include "Membership.hpp"
|
||||
#include "Topology.hpp"
|
||||
#include "Switch.hpp"
|
||||
|
||||
|
@ -28,7 +29,7 @@ Multicaster::Multicaster(const RuntimeEnvironment *renv) :
|
|||
|
||||
Multicaster::~Multicaster() {}
|
||||
|
||||
void Multicaster::send(
|
||||
unsigned int Multicaster::send(
|
||||
void *tPtr,
|
||||
int64_t now,
|
||||
const SharedPtr<Network> &network,
|
||||
|
@ -40,104 +41,218 @@ void Multicaster::send(
|
|||
const void *const data,
|
||||
unsigned int len)
|
||||
{
|
||||
static const unsigned int PRIMES[16] = { 2,3,5,7,11,13,17,19,23,29,31,37,41,43,47,53 };
|
||||
static const unsigned int PRIMES[16] = { 3,5,7,11,13,17,19,23,29,31,37,41,43,47,53,59 }; // 2 is skipped as it's even
|
||||
|
||||
if (unlikely(len > ZT_MAX_MTU)) return; // sanity check
|
||||
std::vector< std::pair<int64_t,Address> > recipients;
|
||||
|
||||
const NetworkConfig &config = network->config();
|
||||
if (config.multicastLimit == 0) return; // multicast disabled
|
||||
Address bridges[ZT_MAX_NETWORK_SPECIALISTS],multicastReplicators[ZT_MAX_NETWORK_SPECIALISTS];
|
||||
unsigned int bridgeCount = 0,multicastReplicatorCount = 0;
|
||||
|
||||
Address specialists[ZT_MAX_NETWORK_SPECIALISTS],multicastReplicators[ZT_MAX_NETWORK_SPECIALISTS];
|
||||
unsigned int specialistCount = 0,multicastReplicatorCount = 0,bridgeCount = 0;
|
||||
bool amMulticastReplicator = false;
|
||||
for(unsigned int i=0;i<config.specialistCount;++i) {
|
||||
if ((config.specialists[i] & ZT_NETWORKCONFIG_SPECIALIST_TYPE_ACTIVE_BRIDGE) != 0)
|
||||
bridges[bridgeCount++] = config.specialists[i];
|
||||
if ((config.specialists[i] & ZT_NETWORKCONFIG_SPECIALIST_TYPE_MULTICAST_REPLICATOR) != 0)
|
||||
multicastReplicators[multicastReplicatorCount++] = config.specialists[i];
|
||||
if (RR->identity.address() == config.specialists[i]) {
|
||||
amMulticastReplicator |= ((config.specialists[i] & ZT_NETWORKCONFIG_SPECIALIST_TYPE_MULTICAST_REPLICATOR) != 0);
|
||||
} else {
|
||||
specialists[specialistCount++] = config.specialists[i];
|
||||
if ((config.specialists[i] & ZT_NETWORKCONFIG_SPECIALIST_TYPE_ACTIVE_BRIDGE) != 0) {
|
||||
recipients.push_back(std::pair<int64_t,Address>(0,config.specialists[i]));
|
||||
++bridgeCount;
|
||||
} if ((config.specialists[i] & ZT_NETWORKCONFIG_SPECIALIST_TYPE_MULTICAST_REPLICATOR) != 0) {
|
||||
multicastReplicators[multicastReplicatorCount++] = config.specialists[i];
|
||||
}
|
||||
}
|
||||
}
|
||||
std::sort(&(specialists[0]),&(specialists[specialistCount])); // for binary search
|
||||
|
||||
std::vector< std::pair<int64_t,Address> > recipients;
|
||||
bool needMoar = false;
|
||||
for(unsigned int i=0;i<bridgeCount;++i)
|
||||
recipients.push_back(std::pair<int64_t,Address>(9223372036854775807LL,bridges[i]));
|
||||
int64_t lastGather = 0;
|
||||
_K groupKey(network->id(),mg);
|
||||
{
|
||||
Mutex::Lock l2(_groups_l);
|
||||
_getMembersByTime(network->id(),mg,recipients);
|
||||
}
|
||||
std::sort(recipients.begin() + bridgeCount,recipients.end(),std::greater< std::pair<int64_t,Address> >());
|
||||
recipients.erase(std::unique(recipients.begin(),recipients.end()),recipients.end());
|
||||
if (recipients.size() > config.multicastLimit) {
|
||||
recipients.resize(config.multicastLimit);
|
||||
} else if (recipients.size() < config.multicastLimit) {
|
||||
needMoar = true;
|
||||
}
|
||||
|
||||
_txQueue_l.lock();
|
||||
_OM *om = &(_txQueue[_txQueuePtr++ % ZT_TX_QUEUE_SIZE]);
|
||||
Mutex::Lock ql(om->lock);
|
||||
_txQueue_l.unlock();
|
||||
|
||||
om->nwid = network->id();
|
||||
om->src = src;
|
||||
om->mg = mg;
|
||||
om->etherType = etherType;
|
||||
om->dataSize = len;
|
||||
memcpy(om->data,data,len);
|
||||
|
||||
if (existingBloom) {
|
||||
om->bloomFilterMultiplier = existingBloomMultiplier;
|
||||
memcpy(om->bloomFilter,existingBloom,sizeof(om->bloomFilter));
|
||||
} else {
|
||||
om->bloomFilterMultiplier = 1;
|
||||
memset(om->bloomFilter,0,sizeof(om->bloomFilter));
|
||||
|
||||
if (recipients.size() > 1) {
|
||||
unsigned int mult = 1;
|
||||
unsigned int bestMultColl = 0xffffffff;
|
||||
for(int k=0;k<16;++k) { // 16 == arbitrary limit on iterations for this search, also must be <= size of PRIMES
|
||||
unsigned int coll = 0;
|
||||
for(std::vector< std::pair<int64_t,Address> >::const_iterator r(recipients.begin());r!=recipients.end();++r) {
|
||||
const unsigned int bfi = mult * (unsigned int)r->second.toInt();
|
||||
const unsigned int byte = (bfi >> 3) % sizeof(om->bloomFilter);
|
||||
const uint8_t bit = 1 << (bfi & 7);
|
||||
coll += ((om->bloomFilter[byte] & bit) != 0);
|
||||
om->bloomFilter[byte] |= bit;
|
||||
}
|
||||
memset(om->bloomFilter,0,sizeof(om->bloomFilter));
|
||||
|
||||
if (coll <= bestMultColl) {
|
||||
om->bloomFilterMultiplier = mult;
|
||||
if (coll == 0) // perfect score, no need to continue searching
|
||||
break;
|
||||
bestMultColl = coll;
|
||||
}
|
||||
|
||||
mult = PRIMES[k];
|
||||
Mutex::Lock l(_groups_l);
|
||||
const _G *const g = _groups.get(groupKey);
|
||||
if (g) {
|
||||
lastGather = g->lastGather;
|
||||
recipients.reserve(recipients.size() + g->members.size());
|
||||
Hashtable< Address,int64_t >::Iterator mi(const_cast<_G *>(g)->members);
|
||||
Address *mik = nullptr;
|
||||
int64_t *miv = nullptr;
|
||||
while (mi.next(mik,miv)) {
|
||||
if (!std::binary_search(&(specialists[0]),&(specialists[specialistCount]),*mik))
|
||||
recipients.push_back(std::pair<int64_t,Address>(*miv,*mik));
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
if (multicastReplicatorCount > 0) {
|
||||
// SEND
|
||||
return;
|
||||
// Sort recipients, maintaining bridges first in list
|
||||
std::sort(recipients.begin() + bridgeCount,recipients.end(),std::greater< std::pair<int64_t,Address> >());
|
||||
|
||||
// Gather new recipients periodically, being more aggressive if we have none.
|
||||
if ((now - lastGather) > (recipients.empty() ? 5000 : ZT_MULTICAST_GATHER_PERIOD)) {
|
||||
{
|
||||
Mutex::Lock l(_groups_l);
|
||||
_groups[groupKey].lastGather = now;
|
||||
}
|
||||
|
||||
Packet outp(network->controller(),RR->identity.address(),Packet::VERB_MULTICAST_GATHER);
|
||||
outp.append(network->id());
|
||||
outp.append((uint8_t)0);
|
||||
mg.mac().appendTo(outp);
|
||||
outp.append(mg.adi());
|
||||
outp.append((uint32_t)0xffffffff);
|
||||
RR->sw->send(tPtr,outp,true);
|
||||
|
||||
for(unsigned int i=0;i<specialistCount;++i) {
|
||||
outp.newInitializationVector();
|
||||
outp.setDestination(specialists[i]);
|
||||
RR->sw->send(tPtr,outp,true);
|
||||
}
|
||||
|
||||
// LEGACY: roots may know about older versions' multicast subscriptions but
|
||||
// the root's role here is being phased out.
|
||||
SharedPtr<Peer> root(RR->topology->root(now));
|
||||
if (root) {
|
||||
outp.newInitializationVector();
|
||||
outp.setDestination(root->address());
|
||||
outp.armor(root->key(),true);
|
||||
root->sendDirect(tPtr,outp.data(),outp.size(),now,true);
|
||||
}
|
||||
}
|
||||
|
||||
SharedPtr<Peer> nextHops[2]; // these by definition are protocol version >= 11
|
||||
unsigned int nextHopsBestLatency[2] = { 0xffff,0xffff };
|
||||
for(std::vector< std::pair<int64_t,Address> >::const_iterator r(recipients.begin());r!=recipients.end();++r) {
|
||||
const unsigned int bfi = om->bloomFilterMultiplier * (unsigned int)r->second.toInt();
|
||||
const unsigned int bfbyte = (bfi >> 3) % sizeof(om->bloomFilter);
|
||||
const uint8_t bfbit = 1 << (bfi & 7);
|
||||
if ((om->bloomFilter[bfbyte] & bfbit) != 0) {
|
||||
continue;
|
||||
} else {
|
||||
SharedPtr<Peer> peer(RR->topology->get(r->second));
|
||||
if (peer) {
|
||||
if (peer->remoteVersionProtocol() < 11) {
|
||||
// SEND
|
||||
if (recipients.empty())
|
||||
return 0;
|
||||
|
||||
om->bloomFilter[bfbyte] |= bfbit;
|
||||
continue;
|
||||
} else {
|
||||
unsigned int sentCount = 0;
|
||||
|
||||
uint64_t bloomFilter[ZT_MULTICAST_BLOOM_FILTER_SIZE_BITS / 64];
|
||||
unsigned int bloomMultiplier;
|
||||
if (existingBloom) {
|
||||
memcpy(bloomFilter,existingBloom,sizeof(bloomFilter));
|
||||
bloomMultiplier = existingBloomMultiplier;
|
||||
} else {
|
||||
memset(bloomFilter,0,sizeof(bloomFilter));
|
||||
bloomMultiplier = 1;
|
||||
|
||||
// Iteratively search for a bloom multiplier that results in no collisions
|
||||
// among known recipients. Usually the first iteration is good unless
|
||||
// the recipient set is quite large.
|
||||
if (recipients.size() > 1) {
|
||||
unsigned long bestMultColl = 0xffffffff;
|
||||
for(int k=0;k<16;++k) { // 16 == arbitrary limit on iterations for this search, also must be <= size of PRIMES
|
||||
const unsigned int mult = PRIMES[k];
|
||||
unsigned long coll = 0;
|
||||
for(std::vector< std::pair<int64_t,Address> >::const_iterator r(recipients.begin());r!=recipients.end();++r) {
|
||||
const unsigned int bfi = mult * (unsigned int)r->second.toInt();
|
||||
const unsigned int byte = (bfi >> 3) % sizeof(bloomFilter);
|
||||
const uint8_t bit = 1 << (bfi & 7);
|
||||
coll += ((((uint8_t *)bloomFilter)[byte] & bit) != 0);
|
||||
((uint8_t *)bloomFilter)[byte] |= bit;
|
||||
}
|
||||
memset(bloomFilter,0,sizeof(bloomFilter));
|
||||
|
||||
if (coll <= bestMultColl) {
|
||||
bloomMultiplier = mult;
|
||||
if (coll == 0) // perfect score, no need to continue searching
|
||||
break;
|
||||
bestMultColl = coll;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// See if there is a multicast replicator, trying to pick the fastest/best one.
|
||||
Address bestReplicator;
|
||||
if (multicastReplicatorCount > 0) {
|
||||
unsigned int bestReplicatorLatency = 0xffff;
|
||||
for(unsigned int i=0;i<multicastReplicatorCount;++i) {
|
||||
const unsigned int bfi = bloomMultiplier * (unsigned int)multicastReplicators[i].toInt();
|
||||
if ((((uint8_t *)bloomFilter)[(bfi >> 3) % sizeof(bloomFilter)] & (1 << (bfi & 7))) == 0) {
|
||||
SharedPtr<Peer> peer(RR->topology->get(multicastReplicators[i]));
|
||||
if (peer) {
|
||||
const unsigned int lat = peer->latency(now);
|
||||
if (lat <= bestReplicatorLatency) {
|
||||
bestReplicator = peer->address();
|
||||
bestReplicatorLatency = lat;
|
||||
}
|
||||
} else if (!bestReplicator) {
|
||||
bestReplicator = multicastReplicators[i];
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// If this is a multicast replicator, aggressively replicate. Multicast
|
||||
// replicators are not subject to send count limits.
|
||||
if (amMulticastReplicator) {
|
||||
std::vector< std::pair< int,Address > > byLatency;
|
||||
for(std::vector< std::pair<int64_t,Address> >::const_iterator r(recipients.begin());r!=recipients.end();++r) {
|
||||
const unsigned int bfi = bloomMultiplier * (unsigned int)r->second.toInt();
|
||||
if ((((uint8_t *)bloomFilter)[(bfi >> 3) % sizeof(bloomFilter)] & (1 << (bfi & 7))) == 0) {
|
||||
SharedPtr<Peer> peer(RR->topology->get(r->second));
|
||||
byLatency.push_back(std::pair< int,Address >((peer) ? (int)peer->latency(now) : 0xffff,r->second));
|
||||
}
|
||||
}
|
||||
std::sort(byLatency.begin(),byLatency.end());
|
||||
|
||||
unsigned long cnt = byLatency.size();
|
||||
if (bestReplicator)
|
||||
cnt /= 2; // send to only the best half of the latency-sorted population if there are more replicators
|
||||
for(unsigned long i=0;i<cnt;++i) {
|
||||
const unsigned int bfi = bloomMultiplier * (unsigned int)byLatency[i].second.toInt();
|
||||
((uint8_t *)bloomFilter)[(bfi >> 3) % sizeof(bloomFilter)] |= 1 << (bfi & 7);
|
||||
|
||||
Packet outp(byLatency[i].second,RR->identity.address(),Packet::VERB_MULTICAST_FRAME);
|
||||
outp.append(network->id());
|
||||
outp.append((uint8_t)0x04);
|
||||
src.appendTo(outp);
|
||||
mg.mac().appendTo(outp);
|
||||
outp.append(mg.adi());
|
||||
outp.append((uint16_t)etherType);
|
||||
outp.append(data,len);
|
||||
outp.compress();
|
||||
RR->sw->send(tPtr,outp,true);
|
||||
|
||||
++sentCount;
|
||||
}
|
||||
}
|
||||
|
||||
// Forward to the next multicast replicator, if any.
|
||||
if (bestReplicator) {
|
||||
const unsigned int bfi = bloomMultiplier * (unsigned int)bestReplicator.toInt();
|
||||
((uint8_t *)bloomFilter)[(bfi >> 3) % sizeof(bloomFilter)] |= 1 << (bfi & 7);
|
||||
|
||||
Packet outp(bestReplicator,RR->identity.address(),Packet::VERB_MULTICAST_FRAME);
|
||||
outp.append((uint8_t)(0x04 | 0x08));
|
||||
RR->identity.address().appendTo(outp);
|
||||
outp.append((uint16_t)bloomMultiplier);
|
||||
outp.append((uint16_t)sizeof(bloomFilter));
|
||||
outp.append(((uint8_t *)bloomFilter),sizeof(bloomFilter));
|
||||
src.appendTo(outp);
|
||||
mg.mac().appendTo(outp);
|
||||
outp.append(mg.adi());
|
||||
outp.append((uint16_t)etherType);
|
||||
outp.append(data,len);
|
||||
outp.compress();
|
||||
RR->sw->send(tPtr,outp,true);
|
||||
|
||||
++sentCount;
|
||||
}
|
||||
|
||||
// If this is a multicast replicator, we've already replicated.
|
||||
if (amMulticastReplicator)
|
||||
return (unsigned int)recipients.size();
|
||||
|
||||
// Find the two best next hops (that have never seen this multicast)
|
||||
// that are newer version nodes.
|
||||
SharedPtr<Peer> nextHops[2];
|
||||
unsigned int nextHopsBestLatency[2] = { 0xffff,0xffff };
|
||||
for(std::vector< std::pair<int64_t,Address> >::iterator r(recipients.begin());r!=recipients.end();++r) {
|
||||
if (r->first >= 0) {
|
||||
const unsigned int bfi = bloomMultiplier * (unsigned int)r->second.toInt();
|
||||
if ((((uint8_t *)bloomFilter)[(bfi >> 3) % sizeof(bloomFilter)] & (1 << (bfi & 7))) == 0) {
|
||||
const SharedPtr<Peer> peer(RR->topology->get(r->second));
|
||||
if ((peer)&&(peer->remoteVersionProtocol() >= 11)) {
|
||||
r->first = -1; // use this field now to flag as non-legacy
|
||||
const unsigned int lat = peer->latency(now);
|
||||
for(unsigned int nh=0;nh<2;++nh) {
|
||||
if (lat <= nextHopsBestLatency[nh]) {
|
||||
|
@ -151,17 +266,57 @@ void Multicaster::send(
|
|||
}
|
||||
}
|
||||
|
||||
// Set bits for next hops in bloom filter
|
||||
for(unsigned int nh=0;nh<2;++nh) {
|
||||
if (nextHops[nh]) {
|
||||
const unsigned int bfi = om->bloomFilterMultiplier * (unsigned int)nextHops[nh]->address().toInt();
|
||||
om->bloomFilter[(bfi >> 3) % sizeof(om->bloomFilter)] |= 1 << (bfi & 7);
|
||||
const unsigned int bfi = bloomMultiplier * (unsigned int)nextHops[nh]->address().toInt();
|
||||
((uint8_t *)bloomFilter)[(bfi >> 3) % sizeof(bloomFilter)] |= 1 << (bfi & 7);
|
||||
++sentCount;
|
||||
}
|
||||
}
|
||||
|
||||
for(unsigned int nh=0;nh<2;++nh) {
|
||||
if (nextHops[nh]) {
|
||||
// Send to legacy peers and flag these in bloom filter
|
||||
const unsigned int limit = config.multicastLimit + bridgeCount;
|
||||
for(std::vector< std::pair<int64_t,Address> >::const_iterator r(recipients.begin());(r!=recipients.end())&&(sentCount<limit);++r) {
|
||||
if (r->first >= 0) {
|
||||
const unsigned int bfi = bloomMultiplier * (unsigned int)r->second.toInt();
|
||||
((uint8_t *)bloomFilter)[(bfi >> 3) % sizeof(bloomFilter)] |= 1 << (bfi & 7);
|
||||
|
||||
Packet outp(r->second,RR->identity.address(),Packet::VERB_MULTICAST_FRAME);
|
||||
outp.append(network->id());
|
||||
outp.append((uint8_t)0x04);
|
||||
src.appendTo(outp);
|
||||
mg.mac().appendTo(outp);
|
||||
outp.append(mg.adi());
|
||||
outp.append((uint16_t)etherType);
|
||||
outp.append(data,len);
|
||||
outp.compress();
|
||||
RR->sw->send(tPtr,outp,true);
|
||||
|
||||
++sentCount;
|
||||
}
|
||||
}
|
||||
|
||||
// Send to next hops for P2P propagation
|
||||
for(unsigned int nh=0;nh<2;++nh) {
|
||||
if (nextHops[nh]) {
|
||||
Packet outp(nextHops[nh]->address(),RR->identity.address(),Packet::VERB_MULTICAST_FRAME);
|
||||
outp.append((uint8_t)(0x04 | 0x08));
|
||||
RR->identity.address().appendTo(outp);
|
||||
outp.append((uint16_t)bloomMultiplier);
|
||||
outp.append((uint16_t)sizeof(bloomFilter));
|
||||
outp.append(((uint8_t *)bloomFilter),sizeof(bloomFilter));
|
||||
src.appendTo(outp);
|
||||
mg.mac().appendTo(outp);
|
||||
outp.append(mg.adi());
|
||||
outp.append((uint16_t)etherType);
|
||||
outp.append(data,len);
|
||||
outp.compress();
|
||||
RR->sw->send(tPtr,outp,true);
|
||||
}
|
||||
}
|
||||
|
||||
return (unsigned int)recipients.size();
|
||||
}
|
||||
|
||||
void Multicaster::clean(int64_t now)
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue