2017-12-29 07:16:20 +03:00
package yggdrasil
// This part constructs a spanning tree of the network
// It routes packets based on distance on the spanning tree
// In general, this is *not* equivalent to routing on the tree
// It falls back to the tree in the worst case, but it can take shortcuts too
// This is the part that makse routing reasonably efficient on scale-free graphs
// TODO document/comment everything in a lot more detail
// TODO? use a pre-computed lookup table (python version had this)
// A little annoying to do with constant changes from bandwidth estimates
import "time"
2018-05-27 21:37:35 +03:00
import "sort"
2017-12-29 07:16:20 +03:00
import "sync"
import "sync/atomic"
//import "fmt"
const switch_timeout = time . Minute
2018-02-18 08:57:24 +03:00
const switch_updateInterval = switch_timeout / 2
const switch_throttle = switch_updateInterval / 2
2017-12-29 07:16:20 +03:00
// You should be able to provide crypto signatures for this
// 1 signature per coord, from the *sender* to that coord
// E.g. A->B->C has sigA(A->B) and sigB(A->B->C)
type switchLocator struct {
2018-01-05 01:37:51 +03:00
root sigPubKey
tstamp int64
coords [ ] switchPort
2017-12-29 07:16:20 +03:00
}
func firstIsBetter ( first , second * sigPubKey ) bool {
2018-01-05 01:37:51 +03:00
// Higher TreeID is better
ftid := getTreeID ( first )
stid := getTreeID ( second )
for idx := 0 ; idx < len ( ftid ) ; idx ++ {
if ftid [ idx ] == stid [ idx ] {
continue
}
return ftid [ idx ] > stid [ idx ]
}
// Edge case, when comparing identical IDs
return false
2017-12-29 07:16:20 +03:00
}
func ( l * switchLocator ) clone ( ) switchLocator {
2018-01-05 01:37:51 +03:00
// Used to create a deep copy for use in messages
// Copy required because we need to mutate coords before sending
// (By appending the port from us to the destination)
loc := * l
loc . coords = make ( [ ] switchPort , len ( l . coords ) , len ( l . coords ) + 1 )
copy ( loc . coords , l . coords )
return loc
2017-12-29 07:16:20 +03:00
}
func ( l * switchLocator ) dist ( dest [ ] byte ) int {
2018-01-05 01:37:51 +03:00
// Returns distance (on the tree) from these coords
offset := 0
fdc := 0
for {
if fdc >= len ( l . coords ) {
break
}
coord , length := wire_decode_uint64 ( dest [ offset : ] )
if length == 0 {
break
}
if l . coords [ fdc ] != switchPort ( coord ) {
break
}
fdc ++
offset += length
}
dist := len ( l . coords [ fdc : ] )
for {
_ , length := wire_decode_uint64 ( dest [ offset : ] )
if length == 0 {
break
}
dist ++
offset += length
}
return dist
2017-12-29 07:16:20 +03:00
}
func ( l * switchLocator ) getCoords ( ) [ ] byte {
2018-01-05 01:37:51 +03:00
bs := make ( [ ] byte , 0 , len ( l . coords ) )
for _ , coord := range l . coords {
c := wire_encode_uint64 ( uint64 ( coord ) )
bs = append ( bs , c ... )
}
return bs
2017-12-29 07:16:20 +03:00
}
func ( x * switchLocator ) isAncestorOf ( y * switchLocator ) bool {
2018-01-05 01:37:51 +03:00
if x . root != y . root {
return false
}
if len ( x . coords ) > len ( y . coords ) {
return false
}
for idx := range x . coords {
if x . coords [ idx ] != y . coords [ idx ] {
return false
}
}
return true
2017-12-29 07:16:20 +03:00
}
type peerInfo struct {
2018-01-05 01:37:51 +03:00
key sigPubKey // ID of this peer
locator switchLocator // Should be able to respond with signatures upon request
degree uint64 // Self-reported degree
coords [ ] switchPort // Coords of this peer (taken from coords of the sent locator)
time time . Time // Time this node was last seen
firstSeen time . Time
port switchPort // Interface number of this peer
seq uint64 // Seq number we last saw this peer advertise
2017-12-29 07:16:20 +03:00
}
type switchMessage struct {
2018-01-05 01:37:51 +03:00
from sigPubKey // key of the sender
locator switchLocator // Locator advertised for the receiver, not the sender's loc!
seq uint64
2017-12-29 07:16:20 +03:00
}
type switchPort uint64
type tableElem struct {
2018-05-17 01:48:53 +03:00
port switchPort
2018-05-16 07:57:00 +03:00
locator switchLocator
2017-12-29 07:16:20 +03:00
}
type lookupTable struct {
2018-01-05 01:37:51 +03:00
self switchLocator
2018-01-19 03:48:34 +03:00
elems [ ] tableElem
2017-12-29 07:16:20 +03:00
}
type switchData struct {
2018-01-05 01:37:51 +03:00
// All data that's mutable and used by exported Table methods
// To be read/written with atomic.Value Store/Load calls
locator switchLocator
seq uint64 // Sequence number, reported to peers, so they know about changes
peers map [ switchPort ] peerInfo
sigs [ ] sigInfo
2017-12-29 07:16:20 +03:00
}
type switchTable struct {
2018-01-05 01:37:51 +03:00
core * Core
key sigPubKey // Our own key
time time . Time // Time when locator.tstamp was last updated
parent switchPort // Port of whatever peer is our parent, or self if we're root
drop map [ sigPubKey ] int64 // Tstamp associated with a dropped root
mutex sync . RWMutex // Lock for reads/writes of switchData
data switchData
updater atomic . Value //*sync.Once
table atomic . Value //lookupTable
2017-12-29 07:16:20 +03:00
}
func ( t * switchTable ) init ( core * Core , key sigPubKey ) {
2018-01-05 01:37:51 +03:00
now := time . Now ( )
t . core = core
t . key = key
locator := switchLocator { root : key , tstamp : now . Unix ( ) }
peers := make ( map [ switchPort ] peerInfo )
t . data = switchData { locator : locator , peers : peers }
t . updater . Store ( & sync . Once { } )
2018-01-19 03:48:34 +03:00
t . table . Store ( lookupTable { } )
2018-01-05 01:37:51 +03:00
t . drop = make ( map [ sigPubKey ] int64 )
2018-05-28 00:13:37 +03:00
}
2017-12-29 07:16:20 +03:00
func ( t * switchTable ) getLocator ( ) switchLocator {
2018-01-05 01:37:51 +03:00
t . mutex . RLock ( )
defer t . mutex . RUnlock ( )
return t . data . locator . clone ( )
2017-12-29 07:16:20 +03:00
}
2018-06-07 07:10:33 +03:00
func ( t * switchTable ) doMaintenance ( ) {
2018-01-05 01:37:51 +03:00
// Periodic maintenance work to keep things internally consistent
t . mutex . Lock ( ) // Write lock
defer t . mutex . Unlock ( ) // Release lock when we're done
t . cleanRoot ( )
t . cleanDropped ( )
2017-12-29 07:16:20 +03:00
}
func ( t * switchTable ) cleanRoot ( ) {
2018-01-05 01:37:51 +03:00
// TODO rethink how this is done?...
// Get rid of the root if it looks like its timed out
now := time . Now ( )
doUpdate := false
//fmt.Println("DEBUG clean root:", now.Sub(t.time))
if now . Sub ( t . time ) > switch_timeout {
//fmt.Println("root timed out", t.data.locator)
dropped := t . data . peers [ t . parent ]
dropped . time = t . time
t . drop [ t . data . locator . root ] = t . data . locator . tstamp
doUpdate = true
//t.core.log.Println("DEBUG: switch root timeout", len(t.drop))
}
// Or, if we're better than our root, root ourself
if firstIsBetter ( & t . key , & t . data . locator . root ) {
//fmt.Println("root is worse than us", t.data.locator.Root)
doUpdate = true
//t.core.log.Println("DEBUG: switch root replace with self", t.data.locator.Root)
}
// Or, if we are the root, possibly update our timestamp
if t . data . locator . root == t . key &&
2018-02-18 08:57:24 +03:00
now . Sub ( t . time ) > switch_updateInterval {
2018-01-05 01:37:51 +03:00
//fmt.Println("root is self and old, updating", t.data.locator.Root)
doUpdate = true
}
if doUpdate {
t . parent = switchPort ( 0 )
t . time = now
if t . data . locator . root != t . key {
t . data . seq ++
t . updater . Store ( & sync . Once { } )
select {
case t . core . router . reset <- struct { } { } :
default :
}
}
t . data . locator = switchLocator { root : t . key , tstamp : now . Unix ( ) }
t . data . sigs = nil
2018-06-07 08:16:47 +03:00
t . core . peers . sendSwitchMsgs ( )
2018-01-05 01:37:51 +03:00
}
2017-12-29 07:16:20 +03:00
}
2018-06-07 07:23:16 +03:00
func ( t * switchTable ) removePeer ( port switchPort ) {
delete ( t . data . peers , port )
t . updater . Store ( & sync . Once { } )
2018-06-07 18:58:24 +03:00
// TODO if parent, find a new peer to use as parent instead
2017-12-29 07:16:20 +03:00
}
func ( t * switchTable ) cleanDropped ( ) {
2018-01-27 02:30:51 +03:00
// TODO? only call this after root changes, not periodically
2018-01-05 01:37:51 +03:00
for root := range t . drop {
if ! firstIsBetter ( & root , & t . data . locator . root ) {
delete ( t . drop , root )
}
}
2017-12-29 07:16:20 +03:00
}
func ( t * switchTable ) createMessage ( port switchPort ) ( * switchMessage , [ ] sigInfo ) {
2018-01-05 01:37:51 +03:00
t . mutex . RLock ( )
defer t . mutex . RUnlock ( )
msg := switchMessage { from : t . key , locator : t . data . locator . clone ( ) }
msg . locator . coords = append ( msg . locator . coords , port )
msg . seq = t . data . seq
return & msg , t . data . sigs
2017-12-29 07:16:20 +03:00
}
func ( t * switchTable ) handleMessage ( msg * switchMessage , fromPort switchPort , sigs [ ] sigInfo ) {
2018-06-07 08:16:47 +03:00
// TODO directly use a switchMsg instead of switchMessage + sigs
2018-01-05 01:37:51 +03:00
t . mutex . Lock ( )
defer t . mutex . Unlock ( )
now := time . Now ( )
if len ( msg . locator . coords ) == 0 {
return
} // Should always have >=1 links
oldSender , isIn := t . data . peers [ fromPort ]
if ! isIn {
oldSender . firstSeen = now
}
sender := peerInfo { key : msg . from ,
locator : msg . locator ,
coords : msg . locator . coords [ : len ( msg . locator . coords ) - 1 ] ,
time : now ,
firstSeen : oldSender . firstSeen ,
port : fromPort ,
seq : msg . seq }
equiv := func ( x * switchLocator , y * switchLocator ) bool {
if x . root != y . root {
return false
}
if len ( x . coords ) != len ( y . coords ) {
return false
}
for idx := range x . coords {
if x . coords [ idx ] != y . coords [ idx ] {
return false
}
}
return true
}
doUpdate := false
if ! equiv ( & msg . locator , & oldSender . locator ) {
doUpdate = true
2018-06-07 18:58:24 +03:00
//sender.firstSeen = now // TODO? uncomment to prevent flapping?
2018-01-05 01:37:51 +03:00
}
t . data . peers [ fromPort ] = sender
updateRoot := false
oldParent , isIn := t . data . peers [ t . parent ]
noParent := ! isIn
noLoop := func ( ) bool {
for idx := 0 ; idx < len ( sigs ) - 1 ; idx ++ {
if sigs [ idx ] . next == t . core . sigPub {
return false
}
}
if msg . locator . root == t . core . sigPub {
return false
}
return true
} ( )
sTime := now . Sub ( sender . firstSeen )
pTime := oldParent . time . Sub ( oldParent . firstSeen ) + switch_timeout
// Really want to compare sLen/sTime and pLen/pTime
// Cross multiplied to avoid divide-by-zero
cost := len ( msg . locator . coords ) * int ( pTime . Seconds ( ) )
pCost := len ( t . data . locator . coords ) * int ( sTime . Seconds ( ) )
dropTstamp , isIn := t . drop [ msg . locator . root ]
// Here be dragons
switch {
case ! noLoop : // do nothing
case isIn && dropTstamp >= msg . locator . tstamp : // do nothing
case firstIsBetter ( & msg . locator . root , & t . data . locator . root ) :
updateRoot = true
case t . data . locator . root != msg . locator . root : // do nothing
case t . data . locator . tstamp > msg . locator . tstamp : // do nothing
case noParent :
updateRoot = true
case cost < pCost :
updateRoot = true
2018-02-18 08:57:24 +03:00
case sender . port != t . parent : // do nothing
case ! equiv ( & msg . locator , & t . data . locator ) :
updateRoot = true
case now . Sub ( t . time ) < switch_throttle : // do nothing
case msg . locator . tstamp > t . data . locator . tstamp :
2018-01-05 01:37:51 +03:00
updateRoot = true
}
if updateRoot {
if ! equiv ( & msg . locator , & t . data . locator ) {
doUpdate = true
t . data . seq ++
select {
case t . core . router . reset <- struct { } { } :
default :
}
2018-05-16 07:57:00 +03:00
//t.core.log.Println("Switch update:", msg.locator.root, msg.locator.tstamp, msg.locator.coords)
2018-01-05 01:37:51 +03:00
//fmt.Println("Switch update:", msg.Locator.Root, msg.Locator.Tstamp, msg.Locator.Coords)
}
if t . data . locator . tstamp != msg . locator . tstamp {
t . time = now
}
t . data . locator = msg . locator
t . parent = sender . port
t . data . sigs = sigs
//t.core.log.Println("Switch update:", msg.Locator.Root, msg.Locator.Tstamp, msg.Locator.Coords)
2018-06-07 08:16:47 +03:00
t . core . peers . sendSwitchMsgs ( )
2018-01-05 01:37:51 +03:00
}
if doUpdate {
t . updater . Store ( & sync . Once { } )
}
return
2017-12-29 07:16:20 +03:00
}
func ( t * switchTable ) updateTable ( ) {
2018-01-05 01:37:51 +03:00
// WARNING this should only be called from within t.data.updater.Do()
// It relies on the sync.Once for synchronization with messages and lookups
// TODO use a pre-computed faster lookup table
// Instead of checking distance for every destination every time
// Array of structs, indexed by first coord that differs from self
// Each struct has stores the best port to forward to, and a next coord map
// Move to struct, then iterate over coord maps until you dead end
// The last port before the dead end should be the closest
t . mutex . RLock ( )
defer t . mutex . RUnlock ( )
newTable := lookupTable {
self : t . data . locator . clone ( ) ,
2018-01-19 03:48:34 +03:00
elems : make ( [ ] tableElem , 0 , len ( t . data . peers ) ) ,
2018-01-05 01:37:51 +03:00
}
for _ , pinfo := range t . data . peers {
//if !pinfo.forward { continue }
2018-02-18 08:14:23 +03:00
if pinfo . locator . root != newTable . self . root {
continue
}
2018-01-05 01:37:51 +03:00
loc := pinfo . locator . clone ( )
loc . coords = loc . coords [ : len ( loc . coords ) - 1 ] // Remove the them->self link
2018-01-19 03:48:34 +03:00
newTable . elems = append ( newTable . elems , tableElem {
2018-01-05 01:37:51 +03:00
locator : loc ,
2018-05-17 01:48:53 +03:00
port : pinfo . port ,
2018-01-19 03:48:34 +03:00
} )
2018-01-05 01:37:51 +03:00
}
2018-05-27 21:37:35 +03:00
sort . SliceStable ( newTable . elems , func ( i , j int ) bool {
return t . data . peers [ newTable . elems [ i ] . port ] . firstSeen . Before ( t . data . peers [ newTable . elems [ j ] . port ] . firstSeen )
} )
2018-01-05 01:37:51 +03:00
t . table . Store ( newTable )
2017-12-29 07:16:20 +03:00
}
func ( t * switchTable ) lookup ( dest [ ] byte , ttl uint64 ) ( switchPort , uint64 ) {
2018-01-05 01:37:51 +03:00
t . updater . Load ( ) . ( * sync . Once ) . Do ( t . updateTable )
table := t . table . Load ( ) . ( lookupTable )
myDist := table . self . dist ( dest ) //getDist(table.self.coords)
if ! ( uint64 ( myDist ) < ttl ) {
return 0 , 0
}
2018-05-27 21:37:35 +03:00
// cost is in units of (expected distance) + (expected queue size), where expected distance is used as an approximation of the minimum backpressure gradient needed for packets to flow
ports := t . core . peers . getPorts ( )
var best switchPort
bestCost := int64 ( ^ uint64 ( 0 ) >> 1 )
2018-01-19 03:48:34 +03:00
for _ , info := range table . elems {
2018-01-05 01:37:51 +03:00
dist := info . locator . dist ( dest ) //getDist(info.locator.coords)
if ! ( dist < myDist ) {
continue
}
2018-05-27 21:37:35 +03:00
p , isIn := ports [ info . port ]
if ! isIn {
continue
}
cost := int64 ( dist ) + p . getQueueSize ( )
if cost < bestCost {
2018-01-19 03:48:34 +03:00
best = info . port
2018-05-27 21:37:35 +03:00
bestCost = cost
2018-01-05 01:37:51 +03:00
}
}
//t.core.log.Println("DEBUG: sending to", best, "bandwidth", getBandwidth(best))
return best , uint64 ( myDist )
2017-12-29 07:16:20 +03:00
}
////////////////////////////////////////////////////////////////////////////////
//Signature stuff
type sigInfo struct {
2018-01-05 01:37:51 +03:00
next sigPubKey
sig sigBytes
2017-12-29 07:16:20 +03:00
}
////////////////////////////////////////////////////////////////////////////////