go-libp2p-kad-dht/routing.go

387 lines
8.5 KiB
Go
Raw Normal View History

2014-07-23 04:48:30 -07:00
package dht
import (
"bytes"
"encoding/json"
"errors"
"math/rand"
"sync"
"time"
proto "code.google.com/p/goprotobuf/proto"
ma "github.com/jbenet/go-multiaddr"
2014-07-29 17:55:19 -07:00
peer "github.com/jbenet/go-ipfs/peer"
kb "github.com/jbenet/go-ipfs/routing/kbucket"
2014-07-29 17:55:19 -07:00
swarm "github.com/jbenet/go-ipfs/swarm"
u "github.com/jbenet/go-ipfs/util"
2014-07-23 04:48:30 -07:00
)
// Pool size is the number of nodes used for group find/set RPC calls
var PoolSize = 6
// TODO: determine a way of creating and managing message IDs
func GenerateMessageID() uint64 {
//return (uint64(rand.Uint32()) << 32) & uint64(rand.Uint32())
return uint64(rand.Uint32())
}
2014-07-23 04:48:30 -07:00
// This file implements the Routing interface for the IpfsDHT struct.
// Basic Put/Get
// PutValue adds value corresponding to given Key.
// This is the top level "Store" operation of the DHT
2014-08-09 22:28:46 -07:00
func (s *IpfsDHT) PutValue(key u.Key, value []byte) {
complete := make(chan struct{})
for _, route := range s.routes {
2014-08-09 22:28:46 -07:00
p := route.NearestPeer(kb.ConvertKey(key))
if p == nil {
s.network.Error(kb.ErrLookupFailure)
2014-08-09 22:28:46 -07:00
go func() {
complete <- struct{}{}
}()
continue
2014-08-09 22:28:46 -07:00
}
go func() {
err := s.putValueToNetwork(p, string(key), value)
if err != nil {
s.network.Error(err)
2014-08-09 22:28:46 -07:00
}
complete <- struct{}{}
}()
}
for _, _ = range s.routes {
<-complete
}
2014-07-23 04:48:30 -07:00
}
// A counter for incrementing a variable across multiple threads
type counter struct {
n int
mut sync.RWMutex
}
func (c *counter) Increment() {
c.mut.Lock()
c.n++
c.mut.Unlock()
}
func (c *counter) Decrement() {
c.mut.Lock()
c.n--
c.mut.Unlock()
}
func (c *counter) Size() int {
c.mut.RLock()
defer c.mut.RUnlock()
return c.n
}
2014-07-23 04:48:30 -07:00
// GetValue searches for the value corresponding to given Key.
2014-08-06 21:36:56 -07:00
// If the search does not succeed, a multiaddr string of a closer peer is
// returned along with util.ErrSearchIncomplete
2014-07-23 04:48:30 -07:00
func (s *IpfsDHT) GetValue(key u.Key, timeout time.Duration) ([]byte, error) {
2014-08-14 08:32:17 -07:00
ll := startNewRpc("GET")
defer func() {
ll.EndLog()
ll.Print()
}()
2014-08-12 22:10:44 -07:00
// If we have it local, dont bother doing an RPC!
// NOTE: this might not be what we want to do...
2014-08-14 08:32:17 -07:00
val, err := s.GetLocal(key)
if err == nil {
ll.Success = true
u.DOut("Found local, returning.")
2014-08-12 22:10:44 -07:00
return val, nil
}
route_level := 0
closest := s.routes[route_level].NearestPeers(kb.ConvertKey(key), PoolSize)
if closest == nil || len(closest) == 0 {
return nil, kb.ErrLookupFailure
}
val_chan := make(chan []byte)
npeer_chan := make(chan *peer.Peer, 30)
proc_peer := make(chan *peer.Peer, 30)
err_chan := make(chan error)
after := time.After(timeout)
for _, p := range closest {
npeer_chan <- p
}
c := counter{}
// This limit value is referred to as k in the kademlia paper
limit := 20
count := 0
go func() {
for {
select {
case p := <-npeer_chan:
count++
if count >= limit {
break
2014-08-12 22:10:44 -07:00
}
c.Increment()
proc_peer <- p
default:
if c.Size() == 0 {
err_chan <- u.ErrNotFound
}
}
}
}()
process := func() {
for {
select {
case p, ok := <-proc_peer:
if !ok || p == nil {
c.Decrement()
return
}
val, peers, err := s.getValueOrPeers(p, key, timeout/4, route_level)
if err != nil {
u.DErr(err.Error())
c.Decrement()
2014-08-14 08:32:17 -07:00
continue
}
if val != nil {
val_chan <- val
c.Decrement()
return
}
for _, np := range peers {
// TODO: filter out peers that arent closer
npeer_chan <- np
}
c.Decrement()
}
}
}
concurFactor := 3
for i := 0; i < concurFactor; i++ {
go process()
}
select {
case val := <-val_chan:
close(npeer_chan)
return val, nil
case err := <-err_chan:
close(npeer_chan)
return nil, err
case <-after:
close(npeer_chan)
return nil, u.ErrTimeout
}
2014-07-23 04:48:30 -07:00
}
// Value provider layer of indirection.
// This is what DSHTs (Coral and MainlineDHT) do to store large values in a DHT.
// Announce that this node can provide value for given key
2014-07-29 17:55:19 -07:00
func (s *IpfsDHT) Provide(key u.Key) error {
peers := s.routes[0].NearestPeers(kb.ConvertKey(key), PoolSize)
if len(peers) == 0 {
return kb.ErrLookupFailure
}
pmes := DHTMessage{
Type: PBDHTMessage_ADD_PROVIDER,
Key: string(key),
}
pbmes := pmes.ToProtobuf()
for _, p := range peers {
mes := swarm.NewMessage(p, pbmes)
s.network.Send(mes)
}
return nil
2014-07-23 04:48:30 -07:00
}
// FindProviders searches for peers who can provide the value for given key.
func (s *IpfsDHT) FindProviders(key u.Key, timeout time.Duration) ([]*peer.Peer, error) {
2014-08-14 08:32:17 -07:00
ll := startNewRpc("FindProviders")
defer func() {
ll.EndLog()
ll.Print()
}()
u.DOut("Find providers for: '%s'", key)
p := s.routes[0].NearestPeer(kb.ConvertKey(key))
if p == nil {
return nil, kb.ErrLookupFailure
}
2014-08-14 08:32:17 -07:00
for level := 0; level < len(s.routes); {
pmes, err := s.findProvidersSingle(p, key, level, timeout)
if err != nil {
return nil, err
}
2014-08-14 08:32:17 -07:00
if pmes.GetSuccess() {
provs := s.addPeerList(key, pmes.GetPeers())
ll.Success = true
return provs, nil
} else {
closer := pmes.GetPeers()
if len(closer) == 0 {
level++
2014-08-12 22:10:44 -07:00
continue
}
2014-08-14 08:32:17 -07:00
if peer.ID(closer[0].GetId()).Equal(s.self.ID) {
u.DOut("Got myself back as a closer peer.")
return nil, u.ErrNotFound
}
maddr, err := ma.NewMultiaddr(closer[0].GetAddr())
if err != nil {
// ??? Move up route level???
panic("not yet implemented")
}
2014-08-14 08:32:17 -07:00
np, err := s.network.GetConnection(peer.ID(closer[0].GetId()), maddr)
if err != nil {
u.PErr("[%s] Failed to connect to: %s", s.self.ID.Pretty(), closer[0].GetAddr())
level++
continue
}
p = np
}
}
2014-08-14 08:32:17 -07:00
return nil, u.ErrNotFound
2014-07-23 04:48:30 -07:00
}
// Find specific Peer
// FindPeer searches for a peer with given ID.
func (s *IpfsDHT) FindPeer(id peer.ID, timeout time.Duration) (*peer.Peer, error) {
// Check if were already connected to them
p, _ := s.Find(id)
if p != nil {
return p, nil
}
route_level := 0
p = s.routes[route_level].NearestPeer(kb.ConvertPeerID(id))
if p == nil {
return nil, kb.ErrLookupFailure
}
if p.ID.Equal(id) {
return p, nil
}
for route_level < len(s.routes) {
pmes, err := s.findPeerSingle(p, id, timeout, route_level)
plist := pmes.GetPeers()
if len(plist) == 0 {
route_level++
}
found := plist[0]
addr, err := ma.NewMultiaddr(found.GetAddr())
2014-08-05 20:31:48 -07:00
if err != nil {
return nil, u.WrapError(err, "FindPeer received bad info")
2014-08-05 20:31:48 -07:00
}
nxtPeer, err := s.network.GetConnection(peer.ID(found.GetId()), addr)
2014-08-06 10:02:53 -07:00
if err != nil {
return nil, u.WrapError(err, "FindPeer failed to connect to new peer.")
2014-08-06 10:02:53 -07:00
}
if pmes.GetSuccess() {
if !id.Equal(nxtPeer.ID) {
return nil, errors.New("got back invalid peer from 'successful' response")
}
return nxtPeer, nil
} else {
p = nxtPeer
2014-08-06 10:02:53 -07:00
}
}
return nil, u.ErrNotFound
2014-07-23 04:48:30 -07:00
}
// Ping a peer, log the time it took
func (dht *IpfsDHT) Ping(p *peer.Peer, timeout time.Duration) error {
// Thoughts: maybe this should accept an ID and do a peer lookup?
u.DOut("Enter Ping.")
pmes := DHTMessage{Id: GenerateMessageID(), Type: PBDHTMessage_PING}
mes := swarm.NewMessage(p, pmes.ToProtobuf())
before := time.Now()
response_chan := dht.ListenFor(pmes.Id, 1, time.Minute)
dht.network.Send(mes)
tout := time.After(timeout)
select {
case <-response_chan:
roundtrip := time.Since(before)
p.SetLatency(roundtrip)
u.DOut("Ping took %s.", roundtrip.String())
return nil
case <-tout:
// Timed out, think about removing peer from network
u.DOut("Ping peer timed out.")
dht.Unlisten(pmes.Id)
return u.ErrTimeout
}
}
func (dht *IpfsDHT) GetDiagnostic(timeout time.Duration) ([]*diagInfo, error) {
u.DOut("Begin Diagnostic")
//Send to N closest peers
targets := dht.routes[0].NearestPeers(kb.ConvertPeerID(dht.self.ID), 10)
// TODO: Add timeout to this struct so nodes know when to return
pmes := DHTMessage{
Type: PBDHTMessage_DIAGNOSTIC,
Id: GenerateMessageID(),
}
2014-08-09 22:28:46 -07:00
listenChan := dht.ListenFor(pmes.Id, len(targets), time.Minute*2)
pbmes := pmes.ToProtobuf()
for _, p := range targets {
mes := swarm.NewMessage(p, pbmes)
dht.network.Send(mes)
}
var out []*diagInfo
after := time.After(timeout)
for count := len(targets); count > 0; {
select {
case <-after:
u.DOut("Diagnostic request timed out.")
return out, u.ErrTimeout
2014-08-09 22:28:46 -07:00
case resp := <-listenChan:
pmes_out := new(PBDHTMessage)
err := proto.Unmarshal(resp.Data, pmes_out)
if err != nil {
// NOTE: here and elsewhere, need to audit error handling,
// some errors should be continued on from
return out, err
}
dec := json.NewDecoder(bytes.NewBuffer(pmes_out.GetValue()))
for {
di := new(diagInfo)
err := dec.Decode(di)
if err != nil {
break
}
out = append(out, di)
}
}
}
return nil, nil
}