rust-libp2p/protocols/kad/src/behaviour.rs

// Copyright 2018 Parity Technologies (UK) Ltd.
//
// Permission is hereby granted, free of charge, to any person obtaining a
// copy of this software and associated documentation files (the "Software"),
// to deal in the Software without restriction, including without limitation
// the rights to use, copy, modify, merge, publish, distribute, sublicense,
// and/or sell copies of the Software, and to permit persons to whom the
// Software is furnished to do so, subject to the following conditions:
//
// The above copyright notice and this permission notice shall be included in
// all copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
// OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
// FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
// DEALINGS IN THE SOFTWARE.

use crate::addresses::Addresses;
use crate::handler::{KademliaHandler, KademliaHandlerEvent, KademliaHandlerIn};
use crate::kbucket::{self, KBucketsTable};
use crate::protocol::{KadConnectionType, KadPeer};
use crate::query::{QueryConfig, QueryState, QueryStatePollOut};
use fnv::{FnvHashMap, FnvHashSet};
use futures::{prelude::*, stream};
use libp2p_core::swarm::{ConnectedPoint, NetworkBehaviour, NetworkBehaviourAction, PollParameters};
use libp2p_core::{protocols_handler::ProtocolsHandler, Multiaddr, PeerId};
use multihash::Multihash;
use smallvec::SmallVec;
use std::{borrow::Cow, error, marker::PhantomData, time::Duration};
use tokio_io::{AsyncRead, AsyncWrite};
use wasm_timer::{Instant, Interval};

mod test;

/// Network behaviour that handles Kademlia.
pub struct Kademlia<TSubstream> {
    /// Storage for the nodes. Contains the known multiaddresses for this node.
    kbuckets: KBucketsTable<PeerId, Addresses>,

    /// If `Some`, we overwrite the Kademlia protocol name with this one.
    protocol_name_override: Option<Cow<'static, [u8]>>,

    /// All the iterative queries we are currently performing, with their ID. The last parameter
    /// is the list of accumulated providers for `GET_PROVIDERS` queries.
    active_queries: FnvHashMap<QueryId, QueryState<QueryInfo, PeerId>>,

    /// List of peers the swarm is connected to.
    connected_peers: FnvHashSet<PeerId>,

    /// Contains a list of peer IDs which we are not connected to, and an RPC query to send to them
    /// once they connect.
    pending_rpcs: SmallVec<[(PeerId, KademliaHandlerIn<QueryId>); 8]>,

    /// Identifier for the next query that we start.
    next_query_id: QueryId,

    /// List of values and peers that are providing them.
    ///
    /// Our local peer ID can be in this container.
    // TODO: Note that in reality the value is a SHA-256 of the actual value (https://github.com/libp2p/rust-libp2p/issues/694)
    values_providers: FnvHashMap<Multihash, SmallVec<[PeerId; 20]>>,

    /// List of values that we are providing ourselves. Must be kept in sync with
    /// `values_providers`.
    providing_keys: FnvHashSet<Multihash>,

    /// Interval to send `ADD_PROVIDER` messages to everyone.
    refresh_add_providers: stream::Fuse<Interval>,

    /// `α` in the Kademlia reference papers. Designates the maximum number of queries that we
    /// perform in parallel.
    parallelism: usize,

    /// `k` in the Kademlia reference papers. Number of results in a find node query.
    num_results: usize,

    /// Timeout for each individual RPC query.
    rpc_timeout: Duration,

    /// Events to return when polling.
    queued_events: SmallVec<[NetworkBehaviourAction<KademliaHandlerIn<QueryId>, KademliaOut>; 32]>,

    /// List of providers to add to the topology as soon as we are in `poll()`.
    add_provider: SmallVec<[(Multihash, PeerId); 32]>,

    /// Marker to pin the generics.
    marker: PhantomData<TSubstream>,
}

/// Opaque type. Each query that we start gets a unique number.
#[derive(Debug, Copy, Clone, Hash, PartialEq, Eq)]
pub struct QueryId(usize);

/// Information about a query.
#[derive(Debug, Clone, PartialEq, Eq)]
struct QueryInfo {
    /// What we are querying and why.
    inner: QueryInfoInner,
    /// Temporary addresses used when trying to reach nodes.
    untrusted_addresses: FnvHashMap<PeerId, SmallVec<[Multiaddr; 8]>>,
}

/// Additional information about the query.
#[derive(Debug, Clone, PartialEq, Eq)]
enum QueryInfoInner {
    /// The query was created for the Kademlia initialization process.
    Initialization {
        /// Hash we're targetting to insert ourselves in the k-buckets.
        target: PeerId,
    },

    /// The user requested a `FIND_PEER` query to be performed. It should be reported when finished.
    FindPeer(PeerId),

    /// The user requested a `GET_PROVIDERS` query to be performed. It should be reported when
    /// finished.
    GetProviders {
        /// Target we are searching the providers of.
        target: Multihash,
        /// Results to return. Filled over time.
        pending_results: Vec<PeerId>,
    },

    /// We are traversing towards `target` and should add an `ADD_PROVIDER` message to the peers
    /// of the outcome with our own identity.
    AddProvider {
        /// Which hash we're targetting.
        target: Multihash,
    },
}

impl Into<kbucket::Key<QueryInfo>> for QueryInfo {
    fn into(self) -> kbucket::Key<QueryInfo> {
        kbucket::Key::new(self)
    }
}

impl AsRef<[u8]> for QueryInfo {
    fn as_ref(&self) -> &[u8] {
        match &self.inner {
            QueryInfoInner::Initialization { target } => target.as_ref(),
            QueryInfoInner::FindPeer(peer) => peer.as_ref(),
            QueryInfoInner::GetProviders { target, .. } => target.as_bytes(),
            QueryInfoInner::AddProvider { target } => target.as_bytes(),
        }
    }
}

impl QueryInfo {
    /// Creates the corresponding RPC request to send to remote.
    fn to_rpc_request<TUserData>(&self, user_data: TUserData) -> KademliaHandlerIn<TUserData> {
        match &self.inner {
            QueryInfoInner::Initialization { target } => KademliaHandlerIn::FindNodeReq {
                key: target.clone(),
                user_data,
            },
            QueryInfoInner::FindPeer(key) => KademliaHandlerIn::FindNodeReq {
                key: key.clone(),
                user_data,
            },
            QueryInfoInner::GetProviders { target, .. } => KademliaHandlerIn::GetProvidersReq {
                key: target.clone(),
                user_data,
            },
            QueryInfoInner::AddProvider { .. } => KademliaHandlerIn::FindNodeReq {
                key: unimplemented!(), // TODO: target.clone(),
                user_data,
            },
        }
    }
}

impl<TSubstream> Kademlia<TSubstream> {
    /// Creates a `Kademlia`.
    #[inline]
    pub fn new(local_peer_id: PeerId) -> Self {
        Self::new_inner(local_peer_id)
    }

    /// The same as `new`, but using a custom protocol name.
    ///
    /// Kademlia nodes only communicate with other nodes using the same protocol name. Using a
    /// custom name therefore allows to segregate the DHT from others, if that is desired.
    pub fn with_protocol_name(local_peer_id: PeerId, name: impl Into<Cow<'static, [u8]>>) -> Self {
        let mut me = Kademlia::new_inner(local_peer_id);
        me.protocol_name_override = Some(name.into());
        me
    }

    /// Creates a `Kademlia`.
    ///
    /// Contrary to `new`, doesn't perform the initialization queries that store our local ID into
    /// the DHT and fill our buckets.
    #[inline]
    #[deprecated(note="this function is now equivalent to new() and will be removed in the future")]
    pub fn without_init(local_peer_id: PeerId) -> Self {
        Self::new_inner(local_peer_id)
    }

    /// Adds a known address for the given `PeerId`. We are connected to this address.
    // TODO: report if the address was inserted? also, semantics unclear
    pub fn add_connected_address(&mut self, peer_id: &PeerId, address: Multiaddr) {
        self.add_address(peer_id, address, true)
    }

    /// Adds a known address for the given `PeerId`. We are not connected or don't know whether we
    /// are connected to this address.
    // TODO: report if the address was inserted? also, semantics unclear
    pub fn add_not_connected_address(&mut self, peer_id: &PeerId, address: Multiaddr) {
        self.add_address(peer_id, address, false)
    }

    /// Underlying implementation for `add_connected_address` and `add_not_connected_address`.
    fn add_address(&mut self, peer_id: &PeerId, address: Multiaddr, _connected: bool) {
        let key = kbucket::Key::new(peer_id.clone());
        match self.kbuckets.entry(&key) {
            kbucket::Entry::InKbucketConnected(mut entry) => entry.value().insert(address),
            kbucket::Entry::InKbucketConnectedPending(mut entry) => entry.value().insert(address),
            kbucket::Entry::InKbucketDisconnected(mut entry) => entry.value().insert(address),
            kbucket::Entry::InKbucketDisconnectedPending(mut entry) => entry.value().insert(address),
            kbucket::Entry::NotInKbucket(entry) => {
                let mut addresses = Addresses::new();
                addresses.insert(address);
                match entry.insert_disconnected(addresses) {
                    kbucket::InsertOutcome::Inserted => {
                        let event = KademliaOut::KBucketAdded {
                            peer_id: peer_id.clone(),
                            replaced: None,
                        };
                        self.queued_events.push(NetworkBehaviourAction::GenerateEvent(event));
                    },
                    kbucket::InsertOutcome::Full => (),
                    kbucket::InsertOutcome::Pending { to_ping } => {
                        self.queued_events.push(NetworkBehaviourAction::DialPeer {
                            peer_id: to_ping.into_preimage(),
                        })
                    },
                }
                return;
            },
            kbucket::Entry::SelfEntry => return,
        };
    }

    /// Inner implementation of the constructors.
    fn new_inner(local_peer_id: PeerId) -> Self {
        let parallelism = 3;

        Kademlia {
            kbuckets: KBucketsTable::new(kbucket::Key::new(local_peer_id), Duration::from_secs(60)),   // TODO: constant
            protocol_name_override: None,
            queued_events: SmallVec::new(),
            active_queries: Default::default(),
            connected_peers: Default::default(),
            pending_rpcs: SmallVec::with_capacity(parallelism),
            next_query_id: QueryId(0),
            values_providers: FnvHashMap::default(),
            providing_keys: FnvHashSet::default(),
            refresh_add_providers: Interval::new_interval(Duration::from_secs(60)).fuse(),     // TODO: constant
            parallelism,
            num_results: 20,
            rpc_timeout: Duration::from_secs(8),
            add_provider: SmallVec::new(),
            marker: PhantomData,
        }
    }

    /// Returns an iterator to all the peer IDs in the bucket, without the pending nodes.
    pub fn kbuckets_entries(&self) -> impl Iterator<Item = &PeerId> {
        self.kbuckets.entries_not_pending().map(|(key, _)| key.preimage())
    }

    /// Starts an iterative `FIND_NODE` request.
    ///
    /// This will eventually produce an event containing the nodes of the DHT closest to the
    /// requested `PeerId`.
    pub fn find_node(&mut self, peer_id: PeerId) {
        self.start_query(QueryInfoInner::FindPeer(peer_id));
    }

    /// Starts an iterative `GET_PROVIDERS` request.
    pub fn get_providers(&mut self, target: Multihash) {
        self.start_query(QueryInfoInner::GetProviders { target, pending_results: Vec::new() });
    }

    /// Register the local node as the provider for the given key.
    ///
    /// This will periodically send `ADD_PROVIDER` messages to the nodes closest to the key. When
    /// someone performs a `GET_PROVIDERS` iterative request on the DHT, our local node will be
    /// returned as part of the results.
    ///
    /// The actual meaning of *providing* the value of a key is not defined, and is specific to
    /// the value whose key is the hash.
    pub fn add_providing(&mut self, key: Multihash) {
        self.providing_keys.insert(key.clone());
        let providers = self.values_providers.entry(key).or_insert_with(Default::default);
        let local_id = self.kbuckets.local_key().preimage();
        if !providers.iter().any(|peer_id| peer_id == local_id) {
            providers.push(local_id.clone());
        }

        // Trigger the next refresh now.
        self.refresh_add_providers = Interval::new(Instant::now(), Duration::from_secs(60)).fuse();
    }

    /// Cancels a registration done with `add_providing`.
    ///
    /// There doesn't exist any "remove provider" message to broadcast on the network, therefore we
    /// will still be registered as a provider in the DHT for as long as the timeout doesn't expire.
    pub fn remove_providing(&mut self, key: &Multihash) {
        self.providing_keys.remove(key);

        let providers = match self.values_providers.get_mut(key) {
            Some(p) => p,
            None => return,
        };

        if let Some(position) = providers.iter().position(|k| k == key) {
            providers.remove(position);
            providers.shrink_to_fit();
        }
    }

    /// Internal function that starts a query.
    fn start_query(&mut self, target: QueryInfoInner) {
        let query_id = self.next_query_id;
        self.next_query_id.0 += 1;

        let target = QueryInfo {
            inner: target,
            untrusted_addresses: Default::default(),
        };

        let known_closest_peers = self.kbuckets
            .find_closest(&kbucket::Key::new(target.clone()))
            .take(self.num_results);

        self.active_queries.insert(
            query_id,
            QueryState::new(QueryConfig {
                target,
                parallelism: self.parallelism,
                num_results: self.num_results,
                rpc_timeout: self.rpc_timeout,
                known_closest_peers,
            })
        );
    }

    /// Processes discovered peers from a query.
    fn discovered<'a, I>(&'a mut self, query_id: &QueryId, source: &PeerId, peers: I)
    where
        I: Iterator<Item=&'a KadPeer> + Clone
    {
        let local_id = self.kbuckets.local_key().preimage().clone();
        let others_iter = peers.filter(|p| p.node_id != local_id);

        for peer in others_iter.clone() {
            self.queued_events.push(NetworkBehaviourAction::GenerateEvent(
                KademliaOut::Discovered {
                    peer_id: peer.node_id.clone(),
                    addresses: peer.multiaddrs.clone(),
                    ty: peer.connection_ty,
                }
            ));
        }

        if let Some(query) = self.active_queries.get_mut(query_id) {
            for peer in others_iter.clone() {
                query.target_mut().untrusted_addresses
                    .insert(peer.node_id.clone(), peer.multiaddrs.iter().cloned().collect());
            }
            query.inject_rpc_result(source, others_iter.cloned().map(|kp| kp.node_id))
        }
    }
}

impl<TSubstream> NetworkBehaviour for Kademlia<TSubstream>
where
    TSubstream: AsyncRead + AsyncWrite,
{
    type ProtocolsHandler = KademliaHandler<TSubstream, QueryId>;
    type OutEvent = KademliaOut;

    fn new_handler(&mut self) -> Self::ProtocolsHandler {
        let mut handler = KademliaHandler::dial_and_listen();
        if let Some(name) = self.protocol_name_override.as_ref() {
            handler = handler.with_protocol_name(name.clone());
        }
        handler
    }

    fn addresses_of_peer(&mut self, peer_id: &PeerId) -> Vec<Multiaddr> {
        // We should order addresses from decreasing likelyhood of connectivity, so start with
        // the addresses of that peer in the k-buckets.
        let mut out_list = self.kbuckets
            .entry(&kbucket::Key::new(peer_id.clone()))
            .value_not_pending()
            .map(|l| l.iter().cloned().collect::<Vec<_>>())
            .unwrap_or_else(Vec::new);

        // We add to that a temporary list of addresses from the ongoing queries.
        for query in self.active_queries.values() {
            if let Some(addrs) = query.target().untrusted_addresses.get(peer_id) {
                for addr in addrs {
                    out_list.push(addr.clone());
                }
            }
        }

        out_list
    }

    fn inject_connected(&mut self, id: PeerId, endpoint: ConnectedPoint) {
        if let Some(pos) = self.pending_rpcs.iter().position(|(p, _)| p == &id) {
            let (_, rpc) = self.pending_rpcs.remove(pos);
            self.queued_events.push(NetworkBehaviourAction::SendEvent {
                peer_id: id.clone(),
                event: rpc,
            });
        }

        let address = match endpoint {
            ConnectedPoint::Dialer { address } => Some(address),
            ConnectedPoint::Listener { .. } => None,
        };

        let key = kbucket::Key::new(id.clone());

        match self.kbuckets.entry(&key) {
            kbucket::Entry::InKbucketConnected(_) => {
                unreachable!("Kbuckets are always kept in sync with the connection state; QED")
            },
            kbucket::Entry::InKbucketConnectedPending(_) => {
                unreachable!("Kbuckets are always kept in sync with the connection state; QED")
            },

            kbucket::Entry::InKbucketDisconnected(mut entry) => {
                if let Some(address) = address {
                    entry.value().insert(address);
                }
                entry.set_connected();
            },

            kbucket::Entry::InKbucketDisconnectedPending(mut entry) => {
                if let Some(address) = address {
                    entry.value().insert(address);
                }
                entry.set_connected();
            },

            kbucket::Entry::NotInKbucket(entry) => {
                let mut addresses = Addresses::new();
                if let Some(address) = address {
                    addresses.insert(address);
                }
                match entry.insert_connected(addresses) {
                    kbucket::InsertOutcome::Inserted => {
                        let event = KademliaOut::KBucketAdded {
                            peer_id: id.clone(),
                            replaced: None,
                        };
                        self.queued_events.push(NetworkBehaviourAction::GenerateEvent(event));
                    },
                    kbucket::InsertOutcome::Full => (),
                    kbucket::InsertOutcome::Pending { to_ping } => {
                        self.queued_events.push(NetworkBehaviourAction::DialPeer {
                            peer_id: to_ping.into_preimage(),
                        })
                    },
                }
            },

            kbucket::Entry::SelfEntry => {
                unreachable!("Guaranteed to never receive disconnected even for self; QED")
            },
        }

        self.connected_peers.insert(id);
    }

    fn inject_addr_reach_failure(&mut self, peer_id: Option<&PeerId>, addr: &Multiaddr, _: &dyn error::Error) {
        if let Some(peer_id) = peer_id {
            let key = kbucket::Key::new(peer_id.clone());

            if let Some(list) = self.kbuckets.entry(&key).value() {
                // TODO: don't remove the address if the error is that we are already connected
                //       to this peer
                list.remove(addr);
            }

            for query in self.active_queries.values_mut() {
                if let Some(addrs) = query.target_mut().untrusted_addresses.get_mut(&peer_id) {
                    addrs.retain(|a| a != addr);
                }
            }
        }
    }

    fn inject_dial_failure(&mut self, peer_id: &PeerId) {
        for query in self.active_queries.values_mut() {
            query.inject_rpc_error(peer_id);
        }
    }

    fn inject_disconnected(&mut self, id: &PeerId, _old_endpoint: ConnectedPoint) {
        let was_in = self.connected_peers.remove(id);
        debug_assert!(was_in);

        for query in self.active_queries.values_mut() {
            query.inject_rpc_error(id);
        }

        match self.kbuckets.entry(&kbucket::Key::new(id.clone())) {
            kbucket::Entry::InKbucketConnected(entry) => {
                match entry.set_disconnected() {
                    kbucket::SetDisconnectedOutcome::Kept(_) => {},
                    kbucket::SetDisconnectedOutcome::Replaced { replacement, .. } => {
                        let event = KademliaOut::KBucketAdded {
                            peer_id: replacement.into_preimage(),
                            replaced: Some(id.clone()),
                        };
                        self.queued_events.push(NetworkBehaviourAction::GenerateEvent(event));
                    },
                }
            },
            kbucket::Entry::InKbucketConnectedPending(entry) => {
                entry.set_disconnected();
            },
            kbucket::Entry::InKbucketDisconnected(_) => {
                unreachable!("Kbuckets are always kept in sync with the connection state; QED")
            },
            kbucket::Entry::InKbucketDisconnectedPending(_) => {
                unreachable!("Kbuckets are always kept in sync with the connection state; QED")
            },
            kbucket::Entry::NotInKbucket(_) => {},
            kbucket::Entry::SelfEntry => {
                unreachable!("Guaranteed to never receive disconnected even for self; QED")
            },
        }
    }

    fn inject_replaced(&mut self, peer_id: PeerId, _old: ConnectedPoint, new_endpoint: ConnectedPoint) {
        // We need to re-send the active queries.
        for (query_id, query) in self.active_queries.iter() {
            if query.is_waiting(&peer_id) {
                self.queued_events.push(NetworkBehaviourAction::SendEvent {
                    peer_id: peer_id.clone(),
                    event: query.target().to_rpc_request(*query_id),
                });
            }
        }

        if let Some(list) = self.kbuckets.entry(&kbucket::Key::new(peer_id)).value() {
            if let ConnectedPoint::Dialer { address } = new_endpoint {
                list.insert(address);
            }
        }
    }

    fn inject_node_event(&mut self, source: PeerId, event: KademliaHandlerEvent<QueryId>) {
        match event {
            KademliaHandlerEvent::FindNodeReq { key, request_id } => {
                let closer_peers = self.kbuckets
                    .find_closest(&kbucket::Key::new(key))
                    .filter(|p| p.preimage() != &source)
                    .take(self.num_results)
                    .map(|key| build_kad_peer(&key, &mut self.kbuckets))
                    .collect();

                self.queued_events.push(NetworkBehaviourAction::SendEvent {
                    peer_id: source,
                    event: KademliaHandlerIn::FindNodeRes {
                        closer_peers,
                        request_id,
                    },
                });
            }
            KademliaHandlerEvent::FindNodeRes {
                closer_peers,
                user_data,
            } => {
                self.discovered(&user_data, &source, closer_peers.iter());
            }
            KademliaHandlerEvent::GetProvidersReq { key, request_id } => {
                let provider_peers = {
                    let kbuckets = &mut self.kbuckets;
                    self.values_providers
                        .get(&key)
                        .into_iter()
                        .flat_map(|peers| peers)
                        .filter(|p| *p != &source)
                        .map(move |peer_id| build_kad_peer(&kbucket::Key::new(peer_id.clone()), kbuckets))
                        .collect()
                };

                let closer_peers = self.kbuckets
                    .find_closest(&kbucket::Key::from(key))
                    .take(self.num_results)
                    .map(|key| build_kad_peer(&key, &mut self.kbuckets))
                    .collect();

                self.queued_events.push(NetworkBehaviourAction::SendEvent {
                    peer_id: source,
                    event: KademliaHandlerIn::GetProvidersRes {
                        closer_peers,
                        provider_peers,
                        request_id,
                    },
                });
            }
            KademliaHandlerEvent::GetProvidersRes {
                closer_peers,
                provider_peers,
                user_data,
            } => {
                let peers = closer_peers.iter().chain(provider_peers.iter());
                self.discovered(&user_data, &source, peers);
                if let Some(query) = self.active_queries.get_mut(&user_data) {
                    if let QueryInfoInner::GetProviders {
                        pending_results, ..
                    } = &mut query.target_mut().inner {
                        for peer in provider_peers {
                            pending_results.push(peer.node_id);
                        }
                    }
                }
            }
            KademliaHandlerEvent::QueryError { user_data, .. } => {
                // It is possible that we obtain a response for a query that has finished, which is
                // why we may not find an entry in `self.active_queries`.
                if let Some(query) = self.active_queries.get_mut(&user_data) {
                    query.inject_rpc_error(&source)
                }
            }
            KademliaHandlerEvent::AddProvider { key, provider_peer } => {
                self.queued_events.push(NetworkBehaviourAction::GenerateEvent(KademliaOut::Discovered {
                    peer_id: provider_peer.node_id.clone(),
                    addresses: provider_peer.multiaddrs.clone(),
                    ty: provider_peer.connection_ty,
                }));
                self.add_provider.push((key, provider_peer.node_id));
                return;
            }
        };
    }

    fn poll(
        &mut self,
        parameters: &mut PollParameters<'_>,
    ) -> Async<
        NetworkBehaviourAction<
            <Self::ProtocolsHandler as ProtocolsHandler>::InEvent,
            Self::OutEvent,
        >,
    > {
        // Flush the changes to the topology that we want to make.
        for (key, provider) in self.add_provider.drain() {
            // Don't add ourselves to the providers.
            if provider == *self.kbuckets.local_key().preimage() {
                continue;
            }
            let providers = self.values_providers.entry(key).or_insert_with(Default::default);
            if !providers.iter().any(|peer_id| peer_id == &provider) {
                providers.push(provider);
            }
        }
        self.add_provider.shrink_to_fit();

        // Handle `refresh_add_providers`.
        match self.refresh_add_providers.poll() {
            Ok(Async::NotReady) => {},
            Ok(Async::Ready(Some(_))) => {
                for target in self.providing_keys.clone().into_iter() {
                    self.start_query(QueryInfoInner::AddProvider { target });
                }
            },
            // Ignore errors.
            Ok(Async::Ready(None)) | Err(_) => {},
        }

        loop {
            // Handle events queued by other parts of this struct
            if !self.queued_events.is_empty() {
                return Async::Ready(self.queued_events.remove(0));
            }
            self.queued_events.shrink_to_fit();

            // If iterating finds a query that is finished, stores it here and stops looping.
            let mut finished_query = None;

            'queries_iter: for (&query_id, query) in self.active_queries.iter_mut() {
                loop {
                    match query.poll() {
                        Async::Ready(QueryStatePollOut::Finished) => {
                            finished_query = Some(query_id);
                            break 'queries_iter;
                        }
                        Async::Ready(QueryStatePollOut::SendRpc {
                            peer_id,
                            query_target,
                        }) => {
                            let rpc = query_target.to_rpc_request(query_id);
                            if self.connected_peers.contains(peer_id) {
                                return Async::Ready(NetworkBehaviourAction::SendEvent {
                                    peer_id: peer_id.clone(),
                                    event: rpc,
                                });
                            } else if peer_id != self.kbuckets.local_key().preimage() {
                                self.pending_rpcs.push((peer_id.clone(), rpc));
                                return Async::Ready(NetworkBehaviourAction::DialPeer {
                                    peer_id: peer_id.clone(),
                                });
                            }
                        }
                        Async::Ready(QueryStatePollOut::CancelRpc { peer_id }) => {
                            // We don't cancel if the RPC has already been sent out.
                            self.pending_rpcs.retain(|(id, _)| id != peer_id);
                        }
                        Async::NotReady => break,
                    }
                }
            }

            if let Some(finished_query) = finished_query {
                let (query_info, closer_peers) = self
                    .active_queries
                    .remove(&finished_query)
                    .expect("finished_query was gathered when iterating active_queries; QED.")
                    .into_target_and_closest_peers();

                match query_info.inner {
                    QueryInfoInner::Initialization { .. } => {},
                    QueryInfoInner::FindPeer(target) => {
                        let event = KademliaOut::FindNodeResult {
                            key: target,
                            closer_peers: closer_peers.collect(),
                        };
                        break Async::Ready(NetworkBehaviourAction::GenerateEvent(event));
                    },
                    QueryInfoInner::GetProviders { target, pending_results } => {
                        let event = KademliaOut::GetProvidersResult {
                            key: target,
                            closer_peers: closer_peers.collect(),
                            provider_peers: pending_results,
                        };

                        break Async::Ready(NetworkBehaviourAction::GenerateEvent(event));
                    },
                    QueryInfoInner::AddProvider { target } => {
                        let local_key = kbucket::Key::new(parameters.local_peer_id().clone());
                        for closest in closer_peers {
                            let event = NetworkBehaviourAction::SendEvent {
                                peer_id: closest,
                                event: KademliaHandlerIn::AddProvider {
                                    key: target.clone(),
                                    provider_peer: build_kad_peer(&local_key, &mut self.kbuckets),
                                },
                            };

                            self.queued_events.push(event);
                        }
                    },
                }
            } else {
                break Async::NotReady;
            }
        }
    }
}

/// Output event of the `Kademlia` behaviour.
#[derive(Debug, Clone)]
pub enum KademliaOut {
    /// We have discovered a node.
    ///
    /// > **Note**: The Kademlia behaviour doesn't store the addresses of this node, and therefore
    /// >           attempting to connect to this node may or may not work.
    Discovered {
        /// Id of the node that was discovered.
        peer_id: PeerId,
        /// Addresses of the node.
        addresses: Vec<Multiaddr>,
        /// How the reporter is connected to the reported.
        ty: KadConnectionType,
    },

    /// A node has been added to a k-bucket.
    KBucketAdded {
        /// Id of the node that was added.
        peer_id: PeerId,
        /// If `Some`, this addition replaced the value that is inside the option.
        replaced: Option<PeerId>,
    },

    /// Result of a `FIND_NODE` iterative query.
    FindNodeResult {
        /// The key that we looked for in the query.
        key: PeerId,
        /// List of peers ordered from closest to furthest away.
        closer_peers: Vec<PeerId>,
    },

    /// Result of a `GET_PROVIDERS` iterative query.
    GetProvidersResult {
        /// The key that we looked for in the query.
        key: Multihash,
        /// The peers that are providing the requested key.
        provider_peers: Vec<PeerId>,
        /// List of peers ordered from closest to furthest away.
        closer_peers: Vec<PeerId>,
    },
}

/// Builds a `KadPeer` struct corresponding to the given `PeerId`.
/// The `PeerId` cannot be the same as the local one.
///
/// > **Note**: This is just a convenience function that doesn't do anything note-worthy.
fn build_kad_peer(
    key: &kbucket::Key<PeerId>,
    kbuckets: &mut KBucketsTable<PeerId, Addresses>
) -> KadPeer {
    let (multiaddrs, connection_ty) = match kbuckets.entry(key) {
        kbucket::Entry::NotInKbucket(_) => (Vec::new(), KadConnectionType::NotConnected),       // TODO: pending connection?
        kbucket::Entry::InKbucketConnected(mut entry) => (entry.value().iter().cloned().collect(), KadConnectionType::Connected),
        kbucket::Entry::InKbucketDisconnected(mut entry) => (entry.value().iter().cloned().collect(), KadConnectionType::NotConnected),
        kbucket::Entry::InKbucketConnectedPending(mut entry) => (entry.value().iter().cloned().collect(), KadConnectionType::Connected),
        kbucket::Entry::InKbucketDisconnectedPending(mut entry) => (entry.value().iter().cloned().collect(), KadConnectionType::NotConnected),
        kbucket::Entry::SelfEntry => panic!("build_kad_peer expects not to be called with the kbucket::Key of the local ID"),
    };

    KadPeer {
        node_id: key.preimage().clone(),
        multiaddrs,
        connection_ty,
    }
}
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								// Copyright 2018 Parity Technologies (UK) Ltd.
 								//
 								// Permission is hereby granted, free of charge, to any person obtaining a
 								// copy of this software and associated documentation files (the "Software"),
 								// to deal in the Software without restriction, including without limitation
 								// the rights to use, copy, modify, merge, publish, distribute, sublicense,
 								// and/or sell copies of the Software, and to permit persons to whom the
 								// Software is furnished to do so, subject to the following conditions:
 								//
 								// The above copyright notice and this permission notice shall be included in
 								// all copies or substantial portions of the Software.
 								//
 								// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
 								// OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 								// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 								// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 								// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 								// FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
 								// DEALINGS IN THE SOFTWARE.
-												Add a proper list of addresses type for Kademlia (#928)

* Add a proper list of addresses type for Kademlia

* Some adjustements

											
										
										
											2019-02-12 12:56:39 +01:00
+								use crate::addresses::Addresses;
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								use crate::handler::{KademliaHandler, KademliaHandlerEvent, KademliaHandlerIn};
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								use crate::kbucket::{self, KBucketsTable};
-												Update protocols and transport to 2018 edition (#875)

Update the protocols and transport subdirectories to the 2018 edition.

NB: The websocket transport cannot be moved to 2018 edition due to
websocket-rs's use of the keyword async as the name of a module.
											
										
										
											2019-01-21 10:33:51 +00:00
+								use crate::protocol::{KadConnectionType, KadPeer};
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								use crate::query::{QueryConfig, QueryState, QueryStatePollOut};
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								use fnv::{FnvHashMap, FnvHashSet};
 								use futures::{prelude::*, stream};
-												Enhance the swarm a bit (#711)

* Replace the &mut TTopology with a &mut PollParameters

* Add supported_protocols

* Add external_addresses

* Report out addresses in Kademlia

* Fix the custom derive

* Some comments

* Fix compilation on stable

											
										
										
											2018-12-01 13:34:57 +01:00
+								use libp2p_core::swarm::{ConnectedPoint, NetworkBehaviour, NetworkBehaviourAction, PollParameters};
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								use libp2p_core::{protocols_handler::ProtocolsHandler, Multiaddr, PeerId};
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								use multihash::Multihash;
 								use smallvec::SmallVec;
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								use std::{borrow::Cow, error, marker::PhantomData, time::Duration};
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								use tokio_io::{AsyncRead, AsyncWrite};
-												Switch to wasm-timer (#1071)


											
										
										
											2019-04-25 15:08:06 +02:00
+								use wasm_timer::{Instant, Interval};
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								mod test;
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								/// Network behaviour that handles Kademlia.
 								pub struct Kademlia<TSubstream> {
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								    /// Storage for the nodes. Contains the known multiaddresses for this node.
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								    kbuckets: KBucketsTable<PeerId, Addresses>,
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
-												Allow changing the Kademlia protocol name (#1118)

* Allow changing the Kademlia protocol name

* Expose the method to the behaviour

* Address review

											
										
										
											2019-05-15 15:44:51 +02:00
+								    /// If `Some`, we overwrite the Kademlia protocol name with this one.
 								    protocol_name_override: Option<Cow<'static, [u8]>>,
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    /// All the iterative queries we are currently performing, with their ID. The last parameter
 								    /// is the list of accumulated providers for `GET_PROVIDERS` queries.
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								    active_queries: FnvHashMap<QueryId, QueryState<QueryInfo, PeerId>>,
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
 								    /// List of peers the swarm is connected to.
 								    connected_peers: FnvHashSet<PeerId>,
 								    /// Contains a list of peer IDs which we are not connected to, and an RPC query to send to them
 								    /// once they connect.
 								    pending_rpcs: SmallVec<[(PeerId, KademliaHandlerIn<QueryId>); 8]>,
 								    /// Identifier for the next query that we start.
 								    next_query_id: QueryId,
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								    /// List of values and peers that are providing them.
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    ///
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								    /// Our local peer ID can be in this container.
 								    // TODO: Note that in reality the value is a SHA-256 of the actual value (https://github.com/libp2p/rust-libp2p/issues/694)
 								    values_providers: FnvHashMap<Multihash, SmallVec<[PeerId; 20]>>,
 								    /// List of values that we are providing ourselves. Must be kept in sync with
 								    /// `values_providers`.
 								    providing_keys: FnvHashSet<Multihash>,
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
 								    /// Interval to send `ADD_PROVIDER` messages to everyone.
 								    refresh_add_providers: stream::Fuse<Interval>,
 								    /// `α` in the Kademlia reference papers. Designates the maximum number of queries that we
 								    /// perform in parallel.
 								    parallelism: usize,
 								    /// `k` in the Kademlia reference papers. Number of results in a find node query.
 								    num_results: usize,
 								    /// Timeout for each individual RPC query.
 								    rpc_timeout: Duration,
 								    /// Events to return when polling.
 								    queued_events: SmallVec<[NetworkBehaviourAction<KademliaHandlerIn<QueryId>, KademliaOut>; 32]>,
 								    /// List of providers to add to the topology as soon as we are in `poll()`.
 								    add_provider: SmallVec<[(Multihash, PeerId); 32]>,
 								    /// Marker to pin the generics.
 								    marker: PhantomData<TSubstream>,
 								}
 								/// Opaque type. Each query that we start gets a unique number.
 								#[derive(Debug, Copy, Clone, Hash, PartialEq, Eq)]
 								pub struct QueryId(usize);
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								/// Information about a query.
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								#[derive(Debug, Clone, PartialEq, Eq)]
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								struct QueryInfo {
 								    /// What we are querying and why.
 								    inner: QueryInfoInner,
 								    /// Temporary addresses used when trying to reach nodes.
 								    untrusted_addresses: FnvHashMap<PeerId, SmallVec<[Multiaddr; 8]>>,
 								}
 								/// Additional information about the query.
 								#[derive(Debug, Clone, PartialEq, Eq)]
 								enum QueryInfoInner {
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    /// The query was created for the Kademlia initialization process.
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								    Initialization {
 								        /// Hash we're targetting to insert ourselves in the k-buckets.
 								        target: PeerId,
 								    },
 								    /// The user requested a `FIND_PEER` query to be performed. It should be reported when finished.
 								    FindPeer(PeerId),
 								    /// The user requested a `GET_PROVIDERS` query to be performed. It should be reported when
 								    /// finished.
 								    GetProviders {
 								        /// Target we are searching the providers of.
 								        target: Multihash,
 								        /// Results to return. Filled over time.
 								        pending_results: Vec<PeerId>,
 								    },
 								    /// We are traversing towards `target` and should add an `ADD_PROVIDER` message to the peers
 								    /// of the outcome with our own identity.
 								    AddProvider {
 								        /// Which hash we're targetting.
 								        target: Multihash,
 								    },
 								}
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								impl Into<kbucket::Key<QueryInfo>> for QueryInfo {
 								    fn into(self) -> kbucket::Key<QueryInfo> {
 								        kbucket::Key::new(self)
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								    }
 								}
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								impl AsRef<[u8]> for QueryInfo {
 								    fn as_ref(&self) -> &[u8] {
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								        match &self.inner {
 								            QueryInfoInner::Initialization { target } => target.as_ref(),
 								            QueryInfoInner::FindPeer(peer) => peer.as_ref(),
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								            QueryInfoInner::GetProviders { target, .. } => target.as_bytes(),
 								            QueryInfoInner::AddProvider { target } => target.as_bytes(),
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								        }
 								    }
 								}
 								impl QueryInfo {
 								    /// Creates the corresponding RPC request to send to remote.
 								    fn to_rpc_request<TUserData>(&self, user_data: TUserData) -> KademliaHandlerIn<TUserData> {
 								        match &self.inner {
 								            QueryInfoInner::Initialization { target } => KademliaHandlerIn::FindNodeReq {
 								                key: target.clone(),
 								                user_data,
 								            },
 								            QueryInfoInner::FindPeer(key) => KademliaHandlerIn::FindNodeReq {
 								                key: key.clone(),
 								                user_data,
 								            },
 								            QueryInfoInner::GetProviders { target, .. } => KademliaHandlerIn::GetProvidersReq {
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								                key: target.clone(),
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                user_data,
 								            },
-												[Kademlia] Rehash PeerId before inserting in a KBucketsTable (#1025)

Add KadHash as the type to be used as key within KBuckets and replace PeerId.
											
										
										
											2019-03-26 16:17:34 +01:00
+								            QueryInfoInner::AddProvider { .. } => KademliaHandlerIn::FindNodeReq {
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                key: unimplemented!(), // TODO: target.clone(),
 								                user_data,
 								            },
 								        }
 								    }
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								}
 								impl<TSubstream> Kademlia<TSubstream> {
 								    /// Creates a `Kademlia`.
 								    #[inline]
 								    pub fn new(local_peer_id: PeerId) -> Self {
-												[Kademlia] Rehash PeerId before inserting in a KBucketsTable (#1025)

Add KadHash as the type to be used as key within KBuckets and replace PeerId.
											
										
										
											2019-03-26 16:17:34 +01:00
+								        Self::new_inner(local_peer_id)
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    }
-												Allow changing the Kademlia protocol name (#1118)

* Allow changing the Kademlia protocol name

* Expose the method to the behaviour

* Address review

											
										
										
											2019-05-15 15:44:51 +02:00
+								    /// The same as `new`, but using a custom protocol name.
 								    ///
 								    /// Kademlia nodes only communicate with other nodes using the same protocol name. Using a
 								    /// custom name therefore allows to segregate the DHT from others, if that is desired.
 								    pub fn with_protocol_name(local_peer_id: PeerId, name: impl Into<Cow<'static, [u8]>>) -> Self {
 								        let mut me = Kademlia::new_inner(local_peer_id);
 								        me.protocol_name_override = Some(name.into());
 								        me
 								    }
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    /// Creates a `Kademlia`.
 								    ///
 								    /// Contrary to `new`, doesn't perform the initialization queries that store our local ID into
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								    /// the DHT and fill our buckets.
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    #[inline]
-												[Kademlia] Rehash PeerId before inserting in a KBucketsTable (#1025)

Add KadHash as the type to be used as key within KBuckets and replace PeerId.
											
										
										
											2019-03-26 16:17:34 +01:00
+								    #[deprecated(note="this function is now equivalent to new() and will be removed in the future")]
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    pub fn without_init(local_peer_id: PeerId) -> Self {
-												[Kademlia] Rehash PeerId before inserting in a KBucketsTable (#1025)

Add KadHash as the type to be used as key within KBuckets and replace PeerId.
											
										
										
											2019-03-26 16:17:34 +01:00
+								        Self::new_inner(local_peer_id)
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    }
-												Add a proper list of addresses type for Kademlia (#928)

* Add a proper list of addresses type for Kademlia

* Some adjustements

											
										
										
											2019-02-12 12:56:39 +01:00
+								    /// Adds a known address for the given `PeerId`. We are connected to this address.
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								    // TODO: report if the address was inserted? also, semantics unclear
-												Add a proper list of addresses type for Kademlia (#928)

* Add a proper list of addresses type for Kademlia

* Some adjustements

											
										
										
											2019-02-12 12:56:39 +01:00
+								    pub fn add_connected_address(&mut self, peer_id: &PeerId, address: Multiaddr) {
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								        self.add_address(peer_id, address, true)
-												Add a proper list of addresses type for Kademlia (#928)

* Add a proper list of addresses type for Kademlia

* Some adjustements

											
										
										
											2019-02-12 12:56:39 +01:00
+								    }
 								    /// Adds a known address for the given `PeerId`. We are not connected or don't know whether we
 								    /// are connected to this address.
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								    // TODO: report if the address was inserted? also, semantics unclear
-												Add a proper list of addresses type for Kademlia (#928)

* Add a proper list of addresses type for Kademlia

* Some adjustements

											
										
										
											2019-02-12 12:56:39 +01:00
+								    pub fn add_not_connected_address(&mut self, peer_id: &PeerId, address: Multiaddr) {
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								        self.add_address(peer_id, address, false)
 								    }
 								    /// Underlying implementation for `add_connected_address` and `add_not_connected_address`.
-												[Kademlia] Rehash PeerId before inserting in a KBucketsTable (#1025)

Add KadHash as the type to be used as key within KBuckets and replace PeerId.
											
										
										
											2019-03-26 16:17:34 +01:00
+								    fn add_address(&mut self, peer_id: &PeerId, address: Multiaddr, _connected: bool) {
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								        let key = kbucket::Key::new(peer_id.clone());
 								        match self.kbuckets.entry(&key) {
-												Simplify the Addresses (#1012)

* Simplify the Addresses

* Remove println

											
										
										
											2019-03-20 17:30:00 +01:00
+								            kbucket::Entry::InKbucketConnected(mut entry) => entry.value().insert(address),
 								            kbucket::Entry::InKbucketConnectedPending(mut entry) => entry.value().insert(address),
 								            kbucket::Entry::InKbucketDisconnected(mut entry) => entry.value().insert(address),
 								            kbucket::Entry::InKbucketDisconnectedPending(mut entry) => entry.value().insert(address),
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								            kbucket::Entry::NotInKbucket(entry) => {
 								                let mut addresses = Addresses::new();
-												Simplify the Addresses (#1012)

* Simplify the Addresses

* Remove println

											
										
										
											2019-03-20 17:30:00 +01:00
+								                addresses.insert(address);
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								                match entry.insert_disconnected(addresses) {
 								                    kbucket::InsertOutcome::Inserted => {
 								                        let event = KademliaOut::KBucketAdded {
 								                            peer_id: peer_id.clone(),
 								                            replaced: None,
 								                        };
 								                        self.queued_events.push(NetworkBehaviourAction::GenerateEvent(event));
 								                    },
 								                    kbucket::InsertOutcome::Full => (),
 								                    kbucket::InsertOutcome::Pending { to_ping } => {
 								                        self.queued_events.push(NetworkBehaviourAction::DialPeer {
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								                            peer_id: to_ping.into_preimage(),
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								                        })
 								                    },
 								                }
 								                return;
 								            },
 								            kbucket::Entry::SelfEntry => return,
 								        };
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								    }
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    /// Inner implementation of the constructors.
-												[Kademlia] Rehash PeerId before inserting in a KBucketsTable (#1025)

Add KadHash as the type to be used as key within KBuckets and replace PeerId.
											
										
										
											2019-03-26 16:17:34 +01:00
+								    fn new_inner(local_peer_id: PeerId) -> Self {
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								        let parallelism = 3;
-												[Kademlia] Rehash PeerId before inserting in a KBucketsTable (#1025)

Add KadHash as the type to be used as key within KBuckets and replace PeerId.
											
										
										
											2019-03-26 16:17:34 +01:00
+								        Kademlia {
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								            kbuckets: KBucketsTable::new(kbucket::Key::new(local_peer_id), Duration::from_secs(60)),   // TODO: constant
-												Allow changing the Kademlia protocol name (#1118)

* Allow changing the Kademlia protocol name

* Expose the method to the behaviour

* Address review

											
										
										
											2019-05-15 15:44:51 +02:00
+								            protocol_name_override: None,
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								            queued_events: SmallVec::new(),
 								            active_queries: Default::default(),
 								            connected_peers: Default::default(),
 								            pending_rpcs: SmallVec::with_capacity(parallelism),
 								            next_query_id: QueryId(0),
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								            values_providers: FnvHashMap::default(),
 								            providing_keys: FnvHashSet::default(),
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								            refresh_add_providers: Interval::new_interval(Duration::from_secs(60)).fuse(),     // TODO: constant
 								            parallelism,
 								            num_results: 20,
 								            rpc_timeout: Duration::from_secs(8),
 								            add_provider: SmallVec::new(),
 								            marker: PhantomData,
 								        }
 								    }
-												Add kbuckets_entries (#1016)


											
										
										
											2019-03-20 18:36:01 +01:00
+								    /// Returns an iterator to all the peer IDs in the bucket, without the pending nodes.
 								    pub fn kbuckets_entries(&self) -> impl Iterator<Item = &PeerId> {
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								        self.kbuckets.entries_not_pending().map(|(key, _)| key.preimage())
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								    }
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    /// Starts an iterative `FIND_NODE` request.
 								    ///
 								    /// This will eventually produce an event containing the nodes of the DHT closest to the
 								    /// requested `PeerId`.
 								    pub fn find_node(&mut self, peer_id: PeerId) {
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								        self.start_query(QueryInfoInner::FindPeer(peer_id));
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    }
 								    /// Starts an iterative `GET_PROVIDERS` request.
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								    pub fn get_providers(&mut self, target: Multihash) {
 								        self.start_query(QueryInfoInner::GetProviders { target, pending_results: Vec::new() });
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    }
 								    /// Register the local node as the provider for the given key.
 								    ///
 								    /// This will periodically send `ADD_PROVIDER` messages to the nodes closest to the key. When
 								    /// someone performs a `GET_PROVIDERS` iterative request on the DHT, our local node will be
 								    /// returned as part of the results.
 								    ///
 								    /// The actual meaning of *providing* the value of a key is not defined, and is specific to
 								    /// the value whose key is the hash.
-												Replace PeerId with Multihash for interface consistency (#1095)

* Change a PeerId for a Multihash

* Update protocols/kad/src/behaviour.rs

Co-Authored-By: elferdo <elferdo@gmail.com>

* Update protocols/kad/src/behaviour.rs

Co-Authored-By: elferdo <elferdo@gmail.com>

											
										
										
											2019-04-30 19:39:26 +02:00
+								    pub fn add_providing(&mut self, key: Multihash) {
 								        self.providing_keys.insert(key.clone());
 								        let providers = self.values_providers.entry(key).or_insert_with(Default::default);
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								        let local_id = self.kbuckets.local_key().preimage();
 								        if !providers.iter().any(|peer_id| peer_id == local_id) {
 								            providers.push(local_id.clone());
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								        }
 								        // Trigger the next refresh now.
 								        self.refresh_add_providers = Interval::new(Instant::now(), Duration::from_secs(60)).fuse();
 								    }
 								    /// Cancels a registration done with `add_providing`.
 								    ///
 								    /// There doesn't exist any "remove provider" message to broadcast on the network, therefore we
 								    /// will still be registered as a provider in the DHT for as long as the timeout doesn't expire.
 								    pub fn remove_providing(&mut self, key: &Multihash) {
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								        self.providing_keys.remove(key);
 								        let providers = match self.values_providers.get_mut(key) {
 								            Some(p) => p,
 								            None => return,
 								        };
 								        if let Some(position) = providers.iter().position(|k| k == key) {
 								            providers.remove(position);
 								            providers.shrink_to_fit();
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								        }
 								    }
 								    /// Internal function that starts a query.
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								    fn start_query(&mut self, target: QueryInfoInner) {
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								        let query_id = self.next_query_id;
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								        self.next_query_id.0 += 1;
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
 								        let target = QueryInfo {
 								            inner: target,
 								            untrusted_addresses: Default::default(),
 								        };
 								        let known_closest_peers = self.kbuckets
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								            .find_closest(&kbucket::Key::new(target.clone()))
 								            .take(self.num_results);
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
 								        self.active_queries.insert(
 								            query_id,
 								            QueryState::new(QueryConfig {
 								                target,
 								                parallelism: self.parallelism,
 								                num_results: self.num_results,
 								                rpc_timeout: self.rpc_timeout,
 								                known_closest_peers,
 								            })
 								        );
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    }
-												Fix self-dialing in Kademlia. (#1097)

* Fix self-dialing in Kademlia.

Addresses https://github.com/libp2p/rust-libp2p/issues/341 which is the cause
for one of the observations made in https://github.com/libp2p/rust-libp2p/issues/1053.
However, the latter is not assumed to be fully addressed by these changes and
needs further investigation.

Currently, whenever a search for a key yields a response containing the initiating
peer as one of the closest peers known to the remote, the local node
would attempt to dial itself. That attempt is ignored by the Swarm, but
the Kademlia behaviour now believes it still has a query ongoing which is
always doomed to time out. That timeout delays successful completion of the query.
Hence, any query where a remote responds with the ID of the local node takes at
least as long as the `rpc_timeout` to complete, which possibly affects almost
all queries in smaller clusters where every node knows about every other.

This problem is fixed here by ensuring that Kademlia never tries to dial the local node.
Furthermore, `Discovered` events are no longer emitted for the local node
and it is not inserted into the `untrusted_addresses` from discovery, as described
in #341.

This commit also includes a change to the condition for freezing / terminating
a Kademlia query upon receiving a response. Specifically, the condition is
tightened such that it only applies if in addition to `parallelism`
consecutive responses that failed to yield a peer closer to the target, the
last response must also either not have reported any new peer or the
number of collected peers has already reached the number of desired results.
In effect, a Kademlia query now tries harder to actually return `k`
closest peers.

Tests have been refactored and expanded.

* Add another comment.

											
										
										
											2019-05-02 21:43:29 +02:00
 								    /// Processes discovered peers from a query.
 								    fn discovered<'a, I>(&'a mut self, query_id: &QueryId, source: &PeerId, peers: I)
 								    where
 								        I: Iterator<Item=&'a KadPeer> + Clone
 								    {
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								        let local_id = self.kbuckets.local_key().preimage().clone();
-												Fix self-dialing in Kademlia. (#1097)

* Fix self-dialing in Kademlia.

Addresses https://github.com/libp2p/rust-libp2p/issues/341 which is the cause
for one of the observations made in https://github.com/libp2p/rust-libp2p/issues/1053.
However, the latter is not assumed to be fully addressed by these changes and
needs further investigation.

Currently, whenever a search for a key yields a response containing the initiating
peer as one of the closest peers known to the remote, the local node
would attempt to dial itself. That attempt is ignored by the Swarm, but
the Kademlia behaviour now believes it still has a query ongoing which is
always doomed to time out. That timeout delays successful completion of the query.
Hence, any query where a remote responds with the ID of the local node takes at
least as long as the `rpc_timeout` to complete, which possibly affects almost
all queries in smaller clusters where every node knows about every other.

This problem is fixed here by ensuring that Kademlia never tries to dial the local node.
Furthermore, `Discovered` events are no longer emitted for the local node
and it is not inserted into the `untrusted_addresses` from discovery, as described
in #341.

This commit also includes a change to the condition for freezing / terminating
a Kademlia query upon receiving a response. Specifically, the condition is
tightened such that it only applies if in addition to `parallelism`
consecutive responses that failed to yield a peer closer to the target, the
last response must also either not have reported any new peer or the
number of collected peers has already reached the number of desired results.
In effect, a Kademlia query now tries harder to actually return `k`
closest peers.

Tests have been refactored and expanded.

* Add another comment.

											
										
										
											2019-05-02 21:43:29 +02:00
+								        let others_iter = peers.filter(|p| p.node_id != local_id);
 								        for peer in others_iter.clone() {
 								            self.queued_events.push(NetworkBehaviourAction::GenerateEvent(
 								                KademliaOut::Discovered {
 								                    peer_id: peer.node_id.clone(),
 								                    addresses: peer.multiaddrs.clone(),
 								                    ty: peer.connection_ty,
 								                }
 								            ));
 								        }
 								        if let Some(query) = self.active_queries.get_mut(query_id) {
 								            for peer in others_iter.clone() {
 								                query.target_mut().untrusted_addresses
 								                    .insert(peer.node_id.clone(), peer.multiaddrs.iter().cloned().collect());
 								            }
 								            query.inject_rpc_result(source, others_iter.cloned().map(|kp| kp.node_id))
 								        }
 								    }
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								}
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								impl<TSubstream> NetworkBehaviour for Kademlia<TSubstream>
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								where
 								    TSubstream: AsyncRead + AsyncWrite,
 								{
 								    type ProtocolsHandler = KademliaHandler<TSubstream, QueryId>;
 								    type OutEvent = KademliaOut;
 								    fn new_handler(&mut self) -> Self::ProtocolsHandler {
-												Allow changing the Kademlia protocol name (#1118)

* Allow changing the Kademlia protocol name

* Expose the method to the behaviour

* Address review

											
										
										
											2019-05-15 15:44:51 +02:00
+								        let mut handler = KademliaHandler::dial_and_listen();
 								        if let Some(name) = self.protocol_name_override.as_ref() {
 								            handler = handler.with_protocol_name(name.clone());
 								        }
 								        handler
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    }
-												Add inject_dial_failure and make addresses_of_peer mut (#901)

* Add inject_dial_failure and make addresses_of_peer mut

* Fix tests

											
										
										
											2019-01-30 14:55:39 +01:00
+								    fn addresses_of_peer(&mut self, peer_id: &PeerId) -> Vec<Multiaddr> {
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								        // We should order addresses from decreasing likelyhood of connectivity, so start with
 								        // the addresses of that peer in the k-buckets.
 								        let mut out_list = self.kbuckets
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								            .entry(&kbucket::Key::new(peer_id.clone()))
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								            .value_not_pending()
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								            .map(|l| l.iter().cloned().collect::<Vec<_>>())
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								            .unwrap_or_else(Vec::new);
 								        // We add to that a temporary list of addresses from the ongoing queries.
 								        for query in self.active_queries.values() {
 								            if let Some(addrs) = query.target().untrusted_addresses.get(peer_id) {
 								                for addr in addrs {
 								                    out_list.push(addr.clone());
 								                }
 								            }
 								        }
 								        out_list
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								    }
-												Add NetworkBehaviour::inject_replaced (#914)

* Add NetworkBehaviour::inject_replaced

* Address style

* Forgot to call set_disconnected

* Also add incoming addresses to kbuckets

											
										
										
											2019-02-04 15:21:50 +01:00
+								    fn inject_connected(&mut self, id: PeerId, endpoint: ConnectedPoint) {
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								        if let Some(pos) = self.pending_rpcs.iter().position(|(p, _)| p == &id) {
 								            let (_, rpc) = self.pending_rpcs.remove(pos);
 								            self.queued_events.push(NetworkBehaviourAction::SendEvent {
 								                peer_id: id.clone(),
 								                event: rpc,
 								            });
 								        }
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								        let address = match endpoint {
 								            ConnectedPoint::Dialer { address } => Some(address),
 								            ConnectedPoint::Listener { .. } => None,
 								        };
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								        let key = kbucket::Key::new(id.clone());
-												[Kademlia] Rehash PeerId before inserting in a KBucketsTable (#1025)

Add KadHash as the type to be used as key within KBuckets and replace PeerId.
											
										
										
											2019-03-26 16:17:34 +01:00
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								        match self.kbuckets.entry(&key) {
-												Bugfix in Kademlia disconnected (#1017)


											
										
										
											2019-03-20 17:52:35 +01:00
+								            kbucket::Entry::InKbucketConnected(_) => {
-												Revert accidental change in Kademlia (#1018)


											
										
										
											2019-03-20 18:55:09 +01:00
+								                unreachable!("Kbuckets are always kept in sync with the connection state; QED")
-												Bugfix in Kademlia disconnected (#1017)


											
										
										
											2019-03-20 17:52:35 +01:00
+								            },
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								            kbucket::Entry::InKbucketConnectedPending(_) => {
-												Revert accidental change in Kademlia (#1018)


											
										
										
											2019-03-20 18:55:09 +01:00
+								                unreachable!("Kbuckets are always kept in sync with the connection state; QED")
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								            },
 								            kbucket::Entry::InKbucketDisconnected(mut entry) => {
 								                if let Some(address) = address {
-												Simplify the Addresses (#1012)

* Simplify the Addresses

* Remove println

											
										
										
											2019-03-20 17:30:00 +01:00
+								                    entry.value().insert(address);
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								                }
 								                entry.set_connected();
 								            },
 								            kbucket::Entry::InKbucketDisconnectedPending(mut entry) => {
 								                if let Some(address) = address {
-												Simplify the Addresses (#1012)

* Simplify the Addresses

* Remove println

											
										
										
											2019-03-20 17:30:00 +01:00
+								                    entry.value().insert(address);
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								                }
 								                entry.set_connected();
 								            },
 								            kbucket::Entry::NotInKbucket(entry) => {
 								                let mut addresses = Addresses::new();
 								                if let Some(address) = address {
-												Simplify the Addresses (#1012)

* Simplify the Addresses

* Remove println

											
										
										
											2019-03-20 17:30:00 +01:00
+								                    addresses.insert(address);
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								                }
 								                match entry.insert_connected(addresses) {
 								                    kbucket::InsertOutcome::Inserted => {
 								                        let event = KademliaOut::KBucketAdded {
 								                            peer_id: id.clone(),
 								                            replaced: None,
 								                        };
 								                        self.queued_events.push(NetworkBehaviourAction::GenerateEvent(event));
 								                    },
 								                    kbucket::InsertOutcome::Full => (),
 								                    kbucket::InsertOutcome::Pending { to_ping } => {
 								                        self.queued_events.push(NetworkBehaviourAction::DialPeer {
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								                            peer_id: to_ping.into_preimage(),
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								                        })
 								                    },
 								                }
 								            },
 								            kbucket::Entry::SelfEntry => {
 								                unreachable!("Guaranteed to never receive disconnected even for self; QED")
 								            },
-												Add NetworkBehaviour::inject_replaced (#914)

* Add NetworkBehaviour::inject_replaced

* Address style

* Forgot to call set_disconnected

* Also add incoming addresses to kbuckets

											
										
										
											2019-02-04 15:21:50 +01:00
+								        }
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								        self.connected_peers.insert(id);
 								    }
-												Split address reach error and node reach error (#1013)

* Split address reach error and node reach error

* Small comments about order of operatoins

* Minor doc change

											
										
										
											2019-03-20 20:28:55 +01:00
+								    fn inject_addr_reach_failure(&mut self, peer_id: Option<&PeerId>, addr: &Multiaddr, _: &dyn error::Error) {
-												Add a proper list of addresses type for Kademlia (#928)

* Add a proper list of addresses type for Kademlia

* Some adjustements

											
										
										
											2019-02-12 12:56:39 +01:00
+								        if let Some(peer_id) = peer_id {
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								            let key = kbucket::Key::new(peer_id.clone());
-												[Kademlia] Rehash PeerId before inserting in a KBucketsTable (#1025)

Add KadHash as the type to be used as key within KBuckets and replace PeerId.
											
										
										
											2019-03-26 16:17:34 +01:00
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								            if let Some(list) = self.kbuckets.entry(&key).value() {
-												Add a proper list of addresses type for Kademlia (#928)

* Add a proper list of addresses type for Kademlia

* Some adjustements

											
										
										
											2019-02-12 12:56:39 +01:00
+								                // TODO: don't remove the address if the error is that we are already connected
 								                //       to this peer
-												Simplify the Addresses (#1012)

* Simplify the Addresses

* Remove println

											
										
										
											2019-03-20 17:30:00 +01:00
+								                list.remove(addr);
-												Add a proper list of addresses type for Kademlia (#928)

* Add a proper list of addresses type for Kademlia

* Some adjustements

											
										
										
											2019-02-12 12:56:39 +01:00
+								            }
-												Split address reach error and node reach error (#1013)

* Split address reach error and node reach error

* Small comments about order of operatoins

* Minor doc change

											
										
										
											2019-03-20 20:28:55 +01:00
 								            for query in self.active_queries.values_mut() {
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								                if let Some(addrs) = query.target_mut().untrusted_addresses.get_mut(&peer_id) {
-												Split address reach error and node reach error (#1013)

* Split address reach error and node reach error

* Small comments about order of operatoins

* Minor doc change

											
										
										
											2019-03-20 20:28:55 +01:00
+								                    addrs.retain(|a| a != addr);
 								                }
 								            }
 								        }
 								    }
 								    fn inject_dial_failure(&mut self, peer_id: &PeerId) {
 								        for query in self.active_queries.values_mut() {
 								            query.inject_rpc_error(peer_id);
-												Add a proper list of addresses type for Kademlia (#928)

* Add a proper list of addresses type for Kademlia

* Some adjustements

											
										
										
											2019-02-12 12:56:39 +01:00
+								        }
 								    }
-												[Kademlia] Rehash PeerId before inserting in a KBucketsTable (#1025)

Add KadHash as the type to be used as key within KBuckets and replace PeerId.
											
										
										
											2019-03-26 16:17:34 +01:00
+								    fn inject_disconnected(&mut self, id: &PeerId, _old_endpoint: ConnectedPoint) {
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								        let was_in = self.connected_peers.remove(id);
 								        debug_assert!(was_in);
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								        for query in self.active_queries.values_mut() {
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								            query.inject_rpc_error(id);
 								        }
-												Add NetworkBehaviour::inject_replaced (#914)

* Add NetworkBehaviour::inject_replaced

* Address style

* Forgot to call set_disconnected

* Also add incoming addresses to kbuckets

											
										
										
											2019-02-04 15:21:50 +01:00
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								        match self.kbuckets.entry(&kbucket::Key::new(id.clone())) {
-												Bugfix in Kademlia disconnected (#1017)


											
										
										
											2019-03-20 17:52:35 +01:00
+								            kbucket::Entry::InKbucketConnected(entry) => {
 								                match entry.set_disconnected() {
 								                    kbucket::SetDisconnectedOutcome::Kept(_) => {},
 								                    kbucket::SetDisconnectedOutcome::Replaced { replacement, .. } => {
 								                        let event = KademliaOut::KBucketAdded {
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								                            peer_id: replacement.into_preimage(),
-												Bugfix in Kademlia disconnected (#1017)


											
										
										
											2019-03-20 17:52:35 +01:00
+								                            replaced: Some(id.clone()),
 								                        };
 								                        self.queued_events.push(NetworkBehaviourAction::GenerateEvent(event));
 								                    },
 								                }
 								            },
 								            kbucket::Entry::InKbucketConnectedPending(entry) => {
 								                entry.set_disconnected();
 								            },
 								            kbucket::Entry::InKbucketDisconnected(_) => {
 								                unreachable!("Kbuckets are always kept in sync with the connection state; QED")
 								            },
 								            kbucket::Entry::InKbucketDisconnectedPending(_) => {
 								                unreachable!("Kbuckets are always kept in sync with the connection state; QED")
 								            },
 								            kbucket::Entry::NotInKbucket(_) => {},
 								            kbucket::Entry::SelfEntry => {
 								                unreachable!("Guaranteed to never receive disconnected even for self; QED")
 								            },
-												Add a proper list of addresses type for Kademlia (#928)

* Add a proper list of addresses type for Kademlia

* Some adjustements

											
										
										
											2019-02-12 12:56:39 +01:00
+								        }
-												Add NetworkBehaviour::inject_replaced (#914)

* Add NetworkBehaviour::inject_replaced

* Address style

* Forgot to call set_disconnected

* Also add incoming addresses to kbuckets

											
										
										
											2019-02-04 15:21:50 +01:00
+								    }
-												Simplify the Addresses (#1012)

* Simplify the Addresses

* Remove println

											
										
										
											2019-03-20 17:30:00 +01:00
+								    fn inject_replaced(&mut self, peer_id: PeerId, _old: ConnectedPoint, new_endpoint: ConnectedPoint) {
-												Add NetworkBehaviour::inject_replaced (#914)

* Add NetworkBehaviour::inject_replaced

* Address style

* Forgot to call set_disconnected

* Also add incoming addresses to kbuckets

											
										
										
											2019-02-04 15:21:50 +01:00
+								        // We need to re-send the active queries.
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								        for (query_id, query) in self.active_queries.iter() {
-												Add NetworkBehaviour::inject_replaced (#914)

* Add NetworkBehaviour::inject_replaced

* Address style

* Forgot to call set_disconnected

* Also add incoming addresses to kbuckets

											
										
										
											2019-02-04 15:21:50 +01:00
+								            if query.is_waiting(&peer_id) {
 								                self.queued_events.push(NetworkBehaviourAction::SendEvent {
 								                    peer_id: peer_id.clone(),
 								                    event: query.target().to_rpc_request(*query_id),
 								                });
 								            }
 								        }
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								        if let Some(list) = self.kbuckets.entry(&kbucket::Key::new(peer_id)).value() {
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								            if let ConnectedPoint::Dialer { address } = new_endpoint {
-												Simplify the Addresses (#1012)

* Simplify the Addresses

* Remove println

											
										
										
											2019-03-20 17:30:00 +01:00
+								                list.insert(address);
-												Add NetworkBehaviour::inject_replaced (#914)

* Add NetworkBehaviour::inject_replaced

* Address style

* Forgot to call set_disconnected

* Also add incoming addresses to kbuckets

											
										
										
											2019-02-04 15:21:50 +01:00
+								            }
 								        }
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    }
 								    fn inject_node_event(&mut self, source: PeerId, event: KademliaHandlerEvent<QueryId>) {
 								        match event {
 								            KademliaHandlerEvent::FindNodeReq { key, request_id } => {
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                let closer_peers = self.kbuckets
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								                    .find_closest(&kbucket::Key::new(key))
 								                    .filter(|p| p.preimage() != &source)
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                    .take(self.num_results)
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								                    .map(|key| build_kad_peer(&key, &mut self.kbuckets))
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                    .collect();
 								                self.queued_events.push(NetworkBehaviourAction::SendEvent {
 								                    peer_id: source,
 								                    event: KademliaHandlerIn::FindNodeRes {
 								                        closer_peers,
 								                        request_id,
 								                    },
 								                });
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								            }
 								            KademliaHandlerEvent::FindNodeRes {
 								                closer_peers,
 								                user_data,
 								            } => {
-												Fix self-dialing in Kademlia. (#1097)

* Fix self-dialing in Kademlia.

Addresses https://github.com/libp2p/rust-libp2p/issues/341 which is the cause
for one of the observations made in https://github.com/libp2p/rust-libp2p/issues/1053.
However, the latter is not assumed to be fully addressed by these changes and
needs further investigation.

Currently, whenever a search for a key yields a response containing the initiating
peer as one of the closest peers known to the remote, the local node
would attempt to dial itself. That attempt is ignored by the Swarm, but
the Kademlia behaviour now believes it still has a query ongoing which is
always doomed to time out. That timeout delays successful completion of the query.
Hence, any query where a remote responds with the ID of the local node takes at
least as long as the `rpc_timeout` to complete, which possibly affects almost
all queries in smaller clusters where every node knows about every other.

This problem is fixed here by ensuring that Kademlia never tries to dial the local node.
Furthermore, `Discovered` events are no longer emitted for the local node
and it is not inserted into the `untrusted_addresses` from discovery, as described
in #341.

This commit also includes a change to the condition for freezing / terminating
a Kademlia query upon receiving a response. Specifically, the condition is
tightened such that it only applies if in addition to `parallelism`
consecutive responses that failed to yield a peer closer to the target, the
last response must also either not have reported any new peer or the
number of collected peers has already reached the number of desired results.
In effect, a Kademlia query now tries harder to actually return `k`
closest peers.

Tests have been refactored and expanded.

* Add another comment.

											
										
										
											2019-05-02 21:43:29 +02:00
+								                self.discovered(&user_data, &source, closer_peers.iter());
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								            }
 								            KademliaHandlerEvent::GetProvidersReq { key, request_id } => {
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								                let provider_peers = {
 								                    let kbuckets = &mut self.kbuckets;
 								                    self.values_providers
 								                        .get(&key)
 								                        .into_iter()
 								                        .flat_map(|peers| peers)
-												Filter requesting peer from results. (#1102)

Although not explicitly mentioned in the paper, it seems clear that
including an entry for the requesting peer in a FIND_NODE response
never gives useful information and just occupies a result slot that may
have been better filled with another peer that the requestor may not
know about.

There is one explicit mention that this is the desired behavior
in a somewhat dated design document of another p2p framework [1]:

"The recipient of a FIND_NODE should never return a triple containing
the nodeID of the requestor."

The same reasoning supposedly applies to the libp2p-specific `GET_PROVIDERS`
request.

[1] http://xlattice.sourceforge.net/components/protocol/kademlia/specs.html#FIND_NODE
											
										
										
											2019-05-06 11:40:13 +02:00
+								                        .filter(|p| *p != &source)
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								                        .map(move |peer_id| build_kad_peer(&kbucket::Key::new(peer_id.clone()), kbuckets))
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								                        .collect()
 								                };
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								                let closer_peers = self.kbuckets
 								                    .find_closest(&kbucket::Key::from(key))
 								                    .take(self.num_results)
 								                    .map(|key| build_kad_peer(&key, &mut self.kbuckets))
 								                    .collect();
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                self.queued_events.push(NetworkBehaviourAction::SendEvent {
 								                    peer_id: source,
 								                    event: KademliaHandlerIn::GetProvidersRes {
 								                        closer_peers,
 								                        provider_peers,
 								                        request_id,
 								                    },
 								                });
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								            }
 								            KademliaHandlerEvent::GetProvidersRes {
 								                closer_peers,
 								                provider_peers,
 								                user_data,
 								            } => {
-												Fix self-dialing in Kademlia. (#1097)

* Fix self-dialing in Kademlia.

Addresses https://github.com/libp2p/rust-libp2p/issues/341 which is the cause
for one of the observations made in https://github.com/libp2p/rust-libp2p/issues/1053.
However, the latter is not assumed to be fully addressed by these changes and
needs further investigation.

Currently, whenever a search for a key yields a response containing the initiating
peer as one of the closest peers known to the remote, the local node
would attempt to dial itself. That attempt is ignored by the Swarm, but
the Kademlia behaviour now believes it still has a query ongoing which is
always doomed to time out. That timeout delays successful completion of the query.
Hence, any query where a remote responds with the ID of the local node takes at
least as long as the `rpc_timeout` to complete, which possibly affects almost
all queries in smaller clusters where every node knows about every other.

This problem is fixed here by ensuring that Kademlia never tries to dial the local node.
Furthermore, `Discovered` events are no longer emitted for the local node
and it is not inserted into the `untrusted_addresses` from discovery, as described
in #341.

This commit also includes a change to the condition for freezing / terminating
a Kademlia query upon receiving a response. Specifically, the condition is
tightened such that it only applies if in addition to `parallelism`
consecutive responses that failed to yield a peer closer to the target, the
last response must also either not have reported any new peer or the
number of collected peers has already reached the number of desired results.
In effect, a Kademlia query now tries harder to actually return `k`
closest peers.

Tests have been refactored and expanded.

* Add another comment.

											
										
										
											2019-05-02 21:43:29 +02:00
+								                let peers = closer_peers.iter().chain(provider_peers.iter());
 								                self.discovered(&user_data, &source, peers);
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                if let Some(query) = self.active_queries.get_mut(&user_data) {
-												Fix self-dialing in Kademlia. (#1097)

* Fix self-dialing in Kademlia.

Addresses https://github.com/libp2p/rust-libp2p/issues/341 which is the cause
for one of the observations made in https://github.com/libp2p/rust-libp2p/issues/1053.
However, the latter is not assumed to be fully addressed by these changes and
needs further investigation.

Currently, whenever a search for a key yields a response containing the initiating
peer as one of the closest peers known to the remote, the local node
would attempt to dial itself. That attempt is ignored by the Swarm, but
the Kademlia behaviour now believes it still has a query ongoing which is
always doomed to time out. That timeout delays successful completion of the query.
Hence, any query where a remote responds with the ID of the local node takes at
least as long as the `rpc_timeout` to complete, which possibly affects almost
all queries in smaller clusters where every node knows about every other.

This problem is fixed here by ensuring that Kademlia never tries to dial the local node.
Furthermore, `Discovered` events are no longer emitted for the local node
and it is not inserted into the `untrusted_addresses` from discovery, as described
in #341.

This commit also includes a change to the condition for freezing / terminating
a Kademlia query upon receiving a response. Specifically, the condition is
tightened such that it only applies if in addition to `parallelism`
consecutive responses that failed to yield a peer closer to the target, the
last response must also either not have reported any new peer or the
number of collected peers has already reached the number of desired results.
In effect, a Kademlia query now tries harder to actually return `k`
closest peers.

Tests have been refactored and expanded.

* Add another comment.

											
										
										
											2019-05-02 21:43:29 +02:00
+								                    if let QueryInfoInner::GetProviders {
 								                        pending_results, ..
 								                    } = &mut query.target_mut().inner {
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                        for peer in provider_peers {
 								                            pending_results.push(peer.node_id);
 								                        }
 								                    }
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								                }
 								            }
 								            KademliaHandlerEvent::QueryError { user_data, .. } => {
 								                // It is possible that we obtain a response for a query that has finished, which is
 								                // why we may not find an entry in `self.active_queries`.
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                if let Some(query) = self.active_queries.get_mut(&user_data) {
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								                    query.inject_rpc_error(&source)
 								                }
 								            }
 								            KademliaHandlerEvent::AddProvider { key, provider_peer } => {
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								                self.queued_events.push(NetworkBehaviourAction::GenerateEvent(KademliaOut::Discovered {
 								                    peer_id: provider_peer.node_id.clone(),
 								                    addresses: provider_peer.multiaddrs.clone(),
 								                    ty: provider_peer.connection_ty,
 								                }));
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								                self.add_provider.push((key, provider_peer.node_id));
 								                return;
 								            }
 								        };
 								    }
 								    fn poll(
 								        &mut self,
-												Address edition-2018 idioms. (#929)


											
										
										
											2019-02-11 14:58:15 +01:00
+								        parameters: &mut PollParameters<'_>,
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    ) -> Async<
 								        NetworkBehaviourAction<
 								            <Self::ProtocolsHandler as ProtocolsHandler>::InEvent,
 								            Self::OutEvent,
 								        >,
 								    > {
 								        // Flush the changes to the topology that we want to make.
 								        for (key, provider) in self.add_provider.drain() {
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								            // Don't add ourselves to the providers.
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								            if provider == *self.kbuckets.local_key().preimage() {
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								                continue;
 								            }
 								            let providers = self.values_providers.entry(key).or_insert_with(Default::default);
-												[Kademlia] Rehash PeerId before inserting in a KBucketsTable (#1025)

Add KadHash as the type to be used as key within KBuckets and replace PeerId.
											
										
										
											2019-03-26 16:17:34 +01:00
+								            if !providers.iter().any(|peer_id| peer_id == &provider) {
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								                providers.push(provider);
 								            }
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								        }
 								        self.add_provider.shrink_to_fit();
 								        // Handle `refresh_add_providers`.
 								        match self.refresh_add_providers.poll() {
 								            Ok(Async::NotReady) => {},
 								            Ok(Async::Ready(Some(_))) => {
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                for target in self.providing_keys.clone().into_iter() {
 								                    self.start_query(QueryInfoInner::AddProvider { target });
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								                }
 								            },
 								            // Ignore errors.
 								            Ok(Async::Ready(None)) | Err(_) => {},
 								        }
 								        loop {
 								            // Handle events queued by other parts of this struct
 								            if !self.queued_events.is_empty() {
 								                return Async::Ready(self.queued_events.remove(0));
 								            }
 								            self.queued_events.shrink_to_fit();
 								            // If iterating finds a query that is finished, stores it here and stops looping.
 								            let mut finished_query = None;
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								            'queries_iter: for (&query_id, query) in self.active_queries.iter_mut() {
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								                loop {
 								                    match query.poll() {
 								                        Async::Ready(QueryStatePollOut::Finished) => {
 								                            finished_query = Some(query_id);
 								                            break 'queries_iter;
 								                        }
 								                        Async::Ready(QueryStatePollOut::SendRpc {
 								                            peer_id,
 								                            query_target,
 								                        }) => {
 								                            let rpc = query_target.to_rpc_request(query_id);
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								                            if self.connected_peers.contains(peer_id) {
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								                                return Async::Ready(NetworkBehaviourAction::SendEvent {
 								                                    peer_id: peer_id.clone(),
 								                                    event: rpc,
 								                                });
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								                            } else if peer_id != self.kbuckets.local_key().preimage() {
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								                                self.pending_rpcs.push((peer_id.clone(), rpc));
 								                                return Async::Ready(NetworkBehaviourAction::DialPeer {
 								                                    peer_id: peer_id.clone(),
 								                                });
 								                            }
 								                        }
 								                        Async::Ready(QueryStatePollOut::CancelRpc { peer_id }) => {
 								                            // We don't cancel if the RPC has already been sent out.
 								                            self.pending_rpcs.retain(|(id, _)| id != peer_id);
 								                        }
 								                        Async::NotReady => break,
 								                    }
 								                }
 								            }
 								            if let Some(finished_query) = finished_query {
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                let (query_info, closer_peers) = self
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								                    .active_queries
 								                    .remove(&finished_query)
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                    .expect("finished_query was gathered when iterating active_queries; QED.")
 								                    .into_target_and_closest_peers();
 								                match query_info.inner {
 								                    QueryInfoInner::Initialization { .. } => {},
 								                    QueryInfoInner::FindPeer(target) => {
 								                        let event = KademliaOut::FindNodeResult {
 								                            key: target,
 								                            closer_peers: closer_peers.collect(),
 								                        };
 								                        break Async::Ready(NetworkBehaviourAction::GenerateEvent(event));
 								                    },
 								                    QueryInfoInner::GetProviders { target, pending_results } => {
 								                        let event = KademliaOut::GetProvidersResult {
 								                            key: target,
 								                            closer_peers: closer_peers.collect(),
 								                            provider_peers: pending_results,
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								                        };
 								                        break Async::Ready(NetworkBehaviourAction::GenerateEvent(event));
 								                    },
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                    QueryInfoInner::AddProvider { target } => {
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								                        let local_key = kbucket::Key::new(parameters.local_peer_id().clone());
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                        for closest in closer_peers {
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								                            let event = NetworkBehaviourAction::SendEvent {
 								                                peer_id: closest,
 								                                event: KademliaHandlerIn::AddProvider {
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								                                    key: target.clone(),
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								                                    provider_peer: build_kad_peer(&local_key, &mut self.kbuckets),
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								                                },
 								                            };
 								                            self.queued_events.push(event);
 								                        }
 								                    },
 								                }
 								            } else {
 								                break Async::NotReady;
 								            }
 								        }
 								    }
 								}
 								/// Output event of the `Kademlia` behaviour.
 								#[derive(Debug, Clone)]
 								pub enum KademliaOut {
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								    /// We have discovered a node.
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								    ///
 								    /// > **Note**: The Kademlia behaviour doesn't store the addresses of this node, and therefore
 								    /// >           attempting to connect to this node may or may not work.
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								    Discovered {
 								        /// Id of the node that was discovered.
 								        peer_id: PeerId,
 								        /// Addresses of the node.
 								        addresses: Vec<Multiaddr>,
 								        /// How the reporter is connected to the reported.
 								        ty: KadConnectionType,
 								    },
-												Rewrite the Kademlia k-buckets to be more explicit (#996)

* Some k-buckets improvements

* Apply suggestions from code review

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Use NonZeroUsize for the distance

* Update TODO comment

											
										
										
											2019-03-20 17:09:48 +01:00
+								    /// A node has been added to a k-bucket.
 								    KBucketAdded {
 								        /// Id of the node that was added.
 								        peer_id: PeerId,
 								        /// If `Some`, this addition replaced the value that is inside the option.
 								        replaced: Option<PeerId>,
 								    },
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    /// Result of a `FIND_NODE` iterative query.
 								    FindNodeResult {
 								        /// The key that we looked for in the query.
 								        key: PeerId,
 								        /// List of peers ordered from closest to furthest away.
 								        closer_peers: Vec<PeerId>,
 								    },
 								    /// Result of a `GET_PROVIDERS` iterative query.
 								    GetProvidersResult {
 								        /// The key that we looked for in the query.
 								        key: Multihash,
 								        /// The peers that are providing the requested key.
 								        provider_peers: Vec<PeerId>,
 								        /// List of peers ordered from closest to furthest away.
 								        closer_peers: Vec<PeerId>,
 								    },
 								}
 								/// Builds a `KadPeer` struct corresponding to the given `PeerId`.
-												Some Kademlia improvements (#994)

* Move QueryTarget to the behaviour

* Rework query system

* Add a few tests

* Add some Kademlia tests

* More tests

* Don't return self entry

* Fix tests

											
										
										
											2019-03-18 18:20:57 +01:00
+								/// The `PeerId` cannot be the same as the local one.
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								///
 								/// > **Note**: This is just a convenience function that doesn't do anything note-worthy.
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								fn build_kad_peer(
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								    key: &kbucket::Key<PeerId>,
 								    kbuckets: &mut KBucketsTable<PeerId, Addresses>
-												Embed the topology in the NetworkBehaviour  (#889)

* Embed the topology in the NetworkBehaviour

* Put topologies inside of Floodsub and Kad

* Fix core tests

* Fix chat example

* More work

* Some cleanup

* Restore external addresses system

											
										
										
											2019-01-26 23:57:53 +01:00
+								) -> KadPeer {
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								    let (multiaddrs, connection_ty) = match kbuckets.entry(key) {
-												Simplify the Addresses (#1012)

* Simplify the Addresses

* Remove println

											
										
										
											2019-03-20 17:30:00 +01:00
+								        kbucket::Entry::NotInKbucket(_) => (Vec::new(), KadConnectionType::NotConnected),       // TODO: pending connection?
 								        kbucket::Entry::InKbucketConnected(mut entry) => (entry.value().iter().cloned().collect(), KadConnectionType::Connected),
 								        kbucket::Entry::InKbucketDisconnected(mut entry) => (entry.value().iter().cloned().collect(), KadConnectionType::NotConnected),
 								        kbucket::Entry::InKbucketConnectedPending(mut entry) => (entry.value().iter().cloned().collect(), KadConnectionType::Connected),
 								        kbucket::Entry::InKbucketDisconnectedPending(mut entry) => (entry.value().iter().cloned().collect(), KadConnectionType::NotConnected),
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								        kbucket::Entry::SelfEntry => panic!("build_kad_peer expects not to be called with the kbucket::Key of the local ID"),
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								    };
 								    KadPeer {
-												Improve XOR metric. (#1108)

There are two issues with the current definition and use of Kademlia's
XOR metric:

  1. The distance is currently equated with the bucket index, i.e.
     `distance(a,b) - 1` is the index of the bucket into which either
     peer is put by the other. The result is a metric that is not
     unidirectional, as defined in the Kademlia paper and as implemented
     in e.g. libp2p-go and libp2p-js, which is to interpret the result
     of the XOR as an integer in its entirety.

  2. The current `KBucketsPeerId` trait and its instances allow computing
     distances between types with differing bit lengths as well as between
     types that hash all inputs again (i.e. `KadHash`) and "plain" `PeerId`s
     or `Multihash`es. This can result in computed distances that are either
     incorrect as per the requirement of the libp2p specs that all distances
     are to be computed from the XOR of the SHA256 of the input keys, or
     even fall outside of the image of the metric used for the `KBucketsTable`.
     In the latter case, such distances are not currently used as a bucket index
     - they can only occur in the context of comparing distances for the purpose
     of sorting peers - but that still seems undesirable.

These issues are addressed here as follows:

  * Unidirectionality of the XOR metric is restored by keeping the "full"
    integer representation of the bitwise XOR. The result is an XOR metric
    as defined in the paper. This also opens the door to avoiding the
    "full table scan" when searching for the keys closest to a given key -
    the ideal order in which to visit the buckets can be computed with the
    help of the distance bit string.

  * As a simplification and to make it easy to "do the right thing", the
    XOR metric is only defined on an opaque `kbucket::Key` type, partially
    derived from the current `KadHash`. `KadHash` and `KBucketsPeerId`
    are removed.
											
										
										
											2019-05-17 17:27:57 +02:00
+								        node_id: key.preimage().clone(),
-												Add a KademliaHandler (#580)

* Rework Kademlia for the new design

* Minor work on protocol.rs

* More work

* Remove QueryTarget::FindValue

* Finish work on query

* Query timeout test

* Work on topology

* More work

* Update protocols/kad/src/topology.rs

Co-Authored-By: tomaka <pierre.krieger1708@gmail.com>

* Fix trailing whitespaces

* Use if let

											
										
										
											2018-11-29 12:11:35 +01:00
+								        multiaddrs,
 								        connection_ty,
 								    }
 								}