zolfa
/
tendermint


								package p2p


								import (

									"context"

									"errors"

									"fmt"

									"io"

									"math"

									"math/rand"

									"net"

									"net/url"

									"runtime/debug"

									"sort"

									"strconv"

									"sync"

									"time"


									"github.com/tendermint/tendermint/libs/cmap"

									"github.com/tendermint/tendermint/libs/log"

									"github.com/tendermint/tendermint/libs/service"

									tmconn "github.com/tendermint/tendermint/p2p/conn"

								)


								// PeerAddress is a peer address URL.

								type PeerAddress struct {

									*url.URL

								}


								// ParsePeerAddress parses a peer address URL into a PeerAddress.

								func ParsePeerAddress(address string) (PeerAddress, error) {

									u, err := url.Parse(address)

									if err != nil || u == nil {

										return PeerAddress{}, fmt.Errorf("unable to parse peer address %q: %w", address, err)

									}

									if u.Scheme == "" {

										u.Scheme = string(defaultProtocol)

									}

									pa := PeerAddress{URL: u}

									if err = pa.Validate(); err != nil {

										return PeerAddress{}, err

									}

									return pa, nil

								}


								// NodeID returns the address node ID.

								func (a PeerAddress) NodeID() NodeID {

									return NodeID(a.User.Username())

								}


								// Resolve resolves a PeerAddress into a set of Endpoints, by expanding

								// out a DNS name in Host to its IP addresses. Field mapping:

								//

								//   Scheme → Endpoint.Protocol

								//   Host   → Endpoint.IP

								//   User   → Endpoint.PeerID

								//   Port   → Endpoint.Port

								//   Path+Query+Fragment,Opaque → Endpoint.Path

								//

								func (a PeerAddress) Resolve(ctx context.Context) ([]Endpoint, error) {

									ips, err := net.DefaultResolver.LookupIP(ctx, "ip", a.Host)

									if err != nil {

										return nil, err

									}

									port, err := a.parsePort()

									if err != nil {

										return nil, err

									}


									path := a.Path

									if a.RawPath != "" {

										path = a.RawPath

									}

									if a.Opaque != "" { // used for e.g. "about:blank" style URLs

										path = a.Opaque

									}

									if a.RawQuery != "" {

										path += "?" + a.RawQuery

									}

									if a.RawFragment != "" {

										path += "#" + a.RawFragment

									}


									endpoints := make([]Endpoint, len(ips))

									for i, ip := range ips {

										endpoints[i] = Endpoint{

											PeerID:   a.NodeID(),

											Protocol: Protocol(a.Scheme),

											IP:       ip,

											Port:     port,

											Path:     path,

										}

									}

									return endpoints, nil

								}


								// Validates validates a PeerAddress.

								func (a PeerAddress) Validate() error {

									if a.Scheme == "" {

										return errors.New("no protocol")

									}

									if id := a.User.Username(); id == "" {

										return errors.New("no peer ID")

									} else if err := NodeID(id).Validate(); err != nil {

										return fmt.Errorf("invalid peer ID: %w", err)

									}

									if a.Hostname() == "" && len(a.Query()) == 0 && a.Opaque == "" {

										return errors.New("no host or path given")

									}

									if port, err := a.parsePort(); err != nil {

										return err

									} else if port > 0 && a.Hostname() == "" {

										return errors.New("cannot specify port without host")

									}

									return nil

								}


								// parsePort returns the port number as a uint16.

								func (a PeerAddress) parsePort() (uint16, error) {

									if portString := a.Port(); portString != "" {

										port64, err := strconv.ParseUint(portString, 10, 16)

										if err != nil {

											return 0, fmt.Errorf("invalid port %q: %w", portString, err)

										}

										return uint16(port64), nil

									}

									return 0, nil

								}


								// PeerStatus specifies peer statuses.

								type PeerStatus string


								const (

									PeerStatusNew     = PeerStatus("new")     // New peer which we haven't tried to contact yet.

									PeerStatusUp      = PeerStatus("up")      // Peer which we have an active connection to.

									PeerStatusDown    = PeerStatus("down")    // Peer which we're temporarily disconnected from.

									PeerStatusRemoved = PeerStatus("removed") // Peer which has been removed.

									PeerStatusBanned  = PeerStatus("banned")  // Peer which is banned for misbehavior.

								)


								// PeerError is a peer error reported by a reactor via the Error channel. The

								// severity may cause the peer to be disconnected or banned depending on policy.

								type PeerError struct {

									PeerID   NodeID

									Err      error

									Severity PeerErrorSeverity

								}


								// PeerErrorSeverity determines the severity of a peer error.

								type PeerErrorSeverity string


								const (

									PeerErrorSeverityLow      PeerErrorSeverity = "low"      // Mostly ignored.

									PeerErrorSeverityHigh     PeerErrorSeverity = "high"     // May disconnect.

									PeerErrorSeverityCritical PeerErrorSeverity = "critical" // Ban.

								)


								// PeerUpdatesCh defines a wrapper around a PeerUpdate go channel that allows

								// a reactor to listen for peer updates and safely close it when stopping.

								type PeerUpdatesCh struct {

									closeOnce sync.Once


									// updatesCh defines the go channel in which the router sends peer updates to

									// reactors. Each reactor will have its own PeerUpdatesCh to listen for updates

									// from.

									updatesCh chan PeerUpdate


									// doneCh is used to signal that a PeerUpdatesCh is closed. It is the

									// reactor's responsibility to invoke Close.

									doneCh chan struct{}

								}


								// NewPeerUpdates returns a reference to a new PeerUpdatesCh.

								func NewPeerUpdates(updatesCh chan PeerUpdate) *PeerUpdatesCh {

									return &PeerUpdatesCh{

										updatesCh: updatesCh,

										doneCh:    make(chan struct{}),

									}

								}


								// Updates returns a read-only go channel where a consuming reactor can listen

								// for peer updates sent from the router.

								func (puc *PeerUpdatesCh) Updates() <-chan PeerUpdate {

									return puc.updatesCh

								}


								// Close closes the PeerUpdatesCh channel. It should only be closed by the respective

								// reactor when stopping and ensure nothing is listening for updates.

								//

								// NOTE: After a PeerUpdatesCh is closed, the router may safely assume it can no

								// longer send on the internal updatesCh, however it should NEVER explicitly close

								// it as that could result in panics by sending on a closed channel.

								func (puc *PeerUpdatesCh) Close() {

									puc.closeOnce.Do(func() {

										close(puc.doneCh)

									})

								}


								// Done returns a read-only version of the PeerUpdatesCh's internal doneCh go

								// channel that should be used by a router to signal when it is safe to explicitly

								// not send any peer updates.

								func (puc *PeerUpdatesCh) Done() <-chan struct{} {

									return puc.doneCh

								}


								// PeerUpdate is a peer status update for reactors.

								type PeerUpdate struct {

									PeerID NodeID

									Status PeerStatus

								}


								// PeerScore is a numeric score assigned to a peer (higher is better).

								type PeerScore uint16


								const (

									// PeerScorePersistent is added for persistent peers.

									PeerScorePersistent PeerScore = 100

								)


								// PeerManager manages peer lifecycle information, using a peerStore for

								// underlying storage. Its primary purpose is to determine which peers to

								// connect to next, make sure a peer only has a single active connection (either

								// inbound or outbound), and evict peers to make room for higher-scored peers.

								// It does not manage actual connections (this is handled by the Router),

								// only the peer lifecycle state.

								//

								// We track dialing and connected states independently. This allows us to accept

								// an inbound connection from a peer while the router is also dialing an

								// outbound connection to that same peer, which will cause the dialer to

								// eventually error when attempting to mark the peer as connected. This also

								// avoids race conditions where multiple goroutines may end up dialing a peer if

								// an incoming connection was briefly accepted and disconnected while we were

								// also dialing.

								//

								// For an outbound connection, the flow is as follows:

								// - DialNext: returns a peer address to dial, marking the peer as dialing.

								// - DialFailed: reports a dial failure, unmarking the peer as dialing.

								// - Dialed: successfully dialed, unmarking as dialing and marking as connected

								//   (or erroring if already connected).

								// - Ready: routing is up, broadcasts a PeerStatusUp peer update to subscribers.

								// - Disconnected: peer disconnects, unmarking as connected and broadcasts a

								//   PeerStatusDown peer update.

								//

								// For an inbound connection, the flow is as follows:

								// - Accepted: successfully accepted connection, marking as connected (or erroring

								//   if already connected).

								// - Ready: routing is up, broadcasts a PeerStatusUp peer update to subscribers.

								// - Disconnected: peer disconnects, unmarking as connected and broadcasts a

								//   PeerStatusDown peer update.

								//

								// If we are connected to too many peers (more than MaxConnections), typically

								// because we have upgraded to higher-scored peers and need to shed lower-scored

								// ones, the flow is as follows:

								// - EvictNext: returns a peer ID to evict, marking peer as evicting.

								// - Disconnected: peer was disconnected, unmarking as connected and evicting,

								//   and broadcasts a PeerStatusDown peer update.

								//

								// If all connection slots are full (at MaxConnections), we can use up to

								// MaxConnectionsUpgrade additional connections to probe any higher-scored

								// unconnected peers, and if we reach them (or they reach us) we allow the

								// connection and evict lower-scored peers. We mark the lower-scored peer as

								// upgrading[from]=to to make sure no other higher-scored peers can claim the

								// same one for an upgrade. The flow is as follows:

								// - Accepted: if upgrade is possible, mark upgrading[from]=to and connected.

								// - DialNext: if upgrade is possible, mark upgrading[from]=to and dialing.

								// - DialFailed: unmark upgrading[from]=to and dialing.

								// - Dialed: unmark dialing, mark as connected.

								// - EvictNext: unmark upgrading[from]=to, then if over MaxConnections

								//   either the upgraded peer or an even lower-scored one (if found)

								//   is marked as evicting and returned.

								// - Disconnected: unmark connected and evicting, also upgrading[from]=to

								//   both from and to (in case either disconnected before eviction).

								type PeerManager struct {

									options     PeerManagerOptions

									wakeDialCh  chan struct{} // wakes up DialNext() on relevant peer changes

									wakeEvictCh chan struct{} // wakes up EvictNext() on relevant peer changes

									closeCh     chan struct{} // signal channel for Close()

									closeOnce   sync.Once


									mtx           sync.Mutex

									store         *peerStore

									dialing       map[NodeID]bool                   // peers being dialed (DialNext -> Dialed/DialFail)

									connected     map[NodeID]bool                   // connected peers (Dialed/Accepted -> Disconnected)

									upgrading     map[NodeID]NodeID                 // peers claimed for upgrading (key is lower-scored peer)

									evicting      map[NodeID]bool                   // peers being evicted (EvictNext -> Disconnected)

									subscriptions map[*PeerUpdatesCh]*PeerUpdatesCh // keyed by struct identity (address)

								}


								// PeerManagerOptions specifies options for a PeerManager.

								type PeerManagerOptions struct {

									// PersistentPeers are peers that we want to maintain persistent connections

									// to. These will be scored higher than other peers, and if

									// MaxConnectedUpgrade is non-zero any lower-scored peers will be evicted if

									// necessary to make room for these.

									PersistentPeers []NodeID


									// MaxConnected is the maximum number of connected peers (inbound and

									// outbound). 0 means no limit.

									MaxConnected uint16


									// MaxConnectedUpgrade is the maximum number of additional connections to

									// use for probing any better-scored peers to upgrade to when all connection

									// slots are full. 0 disables peer upgrading.

									//

									// For example, if we are already connected to MaxConnected peers, but we

									// know or learn about better-scored peers (e.g. configured persistent

									// peers) that we are not connected too, then we can probe these peers by

									// using up to MaxConnectedUpgrade connections, and once connected evict the

									// lowest-scored connected peers. This also works for inbound connections,

									// i.e. if a higher-scored peer attempts to connect to us, we can accept

									// the connection and evict a lower-scored peer.

									MaxConnectedUpgrade uint16


									// MinRetryTime is the minimum time to wait between retries. Retry times

									// double for each retry, up to MaxRetryTime. 0 disables retries.

									MinRetryTime time.Duration


									// MaxRetryTime is the maximum time to wait between retries. 0 means

									// no maximum, in which case the retry time will keep doubling.

									MaxRetryTime time.Duration


									// MaxRetryTimePersistent is the maximum time to wait between retries for

									// peers listed in PersistentPeers. 0 uses MaxRetryTime instead.

									MaxRetryTimePersistent time.Duration


									// RetryTimeJitter is the upper bound of a random interval added to

									// retry times, to avoid thundering herds. 0 disables jutter.

									RetryTimeJitter time.Duration

								}


								// isPersistent is a convenience function that checks if the given peer ID

								// is contained in PersistentPeers. It just uses a linear search, since

								// PersistentPeers is expected to be small.

								func (o PeerManagerOptions) isPersistent(id NodeID) bool {

									for _, p := range o.PersistentPeers {

										if id == p {

											return true

										}

									}

									return false

								}


								// NewPeerManager creates a new peer manager.

								func NewPeerManager(options PeerManagerOptions) *PeerManager {

									return &PeerManager{

										options: options,

										closeCh: make(chan struct{}),


										// We use a buffer of size 1 for these trigger channels, with

										// non-blocking sends. This ensures that if e.g. wakeDial() is called

										// multiple times before the initial trigger is picked up we only

										// process the trigger once.

										//

										// FIXME: This should maybe be a libs/sync type.

										wakeDialCh:  make(chan struct{}, 1),

										wakeEvictCh: make(chan struct{}, 1),


										// FIXME: Once the store persists data, we need to update existing

										// peers in the store with any new information, e.g. changes to

										// PersistentPeers configuration.

										store:         newPeerStore(),

										dialing:       map[NodeID]bool{},

										connected:     map[NodeID]bool{},

										upgrading:     map[NodeID]NodeID{},

										evicting:      map[NodeID]bool{},

										subscriptions: map[*PeerUpdatesCh]*PeerUpdatesCh{},

									}

								}


								// Close closes the peer manager, releasing resources allocated with it

								// (specifically any running goroutines).

								func (m *PeerManager) Close() {

									m.closeOnce.Do(func() {

										close(m.closeCh)

									})

								}


								// Add adds a peer to the manager, given as an address. If the peer already

								// exists, the address is added to it.

								func (m *PeerManager) Add(address PeerAddress) error {

									if err := address.Validate(); err != nil {

										return err

									}

									m.mtx.Lock()

									defer m.mtx.Unlock()


									peer, err := m.store.Get(address.NodeID())

									if err != nil {

										return err

									}

									if peer == nil {

										peer = &peerInfo{

											ID:         address.NodeID(),

											Persistent: m.options.isPersistent(address.NodeID()),

										}

									}

									peer.AddAddress(address)

									err = m.store.Set(peer)

									if err != nil {

										return err

									}

									m.wakeDial()

									return nil

								}


								// Subscribe subscribes to peer updates. The caller must consume the peer

								// updates in a timely fashion and close the subscription when done, since

								// delivery is guaranteed and will block peer connection/disconnection

								// otherwise.

								func (m *PeerManager) Subscribe() *PeerUpdatesCh {

									// FIXME: We may want to use a size 1 buffer here. When the router

									// broadcasts a peer update it has to loop over all of the

									// subscriptions, and we want to avoid blocking and waiting for a

									// context switch before continuing to the next subscription. This also

									// prevents tail latencies from compounding across updates. We also want

									// to make sure the subscribers are reasonably in sync, so it should be

									// kept at 1. However, this should be benchmarked first.

									peerUpdates := NewPeerUpdates(make(chan PeerUpdate))

									m.mtx.Lock()

									m.subscriptions[peerUpdates] = peerUpdates

									m.mtx.Unlock()


									go func() {

										<-peerUpdates.Done()

										m.mtx.Lock()

										delete(m.subscriptions, peerUpdates)

										m.mtx.Unlock()

									}()

									return peerUpdates

								}


								// broadcast broadcasts a peer update to all subscriptions. The caller must

								// already hold the mutex lock. This means the mutex is held for the duration

								// of the broadcast, which we want to make sure all subscriptions receive all

								// updates in the same order.

								//

								// FIXME: Consider using more fine-grained mutexes here, and/or a channel to

								// enforce ordering of updates.

								func (m *PeerManager) broadcast(peerUpdate PeerUpdate) {

									for _, sub := range m.subscriptions {

										select {

										case sub.updatesCh <- peerUpdate:

										case <-sub.doneCh:

										}

									}

								}


								// DialNext finds an appropriate peer address to dial, and marks it as dialing.

								// If no peer is found, or all connection slots are full, it blocks until one

								// becomes available. The caller must call Dialed() or DialFailed() for the

								// returned peer. The context can be used to cancel the call.

								func (m *PeerManager) DialNext(ctx context.Context) (NodeID, PeerAddress, error) {

									for {

										id, address, err := m.TryDialNext()

										if err != nil || id != "" {

											return id, address, err

										}

										select {

										case <-m.wakeDialCh:

										case <-ctx.Done():

											return "", PeerAddress{}, ctx.Err()

										}

									}

								}


								// TryDialNext is equivalent to DialNext(), but immediately returns an empty

								// peer ID if no peers or connection slots are available.

								func (m *PeerManager) TryDialNext() (NodeID, PeerAddress, error) {

									m.mtx.Lock()

									defer m.mtx.Unlock()


									// We allow dialing MaxConnected+MaxConnectedUpgrade peers. Including

									// MaxConnectedUpgrade allows us to probe additional peers that have a

									// higher score than a connected peer, and if successful evict the

									// lower-scored peer via EvictNext().

									if m.options.MaxConnected > 0 &&

										len(m.connected)+len(m.dialing) >= int(m.options.MaxConnected)+int(m.options.MaxConnectedUpgrade) {

										return "", PeerAddress{}, nil

									}


									ranked, err := m.store.Ranked()

									if err != nil {

										return "", PeerAddress{}, err

									}

									for _, peer := range ranked {

										if m.dialing[peer.ID] || m.connected[peer.ID] {

											continue

										}


										for _, addressInfo := range peer.AddressInfo {

											if time.Since(addressInfo.LastDialFailure) < m.retryDelay(peer, addressInfo.DialFailures) {

												continue

											}


											// At this point we have an eligible address to dial. If we're full

											// but have peer upgrade capacity (as checked above), we need to

											// make sure there exists an evictable peer of a lower score that we

											// can replace. If so, we mark the lower-scored peer as upgrading so

											// noone else can claim it, and EvictNext() will evict it later.

											//

											// If we don't find one, there is no point in trying additional

											// peers, since they will all have the same or lower score than this

											// peer (since they're ordered by score via peerStore.Ranked).

											if m.options.MaxConnected > 0 && len(m.connected) >= int(m.options.MaxConnected) {

												upgradePeer := m.findUpgradeCandidate(peer, ranked)

												if upgradePeer == "" {

													return "", PeerAddress{}, nil

												}

												m.upgrading[upgradePeer] = peer.ID

											}


											m.dialing[peer.ID] = true

											return peer.ID, addressInfo.Address, nil

										}

									}

									return "", PeerAddress{}, nil

								}


								// wakeDial is used to notify DialNext about changes that *may* cause new

								// peers to become eligible for dialing, such as peer disconnections and

								// retry timeouts.

								func (m *PeerManager) wakeDial() {

									// The channel has a 1-size buffer. A non-blocking send ensures

									// we only queue up at most 1 trigger between each DialNext().

									select {

									case m.wakeDialCh <- struct{}{}:

									default:

									}

								}


								// wakeEvict is used to notify EvictNext about changes that *may* cause

								// peers to become eligible for eviction, such as peer upgrades.

								func (m *PeerManager) wakeEvict() {

									// The channel has a 1-size buffer. A non-blocking send ensures

									// we only queue up at most 1 trigger between each EvictNext().

									select {

									case m.wakeEvictCh <- struct{}{}:

									default:

									}

								}


								// retryDelay calculates a dial retry delay using exponential backoff, based on

								// retry settings in PeerManagerOptions. If MinRetryTime is 0, this returns

								// MaxInt64 (i.e. an infinite retry delay, effectively disabling retries).

								func (m *PeerManager) retryDelay(peer *peerInfo, failures uint32) time.Duration {

									if failures == 0 {

										return 0

									}

									if m.options.MinRetryTime == 0 {

										return time.Duration(math.MaxInt64)

									}

									maxDelay := m.options.MaxRetryTime

									if peer.Persistent && m.options.MaxRetryTimePersistent > 0 {

										maxDelay = m.options.MaxRetryTimePersistent

									}


									delay := m.options.MinRetryTime * time.Duration(math.Pow(2, float64(failures)))

									if maxDelay > 0 && delay > maxDelay {

										delay = maxDelay

									}

									// FIXME: This should use a PeerManager-scoped RNG.

									delay += time.Duration(rand.Int63n(int64(m.options.RetryTimeJitter))) // nolint:gosec

									return delay

								}


								// DialFailed reports a failed dial attempt. This will make the peer available

								// for dialing again when appropriate.

								//

								// FIXME: This should probably delete or mark bad addresses/peers after some time.

								func (m *PeerManager) DialFailed(peerID NodeID, address PeerAddress) error {

									m.mtx.Lock()

									defer m.mtx.Unlock()


									delete(m.dialing, peerID)

									for from, to := range m.upgrading {

										if to == peerID {

											// Unmark failed upgrade attempt.

											delete(m.upgrading, from)

										}

									}


									peer, err := m.store.Get(peerID)

									if err != nil || peer == nil { // Peer may have been removed while dialing, ignore.

										return err

									}

									addressInfo := peer.LookupAddressInfo(address)

									if addressInfo == nil {

										return nil // Assume the address has been removed, ignore.

									}

									addressInfo.LastDialFailure = time.Now().UTC()

									addressInfo.DialFailures++

									if err = m.store.Set(peer); err != nil {

										return err

									}


									// We spawn a goroutine that notifies DialNext() again when the retry

									// timeout has elapsed, so that we can consider dialing it again.

									//

									// FIXME: We need to calculate the retry delay outside of the goroutine,

									// since the arguments are currently pointers to structs shared in the

									// peerStore. The peerStore should probably return struct copies instead,

									// to avoid these sorts of issues.

									if retryDelay := m.retryDelay(peer, addressInfo.DialFailures); retryDelay != time.Duration(math.MaxInt64) {

										go func() {

											// Use an explicit timer with deferred cleanup instead of

											// time.After(), to avoid leaking goroutines on PeerManager.Close().

											timer := time.NewTimer(retryDelay)

											defer timer.Stop()

											select {

											case <-timer.C:

												m.wakeDial()

											case <-m.closeCh:

											}

										}()

									}


									m.wakeDial()

									return nil

								}


								// Dialed marks a peer as successfully dialed. Any further incoming connections

								// will be rejected, and once disconnected the peer may be dialed again.

								func (m *PeerManager) Dialed(peerID NodeID, address PeerAddress) error {

									m.mtx.Lock()

									defer m.mtx.Unlock()


									delete(m.dialing, peerID)


									if m.connected[peerID] {

										return fmt.Errorf("peer %v is already connected", peerID)

									}

									if m.options.MaxConnected > 0 &&

										len(m.connected) >= int(m.options.MaxConnected)+int(m.options.MaxConnectedUpgrade) {

										return fmt.Errorf("already connected to maximum number of peers")

									}


									peer, err := m.store.Get(peerID)

									if err != nil {

										return err

									} else if peer == nil {

										return fmt.Errorf("peer %q was removed while dialing", peerID)

									}


									now := time.Now().UTC()

									peer.LastConnected = now

									if addressInfo := peer.LookupAddressInfo(address); addressInfo != nil {

										addressInfo.DialFailures = 0

										addressInfo.LastDialSuccess = now

									}

									if err = m.store.Set(peer); err != nil {

										return err

									}


									m.connected[peerID] = true

									m.wakeEvict()


									return nil

								}


								// Accepted marks an incoming peer connection successfully accepted. If the peer

								// is already connected or we don't allow additional connections then this will

								// return an error.

								//

								// If MaxConnectedUpgrade is non-zero, the accepted peer is better-scored than any

								// other connected peer, and the number of connections does not exceed

								// MaxConnected + MaxConnectedUpgrade then we accept the connection and rely on

								// EvictNext() to evict lower-scored peers.

								//

								// NOTE: We can't take an address here, since e.g. TCP uses a different port

								// number for outbound traffic than inbound traffic, so the peer's endpoint

								// wouldn't necessarily be an appropriate address to dial.

								func (m *PeerManager) Accepted(peerID NodeID) error {

									m.mtx.Lock()

									defer m.mtx.Unlock()


									if m.connected[peerID] {

										return fmt.Errorf("peer %q is already connected", peerID)

									}

									if m.options.MaxConnected > 0 &&

										len(m.connected) >= int(m.options.MaxConnected)+int(m.options.MaxConnectedUpgrade) {

										return fmt.Errorf("already connected to maximum number of peers")

									}


									peer, err := m.store.Get(peerID)

									if err != nil {

										return err

									}

									if peer == nil {

										peer = &peerInfo{

											ID:         peerID,

											Persistent: m.options.isPersistent(peerID),

										}

									}


									// If we're already full (i.e. at MaxConnected), but we allow upgrades (and

									// we know from the check above that we have upgrade capacity), then we can

									// look for any lower-scored evictable peer, and if found we can accept this

									// connection anyway and let EvictNext() evict a lower-scored peer for us.

									if m.options.MaxConnected > 0 && len(m.connected) >= int(m.options.MaxConnected) {

										ranked, err := m.store.Ranked()

										if err != nil {

											return err

										}

										upgradePeer := m.findUpgradeCandidate(peer, ranked)

										if upgradePeer == "" {

											return fmt.Errorf("already connected to maximum number of peers")

										}

										m.upgrading[upgradePeer] = peerID

									}


									peer.LastConnected = time.Now().UTC()

									if err = m.store.Set(peer); err != nil {

										return err

									}


									m.connected[peerID] = true

									m.wakeEvict()

									return nil

								}


								// Ready marks a peer as ready, broadcasting status updates to subscribers. The

								// peer must already be marked as connected. This is separate from Dialed() and

								// Accepted() to allow the router to set up its internal queues before reactors

								// start sending messages.

								func (m *PeerManager) Ready(peerID NodeID) {

									m.mtx.Lock()

									defer m.mtx.Unlock()


									if m.connected[peerID] {

										m.broadcast(PeerUpdate{

											PeerID: peerID,

											Status: PeerStatusUp,

										})

									}

								}


								// Disconnected unmarks a peer as connected, allowing new connections to be

								// established.

								func (m *PeerManager) Disconnected(peerID NodeID) error {

									m.mtx.Lock()

									defer m.mtx.Unlock()


									// After upgrading to a peer, it's possible for that peer to disconnect

									// before EvictNext() gets around to evicting the lower-scored peer. To

									// avoid stale upgrade markers, we remove it here.

									for from, to := range m.upgrading {

										if to == peerID {

											delete(m.upgrading, from)

										}

									}


									delete(m.connected, peerID)

									delete(m.upgrading, peerID)

									delete(m.evicting, peerID)

									m.broadcast(PeerUpdate{

										PeerID: peerID,

										Status: PeerStatusDown,

									})

									m.wakeDial()

									return nil

								}


								// EvictNext returns the next peer to evict (i.e. disconnect). If no evictable

								// peers are found, the call will block until one becomes available or the

								// context is cancelled.

								func (m *PeerManager) EvictNext(ctx context.Context) (NodeID, error) {

									for {

										id, err := m.TryEvictNext()

										if err != nil || id != "" {

											return id, err

										}

										select {

										case <-m.wakeEvictCh:

										case <-ctx.Done():

											return "", ctx.Err()

										}

									}

								}


								// TryEvictNext is equivalent to EvictNext, but immediately returns an empty

								// node ID if no evictable peers are found.

								func (m *PeerManager) TryEvictNext() (NodeID, error) {

									m.mtx.Lock()

									defer m.mtx.Unlock()


									// We first prune the upgrade list. All connection slots were full when the

									// upgrades began, but we may have disconnected other peers in the meanwhile

									// and thus don't have to evict the upgraded peers after all.

									for from, to := range m.upgrading {

										// Stop pruning when the upgrade slots are only for connections

										// exceeding MaxConnected.

										if m.options.MaxConnected == 0 ||

											len(m.upgrading) <= len(m.connected)-len(m.evicting)-int(m.options.MaxConnected) {

											break

										}

										if m.connected[to] {

											delete(m.upgrading, from)

										}

									}


									// If we're below capacity, we don't need to evict anything.

									if m.options.MaxConnected == 0 ||

										len(m.connected)-len(m.evicting) <= int(m.options.MaxConnected) {

										return "", nil

									}


									ranked, err := m.store.Ranked()

									if err != nil {

										return "", err

									}


									// Look for any upgraded peers that we can evict.

									for from, to := range m.upgrading {

										if m.connected[to] {

											delete(m.upgrading, from)

											// We may have connected to even lower-scored peers that we can

											// evict since we started upgrading this one, in which case we can

											// evict one of those.

											fromPeer, err := m.store.Get(from)

											if err != nil {

												return "", err

											} else if fromPeer == nil {

												continue

											} else if evictPeer := m.findUpgradeCandidate(fromPeer, ranked); evictPeer != "" {

												m.evicting[evictPeer] = true

												return evictPeer, nil

											} else {

												m.evicting[from] = true

												return from, nil

											}

										}

									}


									// If we didn't find any upgraded peers to evict, we just pick a low-ranked one.

									for i := len(ranked) - 1; i >= 0; i-- {

										peer := ranked[i]

										if m.connected[peer.ID] && !m.evicting[peer.ID] {

											m.evicting[peer.ID] = true

											return peer.ID, nil

										}

									}


									return "", nil

								}


								// findUpgradeCandidate looks for a lower-scored peer that we could evict

								// to make room for the given peer. Returns an empty ID if none is found.

								// The caller must hold the mutex lock.

								func (m *PeerManager) findUpgradeCandidate(peer *peerInfo, ranked []*peerInfo) NodeID {

									// Check for any existing upgrade claims to this peer. It is important that

									// we return this, since we can get an inbound connection from a peer that

									// we're concurrently trying to dial for an upgrade, and we want the inbound

									// connection to be accepted in this case.

									for from, to := range m.upgrading {

										if to == peer.ID {

											return from

										}

									}

									for i := len(ranked) - 1; i >= 0; i-- {

										candidate := ranked[i]

										switch {

										case candidate.Score() >= peer.Score():

											return "" // no further peers can be scored lower, due to sorting

										case !m.connected[candidate.ID]:

										case m.evicting[candidate.ID]:

										case m.upgrading[candidate.ID] != "":

										default:

											return candidate.ID

										}

									}

									return ""

								}


								// GetHeight returns a peer's height, as reported via SetHeight. If the peer

								// or height is unknown, this returns 0.

								//

								// FIXME: This is a temporary workaround for the peer state stored via the

								// legacy Peer.Set() and Peer.Get() APIs, used to share height state between the

								// consensus and mempool reactors. These dependencies should be removed from the

								// reactors, and instead query this information independently via new P2P

								// protocol additions.

								func (m *PeerManager) GetHeight(peerID NodeID) (int64, error) {

									m.mtx.Lock()

									defer m.mtx.Unlock()


									peer, err := m.store.Get(peerID)

									if err != nil || peer == nil {

										return 0, err

									}

									return peer.Height, nil

								}


								// SetHeight stores a peer's height, making it available via GetHeight. If the

								// peer is unknown, it is created.

								//

								// FIXME: This is a temporary workaround for the peer state stored via the

								// legacy Peer.Set() and Peer.Get() APIs, used to share height state between the

								// consensus and mempool reactors. These dependencies should be removed from the

								// reactors, and instead query this information independently via new P2P

								// protocol additions.

								func (m *PeerManager) SetHeight(peerID NodeID, height int64) error {

									m.mtx.Lock()

									defer m.mtx.Unlock()


									peer, err := m.store.Get(peerID)

									if err != nil {

										return err

									}

									if peer == nil {

										peer = &peerInfo{

											ID:         peerID,

											Persistent: m.options.isPersistent(peerID),

										}

									}

									peer.Height = height

									return m.store.Set(peer)

								}


								// peerStore stores information about peers. It is currently a bare-bones

								// in-memory store, and will be fleshed out later.

								//

								// peerStore is not thread-safe, since it assumes it is only used by PeerManager

								// which handles concurrency control. This allows the manager to execute multiple

								// operations atomically while it holds the mutex.

								type peerStore struct {

									peers map[NodeID]peerInfo

								}


								// newPeerStore creates a new peer store.

								func newPeerStore() *peerStore {

									return &peerStore{

										peers: map[NodeID]peerInfo{},

									}

								}


								// Get fetches a peer, returning nil if not found.

								func (s *peerStore) Get(id NodeID) (*peerInfo, error) {

									peer, ok := s.peers[id]

									if !ok {

										return nil, nil

									}

									return &peer, nil

								}


								// Set stores peer data.

								func (s *peerStore) Set(peer *peerInfo) error {

									if peer == nil {

										return errors.New("peer cannot be nil")

									}

									s.peers[peer.ID] = *peer

									return nil

								}


								// List retrieves all peers.

								func (s *peerStore) List() ([]*peerInfo, error) {

									peers := []*peerInfo{}

									for _, peer := range s.peers {

										peer := peer

										peers = append(peers, &peer)

									}

									return peers, nil

								}


								// Ranked returns a list of peers ordered by score (better peers first).

								// Peers with equal scores are returned in an arbitrary order.

								//

								// This is used to determine which peers to connect to and which peers to evict

								// in order to make room for better peers.

								//

								// FIXME: For now, we simply generate the list on every call, but this can get

								// expensive since it's called fairly frequently. We may want to either cache

								// this, or store peers in a data structure that maintains order (e.g. a heap or

								// ordered map).

								func (s *peerStore) Ranked() ([]*peerInfo, error) {

									peers, err := s.List()

									if err != nil {

										return nil, err

									}

									sort.Slice(peers, func(i, j int) bool {

										// FIXME: If necessary, consider precomputing scores before sorting,

										// to reduce the number of Score() calls.

										return peers[i].Score() > peers[j].Score()

									})

									return peers, nil

								}


								// peerInfo contains peer information stored in a peerStore.

								type peerInfo struct {

									ID            NodeID

									AddressInfo   []*addressInfo

									Persistent    bool

									Height        int64

									LastConnected time.Time

								}


								// AddAddress adds an address to a peer, unless it already exists. It does not

								// validate the address. Returns true if the address was new.

								func (p *peerInfo) AddAddress(address PeerAddress) bool {

									if p.LookupAddressInfo(address) != nil {

										return false

									}

									p.AddressInfo = append(p.AddressInfo, &addressInfo{Address: address})

									return true

								}


								// LookupAddressInfo returns address info for an address, or nil if unknown.

								func (p *peerInfo) LookupAddressInfo(address PeerAddress) *addressInfo {

									// We just do a linear search for now.

									addressString := address.String()

									for _, info := range p.AddressInfo {

										if info.Address.String() == addressString {

											return info

										}

									}

									return nil

								}


								// Score calculates a score for the peer. Higher-scored peers will be

								// preferred over lower scores.

								func (p *peerInfo) Score() PeerScore {

									var score PeerScore

									if p.Persistent {

										score += PeerScorePersistent

									}

									return score

								}


								// addressInfo contains information and statistics about an address.

								type addressInfo struct {

									Address         PeerAddress

									LastDialSuccess time.Time

									LastDialFailure time.Time

									DialFailures    uint32 // since last successful dial

								}


								// ============================================================================

								// Types and business logic below may be deprecated.

								//

								// TODO: Rename once legacy p2p types are removed.

								// ref: https://github.com/tendermint/tendermint/issues/5670

								// ============================================================================


								//go:generate mockery --case underscore --name Peer


								const metricsTickerDuration = 10 * time.Second


								// Peer is an interface representing a peer connected on a reactor.

								type Peer interface {

									service.Service

									FlushStop()


									ID() NodeID           // peer's cryptographic ID

									RemoteIP() net.IP     // remote IP of the connection

									RemoteAddr() net.Addr // remote address of the connection


									IsOutbound() bool   // did we dial the peer

									IsPersistent() bool // do we redial this peer when we disconnect


									CloseConn() error // close original connection


									NodeInfo() NodeInfo // peer's info

									Status() tmconn.ConnectionStatus

									SocketAddr() *NetAddress // actual address of the socket


									Send(byte, []byte) bool

									TrySend(byte, []byte) bool


									Set(string, interface{})

									Get(string) interface{}

								}


								//----------------------------------------------------------


								// peerConn contains the raw connection and its config.

								type peerConn struct {

									outbound   bool

									persistent bool

									conn       Connection

									ip         net.IP // cached RemoteIP()

								}


								func newPeerConn(outbound, persistent bool, conn Connection) peerConn {

									return peerConn{

										outbound:   outbound,

										persistent: persistent,

										conn:       conn,

									}

								}


								// ID only exists for SecretConnection.

								func (pc peerConn) ID() NodeID {

									return NodeIDFromPubKey(pc.conn.PubKey())

								}


								// Return the IP from the connection RemoteAddr

								func (pc peerConn) RemoteIP() net.IP {

									if pc.ip == nil {

										pc.ip = pc.conn.RemoteEndpoint().IP

									}

									return pc.ip

								}


								// peer implements Peer.

								//

								// Before using a peer, you will need to perform a handshake on connection.

								type peer struct {

									service.BaseService


									// raw peerConn and the multiplex connection

									peerConn


									// peer's node info and the channel it knows about

									// channels = nodeInfo.Channels

									// cached to avoid copying nodeInfo in hasChannel

									nodeInfo    NodeInfo

									channels    []byte

									reactors    map[byte]Reactor

									onPeerError func(Peer, interface{})


									// User data

									Data *cmap.CMap


									metrics       *Metrics

									metricsTicker *time.Ticker

								}


								type PeerOption func(*peer)


								func newPeer(

									pc peerConn,

									reactorsByCh map[byte]Reactor,

									onPeerError func(Peer, interface{}),

									options ...PeerOption,

								) *peer {

									nodeInfo := pc.conn.NodeInfo()

									p := &peer{

										peerConn:      pc,

										nodeInfo:      nodeInfo,

										channels:      nodeInfo.Channels, // TODO

										reactors:      reactorsByCh,

										onPeerError:   onPeerError,

										Data:          cmap.NewCMap(),

										metricsTicker: time.NewTicker(metricsTickerDuration),

										metrics:       NopMetrics(),

									}


									p.BaseService = *service.NewBaseService(nil, "Peer", p)

									for _, option := range options {

										option(p)

									}


									return p

								}


								// onError calls the peer error callback.

								func (p *peer) onError(err interface{}) {

									p.onPeerError(p, err)

								}


								// String representation.

								func (p *peer) String() string {

									if p.outbound {

										return fmt.Sprintf("Peer{%v %v out}", p.conn, p.ID())

									}


									return fmt.Sprintf("Peer{%v %v in}", p.conn, p.ID())

								}


								//---------------------------------------------------

								// Implements service.Service


								// SetLogger implements BaseService.

								func (p *peer) SetLogger(l log.Logger) {

									p.Logger = l

								}


								// OnStart implements BaseService.

								func (p *peer) OnStart() error {

									if err := p.BaseService.OnStart(); err != nil {

										return err

									}


									go p.processMessages()

									go p.metricsReporter()


									return nil

								}


								// processMessages processes messages received from the connection.

								func (p *peer) processMessages() {

									defer func() {

										if r := recover(); r != nil {

											p.Logger.Error("peer message processing panic", "err", r, "stack", string(debug.Stack()))

											p.onError(fmt.Errorf("panic during peer message processing: %v", r))

										}

									}()


									for {

										chID, msg, err := p.conn.ReceiveMessage()

										if err != nil {

											p.onError(err)

											return

										}

										reactor, ok := p.reactors[chID]

										if !ok {

											p.onError(fmt.Errorf("unknown channel %v", chID))

											return

										}

										reactor.Receive(chID, p, msg)

									}

								}


								// FlushStop mimics OnStop but additionally ensures that all successful

								// .Send() calls will get flushed before closing the connection.

								// NOTE: it is not safe to call this method more than once.

								func (p *peer) FlushStop() {

									p.metricsTicker.Stop()

									p.BaseService.OnStop()

									if err := p.conn.FlushClose(); err != nil {

										p.Logger.Debug("error while stopping peer", "err", err)

									}

								}


								// OnStop implements BaseService.

								func (p *peer) OnStop() {

									p.metricsTicker.Stop()

									p.BaseService.OnStop()

									if err := p.conn.Close(); err != nil {

										p.Logger.Debug("error while stopping peer", "err", err)

									}

								}


								//---------------------------------------------------

								// Implements Peer


								// ID returns the peer's ID - the hex encoded hash of its pubkey.

								func (p *peer) ID() NodeID {

									return p.nodeInfo.ID()

								}


								// IsOutbound returns true if the connection is outbound, false otherwise.

								func (p *peer) IsOutbound() bool {

									return p.peerConn.outbound

								}


								// IsPersistent returns true if the peer is persitent, false otherwise.

								func (p *peer) IsPersistent() bool {

									return p.peerConn.persistent

								}


								// NodeInfo returns a copy of the peer's NodeInfo.

								func (p *peer) NodeInfo() NodeInfo {

									return p.nodeInfo

								}


								// SocketAddr returns the address of the socket.

								// For outbound peers, it's the address dialed (after DNS resolution).

								// For inbound peers, it's the address returned by the underlying connection

								// (not what's reported in the peer's NodeInfo).

								func (p *peer) SocketAddr() *NetAddress {

									return p.peerConn.conn.RemoteEndpoint().NetAddress()

								}


								// Status returns the peer's ConnectionStatus.

								func (p *peer) Status() tmconn.ConnectionStatus {

									return p.conn.Status()

								}


								// Send msg bytes to the channel identified by chID byte. Returns false if the

								// send queue is full after timeout, specified by MConnection.

								func (p *peer) Send(chID byte, msgBytes []byte) bool {

									if !p.IsRunning() {

										// see Switch#Broadcast, where we fetch the list of peers and loop over

										// them - while we're looping, one peer may be removed and stopped.

										return false

									} else if !p.hasChannel(chID) {

										return false

									}

									res, err := p.conn.SendMessage(chID, msgBytes)

									if err == io.EOF {

										return false

									} else if err != nil {

										p.onError(err)

										return false

									}

									if res {

										labels := []string{

											"peer_id", string(p.ID()),

											"chID", fmt.Sprintf("%#x", chID),

										}

										p.metrics.PeerSendBytesTotal.With(labels...).Add(float64(len(msgBytes)))

									}

									return res

								}


								// TrySend msg bytes to the channel identified by chID byte. Immediately returns

								// false if the send queue is full.

								func (p *peer) TrySend(chID byte, msgBytes []byte) bool {

									if !p.IsRunning() {

										return false

									} else if !p.hasChannel(chID) {

										return false

									}

									res, err := p.conn.TrySendMessage(chID, msgBytes)

									if err == io.EOF {

										return false

									} else if err != nil {

										p.onError(err)

										return false

									}

									if res {

										labels := []string{

											"peer_id", string(p.ID()),

											"chID", fmt.Sprintf("%#x", chID),

										}

										p.metrics.PeerSendBytesTotal.With(labels...).Add(float64(len(msgBytes)))

									}

									return res

								}


								// Get the data for a given key.

								func (p *peer) Get(key string) interface{} {

									return p.Data.Get(key)

								}


								// Set sets the data for the given key.

								func (p *peer) Set(key string, data interface{}) {

									p.Data.Set(key, data)

								}


								// hasChannel returns true if the peer reported

								// knowing about the given chID.

								func (p *peer) hasChannel(chID byte) bool {

									for _, ch := range p.channels {

										if ch == chID {

											return true

										}

									}

									// NOTE: probably will want to remove this

									// but could be helpful while the feature is new

									p.Logger.Debug(

										"Unknown channel for peer",

										"channel",

										chID,

										"channels",

										p.channels,

									)

									return false

								}


								// CloseConn closes original connection. Used for cleaning up in cases where the peer had not been started at all.

								func (p *peer) CloseConn() error {

									return p.peerConn.conn.Close()

								}


								//---------------------------------------------------

								// methods only used for testing

								// TODO: can we remove these?


								// CloseConn closes the underlying connection

								func (pc *peerConn) CloseConn() {

									pc.conn.Close()

								}


								// RemoteAddr returns peer's remote network address.

								func (p *peer) RemoteAddr() net.Addr {

									endpoint := p.conn.RemoteEndpoint()

									return &net.TCPAddr{

										IP:   endpoint.IP,

										Port: int(endpoint.Port),

									}

								}


								//---------------------------------------------------


								func PeerMetrics(metrics *Metrics) PeerOption {

									return func(p *peer) {

										p.metrics = metrics

									}

								}


								func (p *peer) metricsReporter() {

									for {

										select {

										case <-p.metricsTicker.C:

											status := p.conn.Status()

											var sendQueueSize float64

											for _, chStatus := range status.Channels {

												sendQueueSize += float64(chStatus.SendQueueSize)

											}


											p.metrics.PeerPendingSendBytes.With("peer_id", string(p.ID())).Set(sendQueueSize)

										case <-p.Quit():

											return

										}

									}

								}