zolfa
/
tendermint


								package pex


								import (

									"context"

									"fmt"

									"sync"

									"time"


									"github.com/tendermint/tendermint/internal/p2p"

									"github.com/tendermint/tendermint/internal/p2p/conn"

									"github.com/tendermint/tendermint/libs/log"

									tmmath "github.com/tendermint/tendermint/libs/math"

									"github.com/tendermint/tendermint/libs/service"

									protop2p "github.com/tendermint/tendermint/proto/tendermint/p2p"

									"github.com/tendermint/tendermint/types"

								)


								var (

									_ service.Service = (*ReactorV2)(nil)

									_ p2p.Wrapper     = (*protop2p.PexMessage)(nil)

								)


								// TODO: Consolidate with params file.

								// See https://github.com/tendermint/tendermint/issues/6371

								const (

									// the minimum time one peer can send another request to the same peer

									minReceiveRequestInterval = 100 * time.Millisecond


									// the maximum amount of addresses that can be included in a response

									maxAddresses uint16 = 100


									// allocated time to resolve a node address into a set of endpoints

									resolveTimeout = 3 * time.Second


									// How long to wait when there are no peers available before trying again

									noAvailablePeersWaitPeriod = 1 * time.Second


									// indicates the ping rate of the pex reactor when the peer store is full.

									// The reactor should still look to add new peers in order to flush out low

									// scoring peers that are still in the peer store

									fullCapacityInterval = 10 * time.Minute

								)


								// TODO: We should decide whether we want channel descriptors to be housed

								// within each reactor (as they are now) or, considering that the reactor doesn't

								// really need to care about the channel descriptors, if they should be housed

								// in the node module.

								func ChannelDescriptor() conn.ChannelDescriptor {

									return conn.ChannelDescriptor{

										ID:                  PexChannel,

										Priority:            1,

										SendQueueCapacity:   10,

										RecvMessageCapacity: maxMsgSize,

										RecvBufferCapacity:  32,

										MaxSendBytes:        200,

									}

								}


								// ReactorV2 is a PEX reactor for the new P2P stack. The legacy reactor

								// is Reactor.

								//

								// FIXME: Rename this when Reactor is removed, and consider moving to p2p/.

								//

								// The peer exchange or PEX reactor supports the peer manager by sending

								// requests to other peers for addresses that can be given to the peer manager

								// and at the same time advertises addresses to peers that need more.

								//

								// The reactor is able to tweak the intensity of it's search by decreasing or

								// increasing the interval between each request. It tracks connected peers via

								// a linked list, sending a request to the node at the front of the list and

								// adding it to the back of the list once a response is received.

								type ReactorV2 struct {

									service.BaseService


									peerManager *p2p.PeerManager

									pexCh       *p2p.Channel

									peerUpdates *p2p.PeerUpdates

									closeCh     chan struct{}


									// list of available peers to loop through and send peer requests to

									availablePeers map[types.NodeID]struct{}


									mtx sync.RWMutex


									// requestsSent keeps track of which peers the PEX reactor has sent requests

									// to. This prevents the sending of spurious responses.

									// NOTE: If a node never responds, they will remain in this map until a

									// peer down status update is sent

									requestsSent map[types.NodeID]struct{}


									// lastReceivedRequests keeps track of when peers send a request to prevent

									// peers from sending requests too often (as defined by

									// minReceiveRequestInterval).

									lastReceivedRequests map[types.NodeID]time.Time


									// the time when another request will be sent

									nextRequestTime time.Time


									// keep track of how many new peers to existing peers we have received to

									// extrapolate the size of the network

									newPeers   uint32

									totalPeers uint32


									// discoveryRatio is the inverse ratio of new peers to old peers squared.

									// This is multiplied by the minimum duration to calculate how long to wait

									// between each request.

									discoveryRatio float32

								}


								// NewReactor returns a reference to a new reactor.

								func NewReactorV2(

									logger log.Logger,

									peerManager *p2p.PeerManager,

									pexCh *p2p.Channel,

									peerUpdates *p2p.PeerUpdates,

								) *ReactorV2 {


									r := &ReactorV2{

										peerManager:          peerManager,

										pexCh:                pexCh,

										peerUpdates:          peerUpdates,

										closeCh:              make(chan struct{}),

										availablePeers:       make(map[types.NodeID]struct{}),

										requestsSent:         make(map[types.NodeID]struct{}),

										lastReceivedRequests: make(map[types.NodeID]time.Time),

									}


									r.BaseService = *service.NewBaseService(logger, "PEX", r)

									return r

								}


								// OnStart starts separate go routines for each p2p Channel and listens for

								// envelopes on each. In addition, it also listens for peer updates and handles

								// messages on that p2p channel accordingly. The caller must be sure to execute

								// OnStop to ensure the outbound p2p Channels are closed.

								func (r *ReactorV2) OnStart() error {

									go r.processPexCh()

									go r.processPeerUpdates()

									return nil

								}


								// OnStop stops the reactor by signaling to all spawned goroutines to exit and

								// blocking until they all exit.

								func (r *ReactorV2) OnStop() {

									// Close closeCh to signal to all spawned goroutines to gracefully exit. All

									// p2p Channels should execute Close().

									close(r.closeCh)


									// Wait for all p2p Channels to be closed before returning. This ensures we

									// can easily reason about synchronization of all p2p Channels and ensure no

									// panics will occur.

									<-r.pexCh.Done()

									<-r.peerUpdates.Done()

								}


								// processPexCh implements a blocking event loop where we listen for p2p

								// Envelope messages from the pexCh.

								func (r *ReactorV2) processPexCh() {

									defer r.pexCh.Close()


									for {

										select {

										case <-r.closeCh:

											r.Logger.Debug("stopped listening on PEX channel; closing...")

											return


										// outbound requests for new peers

										case <-r.waitUntilNextRequest():

											r.sendRequestForPeers()


										// inbound requests for new peers or responses to requests sent by this

										// reactor

										case envelope := <-r.pexCh.In:

											if err := r.handleMessage(r.pexCh.ID, envelope); err != nil {

												r.Logger.Error("failed to process message", "ch_id", r.pexCh.ID, "envelope", envelope, "err", err)

												r.pexCh.Error <- p2p.PeerError{

													NodeID: envelope.From,

													Err:    err,

												}

											}

										}

									}

								}


								// processPeerUpdates initiates a blocking process where we listen for and handle

								// PeerUpdate messages. When the reactor is stopped, we will catch the signal and

								// close the p2p PeerUpdatesCh gracefully.

								func (r *ReactorV2) processPeerUpdates() {

									defer r.peerUpdates.Close()


									for {

										select {

										case peerUpdate := <-r.peerUpdates.Updates():

											r.processPeerUpdate(peerUpdate)


										case <-r.closeCh:

											r.Logger.Debug("stopped listening on peer updates channel; closing...")

											return

										}

									}

								}


								// handlePexMessage handles envelopes sent from peers on the PexChannel.

								func (r *ReactorV2) handlePexMessage(envelope p2p.Envelope) error {

									logger := r.Logger.With("peer", envelope.From)


									switch msg := envelope.Message.(type) {


									case *protop2p.PexRequest:

										// Check if the peer hasn't sent a prior request too close to this one

										// in time.

										if err := r.markPeerRequest(envelope.From); err != nil {

											return err

										}


										// parse and send the legacy PEX addresses

										pexAddresses := r.resolve(r.peerManager.Advertise(envelope.From, maxAddresses))

										r.pexCh.Out <- p2p.Envelope{

											To:      envelope.From,

											Message: &protop2p.PexResponse{Addresses: pexAddresses},

										}


									case *protop2p.PexResponse:

										// check if the response matches a request that was made to that peer

										if err := r.markPeerResponse(envelope.From); err != nil {

											return err

										}


										// check the size of the response

										if len(msg.Addresses) > int(maxAddresses) {

											return fmt.Errorf("peer sent too many addresses (max: %d, got: %d)",

												maxAddresses,

												len(msg.Addresses),

											)

										}


										for _, pexAddress := range msg.Addresses {

											// no protocol is prefixed so we assume the default (mconn)

											peerAddress, err := p2p.ParseNodeAddress(

												fmt.Sprintf("%s@%s:%d", pexAddress.ID, pexAddress.IP, pexAddress.Port))

											if err != nil {

												continue

											}

											added, err := r.peerManager.Add(peerAddress)

											if err != nil {

												logger.Error("failed to add PEX address", "address", peerAddress, "err", err)

											}

											if added {

												r.newPeers++

												logger.Debug("added PEX address", "address", peerAddress)

											}

											r.totalPeers++

										}


									// V2 PEX MESSAGES

									case *protop2p.PexRequestV2:

										// check if the peer hasn't sent a prior request too close to this one

										// in time

										if err := r.markPeerRequest(envelope.From); err != nil {

											return err

										}


										// request peers from the peer manager and parse the NodeAddresses into

										// URL strings

										nodeAddresses := r.peerManager.Advertise(envelope.From, maxAddresses)

										pexAddressesV2 := make([]protop2p.PexAddressV2, len(nodeAddresses))

										for idx, addr := range nodeAddresses {

											pexAddressesV2[idx] = protop2p.PexAddressV2{

												URL: addr.String(),

											}

										}

										r.pexCh.Out <- p2p.Envelope{

											To:      envelope.From,

											Message: &protop2p.PexResponseV2{Addresses: pexAddressesV2},

										}


									case *protop2p.PexResponseV2:

										// check if the response matches a request that was made to that peer

										if err := r.markPeerResponse(envelope.From); err != nil {

											return err

										}


										// check the size of the response

										if len(msg.Addresses) > int(maxAddresses) {

											return fmt.Errorf("peer sent too many addresses (max: %d, got: %d)",

												maxAddresses,

												len(msg.Addresses),

											)

										}


										for _, pexAddress := range msg.Addresses {

											peerAddress, err := p2p.ParseNodeAddress(pexAddress.URL)

											if err != nil {

												continue

											}

											added, err := r.peerManager.Add(peerAddress)

											if err != nil {

												logger.Error("failed to add V2 PEX address", "address", peerAddress, "err", err)

											}

											if added {

												r.newPeers++

												logger.Debug("added V2 PEX address", "address", peerAddress)

											}

											r.totalPeers++

										}


									default:

										return fmt.Errorf("received unknown message: %T", msg)

									}


									return nil

								}


								// resolve resolves a set of peer addresses into PEX addresses.

								//

								// FIXME: This is necessary because the current PEX protocol only supports

								// IP/port pairs, while the P2P stack uses NodeAddress URLs. The PEX protocol

								// should really use URLs too, to exchange DNS names instead of IPs and allow

								// different transport protocols (e.g. QUIC and MemoryTransport).

								//

								// FIXME: We may want to cache and parallelize this, but for now we'll just rely

								// on the operating system to cache it for us.

								func (r *ReactorV2) resolve(addresses []p2p.NodeAddress) []protop2p.PexAddress {

									limit := len(addresses)

									pexAddresses := make([]protop2p.PexAddress, 0, limit)


									for _, address := range addresses {

										ctx, cancel := context.WithTimeout(context.Background(), resolveTimeout)

										endpoints, err := address.Resolve(ctx)

										r.Logger.Debug("resolved node address", "endpoints", endpoints)

										cancel()


										if err != nil {

											r.Logger.Debug("failed to resolve address", "address", address, "err", err)

											continue

										}


										for _, endpoint := range endpoints {

											r.Logger.Debug("checking endpint", "IP", endpoint.IP, "Port", endpoint.Port)

											if len(pexAddresses) >= limit {

												return pexAddresses


											} else if endpoint.IP != nil {

												r.Logger.Debug("appending pex address")

												// PEX currently only supports IP-networked transports (as

												// opposed to e.g. p2p.MemoryTransport).

												//

												// FIXME: as the PEX address contains no information about the

												// protocol, we jam this into the ID. We won't need to this once

												// we support URLs

												pexAddresses = append(pexAddresses, protop2p.PexAddress{

													ID:   string(address.NodeID),

													IP:   endpoint.IP.String(),

													Port: uint32(endpoint.Port),

												})

											}

										}

									}


									return pexAddresses

								}


								// handleMessage handles an Envelope sent from a peer on a specific p2p Channel.

								// It will handle errors and any possible panics gracefully. A caller can handle

								// any error returned by sending a PeerError on the respective channel.

								func (r *ReactorV2) handleMessage(chID p2p.ChannelID, envelope p2p.Envelope) (err error) {

									defer func() {

										if e := recover(); e != nil {

											err = fmt.Errorf("panic in processing message: %v", e)

										}

									}()


									r.Logger.Debug("received PEX message", "peer", envelope.From)


									switch chID {

									case p2p.ChannelID(PexChannel):

										err = r.handlePexMessage(envelope)


									default:

										err = fmt.Errorf("unknown channel ID (%d) for envelope (%v)", chID, envelope)

									}


									return err

								}


								// processPeerUpdate processes a PeerUpdate. For added peers, PeerStatusUp, we

								// send a request for addresses.

								func (r *ReactorV2) processPeerUpdate(peerUpdate p2p.PeerUpdate) {

									r.Logger.Debug("received PEX peer update", "peer", peerUpdate.NodeID, "status", peerUpdate.Status)


									r.mtx.Lock()

									defer r.mtx.Unlock()


									switch peerUpdate.Status {

									case p2p.PeerStatusUp:

										r.availablePeers[peerUpdate.NodeID] = struct{}{}

									case p2p.PeerStatusDown:

										delete(r.availablePeers, peerUpdate.NodeID)

										delete(r.requestsSent, peerUpdate.NodeID)

										delete(r.lastReceivedRequests, peerUpdate.NodeID)

									default:

									}

								}


								func (r *ReactorV2) waitUntilNextRequest() <-chan time.Time {

									return time.After(time.Until(r.nextRequestTime))

								}


								// sendRequestForPeers pops the first peerID off the list and sends the

								// peer a request for more peer addresses. The function then moves the

								// peer into the requestsSent bucket and calculates when the next request

								// time should be

								func (r *ReactorV2) sendRequestForPeers() {

									r.mtx.Lock()

									defer r.mtx.Unlock()

									if len(r.availablePeers) == 0 {

										// no peers are available

										r.Logger.Debug("no available peers to send request to, waiting...")

										r.nextRequestTime = time.Now().Add(noAvailablePeersWaitPeriod)


										return

									}

									var peerID types.NodeID


									// use range to get a random peer.

									for peerID = range r.availablePeers {

										break

									}


									// The node accommodates for both pex systems

									if r.isLegacyPeer(peerID) {

										r.pexCh.Out <- p2p.Envelope{

											To:      peerID,

											Message: &protop2p.PexRequest{},

										}

									} else {

										r.pexCh.Out <- p2p.Envelope{

											To:      peerID,

											Message: &protop2p.PexRequestV2{},

										}

									}


									// remove the peer from the abvailable peers list and mark it in the requestsSent map

									delete(r.availablePeers, peerID)

									r.requestsSent[peerID] = struct{}{}


									r.calculateNextRequestTime()

									r.Logger.Debug("peer request sent", "next_request_time", r.nextRequestTime)

								}


								// calculateNextRequestTime implements something of a proportional controller

								// to estimate how often the reactor should be requesting new peer addresses.

								// The dependent variable in this calculation is the ratio of new peers to

								// all peers that the reactor receives. The interval is thus calculated as the

								// inverse squared. In the beginning, all peers should be new peers.

								// We  expect this ratio to be near 1 and thus the interval to be as short

								// as possible. As the node becomes more familiar with the network the ratio of

								// new nodes will plummet to a very small number, meaning the interval expands

								// to its upper bound.

								// CONTRACT: Must use a write lock as nextRequestTime is updated

								func (r *ReactorV2) calculateNextRequestTime() {

									// check if the peer store is full. If so then there is no need

									// to send peer requests too often

									if ratio := r.peerManager.PeerRatio(); ratio >= 0.95 {

										r.Logger.Debug("peer manager near full ratio, sleeping...",

											"sleep_period", fullCapacityInterval, "ratio", ratio)

										r.nextRequestTime = time.Now().Add(fullCapacityInterval)

										return

									}


									// baseTime represents the shortest interval that we can send peer requests

									// in. For example if we have 10 peers and we can't send a message to the

									// same peer every 500ms, then we can send a request every 50ms. In practice

									// we use a safety margin of 2, ergo 100ms

									peers := tmmath.MinInt(len(r.availablePeers), 50)

									baseTime := minReceiveRequestInterval

									if peers > 0 {

										baseTime = minReceiveRequestInterval * 2 / time.Duration(peers)

									}


									if r.totalPeers > 0 || r.discoveryRatio == 0 {

										// find the ratio of new peers. NOTE: We add 1 to both sides to avoid

										// divide by zero problems

										ratio := float32(r.totalPeers+1) / float32(r.newPeers+1)

										// square the ratio in order to get non linear time intervals

										// NOTE: The longest possible interval for a network with 100 or more peers

										// where a node is connected to 50 of them is 2 minutes.

										r.discoveryRatio = ratio * ratio

										r.newPeers = 0

										r.totalPeers = 0

									}

									// NOTE: As ratio is always >= 1, discovery ratio is >= 1. Therefore we don't need to worry

									// about the next request time being less than the minimum time

									r.nextRequestTime = time.Now().Add(baseTime * time.Duration(r.discoveryRatio))

								}


								func (r *ReactorV2) markPeerRequest(peer types.NodeID) error {

									r.mtx.Lock()

									defer r.mtx.Unlock()

									if lastRequestTime, ok := r.lastReceivedRequests[peer]; ok {

										if time.Now().Before(lastRequestTime.Add(minReceiveRequestInterval)) {

											return fmt.Errorf("peer sent a request too close after a prior one. Minimum interval: %v",

												minReceiveRequestInterval)

										}

									}

									r.lastReceivedRequests[peer] = time.Now()

									return nil

								}


								func (r *ReactorV2) markPeerResponse(peer types.NodeID) error {

									r.mtx.Lock()

									defer r.mtx.Unlock()

									// check if a request to this peer was sent

									if _, ok := r.requestsSent[peer]; !ok {

										return fmt.Errorf("peer sent a PEX response when none was requested (%v)", peer)

									}

									delete(r.requestsSent, peer)

									// attach to the back of the list so that the peer can be used again for

									// future requests


									r.availablePeers[peer] = struct{}{}

									return nil

								}


								// all addresses must use a MCONN protocol for the peer to be considered part of the

								// legacy p2p pex system

								func (r *ReactorV2) isLegacyPeer(peer types.NodeID) bool {

									for _, addr := range r.peerManager.Addresses(peer) {

										if addr.Protocol != p2p.MConnProtocol {

											return false

										}

									}

									return true

								}