2019-03-26 09:58:30 +01:00
|
|
|
package blockchain_new
|
|
|
|
|
|
|
|
import (
|
|
|
|
"errors"
|
|
|
|
"fmt"
|
|
|
|
"time"
|
|
|
|
|
|
|
|
"github.com/tendermint/tendermint/libs/log"
|
|
|
|
"github.com/tendermint/tendermint/p2p"
|
|
|
|
"github.com/tendermint/tendermint/types"
|
|
|
|
)
|
|
|
|
|
|
|
|
// Blockchain Reactor State
|
|
|
|
type bReactorFSMState struct {
|
|
|
|
name string
|
2019-04-04 00:13:32 +02:00
|
|
|
|
2019-03-26 09:58:30 +01:00
|
|
|
// called when transitioning out of current state
|
|
|
|
handle func(*bReactorFSM, bReactorEvent, bReactorEventData) (next *bReactorFSMState, err error)
|
|
|
|
// called when entering the state
|
|
|
|
enter func(fsm *bReactorFSM)
|
|
|
|
|
|
|
|
// timer to ensure FSM is not stuck in a state forever
|
|
|
|
timer *time.Timer
|
|
|
|
timeout time.Duration
|
|
|
|
}
|
|
|
|
|
|
|
|
func (s *bReactorFSMState) String() string {
|
|
|
|
return s.name
|
|
|
|
}
|
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
// Interface used by FSM for sending Block and Status requests,
|
|
|
|
// informing of peer errors and state timeouts
|
|
|
|
// Implemented by BlockchainReactor and tests
|
|
|
|
type bcRMessageInterface interface {
|
|
|
|
sendStatusRequest()
|
|
|
|
sendBlockRequest(peerID p2p.ID, height int64) error
|
|
|
|
sendPeerError(err error, peerID p2p.ID)
|
|
|
|
resetStateTimer(name string, timer *time.Timer, timeout time.Duration, f func())
|
|
|
|
switchToConsensus()
|
|
|
|
}
|
|
|
|
|
2019-03-26 09:58:30 +01:00
|
|
|
// Blockchain Reactor State Machine
|
|
|
|
type bReactorFSM struct {
|
|
|
|
logger log.Logger
|
|
|
|
startTime time.Time
|
|
|
|
|
|
|
|
state *bReactorFSMState
|
2019-04-04 00:13:32 +02:00
|
|
|
pool *blockPool
|
2019-03-26 09:58:30 +01:00
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
// interface used to call the Blockchain reactor to send StatusRequest, BlockRequest, reporting errors, etc.
|
|
|
|
toBcR bcRMessageInterface
|
2019-03-26 09:58:30 +01:00
|
|
|
}
|
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
// bReactorEventData is part of the message sent by the reactor to the FSM and used by the state handlers.
|
2019-03-26 09:58:30 +01:00
|
|
|
type bReactorEventData struct {
|
2019-04-04 00:13:32 +02:00
|
|
|
peerId p2p.ID
|
|
|
|
err error // for peer error: timeout, slow; for processed block event if error occurred
|
|
|
|
height int64 // for status response; for processed block event
|
|
|
|
block *types.Block // for block response
|
|
|
|
stateName string // for state timeout events
|
|
|
|
length int // for block response event, length of received block, used to detect slow peers
|
|
|
|
maxNumRequests int32 // for request needed event, maximum number of pending requests
|
2019-03-26 09:58:30 +01:00
|
|
|
}
|
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
// Blockchain Reactor Events (the input to the state machine)
|
|
|
|
type bReactorEvent uint
|
|
|
|
|
|
|
|
const (
|
|
|
|
// message type events
|
|
|
|
startFSMEv = iota + 1
|
|
|
|
statusResponseEv
|
|
|
|
blockResponseEv
|
|
|
|
processedBlockEv
|
|
|
|
makeRequestsEv
|
|
|
|
stopFSMEv
|
|
|
|
|
|
|
|
// other events
|
|
|
|
peerRemoveEv = iota + 256
|
|
|
|
stateTimeoutEv
|
|
|
|
)
|
2019-03-26 09:58:30 +01:00
|
|
|
|
|
|
|
func (msg *bReactorMessageData) String() string {
|
|
|
|
var dataStr string
|
|
|
|
|
|
|
|
switch msg.event {
|
|
|
|
case startFSMEv:
|
|
|
|
dataStr = ""
|
|
|
|
case statusResponseEv:
|
|
|
|
dataStr = fmt.Sprintf("peer: %v height: %v", msg.data.peerId, msg.data.height)
|
|
|
|
case blockResponseEv:
|
|
|
|
dataStr = fmt.Sprintf("peer: %v block.height: %v lenght: %v", msg.data.peerId, msg.data.block.Height, msg.data.length)
|
2019-04-04 00:13:32 +02:00
|
|
|
case processedBlockEv:
|
|
|
|
dataStr = fmt.Sprintf("block processing returned following error: %v", msg.data.err)
|
|
|
|
case makeRequestsEv:
|
|
|
|
dataStr = fmt.Sprintf("new requests needed")
|
2019-03-26 09:58:30 +01:00
|
|
|
case stopFSMEv:
|
|
|
|
dataStr = ""
|
2019-04-04 00:13:32 +02:00
|
|
|
case peerRemoveEv:
|
|
|
|
dataStr = fmt.Sprintf("peer: %v is being removed by the switch", msg.data.peerId)
|
2019-03-26 09:58:30 +01:00
|
|
|
case stateTimeoutEv:
|
|
|
|
dataStr = fmt.Sprintf("state: %v", msg.data.stateName)
|
2019-04-04 00:13:32 +02:00
|
|
|
|
2019-03-26 09:58:30 +01:00
|
|
|
default:
|
|
|
|
dataStr = fmt.Sprintf("cannot interpret message data")
|
|
|
|
return "event unknown"
|
|
|
|
}
|
|
|
|
|
|
|
|
return fmt.Sprintf("event: %v %v", msg.event, dataStr)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (ev bReactorEvent) String() string {
|
|
|
|
switch ev {
|
|
|
|
case startFSMEv:
|
|
|
|
return "startFSMEv"
|
|
|
|
case statusResponseEv:
|
|
|
|
return "statusResponseEv"
|
|
|
|
case blockResponseEv:
|
|
|
|
return "blockResponseEv"
|
2019-04-04 00:13:32 +02:00
|
|
|
case processedBlockEv:
|
|
|
|
return "processedBlockEv"
|
|
|
|
case makeRequestsEv:
|
|
|
|
return "makeRequestsEv"
|
2019-03-26 09:58:30 +01:00
|
|
|
case stopFSMEv:
|
|
|
|
return "stopFSMEv"
|
2019-04-04 00:13:32 +02:00
|
|
|
case peerRemoveEv:
|
|
|
|
return "peerRemoveEv"
|
2019-03-26 09:58:30 +01:00
|
|
|
case stateTimeoutEv:
|
|
|
|
return "stateTimeoutEv"
|
|
|
|
default:
|
|
|
|
return "event unknown"
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
// states
|
|
|
|
var (
|
|
|
|
unknown *bReactorFSMState
|
|
|
|
waitForPeer *bReactorFSMState
|
|
|
|
waitForBlock *bReactorFSMState
|
|
|
|
finished *bReactorFSMState
|
|
|
|
)
|
|
|
|
|
|
|
|
// state timers
|
|
|
|
var (
|
2019-04-04 00:13:32 +02:00
|
|
|
waitForPeerTimeout = 2 * time.Second
|
2019-03-26 09:58:30 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
// errors
|
|
|
|
var (
|
|
|
|
errNoErrorFinished = errors.New("FSM is finished")
|
2019-04-04 00:13:32 +02:00
|
|
|
errInvalidEvent = errors.New("invalid event in current state")
|
2019-03-26 09:58:30 +01:00
|
|
|
errNoPeerResponse = errors.New("FSM timed out on peer response")
|
|
|
|
errBadDataFromPeer = errors.New("received from wrong peer or bad block")
|
|
|
|
errMissingBlocks = errors.New("missing blocks")
|
|
|
|
errBlockVerificationFailure = errors.New("block verification failure, redo")
|
|
|
|
errNilPeerForBlockRequest = errors.New("nil peer for block request")
|
|
|
|
errSendQueueFull = errors.New("block request not made, send-queue is full")
|
2019-04-04 00:13:32 +02:00
|
|
|
errPeerTooShort = errors.New("peer height too low, old peer removed/ new peer not added")
|
|
|
|
errSlowPeer = errors.New("peer is not sending us data fast enough")
|
2019-04-12 22:02:30 -04:00
|
|
|
errNoPeerFoundForHeight = errors.New("could not find peer for block request")
|
2019-04-12 23:32:21 -04:00
|
|
|
errSwitchRemovesPeer = errors.New("switch is removing peer")
|
2019-03-26 09:58:30 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
func init() {
|
|
|
|
unknown = &bReactorFSMState{
|
|
|
|
name: "unknown",
|
|
|
|
handle: func(fsm *bReactorFSM, ev bReactorEvent, data bReactorEventData) (*bReactorFSMState, error) {
|
|
|
|
switch ev {
|
|
|
|
case startFSMEv:
|
|
|
|
// Broadcast Status message. Currently doesn't return non-nil error.
|
2019-04-04 00:13:32 +02:00
|
|
|
fsm.toBcR.sendStatusRequest()
|
2019-03-26 09:58:30 +01:00
|
|
|
if fsm.state.timer != nil {
|
|
|
|
fsm.state.timer.Stop()
|
|
|
|
}
|
|
|
|
return waitForPeer, nil
|
|
|
|
|
|
|
|
case stopFSMEv:
|
|
|
|
return finished, errNoErrorFinished
|
|
|
|
|
|
|
|
default:
|
|
|
|
return unknown, errInvalidEvent
|
|
|
|
}
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
waitForPeer = &bReactorFSMState{
|
|
|
|
name: "waitForPeer",
|
|
|
|
timeout: waitForPeerTimeout,
|
|
|
|
enter: func(fsm *bReactorFSM) {
|
2019-04-04 00:13:32 +02:00
|
|
|
// Stop when leaving the state.
|
2019-03-26 09:58:30 +01:00
|
|
|
fsm.resetStateTimer(waitForPeer)
|
|
|
|
},
|
|
|
|
handle: func(fsm *bReactorFSM, ev bReactorEvent, data bReactorEventData) (*bReactorFSMState, error) {
|
|
|
|
switch ev {
|
|
|
|
case stateTimeoutEv:
|
2019-04-04 00:13:32 +02:00
|
|
|
// There was no statusResponse received from any peer.
|
2019-03-26 09:58:30 +01:00
|
|
|
// Should we send status request again?
|
|
|
|
if fsm.state.timer != nil {
|
|
|
|
fsm.state.timer.Stop()
|
|
|
|
}
|
|
|
|
return finished, errNoPeerResponse
|
|
|
|
|
|
|
|
case statusResponseEv:
|
2019-04-04 00:13:32 +02:00
|
|
|
if err := fsm.pool.updatePeer(data.peerId, data.height); err != nil {
|
2019-03-27 14:33:11 +01:00
|
|
|
if len(fsm.pool.peers) == 0 {
|
2019-03-26 09:58:30 +01:00
|
|
|
return waitForPeer, err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return waitForBlock, nil
|
|
|
|
|
|
|
|
case stopFSMEv:
|
|
|
|
return finished, errNoErrorFinished
|
|
|
|
|
|
|
|
default:
|
|
|
|
return waitForPeer, errInvalidEvent
|
|
|
|
}
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
waitForBlock = &bReactorFSMState{
|
2019-04-04 00:13:32 +02:00
|
|
|
name: "waitForBlock",
|
2019-03-26 09:58:30 +01:00
|
|
|
handle: func(fsm *bReactorFSM, ev bReactorEvent, data bReactorEventData) (*bReactorFSMState, error) {
|
|
|
|
switch ev {
|
|
|
|
|
|
|
|
case statusResponseEv:
|
2019-04-04 00:13:32 +02:00
|
|
|
err := fsm.pool.updatePeer(data.peerId, data.height)
|
2019-03-27 19:54:08 +01:00
|
|
|
if len(fsm.pool.peers) == 0 {
|
2019-04-04 00:13:32 +02:00
|
|
|
fsm.toBcR.sendStatusRequest()
|
2019-03-27 19:54:08 +01:00
|
|
|
if fsm.state.timer != nil {
|
|
|
|
fsm.state.timer.Stop()
|
|
|
|
}
|
|
|
|
return waitForPeer, err
|
|
|
|
}
|
2019-03-26 09:58:30 +01:00
|
|
|
return waitForBlock, err
|
|
|
|
|
|
|
|
case blockResponseEv:
|
2019-03-26 14:51:37 +01:00
|
|
|
fsm.logger.Debug("blockResponseEv", "H", data.block.Height)
|
2019-03-27 14:33:11 +01:00
|
|
|
err := fsm.pool.addBlock(data.peerId, data.block, data.length)
|
2019-03-26 09:58:30 +01:00
|
|
|
if err != nil {
|
2019-04-04 00:13:32 +02:00
|
|
|
// A block was received that was unsolicited, from unexpected peer, or that we already have it.
|
|
|
|
// Ignore block, remove peer and send error to switch.
|
2019-03-27 14:33:11 +01:00
|
|
|
fsm.pool.removePeer(data.peerId, err)
|
2019-04-12 22:02:30 -04:00
|
|
|
fsm.toBcR.sendPeerError(err, data.peerId)
|
2019-03-26 09:58:30 +01:00
|
|
|
}
|
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
return waitForBlock, err
|
2019-03-27 14:33:11 +01:00
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
case processedBlockEv:
|
|
|
|
fsm.logger.Debug("processedBlockEv", "err", data.err)
|
|
|
|
first, second, _ := fsm.pool.getNextTwoBlocks()
|
|
|
|
if data.err != nil {
|
|
|
|
fsm.logger.Error("process blocks returned error", "err", data.err, "first", first.block.Height, "second", second.block.Height)
|
|
|
|
fsm.logger.Error("send peer error for", "peer", first.peer.id)
|
|
|
|
fsm.toBcR.sendPeerError(data.err, first.peer.id)
|
|
|
|
fsm.logger.Error("send peer error for", "peer", second.peer.id)
|
|
|
|
fsm.toBcR.sendPeerError(data.err, second.peer.id)
|
2019-04-12 22:02:30 -04:00
|
|
|
// Remove the first two blocks. This will also remove the peers
|
2019-04-04 00:13:32 +02:00
|
|
|
fsm.pool.invalidateFirstTwoBlocks(data.err)
|
|
|
|
} else {
|
|
|
|
fsm.pool.processedCurrentHeightBlock()
|
|
|
|
if fsm.pool.reachedMaxHeight() {
|
|
|
|
fsm.stop()
|
|
|
|
return finished, nil
|
|
|
|
}
|
2019-03-26 09:58:30 +01:00
|
|
|
}
|
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
return waitForBlock, data.err
|
2019-03-26 09:58:30 +01:00
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
case peerRemoveEv:
|
|
|
|
// This event is sent by the switch to remove disconnected and errored peers.
|
2019-03-27 14:33:11 +01:00
|
|
|
fsm.pool.removePeer(data.peerId, data.err)
|
2019-04-04 00:13:32 +02:00
|
|
|
return waitForBlock, nil
|
|
|
|
|
|
|
|
case makeRequestsEv:
|
2019-04-12 22:02:30 -04:00
|
|
|
fsm.makeNextRequests(data.maxNumRequests)
|
|
|
|
return waitForBlock, nil
|
2019-03-26 09:58:30 +01:00
|
|
|
|
|
|
|
case stopFSMEv:
|
|
|
|
return finished, errNoErrorFinished
|
|
|
|
|
|
|
|
default:
|
|
|
|
return waitForBlock, errInvalidEvent
|
|
|
|
}
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
finished = &bReactorFSMState{
|
|
|
|
name: "finished",
|
|
|
|
enter: func(fsm *bReactorFSM) {
|
2019-04-04 00:13:32 +02:00
|
|
|
fsm.cleanup()
|
2019-03-26 09:58:30 +01:00
|
|
|
},
|
|
|
|
handle: func(fsm *bReactorFSM, ev bReactorEvent, data bReactorEventData) (*bReactorFSMState, error) {
|
|
|
|
return nil, nil
|
|
|
|
},
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
func NewFSM(height int64, toBcR bcRMessageInterface) *bReactorFSM {
|
2019-03-26 09:58:30 +01:00
|
|
|
return &bReactorFSM{
|
2019-03-27 14:33:11 +01:00
|
|
|
state: unknown,
|
2019-04-04 00:13:32 +02:00
|
|
|
startTime: time.Now(),
|
|
|
|
pool: newBlockPool(height, toBcR),
|
|
|
|
toBcR: toBcR,
|
2019-03-26 09:58:30 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (fsm *bReactorFSM) setLogger(l log.Logger) {
|
|
|
|
fsm.logger = l
|
2019-03-27 14:33:11 +01:00
|
|
|
fsm.pool.setLogger(l)
|
2019-03-26 09:58:30 +01:00
|
|
|
}
|
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
func sendMessageToFSMSync(fsm *bReactorFSM, msg bReactorMessageData) error {
|
|
|
|
err := fsm.handle(&msg)
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
// Starts the FSM goroutine.
|
2019-03-26 09:58:30 +01:00
|
|
|
func (fsm *bReactorFSM) start() {
|
2019-04-04 00:13:32 +02:00
|
|
|
_ = sendMessageToFSMSync(fsm, bReactorMessageData{
|
|
|
|
event: startFSMEv,
|
|
|
|
})
|
2019-03-26 09:58:30 +01:00
|
|
|
}
|
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
// Stops the FSM goroutine.
|
2019-03-26 09:58:30 +01:00
|
|
|
func (fsm *bReactorFSM) stop() {
|
2019-04-04 00:13:32 +02:00
|
|
|
_ = sendMessageToFSMSync(fsm, bReactorMessageData{
|
2019-03-26 09:58:30 +01:00
|
|
|
event: stopFSMEv,
|
2019-04-04 00:13:32 +02:00
|
|
|
})
|
2019-03-26 09:58:30 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// handle processes messages and events sent to the FSM.
|
|
|
|
func (fsm *bReactorFSM) handle(msg *bReactorMessageData) error {
|
2019-03-26 14:51:37 +01:00
|
|
|
fsm.logger.Debug("FSM received event", "event", msg.event, "state", fsm.state.name)
|
2019-03-26 09:58:30 +01:00
|
|
|
|
|
|
|
if fsm.state == nil {
|
|
|
|
fsm.state = unknown
|
|
|
|
}
|
|
|
|
next, err := fsm.state.handle(fsm, msg.event, msg.data)
|
|
|
|
if err != nil {
|
2019-03-26 14:51:37 +01:00
|
|
|
fsm.logger.Error("FSM event handler returned", "err", err, "state", fsm.state.name, "event", msg.event)
|
2019-03-26 09:58:30 +01:00
|
|
|
}
|
|
|
|
|
2019-03-26 14:51:37 +01:00
|
|
|
oldState := fsm.state.name
|
2019-03-26 09:58:30 +01:00
|
|
|
fsm.transition(next)
|
2019-03-26 14:51:37 +01:00
|
|
|
if oldState != fsm.state.name {
|
|
|
|
fsm.logger.Info("FSM changed state", "old_state", oldState, "event", msg.event, "new_state", fsm.state.name)
|
|
|
|
}
|
2019-03-26 09:58:30 +01:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
func (fsm *bReactorFSM) transition(next *bReactorFSMState) {
|
|
|
|
if next == nil {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
if fsm.state != next {
|
|
|
|
fsm.state = next
|
|
|
|
if next.enter != nil {
|
|
|
|
next.enter(fsm)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// FSM state timeout handler
|
|
|
|
func (fsm *bReactorFSM) sendStateTimeoutEvent(stateName string) {
|
|
|
|
// Check that the timeout is for the state we are currently in to prevent wrong transitions.
|
|
|
|
if stateName == fsm.state.name {
|
|
|
|
msg := bReactorMessageData{
|
|
|
|
event: stateTimeoutEv,
|
|
|
|
data: bReactorEventData{
|
|
|
|
stateName: stateName,
|
|
|
|
},
|
|
|
|
}
|
2019-04-04 00:13:32 +02:00
|
|
|
_ = sendMessageToFSMSync(fsm, msg)
|
2019-03-26 09:58:30 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
// Called when entering an FSM state in order to detect lack of progress in the state machine.
|
|
|
|
// Note the use of the 'bcr' interface to facilitate testing without timer expiring.
|
2019-03-26 09:58:30 +01:00
|
|
|
func (fsm *bReactorFSM) resetStateTimer(state *bReactorFSMState) {
|
2019-04-04 00:13:32 +02:00
|
|
|
fsm.toBcR.resetStateTimer(state.name, state.timer, state.timeout, func() {
|
2019-03-26 09:58:30 +01:00
|
|
|
fsm.sendStateTimeoutEvent(state.name)
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
func (fsm *bReactorFSM) isCaughtUp() bool {
|
|
|
|
// Some conditions to determine if we're caught up.
|
|
|
|
// Ensures we've either received a block or waited some amount of time,
|
|
|
|
// and that we're synced to the highest known height.
|
|
|
|
// Note we use maxPeerHeight - 1 because to sync block H requires block H+1
|
|
|
|
// to verify the LastCommit.
|
|
|
|
receivedBlockOrTimedOut := fsm.pool.height > 0 || time.Since(fsm.startTime) > 5*time.Second
|
|
|
|
ourChainIsLongestAmongPeers := fsm.pool.maxPeerHeight == 0 || fsm.pool.height >= (fsm.pool.maxPeerHeight-1) || fsm.state == finished
|
|
|
|
isCaughtUp := receivedBlockOrTimedOut && ourChainIsLongestAmongPeers
|
|
|
|
|
|
|
|
return isCaughtUp
|
2019-03-26 09:58:30 +01:00
|
|
|
}
|
|
|
|
|
2019-04-04 00:13:32 +02:00
|
|
|
func (fsm *bReactorFSM) cleanup() {
|
|
|
|
// TODO
|
2019-03-26 09:58:30 +01:00
|
|
|
}
|
2019-03-27 19:54:08 +01:00
|
|
|
|
2019-04-12 22:02:30 -04:00
|
|
|
func (fsm *bReactorFSM) makeNextRequests(maxNumPendingRequests int32) {
|
|
|
|
fsm.pool.makeNextRequests(maxNumPendingRequests)
|
2019-03-27 19:54:08 +01:00
|
|
|
}
|