You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1503 lines
52 KiB

10 years ago
7 years ago
8 years ago
7 years ago
10 years ago
10 years ago
9 years ago
9 years ago
9 years ago
9 years ago
9 years ago
10 years ago
8 years ago
8 years ago
10 years ago
10 years ago
8 years ago
10 years ago
9 years ago
9 years ago
8 years ago
10 years ago
10 years ago
10 years ago
8 years ago
9 years ago
9 years ago
8 years ago
9 years ago
8 years ago
8 years ago
8 years ago
7 years ago
8 years ago
8 years ago
8 years ago
8 years ago
10 years ago
8 years ago
10 years ago
8 years ago
9 years ago
9 years ago
7 years ago
7 years ago
7 years ago
7 years ago
7 years ago
7 years ago
7 years ago
7 years ago
7 years ago
7 years ago
10 years ago
8 years ago
8 years ago
10 years ago
8 years ago
8 years ago
10 years ago
10 years ago
10 years ago
8 years ago
9 years ago
9 years ago
9 years ago
8 years ago
10 years ago
8 years ago
8 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
7 years ago
8 years ago
8 years ago
8 years ago
10 years ago
8 years ago
10 years ago
10 years ago
8 years ago
8 years ago
10 years ago
10 years ago
8 years ago
8 years ago
10 years ago
10 years ago
8 years ago
10 years ago
10 years ago
8 years ago
10 years ago
10 years ago
9 years ago
8 years ago
8 years ago
9 years ago
8 years ago
10 years ago
8 years ago
9 years ago
9 years ago
10 years ago
10 years ago
10 years ago
10 years ago
10 years ago
9 years ago
9 years ago
9 years ago
8 years ago
9 years ago
9 years ago
8 years ago
10 years ago
10 years ago
8 years ago
8 years ago
8 years ago
8 years ago
9 years ago
9 years ago
10 years ago
10 years ago
9 years ago
10 years ago
9 years ago
8 years ago
9 years ago
8 years ago
9 years ago
8 years ago
9 years ago
9 years ago
8 years ago
8 years ago
10 years ago
8 years ago
10 years ago
  1. package consensus
  2. import (
  3. "bytes"
  4. "errors"
  5. "fmt"
  6. "path/filepath"
  7. "reflect"
  8. "runtime/debug"
  9. "sync"
  10. "time"
  11. fail "github.com/ebuchman/fail-test"
  12. wire "github.com/tendermint/go-wire"
  13. cmn "github.com/tendermint/tmlibs/common"
  14. "github.com/tendermint/tmlibs/log"
  15. cfg "github.com/tendermint/tendermint/config"
  16. cstypes "github.com/tendermint/tendermint/consensus/types"
  17. "github.com/tendermint/tendermint/proxy"
  18. sm "github.com/tendermint/tendermint/state"
  19. "github.com/tendermint/tendermint/types"
  20. )
  21. //-----------------------------------------------------------------------------
  22. // Config
  23. const (
  24. proposalHeartbeatIntervalSeconds = 2
  25. )
  26. //-----------------------------------------------------------------------------
  27. // Errors
  28. var (
  29. ErrInvalidProposalSignature = errors.New("Error invalid proposal signature")
  30. ErrInvalidProposalPOLRound = errors.New("Error invalid proposal POL round")
  31. ErrAddingVote = errors.New("Error adding vote")
  32. ErrVoteHeightMismatch = errors.New("Error vote height mismatch")
  33. )
  34. //-----------------------------------------------------------------------------
  35. var (
  36. msgQueueSize = 1000
  37. )
  38. // msgs from the reactor which may update the state
  39. type msgInfo struct {
  40. Msg ConsensusMessage `json:"msg"`
  41. PeerKey string `json:"peer_key"`
  42. }
  43. // internally generated messages which may update the state
  44. type timeoutInfo struct {
  45. Duration time.Duration `json:"duration"`
  46. Height int `json:"height"`
  47. Round int `json:"round"`
  48. Step cstypes.RoundStepType `json:"step"`
  49. }
  50. func (ti *timeoutInfo) String() string {
  51. return fmt.Sprintf("%v ; %d/%d %v", ti.Duration, ti.Height, ti.Round, ti.Step)
  52. }
  53. // ConsensusState handles execution of the consensus algorithm.
  54. // It processes votes and proposals, and upon reaching agreement,
  55. // commits blocks to the chain and executes them against the application.
  56. // The internal state machine receives input from peers, the internal validator, and from a timer.
  57. type ConsensusState struct {
  58. cmn.BaseService
  59. // config details
  60. config *cfg.ConsensusConfig
  61. privValidator types.PrivValidator // for signing votes
  62. // services for creating and executing blocks
  63. proxyAppConn proxy.AppConnConsensus
  64. blockStore types.BlockStore
  65. mempool types.Mempool
  66. // internal state
  67. mtx sync.Mutex
  68. cstypes.RoundState
  69. state *sm.State // State until height-1.
  70. // state changes may be triggered by msgs from peers,
  71. // msgs from ourself, or by timeouts
  72. peerMsgQueue chan msgInfo
  73. internalMsgQueue chan msgInfo
  74. timeoutTicker TimeoutTicker
  75. // we use PubSub to trigger msg broadcasts in the reactor,
  76. // and to notify external subscribers, eg. through a websocket
  77. evsw types.EventSwitch
  78. // a Write-Ahead Log ensures we can recover from any kind of crash
  79. // and helps us avoid signing conflicting votes
  80. wal *WAL
  81. replayMode bool // so we don't log signing errors during replay
  82. // for tests where we want to limit the number of transitions the state makes
  83. nSteps int
  84. // some functions can be overwritten for testing
  85. decideProposal func(height, round int)
  86. doPrevote func(height, round int)
  87. setProposal func(proposal *types.Proposal) error
  88. // closed when we finish shutting down
  89. done chan struct{}
  90. }
  91. // NewConsensusState returns a new ConsensusState.
  92. func NewConsensusState(config *cfg.ConsensusConfig, state *sm.State, proxyAppConn proxy.AppConnConsensus, blockStore types.BlockStore, mempool types.Mempool) *ConsensusState {
  93. cs := &ConsensusState{
  94. config: config,
  95. proxyAppConn: proxyAppConn,
  96. blockStore: blockStore,
  97. mempool: mempool,
  98. peerMsgQueue: make(chan msgInfo, msgQueueSize),
  99. internalMsgQueue: make(chan msgInfo, msgQueueSize),
  100. timeoutTicker: NewTimeoutTicker(),
  101. done: make(chan struct{}),
  102. }
  103. // set function defaults (may be overwritten before calling Start)
  104. cs.decideProposal = cs.defaultDecideProposal
  105. cs.doPrevote = cs.defaultDoPrevote
  106. cs.setProposal = cs.defaultSetProposal
  107. cs.updateToState(state)
  108. // Don't call scheduleRound0 yet.
  109. // We do that upon Start().
  110. cs.reconstructLastCommit(state)
  111. cs.BaseService = *cmn.NewBaseService(nil, "ConsensusState", cs)
  112. return cs
  113. }
  114. //----------------------------------------
  115. // Public interface
  116. // SetLogger implements Service.
  117. func (cs *ConsensusState) SetLogger(l log.Logger) {
  118. cs.BaseService.Logger = l
  119. cs.timeoutTicker.SetLogger(l)
  120. }
  121. // SetEventSwitch implements events.Eventable
  122. func (cs *ConsensusState) SetEventSwitch(evsw types.EventSwitch) {
  123. cs.evsw = evsw
  124. }
  125. // String returns a string.
  126. func (cs *ConsensusState) String() string {
  127. // better not to access shared variables
  128. return cmn.Fmt("ConsensusState") //(H:%v R:%v S:%v", cs.Height, cs.Round, cs.Step)
  129. }
  130. // GetState returns a copy of the chain state.
  131. func (cs *ConsensusState) GetState() *sm.State {
  132. cs.mtx.Lock()
  133. defer cs.mtx.Unlock()
  134. return cs.state.Copy()
  135. }
  136. // GetRoundState returns a copy of the internal consensus state.
  137. func (cs *ConsensusState) GetRoundState() *cstypes.RoundState {
  138. cs.mtx.Lock()
  139. defer cs.mtx.Unlock()
  140. return cs.getRoundState()
  141. }
  142. func (cs *ConsensusState) getRoundState() *cstypes.RoundState {
  143. rs := cs.RoundState // copy
  144. return &rs
  145. }
  146. // GetValidators returns a copy of the current validators.
  147. func (cs *ConsensusState) GetValidators() (int, []*types.Validator) {
  148. cs.mtx.Lock()
  149. defer cs.mtx.Unlock()
  150. return cs.state.LastBlockHeight, cs.state.Validators.Copy().Validators
  151. }
  152. // SetPrivValidator sets the private validator account for signing votes.
  153. func (cs *ConsensusState) SetPrivValidator(priv types.PrivValidator) {
  154. cs.mtx.Lock()
  155. defer cs.mtx.Unlock()
  156. cs.privValidator = priv
  157. }
  158. // SetTimeoutTicker sets the local timer. It may be useful to overwrite for testing.
  159. func (cs *ConsensusState) SetTimeoutTicker(timeoutTicker TimeoutTicker) {
  160. cs.mtx.Lock()
  161. defer cs.mtx.Unlock()
  162. cs.timeoutTicker = timeoutTicker
  163. }
  164. // LoadCommit loads the commit for a given height.
  165. func (cs *ConsensusState) LoadCommit(height int) *types.Commit {
  166. cs.mtx.Lock()
  167. defer cs.mtx.Unlock()
  168. if height == cs.blockStore.Height() {
  169. return cs.blockStore.LoadSeenCommit(height)
  170. }
  171. return cs.blockStore.LoadBlockCommit(height)
  172. }
  173. // OnStart implements cmn.Service.
  174. // It loads the latest state via the WAL, and starts the timeout and receive routines.
  175. func (cs *ConsensusState) OnStart() error {
  176. walFile := cs.config.WalFile()
  177. if err := cs.OpenWAL(walFile); err != nil {
  178. cs.Logger.Error("Error loading ConsensusState wal", "err", err.Error())
  179. return err
  180. }
  181. // we need the timeoutRoutine for replay so
  182. // we don't block on the tick chan.
  183. // NOTE: we will get a build up of garbage go routines
  184. // firing on the tockChan until the receiveRoutine is started
  185. // to deal with them (by that point, at most one will be valid)
  186. cs.timeoutTicker.Start()
  187. // we may have lost some votes if the process crashed
  188. // reload from consensus log to catchup
  189. if err := cs.catchupReplay(cs.Height); err != nil {
  190. cs.Logger.Error("Error on catchup replay. Proceeding to start ConsensusState anyway", "err", err.Error())
  191. // NOTE: if we ever do return an error here,
  192. // make sure to stop the timeoutTicker
  193. }
  194. // now start the receiveRoutine
  195. go cs.receiveRoutine(0)
  196. // schedule the first round!
  197. // use GetRoundState so we don't race the receiveRoutine for access
  198. cs.scheduleRound0(cs.GetRoundState())
  199. return nil
  200. }
  201. // timeoutRoutine: receive requests for timeouts on tickChan and fire timeouts on tockChan
  202. // receiveRoutine: serializes processing of proposoals, block parts, votes; coordinates state transitions
  203. func (cs *ConsensusState) startRoutines(maxSteps int) {
  204. cs.timeoutTicker.Start()
  205. go cs.receiveRoutine(maxSteps)
  206. }
  207. // OnStop implements cmn.Service. It stops all routines and waits for the WAL to finish.
  208. func (cs *ConsensusState) OnStop() {
  209. cs.BaseService.OnStop()
  210. cs.timeoutTicker.Stop()
  211. // Make BaseService.Wait() wait until cs.wal.Wait()
  212. if cs.wal != nil && cs.IsRunning() {
  213. cs.wal.Wait()
  214. }
  215. }
  216. // Wait waits for the the main routine to return.
  217. // NOTE: be sure to Stop() the event switch and drain
  218. // any event channels or this may deadlock
  219. func (cs *ConsensusState) Wait() {
  220. <-cs.done
  221. }
  222. // OpenWAL opens a file to log all consensus messages and timeouts for deterministic accountability
  223. func (cs *ConsensusState) OpenWAL(walFile string) (err error) {
  224. err = cmn.EnsureDir(filepath.Dir(walFile), 0700)
  225. if err != nil {
  226. cs.Logger.Error("Error ensuring ConsensusState wal dir", "err", err.Error())
  227. return err
  228. }
  229. cs.mtx.Lock()
  230. defer cs.mtx.Unlock()
  231. wal, err := NewWAL(walFile, cs.config.WalLight)
  232. if err != nil {
  233. return err
  234. }
  235. wal.SetLogger(cs.Logger.With("wal", walFile))
  236. if _, err := wal.Start(); err != nil {
  237. return err
  238. }
  239. cs.wal = wal
  240. return nil
  241. }
  242. //------------------------------------------------------------
  243. // Public interface for passing messages into the consensus state, possibly causing a state transition.
  244. // If peerKey == "", the msg is considered internal.
  245. // Messages are added to the appropriate queue (peer or internal).
  246. // If the queue is full, the function may block.
  247. // TODO: should these return anything or let callers just use events?
  248. // AddVote inputs a vote.
  249. func (cs *ConsensusState) AddVote(vote *types.Vote, peerKey string) (added bool, err error) {
  250. if peerKey == "" {
  251. cs.internalMsgQueue <- msgInfo{&VoteMessage{vote}, ""}
  252. } else {
  253. cs.peerMsgQueue <- msgInfo{&VoteMessage{vote}, peerKey}
  254. }
  255. // TODO: wait for event?!
  256. return false, nil
  257. }
  258. // SetProposal inputs a proposal.
  259. func (cs *ConsensusState) SetProposal(proposal *types.Proposal, peerKey string) error {
  260. if peerKey == "" {
  261. cs.internalMsgQueue <- msgInfo{&ProposalMessage{proposal}, ""}
  262. } else {
  263. cs.peerMsgQueue <- msgInfo{&ProposalMessage{proposal}, peerKey}
  264. }
  265. // TODO: wait for event?!
  266. return nil
  267. }
  268. // AddProposalBlockPart inputs a part of the proposal block.
  269. func (cs *ConsensusState) AddProposalBlockPart(height, round int, part *types.Part, peerKey string) error {
  270. if peerKey == "" {
  271. cs.internalMsgQueue <- msgInfo{&BlockPartMessage{height, round, part}, ""}
  272. } else {
  273. cs.peerMsgQueue <- msgInfo{&BlockPartMessage{height, round, part}, peerKey}
  274. }
  275. // TODO: wait for event?!
  276. return nil
  277. }
  278. // SetProposalAndBlock inputs the proposal and all block parts.
  279. func (cs *ConsensusState) SetProposalAndBlock(proposal *types.Proposal, block *types.Block, parts *types.PartSet, peerKey string) error {
  280. cs.SetProposal(proposal, peerKey)
  281. for i := 0; i < parts.Total(); i++ {
  282. part := parts.GetPart(i)
  283. cs.AddProposalBlockPart(proposal.Height, proposal.Round, part, peerKey)
  284. }
  285. return nil // TODO errors
  286. }
  287. //------------------------------------------------------------
  288. // internal functions for managing the state
  289. func (cs *ConsensusState) updateHeight(height int) {
  290. cs.Height = height
  291. }
  292. func (cs *ConsensusState) updateRoundStep(round int, step cstypes.RoundStepType) {
  293. cs.Round = round
  294. cs.Step = step
  295. }
  296. // enterNewRound(height, 0) at cs.StartTime.
  297. func (cs *ConsensusState) scheduleRound0(rs *cstypes.RoundState) {
  298. //cs.Logger.Info("scheduleRound0", "now", time.Now(), "startTime", cs.StartTime)
  299. sleepDuration := rs.StartTime.Sub(time.Now())
  300. cs.scheduleTimeout(sleepDuration, rs.Height, 0, cstypes.RoundStepNewHeight)
  301. }
  302. // Attempt to schedule a timeout (by sending timeoutInfo on the tickChan)
  303. func (cs *ConsensusState) scheduleTimeout(duration time.Duration, height, round int, step cstypes.RoundStepType) {
  304. cs.timeoutTicker.ScheduleTimeout(timeoutInfo{duration, height, round, step})
  305. }
  306. // send a msg into the receiveRoutine regarding our own proposal, block part, or vote
  307. func (cs *ConsensusState) sendInternalMessage(mi msgInfo) {
  308. select {
  309. case cs.internalMsgQueue <- mi:
  310. default:
  311. // NOTE: using the go-routine means our votes can
  312. // be processed out of order.
  313. // TODO: use CList here for strict determinism and
  314. // attempt push to internalMsgQueue in receiveRoutine
  315. cs.Logger.Info("Internal msg queue is full. Using a go-routine")
  316. go func() { cs.internalMsgQueue <- mi }()
  317. }
  318. }
  319. // Reconstruct LastCommit from SeenCommit, which we saved along with the block,
  320. // (which happens even before saving the state)
  321. func (cs *ConsensusState) reconstructLastCommit(state *sm.State) {
  322. if state.LastBlockHeight == 0 {
  323. return
  324. }
  325. seenCommit := cs.blockStore.LoadSeenCommit(state.LastBlockHeight)
  326. lastPrecommits := types.NewVoteSet(state.ChainID, state.LastBlockHeight, seenCommit.Round(), types.VoteTypePrecommit, state.LastValidators)
  327. for _, precommit := range seenCommit.Precommits {
  328. if precommit == nil {
  329. continue
  330. }
  331. added, err := lastPrecommits.AddVote(precommit)
  332. if !added || err != nil {
  333. cmn.PanicCrisis(cmn.Fmt("Failed to reconstruct LastCommit: %v", err))
  334. }
  335. }
  336. if !lastPrecommits.HasTwoThirdsMajority() {
  337. cmn.PanicSanity("Failed to reconstruct LastCommit: Does not have +2/3 maj")
  338. }
  339. cs.LastCommit = lastPrecommits
  340. }
  341. // Updates ConsensusState and increments height to match that of state.
  342. // The round becomes 0 and cs.Step becomes cstypes.RoundStepNewHeight.
  343. func (cs *ConsensusState) updateToState(state *sm.State) {
  344. if cs.CommitRound > -1 && 0 < cs.Height && cs.Height != state.LastBlockHeight {
  345. cmn.PanicSanity(cmn.Fmt("updateToState() expected state height of %v but found %v",
  346. cs.Height, state.LastBlockHeight))
  347. }
  348. if cs.state != nil && cs.state.LastBlockHeight+1 != cs.Height {
  349. // This might happen when someone else is mutating cs.state.
  350. // Someone forgot to pass in state.Copy() somewhere?!
  351. cmn.PanicSanity(cmn.Fmt("Inconsistent cs.state.LastBlockHeight+1 %v vs cs.Height %v",
  352. cs.state.LastBlockHeight+1, cs.Height))
  353. }
  354. // If state isn't further out than cs.state, just ignore.
  355. // This happens when SwitchToConsensus() is called in the reactor.
  356. // We don't want to reset e.g. the Votes.
  357. if cs.state != nil && (state.LastBlockHeight <= cs.state.LastBlockHeight) {
  358. cs.Logger.Info("Ignoring updateToState()", "newHeight", state.LastBlockHeight+1, "oldHeight", cs.state.LastBlockHeight+1)
  359. return
  360. }
  361. // Reset fields based on state.
  362. validators := state.Validators
  363. lastPrecommits := (*types.VoteSet)(nil)
  364. if cs.CommitRound > -1 && cs.Votes != nil {
  365. if !cs.Votes.Precommits(cs.CommitRound).HasTwoThirdsMajority() {
  366. cmn.PanicSanity("updateToState(state) called but last Precommit round didn't have +2/3")
  367. }
  368. lastPrecommits = cs.Votes.Precommits(cs.CommitRound)
  369. }
  370. // Next desired block height
  371. height := state.LastBlockHeight + 1
  372. // RoundState fields
  373. cs.updateHeight(height)
  374. cs.updateRoundStep(0, cstypes.RoundStepNewHeight)
  375. if cs.CommitTime.IsZero() {
  376. // "Now" makes it easier to sync up dev nodes.
  377. // We add timeoutCommit to allow transactions
  378. // to be gathered for the first block.
  379. // And alternative solution that relies on clocks:
  380. // cs.StartTime = state.LastBlockTime.Add(timeoutCommit)
  381. cs.StartTime = cs.config.Commit(time.Now())
  382. } else {
  383. cs.StartTime = cs.config.Commit(cs.CommitTime)
  384. }
  385. cs.Validators = validators
  386. cs.Proposal = nil
  387. cs.ProposalBlock = nil
  388. cs.ProposalBlockParts = nil
  389. cs.LockedRound = 0
  390. cs.LockedBlock = nil
  391. cs.LockedBlockParts = nil
  392. cs.Votes = cstypes.NewHeightVoteSet(state.ChainID, height, validators)
  393. cs.CommitRound = -1
  394. cs.LastCommit = lastPrecommits
  395. cs.LastValidators = state.LastValidators
  396. cs.state = state
  397. // Finally, broadcast RoundState
  398. cs.newStep()
  399. }
  400. func (cs *ConsensusState) newStep() {
  401. rs := cs.RoundStateEvent()
  402. cs.wal.Save(rs)
  403. cs.nSteps += 1
  404. // newStep is called by updateToStep in NewConsensusState before the evsw is set!
  405. if cs.evsw != nil {
  406. types.FireEventNewRoundStep(cs.evsw, rs)
  407. }
  408. }
  409. //-----------------------------------------
  410. // the main go routines
  411. // receiveRoutine handles messages which may cause state transitions.
  412. // it's argument (n) is the number of messages to process before exiting - use 0 to run forever
  413. // It keeps the RoundState and is the only thing that updates it.
  414. // Updates (state transitions) happen on timeouts, complete proposals, and 2/3 majorities.
  415. // ConsensusState must be locked before any internal state is updated.
  416. func (cs *ConsensusState) receiveRoutine(maxSteps int) {
  417. defer func() {
  418. if r := recover(); r != nil {
  419. cs.Logger.Error("CONSENSUS FAILURE!!!", "err", r, "stack", string(debug.Stack()))
  420. }
  421. }()
  422. for {
  423. if maxSteps > 0 {
  424. if cs.nSteps >= maxSteps {
  425. cs.Logger.Info("reached max steps. exiting receive routine")
  426. cs.nSteps = 0
  427. return
  428. }
  429. }
  430. rs := cs.RoundState
  431. var mi msgInfo
  432. select {
  433. case height := <-cs.mempool.TxsAvailable():
  434. cs.handleTxsAvailable(height)
  435. case mi = <-cs.peerMsgQueue:
  436. cs.wal.Save(mi)
  437. // handles proposals, block parts, votes
  438. // may generate internal events (votes, complete proposals, 2/3 majorities)
  439. cs.handleMsg(mi)
  440. case mi = <-cs.internalMsgQueue:
  441. cs.wal.Save(mi)
  442. // handles proposals, block parts, votes
  443. cs.handleMsg(mi)
  444. case ti := <-cs.timeoutTicker.Chan(): // tockChan:
  445. cs.wal.Save(ti)
  446. // if the timeout is relevant to the rs
  447. // go to the next step
  448. cs.handleTimeout(ti, rs)
  449. case <-cs.Quit:
  450. // NOTE: the internalMsgQueue may have signed messages from our
  451. // priv_val that haven't hit the WAL, but its ok because
  452. // priv_val tracks LastSig
  453. // close wal now that we're done writing to it
  454. if cs.wal != nil {
  455. cs.wal.Stop()
  456. }
  457. close(cs.done)
  458. return
  459. }
  460. }
  461. }
  462. // state transitions on complete-proposal, 2/3-any, 2/3-one
  463. func (cs *ConsensusState) handleMsg(mi msgInfo) {
  464. cs.mtx.Lock()
  465. defer cs.mtx.Unlock()
  466. var err error
  467. msg, peerKey := mi.Msg, mi.PeerKey
  468. switch msg := msg.(type) {
  469. case *ProposalMessage:
  470. // will not cause transition.
  471. // once proposal is set, we can receive block parts
  472. err = cs.setProposal(msg.Proposal)
  473. case *BlockPartMessage:
  474. // if the proposal is complete, we'll enterPrevote or tryFinalizeCommit
  475. _, err = cs.addProposalBlockPart(msg.Height, msg.Part, peerKey != "")
  476. if err != nil && msg.Round != cs.Round {
  477. err = nil
  478. }
  479. case *VoteMessage:
  480. // attempt to add the vote and dupeout the validator if its a duplicate signature
  481. // if the vote gives us a 2/3-any or 2/3-one, we transition
  482. err := cs.tryAddVote(msg.Vote, peerKey)
  483. if err == ErrAddingVote {
  484. // TODO: punish peer
  485. }
  486. // NOTE: the vote is broadcast to peers by the reactor listening
  487. // for vote events
  488. // TODO: If rs.Height == vote.Height && rs.Round < vote.Round,
  489. // the peer is sending us CatchupCommit precommits.
  490. // We could make note of this and help filter in broadcastHasVoteMessage().
  491. default:
  492. cs.Logger.Error("Unknown msg type", reflect.TypeOf(msg))
  493. }
  494. if err != nil {
  495. cs.Logger.Error("Error with msg", "type", reflect.TypeOf(msg), "peer", peerKey, "err", err, "msg", msg)
  496. }
  497. }
  498. func (cs *ConsensusState) handleTimeout(ti timeoutInfo, rs cstypes.RoundState) {
  499. cs.Logger.Debug("Received tock", "timeout", ti.Duration, "height", ti.Height, "round", ti.Round, "step", ti.Step)
  500. // timeouts must be for current height, round, step
  501. if ti.Height != rs.Height || ti.Round < rs.Round || (ti.Round == rs.Round && ti.Step < rs.Step) {
  502. cs.Logger.Debug("Ignoring tock because we're ahead", "height", rs.Height, "round", rs.Round, "step", rs.Step)
  503. return
  504. }
  505. // the timeout will now cause a state transition
  506. cs.mtx.Lock()
  507. defer cs.mtx.Unlock()
  508. switch ti.Step {
  509. case cstypes.RoundStepNewHeight:
  510. // NewRound event fired from enterNewRound.
  511. // XXX: should we fire timeout here (for timeout commit)?
  512. cs.enterNewRound(ti.Height, 0)
  513. case cstypes.RoundStepNewRound:
  514. cs.enterPropose(ti.Height, 0)
  515. case cstypes.RoundStepPropose:
  516. types.FireEventTimeoutPropose(cs.evsw, cs.RoundStateEvent())
  517. cs.enterPrevote(ti.Height, ti.Round)
  518. case cstypes.RoundStepPrevoteWait:
  519. types.FireEventTimeoutWait(cs.evsw, cs.RoundStateEvent())
  520. cs.enterPrecommit(ti.Height, ti.Round)
  521. case cstypes.RoundStepPrecommitWait:
  522. types.FireEventTimeoutWait(cs.evsw, cs.RoundStateEvent())
  523. cs.enterNewRound(ti.Height, ti.Round+1)
  524. default:
  525. panic(cmn.Fmt("Invalid timeout step: %v", ti.Step))
  526. }
  527. }
  528. func (cs *ConsensusState) handleTxsAvailable(height int) {
  529. cs.mtx.Lock()
  530. defer cs.mtx.Unlock()
  531. // we only need to do this for round 0
  532. cs.enterPropose(height, 0)
  533. }
  534. //-----------------------------------------------------------------------------
  535. // State functions
  536. // Used internally by handleTimeout and handleMsg to make state transitions
  537. // Enter: `timeoutNewHeight` by startTime (commitTime+timeoutCommit),
  538. // or, if SkipTimeout==true, after receiving all precommits from (height,round-1)
  539. // Enter: `timeoutPrecommits` after any +2/3 precommits from (height,round-1)
  540. // Enter: +2/3 precommits for nil at (height,round-1)
  541. // Enter: +2/3 prevotes any or +2/3 precommits for block or any from (height, round)
  542. // NOTE: cs.StartTime was already set for height.
  543. func (cs *ConsensusState) enterNewRound(height int, round int) {
  544. if cs.Height != height || round < cs.Round || (cs.Round == round && cs.Step != cstypes.RoundStepNewHeight) {
  545. cs.Logger.Debug(cmn.Fmt("enterNewRound(%v/%v): Invalid args. Current step: %v/%v/%v", height, round, cs.Height, cs.Round, cs.Step))
  546. return
  547. }
  548. if now := time.Now(); cs.StartTime.After(now) {
  549. cs.Logger.Info("Need to set a buffer and log message here for sanity.", "startTime", cs.StartTime, "now", now)
  550. }
  551. cs.Logger.Info(cmn.Fmt("enterNewRound(%v/%v). Current: %v/%v/%v", height, round, cs.Height, cs.Round, cs.Step))
  552. // Increment validators if necessary
  553. validators := cs.Validators
  554. if cs.Round < round {
  555. validators = validators.Copy()
  556. validators.IncrementAccum(round - cs.Round)
  557. }
  558. // Setup new round
  559. // we don't fire newStep for this step,
  560. // but we fire an event, so update the round step first
  561. cs.updateRoundStep(round, cstypes.RoundStepNewRound)
  562. cs.Validators = validators
  563. if round == 0 {
  564. // We've already reset these upon new height,
  565. // and meanwhile we might have received a proposal
  566. // for round 0.
  567. } else {
  568. cs.Proposal = nil
  569. cs.ProposalBlock = nil
  570. cs.ProposalBlockParts = nil
  571. }
  572. cs.Votes.SetRound(round + 1) // also track next round (round+1) to allow round-skipping
  573. types.FireEventNewRound(cs.evsw, cs.RoundStateEvent())
  574. // Wait for txs to be available in the mempool
  575. // before we enterPropose in round 0. If the last block changed the app hash,
  576. // we may need an empty "proof" block, and enterPropose immediately.
  577. waitForTxs := cs.config.WaitForTxs() && round == 0 && !cs.needProofBlock(height)
  578. if waitForTxs {
  579. if cs.config.CreateEmptyBlocksInterval > 0 {
  580. cs.scheduleTimeout(cs.config.EmptyBlocksInterval(), height, round, cstypes.RoundStepNewRound)
  581. }
  582. go cs.proposalHeartbeat(height, round)
  583. } else {
  584. cs.enterPropose(height, round)
  585. }
  586. }
  587. // needProofBlock returns true on the first height (so the genesis app hash is signed right away)
  588. // and where the last block (height-1) caused the app hash to change
  589. func (cs *ConsensusState) needProofBlock(height int) bool {
  590. if height == 1 {
  591. return true
  592. }
  593. lastBlockMeta := cs.blockStore.LoadBlockMeta(height - 1)
  594. if !bytes.Equal(cs.state.AppHash, lastBlockMeta.Header.AppHash) {
  595. return true
  596. }
  597. return false
  598. }
  599. func (cs *ConsensusState) proposalHeartbeat(height, round int) {
  600. counter := 0
  601. addr := cs.privValidator.GetAddress()
  602. valIndex, v := cs.Validators.GetByAddress(addr)
  603. if v == nil {
  604. // not a validator
  605. valIndex = -1
  606. }
  607. chainID := cs.state.ChainID
  608. for {
  609. rs := cs.GetRoundState()
  610. // if we've already moved on, no need to send more heartbeats
  611. if rs.Step > cstypes.RoundStepNewRound || rs.Round > round || rs.Height > height {
  612. return
  613. }
  614. heartbeat := &types.Heartbeat{
  615. Height: rs.Height,
  616. Round: rs.Round,
  617. Sequence: counter,
  618. ValidatorAddress: addr,
  619. ValidatorIndex: valIndex,
  620. }
  621. cs.privValidator.SignHeartbeat(chainID, heartbeat)
  622. heartbeatEvent := types.EventDataProposalHeartbeat{heartbeat}
  623. types.FireEventProposalHeartbeat(cs.evsw, heartbeatEvent)
  624. counter += 1
  625. time.Sleep(proposalHeartbeatIntervalSeconds * time.Second)
  626. }
  627. }
  628. // Enter (CreateEmptyBlocks): from enterNewRound(height,round)
  629. // Enter (CreateEmptyBlocks, CreateEmptyBlocksInterval > 0 ): after enterNewRound(height,round), after timeout of CreateEmptyBlocksInterval
  630. // Enter (!CreateEmptyBlocks) : after enterNewRound(height,round), once txs are in the mempool
  631. func (cs *ConsensusState) enterPropose(height int, round int) {
  632. if cs.Height != height || round < cs.Round || (cs.Round == round && cstypes.RoundStepPropose <= cs.Step) {
  633. cs.Logger.Debug(cmn.Fmt("enterPropose(%v/%v): Invalid args. Current step: %v/%v/%v", height, round, cs.Height, cs.Round, cs.Step))
  634. return
  635. }
  636. cs.Logger.Info(cmn.Fmt("enterPropose(%v/%v). Current: %v/%v/%v", height, round, cs.Height, cs.Round, cs.Step))
  637. defer func() {
  638. // Done enterPropose:
  639. cs.updateRoundStep(round, cstypes.RoundStepPropose)
  640. cs.newStep()
  641. // If we have the whole proposal + POL, then goto Prevote now.
  642. // else, we'll enterPrevote when the rest of the proposal is received (in AddProposalBlockPart),
  643. // or else after timeoutPropose
  644. if cs.isProposalComplete() {
  645. cs.enterPrevote(height, cs.Round)
  646. }
  647. }()
  648. // If we don't get the proposal and all block parts quick enough, enterPrevote
  649. cs.scheduleTimeout(cs.config.Propose(round), height, round, cstypes.RoundStepPropose)
  650. // Nothing more to do if we're not a validator
  651. if cs.privValidator == nil {
  652. cs.Logger.Debug("This node is not a validator")
  653. return
  654. }
  655. if !cs.isProposer() {
  656. cs.Logger.Info("enterPropose: Not our turn to propose", "proposer", cs.Validators.GetProposer().Address, "privValidator", cs.privValidator)
  657. if cs.Validators.HasAddress(cs.privValidator.GetAddress()) {
  658. cs.Logger.Debug("This node is a validator")
  659. } else {
  660. cs.Logger.Debug("This node is not a validator")
  661. }
  662. } else {
  663. cs.Logger.Info("enterPropose: Our turn to propose", "proposer", cs.Validators.GetProposer().Address, "privValidator", cs.privValidator)
  664. cs.Logger.Debug("This node is a validator")
  665. cs.decideProposal(height, round)
  666. }
  667. }
  668. func (cs *ConsensusState) isProposer() bool {
  669. return bytes.Equal(cs.Validators.GetProposer().Address, cs.privValidator.GetAddress())
  670. }
  671. func (cs *ConsensusState) defaultDecideProposal(height, round int) {
  672. var block *types.Block
  673. var blockParts *types.PartSet
  674. // Decide on block
  675. if cs.LockedBlock != nil {
  676. // If we're locked onto a block, just choose that.
  677. block, blockParts = cs.LockedBlock, cs.LockedBlockParts
  678. } else {
  679. // Create a new proposal block from state/txs from the mempool.
  680. block, blockParts = cs.createProposalBlock()
  681. if block == nil { // on error
  682. return
  683. }
  684. }
  685. // Make proposal
  686. polRound, polBlockID := cs.Votes.POLInfo()
  687. proposal := types.NewProposal(height, round, blockParts.Header(), polRound, polBlockID)
  688. if err := cs.privValidator.SignProposal(cs.state.ChainID, proposal); err == nil {
  689. // Set fields
  690. /* fields set by setProposal and addBlockPart
  691. cs.Proposal = proposal
  692. cs.ProposalBlock = block
  693. cs.ProposalBlockParts = blockParts
  694. */
  695. // send proposal and block parts on internal msg queue
  696. cs.sendInternalMessage(msgInfo{&ProposalMessage{proposal}, ""})
  697. for i := 0; i < blockParts.Total(); i++ {
  698. part := blockParts.GetPart(i)
  699. cs.sendInternalMessage(msgInfo{&BlockPartMessage{cs.Height, cs.Round, part}, ""})
  700. }
  701. cs.Logger.Info("Signed proposal", "height", height, "round", round, "proposal", proposal)
  702. cs.Logger.Debug(cmn.Fmt("Signed proposal block: %v", block))
  703. } else {
  704. if !cs.replayMode {
  705. cs.Logger.Error("enterPropose: Error signing proposal", "height", height, "round", round, "err", err)
  706. }
  707. }
  708. }
  709. // Returns true if the proposal block is complete &&
  710. // (if POLRound was proposed, we have +2/3 prevotes from there).
  711. func (cs *ConsensusState) isProposalComplete() bool {
  712. if cs.Proposal == nil || cs.ProposalBlock == nil {
  713. return false
  714. }
  715. // we have the proposal. if there's a POLRound,
  716. // make sure we have the prevotes from it too
  717. if cs.Proposal.POLRound < 0 {
  718. return true
  719. } else {
  720. // if this is false the proposer is lying or we haven't received the POL yet
  721. return cs.Votes.Prevotes(cs.Proposal.POLRound).HasTwoThirdsMajority()
  722. }
  723. }
  724. // Create the next block to propose and return it.
  725. // Returns nil block upon error.
  726. // NOTE: keep it side-effect free for clarity.
  727. func (cs *ConsensusState) createProposalBlock() (block *types.Block, blockParts *types.PartSet) {
  728. var commit *types.Commit
  729. if cs.Height == 1 {
  730. // We're creating a proposal for the first block.
  731. // The commit is empty, but not nil.
  732. commit = &types.Commit{}
  733. } else if cs.LastCommit.HasTwoThirdsMajority() {
  734. // Make the commit from LastCommit
  735. commit = cs.LastCommit.MakeCommit()
  736. } else {
  737. // This shouldn't happen.
  738. cs.Logger.Error("enterPropose: Cannot propose anything: No commit for the previous block.")
  739. return
  740. }
  741. // Mempool validated transactions
  742. txs := cs.mempool.Reap(cs.config.MaxBlockSizeTxs)
  743. return types.MakeBlock(cs.Height, cs.state.ChainID, txs, commit,
  744. cs.state.LastBlockID, cs.state.Validators.Hash(),
  745. cs.state.AppHash, cs.state.Params.BlockPartSizeBytes)
  746. }
  747. // Enter: `timeoutPropose` after entering Propose.
  748. // Enter: proposal block and POL is ready.
  749. // Enter: any +2/3 prevotes for future round.
  750. // Prevote for LockedBlock if we're locked, or ProposalBlock if valid.
  751. // Otherwise vote nil.
  752. func (cs *ConsensusState) enterPrevote(height int, round int) {
  753. if cs.Height != height || round < cs.Round || (cs.Round == round && cstypes.RoundStepPrevote <= cs.Step) {
  754. cs.Logger.Debug(cmn.Fmt("enterPrevote(%v/%v): Invalid args. Current step: %v/%v/%v", height, round, cs.Height, cs.Round, cs.Step))
  755. return
  756. }
  757. defer func() {
  758. // Done enterPrevote:
  759. cs.updateRoundStep(round, cstypes.RoundStepPrevote)
  760. cs.newStep()
  761. }()
  762. // fire event for how we got here
  763. if cs.isProposalComplete() {
  764. types.FireEventCompleteProposal(cs.evsw, cs.RoundStateEvent())
  765. } else {
  766. // we received +2/3 prevotes for a future round
  767. // TODO: catchup event?
  768. }
  769. cs.Logger.Info(cmn.Fmt("enterPrevote(%v/%v). Current: %v/%v/%v", height, round, cs.Height, cs.Round, cs.Step))
  770. // Sign and broadcast vote as necessary
  771. cs.doPrevote(height, round)
  772. // Once `addVote` hits any +2/3 prevotes, we will go to PrevoteWait
  773. // (so we have more time to try and collect +2/3 prevotes for a single block)
  774. }
  775. func (cs *ConsensusState) defaultDoPrevote(height int, round int) {
  776. logger := cs.Logger.With("height", height, "round", round)
  777. // If a block is locked, prevote that.
  778. if cs.LockedBlock != nil {
  779. logger.Info("enterPrevote: Block was locked")
  780. cs.signAddVote(types.VoteTypePrevote, cs.LockedBlock.Hash(), cs.LockedBlockParts.Header())
  781. return
  782. }
  783. // If ProposalBlock is nil, prevote nil.
  784. if cs.ProposalBlock == nil {
  785. logger.Info("enterPrevote: ProposalBlock is nil")
  786. cs.signAddVote(types.VoteTypePrevote, nil, types.PartSetHeader{})
  787. return
  788. }
  789. // Validate proposal block
  790. err := cs.state.ValidateBlock(cs.ProposalBlock)
  791. if err != nil {
  792. // ProposalBlock is invalid, prevote nil.
  793. logger.Error("enterPrevote: ProposalBlock is invalid", "err", err)
  794. cs.signAddVote(types.VoteTypePrevote, nil, types.PartSetHeader{})
  795. return
  796. }
  797. // Prevote cs.ProposalBlock
  798. // NOTE: the proposal signature is validated when it is received,
  799. // and the proposal block parts are validated as they are received (against the merkle hash in the proposal)
  800. logger.Info("enterPrevote: ProposalBlock is valid")
  801. cs.signAddVote(types.VoteTypePrevote, cs.ProposalBlock.Hash(), cs.ProposalBlockParts.Header())
  802. }
  803. // Enter: any +2/3 prevotes at next round.
  804. func (cs *ConsensusState) enterPrevoteWait(height int, round int) {
  805. if cs.Height != height || round < cs.Round || (cs.Round == round && cstypes.RoundStepPrevoteWait <= cs.Step) {
  806. cs.Logger.Debug(cmn.Fmt("enterPrevoteWait(%v/%v): Invalid args. Current step: %v/%v/%v", height, round, cs.Height, cs.Round, cs.Step))
  807. return
  808. }
  809. if !cs.Votes.Prevotes(round).HasTwoThirdsAny() {
  810. cmn.PanicSanity(cmn.Fmt("enterPrevoteWait(%v/%v), but Prevotes does not have any +2/3 votes", height, round))
  811. }
  812. cs.Logger.Info(cmn.Fmt("enterPrevoteWait(%v/%v). Current: %v/%v/%v", height, round, cs.Height, cs.Round, cs.Step))
  813. defer func() {
  814. // Done enterPrevoteWait:
  815. cs.updateRoundStep(round, cstypes.RoundStepPrevoteWait)
  816. cs.newStep()
  817. }()
  818. // Wait for some more prevotes; enterPrecommit
  819. cs.scheduleTimeout(cs.config.Prevote(round), height, round, cstypes.RoundStepPrevoteWait)
  820. }
  821. // Enter: `timeoutPrevote` after any +2/3 prevotes.
  822. // Enter: +2/3 precomits for block or nil.
  823. // Enter: any +2/3 precommits for next round.
  824. // Lock & precommit the ProposalBlock if we have enough prevotes for it (a POL in this round)
  825. // else, unlock an existing lock and precommit nil if +2/3 of prevotes were nil,
  826. // else, precommit nil otherwise.
  827. func (cs *ConsensusState) enterPrecommit(height int, round int) {
  828. if cs.Height != height || round < cs.Round || (cs.Round == round && cstypes.RoundStepPrecommit <= cs.Step) {
  829. cs.Logger.Debug(cmn.Fmt("enterPrecommit(%v/%v): Invalid args. Current step: %v/%v/%v", height, round, cs.Height, cs.Round, cs.Step))
  830. return
  831. }
  832. cs.Logger.Info(cmn.Fmt("enterPrecommit(%v/%v). Current: %v/%v/%v", height, round, cs.Height, cs.Round, cs.Step))
  833. defer func() {
  834. // Done enterPrecommit:
  835. cs.updateRoundStep(round, cstypes.RoundStepPrecommit)
  836. cs.newStep()
  837. }()
  838. blockID, ok := cs.Votes.Prevotes(round).TwoThirdsMajority()
  839. // If we don't have a polka, we must precommit nil
  840. if !ok {
  841. if cs.LockedBlock != nil {
  842. cs.Logger.Info("enterPrecommit: No +2/3 prevotes during enterPrecommit while we're locked. Precommitting nil")
  843. } else {
  844. cs.Logger.Info("enterPrecommit: No +2/3 prevotes during enterPrecommit. Precommitting nil.")
  845. }
  846. cs.signAddVote(types.VoteTypePrecommit, nil, types.PartSetHeader{})
  847. return
  848. }
  849. // At this point +2/3 prevoted for a particular block or nil
  850. types.FireEventPolka(cs.evsw, cs.RoundStateEvent())
  851. // the latest POLRound should be this round
  852. polRound, _ := cs.Votes.POLInfo()
  853. if polRound < round {
  854. cmn.PanicSanity(cmn.Fmt("This POLRound should be %v but got %", round, polRound))
  855. }
  856. // +2/3 prevoted nil. Unlock and precommit nil.
  857. if len(blockID.Hash) == 0 {
  858. if cs.LockedBlock == nil {
  859. cs.Logger.Info("enterPrecommit: +2/3 prevoted for nil.")
  860. } else {
  861. cs.Logger.Info("enterPrecommit: +2/3 prevoted for nil. Unlocking")
  862. cs.LockedRound = 0
  863. cs.LockedBlock = nil
  864. cs.LockedBlockParts = nil
  865. types.FireEventUnlock(cs.evsw, cs.RoundStateEvent())
  866. }
  867. cs.signAddVote(types.VoteTypePrecommit, nil, types.PartSetHeader{})
  868. return
  869. }
  870. // At this point, +2/3 prevoted for a particular block.
  871. // If we're already locked on that block, precommit it, and update the LockedRound
  872. if cs.LockedBlock.HashesTo(blockID.Hash) {
  873. cs.Logger.Info("enterPrecommit: +2/3 prevoted locked block. Relocking")
  874. cs.LockedRound = round
  875. types.FireEventRelock(cs.evsw, cs.RoundStateEvent())
  876. cs.signAddVote(types.VoteTypePrecommit, blockID.Hash, blockID.PartsHeader)
  877. return
  878. }
  879. // If +2/3 prevoted for proposal block, stage and precommit it
  880. if cs.ProposalBlock.HashesTo(blockID.Hash) {
  881. cs.Logger.Info("enterPrecommit: +2/3 prevoted proposal block. Locking", "hash", blockID.Hash)
  882. // Validate the block.
  883. if err := cs.state.ValidateBlock(cs.ProposalBlock); err != nil {
  884. cmn.PanicConsensus(cmn.Fmt("enterPrecommit: +2/3 prevoted for an invalid block: %v", err))
  885. }
  886. cs.LockedRound = round
  887. cs.LockedBlock = cs.ProposalBlock
  888. cs.LockedBlockParts = cs.ProposalBlockParts
  889. types.FireEventLock(cs.evsw, cs.RoundStateEvent())
  890. cs.signAddVote(types.VoteTypePrecommit, blockID.Hash, blockID.PartsHeader)
  891. return
  892. }
  893. // There was a polka in this round for a block we don't have.
  894. // Fetch that block, unlock, and precommit nil.
  895. // The +2/3 prevotes for this round is the POL for our unlock.
  896. // TODO: In the future save the POL prevotes for justification.
  897. cs.LockedRound = 0
  898. cs.LockedBlock = nil
  899. cs.LockedBlockParts = nil
  900. if !cs.ProposalBlockParts.HasHeader(blockID.PartsHeader) {
  901. cs.ProposalBlock = nil
  902. cs.ProposalBlockParts = types.NewPartSetFromHeader(blockID.PartsHeader)
  903. }
  904. types.FireEventUnlock(cs.evsw, cs.RoundStateEvent())
  905. cs.signAddVote(types.VoteTypePrecommit, nil, types.PartSetHeader{})
  906. }
  907. // Enter: any +2/3 precommits for next round.
  908. func (cs *ConsensusState) enterPrecommitWait(height int, round int) {
  909. if cs.Height != height || round < cs.Round || (cs.Round == round && cstypes.RoundStepPrecommitWait <= cs.Step) {
  910. cs.Logger.Debug(cmn.Fmt("enterPrecommitWait(%v/%v): Invalid args. Current step: %v/%v/%v", height, round, cs.Height, cs.Round, cs.Step))
  911. return
  912. }
  913. if !cs.Votes.Precommits(round).HasTwoThirdsAny() {
  914. cmn.PanicSanity(cmn.Fmt("enterPrecommitWait(%v/%v), but Precommits does not have any +2/3 votes", height, round))
  915. }
  916. cs.Logger.Info(cmn.Fmt("enterPrecommitWait(%v/%v). Current: %v/%v/%v", height, round, cs.Height, cs.Round, cs.Step))
  917. defer func() {
  918. // Done enterPrecommitWait:
  919. cs.updateRoundStep(round, cstypes.RoundStepPrecommitWait)
  920. cs.newStep()
  921. }()
  922. // Wait for some more precommits; enterNewRound
  923. cs.scheduleTimeout(cs.config.Precommit(round), height, round, cstypes.RoundStepPrecommitWait)
  924. }
  925. // Enter: +2/3 precommits for block
  926. func (cs *ConsensusState) enterCommit(height int, commitRound int) {
  927. if cs.Height != height || cstypes.RoundStepCommit <= cs.Step {
  928. cs.Logger.Debug(cmn.Fmt("enterCommit(%v/%v): Invalid args. Current step: %v/%v/%v", height, commitRound, cs.Height, cs.Round, cs.Step))
  929. return
  930. }
  931. cs.Logger.Info(cmn.Fmt("enterCommit(%v/%v). Current: %v/%v/%v", height, commitRound, cs.Height, cs.Round, cs.Step))
  932. defer func() {
  933. // Done enterCommit:
  934. // keep cs.Round the same, commitRound points to the right Precommits set.
  935. cs.updateRoundStep(cs.Round, cstypes.RoundStepCommit)
  936. cs.CommitRound = commitRound
  937. cs.CommitTime = time.Now()
  938. cs.newStep()
  939. // Maybe finalize immediately.
  940. cs.tryFinalizeCommit(height)
  941. }()
  942. blockID, ok := cs.Votes.Precommits(commitRound).TwoThirdsMajority()
  943. if !ok {
  944. cmn.PanicSanity("RunActionCommit() expects +2/3 precommits")
  945. }
  946. // The Locked* fields no longer matter.
  947. // Move them over to ProposalBlock if they match the commit hash,
  948. // otherwise they'll be cleared in updateToState.
  949. if cs.LockedBlock.HashesTo(blockID.Hash) {
  950. cs.ProposalBlock = cs.LockedBlock
  951. cs.ProposalBlockParts = cs.LockedBlockParts
  952. }
  953. // If we don't have the block being committed, set up to get it.
  954. if !cs.ProposalBlock.HashesTo(blockID.Hash) {
  955. if !cs.ProposalBlockParts.HasHeader(blockID.PartsHeader) {
  956. // We're getting the wrong block.
  957. // Set up ProposalBlockParts and keep waiting.
  958. cs.ProposalBlock = nil
  959. cs.ProposalBlockParts = types.NewPartSetFromHeader(blockID.PartsHeader)
  960. } else {
  961. // We just need to keep waiting.
  962. }
  963. }
  964. }
  965. // If we have the block AND +2/3 commits for it, finalize.
  966. func (cs *ConsensusState) tryFinalizeCommit(height int) {
  967. if cs.Height != height {
  968. cmn.PanicSanity(cmn.Fmt("tryFinalizeCommit() cs.Height: %v vs height: %v", cs.Height, height))
  969. }
  970. blockID, ok := cs.Votes.Precommits(cs.CommitRound).TwoThirdsMajority()
  971. if !ok || len(blockID.Hash) == 0 {
  972. cs.Logger.Error("Attempt to finalize failed. There was no +2/3 majority, or +2/3 was for <nil>.", "height", height)
  973. return
  974. }
  975. if !cs.ProposalBlock.HashesTo(blockID.Hash) {
  976. // TODO: this happens every time if we're not a validator (ugly logs)
  977. // TODO: ^^ wait, why does it matter that we're a validator?
  978. cs.Logger.Info("Attempt to finalize failed. We don't have the commit block.", "height", height, "proposal-block", cs.ProposalBlock.Hash(), "commit-block", blockID.Hash)
  979. return
  980. }
  981. // go
  982. cs.finalizeCommit(height)
  983. }
  984. // Increment height and goto cstypes.RoundStepNewHeight
  985. func (cs *ConsensusState) finalizeCommit(height int) {
  986. if cs.Height != height || cs.Step != cstypes.RoundStepCommit {
  987. cs.Logger.Debug(cmn.Fmt("finalizeCommit(%v): Invalid args. Current step: %v/%v/%v", height, cs.Height, cs.Round, cs.Step))
  988. return
  989. }
  990. blockID, ok := cs.Votes.Precommits(cs.CommitRound).TwoThirdsMajority()
  991. block, blockParts := cs.ProposalBlock, cs.ProposalBlockParts
  992. if !ok {
  993. cmn.PanicSanity(cmn.Fmt("Cannot finalizeCommit, commit does not have two thirds majority"))
  994. }
  995. if !blockParts.HasHeader(blockID.PartsHeader) {
  996. cmn.PanicSanity(cmn.Fmt("Expected ProposalBlockParts header to be commit header"))
  997. }
  998. if !block.HashesTo(blockID.Hash) {
  999. cmn.PanicSanity(cmn.Fmt("Cannot finalizeCommit, ProposalBlock does not hash to commit hash"))
  1000. }
  1001. if err := cs.state.ValidateBlock(block); err != nil {
  1002. cmn.PanicConsensus(cmn.Fmt("+2/3 committed an invalid block: %v", err))
  1003. }
  1004. cs.Logger.Info(cmn.Fmt("Finalizing commit of block with %d txs", block.NumTxs),
  1005. "height", block.Height, "hash", block.Hash(), "root", block.AppHash)
  1006. cs.Logger.Info(cmn.Fmt("%v", block))
  1007. fail.Fail() // XXX
  1008. // Save to blockStore.
  1009. if cs.blockStore.Height() < block.Height {
  1010. // NOTE: the seenCommit is local justification to commit this block,
  1011. // but may differ from the LastCommit included in the next block
  1012. precommits := cs.Votes.Precommits(cs.CommitRound)
  1013. seenCommit := precommits.MakeCommit()
  1014. cs.blockStore.SaveBlock(block, blockParts, seenCommit)
  1015. } else {
  1016. // Happens during replay if we already saved the block but didn't commit
  1017. cs.Logger.Info("Calling finalizeCommit on already stored block", "height", block.Height)
  1018. }
  1019. fail.Fail() // XXX
  1020. // Finish writing to the WAL for this height.
  1021. // NOTE: If we fail before writing this, we'll never write it,
  1022. // and just recover by running ApplyBlock in the Handshake.
  1023. // If we moved it before persisting the block, we'd have to allow
  1024. // WAL replay for blocks with an #ENDHEIGHT
  1025. // As is, ConsensusState should not be started again
  1026. // until we successfully call ApplyBlock (ie. here or in Handshake after restart)
  1027. if cs.wal != nil {
  1028. cs.wal.writeEndHeight(height)
  1029. }
  1030. fail.Fail() // XXX
  1031. // Create a copy of the state for staging
  1032. // and an event cache for txs
  1033. stateCopy := cs.state.Copy()
  1034. eventCache := types.NewEventCache(cs.evsw)
  1035. // Execute and commit the block, update and save the state, and update the mempool.
  1036. // All calls to the proxyAppConn come here.
  1037. // NOTE: the block.AppHash wont reflect these txs until the next block
  1038. err := stateCopy.ApplyBlock(eventCache, cs.proxyAppConn, block, blockParts.Header(), cs.mempool)
  1039. if err != nil {
  1040. cs.Logger.Error("Error on ApplyBlock. Did the application crash? Please restart tendermint", "err", err)
  1041. return
  1042. }
  1043. fail.Fail() // XXX
  1044. // Fire event for new block.
  1045. // NOTE: If we fail before firing, these events will never fire
  1046. //
  1047. // TODO: Either
  1048. // * Fire before persisting state, in ApplyBlock
  1049. // * Fire on start up if we haven't written any new WAL msgs
  1050. // Both options mean we may fire more than once. Is that fine ?
  1051. types.FireEventNewBlock(cs.evsw, types.EventDataNewBlock{block})
  1052. types.FireEventNewBlockHeader(cs.evsw, types.EventDataNewBlockHeader{block.Header})
  1053. eventCache.Flush()
  1054. fail.Fail() // XXX
  1055. // NewHeightStep!
  1056. cs.updateToState(stateCopy)
  1057. fail.Fail() // XXX
  1058. // cs.StartTime is already set.
  1059. // Schedule Round0 to start soon.
  1060. cs.scheduleRound0(&cs.RoundState)
  1061. // By here,
  1062. // * cs.Height has been increment to height+1
  1063. // * cs.Step is now cstypes.RoundStepNewHeight
  1064. // * cs.StartTime is set to when we will start round0.
  1065. }
  1066. //-----------------------------------------------------------------------------
  1067. func (cs *ConsensusState) defaultSetProposal(proposal *types.Proposal) error {
  1068. // Already have one
  1069. // TODO: possibly catch double proposals
  1070. if cs.Proposal != nil {
  1071. return nil
  1072. }
  1073. // Does not apply
  1074. if proposal.Height != cs.Height || proposal.Round != cs.Round {
  1075. return nil
  1076. }
  1077. // We don't care about the proposal if we're already in cstypes.RoundStepCommit.
  1078. if cstypes.RoundStepCommit <= cs.Step {
  1079. return nil
  1080. }
  1081. // Verify POLRound, which must be -1 or between 0 and proposal.Round exclusive.
  1082. if proposal.POLRound != -1 &&
  1083. (proposal.POLRound < 0 || proposal.Round <= proposal.POLRound) {
  1084. return ErrInvalidProposalPOLRound
  1085. }
  1086. // Verify signature
  1087. if !cs.Validators.GetProposer().PubKey.VerifyBytes(types.SignBytes(cs.state.ChainID, proposal), proposal.Signature) {
  1088. return ErrInvalidProposalSignature
  1089. }
  1090. cs.Proposal = proposal
  1091. cs.ProposalBlockParts = types.NewPartSetFromHeader(proposal.BlockPartsHeader)
  1092. return nil
  1093. }
  1094. // NOTE: block is not necessarily valid.
  1095. // Asynchronously triggers either enterPrevote (before we timeout of propose) or tryFinalizeCommit, once we have the full block.
  1096. func (cs *ConsensusState) addProposalBlockPart(height int, part *types.Part, verify bool) (added bool, err error) {
  1097. // Blocks might be reused, so round mismatch is OK
  1098. if cs.Height != height {
  1099. return false, nil
  1100. }
  1101. // We're not expecting a block part.
  1102. if cs.ProposalBlockParts == nil {
  1103. return false, nil // TODO: bad peer? Return error?
  1104. }
  1105. added, err = cs.ProposalBlockParts.AddPart(part, verify)
  1106. if err != nil {
  1107. return added, err
  1108. }
  1109. if added && cs.ProposalBlockParts.IsComplete() {
  1110. // Added and completed!
  1111. var n int
  1112. var err error
  1113. cs.ProposalBlock = wire.ReadBinary(&types.Block{}, cs.ProposalBlockParts.GetReader(),
  1114. cs.state.Params.BlockSizeParams.MaxBytes, &n, &err).(*types.Block)
  1115. // NOTE: it's possible to receive complete proposal blocks for future rounds without having the proposal
  1116. cs.Logger.Info("Received complete proposal block", "height", cs.ProposalBlock.Height, "hash", cs.ProposalBlock.Hash())
  1117. if cs.Step == cstypes.RoundStepPropose && cs.isProposalComplete() {
  1118. // Move onto the next step
  1119. cs.enterPrevote(height, cs.Round)
  1120. } else if cs.Step == cstypes.RoundStepCommit {
  1121. // If we're waiting on the proposal block...
  1122. cs.tryFinalizeCommit(height)
  1123. }
  1124. return true, err
  1125. }
  1126. return added, nil
  1127. }
  1128. // Attempt to add the vote. if its a duplicate signature, dupeout the validator
  1129. func (cs *ConsensusState) tryAddVote(vote *types.Vote, peerKey string) error {
  1130. _, err := cs.addVote(vote, peerKey)
  1131. if err != nil {
  1132. // If the vote height is off, we'll just ignore it,
  1133. // But if it's a conflicting sig, broadcast evidence tx for slashing.
  1134. // If it's otherwise invalid, punish peer.
  1135. if err == ErrVoteHeightMismatch {
  1136. return err
  1137. } else if _, ok := err.(*types.ErrVoteConflictingVotes); ok {
  1138. if bytes.Equal(vote.ValidatorAddress, cs.privValidator.GetAddress()) {
  1139. cs.Logger.Error("Found conflicting vote from ourselves. Did you unsafe_reset a validator?", "height", vote.Height, "round", vote.Round, "type", vote.Type)
  1140. return err
  1141. }
  1142. cs.Logger.Error("Found conflicting vote. Publish evidence (TODO)", "height", vote.Height, "round", vote.Round, "type", vote.Type, "valAddr", vote.ValidatorAddress, "valIndex", vote.ValidatorIndex)
  1143. // TODO: track evidence for inclusion in a block
  1144. return err
  1145. } else {
  1146. // Probably an invalid signature. Bad peer.
  1147. cs.Logger.Error("Error attempting to add vote", "err", err)
  1148. return ErrAddingVote
  1149. }
  1150. }
  1151. return nil
  1152. }
  1153. //-----------------------------------------------------------------------------
  1154. func (cs *ConsensusState) addVote(vote *types.Vote, peerKey string) (added bool, err error) {
  1155. cs.Logger.Debug("addVote", "voteHeight", vote.Height, "voteType", vote.Type, "valIndex", vote.ValidatorIndex, "csHeight", cs.Height)
  1156. // A precommit for the previous height?
  1157. // These come in while we wait timeoutCommit
  1158. if vote.Height+1 == cs.Height {
  1159. if !(cs.Step == cstypes.RoundStepNewHeight && vote.Type == types.VoteTypePrecommit) {
  1160. // TODO: give the reason ..
  1161. // fmt.Errorf("tryAddVote: Wrong height, not a LastCommit straggler commit.")
  1162. return added, ErrVoteHeightMismatch
  1163. }
  1164. added, err = cs.LastCommit.AddVote(vote)
  1165. if added {
  1166. cs.Logger.Info(cmn.Fmt("Added to lastPrecommits: %v", cs.LastCommit.StringShort()))
  1167. types.FireEventVote(cs.evsw, types.EventDataVote{vote})
  1168. // if we can skip timeoutCommit and have all the votes now,
  1169. if cs.config.SkipTimeoutCommit && cs.LastCommit.HasAll() {
  1170. // go straight to new round (skip timeout commit)
  1171. // cs.scheduleTimeout(time.Duration(0), cs.Height, 0, cstypes.RoundStepNewHeight)
  1172. cs.enterNewRound(cs.Height, 0)
  1173. }
  1174. }
  1175. return
  1176. }
  1177. // A prevote/precommit for this height?
  1178. if vote.Height == cs.Height {
  1179. height := cs.Height
  1180. added, err = cs.Votes.AddVote(vote, peerKey)
  1181. if added {
  1182. types.FireEventVote(cs.evsw, types.EventDataVote{vote})
  1183. switch vote.Type {
  1184. case types.VoteTypePrevote:
  1185. prevotes := cs.Votes.Prevotes(vote.Round)
  1186. cs.Logger.Info("Added to prevote", "vote", vote, "prevotes", prevotes.StringShort())
  1187. // First, unlock if prevotes is a valid POL.
  1188. // >> lockRound < POLRound <= unlockOrChangeLockRound (see spec)
  1189. // NOTE: If (lockRound < POLRound) but !(POLRound <= unlockOrChangeLockRound),
  1190. // we'll still enterNewRound(H,vote.R) and enterPrecommit(H,vote.R) to process it
  1191. // there.
  1192. if (cs.LockedBlock != nil) && (cs.LockedRound < vote.Round) && (vote.Round <= cs.Round) {
  1193. blockID, ok := prevotes.TwoThirdsMajority()
  1194. if ok && !cs.LockedBlock.HashesTo(blockID.Hash) {
  1195. cs.Logger.Info("Unlocking because of POL.", "lockedRound", cs.LockedRound, "POLRound", vote.Round)
  1196. cs.LockedRound = 0
  1197. cs.LockedBlock = nil
  1198. cs.LockedBlockParts = nil
  1199. types.FireEventUnlock(cs.evsw, cs.RoundStateEvent())
  1200. }
  1201. }
  1202. if cs.Round <= vote.Round && prevotes.HasTwoThirdsAny() {
  1203. // Round-skip over to PrevoteWait or goto Precommit.
  1204. cs.enterNewRound(height, vote.Round) // if the vote is ahead of us
  1205. if prevotes.HasTwoThirdsMajority() {
  1206. cs.enterPrecommit(height, vote.Round)
  1207. } else {
  1208. cs.enterPrevote(height, vote.Round) // if the vote is ahead of us
  1209. cs.enterPrevoteWait(height, vote.Round)
  1210. }
  1211. } else if cs.Proposal != nil && 0 <= cs.Proposal.POLRound && cs.Proposal.POLRound == vote.Round {
  1212. // If the proposal is now complete, enter prevote of cs.Round.
  1213. if cs.isProposalComplete() {
  1214. cs.enterPrevote(height, cs.Round)
  1215. }
  1216. }
  1217. case types.VoteTypePrecommit:
  1218. precommits := cs.Votes.Precommits(vote.Round)
  1219. cs.Logger.Info("Added to precommit", "vote", vote, "precommits", precommits.StringShort())
  1220. blockID, ok := precommits.TwoThirdsMajority()
  1221. if ok {
  1222. if len(blockID.Hash) == 0 {
  1223. cs.enterNewRound(height, vote.Round+1)
  1224. } else {
  1225. cs.enterNewRound(height, vote.Round)
  1226. cs.enterPrecommit(height, vote.Round)
  1227. cs.enterCommit(height, vote.Round)
  1228. if cs.config.SkipTimeoutCommit && precommits.HasAll() {
  1229. // if we have all the votes now,
  1230. // go straight to new round (skip timeout commit)
  1231. // cs.scheduleTimeout(time.Duration(0), cs.Height, 0, cstypes.RoundStepNewHeight)
  1232. cs.enterNewRound(cs.Height, 0)
  1233. }
  1234. }
  1235. } else if cs.Round <= vote.Round && precommits.HasTwoThirdsAny() {
  1236. cs.enterNewRound(height, vote.Round)
  1237. cs.enterPrecommit(height, vote.Round)
  1238. cs.enterPrecommitWait(height, vote.Round)
  1239. }
  1240. default:
  1241. cmn.PanicSanity(cmn.Fmt("Unexpected vote type %X", vote.Type)) // Should not happen.
  1242. }
  1243. }
  1244. // Either duplicate, or error upon cs.Votes.AddByIndex()
  1245. return
  1246. } else {
  1247. err = ErrVoteHeightMismatch
  1248. }
  1249. // Height mismatch, bad peer?
  1250. cs.Logger.Info("Vote ignored and not added", "voteHeight", vote.Height, "csHeight", cs.Height, "err", err)
  1251. return
  1252. }
  1253. func (cs *ConsensusState) signVote(type_ byte, hash []byte, header types.PartSetHeader) (*types.Vote, error) {
  1254. addr := cs.privValidator.GetAddress()
  1255. valIndex, _ := cs.Validators.GetByAddress(addr)
  1256. vote := &types.Vote{
  1257. ValidatorAddress: addr,
  1258. ValidatorIndex: valIndex,
  1259. Height: cs.Height,
  1260. Round: cs.Round,
  1261. Type: type_,
  1262. BlockID: types.BlockID{hash, header},
  1263. }
  1264. err := cs.privValidator.SignVote(cs.state.ChainID, vote)
  1265. return vote, err
  1266. }
  1267. // sign the vote and publish on internalMsgQueue
  1268. func (cs *ConsensusState) signAddVote(type_ byte, hash []byte, header types.PartSetHeader) *types.Vote {
  1269. // if we don't have a key or we're not in the validator set, do nothing
  1270. if cs.privValidator == nil || !cs.Validators.HasAddress(cs.privValidator.GetAddress()) {
  1271. return nil
  1272. }
  1273. vote, err := cs.signVote(type_, hash, header)
  1274. if err == nil {
  1275. cs.sendInternalMessage(msgInfo{&VoteMessage{vote}, ""})
  1276. cs.Logger.Info("Signed and pushed vote", "height", cs.Height, "round", cs.Round, "vote", vote, "err", err)
  1277. return vote
  1278. } else {
  1279. //if !cs.replayMode {
  1280. cs.Logger.Error("Error signing vote", "height", cs.Height, "round", cs.Round, "vote", vote, "err", err)
  1281. //}
  1282. return nil
  1283. }
  1284. }
  1285. //---------------------------------------------------------
  1286. func CompareHRS(h1, r1 int, s1 cstypes.RoundStepType, h2, r2 int, s2 cstypes.RoundStepType) int {
  1287. if h1 < h2 {
  1288. return -1
  1289. } else if h1 > h2 {
  1290. return 1
  1291. }
  1292. if r1 < r2 {
  1293. return -1
  1294. } else if r1 > r2 {
  1295. return 1
  1296. }
  1297. if s1 < s2 {
  1298. return -1
  1299. } else if s1 > s2 {
  1300. return 1
  1301. }
  1302. return 0
  1303. }