Skip to content

Commit

Permalink
Add more tendermint metrics for block processing (#223)
Browse files Browse the repository at this point in the history
* Add more tendermint metrics for block processing

* Fix

* Fix metric
  • Loading branch information
yzang2019 authored Apr 2, 2024
1 parent e250648 commit 124468c
Show file tree
Hide file tree
Showing 6 changed files with 90 additions and 10 deletions.
9 changes: 9 additions & 0 deletions internal/consensus/metrics.gen.go

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

3 changes: 3 additions & 0 deletions internal/consensus/metrics.go
Original file line number Diff line number Diff line change
Expand Up @@ -170,6 +170,9 @@ type Metrics struct {
// processing all of its parts. Note that this means it also includes network latency from
// block parts gossip
CompleteProposalTime metrics.Histogram

// ApplyBlockLatency measures how long it takes to execute ApplyBlock in finalize commit step
ApplyBlockLatency metrics.Histogram `metrics_labels:"apply_block_ms" metrics_buckettype:"exprange" metrics_bucketsizes:"0.01, 10, 10"`
}

// RecordConsMetrics uses for recording the block related metrics during fast-sync.
Expand Down
3 changes: 2 additions & 1 deletion internal/consensus/state.go
Original file line number Diff line number Diff line change
Expand Up @@ -2184,7 +2184,7 @@ func (cs *State) finalizeCommit(ctx context.Context, height int64) {

// Execute and commit the block, update and save the state, and update the mempool.
// NOTE The block.AppHash won't reflect these txs until the next block.

startTime := time.Now()
stateCopy, err := cs.blockExec.ApplyBlock(spanCtx,
stateCopy,
types.BlockID{
Expand All @@ -2194,6 +2194,7 @@ func (cs *State) finalizeCommit(ctx context.Context, height int64) {
block,
cs.tracer,
)
cs.metrics.ApplyBlockLatency.Observe(float64(time.Since(startTime).Milliseconds()))
if err != nil {
logger.Error("failed to apply block", "err", err)
return
Expand Down
13 changes: 10 additions & 3 deletions internal/state/execution.go
Original file line number Diff line number Diff line change
Expand Up @@ -246,6 +246,7 @@ func (blockExec *BlockExecutor) ApplyBlock(
defer finalizeBlockSpan.End()
}
txs := block.Data.Txs.ToSliceOfBytes()
finalizeBlockStartTime := time.Now()
fBlockRes, err := blockExec.appClient.FinalizeBlock(
ctx,
&abci.RequestFinalizeBlock{
Expand All @@ -269,6 +270,7 @@ func (blockExec *BlockExecutor) ApplyBlock(
LastResultsHash: block.LastResultsHash,
},
)
blockExec.metrics.FinalizeBlockLatency.Observe(float64(time.Since(finalizeBlockStartTime).Milliseconds()))
if finalizeBlockSpan != nil {
finalizeBlockSpan.End()
}
Expand All @@ -286,7 +288,9 @@ func (blockExec *BlockExecutor) ApplyBlock(
)

// Save the results before we commit.
saveBlockResponseTime := time.Now()
err = blockExec.store.SaveFinalizeBlockResponses(block.Height, fBlockRes)
blockExec.metrics.SaveBlockResponseLatency.Observe(float64(time.Since(saveBlockResponseTime).Milliseconds()))
if err != nil && !errors.Is(err, ErrNoFinalizeBlockResponsesForHeight{block.Height}) {
// It is correct to have an empty ResponseFinalizeBlock for ApplyBlock,
// but not for saving it to the state store
Expand Down Expand Up @@ -340,12 +344,14 @@ func (blockExec *BlockExecutor) ApplyBlock(
blockExec.evpool.Update(ctx, state, block.Evidence)

// Update the app hash and save the state.
saveBlockTime := time.Now()
state.AppHash = fBlockRes.AppHash
if err := blockExec.store.Save(state); err != nil {
return state, err
}

blockExec.metrics.SaveBlockLatency.Observe(float64(time.Since(saveBlockTime).Milliseconds()))
// Prune old heights, if requested by ABCI app.
pruneBlockTime := time.Now()
if retainHeight > 0 {
pruned, err := blockExec.pruneBlocks(retainHeight)
if err != nil {
Expand All @@ -354,14 +360,15 @@ func (blockExec *BlockExecutor) ApplyBlock(
blockExec.logger.Debug("pruned blocks", "pruned", pruned, "retain_height", retainHeight)
}
}

blockExec.metrics.PruneBlockLatency.Observe(float64(time.Since(pruneBlockTime).Milliseconds()))
// reset the verification cache
blockExec.cache = make(map[string]struct{})

// Events are fired after everything else.
// NOTE: if we crash between Commit and Save, events wont be fired during replay
fireEventsStartTime := time.Now()
FireEvents(blockExec.logger, blockExec.eventBus, block, blockID, fBlockRes, validatorUpdates)

blockExec.metrics.FireEventsLatency.Observe(float64(time.Since(fireEventsStartTime).Milliseconds()))
return state, nil
}

Expand Down
57 changes: 51 additions & 6 deletions internal/state/metrics.gen.go

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

15 changes: 15 additions & 0 deletions internal/state/metrics.go
Original file line number Diff line number Diff line change
Expand Up @@ -37,4 +37,19 @@ type Metrics struct {
// UpdateMempoolTime meaures how long it takes to update mempool after commiting, including
// reCheckTx
UpdateMempoolTime metrics.Histogram

// FinalizeBlockLatency measures how long it takes to run abci FinalizeBlock
FinalizeBlockLatency metrics.Histogram `metrics_labels:"finalize_blocks_ms" metrics_buckettype:"exprange" metrics_bucketsizes:"0.01, 10, 10"`

// SaveBlockResponseLatency measures how long it takes to run save the FinalizeBlockRes
SaveBlockResponseLatency metrics.Histogram `metrics_labels:"save_block_response_ms" metrics_buckettype:"exprange" metrics_bucketsizes:"0.01, 10, 10"`

// SaveBlockLatency measure how long it takes to save the block
SaveBlockLatency metrics.Histogram `metrics_labels:"save_block_ms" metrics_buckettype:"exprange" metrics_bucketsizes:"0.01, 10, 10"`

// PruneBlockLatency measures how long it takes to prune block from blockstore
PruneBlockLatency metrics.Histogram `metrics_labels:"prune_block_ms" metrics_buckettype:"exprange" metrics_bucketsizes:"0.01, 10, 10"`

// FireEventsLatency measures how long it takes to fire events for indexing
FireEventsLatency metrics.Histogram `metrics_labels:"prune_block_ms" metrics_buckettype:"exprange" metrics_bucketsizes:"0.01, 10, 10"`
}

0 comments on commit 124468c

Please sign in to comment.