onflow · peterargue · May 9, 2025 · May 9, 2025 · May 22, 2025 · May 27, 2025
@@ -0,0 +1,186 @@
+package ingestion2
+
+import (
+	"fmt"
+
+	"github.com/rs/zerolog"
+
+	"github.com/onflow/flow-go/consensus/hotstuff"
+	"github.com/onflow/flow-go/consensus/hotstuff/model"
+	"github.com/onflow/flow-go/engine"
+	"github.com/onflow/flow-go/model/flow"
+	"github.com/onflow/flow-go/module"
+	"github.com/onflow/flow-go/module/component"
+	"github.com/onflow/flow-go/module/counters"
+	"github.com/onflow/flow-go/module/irrecoverable"
+	"github.com/onflow/flow-go/module/jobqueue"
+	"github.com/onflow/flow-go/state/protocol"
+	"github.com/onflow/flow-go/storage"
+)
+
+type Engine struct {
+	component.Component
+	cm *component.ComponentManager
+
+	log   zerolog.Logger
+	state protocol.State // used to access the  protocol state
+
+	blocks            storage.Blocks
+	headers           storage.Headers
+	executionReceipts storage.ExecutionReceipts
+	executionResults  storage.ExecutionResults
+
+	lastFullBlockHeight *counters.PersistentStrictMonotonicCounter
+
+	// Job queue
+	finalizedBlockConsumer *jobqueue.ComponentConsumer
+	// Notifier for queue consumer
+	finalizedBlockNotifier engine.Notifier
+
+	resultsForest *ResultsForest
+	maxForestSize uint
+
+	collectionExecutedMetric module.CollectionExecutedMetric
+
+	latestPersistedSealedResult *LatestPersistedSealedResult
+}
+
+var _ hotstuff.FinalizationConsumer = (*Engine)(nil)
+
+func New(
+	log zerolog.Logger,
+	latestPersistedSealedResult *LatestPersistedSealedResult,
+) *Engine {
+	resultsForest := NewResultsForest(log, latestPersistedSealedResult)
+
+	e := &Engine{
+		log:           log.With().Str("component", "ingestion").Logger(),
+		resultsForest: resultsForest,
+	}
+
+	cm := component.NewComponentManagerBuilder().
+		AddWorker(e.runForest).
+		AddWorker(e.runForestLoader).
+		Build()
+
+	e.cm = cm
+	e.Component = cm
+
+	return e
+}
+
+func (e *Engine) runForest(ctx irrecoverable.SignalerContext, ready component.ReadyFunc) {
+	e.resultsForest.Start(ctx)
+
+	select {
+	case <-ctx.Done():
+	case <-e.resultsForest.Ready():
+		ready()
+	}
+
+	<-e.resultsForest.Done()
+}
+
+func (e *Engine) runForestLoader(ctx irrecoverable.SignalerContext, ready component.ReadyFunc) {
+	loader := NewForestLoader(e.resultsForest, e.latestPersistedSealedResult.ResultID(), e.maxForestSize)
+
+	select {
+	case <-ctx.Done():
+		return
+	case <-e.resultsForest.Ready():
+	}
+
+	ready()
+	if err := loader.Run(ctx); err != nil {
+		ctx.Throw(err)
+		return
+	}
 entries, err := l.getUnsealedResults(previousHeader, finalizedHeader) 
 if err != nil { 
 	return fmt.Errorf("could not get unsealed results: %w", err) 
 } 
 for _, re := range entries { 
 	err := l.forest.AddResult(re.result, re.header, false) 
 	if err != nil { 
 		return fmt.Errorf("could not add result %s to forest: %w", re.result.ID(), err) 
 	} 
 } 
 entries, err := l.getUnsealedResults(previousHeader, finalizedHeader) 
 if err != nil { 
 	return fmt.Errorf("could not get unsealed results: %w", err) 
 } 
  
 for _, re := range entries { 
 	err := l.forest.AddResult(re.result, re.header, false) 
 	if err != nil { 
 		return fmt.Errorf("could not add result %s to forest: %w", re.result.ID(), err) 
 	} 
 } 
+}
+
+// OnFinalizedBlock is called by the follower engine after a block has been finalized and
+// the state has been updated. Receives events from the finalization distributor.
+func (e *Engine) OnFinalizedBlock(*model.Block) {
+	// Per specification of the `hotstuff.FinalizationConsumer` consumers of the `OnBlockIncorporated` notification must
+	// be non-blocking. This code is run on the hotpath of consensus and should induce as little overhead as possible.
+	//
+	// The input is coming from the node-internal consensus follower, which is a trusted component. Hence, we don't
+	// need to verify the inputs and queue them directly for processing by one of the engine's workers.
+	e.finalizedBlockNotifier.Notify()
+}
+
+// OnBlockIncorporated is called by the follower engine after a block has been certified and the state has been updated.
+// Receives block incorporated events from the finalization distributor.
+func (e *Engine) OnBlockIncorporated(hotstuffBlock *model.Block) {
+	// Per specification of the `hotstuff.FinalizationConsumer` consumers of the `OnBlockIncorporated` notification must
+	// be non-blocking. This code is run on the hotpath of consensus and should induce as little overhead as possible.
+	//
+	// The input is coming from the node-internal consensus follower, which is a trusted component. Hence, we don't
+	// need to verify the inputs and queue them directly for processing by one of the engine's workers.
+
+	// ToDO: queue incoming incorporated hotstuffBlock for processing in a dedicated pipeline
+	// The thread picking up the hotstuffBlock would then convert it to `flow.block` and process it further
+	//
+	//  block, err := e.blocks.ByID(hotstuffBlock.BlockID)
+	//  if err != nil {
+	//	  return irrecoverable.NewExceptionf("received incorporated block %s from consensus follower, but failed to retrieve full block: %w", err)
+	//   }
+	//   err = e.processCertifiedBlock(block)
+	//      ...
+}
+
+// processCertifiedBlock adds results from the certified block to the results forest.
+// No errors are expected during normal operation.
+func (e *Engine) processCertifiedBlock(block *flow.Block) error {
+	for _, result := range block.Payload.Results {
+		if err := e.resultsForest.AddResult(result, block.Header, false); err != nil {
+			return fmt.Errorf("could not add result %s to forest: %w", result.ID(), err)
+		}
+	}
+	return nil
+}
+
+// processFinalizedBlock handles an incoming finalized block.
+// It processes the block, indexes it for further processing, and requests missing collections if necessary.
+//
+// Expected errors during normal operation:
+//   - storage.ErrNotFound - if last full block height does not exist in the database.
+//   - storage.ErrAlreadyExists - if the collection within block or an execution result ID already exists in the database.
+//   - generic error in case of unexpected failure from the database layer, or failure
+//     to decode an existing database value.
+func (e *Engine) processFinalizedBlock(block *flow.Block) error {
+	// index the block storage with each of the collection guarantee
+	err := e.blocks.IndexBlockForCollections(block.Header.ID(), flow.GetIDs(block.Payload.Guarantees))
+	if err != nil {
+		return fmt.Errorf("could not index block for collections: %w", err)
+	}
+
+	// index sealed results and notify the results forest
+	for _, seal := range block.Payload.Seals {
+		if err := e.executionResults.Index(seal.BlockID, seal.ResultID); err != nil {
+			return fmt.Errorf("could not index block for execution result (id: %s): %w", seal.ResultID, err)
+		}
+
+		if err := e.resultsForest.OnResultSealed(seal.ResultID); err != nil {
+			return fmt.Errorf("could not notify results forest of newly sealed result (id: %s): %w", seal.ResultID, err)
+		}
+	}
+
+	e.collectionExecutedMetric.BlockFinalized(block)
+
+	return nil
+}
+
+// handleExecutionReceipt persists the execution receipt locally.
+// Storing the execution receipt and updates the collection executed metric.
+//
+// No errors are expected during normal operation.
+func (e *Engine) handleExecutionReceipt(receipt *flow.ExecutionReceipt) error {
+	// persist the execution receipt locally, storing will also index the receipt
+	err := e.executionReceipts.Store(receipt)
+	if err != nil {
+		return fmt.Errorf("failed to store execution receipt: %w", err)
+	}
+
+	e.collectionExecutedMetric.ExecutionReceiptReceived(receipt)
+	return nil
+}
@@ -0,0 +1,52 @@
+package ingestion2
+
+import (
+	"fmt"
+
+	"github.com/onflow/flow-go/model/flow"
+	pipeline "github.com/onflow/flow-go/module/executiondatasync/optimistic_syncing"
+	"github.com/onflow/flow-go/module/forest"
+)
+
+var _ forest.Vertex = (*ExecutionResultContainer)(nil)
+
+// ExecutionResultContainer represents an ExecutionResult within the LevelledForest.
+// Implements LevelledForest's Vertex interface.
+type ExecutionResultContainer struct {
+	result      *flow.ExecutionResult
+	resultID    flow.Identifier // precomputed ID of result to avoid expensive hashing on each call
+	blockHeader *flow.Header    // header of the block which the result is for
+	pipeline    pipeline.Pipeline
+}
+
+// NewExecutionResultContainer instantiates an empty Equivalence Class (without any receipts)
+// No errors are expected during normal operation.
+func NewExecutionResultContainer(
+	result *flow.ExecutionResult,
+	header *flow.Header,
+	pipeline pipeline.Pipeline,
+) (*ExecutionResultContainer, error) {
+	// sanity check: initial result should be for block
+	if header.ID() != result.BlockID {
+		return nil, fmt.Errorf("initial result is for different block")
+	}
+
+	// construct ExecutionResultContainer only containing initialReceipt
+	return &ExecutionResultContainer{
+		result:      result,
+		resultID:    result.ID(),
+		blockHeader: header,
+		pipeline:    pipeline,
+	}, nil
+}
+
+// VertexID returns the ExecutionResult ID of the ExecutionResultContainer.
+func (c *ExecutionResultContainer) VertexID() flow.Identifier { return c.resultID }
+
+// Level returns the View of the block the ExecutionResult is associated with.
+func (c *ExecutionResultContainer) Level() uint64 { return c.blockHeader.View }
+
+// Parent returns the ID and view of the parent result.
+func (c *ExecutionResultContainer) Parent() (flow.Identifier, uint64) {
+	return c.result.PreviousResultID, c.blockHeader.ParentView
+}