From c9666ece4f1a983de8e36d0947d737958429405c Mon Sep 17 00:00:00 2001 From: Peter Argue <89119817+peterargue@users.noreply.github.com> Date: Wed, 16 Oct 2024 16:12:26 -0700 Subject: [PATCH 1/5] Add traces backfill option --- api/profiler.go | 4 +-- bootstrap/bootstrap.go | 12 +++++++++ config/config.go | 6 ++++- services/traces/engine.go | 53 +++++++++++++++++++++++++++++++++++++-- 4 files changed, 70 insertions(+), 5 deletions(-) diff --git a/api/profiler.go b/api/profiler.go index 683a7884a..cda1b8b89 100644 --- a/api/profiler.go +++ b/api/profiler.go @@ -30,8 +30,8 @@ func NewProfileServer( } } -func (h *ProfileServer) ListenAddr() string { - return h.endpoint +func (s *ProfileServer) ListenAddr() string { + return s.endpoint } func (s *ProfileServer) Start() { diff --git a/bootstrap/bootstrap.go b/bootstrap/bootstrap.go index c524fb1c7..54dbcc2a2 100644 --- a/bootstrap/bootstrap.go +++ b/bootstrap/bootstrap.go @@ -163,6 +163,18 @@ func (b *Bootstrap) StartTraceDownloader(ctx context.Context) error { ) StartEngine(ctx, b.traces, l) + + if b.config.TracesBackfillStartHeight > 0 { + endHeight := b.config.TracesBackfillEndHeight + if endHeight == 0 { + endHeight, err = b.storages.Blocks.LatestEVMHeight() + if err != nil { + return fmt.Errorf("failed to get latest EVM height: %w", err) + } + } + go b.traces.Backfill(b.config.TracesBackfillStartHeight, endHeight) + } + return nil } diff --git a/config/config.go b/config/config.go index 4fec57842..95066fcad 100644 --- a/config/config.go +++ b/config/config.go @@ -86,7 +86,9 @@ type Config struct { // TracesBucketName sets the GCP bucket name where transaction traces are being stored. TracesBucketName string // TracesEnabled sets whether the node is supporting transaction traces. - TracesEnabled bool + TracesEnabled bool + TracesBackfillStartHeight uint64 + TracesBackfillEndHeight uint64 // WalletEnabled sets whether wallet APIs are enabled WalletEnabled bool // WalletKey used for signing transactions @@ -158,6 +160,8 @@ func FromFlags() (*Config, error) { flag.Uint64Var(&forceStartHeight, "force-start-height", 0, "Force set starting Cadence height. WARNING: This should only be used locally or for testing, never in production.") flag.StringVar(&filterExpiry, "filter-expiry", "5m", "Filter defines the time it takes for an idle filter to expire") flag.StringVar(&cfg.TracesBucketName, "traces-gcp-bucket", "", "GCP bucket name where transaction traces are stored") + flag.Uint64Var(&cfg.TracesBackfillStartHeight, "traces-backfill-start-height", 0, "evm block height from which to start backfilling missing traces.") + flag.Uint64Var(&cfg.TracesBackfillEndHeight, "traces-backfill-end-height", 0, "evm block height until which to backfill missing traces. If 0, backfill until the latest block") flag.StringVar(&cloudKMSProjectID, "coa-cloud-kms-project-id", "", "The project ID containing the KMS keys, e.g. 'flow-evm-gateway'") flag.StringVar(&cloudKMSLocationID, "coa-cloud-kms-location-id", "", "The location ID where the key ring is grouped into, e.g. 'global'") flag.StringVar(&cloudKMSKeyRingID, "coa-cloud-kms-key-ring-id", "", "The key ring ID where the KMS keys exist, e.g. 'tx-signing'") diff --git a/services/traces/engine.go b/services/traces/engine.go index 0f089f0ed..1cbc99192 100644 --- a/services/traces/engine.go +++ b/services/traces/engine.go @@ -84,11 +84,11 @@ func (e *Engine) Notify(block *models.Block) { return } - go e.indexBlockTraces(block, cadenceID) + go e.indexBlockTraces(block, cadenceID, false) } // indexBlockTraces iterates the block transaction hashes and tries to download the traces -func (e *Engine) indexBlockTraces(evmBlock *models.Block, cadenceBlockID flow.Identifier) { +func (e *Engine) indexBlockTraces(evmBlock *models.Block, cadenceBlockID flow.Identifier, skipExisting bool) { ctx, cancel := context.WithTimeout(context.Background(), downloadTimeout) defer cancel() @@ -107,9 +107,17 @@ func (e *Engine) indexBlockTraces(evmBlock *models.Block, cadenceBlockID flow.Id l := e.logger.With(). Str("tx-id", h.String()). + Uint64("evm-height", evmBlock.Height). Str("cadence-block-id", cadenceBlockID.String()). Logger() + if skipExisting { + if _, err := e.traces.GetTransaction(h); err == nil { + l.Debug().Msg("trace already downloaded") + return + } + } + err := retry.Fibonacci(ctx, time.Second*1, func(ctx context.Context) error { trace, err := e.downloader.Download(h, cadenceBlockID) if err != nil { @@ -140,3 +148,44 @@ func (e *Engine) Error() <-chan error { func (e *Engine) Stop() { e.MarkStopped() } + +// Backfill redownloads traces for blocks from EVM start to end height. +func (e *Engine) Backfill(start uint64, end uint64) { + select { + case <-e.Ready(): + case <-e.Done(): + return + } + + e.logger.Info().Uint64("start", start).Uint64("end", end).Msg("backfilling traces") + for height := start; height <= end; height++ { + select { + case <-e.Done(): + return + case <-e.Stopped(): + return + default: + } + + l := e.logger.With().Uint64("evm-height", height).Logger() + + block, err := e.blocks.GetByHeight(height) + if err != nil { + l.Error().Err(err).Msg("failed to get block by height") + return + } + + if len(block.TransactionHashes) == 0 { + continue + } + + cadenceID, err := e.blocks.GetCadenceID(block.Height) + if err != nil { + l.Error().Err(err).Msg("failed to get cadence block ID") + return + } + + e.indexBlockTraces(block, cadenceID, true) + } + e.logger.Info().Uint64("start", start).Uint64("end", end).Msg("done backfilling traces") +} From 45d2dd8c632504ddd17f055a5c50bf1c862d10a2 Mon Sep 17 00:00:00 2001 From: Peter Argue <89119817+peterargue@users.noreply.github.com> Date: Wed, 16 Oct 2024 16:23:39 -0700 Subject: [PATCH 2/5] Add comments and update readme --- README.md | 72 +++++++++++++++++++++++++----------------------- config/config.go | 6 ++-- 2 files changed, 41 insertions(+), 37 deletions(-) diff --git a/README.md b/README.md index c3a3299b1..7932687de 100644 --- a/README.md +++ b/README.md @@ -172,41 +172,43 @@ Running the EVM gateway for mainnet requires additional security and stability m The application can be configured using the following flags at runtime: -| Flag | Default Value | Description | -|------------------------------|---------------------------------|------------------------------------------------------------------------------------------| -| `database-dir` | `./db` | Path to the directory for the database | -| `rpc-host` | `""` | Host for the RPC API server | -| `rpc-port` | `8545` | Port for the RPC API server | -| `ws-enabled` | `false` | Enable websocket connections | -| `access-node-grpc-host` | `localhost:3569` | Host to the flow access node gRPC API | -| `access-node-spork-hosts` | `""` | Previous spork AN hosts, defined as a comma-separated list (e.g. `"host-1.com,host2.com"`) | -| `flow-network-id` | `flow-emulator` | Flow network ID (options: `flow-emulator`, `flow-testnet`, `flow-mainnet`) | -| `coinbase` | `""` | Coinbase address to use for fee collection | -| `init-cadence-height` | `0` | Cadence block height to start indexing; avoid using on a new network | -| `gas-price` | `1` | Static gas price for EVM transactions | -| `coa-address` | `""` | Flow address holding COA account for submitting transactions | -| `coa-key` | `""` | Private key for the COA address used for transactions | -| `coa-key-file` | `""` | Path to a JSON file of COA keys for key-rotation (exclusive with `coa-key` flag) | -| `coa-resource-create` | `false` | Auto-create the COA resource if it doesn't exist in the Flow COA account | -| `coa-cloud-kms-project-id` | `""` | Project ID for KMS keys (e.g. `flow-evm-gateway`) | -| `coa-cloud-kms-location-id` | `""` | Location ID for KMS key ring (e.g. 'global') | -| `coa-cloud-kms-key-ring-id` | `""` | Key ring ID for KMS keys (e.g. 'tx-signing') | -| `coa-cloud-kms-keys` | `""` | KMS keys and versions, comma-separated (e.g. `"gw-key-6@1,gw-key-7@1"`) | -| `log-level` | `debug` | Log verbosity level (`debug`, `info`, `warn`, `error`, `fatal`, `panic`) | -| `log-writer` | `stderr` | Output method for logs (`stderr`, `console`) | -| `stream-limit` | `10` | Rate-limit for client events sent per second | -| `rate-limit` | `50` | Requests per second limit for clients over any protocol (ws/http) | -| `address-header` | `""` | Header for client IP when server is behind a proxy | -| `heartbeat-interval` | `100` | Interval for AN event subscription heartbeats | -| `stream-timeout` | `3` | Timeout in seconds for sending events to clients | -| `force-start-height` | `0` | Force-set starting Cadence height (local/testing use only) | -| `wallet-api-key` | `""` | ECDSA private key for wallet APIs (local/testing use only) | -| `filter-expiry` | `5m` | Expiry time for idle filters | -| `traces-gcp-bucket` | `""` | GCP bucket name for transaction traces | -| `index-only` | `false` | Run in index-only mode, allowing state queries and indexing but no transaction sending | -| `profiler-enabled` | `false` | Enable the pprof profiler server | -| `profiler-host` | `localhost` | Host for the pprof profiler | -| `profiler-port` | `6060` | Port for the pprof profiler | +| Flag | Default Value | Description | +|--------------------------------|-------------------------------|------------------------------------------------------------------------------------------| +| `database-dir` | `./db` | Path to the directory for the database | +| `rpc-host` | `""` | Host for the RPC API server | +| `rpc-port` | `8545` | Port for the RPC API server | +| `ws-enabled` | `false` | Enable websocket connections | +| `access-node-grpc-host` | `localhost:3569` | Host to the flow access node gRPC API | +| `access-node-spork-hosts` | `""` | Previous spork AN hosts, defined as a comma-separated list (e.g. `"host-1.com,host2.com"`) | +| `flow-network-id` | `flow-emulator` | Flow network ID (options: `flow-emulator`, `flow-testnet`, `flow-mainnet`) | +| `coinbase` | `""` | Coinbase address to use for fee collection | +| `init-cadence-height` | `0` | Cadence block height to start indexing; avoid using on a new network | +| `gas-price` | `1` | Static gas price for EVM transactions | +| `coa-address` | `""` | Flow address holding COA account for submitting transactions | +| `coa-key` | `""` | Private key for the COA address used for transactions | +| `coa-key-file` | `""` | Path to a JSON file of COA keys for key-rotation (exclusive with `coa-key` flag) | +| `coa-resource-create` | `false` | Auto-create the COA resource if it doesn't exist in the Flow COA account | +| `coa-cloud-kms-project-id` | `""` | Project ID for KMS keys (e.g. `flow-evm-gateway`) | +| `coa-cloud-kms-location-id` | `""` | Location ID for KMS key ring (e.g. 'global') | +| `coa-cloud-kms-key-ring-id` | `""` | Key ring ID for KMS keys (e.g. 'tx-signing') | +| `coa-cloud-kms-keys` | `""` | KMS keys and versions, comma-separated (e.g. `"gw-key-6@1,gw-key-7@1"`) | +| `log-level` | `debug` | Log verbosity level (`debug`, `info`, `warn`, `error`, `fatal`, `panic`) | +| `log-writer` | `stderr` | Output method for logs (`stderr`, `console`) | +| `stream-limit` | `10` | Rate-limit for client events sent per second | +| `rate-limit` | `50` | Requests per second limit for clients over any protocol (ws/http) | +| `address-header` | `""` | Header for client IP when server is behind a proxy | +| `heartbeat-interval` | `100` | Interval for AN event subscription heartbeats | +| `stream-timeout` | `3` | Timeout in seconds for sending events to clients | +| `force-start-height` | `0` | Force-set starting Cadence height (local/testing use only) | +| `wallet-api-key` | `""` | ECDSA private key for wallet APIs (local/testing use only) | +| `filter-expiry` | `5m` | Expiry time for idle filters | +| `traces-gcp-bucket` | `""` | GCP bucket name for transaction traces | +| `traces-backfill-start-height` | `0` | Start height for backfilling transaction traces | +| `traces-backfill-end-height` | `0` | End height for backfilling transaction traces | +| `index-only` | `false` | Run in index-only mode, allowing state queries and indexing but no transaction sending | +| `profiler-enabled` | `false` | Enable the pprof profiler server | +| `profiler-host` | `localhost` | Host for the pprof profiler | +| `profiler-port` | `6060` | Port for the pprof profiler | # Deploying Deploying the EVM Gateway node comes with some prerequisites as well as expectations and they are best explained in the WIP document: https://flowfoundation.notion.site/EVM-Gateway-Deployment-3c41da6710af40acbaf971e22ce0a9fd diff --git a/config/config.go b/config/config.go index 95066fcad..0f6c75b26 100644 --- a/config/config.go +++ b/config/config.go @@ -86,9 +86,11 @@ type Config struct { // TracesBucketName sets the GCP bucket name where transaction traces are being stored. TracesBucketName string // TracesEnabled sets whether the node is supporting transaction traces. - TracesEnabled bool + TracesEnabled bool + // TracesBackfillStartHeight sets the starting block height for backfilling missing traces. TracesBackfillStartHeight uint64 - TracesBackfillEndHeight uint64 + // TracesBackfillEndHeight sets the ending block height for backfilling missing traces. + TracesBackfillEndHeight uint64 // WalletEnabled sets whether wallet APIs are enabled WalletEnabled bool // WalletKey used for signing transactions From 9232c44e8c5a0a2b1df57dc000da9b31bca19751 Mon Sep 17 00:00:00 2001 From: Peter Argue <89119817+peterargue@users.noreply.github.com> Date: Wed, 16 Oct 2024 16:34:21 -0700 Subject: [PATCH 3/5] validate range --- bootstrap/bootstrap.go | 10 +++++++++- config/config.go | 4 ++++ 2 files changed, 13 insertions(+), 1 deletion(-) diff --git a/bootstrap/bootstrap.go b/bootstrap/bootstrap.go index 54dbcc2a2..478f86a95 100644 --- a/bootstrap/bootstrap.go +++ b/bootstrap/bootstrap.go @@ -165,14 +165,22 @@ func (b *Bootstrap) StartTraceDownloader(ctx context.Context) error { StartEngine(ctx, b.traces, l) if b.config.TracesBackfillStartHeight > 0 { + startHeight := b.config.TracesBackfillStartHeight + if _, err := b.storages.Blocks.GetByHeight(startHeight); err != nil { + return fmt.Errorf("failed to get provided start height %d in db: %w", startHeight, err) + } + endHeight := b.config.TracesBackfillEndHeight if endHeight == 0 { endHeight, err = b.storages.Blocks.LatestEVMHeight() if err != nil { return fmt.Errorf("failed to get latest EVM height: %w", err) } + } else if _, err := b.storages.Blocks.GetByHeight(endHeight); err != nil { + return fmt.Errorf("failed to get provided end height %d in db: %w", endHeight, err) } - go b.traces.Backfill(b.config.TracesBackfillStartHeight, endHeight) + + go b.traces.Backfill(startHeight, endHeight) } return nil diff --git a/config/config.go b/config/config.go index 0f6c75b26..b51308a43 100644 --- a/config/config.go +++ b/config/config.go @@ -316,6 +316,10 @@ func FromFlags() (*Config, error) { cfg.TracesEnabled = cfg.TracesBucketName != "" + if cfg.TracesBackfillStartHeight > 0 && cfg.TracesBackfillEndHeight > 0 && cfg.TracesBackfillStartHeight > cfg.TracesBackfillEndHeight { + return nil, fmt.Errorf("traces backfill start height must be less than the end height") + } + if walletKey != "" { k, err := gethCrypto.HexToECDSA(walletKey) if err != nil { From 378e60f86d834fba4bced1f3496cd310cbcef52b Mon Sep 17 00:00:00 2001 From: Peter Argue <89119817+peterargue@users.noreply.github.com> Date: Thu, 17 Oct 2024 08:28:42 -0700 Subject: [PATCH 4/5] add check that backfill start height is after init height --- bootstrap/bootstrap.go | 13 +++++++++++++ services/traces/engine.go | 8 +++++--- 2 files changed, 18 insertions(+), 3 deletions(-) diff --git a/bootstrap/bootstrap.go b/bootstrap/bootstrap.go index 478f86a95..dbed6f484 100644 --- a/bootstrap/bootstrap.go +++ b/bootstrap/bootstrap.go @@ -170,6 +170,19 @@ func (b *Bootstrap) StartTraceDownloader(ctx context.Context) error { return fmt.Errorf("failed to get provided start height %d in db: %w", startHeight, err) } + cadenceStartHeight, err := b.storages.Blocks.GetCadenceHeight(startHeight) + if err != nil { + return fmt.Errorf("failed to get cadence height for backfill start height %d: %w", startHeight, err) + } + + if cadenceStartHeight < b.config.InitCadenceHeight { + b.logger.Warn(). + Uint64("evm-start-height", startHeight). + Uint64("cadence-start-height", cadenceStartHeight). + Uint64("init-cadence-height", b.config.InitCadenceHeight). + Msg("backfill start height is before initial cadence height. data may be missing from configured traces bucket") + } + endHeight := b.config.TracesBackfillEndHeight if endHeight == 0 { endHeight, err = b.storages.Blocks.LatestEVMHeight() diff --git a/services/traces/engine.go b/services/traces/engine.go index 1cbc99192..a76830c01 100644 --- a/services/traces/engine.go +++ b/services/traces/engine.go @@ -157,7 +157,9 @@ func (e *Engine) Backfill(start uint64, end uint64) { return } - e.logger.Info().Uint64("start", start).Uint64("end", end).Msg("backfilling traces") + lg := e.logger.With().Uint64("start", start).Uint64("end", end).Logger() + + lg.Info().Msg("backfilling traces") for height := start; height <= end; height++ { select { case <-e.Done(): @@ -167,7 +169,7 @@ func (e *Engine) Backfill(start uint64, end uint64) { default: } - l := e.logger.With().Uint64("evm-height", height).Logger() + l := lg.With().Uint64("evm-height", height).Logger() block, err := e.blocks.GetByHeight(height) if err != nil { @@ -187,5 +189,5 @@ func (e *Engine) Backfill(start uint64, end uint64) { e.indexBlockTraces(block, cadenceID, true) } - e.logger.Info().Uint64("start", start).Uint64("end", end).Msg("done backfilling traces") + lg.Info().Msg("done backfilling traces") } From 03d06c53f9aea0c0e930c3982e193ebbd5951619 Mon Sep 17 00:00:00 2001 From: Peter Argue <89119817+peterargue@users.noreply.github.com> Date: Thu, 17 Oct 2024 11:33:08 -0700 Subject: [PATCH 5/5] remove unused map that caused concurrent write in test --- services/traces/engine_test.go | 2 -- 1 file changed, 2 deletions(-) diff --git a/services/traces/engine_test.go b/services/traces/engine_test.go index 89473afcb..028309918 100644 --- a/services/traces/engine_test.go +++ b/services/traces/engine_test.go @@ -62,12 +62,10 @@ func TestTraceIngestion(t *testing.T) { return blockID, nil }) - downloadedHashes := make(map[gethCommon.Hash]struct{}) downloader. On("Download", mock.Anything, mock.Anything). Return(func(txID gethCommon.Hash, blkID flow.Identifier) (json.RawMessage, error) { require.Equal(t, blockID, blkID) - downloadedHashes[txID] = struct{}{} time.Sleep(time.Millisecond * 200) // simulate download delay return txTrace(txID), nil })