Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Migrate Events Processor to Use New Version Tracker Impl #560

Merged
merged 5 commits into from
Oct 23, 2024
Merged
Show file tree
Hide file tree
Changes from 4 commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions rust/Cargo.lock

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

2 changes: 1 addition & 1 deletion rust/integration-tests/src/models/queryable_models.rs
Original file line number Diff line number Diff line change
Expand Up @@ -149,8 +149,8 @@ pub struct FungibleAssetMetadataModel {
pub supply_aggregator_table_handle_v1: Option<String>,
pub supply_aggregator_table_key_v1: Option<String>,
pub token_standard: String,
pub is_token_v2: Option<bool>,
pub inserted_at: chrono::NaiveDateTime,
pub is_token_v2: Option<bool>,
pub supply_v2: Option<BigDecimal>,
pub maximum_v2: Option<BigDecimal>,
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -34,6 +34,7 @@ pub async fn setup_events_processor_config(
processor_config,
transaction_stream_config,
db_config,
backfill_config: None,
},
processor_name,
)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -35,6 +35,7 @@ pub fn setup_fa_processor_config(
processor_config,
transaction_stream_config,
db_config,
backfill_config: None,
},
processor_name,
)
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
-- This file should undo anything in `up.sql`
DROP TABLE IF EXISTS backfill_processor_status;
Original file line number Diff line number Diff line change
@@ -0,0 +1,11 @@
-- Your SQL goes here
CREATE TABLE backfill_processor_status (
backfill_alias VARCHAR(50) NOT NULL,
backfill_status VARCHAR(50) NOT NULL,
last_success_version BIGINT NOT NULL,
last_updated TIMESTAMP NOT NULL DEFAULT NOW(),
last_transaction_timestamp TIMESTAMP NULL,
backfill_start_version BIGINT NOT NULL,
backfill_end_version BIGINT NOT NULL,
PRIMARY KEY (backfill_alias)
);
17 changes: 16 additions & 1 deletion rust/processor/src/db/postgres/schema.rs
Original file line number Diff line number Diff line change
Expand Up @@ -84,6 +84,20 @@ diesel::table! {
}
}

diesel::table! {
backfill_processor_status (backfill_alias) {
#[max_length = 50]
backfill_alias -> Varchar,
#[max_length = 50]
backfill_status -> Varchar,
last_success_version -> Int8,
last_updated -> Timestamp,
last_transaction_timestamp -> Nullable<Timestamp>,
backfill_start_version -> Int8,
backfill_end_version -> Int8,
}
}

diesel::table! {
block_metadata_transactions (version) {
version -> Int8,
Expand Down Expand Up @@ -837,8 +851,8 @@ diesel::table! {
supply_aggregator_table_key_v1 -> Nullable<Text>,
#[max_length = 10]
token_standard -> Varchar,
is_token_v2 -> Nullable<Bool>,
inserted_at -> Timestamp,
is_token_v2 -> Nullable<Bool>,
Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

This needed to be changed around otherwise whenever the migrations are re-ran, the ordering of the produced struct's constructor changes causing some issues.

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

to add a bit of context: this is reverting the change I made manually. this order should be always the same unless we change in sql file.

supply_v2 -> Nullable<Numeric>,
maximum_v2 -> Nullable<Numeric>,
}
Expand Down Expand Up @@ -1285,6 +1299,7 @@ diesel::allow_tables_to_appear_in_same_query!(
ans_lookup_v2,
ans_primary_name,
ans_primary_name_v2,
backfill_processor_status,
block_metadata_transactions,
coin_activities,
coin_balances,
Expand Down
1 change: 1 addition & 0 deletions rust/sdk-processor/Cargo.toml
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,7 @@ ahash = { workspace = true }
anyhow = { workspace = true }
aptos-indexer-processor-sdk = { workspace = true }
aptos-indexer-processor-sdk-server-framework = { workspace = true }
aptos-indexer-testing-framework = { workspace = true }
async-trait = { workspace = true }
bcs = { workspace = true }
bigdecimal = { workspace = true }
Expand Down
7 changes: 7 additions & 0 deletions rust/sdk-processor/src/config/indexer_processor_config.rs
Original file line number Diff line number Diff line change
Expand Up @@ -19,6 +19,7 @@ pub struct IndexerProcessorConfig {
pub processor_config: ProcessorConfig,
pub transaction_stream_config: TransactionStreamConfig,
pub db_config: DbConfig,
pub backfill_config: Option<BackfillConfig>,
}

#[async_trait::async_trait]
Expand Down Expand Up @@ -47,3 +48,9 @@ impl RunnableConfig for IndexerProcessorConfig {
before_underscore[..before_underscore.len().min(12)].to_string()
}
}

#[derive(Clone, Debug, Deserialize, Serialize)]
#[serde(deny_unknown_fields)]
pub struct BackfillConfig {
pub backfill_alias: String,
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,86 @@
// Copyright © Aptos Foundation
// SPDX-License-Identifier: Apache-2.0

#![allow(clippy::extra_unused_lifetimes)]

use crate::utils::database::DbPoolConnection;
use diesel::{
deserialize,
deserialize::{FromSql, FromSqlRow},
expression::AsExpression,
pg::{Pg, PgValue},
serialize,
serialize::{IsNull, Output, ToSql},
sql_types::Text,
AsChangeset, ExpressionMethods, Insertable, OptionalExtension, QueryDsl, Queryable,
};
use diesel_async::RunQueryDsl;
use processor::schema::backfill_processor_status;
use std::io::Write;

#[derive(Debug, PartialEq, FromSqlRow, AsExpression, Eq)]
#[diesel(sql_type = Text)]
pub enum BackfillStatus {
// #[diesel(rename = "in_progress")]
InProgress,
// #[diesel(rename = "complete")]
Complete,
}

impl ToSql<Text, Pg> for BackfillStatus {
fn to_sql<'b>(&'b self, out: &mut Output<'b, '_, Pg>) -> serialize::Result {
match *self {
BackfillStatus::InProgress => out.write_all(b"in_progress")?,
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

nit: should we have the bytes in a constant var?

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

done

BackfillStatus::Complete => out.write_all(b"complete")?,
}
Ok(IsNull::No)
}
}

impl FromSql<Text, Pg> for BackfillStatus {
fn from_sql(bytes: PgValue<'_>) -> deserialize::Result<Self> {
match bytes.as_bytes() {
b"in_progress" => Ok(BackfillStatus::InProgress),
b"complete" => Ok(BackfillStatus::Complete),
_ => Err("Unrecognized enum variant".into()),
}
}
}

#[derive(AsChangeset, Debug, Insertable)]
#[diesel(table_name = backfill_processor_status)]
/// Only tracking the latest version successfully processed
pub struct BackfillProcessorStatus {
pub backfill_alias: String,
pub backfill_status: BackfillStatus,
pub last_success_version: i64,
pub last_transaction_timestamp: Option<chrono::NaiveDateTime>,
pub backfill_start_version: i64,
pub backfill_end_version: i64,
}

#[derive(AsChangeset, Debug, Queryable)]
#[diesel(table_name = backfill_processor_status)]
/// Only tracking the latest version successfully processed
pub struct BackfillProcessorStatusQuery {
pub backfill_alias: String,
pub backfill_status: BackfillStatus,
pub last_success_version: i64,
pub last_updated: chrono::NaiveDateTime,
pub last_transaction_timestamp: Option<chrono::NaiveDateTime>,
pub backfill_start_version: i64,
pub backfill_end_version: i64,
}

impl BackfillProcessorStatusQuery {
pub async fn get_by_processor(
backfill_alias: &str,
conn: &mut DbPoolConnection<'_>,
) -> diesel::QueryResult<Option<Self>> {
backfill_processor_status::table
.filter(backfill_processor_status::backfill_alias.eq(backfill_alias))
.first::<Self>(conn)
.await
.optional()
}
}
1 change: 1 addition & 0 deletions rust/sdk-processor/src/db/common/models/mod.rs
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
pub mod backfill_processor_status;
pub mod events_models;
pub mod processor_status;
19 changes: 10 additions & 9 deletions rust/sdk-processor/src/processors/events_processor.rs
Original file line number Diff line number Diff line change
Expand Up @@ -4,9 +4,7 @@ use crate::{
processor_config::ProcessorConfig,
},
steps::{
common::latest_processed_version_tracker::{
LatestVersionProcessedTracker, UPDATE_PROCESSOR_STATUS_SECS,
},
common::get_processor_status_saver,
events_processor::{EventsExtractor, EventsStorer},
},
utils::{
Expand All @@ -19,7 +17,10 @@ use anyhow::Result;
use aptos_indexer_processor_sdk::{
aptos_indexer_transaction_stream::{TransactionStream, TransactionStreamConfig},
builder::ProcessorBuilder,
common_steps::{OrderByVersionStep, TransactionStreamStep},
common_steps::{
OrderByVersionStep, TransactionStreamStep, VersionTrackerStep,
DEFAULT_UPDATE_PROCESSOR_STATUS_SECS,
},
traits::{processor_trait::ProcessorTrait, IntoRunnableStep},
};
use std::time::Duration;
Expand Down Expand Up @@ -62,8 +63,6 @@ impl ProcessorTrait for EventsProcessor {
}

async fn run_processor(&self) -> Result<()> {
let processor_name = self.config.processor_config.name();

// Run migrations
match self.config.db_config {
DbConfig::PostgresConfig(ref postgres_config) => {
Expand Down Expand Up @@ -106,10 +105,12 @@ impl ProcessorTrait for EventsProcessor {
let events_storer = EventsStorer::new(self.db_pool.clone(), processor_config);
let order_step = OrderByVersionStep::new(
starting_version,
Duration::from_secs(UPDATE_PROCESSOR_STATUS_SECS),
Duration::from_secs(DEFAULT_UPDATE_PROCESSOR_STATUS_SECS),
);
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Could we actually remove the OrderByVersionStep for the events and fa processor? They're not needed since there's no parallel processing.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

removed.

let version_tracker = VersionTrackerStep::new(
get_processor_status_saver(self.db_pool.clone(), self.config.clone()),
DEFAULT_UPDATE_PROCESSOR_STATUS_SECS,
);
let version_tracker =
LatestVersionProcessedTracker::new(self.db_pool.clone(), processor_name.to_string());

// Connect processor steps together
let (_, buffer_receiver) = ProcessorBuilder::new_with_inputless_first_step(
Expand Down
3 changes: 3 additions & 0 deletions rust/sdk-processor/src/steps/common/mod.rs
Original file line number Diff line number Diff line change
@@ -1 +1,4 @@
pub mod latest_processed_version_tracker;
pub mod processor_status_saver;

pub use processor_status_saver::get_processor_status_saver;
Loading
Loading