Skip to content

Commit

Permalink
feat(torii): add a script to verify data
Browse files Browse the repository at this point in the history
commit-id:c6195721
  • Loading branch information
lambda-0x committed Sep 24, 2024
1 parent 7757619 commit 3cc4907
Showing 1 changed file with 87 additions and 0 deletions.
87 changes: 87 additions & 0 deletions scripts/compare-torii-data.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,87 @@
# This script compares data across 'events', 'entities', and 'transactions' tables between two SQLite databases.
# Helpful to make sure any changes made in torii doesn't affect the resulting data.

import sqlite3
import argparse

def fetch_table_data(db_path, table_name, columns):
conn = sqlite3.connect(db_path)
cursor = conn.cursor()
cursor.execute(f"SELECT {', '.join(columns)} FROM {table_name}")
data = cursor.fetchall()
conn.close()
return {row[0]: row[1:] for row in data}

def get_table_row_count(db_path, table_name):
conn = sqlite3.connect(db_path)
cursor = conn.cursor()
cursor.execute(f"SELECT COUNT(*) FROM {table_name}")
count = cursor.fetchone()[0]
conn.close()
return count

def compare_data(data1, data2, table_name):
differences_found = False
for id, values in data1.items():
if id in data2:
if values != data2[id]:
print(f"Mismatch found in {table_name} for ID {id}:")
print(f" Database 1: {values}")
print(f" Database 2: {data2[id]}")
differences_found = True
else:
print(f"ID {id} found in {table_name} of Database 1 but not in Database 2")
differences_found = True

for id in data2:
if id not in data1:
print(f"ID {id} found in {table_name} of Database 2 but not in Database 1")
differences_found = True

if not differences_found:
print(f"No differences found in {table_name}")

def compare_databases(db_path1, db_path2):
# Columns to compare, ignoring time-dependent and event_id columns
events_columns = ["id", "keys", "data", "transaction_hash"]
entities_columns = ["id", "keys"]
transactions_columns = ["id", "transaction_hash", "sender_address", "calldata", "max_fee", "signature", "nonce", "transaction_type"]

# Fetch data from both databases
events_data_db1 = fetch_table_data(db_path1, "events", events_columns)
events_data_db2 = fetch_table_data(db_path2, "events", events_columns)
entities_data_db1 = fetch_table_data(db_path1, "entities", entities_columns)
entities_data_db2 = fetch_table_data(db_path2, "entities", entities_columns)
transactions_data_db1 = fetch_table_data(db_path1, "transactions", transactions_columns)
transactions_data_db2 = fetch_table_data(db_path2, "transactions", transactions_columns)

# Get row counts from both databases
events_count_db1 = get_table_row_count(db_path1, "events")
events_count_db2 = get_table_row_count(db_path2, "events")
entities_count_db1 = get_table_row_count(db_path1, "entities")
entities_count_db2 = get_table_row_count(db_path2, "entities")
transactions_count_db1 = get_table_row_count(db_path1, "transactions")
transactions_count_db2 = get_table_row_count(db_path2, "transactions")

# Print row counts
print(f"Number of rows in events table: Database 1 = {events_count_db1}, Database 2 = {events_count_db2}")
print(f"Number of rows in entities table: Database 1 = {entities_count_db1}, Database 2 = {entities_count_db2}")
print(f"Number of rows in transactions table: Database 1 = {transactions_count_db1}, Database 2 = {transactions_count_db2}")

# Compare data
print("\nComparing events table:")
compare_data(events_data_db1, events_data_db2, "events")

print("\nComparing entities table:")
compare_data(entities_data_db1, entities_data_db2, "entities")

print("\nComparing transactions table:")
compare_data(transactions_data_db1, transactions_data_db2, "transactions")

if __name__ == "__main__":
parser = argparse.ArgumentParser(description="Compare data in events, entities, and transactions tables between two SQLite databases.")
parser.add_argument("db_path1", help="Path to the first SQLite database")
parser.add_argument("db_path2", help="Path to the second SQLite database")
args = parser.parse_args()

compare_databases(args.db_path1, args.db_path2)

0 comments on commit 3cc4907

Please sign in to comment.