oracle / inference.py

Upload folder using huggingface_hub

d195287 verified 25 days ago

13.1 kB

	# inference.py

	import torch
	import traceback
	import time

	# Import all the necessary components from our project
	from models.model import Oracle
	from data.data_collator import MemecoinCollator
	from models.multi_modal_processor import MultiModalEncoder
	from data.data_loader import OracleDataset
	from data.data_fetcher import DataFetcher
	from models.helper_encoders import ContextualTimeEncoder
	from models.token_encoder import TokenEncoder
	from models.wallet_encoder import WalletEncoder
	from models.graph_updater import GraphUpdater
	from models.ohlc_embedder import OHLCEmbedder
	from models.quant_ohlc_embedder import QuantOHLCEmbedder
	import models.vocabulary as vocab
	from data.quant_ohlc_feature_schema import NUM_QUANT_OHLC_FEATURES, TOKENS_PER_SEGMENT

	# --- NEW: Import database clients ---
	from clickhouse_driver import Client as ClickHouseClient
	from neo4j import GraphDatabase

	# =============================================================================
	# Inference/Test Script for the Oracle Model
	# This script replicates the test logic previously in model.py
	# =============================================================================
	if __name__ == "__main__":
	print("--- Oracle Inference Script (Full Pipeline Test) ---")

	# --- 1. Define Configs ---
	OHLC_SEQ_LEN = 300
	print(f"Using {vocab.NUM_EVENT_TYPES} event types from vocabulary.")

	device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
	dtype = torch.bfloat16 if torch.cuda.is_available() and torch.cuda.is_bf16_supported() else torch.float16
	if device.type == 'cpu': dtype = torch.float32
	print(f"Using device: {device}, dtype: {dtype}")

	_test_quantiles = [0.1, 0.5, 0.9]
	_test_horizons = [30, 60, 120, 240, 420]
	_test_num_outputs = len(_test_quantiles) * len(_test_horizons)

	# --- 2. Instantiate ALL Encoders ---
	print("Instantiating encoders (using defaults)...")
	try:
	multi_modal_encoder = MultiModalEncoder(dtype=dtype)
	real_time_enc = ContextualTimeEncoder(dtype=dtype)

	real_token_enc = TokenEncoder(
	multi_dim=multi_modal_encoder.embedding_dim,
	dtype=dtype
	)
	real_wallet_enc = WalletEncoder(encoder=multi_modal_encoder, dtype=dtype)
	real_graph_upd = GraphUpdater(time_encoder=real_time_enc, dtype=dtype)

	real_ohlc_emb = OHLCEmbedder(
	num_intervals=vocab.NUM_OHLC_INTERVALS,
	dtype=dtype
	)
	real_quant_ohlc_emb = QuantOHLCEmbedder(
	num_features=NUM_QUANT_OHLC_FEATURES,
	sequence_length=TOKENS_PER_SEGMENT,
	dtype=dtype
	)

	print(f"TokenEncoder default output_dim: {real_token_enc.output_dim}")
	print(f"WalletEncoder default d_model: {real_wallet_enc.d_model}")
	print(f"OHLCEmbedder default output_dim: {real_ohlc_emb.output_dim}")

	print("Encoders instantiated.")
	except Exception as e:
	print(f"Failed to instantiate encoders: {e}")
	traceback.print_exc()
	exit()

	# --- 3. Instantiate the Collator ---
	collator = MemecoinCollator(
	event_type_to_id=vocab.EVENT_TO_ID,
	device=device,
	multi_modal_encoder=multi_modal_encoder,
	dtype=dtype,
	ohlc_seq_len=OHLC_SEQ_LEN,
	max_seq_len=50
	)
	print("MemecoinCollator (fast batcher) instantiated.")

	# --- 4. Instantiate the Oracle Model ---
	print("Instantiating Oracle (full pipeline)...")
	model = Oracle(
	token_encoder=real_token_enc,
	wallet_encoder=real_wallet_enc,
	graph_updater=real_graph_upd,
	time_encoder=real_time_enc,
	multi_modal_dim=multi_modal_encoder.embedding_dim,
	num_event_types=vocab.NUM_EVENT_TYPES,
	event_pad_id=vocab.EVENT_TO_ID['__PAD__'],
	event_type_to_id=vocab.EVENT_TO_ID,
	model_config_name="Qwen/Qwen3-0.6B",
	quantiles=_test_quantiles,
	horizons_seconds=_test_horizons,
	dtype=dtype,
	ohlc_embedder=real_ohlc_emb,
	quant_ohlc_embedder=real_quant_ohlc_emb
	).to(device)
	model.eval()
	print(f"Oracle d_model: {model.d_model}")

	# --- 5. Create Dataset and run pre-collation step ---
	print("Creating Dataset...")

	# --- NEW: Initialize real database clients and DataFetcher ---
	try:
	print("Connecting to databases...")
	# ClickHouse running locally on port 8123 with no auth
	clickhouse_client = ClickHouseClient(host='localhost', port=9000)
	# Neo4j running locally on port 7687 with no auth
	neo4j_driver = GraphDatabase.driver("bolt://localhost:7687", auth=None)

	data_fetcher = DataFetcher(clickhouse_client=clickhouse_client, neo4j_driver=neo4j_driver)
	print("Database clients and DataFetcher initialized.")

	# --- Fetch mints to get the first token for processing ---
	all_mints = data_fetcher.get_all_mints()
	if not all_mints:
	print("\n❌ No mints found in the database. Exiting test.")
	exit()

	# --- FIXED: Instantiate the dataset in REAL mode, removing is_test flag ---
	dataset = OracleDataset(
	data_fetcher=data_fetcher,
	horizons_seconds=_test_horizons,
	quantiles=_test_quantiles,
	max_samples=57)

	except Exception as e:
	print(f"FATAL: Could not initialize database connections or dataset: {e}")
	traceback.print_exc()
	exit()

	# --- PRODUCTION-READY: Process a full batch of items from the dataset ---
	print(f"\n--- Processing a batch of up to {len(dataset)} items from the dataset ---")
	batch_items = []
	for i in range(len(dataset)):
	token_addr = dataset.sampled_mints[i].get('mint_address', 'unknown')
	print(f" - Attempting to process sample {i+1}/{len(dataset)} ({token_addr})...")
	fetch_start = time.time()
	sample = dataset[i]
	fetch_elapsed = time.time() - fetch_start
	print(f" ... fetch completed in {fetch_elapsed:.2f}s")
	if sample is not None:
	batch_items.append(sample)
	print(f" ... Success! Sample added to batch.")

	if not batch_items:
	print("\n❌ No valid samples could be generated from the dataset. Exiting.")
	exit()

	# --- 6. Run Collator AND Model ---
	print("\n--- Testing Pipeline (Collator + Model.forward) ---")
	try:
	# 1. Collator
	collate_start = time.time()
	collated_batch = collator(batch_items)
	collate_elapsed = time.time() - collate_start
	print("Collation successful!")
	print(f"Collation time for batch of {len(batch_items)} tokens: {collate_elapsed:.2f}s")

	# --- Check collator output ---
	B = len(batch_items)
	L = collated_batch['attention_mask'].shape[1]
	assert 'ohlc_price_tensors' in collated_batch
	ohlc_price_tensors = collated_batch['ohlc_price_tensors']
	assert ohlc_price_tensors.dim() == 3, f"Expected 3D OHLC tensor, got shape {tuple(ohlc_price_tensors.shape)}"
	assert ohlc_price_tensors.shape[1] == 2, f"Expected OHLC tensor with 2 rows (open/close), got {ohlc_price_tensors.shape[1]}"
	assert ohlc_price_tensors.shape[2] == OHLC_SEQ_LEN, f"Expected OHLC seq len {OHLC_SEQ_LEN}, got {ohlc_price_tensors.shape[2]}"
	assert collated_batch['ohlc_interval_ids'].shape[0] == ohlc_price_tensors.shape[0], "Interval ids must align with OHLC segments"
	assert ohlc_price_tensors.dtype == dtype, f"OHLC tensor dtype {ohlc_price_tensors.dtype} != expected {dtype}"
	print(f"Collator produced {ohlc_price_tensors.shape[0]} OHLC segment(s).")

	# --- FIXED: Update assertions for event-specific data which is mostly empty for now ---
	assert collated_batch['dest_wallet_indices'].shape == (B, L)
	assert collated_batch['transfer_numerical_features'].shape == (B, L, 4)
	assert collated_batch['trade_numerical_features'].shape == (B, L, 8) # Corrected from 10
	assert collated_batch['deployer_trade_numerical_features'].shape == (B, L, 8) # Corrected from 10
	assert collated_batch['smart_wallet_trade_numerical_features'].shape == (B, L, 8) # Corrected from 10
	assert collated_batch['pool_created_numerical_features'].shape == (B, L, 2)
	assert collated_batch['liquidity_change_numerical_features'].shape == (B, L, 1)
	assert collated_batch['fee_collected_numerical_features'].shape == (B, L, 1)
	assert collated_batch['token_burn_numerical_features'].shape == (B, L, 2)
	assert collated_batch['supply_lock_numerical_features'].shape == (B, L, 2)
	assert collated_batch['onchain_snapshot_numerical_features'].shape == (B, L, 14)
	assert collated_batch['trending_token_numerical_features'].shape == (B, L, 1)
	assert collated_batch['boosted_token_numerical_features'].shape == (B, L, 2)
	# assert len(collated_batch['holder_snapshot_raw_data']) == 1 # No holder snapshots yet
	# assert len(collated_batch['textual_event_data']) == 8 # No textual events yet
	assert collated_batch['dexboost_paid_numerical_features'].shape == (B, L, 2)
	print("Collator correctly processed all event-specific numerical data into their respective tensors.")

	# --- NEW: Comprehensive Debugging Output ---
	print("\n--- Collated Batch Debug Output ---")
	print(f"Batch Size: {B}, Max Sequence Length: {L}")

	# Print shapes of key tensors
	print("\n[Core Tensors]")
	print(f" event_type_ids: {collated_batch['event_type_ids'].shape}")
	print(f" attention_mask: {collated_batch['attention_mask'].shape}")
	print(f" timestamps_float: {collated_batch['timestamps_float'].shape}")

	print("\n[Pointer Tensors]")
	print(f" wallet_indices: {collated_batch['wallet_indices'].shape}")
	print(f" token_indices: {collated_batch['token_indices'].shape}")

	print("\n[Encoder Inputs]")
	print(f" embedding_pool: {collated_batch['embedding_pool'].shape}")
	# --- FIXED: Check for a key that still exists after removing address embeddings ---
	if collated_batch['token_encoder_inputs']['name_embed_indices'].numel() > 0:
	print(f" token_encoder_inputs contains {collated_batch['token_encoder_inputs']['name_embed_indices'].shape[0]} tokens.")
	else:
	print(" token_encoder_inputs is empty.")
	if collated_batch['wallet_encoder_inputs']['profile_rows']:
	print(f" wallet_encoder_inputs contains {len(collated_batch['wallet_encoder_inputs']['profile_rows'])} wallets.")
	else:
	print(" wallet_encoder_inputs is empty.")

	print("\n[Graph Links]")
	if collated_batch['graph_updater_links']:
	for link_name, data in collated_batch['graph_updater_links'].items():
	print(f" - {link_name}: {data['edge_index'].shape[1]} edges")
	else:
	print(" No graph links in this batch.")
	print("--- End Debug Output ---\n")

	print("Embedding pool size:", collated_batch["embedding_pool"].shape[0])
	print("Max name_emb_idx:", collated_batch["token_encoder_inputs"]["name_embed_indices"].max().item())

	# 2. Model Forward Pass
	with torch.no_grad():
	model_outputs = model(collated_batch)
	quantile_logits = model_outputs["quantile_logits"]
	hidden_states = model_outputs["hidden_states"]
	attention_mask = model_outputs["attention_mask"]
	pooled_states = model_outputs["pooled_states"]
	print("Model forward pass successful!")

	# --- 7. Verify Output ---
	print("\n--- Test Results ---")
	D_MODEL = model.d_model

	print(f"Final hidden_states shape: {hidden_states.shape}")
	print(f"Final attention_mask shape: {attention_mask.shape}")

	assert hidden_states.shape == (B, L, D_MODEL)
	assert attention_mask.shape == (B, L)
	assert hidden_states.dtype == dtype

	print(f"Output mean (sanity check): {hidden_states.mean().item()}")
	print(f"Pooled state shape: {pooled_states.shape}")
	print(f"Quantile logits shape: {quantile_logits.shape}")

	quantile_grid = quantile_logits.view(B, len(_test_horizons), len(_test_quantiles))
	print("\n[Quantile Predictions]")
	for b_idx in range(B):
	print(f" Sample {b_idx}:")
	for h_idx, horizon in enumerate(_test_horizons):
	row = quantile_grid[b_idx, h_idx]
	print(f" Horizon {horizon}s -> " + ", ".join(
	f"q={q:.2f}: {row[q_idx].item():.6f}"
	for q_idx, q in enumerate(_test_quantiles)
	))

	print("\n✅ Test Passed! Full ENCODING pipeline is working.")

	except Exception as e:
	print(f"\n❌ Error during pipeline test: {e}")
	traceback.print_exc()