Spaces:

LeoWalker
/

todo-agent

Sleeping

App Files Files Community

todo-agent / tests /test_web_search_brainstorming.py

LeoWalker

Clean repository with latest todo-agent code and article

2c060c5 about 1 month ago

raw

history blame contribute delete

6.82 kB

	"""
	Web Search Platform Research Test
	Tutorial: Research observability platforms and convert findings into writing tasks.
	"""

	import os
	import sys
	import asyncio
	import json
	from pathlib import Path
	from datetime import datetime
	from dotenv import load_dotenv
	from phoenix.otel import register
	import weave
	from agents import Runner, Agent

	sys.path.insert(0, str(Path(__file__).parent.parent))
	from agent.todo_agent import create_agent
	from agent.storage import JsonTodoStorage


	def reset_test_data():
	"""Reset todos and session data for clean test runs."""
	os.makedirs("data", exist_ok=True)

	with open("data/todos.json", "w") as f:
	json.dump([], f)

	with open("data/session_default.json", "w") as f:
	json.dump({"history": []}, f)

	print("🔄 Data reset - starting with clean slate")




	def initialize_tracing(project_name: str):
	"""Initialize tracing with graceful error handling."""
	os.environ["OPENAI_TRACING_ENABLED"] = "1"
	os.environ["WEAVE_PRINT_CALL_LINK"] = "false"

	# Phoenix: Add minimal custom resource attributes via environment variable
	os.environ["OTEL_RESOURCE_ATTRIBUTES"] = f"tutorial.name={project_name},tutorial.type=web_search,environment=test,app.name=todo-agent"

	try:
	register(project_name=project_name, auto_instrument=True)
	print(f"✅ Phoenix tracing initialized for: {project_name}")
	except Exception as e:
	print(f"⚠️ Phoenix tracing failed: {e}")

	if not weave.get_client():
	try:
	weave.init(project_name)
	print(f"✅ Weave tracing initialized for: {project_name}")
	except Exception as e:
	print(f"⚠️ Weave tracing failed (continuing without Weave): {e}")


	async def run_web_search_test():
	"""Tutorial: Research platforms and create structured writing tasks."""
	start_time = datetime.now()
	test_details = {
	"turns": 0,
	"validation_results": {},
	"errors": []
	}

	try:
	reset_test_data()

	load_dotenv()

	initialize_tracing("observability-platform-research")

	agent = create_agent(storage=JsonTodoStorage(), agent_name="To-Do Agent (Platform Research)")

	print("🧪 Starting Web Search Platform Research Tutorial")
	print("=" * 50)
	print("🎯 Learn: Research workflow → structured task creation")
	print("📚 Goal: Compare observability platforms for AI agents")

	test_messages = [
	# === Platform Research (3 searches with guided responses) ===
	"Search for 'Arize Phoenix Cloud main benefits agent observability' and give me a brief 2 paragraph summary",

	"Search for 'Weights & Biases Weave main benefits agent tracing' and give me a brief 2 paragraph summary",

	"Search for 'OpenAI platform observability features benefits' and give me a brief 2 paragraph summary",

	# === Convert Research to Tasks ===
	"Based on this research, please add writing tasks to my 'Platform Comparison' project for comparing these platforms - I need specific tasks I can work on"
	]

	history = []

	# Weave: Add minimal context attributes for this tutorial session
	with weave.attributes({'tutorial_type': 'web_search', 'environment': 'test', 'app_name': 'todo-agent', 'tutorial_name': 'platform-research-tutorial'}):
	for i, message in enumerate(test_messages, 1):
	print(f"\n--- Research Step {i} ---")
	print(f"User: {message}")

	history.append({"role": "user", "content": message})
	result = await Runner.run(agent, input=history)

	print(f"Agent: {result.final_output}")
	history = result.to_input_list()

	await asyncio.sleep(0.5)

	test_details["turns"] = len(test_messages)

	print("\n" + "=" * 50)
	print("🎓 Platform Research Tutorial Complete")

	validation_success = True

	try:
	with open("data/todos.json", "r") as f:
	todos = json.load(f)

	total_todos = len(todos)
	test_details["validation_results"]["total_todos"] = total_todos

	# Research tutorial should create at least 3 writing tasks
	if total_todos < 3:
	validation_success = False
	error_msg = f"Expected at least 3 writing tasks from research, got {total_todos}"
	test_details["errors"].append(error_msg)
	print(f"❌ {error_msg}")

	print(f"\n📊 Research Results: {total_todos} writing tasks created from platform research")

	for i, todo in enumerate(todos, 1):
	if not todo or not isinstance(todo, dict):
	continue
	name = todo.get('name', 'Unnamed Task')
	print(f"{i}. {name}")
	if todo.get('description'):
	print(f" Description: {todo['description']}")
	if todo.get('project'):
	print(f" Project: {todo['project']}")

	except FileNotFoundError:
	validation_success = False
	error_msg = "No todos.json file found"
	test_details["errors"].append(error_msg)
	print(f"❌ {error_msg}")

	overall_success = validation_success and len(test_details["errors"]) == 0

	print(f"\n🎓 What You Learned:")
	print("• Web search integration for research workflows")
	print("• Converting research findings into structured writing tasks")
	print("• Multi-platform comparison methodology")
	print("• Research stays in chat history, todos are actionable tasks")
	print("🚀 Next: Try the natural language tutorial for project finishing touches!")

	end_time = datetime.now()
	duration = (end_time - start_time).total_seconds()

	if overall_success:
	print(f"\n✅ TUTORIAL PASSED: Platform research complete! ({duration:.1f}s)")
	else:
	print(f"\n❌ TUTORIAL FAILED: Research workflow needs attention ({duration:.1f}s)")

	return overall_success

	except Exception as e:
	end_time = datetime.now()
	duration = (end_time - start_time).total_seconds()
	print(f"\n❌ TUTORIAL FAILED: {str(e)} ({duration:.1f}s)")
	return False


	if __name__ == "__main__":
	success = asyncio.run(run_web_search_test())
	exit(0 if success else 1)