Spaces:

Zok213
/

ADY201M

Sleeping

Zok213 commited on 8 days ago

Commit

f2826d8

1 Parent(s): a705291

fix

Files changed (3) hide show

__init__.py ADDED Viewed

File without changes

app.py CHANGED Viewed

@@ -1,19 +1,42 @@
-from fastapi import FastAPI, Query
 from typing import Optional
 from datetime import date
 import psycopg2
 import os
 from dotenv import load_dotenv
 # Load environment variables from .env file (optional, for local development)
 load_dotenv()
 app = FastAPI()
 def get_db_connection():
     conn = psycopg2.connect(os.getenv('DB_CONNECTION_STRING'))
     return conn
 @app.get("/data")
 def get_data(
     start_date: Optional[date] = Query(None),

+from fastapi import FastAPI, Query, BackgroundTasks
 from typing import Optional
 from datetime import date
 import psycopg2
 import os
 from dotenv import load_dotenv
+# Import your scraper function
+from scraper import get_china_cpi
 # Load environment variables from .env file (optional, for local development)
 load_dotenv()
 app = FastAPI()
 def get_db_connection():
     conn = psycopg2.connect(os.getenv('DB_CONNECTION_STRING'))
     return conn
+# Add a new endpoint to run the scraper
+@app.get("/run-scraper")
+async def run_scraper(background_tasks: BackgroundTasks):
+    """Run the China CPI scraper in the background"""
+    background_tasks.add_task(get_china_cpi)
+    return {"message": "Scraper started in background"}
+# Add a root endpoint
+@app.get("/")
+def root():
+    """Root endpoint with API information"""
+    return {
+        "message": "China CPI API",
+        "endpoints": [
+            {"path": "/", "method": "GET", "description": "This information"},
+            {"path": "/run-scraper", "method": "GET", "description": "Trigger the data scraper"},
+            {"path": "/data", "method": "GET", "description": "Get CPI data with optional filters"},
+            {"path": "/latest", "method": "GET", "description": "Get the latest CPI data"}
+        ]
+    }
+# Your existing endpoints
 @app.get("/data")
 def get_data(
     start_date: Optional[date] = Query(None),

scraper.py CHANGED Viewed

@@ -1,3 +1,4 @@
 from playwright.sync_api import sync_playwright
 import pandas as pd
 from datetime import datetime
@@ -50,6 +51,7 @@ def get_china_cpi(output_dir='data/raw/'):
             current_row_count = len(page.query_selector_all('#eventHistoryTable459 tbody tr'))
             if current_row_count == previous_row_count:
                 break
             page.evaluate('document.querySelector("#showMoreHistory459 a").click()')
             page.wait_for_function(
                 f"document.querySelectorAll('#eventHistoryTable459 tbody tr').length > {current_row_count}",

+# Ensure scraper.py contains a complete function that can be imported
 from playwright.sync_api import sync_playwright
 import pandas as pd
 from datetime import datetime
             current_row_count = len(page.query_selector_all('#eventHistoryTable459 tbody tr'))
             if current_row_count == previous_row_count:
                 break
+            # Fix the JavaScript method name
             page.evaluate('document.querySelector("#showMoreHistory459 a").click()')
             page.wait_for_function(
                 f"document.querySelectorAll('#eventHistoryTable459 tbody tr').length > {current_row_count}",