Spaces:

fireworks-ai
/

search-alchemy

Running

App Files Files Community

RobertoBarrosoLuque commited on 22 days ago

Commit

03263ac

1 Parent(s): f9c74bd

Frontend V1

Browse files

Files changed (4) hide show

assets/fireworks_logo.png +0 -0
requirements.txt +5 -8
src/app.py +426 -0
src/config.py +194 -0

assets/fireworks_logo.png ADDED Viewed

requirements.txt CHANGED Viewed

@@ -1,11 +1,8 @@
-huggingface_hub
-openai
 gradio==5.42.0
 python-dotenv==1.0.0
-ipython
-scikit-learn
-jupyter
-altair
-matplotlib
-pandas
 numpy

 gradio==5.42.0
+openai
 python-dotenv==1.0.0
 numpy
+pandas
+scikit-learn
+rank-bm25
+faiss-cpu

src/app.py CHANGED Viewed

	@@ -0,0 +1,426 @@

+import gradio as gr
+import time
+from typing import List, Dict, Tuple
+from pathlib import Path
+import os
+from config import GRADIO_THEME, CUSTOM_CSS, EXAMPLE_QUERIES
+_FILE_PATH = Path(__file__).parents[1]
+# Placeholder data for demo
+SAMPLE_PRODUCTS = [
+    {
+        "id": 1,
+        "title": "Wireless Bluetooth Headphones",
+        "description": "High-quality wireless headphones with 30-hour battery life and noise cancellation.",
+        "category": "Electronics",
+    },
+    {
+        "id": 2,
+        "title": "Science Kit for Kids",
+        "description": "Educational science experiments kit perfect for children ages 5-10.",
+        "category": "Toys",
+    },
+    {
+        "id": 3,
+        "title": "Running Shoes - Men's",
+        "description": "Lightweight running shoes with cushioned soles and breathable mesh.",
+        "category": "Sports",
+    },
+    {
+        "id": 4,
+        "title": "Portable Bluetooth Speaker",
+        "description": "Waterproof speaker with 12-hour battery life and deep bass.",
+        "category": "Electronics",
+    },
+    {
+        "id": 5,
+        "title": "Ergonomic Office Chair",
+        "description": "Adjustable office chair with lumbar support and breathable fabric.",
+        "category": "Furniture",
+    },
+]
+def format_results(results: List[Dict], stage_name: str, metrics: Dict) -> str:
+    """Format search results as HTML."""
+    html_parts = [f"### {stage_name} Results\n\n"]
+    for idx, result in enumerate(results, 1):
+        html_parts.append(
+            f"""
+<div class="result-card">
+<strong>{idx}. {result['title']}</strong><br/>
+<span style="color: #64748B; font-size: 0.9em;">{result['description']}</span><br/>
+<span style="color: #94A3B8; font-size: 0.85em;">Category: {result['category']}</span><br/>
+<span style="color: #6720FF; font-weight: 600;">Score: {result['score']:.3f}</span>
+</div>
+"""
+        )
+    html_parts.append("\n### Metrics\n\n")
+    html_parts.append(
+        f"""
+<div class="metric-box">
+" <strong>Semantic Match:</strong> {metrics['semantic_match']:.3f}<br/>
+" <strong>Diversity:</strong> {metrics['diversity']:.3f}<br/>
+" <strong>Latency:</strong> {metrics['latency_ms']}ms
+</div>
+"""
+    )
+    return "".join(html_parts)
+def search_stage_1(query: str) -> Tuple[str, Dict]:
+    """Stage 1: Baseline BM25 keyword search."""
+    start_time = time.time()
+    # Placeholder: Simple keyword matching
+    results = []
+    for product in SAMPLE_PRODUCTS[:3]:
+        results.append({**product, "score": 0.65 + (len(results) * 0.05)})
+    latency = int((time.time() - start_time) * 1000)
+    metrics = {
+        "semantic_match": 0.58,
+        "diversity": 0.60,
+        "latency_ms": max(50, latency),
+    }
+    return format_results(results, "Stage 1: BM25 Baseline", metrics), metrics
+def search_stage_2(query: str) -> Tuple[str, Dict]:
+    """Stage 2: BM25 + Vector Embeddings."""
+    start_time = time.time()
+    # Placeholder: Simulated embedding search
+    results = []
+    for product in SAMPLE_PRODUCTS[:4]:
+        results.append({**product, "score": 0.72 + (len(results) * 0.04)})
+    latency = int((time.time() - start_time) * 1000)
+    metrics = {
+        "semantic_match": 0.72,
+        "diversity": 0.70,
+        "latency_ms": max(100, latency),
+    }
+    return format_results(results, "Stage 2: + Vector Embeddings", metrics), metrics
+def search_stage_3(query: str) -> Tuple[str, Dict]:
+    """Stage 3: BM25 + Embeddings + Query Expansion."""
+    start_time = time.time()
+    # Placeholder: Simulated query expansion
+    results = []
+    for product in SAMPLE_PRODUCTS[:5]:
+        results.append({**product, "score": 0.78 + (len(results) * 0.03)})
+    latency = int((time.time() - start_time) * 1000)
+    metrics = {
+        "semantic_match": 0.81,
+        "diversity": 0.75,
+        "latency_ms": max(150, latency),
+    }
+    return format_results(results, "Stage 3: + Query Expansion", metrics), metrics
+def search_stage_4(query: str) -> Tuple[str, Dict]:
+    """Stage 4: BM25 + Embeddings + Query Expansion + LLM Reranking."""
+    start_time = time.time()
+    # Placeholder: Simulated reranking
+    results = []
+    for product in SAMPLE_PRODUCTS[:5]:
+        results.append({**product, "score": 0.85 + (len(results) * 0.025)})
+    latency = int((time.time() - start_time) * 1000)
+    metrics = {
+        "semantic_match": 0.88,
+        "diversity": 0.80,
+        "latency_ms": max(200, latency),
+    }
+    return format_results(results, "Stage 4: + LLM Reranking", metrics), metrics
+def search_all_stages(query: str) -> Tuple[str, str, str, str, str]:
+    """Run search across all stages and return comparison."""
+    if not query.strip():
+        empty_msg = "Please enter a search query."
+        return empty_msg, empty_msg, empty_msg, empty_msg, empty_msg
+    results_1, metrics_1 = search_stage_1(query)
+    results_2, metrics_2 = search_stage_2(query)
+    results_3, metrics_3 = search_stage_3(query)
+    results_4, metrics_4 = search_stage_4(query)
+    comparison = generate_comparison_table([metrics_1, metrics_2, metrics_3, metrics_4])
+    return results_1, results_2, results_3, results_4, comparison
+def generate_comparison_table(all_metrics: List[Dict]) -> str:
+    """Generate comparison table for all stages."""
+    stage_names = [
+        "Stage 1: BM25",
+        "Stage 2: + Embeddings",
+        "Stage 3: + Query Expansion",
+        "Stage 4: + Reranking",
+    ]
+    html = """
+### Comparison Across All Stages
+<table class="comparison-table">
+<tr>
+    <th>Stage</th>
+    <th>Semantic Match</th>
+    <th>Diversity</th>
+    <th>Latency (ms)</th>
+</tr>
+"""
+    for idx, (name, metrics) in enumerate(zip(stage_names, all_metrics)):
+        html += f"""
+<tr>
+    <td><strong>{name}</strong></td>
+    <td>{metrics['semantic_match']:.3f}</td>
+    <td>{metrics['diversity']:.3f}</td>
+    <td>{metrics['latency_ms']}ms</td>
+</tr>
+"""
+    html += "</table>"
+    html += """
+### Key Insights
+<div class="metric-box">
+" <strong>Semantic Match improves by 52%</strong> from Stage 1 to Stage 4<br/>
+" <strong>Diversity increases by 33%</strong> showing more varied results<br/>
+" <strong>Latency stays under 200ms</strong> maintaining fast performance<br/>
+" Each stage adds incremental value to search quality
+</div>
+"""
+    return html
+def set_example(example: str) -> str:
+    """Set an example query."""
+    return example
+# Code snippets for each stage
+CODE_STAGE_1 = """
+```python
+from rank_bm25 import BM25Okapi
+# Tokenize documents
+tokenized_docs = [doc.split() for doc in documents]
+# Create BM25 index
+bm25 = BM25Okapi(tokenized_docs)
+# Search
+query_tokens = query.split()
+scores = bm25.get_scores(query_tokens)
+# Get top results
+top_indices = scores.argsort()[-5:][::-1]
+results = [documents[i] for i in top_indices]
+```
+"""
+CODE_STAGE_2 = """
+```python
+from openai import OpenAI
+import faiss
+import numpy as np
+client = OpenAI(
+    base_url="https://api.fireworks.ai/inference/v1"
+)
+# Generate embeddings
+response = client.embeddings.create(
+    model="accounts/fireworks/models/qwen3-embedding-8b",
+    input=[query] + documents
+)
+# Extract embeddings
+query_emb = np.array(response.data[0].embedding)
+doc_embs = np.array([d.embedding for d in response.data[1:]])
+# FAISS search
+index = faiss.IndexFlatIP(doc_embs.shape[1])
+index.add(doc_embs)
+scores, indices = index.search(query_emb.reshape(1, -1), k=5)
+```
+"""
+CODE_STAGE_3 = """
+```python
+# Query expansion with LLM
+response = client.chat.completions.create(
+    model="accounts/fireworks/models/llama-v3p1-8b-instruct",
+    messages=[{
+        "role": "user",
+        "content": f"Extract 2-3 key search concepts from: {query}"
+    }]
+)
+expanded_query = response.choices[0].message.content
+# Search with expanded query
+response = client.embeddings.create(
+    model="accounts/fireworks/models/qwen3-embedding-8b",
+    input=[expanded_query] + documents
+)
+# Continue with embedding search...
+```
+"""
+CODE_STAGE_4 = """
+```python
+# First get top 20 candidates from Stage 3
+top_20_results = get_stage_3_results(query, k=20)
+# Rerank with Fireworks reranker
+rerank_response = client.post(
+    "https://api.fireworks.ai/inference/v1/rerank",
+    json={
+        "model": "fireworks/qwen3-reranker-8b",
+        "query": query,
+        "documents": [r["text"] for r in top_20_results],
+        "top_n": 5
+    }
+)
+# Get final ranked results
+final_results = [
+    top_20_results[r["index"]]
+    for r in rerank_response.json()["results"]
+]
+```
+"""
+# Build Gradio Interface
+with gr.Blocks(
+    css=CUSTOM_CSS, theme=GRADIO_THEME, title="Search Alchemy - Fireworks AI"
+) as demo:
+    # Header
+    with gr.Row():
+        with gr.Column(scale=3):
+            gr.Markdown(
+                """
+            <h1 class="header-title" style="font-size: 2.5em; text-align: left;">Search Alchemy</h1>
+            <p style="color: #64748B; font-size: 1.1em; margin-top: 0; text-align: left;">Building Production Search Pipelines with Fireworks AI</p>
+            """
+            )
+        with gr.Row(elem_classes="compact-header"):
+            with gr.Column(scale=1, min_width=150):
+                gr.Markdown(
+                    "<p style='margin: 0; padding: 0; font-size: 0.85em; color: #64748B;'>Powered by</p>"
+                )
+                gr.Image(
+                    value=str(_FILE_PATH / "assets" / "fireworks_logo.png"),
+                    height=35,
+                    width=140,
+                    show_label=False,
+                    show_download_button=False,
+                    container=False,
+                    show_fullscreen_button=False,
+                    show_share_button=False,
+                )
+    with gr.Row():
+        with gr.Column(scale=4):
+            query_input = gr.Textbox(
+                label="Search Query",
+                placeholder="Enter your search query...",
+                scale=3,
+                elem_classes="search-box",
+            )
+        with gr.Column(scale=1):
+            val = os.getenv("FIREWORKS_API_KEY", "")  # pragma: allowlist secret
+            api_key_value = gr.Textbox(  # pragma: allowlist secret
+                label="API Key",
+                type="password",
+                placeholder="Enter your Fireworks AI API key",
+                value=val,
+                container=True,
+                elem_classes="compact-input",
+            )
+    with gr.Row():
+        search_btn = gr.Button("Search", variant="primary", scale=1)
+    # Example queries
+    with gr.Row():
+        gr.Markdown("**Quick Examples:**")
+    with gr.Row():
+        example_buttons = []
+        for example in EXAMPLE_QUERIES:
+            btn = gr.Button(example, size="sm", variant="secondary")
+            example_buttons.append(btn)
+            btn.click(fn=set_example, inputs=[gr.State(example)], outputs=[query_input])
+    # Tabs for each stage
+    with gr.Tabs() as tabs:
+        # Stage 1 Tab
+        with gr.Tab("Stage 1: BM25 Baseline"):
+            stage1_output = gr.Markdown(label="Results")
+            with gr.Accordion("Show Code", open=False):
+                gr.Markdown(CODE_STAGE_1)
+        # Stage 2 Tab
+        with gr.Tab("Stage 2: + Vector Embeddings"):
+            stage2_output = gr.Markdown(label="Results")
+            with gr.Accordion("Show Code", open=False):
+                gr.Markdown(CODE_STAGE_2)
+        # Stage 3 Tab
+        with gr.Tab("Stage 3: + Query Expansion"):
+            stage3_output = gr.Markdown(label="Results")
+            with gr.Accordion("Show Code", open=False):
+                gr.Markdown(CODE_STAGE_3)
+        # Stage 4 Tab
+        with gr.Tab("Stage 4: + LLM Reranking"):
+            stage4_output = gr.Markdown(label="Results")
+            with gr.Accordion("Show Code", open=False):
+                gr.Markdown(CODE_STAGE_4)
+        # Comparison Tab
+        with gr.Tab("Compare All Stages"):
+            comparison_output = gr.Markdown(label="Comparison")
+    # Search button click handler
+    search_btn.click(
+        fn=search_all_stages,
+        inputs=[query_input],
+        outputs=[
+            stage1_output,
+            stage2_output,
+            stage3_output,
+            stage4_output,
+            comparison_output,
+        ],
+    )
+if __name__ == "__main__":
+    demo.launch()

src/config.py ADDED Viewed

	@@ -0,0 +1,194 @@

+import gradio as gr
+# Fireworks AI Model Configuration
+EMBEDDING_MODEL = "accounts/fireworks/models/qwen3-embedding-8b"
+LLM_MODEL = "accounts/fireworks/models/llama-v3p1-8b-instruct"
+RERANKER_MODEL = "fireworks/qwen3-reranker-8b"
+# Gradio Theme Configuration
+GRADIO_THEME = gr.themes.Base(
+    primary_hue=gr.themes.colors.purple,
+    secondary_hue=gr.themes.colors.violet,
+    neutral_hue=gr.themes.colors.slate,
+    spacing_size=gr.themes.sizes.spacing_lg,
+    radius_size=gr.themes.sizes.radius_md,
+    text_size=gr.themes.sizes.text_md,
+    font=[gr.themes.GoogleFont("Inter"), "ui-sans-serif", "system-ui", "sans-serif"],
+    font_mono=[gr.themes.GoogleFont("JetBrains Mono"), "monospace"],
+).set(
+    button_primary_background_fill="#6720FF",
+    button_primary_background_fill_hover="#7B2FFF",
+    button_primary_text_color="#FFFFFF",
+    button_secondary_background_fill="#F3F0FF",
+    button_secondary_background_fill_hover="#EDE9FE",
+    button_secondary_text_color="#6720FF",
+    slider_color="#6720FF",
+    link_text_color="#6720FF",
+    link_text_color_hover="#7B2FFF",
+    link_text_color_visited="#8B5CF6",
+    body_background_fill="#FAFBFC",
+    block_background_fill="#FFFFFF",
+    input_background_fill="#FFFFFF",
+    border_color_primary="#E6EAF4",
+)
+# Custom CSS
+CUSTOM_CSS = """
+.gradio-container {
+    font-family: 'Inter', 'Segoe UI', system-ui, sans-serif;
+    background: linear-gradient(135deg, #FAFBFC 0%, #F3F0FF 100%);
+}
+.header-title {
+    background: linear-gradient(135deg, #6720FF 0%, #8B5CF6 100%);
+    -webkit-background-clip: text;
+    -webkit-text-fill-color: transparent;
+    background-clip: text;
+    font-weight: 700;
+    text-align: center;
+    margin-bottom: 0.5em;
+}
+.subtitle {
+    color: #64748B;
+    text-align: center;
+    font-size: 1.1em;
+    margin-top: 0;
+}
+.search-box {
+    border: 2px solid #E6EAF4;
+    border-radius: 10px;
+    transition: all 0.2s ease;
+}
+.search-box:focus {
+    border-color: #6720FF;
+    box-shadow: 0 0 0 3px rgba(103, 32, 255, 0.1);
+}
+.result-card {
+    background: white;
+    border-radius: 12px;
+    padding: 16px;
+    margin: 8px 0;
+    box-shadow: 0 2px 4px rgba(103, 32, 255, 0.08);
+    border: 1px solid #E6EAF4;
+    transition: all 0.2s ease;
+}
+.result-card:hover {
+    box-shadow: 0 4px 12px rgba(103, 32, 255, 0.12);
+    border-color: #C4B5FD;
+}
+.metric-box {
+    background: linear-gradient(to right, #F3F0FF, #FFFFFF);
+    border-left: 3px solid #6720FF;
+    padding: 12px;
+    margin: 8px 0;
+    border-radius: 8px;
+    font-size: 0.9em;
+}
+.code-section {
+    background: linear-gradient(to right, #F3F0FF, #FFFFFF);
+    border-left: 3px solid #6720FF;
+    padding: 16px;
+    margin: 12px 0;
+    border-radius: 8px;
+    font-family: 'JetBrains Mono', monospace;
+    font-size: 0.9em;
+}
+.comparison-table {
+    width: 100%;
+    border-collapse: collapse;
+    margin: 20px 0;
+}
+.comparison-table th {
+    background: #6720FF;
+    color: white;
+    padding: 12px;
+    text-align: left;
+    font-weight: 600;
+}
+.comparison-table td {
+    padding: 12px;
+    border-bottom: 1px solid #E6EAF4;
+}
+.comparison-table tr:hover {
+    background: #F3F0FF;
+}
+::-webkit-scrollbar {
+    width: 8px;
+    height: 8px;
+}
+::-webkit-scrollbar-track {
+    background: #F3F0FF;
+    border-radius: 4px;
+}
+::-webkit-scrollbar-thumb {
+    background: #C4B5FD;
+    border-radius: 4px;
+}
+::-webkit-scrollbar-thumb:hover {
+    background: #A78BFA;
+}
+details {
+    border: 1px solid #E6EAF4;
+    border-radius: 10px;
+    padding: 12px;
+    margin: 10px 0;
+    background: white;
+}
+details[open] {
+    border-color: #6720FF;
+    box-shadow: 0 4px 12px rgba(103, 32, 255, 0.15);
+}
+summary {
+    font-weight: 600;
+    color: #6720FF;
+    cursor: pointer;
+    padding: 4px;
+}
+summary:hover {
+    color: #7B2FFF;
+}
+.logo-image {
+    display: flex;
+    justify-content: flex-end;
+    align-items: center;
+}
+.api-config-accordion {
+    margin: 10px 0;
+    padding: 0;
+}
+.api-config-accordion > .label-wrap {
+    font-size: 0.85em;
+    padding: 8px 12px;
+}
+"""
+# Example queries
+EXAMPLE_QUERIES = [
+    "gift for 5 year old who likes science",
+    "cheap wireless headphones good battery",
+    "running shoes",
+    "waterproof bluetooth speaker",
+    "ergonomic office chair under 200",
+]