Spaces:

adikwok
/

api-deepseek

Sleeping

App Files Files Community

api-deepseek / app.py

adikwok

Update app.py

b64c343 verified 7 months ago

raw

history blame

9.95 kB

	import gradio as gr
	import requests
	import os
	from typing import List, Tuple

	# Groq API Configuration
	API_URL = "https://api.groq.com/openai/v1/chat/completions"
	API_KEY = os.getenv("GROQ_API_KEY") # This will read from HF Secrets

	# Debug info (will show in HF Spaces logs)
	print(f"🔑 Groq API Key Status: {'✅ Found' if API_KEY else '❌ Missing'}")
	if API_KEY:
	print(f"🔑 API Key Preview: {API_KEY[:8]}...")

	headers = {
	"Authorization": f"Bearer {API_KEY}",
	"Content-Type": "application/json"
	}

	# Groq Models
	MODELS = {
	"llama3-8b-8192": "Llama 3 8B ⚡ (Fastest)",
	"llama3-70b-8192": "Llama 3 70B 🧠 (Smartest)",
	"mixtral-8x7b-32768": "Mixtral 8x7B ⚖️ (Balanced)",
	"gemma-7b-it": "Gemma 7B 🔍 (Google)"
	}

	def query_groq(message: str, history: List[Tuple[str, str]], model: str) -> str:
	"""Query Groq API with comprehensive error handling"""

	# Check API key
	if not API_KEY:
	return """❌ API Key Not Found

	Please set up your API key in Hugging Face Spaces:

	1. Go to your Space's Settings
	2. Click Repository secrets
	3. Add new secret:
	- Name: `GROQ_API_KEY`
	- Value: Your Groq API key
	4. Restart the Space

	Get your free API key at: [console.groq.com](https://console.groq.com)"""

	try:
	# Build conversation history
	messages = [{"role": "system", "content": "You are a helpful AI assistant powered by Groq's lightning-fast inference."}]

	# Add chat history
	for user_msg, bot_msg in history:
	if user_msg and bot_msg:
	messages.extend([
	{"role": "user", "content": user_msg},
	{"role": "assistant", "content": bot_msg}
	])

	# Add current message
	messages.append({"role": "user", "content": message})

	# Make API request
	response = requests.post(
	API_URL,
	headers=headers,
	json={
	"model": model,
	"messages": messages,
	"temperature": 0.7,
	"max_tokens": 2048,
	"stream": False,
	"stop": None
	},
	timeout=30
	)

	# Handle HTTP errors
	if response.status_code == 401:
	return "❌ Authentication Failed\nInvalid API key. Please check your GROQ_API_KEY secret."
	elif response.status_code == 403:
	return "❌ Access Forbidden\nAPI key doesn't have permission."
	elif response.status_code == 429:
	return "❌ Rate Limited\nToo many requests. Groq has generous limits, this should be rare."
	elif response.status_code == 500:
	return "❌ Server Error\nGroq server issue. Please try again."
	elif response.status_code == 503:
	return "❌ Service Unavailable\nGroq is temporarily down. Try again in a moment."

	response.raise_for_status()

	# Parse response
	result = response.json()

	if "choices" in result and len(result["choices"]) > 0:
	content = result["choices"][0]["message"]["content"]
	return content.strip()
	else:
	return f"❌ Unexpected Response Format\n```json\n{result}\n```"

	except requests.exceptions.Timeout:
	return "❌ Timeout\nRequest took too long (>30s). Try again."
	except requests.exceptions.ConnectionError:
	return "❌ Connection Error\nCannot connect to Groq API. Check internet connection."
	except requests.exceptions.RequestException as e:
	return f"❌ Request Error\n{str(e)}"
	except Exception as e:
	return f"❌ Unexpected Error\n{str(e)}"

	def test_api_connection():
	"""Test API connection and return status"""
	if not API_KEY:
	return "🔴 API Key Missing"

	try:
	response = requests.post(
	API_URL,
	headers=headers,
	json={
	"model": "llama3-8b-8192",
	"messages": [{"role": "user", "content": "test"}],
	"max_tokens": 5
	},
	timeout=10
	)

	if response.status_code == 200:
	return "🟢 Connected Successfully"
	else:
	return f"🔴 HTTP {response.status_code}"
	except Exception as e:
	return f"🔴 Connection Failed: {str(e)[:50]}"

	def create_gradio_interface():
	# Test connection at startup
	connection_status = test_api_connection()

	# Custom CSS for better UI
	css = """
	.gradio-container {
	max-width: 800px !important;
	margin: auto !important;
	}
	.chat-message {
	padding: 10px !important;
	}
	"""

	with gr.Blocks(
	title="⚡ Groq AI Chat",
	theme=gr.themes.Soft(primary_hue="blue"),
	css=css
	) as demo:

	# Header
	gr.Markdown("""
	# ⚡ Groq AI Chat
	### Lightning-fast AI responses powered by Groq's LPU™
	""")

	# Status indicator
	with gr.Row():
	gr.Markdown(f"Connection Status: {connection_status}")

	# Model selector
	with gr.Row():
	model_dropdown = gr.Dropdown(
	choices=list(MODELS.keys()),
	value="llama3-8b-8192",
	label="🤖 Select AI Model",
	info="Choose the model that best fits your needs"
	)

	# Chat interface
	chatbot = gr.Chatbot(
	label="💬 Chat History",
	height=500,
	bubble_full_width=False,
	show_copy_button=True
	)

	# Input area
	with gr.Row():
	msg_textbox = gr.Textbox(
	label="✍️ Your Message",
	placeholder="Ask me anything... Groq responses are incredibly fast!",
	scale=4,
	lines=2,
	max_lines=5
	)
	send_button = gr.Button("Send ⚡", variant="primary", scale=1)

	# Control buttons
	with gr.Row():
	clear_button = gr.Button("🗑️ Clear Chat", variant="secondary")

	# Chat logic
	def respond(message: str, chat_history: List[List[str]], model: str):
	if not message.strip():
	return "", chat_history

	# Convert gradio format to API format
	history_tuples = [(h[0], h[1]) for h in chat_history if len(h) >= 2]

	# Get AI response
	bot_message = query_groq(message.strip(), history_tuples, model)

	# Update chat history
	chat_history.append([message, bot_message])
	return "", chat_history

	# Event handlers
	msg_textbox.submit(
	respond,
	inputs=[msg_textbox, chatbot, model_dropdown],
	outputs=[msg_textbox, chatbot]
	)
	send_button.click(
	respond,
	inputs=[msg_textbox, chatbot, model_dropdown],
	outputs=[msg_textbox, chatbot]
	)
	clear_button.click(
	lambda: [],
	outputs=chatbot
	)

	# Example prompts
	gr.Examples(
	examples=[
	["Hello! What makes Groq special?"],
	["Explain quantum computing in simple terms"],
	["Write a Python function to find prime numbers"],
	["What's the difference between AI, ML, and Deep Learning?"],
	["Help me debug this error: 'TypeError: 'str' object is not callable'"],
	["Create a simple REST API with FastAPI"],
	["Explain the concept of recursion with examples"],
	["What are the latest trends in web development?"]
	],
	inputs=msg_textbox,
	label="💡 Try these examples:"
	)

	# Information accordion
	with gr.Accordion("ℹ️ About Groq & Models", open=False):
	gr.Markdown(f"""
	🚀 Why Groq is Amazing:
	- ⚡ Fastest AI inference in the world (500+ tokens/second)
	- 🆓 Generous free tier with high rate limits
	- 🔄 Real-time responses feel like magic
	- 🎯 Consistent quality across all models

	🤖 Available Models:
	{chr(10).join([f"- {model}: {desc}" for model, desc in MODELS.items()])}

	🔧 Technical Details:
	- Powered by Groq's custom LPU™ (Language Processing Unit)
	- Optimized for transformer model inference
	- Supports context windows up to 32K tokens
	- Enterprise-grade reliability and security
	""")

	# Footer
	gr.Markdown("""
	---
	🔑 Setup Instructions:
	1. Get free API key: [console.groq.com](https://console.groq.com)
	2. Add to HF Spaces: Settings → Repository secrets → `GROQ_API_KEY`
	3. Restart your Space and enjoy lightning-fast AI!

	💡 Tips:
	- Groq excels at coding, explanations, and creative tasks
	- Try different models to see which fits your use case
	- The speed difference is immediately noticeable!
	""")

	return demo

	# Create and launch the interface
	if __name__ == "__main__":
	print("🚀 Initializing Groq Chat Interface...")
	print(f"🔑 API Key Status: {'✅ Ready' if API_KEY else '❌ Please add GROQ_API_KEY to secrets'}")

	demo = create_gradio_interface()
	demo.launch(
	server_name="0.0.0.0",
	server_port=7860,
	show_error=True,
	show_api=False, # Hide API docs for cleaner interface
	favicon_path=None
	)