import os import gradio as gr from huggingface_hub import InferenceClient import time client = InferenceClient("lambdaindie/lambda-1v-1B", token = os.getenv("HF_TOKEN")) css = """ @import url('https://fonts.googleapis.com/css2?family=JetBrains+Mono&display=swap'); * { font-family: 'JetBrains Mono', monospace !important; } html, body, .gradio-container { font-family: 'JetBrains Mono', monospace !important; background-color: #111 !important; color: #e0e0e0 !important; } textarea, input, button, select{ background-color: transparent !important; color: #e0e0e0 !important; border: 1px solid #444 !important; } .markdown-think { background-color: #1e1e1e; border-left: 4px solid #555; padding: 10px; margin-bottom: 8px; font-style: italic; white-space: pre-wrap; animation: pulse 1.5s infinite ease-in-out; } @keyframes pulse { 0% { opacity: 0.6; } 50% { opacity: 1.0; } 100% { opacity: 0.6; } } """ theme = gr.themes.Base( primary_hue="gray", font=[ gr.themes.GoogleFont("JetBrains Mono"), "monospace" ] ).set( body_background_fill="#111", body_text_color="#e0e0e0", button_primary_background_fill="#333", button_primary_text_color="#e0e0e0", input_background_fill="#222", input_border_color="#444", block_title_text_color="#fff" ) def respond(message, history, system_message, max_tokens, temperature, top_p): messages = [{"role": "system", "content": system_message}] if system_message else [] for user, assistant in history: if user: messages.append({"role": "user", "content": user}) if assistant: messages.append({"role": "assistant", "content": assistant}) thinking_prompt = messages + [{ "role": "user", "content": f"{message}\n\nThink a bit step-by-step before answering." }] reasoning = "" yield '