Spaces:

philschmid
/

Can-i-run-tgi

Sleeping

philschmid HF staff commited on Mar 14

Commit

d521aaf

•

1 Parent(s): 65db30c

Create app.py

Files changed (1) hide show

app.py ADDED Viewed

+#### INSTALL LIB
+import subprocess
+import os
+token = os.environ.get("GITHUB_TOKEN", None)
+if not token:
+    raise ValueError("Token not found")
+# Build the install command
+command = f"pip install git+https://x-access-token:{token}:x-oauth-basic@github.com/philschmid/model-recommender.git"
+subprocess.run(command, shell=True, check=True)
+#### INSTALL LIB
+import json
+import gradio as gr
+from recommender.main import get_tgi_config
+def greet(model_id, gpu_memory):
+    config = get_tgi_config(model_id, gpu_memory)
+    return json.dumps(config)
+demo = gr.Interface(
+    fn=greet,
+    inputs=[
+        gr.Textbox(label="Model ID", placeholder="meta-llama/Llama-2-7b-chat-hf"),
+        gr.Slider(
+            step=4000,
+            minimum=16_000,
+            maximum=640_000,
+            value=24_000,
+            label="GPU memory",
+            info="Select how much GPU memory you have available",
+        ),
+    ],
+    outputs=[gr.JSON()],
+)
+demo.launch()