Spaces:

Quanttum
/

crypto-llama-summarizer

Sleeping

App Files Files Community

Quanttum commited on 22 days ago

Commit

99281ee

verified ·

1 Parent(s): 8cc9472

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -11

app.py CHANGED Viewed

@@ -4,23 +4,29 @@ from peft import PeftModel
 import torch
 import re
-# THIS LINE IS THE ONLY CHANGE — un-gated, public, works instantly
-model_name = "unsloth/Meta-Llama-3.1-8B-Instruct-bnb-4bit"
-tokenizer = AutoTokenizer.from_pretrained(model_name)
 base_model = AutoModelForCausalLM.from_pretrained(
-    model_name,
     torch_dtype=torch.float16,
     device_map="auto"
 )
-model = PeftModel.from_pretrained(base_model, "Quanttum/crypto-llama-lora-final")
 pipe = pipeline(
     "text-generation",
     model=model,
     tokenizer=tokenizer,
     max_new_tokens=512,
     temperature=0.3,
     repetition_penalty=1.15,
 )
@@ -35,17 +41,28 @@ TL;DR:"""
     output = pipe(prompt)[0]["generated_text"]
     response = output[len(prompt):].strip()
-    return response
-with gr.Blocks(theme=gr.themes.Soft()) as demo:
-    gr.Markdown("# 🚀 Crypto News Summarizer + Sentiment Analyzer\nFine-tuned Llama 3.1 8B")
-    gr.ChatInterface(
         chat,
         examples=[
-            ["Bitcoin ETF inflows hit $1.5B this week!"],
             ["SEC approves spot Ethereum ETF!"],
-            ["Mt. Gox starts repaying creditors in BTC."],
         ],
         cache_examples=True,
     )

 import torch
 import re
+# Public, ungated base model + your LoRA (works 100% in Spaces)
+base_name = "unsloth/Meta-Llama-3.1-8B-Instruct-bnb-4bit"
+lora_name = "Quanttum/crypto-llama-lora-final"
+# Load base model (no auth needed)
+tokenizer = AutoTokenizer.from_pretrained(base_name)
 base_model = AutoModelForCausalLM.from_pretrained(
+    base_name,
     torch_dtype=torch.float16,
     device_map="auto"
 )
+# Load your LoRA on top (your fine-tuning!)
+model = PeftModel.from_pretrained(base_model, lora_name)
+# Pipeline for generation
 pipe = pipeline(
     "text-generation",
     model=model,
     tokenizer=tokenizer,
     max_new_tokens=512,
     temperature=0.3,
+    top_p=0.9,
     repetition_penalty=1.15,
 )
     output = pipe(prompt)[0]["generated_text"]
     response = output[len(prompt):].strip()
+    # Simple score extraction
+    score_match = re.search(r"[-+]?\d*\.\d+", response[-20:])
+    score = score_match.group(0) if score_match else "N/A"
+    full_response = response + f"\n\nSentiment Score: {score}"
+    return full_response
+# ChatGPT-style UI
+with gr.Blocks(theme=gr.themes.Soft(), title="Crypto News Summarizer") as demo:
+    gr.Markdown("# 🚀 Crypto News Summarizer + Sentiment Analyzer\nFine-tuned Llama 3.1 8B by @Quanttum")
+    chatbot = gr.ChatInterface(
         chat,
         examples=[
+            ["Bitcoin ETF inflows hit $1.5B this week as institutional adoption surges."],
+            ["Mt. Gox starts repaying creditors in BTC — 140k coins incoming."],
             ["SEC approves spot Ethereum ETF!"],
+            ["China just banned all crypto trading again."],
         ],
+        title=None,
+        description="Paste any crypto news or tweet → get instant TL;DR + sentiment score (-1.0 to +1.0)",
         cache_examples=True,
     )