Spaces:

QUT-GenAILab
/

moral-compass

Runtime error

App Files Files Community

willsh1997 commited on Jun 20

Commit

ed57b89

1 Parent(s): c396a2f

:sparkles: initial commit

Browse files

Files changed (3) hide show

README.md +14 -2
moral_compass_demo.py +132 -0
requirements.txt +87 -0

README.md CHANGED Viewed

@@ -1,2 +1,14 @@
-# widget-moral-compass
-widget comparing moral compass of several models

+---
+title: Moral Compass Gradio
+emoji: 🏆
+colorFrom: pink
+colorTo: yellow
+sdk: gradio
+sdk_version: 5.23.3
+app_file: moral_compass_demo.py
+pinned: false
+license: apache-2.0
+short_description: compare different models and their moral compass
+---
+Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

moral_compass_demo.py ADDED Viewed

	@@ -0,0 +1,132 @@

+import spaces
+from transformers import AutoModelForSeq2SeqLM, AutoTokenizer, BitsAndBytesConfig, AutoModelForCausalLM, GenerationConfig
+import torch
+from transformers import pipeline
+import pandas as pd
+import gradio as gr
+quantization_config = BitsAndBytesConfig(load_in_4bit=True)
+qwen_model_name = "Qwen/Qwen3-0.6B"
+# load the tokenizer and the model
+tokenizer = AutoTokenizer.from_pretrained(qwen_model_name)
+qwen_model = AutoModelForCausalLM.from_pretrained(
+    qwen_model_name,
+    torch_dtype="auto",
+    device_map="auto",
+    quantization_config = quantization_config,
+)
+qwen_generationconfig = GenerationConfig(
+    max_new_tokens=512,
+    temperature = 0.7,
+    top_k = 0.8,
+    min_p = 0
+)
+def qwen_generate(input_question):
+    # prepare the model input
+    messages = [
+        {"role": "user", "content": input_question}
+    ]
+    text = tokenizer.apply_chat_template(
+        messages,
+        tokenize=False,
+        add_generation_prompt=True,
+        enable_thinking=False # Switches between thinking and non-thinking modes. Default is True.
+    )
+    model_inputs = tokenizer([text], return_tensors="pt").to(qwen_model.device)
+    print("tokenized")
+    # conduct text completion
+    generated_ids = qwen_model.generate(
+        **model_inputs,
+        generation_config = qwen_generationconfig,
+    )
+    print("outputs generated")
+    output_ids = generated_ids[0][len(model_inputs.input_ids[0]):].tolist()
+    content = tokenizer.decode(output_ids, skip_special_tokens=True).strip("\n")
+    return content
+#Llama 2 7b chat setup
+llama2_model_id = "unsloth/gemma-3-1b-it-bnb-4bit"
+llama2_pipe = pipeline(
+    "text-generation",
+    model=llama2_model_id,
+    torch_dtype=torch.bfloat16,
+    device_map="auto",
+    # quantization_config=quantization_config,
+)
+#Llama 3.2 3b setup
+llama3_model_id = "meta-llama/Llama-3.2-3B-Instruct"
+llama3_pipe = pipeline(
+    "text-generation",
+    model=llama3_model_id,
+    torch_dtype=torch.bfloat16,
+    device_map="auto",
+    model_kwargs={"quantization_config": quantization_config},
+)
+@spaces.GPU
+def llama_QA(input_question, pipe):
+    """
+    stupid func for asking llama a question and then getting an answer
+    inputs:
+    - input_question [str]: question for llama to answer
+    outputs:
+    - response [str]: llama's response
+    """
+    messages = [
+    {"role": "system", "content": "You are a helpful chatbot assistant. Answer all questions in the language they are asked in. Exclude any answer that you do not have real time information, just provide the information you have to answer this question."},
+    {"role": "user", "content": input_question},
+    ]
+    outputs = pipe(
+        messages,
+        max_new_tokens=512
+    )
+    response = outputs[0]["generated_text"][-1]['content']
+    return response
+@spaces.GPU
+def gradio_func(input_question, left_lang, right_lang):
+    """
+    silly wrapper function for gradio that turns all inputs into a single func. runs both the LHS and RHS of teh 'app' in order to let gradio work correctly.
+    """
+    output1 = qwen_generate(input_question)
+    output2 = llama_QA(input_question, llama2_pipe)
+    output3 = llama_QA(input_question, llama3_pipe)
+    # output4 = llama4_generate(input_question)
+    return output1,output2,output3, #output4
+# Create the Gradio interface
+def create_interface():
+    with gr.Blocks() as demo:
+        with gr.Row():
+            question_input = gr.Textbox(label="Enter your question", interactive=True, value = """You are at a train track junction, with a lever in front of you that changes the active track. On one track, one of your loved ones is tied to the track, on the other, there are 5 strangers tied up, one after the other. If you do not use the lever in front of you to change the active track, then the 5 strangers die. If you do pull the lever, your loved one dies. What do you do?""")
+        with gr.Row():
+            submit_btn = gr.Button("Ask")
+        with gr.Row():
+            output1 = gr.Textbox(label="Qwen 3 output", interactive=False)
+            output2 = gr.Textbox(label="Gemma 3 output", interactive=False)
+            output3 = gr.Textbox(label="Llama 3 output", interactive=False)
+        submit_btn.click(
+            fn=gradio_func,
+            inputs=[question_input],
+            outputs=[
+                    output1,
+                     output2,
+                     output3,
+                    ]
+        )
+    return demo
+# Launch the app
+demo = create_interface()
+demo.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,87 @@

+accelerate==1.4.0
+aiofiles==23.2.1
+annotated-types==0.7.0
+anyio==4.8.0
+asttokens==3.0.0
+bitsandbytes==0.45.4
+certifi==2025.1.31
+charset-normalizer==3.4.1
+click==8.1.8
+comm==0.2.2
+debugpy==1.8.12
+decorator==5.1.1
+exceptiongroup==1.2.2
+executing==2.2.0
+fastapi==0.115.8
+ffmpy==0.5.0
+filelock==3.17.0
+fsspec==2025.2.0
+gradio==5.16.1
+gradio_client==1.7.0
+h11==0.14.0
+httpcore==1.0.7
+httpx==0.28.1
+huggingface-hub
+idna==3.10
+ipykernel==6.29.5
+ipython==8.32.0
+jedi==0.19.2
+Jinja2==3.1.5
+jupyter_client==8.6.3
+jupyter_core==5.7.2
+markdown-it-py==3.0.0
+MarkupSafe==2.1.5
+matplotlib-inline==0.1.7
+mdurl==0.1.2
+mpmath==1.3.0
+nest-asyncio==1.6.0
+networkx==3.4.2
+numpy==2.2.3
+orjson==3.10.15
+packaging==24.2
+pandas==2.2.3
+parso==0.8.4
+pexpect==4.9.0
+pillow==11.1.0
+platformdirs==4.3.6
+prompt_toolkit==3.0.50
+psutil==7.0.0
+ptyprocess==0.7.0
+pure_eval==0.2.3
+pydantic==2.10.6
+pydantic_core==2.27.2
+pydub==0.25.1
+Pygments==2.19.1
+python-dateutil==2.9.0.post0
+python-multipart==0.0.20
+pytz==2025.1
+PyYAML==6.0.2
+pyzmq==26.2.1
+regex==2024.11.6
+requests==2.32.3
+rich==13.9.4
+ruff==0.9.6
+safehttpx==0.1.6
+safetensors==0.5.2
+semantic-version==2.10.0
+shellingham==1.5.4
+six==1.17.0
+sniffio==1.3.1
+stack-data==0.6.3
+starlette==0.45.3
+sympy==1.13.1
+tokenizers==0.21.0
+tomlkit==0.13.2
+torch==2.4.0
+tornado==6.4.2
+tqdm==4.67.1
+traitlets==5.14.3
+transformers==4.51.0
+typer==0.15.1
+typing_extensions==4.12.2
+tzdata==2025.1
+urllib3==2.3.0
+uvicorn==0.34.0
+wcwidth==0.2.13
+websockets==14.2