Spaces:

Dimitre
/

Gemma-Hangman

Runtime error

Dimitre commited on Mar 31, 2024

Commit

1fd4dc6

1 Parent(s): f8817da

App final update

Files changed (2) hide show

app.py CHANGED Viewed

@@ -4,7 +4,7 @@ import os
 import streamlit as st
 import torch
 from dotenv import load_dotenv
-from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig
 from hangman import guess_letter
 from hf_utils import query_hint, query_word
@@ -34,7 +34,6 @@ def setup(model_id: str, device: str) -> None:
         model_id (str): Model ID used to load the tokenizer and model.
     """
     logger.info(f"Loading model and tokenizer from model: '{model_id}'")
-    quantization_config = BitsAndBytesConfig(load_in_4bit=True)
     tokenizer = AutoTokenizer.from_pretrained(
         model_id,
@@ -44,7 +43,7 @@ def setup(model_id: str, device: str) -> None:
         model_id,
         torch_dtype=torch.float16,
         token=os.environ["HF_ACCESS_TOKEN"],
-        quantization_config=quantization_config,
     ).to(device)
     logger.info("Setup finished")
     return {"tokenizer": tokenizer, "model": model}

 import streamlit as st
 import torch
 from dotenv import load_dotenv
+from transformers import AutoModelForCausalLM, AutoTokenizer
 from hangman import guess_letter
 from hf_utils import query_hint, query_word
         model_id (str): Model ID used to load the tokenizer and model.
     """
     logger.info(f"Loading model and tokenizer from model: '{model_id}'")
     tokenizer = AutoTokenizer.from_pretrained(
         model_id,
         model_id,
         torch_dtype=torch.float16,
         token=os.environ["HF_ACCESS_TOKEN"],
+        device_map="auto",
     ).to(device)
     logger.info("Setup finished")
     return {"tokenizer": tokenizer, "model": model}

requirements.txt CHANGED Viewed

@@ -2,5 +2,4 @@ streamlit
 python-dotenv
 torch
 transformers
-bitsandbytes
 accelerate

 python-dotenv
 torch
 transformers
 accelerate