thomasabebe
/

mistralSun11

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

thomasabebe commited on May 23

Commit

7b7297d

•

1 Parent(s): c75004b

Create handler.py

Files changed (1) hide show

handler.py +30 -0

handler.py ADDED Viewed

	@@ -0,0 +1,30 @@

+import torch
+import bitsandbytes as bnb
+from transformers import AutoTokenizer, AutoModelForCausalLM  # Adjusted import for the correct model type
+import os
+from typing import Dict, List, Any
+# Set the environment variable for the Hugging Face token
+class EndpointHandler:
+    def __init__(self, model_path="thomasabebe/coolmodel"):
+        self.tokenizer = AutoTokenizer.from_pretrained(model_path)
+        self.model = AutoModelForCausalLM.from_pretrained(model_path, torch_dtype=torch.float32)  # Adjusted model class
+    def __call__(self, data):
+        # Extract inputs from the data
+        inputs = data.get("inputs", "")
+        # Preprocess the inputs
+        encoded_input = self.tokenizer(inputs, return_tensors='pt', padding=True, truncation=True)
+        # Get predictions
+        output = self.model(**encoded_input)
+        # Postprocess the outputs
+        prediction = output.logits.argmax(-1).tolist()  # Convert the tensor to a list
+        # Return the result
+        return {"label": prediction}