samsonsbike
/

music-d3xy

Inference Endpoints

Model card Files Files and versions Community

samsonsbike commited on Jan 20

Commit

99557a7

•

1 Parent(s): 084a6a5

Update handler.py

Files changed (1) hide show

handler.py +35 -27

handler.py CHANGED Viewed

@@ -1,38 +1,46 @@
-from typing import Dict, List, Any
-from transformers import AutoProcessor, MusicgenForConditionalGeneration
 import torch
 class EndpointHandler:
     def __init__(self, path=""):
-        # load model and processor from path
-        self.processor = AutoProcessor.from_pretrained(path)
-        self.model = MusicgenForConditionalGeneration.from_pretrained(path, torch_dtype=torch.float16).to("cuda")
     def __call__(self, data: Dict[str, Any]) -> Dict[str, str]:
-        """
-        Args:
-            data (:dict:):
-                The payload with the text prompt and generation parameters.
-        """
-        # process input
-        inputs = data.pop("inputs", data)
-        parameters = data.pop("parameters", None)
-        # preprocess
-        inputs = self.processor(
-            text=[inputs],
-            padding=True,
-            return_tensors="pt",).to("cuda")
-        # pass inputs with all kwargs in data
-        if parameters is not None:
-            with torch.autocast("cuda"):
-                outputs = self.model.generate(**inputs, **parameters)
-        else:
             with torch.autocast("cuda"):
-                outputs = self.model.generate(**inputs,)
-        # postprocess the prediction
-        prediction = outputs[0].cpu().numpy().tolist()
-        return [{"generated_audio": prediction}]

 import torch
+import logging
+from transformers import AutoProcessor, MusicgenForConditionalGeneration
+from typing import Dict, Any
 class EndpointHandler:
     def __init__(self, path=""):
+        logging.basicConfig(level=logging.INFO)
+        try:
+            # load model and processor from path
+            self.processor = AutoProcessor.from_pretrained(path)
+            self.model = MusicgenForConditionalGeneration.from_pretrained(path, torch_dtype=torch.float16).to("cuda")
+        except Exception as e:
+            logging.error(f"Error loading model or processor: {e}")
+            raise
     def __call__(self, data: Dict[str, Any]) -> Dict[str, str]:
+        try:
+            # validate and process input
+            inputs = data.get("inputs")
+            if not inputs:
+                raise ValueError("No inputs provided")
+            parameters = data.get("parameters", {})
+            # preprocess
+            processed_inputs = self.processor(
+                text=[inputs],
+                padding=True,
+                return_tensors="pt"
+            ).to("cuda")
+            # generate outputs
             with torch.autocast("cuda"):
+                outputs = self.model.generate(**processed_inputs, **parameters)
+            # postprocess the prediction
+            prediction = outputs[0].cpu().numpy().tolist()
+            return [{"generated_audio": prediction}]
+        except Exception as e:
+            logging.error(f"Error during model inference: {e}")
+            return {"error": str(e)}
+# Example usage:
+# handler = EndpointHandler(path="your_model_path")
+# result = handler({"inputs": "your input text"})