CobraMamba
/

mamba-gpt-3b-v2

Text Generation

large language model

text-generation-inference

Model card Files Files and versions

chiliu commited on Jul 28, 2023

Commit

faed5af

·

1 Parent(s): e54792e

add & fix

Files changed (2) hide show

README.md +1 -1
mamba_gpt_pipeline.py +42 -0

README.md CHANGED Viewed

@@ -83,7 +83,7 @@ Alternatively, you can download the mamba_gpt_pipeline.py, store it alongside yo
 ```python
 import torch
-from mamba_gpt_pipeline.py import MambaGPTTextGenerationPipeline
 from transformers import AutoModelForCausalLM, AutoTokenizer
 tokenizer = AutoTokenizer.from_pretrained(

 ```python
 import torch
+from mamba_gpt_pipeline import MambaGPTTextGenerationPipeline
 from transformers import AutoModelForCausalLM, AutoTokenizer
 tokenizer = AutoTokenizer.from_pretrained(

mamba_gpt_pipeline.py ADDED Viewed

	@@ -0,0 +1,42 @@

+from transformers import TextGenerationPipeline
+from transformers.pipelines.text_generation import ReturnType
+STYLE = "<|prompt|>{instruction}</s><|answer|>"
+class MambaGPTTextGenerationPipeline(TextGenerationPipeline):
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+        self.prompt = STYLE
+    def preprocess(
+        self, prompt_text, prefix="", handle_long_generation=None, **generate_kwargs
+    ):
+        prompt_text = self.prompt.format(instruction=prompt_text)
+        return super().preprocess(
+            prompt_text,
+            prefix=prefix,
+            handle_long_generation=handle_long_generation,
+            **generate_kwargs,
+        )
+    def postprocess(
+        self,
+        model_outputs,
+        return_type=ReturnType.FULL_TEXT,
+        clean_up_tokenization_spaces=True,
+    ):
+        records = super().postprocess(
+            model_outputs,
+            return_type=return_type,
+            clean_up_tokenization_spaces=clean_up_tokenization_spaces,
+        )
+        for rec in records:
+            rec["generated_text"] = (
+                rec["generated_text"]
+                .split("<|answer|>")[1]
+                .strip()
+                .split("<|prompt|>")[0]
+                .strip()
+            )
+        return records