yamete4
/

codegen-350M-mono-QLoRa-flytech

Text Generation

Model card Files Files and versions Community

yamete4 commited on Mar 18

Commit

f7d94c1

•

1 Parent(s): 3908efa

Update README.md

Files changed (1) hide show

README.md +31 -28

README.md CHANGED Viewed

@@ -4,6 +4,9 @@ base_model: shpotes/codegen-350M-mono
 datasets:
 - flytech/python-codes-25k
 pipeline_tag: text-generation
 ---
 # Model Card for Model ID
@@ -72,34 +75,34 @@ Users (both direct and downstream) should be made aware of the risks, biases and
 ## How to Get Started with the Model
-import torch
-from transformers import AutoModelForCausalLM, AutoTokenizer
-tokenizer = AutoTokenizer.from_pretrained("shpotes/codegen-350M-mono")
-model = AutoModelForCausalLM.from_pretrained("shpotes/codegen-350M-mono", trust_remote_code=True)
-input_ids = tokenizer(
-    context,
-    truncation=True,
-    padding=True,
-    return_tensors='pt',
-    pad_token_id=pad_token_id,
-).input_ids
-input_ids_len = input_ids.shape[1]
-with torch.no_grad():
-  input_ids = input_ids
-  tokens = model.generate(
-      input_ids,
-      do_sample=True,
-      num_return_sequences=num_return_sequences,
-      temperature=temp,
-      max_length=input_ids_len + max_length_sample,
-      top_p=top_p,
-      use_cache=True,
-  )
-  text = tokenizer.batch_decode(tokens[:, input_ids_len:, ...])
 [More Information Needed]

 datasets:
 - flytech/python-codes-25k
 pipeline_tag: text-generation
+tags:
+- code
+- text-generation-inference
 ---
 # Model Card for Model ID
 ## How to Get Started with the Model
+  import torch
+  from transformers import AutoModelForCausalLM, AutoTokenizer
+  tokenizer = AutoTokenizer.from_pretrained("shpotes/codegen-350M-mono")
+  model = AutoModelForCausalLM.from_pretrained("shpotes/codegen-350M-mono", trust_remote_code=True)
+  input_ids = tokenizer(
+      context,
+      truncation=True,
+      padding=True,
+      return_tensors='pt',
+      pad_token_id=pad_token_id,
+  ).input_ids
+  input_ids_len = input_ids.shape[1]
+  with torch.no_grad():
+    input_ids = input_ids
+    tokens = model.generate(
+        input_ids,
+        do_sample=True,
+        num_return_sequences=num_return_sequences,
+        temperature=temp,
+        max_length=input_ids_len + max_length_sample,
+        top_p=top_p,
+        use_cache=True,
+    )
+    text = tokenizer.batch_decode(tokens[:, input_ids_len:, ...])
 [More Information Needed]