robowaifudev
/

megatron-gpt2-345m

Text Generation

Inference Endpoints

text-generation-inference

Model card Files Files and versions Community

robowaifudev commited on Dec 21, 2022

Commit

5ee52db

•

1 Parent(s): c0fd3c3

Update README.md

Files changed (1) hide show

README.md +25 -5

README.md CHANGED Viewed

@@ -1,3 +1,19 @@
 <!---
 # ##############################################################################################
 #
@@ -48,29 +64,33 @@ model = GPT2LMHeadModel.from_pretrained("robowaifudev/megatron-gpt2-345m")
 if torch.cuda.is_available():
     device = torch.device("cuda")
-    model.to(device)
     model.half()
 else:
     device = torch.device("cpu")
 model.eval()
 # Generate
-text = "Hello world!"
-input_ids = tokenizer.encode(text, return_tensors="pt")
 output = model.generate(
     input_ids=input_ids,
-    max_length=len(input_ids) + 32,
     do_sample=True,
     top_k=64,
     top_p=0.9,
     temperature=0.8,
-    num_return_sequences=1
 )
 # Output the text.
 for i, sentence in enumerate(output):
     text = tokenizer.decode(sentence, clean_up_tokenization_spaces=True)
     print(f"{i}:", text)
 ```
 # Original code

+---
+language:
+  - en
+tags:
+  - gpt2
+license: apache-2.0
+datasets:
+  - wikitext
+  - openwebtext
+  - cc-stories
+metrics:
+  - type: wikitext
+    value: 19.31
+    name: WikiText-103
+---
 <!---
 # ##############################################################################################
 #
 if torch.cuda.is_available():
     device = torch.device("cuda")
     model.half()
 else:
     device = torch.device("cpu")
+model.to(device)
 model.eval()
 # Generate
+prompt = "It was a bright cold day in April, and the clocks were striking thirteen. Winston Smith,"
+input_ids = tokenizer.encode(prompt, return_tensors="pt").to(device)
 output = model.generate(
     input_ids=input_ids,
+    max_length=len(input_ids) + 128,
     do_sample=True,
     top_k=64,
     top_p=0.9,
     temperature=0.8,
+    num_return_sequences=2,
+    repetition_penalty=1.025
 )
 # Output the text.
+print("Prompt:", prompt)
+print("*" * 3)
 for i, sentence in enumerate(output):
     text = tokenizer.decode(sentence, clean_up_tokenization_spaces=True)
     print(f"{i}:", text)
+    print("*" * 3)
 ```
 # Original code