llmware
/

dragon-yi-6b-v0

Text Generation

Inference Endpoints

Model card Files Files and versions Community

doberst commited on Nov 16, 2023

Commit

6b74b96

•

1 Parent(s): 015a637

Update generation_test_hf_script.py

Files changed (1) hide show

generation_test_hf_script.py +5 -2

generation_test_hf_script.py CHANGED Viewed

@@ -13,7 +13,7 @@ def load_rag_benchmark_tester_ds():
     dataset = load_dataset(ds_name)
-    print("update: loading test dataset - ", dataset)
     test_set = []
     for i, samples in enumerate(dataset["train"]):
@@ -29,7 +29,9 @@ def run_test(model_name, test_ds):
     device = "cuda" if torch.cuda.is_available() else "cpu"
-    print("update: model will be loaded on device - ", device)
     model = AutoModelForCausalLM.from_pretrained(model_name, trust_remote_code=True)
     model.to(device)
@@ -39,6 +41,7 @@ def run_test(model_name, test_ds):
     for i, entries in enumerate(test_ds):
         # prepare prompt packaging used in fine-tuning process
         new_prompt = "<human>: " + entries["context"] + "\n" + entries["query"] + "\n" + "<bot>:" + "\n"
         inputs = tokenizer(new_prompt, return_tensors="pt")

     dataset = load_dataset(ds_name)
+    print("update: loading RAG Benchmark test dataset - ", dataset)
     test_set = []
     for i, samples in enumerate(dataset["train"]):
     device = "cuda" if torch.cuda.is_available() else "cpu"
+    print("\nRAG Performance Test - 200 questions")
+    print("update: model - ", model_name)
+    print("update: device - ", device)
     model = AutoModelForCausalLM.from_pretrained(model_name, trust_remote_code=True)
     model.to(device)
     for i, entries in enumerate(test_ds):
         # prepare prompt packaging used in fine-tuning process
+        # note: in out testing, Yi model performed better with trailing "\n" at end of prompt
         new_prompt = "<human>: " + entries["context"] + "\n" + entries["query"] + "\n" + "<bot>:" + "\n"
         inputs = tokenizer(new_prompt, return_tensors="pt")