Zhiyu Wu commited on
Commit
4fc7206
1 Parent(s): f5248c1

t5 use hf-seq2seq

Browse files
Files changed (1) hide show
  1. pegasus/nlp-eval.yaml +5 -3
pegasus/nlp-eval.yaml CHANGED
@@ -12,7 +12,6 @@
12
  - databricks/dolly-v2-12b
13
  - FreedomIntelligence/phoenix-inst-chat-7b
14
  - h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
15
- - lmsys/fastchat-t5-3b-v1.0
16
  - Neutralzz/BiLLa-7B-SFT
17
  - nomic-ai/gpt4all-13b-snoozy
18
  - openaccess-ai-collective/manticore-13b-chat-pyg
@@ -35,7 +34,6 @@
35
  - databricks/dolly-v2-12b
36
  - FreedomIntelligence/phoenix-inst-chat-7b
37
  - h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
38
- - lmsys/fastchat-t5-3b-v1.0
39
  - Neutralzz/BiLLa-7B-SFT
40
  - nomic-ai/gpt4all-13b-snoozy
41
  - openaccess-ai-collective/manticore-13b-chat-pyg
@@ -58,7 +56,6 @@
58
  - databricks/dolly-v2-12b
59
  - FreedomIntelligence/phoenix-inst-chat-7b
60
  - h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
61
- - lmsys/fastchat-t5-3b-v1.0
62
  - Neutralzz/BiLLa-7B-SFT
63
  - nomic-ai/gpt4all-13b-snoozy
64
  - openaccess-ai-collective/manticore-13b-chat-pyg
@@ -66,3 +63,8 @@
66
  - project-baize/baize-v2-7B
67
  - StabilityAI/stablelm-tuned-alpha-7b
68
  - togethercomputer/RedPajama-INCITE-7B-Chat
 
 
 
 
 
 
12
  - databricks/dolly-v2-12b
13
  - FreedomIntelligence/phoenix-inst-chat-7b
14
  - h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
 
15
  - Neutralzz/BiLLa-7B-SFT
16
  - nomic-ai/gpt4all-13b-snoozy
17
  - openaccess-ai-collective/manticore-13b-chat-pyg
 
34
  - databricks/dolly-v2-12b
35
  - FreedomIntelligence/phoenix-inst-chat-7b
36
  - h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
 
37
  - Neutralzz/BiLLa-7B-SFT
38
  - nomic-ai/gpt4all-13b-snoozy
39
  - openaccess-ai-collective/manticore-13b-chat-pyg
 
56
  - databricks/dolly-v2-12b
57
  - FreedomIntelligence/phoenix-inst-chat-7b
58
  - h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
 
59
  - Neutralzz/BiLLa-7B-SFT
60
  - nomic-ai/gpt4all-13b-snoozy
61
  - openaccess-ai-collective/manticore-13b-chat-pyg
 
63
  - project-baize/baize-v2-7B
64
  - StabilityAI/stablelm-tuned-alpha-7b
65
  - togethercomputer/RedPajama-INCITE-7B-Chat
66
+
67
+ - command:
68
+ - docker exec leaderboard{{ gpu }} python lm-evaluation-harness/main.py --device cuda --no_cache --model hf-seq2seq --model_args pretrained=lmsys/fastchat-t5-3b-v1.0,trust_remote_code=True,use_accelerate=True --tasks arc_challenge --num_fewshot 25
69
+ - docker exec leaderboard{{ gpu }} python lm-evaluation-harness/main.py --device cuda --no_cache --model hf-seq2seq --model_args pretrained=lmsys/fastchat-t5-3b-v1.0,trust_remote_code=True,use_accelerate=True --tasks hellaswag --num_fewshot 10
70
+ - docker exec leaderboard{{ gpu }} python lm-evaluation-harness/main.py --device cuda --no_cache --model hf-seq2seq --model_args pretrained=lmsys/fastchat-t5-3b-v1.0,trust_remote_code=True,use_accelerate=True --tasks truthfulqa_mc --num_fewshot 0