Spaces:
Running
Running
Zhiyu Wu
commited on
Commit
·
4fc7206
1
Parent(s):
f5248c1
t5 use hf-seq2seq
Browse files- pegasus/nlp-eval.yaml +5 -3
pegasus/nlp-eval.yaml
CHANGED
@@ -12,7 +12,6 @@
|
|
12 |
- databricks/dolly-v2-12b
|
13 |
- FreedomIntelligence/phoenix-inst-chat-7b
|
14 |
- h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
|
15 |
-
- lmsys/fastchat-t5-3b-v1.0
|
16 |
- Neutralzz/BiLLa-7B-SFT
|
17 |
- nomic-ai/gpt4all-13b-snoozy
|
18 |
- openaccess-ai-collective/manticore-13b-chat-pyg
|
@@ -35,7 +34,6 @@
|
|
35 |
- databricks/dolly-v2-12b
|
36 |
- FreedomIntelligence/phoenix-inst-chat-7b
|
37 |
- h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
|
38 |
-
- lmsys/fastchat-t5-3b-v1.0
|
39 |
- Neutralzz/BiLLa-7B-SFT
|
40 |
- nomic-ai/gpt4all-13b-snoozy
|
41 |
- openaccess-ai-collective/manticore-13b-chat-pyg
|
@@ -58,7 +56,6 @@
|
|
58 |
- databricks/dolly-v2-12b
|
59 |
- FreedomIntelligence/phoenix-inst-chat-7b
|
60 |
- h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
|
61 |
-
- lmsys/fastchat-t5-3b-v1.0
|
62 |
- Neutralzz/BiLLa-7B-SFT
|
63 |
- nomic-ai/gpt4all-13b-snoozy
|
64 |
- openaccess-ai-collective/manticore-13b-chat-pyg
|
@@ -66,3 +63,8 @@
|
|
66 |
- project-baize/baize-v2-7B
|
67 |
- StabilityAI/stablelm-tuned-alpha-7b
|
68 |
- togethercomputer/RedPajama-INCITE-7B-Chat
|
|
|
|
|
|
|
|
|
|
|
|
12 |
- databricks/dolly-v2-12b
|
13 |
- FreedomIntelligence/phoenix-inst-chat-7b
|
14 |
- h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
|
|
|
15 |
- Neutralzz/BiLLa-7B-SFT
|
16 |
- nomic-ai/gpt4all-13b-snoozy
|
17 |
- openaccess-ai-collective/manticore-13b-chat-pyg
|
|
|
34 |
- databricks/dolly-v2-12b
|
35 |
- FreedomIntelligence/phoenix-inst-chat-7b
|
36 |
- h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
|
|
|
37 |
- Neutralzz/BiLLa-7B-SFT
|
38 |
- nomic-ai/gpt4all-13b-snoozy
|
39 |
- openaccess-ai-collective/manticore-13b-chat-pyg
|
|
|
56 |
- databricks/dolly-v2-12b
|
57 |
- FreedomIntelligence/phoenix-inst-chat-7b
|
58 |
- h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
|
|
|
59 |
- Neutralzz/BiLLa-7B-SFT
|
60 |
- nomic-ai/gpt4all-13b-snoozy
|
61 |
- openaccess-ai-collective/manticore-13b-chat-pyg
|
|
|
63 |
- project-baize/baize-v2-7B
|
64 |
- StabilityAI/stablelm-tuned-alpha-7b
|
65 |
- togethercomputer/RedPajama-INCITE-7B-Chat
|
66 |
+
|
67 |
+
- command:
|
68 |
+
- docker exec leaderboard{{ gpu }} python lm-evaluation-harness/main.py --device cuda --no_cache --model hf-seq2seq --model_args pretrained=lmsys/fastchat-t5-3b-v1.0,trust_remote_code=True,use_accelerate=True --tasks arc_challenge --num_fewshot 25
|
69 |
+
- docker exec leaderboard{{ gpu }} python lm-evaluation-harness/main.py --device cuda --no_cache --model hf-seq2seq --model_args pretrained=lmsys/fastchat-t5-3b-v1.0,trust_remote_code=True,use_accelerate=True --tasks hellaswag --num_fewshot 10
|
70 |
+
- docker exec leaderboard{{ gpu }} python lm-evaluation-harness/main.py --device cuda --no_cache --model hf-seq2seq --model_args pretrained=lmsys/fastchat-t5-3b-v1.0,trust_remote_code=True,use_accelerate=True --tasks truthfulqa_mc --num_fewshot 0
|