Spaces:
Running
Running
Zhiyu Wu
commited on
Commit
·
4fc7206
1
Parent(s):
f5248c1
t5 use hf-seq2seq
Browse files- pegasus/nlp-eval.yaml +5 -3
pegasus/nlp-eval.yaml
CHANGED
|
@@ -12,7 +12,6 @@
|
|
| 12 |
- databricks/dolly-v2-12b
|
| 13 |
- FreedomIntelligence/phoenix-inst-chat-7b
|
| 14 |
- h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
|
| 15 |
-
- lmsys/fastchat-t5-3b-v1.0
|
| 16 |
- Neutralzz/BiLLa-7B-SFT
|
| 17 |
- nomic-ai/gpt4all-13b-snoozy
|
| 18 |
- openaccess-ai-collective/manticore-13b-chat-pyg
|
|
@@ -35,7 +34,6 @@
|
|
| 35 |
- databricks/dolly-v2-12b
|
| 36 |
- FreedomIntelligence/phoenix-inst-chat-7b
|
| 37 |
- h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
|
| 38 |
-
- lmsys/fastchat-t5-3b-v1.0
|
| 39 |
- Neutralzz/BiLLa-7B-SFT
|
| 40 |
- nomic-ai/gpt4all-13b-snoozy
|
| 41 |
- openaccess-ai-collective/manticore-13b-chat-pyg
|
|
@@ -58,7 +56,6 @@
|
|
| 58 |
- databricks/dolly-v2-12b
|
| 59 |
- FreedomIntelligence/phoenix-inst-chat-7b
|
| 60 |
- h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
|
| 61 |
-
- lmsys/fastchat-t5-3b-v1.0
|
| 62 |
- Neutralzz/BiLLa-7B-SFT
|
| 63 |
- nomic-ai/gpt4all-13b-snoozy
|
| 64 |
- openaccess-ai-collective/manticore-13b-chat-pyg
|
|
@@ -66,3 +63,8 @@
|
|
| 66 |
- project-baize/baize-v2-7B
|
| 67 |
- StabilityAI/stablelm-tuned-alpha-7b
|
| 68 |
- togethercomputer/RedPajama-INCITE-7B-Chat
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 12 |
- databricks/dolly-v2-12b
|
| 13 |
- FreedomIntelligence/phoenix-inst-chat-7b
|
| 14 |
- h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
|
|
|
|
| 15 |
- Neutralzz/BiLLa-7B-SFT
|
| 16 |
- nomic-ai/gpt4all-13b-snoozy
|
| 17 |
- openaccess-ai-collective/manticore-13b-chat-pyg
|
|
|
|
| 34 |
- databricks/dolly-v2-12b
|
| 35 |
- FreedomIntelligence/phoenix-inst-chat-7b
|
| 36 |
- h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
|
|
|
|
| 37 |
- Neutralzz/BiLLa-7B-SFT
|
| 38 |
- nomic-ai/gpt4all-13b-snoozy
|
| 39 |
- openaccess-ai-collective/manticore-13b-chat-pyg
|
|
|
|
| 56 |
- databricks/dolly-v2-12b
|
| 57 |
- FreedomIntelligence/phoenix-inst-chat-7b
|
| 58 |
- h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
|
|
|
|
| 59 |
- Neutralzz/BiLLa-7B-SFT
|
| 60 |
- nomic-ai/gpt4all-13b-snoozy
|
| 61 |
- openaccess-ai-collective/manticore-13b-chat-pyg
|
|
|
|
| 63 |
- project-baize/baize-v2-7B
|
| 64 |
- StabilityAI/stablelm-tuned-alpha-7b
|
| 65 |
- togethercomputer/RedPajama-INCITE-7B-Chat
|
| 66 |
+
|
| 67 |
+
- command:
|
| 68 |
+
- docker exec leaderboard{{ gpu }} python lm-evaluation-harness/main.py --device cuda --no_cache --model hf-seq2seq --model_args pretrained=lmsys/fastchat-t5-3b-v1.0,trust_remote_code=True,use_accelerate=True --tasks arc_challenge --num_fewshot 25
|
| 69 |
+
- docker exec leaderboard{{ gpu }} python lm-evaluation-harness/main.py --device cuda --no_cache --model hf-seq2seq --model_args pretrained=lmsys/fastchat-t5-3b-v1.0,trust_remote_code=True,use_accelerate=True --tasks hellaswag --num_fewshot 10
|
| 70 |
+
- docker exec leaderboard{{ gpu }} python lm-evaluation-harness/main.py --device cuda --no_cache --model hf-seq2seq --model_args pretrained=lmsys/fastchat-t5-3b-v1.0,trust_remote_code=True,use_accelerate=True --tasks truthfulqa_mc --num_fewshot 0
|