Spaces:

ml-energy
/

leaderboard

Running

App Files Files Community

Zhiyu Wu commited on Jul 6, 2023

Commit

4fc7206

1 Parent(s): f5248c1

t5 use hf-seq2seq

Browse files

Files changed (1) hide show

pegasus/nlp-eval.yaml +5 -3

pegasus/nlp-eval.yaml CHANGED Viewed

@@ -12,7 +12,6 @@
     - databricks/dolly-v2-12b
     - FreedomIntelligence/phoenix-inst-chat-7b
     - h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
-    - lmsys/fastchat-t5-3b-v1.0
     - Neutralzz/BiLLa-7B-SFT
     - nomic-ai/gpt4all-13b-snoozy
     - openaccess-ai-collective/manticore-13b-chat-pyg
@@ -35,7 +34,6 @@
     - databricks/dolly-v2-12b
     - FreedomIntelligence/phoenix-inst-chat-7b
     - h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
-    - lmsys/fastchat-t5-3b-v1.0
     - Neutralzz/BiLLa-7B-SFT
     - nomic-ai/gpt4all-13b-snoozy
     - openaccess-ai-collective/manticore-13b-chat-pyg
@@ -58,7 +56,6 @@
     - databricks/dolly-v2-12b
     - FreedomIntelligence/phoenix-inst-chat-7b
     - h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
-    - lmsys/fastchat-t5-3b-v1.0
     - Neutralzz/BiLLa-7B-SFT
     - nomic-ai/gpt4all-13b-snoozy
     - openaccess-ai-collective/manticore-13b-chat-pyg
@@ -66,3 +63,8 @@
     - project-baize/baize-v2-7B
     - StabilityAI/stablelm-tuned-alpha-7b
     - togethercomputer/RedPajama-INCITE-7B-Chat

     - databricks/dolly-v2-12b
     - FreedomIntelligence/phoenix-inst-chat-7b
     - h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
     - Neutralzz/BiLLa-7B-SFT
     - nomic-ai/gpt4all-13b-snoozy
     - openaccess-ai-collective/manticore-13b-chat-pyg
     - databricks/dolly-v2-12b
     - FreedomIntelligence/phoenix-inst-chat-7b
     - h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
     - Neutralzz/BiLLa-7B-SFT
     - nomic-ai/gpt4all-13b-snoozy
     - openaccess-ai-collective/manticore-13b-chat-pyg
     - databricks/dolly-v2-12b
     - FreedomIntelligence/phoenix-inst-chat-7b
     - h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2
     - Neutralzz/BiLLa-7B-SFT
     - nomic-ai/gpt4all-13b-snoozy
     - openaccess-ai-collective/manticore-13b-chat-pyg
     - project-baize/baize-v2-7B
     - StabilityAI/stablelm-tuned-alpha-7b
     - togethercomputer/RedPajama-INCITE-7B-Chat
+- command:
+    - docker exec leaderboard{{ gpu }} python lm-evaluation-harness/main.py --device cuda --no_cache --model hf-seq2seq --model_args pretrained=lmsys/fastchat-t5-3b-v1.0,trust_remote_code=True,use_accelerate=True --tasks arc_challenge --num_fewshot 25
+    - docker exec leaderboard{{ gpu }} python lm-evaluation-harness/main.py --device cuda --no_cache --model hf-seq2seq --model_args pretrained=lmsys/fastchat-t5-3b-v1.0,trust_remote_code=True,use_accelerate=True --tasks hellaswag --num_fewshot 10
+    - docker exec leaderboard{{ gpu }} python lm-evaluation-harness/main.py --device cuda --no_cache --model hf-seq2seq --model_args pretrained=lmsys/fastchat-t5-3b-v1.0,trust_remote_code=True,use_accelerate=True --tasks truthfulqa_mc --num_fewshot 0