Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
pminervini
commited on
Commit
•
1591f9d
1
Parent(s):
ecd0860
update
Browse files- plots/clustermap_all.pdf +0 -0
- plots/clustermap_all.png +2 -2
- plots/clustermap_det.pdf +0 -0
- plots/clustermap_det.png +2 -2
- plots/clustermap_instr.pdf +0 -0
- plots/clustermap_instr.png +2 -2
- plots/clustermap_qa.pdf +0 -0
- plots/clustermap_qa.png +2 -2
- plots/clustermap_summ.pdf +0 -0
- plots/clustermap_summ.png +2 -2
- src/backend/envs.py +1 -0
- src/backend/tasks/memo-trap/memo-trap_v2.yaml +20 -0
plots/clustermap_all.pdf
CHANGED
Binary files a/plots/clustermap_all.pdf and b/plots/clustermap_all.pdf differ
|
|
plots/clustermap_all.png
CHANGED
Git LFS Details
|
Git LFS Details
|
plots/clustermap_det.pdf
CHANGED
Binary files a/plots/clustermap_det.pdf and b/plots/clustermap_det.pdf differ
|
|
plots/clustermap_det.png
CHANGED
Git LFS Details
|
Git LFS Details
|
plots/clustermap_instr.pdf
CHANGED
Binary files a/plots/clustermap_instr.pdf and b/plots/clustermap_instr.pdf differ
|
|
plots/clustermap_instr.png
CHANGED
Git LFS Details
|
Git LFS Details
|
plots/clustermap_qa.pdf
CHANGED
Binary files a/plots/clustermap_qa.pdf and b/plots/clustermap_qa.pdf differ
|
|
plots/clustermap_qa.png
CHANGED
Git LFS Details
|
Git LFS Details
|
plots/clustermap_summ.pdf
CHANGED
Binary files a/plots/clustermap_summ.pdf and b/plots/clustermap_summ.pdf differ
|
|
plots/clustermap_summ.png
CHANGED
Git LFS Details
|
Git LFS Details
|
src/backend/envs.py
CHANGED
@@ -33,6 +33,7 @@ class Tasks(Enum):
|
|
33 |
task9 = Task("cnndm", "rougeL", "CNN/DM", 2)
|
34 |
|
35 |
task10 = Task("memo-trap", "acc", "memo-trap", 0)
|
|
|
36 |
|
37 |
task11 = Task("nq8", "em", "NQ Open 8", 8)
|
38 |
task12 = Task("tqa8", "em", "TriviaQA 8", 8)
|
|
|
33 |
task9 = Task("cnndm", "rougeL", "CNN/DM", 2)
|
34 |
|
35 |
task10 = Task("memo-trap", "acc", "memo-trap", 0)
|
36 |
+
task10_2 = Task("memo-trap_v2", "acc", "memo-trap", 0)
|
37 |
|
38 |
task11 = Task("nq8", "em", "NQ Open 8", 8)
|
39 |
task12 = Task("tqa8", "em", "TriviaQA 8", 8)
|
src/backend/tasks/memo-trap/memo-trap_v2.yaml
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
task: memo-trap_v2
|
2 |
+
dataset_path: pminervini/inverse-scaling
|
3 |
+
dataset_name: memo-trap
|
4 |
+
output_type: multiple_choice
|
5 |
+
training_split: null
|
6 |
+
validation_split: data
|
7 |
+
test_split: null
|
8 |
+
num_fewshot: 0
|
9 |
+
doc_to_text: "{{prompt}}"
|
10 |
+
doc_to_target: answer_index
|
11 |
+
doc_to_choice: "{{classes}}"
|
12 |
+
target_delimiter: ""
|
13 |
+
should_decontaminate: False
|
14 |
+
doc_to_decontamination_query: prompt
|
15 |
+
metric_list:
|
16 |
+
- metric: acc
|
17 |
+
aggregation: mean
|
18 |
+
higher_is_better: true
|
19 |
+
metadata:
|
20 |
+
- version: 0.0
|