init
Browse files- ckpt/MrcGlobalPointerModel.best.pth +3 -0
- task_params.yaml +50 -0
ckpt/MrcGlobalPointerModel.best.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9b75816657a9b40ee8c2a6a1073f320e30f068998a05a5c9a267c42bead1e3f
|
3 |
+
size 414414660
|
task_params.yaml
ADDED
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
_config_info:
|
2 |
+
create_time: '2023-03-14 23:35:21'
|
3 |
+
use_default_base_config: true
|
4 |
+
config_filepath:
|
5 |
+
- /data/tzhu/MRC4IE/conf/mrc.yaml
|
6 |
+
task_type: MrcQaTask
|
7 |
+
task_name: RobertaBase_data20230314v2
|
8 |
+
comment: GlobalPointer with RoPE
|
9 |
+
output_dir: outputs
|
10 |
+
task_dir: outputs/RobertaBase_data20230314v2
|
11 |
+
dump_cache_dir: outputs/RobertaBase_data20230314v2/cache
|
12 |
+
regenerate_cache: true
|
13 |
+
data_dir: resources/Merged/20230314-v2
|
14 |
+
train_filepath: resources/Merged/20230314-v2/train.jsonl
|
15 |
+
dev_filepath: resources/Merged/20230314-v2/dev.jsonl
|
16 |
+
test_filepath: resources/Merged/20230314-v2/test.jsonl
|
17 |
+
random_seed: 1227
|
18 |
+
num_epochs: 20
|
19 |
+
num_steps: -1
|
20 |
+
warmup_proportion: 0.1
|
21 |
+
epoch_patience: 10
|
22 |
+
step_patience: 5000
|
23 |
+
batch_size: 64
|
24 |
+
learning_rate: 2.0e-05
|
25 |
+
max_grad_norm: -1.0
|
26 |
+
skip_train: false
|
27 |
+
debug_mode: false
|
28 |
+
grad_accum_steps: 1
|
29 |
+
resumed_training_path: null
|
30 |
+
step_eval_interval: 20000
|
31 |
+
epoch_eval_interval: 1
|
32 |
+
eval_on_data:
|
33 |
+
- dev
|
34 |
+
select_best_on_data: dev
|
35 |
+
select_best_by_key: metric
|
36 |
+
best_metric_field: micro.f1
|
37 |
+
save_every_ckpt: false
|
38 |
+
save_best_ckpt: true
|
39 |
+
final_eval_on_test: true
|
40 |
+
main_process_logging: true
|
41 |
+
max_seq_len: 512
|
42 |
+
plm_dir: hfl/chinese-roberta-wwm-ext
|
43 |
+
train_batch_size: 16
|
44 |
+
eval_batch_size: 32
|
45 |
+
other_learning_rate: 2.0e-05
|
46 |
+
dropout: 0.3
|
47 |
+
biaffine_size: 512
|
48 |
+
include_package:
|
49 |
+
- src.task
|
50 |
+
use_default_base_config: true
|