Spico commited on
Commit
5968071
·
1 Parent(s): b3e11d2
ckpt/MrcGlobalPointerModel.best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9b75816657a9b40ee8c2a6a1073f320e30f068998a05a5c9a267c42bead1e3f
3
+ size 414414660
task_params.yaml ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _config_info:
2
+ create_time: '2023-03-14 23:35:21'
3
+ use_default_base_config: true
4
+ config_filepath:
5
+ - /data/tzhu/MRC4IE/conf/mrc.yaml
6
+ task_type: MrcQaTask
7
+ task_name: RobertaBase_data20230314v2
8
+ comment: GlobalPointer with RoPE
9
+ output_dir: outputs
10
+ task_dir: outputs/RobertaBase_data20230314v2
11
+ dump_cache_dir: outputs/RobertaBase_data20230314v2/cache
12
+ regenerate_cache: true
13
+ data_dir: resources/Merged/20230314-v2
14
+ train_filepath: resources/Merged/20230314-v2/train.jsonl
15
+ dev_filepath: resources/Merged/20230314-v2/dev.jsonl
16
+ test_filepath: resources/Merged/20230314-v2/test.jsonl
17
+ random_seed: 1227
18
+ num_epochs: 20
19
+ num_steps: -1
20
+ warmup_proportion: 0.1
21
+ epoch_patience: 10
22
+ step_patience: 5000
23
+ batch_size: 64
24
+ learning_rate: 2.0e-05
25
+ max_grad_norm: -1.0
26
+ skip_train: false
27
+ debug_mode: false
28
+ grad_accum_steps: 1
29
+ resumed_training_path: null
30
+ step_eval_interval: 20000
31
+ epoch_eval_interval: 1
32
+ eval_on_data:
33
+ - dev
34
+ select_best_on_data: dev
35
+ select_best_by_key: metric
36
+ best_metric_field: micro.f1
37
+ save_every_ckpt: false
38
+ save_best_ckpt: true
39
+ final_eval_on_test: true
40
+ main_process_logging: true
41
+ max_seq_len: 512
42
+ plm_dir: hfl/chinese-roberta-wwm-ext
43
+ train_batch_size: 16
44
+ eval_batch_size: 32
45
+ other_learning_rate: 2.0e-05
46
+ dropout: 0.3
47
+ biaffine_size: 512
48
+ include_package:
49
+ - src.task
50
+ use_default_base_config: true