mt5-base-jaquad-qg-ae / trainer_config.json
asahi417's picture
add model
9830bbb
raw
history blame
392 Bytes
{"dataset_path": "lmqg/qg_jaquad", "dataset_name": "default", "input_types": ["paragraph_answer", "paragraph_sentence"], "output_types": ["question", "answer"], "prefix_types": ["qg", "ae"], "model": "google/mt5-base", "max_length": 512, "max_length_output": 32, "epoch": 9, "batch": 32, "lr": 0.001, "fp16": false, "random_seed": 1, "gradient_accumulation_steps": 2, "label_smoothing": 0.15}