secometo's picture
Upload model_args.json
eaf3978
raw
history blame
499 Bytes
{'adam_epsilon': 1e-08,
'data_dir': '',
'early_stop_callback': False,
'eval_batch_size': 4,
'fp_16': False,
'gradient_accumulation_steps': 16,
'learning_rate': 0.0003,
'max_grad_norm': 1.0,
'max_seq_length': 150,
'model_name_or_path': 'google/mt5-base',
'n_gpu': 1,
'num_train_epochs': 2,
'opt_level': 'O1',
'output_dir': 'mt5model_dh_small/',
'seed': 42,
'tokenizer_name_or_path': 'google/mt5-base',
'train_batch_size': 4,
'warmup_steps': 0,
'weight_decay': 0.0}