File size: 527 Bytes
724ad08 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 |
{
"project": "iterative preference learning",
"exp_name": "mistral-sft_iter4",
"cache_dir": ".cache",
"result_dir": "results",
"data": null,
"prompt_max_length": 1024,
"max_length": 2048,
"model_name_or_path": ".cache/mistral-sft_iter3",
"ref_model_name_or_path": ".cache/mistral-sft_iter1/",
"beta": 0.1,
"n_epochs": 1,
"per_device_batch_size": 1,
"gradient_accumulation_steps": 32,
"lr": 5e-07,
"warmup_ratio": 0.03,
"max_grad_norm": 1,
"open_port": 57423
} |