opt-125m-squad / args.txt
Anas Awadalla
Add model
f070e65
raw
history blame contribute delete
732 Bytes
model_name_or_path: facebook/opt-125m
config_name: None
tokenizer_name: None
use_slow_tokenizer: False
per_device_train_batch_size: 32
per_device_eval_batch_size: 32
learning_rate: 5e-05
weight_decay: 0.1
num_train_epochs: 5
patience: 100
max_train_steps: None
gradient_accumulation_steps: 1
lr_scheduler_type: SchedulerType.LINEAR
num_warmup_steps: 0
output_dir: opt_125m_squad_decay_0.1
seed: None
finetune_type: vanilla
beta: 0.1
model_type: None
max_seq_length: 384
max_context_length: 600
num_beams: 1
preprocessing_num_workers: 16
overwrite_cache: False
no_keep_linebreaks: False
push_to_hub: False
hub_model_id: None
hub_token: None
checkpointing_steps: epoch
resume_from_checkpoint: None
with_tracking: False
local_rank: -1