wandb_project: joy-caption-1 device_batch_size: 2 batch_size: 256 learning_rate: 0.0002 warmup_samples: 18000 max_samples: 500000 save_every: 50000 test_every: 50000 use_amp: true grad_scaler: true lr_scheduler_type: cosine min_lr_ratio: 0.0 allow_tf32: true seed: 69 num_workers: 8 optimizer_type: adamw adam_beta1: 0.9 adam_beta2: 0.999 adam_eps: 1.0e-08 adam_weight_decay: 0.0 clip_grad_norm: 1.0 dataset: fancyfeast/joy-captioning-20240917a clip_model: google/siglip-so400m-patch14-384 text_model: meta-llama/Meta-Llama-3.1-8B resume: null gradient_checkpointing: false test_size: 2048 grad_scaler_init: 65536.0 max_caption_length: 257 num_image_tokens: 32 adapter_type: mlp text_model_dtype: bfloat16 pre_test: false train_image_model: true image_model_lr: null train_lora: true lora_r: 64 lora_alpha: 16 lora_dropout: 0.1