filename: stage3_test seed: 0 mode: eval strategy_name: deepspeed use_3d: true accelerator: gpu devices: 0,1 precision: bf16-mixed max_steps: 40000 accumulate_grad_batches: 8 enable_flash: true gin_hidden_dim: 300 gin_num_layers: 5 drop_ratio: 0.0 tune_gnn: false bert_hidden_dim: 768 bert_name: scibert cross_attention_freq: 2 num_query_token: 8 llm_model: llama-2-hf-7b num_beams: 5 do_sample: false max_len: 64 min_len: 4 llm_tune: lora peft_config: null peft_dir: '' every_n_train_steps: 5000 load_in_8bit: false lora_r: 8 lora_alpha: 32 lora_dropout: 0.1 weight_decay: 0.05 init_lr: 1.0e-05 min_lr: 1.0e-08 warmup_lr: 1.0e-06 warmup_steps: 1000 scheduler: linear_warmup_cosine_lr stage2_path: '' stage3_path: all_checkpoints/stage3/step=40000.ckpt init_checkpoint: '' num_workers: 8 batch_size: 8 inference_batch_size: 8 root: data/3d-mol-dataset text_max_len: 384 unimol_encoder_layers: 15 unimol_encoder_embed_dim: 512 unimol_encoder_ffn_embed_dim: 2048 unimol_encoder_attention_heads: 64 unimol_activation_fn: gelu unimol_emb_dropout: 0.1 unimol_dropout: 0.1 unimol_attention_dropout: 0.1 unimol_activation_dropout: 0.0 unimol_max_seq_len: 512 unimol_delta_pair_repr_norm_loss: -1.0 unimol_max_atoms: 256