{ "model_type": "llama", "model_name": "SiddharthShukla48/Mental_Health_Counseling", "peft_config": { "lora_r": 64, "lora_alpha": 16, "lora_dropout": 0.1, "task_type": "CAUSAL_LM" }, "bnb_config": { "use_4bit": true, "bnb_4bit_compute_dtype": "float16", "bnb_4bit_quant_type": "nf4", "use_nested_quant": false }, "training_arguments": { "output_dir": "SiddharthShukla48/llama_mental_health", "num_train_epochs": 1, "fp16": false, "bf16": false, "per_device_train_batch_size": 4, "per_device_eval_batch_size": 4, "gradient_accumulation_steps": 1, "gradient_checkpointing": true, "max_grad_norm": 0.3, "learning_rate": 2e-4, "weight_decay": 0.001, "optim": "paged_adamw_32bit", "lr_scheduler_type": "cosine", "max_steps": -1, "warmup_ratio": 0.03, "group_by_length": true, "save_steps": 0, "logging_steps": 25 }, "max_seq_length": 1024, "tokenizer_name": "NousResearch/Llama-2-7b-chat-hf", "pad_token": "", "padding_side": "right", "use_cache": false, "pretraining_tp": 1 }