Text Generation
PEFT
Safetensors
Muhammad7865253 commited on
Commit
9078c5e
1 Parent(s): 1391b6f

Create model_config.json

Browse files
Files changed (1) hide show
  1. model_config.json +57 -0
model_config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name": "unsloth/gemma-2-2b",
3
+ "max_seq_length": 2048,
4
+ "dtype": null,
5
+ "load_in_4bit": false,
6
+ "lora_params": {
7
+ "r": 16,
8
+ "target_modules": [
9
+ "q_proj",
10
+ "k_proj",
11
+ "v_proj",
12
+ "o_proj",
13
+ "gate_proj",
14
+ "up_proj",
15
+ "down_proj"
16
+ ],
17
+ "lora_alpha": 16,
18
+ "lora_dropout": 0,
19
+ "bias": "none",
20
+ "use_gradient_checkpointing": "unsloth",
21
+ "random_state": 3407,
22
+ "use_rslora": false
23
+ },
24
+ "training_args": {
25
+ "per_device_train_batch_size": 4,
26
+ "gradient_accumulation_steps": 4,
27
+ "warmup_steps": 5,
28
+ "num_train_epochs": 1,
29
+ "learning_rate": 0.0002,
30
+ "fp16": true,
31
+ "bf16": false,
32
+ "logging_steps": 1,
33
+ "optim": "adamw_8bit",
34
+ "weight_decay": 0.01,
35
+ "lr_scheduler_type": "linear",
36
+ "seed": 3407,
37
+ "output_dir": "outputs",
38
+ "report_to": "none"
39
+ },
40
+ "data_config": {
41
+ "dataset_name": "marmikpandya/mental-health",
42
+ "dataset_split": "train",
43
+ "dataset_rows": null,
44
+ "conversation_format": null,
45
+ "max_seq_length": 2048,
46
+ "train_on_responses_only": false
47
+ },
48
+ "inference_config": {
49
+ "temperature": null,
50
+ "min_p": null,
51
+ "max_new_tokens": null
52
+ },
53
+ "alpaca_prompt": {
54
+ "template": "Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request.\n\n### Instruction:\n{}\n\n### Input:\n{}\n\n### Response:\n{}",
55
+ "eos_token": true
56
+ }
57
+ }