GOODYEONSU commited on
Commit
70d59b6
1 Parent(s): 137ef2c

Model save

Browse files
README.md CHANGED
@@ -1,4 +1,5 @@
1
  ---
 
2
  license: apache-2.0
3
  base_model: Qwen/Qwen2.5-0.5B-Instruct
4
  tags:
@@ -38,8 +39,8 @@ The following hyperparameters were used during training:
38
  - train_batch_size: 16
39
  - eval_batch_size: 8
40
  - seed: 42
41
- - gradient_accumulation_steps: 4
42
- - total_train_batch_size: 64
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
  - lr_scheduler_type: constant
45
  - lr_scheduler_warmup_ratio: 0.03
@@ -51,7 +52,7 @@ The following hyperparameters were used during training:
51
 
52
  ### Framework versions
53
 
54
- - Transformers 4.43.3
55
  - Pytorch 2.4.0+cu121
56
  - Datasets 2.20.0
57
  - Tokenizers 0.19.1
 
1
  ---
2
+ library_name: transformers
3
  license: apache-2.0
4
  base_model: Qwen/Qwen2.5-0.5B-Instruct
5
  tags:
 
39
  - train_batch_size: 16
40
  - eval_batch_size: 8
41
  - seed: 42
42
+ - gradient_accumulation_steps: 2
43
+ - total_train_batch_size: 32
44
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
45
  - lr_scheduler_type: constant
46
  - lr_scheduler_warmup_ratio: 0.03
 
52
 
53
  ### Framework versions
54
 
55
+ - Transformers 4.44.2
56
  - Pytorch 2.4.0+cu121
57
  - Datasets 2.20.0
58
  - Tokenizers 0.19.1
generation_config.json CHANGED
@@ -10,5 +10,5 @@
10
  "temperature": 0.7,
11
  "top_k": 20,
12
  "top_p": 0.8,
13
- "transformers_version": "4.43.3"
14
  }
 
10
  "temperature": 0.7,
11
  "top_k": 20,
12
  "top_p": 0.8,
13
+ "transformers_version": "4.44.2"
14
  }
runs/Sep26_13-33-55_nlu12a2/events.out.tfevents.1727325250.nlu12a2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30e9d8d5e569327673a0dbc525fa917c67f53fea5c0bb8b2dbefaeafe34c7559
3
- size 11661
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff38e1605b5a22b7e53586038a6e9c32731a6dabc5b60e1087c7095ea5ddf24a
3
+ size 12226