Minbyul commited on
Commit
21bcd26
1 Parent(s): 7722e13

Model save

Browse files
README.md CHANGED
@@ -1,15 +1,12 @@
1
  ---
2
  base_model: dmis-lab/selfbiorag_7b
3
  tags:
4
- - alignment-handbook
5
- - trl
6
- - sft
7
- - generated_from_trainer
8
  - trl
9
  - sft
 
10
  - generated_from_trainer
11
  datasets:
12
- - HuggingFaceH4/deita-10k-v0-sft
13
  model-index:
14
  - name: selfbiorag-7b-1e-6-wo-kqa_silver_wogold-iter-sft-step1_lr
15
  results: []
@@ -20,7 +17,7 @@ should probably proofread and complete it, then remove this comment. -->
20
 
21
  # selfbiorag-7b-1e-6-wo-kqa_silver_wogold-iter-sft-step1_lr
22
 
23
- This model is a fine-tuned version of [dmis-lab/selfbiorag_7b](https://huggingface.co/dmis-lab/selfbiorag_7b) on the HuggingFaceH4/deita-10k-v0-sft dataset.
24
  It achieves the following results on the evaluation set:
25
  - Loss: 1.5166
26
 
@@ -60,7 +57,7 @@ The following hyperparameters were used during training:
60
  | Training Loss | Epoch | Step | Validation Loss |
61
  |:-------------:|:-----:|:----:|:---------------:|
62
  | 1.4116 | 0.84 | 4 | 1.5586 |
63
- | 1.4074 | 1.89 | 9 | 1.5178 |
64
  | 1.3759 | 2.53 | 12 | 1.5166 |
65
 
66
 
 
1
  ---
2
  base_model: dmis-lab/selfbiorag_7b
3
  tags:
 
 
 
 
4
  - trl
5
  - sft
6
+ - alignment-handbook
7
  - generated_from_trainer
8
  datasets:
9
+ - generator
10
  model-index:
11
  - name: selfbiorag-7b-1e-6-wo-kqa_silver_wogold-iter-sft-step1_lr
12
  results: []
 
17
 
18
  # selfbiorag-7b-1e-6-wo-kqa_silver_wogold-iter-sft-step1_lr
19
 
20
+ This model is a fine-tuned version of [dmis-lab/selfbiorag_7b](https://huggingface.co/dmis-lab/selfbiorag_7b) on the generator dataset.
21
  It achieves the following results on the evaluation set:
22
  - Loss: 1.5166
23
 
 
57
  | Training Loss | Epoch | Step | Validation Loss |
58
  |:-------------:|:-----:|:----:|:---------------:|
59
  | 1.4116 | 0.84 | 4 | 1.5586 |
60
+ | 1.4074 | 1.89 | 9 | 1.5179 |
61
  | 1.3759 | 2.53 | 12 | 1.5166 |
62
 
63
 
all_results.json CHANGED
@@ -5,9 +5,9 @@
5
  "eval_samples": 904,
6
  "eval_samples_per_second": 11.691,
7
  "eval_steps_per_second": 0.731,
8
- "train_loss": 1.3832212686538696,
9
- "train_runtime": 213.2984,
10
  "train_samples": 4047,
11
- "train_samples_per_second": 4.149,
12
  "train_steps_per_second": 0.056
13
  }
 
5
  "eval_samples": 904,
6
  "eval_samples_per_second": 11.691,
7
  "eval_steps_per_second": 0.731,
8
+ "train_loss": 1.3832024335861206,
9
+ "train_runtime": 214.4516,
10
  "train_samples": 4047,
11
+ "train_samples_per_second": 4.127,
12
  "train_steps_per_second": 0.056
13
  }
config.json CHANGED
@@ -23,6 +23,6 @@
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
  "transformers_version": "4.39.0.dev0",
26
- "use_cache": true,
27
  "vocab_size": 32016
28
  }
 
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
  "transformers_version": "4.39.0.dev0",
26
+ "use_cache": false,
27
  "vocab_size": 32016
28
  }
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ccd8d7f35387a07dd8ec4da89373d40065ed3ecd311977490c9fa0d60f720adb
3
  size 4939116424
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca43263c29a0922d70b08411b028441d6c37b20e150bb5bcd853e9ce909e6734
3
  size 4939116424
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44053789dfd074c0517b18c79011576790733a3685edc86b502a86bdac548288
3
  size 4947390880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dba6ba75d061f07091c1b50e7052a032d2156d7229baf786c41631ee338ba81
3
  size 4947390880
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd84089f0e9f263832d03370ae2102ae69a6a193bd63b29d91e71428f453669a
3
  size 3590619888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6648322215c3d7128e74635f14576d4140b3903e75a0f6e3f4a7416c9728a1c5
3
  size 3590619888
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 2.53,
3
- "train_loss": 1.3832212686538696,
4
- "train_runtime": 213.2984,
5
  "train_samples": 4047,
6
- "train_samples_per_second": 4.149,
7
  "train_steps_per_second": 0.056
8
  }
 
1
  {
2
  "epoch": 2.53,
3
+ "train_loss": 1.3832024335861206,
4
+ "train_runtime": 214.4516,
5
  "train_samples": 4047,
6
+ "train_samples_per_second": 4.127,
7
  "train_steps_per_second": 0.056
8
  }
trainer_state.json CHANGED
@@ -10,56 +10,56 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.21,
13
- "grad_norm": 7.686335725067591,
14
  "learning_rate": 5e-07,
15
  "loss": 1.4116,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.84,
20
- "eval_loss": 1.558627963066101,
21
- "eval_runtime": 5.3458,
22
- "eval_samples_per_second": 11.972,
23
- "eval_steps_per_second": 0.748,
24
  "step": 4
25
  },
26
  {
27
  "epoch": 1.05,
28
- "grad_norm": 7.287253588921336,
29
  "learning_rate": 7.938926261462365e-07,
30
  "loss": 1.4074,
31
  "step": 5
32
  },
33
  {
34
  "epoch": 1.89,
35
- "eval_loss": 1.517771601676941,
36
- "eval_runtime": 5.2983,
37
- "eval_samples_per_second": 12.079,
38
- "eval_steps_per_second": 0.755,
39
  "step": 9
40
  },
41
  {
42
  "epoch": 2.11,
43
- "grad_norm": 6.50356839675754,
44
  "learning_rate": 9.549150281252632e-08,
45
  "loss": 1.3759,
46
  "step": 10
47
  },
48
  {
49
  "epoch": 2.53,
50
- "eval_loss": 1.5166064500808716,
51
- "eval_runtime": 5.4659,
52
- "eval_samples_per_second": 11.709,
53
- "eval_steps_per_second": 0.732,
54
  "step": 12
55
  },
56
  {
57
  "epoch": 2.53,
58
  "step": 12,
59
  "total_flos": 2460210954240.0,
60
- "train_loss": 1.3832212686538696,
61
- "train_runtime": 213.2984,
62
- "train_samples_per_second": 4.149,
63
  "train_steps_per_second": 0.056
64
  }
65
  ],
 
10
  "log_history": [
11
  {
12
  "epoch": 0.21,
13
+ "grad_norm": 7.686098770544664,
14
  "learning_rate": 5e-07,
15
  "loss": 1.4116,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.84,
20
+ "eval_loss": 1.558640480041504,
21
+ "eval_runtime": 5.3808,
22
+ "eval_samples_per_second": 11.894,
23
+ "eval_steps_per_second": 0.743,
24
  "step": 4
25
  },
26
  {
27
  "epoch": 1.05,
28
+ "grad_norm": 7.297067521077281,
29
  "learning_rate": 7.938926261462365e-07,
30
  "loss": 1.4074,
31
  "step": 5
32
  },
33
  {
34
  "epoch": 1.89,
35
+ "eval_loss": 1.5179415941238403,
36
+ "eval_runtime": 5.36,
37
+ "eval_samples_per_second": 11.94,
38
+ "eval_steps_per_second": 0.746,
39
  "step": 9
40
  },
41
  {
42
  "epoch": 2.11,
43
+ "grad_norm": 6.501168641091188,
44
  "learning_rate": 9.549150281252632e-08,
45
  "loss": 1.3759,
46
  "step": 10
47
  },
48
  {
49
  "epoch": 2.53,
50
+ "eval_loss": 1.5165581703186035,
51
+ "eval_runtime": 5.5377,
52
+ "eval_samples_per_second": 11.557,
53
+ "eval_steps_per_second": 0.722,
54
  "step": 12
55
  },
56
  {
57
  "epoch": 2.53,
58
  "step": 12,
59
  "total_flos": 2460210954240.0,
60
+ "train_loss": 1.3832024335861206,
61
+ "train_runtime": 214.4516,
62
+ "train_samples_per_second": 4.127,
63
  "train_steps_per_second": 0.056
64
  }
65
  ],
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c8448a03507536af581e7bf3b53c51acba34e5bb187dc044363d746e4c62c01
3
  size 6328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c5c8ca7d7552547f12da429ee06c65d0ad820ab247016bf754ddb1a20f47479
3
  size 6328