Update README.md
Browse files
README.md
CHANGED
@@ -8,11 +8,11 @@ tags:
|
|
8 |
- trl
|
9 |
- dpo
|
10 |
- generated_from_trainer
|
11 |
-
datasets:
|
12 |
-
- HuggingFaceH4/ultrafeedback_binarized
|
13 |
model-index:
|
14 |
- name: selfbiorag-7b-wo-kqa_golden-iter-dpo-step4-filtered
|
15 |
results: []
|
|
|
|
|
16 |
---
|
17 |
|
18 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
@@ -72,4 +72,4 @@ The following hyperparameters were used during training:
|
|
72 |
- Transformers 4.39.0.dev0
|
73 |
- Pytorch 2.1.2
|
74 |
- Datasets 2.14.6
|
75 |
-
- Tokenizers 0.15.2
|
|
|
8 |
- trl
|
9 |
- dpo
|
10 |
- generated_from_trainer
|
|
|
|
|
11 |
model-index:
|
12 |
- name: selfbiorag-7b-wo-kqa_golden-iter-dpo-step4-filtered
|
13 |
results: []
|
14 |
+
language:
|
15 |
+
- en
|
16 |
---
|
17 |
|
18 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
|
|
72 |
- Transformers 4.39.0.dev0
|
73 |
- Pytorch 2.1.2
|
74 |
- Datasets 2.14.6
|
75 |
+
- Tokenizers 0.15.2
|