Update README.md
Browse files
README.md
CHANGED
@@ -1,10 +1,12 @@
|
|
1 |
---
|
|
|
2 |
license: gemma
|
3 |
datasets:
|
4 |
- openbmb/UltraFeedback
|
5 |
language:
|
6 |
- en
|
7 |
pipeline_tag: text-generation
|
|
|
8 |
---
|
9 |
Self-Play Preference Optimization for Language Model Alignment (https://arxiv.org/abs/2405.00675)
|
10 |
|
|
|
1 |
---
|
2 |
+
base_model: UCLA-AGI/Gemma-2-9B-It-SPPO-Iter3
|
3 |
license: gemma
|
4 |
datasets:
|
5 |
- openbmb/UltraFeedback
|
6 |
language:
|
7 |
- en
|
8 |
pipeline_tag: text-generation
|
9 |
+
quantized_by: Apel-sin
|
10 |
---
|
11 |
Self-Play Preference Optimization for Language Model Alignment (https://arxiv.org/abs/2405.00675)
|
12 |
|