|
--- |
|
license: apache-2.0 |
|
tags: |
|
- generated_from_trainer |
|
base_model: yanolja/EEVE-Korean-10.8B-v1.0 |
|
model-index: |
|
- name: yanolja/EEVE-Korean-Instruct-10.8B-v1.0 |
|
results: [] |
|
--- |
|
|
|
|
|
- Original model is [yanolja/EEVE-Korean-Instruct-10.8B-v1.0](https://huggingface.co/yanolja/EEVE-Korean-Instruct-10.8B-v1.0) |
|
- quantized using [llama.cpp](https://github.com/ggerganov/llama.cpp) |
|
|
|
|
|
## Ollama |
|
|
|
Modelfile |
|
|
|
``` |
|
FROM EEVE-Korean-Instruct-10.8B-v1.0-Q8_0.gguf |
|
|
|
TEMPLATE """{{- if .System }} |
|
<s>{{ .System }}</s> |
|
{{- end }} |
|
<s>Human: |
|
{{ .Prompt }}</s> |
|
<s>Assistant: |
|
""" |
|
|
|
SYSTEM """A chat between a curious user and an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the user's questions.""" |
|
|
|
PARAMETER temperature 0 |
|
PARAMETER num_predict 3000 |
|
PARAMETER num_ctx 4096 |
|
PARAMETER stop <s> |
|
PARAMETER stop </s> |
|
``` |
|
|
|
|
|
|
|
### Training Data |
|
- Korean-translated version of [Open-Orca/SlimOrca-Dedup](https://huggingface.co/datasets/Open-Orca/SlimOrca-Dedup) |
|
- Korean-translated version of [argilla/ultrafeedback-binarized-preferences-cleaned](https://huggingface.co/datasets/argilla/ultrafeedback-binarized-preferences-cleaned) |
|
- No other dataset was used |
|
|
|
## Citation |
|
|
|
``` |
|
@misc{kim2024efficient, |
|
title={Efficient and Effective Vocabulary Expansion Towards Multilingual Large Language Models}, |
|
author={Seungduk Kim and Seungtaek Choi and Myeongho Jeong}, |
|
year={2024}, |
|
eprint={2402.14714}, |
|
archivePrefix={arXiv}, |
|
primaryClass={cs.CL} |
|
} |
|
``` |
|
``` |
|
@misc{cui2023ultrafeedback, |
|
title={UltraFeedback: Boosting Language Models with High-quality Feedback}, |
|
author={Ganqu Cui and Lifan Yuan and Ning Ding and Guanming Yao and Wei Zhu and Yuan Ni and Guotong Xie and Zhiyuan Liu and Maosong Sun}, |
|
year={2023}, |
|
eprint={2310.01377}, |
|
archivePrefix={arXiv}, |
|
primaryClass={cs.CL} |
|
} |
|
``` |
|
``` |
|
@misc{SlimOrcaDedup, |
|
title = {SlimOrca Dedup: A Deduplicated Subset of SlimOrca}, |
|
author = {Wing Lian and Guan Wang and Bleys Goodson and Eugene Pentland and Austin Cook and Chanvichet Vong and "Teknium" and Nathan Hoos}, |
|
year = {2023}, |
|
publisher = {HuggingFace}, |
|
url = {https://huggingface.co/datasets/Open-Orca/SlimOrca-Dedup/} |
|
} |
|
``` |
|
``` |
|
@misc{mukherjee2023orca, |
|
title={Orca: Progressive Learning from Complex Explanation Traces of GPT-4}, |
|
author={Subhabrata Mukherjee and Arindam Mitra and Ganesh Jawahar and Sahaj Agarwal and Hamid Palangi and Ahmed Awadallah}, |
|
year={2023}, |
|
eprint={2306.02707}, |
|
archivePrefix={arXiv}, |
|
primaryClass={cs.CL} |
|
} |
|
``` |
|
|