Update README.md
Browse files
README.md
CHANGED
@@ -13,11 +13,11 @@ tags:
|
|
13 |
base_model:
|
14 |
- Qwen/Qwen2.5-72B-Instruct
|
15 |
---
|
16 |
-
# BigQwen2.5-
|
17 |
|
18 |

|
19 |
|
20 |
-
BigQwen2.5-
|
21 |
|
22 |
It applies the [mlabonne/Meta-Llama-3-120B-Instruct](https://huggingface.co/mlabonne/Meta-Llama-3-120B-Instruct/) recipe.
|
23 |
|
@@ -68,7 +68,7 @@ from transformers import AutoTokenizer
|
|
68 |
import transformers
|
69 |
import torch
|
70 |
|
71 |
-
model = "mlabonne/BigQwen2.5-
|
72 |
messages = [{"role": "user", "content": "What is a large language model?"}]
|
73 |
|
74 |
tokenizer = AutoTokenizer.from_pretrained(model)
|
|
|
13 |
base_model:
|
14 |
- Qwen/Qwen2.5-72B-Instruct
|
15 |
---
|
16 |
+
# BigQwen2.5-125B-Instruct
|
17 |
|
18 |

|
19 |
|
20 |
+
BigQwen2.5-125B-Instruct is a [Qwen/Qwen2-72B-Instruct](https://huggingface.co/Qwen/Qwen2-72B-Instruct) self-merge made with [MergeKit](https://github.com/arcee-ai/mergekit/tree/main).
|
21 |
|
22 |
It applies the [mlabonne/Meta-Llama-3-120B-Instruct](https://huggingface.co/mlabonne/Meta-Llama-3-120B-Instruct/) recipe.
|
23 |
|
|
|
68 |
import transformers
|
69 |
import torch
|
70 |
|
71 |
+
model = "mlabonne/BigQwen2.5-125B-Instruct"
|
72 |
messages = [{"role": "user", "content": "What is a large language model?"}]
|
73 |
|
74 |
tokenizer = AutoTokenizer.from_pretrained(model)
|