knifeayumu
commited on
Commit
•
a189b60
1
Parent(s):
2423a56
Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +39 -0
- config.json +27 -0
- mergekit_config.yml +8 -0
- model-00001-of-00051.safetensors +3 -0
- model-00002-of-00051.safetensors +3 -0
- model-00003-of-00051.safetensors +3 -0
- model-00004-of-00051.safetensors +3 -0
- model-00005-of-00051.safetensors +3 -0
- model-00006-of-00051.safetensors +3 -0
- model-00007-of-00051.safetensors +3 -0
- model-00008-of-00051.safetensors +3 -0
- model-00009-of-00051.safetensors +3 -0
- model-00010-of-00051.safetensors +3 -0
- model-00011-of-00051.safetensors +3 -0
- model-00012-of-00051.safetensors +3 -0
- model-00013-of-00051.safetensors +3 -0
- model-00014-of-00051.safetensors +3 -0
- model-00015-of-00051.safetensors +3 -0
- model-00016-of-00051.safetensors +3 -0
- model-00017-of-00051.safetensors +3 -0
- model-00018-of-00051.safetensors +3 -0
- model-00019-of-00051.safetensors +3 -0
- model-00020-of-00051.safetensors +3 -0
- model-00021-of-00051.safetensors +3 -0
- model-00022-of-00051.safetensors +3 -0
- model-00023-of-00051.safetensors +3 -0
- model-00024-of-00051.safetensors +3 -0
- model-00025-of-00051.safetensors +3 -0
- model-00026-of-00051.safetensors +3 -0
- model-00027-of-00051.safetensors +3 -0
- model-00028-of-00051.safetensors +3 -0
- model-00029-of-00051.safetensors +3 -0
- model-00030-of-00051.safetensors +3 -0
- model-00031-of-00051.safetensors +3 -0
- model-00032-of-00051.safetensors +3 -0
- model-00033-of-00051.safetensors +3 -0
- model-00034-of-00051.safetensors +3 -0
- model-00035-of-00051.safetensors +3 -0
- model-00036-of-00051.safetensors +3 -0
- model-00037-of-00051.safetensors +3 -0
- model-00038-of-00051.safetensors +3 -0
- model-00039-of-00051.safetensors +3 -0
- model-00040-of-00051.safetensors +3 -0
- model-00041-of-00051.safetensors +3 -0
- model-00042-of-00051.safetensors +3 -0
- model-00043-of-00051.safetensors +3 -0
- model-00044-of-00051.safetensors +3 -0
- model-00045-of-00051.safetensors +3 -0
- model-00046-of-00051.safetensors +3 -0
- model-00047-of-00051.safetensors +3 -0
README.md
ADDED
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
base_model:
|
3 |
+
- anthracite-org/magnum-v4-123b
|
4 |
+
- TheDrummer/Behemoth-123B-v1.1
|
5 |
+
library_name: transformers
|
6 |
+
tags:
|
7 |
+
- mergekit
|
8 |
+
- merge
|
9 |
+
|
10 |
+
---
|
11 |
+
# merge
|
12 |
+
|
13 |
+
This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
|
14 |
+
|
15 |
+
## Merge Details
|
16 |
+
### Merge Method
|
17 |
+
|
18 |
+
This model was merged using the SLERP merge method.
|
19 |
+
|
20 |
+
### Models Merged
|
21 |
+
|
22 |
+
The following models were included in the merge:
|
23 |
+
* [anthracite-org/magnum-v4-123b](https://huggingface.co/anthracite-org/magnum-v4-123b)
|
24 |
+
* [TheDrummer/Behemoth-123B-v1.1](https://huggingface.co/TheDrummer/Behemoth-123B-v1.1)
|
25 |
+
|
26 |
+
### Configuration
|
27 |
+
|
28 |
+
The following YAML configuration was used to produce this model:
|
29 |
+
|
30 |
+
```yaml
|
31 |
+
models:
|
32 |
+
- model: TheDrummer/Behemoth-123B-v1.1
|
33 |
+
- model: anthracite-org/magnum-v4-123b
|
34 |
+
merge_method: slerp
|
35 |
+
base_model: TheDrummer/Behemoth-123B-v1.1
|
36 |
+
parameters:
|
37 |
+
t: [0.1, 0.3, 0.6, 0.3, 0.1]
|
38 |
+
dtype: float16
|
39 |
+
```
|
config.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "TheDrummer/Behemoth-123B-v1.1",
|
3 |
+
"architectures": [
|
4 |
+
"MistralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 1,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"head_dim": 128,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 12288,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 131072,
|
15 |
+
"model_type": "mistral",
|
16 |
+
"num_attention_heads": 96,
|
17 |
+
"num_hidden_layers": 88,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"rms_norm_eps": 1e-05,
|
20 |
+
"rope_theta": 1000000.0,
|
21 |
+
"sliding_window": null,
|
22 |
+
"tie_word_embeddings": false,
|
23 |
+
"torch_dtype": "float16",
|
24 |
+
"transformers_version": "4.45.1",
|
25 |
+
"use_cache": true,
|
26 |
+
"vocab_size": 32768
|
27 |
+
}
|
mergekit_config.yml
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
models:
|
2 |
+
- model: TheDrummer/Behemoth-123B-v1.1
|
3 |
+
- model: anthracite-org/magnum-v4-123b
|
4 |
+
merge_method: slerp
|
5 |
+
base_model: TheDrummer/Behemoth-123B-v1.1
|
6 |
+
parameters:
|
7 |
+
t: [0.1, 0.3, 0.6, 0.3, 0.1]
|
8 |
+
dtype: float16
|
model-00001-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b9c67dd7122db0b16b0b8cc9d4c51501ca05a37ca91609ca735866050780ac5
|
3 |
+
size 4378928488
|
model-00002-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82c517c0ec0d2715936a1fd9de2845253fa1dec2975c83abc9be6d1ac77c4eff
|
3 |
+
size 4907411072
|
model-00003-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23487baa212737849c143959c49b297ce7bacef2367fa672d2dc0a52b04e5e5b
|
3 |
+
size 4806747888
|
model-00004-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c26ccd18499ffb3ff0eb2104b997d9c0a3826000eb0b9cff91f6c1974a97636c
|
3 |
+
size 4831938528
|
model-00005-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17a8c889158afb91de383876df4377e919323081d0fd8af419da6ecff21eff1d
|
3 |
+
size 4831938536
|
model-00006-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b34d65a618104b7fc06eb90e47c9596ee147270e4e4325029483580c57f36603
|
3 |
+
size 4907411080
|
model-00007-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca62bc87e09c18c86937e28a47a8469e5ab5e4a0f7e693bc45868458a82e9df9
|
3 |
+
size 4806747888
|
model-00008-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22cfc848f83ae5c5e68d2055e14f1127e074f25fc9671d6c8dccd1d08875a10e
|
3 |
+
size 4831938520
|
model-00009-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1820fa12192bd7c560a6c6341183bd1504e6703085ebb57fc94189dd22c13fe7
|
3 |
+
size 4831938536
|
model-00010-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1cc7b5a52c118ab995da22385feeedd9c5d13c158aca3ca76f3705c3c6472f5
|
3 |
+
size 4907411080
|
model-00011-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95cbcf86e72a64ef75bb9a45e845121b625a8fabfd47eb5f04cbaff3984bafb8
|
3 |
+
size 4806747888
|
model-00012-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2db092e7829bf5ba1b279f88541dec48ec39d2866786bcfa935ae51575eedb00
|
3 |
+
size 4831938528
|
model-00013-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9756ba28898ff82beb78ec0ccaec5af874cd3eaf9dc12740f0c58d2e328f6467
|
3 |
+
size 4831938536
|
model-00014-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d617f305ea83b86a4e725bae4a84212942575bb1214c7b1a150fff755bd2ffeb
|
3 |
+
size 4907411072
|
model-00015-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbda6c2fbd9627a612039e5db63bc16b60f1a7bd256ec0fc637d24ca6c6fdb83
|
3 |
+
size 4806747888
|
model-00016-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2fac2af0ffd12363faa5b0a74ed17994538a8a2e9d9def582e113d53c05a1b9
|
3 |
+
size 4831938528
|
model-00017-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee742ed2abc929026bdcec8c2f6a73eed49aa2c6611e32760f7b32f377b5b2c4
|
3 |
+
size 4831938536
|
model-00018-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72d8d7fd283367e738319aef5daca11a561a50bbfec27da29493d3779394cf00
|
3 |
+
size 4907411080
|
model-00019-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e2e50c673f53672c07901e7fb0ae3ef80290224869a43e3591a48521f83ac1a
|
3 |
+
size 4806747888
|
model-00020-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66482d882bc1b3a7e17384b65e85f1246d85da1c7aedac0de41f0a90089666b8
|
3 |
+
size 4831938528
|
model-00021-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ac7fc109f8fbe7fd62b7d4828e0d354ba0502dce6d0bb26252959c21b7ae4ca
|
3 |
+
size 4831938528
|
model-00022-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60367a5b237bf7a86ae35442381ad19f1b1ca33586553e38a4732edc34e08419
|
3 |
+
size 4907411080
|
model-00023-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bda2d0b0978a48c6866bae30e831b874762622bb6c675b23459d27c6fa55096f
|
3 |
+
size 4806747888
|
model-00024-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea2cddd4bb712dc0b3192daae2a0d11b01db9b8f678a7ac35dba9f95b7b9384a
|
3 |
+
size 4831938528
|
model-00025-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a74a489aa29c4c705108def46dfe5e1c0e3ed28edd3c8853c8022506520665e
|
3 |
+
size 4831938536
|
model-00026-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bd9eedd9ec1b65940e439e1c33aaa40cdd07958d3537dfbf489dbbf95294802
|
3 |
+
size 4907411080
|
model-00027-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2b4b78b3291bb1a78ce84ac0e416c109a85548f4b503e39b8d6934406ccf116
|
3 |
+
size 4806747880
|
model-00028-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9811b27823a6a7388cef7435bee26a6e082f983f99428ce2907884657ea97d3e
|
3 |
+
size 4831938528
|
model-00029-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:251963e2666050f6d757518d1e360bee2a18a7495f1b2ad649593db99cc29b89
|
3 |
+
size 4831938536
|
model-00030-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a493a9dabcd7df8a475b393c86647fb237360ed929bd2078083bc41e1d45437a
|
3 |
+
size 4907411080
|
model-00031-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49bd96c00cb74eb10bbcdc82137bb16be9bcfb8df97cf9489c65aae16b5f017f
|
3 |
+
size 4806747888
|
model-00032-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e43965a93e33119e0869ff15dd66e9f3ec3caeacc97a7dcccf5bdbb355e7e49
|
3 |
+
size 4831938528
|
model-00033-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6cfc0dcb11a99e77dcf5f0ff44965fa39a20f8b7b296235925548ac7a80758a
|
3 |
+
size 4831938528
|
model-00034-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b58fc61fd2f4ae449f90d03cbab69293739ce21ec71b5a5bf122e33e54c3e92e
|
3 |
+
size 4907411080
|
model-00035-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7cc9de2da23517f35f01d5c8160334c65ceb67f4b41ba1b05160339765546beb
|
3 |
+
size 4806747888
|
model-00036-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29c0f382e6fb159c4a3e5b9bbdc8c6f82153c7d930a7b931756388c41b8b58c1
|
3 |
+
size 4831938528
|
model-00037-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b679e2a79378066fee777033609a828199e2171c1dfd8502be91f83455d96ac9
|
3 |
+
size 4831938536
|
model-00038-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd02cdf9bc09935bd985693d6f4e574ccbfab5490be148dcbcb404a0a8ae2083
|
3 |
+
size 4907411080
|
model-00039-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40d5f40fc5662c16990ba6221d3c0da9e31e286712cf66ec6c475148c8c062cf
|
3 |
+
size 4806747888
|
model-00040-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4e664b8c40069e04ef58f619dc0d7fe67cd373cefbfd2832661332b3737b597
|
3 |
+
size 4831938528
|
model-00041-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba345b6f2fd34245814f4f00bb5c3554c843bb6c6f338a512b896f0647ba40b0
|
3 |
+
size 4831938536
|
model-00042-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:610857d0068536623f6d4f55673c6c6728910aa364ef479db7dfb1ce677a40c6
|
3 |
+
size 4907411080
|
model-00043-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2dc72050121a4cf54e57a469ca94613ad317b9df6b3cb92e3ab9ef2cabb7a693
|
3 |
+
size 4806747888
|
model-00044-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2e7351828b7c222b83306c7ea1dd49465a6bca22f1c76422f3af1e7f6a8eb46
|
3 |
+
size 4831938528
|
model-00045-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49d47ccf9976ad2215e204223dccd8d82c3e99f93d3b8294555f577cec938a45
|
3 |
+
size 4831938536
|
model-00046-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:786cbac6c4907ef0f5ea109dcf5bda9c4c1900724b8f0a0dca3a40c0c3c29f7f
|
3 |
+
size 4907411072
|
model-00047-of-00051.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12beaee752b784fd60bf617fff0fc92e9f0671b5e2609dc0830e5a4851c87079
|
3 |
+
size 4806747888
|