danielhanchen
commited on
Commit
•
6868cf2
1
Parent(s):
86c587c
Upload LlamaForCausalLM
Browse files- config.json +1 -3
- generation_config.json +0 -2
- model-00001-of-00044.safetensors +3 -0
- model-00002-of-00044.safetensors +3 -0
- model-00003-of-00044.safetensors +3 -0
- model-00004-of-00044.safetensors +3 -0
- model-00005-of-00044.safetensors +3 -0
- model-00006-of-00044.safetensors +3 -0
- model-00007-of-00044.safetensors +3 -0
- model-00008-of-00044.safetensors +3 -0
- model-00009-of-00044.safetensors +3 -0
- model-00010-of-00044.safetensors +3 -0
- model-00011-of-00044.safetensors +3 -0
- model-00012-of-00044.safetensors +3 -0
- model-00013-of-00044.safetensors +3 -0
- model-00014-of-00044.safetensors +3 -0
- model-00015-of-00044.safetensors +3 -0
- model-00016-of-00044.safetensors +3 -0
- model-00017-of-00044.safetensors +3 -0
- model-00018-of-00044.safetensors +3 -0
- model-00019-of-00044.safetensors +3 -0
- model-00020-of-00044.safetensors +3 -0
- model-00021-of-00044.safetensors +3 -0
- model-00022-of-00044.safetensors +3 -0
- model-00023-of-00044.safetensors +3 -0
- model-00024-of-00044.safetensors +3 -0
- model-00025-of-00044.safetensors +3 -0
- model-00026-of-00044.safetensors +3 -0
- model-00027-of-00044.safetensors +3 -0
- model-00028-of-00044.safetensors +3 -0
- model-00029-of-00044.safetensors +3 -0
- model-00030-of-00044.safetensors +3 -0
- model-00031-of-00044.safetensors +3 -0
- model-00032-of-00044.safetensors +3 -0
- model-00033-of-00044.safetensors +3 -0
- model-00034-of-00044.safetensors +3 -0
- model-00035-of-00044.safetensors +3 -0
- model-00036-of-00044.safetensors +3 -0
- model-00037-of-00044.safetensors +3 -0
- model-00038-of-00044.safetensors +3 -0
- model-00039-of-00044.safetensors +3 -0
- model-00040-of-00044.safetensors +3 -0
- model-00041-of-00044.safetensors +3 -0
- model-00042-of-00044.safetensors +3 -0
- model-00043-of-00044.safetensors +3 -0
- model-00044-of-00044.safetensors +3 -0
- model.safetensors.index.json +0 -0
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"architectures": [
|
4 |
"LlamaForCausalLM"
|
5 |
],
|
@@ -17,7 +17,6 @@
|
|
17 |
"num_attention_heads": 128,
|
18 |
"num_hidden_layers": 126,
|
19 |
"num_key_value_heads": 8,
|
20 |
-
"pad_token_id": 128004,
|
21 |
"pretraining_tp": 1,
|
22 |
"quantization_config": {
|
23 |
"_load_in_4bit": true,
|
@@ -46,7 +45,6 @@
|
|
46 |
"tie_word_embeddings": false,
|
47 |
"torch_dtype": "bfloat16",
|
48 |
"transformers_version": "4.44.2",
|
49 |
-
"unsloth_version": "2024.9",
|
50 |
"use_cache": true,
|
51 |
"vocab_size": 128256
|
52 |
}
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "meta-llama/Meta-Llama-3.1-405B",
|
3 |
"architectures": [
|
4 |
"LlamaForCausalLM"
|
5 |
],
|
|
|
17 |
"num_attention_heads": 128,
|
18 |
"num_hidden_layers": 126,
|
19 |
"num_key_value_heads": 8,
|
|
|
20 |
"pretraining_tp": 1,
|
21 |
"quantization_config": {
|
22 |
"_load_in_4bit": true,
|
|
|
45 |
"tie_word_embeddings": false,
|
46 |
"torch_dtype": "bfloat16",
|
47 |
"transformers_version": "4.44.2",
|
|
|
48 |
"use_cache": true,
|
49 |
"vocab_size": 128256
|
50 |
}
|
generation_config.json
CHANGED
@@ -3,8 +3,6 @@
|
|
3 |
"bos_token_id": 128000,
|
4 |
"do_sample": true,
|
5 |
"eos_token_id": 128001,
|
6 |
-
"max_length": 131072,
|
7 |
-
"pad_token_id": 128004,
|
8 |
"temperature": 0.6,
|
9 |
"top_p": 0.9,
|
10 |
"transformers_version": "4.44.2"
|
|
|
3 |
"bos_token_id": 128000,
|
4 |
"do_sample": true,
|
5 |
"eos_token_id": 128001,
|
|
|
|
|
6 |
"temperature": 0.6,
|
7 |
"top_p": 0.9,
|
8 |
"transformers_version": "4.44.2"
|
model-00001-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94cb37dbb5f7c756f8fe94b9de244d2db18ea8f4f86ded646c1ba9868eadf9d1
|
3 |
+
size 4947019582
|
model-00002-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0223d0bb178a982153a7e905066d498dac06c175c991244c4ddcb41331d88ca8
|
3 |
+
size 4933502252
|
model-00003-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a312d1a09677592c87d0a983bed404fad9f85db0a5ee944a03ac94d586d0fc0d
|
3 |
+
size 4933502250
|
model-00004-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b77a4927f431105935169c509580c0702c0a61cc1454def926b9a6de9b7735d
|
3 |
+
size 4933502251
|
model-00005-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9175deab6aaa82721c67749c8e22ad281321686155764e4712836b5e8cd48124
|
3 |
+
size 4933502348
|
model-00006-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c305ef7ea3eb453d61a45ff37391d0dba389efb75afa1a6fe2e2c489f7c2b28
|
3 |
+
size 4933502387
|
model-00007-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51beb88c5811647c05e7a1fa957a918671b2c9f3c113f3f85c918f4cd861adf4
|
3 |
+
size 4933502390
|
model-00008-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd7b24bb3f0e623bdc799735389d9a89004aa45c2cee5cb4eafbbb9a3119cd3f
|
3 |
+
size 4933502390
|
model-00009-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23dab6f1c7ac6a4780944c27a96fb545acd9203487cd028b60e392a8eeb467f1
|
3 |
+
size 4933502388
|
model-00010-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d8a8368513b66ba7e495d598dc20a679b368ac5ac028eac32ba6ead4e7c73a7
|
3 |
+
size 4933502385
|
model-00011-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e86fbf3906a5a20f2f7d40b71f19d1dab1c211759d482530ae2f042ec890b328
|
3 |
+
size 4933502390
|
model-00012-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa0a2bb8724cd009caa0ab84fac493e8003b85cadaacf513e429345290319d2a
|
3 |
+
size 4933502382
|
model-00013-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17cc17377bb8f9a2ad19bf654a91957ba5d4056708af5b589325ef539f6c2ab2
|
3 |
+
size 4933502386
|
model-00014-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b77662d4d9f8c61c2e6e6e7973ca10bc35e559d837c2871a2279eb8cbbccb5c
|
3 |
+
size 4933502387
|
model-00015-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7780c50e2c4c00fe0150e7c6400fd8706775277e8ce4e803b0c9f70a0061afce
|
3 |
+
size 4933502387
|
model-00016-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6af36a43efc2bd20c8a70cfe549b919dd8df5b1f508ab42d23a91d6876bc52eb
|
3 |
+
size 4933502382
|
model-00017-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a7b6a38befa67094a8705e730e8cc139db91265bb7f3f32628abb0e8261db62
|
3 |
+
size 4933502385
|
model-00018-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20e0d6efa2022afa1842236c41f25bb962cee5077dfc7b54553aff3187a168d0
|
3 |
+
size 4933502389
|
model-00019-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8b98346ec0651f050036faa57a8ff3065a5573d63bbba178b6ba87ec51b2fe1
|
3 |
+
size 4933502384
|
model-00020-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a90269648c0b4979ebb5a95dab776aeb473d6722c68ed93c3792cc33cedc86b1
|
3 |
+
size 4933502389
|
model-00021-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:191f3442eba5052cf01f45c54562aa397d38496deaf6124c20c1c57b432a31da
|
3 |
+
size 4933502388
|
model-00022-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7dd73d573f84091d31ef1afe6274feaaa91429f153fb38bd6a73d6f3ae2a83b
|
3 |
+
size 4933502388
|
model-00023-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7480ff2098ea16b76120cc8cfc22e663f346a96d0d723e4b59742e26cd3d3caa
|
3 |
+
size 4933502383
|
model-00024-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8b8a62005d62d37a94e29a4206f4e85978f6049faf83ccad649a5b758b4ce80
|
3 |
+
size 4933502385
|
model-00025-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b737efdfea1b699e30cdcaa5e68b164ab3798f4e70065dcb0a4e27618e54f97
|
3 |
+
size 4933502386
|
model-00026-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbf458e61393e8029417070d0056789bc85b43d2a25912962c8da9d0a23e7345
|
3 |
+
size 4933502388
|
model-00027-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ee14c28ecf23443765d8ba956948a9bbf2d34b9ef549749e1e193990d6c8e4a
|
3 |
+
size 4933502387
|
model-00028-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a2a4f3e05b31740768432ee73d5f423fbd020054f1c114dee96319ec06dc835
|
3 |
+
size 4933502387
|
model-00029-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1691cab0756e0c942159054eec547b37e39281470e5de052acfc0a9f55cc553a
|
3 |
+
size 4933502386
|
model-00030-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:398e090dabd847d59652f8e919a05e88fb1b6ee13ef627c0b882977f61c3c235
|
3 |
+
size 4933502391
|
model-00031-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5bbff0c977edcf2c3be2262a894e11a8e4383f44a60d19b3db13fe7f691f7a1
|
3 |
+
size 4933502389
|
model-00032-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86b900809f71220de786b24f98901b52e203a1bda3a879b78d198cff697c327a
|
3 |
+
size 4933502389
|
model-00033-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0de8e9fa44104372f2c1689a702546fbe8790f2d9578699e5f8b7664ce27eba
|
3 |
+
size 4933502388
|
model-00034-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20540e4bb34fe00cc0560e097425aa560f298e9a2de2545a52c9cd3e22ab457f
|
3 |
+
size 4933502390
|
model-00035-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6517c2c7e65a4e58410068dad6320d712c934046a2f2e6fe907973946bb4f550
|
3 |
+
size 4933502486
|
model-00036-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07554b7370f6dcf268abfb2e4bf2a9189021a455ab7480801d3b61cfe91377eb
|
3 |
+
size 4933502519
|
model-00037-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:187b68ea1ddc0b760fb338f66d4ab69e04bbbaa53b968859b8f630fadba7d28c
|
3 |
+
size 4933502515
|
model-00038-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96af7fc711f8e60f465813b7f9e36c3393523dd4ac05c3177a3ee17cb2a9eaba
|
3 |
+
size 4933502518
|
model-00039-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab221e030982ec9c605425af92d2129b478b58adf38b01456309bc7a163a01bf
|
3 |
+
size 4933502513
|
model-00040-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a30307fba3f4872e3347d8bc3b428d238e51cc8b67fe322c52b990e4995a93be
|
3 |
+
size 4933502517
|
model-00041-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7b1ad47f8d28bb0a5b95db27a878556f6aed167b4da791756789f2b50044a05
|
3 |
+
size 4933502512
|
model-00042-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f52725f959f2ce437cfc89aa993b5a573048f191fb804de20fc996c2371f8100
|
3 |
+
size 4933502514
|
model-00043-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:026b2bb50e06f859180872ef455b662a86bc890cbc01f66213008c3b18a1581d
|
3 |
+
size 4189208444
|
model-00044-of-00044.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c19b417dcc7fd337f97811ce0cd49f33750240019dc873802e7e15b6ee63b428
|
3 |
+
size 4202692736
|
model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|