Upload folder using huggingface_hub
Browse files- config.json +2 -1
- model-00001-of-00029.safetensors +2 -2
- model.safetensors.index.json +1 -2
config.json
CHANGED
@@ -12,6 +12,7 @@
|
|
12 |
"hidden_size": 8192,
|
13 |
"initializer_range": 0.02,
|
14 |
"intermediate_size": 28672,
|
|
|
15 |
"max_position_embeddings": 4096,
|
16 |
"mlp_bias": false,
|
17 |
"model_type": "llama",
|
@@ -23,7 +24,7 @@
|
|
23 |
"rope_scaling": null,
|
24 |
"rope_theta": 10000.0,
|
25 |
"tie_word_embeddings": false,
|
26 |
-
"torch_dtype": "
|
27 |
"training_pipeline_parallel": 1,
|
28 |
"training_tensor_parallel": 1,
|
29 |
"transformers_version": "4.41.0.dev0",
|
|
|
12 |
"hidden_size": 8192,
|
13 |
"initializer_range": 0.02,
|
14 |
"intermediate_size": 28672,
|
15 |
+
"kv_cache_torch_dtype": "float8_e4m3fn",
|
16 |
"max_position_embeddings": 4096,
|
17 |
"mlp_bias": false,
|
18 |
"model_type": "llama",
|
|
|
24 |
"rope_scaling": null,
|
25 |
"rope_theta": 10000.0,
|
26 |
"tie_word_embeddings": false,
|
27 |
+
"torch_dtype": "float16",
|
28 |
"training_pipeline_parallel": 1,
|
29 |
"training_tensor_parallel": 1,
|
30 |
"transformers_version": "4.41.0.dev0",
|
model-00001-of-00029.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6905b9fd4c8c73b2463d2bb557d7cf4bcc0c2bebdc169abb8590556615f33f55
|
3 |
+
size 4718660580
|
model.safetensors.index.json
CHANGED
@@ -1,11 +1,10 @@
|
|
1 |
{
|
2 |
"metadata": {
|
3 |
-
"total_size":
|
4 |
},
|
5 |
"weight_map": {
|
6 |
"lm_head.weight": "model-00029-of-00029.safetensors",
|
7 |
"model.embed_tokens.weight": "model-00001-of-00029.safetensors",
|
8 |
-
"model.kv_cache_dtype": "model-00001-of-00029.safetensors",
|
9 |
"model.layers.0.input_layernorm.weight": "model-00001-of-00029.safetensors",
|
10 |
"model.layers.0.mlp.down_proj.weight": "model-00001-of-00029.safetensors",
|
11 |
"model.layers.0.mlp.gate_proj.weight": "model-00001-of-00029.safetensors",
|
|
|
1 |
{
|
2 |
"metadata": {
|
3 |
+
"total_size": 137953296704
|
4 |
},
|
5 |
"weight_map": {
|
6 |
"lm_head.weight": "model-00029-of-00029.safetensors",
|
7 |
"model.embed_tokens.weight": "model-00001-of-00029.safetensors",
|
|
|
8 |
"model.layers.0.input_layernorm.weight": "model-00001-of-00029.safetensors",
|
9 |
"model.layers.0.mlp.down_proj.weight": "model-00001-of-00029.safetensors",
|
10 |
"model.layers.0.mlp.gate_proj.weight": "model-00001-of-00029.safetensors",
|