mohitsha HF staff commited on
Commit
21f0e66
1 Parent(s): f119ab9

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -12,6 +12,7 @@
12
  "hidden_size": 8192,
13
  "initializer_range": 0.02,
14
  "intermediate_size": 28672,
 
15
  "max_position_embeddings": 4096,
16
  "mlp_bias": false,
17
  "model_type": "llama",
@@ -23,7 +24,7 @@
23
  "rope_scaling": null,
24
  "rope_theta": 10000.0,
25
  "tie_word_embeddings": false,
26
- "torch_dtype": "float8_e4m3fn",
27
  "training_pipeline_parallel": 1,
28
  "training_tensor_parallel": 1,
29
  "transformers_version": "4.41.0.dev0",
 
12
  "hidden_size": 8192,
13
  "initializer_range": 0.02,
14
  "intermediate_size": 28672,
15
+ "kv_cache_torch_dtype": "float8_e4m3fn",
16
  "max_position_embeddings": 4096,
17
  "mlp_bias": false,
18
  "model_type": "llama",
 
24
  "rope_scaling": null,
25
  "rope_theta": 10000.0,
26
  "tie_word_embeddings": false,
27
+ "torch_dtype": "float16",
28
  "training_pipeline_parallel": 1,
29
  "training_tensor_parallel": 1,
30
  "transformers_version": "4.41.0.dev0",
model-00001-of-00029.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b7a773e6539ff6286f191598136e72fffd6109e87d3587e4f8d569fd3c3cb82
3
- size 4718660669
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6905b9fd4c8c73b2463d2bb557d7cf4bcc0c2bebdc169abb8590556615f33f55
3
+ size 4718660580
model.safetensors.index.json CHANGED
@@ -1,11 +1,10 @@
1
  {
2
  "metadata": {
3
- "total_size": 137953296705
4
  },
5
  "weight_map": {
6
  "lm_head.weight": "model-00029-of-00029.safetensors",
7
  "model.embed_tokens.weight": "model-00001-of-00029.safetensors",
8
- "model.kv_cache_dtype": "model-00001-of-00029.safetensors",
9
  "model.layers.0.input_layernorm.weight": "model-00001-of-00029.safetensors",
10
  "model.layers.0.mlp.down_proj.weight": "model-00001-of-00029.safetensors",
11
  "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00029.safetensors",
 
1
  {
2
  "metadata": {
3
+ "total_size": 137953296704
4
  },
5
  "weight_map": {
6
  "lm_head.weight": "model-00029-of-00029.safetensors",
7
  "model.embed_tokens.weight": "model-00001-of-00029.safetensors",
 
8
  "model.layers.0.input_layernorm.weight": "model-00001-of-00029.safetensors",
9
  "model.layers.0.mlp.down_proj.weight": "model-00001-of-00029.safetensors",
10
  "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00029.safetensors",