Lin-K76 commited on
Commit
6fb669f
1 Parent(s): 30fa5d4

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +68 -0
  2. generation_config.json +9 -0
  3. model-00001-of-00048.safetensors +3 -0
  4. model-00002-of-00048.safetensors +3 -0
  5. model-00003-of-00048.safetensors +3 -0
  6. model-00004-of-00048.safetensors +3 -0
  7. model-00005-of-00048.safetensors +3 -0
  8. model-00006-of-00048.safetensors +3 -0
  9. model-00007-of-00048.safetensors +3 -0
  10. model-00008-of-00048.safetensors +3 -0
  11. model-00009-of-00048.safetensors +3 -0
  12. model-00010-of-00048.safetensors +3 -0
  13. model-00011-of-00048.safetensors +3 -0
  14. model-00012-of-00048.safetensors +3 -0
  15. model-00013-of-00048.safetensors +3 -0
  16. model-00014-of-00048.safetensors +3 -0
  17. model-00015-of-00048.safetensors +3 -0
  18. model-00016-of-00048.safetensors +3 -0
  19. model-00017-of-00048.safetensors +3 -0
  20. model-00018-of-00048.safetensors +3 -0
  21. model-00019-of-00048.safetensors +3 -0
  22. model-00020-of-00048.safetensors +3 -0
  23. model-00021-of-00048.safetensors +3 -0
  24. model-00022-of-00048.safetensors +3 -0
  25. model-00023-of-00048.safetensors +3 -0
  26. model-00024-of-00048.safetensors +3 -0
  27. model-00025-of-00048.safetensors +3 -0
  28. model-00026-of-00048.safetensors +3 -0
  29. model-00027-of-00048.safetensors +3 -0
  30. model-00028-of-00048.safetensors +3 -0
  31. model-00029-of-00048.safetensors +3 -0
  32. model-00030-of-00048.safetensors +3 -0
  33. model-00031-of-00048.safetensors +3 -0
  34. model-00032-of-00048.safetensors +3 -0
  35. model-00033-of-00048.safetensors +3 -0
  36. model-00034-of-00048.safetensors +3 -0
  37. model-00035-of-00048.safetensors +3 -0
  38. model-00036-of-00048.safetensors +3 -0
  39. model-00037-of-00048.safetensors +3 -0
  40. model-00038-of-00048.safetensors +3 -0
  41. model-00039-of-00048.safetensors +3 -0
  42. model-00040-of-00048.safetensors +3 -0
  43. model-00041-of-00048.safetensors +3 -0
  44. model-00042-of-00048.safetensors +3 -0
  45. model-00043-of-00048.safetensors +3 -0
  46. model-00044-of-00048.safetensors +3 -0
  47. model-00045-of-00048.safetensors +3 -0
  48. model-00046-of-00048.safetensors +3 -0
  49. model-00047-of-00048.safetensors +3 -0
  50. model-00048-of-00048.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,68 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "deepseek-ai/DeepSeek-Coder-V2-Base",
3
+ "architectures": [
4
+ "DeepseekV2ForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "auto_map": {
9
+ "AutoConfig": "deepseek-ai/DeepSeek-Coder-V2-Base--configuration_deepseek.DeepseekV2Config",
10
+ "AutoModel": "deepseek-ai/DeepSeek-Coder-V2-Base--modeling_deepseek.DeepseekV2Model",
11
+ "AutoModelForCausalLM": "deepseek-ai/DeepSeek-Coder-V2-Base--modeling_deepseek.DeepseekV2ForCausalLM"
12
+ },
13
+ "aux_loss_alpha": 0.001,
14
+ "bos_token_id": 100000,
15
+ "eos_token_id": 100001,
16
+ "ep_size": 1,
17
+ "first_k_dense_replace": 1,
18
+ "hidden_act": "silu",
19
+ "hidden_size": 5120,
20
+ "initializer_range": 0.02,
21
+ "intermediate_size": 12288,
22
+ "kv_lora_rank": 512,
23
+ "max_position_embeddings": 163840,
24
+ "model_type": "deepseek_v2",
25
+ "moe_intermediate_size": 1536,
26
+ "moe_layer_freq": 1,
27
+ "n_group": 8,
28
+ "n_routed_experts": 160,
29
+ "n_shared_experts": 2,
30
+ "norm_topk_prob": false,
31
+ "num_attention_heads": 128,
32
+ "num_experts_per_tok": 6,
33
+ "num_hidden_layers": 60,
34
+ "num_key_value_heads": 128,
35
+ "pretraining_tp": 1,
36
+ "q_lora_rank": 1536,
37
+ "qk_nope_head_dim": 128,
38
+ "qk_rope_head_dim": 64,
39
+ "quantization_config": {
40
+ "activation_scheme": "static",
41
+ "ignored_layers": [
42
+ "lm_head"
43
+ ],
44
+ "quant_method": "fp8"
45
+ },
46
+ "rms_norm_eps": 1e-06,
47
+ "rope_scaling": {
48
+ "beta_fast": 32,
49
+ "beta_slow": 1,
50
+ "factor": 40,
51
+ "mscale": 1.0,
52
+ "mscale_all_dim": 1.0,
53
+ "original_max_position_embeddings": 4096,
54
+ "type": "yarn"
55
+ },
56
+ "rope_theta": 10000,
57
+ "routed_scaling_factor": 16.0,
58
+ "scoring_func": "softmax",
59
+ "seq_aux": true,
60
+ "tie_word_embeddings": false,
61
+ "topk_group": 3,
62
+ "topk_method": "group_limited_greedy",
63
+ "torch_dtype": "bfloat16",
64
+ "transformers_version": "4.42.4",
65
+ "use_cache": true,
66
+ "v_head_dim": 128,
67
+ "vocab_size": 102400
68
+ }
generation_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 100000,
4
+ "do_sample": true,
5
+ "eos_token_id": 100001,
6
+ "temperature": 0.3,
7
+ "top_p": 0.95,
8
+ "transformers_version": "4.42.4"
9
+ }
model-00001-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50b88c568fde1c4dd6b48783c556797e94a9ebb243c10c7a54e865a054d5f562
3
+ size 4996259528
model-00002-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89f46ab8b32f869ff374f533a5945c37d0c656f7bb8f610e5fa8f91c2bde49c8
3
+ size 4996987640
model-00003-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3caf3d12bd2396f49af10e719dd6063a6bec88301e17dd3e4ef87881dcffe6c9
3
+ size 4995526672
model-00004-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdf015f5c33909e02cd68af0bdfbe9900d363162b417720831ff2523465ad817
3
+ size 4995526744
model-00005-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec42b35a58d432ca9267d4fbc599d4213240bfc22b7eea884cd1c16eb5c3e42d
3
+ size 4995527056
model-00006-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b4b844df5daf120a3b8cd1114409a56cbbf8b26a378d943df375fc00565ca73
3
+ size 4996987592
model-00007-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d633a243a339da1579eb3fb6e20a475a4fbcaa789c6d68035878533c305bcca
3
+ size 4995526672
model-00008-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c46f4435f22d6cfa0875bd44e4c0aa094323c3ccf8985cfeea96041e94e7de06
3
+ size 4995527816
model-00009-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20ccf6879d95b5e5e97f54cf6070ec2705504a6313df3c2abe465937de859113
3
+ size 4995528912
model-00010-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa147d9334fbd914bb209f0bd63a6ced90acef9bcaff56e57486fe018fc81e39
3
+ size 4996989368
model-00011-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db3ca10560a28e66710fb26bd6093fe23d279be1187bb2e3d5232c4973bc8bc2
3
+ size 4995528528
model-00012-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:052f886aa7efc874d1422613b29c8e38c8d6733e767a6019c3bc6fbb7ce65245
3
+ size 4995528696
model-00013-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8d1d05c769be0f2467eb8f4b493980d120f87648a44e9658fe353730b55baed
3
+ size 4989302048
model-00014-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3764f33ac4637e79c21387f4f5181c8bfd52170cd5109175a183ab3bc73c504
3
+ size 4995351504
model-00015-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e5d5eb34d0756d47b8ef6e45a35d285be68e5fbc3ecceed6104a33392b77871
3
+ size 4995528528
model-00016-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ea4504dae11c8484433f41eb570309f8c43ac46449f8143da64d458c2a2288b
3
+ size 4995528736
model-00017-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e306d2d9a715c27ab793970bbe660e55d71988b4a0951174e3c9e64fdea11672
3
+ size 4960291384
model-00018-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0e812044d474710f4845ccb9814220308e2cd13d15360916f74a0a56c46b7f7
3
+ size 4992903432
model-00019-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9279e4faafccbc6d25c6a669e771ca35af76cbb337db29828ccbcc287d6d0e3
3
+ size 4995528528
model-00020-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6422fae9eb8f3de8f1975266cc5d12003f1ffe9ed230bdace3e3e2ff9ed120d
3
+ size 4995528768
model-00021-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:244c05fb0811c1704b12d6d5a78e4827d8799f7a78f682520ace4c040cd8b73a
3
+ size 4996989712
model-00022-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0066660206cfa4174b7a61810245b3579a8eb7d024ece8406d411755c77e80ad
3
+ size 4995528448
model-00023-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bff7a9a322276d1e3a459f3da3386be8e3c5667168bf7438998d5682f22cc5bc
3
+ size 4995528528
model-00024-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:401544805c2373ea0f153afd95416c9b10e31e6573464abf0807b31797fd9461
3
+ size 4995528816
model-00025-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e65663f955cf00afe00304e5165ccd8adfa63a4d557d373a3ea79d47e1937838
3
+ size 4996989624
model-00026-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c117a693afc4122fb3b725ab9a77ca74e4f866339f4159c6c967ea2caa85c089
3
+ size 4995528488
model-00027-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce51d3e24b81f4ed9cd837b51cf07fc1972dc14f397c56ca07b947f81da2f0a8
3
+ size 4995528528
model-00028-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:440cca97ac9b41f28a4b2deef2410036ee7ac74a52d4b77ce645c57592f45c1e
3
+ size 4995528856
model-00029-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c932ec9d7b8cc1bdc7b89fba9f98f8373d54f0b6583c376bbbf932279c8ba9a
3
+ size 4996989544
model-00030-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c1e81bd4ec1b3915c3028f70e0f43b2c0993327d2f40726052f609b01fd223e
3
+ size 4995528528
model-00031-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b83b1e65acaa9699993c2843f5947dcf8494f47e9921a591fd5cec64fe539577
3
+ size 4995528528
model-00032-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:123fc3da66ffd49f43964601958273d7c4c4b7e72607f4763b93dd7ee1f05cbc
3
+ size 4995528904
model-00033-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89a1ba22d405685d9e6f16ce58bc38755622b2460134b01bde5a2a27f92b4f89
3
+ size 4996989504
model-00034-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29e0b1e0fcd81f05bff0a0d5cbb3bdde1aa6afa6e32cd260a07e0710f8902a27
3
+ size 4995528528
model-00035-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef6a843dc62ae99db78afeb5e4676921013a23fcaa899bb56e9e5e24f5393fd2
3
+ size 4995528560
model-00036-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:325c7be21530a7fc43b9d325c4260ccada9efd0a24e974729543b1c6ead616e4
3
+ size 4995528920
model-00037-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab35c820136ff23cd165c8aa788fd5542b83198b8864c54fa90c82f042ae413f
3
+ size 4996989456
model-00038-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7180f8c53653f076486c64f80f3af9ecead629fd03954d2388fa3b3c6fd0c35c
3
+ size 4995528528
model-00039-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8c053bbbeed259a5da6d10c2010c0b39d7502dc79acea333f42d53d50aeb032
3
+ size 4995528600
model-00040-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a01f9c3838a6345d19007a9f3a4523345a1baa8e4ed68d1da7607c24de8ae59b
3
+ size 4995528920
model-00041-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97f644b8325b6e0383545a89beec27f06f5e6dce120377c93e4d0271a543678c
3
+ size 4996989408
model-00042-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c94fd2d3fcef7bed2dfd58d11e96cf4293699192e04000d6ded5fc8a26a73977
3
+ size 4995528528
model-00043-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60bebe8f9653f2dc504ef2b5b45ef51a158304ccae375093efffcd8ca16f6b62
3
+ size 4995528648
model-00044-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a96815b8384b871074ed25564ebf399f756f839de5b296b52195fc9c30f55ddd
3
+ size 4995528920
model-00045-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2dabf10837e7c240945a8dd3ae3ea21d5656205d350130d9e5d43a658e30102
3
+ size 4996989368
model-00046-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7783cdd823d28b6ede934214150f1498c3012eb0b4ef5df407be6d3eb285e670
3
+ size 4995528528
model-00047-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d09a5b9307ee2b2543ca418ab609e7061aac0d34d8c1776c3ea018eaf5a4fbf
3
+ size 4995528696
model-00048-of-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f71aa6b780ade9f22ad78253c7eabe1db7b8e27f5c79dbab6a1afc999f8a526
3
+ size 2088381456