CharlieFRuan
commited on
Commit
•
ede4506
1
Parent(s):
aa34bcf
Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +80 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,80 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128256,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"position_embedding_base": 500000.0,
|
14 |
+
"context_window_size": 131072,
|
15 |
+
"prefill_chunk_size": 2048,
|
16 |
+
"num_key_value_heads": 8,
|
17 |
+
"head_dim": 128,
|
18 |
+
"tensor_parallel_shards": 1,
|
19 |
+
"max_batch_size": 80
|
20 |
+
},
|
21 |
+
"vocab_size": 128256,
|
22 |
+
"context_window_size": 131072,
|
23 |
+
"sliding_window_size": -1,
|
24 |
+
"prefill_chunk_size": 2048,
|
25 |
+
"attention_sink_size": -1,
|
26 |
+
"tensor_parallel_shards": 1,
|
27 |
+
"temperature": 0.6,
|
28 |
+
"presence_penalty": 0.0,
|
29 |
+
"frequency_penalty": 0.0,
|
30 |
+
"repetition_penalty": 1.0,
|
31 |
+
"top_p": 0.9,
|
32 |
+
"tokenizer_files": [
|
33 |
+
"tokenizer.json",
|
34 |
+
"tokenizer_config.json"
|
35 |
+
],
|
36 |
+
"tokenizer_info": {
|
37 |
+
"token_postproc_method": "byte_level",
|
38 |
+
"prepend_space_in_encode": false,
|
39 |
+
"strip_space_in_decode": false
|
40 |
+
},
|
41 |
+
"conv_template": {
|
42 |
+
"name": "llama-3_1",
|
43 |
+
"system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|>",
|
44 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
45 |
+
"system_prefix_token_ids": [
|
46 |
+
128000
|
47 |
+
],
|
48 |
+
"add_role_after_system_message": true,
|
49 |
+
"roles": {
|
50 |
+
"user": "<|start_header_id|>user",
|
51 |
+
"assistant": "<|start_header_id|>assistant"
|
52 |
+
},
|
53 |
+
"role_templates": {
|
54 |
+
"user": "{user_message}",
|
55 |
+
"assistant": "{assistant_message}",
|
56 |
+
"tool": "{tool_message}"
|
57 |
+
},
|
58 |
+
"messages": [],
|
59 |
+
"seps": [
|
60 |
+
"<|eot_id|>"
|
61 |
+
],
|
62 |
+
"role_content_sep": "<|end_header_id|>\n\n",
|
63 |
+
"role_empty_sep": "<|end_header_id|>\n\n",
|
64 |
+
"stop_str": [],
|
65 |
+
"stop_token_ids": [
|
66 |
+
128001,
|
67 |
+
128008,
|
68 |
+
128009
|
69 |
+
],
|
70 |
+
"function_string": "",
|
71 |
+
"use_function_calling": false
|
72 |
+
},
|
73 |
+
"pad_token_id": 0,
|
74 |
+
"bos_token_id": 128000,
|
75 |
+
"eos_token_id": [
|
76 |
+
128001,
|
77 |
+
128008,
|
78 |
+
128009
|
79 |
+
]
|
80 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a702ce2a3bb10a354a832af235be6c94e01e18bdd93fc9bfafed035d28db3da4
|
3 |
+
size 262668288
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:507fd6047da32e799139c5a08b0f974c8671dd0128571fcc622617152b574985
|
3 |
+
size 29360128
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1d44e54c531ecf154226b410a0addc7e20755d1e58a07f21dd2b308a2e78569
|
3 |
+
size 33046528
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55e79d6f681ea0e32b1943714623d55949e22175c529083d9c165a0c71912b0e
|
3 |
+
size 58720256
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35fc7065303fe79a82caec95272856ff80f2543906355d94685cc97e2d5ed406
|
3 |
+
size 25174016
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd3cbfe6fe8a94bead2315a43280634f42086b5f66eaf79305feec74dd556d13
|
3 |
+
size 29360128
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0070bbbd6a91f5b36c787993f8a278de7eaef9051006a845af616d15fec7b92
|
3 |
+
size 58720256
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bedd47e32ffff14e7cac974ce857a36a659e94c107037e95e09d6bc6ce257e50
|
3 |
+
size 33046528
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d09e1a2ed348f86b2085a53682385ad88d9e1eb0341909272830e96ae7f9f96
|
3 |
+
size 58720256
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08c26adb8c1a561c3ced51cc5f3530d384ff6ce036ff7b92c34448ed0176f1d3
|
3 |
+
size 32505856
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2aeb3f09991d64f683455d5b0bea997813566dc89ae7b4e3bc7427f1254715b
|
3 |
+
size 9437184
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0775dda4aeea98208ad8dab51c70e1d728ca214d0e6dcc414a329a447262c11
|
3 |
+
size 29360128
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcfde7f6b3cbd22e4578e33eb3288cfb34b6cc9a61aabb91dd9bb3ebdcd064fe
|
3 |
+
size 58720256
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62aadcc83ffa149a3393cb5fb7296957da1dbb96b5809304ebbe662fa9fab67e
|
3 |
+
size 22036480
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d90c89def84b8b985b3a60f5c5e0363345437543d9cc83b60aa5ea649b500343
|
3 |
+
size 29360128
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06669b4a3dab5ee9036ebf42f69432119d116cc1489f400d3e65b4272a6fef99
|
3 |
+
size 58720256
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee7ae7d554057bd264d3f192880ddf13dbdd10b7a522017a541ff70e286d3e76
|
3 |
+
size 27271168
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17ad18a1ec995151d6a9c42ca22553fcf453c4dedb86a999dd6e1c2125cffe1d
|
3 |
+
size 29360128
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65a9a667ebf342f936116d179a931c94cd3f5be01f5389467d45fd63cbe1cc11
|
3 |
+
size 30949376
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e3d7a1a16a356b3184f28889cb091fff11f766319087d90c59df5dc6578a091
|
3 |
+
size 58720256
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32a53926ed395eaea0209e115852f89bcc941794857f098d652f30ff48c4d522
|
3 |
+
size 32841728
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:303b8265ae466127673e4b941b7d16060abf163ef803d9905aedd05aceb92d7f
|
3 |
+
size 25174016
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:388fc1e4fead684a549f2e4c24fd07e1ab73637032deb7519668a807a954225d
|
3 |
+
size 29360128
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:647952e017f491576607db4c26135ee0d957f095ce5ca727e04c8b1067d4fff0
|
3 |
+
size 58720256
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:075d3be0e4c382ad5dcb158e23a54d0fa3f27de5bd35161314633a0206482066
|
3 |
+
size 33046528
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddf5df4995614cca80aa34573ed7f106464a881d3136d9e4210b9f77d04f5cc3
|
3 |
+
size 29360128
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7634cd664888c00b446423da1b05b23b09b2864ae3786d05fe4ff31f60cd0a85
|
3 |
+
size 58720256
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8937dd0b857ae2324e9f1d872b29b3d344b4cc0030b3617d1a8aae027c9f942
|
3 |
+
size 22036480
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:571ddf10381c3b190bd45f2aabf5d4d2f29c509e8300d424b89dc7b67169455b
|
3 |
+
size 29360128
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6d1e5dda992c2b2d739f4c468e5ea8c8d3a4299c4a956996566d2bcde7205ce
|
3 |
+
size 58720256
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfb16834df0c67ba4698e70df1b22ec792997b8fa6e13c4d4e57af42f4a0731e
|
3 |
+
size 27271168
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24db9f4de65eda45fc6f31dbf044b0d43ac2edd116dd270cf09a1ae32954576d
|
3 |
+
size 262668288
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3502be120c62bc2e01aa062de8f19d3ba419763b840e98ad0fb4ac3e60e6380
|
3 |
+
size 29360128
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bcf32b08072cfb1767d12ce1c2c1294cb5fb8895dc7d42be0712da8c64b545b
|
3 |
+
size 30949376
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d6f2794fd13eb69c73e6ea997c23550c824748772a3c1a026bc6757fe56eb90
|
3 |
+
size 58720256
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66a330c444f53a6be5c6cc0cfc511bd2cafbc58fe37ec6b83fb61719d74b2456
|
3 |
+
size 25174016
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67fc40b821f9f44785d9709d5d320d4de23dd8fbc9afdc8622bbd40f70bb0fea
|
3 |
+
size 29360128
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08960c28ed83e4dc702f124bc32d2e39fb5c1f1b9deb2ac3ec7d7facba4cd527
|
3 |
+
size 58720256
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab4d0ac972c72856ee0f6afd6edf071aa41be87253a517834191b0b3d081ae38
|
3 |
+
size 33046528
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7ee379f3f595ce06c6b832b7a6b3a494d05001265b70efe47ff7acd6345eb87
|
3 |
+
size 29360128
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85121c10ce2944a3db5834351e721b6fcf90fef46f135b6b7d1da93bb9775495
|
3 |
+
size 58720256
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:309ce35550499fcaa20d20f1c816c7f433ff6637eb05997d0c2499108920da58
|
3 |
+
size 22036480
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dca91ba58bcc470314014b4b954668b54b9a70c338528bff54acf0185e793ba4
|
3 |
+
size 32833536
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4fd1d6c11f9f8510b115d9f045ca9f0b4e710e40a3a1089966056f236218007b
|
3 |
+
size 29360128
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6d9022a8403102a8354d5939c8a04622f8e4e2367bad723698a090833487352
|
3 |
+
size 58720256
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7416f5c0b19adecef69db329df822dd74cc789bf852f708c76f63a581d222a3
|
3 |
+
size 27271168
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:997c02fb965c16dae73f0013df60ea6be0dae6dc1a964d7481528f5f4e9db28c
|
3 |
+
size 29360128
|