CharlieFRuan
commited on
Commit
•
d7e1d18
1
Parent(s):
8844a7d
Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- mlc-chat-config.json +83 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,83 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "gemma2",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4608,
|
7 |
+
"intermediate_size": 36864,
|
8 |
+
"attention_bias": false,
|
9 |
+
"num_attention_heads": 32,
|
10 |
+
"num_key_value_heads": 16,
|
11 |
+
"head_dim": 128,
|
12 |
+
"num_hidden_layers": 46,
|
13 |
+
"rms_norm_eps": 1e-06,
|
14 |
+
"vocab_size": 256000,
|
15 |
+
"hidden_activation": "gelu_pytorch_tanh",
|
16 |
+
"position_embedding_base": 10000.0,
|
17 |
+
"context_window_size": 4096,
|
18 |
+
"prefill_chunk_size": 2048,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"max_batch_size": 80,
|
21 |
+
"attn_logit_softcapping": 50.0,
|
22 |
+
"final_logit_softcapping": 30.0,
|
23 |
+
"query_pre_attn_scalar": 144,
|
24 |
+
"sliding_window": 4096
|
25 |
+
},
|
26 |
+
"vocab_size": 256000,
|
27 |
+
"context_window_size": 4096,
|
28 |
+
"sliding_window_size": -1,
|
29 |
+
"prefill_chunk_size": 2048,
|
30 |
+
"attention_sink_size": -1,
|
31 |
+
"tensor_parallel_shards": 1,
|
32 |
+
"temperature": 1.0,
|
33 |
+
"presence_penalty": 0.0,
|
34 |
+
"frequency_penalty": 0.0,
|
35 |
+
"repetition_penalty": 1.0,
|
36 |
+
"top_p": 1.0,
|
37 |
+
"tokenizer_files": [
|
38 |
+
"tokenizer.model",
|
39 |
+
"tokenizer.json",
|
40 |
+
"tokenizer_config.json"
|
41 |
+
],
|
42 |
+
"tokenizer_info": {
|
43 |
+
"token_postproc_method": "byte_fallback",
|
44 |
+
"prepend_space_in_encode": false,
|
45 |
+
"strip_space_in_decode": false
|
46 |
+
},
|
47 |
+
"conv_template": {
|
48 |
+
"name": "gemma_instruction",
|
49 |
+
"system_template": "{system_message}",
|
50 |
+
"system_message": "",
|
51 |
+
"system_prefix_token_ids": [
|
52 |
+
2
|
53 |
+
],
|
54 |
+
"add_role_after_system_message": true,
|
55 |
+
"roles": {
|
56 |
+
"user": "<start_of_turn>user",
|
57 |
+
"assistant": "<start_of_turn>model"
|
58 |
+
},
|
59 |
+
"role_templates": {
|
60 |
+
"user": "{user_message}",
|
61 |
+
"assistant": "{assistant_message}",
|
62 |
+
"tool": "{tool_message}"
|
63 |
+
},
|
64 |
+
"messages": [],
|
65 |
+
"seps": [
|
66 |
+
"<end_of_turn>\n"
|
67 |
+
],
|
68 |
+
"role_content_sep": "\n",
|
69 |
+
"role_empty_sep": "\n",
|
70 |
+
"stop_str": [
|
71 |
+
"<end_of_turn>"
|
72 |
+
],
|
73 |
+
"stop_token_ids": [
|
74 |
+
1,
|
75 |
+
107
|
76 |
+
],
|
77 |
+
"function_string": "",
|
78 |
+
"use_function_calling": false
|
79 |
+
},
|
80 |
+
"pad_token_id": 0,
|
81 |
+
"bos_token_id": 2,
|
82 |
+
"eos_token_id": 1
|
83 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88ba5b3f5497ccfe0b22d6ad859d45a9dee692740cc60841039520cbae4861b0
|
3 |
+
size 589824000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a81dbd770fa4949994f9013bb9ffe49482a390ab1317cbd84129ce186693491a
|
3 |
+
size 73728000
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8cb8fc89f471905d2c5f91f0b203ff12da01d5971618bf13b5815911d857f15
|
3 |
+
size 25989120
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01d98a54c97db67a88c5616af9f915512f2514bf1dd69f81ef3cf0d108496c27
|
3 |
+
size 31924224
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11ee833f6e5b11da2cb0090e824805186288e2e40d951a5e6e5382de50620015
|
3 |
+
size 84934656
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7273c4bb91f92f260eb22b6351dbde7a92e76b662bc81addf0f2ce156daefee5
|
3 |
+
size 169869312
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:beaa98086cdcb0dc66d40320c7d2882384a7d154f2c4dd4e024a020c2352fb51
|
3 |
+
size 21233664
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:927112c1a90b737a621a79931f85d4953cc3370ffd987c9fca0bffae66cd51a1
|
3 |
+
size 18874368
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e34f3d5b530927e8cd62bd3826499642f4c2d7e37145f6f0c3be3332fa3e82d
|
3 |
+
size 25989120
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4d9faaf23689992f4404fa0348f8cffb5d62f7bfb99a0fe6669a40cb50af3e1
|
3 |
+
size 84934656
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1eb5f6ebb49b10f729b6d19318d54e00dbb3e98e8ce7e5791ede4b2d7ed2ba93
|
3 |
+
size 169869312
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1d63587f07f527b3a7587d0d876e162ab0de72cc161f2449ff75013565b7ec9
|
3 |
+
size 21233664
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77ca5cbe8d9b534c994948bc70fdcd248935db5cf4028ba945820e8b97a49a97
|
3 |
+
size 18874368
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b45cb46ad952a6b34f385b2935bf891460b730cb261b7015778c2a31335227dc
|
3 |
+
size 31850496
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:482e48a3077de86e6e3ca511a1b7b7e22ebe66eb87a3d54f071e86b6a99d06ea
|
3 |
+
size 33067008
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:889258fa192789016dde1b320b1bc3f2954e91cd89a098336e75546837f927a8
|
3 |
+
size 84934656
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f00c9824d54a4a80b41d3f4f9a2a80e2801fabee1c4638d09af2c7951d42a5fa
|
3 |
+
size 33039360
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ccd2a002d50be13e5d03dad9997831d64fdc4bdb23c2f5afa70abb981c58963
|
3 |
+
size 84934656
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:609328b523a629ff353de7424ed1b5905210a6a7c73f18ae3faa3e57ba1ef8ca
|
3 |
+
size 169869312
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe8dd351613f592b4ef8522985bdbb14c22ac433930119ed356b1e8706c9d67c
|
3 |
+
size 21233664
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:512e5f39b3e926d005bab637ab471bfa3e6f7eaa42aa6aac28bb285d5432ac58
|
3 |
+
size 18874368
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce703cbe22eb917addd1b2c789c857237f56168edd7de1196f1189a3fe8bb51a
|
3 |
+
size 33094656
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b21f563bb7d7abe56ffaed3165a6359bcd8bc3ba705b8d0472e39b637930f51
|
3 |
+
size 84934656
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56232e123eefbe5ca697a8e9dffc36549e21a2b923c4c5d27d33329b1695d629
|
3 |
+
size 169869312
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df4515d65f7798113e5b13a846085a6a2f69b56ba1d8dba45c9b495091fd6867
|
3 |
+
size 84934656
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7570d783519b583ab488d51556f004703c97e7c19c659a41f92ec243089e5462
|
3 |
+
size 18874368
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5340934dd3abf76e8a72397eedf80cf4b09b6d8e25f64fa952745ec2ed32853
|
3 |
+
size 33067008
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5aa3e2358376700ac3d36aceb447b778bbed3459c664707b784ff1b8f396c2f5
|
3 |
+
size 84934656
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3d4a164a79f1bfbce13748270e8b1eee9689b52c39aeb261fb973cccb99fd9a
|
3 |
+
size 169869312
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:174e8cf2e9dd43ef1bf0ece984fb22bf259fa9d7705a80635412bea60d9fa528
|
3 |
+
size 21233664
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a704a630773a4cc5f74628818c91f3e729cc5eb81362b551c1c522236a300520
|
3 |
+
size 18874368
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9f1e583a01aa3dbaa5a931bb4d561c7b44e2ced322230c9df2459da4a147701
|
3 |
+
size 25989120
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ddb82f5c951757cf66c5f4ee6b79396880f1c522fe4e03f08b6db44e017cb95
|
3 |
+
size 84934656
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:858505a52b9d6c21a57074ed42ed21a8630c6124e966c3c8260d60205fc4bf06
|
3 |
+
size 169869312
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ebb6d2ffa41c3293e2da47177a6c93aa9a97e20c24e490deb58791acec68219
|
3 |
+
size 21233664
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5508e9eef5dc05d64b7c868d236fef4c1561d32f146eca06fe7e924715d7705b
|
3 |
+
size 84934656
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb52db2d624ad7f9445a0e90888a9117acf2573ab2ceae0438a3e5766beb7842
|
3 |
+
size 18874368
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9379749efecbf402f8a731d8263f580a315d1bb88f36663a4b3d34d75de22a1
|
3 |
+
size 33067008
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e44a2ed1206be94bcdd2987349e70fd04aa2f39ee9b25a0cfc238d05624031ec
|
3 |
+
size 84934656
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84dba5f6a01394207c377acc27403dc54a80df8960c8a9a19325d72bac499a1c
|
3 |
+
size 33039360
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7b783fa34dbf52ad93b9caa9f73b9c6311f4a1f267da9ad88d376daf2cc1671
|
3 |
+
size 169869312
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:063da113c47dc030085633520110848045597d149047b08df5fa6443690e74ba
|
3 |
+
size 84934656
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f94df20dabf5113b10f7cd698ff8ee8c0b24d9bd8b019043c3e6b75e83b2e86
|
3 |
+
size 31887360
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4ed261c7009da1a24d405afc4e71cea20f1996eeeb9b0f7bb62bc6668f8cd4c
|
3 |
+
size 169869312
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97d9bc2cf86945cf793e54f03a69e19ef6c49b127b8dec37fd976f45649d6013
|
3 |
+
size 18874368
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0653523f9d72f1678fea7a8fd112a6e6303939c87fe04ee56c14c9ab727f8b7
|
3 |
+
size 31878144
|