CharlieFRuan commited on
Commit
d7e1d18
1 Parent(s): 8844a7d

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
mlc-chat-config.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "gemma2",
4
+ "quantization": "q4f32_1",
5
+ "model_config": {
6
+ "hidden_size": 4608,
7
+ "intermediate_size": 36864,
8
+ "attention_bias": false,
9
+ "num_attention_heads": 32,
10
+ "num_key_value_heads": 16,
11
+ "head_dim": 128,
12
+ "num_hidden_layers": 46,
13
+ "rms_norm_eps": 1e-06,
14
+ "vocab_size": 256000,
15
+ "hidden_activation": "gelu_pytorch_tanh",
16
+ "position_embedding_base": 10000.0,
17
+ "context_window_size": 4096,
18
+ "prefill_chunk_size": 2048,
19
+ "tensor_parallel_shards": 1,
20
+ "max_batch_size": 80,
21
+ "attn_logit_softcapping": 50.0,
22
+ "final_logit_softcapping": 30.0,
23
+ "query_pre_attn_scalar": 144,
24
+ "sliding_window": 4096
25
+ },
26
+ "vocab_size": 256000,
27
+ "context_window_size": 4096,
28
+ "sliding_window_size": -1,
29
+ "prefill_chunk_size": 2048,
30
+ "attention_sink_size": -1,
31
+ "tensor_parallel_shards": 1,
32
+ "temperature": 1.0,
33
+ "presence_penalty": 0.0,
34
+ "frequency_penalty": 0.0,
35
+ "repetition_penalty": 1.0,
36
+ "top_p": 1.0,
37
+ "tokenizer_files": [
38
+ "tokenizer.model",
39
+ "tokenizer.json",
40
+ "tokenizer_config.json"
41
+ ],
42
+ "tokenizer_info": {
43
+ "token_postproc_method": "byte_fallback",
44
+ "prepend_space_in_encode": false,
45
+ "strip_space_in_decode": false
46
+ },
47
+ "conv_template": {
48
+ "name": "gemma_instruction",
49
+ "system_template": "{system_message}",
50
+ "system_message": "",
51
+ "system_prefix_token_ids": [
52
+ 2
53
+ ],
54
+ "add_role_after_system_message": true,
55
+ "roles": {
56
+ "user": "<start_of_turn>user",
57
+ "assistant": "<start_of_turn>model"
58
+ },
59
+ "role_templates": {
60
+ "user": "{user_message}",
61
+ "assistant": "{assistant_message}",
62
+ "tool": "{tool_message}"
63
+ },
64
+ "messages": [],
65
+ "seps": [
66
+ "<end_of_turn>\n"
67
+ ],
68
+ "role_content_sep": "\n",
69
+ "role_empty_sep": "\n",
70
+ "stop_str": [
71
+ "<end_of_turn>"
72
+ ],
73
+ "stop_token_ids": [
74
+ 1,
75
+ 107
76
+ ],
77
+ "function_string": "",
78
+ "use_function_calling": false
79
+ },
80
+ "pad_token_id": 0,
81
+ "bos_token_id": 2,
82
+ "eos_token_id": 1
83
+ }
ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88ba5b3f5497ccfe0b22d6ad859d45a9dee692740cc60841039520cbae4861b0
3
+ size 589824000
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a81dbd770fa4949994f9013bb9ffe49482a390ab1317cbd84129ce186693491a
3
+ size 73728000
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8cb8fc89f471905d2c5f91f0b203ff12da01d5971618bf13b5815911d857f15
3
+ size 25989120
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01d98a54c97db67a88c5616af9f915512f2514bf1dd69f81ef3cf0d108496c27
3
+ size 31924224
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11ee833f6e5b11da2cb0090e824805186288e2e40d951a5e6e5382de50620015
3
+ size 84934656
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7273c4bb91f92f260eb22b6351dbde7a92e76b662bc81addf0f2ce156daefee5
3
+ size 169869312
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:beaa98086cdcb0dc66d40320c7d2882384a7d154f2c4dd4e024a020c2352fb51
3
+ size 21233664
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:927112c1a90b737a621a79931f85d4953cc3370ffd987c9fca0bffae66cd51a1
3
+ size 18874368
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e34f3d5b530927e8cd62bd3826499642f4c2d7e37145f6f0c3be3332fa3e82d
3
+ size 25989120
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4d9faaf23689992f4404fa0348f8cffb5d62f7bfb99a0fe6669a40cb50af3e1
3
+ size 84934656
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1eb5f6ebb49b10f729b6d19318d54e00dbb3e98e8ce7e5791ede4b2d7ed2ba93
3
+ size 169869312
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1d63587f07f527b3a7587d0d876e162ab0de72cc161f2449ff75013565b7ec9
3
+ size 21233664
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77ca5cbe8d9b534c994948bc70fdcd248935db5cf4028ba945820e8b97a49a97
3
+ size 18874368
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b45cb46ad952a6b34f385b2935bf891460b730cb261b7015778c2a31335227dc
3
+ size 31850496
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:482e48a3077de86e6e3ca511a1b7b7e22ebe66eb87a3d54f071e86b6a99d06ea
3
+ size 33067008
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:889258fa192789016dde1b320b1bc3f2954e91cd89a098336e75546837f927a8
3
+ size 84934656
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f00c9824d54a4a80b41d3f4f9a2a80e2801fabee1c4638d09af2c7951d42a5fa
3
+ size 33039360
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ccd2a002d50be13e5d03dad9997831d64fdc4bdb23c2f5afa70abb981c58963
3
+ size 84934656
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:609328b523a629ff353de7424ed1b5905210a6a7c73f18ae3faa3e57ba1ef8ca
3
+ size 169869312
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe8dd351613f592b4ef8522985bdbb14c22ac433930119ed356b1e8706c9d67c
3
+ size 21233664
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:512e5f39b3e926d005bab637ab471bfa3e6f7eaa42aa6aac28bb285d5432ac58
3
+ size 18874368
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce703cbe22eb917addd1b2c789c857237f56168edd7de1196f1189a3fe8bb51a
3
+ size 33094656
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b21f563bb7d7abe56ffaed3165a6359bcd8bc3ba705b8d0472e39b637930f51
3
+ size 84934656
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56232e123eefbe5ca697a8e9dffc36549e21a2b923c4c5d27d33329b1695d629
3
+ size 169869312
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df4515d65f7798113e5b13a846085a6a2f69b56ba1d8dba45c9b495091fd6867
3
+ size 84934656
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7570d783519b583ab488d51556f004703c97e7c19c659a41f92ec243089e5462
3
+ size 18874368
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5340934dd3abf76e8a72397eedf80cf4b09b6d8e25f64fa952745ec2ed32853
3
+ size 33067008
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5aa3e2358376700ac3d36aceb447b778bbed3459c664707b784ff1b8f396c2f5
3
+ size 84934656
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3d4a164a79f1bfbce13748270e8b1eee9689b52c39aeb261fb973cccb99fd9a
3
+ size 169869312
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:174e8cf2e9dd43ef1bf0ece984fb22bf259fa9d7705a80635412bea60d9fa528
3
+ size 21233664
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a704a630773a4cc5f74628818c91f3e729cc5eb81362b551c1c522236a300520
3
+ size 18874368
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9f1e583a01aa3dbaa5a931bb4d561c7b44e2ced322230c9df2459da4a147701
3
+ size 25989120
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ddb82f5c951757cf66c5f4ee6b79396880f1c522fe4e03f08b6db44e017cb95
3
+ size 84934656
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:858505a52b9d6c21a57074ed42ed21a8630c6124e966c3c8260d60205fc4bf06
3
+ size 169869312
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ebb6d2ffa41c3293e2da47177a6c93aa9a97e20c24e490deb58791acec68219
3
+ size 21233664
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5508e9eef5dc05d64b7c868d236fef4c1561d32f146eca06fe7e924715d7705b
3
+ size 84934656
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb52db2d624ad7f9445a0e90888a9117acf2573ab2ceae0438a3e5766beb7842
3
+ size 18874368
params_shard_131.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9379749efecbf402f8a731d8263f580a315d1bb88f36663a4b3d34d75de22a1
3
+ size 33067008
params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e44a2ed1206be94bcdd2987349e70fd04aa2f39ee9b25a0cfc238d05624031ec
3
+ size 84934656
params_shard_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84dba5f6a01394207c377acc27403dc54a80df8960c8a9a19325d72bac499a1c
3
+ size 33039360
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7b783fa34dbf52ad93b9caa9f73b9c6311f4a1f267da9ad88d376daf2cc1671
3
+ size 169869312
params_shard_135.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:063da113c47dc030085633520110848045597d149047b08df5fa6443690e74ba
3
+ size 84934656
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f94df20dabf5113b10f7cd698ff8ee8c0b24d9bd8b019043c3e6b75e83b2e86
3
+ size 31887360
params_shard_137.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4ed261c7009da1a24d405afc4e71cea20f1996eeeb9b0f7bb62bc6668f8cd4c
3
+ size 169869312
params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97d9bc2cf86945cf793e54f03a69e19ef6c49b127b8dec37fd976f45649d6013
3
+ size 18874368
params_shard_139.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0653523f9d72f1678fea7a8fd112a6e6303939c87fe04ee56c14c9ab727f8b7
3
+ size 31878144