Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +83 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,83 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128256,
|
12 |
+
"position_embedding_base": 500000.0,
|
13 |
+
"context_window_size": 8192,
|
14 |
+
"prefill_chunk_size": 2048,
|
15 |
+
"num_key_value_heads": 8,
|
16 |
+
"head_dim": 128,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"max_batch_size": 80
|
19 |
+
},
|
20 |
+
"vocab_size": 128256,
|
21 |
+
"context_window_size": 8192,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 2048,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"temperature": 0.6,
|
27 |
+
"presence_penalty": 0.0,
|
28 |
+
"frequency_penalty": 0.0,
|
29 |
+
"repetition_penalty": 1.0,
|
30 |
+
"top_p": 0.9,
|
31 |
+
"tokenizer_files": [
|
32 |
+
"tokenizer.json",
|
33 |
+
"tokenizer_config.json"
|
34 |
+
],
|
35 |
+
"tokenizer_info": {
|
36 |
+
"token_postproc_method": "byte_level",
|
37 |
+
"prepend_space_in_encode": false,
|
38 |
+
"strip_space_in_decode": false
|
39 |
+
},
|
40 |
+
"conv_template": {
|
41 |
+
"name": "llama-3",
|
42 |
+
"system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|>\n",
|
43 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
44 |
+
"system_prefix_token_ids": [
|
45 |
+
128000
|
46 |
+
],
|
47 |
+
"add_role_after_system_message": true,
|
48 |
+
"roles": {
|
49 |
+
"user": "<|start_header_id|>user",
|
50 |
+
"assistant": "<|start_header_id|>assistant"
|
51 |
+
},
|
52 |
+
"role_templates": {
|
53 |
+
"user": "{user_message}",
|
54 |
+
"assistant": "{assistant_message}",
|
55 |
+
"tool": "{tool_message}"
|
56 |
+
},
|
57 |
+
"messages": [],
|
58 |
+
"seps": [
|
59 |
+
"<|eot_id|>"
|
60 |
+
],
|
61 |
+
"role_content_sep": "<|end_header_id|>\n\n",
|
62 |
+
"role_empty_sep": "<|end_header_id|>\n\n",
|
63 |
+
"stop_str": [
|
64 |
+
"<|end_of_text|>",
|
65 |
+
"<|eot_id|>"
|
66 |
+
],
|
67 |
+
"stop_token_ids": [
|
68 |
+
128001,
|
69 |
+
128009
|
70 |
+
],
|
71 |
+
"function_string": "",
|
72 |
+
"use_function_calling": false
|
73 |
+
},
|
74 |
+
"pad_token_id": 0,
|
75 |
+
"bos_token_id": 128000,
|
76 |
+
"eos_token_id": [
|
77 |
+
128001,
|
78 |
+
128009
|
79 |
+
],
|
80 |
+
"mean_gen_len": 128,
|
81 |
+
"max_gen_len": 512,
|
82 |
+
"shift_fill_factor": 0.3
|
83 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9f235668b5d95068f789df61b90f587957396b2652948f46d875be35b8abe0d
|
3 |
+
size 262668288
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8697075c7ed95287ce3200558af0d7bdbfba8c6ad3d33d0eba24e3656475ae07
|
3 |
+
size 29360128
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65f29d51d96e394ea3b7da7a162b8f800798dd0655e6f93c389342fa09e02fd7
|
3 |
+
size 33046528
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d018e31cfb4e7eff5acb80bfe957d96a984839f3e3f826f3f8ac1d12c76fb25
|
3 |
+
size 58720256
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8736ae6a8f9a62008a99850b7d13b84d966cbc9b47bbdbddc26c406d2790686a
|
3 |
+
size 25174016
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23b0e6749c12447b6848f32ca657d4c70c3dd4da9200ddfb5f01b96638221bef
|
3 |
+
size 29360128
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e68d2b037b578364aeffa1c84d49acb683f0b1670883fa69e69935294e4c1358
|
3 |
+
size 58720256
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da0b8714effc74d2312cfd9ad41df9b781885326b66a5fd67f6453db37db4fb4
|
3 |
+
size 33046528
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5328a7d08c95f7bed4fb10e67e06df292018c41e43a1818802fc98fdf533a04e
|
3 |
+
size 58720256
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65207cd36333c80418bd017249224594c241c3b30aac1a18a595f903f8c489c9
|
3 |
+
size 32505856
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e970c1a904651ba06581e357a1bfa753101bab89b84e6bb0de7e44ce9efc3ebc
|
3 |
+
size 9437184
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47fb57e8ec2666db2d019d70b48ec7078f5880b49610321f85c11b02258a69db
|
3 |
+
size 29360128
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9813e94cc6ff515eddf33eb861c01516d6dc71ee478dba60d45d09543b5dfb0
|
3 |
+
size 58720256
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55bc8366f2cde77d04866bf1185f4c1e0291998565128cd06ad82b0d8d679b70
|
3 |
+
size 22036480
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3a386bca3bd3e73a94364c7a77b852a3c4e73193ffbf12ddcb7d53406827687
|
3 |
+
size 29360128
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1a963a80d350e8b1efbbe8d8c31c72285581735e595c51459473cc582d6b48a
|
3 |
+
size 58720256
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5271e2135f6fba2c029c0b9efa3862827fe0d2b63aedd5db629304b0eaacfffd
|
3 |
+
size 27271168
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a70f8ff2d4804a77a46f7695cee72765c640e40368eac5be1f553c611431330
|
3 |
+
size 29360128
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9993f5fb04e7c0f14bf071d0adb96212eb061842f0a37d713c2bdaeb9ebf963
|
3 |
+
size 30949376
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4646de43c62c19ec63f673234e2dad3016d01bde518e44f59f3f2a1d39d607ef
|
3 |
+
size 58720256
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c40bb09ff2f604f8dd17712e574c10ab897aff66c437e716be1792209eb7229
|
3 |
+
size 32841728
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7992a42e2db8e699e6eeac87e4c597081e47391695cc614c1a3c25d22fb5fe9
|
3 |
+
size 25174016
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae7ce09657ea87844544abbbc281af56015a5f72ac32a512e7effbcb3b3c1b32
|
3 |
+
size 29360128
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d2802415dd3d0a9f622cd38a921a5672136a6292659859eeabeb4f5f1669c05
|
3 |
+
size 58720256
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e01e5b3d73b2b280f3f7cf0ae724b50f661d931d458c711212db30c895413d2f
|
3 |
+
size 33046528
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab56032ba4f2359ecef272454b56840fa86957bf011ffb5ce75198b5380cde69
|
3 |
+
size 29360128
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8d6112e0641eacf886732d563a060dab38986cf3e6172413a35a1189a67f1cf
|
3 |
+
size 58720256
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4eb5a2b03ce080dda25c64c42933f85c98b89a155659144497d47a0f3950127a
|
3 |
+
size 22036480
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0468b3ab5dde35bf8ef603ca43a593e702e61834d25d077c624a51123bac708f
|
3 |
+
size 29360128
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:007232352f3f26e01ff423f7d9e4de2096c214dcef87ace26cc1eeebb12a9e42
|
3 |
+
size 58720256
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:301a443d660266d8abe596f3567c806b0461a9d8637d261fb2037a77b51205e1
|
3 |
+
size 27271168
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63094c7b5530f553ac31b83fb1c45911643bf6a9f9a8da4b3439af66061ca9dc
|
3 |
+
size 262668288
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d1df10274ae63f992bbede03e14c8b7b3b359aada82e8f6646630dfeb226d7a
|
3 |
+
size 29360128
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36483734bca2fd5844cef2f18d807fc99ac2bfeee429bddde241c2cd3f75947e
|
3 |
+
size 30949376
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ba51e2ecb73ff2b9c7c5ad2b13f01d5d60a069d6a33358ac943d32f1128a925
|
3 |
+
size 58720256
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0084c3ecbba81070b900b65f718c8c8227bcd3cf7434bab0e11f84b23f0d0888
|
3 |
+
size 25174016
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4760b363d07765caec77497f0501259df8fa945ad70490998da29c774cdeb919
|
3 |
+
size 29360128
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ff44b10555929bf92c9b2a4366d2c046c2c0f3e317c691558bb78ea23ba6823
|
3 |
+
size 58720256
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0bc1d901b1ce51f15d9b1120c967409ef3d311f3ef16706911e1494388459834
|
3 |
+
size 33046528
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f3df11a7ebd6071dd92790977017c37730bdd885510e6f7576cc890578161d3
|
3 |
+
size 29360128
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46c92cb41bba9d28aa7f3555209bc9c6a63a3c9b8f932e2d907f02788e82974e
|
3 |
+
size 58720256
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad1674f934b530056d00808c2cfe684a7c71beeebb4b3c0de61cdb11564f85dd
|
3 |
+
size 22036480
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92e2b9fd9e84658a91488199af395902921ce4a849f459cc3a24f00104f5b299
|
3 |
+
size 32833536
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8426596a9bd35038625cc37e5cbda6eb2729ca2169b9d5080de982a5e9a77d22
|
3 |
+
size 29360128
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac9dc9ab1afb53b538b141f5fc779e8887806832b984a855e8c328c7728285f3
|
3 |
+
size 58720256
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4d0919b4d55014abf5ef184daed1a2e8aaf4ea5aca94726ebde076a18dee4f1
|
3 |
+
size 27271168
|