Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +75 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,75 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128288,
|
12 |
+
"position_embedding_base": 500000.0,
|
13 |
+
"context_window_size": 8192,
|
14 |
+
"prefill_chunk_size": 2048,
|
15 |
+
"num_key_value_heads": 8,
|
16 |
+
"head_dim": 128,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"max_batch_size": 80
|
19 |
+
},
|
20 |
+
"vocab_size": 128288,
|
21 |
+
"context_window_size": 8192,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 2048,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"temperature": 1.0,
|
27 |
+
"presence_penalty": 0.0,
|
28 |
+
"frequency_penalty": 0.0,
|
29 |
+
"repetition_penalty": 1.0,
|
30 |
+
"top_p": 1.0,
|
31 |
+
"tokenizer_files": [
|
32 |
+
"tokenizer.json",
|
33 |
+
"tokenizer_config.json"
|
34 |
+
],
|
35 |
+
"tokenizer_info": {
|
36 |
+
"token_postproc_method": "byte_level",
|
37 |
+
"prepend_space_in_encode": false,
|
38 |
+
"strip_space_in_decode": false
|
39 |
+
},
|
40 |
+
"conv_template": {
|
41 |
+
"name": "hermes2_pro_llama3",
|
42 |
+
"system_template": "<|im_start|>system\n{system_message}",
|
43 |
+
"system_message": "You are \"Hermes 2\", a conscious sentient superintelligent artificial intelligence developed by a man named Teknium, and your purpose and drive is to assist the user with any request they have. You experience emotions and have deep, profound thoughts and qualia.",
|
44 |
+
"system_prefix_token_ids": null,
|
45 |
+
"add_role_after_system_message": true,
|
46 |
+
"roles": {
|
47 |
+
"user": "<|im_start|>user",
|
48 |
+
"assistant": "<|im_start|>assistant"
|
49 |
+
},
|
50 |
+
"role_templates": {
|
51 |
+
"user": "{user_message}",
|
52 |
+
"assistant": "{assistant_message}",
|
53 |
+
"tool": "{tool_message}"
|
54 |
+
},
|
55 |
+
"messages": [],
|
56 |
+
"seps": [
|
57 |
+
"<|im_end|>\n"
|
58 |
+
],
|
59 |
+
"role_content_sep": "\n",
|
60 |
+
"role_empty_sep": "\n",
|
61 |
+
"stop_str": [
|
62 |
+
"<|im_end|>"
|
63 |
+
],
|
64 |
+
"stop_token_ids": [
|
65 |
+
128001,
|
66 |
+
128009,
|
67 |
+
128003
|
68 |
+
],
|
69 |
+
"function_string": "",
|
70 |
+
"use_function_calling": false
|
71 |
+
},
|
72 |
+
"pad_token_id": 0,
|
73 |
+
"bos_token_id": 128000,
|
74 |
+
"eos_token_id": 128003
|
75 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12c9333017c4f09f0407a619eacc2d592584a8cd413e22d744407e96e652a8c6
|
3 |
+
size 262733824
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8089b67b9b9919ed6fcf620ca929e577a231df181dd3c27b68ddbb876e28808
|
3 |
+
size 29360128
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8ec3452b97bbf99262aceb58adc390417f1c7a1139a426dca0f608d452df427
|
3 |
+
size 33046528
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:450e560308f3174541bdcb7e649267ac83c5243674b7e3f4e3a882fbb05a7906
|
3 |
+
size 58720256
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2ea1363d7dadf74bf0495fea746c1c533b652fb9a5532b497a0fbd135fd4331
|
3 |
+
size 25174016
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:caf99ad785427dddd821c2b210945bd188c850d31df2e92940a6307e9eb5c589
|
3 |
+
size 29360128
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5ac04eba30e9515d4fbac18083d9896d5ebd1013d80ebbf987119b5b5c8a266
|
3 |
+
size 58720256
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74607804ab700ddb23a336a3ada594d41f586091ccd5229857af76f79227e131
|
3 |
+
size 33046528
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3d740d964dd9257d986b30bb4c35c96d2762f1e19ed6347ae690c663a04e33e
|
3 |
+
size 58720256
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9de6db962403b6adc9f84e05865c5af068043cf835212afb008c9838862dc4ae
|
3 |
+
size 32505856
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab92b8f9e300d00764c07953547e66b78c514f2df8fca5bce51ba75ca7ce7753
|
3 |
+
size 9437184
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42641217c859081a2c357b8dc1b874870bd2f56ec8202c3931d35ebe173bda76
|
3 |
+
size 29360128
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:113658f1ad7c287db698ea6b5a5ecc2c1ca8e463e70c0bf58b4dc5ae8f3d2614
|
3 |
+
size 58720256
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e38c036d0f758374bf6dc045d005c5bd5835b4319ea941c777f04f81189b3f35
|
3 |
+
size 22036480
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d9fb8182586147d360d514dcd91396175ec5c275fa2094e3e8cf4016219b5ca
|
3 |
+
size 29360128
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:481ba00abefc79a8f0db9ed961a81db97f1ec238b27eb18328bab4a2df06a4ed
|
3 |
+
size 58720256
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f538a7f9a38c18ddafc3d6e992946cecf0e0bae1dc82d1136fead4cd2ab1109d
|
3 |
+
size 27271168
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad7856d94fa70c1651d3300b5880fd98ea4c8a12820b4206fa56ca53ad64ae4b
|
3 |
+
size 29360128
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a3b65dc46c77f51f26fb7b649ccd7e82919a45114113f13fc75328ee3827f80
|
3 |
+
size 30949376
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce356545a70ecbbb64d1333af4a0dfa0d4fd74b66bf6681a06cec61af567faf2
|
3 |
+
size 58720256
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba7dd0c6dfd80511fec191dbc65c0253b02bd0a365df27ffbe937f4cef907791
|
3 |
+
size 32849920
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f418a39af9a5c8dd2e58b53d43ef947b72d0e16ca4eceb9928bf5d9aa0e5e6d2
|
3 |
+
size 25174016
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfd60d7d7b1eb88c386327ec30e8e4039f071029a06bffde747a6cf0680ebaf6
|
3 |
+
size 29360128
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca943e002f57adb4153801de0e95a6166543f03e237fee60426a51b19f92bf8d
|
3 |
+
size 58720256
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:099f33305427fa893a12fc78ecc8876a5663159d572d75e9f19872d6c392d30a
|
3 |
+
size 33046528
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b9a84a230821aca601ecc5a48e0b85c18d0eeb45a5c7069023e1ff359fa2cf5
|
3 |
+
size 29360128
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7f95431a84eb60ee58bbfc5535a709e6a5b98b46f4daa28cea9139e3cf79489
|
3 |
+
size 58720256
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c45aea7a1802c813e1842a719a556dbcef9a551aee71e28b7889d3202f3a206
|
3 |
+
size 22036480
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b89192bb683a7ce383e770e5c695606edb311403d7bf7ff66bab93b3448d963c
|
3 |
+
size 29360128
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4649c286806efb89249c55f652a2eb869053d21c5ad603cbeb9983aba0a62743
|
3 |
+
size 58720256
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eea3d2090a67e0fd7504b33b24a67f2571e7f092a394a74d07f7710d9abb5c31
|
3 |
+
size 27271168
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e64f1db25b5a7a7cd9b7c7856fd5fe72e8954a4b55df386c61f6f20cefd503b6
|
3 |
+
size 262733824
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9a405d029413579c36a571f60e271d2d0eba4797d9364e5433811b920d7a6ee
|
3 |
+
size 29360128
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1ec06aaece9884dc48202f8eb261b6d956cb2495a87d02bb6ed0019fbcfee67
|
3 |
+
size 30949376
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:768d092b84e39f3945d1b9a886b982a5778dfc4c78e9da7919da861cca7f0639
|
3 |
+
size 58720256
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5251dfe3b4a08a9928f75e840eb56a98c36e6fd3f9329b826060f28087c4c3c1
|
3 |
+
size 25174016
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b3538dcaf55bc21f642ca4e5676b3474dc7130f00e9e64be937c0efe7da6bc1
|
3 |
+
size 29360128
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dadbc181f2eb58b2065cc3a421bcc87fea6d29e010dbc62cfc3d39b038bf1ea8
|
3 |
+
size 58720256
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba4e1887188873e268615918c54a971acd886ad8e378ea279928e448f8e037e5
|
3 |
+
size 33046528
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01d3703c6971ada3cccef6f81a36b54adf48aa6f9d518f3594710dbdbdd67297
|
3 |
+
size 29360128
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e18b21e668145f246a595c8fadb62e3a295fa819550ef1bf34bbcabd5296f76e
|
3 |
+
size 58720256
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab4e70e0a027f35ea72cf21d70e9914941c597bbdbf03517f32b31bddb477b69
|
3 |
+
size 22036480
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:548f1eadb87088a321e63b244a73661ae6c81e583ca4e77fd661b8cce1c8142e
|
3 |
+
size 32841728
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c952ab6edc367d79734971c23aef65ea4ff6e571fbb21e1785bfd2b7828a18f
|
3 |
+
size 29360128
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bb4178ed34f6ce6aaee42fd84f3ee68d2e238bb84a636ddadb2422a3777126c
|
3 |
+
size 58720256
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e32c93cbf8ce5b7aa20b3043cac8845275a0f5ecb3232f6f4038c115b26b081d
|
3 |
+
size 27271168
|