Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +79 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "mixtral",
|
4 |
+
"quantization": "q4f16_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 32000,
|
12 |
+
"position_embedding_base": 1000000.0,
|
13 |
+
"context_window_size": 32768,
|
14 |
+
"prefill_chunk_size": 2048,
|
15 |
+
"num_key_value_heads": 8,
|
16 |
+
"head_dim": 128,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"max_batch_size": 80,
|
19 |
+
"num_local_experts": 8,
|
20 |
+
"num_experts_per_tok": 2
|
21 |
+
},
|
22 |
+
"vocab_size": 32000,
|
23 |
+
"context_window_size": 32768,
|
24 |
+
"sliding_window_size": -1,
|
25 |
+
"prefill_chunk_size": 2048,
|
26 |
+
"attention_sink_size": -1,
|
27 |
+
"tensor_parallel_shards": 1,
|
28 |
+
"temperature": 1.0,
|
29 |
+
"presence_penalty": 0.0,
|
30 |
+
"frequency_penalty": 0.0,
|
31 |
+
"repetition_penalty": 1.0,
|
32 |
+
"top_p": 1.0,
|
33 |
+
"tokenizer_files": [
|
34 |
+
"tokenizer.model",
|
35 |
+
"tokenizer.json",
|
36 |
+
"tokenizer_config.json"
|
37 |
+
],
|
38 |
+
"tokenizer_info": {
|
39 |
+
"token_postproc_method": "byte_fallback",
|
40 |
+
"prepend_space_in_encode": true,
|
41 |
+
"strip_space_in_decode": true
|
42 |
+
},
|
43 |
+
"conv_template": {
|
44 |
+
"name": "mistral_default",
|
45 |
+
"system_template": "[INST] {system_message}",
|
46 |
+
"system_message": "Always assist with care, respect, and truth. Respond with utmost utility yet securely. Avoid harmful, unethical, prejudiced, or negative content. Ensure replies promote fairness and positivity.",
|
47 |
+
"system_prefix_token_ids": [
|
48 |
+
1
|
49 |
+
],
|
50 |
+
"add_role_after_system_message": false,
|
51 |
+
"roles": {
|
52 |
+
"user": "[INST]",
|
53 |
+
"assistant": "[/INST]",
|
54 |
+
"tool": "[INST]"
|
55 |
+
},
|
56 |
+
"role_templates": {
|
57 |
+
"user": "{user_message}",
|
58 |
+
"assistant": "{assistant_message}",
|
59 |
+
"tool": "{tool_message}"
|
60 |
+
},
|
61 |
+
"messages": [],
|
62 |
+
"seps": [
|
63 |
+
" "
|
64 |
+
],
|
65 |
+
"role_content_sep": " ",
|
66 |
+
"role_empty_sep": "",
|
67 |
+
"stop_str": [
|
68 |
+
"</s>"
|
69 |
+
],
|
70 |
+
"stop_token_ids": [
|
71 |
+
2
|
72 |
+
],
|
73 |
+
"function_string": "",
|
74 |
+
"use_function_calling": false
|
75 |
+
},
|
76 |
+
"pad_token_id": 0,
|
77 |
+
"bos_token_id": 1,
|
78 |
+
"eos_token_id": 2
|
79 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bac77a17e8e0ab177f3011efe61fddb3aaa5f287ad2fa44ce31aba838c30597
|
3 |
+
size 65536000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9980cdaafd38e1d27e95fed728d661d628dd71e91b4fdb613b36591027775219
|
3 |
+
size 469762048
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d039670c5ccb5aa943e1db95a649087b7f14dc035263dd969f359a25bced658
|
3 |
+
size 31891456
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a295fb80b2207f4e4cad8f93c5305bdefd281a142902a3b4c9d943e8f88728d1
|
3 |
+
size 58720256
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26c36a422597e1994a59a9b1ab8cd269b7314f66242a77fcc1cf10217b7e4280
|
3 |
+
size 234881024
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01cf5e49621ca42c3d9a5577c361a8d2d10aa1966ad81bd0d95ca8925874d6bb
|
3 |
+
size 29360128
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cca612d9b7ac36983d711f951c1abe575fbf6132fa9836421c5642d0ff552100
|
3 |
+
size 23658496
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5efa0d2793697de9294ffddc4b565db8e9b50e75aaf677ced4b5039bf48f5db
|
3 |
+
size 469762048
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:486762fc5b1bb9246685ae05cc43f39fcdbe49118375aed7bc62ef2be5f73436
|
3 |
+
size 58720256
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9f85a957cb250d37e08befae14f46317339833952604fa5fd5f52db729614c6
|
3 |
+
size 234881024
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5fa1ab4160e1666b8765a3b2c9d3fdffe000d152c47486d310518504f39438d
|
3 |
+
size 29360128
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b1ce2cb32d36331913b5496461c790773ec0330b8dede52f0c1ae8a2cf3da13
|
3 |
+
size 23674880
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d10c70eb0f93fba6a201d53035bfe879511975d02890ca6559ae421c45a60bc8
|
3 |
+
size 469762048
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:793c022d24bdc76e30e7ba48fb73cc49ab2aa3ff0e1f0b815b0ca3e9d02be7e0
|
3 |
+
size 469762048
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:947b50c9d362d339b32f05435d4f2269f9c98941cbfb8f1b47285dbfbc609ac3
|
3 |
+
size 58720256
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:634a569c8801545caac560ed1ed22162d377c604e10ff609c4d85debeb9a6e9a
|
3 |
+
size 234881024
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0b5f80c03ffdfa60495f268b28c8586d2b28f7ffb6da20a816321e1cc91f83c
|
3 |
+
size 29360128
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d20d34a6440315d09d00fafe1bdda580166409101467a3aebab3b4c779cbe063
|
3 |
+
size 23691264
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e209b13d279556f51e006c522356bc2618b63c84ba593a9eb4693b28b78e9af9
|
3 |
+
size 469762048
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4495fceb4e18a005aa46d2c76e2e5966411502c3af3ead16fa0c397d3fb319e
|
3 |
+
size 58720256
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6af5012e64703353cc0b4d85fe76955041e16f0afef45f05eb6de5eea5d888d9
|
3 |
+
size 234881024
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:018fd541f8527e54b44f5137cc115a1f62b1feb37426c6b4a8cce18c57f07fad
|
3 |
+
size 29360128
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:524e6563958ee67b4b1a741a168b77306f2de7eacfc735b39694bf791d630159
|
3 |
+
size 23658496
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51c136bbe648ed3aabd29ce971f1068ffe61aa412faf9592c5c7448b1c272ce1
|
3 |
+
size 469762048
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf473009279a505b9a7466a14bced629fd5c3f4955e7eb1f49ba92caa4ed71d9
|
3 |
+
size 58720256
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab27b2671e3bf45009f3a093971a395edbf4f2bcf8f540d5007148014fea09c6
|
3 |
+
size 58720256
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adc356789b9bcfa06753ea36cd0fbca02ab050e71654cac5f62ce1dfb51aed17
|
3 |
+
size 234881024
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48b827a45cf2e3b505fa74ce88e426e4afc124553d6f1c6aa516b41c212687cc
|
3 |
+
size 29360128
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c348e86124d35f117b16885e7373a9c442bea23ec5fbc6dc8ea66c68a674bfe
|
3 |
+
size 23691264
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6a5cc7c7ffd112e2e0df402e20fa7d5471d8a91a6acb4cdf7530019d4e25e53
|
3 |
+
size 469762048
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24e05b58c890c3a85cdc94c30025d96cfbe9f8c758ef9e7fad8db70374e5562f
|
3 |
+
size 58720256
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43f9ec2227973edc0e983c85e9666ad365e636ab65a9cf9402cbc52208e7b144
|
3 |
+
size 234881024
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78dd5e42fa8195f295a55204682be31491dba4396f5572834f35dbc92d21de0d
|
3 |
+
size 29360128
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8af3ed1df5ee3d3d59edeefec362fc919d5f257e2684c3ddb6a57da5b3ca93c1
|
3 |
+
size 23658496
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ddeb45a120c16387c5d59eee280ec2ccc056e7b714fc084af34599b9a75ec1e
|
3 |
+
size 469762048
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ff4850db89d02fab7fee99b60ad69c99150158b466aff2da5153e26f5b67869
|
3 |
+
size 234881024
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5135991d06c3020324037306edcbea41fd969fc37d0509843705aa672f11084a
|
3 |
+
size 58720256
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95e7eca8b4f540bd050893d3bcf9af32205ad22a05485ed3ea4118ba19b8d2e4
|
3 |
+
size 234881024
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6ff103ec0ed0c5671a775f2a201844647c6110298effaa640f4e2e124582bbe
|
3 |
+
size 29360128
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4dc69c23bc7d41bd2a3f9408086cb7d9bdb469b32403620fb918bc4e00d15939
|
3 |
+
size 23674880
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c2d1225960e801531c85e89c87f33dffe3b2e54b958378a8ac3c3f1c1616d61
|
3 |
+
size 469762048
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37f1000bdfeaafaac1fe216e6f171b343a229f98f66ba282a8fd246dcf863d92
|
3 |
+
size 58720256
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d88492ea4d31d213bc1e67c67efeac020f4f7c5a3854cdaa71ec9201aea9147a
|
3 |
+
size 234881024
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f08a637391524b2f816df11511a63421c6d3fc7ac55351629e40324acac9574e
|
3 |
+
size 29360128
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4fa2367c8eb4b1cd2442cbff83f5dbbf93f03811c45e0f74f92987b51a65ec7f
|
3 |
+
size 23691264
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef2e015e28dcb52a52b65f9c3b14a06753ddc26aaa05f6c04a2c6915ad9c18fe
|
3 |
+
size 23658496
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63d7c1c18c26a024ea45a193041b9ebae5cf8aca81c1590b4fb882cd87bd5c45
|
3 |
+
size 29360128
|