siddartha-abacus
commited on
Commit
•
e19fd5e
1
Parent(s):
fc2c5bb
Upload Qwen2ForCausalLM
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +27 -0
- generation_config.json +7 -0
- model-00001-of-00063.safetensors +3 -0
- model-00002-of-00063.safetensors +3 -0
- model-00003-of-00063.safetensors +3 -0
- model-00004-of-00063.safetensors +3 -0
- model-00005-of-00063.safetensors +3 -0
- model-00006-of-00063.safetensors +3 -0
- model-00007-of-00063.safetensors +3 -0
- model-00008-of-00063.safetensors +3 -0
- model-00009-of-00063.safetensors +3 -0
- model-00010-of-00063.safetensors +3 -0
- model-00011-of-00063.safetensors +3 -0
- model-00012-of-00063.safetensors +3 -0
- model-00013-of-00063.safetensors +3 -0
- model-00014-of-00063.safetensors +3 -0
- model-00015-of-00063.safetensors +3 -0
- model-00016-of-00063.safetensors +3 -0
- model-00017-of-00063.safetensors +3 -0
- model-00018-of-00063.safetensors +3 -0
- model-00019-of-00063.safetensors +3 -0
- model-00020-of-00063.safetensors +3 -0
- model-00021-of-00063.safetensors +3 -0
- model-00022-of-00063.safetensors +3 -0
- model-00023-of-00063.safetensors +3 -0
- model-00024-of-00063.safetensors +3 -0
- model-00025-of-00063.safetensors +3 -0
- model-00026-of-00063.safetensors +3 -0
- model-00027-of-00063.safetensors +3 -0
- model-00028-of-00063.safetensors +3 -0
- model-00029-of-00063.safetensors +3 -0
- model-00030-of-00063.safetensors +3 -0
- model-00031-of-00063.safetensors +3 -0
- model-00032-of-00063.safetensors +3 -0
- model-00033-of-00063.safetensors +3 -0
- model-00034-of-00063.safetensors +3 -0
- model-00035-of-00063.safetensors +3 -0
- model-00036-of-00063.safetensors +3 -0
- model-00037-of-00063.safetensors +3 -0
- model-00038-of-00063.safetensors +3 -0
- model-00039-of-00063.safetensors +3 -0
- model-00040-of-00063.safetensors +3 -0
- model-00041-of-00063.safetensors +3 -0
- model-00042-of-00063.safetensors +3 -0
- model-00043-of-00063.safetensors +3 -0
- model-00044-of-00063.safetensors +3 -0
- model-00045-of-00063.safetensors +3 -0
- model-00046-of-00063.safetensors +3 -0
- model-00047-of-00063.safetensors +3 -0
- model-00048-of-00063.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": ".",
|
3 |
+
"architectures": [
|
4 |
+
"Qwen2ForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"eos_token_id": 151645,
|
8 |
+
"hidden_act": "silu",
|
9 |
+
"hidden_size": 8192,
|
10 |
+
"initializer_range": 0.02,
|
11 |
+
"intermediate_size": 24576,
|
12 |
+
"max_position_embeddings": 32768,
|
13 |
+
"max_window_layers": 28,
|
14 |
+
"model_type": "qwen2",
|
15 |
+
"num_attention_heads": 64,
|
16 |
+
"num_hidden_layers": 80,
|
17 |
+
"num_key_value_heads": 64,
|
18 |
+
"rms_norm_eps": 1e-05,
|
19 |
+
"rope_theta": 1000000.0,
|
20 |
+
"sliding_window": 32768,
|
21 |
+
"tie_word_embeddings": false,
|
22 |
+
"torch_dtype": "float32",
|
23 |
+
"transformers_version": "4.37.2",
|
24 |
+
"use_cache": false,
|
25 |
+
"use_sliding_window": false,
|
26 |
+
"vocab_size": 152064
|
27 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 151644,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": 151645,
|
5 |
+
"max_new_tokens": 2048,
|
6 |
+
"transformers_version": "4.37.2"
|
7 |
+
}
|
model-00001-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acccd2158300774c94db715aa61c266a601ed864c2858e90b401cae7979a1c96
|
3 |
+
size 4982833288
|
model-00002-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e38f6f6e2b1686a69d0d8163e624b492dc8c1c974917f4210205708ec22b0c84
|
3 |
+
size 4563667072
|
model-00003-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63d9b7734f9876b2bdf108bca5ebb67b55c1043e642d9b7588a3b32fa8e0afa5
|
3 |
+
size 4295132632
|
model-00004-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d1433fb9524a406d4e7576b4e0bf3690b18d9e49d8e108c08c5c9d3693ed1b3
|
3 |
+
size 4295132632
|
model-00005-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f139ede515f5f6ba1c4ad82e4c00b1c5f01b46db92f964202861affe9a36c66
|
3 |
+
size 4832135288
|
model-00006-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b24e3f97958053b683b79fd0e73e148b3cfe6e948e43512f8db48e4a8e05f592
|
3 |
+
size 4832036656
|
model-00007-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6695940df7a810b72b7f93ac9a23970d015335d3a6a1f5db6e21d97cdecab59
|
3 |
+
size 4295132632
|
model-00008-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be660444edd459e04bb5bcbc46feb44670bcbf4ced2efb97e5b2d7fdac1e4e50
|
3 |
+
size 4832135288
|
model-00009-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea649dfb0fcdb6bf57d41d03ea88e48bfbc433f948cff20f653e16e6a3eb1700
|
3 |
+
size 4832036672
|
model-00010-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9bab17a643499fb5b44c9e5cf2b18d5b7d8d85df7f54d6e14cea4cdbf09ef47
|
3 |
+
size 4295132640
|
model-00011-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be9529e6d40a4e3da086b43c9b2e19da8f0774145cc949e24bf8621a358d2090
|
3 |
+
size 4832135312
|
model-00012-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f0307453a0553d8f78b8a72656e02ffdcbe176cb871f88cac9a6da6e70cd173
|
3 |
+
size 4832036672
|
model-00013-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9e389e0ad4cabaaf5edb18fc7d80d205f6fca5f560862a2292fb0c475a2d54a
|
3 |
+
size 4295132640
|
model-00014-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d82bd3a9ff4683856d8b9b260372a8696ed38704a8d145185e33fa893d6a52f2
|
3 |
+
size 4832135312
|
model-00015-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d03b79a2a5ee055c5aad168ca107e46b7681335785b6a76581145a1c7bf2271b
|
3 |
+
size 4832036672
|
model-00016-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63a13704103d3cda1f6707c9e52d2d2d6fd27acc39acb23852fcc5e01cc0dedd
|
3 |
+
size 4295132640
|
model-00017-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:918cdbd486b051df26d28fe4225baff3b4328472a5ce35d11f3a0ce6dabf8299
|
3 |
+
size 4832135312
|
model-00018-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23ed293bd1f5898e66acd50bcd4d03f1aea5b831cbe516132de2244dcbec4768
|
3 |
+
size 4832036672
|
model-00019-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1706fd1d4ac47182ed2c6409deedfcdb1bdfacaf464dacd7f1b800011ef3db8b
|
3 |
+
size 4295132640
|
model-00020-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4832f5514a2f22422f84552e60bc373d167137f97521e196360d0114ce579f4
|
3 |
+
size 4832135312
|
model-00021-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:383915a5323a3453c94f0dbf7861d75b92f485eac346a7f9049cf7da28d05ab2
|
3 |
+
size 4832036672
|
model-00022-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb885b65e06b4ad43c248d00e8a989477a2f1f7f13d79ac771c065572106846d
|
3 |
+
size 4295132640
|
model-00023-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a87a8522fb3a3ebb62a33f5ef73841bb45987e59029c93c7cd4e94e002f79e4
|
3 |
+
size 4832135312
|
model-00024-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62cc63c5523d24d4d165ee205c5d3c18c9d2f4bb7819faf682b5d3f28f3155ed
|
3 |
+
size 4832036672
|
model-00025-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd6d61314bfcec194cc6aede78337f0a898973b38c60d1ee1aee6e7ec9d86e4f
|
3 |
+
size 4295132640
|
model-00026-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6dbfca645db1dacf4a5736ca7ea9ea2803770c9141d9c21b779c2ca31a43896
|
3 |
+
size 4832135312
|
model-00027-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68e9768bdf01a0dddeb97bb058d34c474caebb3c10b188fbfaa2efef64223da7
|
3 |
+
size 4832036672
|
model-00028-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9caf90e7138c169cf0be804d8aac8c621d7e85f0f3f5c754fa5af8fd40af27c
|
3 |
+
size 4295132640
|
model-00029-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91dedf5693253877f2ad587ec81b5dc40781752327bbafcdae0ecc018ced2671
|
3 |
+
size 4832135312
|
model-00030-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:032d5d7e08f2240229b94ed0d99daa2124eedad8b9fcfe1d1a46dca675d1db28
|
3 |
+
size 4832036672
|
model-00031-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ca2a2be18f3235197fd941694c4fcf4092c6c725762e63291d604d8e0d2a991
|
3 |
+
size 4295132640
|
model-00032-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a483848832f6a31976c1acba2425e95b01a83bdd4755317a0ddafa2aea992b2a
|
3 |
+
size 4832135312
|
model-00033-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f04c029b52afed6d70ce5b635854eb716fc7c43cc8465c032ed2012bec1aff1
|
3 |
+
size 4832036672
|
model-00034-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c77cb928c54414331275fdb42fcd39a5d098b59e22d6b57ec0cbce4de2604cd
|
3 |
+
size 4295132640
|
model-00035-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0107caaac168e435a9b265c7594fddb33a8272db0ce4241b4861aa0f660b2040
|
3 |
+
size 4832135312
|
model-00036-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abc1bc4835ecc4e0f243d813dee7915fb9e91a26d792db62fa5cda53de6fdce4
|
3 |
+
size 4832036672
|
model-00037-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11f47bee7a2bb05b120a328057a21fbe6e69831ab53fceaaf3535c3d13ecb0f0
|
3 |
+
size 4295132640
|
model-00038-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9988436ccd2bec881b7652c63e9816e999e97c6bab048e9f4a6999fe75ba303b
|
3 |
+
size 4832135312
|
model-00039-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c40bf9ef0b51c99f13dc2a746b36f548a3848cc71f99ed3c0f47ac9936b9d0b
|
3 |
+
size 4832036672
|
model-00040-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbf1a7469d59e3a32cae58c2394f132c407e54a3f60065e2c055f98ea7ab9a04
|
3 |
+
size 4295132640
|
model-00041-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f8c9919d6148707ed3a49a8e51c99c2d24b47885fa5f9b6e91b86f443f5d421
|
3 |
+
size 4832135312
|
model-00042-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e967742dfab0c959e27d657947004d12d919427859ccaf8d1af425cbbdc16877
|
3 |
+
size 4832036672
|
model-00043-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db2c2592ba1390380c2836d6d7a1d06c7a9c245820751bc4ce16ddd858693da9
|
3 |
+
size 4295132640
|
model-00044-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fdbd234aa0d32be71fb9cb61813be9ec606cefdff8dc5d891fffdc6a289b2321
|
3 |
+
size 4832135312
|
model-00045-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a623f9d940bad8d1345569dfd5302d531e30dceb99a713a686b9256532ff243e
|
3 |
+
size 4832036672
|
model-00046-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d6e1bca38153123fda6c0be181b0337d68155ae296ba617c365e500fe66c326
|
3 |
+
size 4295132640
|
model-00047-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc47f4ac851abf42703e5e9c0f812f9a25848478c15a1f08443bb83e91d60145
|
3 |
+
size 4832135312
|
model-00048-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e0c04190e90606beb8b0ad235454df11ab1050323c7a3e55c3c05fa76ffe99d
|
3 |
+
size 4832036672
|