Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +61 -0
- generation_config.json +10 -0
- latest +1 -0
- model-00001-of-00006.safetensors +3 -0
- model-00002-of-00006.safetensors +3 -0
- model-00003-of-00006.safetensors +3 -0
- model-00004-of-00006.safetensors +3 -0
- model-00005-of-00006.safetensors +3 -0
- model-00006-of-00006.safetensors +3 -0
- model.safetensors.index.json +0 -0
- rng_state_0.pth +3 -0
- rng_state_1.pth +3 -0
- rng_state_10.pth +3 -0
- rng_state_100.pth +3 -0
- rng_state_101.pth +3 -0
- rng_state_102.pth +3 -0
- rng_state_103.pth +3 -0
- rng_state_104.pth +3 -0
- rng_state_105.pth +3 -0
- rng_state_106.pth +3 -0
- rng_state_107.pth +3 -0
- rng_state_108.pth +3 -0
- rng_state_109.pth +3 -0
- rng_state_11.pth +3 -0
- rng_state_110.pth +3 -0
- rng_state_111.pth +3 -0
- rng_state_112.pth +3 -0
- rng_state_113.pth +3 -0
- rng_state_114.pth +3 -0
- rng_state_115.pth +3 -0
- rng_state_116.pth +3 -0
- rng_state_117.pth +3 -0
- rng_state_118.pth +3 -0
- rng_state_119.pth +3 -0
- rng_state_12.pth +3 -0
- rng_state_120.pth +3 -0
- rng_state_121.pth +3 -0
- rng_state_122.pth +3 -0
- rng_state_123.pth +3 -0
- rng_state_124.pth +3 -0
- rng_state_125.pth +3 -0
- rng_state_126.pth +3 -0
- rng_state_127.pth +3 -0
- rng_state_128.pth +3 -0
- rng_state_129.pth +3 -0
- rng_state_13.pth +3 -0
- rng_state_130.pth +3 -0
- rng_state_131.pth +3 -0
- rng_state_132.pth +3 -0
- rng_state_133.pth +3 -0
config.json
ADDED
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/fsx_0/user/zhaojiang/models/llava-clip-gen-und-2",
|
3 |
+
"architectures": [
|
4 |
+
"LlavaLlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": [
|
10 |
+
128001,
|
11 |
+
128008,
|
12 |
+
128009
|
13 |
+
],
|
14 |
+
"freeze_mm_mlp_adapter": false,
|
15 |
+
"gen_hidden_size": 1792,
|
16 |
+
"gen_pooling": "early_pool2d_4",
|
17 |
+
"gen_projector_type": "mlp2x_gelu",
|
18 |
+
"gen_vision_tower": "eva-clip-E-14-plus",
|
19 |
+
"hidden_act": "silu",
|
20 |
+
"hidden_size": 4096,
|
21 |
+
"image_aspect_ratio": "square",
|
22 |
+
"initializer_range": 0.02,
|
23 |
+
"intermediate_size": 14336,
|
24 |
+
"max_position_embeddings": 131072,
|
25 |
+
"mlp_bias": false,
|
26 |
+
"mm_hidden_size": 1152,
|
27 |
+
"mm_patch_merge_type": "flat",
|
28 |
+
"mm_projector_lr": null,
|
29 |
+
"mm_projector_type": "mlp2x_gelu",
|
30 |
+
"mm_use_im_patch_token": false,
|
31 |
+
"mm_use_im_start_end": false,
|
32 |
+
"mm_vision_select_feature": "patch",
|
33 |
+
"mm_vision_select_layer": -2,
|
34 |
+
"mm_vision_tower": "google/siglip-so400m-patch14-384",
|
35 |
+
"model_type": "llava_llama",
|
36 |
+
"n_query": 64,
|
37 |
+
"num_attention_heads": 32,
|
38 |
+
"num_hidden_layers": 32,
|
39 |
+
"num_key_value_heads": 8,
|
40 |
+
"pad_token_id": 128256,
|
41 |
+
"pretraining_tp": 1,
|
42 |
+
"rms_norm_eps": 1e-05,
|
43 |
+
"rope_scaling": {
|
44 |
+
"factor": 8.0,
|
45 |
+
"high_freq_factor": 4.0,
|
46 |
+
"low_freq_factor": 1.0,
|
47 |
+
"original_max_position_embeddings": 8192,
|
48 |
+
"rope_type": "llama3"
|
49 |
+
},
|
50 |
+
"rope_theta": 500000.0,
|
51 |
+
"tie_word_embeddings": false,
|
52 |
+
"tokenizer_model_max_length": 2048,
|
53 |
+
"tokenizer_padding_side": "right",
|
54 |
+
"torch_dtype": "bfloat16",
|
55 |
+
"transformers_version": "4.43.1",
|
56 |
+
"tune_mm_mlp_adapter": false,
|
57 |
+
"use_cache": false,
|
58 |
+
"use_mm_proj": true,
|
59 |
+
"vision_tower_pretrained": null,
|
60 |
+
"vocab_size": 128260
|
61 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 128000,
|
4 |
+
"eos_token_id": [
|
5 |
+
128001,
|
6 |
+
128008,
|
7 |
+
128009
|
8 |
+
],
|
9 |
+
"transformers_version": "4.43.1"
|
10 |
+
}
|
latest
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
global_step41000
|
model-00001-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:239b6add0830f2e1e4c9515698172b8884be00dcfcc22bd50df99f61c40a5641
|
3 |
+
size 4976731440
|
model-00002-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c0c87fdcbde831157a4df42a479b985c7277854b4bd8e7bf4ed786eeb7a16a0
|
3 |
+
size 4999802720
|
model-00003-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63a88a22a688ee99d1abf2b7e4520516056a2f1e902747f2ed93de62707ebdd3
|
3 |
+
size 4915916176
|
model-00004-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0852b987b56e849ea85a42aa3c569851090afe8cfcf8dd12d585634ed6329063
|
3 |
+
size 4999640736
|
model-00005-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9676009c052cac264d63ce39ede976f95e079ee904b1eba2277fed16ab758f9
|
3 |
+
size 4783899064
|
model-00006-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:737096912d89174e59818ff3c5e0317ae2f4e6ae976463719aa145b2a09f4d72
|
3 |
+
size 1050706048
|
model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:575119a228f98110923ffa2dedcb50e3317251b26054355d015e0b2240d566f2
|
3 |
+
size 15984
|
rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0728b56dab7abb5ef8a0d4bae3519c5767c97467bdd886d26bf19cc8599d0312
|
3 |
+
size 15984
|
rng_state_10.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:532d1ab071177c2e9d0cc3435d6314c1777a0356f9ce1a5d8f10fbe5f8fd8926
|
3 |
+
size 15997
|
rng_state_100.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fa975ad1ae1661ad3fad17a3236db26af34e8ef6d31163115c4ea9193f8cc9b
|
3 |
+
size 16010
|
rng_state_101.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1dd4d3adaf131e6bc615713b1b85352706739e9bd041e2f2453163158c76041
|
3 |
+
size 16010
|
rng_state_102.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd8d1031750457f476c119e61c92286e09098d6eb3a186beaeb238524b064f6c
|
3 |
+
size 16010
|
rng_state_103.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6eb1d2fb1d84fdc1d312f44402c52cbfa549a77a96f807f13cd33cf982bb6921
|
3 |
+
size 16010
|
rng_state_104.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56406f9b17c9e552e8472412f20edb77fefcfff7d40c5361900b1d44ae113b1e
|
3 |
+
size 16010
|
rng_state_105.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d99e4f2dafa6da591ecb28e6b27663b19be38cdffb64ea5103b9608ed013f2d5
|
3 |
+
size 16010
|
rng_state_106.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4396f2abc7146eaab891842bee3f3fca8861a4ca28dc287f50b28fb8bba1157d
|
3 |
+
size 16010
|
rng_state_107.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4df99104a39734765569cc6338ec86ce6587577b660b84f4e1c981a52b68ac7
|
3 |
+
size 16010
|
rng_state_108.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38500ce7f14d8cf9ed2af440919cd8d250391488cfb930ac10431753932298b6
|
3 |
+
size 16010
|
rng_state_109.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4fbf960d9c47707308c58a88774c121140e3fde5a62b1d795c2a185544ce50f5
|
3 |
+
size 16010
|
rng_state_11.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a089513416d3ed447265187782ec1194ac2303155b941284463976c62bf3d9b
|
3 |
+
size 15997
|
rng_state_110.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7fb01852b12e0be001519c78dcc2a41f254b84c77ce7cdb3d1d6ed16e0736c7d
|
3 |
+
size 16010
|
rng_state_111.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0f7d5868c459ecaa83cd25b056151a3171cc4177f83f66052cb2e84ce389064
|
3 |
+
size 16010
|
rng_state_112.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:498b797cba9e6a827502a14f7447f43350e3975a2e8f12b22fc0fa076b823c93
|
3 |
+
size 16010
|
rng_state_113.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ddf6538f7f6d2d4fad9224ea8c5146bb7f9b3f39c780b3caecf1155726a6c41
|
3 |
+
size 16010
|
rng_state_114.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acc943595efd95e8dca91b42b2543a2ca69a02be62b76327da2cdec1d8e606f3
|
3 |
+
size 16010
|
rng_state_115.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02494715083e15ad0b5344aeed6203e438a1e7cbe50657cfe755ed90376a883c
|
3 |
+
size 16010
|
rng_state_116.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:628cd5da4b7bf94c341d16092c6b9864b66775c192af33615e49c74686504386
|
3 |
+
size 16010
|
rng_state_117.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8849f23daa03e12c031d7954e658fc62707e033ec7204df54126bc8f2909e79
|
3 |
+
size 16010
|
rng_state_118.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fc01f47f0176a79e02ffd0049a4a436ef8189e7d57503817130add2aed9f84a
|
3 |
+
size 16010
|
rng_state_119.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f7208ad1ca7a9f2d64785f3b264a6f183c85145181ac12be6e17a1baeb7ec10
|
3 |
+
size 16010
|
rng_state_12.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a87db6b16c9956496c45bf5c81750dc2349e157e60e544e5d256bb957be1243
|
3 |
+
size 15997
|
rng_state_120.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43f14521187a9902a83c87350207be91c3ee42812ee0e92848f715ff933b91bf
|
3 |
+
size 16010
|
rng_state_121.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f01b8000da78f19cd38830be9b7012b7c402af04e8d5a46949b35ddabe345352
|
3 |
+
size 16010
|
rng_state_122.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be4fb5d3f179f7b8d1cc98c7f8d19a1048b074733adea33ef45c3759171ea4ea
|
3 |
+
size 16010
|
rng_state_123.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d0dab661e20f3369af9ccb2d6f749c24e406a62ec71d278394f4e1fe9095109
|
3 |
+
size 16010
|
rng_state_124.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0290e3295ebcaaebb42a70479bbec724bc19724d4082e5a2ca5e315eed776750
|
3 |
+
size 16010
|
rng_state_125.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35cbcddd7e8e4c53d1a4fa102aa056f49ffa3067ef648f5425f50e76e0ecd8f9
|
3 |
+
size 16010
|
rng_state_126.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c6263895a67c040d499ac194cc55d7a7db1088fdb871004833c6f04efef10a4
|
3 |
+
size 16010
|
rng_state_127.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8267d587b2ecc104da53614606d9fea8b1cee1f9879919cc411f658f1d085568
|
3 |
+
size 16010
|
rng_state_128.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fe9d1033254128c292e9fb051dbbbbf380c4b6e58b1e2a038b81a11fc83c886
|
3 |
+
size 16010
|
rng_state_129.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45f42e81714b374062f598a1c0bb6ff86f4843398405566c1e8fc9c81d6288f8
|
3 |
+
size 16010
|
rng_state_13.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36d5fe5d1b92643a3c3dd35cf2f0cbfa4a92599fe3ccbd8941395c1550f088aa
|
3 |
+
size 15997
|
rng_state_130.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddd2120819f0058690374e5ff3b0daf44e57cdbeabd399a644523028451a7e45
|
3 |
+
size 16010
|
rng_state_131.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a52298e871bcfe55f9ef6d3d6a1de4a2c5cd37ec216810cd297b2dfde5012bc
|
3 |
+
size 16010
|
rng_state_132.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a173ddc90d555a18cb3a412aa950b2c70e7b9e59874093676b39d2f809749cbd
|
3 |
+
size 16010
|
rng_state_133.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af6be4eed09303e45cd5743a710810b2a9a5a66e0ce1a942e15670162e71a994
|
3 |
+
size 16010
|