Upload 22 files (#1)
Browse files- Upload 22 files (ef5d074bb947a1e8d486681de3e613438303edf8)
Co-authored-by: Daniel Gu <dg845@users.noreply.huggingface.co>
- clip_image_processor/preprocessor_config.json +27 -0
- clip_tokenizer/tokenizer_config.json +1 -2
- image_encoder/config.json +1 -1
- model_index.json +5 -5
- scheduler/scheduler_config.json +3 -1
- text_decoder/config.json +1 -2
- text_decoder/diffusion_pytorch_model.bin +1 -1
- text_encoder/config.json +1 -2
- text_tokenizer/tokenizer_config.json +1 -2
- unet/config.json +1 -1
- unet/diffusion_pytorch_model.bin +2 -2
- vae/config.json +2 -2
- vae/diffusion_pytorch_model.bin +2 -2
clip_image_processor/preprocessor_config.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"crop_size": {
|
3 |
+
"height": 32,
|
4 |
+
"width": 32
|
5 |
+
},
|
6 |
+
"do_center_crop": true,
|
7 |
+
"do_convert_rgb": true,
|
8 |
+
"do_normalize": true,
|
9 |
+
"do_rescale": true,
|
10 |
+
"do_resize": true,
|
11 |
+
"image_mean": [
|
12 |
+
0.48145466,
|
13 |
+
0.4578275,
|
14 |
+
0.40821073
|
15 |
+
],
|
16 |
+
"image_processor_type": "CLIPImageProcessor",
|
17 |
+
"image_std": [
|
18 |
+
0.26862954,
|
19 |
+
0.26130258,
|
20 |
+
0.27577711
|
21 |
+
],
|
22 |
+
"resample": 3,
|
23 |
+
"rescale_factor": 0.00392156862745098,
|
24 |
+
"size": {
|
25 |
+
"shortest_edge": 32
|
26 |
+
}
|
27 |
+
}
|
clip_tokenizer/tokenizer_config.json
CHANGED
@@ -8,6 +8,7 @@
|
|
8 |
"rstrip": false,
|
9 |
"single_word": false
|
10 |
},
|
|
|
11 |
"do_lower_case": true,
|
12 |
"eos_token": {
|
13 |
"__type": "AddedToken",
|
@@ -19,9 +20,7 @@
|
|
19 |
},
|
20 |
"errors": "replace",
|
21 |
"model_max_length": 77,
|
22 |
-
"name_or_path": "hf-internal-testing/tiny-random-clip",
|
23 |
"pad_token": "<|endoftext|>",
|
24 |
-
"special_tokens_map_file": "/home/lysandre/.cache/huggingface/transformers/18a566598f286c9139f88160c99f84eec492a26bd22738fa9cb44d5b7e0a5c76.cce1206abbad28826f000510f22f354e53e66a97f7c23745a7dfe27609cc07f5",
|
25 |
"tokenizer_class": "CLIPTokenizer",
|
26 |
"unk_token": {
|
27 |
"__type": "AddedToken",
|
|
|
8 |
"rstrip": false,
|
9 |
"single_word": false
|
10 |
},
|
11 |
+
"clean_up_tokenization_spaces": true,
|
12 |
"do_lower_case": true,
|
13 |
"eos_token": {
|
14 |
"__type": "AddedToken",
|
|
|
20 |
},
|
21 |
"errors": "replace",
|
22 |
"model_max_length": 77,
|
|
|
23 |
"pad_token": "<|endoftext|>",
|
|
|
24 |
"tokenizer_class": "CLIPTokenizer",
|
25 |
"unk_token": {
|
26 |
"__type": "AddedToken",
|
image_encoder/config.json
CHANGED
@@ -18,5 +18,5 @@
|
|
18 |
"patch_size": 2,
|
19 |
"projection_dim": 32,
|
20 |
"torch_dtype": "float32",
|
21 |
-
"transformers_version": "4.
|
22 |
}
|
|
|
18 |
"patch_size": 2,
|
19 |
"projection_dim": 32,
|
20 |
"torch_dtype": "float32",
|
21 |
+
"transformers_version": "4.29.1"
|
22 |
}
|
model_index.json
CHANGED
@@ -1,6 +1,10 @@
|
|
1 |
{
|
2 |
"_class_name": "UniDiffuserPipeline",
|
3 |
-
"_diffusers_version": "0.
|
|
|
|
|
|
|
|
|
4 |
"clip_tokenizer": [
|
5 |
"transformers",
|
6 |
"CLIPTokenizer"
|
@@ -9,10 +13,6 @@
|
|
9 |
"transformers",
|
10 |
"CLIPVisionModelWithProjection"
|
11 |
],
|
12 |
-
"image_processor": [
|
13 |
-
"transformers",
|
14 |
-
"CLIPImageProcessor"
|
15 |
-
],
|
16 |
"scheduler": [
|
17 |
"diffusers",
|
18 |
"DPMSolverMultistepScheduler"
|
|
|
1 |
{
|
2 |
"_class_name": "UniDiffuserPipeline",
|
3 |
+
"_diffusers_version": "0.21.0.dev0",
|
4 |
+
"clip_image_processor": [
|
5 |
+
"transformers",
|
6 |
+
"CLIPImageProcessor"
|
7 |
+
],
|
8 |
"clip_tokenizer": [
|
9 |
"transformers",
|
10 |
"CLIPTokenizer"
|
|
|
13 |
"transformers",
|
14 |
"CLIPVisionModelWithProjection"
|
15 |
],
|
|
|
|
|
|
|
|
|
16 |
"scheduler": [
|
17 |
"diffusers",
|
18 |
"DPMSolverMultistepScheduler"
|
scheduler/scheduler_config.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"_class_name": "DPMSolverMultistepScheduler",
|
3 |
-
"_diffusers_version": "0.
|
4 |
"algorithm_type": "dpmsolver++",
|
5 |
"beta_end": 0.012,
|
6 |
"beta_schedule": "scaled_linear",
|
@@ -13,7 +13,9 @@
|
|
13 |
"sample_max_value": 1.0,
|
14 |
"solver_order": 3,
|
15 |
"solver_type": "midpoint",
|
|
|
16 |
"thresholding": false,
|
|
|
17 |
"trained_betas": null,
|
18 |
"use_karras_sigmas": false,
|
19 |
"variance_type": null
|
|
|
1 |
{
|
2 |
"_class_name": "DPMSolverMultistepScheduler",
|
3 |
+
"_diffusers_version": "0.21.0.dev0",
|
4 |
"algorithm_type": "dpmsolver++",
|
5 |
"beta_end": 0.012,
|
6 |
"beta_schedule": "scaled_linear",
|
|
|
13 |
"sample_max_value": 1.0,
|
14 |
"solver_order": 3,
|
15 |
"solver_type": "midpoint",
|
16 |
+
"steps_offset": 0,
|
17 |
"thresholding": false,
|
18 |
+
"timestep_spacing": "linspace",
|
19 |
"trained_betas": null,
|
20 |
"use_karras_sigmas": false,
|
21 |
"variance_type": null
|
text_decoder/config.json
CHANGED
@@ -1,7 +1,6 @@
|
|
1 |
{
|
2 |
"_class_name": "UniDiffuserTextDecoder",
|
3 |
-
"_diffusers_version": "0.
|
4 |
-
"_name_or_path": "/home/tamamo/scratch/unidiffuser_test/text_decoder",
|
5 |
"activation_function": "gelu",
|
6 |
"attn_pdrop": 0.1,
|
7 |
"embd_pdrop": 0.1,
|
|
|
1 |
{
|
2 |
"_class_name": "UniDiffuserTextDecoder",
|
3 |
+
"_diffusers_version": "0.21.0.dev0",
|
|
|
4 |
"activation_function": "gelu",
|
5 |
"attn_pdrop": 0.1,
|
6 |
"embd_pdrop": 0.1,
|
text_decoder/diffusion_pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5679611
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45fc49f24560aab4103739b7d196548121f1a91f9ecaa603d6a97afb6bcc1bbc
|
3 |
size 5679611
|
text_encoder/config.json
CHANGED
@@ -4,7 +4,6 @@
|
|
4 |
],
|
5 |
"attention_dropout": 0.0,
|
6 |
"bos_token_id": 0,
|
7 |
-
"dropout": 0.0,
|
8 |
"eos_token_id": 2,
|
9 |
"hidden_act": "quick_gelu",
|
10 |
"hidden_size": 32,
|
@@ -19,6 +18,6 @@
|
|
19 |
"pad_token_id": 1,
|
20 |
"projection_dim": 512,
|
21 |
"torch_dtype": "float32",
|
22 |
-
"transformers_version": "4.
|
23 |
"vocab_size": 1000
|
24 |
}
|
|
|
4 |
],
|
5 |
"attention_dropout": 0.0,
|
6 |
"bos_token_id": 0,
|
|
|
7 |
"eos_token_id": 2,
|
8 |
"hidden_act": "quick_gelu",
|
9 |
"hidden_size": 32,
|
|
|
18 |
"pad_token_id": 1,
|
19 |
"projection_dim": 512,
|
20 |
"torch_dtype": "float32",
|
21 |
+
"transformers_version": "4.29.1",
|
22 |
"vocab_size": 1000
|
23 |
}
|
text_tokenizer/tokenizer_config.json
CHANGED
@@ -9,6 +9,7 @@
|
|
9 |
"rstrip": false,
|
10 |
"single_word": false
|
11 |
},
|
|
|
12 |
"eos_token": {
|
13 |
"__type": "AddedToken",
|
14 |
"content": "<|endoftext|>",
|
@@ -19,9 +20,7 @@
|
|
19 |
},
|
20 |
"errors": "replace",
|
21 |
"model_max_length": 512,
|
22 |
-
"name_or_path": "/home/tamamo/code/unidiffuser/models/new_gpt_tokenizer",
|
23 |
"pad_token": null,
|
24 |
-
"special_tokens_map_file": null,
|
25 |
"tokenizer_class": "GPT2Tokenizer",
|
26 |
"unk_token": {
|
27 |
"__type": "AddedToken",
|
|
|
9 |
"rstrip": false,
|
10 |
"single_word": false
|
11 |
},
|
12 |
+
"clean_up_tokenization_spaces": true,
|
13 |
"eos_token": {
|
14 |
"__type": "AddedToken",
|
15 |
"content": "<|endoftext|>",
|
|
|
20 |
},
|
21 |
"errors": "replace",
|
22 |
"model_max_length": 512,
|
|
|
23 |
"pad_token": null,
|
|
|
24 |
"tokenizer_class": "GPT2Tokenizer",
|
25 |
"unk_token": {
|
26 |
"__type": "AddedToken",
|
unet/config.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"_class_name": "UniDiffuserModel",
|
3 |
-
"_diffusers_version": "0.
|
4 |
"activation_fn": "gelu",
|
5 |
"attention_bias": false,
|
6 |
"attention_head_dim": 8,
|
|
|
1 |
{
|
2 |
"_class_name": "UniDiffuserModel",
|
3 |
+
"_diffusers_version": "0.21.0.dev0",
|
4 |
"activation_fn": "gelu",
|
5 |
"attention_bias": false,
|
6 |
"attention_head_dim": 8,
|
unet/diffusion_pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff85fcccea0e13b2091802eb2f1fab9828cdb8580c346822c020a1c3765b1078
|
3 |
+
size 87531
|
vae/config.json
CHANGED
@@ -1,7 +1,6 @@
|
|
1 |
{
|
2 |
"_class_name": "AutoencoderKL",
|
3 |
-
"_diffusers_version": "0.
|
4 |
-
"_name_or_path": "/home/tamamo/scratch/unidiffuser_test/vae",
|
5 |
"act_fn": "silu",
|
6 |
"block_out_channels": [
|
7 |
32,
|
@@ -11,6 +10,7 @@
|
|
11 |
"DownEncoderBlock2D",
|
12 |
"DownEncoderBlock2D"
|
13 |
],
|
|
|
14 |
"in_channels": 3,
|
15 |
"latent_channels": 4,
|
16 |
"layers_per_block": 1,
|
|
|
1 |
{
|
2 |
"_class_name": "AutoencoderKL",
|
3 |
+
"_diffusers_version": "0.21.0.dev0",
|
|
|
4 |
"act_fn": "silu",
|
5 |
"block_out_channels": [
|
6 |
32,
|
|
|
10 |
"DownEncoderBlock2D",
|
11 |
"DownEncoderBlock2D"
|
12 |
],
|
13 |
+
"force_upcast": true,
|
14 |
"in_channels": 3,
|
15 |
"latent_channels": 4,
|
16 |
"layers_per_block": 1,
|
vae/diffusion_pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e84bb0d30f9de5f723541259119fa2702639a8c73465fe8263085739154eff9f
|
3 |
+
size 2681001
|