Upload decoder/decoder_config.json with huggingface_hub
Browse files
decoder/decoder_config.json
CHANGED
@@ -3,13 +3,13 @@
|
|
3 |
"decoder": {
|
4 |
"unets": [
|
5 |
{
|
6 |
-
"dim":
|
7 |
"cond_dim": 512,
|
8 |
"image_embed_dim": 1024,
|
9 |
"text_embed_dim": 1024,
|
10 |
"cond_on_text_encodings": true,
|
11 |
"channels": 3,
|
12 |
-
"dim_mults": [1, 2,
|
13 |
"num_resnet_blocks": 4,
|
14 |
"attn_heads": 8,
|
15 |
"attn_dim_head": 64,
|
@@ -33,9 +33,8 @@
|
|
33 |
},
|
34 |
"data": {
|
35 |
"webdataset_base_url": "pipe:aws s3 cp --quiet s3://s-datasets/laion5b/laion2B-data/{}.tar -",
|
36 |
-
"img_embeddings_url": "s3://s-laion/vit-h-14-embeddings/img_emb/",
|
37 |
"num_workers": 6,
|
38 |
-
"batch_size":
|
39 |
"start_shard": 0,
|
40 |
"end_shard": 231349,
|
41 |
"shard_width": 6,
|
|
|
3 |
"decoder": {
|
4 |
"unets": [
|
5 |
{
|
6 |
+
"dim": 320,
|
7 |
"cond_dim": 512,
|
8 |
"image_embed_dim": 1024,
|
9 |
"text_embed_dim": 1024,
|
10 |
"cond_on_text_encodings": true,
|
11 |
"channels": 3,
|
12 |
+
"dim_mults": [1, 2, 3, 4],
|
13 |
"num_resnet_blocks": 4,
|
14 |
"attn_heads": 8,
|
15 |
"attn_dim_head": 64,
|
|
|
33 |
},
|
34 |
"data": {
|
35 |
"webdataset_base_url": "pipe:aws s3 cp --quiet s3://s-datasets/laion5b/laion2B-data/{}.tar -",
|
|
|
36 |
"num_workers": 6,
|
37 |
+
"batch_size": 16,
|
38 |
"start_shard": 0,
|
39 |
"end_shard": 231349,
|
40 |
"shard_width": 6,
|