Upload autocap-full.yaml with huggingface_hub
Browse files- autocap-full.yaml +4 -2
autocap-full.yaml
CHANGED
@@ -47,6 +47,7 @@ model:
|
|
47 |
use_clap_embeds: true
|
48 |
meta_input: true
|
49 |
add_special_tokens: True # If not then the meat data will start with Title:, Caption:, etc
|
|
|
50 |
meta_keys: ['video_caption', 'title']
|
51 |
# meta_keys: ['video_caption', 'videollama_caption', 'title', 'description', 'subtitle', 'labels']
|
52 |
|
@@ -100,8 +101,8 @@ data_args:
|
|
100 |
data:
|
101 |
metadata_root: "../dataset_preperation/data/metadata/dataset_root.json"
|
102 |
train: ['32k_captioned_audiocaps', 'caption_audioset', 'wavcaps_audioset_strong', 'wavcaps_bbcsound', 'wavcaps_freesound', 'wavcaps_soundbible', 'clotho', 'fsd50k']
|
103 |
-
val: ['
|
104 |
-
test: ['
|
105 |
|
106 |
keys_synonyms:
|
107 |
gt_audio_caption:
|
@@ -110,6 +111,7 @@ data_args:
|
|
110 |
- gt_caption
|
111 |
- caption
|
112 |
- gt_audio_caption
|
|
|
113 |
- wavcaps_caption
|
114 |
tags:
|
115 |
- keywords
|
|
|
47 |
use_clap_embeds: true
|
48 |
meta_input: true
|
49 |
add_special_tokens: True # If not then the meat data will start with Title:, Caption:, etc
|
50 |
+
resize_token_embeds: True
|
51 |
meta_keys: ['video_caption', 'title']
|
52 |
# meta_keys: ['video_caption', 'videollama_caption', 'title', 'description', 'subtitle', 'labels']
|
53 |
|
|
|
101 |
data:
|
102 |
metadata_root: "../dataset_preperation/data/metadata/dataset_root.json"
|
103 |
train: ['32k_captioned_audiocaps', 'caption_audioset', 'wavcaps_audioset_strong', 'wavcaps_bbcsound', 'wavcaps_freesound', 'wavcaps_soundbible', 'clotho', 'fsd50k']
|
104 |
+
val: ['autocap']
|
105 |
+
test: ['autocap']
|
106 |
|
107 |
keys_synonyms:
|
108 |
gt_audio_caption:
|
|
|
111 |
- gt_caption
|
112 |
- caption
|
113 |
- gt_audio_caption
|
114 |
+
- autocap_caption
|
115 |
- wavcaps_caption
|
116 |
tags:
|
117 |
- keywords
|