fancyfeast commited on
Commit
ded47d2
β€’
1 Parent(s): e354e97

Update to latest training run; fix return

Browse files
app.py CHANGED
@@ -13,7 +13,7 @@ import os
13
  CLIP_PATH = "google/siglip-so400m-patch14-384"
14
  VLM_PROMPT = "A descriptive caption for this image:\n"
15
  MODEL_PATH = "meta-llama/Meta-Llama-3.1-8B"
16
- CHECKPOINT_PATH = Path("h2vtfhad")
17
  TITLE = "<h1><center>Foo</center></h1>"
18
  HF_TOKEN = os.environ.get("HF_TOKEN", None)
19
 
@@ -108,7 +108,7 @@ def stream_chat(input_image: Image.Image):
108
 
109
  caption = tokenizer.batch_decode(generate_ids, skip_special_tokens=False, clean_up_tokenization_spaces=False)[0]
110
 
111
- return [caption]
112
 
113
 
114
  with gr.Blocks() as demo:
 
13
  CLIP_PATH = "google/siglip-so400m-patch14-384"
14
  VLM_PROMPT = "A descriptive caption for this image:\n"
15
  MODEL_PATH = "meta-llama/Meta-Llama-3.1-8B"
16
+ CHECKPOINT_PATH = Path("wpkklhc6")
17
  TITLE = "<h1><center>Foo</center></h1>"
18
  HF_TOKEN = os.environ.get("HF_TOKEN", None)
19
 
 
108
 
109
  caption = tokenizer.batch_decode(generate_ids, skip_special_tokens=False, clean_up_tokenization_spaces=False)[0]
110
 
111
+ return caption.strip()
112
 
113
 
114
  with gr.Blocks() as demo:
{h2vtfhad β†’ wpkklhc6}/config.yaml RENAMED
@@ -3,7 +3,7 @@ device_batch_size: 2
3
  batch_size: 256
4
  learning_rate: 0.001
5
  warmup_samples: 18000
6
- max_samples: 500000
7
  save_every: 50000
8
  test_every: 50000
9
  use_amp: true
@@ -19,7 +19,7 @@ adam_beta2: 0.999
19
  adam_eps: 1.0e-08
20
  adam_weight_decay: 0.0
21
  clip_grad_norm: 1.0
22
- dataset: fancyfeast/joy-captioning-20240720a
23
  clip_model: google/siglip-so400m-patch14-384
24
  text_model: meta-llama/Meta-Llama-3.1-8B
25
  resume: null
 
3
  batch_size: 256
4
  learning_rate: 0.001
5
  warmup_samples: 18000
6
+ max_samples: 600000
7
  save_every: 50000
8
  test_every: 50000
9
  use_amp: true
 
19
  adam_eps: 1.0e-08
20
  adam_weight_decay: 0.0
21
  clip_grad_norm: 1.0
22
+ dataset: fancyfeast/joy-captioning-20240729a
23
  clip_model: google/siglip-so400m-patch14-384
24
  text_model: meta-llama/Meta-Llama-3.1-8B
25
  resume: null
{h2vtfhad β†’ wpkklhc6}/image_adapter.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b06f70ede9f072d92855f91458a3ec09fdc27a3fddf859a4b1381cccff730fea
3
  size 86018240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ebb1d1437bbb3264a6f25a896b25a7c7dd06c570c5de909dc2f19d3a5c5c110
3
  size 86018240