File size: 1,370 Bytes
2a5ac63
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
{
  "auto_map": {
    "AutoImageProcessor": "image_preprocessing_molmo.MolmoImageProcessor",
    "AutoProcessor": "preprocessing_molmo.MolmoProcessor"
  },
  "base_image_input_size": [
    336,
    336
  ],
  "crop_patches": 24,
  "crop_size": 336,
  "crop_window_patches": 16,
  "crop_window_size": 224,
  "do_convert_rgb": true,
  "do_normalize": true,
  "do_pad": true,
  "do_rescale": true,
  "do_resize": true,
  "do_split_into_crops": true,
  "image_column_token": "<im_col>",
  "image_end_token": "<im_end>",
  "image_mean": [
    0.48145466,
    0.4578275,
    0.40821073
  ],
  "image_padding_mask": true,
  "image_patch_size": 14,
  "image_patch_token": "<im_patch>",
  "image_processor_type": "MolmoImageProcessor",
  "image_start_token": "<im_start>",
  "image_std": [
    0.26862954,
    0.26130258,
    0.27577711
  ],
  "image_token_length_h": 12,
  "image_token_length_w": 12,
  "max_crops": 12,
  "max_num_crops": 12,
  "overlap_margins": [
    4,
    4
  ],
  "padding_mode": "constant",
  "padding_value": 1.0,
  "patches_per_image_height": 24,
  "patches_per_image_width": 24,
  "processor_class": "MolmoProcessor",
  "resample": 2,
  "rescale_factor": 0.00392156862745098,
  "size": {
    "height": 336,
    "width": 336
  },
  "tokens_per_image": 144,
  "tokens_per_image_height": 12,
  "tokens_per_image_width": 12,
  "total_margin_pixels": 112
}