File size: 1,370 Bytes
2a5ac63 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 |
{
"auto_map": {
"AutoImageProcessor": "image_preprocessing_molmo.MolmoImageProcessor",
"AutoProcessor": "preprocessing_molmo.MolmoProcessor"
},
"base_image_input_size": [
336,
336
],
"crop_patches": 24,
"crop_size": 336,
"crop_window_patches": 16,
"crop_window_size": 224,
"do_convert_rgb": true,
"do_normalize": true,
"do_pad": true,
"do_rescale": true,
"do_resize": true,
"do_split_into_crops": true,
"image_column_token": "<im_col>",
"image_end_token": "<im_end>",
"image_mean": [
0.48145466,
0.4578275,
0.40821073
],
"image_padding_mask": true,
"image_patch_size": 14,
"image_patch_token": "<im_patch>",
"image_processor_type": "MolmoImageProcessor",
"image_start_token": "<im_start>",
"image_std": [
0.26862954,
0.26130258,
0.27577711
],
"image_token_length_h": 12,
"image_token_length_w": 12,
"max_crops": 12,
"max_num_crops": 12,
"overlap_margins": [
4,
4
],
"padding_mode": "constant",
"padding_value": 1.0,
"patches_per_image_height": 24,
"patches_per_image_width": 24,
"processor_class": "MolmoProcessor",
"resample": 2,
"rescale_factor": 0.00392156862745098,
"size": {
"height": 336,
"width": 336
},
"tokens_per_image": 144,
"tokens_per_image_height": 12,
"tokens_per_image_width": 12,
"total_margin_pixels": 112
}
|