| { |
| "auto_map": { |
| "AutoProcessor": "processing_nvila.NVILAProcessor" |
| }, |
| "do_convert_rgb": null, |
| "do_normalize": true, |
| "do_rescale": true, |
| "do_resize": true, |
| "image_mean": [ |
| 0.5, |
| 0.5, |
| 0.5 |
| ], |
| "image_processor_type": "SiglipImageProcessor", |
| "image_std": [ |
| 0.5, |
| 0.5, |
| 0.5 |
| ], |
| "processor_class": "NVILAProcessor", |
| "resample": 3, |
| "rescale_factor": 0.00392156862745098, |
| "size": { |
| "height": 392, |
| "width": 392 |
| }, |
| "autogaze_model_id": "bfshi/AutoGaze", |
| "gazing_ratio_tile": 0.75, |
| "gazing_ratio_thumbnail": 0.75, |
| "task_loss_requirement_tile": 0.7, |
| "task_loss_requirement_thumbnail": 0.7, |
| "target_scales": [56, 112, 196, 392], |
| "target_patch_size": 16, |
| "num_video_frames": 8, |
| "max_tiles_video": 8, |
| "num_video_frames_thumbnail": 8, |
| "mm_projector_shuffle_num": 9, |
| "max_batch_size_autogaze": 32 |
| } |
|
|