| { |
| "auto_map": { |
| "AutoFeatureExtractor": "feature_extraction_avhubert.AVHubertFeatureExtractor", |
| "AutoProcessor": "processing_avhubert.AVHubertProcessor" |
| }, |
| "feature_extractor_type": "AVHubertFeatureExtractor", |
| "image_crop_size": 88, |
| "landmark_indices": [ |
| 5, |
| 411, |
| 199, |
| 187 |
| ], |
| "max_sample_size": null, |
| "min_detection_confidence": 0.5, |
| "min_tracking_confidence": 0.5, |
| "normalize": true, |
| "processor_class": "AVHubertProcessor", |
| "refine_landmarks": false, |
| "sr": 16000, |
| "stack_order_audio": 4, |
| "static_image_mode": false, |
| "transforms": [ |
| { |
| "training": "True", |
| "transforms_type": "ToImage" |
| }, |
| { |
| "size": "(88, 88)", |
| "training": "True", |
| "transforms_type": "CenterCrop" |
| }, |
| { |
| "dtype": "torch.float32", |
| "scale": "True", |
| "training": "True", |
| "transforms_type": "ToDtype" |
| }, |
| { |
| "inplace": "False", |
| "mean": "[0.421]", |
| "std": "[0.165]", |
| "training": "True", |
| "transforms_type": "Normalize" |
| } |
| ] |
| } |
|
|