{ "chunk_length": 300, "crop_size": null, "data_format": "channels_first", "default_to_square": true, "device": null, "dither": 0.0, "do_center_crop": null, "do_convert_rgb": true, "do_normalize": true, "do_pad": null, "do_rescale": true, "do_resize": true, "do_sample_frames": false, "feature_extractor_type": "WhisperFeatureExtractor", "feature_size": 128, "fps": null, "hop_length": 160, "image_mean": [ 0.48145466, 0.4578275, 0.40821073 ], "image_std": [ 0.26862954, 0.26130258, 0.27577711 ], "input_data_format": null, "max_frames": 768, "max_pixels": 12845056, "merge_size": 2, "min_frames": 4, "min_pixels": 3136, "n_fft": 400, "n_samples": 4800000, "nb_max_frames": 30000, "num_frames": null, "padding_side": "right", "padding_value": 0.0, "patch_size": 14, "processor_class": "Qwen2_5OmniProcessor", "resample": 3, "rescale_factor": 0.00392156862745098, "return_attention_mask": true, "return_metadata": false, "sampling_rate": 16000, "size": { "longest_edge": 12845056, "shortest_edge": 3136 }, "size_divisor": null, "temporal_patch_size": 2, "video_metadata": null, "video_processor_type": "Qwen2VLVideoProcessor" }