| { | |
| "auto_map": { | |
| "AutoImageProcessor": "image_processing_sfl.SFLImageProcessor", | |
| "AutoProcessor": "processing_videollama3_qwen3.Videollama3Qwen3Processor" | |
| }, | |
| "chunk_length": 30, | |
| "dither": 0.0, | |
| "feature_extractor_type": "Qwen2AudioEncoderProcessor", | |
| "feature_size": 128, | |
| "hop_length": 160, | |
| "n_fft": 400, | |
| "n_samples": 480000, | |
| "nb_max_frames": 3000, | |
| "padding_side": "right", | |
| "padding_value": 0.0, | |
| "processor_class": "Videollama3Qwen3Processor", | |
| "return_attention_mask": true, | |
| "sampling_rate": 16000, | |
| "do_convert_rgb": true, | |
| "do_normalize": true, | |
| "do_rescale": true, | |
| "do_resize": true, | |
| "image_mean": [ | |
| 0.5, | |
| 0.5, | |
| 0.5 | |
| ], | |
| "image_processor_type": "SFLImageProcessor", | |
| "image_std": [ | |
| 0.5, | |
| 0.5, | |
| 0.5 | |
| ], | |
| "max_tokens": 10240, | |
| "min_tokens": 16, | |
| "patch_size": 14, | |
| "resample": 3, | |
| "rescale_factor": 0.00392156862745098 | |
| } | |