v1

Files changed (4) hide show

OmniCodec.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:30b4850299bd00a00e71c01aa73cadb01776731d6e45a0699a9062f99d866b63
+size 627755403

Qwen3AuTEncoder/config.json ADDED Viewed

+{
+  "activation_dropout": 0,
+  "activation_function": "gelu",
+  "architectures": [
+    "Qwen3OmniMoeAudioEncoder"
+  ],
+  "attention_dropout": 0,
+  "conv_chunksize": 500,
+  "d_model": 1280,
+  "downsample_hidden_size": 480,
+  "dropout": 0,
+  "dtype": "bfloat16",
+  "encoder_attention_heads": 20,
+  "encoder_ffn_dim": 5120,
+  "encoder_layers": 32,
+  "initializer_range": 0.02,
+  "max_source_positions": 1500,
+  "model_type": "qwen3_omni_moe_audio_encoder",
+  "n_window": 50,
+  "n_window_infer": 800,
+  "num_hidden_layers": 32,
+  "num_mel_bins": 128,
+  "output_dim": 2048,
+  "scale_embedding": false,
+  "tf_legacy_loss": false,
+  "transformers_version": "4.57.0.dev0",
+  "use_bfloat16": false
+}

Qwen3AuTEncoder/model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:72229aa6fc359722c76c3627a56357e805f8c675a23487c0f827c0fc83e3f77a
+size 1295908432

Qwen3AuTEncoder/preprocessor_config.json ADDED Viewed

+{
+  "dither": 0.0,
+  "feature_extractor_type": "WhisperFeatureExtractor",
+  "feature_size": 128,
+  "hop_length": 160,
+  "image_mean": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "image_processor_type": "Qwen2VLImageProcessor",
+  "image_std": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "max_pixels": 12845056,
+  "merge_size": 2,
+  "min_pixels": 3136,
+  "n_fft": 400,
+  "n_samples": 4800000,
+  "nb_max_frames": 30000,
+  "padding_side": "right",
+  "padding_value": 0.0,
+  "patch_size": 16,
+  "processor_class": "Qwen3OmniMoeProcessor",
+  "return_attention_mask": true,
+  "sampling_rate": 16000,
+  "temporal_patch_size": 2
+}