{ "architectures": [ "UpstreamFinetune" ], "classifier_output_dim": 6, "dropout": 0.2, "finetune_layers": 3, "hidden_dim": 64, "model_type": "wav2vec2-emodualhead", "num_layers": 3, "origin_upstream_url": "facebook/wav2vec2-base", "regressor_output_dim": 2, "torch_dtype": "float32", "transformers_version": "4.52.4", "upstream_model": "wav2vec2-base" }