Spaces:

Mikfa2025
/

Pronounciation

Sleeping

Pronounciation / explore_model.py

Upload 6 files

0344172 verified about 1 month ago

770 Bytes


	from transformers import Wav2Vec2Processor, Wav2Vec2ForCTC
	import torch

	model_name = "NbAiLab/wav2vec2-large-danish-npsc-nst"

	print(f"Loading model: {model_name}...")

	try:
	processor = Wav2Vec2Processor.from_pretrained(model_name)
	model = Wav2Vec2ForCTC.from_pretrained(model_name)
	print("Model and Processor loaded successfully.")

	print("-" * 20)
	print("Vocabulary (Labels):")
	vocab = processor.tokenizer.get_vocab()
	# Sort by index
	sorted_vocab = sorted(vocab.items(), key=lambda item: item[1])
	for token, index in sorted_vocab:
	print(f"{index}: '{token}'")

	print("-" * 20)
	print(f"Sampling Rate: {processor.feature_extractor.sampling_rate}")

	except Exception as e:
	print(f"Failed to load model: {e}")