Updated README
Browse files
README.md
CHANGED
|
@@ -50,7 +50,7 @@ audio_array, sr = librosa.load("path_to_audio.wav", sr=16000)
|
|
| 50 |
|
| 51 |
## Load model and feature extractor
|
| 52 |
model = AutoModelForAudioClassification.from_pretrained("alkiskoudounas/hubert-base-slurp")
|
| 53 |
-
feature_extractor = AutoFeatureExtractor.from_pretrained("
|
| 54 |
|
| 55 |
## Extract features
|
| 56 |
inputs = feature_extractor(audio_array.squeeze(), sampling_rate=feature_extractor.sampling_rate, padding=True, return_tensors="pt")
|
|
@@ -68,7 +68,7 @@ The following hyperparameters were used during training:
|
|
| 68 |
- seed: 42
|
| 69 |
- gradient_accumulation_steps: 4
|
| 70 |
- total_train_batch_size: 128
|
| 71 |
-
- optimizer:
|
| 72 |
- lr_scheduler_type: linear
|
| 73 |
- lr_scheduler_warmup_ratio: 0.1
|
| 74 |
- warmup_steps: 3000
|
|
@@ -77,7 +77,7 @@ The following hyperparameters were used during training:
|
|
| 77 |
## Framework versions
|
| 78 |
|
| 79 |
- Datasets 3.2.0
|
| 80 |
-
- Pytorch 2.1.2
|
| 81 |
- Tokenizers 0.20.3
|
| 82 |
- Transformers 4.45.2
|
| 83 |
|
|
|
|
| 50 |
|
| 51 |
## Load model and feature extractor
|
| 52 |
model = AutoModelForAudioClassification.from_pretrained("alkiskoudounas/hubert-base-slurp")
|
| 53 |
+
feature_extractor = AutoFeatureExtractor.from_pretrained("facebook/hubert-base-ls960")
|
| 54 |
|
| 55 |
## Extract features
|
| 56 |
inputs = feature_extractor(audio_array.squeeze(), sampling_rate=feature_extractor.sampling_rate, padding=True, return_tensors="pt")
|
|
|
|
| 68 |
- seed: 42
|
| 69 |
- gradient_accumulation_steps: 4
|
| 70 |
- total_train_batch_size: 128
|
| 71 |
+
- optimizer: AdamW with betas=(0.9,0.999) and epsilon=1e-08
|
| 72 |
- lr_scheduler_type: linear
|
| 73 |
- lr_scheduler_warmup_ratio: 0.1
|
| 74 |
- warmup_steps: 3000
|
|
|
|
| 77 |
## Framework versions
|
| 78 |
|
| 79 |
- Datasets 3.2.0
|
| 80 |
+
- Pytorch 2.1.2
|
| 81 |
- Tokenizers 0.20.3
|
| 82 |
- Transformers 4.45.2
|
| 83 |
|