Create README.md
Browse files
README.md
ADDED
|
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
tags:
|
| 3 |
+
- pyannote
|
| 4 |
+
- audio
|
| 5 |
+
- voice-activity-detection
|
| 6 |
+
datasets:
|
| 7 |
+
- dihard
|
| 8 |
+
license: mit
|
| 9 |
+
inference: false
|
| 10 |
+
---
|
| 11 |
+
|
| 12 |
+
## Example pyannote-audio Voice Activity Detection model
|
| 13 |
+
|
| 14 |
+
### `pyannote.audio.models.segmentation.PyanNet`
|
| 15 |
+
|
| 16 |
+
♻️ Imported from https://github.com/pyannote/pyannote-audio-hub
|
| 17 |
+
|
| 18 |
+
This model was trained by @hbredin.
|
| 19 |
+
|
| 20 |
+
|
| 21 |
+
### Demo: How to use in pyannote-audio
|
| 22 |
+
|
| 23 |
+
```python
|
| 24 |
+
from pyannote.audio.core.inference import Inference
|
| 25 |
+
|
| 26 |
+
model = Inference('julien-c/voice-activity-detection', device='cuda')
|
| 27 |
+
model({
|
| 28 |
+
"audio": "TheBigBangTheory.wav"
|
| 29 |
+
})
|
| 30 |
+
```
|
| 31 |
+
|
| 32 |
+
### Citing pyannote-audio
|
| 33 |
+
|
| 34 |
+
```bibtex
|
| 35 |
+
@inproceedings{Bredin2020,
|
| 36 |
+
Title = {{pyannote.audio: neural building blocks for speaker diarization}},
|
| 37 |
+
Author = {{Bredin}, Herv{\'e} and {Yin}, Ruiqing and {Coria}, Juan Manuel and {Gelly}, Gregory and {Korshunov}, Pavel and {Lavechin}, Marvin and {Fustes}, Diego and {Titeux}, Hadrien and {Bouaziz}, Wassim and {Gill}, Marie-Philippe},
|
| 38 |
+
Booktitle = {ICASSP 2020, IEEE International Conference on Acoustics, Speech, and Signal Processing},
|
| 39 |
+
Address = {Barcelona, Spain},
|
| 40 |
+
Month = {May},
|
| 41 |
+
Year = {2020},
|
| 42 |
+
}
|
| 43 |
+
```
|
| 44 |
+
|
| 45 |
+
|
| 46 |
+
```bibtex
|
| 47 |
+
@inproceedings{Lavechin2020,
|
| 48 |
+
author = {Marvin Lavechin and Marie-Philippe Gill and Ruben Bousbib and Herv\'{e} Bredin and Leibny Paola Garcia-Perera},
|
| 49 |
+
title = {{End-to-end Domain-Adversarial Voice Activity Detection}},
|
| 50 |
+
year = {2020},
|
| 51 |
+
url = {https://arxiv.org/abs/1910.10655},
|
| 52 |
+
}```
|
| 53 |
+
|