Merge branch 'main' of https://huggingface.co/pyannote/segmentation into main
Browse files
README.md
CHANGED
@@ -21,7 +21,7 @@ inference: false
|
|
21 |
|
22 |

|
23 |
|
24 |
-
Model from *[End-to-end speaker segmentation for overlap-aware resegmentation](http://arxiv.org/abs/2104.04045)*,
|
25 |
by Hervé Bredin and Antoine Laurent.
|
26 |
|
27 |
Relies on pyannote.audio 2.0 currently in development: see [installation instructions](https://github.com/pyannote/pyannote-audio/tree/develop#installation).
|
@@ -100,7 +100,7 @@ AMI Mix-Headset | 0.552 | 0.311 | 0.131 | 0.180
|
|
100 |
DIHARD3 | 0.564 | 0.264 | 0.158 | 0.080
|
101 |
VoxConverse | 0.617 | 0.387 | 0.367 | 0.334
|
102 |
|
103 |
-
VBx
|
104 |
----------------|---------|----------|-------------------|-------------------
|
105 |
AMI Mix-Headset | 0.542 | 0.527 | 0.044 | 0.705
|
106 |
DIHARD3 | 0.592 | 0.489 | 0.163 | 0.182
|
@@ -123,7 +123,7 @@ Expected outputs (and VBx baseline) are also provided in the `/reproducible_rese
|
|
123 |
```bibtex
|
124 |
@inproceedings{Bredin2020,
|
125 |
Title = {{pyannote.audio: neural building blocks for speaker diarization}},
|
126 |
-
Author = {{Bredin}, Herv{
|
127 |
Booktitle = {ICASSP 2020, IEEE International Conference on Acoustics, Speech, and Signal Processing},
|
128 |
Address = {Barcelona, Spain},
|
129 |
Month = {May},
|
|
|
21 |
|
22 |

|
23 |
|
24 |
+
Model from *[End-to-end speaker segmentation for overlap-aware resegmentation](http://arxiv.org/abs/2104.04045)*,
|
25 |
by Hervé Bredin and Antoine Laurent.
|
26 |
|
27 |
Relies on pyannote.audio 2.0 currently in development: see [installation instructions](https://github.com/pyannote/pyannote-audio/tree/develop#installation).
|
|
|
100 |
DIHARD3 | 0.564 | 0.264 | 0.158 | 0.080
|
101 |
VoxConverse | 0.617 | 0.387 | 0.367 | 0.334
|
102 |
|
103 |
+
Resegmentation of VBx | `onset` | `offset` | `min_duration_on` | `min_duration_off`
|
104 |
----------------|---------|----------|-------------------|-------------------
|
105 |
AMI Mix-Headset | 0.542 | 0.527 | 0.044 | 0.705
|
106 |
DIHARD3 | 0.592 | 0.489 | 0.163 | 0.182
|
|
|
123 |
```bibtex
|
124 |
@inproceedings{Bredin2020,
|
125 |
Title = {{pyannote.audio: neural building blocks for speaker diarization}},
|
126 |
+
Author = {{Bredin}, Herv{\\\\'e} and {Yin}, Ruiqing and {Coria}, Juan Manuel and {Gelly}, Gregory and {Korshunov}, Pavel and {Lavechin}, Marvin and {Fustes}, Diego and {Titeux}, Hadrien and {Bouaziz}, Wassim and {Gill}, Marie-Philippe},
|
127 |
Booktitle = {ICASSP 2020, IEEE International Conference on Acoustics, Speech, and Signal Processing},
|
128 |
Address = {Barcelona, Spain},
|
129 |
Month = {May},
|