al8n commited on 22 days ago

Commit

8ecadc1

verified ·

1 Parent(s): ae53fc3

initial bundle: segmentation-3.0 + wespeaker_resnet34_lm (3 forms) + PLDA weights, with attribution

Browse files

Files changed (21) hide show

.gitattributes +1 -0
LICENSE +22 -0
LICENSE.APACHE-2.0 +201 -0
LICENSE.CC-BY-4.0 +52 -0
LICENSE.MIT +27 -0
README.md +210 -0
plda/eigenvectors_desc.bin +3 -0
plda/lda.bin +3 -0
plda/mean1.bin +3 -0
plda/mean2.bin +3 -0
plda/mu.bin +3 -0
plda/phi_desc.bin +3 -0
plda/plda.npz +3 -0
plda/psi.bin +3 -0
plda/tr.bin +3 -0
plda/xvec_transform.npz +3 -0
segmentation-3.0.onnx +3 -0
wespeaker_resnet34_lm.onnx +3 -0
wespeaker_resnet34_lm.onnx.data +3 -0
wespeaker_resnet34_lm.pt +3 -0
wespeaker_resnet34_lm_packed.onnx +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+wespeaker_resnet34_lm.onnx.data filter=lfs diff=lfs merge=lfs -text

LICENSE ADDED Viewed

	@@ -0,0 +1,22 @@

+This bundle redistributes model artifacts under three different upstream
+licenses. The full text of each license is included in the
+`LICENSE.MIT`, `LICENSE.APACHE-2.0`, and `LICENSE.CC-BY-4.0` files
+alongside this one. Each artifact retains its upstream license; using
+the bundle obligates the user to comply with all three.
+  segmentation-3.0.onnx                   — MIT (Copyright © 2023 CNRS,
+                                            Hervé Bredin / pyannote.audio)
+  wespeaker_resnet34_lm.onnx (+ .data)    — Apache-2.0 (WeSpeaker / wenet-e2e)
+  wespeaker_resnet34_lm_packed.onnx       — Apache-2.0 (derivative of above:
+                                            same weights repacked into a
+                                            single file)
+  wespeaker_resnet34_lm.pt                — Apache-2.0 (TorchScript export)
+  plda/*                                  — CC-BY-4.0 (BUT Speech@FIT,
+                                            redistributed via pyannote/
+                                            speaker-diarization-community-1)
+CC-BY-4.0 attribution for plda/* (required by upstream):
+  PLDA model trained by BUT Speech@FIT (https://speech.fit.vut.cz/).
+  Integration of VBx in pyannote.audio by Jiangyu Han and Petr Pálka.
+See README.md for upstream sources and snapshot revisions.

LICENSE.APACHE-2.0 ADDED Viewed

	@@ -0,0 +1,201 @@

+                              Apache License
+                        Version 2.0, January 2004
+                     http://www.apache.org/licenses/
+TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+1. Definitions.
+   "License" shall mean the terms and conditions for use, reproduction,
+   and distribution as defined by Sections 1 through 9 of this document.
+   "Licensor" shall mean the copyright owner or entity authorized by
+   the copyright owner that is granting the License.
+   "Legal Entity" shall mean the union of the acting entity and all
+   other entities that control, are controlled by, or are under common
+   control with that entity. For the purposes of this definition,
+   "control" means (i) the power, direct or indirect, to cause the
+   direction or management of such entity, whether by contract or
+   otherwise, or (ii) ownership of fifty percent (50%) or more of the
+   outstanding shares, or (iii) beneficial ownership of such entity.
+   "You" (or "Your") shall mean an individual or Legal Entity
+   exercising permissions granted by this License.
+   "Source" form shall mean the preferred form for making modifications,
+   including but not limited to software source code, documentation
+   source, and configuration files.
+   "Object" form shall mean any form resulting from mechanical
+   transformation or translation of a Source form, including but
+   not limited to compiled object code, generated documentation,
+   and conversions to other media types.
+   "Work" shall mean the work of authorship, whether in Source or
+   Object form, made available under the License, as indicated by a
+   copyright notice that is included in or attached to the work
+   (an example is provided in the Appendix below).
+   "Derivative Works" shall mean any work, whether in Source or Object
+   form, that is based on (or derived from) the Work and for which the
+   editorial revisions, annotations, elaborations, or other modifications
+   represent, as a whole, an original work of authorship. For the purposes
+   of this License, Derivative Works shall not include works that remain
+   separable from, or merely link (or bind by name) to the interfaces of,
+   the Work and Derivative Works thereof.
+   "Contribution" shall mean any work of authorship, including
+   the original version of the Work and any modifications or additions
+   to that Work or Derivative Works thereof, that is intentionally
+   submitted to Licensor for inclusion in the Work by the copyright owner
+   or by an individual or Legal Entity authorized to submit on behalf of
+   the copyright owner. For the purposes of this definition, "submitted"
+   means any form of electronic, verbal, or written communication sent
+   to the Licensor or its representatives, including but not limited to
+   communication on electronic mailing lists, source code control systems,
+   and issue tracking systems that are managed by, or on behalf of, the
+   Licensor for the purpose of discussing and improving the Work, but
+   excluding communication that is conspicuously marked or otherwise
+   designated in writing by the copyright owner as "Not a Contribution."
+   "Contributor" shall mean Licensor and any individual or Legal Entity
+   on behalf of whom a Contribution has been received by Licensor and
+   subsequently incorporated within the Work.
+2. Grant of Copyright License. Subject to the terms and conditions of
+   this License, each Contributor hereby grants to You a perpetual,
+   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+   copyright license to reproduce, prepare Derivative Works of,
+   publicly display, publicly perform, sublicense, and distribute the
+   Work and such Derivative Works in Source or Object form.
+3. Grant of Patent License. Subject to the terms and conditions of
+   this License, each Contributor hereby grants to You a perpetual,
+   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+   (except as stated in this section) patent license to make, have made,
+   use, offer to sell, sell, import, and otherwise transfer the Work,
+   where such license applies only to those patent claims licensable
+   by such Contributor that are necessarily infringed by their
+   Contribution(s) alone or by combination of their Contribution(s)
+   with the Work to which such Contribution(s) was submitted. If You
+   institute patent litigation against any entity (including a
+   cross-claim or counterclaim in a lawsuit) alleging that the Work
+   or a Contribution incorporated within the Work constitutes direct
+   or contributory patent infringement, then any patent licenses
+   granted to You under this License for that Work shall terminate
+   as of the date such litigation is filed.
+4. Redistribution. You may reproduce and distribute copies of the
+   Work or Derivative Works thereof in any medium, with or without
+   modifications, and in Source or Object form, provided that You
+   meet the following conditions:
+   (a) You must give any other recipients of the Work or
+       Derivative Works a copy of this License; and
+   (b) You must cause any modified files to carry prominent notices
+       stating that You changed the files; and
+   (c) You must retain, in the Source form of any Derivative Works
+       that You distribute, all copyright, patent, trademark, and
+       attribution notices from the Source form of the Work,
+       excluding those notices that do not pertain to any part of
+       the Derivative Works; and
+   (d) If the Work includes a "NOTICE" text file as part of its
+       distribution, then any Derivative Works that You distribute must
+       include a readable copy of the attribution notices contained
+       within such NOTICE file, excluding those notices that do not
+       pertain to any part of the Derivative Works, in at least one
+       of the following places: within a NOTICE text file distributed
+       as part of the Derivative Works; within the Source form or
+       documentation, if provided along with the Derivative Works; or,
+       within a display generated by the Derivative Works, if and
+       wherever such third-party notices normally appear. The contents
+       of the NOTICE file are for informational purposes only and
+       do not modify the License. You may add Your own attribution
+       notices within Derivative Works that You distribute, alongside
+       or as an addendum to the NOTICE text from the Work, provided
+       that such additional attribution notices cannot be construed
+       as modifying the License.
+   You may add Your own copyright statement to Your modifications and
+   may provide additional or different license terms and conditions
+   for use, reproduction, or distribution of Your modifications, or
+   for any such Derivative Works as a whole, provided Your use,
+   reproduction, and distribution of the Work otherwise complies with
+   the conditions stated in this License.
+5. Submission of Contributions. Unless You explicitly state otherwise,
+   any Contribution intentionally submitted for inclusion in the Work
+   by You to the Licensor shall be under the terms and conditions of
+   this License, without any additional terms or conditions.
+   Notwithstanding the above, nothing herein shall supersede or modify
+   the terms of any separate license agreement you may have executed
+   with Licensor regarding such Contributions.
+6. Trademarks. This License does not grant permission to use the trade
+   names, trademarks, service marks, or product names of the Licensor,
+   except as required for reasonable and customary use in describing the
+   origin of the Work and reproducing the content of the NOTICE file.
+7. Disclaimer of Warranty. Unless required by applicable law or
+   agreed to in writing, Licensor provides the Work (and each
+   Contributor provides its Contributions) on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+   implied, including, without limitation, any warranties or conditions
+   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+   PARTICULAR PURPOSE. You are solely responsible for determining the
+   appropriateness of using or redistributing the Work and assume any
+   risks associated with Your exercise of permissions under this License.
+8. Limitation of Liability. In no event and under no legal theory,
+   whether in tort (including negligence), contract, or otherwise,
+   unless required by applicable law (such as deliberate and grossly
+   negligent acts) or agreed to in writing, shall any Contributor be
+   liable to You for damages, including any direct, indirect, special,
+   incidental, or consequential damages of any character arising as a
+   result of this License or out of the use or inability to use the
+   Work (including but not limited to damages for loss of goodwill,
+   work stoppage, computer failure or malfunction, or any and all
+   other commercial damages or losses), even if such Contributor
+   has been advised of the possibility of such damages.
+9. Accepting Warranty or Additional Liability. While redistributing
+   the Work or Derivative Works thereof, You may choose to offer,
+   and charge a fee for, acceptance of support, warranty, indemnity,
+   or other liability obligations and/or rights consistent with this
+   License. However, in accepting such obligations, You may act only
+   on Your own behalf and on Your sole responsibility, not on behalf
+   of any other Contributor, and only if You agree to indemnify,
+   defend, and hold each Contributor harmless for any liability
+   incurred by, or claims asserted against, such Contributor by reason
+   of your accepting any such warranty or additional liability.
+END OF TERMS AND CONDITIONS
+APPENDIX: How to apply the Apache License to your work.
+   To apply the Apache License to your work, attach the following
+   boilerplate notice, with the fields enclosed by brackets "[]"
+   replaced with your own identifying information. (Don't include
+   the brackets!)  The text should be enclosed in the appropriate
+   comment syntax for the file format. We also recommend that a
+   file or class name and description of purpose be included on the
+   same "printed page" as the copyright notice for easier
+   identification within third-party archives.
+Copyright [yyyy] [name of copyright owner]
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+	http://www.apache.org/licenses/LICENSE-2.0
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.

LICENSE.CC-BY-4.0 ADDED Viewed

	@@ -0,0 +1,52 @@

+Creative Commons Attribution 4.0 International (CC-BY-4.0)
+This CC-BY-4.0 license applies to:
+  plda/eigenvectors_desc.bin
+  plda/lda.bin
+  plda/mean1.bin
+  plda/mean2.bin
+  plda/mu.bin
+  plda/phi_desc.bin
+  plda/psi.bin
+  plda/tr.bin
+  plda/plda.npz
+  plda/xvec_transform.npz
+Required attribution (per upstream `plda/README.md` in the
+`pyannote/speaker-diarization-community-1` HuggingFace snapshot at
+revision 3533c8cf8e369892e6b79ff1bf80f7b0286a54ee):
+  PLDA model trained by BUT Speech@FIT (https://speech.fit.vut.cz/).
+  Integration of VBx in pyannote.audio by Jiangyu Han and Petr Pálka.
+The full text of the CC-BY-4.0 license is available at:
+  https://creativecommons.org/licenses/by/4.0/legalcode
+Summary of permissions granted (not a substitute for the legal text):
+You are free to:
+  Share — copy and redistribute the material in any medium or format
+  Adapt — remix, transform, and build upon the material
+  for any purpose, even commercially.
+The licensor cannot revoke these freedoms as long as you follow the
+license terms.
+Under the following terms:
+  Attribution — You must give appropriate credit, provide a link to the
+  license, and indicate if changes were made. You may do so in any
+  reasonable manner, but not in any way that suggests the licensor
+  endorses you or your use.
+  No additional restrictions — You may not apply legal terms or
+  technological measures that legally restrict others from doing
+  anything the license permits.
+Notices:
+  You do not have to comply with the license for elements of the
+  material in the public domain or where your use is permitted by an
+  applicable exception or limitation.
+  No warranties are given. The license may not give you all of the
+  permissions necessary for your intended use. For example, other
+  rights such as publicity, privacy, or moral rights may limit how you
+  use the material.

LICENSE.MIT ADDED Viewed

	@@ -0,0 +1,27 @@

+MIT License
+Copyright (c) 2023 CNRS
+This MIT license applies to:
+  segmentation-3.0.onnx
+Author: Hervé Bredin (CNRS / IRIT) — pyannote.audio author and lead trainer.
+Source: https://huggingface.co/pyannote/segmentation-3.0
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

README.md ADDED Viewed

	@@ -0,0 +1,210 @@

+---
+license: other
+license_name: mixed-mit-cc-by-4-apache-2
+license_link: LICENSE
+language:
+- en
+- multilingual
+library_name: onnx
+tags:
+- speaker-diarization
+- diarization
+- pyannote
+- speaker-embedding
+- wespeaker
+- segmentation
+pipeline_tag: voice-activity-detection
+---
+# dia-models — pyannote community-1 model bundle for the `dia` Rust crate
+A single-repo distribution of every model artifact the
+[`dia`](https://github.com/al8n/diarization) Rust crate needs to run
+end-to-end speaker diarization with **pyannote-community-1** parity:
+- The **segmentation-3.0** powerset speaker network (16 kHz audio →
+  per-frame speaker activations).
+- The **WeSpeaker ResNet34-LM** speaker-embedding network, in three
+  forms (external-data ONNX, single-file ONNX, TorchScript).
+- The **PLDA** whitening + LDA weights from the
+  [`pyannote/speaker-diarization-community-1`](https://huggingface.co/pyannote/speaker-diarization-community-1)
+  pipeline, in both `.npz` (build-time) and raw little-endian f64
+  `.bin` (runtime) form.
+`dia` already embeds the segmentation model and the PLDA weights into
+the compiled binary via `include_bytes!`; the **WeSpeaker** ONNX is
+the only artifact callers must download separately. This repo lets
+callers grab any individual model — or the whole bundle — without
+spelunking through the upstream pyannote / WeSpeaker repos.
+> **Attribution: this is a redistribution, not new model training.**
+> All weights come from upstream pyannote / WeSpeaker / BUT Speech@FIT.
+> The licenses below MUST be preserved by anyone redistributing.
+## Files
+| File | Size | Format | License |
+|---|---:|---|---|
+| `segmentation-3.0.onnx` | 5.99 MiB | ONNX (single file) | MIT |
+| `wespeaker_resnet34_lm.onnx` | 256 KiB | ONNX header (external data) | Apache-2.0 |
+| `wespeaker_resnet34_lm.onnx.data` | 25.3 MiB | external-data weights | Apache-2.0 |
+| `wespeaker_resnet34_lm_packed.onnx` | 25.5 MiB | ONNX (single file, repacked) | Apache-2.0 |
+| `wespeaker_resnet34_lm.pt` | 25.6 MiB | TorchScript | Apache-2.0 |
+| `plda/eigenvectors_desc.bin` | 128 KiB | f64 (128×128 row-major) | CC-BY-4.0 |
+| `plda/lda.bin` | 256 KiB | f64 (256×128 row-major) | CC-BY-4.0 |
+| `plda/mean1.bin` | 2 KiB | f64 (256,) | CC-BY-4.0 |
+| `plda/mean2.bin` | 1 KiB | f64 (128,) | CC-BY-4.0 |
+| `plda/mu.bin` | 1 KiB | f64 (128,) | CC-BY-4.0 |
+| `plda/phi_desc.bin` | 1 KiB | f64 (128,) | CC-BY-4.0 |
+| `plda/psi.bin` | 1 KiB | f64 (128,) | CC-BY-4.0 |
+| `plda/tr.bin` | 128 KiB | f64 (128×128 row-major) | CC-BY-4.0 |
+| `plda/plda.npz` | 131 KiB | numpy (`mu`, `tr`, `psi`) | CC-BY-4.0 |
+| `plda/xvec_transform.npz` | 131 KiB | numpy (`mean1`, `mean2`, `lda`) | CC-BY-4.0 |
+## Which file do I want?
+### Segmentation
+Use `segmentation-3.0.onnx`. It feeds `dia::segment::SegmentModel`
+(or any pyannote-segmentation-compatible runtime). Single file, no
+external data, works on every ORT execution provider.
+### Embedding (WeSpeaker)
+Three forms, same weights, pick by use case:
+- **`wespeaker_resnet34_lm.onnx` + `wespeaker_resnet34_lm.onnx.data`**
+  — the default ONNX layout. Loads on CPU / TensorRT / CUDA / OpenVINO
+  / DirectML. The `.onnx` and `.onnx.data` files MUST sit next to
+  each other on disk; ORT resolves the external pointer by relative
+  path.
+- **`wespeaker_resnet34_lm_packed.onnx`** — same model with all
+  weights inlined into one file. Use this if you want a single-file
+  artifact, or if the runtime is **CoreML** (Apple Silicon — Apple's
+  graph optimizer chokes on external initializers and reports
+  `model_path must not be empty`; the packed form sidesteps it).
+  Otherwise functionally identical.
+- **`wespeaker_resnet34_lm.pt`** — TorchScript export for the
+  `tch` backend. Bit-exact to upstream PyTorch on hard cases (heavy-
+  overlap fixtures where the ONNX→ORT path can drift by O(1) per
+  element). Pulls in libtorch (~600 MB shared library).
+### PLDA
+The eight `.bin` files are the runtime data — raw little-endian f64
+blobs that `dia::plda` embeds via `include_bytes!`. The two `.npz`
+files are the build-time sources (`xvec_transform.npz` exposes
+`mean1` / `mean2` / `lda`; `plda.npz` exposes `mu` / `tr` /
+`psi`); they are mirrored from the upstream pyannote-community-1
+snapshot for traceability and so the `.bin` extraction can be
+re-run via `scripts/extract-plda-blobs.sh` in the dia repo.
+`eigenvectors_desc.bin` and `phi_desc.bin` are scipy-derived
+eigenvectors of the PLDA generalized eigenproblem `(B, W)` — pinned
+to avoid LAPACK eigenvector-sign indeterminism (which produced a
+38% DER divergence on three-speaker fixtures when nalgebra and
+scipy disagreed on 67 of 128 column signs). See
+[`models/plda/SOURCE.md`](https://github.com/al8n/diarization/blob/main/models/plda/SOURCE.md)
+in the dia repo for the regeneration procedure.
+## Provenance
+### segmentation-3.0.onnx
+- **Upstream:** [`pyannote/segmentation-3.0`](https://huggingface.co/pyannote/segmentation-3.0)
+- **Original layout:** `pytorch_model.onnx` in the upstream HF repo.
+- **License:** MIT — Copyright (c) 2023 CNRS
+- **Author:** Hervé Bredin (CNRS / IRIT), pyannote.audio author and
+  lead trainer.
+- **SHA-256:** `057ee564753071c0b09b5b611648b50ac188d50846bff5f01e9f7bbf1591ea25`
+### wespeaker_resnet34_lm.onnx (+ .data) / .pt / _packed.onnx
+- **Upstream model architecture:** WeSpeaker ResNet34 with
+  large-margin (LM) angular fine-tuning, trained on VoxCeleb-2.
+- **Upstream sources:**
+  - [WeSpeaker project](https://github.com/wenet-e2e/wespeaker) (Apache-2.0)
+  - [`onnx-community/wespeaker_resnet34_lm`](https://huggingface.co/onnx-community/wespeaker_resnet34_lm)
+    for the ONNX export.
+- **License:** Apache-2.0.
+- **`_packed.onnx` derivative:** produced by loading
+  `wespeaker_resnet34_lm.onnx` + `.onnx.data` via the `onnx` Python
+  library (`onnx.load(path, load_external_data=True)`) and re-saving
+  with `save_as_external_data=False`. Same weights, no external file.
+### plda/
+- **Upstream:** [`pyannote/speaker-diarization-community-1`](https://huggingface.co/pyannote/speaker-diarization-community-1)
+- **License:** CC-BY-4.0
+- **Snapshot revision:** `3533c8cf8e369892e6b79ff1bf80f7b0286a54ee`
+- **Original layout in the upstream HF repo:**
+  `plda/xvec_transform.npz` and `plda/plda.npz`.
+- **Attribution (per upstream `plda/README.md`):**
+  PLDA model trained by [BUT Speech@FIT](https://speech.fit.vut.cz/);
+  integration of VBx in pyannote.audio by Jiangyu Han and Petr Pálka.
+## Usage
+### From `dia` (Rust)
+```rust
+use diarization::{
+  embed::EmbedModel,
+  plda::PldaTransform,
+  segment::SegmentModel,
+};
+// Segmentation + PLDA are bundled by default — no download needed.
+let mut seg = SegmentModel::bundled()?;
+let plda = PldaTransform::new()?;
+// WeSpeaker is BYO; download from this repo.
+let mut emb = EmbedModel::from_file("wespeaker_resnet34_lm.onnx")?;
+# Ok::<(), Box<dyn std::error::Error>>(())
+```
+### Direct download
+```bash
+# whole bundle
+hf download FinDIT-Studio/dia-models --local-dir ./dia-models
+# just the embedding model (default ONNX form)
+hf download FinDIT-Studio/dia-models \
+  wespeaker_resnet34_lm.onnx wespeaker_resnet34_lm.onnx.data \
+  --local-dir ./models
+# CoreML-friendly single-file form
+hf download FinDIT-Studio/dia-models \
+  wespeaker_resnet34_lm_packed.onnx --local-dir ./models
+```
+## Licenses
+This repository **redistributes** model artifacts under three different
+licenses. Each artifact retains its upstream license. By using this
+bundle you agree to comply with **all three**:
+- **MIT** for `segmentation-3.0.onnx` (Copyright © 2023 CNRS, Hervé Bredin).
+  See `LICENSE.MIT`.
+- **Apache-2.0** for the WeSpeaker artifacts. See `LICENSE.APACHE-2.0`.
+- **CC-BY-4.0** for everything under `plda/`. See `LICENSE.CC-BY-4.0`.
+  Required attribution: *PLDA model trained by BUT Speech@FIT;
+  integration of VBx in pyannote.audio by Jiangyu Han and Petr Pálka.*
+The `dia` Rust crate that consumes these models is itself dual-licensed
+MIT OR Apache-2.0; that licensing applies to the source code, not to the
+model weights bundled here.
+## Citation
+If you use these weights in academic work, please cite the upstream
+papers / model cards:
+- **Segmentation-3.0:** Hervé Bredin, *pyannote.audio 2.1 speaker
+  diarization pipeline: principle, benchmark, and recipe*, Interspeech
+  2023.
+- **WeSpeaker:** Wang et al., *WeSpeaker: A research and production
+  oriented speaker embedding learning toolkit*, ICASSP 2023.
+- **PLDA / VBx:** Landini et al., *Bayesian HMM clustering of x-vector
+  sequences (VBx) in speaker diarization: theory, implementation and
+  analysis on standard tasks*, Computer Speech & Language, 2022.
+## Issues / questions
+This repo is a **redistribution** of upstream artifacts. Please file
+issues against:
+- The dia Rust crate: <https://github.com/al8n/diarization/issues>
+- The pyannote.audio project: <https://github.com/pyannote/pyannote-audio/issues>
+- The WeSpeaker project: <https://github.com/wenet-e2e/wespeaker/issues>

plda/eigenvectors_desc.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:caaa0425dc9cc73ffe559f5abe0b8010e31792050f6bd5922eb15ddb84b4f5ee
+size 131072

plda/lda.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3497ba2d97beaa73b310e34a0f4ccc0648a0ca48069699c225063f0d972ba91d
+size 262144

plda/mean1.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4ff32f244658ff69c12b11c19e0f95e4ef8d33f22781f0e2821c4ac986941487
+size 2048

plda/mean2.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1858e57f04937fbb89726ac09c98e9905d182eb6fe7c6aff2b5bdb0fd30564c3
+size 1024

plda/mu.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d67b1d54babdfd8c2547b9e5ba96abb30079b5bcc6b4aaa5985e77571537c798
+size 1024

plda/phi_desc.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1193f733a91d72f4080993471b5971fa555dd9bdf425766fabef835bf73df541
+size 1024

plda/plda.npz ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9b77bcd840692710dd3496f62ecfeed8d8e5f002fd991b785079b244eab7d255
+size 133852

plda/psi.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:72c17389945e40565bd3e07cf529dad328e4f28649b5c286dee92348f623b76b
+size 1024

plda/tr.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f7acd9020ace3908b7ba37c04091fe0555fff4ed0678647866ce2c67208b76f6
+size 131072

plda/xvec_transform.npz ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:325f1ce8e48f7e55e9c8aa47e05d2766b7c48c4b25b8de8dd751e7a4cc5fbe8f
+size 134376

segmentation-3.0.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:057ee564753071c0b09b5b611648b50ac188d50846bff5f01e9f7bbf1591ea25
+size 5986908

wespeaker_resnet34_lm.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b058ea970bc4c713e4afe0b3d8fe1c2b6439ba94fd912368cd954039deb2cfa5
+size 262499

wespeaker_resnet34_lm.onnx.data ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0590f068ff1ba0f6718a735a3c71fbd8b0ac41fbac4569654707977eb9a4394e
+size 26542080

wespeaker_resnet34_lm.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8bd868195ea0e672fb44999bfd10fa6110e688c7de9e3584583dad2da30ef501
+size 26816730

wespeaker_resnet34_lm_packed.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4c15c6be4235318d092c9d347e00c68ba476136d6172f675f76ad6b0c2661f01
+size 26775311