jungjee commited on
Commit
c354ac2
·
verified ·
1 Parent(s): b33d1e3

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +13 -20
README.md CHANGED
@@ -27,6 +27,18 @@ pip install -e .
27
  cd egs2/voxceleb/spk1
28
  ./run.sh --skip_data_prep false --skip_train true --download_model espnet/voxcelebs12_ecapa_wavlm_joint
29
  ```
 
 
 
 
 
 
 
 
 
 
 
 
30
 
31
  <!-- Generated by scripts/utils/show_spk_result.py -->
32
  # RESULTS
@@ -263,28 +275,9 @@ distributed: true
263
  author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
264
  title={{ESPnet}: End-to-End Speech Processing Toolkit},
265
  year={2018},
266
- booktitle={Proceedings of Interspeech},
267
  pages={2207--2211},
268
  doi={10.21437/Interspeech.2018-1456},
269
  url={http://dx.doi.org/10.21437/Interspeech.2018-1456}
270
  }
271
-
272
-
273
-
274
-
275
-
276
-
277
- ```
278
-
279
- or arXiv:
280
-
281
- ```bibtex
282
- @misc{watanabe2018espnet,
283
- title={ESPnet: End-to-End Speech Processing Toolkit},
284
- author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
285
- year={2018},
286
- eprint={1804.00015},
287
- archivePrefix={arXiv},
288
- primaryClass={cs.CL}
289
- }
290
  ```
 
27
  cd egs2/voxceleb/spk1
28
  ./run.sh --skip_data_prep false --skip_train true --download_model espnet/voxcelebs12_ecapa_wavlm_joint
29
  ```
30
+ ```python
31
+ import numpy as np
32
+ from espnet2.bin.spk_inference import Speech2Embedding
33
+
34
+ # from uploaded models
35
+ speech2spk_embed = Speech2Embedding.from_pretrained(model_tag="espnet/voxcelebs12_rawnet3")
36
+ embedding = speech2spk_embed(np.zeros(16500))
37
+
38
+ # from checkpoints trained by oneself
39
+ speech2spk_embed = Speech2Embedding(model_file="model.pth", train_config="config.yaml")
40
+ embedding = speech2spk_embed(np.zeros(32000))
41
+ ```
42
 
43
  <!-- Generated by scripts/utils/show_spk_result.py -->
44
  # RESULTS
 
275
  author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
276
  title={{ESPnet}: End-to-End Speech Processing Toolkit},
277
  year={2018},
278
+ booktitle={Proc. Interspeech},
279
  pages={2207--2211},
280
  doi={10.21437/Interspeech.2018-1456},
281
  url={http://dx.doi.org/10.21437/Interspeech.2018-1456}
282
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
283
  ```