Update README.md
Browse files
README.md
CHANGED
@@ -2,14 +2,14 @@
|
|
2 |
tags:
|
3 |
- espnet
|
4 |
- audio
|
5 |
-
-
|
6 |
language: en
|
7 |
datasets:
|
8 |
- slue-ted
|
9 |
license: cc-by-4.0
|
10 |
---
|
11 |
|
12 |
-
## ESPnet2
|
13 |
|
14 |
### `espnet/slueted_whisper_summ`
|
15 |
|
@@ -31,7 +31,7 @@ cd egs2/slue-ted/slu1
|
|
31 |
{'rouge1': 0.2255418629519756, 'rouge2': 0.0485061537185737, 'rougeL': 0.1596465851004139, 'rougeLsum': 0.15968116069467322, 'meteor': 0.2129616261465529}
|
32 |
RESULT 22.55418629519756 3.799127541421444e-132 15.96465851004139 21.29616261465529 83.78519008627457
|
33 |
|
34 |
-
##
|
35 |
|
36 |
<details><summary>expand</summary>
|
37 |
|
@@ -772,6 +772,15 @@ distributed: true
|
|
772 |
### Citing ESPnet
|
773 |
|
774 |
```BibTex
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
775 |
@inproceedings{watanabe2018espnet,
|
776 |
author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
|
777 |
title={{ESPnet}: End-to-End Speech Processing Toolkit},
|
@@ -782,11 +791,6 @@ distributed: true
|
|
782 |
url={http://dx.doi.org/10.21437/Interspeech.2018-1456}
|
783 |
}
|
784 |
|
785 |
-
|
786 |
-
|
787 |
-
|
788 |
-
|
789 |
-
|
790 |
```
|
791 |
|
792 |
or arXiv:
|
|
|
2 |
tags:
|
3 |
- espnet
|
4 |
- audio
|
5 |
+
- spoken-language-understanding
|
6 |
language: en
|
7 |
datasets:
|
8 |
- slue-ted
|
9 |
license: cc-by-4.0
|
10 |
---
|
11 |
|
12 |
+
## ESPnet2 SLU model
|
13 |
|
14 |
### `espnet/slueted_whisper_summ`
|
15 |
|
|
|
31 |
{'rouge1': 0.2255418629519756, 'rouge2': 0.0485061537185737, 'rougeL': 0.1596465851004139, 'rougeLsum': 0.15968116069467322, 'meteor': 0.2129616261465529}
|
32 |
RESULT 22.55418629519756 3.799127541421444e-132 15.96465851004139 21.29616261465529 83.78519008627457
|
33 |
|
34 |
+
## SLU config
|
35 |
|
36 |
<details><summary>expand</summary>
|
37 |
|
|
|
772 |
### Citing ESPnet
|
773 |
|
774 |
```BibTex
|
775 |
+
@inproceedings{ESPnet-SLU,
|
776 |
+
title={{ESPnet-SLU}: Advancing spoken language understanding through espnet},
|
777 |
+
author={Arora, Siddhant and Dalmia, Siddharth and Denisov, Pavel and Chang, Xuankai and Ueda, Yushi and Peng, Yifan and Zhang, Yuekai and Kumar, Sujay and Ganesan, Karthik and Yan, Brian and others},
|
778 |
+
booktitle={ICASSP 2022-2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
|
779 |
+
pages={7167--7171},
|
780 |
+
year={2022},
|
781 |
+
organization={IEEE}
|
782 |
+
}
|
783 |
+
|
784 |
@inproceedings{watanabe2018espnet,
|
785 |
author={Shinji Watanabe and Takaaki Hori and Shigeki Karita and Tomoki Hayashi and Jiro Nishitoba and Yuya Unno and Nelson Yalta and Jahn Heymann and Matthew Wiesner and Nanxin Chen and Adithya Renduchintala and Tsubasa Ochiai},
|
786 |
title={{ESPnet}: End-to-End Speech Processing Toolkit},
|
|
|
791 |
url={http://dx.doi.org/10.21437/Interspeech.2018-1456}
|
792 |
}
|
793 |
|
|
|
|
|
|
|
|
|
|
|
794 |
```
|
795 |
|
796 |
or arXiv:
|