qgyd2021 commited on
Commit
d9b0161
1 Parent(s): 3e60665

Upload 61 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. data/test_wavs/aidatatang_200zh/README.md +2 -0
  2. data/test_wavs/aidatatang_200zh/T0055G0036S0002.wav +3 -0
  3. data/test_wavs/aidatatang_200zh/T0055G0036S0003.wav +3 -0
  4. data/test_wavs/aidatatang_200zh/T0055G0036S0004.wav +3 -0
  5. data/test_wavs/aishell2/ID0012W0030.wav +3 -0
  6. data/test_wavs/aishell2/ID0012W0162.wav +3 -0
  7. data/test_wavs/aishell2/ID0012W0215.wav +3 -0
  8. data/test_wavs/aishell2/README.md +2 -0
  9. data/test_wavs/aishell2/trans.txt +3 -0
  10. data/test_wavs/alimeeting/165.wav +3 -0
  11. data/test_wavs/alimeeting/209.wav +3 -0
  12. data/test_wavs/alimeeting/74.wav +3 -0
  13. data/test_wavs/alimeeting/R8003_M8001-8004-165.wav +3 -0
  14. data/test_wavs/alimeeting/R8008_M8013-8049-74.wav +3 -0
  15. data/test_wavs/alimeeting/R8009_M8020_N_SPK8026-8026-209.wav +3 -0
  16. data/test_wavs/alimeeting/trans.txt +3 -0
  17. data/test_wavs/arabic/a.wav +3 -0
  18. data/test_wavs/arabic/b.wav +3 -0
  19. data/test_wavs/arabic/c.wav +3 -0
  20. data/test_wavs/arabic/trans.txt +3 -0
  21. data/test_wavs/cantonese/1.wav +3 -0
  22. data/test_wavs/cantonese/2.wav +3 -0
  23. data/test_wavs/french/common_voice_fr_19364697.wav +3 -0
  24. data/test_wavs/french/common_voice_fr_19738183.wav +3 -0
  25. data/test_wavs/french/common_voice_fr_27024649.wav +3 -0
  26. data/test_wavs/french/trans.txt +3 -0
  27. data/test_wavs/german/20120315-0900-PLENARY-14-de_20120315.wav +3 -0
  28. data/test_wavs/german/20170517-0900-PLENARY-16-de_20170517.wav +3 -0
  29. data/test_wavs/gigaspeech/1-minute-audiobook.opus +0 -0
  30. data/test_wavs/gigaspeech/100-seconds-podcast.opus +0 -0
  31. data/test_wavs/gigaspeech/100-seconds-youtube.opus +0 -0
  32. data/test_wavs/librispeech/1089-134686-0001.wav +3 -0
  33. data/test_wavs/librispeech/1221-135766-0001.wav +3 -0
  34. data/test_wavs/librispeech/1221-135766-0002.wav +3 -0
  35. data/test_wavs/librispeech/README.md +2 -0
  36. data/test_wavs/librispeech/trans.txt +3 -0
  37. data/test_wavs/paraformer-zh/si_chuan_hua.wav +3 -0
  38. data/test_wavs/paraformer-zh/tian_jin_hua.wav +3 -0
  39. data/test_wavs/paraformer-zh/zheng_zhou_hua.wav +3 -0
  40. data/test_wavs/russian/russian-i-love-you.wav +3 -0
  41. data/test_wavs/russian/test.wav +3 -0
  42. data/test_wavs/tal_csasr/0.wav +3 -0
  43. data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_132.wav +3 -0
  44. data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_138.wav +3 -0
  45. data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_145.wav +3 -0
  46. data/test_wavs/tal_csasr/README.md +2 -0
  47. data/test_wavs/tedlium3/DanBarber_2010-219.wav +3 -0
  48. data/test_wavs/tedlium3/DanielKahneman_2010-157.wav +3 -0
  49. data/test_wavs/tedlium3/RobertGupta_2010U-15.wav +3 -0
  50. data/test_wavs/tedlium3/trans.txt +3 -0
data/test_wavs/aidatatang_200zh/README.md ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Files are downloaded from
2
+ https://huggingface.co/luomingshuang/icefall_asr_aidatatang-200zh_pruned_transducer_stateless2/tree/main/test_wavs
data/test_wavs/aidatatang_200zh/T0055G0036S0002.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c7bf25a97de0819064c05952d40d93047da474d1e927424b3f27fb71bca403e
3
+ size 67630
data/test_wavs/aidatatang_200zh/T0055G0036S0003.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88e2e8ef9cc009305e3cb42ddd806c757a7ffc1b85a4402c39e2b59e81ab9ec8
3
+ size 94174
data/test_wavs/aidatatang_200zh/T0055G0036S0004.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea822f7873b89443191e4a3b4b08c62b81de3a0a4a7b806d273da975a0b9e9fc
3
+ size 70460
data/test_wavs/aishell2/ID0012W0030.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f042c6cd8cb7fc745f37805565b5ce41b9a4f38a54b267e1a9afd806d5216a38
3
+ size 112878
data/test_wavs/aishell2/ID0012W0162.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aacdc76fc8b37bc2bdd1c05a4bfd42a5ac3333a53c06088abe9814fb1e5e0912
3
+ size 114124
data/test_wavs/aishell2/ID0012W0215.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f48eb860503ec691d7d6b99dfc1491a88f30a0930676b3c5dc9170edce041c46
3
+ size 104368
data/test_wavs/aishell2/README.md ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Files are downloaded from
2
+ https://huggingface.co/yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12/tree/main/test_wavs
data/test_wavs/aishell2/trans.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ ID0012W0162 立法机关采纳了第二种意见
2
+ ID0012W0215 大家都愿意牺牲自己的生命
3
+ ID0012W0030 完全是典型的军事侵略
data/test_wavs/alimeeting/165.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48c131d205a0d93acdcdfc0d81e2ee839f4f3261ca7654e3e3ce175a0ec6098d
3
+ size 262764
data/test_wavs/alimeeting/209.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9374efff5517fd624ceee8551cd8cd3680fc3ed8ff964fe5f17c1064f05ebfb
3
+ size 154604
data/test_wavs/alimeeting/74.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c371dd14ff73d7128e1508c71dd6eef934f91c082e5946bf4bdd87761ae44a13
3
+ size 120364
data/test_wavs/alimeeting/R8003_M8001-8004-165.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b10ddaddabeb905a7915f670502773328d3321beda436907fb0f36c52b2d04e
3
+ size 525498
data/test_wavs/alimeeting/R8008_M8013-8049-74.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cc97f90e46825e8d6783ea0d41112165c5fffb33d5519fd0d3c6860a43cac70
3
+ size 240698
data/test_wavs/alimeeting/R8009_M8020_N_SPK8026-8026-209.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f825ce6a99b00ec30cb276ee821099b63b1594a6782b88aa5117bd578b61f5a
3
+ size 309178
data/test_wavs/alimeeting/trans.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ R8009_M8020_N_SPK8026-8026-209 并不是说一天的话就一定要对一个人进行一个了解这样的话
2
+ R8003_M8001-8004-165 如果他要是不愿意提供地址也不愿意接收礼物那么第二个这个分支可能就省省下了
3
+ R8008_M8013-8049-74 面试的话五月五号到五月十号吧面试
data/test_wavs/arabic/a.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09d4ef01e713b5ea57459dcb8e31631816bc8acdc0833dc41ad3b1ff000a4da5
3
+ size 252846
data/test_wavs/arabic/b.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faecc4e69fb4a1b64b47edada3a6a84c8ff7216027c2490b105b4481bef4b12c
3
+ size 243244
data/test_wavs/arabic/c.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62f08f3c5148e8c69c1607cb067e66034820c4a4322c80e7b396b1bd4360de8b
3
+ size 149804
data/test_wavs/arabic/trans.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ 94D37D38-B203-4FC0-9F3A-538F5C174920_spk-0001_seg-0053813:0054281 بعد أن عجز وبدأ يصدر مشكلات شعبه ومشكلات مصر
2
+ 94D37D38-B203-4FC0-9F3A-538F5C174920_spk-0001_seg-0051454:0052244 وهؤلاء أولياء الشيطان ها هو ذا أحدهم الآن ضيفا عليكم على قناة الجزيرة ولا يستحي في ذلك
3
+ 94D37D38-B203-4FC0-9F3A-538F5C174920_spk-0001_seg-0052244:0053004 عندما استغاث الليبيون بالعالم استغاثوا لرفع الظلم وليس لقهر إرادة الأمة ومصادرة الحياة الدستورية
data/test_wavs/cantonese/1.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22568f57d298bea915f263dea7f41d628eea096e80a85b81ce88b7689ef3eee4
3
+ size 191276
data/test_wavs/cantonese/2.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d75fcd99f9693e91ce3303c97d312594a2a95659db5d43bdcefa87e2256e0de
3
+ size 139052
data/test_wavs/french/common_voice_fr_19364697.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b057a0b3badb2b5e1352b6b058726dc03a063e74794232ed266d5b3ad573f9ca
3
+ size 228174
data/test_wavs/french/common_voice_fr_19738183.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af7487e23134c3fcc6d74627dcefb5c3c45a2bfa24b4290758efd89139a43884
3
+ size 122190
data/test_wavs/french/common_voice_fr_27024649.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76021a91ebbe9110d8cbd19a091cea4c305c417ba0c25f32d6f995c362b0b9f2
3
+ size 202830
data/test_wavs/french/trans.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ common_voice_fr_19738183 CE DERNIER A ÉVOLUÉ TOUT AU LONG DE L'HISTOIRE ROMAINE
2
+ common_voice_fr_27024649 SON ACTIONNAIRE MAJORITAIRE EST LE CONSEIL TERRITORIAL DE SAINT PIERRE ET MIQUELON
3
+ common_voice_fr_19364697 CE SITE CONTIENT QUATRE TOMBEAUX DE LA DYNASTIE ACHÉMÉNIDE ET SEPT DES SASSANIDES
data/test_wavs/german/20120315-0900-PLENARY-14-de_20120315.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edc4f5a2c3e4f6ce99d11490087ef23fa55806a5e32575d3528bf599e0deb711
3
+ size 381356
data/test_wavs/german/20170517-0900-PLENARY-16-de_20170517.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c3b63669e92c6df5bfa3aae0843c64f9eef1be2e85e652b0991a25ebc4e30bb
3
+ size 282284
data/test_wavs/gigaspeech/1-minute-audiobook.opus ADDED
Binary file (580 kB). View file
 
data/test_wavs/gigaspeech/100-seconds-podcast.opus ADDED
Binary file (955 kB). View file
 
data/test_wavs/gigaspeech/100-seconds-youtube.opus ADDED
Binary file (948 kB). View file
 
data/test_wavs/librispeech/1089-134686-0001.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bc58a4efdf20daac252b6b1502632601a71efe0308f6757dc1eda34891a7e4f
3
+ size 212044
data/test_wavs/librispeech/1221-135766-0001.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5143a6ba93c4b274e2c4ac22deb75c2c48936c853f0519add1de828b6c79cc5a
3
+ size 534924
data/test_wavs/librispeech/1221-135766-0002.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65b222837919ccbb924a4e1077413ea7cc6af3e68b663b012a9539d5c05850f0
3
+ size 154444
data/test_wavs/librispeech/README.md ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Files are downloaded from
2
+ https://huggingface.co/csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless5-2022-05-13/tree/main/test_wavs
data/test_wavs/librispeech/trans.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ 1089-134686-0001 AFTER EARLY NIGHTFALL THE YELLOW LAMPS WOULD LIGHT UP HERE AND THERE THE SQUALID QUARTER OF THE BROTHELS
2
+ 1221-135766-0001 GOD AS A DIRECT CONSEQUENCE OF THE SIN WHICH MAN THUS PUNISHED HAD GIVEN HER A LOVELY CHILD WHOSE PLACE WAS ON THAT SAME DISHONOURED BOSOM TO CONNECT HER PARENT FOR EVER WITH THE RACE AND DESCENT OF MORTALS AND TO BE FINALLY A BLESSED SOUL IN HEAVEN
3
+ 1221-135766-0002 YET THESE THOUGHTS AFFECTED HESTER PRYNNE LESS WITH HOPE THAN APPREHENSION
data/test_wavs/paraformer-zh/si_chuan_hua.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:150b75ada9f5b4011018e961e56427e4af6849fcc69764321556586bc4790c49
3
+ size 250764
data/test_wavs/paraformer-zh/tian_jin_hua.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1127451bad4c45953a5b788ab4977170388e91454ef90fee55754c4587628782
3
+ size 249932
data/test_wavs/paraformer-zh/zheng_zhou_hua.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed767dc9a89489888060c65bc246e702b2ab25e16977998be10edc459c9e4397
3
+ size 255724
data/test_wavs/russian/russian-i-love-you.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3ac4f6e5b818ec89bdd884f60637daa32ef0ed19a11981b7e02e3e7799dfd79
3
+ size 295758
data/test_wavs/russian/test.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6e768803b3bc3afcb08326677f3bb872c9beeed29af40d3579bcc14e74484f8
3
+ size 226604
data/test_wavs/tal_csasr/0.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eddf384a906bd6d905c9d9d652d614def1857608b88c2eee663ceeccbb31f7a3
3
+ size 259278
data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_132.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bfb42c963e623ebab31b81ff4404867d07d3102507c87ac14577c4c61663b8c
3
+ size 163244
data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_138.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20805bcc696b9b65f3357a2508a419d4f33b81006d47e1312e219b0fad934d1d
3
+ size 150124
data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_145.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5851e31f3e8e5f741635da9466e19fccfbabd117ebcdc92db242c92483aee064
3
+ size 282604
data/test_wavs/tal_csasr/README.md ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ Files are downloaded from
2
+ https://huggingface.co/luomingshuang/icefall_asr_tal-csasr_pruned_transducer_stateless5/tree/main/test_wavs
data/test_wavs/tedlium3/DanBarber_2010-219.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:667b031ad4f6ca87c00a152fe8d0005f6e703465662ed87815cb53d2e74a9bb1
3
+ size 116908
data/test_wavs/tedlium3/DanielKahneman_2010-157.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38adf05dc46341aac948d7d43f5dfc9d8a3627989dbe9d43ab8548fa060612d9
3
+ size 403564
data/test_wavs/tedlium3/RobertGupta_2010U-15.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abadb1c7a252fd1c5781f8ee0a4378db9ec99924048b594b30b416dd2cf2013a
3
+ size 554604
data/test_wavs/tedlium3/trans.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ DanBarber_2010-219 well the last year this property had six hundred thousand birds on it
2
+ RobertGupta_2010U-15 and he was talking about invisible demons and smoke and how someone was poisoning him in his sleep and i was afraid not for myself but i was afraid that i was going to lose him that he was going to sink into one of his states
3
+ DanielKahneman_2010-157 goes very different ways depending on how you think and whether you think of the remembering self or you think of the experiencing self this is going to influence policy i think in years to come in the united states efforts are being made