diff --git a/data/test_wavs/aidatatang_200zh/README.md b/data/test_wavs/aidatatang_200zh/README.md new file mode 100644 index 0000000000000000000000000000000000000000..c379b5b859bf71723dc384ba14cf5789de85ce1b --- /dev/null +++ b/data/test_wavs/aidatatang_200zh/README.md @@ -0,0 +1,2 @@ +Files are downloaded from +https://huggingface.co/luomingshuang/icefall_asr_aidatatang-200zh_pruned_transducer_stateless2/tree/main/test_wavs diff --git a/data/test_wavs/aidatatang_200zh/T0055G0036S0002.wav b/data/test_wavs/aidatatang_200zh/T0055G0036S0002.wav new file mode 100644 index 0000000000000000000000000000000000000000..b446cef1f96a4dc9f48bccb327e6fd50e2aac26b --- /dev/null +++ b/data/test_wavs/aidatatang_200zh/T0055G0036S0002.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c7bf25a97de0819064c05952d40d93047da474d1e927424b3f27fb71bca403e +size 67630 diff --git a/data/test_wavs/aidatatang_200zh/T0055G0036S0003.wav b/data/test_wavs/aidatatang_200zh/T0055G0036S0003.wav new file mode 100644 index 0000000000000000000000000000000000000000..194a1b1d612dbd6d0c560216d4797b05e533759d --- /dev/null +++ b/data/test_wavs/aidatatang_200zh/T0055G0036S0003.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88e2e8ef9cc009305e3cb42ddd806c757a7ffc1b85a4402c39e2b59e81ab9ec8 +size 94174 diff --git a/data/test_wavs/aidatatang_200zh/T0055G0036S0004.wav b/data/test_wavs/aidatatang_200zh/T0055G0036S0004.wav new file mode 100644 index 0000000000000000000000000000000000000000..2c1bb29488f0b63dbb021cf11f0903fd2378589f --- /dev/null +++ b/data/test_wavs/aidatatang_200zh/T0055G0036S0004.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea822f7873b89443191e4a3b4b08c62b81de3a0a4a7b806d273da975a0b9e9fc +size 70460 diff --git a/data/test_wavs/aishell2/ID0012W0030.wav b/data/test_wavs/aishell2/ID0012W0030.wav new file mode 100644 index 0000000000000000000000000000000000000000..0113391a8fc0096c10ac9a5a3382889b9c8e9ffd --- /dev/null +++ b/data/test_wavs/aishell2/ID0012W0030.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f042c6cd8cb7fc745f37805565b5ce41b9a4f38a54b267e1a9afd806d5216a38 +size 112878 diff --git a/data/test_wavs/aishell2/ID0012W0162.wav b/data/test_wavs/aishell2/ID0012W0162.wav new file mode 100644 index 0000000000000000000000000000000000000000..9908691638b238131edf10ccc8ea57952a0b6699 --- /dev/null +++ b/data/test_wavs/aishell2/ID0012W0162.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aacdc76fc8b37bc2bdd1c05a4bfd42a5ac3333a53c06088abe9814fb1e5e0912 +size 114124 diff --git a/data/test_wavs/aishell2/ID0012W0215.wav b/data/test_wavs/aishell2/ID0012W0215.wav new file mode 100644 index 0000000000000000000000000000000000000000..c241b6ea30f4d5a25475049b60f083e283160467 --- /dev/null +++ b/data/test_wavs/aishell2/ID0012W0215.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f48eb860503ec691d7d6b99dfc1491a88f30a0930676b3c5dc9170edce041c46 +size 104368 diff --git a/data/test_wavs/aishell2/README.md b/data/test_wavs/aishell2/README.md new file mode 100644 index 0000000000000000000000000000000000000000..f6882a5d84cde0915ce2dd6297487d3a959000bb --- /dev/null +++ b/data/test_wavs/aishell2/README.md @@ -0,0 +1,2 @@ +Files are downloaded from +https://huggingface.co/yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12/tree/main/test_wavs diff --git a/data/test_wavs/aishell2/trans.txt b/data/test_wavs/aishell2/trans.txt new file mode 100644 index 0000000000000000000000000000000000000000..7746e18a1236742b0b68a588fd63bf0e2465f281 --- /dev/null +++ b/data/test_wavs/aishell2/trans.txt @@ -0,0 +1,3 @@ +ID0012W0162 立法机关采纳了第二种意见 +ID0012W0215 大家都愿意牺牲自己的生命 +ID0012W0030 完全是典型的军事侵略 \ No newline at end of file diff --git a/data/test_wavs/alimeeting/165.wav b/data/test_wavs/alimeeting/165.wav new file mode 100644 index 0000000000000000000000000000000000000000..b9a004b21005393b548d83f24eb3e91dc0810cb6 --- /dev/null +++ b/data/test_wavs/alimeeting/165.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48c131d205a0d93acdcdfc0d81e2ee839f4f3261ca7654e3e3ce175a0ec6098d +size 262764 diff --git a/data/test_wavs/alimeeting/209.wav b/data/test_wavs/alimeeting/209.wav new file mode 100644 index 0000000000000000000000000000000000000000..6bf339fdb1fb572a68a342e294f2b46e961d2900 --- /dev/null +++ b/data/test_wavs/alimeeting/209.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9374efff5517fd624ceee8551cd8cd3680fc3ed8ff964fe5f17c1064f05ebfb +size 154604 diff --git a/data/test_wavs/alimeeting/74.wav b/data/test_wavs/alimeeting/74.wav new file mode 100644 index 0000000000000000000000000000000000000000..1bf165f1ca563f5ce58a09bfac0cffffa130fd83 --- /dev/null +++ b/data/test_wavs/alimeeting/74.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c371dd14ff73d7128e1508c71dd6eef934f91c082e5946bf4bdd87761ae44a13 +size 120364 diff --git a/data/test_wavs/alimeeting/R8003_M8001-8004-165.wav b/data/test_wavs/alimeeting/R8003_M8001-8004-165.wav new file mode 100644 index 0000000000000000000000000000000000000000..dda41565dff7bcb0ecb68023a75959eff972a95f --- /dev/null +++ b/data/test_wavs/alimeeting/R8003_M8001-8004-165.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b10ddaddabeb905a7915f670502773328d3321beda436907fb0f36c52b2d04e +size 525498 diff --git a/data/test_wavs/alimeeting/R8008_M8013-8049-74.wav b/data/test_wavs/alimeeting/R8008_M8013-8049-74.wav new file mode 100644 index 0000000000000000000000000000000000000000..a52c668e006bc60469988a8aa1c502c0cd23bc3f --- /dev/null +++ b/data/test_wavs/alimeeting/R8008_M8013-8049-74.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cc97f90e46825e8d6783ea0d41112165c5fffb33d5519fd0d3c6860a43cac70 +size 240698 diff --git a/data/test_wavs/alimeeting/R8009_M8020_N_SPK8026-8026-209.wav b/data/test_wavs/alimeeting/R8009_M8020_N_SPK8026-8026-209.wav new file mode 100644 index 0000000000000000000000000000000000000000..797d31d4007b1f9bb143713f18769a866ae0c179 --- /dev/null +++ b/data/test_wavs/alimeeting/R8009_M8020_N_SPK8026-8026-209.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f825ce6a99b00ec30cb276ee821099b63b1594a6782b88aa5117bd578b61f5a +size 309178 diff --git a/data/test_wavs/alimeeting/trans.txt b/data/test_wavs/alimeeting/trans.txt new file mode 100644 index 0000000000000000000000000000000000000000..b9342b75b63b6fccea2841ea782f35bd75787d1b --- /dev/null +++ b/data/test_wavs/alimeeting/trans.txt @@ -0,0 +1,3 @@ +R8009_M8020_N_SPK8026-8026-209 并不是说一天的话就一定要对一个人进行一个了解这样的话 +R8003_M8001-8004-165 如果他要是不愿意提供地址也不愿意接收礼物那么第二个这个分支可能就省省下了 +R8008_M8013-8049-74 面试的话五月五号到五月十号吧面试 diff --git a/data/test_wavs/arabic/a.wav b/data/test_wavs/arabic/a.wav new file mode 100644 index 0000000000000000000000000000000000000000..68bb32af5660a709a66847de91d475cf8f9bf95d --- /dev/null +++ b/data/test_wavs/arabic/a.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09d4ef01e713b5ea57459dcb8e31631816bc8acdc0833dc41ad3b1ff000a4da5 +size 252846 diff --git a/data/test_wavs/arabic/b.wav b/data/test_wavs/arabic/b.wav new file mode 100644 index 0000000000000000000000000000000000000000..67ba665347811dfe2ae9810748069c842826870d --- /dev/null +++ b/data/test_wavs/arabic/b.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faecc4e69fb4a1b64b47edada3a6a84c8ff7216027c2490b105b4481bef4b12c +size 243244 diff --git a/data/test_wavs/arabic/c.wav b/data/test_wavs/arabic/c.wav new file mode 100644 index 0000000000000000000000000000000000000000..4817939203c5aa447649cab7d7bf24ab2b2f3a09 --- /dev/null +++ b/data/test_wavs/arabic/c.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62f08f3c5148e8c69c1607cb067e66034820c4a4322c80e7b396b1bd4360de8b +size 149804 diff --git a/data/test_wavs/arabic/trans.txt b/data/test_wavs/arabic/trans.txt new file mode 100644 index 0000000000000000000000000000000000000000..87b0af7fece1658d2ea8e9d6ad94dab9e7b01a0a --- /dev/null +++ b/data/test_wavs/arabic/trans.txt @@ -0,0 +1,3 @@ +94D37D38-B203-4FC0-9F3A-538F5C174920_spk-0001_seg-0053813:0054281 بعد أن عجز وبدأ يصدر مشكلات شعبه ومشكلات مصر +94D37D38-B203-4FC0-9F3A-538F5C174920_spk-0001_seg-0051454:0052244 وهؤلاء أولياء الشيطان ها هو ذا أحدهم الآن ضيفا عليكم على قناة الجزيرة ولا يستحي في ذلك +94D37D38-B203-4FC0-9F3A-538F5C174920_spk-0001_seg-0052244:0053004 عندما استغاث الليبيون بالعالم استغاثوا لرفع الظلم وليس لقهر إرادة الأمة ومصادرة الحياة الدستورية diff --git a/data/test_wavs/cantonese/1.wav b/data/test_wavs/cantonese/1.wav new file mode 100644 index 0000000000000000000000000000000000000000..8fb8573fc2429890daf90ff1527e7103a624ad59 --- /dev/null +++ b/data/test_wavs/cantonese/1.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22568f57d298bea915f263dea7f41d628eea096e80a85b81ce88b7689ef3eee4 +size 191276 diff --git a/data/test_wavs/cantonese/2.wav b/data/test_wavs/cantonese/2.wav new file mode 100644 index 0000000000000000000000000000000000000000..9f5c30894c7c250f221a90ce83bb6f4d09e1269d --- /dev/null +++ b/data/test_wavs/cantonese/2.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d75fcd99f9693e91ce3303c97d312594a2a95659db5d43bdcefa87e2256e0de +size 139052 diff --git a/data/test_wavs/french/common_voice_fr_19364697.wav b/data/test_wavs/french/common_voice_fr_19364697.wav new file mode 100644 index 0000000000000000000000000000000000000000..f7aa0bb86010fe026bf1a564c6af0e1ac1cad5c6 --- /dev/null +++ b/data/test_wavs/french/common_voice_fr_19364697.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b057a0b3badb2b5e1352b6b058726dc03a063e74794232ed266d5b3ad573f9ca +size 228174 diff --git a/data/test_wavs/french/common_voice_fr_19738183.wav b/data/test_wavs/french/common_voice_fr_19738183.wav new file mode 100644 index 0000000000000000000000000000000000000000..2d6aa7e54984a20671ad160081df9549f5eee416 --- /dev/null +++ b/data/test_wavs/french/common_voice_fr_19738183.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af7487e23134c3fcc6d74627dcefb5c3c45a2bfa24b4290758efd89139a43884 +size 122190 diff --git a/data/test_wavs/french/common_voice_fr_27024649.wav b/data/test_wavs/french/common_voice_fr_27024649.wav new file mode 100644 index 0000000000000000000000000000000000000000..f67bbaceb4c34dc01f1ef1d17b6a8fcba0d947c9 --- /dev/null +++ b/data/test_wavs/french/common_voice_fr_27024649.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76021a91ebbe9110d8cbd19a091cea4c305c417ba0c25f32d6f995c362b0b9f2 +size 202830 diff --git a/data/test_wavs/french/trans.txt b/data/test_wavs/french/trans.txt new file mode 100644 index 0000000000000000000000000000000000000000..f5db679745acf4b98a203fe5e87d6c562f752f34 --- /dev/null +++ b/data/test_wavs/french/trans.txt @@ -0,0 +1,3 @@ +common_voice_fr_19738183 CE DERNIER A ÉVOLUÉ TOUT AU LONG DE L'HISTOIRE ROMAINE +common_voice_fr_27024649 SON ACTIONNAIRE MAJORITAIRE EST LE CONSEIL TERRITORIAL DE SAINT PIERRE ET MIQUELON +common_voice_fr_19364697 CE SITE CONTIENT QUATRE TOMBEAUX DE LA DYNASTIE ACHÉMÉNIDE ET SEPT DES SASSANIDES diff --git a/data/test_wavs/german/20120315-0900-PLENARY-14-de_20120315.wav b/data/test_wavs/german/20120315-0900-PLENARY-14-de_20120315.wav new file mode 100644 index 0000000000000000000000000000000000000000..6fddecfb7317ea4b18fdabf40d310f5768900fc5 --- /dev/null +++ b/data/test_wavs/german/20120315-0900-PLENARY-14-de_20120315.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc4f5a2c3e4f6ce99d11490087ef23fa55806a5e32575d3528bf599e0deb711 +size 381356 diff --git a/data/test_wavs/german/20170517-0900-PLENARY-16-de_20170517.wav b/data/test_wavs/german/20170517-0900-PLENARY-16-de_20170517.wav new file mode 100644 index 0000000000000000000000000000000000000000..d91c7394eb1473ba673807d1693db33a58b08f88 --- /dev/null +++ b/data/test_wavs/german/20170517-0900-PLENARY-16-de_20170517.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c3b63669e92c6df5bfa3aae0843c64f9eef1be2e85e652b0991a25ebc4e30bb +size 282284 diff --git a/data/test_wavs/gigaspeech/1-minute-audiobook.opus b/data/test_wavs/gigaspeech/1-minute-audiobook.opus new file mode 100644 index 0000000000000000000000000000000000000000..eda5173b6c85e0e3294385058e8b55d65bb5d8ba Binary files /dev/null and b/data/test_wavs/gigaspeech/1-minute-audiobook.opus differ diff --git a/data/test_wavs/gigaspeech/100-seconds-podcast.opus b/data/test_wavs/gigaspeech/100-seconds-podcast.opus new file mode 100644 index 0000000000000000000000000000000000000000..f8796c931fe20872d003779c8057b027cfebf06c Binary files /dev/null and b/data/test_wavs/gigaspeech/100-seconds-podcast.opus differ diff --git a/data/test_wavs/gigaspeech/100-seconds-youtube.opus b/data/test_wavs/gigaspeech/100-seconds-youtube.opus new file mode 100644 index 0000000000000000000000000000000000000000..f1888a09c5f3b51fac9c4e79c4334f952ecde110 Binary files /dev/null and b/data/test_wavs/gigaspeech/100-seconds-youtube.opus differ diff --git a/data/test_wavs/librispeech/1089-134686-0001.wav b/data/test_wavs/librispeech/1089-134686-0001.wav new file mode 100644 index 0000000000000000000000000000000000000000..f58b5dd584aceb425bb6c46e62d434a5e5a171eb --- /dev/null +++ b/data/test_wavs/librispeech/1089-134686-0001.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bc58a4efdf20daac252b6b1502632601a71efe0308f6757dc1eda34891a7e4f +size 212044 diff --git a/data/test_wavs/librispeech/1221-135766-0001.wav b/data/test_wavs/librispeech/1221-135766-0001.wav new file mode 100644 index 0000000000000000000000000000000000000000..32f8e24ed1c40a1ea1039728b40742541b37716f --- /dev/null +++ b/data/test_wavs/librispeech/1221-135766-0001.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5143a6ba93c4b274e2c4ac22deb75c2c48936c853f0519add1de828b6c79cc5a +size 534924 diff --git a/data/test_wavs/librispeech/1221-135766-0002.wav b/data/test_wavs/librispeech/1221-135766-0002.wav new file mode 100644 index 0000000000000000000000000000000000000000..0f4ab4796500e2a529063deb400e32adea91f1f0 --- /dev/null +++ b/data/test_wavs/librispeech/1221-135766-0002.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65b222837919ccbb924a4e1077413ea7cc6af3e68b663b012a9539d5c05850f0 +size 154444 diff --git a/data/test_wavs/librispeech/README.md b/data/test_wavs/librispeech/README.md new file mode 100644 index 0000000000000000000000000000000000000000..742b4ce2095a2f0088388c69a70691de91db49b9 --- /dev/null +++ b/data/test_wavs/librispeech/README.md @@ -0,0 +1,2 @@ +Files are downloaded from +https://huggingface.co/csukuangfj/icefall-asr-librispeech-pruned-transducer-stateless5-2022-05-13/tree/main/test_wavs diff --git a/data/test_wavs/librispeech/trans.txt b/data/test_wavs/librispeech/trans.txt new file mode 100644 index 0000000000000000000000000000000000000000..989b907e299fbc3a4523e3485c07580428ffac50 --- /dev/null +++ b/data/test_wavs/librispeech/trans.txt @@ -0,0 +1,3 @@ +1089-134686-0001 AFTER EARLY NIGHTFALL THE YELLOW LAMPS WOULD LIGHT UP HERE AND THERE THE SQUALID QUARTER OF THE BROTHELS +1221-135766-0001 GOD AS A DIRECT CONSEQUENCE OF THE SIN WHICH MAN THUS PUNISHED HAD GIVEN HER A LOVELY CHILD WHOSE PLACE WAS ON THAT SAME DISHONOURED BOSOM TO CONNECT HER PARENT FOR EVER WITH THE RACE AND DESCENT OF MORTALS AND TO BE FINALLY A BLESSED SOUL IN HEAVEN +1221-135766-0002 YET THESE THOUGHTS AFFECTED HESTER PRYNNE LESS WITH HOPE THAN APPREHENSION diff --git a/data/test_wavs/paraformer-zh/si_chuan_hua.wav b/data/test_wavs/paraformer-zh/si_chuan_hua.wav new file mode 100644 index 0000000000000000000000000000000000000000..bef94074c0a92f5885684ef4db9bb2f5c5402f35 --- /dev/null +++ b/data/test_wavs/paraformer-zh/si_chuan_hua.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:150b75ada9f5b4011018e961e56427e4af6849fcc69764321556586bc4790c49 +size 250764 diff --git a/data/test_wavs/paraformer-zh/tian_jin_hua.wav b/data/test_wavs/paraformer-zh/tian_jin_hua.wav new file mode 100644 index 0000000000000000000000000000000000000000..63f7275d942967d9db5c77d760989ea177980a2a --- /dev/null +++ b/data/test_wavs/paraformer-zh/tian_jin_hua.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1127451bad4c45953a5b788ab4977170388e91454ef90fee55754c4587628782 +size 249932 diff --git a/data/test_wavs/paraformer-zh/zheng_zhou_hua.wav b/data/test_wavs/paraformer-zh/zheng_zhou_hua.wav new file mode 100644 index 0000000000000000000000000000000000000000..378c56dc3acedaca363c493ff48f5cb3ef334036 --- /dev/null +++ b/data/test_wavs/paraformer-zh/zheng_zhou_hua.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed767dc9a89489888060c65bc246e702b2ab25e16977998be10edc459c9e4397 +size 255724 diff --git a/data/test_wavs/russian/russian-i-love-you.wav b/data/test_wavs/russian/russian-i-love-you.wav new file mode 100644 index 0000000000000000000000000000000000000000..cbc1722c5c48ab647cb9212aa9a3fc0bb806296e --- /dev/null +++ b/data/test_wavs/russian/russian-i-love-you.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3ac4f6e5b818ec89bdd884f60637daa32ef0ed19a11981b7e02e3e7799dfd79 +size 295758 diff --git a/data/test_wavs/russian/test.wav b/data/test_wavs/russian/test.wav new file mode 100644 index 0000000000000000000000000000000000000000..d2ca4aba0268846f57bed312d9068485386611e1 --- /dev/null +++ b/data/test_wavs/russian/test.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6e768803b3bc3afcb08326677f3bb872c9beeed29af40d3579bcc14e74484f8 +size 226604 diff --git a/data/test_wavs/tal_csasr/0.wav b/data/test_wavs/tal_csasr/0.wav new file mode 100644 index 0000000000000000000000000000000000000000..1d9c8972ae4f8245d819146fafb501f3be41f3bd --- /dev/null +++ b/data/test_wavs/tal_csasr/0.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eddf384a906bd6d905c9d9d652d614def1857608b88c2eee663ceeccbb31f7a3 +size 259278 diff --git a/data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_132.wav b/data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_132.wav new file mode 100644 index 0000000000000000000000000000000000000000..6a72a4d7d33d069c8b858047964402c0bfb26a6e --- /dev/null +++ b/data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_132.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bfb42c963e623ebab31b81ff4404867d07d3102507c87ac14577c4c61663b8c +size 163244 diff --git a/data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_138.wav b/data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_138.wav new file mode 100644 index 0000000000000000000000000000000000000000..96c6d818f4936e39e5d11485afd441fb949fd114 --- /dev/null +++ b/data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_138.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20805bcc696b9b65f3357a2508a419d4f33b81006d47e1312e219b0fad934d1d +size 150124 diff --git a/data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_145.wav b/data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_145.wav new file mode 100644 index 0000000000000000000000000000000000000000..9a4fa6b2c8786388906257d56aa64b9db4e38653 --- /dev/null +++ b/data/test_wavs/tal_csasr/210_36476_210_8341_1_1533271973_7057520_145.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5851e31f3e8e5f741635da9466e19fccfbabd117ebcdc92db242c92483aee064 +size 282604 diff --git a/data/test_wavs/tal_csasr/README.md b/data/test_wavs/tal_csasr/README.md new file mode 100644 index 0000000000000000000000000000000000000000..db5ddd2a6a60da4a0780c5634aa9c0b1cea16c62 --- /dev/null +++ b/data/test_wavs/tal_csasr/README.md @@ -0,0 +1,2 @@ +Files are downloaded from +https://huggingface.co/luomingshuang/icefall_asr_tal-csasr_pruned_transducer_stateless5/tree/main/test_wavs diff --git a/data/test_wavs/tedlium3/DanBarber_2010-219.wav b/data/test_wavs/tedlium3/DanBarber_2010-219.wav new file mode 100644 index 0000000000000000000000000000000000000000..a86439e1a6d3215829cbe0c3b4d904c86e20c8c6 --- /dev/null +++ b/data/test_wavs/tedlium3/DanBarber_2010-219.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:667b031ad4f6ca87c00a152fe8d0005f6e703465662ed87815cb53d2e74a9bb1 +size 116908 diff --git a/data/test_wavs/tedlium3/DanielKahneman_2010-157.wav b/data/test_wavs/tedlium3/DanielKahneman_2010-157.wav new file mode 100644 index 0000000000000000000000000000000000000000..bc5ce7e4294292817fbc5f0f9b42d10ed2192a2b --- /dev/null +++ b/data/test_wavs/tedlium3/DanielKahneman_2010-157.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38adf05dc46341aac948d7d43f5dfc9d8a3627989dbe9d43ab8548fa060612d9 +size 403564 diff --git a/data/test_wavs/tedlium3/RobertGupta_2010U-15.wav b/data/test_wavs/tedlium3/RobertGupta_2010U-15.wav new file mode 100644 index 0000000000000000000000000000000000000000..fba230219ebcbb680809b672e6de7085f03468dc --- /dev/null +++ b/data/test_wavs/tedlium3/RobertGupta_2010U-15.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abadb1c7a252fd1c5781f8ee0a4378db9ec99924048b594b30b416dd2cf2013a +size 554604 diff --git a/data/test_wavs/tedlium3/trans.txt b/data/test_wavs/tedlium3/trans.txt new file mode 100644 index 0000000000000000000000000000000000000000..8304a08e4b93bc00828f35749fd6fa40c7f0ff39 --- /dev/null +++ b/data/test_wavs/tedlium3/trans.txt @@ -0,0 +1,3 @@ +DanBarber_2010-219 well the last year this property had six hundred thousand birds on it +RobertGupta_2010U-15 and he was talking about invisible demons and smoke and how someone was poisoning him in his sleep and i was afraid not for myself but i was afraid that i was going to lose him that he was going to sink into one of his states +DanielKahneman_2010-157 goes very different ways depending on how you think and whether you think of the remembering self or you think of the experiencing self this is going to influence policy i think in years to come in the united states efforts are being made diff --git a/data/test_wavs/tibetan/a_0_cacm-A70_31116.wav b/data/test_wavs/tibetan/a_0_cacm-A70_31116.wav new file mode 100644 index 0000000000000000000000000000000000000000..49fc3f50fe282ed973ddd5f2da0a9f6a16340025 --- /dev/null +++ b/data/test_wavs/tibetan/a_0_cacm-A70_31116.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4887c92e193a422cdb44306d807b7cfb5077bb4474e1449342974a9510f9549e +size 97358 diff --git a/data/test_wavs/tibetan/a_0_cacm-A70_31117.wav b/data/test_wavs/tibetan/a_0_cacm-A70_31117.wav new file mode 100644 index 0000000000000000000000000000000000000000..a982875c3adc8fc76fabd7a07f2d12c2ed5c5285 --- /dev/null +++ b/data/test_wavs/tibetan/a_0_cacm-A70_31117.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d335c49df8536f106c062e3b9a44da9085f02da76fdebee784e261eb0097d94c +size 128078 diff --git a/data/test_wavs/tibetan/a_0_cacm-A70_31118.wav b/data/test_wavs/tibetan/a_0_cacm-A70_31118.wav new file mode 100644 index 0000000000000000000000000000000000000000..9a9175dcff98f19a572e842b9a3479c4840cdf6d --- /dev/null +++ b/data/test_wavs/tibetan/a_0_cacm-A70_31118.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a15845fba46c12d8afca1203ad0a66f29e2a614bfe555ec8d1807b0eaddbfd30 +size 87118 diff --git a/data/test_wavs/tibetan/trans.txt b/data/test_wavs/tibetan/trans.txt new file mode 100644 index 0000000000000000000000000000000000000000..f18de4e19029cf8986f448c8662fb410d274c3b1 --- /dev/null +++ b/data/test_wavs/tibetan/trans.txt @@ -0,0 +1,3 @@ +a_0_cacm-A70_31116.wav ལོ བཅུ ཙམ མ འདང བའི དུས སྐབས ནང +a_0_cacm-A70_31117.wav དྲག པོའི ངོ ལོག ཟིང འཁྲུག སྒྲིག འཛུགས དང ངན བཀོད བྱས ཡོད +a_0_cacm-A70_31118.wav གནས བབ འདིའི རིགས གང མགྱོགས འགྱུར བ གཏོང དགོས diff --git a/data/test_wavs/wenetspeech/DEV_T0000000000.opus b/data/test_wavs/wenetspeech/DEV_T0000000000.opus new file mode 100644 index 0000000000000000000000000000000000000000..ee3daf1d6d01806a3c7174ddb1fab6118d968c39 Binary files /dev/null and b/data/test_wavs/wenetspeech/DEV_T0000000000.opus differ diff --git a/data/test_wavs/wenetspeech/DEV_T0000000001.opus b/data/test_wavs/wenetspeech/DEV_T0000000001.opus new file mode 100644 index 0000000000000000000000000000000000000000..bfc1918ab32efb8a6ade1f011819b550ade9d20c Binary files /dev/null and b/data/test_wavs/wenetspeech/DEV_T0000000001.opus differ diff --git a/data/test_wavs/wenetspeech/DEV_T0000000002.opus b/data/test_wavs/wenetspeech/DEV_T0000000002.opus new file mode 100644 index 0000000000000000000000000000000000000000..91633d8604f276048f7af56f31484e881eb913d4 Binary files /dev/null and b/data/test_wavs/wenetspeech/DEV_T0000000002.opus differ diff --git a/data/test_wavs/wenetspeech/README.md b/data/test_wavs/wenetspeech/README.md new file mode 100644 index 0000000000000000000000000000000000000000..0b30e3076a22a71cd4d216649170f2b0af3e2415 --- /dev/null +++ b/data/test_wavs/wenetspeech/README.md @@ -0,0 +1,2 @@ +Files are downloaded from +https://huggingface.co/luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2/tree/main/test_wavs diff --git a/data/wheels/k2-1.23.4.dev20230130+cpu.torch1.13.1-cp38-cp38-linux_x86_64.whl b/data/wheels/k2-1.23.4.dev20230130+cpu.torch1.13.1-cp38-cp38-linux_x86_64.whl new file mode 100644 index 0000000000000000000000000000000000000000..177d8ca9a31311f8fa176e5de09b5dfe165a1065 --- /dev/null +++ b/data/wheels/k2-1.23.4.dev20230130+cpu.torch1.13.1-cp38-cp38-linux_x86_64.whl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeaf1478d432d93b05f033239c35d9ce2560586afc50ba2360224a4cd672d8a6 +size 2548838 diff --git a/data/wheels/k2_sherpa-1.1-cp38-cp38-linux_x86_64.whl b/data/wheels/k2_sherpa-1.1-cp38-cp38-linux_x86_64.whl new file mode 100644 index 0000000000000000000000000000000000000000..f1a4d5ea6f4681750b87461ba29a481dfd5340a8 --- /dev/null +++ b/data/wheels/k2_sherpa-1.1-cp38-cp38-linux_x86_64.whl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f45aa154c3488377853d1e5ed844287e04db6037bd5d1954a11521e3498a2d4 +size 3593277 diff --git a/data/wheels/kaldifeat-1.22-cp38-cp38-linux_x86_64.whl b/data/wheels/kaldifeat-1.22-cp38-cp38-linux_x86_64.whl new file mode 100644 index 0000000000000000000000000000000000000000..aa9af5c912a31d23d27e865c1326c8d2709b2eff --- /dev/null +++ b/data/wheels/kaldifeat-1.22-cp38-cp38-linux_x86_64.whl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef6fcda05193072b861dc657e4157a3ae74b191ead2b394c86895dc51ae38206 +size 268297