\n", " | Model | \n", "Size | \n", "
---|---|---|
1 | \n", "OpenAI Whisper API | \n", "API | \n", "
2 | \n", "OpenAI Large-V2 | \n", "2.67GB | \n", "
3 | \n", "OpenAI Large | \n", "2.67GB | \n", "
4 | \n", "OpenAI Medium | \n", "1.42GB | \n", "
5 | \n", "OpenAI Small | \n", "461MB | \n", "
6 | \n", "wav2vec2-large-xlsr-53-english | \n", "1.26GB | \n", "
\n", " | Model | \n", "Audio1(storybook 27s) | \n", "Audio2(recording myself 27s) | \n", "Audio3(interview 27s) | \n", "
---|---|---|---|---|
1 | \n", "OpenAI Whisper API | \n", "2.087933 | \n", "3.922523 | \n", "5.703697 | \n", "
2 | \n", "OpenAI Large-V2 | \n", "7.058776 | \n", "5.123279 | \n", "5.159456 | \n", "
3 | \n", "OpenAI Large | \n", "7.487110 | \n", "5.103006 | \n", "5.136639 | \n", "
4 | \n", "OpenAI Medium | \n", "4.867929 | \n", "3.682481 | \n", "4.072536 | \n", "
5 | \n", "OpenAI Small | \n", "2.767450 | \n", "1.943316 | \n", "2.037943 | \n", "
6 | \n", "wav2vec2-large-xlsr-53-english | \n", "10.434880 | \n", "9.464190 | \n", "9.232625 | \n", "
\n", " | Model | \n", "Audio1(storybook 27s) | \n", "Audio2(recording myself 27s) | \n", "Audio3(interview 27s) | \n", "
---|---|---|---|---|
1 | \n", "OpenAI Whisper API | \n", "0.0000 | \n", "0.36 | \n", "0.808333 | \n", "
2 | \n", "OpenAI Large-V2 | \n", "0.0125 | \n", "0.36 | \n", "0.808333 | \n", "
3 | \n", "OpenAI Large | \n", "0.0125 | \n", "0.36 | \n", "0.808333 | \n", "
4 | \n", "OpenAI Medium | \n", "0.0125 | \n", "0.38 | \n", "0.829167 | \n", "
5 | \n", "OpenAI Small | \n", "0.0375 | \n", "0.37 | \n", "0.829167 | \n", "
6 | \n", "wav2vec2-large-xlsr-53-english | \n", "0.3250 | \n", "0.53 | \n", "0.933333 | \n", "