jaekookang commited on
Commit
9cec2f1
1 Parent(s): 63da1fa

updated logging

Browse files
gradio_asr_en_libri100_word_vs_bpe.py CHANGED
@@ -9,7 +9,6 @@ from difflib import Differ
9
  from glob import glob
10
  from loguru import logger
11
  import librosa
12
- import scipy.signal as sps
13
  import gradio as gr
14
 
15
  from espnet2.bin.asr_inference import Speech2Text
@@ -45,20 +44,10 @@ def predict(wav_file):
45
  logger.info('wav file loaded')
46
  # Load audio
47
  speech, rate = librosa.load(wav_file, sr=16000)
48
- # rate, speech = wav_file
49
- # if len(speech.shape) == 2:
50
- # speech = speech.T[0]
51
- # wav = wavio.read(wav_file)
52
- # speech = wav.data
53
- # rate = wav.rate
54
- logger.info(f'speech.shape: {speech.shape}')
55
- logger.info(f'speech.dtype: {speech.dtype}')
56
- logger.info(f'speech rate: {rate}')
57
- # speech = speech.astype('float32')
58
-
59
- # number_of_samples = round(len(speech_raw) * float(16000) / rate)
60
- # speech = sps.resample(speech_raw, number_of_samples)
61
- # speech = speech_raw.astype('float32')
62
 
63
  # Run inference
64
  W = model_word(speech)[0]
 
9
  from glob import glob
10
  from loguru import logger
11
  import librosa
 
12
  import gradio as gr
13
 
14
  from espnet2.bin.asr_inference import Speech2Text
 
44
  logger.info('wav file loaded')
45
  # Load audio
46
  speech, rate = librosa.load(wav_file, sr=16000)
47
+
48
+ logger.info(f'--- speech.shape: {speech.shape}')
49
+ logger.info(f'--- speech.dtype: {speech.dtype}')
50
+ logger.info(f'--- speech rate: {rate}')
 
 
 
 
 
 
 
 
 
 
51
 
52
  # Run inference
53
  W = model_word(speech)[0]