Spaces:
Runtime error
Runtime error
import gradio as gr | |
import numpy as np | |
import pandas as pd | |
import csv | |
import librosa | |
import tensorflow as tf | |
#!gdown https://drive.google.com/uc?id=1hKQdsTZ35KQmNV9Zrqg-ksTLSmPapR53 | |
model = tf.keras.models.load_model('TTM_model.h5') | |
def config_audio(audio): | |
print('enter2') | |
header = 'ChromaSTFT RMS SpectralCentroid SpectralBandwidth Rolloff ZeroCrossingRate' | |
for i in range(1, 21): | |
header += f' mfcc{i}' | |
header += ' label' | |
header = header.split() | |
print(1) | |
file = open('predict_file.csv', 'w', newline='') | |
with file: | |
writer = csv.writer(file) | |
writer.writerow(header) | |
print(2) | |
#taalfile = audio | |
#print('stored in taalfile') | |
y, sr = librosa.load(audio, mono=True, duration=30) | |
print(3) | |
rms = librosa.feature.rms(y=y) | |
chroma = librosa.feature.chroma_stft(y=y, sr=sr) | |
spec_centroid = librosa.feature.spectral_centroid(y=y, sr=sr) | |
spec_bandwidth = librosa.feature.spectral_bandwidth(y=y, sr=sr) | |
rolloff = librosa.feature.spectral_rolloff(y=y, sr=sr) | |
zcr = librosa.feature.zero_crossing_rate(y) | |
mfcc = librosa.feature.mfcc(y=y, sr=sr) | |
to_append = f' {np.mean(chroma)} {np.mean(rms)} {np.mean(spec_centroid)} {np.mean(spec_bandwidth)} {np.mean(rolloff)} {np.mean(zcr)} ' | |
for e in mfcc: | |
to_append += f' {np.mean(e)}' | |
#to_append += f' {t}' | |
file = open('predict_file.csv', 'a', newline='') | |
with file: | |
writer = csv.writer(file) | |
writer.writerow(to_append.split()) | |
predict_file = pd.read_csv("predict_file.csv") | |
X_predict = predict_file.drop('label', axis=1) | |
print('exit2') | |
return X_predict | |
def predict_audio(audiox): | |
audio=audiox.name | |
print('enter1') | |
X_predict = config_audio(audio) | |
taals = ['addhatrital','bhajani','dadra','deepchandi','ektal','jhaptal','rupak','trital'] | |
pred = model.predict(X_predict).flatten() | |
print('exit1') | |
return {taals[i]: float(pred[i]) for i in range(7)},audio | |
audio = gr.inputs.Audio(source="upload", optional=False) | |
label = gr.outputs.Label() | |
audio = gr.inputs.Audio(source="upload", optional=False) | |
#label = gr.outputs.Label() | |
gr.Interface(predict_audio, | |
["file"], | |
[gr.outputs.Label(),gr.outputs.Audio()], | |
description="", | |
examples = [["Addhatrital_Sample1.wav"], ["Addhatrital_Sample2.wav"], ["Bhajani_Sample1.wav"], ["Bhajani_Sample2.wav"], | |
["Dadra_Sample1.wav"], ["Dadra_Sample2.wav"], ["Deepchandi_Sample1.wav"], ["Deepchandi_Sample2.wav"], | |
["Ektal_Sample1.wav"], ["Ektal_Sample2.wav"], ["Jhaptal_Sample1.wav"], ["Jhaptal_Sample2.wav"], | |
["Rupak_Sample1.wav"], ["Rupak_Sample2.wav"], ["Trital_Sample1.wav"], ["Trital_Sample2.wav"]]).launch() |