|
import ffmpeg |
|
import numpy as np |
|
import re |
|
import unicodedata |
|
|
|
|
|
def load_audio(file, sampling_rate): |
|
try: |
|
file = file.strip(" ").strip('"').strip("\n").strip('"').strip(" ") |
|
out, _ = ( |
|
ffmpeg.input(file, threads=0) |
|
.output("-", format="f32le", acodec="pcm_f32le", ac=1, ar=sampling_rate) |
|
.run(cmd=["ffmpeg", "-nostdin"], capture_stdout=True, capture_stderr=True) |
|
) |
|
except Exception as error: |
|
raise RuntimeError(f"Failed to load audio: {error}") |
|
|
|
return np.frombuffer(out, np.float32).flatten() |
|
|
|
|
|
def format_title(title): |
|
formatted_title = unicodedata.normalize('NFKD', title).encode('ascii', 'ignore').decode('utf-8') |
|
formatted_title = re.sub(r'[\u2500-\u257F]+', '', formatted_title) |
|
formatted_title = re.sub(r'[^\w\s.-]', '', formatted_title) |
|
formatted_title = re.sub(r'\s+', '_', formatted_title) |
|
return formatted_title |