subtify / concat_transcriptions.py
Maximofn's picture
Add progress bar to concatenate transcriptions script
96bc450
raw
history blame
3.89 kB
import argparse
import re
from tqdm import tqdm
def sum_seconds(time, seconds):
# Get time in seconds
time = time.split(",")
time_milisecons = time[1]
time_milisecons = int(time_milisecons)/1000
time = time[0].split(":")
time = int(time[0])*3600 + int(time[1])*60 + int(time[2])
# Get integer and decimal part of seconds
seconds, seconds_miliseconds = divmod(seconds, 1)
seconds = int(seconds)
seconds_miliseconds = round(seconds_miliseconds, 3)
# Add seconds
time = time + seconds
time_milisecons = time_milisecons + seconds_miliseconds
if time_milisecons >= 1:
time = time + 1
time_milisecons = time_milisecons - 1
time_milisecons = round(time_milisecons, 3)
# Get time in hh:mm:ss,mmm format
hours = int(time) // 3600
minutes = (int(time) % 3600) // 60
seconds = (int(time) % 3600) % 60
time_milisecons = str(time_milisecons).split(".")[1]
time = f"{hours:02d}:{minutes:02d}:{seconds:02d},{time_milisecons}"
return time
def hmsms_to_seconds(time):
# Get time in seconds
time = time.split(",")
milisecons = time[1]
time = time[0].split(":")
time = int(time[0])*3600 + int(time[1])*60 + int(time[2])
time = time + int(milisecons)/1000
return time
def concatenate_transcriptions(chunk_files, seconds):
chunk_folder = "transcriptions"
output_folder = "concatenated_transcriptions"
transcription_extension = "srt"
# Read chunk files
with open(chunk_files, "r") as f:
files = f.read().splitlines()
# Concatenate transcriptions
transcription = ""
num_transcriptions = 1
progress_bar = tqdm(total=len(files), desc='Concatenating transcriptions progress')
for i, file in enumerate(files):
chunk = file
_, file = chunk.split("/")
file, _ = file.split(".")
transcription_chunk_file = f"{chunk_folder}/{file}.{transcription_extension}"
with open(transcription_chunk_file, "r") as f:
transcription_chunk = f.read().splitlines()
for line in transcription_chunk:
# if line is dd:dd:dd,ddd --> dd:dd:dd,ddd
if re.match(r"\d\d:\d\d:\d\d,\d\d\d --> \d\d:\d\d:\d\d,\d\d\d", line):
# Get start time (dd:dd:dd,ddd) and end time (dd:dd:dd,ddd)
start, end = line.split(" --> ")
# Add seconds to start and end time
start = sum_seconds(start, i*seconds)
end = sum_seconds(end, i*seconds)
# Add to transcription
transcription += f"{start} --> {end}\n"
# if line is a number and carriage return --> number
elif re.match(r"\d+$", line):
transcription += f"{num_transcriptions}\n"
num_transcriptions += 1
else:
transcription += f"{line}\n"
progress_bar.update(1)
# Write transcription
file_split = file.split("_")[:-1]
file = "_".join(file_split)
output_file = f"{output_folder}/{file}.{transcription_extension}"
with open(output_file, "w") as f:
f.write(transcription)
if __name__ == "__main__":
parser = argparse.ArgumentParser()
parser.add_argument("chunk_files", help="Path to the file containing the paths to the chunk files")
parser.add_argument("seconds", help="Duration of each chunk in seconds")
parser.add_argument('speakers_file', help='File with the number of speakers')
args = parser.parse_args()
chunk_files = args.chunk_files
seconds = int(args.seconds)
with open(args.speakers_file, 'r') as f:
speakers = f.read().splitlines()
speakers = int(speakers[0])
if speakers > 0:
for speaker in range(speakers):
pass
else:
concatenate_transcriptions(chunk_files, seconds)