Spaces:

Maximofn
/

subtify

Runtime error

App Files Files Community

subtify / concat_transcriptions.py

Maximofn

Add progress bar to concatenate transcriptions script

96bc450 about 1 year ago

raw

history blame

3.89 kB

	import argparse
	import re
	from tqdm import tqdm

	def sum_seconds(time, seconds):
	# Get time in seconds
	time = time.split(",")
	time_milisecons = time[1]
	time_milisecons = int(time_milisecons)/1000
	time = time[0].split(":")
	time = int(time[0])3600 + int(time[1])60 + int(time[2])

	# Get integer and decimal part of seconds
	seconds, seconds_miliseconds = divmod(seconds, 1)
	seconds = int(seconds)
	seconds_miliseconds = round(seconds_miliseconds, 3)

	# Add seconds
	time = time + seconds
	time_milisecons = time_milisecons + seconds_miliseconds
	if time_milisecons >= 1:
	time = time + 1
	time_milisecons = time_milisecons - 1
	time_milisecons = round(time_milisecons, 3)

	# Get time in hh:mm:ss,mmm format
	hours = int(time) // 3600
	minutes = (int(time) % 3600) // 60
	seconds = (int(time) % 3600) % 60
	time_milisecons = str(time_milisecons).split(".")[1]
	time = f"{hours:02d}:{minutes:02d}:{seconds:02d},{time_milisecons}"

	return time

	def hmsms_to_seconds(time):
	# Get time in seconds
	time = time.split(",")
	milisecons = time[1]
	time = time[0].split(":")
	time = int(time[0])3600 + int(time[1])60 + int(time[2])
	time = time + int(milisecons)/1000

	return time

	def concatenate_transcriptions(chunk_files, seconds):
	chunk_folder = "transcriptions"
	output_folder = "concatenated_transcriptions"
	transcription_extension = "srt"

	# Read chunk files
	with open(chunk_files, "r") as f:
	files = f.read().splitlines()

	# Concatenate transcriptions
	transcription = ""
	num_transcriptions = 1
	progress_bar = tqdm(total=len(files), desc='Concatenating transcriptions progress')
	for i, file in enumerate(files):
	chunk = file
	_, file = chunk.split("/")
	file, _ = file.split(".")
	transcription_chunk_file = f"{chunk_folder}/{file}.{transcription_extension}"
	with open(transcription_chunk_file, "r") as f:
	transcription_chunk = f.read().splitlines()
	for line in transcription_chunk:

	# if line is dd:dd:dd,ddd --> dd:dd:dd,ddd
	if re.match(r"\d\d:\d\d:\d\d,\d\d\d --> \d\d:\d\d:\d\d,\d\d\d", line):
	# Get start time (dd:dd:dd,ddd) and end time (dd:dd:dd,ddd)
	start, end = line.split(" --> ")
	# Add seconds to start and end time
	start = sum_seconds(start, i*seconds)
	end = sum_seconds(end, i*seconds)
	# Add to transcription
	transcription += f"{start} --> {end}\n"

	# if line is a number and carriage return --> number
	elif re.match(r"\d+$", line):
	transcription += f"{num_transcriptions}\n"
	num_transcriptions += 1

	else:
	transcription += f"{line}\n"
	progress_bar.update(1)

	# Write transcription
	file_split = file.split("_")[:-1]
	file = "_".join(file_split)
	output_file = f"{output_folder}/{file}.{transcription_extension}"
	with open(output_file, "w") as f:
	f.write(transcription)

	if __name__ == "__main__":
	parser = argparse.ArgumentParser()
	parser.add_argument("chunk_files", help="Path to the file containing the paths to the chunk files")
	parser.add_argument("seconds", help="Duration of each chunk in seconds")
	parser.add_argument('speakers_file', help='File with the number of speakers')
	args = parser.parse_args()

	chunk_files = args.chunk_files
	seconds = int(args.seconds)
	with open(args.speakers_file, 'r') as f:
	speakers = f.read().splitlines()
	speakers = int(speakers[0])

	if speakers > 0:
	for speaker in range(speakers):
	pass
	else:
	concatenate_transcriptions(chunk_files, seconds)