Spaces:

StarPigeon
/

ViDove

Sleeping

App Files Files Community

JiaenLiu commited on Mar 29, 2023

Commit

ff51822

1 Parent(s): 08c7492

output fixed

Browse files

Former-commit-id: 25a186c46fc6829e3f0d708612f710324154c258

Files changed (2) hide show

SRT.py +6 -6
pipeline.py +22 -7

SRT.py CHANGED Viewed

@@ -421,7 +421,7 @@ class SRT_script():
             n = 0
         return real_word, len(word)+n
-    def realtime_write_srt(self,path,range,length,idx):
         start_seg_id = range[0]
         end_seg_id = range[1]
         with open(path, "a", encoding='utf-8') as f:
@@ -429,19 +429,19 @@ class SRT_script():
             #     f.write(f'{i+idx}\n')
             #     f.write(seg.get_trans_str())
             for i, seg in enumerate(self.segments):
-                if i<range[0]-1: continue
-                if i>=range[1] + length:break
                 f.write(f'{i+idx}\n')
                 f.write(seg.get_trans_str())
         pass
-    def realtime_bilingual_write_srt(self,path,range,length,idx):
         start_seg_id = range[0]
         end_seg_id = range[1]
         with open(path, "a", encoding='utf-8') as f:
             for i, seg in enumerate(self.segments):
-                if i<range[0]-1: continue
-                if i>=range[1] + length:break
                 f.write(f'{i+idx}\n')
                 f.write(seg.get_bilingual_str())
         pass

             n = 0
         return real_word, len(word)+n
+    def realtime_write_srt(self,path,range,length, idx):
         start_seg_id = range[0]
         end_seg_id = range[1]
         with open(path, "a", encoding='utf-8') as f:
             #     f.write(f'{i+idx}\n')
             #     f.write(seg.get_trans_str())
             for i, seg in enumerate(self.segments):
+                if i<range[0]-1 : continue
+                if i>=range[1] + length :break
                 f.write(f'{i+idx}\n')
                 f.write(seg.get_trans_str())
         pass
+    def realtime_bilingual_write_srt(self,path,range, length,idx):
         start_seg_id = range[0]
         end_seg_id = range[1]
         with open(path, "a", encoding='utf-8') as f:
             for i, seg in enumerate(self.segments):
+                if i<range[0]-1 : continue
+                if i>=range[1] + length :break
                 f.write(f'{i+idx}\n')
                 f.write(seg.get_bilingual_str())
         pass

pipeline.py CHANGED Viewed

@@ -5,6 +5,7 @@ import os
 from tqdm import tqdm
 from SRT import SRT_script
 import stable_whisper
 import time
@@ -94,9 +95,17 @@ elif args.video_file is not None:
         audio_file= open(args.audio_file, "rb")
         audio_path = args.audio_file
     else:
-        os.system(f'ffmpeg -i {args.video_file} -f mp3 -ab 192000 -vn {DOWNLOAD_PATH}/audio/{VIDEO_NAME}.mp3')
-        audio_file= open(f'{DOWNLOAD_PATH}/audio/{VIDEO_NAME}.mp3', "rb")
-        audio_path = f'{DOWNLOAD_PATH}/audio/{VIDEO_NAME}.mp3'
 if not os.path.exists(f'{RESULT_PATH}/{VIDEO_NAME}'):
     os.mkdir(f'{RESULT_PATH}/{VIDEO_NAME}')
@@ -250,7 +259,11 @@ def get_response(model_name, sentence):
 # Translate and save
 for sentence, range in tqdm(zip(script_arr, range_arr)):
     # using chatgpt model
     print(f"now translating sentences {range}")
     flag = True
@@ -265,12 +278,14 @@ for sentence, range in tqdm(zip(script_arr, range_arr)):
             flag = True
     # add read-time output back and modify the post-processing by using one batch as an unit.
     srt.set_translation(translate, range, model_name)
-    add_length = srt.check_len_and_split_range(range, threshold)
-    srt.realtime_write_srt(f"{RESULT_PATH}/{VIDEO_NAME}/{VIDEO_NAME}_zh.srt",range, add_length,segidx)
     # srt.realtime_bilingual_write_srt(f"{RESULT_PATH}/{VIDEO_NAME}/{VIDEO_NAME}_bi.srt",range, add_length,segidx)
-# srt.check_len_and_split()
-# srt.write_srt_file_translate(f"{RESULT_PATH}/{VIDEO_NAME}/{VIDEO_NAME}_zh.srt")
 # srt.write_srt_file_bilingual(f"{RESULT_PATH}/{VIDEO_NAME}/{VIDEO_NAME}_bi.srt")
 if not args.only_srt:

 from tqdm import tqdm
 from SRT import SRT_script
 import stable_whisper
+import subprocess
 import time
         audio_file= open(args.audio_file, "rb")
         audio_path = args.audio_file
     else:
+        # escaped_video_path = args.video_file.replace('(', '\(').replace(')', '\)').replace(' ', '\ ')
+        # print(escaped_video_path)
+        # os.system(f'ffmpeg -i {escaped_video_path} -f mp3 -ab 192000 -vn {DOWNLOAD_PATH}/audio/{VIDEO_NAME}.mp3')
+        # audio_file= open(f'{DOWNLOAD_PATH}/audio/{VIDEO_NAME}.mp3', "rb")
+        # audio_path = f'{DOWNLOAD_PATH}/audio/{VIDEO_NAME}.mp3'
+        output_audio_path = f'{DOWNLOAD_PATH}/audio/{VIDEO_NAME}.mp3'
+        # print(video_path)
+        # print(output_audio_path)
+        subprocess.run(['ffmpeg', '-i', video_path, '-f', 'mp3', '-ab', '192000', '-vn', output_audio_path])
+        audio_file = open(output_audio_path, "rb")
+        audio_path = output_audio_path
 if not os.path.exists(f'{RESULT_PATH}/{VIDEO_NAME}'):
     os.mkdir(f'{RESULT_PATH}/{VIDEO_NAME}')
 # Translate and save
+previous_length = 0
 for sentence, range in tqdm(zip(script_arr, range_arr)):
+    # update the range based on previous length
+    range = (range[0]+previous_length, range[1]+previous_length)
     # using chatgpt model
     print(f"now translating sentences {range}")
     flag = True
             flag = True
     # add read-time output back and modify the post-processing by using one batch as an unit.
     srt.set_translation(translate, range, model_name)
+    # add_length = srt.check_len_and_split_range(range, threshold)
+    # srt.realtime_write_srt(f"{RESULT_PATH}/{VIDEO_NAME}/{VIDEO_NAME}_zh.srt",range, add_length ,segidx)
+    # # save current length as previous length
+    # previous_length = add_length
     # srt.realtime_bilingual_write_srt(f"{RESULT_PATH}/{VIDEO_NAME}/{VIDEO_NAME}_bi.srt",range, add_length,segidx)
+srt.check_len_and_split()
+srt.write_srt_file_translate(f"{RESULT_PATH}/{VIDEO_NAME}/{VIDEO_NAME}_zh.srt")
 # srt.write_srt_file_bilingual(f"{RESULT_PATH}/{VIDEO_NAME}/{VIDEO_NAME}_bi.srt")
 if not args.only_srt: