Spaces:

latuan
/

SRT-to-Audio

Running

App Files Files Community

latuan commited on Aug 21

Commit

fd0629f

•

1 Parent(s): e9c562f

ver 1.4

Browse files

Files changed (1) hide show

app.py +34 -5

app.py CHANGED Viewed

@@ -145,12 +145,21 @@ def read_srt(file_path):
         for i in range(0, len(lines), 4):
             if i+2 < len(lines):
-                start_time, end_time = lines[i+1].strip().split(' --> ')
                 text = lines[i+2].strip()
                 subtitles.append((start_time, end_time, text))
     return subtitles
 def time_to_seconds(time_str):
     h, m, s = time_str.split(':')
     seconds = int(h) * 3600 + int(m) * 60 + float(s.replace(',', '.'))
@@ -179,8 +188,12 @@ def generate_audio_with_pause(srt_file_path):
 def srt_to_audio_multi(srt_files):
     output_paths = []
     def process_file(srt_file):
         audio_data = generate_audio_with_pause(srt_file.name)
         output_path = os.path.join(cache_dir, f'output_{os.path.basename(srt_file.name)}.wav')
         torchaudio.save(output_path, torch.tensor(audio_data).unsqueeze(0), 16000)
@@ -189,23 +202,39 @@ def srt_to_audio_multi(srt_files):
     with concurrent.futures.ThreadPoolExecutor() as executor:
         futures = [executor.submit(process_file, srt_file) for srt_file in srt_files]
         for future in concurrent.futures.as_completed(futures):
-            output_paths.append(future.result())
     return output_paths
 # UI display
 css = '''
 #title{text-align: center}
 '''
 with gr.Blocks(css=css) as demo:
     title = gr.HTML(
         """<h1>SRT to Audio Tool</h1>""",
         elem_id="title",
     )
-    inp = gr.File(label="Upload SRT files", file_count="multiple", type="filepath")
-    out = gr.File(label="Generated Audio Files", file_count="multiple", type="filepath")
-    inp.change(fn=srt_to_audio_multi, inputs=inp, outputs=out)
 if __name__ == "__main__":
     demo.launch()

         for i in range(0, len(lines), 4):
             if i+2 < len(lines):
+                start_time, end_time = lines[i+1].strip().split('-->')
+                start_time = start_time.strip()
+                end_time = end_time.strip()
                 text = lines[i+2].strip()
                 subtitles.append((start_time, end_time, text))
     return subtitles
+def is_valid_srt(file_path):
+    try:
+        read_srt(file_path)
+        return True
+    except:
+        return False
 def time_to_seconds(time_str):
     h, m, s = time_str.split(':')
     seconds = int(h) * 3600 + int(m) * 60 + float(s.replace(',', '.'))
 def srt_to_audio_multi(srt_files):
     output_paths = []
+    invalid_files = []
     def process_file(srt_file):
+        if not is_valid_srt(srt_file.name):
+            invalid_files.append(srt_file.name)
+            return None
         audio_data = generate_audio_with_pause(srt_file.name)
         output_path = os.path.join(cache_dir, f'output_{os.path.basename(srt_file.name)}.wav')
         torchaudio.save(output_path, torch.tensor(audio_data).unsqueeze(0), 16000)
     with concurrent.futures.ThreadPoolExecutor() as executor:
         futures = [executor.submit(process_file, srt_file) for srt_file in srt_files]
         for future in concurrent.futures.as_completed(futures):
+            result = future.result()
+            if result:
+                output_paths.append(result)
+    if invalid_files:
+        raise ValueError(f"Invalid SRT files: {', '.join(invalid_files)}")
     return output_paths
+# Initialize model
+model = Model(
+    model_name=default_model_name,
+    speaker_url=""
+)
 # UI display
 css = '''
 #title{text-align: center}
+#container{display: flex; justify-content: space-between; align-items: center;}
 '''
 with gr.Blocks(css=css) as demo:
     title = gr.HTML(
         """<h1>SRT to Audio Tool</h1>""",
         elem_id="title",
     )
+    with gr.Row(elem_id="container"):
+        inp = gr.File(label="Upload SRT files", file_count="multiple", type="filepath")
+        out = gr.File(label="Generated Audio Files", file_count="multiple", type="filepath")
+    btn = gr.Button("Generate")
+    btn.click(fn=srt_to_audio_multi, inputs=inp, outputs=out)
 if __name__ == "__main__":
     demo.launch()