text-to-video

Running

App Files Files Community

bestoai commited on Nov 15, 2024

Commit

bee386d

verified ·

1 Parent(s): 80226aa

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -12

app.py CHANGED Viewed

@@ -44,22 +44,19 @@ async def text_to_speech(text, voice, rate, pitch, output_path):
 # Generate SRT file with specified lines of subtitles
 def generate_srt(words, audio_duration, srt_path, num_lines):
     with open(srt_path, 'w', encoding='utf-8') as srt_file:
-        segment_duration = audio_duration / (len(words) // (5 * num_lines))  # Average duration for each segment
-        current_time = 0
-        divisor = len(words) // (5 * num_lines)
-        if divisor == 0:
-            segment_duration = audio_duration  # Use full duration as fallback
-        else:
-            segment_duration = audio_duration / divisor  # Calculate duration per segment
         for i in range(0, len(words), 5 * num_lines):
             lines = []
             for j in range(num_lines):
-                line = ' '.join(words[i + j * 5:i + (j + 1) * 5])  # 5 words per line
                 if line:
                     lines.append(line)
             start_time = current_time
             end_time = start_time + segment_duration
@@ -70,6 +67,7 @@ def generate_srt(words, audio_duration, srt_path, num_lines):
             current_time += segment_duration
     return srt_path
 # def generate_srt(words, audio_duration, srt_path, num_lines):
 #     with open(srt_path, 'w', encoding='utf-8') as srt_file:
 #         divisor = len(words) // (5 * num_lines)
@@ -138,8 +136,19 @@ async def text_to_audio_and_srt(text, voice, rate, pitch, num_lines, output_audi
 # Gradio interface function
 def tts_interface(text, voice, rate, pitch, num_lines, output_audio_path="output_audio.mp3", output_srt_path="output_subtitle.srt"):
-    audio_path, srt_path, warning = asyncio.run(text_to_audio_and_srt(text, voice, rate, pitch, num_lines, output_audio_path, output_srt_path))
-    return audio_path, srt_path, warning
 # def tts_interface(text, voice, rate, pitch, num_lines):
 #     audio_path, srt_path, warning = asyncio.run(text_to_audio_and_srt(text, voice, rate, pitch, num_lines))
 #     return audio_path, srt_path, warning

 # Generate SRT file with specified lines of subtitles
 def generate_srt(words, audio_duration, srt_path, num_lines):
     with open(srt_path, 'w', encoding='utf-8') as srt_file:
+        total_segments = max(len(words) // (5 * num_lines), 1)  # Ensure at least one segment
+        segment_duration = audio_duration / total_segments
+        current_time = 0
         for i in range(0, len(words), 5 * num_lines):
             lines = []
             for j in range(num_lines):
+                line_start = i + j * 5
+                line_end = line_start + 5
+                line = ' '.join(words[line_start:line_end])
                 if line:
                     lines.append(line)
             start_time = current_time
             end_time = start_time + segment_duration
             current_time += segment_duration
     return srt_path
 # def generate_srt(words, audio_duration, srt_path, num_lines):
 #     with open(srt_path, 'w', encoding='utf-8') as srt_file:
 #         divisor = len(words) // (5 * num_lines)
 # Gradio interface function
 def tts_interface(text, voice, rate, pitch, num_lines, output_audio_path="output_audio.mp3", output_srt_path="output_subtitle.srt"):
+    if not text.strip():
+        return None, None, gr.Warning("Text input cannot be empty.")
+    if num_lines <= 0:
+        return None, None, gr.Warning("Number of SRT lines must be greater than zero.")
+    try:
+        audio_path, srt_path, warning = asyncio.run(
+            text_to_audio_and_srt(text, voice, rate, pitch, num_lines, output_audio_path, output_srt_path)
+        )
+        return audio_path, srt_path, warning
+    except Exception as e:
+        return None, None, gr.Warning(f"An error occurred: {e}")
 # def tts_interface(text, voice, rate, pitch, num_lines):
 #     audio_path, srt_path, warning = asyncio.run(text_to_audio_and_srt(text, voice, rate, pitch, num_lines))
 #     return audio_path, srt_path, warning