Spaces:

huggingface-projects
/

ai-video-composer

Running on CPU Upgrade

App Files Files Community

show ffmpg command in case of error

by Aivo - opened Nov 26, 2024

base: refs/heads/main

←

from: refs/pr/6

Discussion Files changed

+29

-68

Files changed (2) hide show

app.py +28 -67
requirements.txt +1 -1

app.py CHANGED Viewed

@@ -12,28 +12,13 @@ import tempfile
 import shlex
 import shutil
-# Supported models configuration
-MODELS = {
-    "deepseek-ai/DeepSeek-V3": {
-        "base_url": "https://api.deepseek.com/v1",
-        "env_key": "DEEPSEEK_API_KEY",
-    },
-    "Qwen/Qwen2.5-Coder-32B-Instruct": {
-        "base_url": "https://api-inference.huggingface.co/v1/",
-        "env_key": "HF_TOKEN",
-    },
-}
-# Initialize client with first available model
-client = OpenAI(
-    base_url=next(iter(MODELS.values()))["base_url"],
-    api_key=os.environ[next(iter(MODELS.values()))["env_key"]],
-)
 allowed_medias = [
     ".png",
     ".jpg",
-    ".webp",
     ".jpeg",
     ".tiff",
     ".bmp",
@@ -99,7 +84,7 @@ def get_files_infos(files):
     return results
-def get_completion(prompt, files_info, top_p, temperature, model_choice):
     # Create table header
     files_info_string = "| Type | Name | Dimensions | Duration | Audio Channels |\n"
     files_info_string += "|------|------|------------|-----------|--------|\n"
@@ -167,16 +152,8 @@ YOUR FFMPEG COMMAND:
             print(msg["content"])
         print("=====================\n")
-        if model_choice not in MODELS:
-            raise ValueError(f"Model {model_choice} is not supported")
-        model_config = MODELS[model_choice]
-        client.base_url = model_config["base_url"]
-        client.api_key = os.environ[model_config["env_key"]]
-        model = "deepseek-chat" if "deepseek" in model_choice.lower() else model_choice
         completion = client.chat.completions.create(
-            model=model,
             messages=messages,
             temperature=temperature,
             top_p=top_p,
@@ -204,13 +181,7 @@ YOUR FFMPEG COMMAND:
         raise Exception("API Error")
-def update(
-    files,
-    prompt,
-    top_p=1,
-    temperature=1,
-    model_choice="Qwen/Qwen2.5-Coder-32B-Instruct",
-):
     if prompt == "":
         raise gr.Error("Please enter a prompt.")
@@ -222,16 +193,14 @@ def update(
                 raise gr.Error(
                     "Please make sure all videos are less than 2 minute long."
                 )
-        if file_info["size"] > 100000000:
-            raise gr.Error("Please make sure all files are less than 100MB in size.")
     attempts = 0
     while attempts < 2:
         print("ATTEMPT", attempts)
         try:
-            command_string = get_completion(
-                prompt, files_info, top_p, temperature, model_choice
-            )
             print(
                 f"""///PROMTP {prompt} \n\n/// START OF COMMAND ///:\n\n{command_string}\n\n/// END OF COMMAND ///\n\n"""
             )
@@ -283,7 +252,7 @@ with gr.Blocks() as demo:
     gr.Markdown(
         """
             # 🏞 AI Video Composer
-            Compose new videos from your assets using natural language. Add video, image and audio assets and let [Qwen2.5-Coder](https://huggingface.co/Qwen/Qwen2.5-Coder-32B-Instruct) or [DeepSeek-V3](https://huggingface.co/deepseek-ai/DeepSeek-V3-Base) generate a new video for you (using FFMPEG).
         """,
         elem_id="header",
     )
@@ -295,16 +264,11 @@ with gr.Blocks() as demo:
                 file_types=allowed_medias,
             )
             user_prompt = gr.Textbox(
-                placeholder="eg: Remove the 3 first seconds of the video",
                 label="Instructions",
             )
             btn = gr.Button("Run")
             with gr.Accordion("Parameters", open=False):
-                model_choice = gr.Radio(
-                    choices=list(MODELS.keys()),
-                    value=list(MODELS.keys())[0],
-                    label="Model",
-                )
                 top_p = gr.Slider(
                     minimum=-0,
                     maximum=1.0,
@@ -329,7 +293,7 @@ with gr.Blocks() as demo:
         btn.click(
             fn=update,
-            inputs=[user_files, user_prompt, top_p, temperature, model_choice],
             outputs=[generated_video, generated_command],
         )
     with gr.Row():
@@ -340,40 +304,37 @@ with gr.Blocks() as demo:
                     "Use the image as the background with a waveform visualization for the audio positioned in center of the video.",
                     0.7,
                     0.1,
-                    (
-                        list(MODELS.keys())[1]
-                        if len(MODELS) > 1
-                        else list(MODELS.keys())[0]
-                    ),
-                ],
-                [
-                    ["./examples/ai_talk.wav", "./examples/bg-image.png"],
-                    "Use the image as the background with a waveform visualization for the audio positioned in center of the video. Make sure the waveform has a max height of 250 pixels.",
-                    0.7,
-                    0.1,
-                    list(MODELS.keys())[0],
                 ],
                 [
                     [
                         "./examples/cat1.jpeg",
                         "./examples/cat2.jpeg",
                         "./examples/cat3.jpeg",
                         "./examples/cat4.jpeg",
                         "./examples/cat5.jpeg",
                         "./examples/cat6.jpeg",
                         "./examples/heat-wave.mp3",
                     ],
-                    "Create a 3x2 grid of the cat images with the audio as background music. Make the video duration match the audio duration.",
                     0.7,
                     0.1,
-                    (
-                        list(MODELS.keys())[1]
-                        if len(MODELS) > 1
-                        else list(MODELS.keys())[0]
-                    ),
                 ],
             ],
-            inputs=[user_files, user_prompt, top_p, temperature, model_choice],
             outputs=[generated_video, generated_command],
             fn=update,
             run_on_click=True,

 import shlex
 import shutil
+HF_API_KEY = os.environ["HF_TOKEN"]
+client = OpenAI(base_url="https://api-inference.huggingface.co/v1/", api_key=HF_API_KEY)
 allowed_medias = [
     ".png",
     ".jpg",
     ".jpeg",
     ".tiff",
     ".bmp",
     return results
+def get_completion(prompt, files_info, top_p, temperature):
     # Create table header
     files_info_string = "| Type | Name | Dimensions | Duration | Audio Channels |\n"
     files_info_string += "|------|------|------------|-----------|--------|\n"
             print(msg["content"])
         print("=====================\n")
         completion = client.chat.completions.create(
+            model="Qwen/Qwen2.5-Coder-32B-Instruct",
             messages=messages,
             temperature=temperature,
             top_p=top_p,
         raise Exception("API Error")
+def update(files, prompt, top_p=1, temperature=1):
     if prompt == "":
         raise gr.Error("Please enter a prompt.")
                 raise gr.Error(
                     "Please make sure all videos are less than 2 minute long."
                 )
+        if file_info["size"] > 10000000:
+            raise gr.Error("Please make sure all files are less than 10MB in size.")
     attempts = 0
     while attempts < 2:
         print("ATTEMPT", attempts)
         try:
+            command_string = get_completion(prompt, files_info, top_p, temperature)
             print(
                 f"""///PROMTP {prompt} \n\n/// START OF COMMAND ///:\n\n{command_string}\n\n/// END OF COMMAND ///\n\n"""
             )
     gr.Markdown(
         """
             # 🏞 AI Video Composer
+            Compose new videos from your assets using natural language. Add video, image and audio assets and let [Qwen2.5-Coder](https://huggingface.co/Qwen/Qwen2.5-Coder-32B-Instruct) generate a new video for you (using FFMPEG).
         """,
         elem_id="header",
     )
                 file_types=allowed_medias,
             )
             user_prompt = gr.Textbox(
+                placeholder="I want to convert to a gif under 15mb",
                 label="Instructions",
             )
             btn = gr.Button("Run")
             with gr.Accordion("Parameters", open=False):
                 top_p = gr.Slider(
                     minimum=-0,
                     maximum=1.0,
         btn.click(
             fn=update,
+            inputs=[user_files, user_prompt, top_p, temperature],
             outputs=[generated_video, generated_command],
         )
     with gr.Row():
                     "Use the image as the background with a waveform visualization for the audio positioned in center of the video.",
                     0.7,
                     0.1,
                 ],
                 [
                     [
+                        "./examples/cat8.jpeg",
                         "./examples/cat1.jpeg",
                         "./examples/cat2.jpeg",
                         "./examples/cat3.jpeg",
                         "./examples/cat4.jpeg",
                         "./examples/cat5.jpeg",
                         "./examples/cat6.jpeg",
+                        "./examples/cat7.jpeg",
                         "./examples/heat-wave.mp3",
                     ],
+                    "Generate an MP4 slideshow where each photo appears for 2 seconds, using the provided audio as soundtrack.",
+                    0.7,
+                    0.1,
+                ],
+                [
+                    ["./examples/waterfall-overlay.png", "./examples/waterfall.mp4"],
+                    "Add the overlay to the video.",
+                    0.7,
+                    0.1,
+                ],
+                [
+                    ["./examples/example.mp4"],
+                    "Make this video 10 times faster",
                     0.7,
                     0.1,
                 ],
             ],
+            inputs=[user_files, user_prompt, top_p, temperature],
             outputs=[generated_video, generated_command],
             fn=update,
             run_on_click=True,

requirements.txt CHANGED Viewed

@@ -1,3 +1,3 @@
 openai>=1.55.0
-gradio==5.9.1
 moviepy==1

 openai>=1.55.0
+gradio==5.6.0
 moviepy==1