Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -88,8 +88,19 @@ def image_vision(image_input_path, prompt):
|
|
88 |
else:
|
89 |
return answer, None
|
90 |
|
91 |
-
def video_vision(video_input_path, prompt):
|
92 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
93 |
# create a question (<image> is a placeholder for the video frames)
|
94 |
question = f"<image>{prompt}"
|
95 |
result = model.predict_forward(
|
@@ -179,6 +190,7 @@ with gr.Blocks(analytics_enabled=False) as demo:
|
|
179 |
with gr.Row():
|
180 |
with gr.Column():
|
181 |
video_input = gr.Video(label="Video IN")
|
|
|
182 |
with gr.Row():
|
183 |
vid_instruction = gr.Textbox(label="Instruction", scale=4)
|
184 |
submit_video_btn = gr.Button("Submit", scale=1)
|
@@ -188,7 +200,7 @@ with gr.Blocks(analytics_enabled=False) as demo:
|
|
188 |
|
189 |
submit_video_btn.click(
|
190 |
fn = video_vision,
|
191 |
-
inputs = [video_input, vid_instruction],
|
192 |
outputs = [vid_output_res, output_video]
|
193 |
)
|
194 |
|
|
|
88 |
else:
|
89 |
return answer, None
|
90 |
|
91 |
+
def video_vision(video_input_path, prompt, video_interval):
|
92 |
+
# Open the original video
|
93 |
+
cap = cv2.VideoCapture(input_video_path)
|
94 |
+
|
95 |
+
# Get original video properties
|
96 |
+
original_fps = cap.get(cv2.CAP_PROP_FPS)
|
97 |
+
|
98 |
+
frame_skip_factor = video_interval
|
99 |
+
|
100 |
+
# Calculate new FPS
|
101 |
+
new_fps = original_fps / frame_skip_factor
|
102 |
+
|
103 |
+
vid_frames, image_paths = read_video(video_input_path, video_interval)
|
104 |
# create a question (<image> is a placeholder for the video frames)
|
105 |
question = f"<image>{prompt}"
|
106 |
result = model.predict_forward(
|
|
|
190 |
with gr.Row():
|
191 |
with gr.Column():
|
192 |
video_input = gr.Video(label="Video IN")
|
193 |
+
frame_interval = gr.Slider(label="Frame interval", minimum=1, maximum=12, value=6)
|
194 |
with gr.Row():
|
195 |
vid_instruction = gr.Textbox(label="Instruction", scale=4)
|
196 |
submit_video_btn = gr.Button("Submit", scale=1)
|
|
|
200 |
|
201 |
submit_video_btn.click(
|
202 |
fn = video_vision,
|
203 |
+
inputs = [video_input, vid_instruction, frame_interval],
|
204 |
outputs = [vid_output_res, output_video]
|
205 |
)
|
206 |
|