fffiloni commited on
Commit
a945d67
·
verified ·
1 Parent(s): 13d4a9a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +17 -1
app.py CHANGED
@@ -123,6 +123,22 @@ def video_vision(video_input_path, prompt):
123
  with gr.Blocks() as demo:
124
  with gr.Column():
125
  gr.Markdown("# Sa2VA: Marrying SAM2 with LLaVA for Dense Grounded Understanding of Images and Videos")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
126
  with gr.Tab("Single Image"):
127
  with gr.Row():
128
  with gr.Column():
@@ -148,7 +164,7 @@ with gr.Blocks() as demo:
148
  submit_video_btn = gr.Button("Submit", scale=1)
149
  with gr.Column():
150
  vid_output_res = gr.Textbox(label="Response")
151
- output_video = gr.Video(label="Segmentation")
152
 
153
  submit_video_btn.click(
154
  fn = video_vision,
 
123
  with gr.Blocks() as demo:
124
  with gr.Column():
125
  gr.Markdown("# Sa2VA: Marrying SAM2 with LLaVA for Dense Grounded Understanding of Images and Videos")
126
+ gr.HTML("""
127
+ <div style="display:flex;column-gap:4px;">
128
+ <a href="https://github.com/magic-research/Sa2VA">
129
+ <img src='https://img.shields.io/badge/GitHub-Repo-blue'>
130
+ </a>
131
+ <a href="https://arxiv.org/abs/2501.04001">
132
+ <img src='https://img.shields.io/badge/ArXiv-Paper-red'>
133
+ </a>
134
+ <a href="https://huggingface.co/spaces/fffiloni/Sa2VA-simple-demo?duplicate=true">
135
+ <img src="https://huggingface.co/datasets/huggingface/badges/resolve/main/duplicate-this-space-sm.svg" alt="Duplicate this Space">
136
+ </a>
137
+ <a href="https://huggingface.co/fffiloni">
138
+ <img src="https://huggingface.co/datasets/huggingface/badges/resolve/main/follow-me-on-HF-sm-dark.svg" alt="Follow me on HF">
139
+ </a>
140
+ </div>
141
+ """)
142
  with gr.Tab("Single Image"):
143
  with gr.Row():
144
  with gr.Column():
 
164
  submit_video_btn = gr.Button("Submit", scale=1)
165
  with gr.Column():
166
  vid_output_res = gr.Textbox(label="Response")
167
+ output_video = gr.Gallery(label="Segmentation")
168
 
169
  submit_video_btn.click(
170
  fn = video_vision,