Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
|
@@ -123,6 +123,22 @@ def video_vision(video_input_path, prompt):
|
|
| 123 |
with gr.Blocks() as demo:
|
| 124 |
with gr.Column():
|
| 125 |
gr.Markdown("# Sa2VA: Marrying SAM2 with LLaVA for Dense Grounded Understanding of Images and Videos")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 126 |
with gr.Tab("Single Image"):
|
| 127 |
with gr.Row():
|
| 128 |
with gr.Column():
|
|
@@ -148,7 +164,7 @@ with gr.Blocks() as demo:
|
|
| 148 |
submit_video_btn = gr.Button("Submit", scale=1)
|
| 149 |
with gr.Column():
|
| 150 |
vid_output_res = gr.Textbox(label="Response")
|
| 151 |
-
output_video = gr.
|
| 152 |
|
| 153 |
submit_video_btn.click(
|
| 154 |
fn = video_vision,
|
|
|
|
| 123 |
with gr.Blocks() as demo:
|
| 124 |
with gr.Column():
|
| 125 |
gr.Markdown("# Sa2VA: Marrying SAM2 with LLaVA for Dense Grounded Understanding of Images and Videos")
|
| 126 |
+
gr.HTML("""
|
| 127 |
+
<div style="display:flex;column-gap:4px;">
|
| 128 |
+
<a href="https://github.com/magic-research/Sa2VA">
|
| 129 |
+
<img src='https://img.shields.io/badge/GitHub-Repo-blue'>
|
| 130 |
+
</a>
|
| 131 |
+
<a href="https://arxiv.org/abs/2501.04001">
|
| 132 |
+
<img src='https://img.shields.io/badge/ArXiv-Paper-red'>
|
| 133 |
+
</a>
|
| 134 |
+
<a href="https://huggingface.co/spaces/fffiloni/Sa2VA-simple-demo?duplicate=true">
|
| 135 |
+
<img src="https://huggingface.co/datasets/huggingface/badges/resolve/main/duplicate-this-space-sm.svg" alt="Duplicate this Space">
|
| 136 |
+
</a>
|
| 137 |
+
<a href="https://huggingface.co/fffiloni">
|
| 138 |
+
<img src="https://huggingface.co/datasets/huggingface/badges/resolve/main/follow-me-on-HF-sm-dark.svg" alt="Follow me on HF">
|
| 139 |
+
</a>
|
| 140 |
+
</div>
|
| 141 |
+
""")
|
| 142 |
with gr.Tab("Single Image"):
|
| 143 |
with gr.Row():
|
| 144 |
with gr.Column():
|
|
|
|
| 164 |
submit_video_btn = gr.Button("Submit", scale=1)
|
| 165 |
with gr.Column():
|
| 166 |
vid_output_res = gr.Textbox(label="Response")
|
| 167 |
+
output_video = gr.Gallery(label="Segmentation")
|
| 168 |
|
| 169 |
submit_video_btn.click(
|
| 170 |
fn = video_vision,
|