Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -5,7 +5,7 @@ import requests
|
|
5 |
import spaces
|
6 |
from transformers import AutoProcessor, Idefics3ForConditionalGeneration, TextIteratorStreamer, StoppingCriteria, StoppingCriteriaList
|
7 |
|
8 |
-
base_model_id = "Andres77872/SmolVLM-500M-anime-caption-v0.
|
9 |
|
10 |
processor = AutoProcessor.from_pretrained(base_model_id)
|
11 |
model = Idefics3ForConditionalGeneration.from_pretrained(
|
@@ -50,7 +50,7 @@ def caption_anime_image_stream(image):
|
|
50 |
inputs = processor(text=[prompt], images=[[image]], return_tensors='pt', padding=True, size=size)
|
51 |
inputs = {k: v.to(model.device) for k, v in inputs.items()}
|
52 |
|
53 |
-
stop_sequence = "</
|
54 |
streamer = TextIteratorStreamer(
|
55 |
processor.tokenizer,
|
56 |
skip_prompt=True,
|
@@ -64,7 +64,7 @@ def caption_anime_image_stream(image):
|
|
64 |
**inputs,
|
65 |
streamer=streamer,
|
66 |
do_sample=False,
|
67 |
-
max_new_tokens=
|
68 |
pad_token_id=processor.tokenizer.pad_token_id,
|
69 |
stopping_criteria=custom_stopping_criteria,
|
70 |
)
|
@@ -81,7 +81,7 @@ demo = gr.Interface(
|
|
81 |
caption_anime_image_stream,
|
82 |
inputs=gr.Image(type="pil", label="Anime Image"),
|
83 |
outputs=gr.Textbox(lines=8, label="Caption"),
|
84 |
-
title="SmolVLM-500M-
|
85 |
description="Upload an anime-style image to generate a caption.",
|
86 |
# Enable live streaming:
|
87 |
allow_flagging="auto",
|
|
|
5 |
import spaces
|
6 |
from transformers import AutoProcessor, Idefics3ForConditionalGeneration, TextIteratorStreamer, StoppingCriteria, StoppingCriteriaList
|
7 |
|
8 |
+
base_model_id = "Andres77872/SmolVLM-500M-anime-caption-v0.2"
|
9 |
|
10 |
processor = AutoProcessor.from_pretrained(base_model_id)
|
11 |
model = Idefics3ForConditionalGeneration.from_pretrained(
|
|
|
50 |
inputs = processor(text=[prompt], images=[[image]], return_tensors='pt', padding=True, size=size)
|
51 |
inputs = {k: v.to(model.device) for k, v in inputs.items()}
|
52 |
|
53 |
+
stop_sequence = "</RATING>"
|
54 |
streamer = TextIteratorStreamer(
|
55 |
processor.tokenizer,
|
56 |
skip_prompt=True,
|
|
|
64 |
**inputs,
|
65 |
streamer=streamer,
|
66 |
do_sample=False,
|
67 |
+
max_new_tokens=1024,
|
68 |
pad_token_id=processor.tokenizer.pad_token_id,
|
69 |
stopping_criteria=custom_stopping_criteria,
|
70 |
)
|
|
|
81 |
caption_anime_image_stream,
|
82 |
inputs=gr.Image(type="pil", label="Anime Image"),
|
83 |
outputs=gr.Textbox(lines=8, label="Caption"),
|
84 |
+
title="SmolVLM-500M-anime-caption-v0.2 Demo",
|
85 |
description="Upload an anime-style image to generate a caption.",
|
86 |
# Enable live streaming:
|
87 |
allow_flagging="auto",
|