Spaces:

tuandunghcmut
/

corgi-qwen3-vl-demo

Runtime error

App Files Files Community

dung-vpt-uney commited on 22 days ago

Commit

799282e

1 Parent(s): 51b978b

Deploy latest CoRGI Gradio demo

Browse files

Files changed (4) hide show

PROGRESS_LOG.md +1 -0
app.py +21 -0
corgi/__pycache__/gradio_app.cpython-313.pyc +0 -0
corgi/gradio_app.py +14 -0

PROGRESS_LOG.md CHANGED Viewed

@@ -11,6 +11,7 @@
 - Authored a metadata-rich `README.md` (with Hugging Face Space front matter) so the deployed Space renders without configuration errors.
 - Updated `app.py` to fall back to `demo.queue()` when `concurrency_count` is unsupported, fixing the runtime error seen on Spaces.
 - Added ZeroGPU support: cached model/processor globals live on CUDA when available, a `@spaces.GPU`-decorated executor handles pipeline runs, and requirements now include the `spaces` SDK.
 ## 2024-10-21
 - Updated default checkpoints to `Qwen/Qwen3-VL-8B-Thinking` and verified CLI/Gradio/test coverage.

 - Authored a metadata-rich `README.md` (with Hugging Face Space front matter) so the deployed Space renders without configuration errors.
 - Updated `app.py` to fall back to `demo.queue()` when `concurrency_count` is unsupported, fixing the runtime error seen on Spaces.
 - Added ZeroGPU support: cached model/processor globals live on CUDA when available, a `@spaces.GPU`-decorated executor handles pipeline runs, and requirements now include the `spaces` SDK.
+- Introduced structured logging for the app (`app.py`) and pipeline execution to trace model loads, cache hits, and Gradio lifecycle events on Spaces.
 ## 2024-10-21
 - Updated default checkpoints to `Qwen/Qwen3-VL-8B-Thinking` and verified CLI/Gradio/test coverage.

app.py CHANGED Viewed

@@ -1,13 +1,34 @@
 """Hugging Face Spaces entrypoint for the CoRGI Qwen3-VL demo."""
 from corgi.gradio_app import build_demo
 demo = build_demo()
 try:  # Gradio >=4.29 supports concurrency_count
     demo = demo.queue(concurrency_count=1)
 except TypeError:
     demo = demo.queue()
 if __name__ == "__main__":
     demo.launch()

 """Hugging Face Spaces entrypoint for the CoRGI Qwen3-VL demo."""
+from __future__ import annotations
+import logging
+import os
 from corgi.gradio_app import build_demo
+def _configure_logging() -> logging.Logger:
+    level = os.getenv("CORGI_LOG_LEVEL", "INFO").upper()
+    logging.basicConfig(
+        level=getattr(logging, level, logging.INFO),
+        format="%(asctime)s | %(levelname)s | %(name)s | %(message)s",
+    )
+    return logging.getLogger("corgi.app")
+logger = _configure_logging()
+logger.info("Initializing Gradio demo build.")
 demo = build_demo()
+logger.info("Gradio Blocks created; configuring queue.")
 try:  # Gradio >=4.29 supports concurrency_count
     demo = demo.queue(concurrency_count=1)
+    logger.info("Queue configured with concurrency_count=1.")
 except TypeError:
+    logger.warning("concurrency_count unsupported; falling back to default queue().")
     demo = demo.queue()
 if __name__ == "__main__":
+    logger.info("Launching Gradio demo.")
     demo.launch()

corgi/__pycache__/gradio_app.cpython-313.pyc CHANGED Viewed

Binary files a/corgi/__pycache__/gradio_app.cpython-313.pyc and b/corgi/__pycache__/gradio_app.cpython-313.pyc differ

corgi/gradio_app.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from __future__ import annotations
 from dataclasses import dataclass
 from typing import Callable, Optional
@@ -23,6 +24,7 @@ class PipelineState:
 _PIPELINE_CACHE: dict[str, CoRGIPipeline] = {}
 _GLOBAL_FACTORY: Callable[[Optional[str]], CoRGIPipeline] | None = None
 def _default_factory(model_id: Optional[str]) -> CoRGIPipeline:
@@ -33,8 +35,11 @@ def _default_factory(model_id: Optional[str]) -> CoRGIPipeline:
 def _get_pipeline(model_id: str, factory: Callable[[Optional[str]], CoRGIPipeline]) -> CoRGIPipeline:
     pipeline = _PIPELINE_CACHE.get(model_id)
     if pipeline is None:
         pipeline = factory(model_id)
         _PIPELINE_CACHE[model_id] = pipeline
     return pipeline
@@ -47,6 +52,12 @@ def _execute_pipeline(
 ) -> PipelineResult:
     factory = _GLOBAL_FACTORY or _default_factory
     pipeline = _get_pipeline(model_id, factory)
     return pipeline.run(
         image=image.convert("RGB"),
         question=question,
@@ -65,6 +76,7 @@ if spaces is not None:
         max_regions: int,
         model_id: str,
     ) -> PipelineResult:
         return _execute_pipeline(image, question, max_steps, max_regions, model_id)
 else:
@@ -131,6 +143,7 @@ def _run_pipeline(
     if not question.strip():
         return state or PipelineState(model_id=model_id or DEFAULT_MODEL_ID, pipeline=None), "Please enter a question before running the demo."
     target_model = (model_id or DEFAULT_MODEL_ID).strip() or DEFAULT_MODEL_ID
     result = _execute_pipeline_gpu(
         image=image.convert("RGB"),
         question=question.strip(),
@@ -154,6 +167,7 @@ def build_demo(
     factory = pipeline_factory or _default_factory
     global _GLOBAL_FACTORY
     _GLOBAL_FACTORY = factory
     with gr.Blocks(title="CoRGI Qwen3-VL Demo") as demo:
         state = gr.State()  # stores PipelineState

 from __future__ import annotations
+import logging
 from dataclasses import dataclass
 from typing import Callable, Optional
 _PIPELINE_CACHE: dict[str, CoRGIPipeline] = {}
 _GLOBAL_FACTORY: Callable[[Optional[str]], CoRGIPipeline] | None = None
+logger = logging.getLogger("corgi.gradio_app")
 def _default_factory(model_id: Optional[str]) -> CoRGIPipeline:
 def _get_pipeline(model_id: str, factory: Callable[[Optional[str]], CoRGIPipeline]) -> CoRGIPipeline:
     pipeline = _PIPELINE_CACHE.get(model_id)
     if pipeline is None:
+        logger.info("Creating new pipeline for model_id=%s", model_id)
         pipeline = factory(model_id)
         _PIPELINE_CACHE[model_id] = pipeline
+    else:
+        logger.debug("Reusing cached pipeline for model_id=%s", model_id)
     return pipeline
 ) -> PipelineResult:
     factory = _GLOBAL_FACTORY or _default_factory
     pipeline = _get_pipeline(model_id, factory)
+    logger.info(
+        "Executing pipeline for model_id=%s | max_steps=%s | max_regions=%s",
+        model_id,
+        max_steps,
+        max_regions,
+    )
     return pipeline.run(
         image=image.convert("RGB"),
         question=question,
         max_regions: int,
         model_id: str,
     ) -> PipelineResult:
+        logger.debug("Running GPU-decorated pipeline.")
         return _execute_pipeline(image, question, max_steps, max_regions, model_id)
 else:
     if not question.strip():
         return state or PipelineState(model_id=model_id or DEFAULT_MODEL_ID, pipeline=None), "Please enter a question before running the demo."
     target_model = (model_id or DEFAULT_MODEL_ID).strip() or DEFAULT_MODEL_ID
+    logger.info("Received request for model_id=%s", target_model)
     result = _execute_pipeline_gpu(
         image=image.convert("RGB"),
         question=question.strip(),
     factory = pipeline_factory or _default_factory
     global _GLOBAL_FACTORY
     _GLOBAL_FACTORY = factory
+    logger.info("Registering pipeline factory %s", factory)
     with gr.Blocks(title="CoRGI Qwen3-VL Demo") as demo:
         state = gr.State()  # stores PipelineState