Spaces:

dmorawiec
/

Qwen-VL-Object-Detection

Running on Zero

Darius Morawiec commited on about 1 month ago

Commit

449fa2a

1 Parent(s): 3d8d21b

Add download notification

Files changed (1) hide show

app.py CHANGED Viewed

@@ -217,7 +217,9 @@ with gr.Blocks() as demo:
     with gr.Row():
         run_button = gr.Button("Run")
-    def load_model(model_id: str):
         global current_model, current_processor, current_model_id
         # Only load model if it's different from the currently loaded one
@@ -237,11 +239,17 @@ with gr.Blocks() as demo:
                 torch.cuda.empty_cache()
                 torch.cuda.synchronize()
             current_model = AutoModel.from_pretrained(
                 model_id, dtype="auto", device_map="cpu"
             )
             current_processor = AutoProcessor.from_pretrained(model_id)
             current_model_id = model_id
         return current_model, current_processor
     @spaces.GPU
@@ -342,10 +350,10 @@ with gr.Blocks() as demo:
         image_resize: str = "Yes",
         image_target_size: int | None = None,
     ):
-        # Load the model and processor on CPU
         model, processor = load_model(model_id)
-        # Run inference on GPU (if available)
         return generate(
             model,
             processor,

     with gr.Row():
         run_button = gr.Button("Run")
+    def load_model(
+        model_id: str,
+    ):
         global current_model, current_processor, current_model_id
         # Only load model if it's different from the currently loaded one
                 torch.cuda.empty_cache()
                 torch.cuda.synchronize()
+            gr.Info(
+                f"Downloading and loading <strong>{model_id.removeprefix('Qwen/')}</strong> model files ...",
+                duration=10,
+            )
             current_model = AutoModel.from_pretrained(
                 model_id, dtype="auto", device_map="cpu"
             )
             current_processor = AutoProcessor.from_pretrained(model_id)
             current_model_id = model_id
         return current_model, current_processor
     @spaces.GPU
         image_resize: str = "Yes",
         image_target_size: int | None = None,
     ):
+        # Load the model and processor (on CPU)
         model, processor = load_model(model_id)
+        # Run inference (on GPU *if available)
         return generate(
             model,
             processor,