Spaces:

prithivMLmods
/

Qwen3-VL-Outpost

Running on Zero

App Files Files Community

prithivMLmods commited on Oct 24

Commit

e84ad0c

verified ·

1 Parent(s): 9bd8809

update app

Browse files

Files changed (1) hide show

app.py +1 -27

app.py CHANGED Viewed

@@ -147,24 +147,6 @@ model_l = Qwen3VLForConditionalGeneration.from_pretrained(
     torch_dtype=torch.float16
 ).to(device).eval()
-# Load Qwen3-VL-2B-Thinking
-MODEL_ID_J = "Qwen/Qwen3-VL-2B-Thinking"
-processor_j = AutoProcessor.from_pretrained(MODEL_ID_J, trust_remote_code=True)
-model_j = Qwen3VLForConditionalGeneration.from_pretrained(
-    MODEL_ID_J,
-    trust_remote_code=True,
-    torch_dtype=torch.float16
-).to(device).eval()
-# Load Qwen3-VL-4B-Thinking
-MODEL_ID_T = "Qwen/Qwen3-VL-4B-Thinking"
-processor_t = AutoProcessor.from_pretrained(MODEL_ID_T, trust_remote_code=True)
-model_t = Qwen3VLForConditionalGeneration.from_pretrained(
-    MODEL_ID_T,
-    trust_remote_code=True,
-    torch_dtype=torch.float16
-).to(device).eval()
 def downsample_video(video_path):
     """
     Downsamples the video to evenly spaced frames.
@@ -205,12 +187,8 @@ def generate_image(model_name: str, text: str, image: Image.Image,
         processor, model = processor_q, model_q
     elif model_name == "Qwen3-VL-8B-Instruct":
         processor, model = processor_y, model_y
-    elif model_name == "Qwen3-VL-4B-Thinking":
-        processor, model = processor_t, model_t
     elif model_name == "Qwen3-VL-2B-Instruct":
         processor, model = processor_l, model_l
-    elif model_name == "Qwen3-VL-2B-Thinking":
-        processor, model = processor_j, model_j
     else:
         yield "Invalid model selected.", "Invalid model selected."
         return
@@ -251,12 +229,8 @@ def generate_video(model_name: str, text: str, video_path: str,
         processor, model = processor_q, model_q
     elif model_name == "Qwen3-VL-8B-Instruct":
         processor, model = processor_y, model_y
-    elif model_name == "Qwen3-VL-4B-Thinking":
-        processor, model = processor_t, model_t
     elif model_name == "Qwen3-VL-2B-Instruct":
         processor, model = processor_l, model_l
-    elif model_name == "Qwen3-VL-2B-Thinking":
-        processor, model = processor_j, model_j
     else:
         yield "Invalid model selected.", "Invalid model selected."
         return
@@ -351,7 +325,7 @@ with gr.Blocks(css=css, theme=steel_blue_theme) as demo:
                 markdown_output = gr.Markdown()
             model_choice = gr.Radio(
-                choices=["Qwen3-VL-4B-Instruct", "Qwen3-VL-8B-Instruct",  "Qwen3-VL-2B-Instruct", "Qwen3-VL-2B-Thinking", "Qwen3-VL-4B-Thinking", "Qwen2.5-VL-3B-Instruct", "Qwen2.5-VL-7B-Instruct"],
                 label="Select Model",
                 value="Qwen3-VL-4B-Instruct"
             )

     torch_dtype=torch.float16
 ).to(device).eval()
 def downsample_video(video_path):
     """
     Downsamples the video to evenly spaced frames.
         processor, model = processor_q, model_q
     elif model_name == "Qwen3-VL-8B-Instruct":
         processor, model = processor_y, model_y
     elif model_name == "Qwen3-VL-2B-Instruct":
         processor, model = processor_l, model_l
     else:
         yield "Invalid model selected.", "Invalid model selected."
         return
         processor, model = processor_q, model_q
     elif model_name == "Qwen3-VL-8B-Instruct":
         processor, model = processor_y, model_y
     elif model_name == "Qwen3-VL-2B-Instruct":
         processor, model = processor_l, model_l
     else:
         yield "Invalid model selected.", "Invalid model selected."
         return
                 markdown_output = gr.Markdown()
             model_choice = gr.Radio(
+                choices=["Qwen3-VL-4B-Instruct", "Qwen3-VL-8B-Instruct",  "Qwen3-VL-2B-Instruct", "Qwen2.5-VL-3B-Instruct", "Qwen2.5-VL-7B-Instruct"],
                 label="Select Model",
                 value="Qwen3-VL-4B-Instruct"
             )