Update app.py
Browse files
app.py
CHANGED
|
@@ -504,7 +504,7 @@ def load_llama_model(model_path, enable_thinking):
|
|
| 504 |
mul_mat_q=True,
|
| 505 |
use_mmap=True,
|
| 506 |
chat_handler=Qwen35ChatHandler(
|
| 507 |
-
clip_model_path=f"models/mmproj-
|
| 508 |
# force_reasoning=True,
|
| 509 |
enable_thinking=enable_thinking ,
|
| 510 |
image_min_tokens=1024, # Note: Qwen-VL models require at minimum 1024 image tokens to function correctly on bbox grounding tasks
|
|
|
|
| 504 |
mul_mat_q=True,
|
| 505 |
use_mmap=True,
|
| 506 |
chat_handler=Qwen35ChatHandler(
|
| 507 |
+
clip_model_path=f"models/mmproj-F32.gguf",
|
| 508 |
# force_reasoning=True,
|
| 509 |
enable_thinking=enable_thinking ,
|
| 510 |
image_min_tokens=1024, # Note: Qwen-VL models require at minimum 1024 image tokens to function correctly on bbox grounding tasks
|