diff --git a/tools/mtmd/tests.sh b/tools/mtmd/tests.sh index 80db07837a..ed9d592e6a 100755 --- a/tools/mtmd/tests.sh +++ b/tools/mtmd/tests.sh @@ -108,6 +108,7 @@ if [ "$RUN_BIG_TESTS" = true ]; then # add_test_vision "ggml-org/Qwen2.5-VL-32B-Instruct-GGUF:Q4_K_M" # does not work on my mac M3 Ultra # add_test_vision "ggml-org/Kimi-VL-A3B-Thinking-2506-GGUF:Q4_K_M" # not always working add_test_vision "sabafallah/DeepSeek-OCR-GGUF:q8_0" -p "Free OCR." --chat-template deepseek-ocr + add_test_vision "ggml-org/GLM-4.6V-Flash-GGUF:Q4_K_M" -p "extract all texts from this image" add_test_audio "ggml-org/ultravox-v0_5-llama-3_1-8b-GGUF:Q4_K_M" add_test_audio "ggml-org/Qwen2.5-Omni-7B-GGUF:Q4_K_M" diff --git a/tools/mtmd/tests/tests-requirements.txt b/tools/mtmd/tests/tests-requirements.txt index aad4e10ae5..3134d098d6 100644 --- a/tools/mtmd/tests/tests-requirements.txt +++ b/tools/mtmd/tests/tests-requirements.txt @@ -1,3 +1,5 @@ sentence-transformers transformers tokenizers +torch +torchvision