From 3979f2bb08dd003fd979549600b835dc00a56e50 Mon Sep 17 00:00:00 2001 From: Xuan-Son Nguyen Date: Mon, 6 Apr 2026 14:02:37 +0200 Subject: [PATCH] docs: add hunyuan-ocr gguf, also add test [no ci] (#21490) --- docs/multimodal.md | 1 + tools/mtmd/tests.sh | 1 + 2 files changed, 2 insertions(+) diff --git a/docs/multimodal.md b/docs/multimodal.md index f2fc1510cf..744347f626 100644 --- a/docs/multimodal.md +++ b/docs/multimodal.md @@ -37,6 +37,7 @@ llama-server -hf ggml-org/gemma-3-4b-it-GGUF --no-mmproj-offload > - PaddleOCR-VL: https://github.com/ggml-org/llama.cpp/pull/18825 > - GLM-OCR: https://github.com/ggml-org/llama.cpp/pull/19677 > - Deepseek-OCR: https://github.com/ggml-org/llama.cpp/pull/17400 +> - HunyuanOCR: https://github.com/ggml-org/llama.cpp/pull/21395 ## Pre-quantized models diff --git a/tools/mtmd/tests.sh b/tools/mtmd/tests.sh index e081bde875..d6a6b03c85 100755 --- a/tools/mtmd/tests.sh +++ b/tools/mtmd/tests.sh @@ -89,6 +89,7 @@ add_test_vision "ggml-org/LFM2-VL-450M-GGUF:Q8_0" add_test_vision "ggml-org/granite-docling-258M-GGUF:Q8_0" add_test_vision "ggml-org/LightOnOCR-1B-1025-GGUF:Q8_0" add_test_vision "ggml-org/DeepSeek-OCR-GGUF:Q8_0" -p "Free OCR." --chat-template deepseek-ocr +add_test_vision "ggml-org/HunyuanOCR-GGUF:Q8_0" -p "OCR" add_test_audio "ggml-org/ultravox-v0_5-llama-3_2-1b-GGUF:Q8_0" add_test_audio "ggml-org/Qwen2.5-Omni-3B-GGUF:Q4_K_M"