1
0
mirror of https://github.com/containers/ramalama.git synced 2026-02-05 15:47:26 +01:00

granite-code models in Ollama are malformed

To the extent where they work in Ollama but not vanilla llama.cpp

This is sortof a workaround, pulling the hf versions.

Signed-off-by: Eric Curtin <ecurtin@redhat.com>
This commit is contained in:
Eric Curtin
2025-01-13 17:13:54 +00:00
parent cc1db3c5ed
commit da7eb54046

View File

@@ -1,8 +1,13 @@
[shortnames]
"granite" = "ollama://granite3.1-dense"
"granite-lab-8b" = "huggingface://ibm-granite/granite-8b-code-instruct-GGUF/granite-8b-code-instruct.Q4_K_M.gguf"
"granite-lab-8b" = "huggingface://ibm-granite/granite-8b-code-base-GGUF/granite-8b-code-base.Q4_K_M.gguf"
"granite:2b" = "ollama://granite3.1-dense:2b"
"granite:8b" = "ollama://granite3.1-dense:8b"
"granite-code" = "hf://ibm-granite/granite-3b-code-base-2k-GGUF/granite-3b-code-base.Q4_K_M.gguf"
"granite-code:3b" = "hf://ibm-granite/granite-3b-code-base-2k-GGUF/granite-3b-code-base.Q4_K_M.gguf"
"granite-code:8b" = "hf://ibm-granite/granite-8b-code-base-4k-GGUF/granite-8b-code-base.Q4_K_M.gguf"
"granite-code:20b" = "hf://ibm-granite/granite-20b-code-base-8k-GGUF/granite-20b-code-base.Q4_K_M.gguf"
"granite-code:34b" = "hf://ibm-granite/granite-34b-code-base-8k-GGUF/granite-34b-code-base.Q4_K_M.gguf"
"ibm/granite" = "ollama://granite3.1-dense:8b"
"ibm/granite:2b" = "ollama://granite3.1-dense:2b"
"smollm:135m" = "ollama://smollm:135m"