mirror of
https://github.com/containers/ramalama.git
synced 2026-02-05 15:47:26 +01:00
granite-code models in Ollama are malformed
To the extent where they work in Ollama but not vanilla llama.cpp This is sortof a workaround, pulling the hf versions. Signed-off-by: Eric Curtin <ecurtin@redhat.com>
This commit is contained in:
@@ -1,8 +1,13 @@
|
||||
[shortnames]
|
||||
"granite" = "ollama://granite3.1-dense"
|
||||
"granite-lab-8b" = "huggingface://ibm-granite/granite-8b-code-instruct-GGUF/granite-8b-code-instruct.Q4_K_M.gguf"
|
||||
"granite-lab-8b" = "huggingface://ibm-granite/granite-8b-code-base-GGUF/granite-8b-code-base.Q4_K_M.gguf"
|
||||
"granite:2b" = "ollama://granite3.1-dense:2b"
|
||||
"granite:8b" = "ollama://granite3.1-dense:8b"
|
||||
"granite-code" = "hf://ibm-granite/granite-3b-code-base-2k-GGUF/granite-3b-code-base.Q4_K_M.gguf"
|
||||
"granite-code:3b" = "hf://ibm-granite/granite-3b-code-base-2k-GGUF/granite-3b-code-base.Q4_K_M.gguf"
|
||||
"granite-code:8b" = "hf://ibm-granite/granite-8b-code-base-4k-GGUF/granite-8b-code-base.Q4_K_M.gguf"
|
||||
"granite-code:20b" = "hf://ibm-granite/granite-20b-code-base-8k-GGUF/granite-20b-code-base.Q4_K_M.gguf"
|
||||
"granite-code:34b" = "hf://ibm-granite/granite-34b-code-base-8k-GGUF/granite-34b-code-base.Q4_K_M.gguf"
|
||||
"ibm/granite" = "ollama://granite3.1-dense:8b"
|
||||
"ibm/granite:2b" = "ollama://granite3.1-dense:2b"
|
||||
"smollm:135m" = "ollama://smollm:135m"
|
||||
|
||||
Reference in New Issue
Block a user