llama-cpp: fix model name
All checks were successful
Build and Deploy / deploy (push) Successful in 1m18s
All checks were successful
Build and Deploy / deploy (push) Successful in 1m18s
This commit is contained in:
@@ -9,13 +9,15 @@
|
||||
}:
|
||||
let
|
||||
cfg = config.services.llama-cpp;
|
||||
modelUrl = "https://huggingface.co/unsloth/gemma-4-E4B-it-GGUF/resolve/main/gemma-4-E4B-it-Q4_K_M.gguf";
|
||||
modelAlias = lib.removeSuffix ".gguf" (builtins.baseNameOf modelUrl);
|
||||
in
|
||||
{
|
||||
services.llama-cpp = {
|
||||
enable = true;
|
||||
model = toString (
|
||||
pkgs.fetchurl {
|
||||
url = "https://huggingface.co/unsloth/gemma-4-E4B-it-GGUF/resolve/main/gemma-4-E4B-it-Q4_K_M.gguf";
|
||||
url = modelUrl;
|
||||
sha256 = "sha256-4bxEJwn+eAqksuybIsFqf83/VC8X8B7Q4yAxFNKPnzQ=";
|
||||
}
|
||||
);
|
||||
@@ -36,6 +38,8 @@ in
|
||||
"--api-key-file"
|
||||
config.age.secrets.llama-cpp-api-key.path
|
||||
"--metrics"
|
||||
"--alias"
|
||||
modelAlias
|
||||
];
|
||||
};
|
||||
|
||||
|
||||
Reference in New Issue
Block a user