llama-cpp: update + re-enable + gemma 4 E4B
Some checks failed
Build and Deploy / deploy (push) Failing after 20m16s
Some checks failed
Build and Deploy / deploy (push) Failing after 20m16s
This commit is contained in:
6
flake.lock
generated
6
flake.lock
generated
@@ -302,11 +302,11 @@
|
|||||||
]
|
]
|
||||||
},
|
},
|
||||||
"locked": {
|
"locked": {
|
||||||
"lastModified": 1775161985,
|
"lastModified": 1775236905,
|
||||||
"narHash": "sha256-CahR+F3hF7C5IYWooVblvlzHf2eDST0Eagu59xdY37g=",
|
"narHash": "sha256-tHshzR/k6D/r5UhJCfJ9b/mJgsbn7ODtnZrDlimhOOI=",
|
||||||
"owner": "TheTom",
|
"owner": "TheTom",
|
||||||
"repo": "llama-cpp-turboquant",
|
"repo": "llama-cpp-turboquant",
|
||||||
"rev": "63b832bc0799ba7270e695e0987d0bd2272bdc7e",
|
"rev": "bc05a6803e48f17e0f2c7a99fce9b50d03882de7",
|
||||||
"type": "github"
|
"type": "github"
|
||||||
},
|
},
|
||||||
"original": {
|
"original": {
|
||||||
|
|||||||
@@ -8,11 +8,11 @@
|
|||||||
}:
|
}:
|
||||||
{
|
{
|
||||||
services.llama-cpp = {
|
services.llama-cpp = {
|
||||||
enable = false;
|
enable = true;
|
||||||
model = toString (
|
model = toString (
|
||||||
pkgs.fetchurl {
|
pkgs.fetchurl {
|
||||||
url = "https://huggingface.co/unsloth/Qwen3.5-9B-GGUF/resolve/main/Qwen3.5-9B-Q4_K_M.gguf";
|
url = "https://huggingface.co/unsloth/gemma-4-E4B-it-GGUF/resolve/main/gemma-4-E4B-it-Q4_K_M.gguf";
|
||||||
sha256 = "03b74727a860a56338e042c4420bb3f04b2fec5734175f4cb9fa853daf52b7e8";
|
sha256 = "ced37f54b80068fe65e95c6dd79ac88cddc227e179fd1040b8f751b1e5bdf849";
|
||||||
}
|
}
|
||||||
);
|
);
|
||||||
port = service_configs.ports.private.llama_cpp.port;
|
port = service_configs.ports.private.llama_cpp.port;
|
||||||
|
|||||||
Reference in New Issue
Block a user