From d4d01d63f15e96a4fe15f637e91e6c6d4b57a8ab Mon Sep 17 00:00:00 2001 From: Simon Gardling Date: Fri, 3 Apr 2026 14:06:35 -0400 Subject: [PATCH] llama-cpp: update + re-enable + gemma 4 E4B --- flake.lock | 6 +++--- services/llama-cpp/llama-cpp.nix | 6 +++--- 2 files changed, 6 insertions(+), 6 deletions(-) diff --git a/flake.lock b/flake.lock index 5e712a4..81bc859 100644 --- a/flake.lock +++ b/flake.lock @@ -302,11 +302,11 @@ ] }, "locked": { - "lastModified": 1775161985, - "narHash": "sha256-CahR+F3hF7C5IYWooVblvlzHf2eDST0Eagu59xdY37g=", + "lastModified": 1775236905, + "narHash": "sha256-tHshzR/k6D/r5UhJCfJ9b/mJgsbn7ODtnZrDlimhOOI=", "owner": "TheTom", "repo": "llama-cpp-turboquant", - "rev": "63b832bc0799ba7270e695e0987d0bd2272bdc7e", + "rev": "bc05a6803e48f17e0f2c7a99fce9b50d03882de7", "type": "github" }, "original": { diff --git a/services/llama-cpp/llama-cpp.nix b/services/llama-cpp/llama-cpp.nix index 23dee04..7cd002b 100644 --- a/services/llama-cpp/llama-cpp.nix +++ b/services/llama-cpp/llama-cpp.nix @@ -8,11 +8,11 @@ }: { services.llama-cpp = { - enable = false; + enable = true; model = toString ( pkgs.fetchurl { - url = "https://huggingface.co/unsloth/Qwen3.5-9B-GGUF/resolve/main/Qwen3.5-9B-Q4_K_M.gguf"; - sha256 = "03b74727a860a56338e042c4420bb3f04b2fec5734175f4cb9fa853daf52b7e8"; + url = "https://huggingface.co/unsloth/gemma-4-E4B-it-GGUF/resolve/main/gemma-4-E4B-it-Q4_K_M.gguf"; + sha256 = "ced37f54b80068fe65e95c6dd79ac88cddc227e179fd1040b8f751b1e5bdf849"; } ); port = service_configs.ports.private.llama_cpp.port;