diff --git a/services/llama-cpp/llama-cpp.nix b/services/llama-cpp/llama-cpp.nix index df27025..1691d35 100644 --- a/services/llama-cpp/llama-cpp.nix +++ b/services/llama-cpp/llama-cpp.nix @@ -30,9 +30,9 @@ in "-c" "65536" "-ctk" - "q8_0" + "turbo3" "-ctv" - "turbo4" + "turbo3" "-fa" "on" "--api-key-file"