diff --git a/services/llama-cpp.nix b/services/llama-cpp.nix index c3b782a..22a766e 100644 --- a/services/llama-cpp.nix +++ b/services/llama-cpp.nix @@ -22,11 +22,13 @@ # "-ngl" # "12" "-c" - "16384" + "32768" "-ctk" "q8_0" "-ctv" - "turbo3" + "turbo4" + "-fa" + "on" ]; };