diff --git a/configuration.nix b/configuration.nix index e944a61..34e811c 100644 --- a/configuration.nix +++ b/configuration.nix @@ -30,7 +30,7 @@ # ./services/owntracks.nix ./services/soulseek.nix - # ./services/llama-cpp.nix + ./services/llama-cpp.nix ./services/ups.nix diff --git a/services/llama-cpp.nix b/services/llama-cpp.nix index dc7a368..4301bd9 100644 --- a/services/llama-cpp.nix +++ b/services/llama-cpp.nix @@ -11,8 +11,8 @@ enable = true; model = builtins.toString ( pkgs.fetchurl { - url = "https://huggingface.co/ggml-org/gpt-oss-20b-GGUF/resolve/main/gpt-oss-20b-mxfp4.gguf"; - sha256 = "be37a636aca0fc1aae0d32325f82f6b4d21495f06823b5fbc1898ae0303e9935"; + url = "https://huggingface.co/unsloth/Apriel-1.5-15b-Thinker-GGUF/resolve/main/Apriel-1.5-15b-Thinker-Q4_0.gguf"; + sha256 = "4d9439b76b6f4380ab5205617c1ef3d10b0e8897146a0a7ccb7155bca1771df7"; } ); port = service_configs.ports.llama_cpp; @@ -27,7 +27,7 @@ ); extraFlags = [ "-ngl" - "5" + "8" "-c" "16384" ];