Compare commits

..

3 Commits

Author SHA1 Message Date
207722acb2 llama-cpp: update 2025-08-05 20:26:17 -07:00
80afe19a43 llama-cpp: re-enable 2025-08-05 19:56:59 -07:00
ffc079fb21 llama-cpp: use gpt-oss-20b-mxfp4 2025-08-05 19:53:20 -07:00
3 changed files with 6 additions and 6 deletions

View File

@@ -29,7 +29,7 @@
# ./services/owntracks.nix
./services/soulseek.nix
# ./services/llama-cpp.nix
./services/llama-cpp.nix
];
systemd.targets = {

6
flake.lock generated
View File

@@ -238,11 +238,11 @@
]
},
"locked": {
"lastModified": 1754348736,
"narHash": "sha256-rNJpXydIdOtVdbtN0A8XCgcR2+s8JP5IznEp34gy68s=",
"lastModified": 1754436398,
"narHash": "sha256-VhIDk/csS3dt2gF2iFtXe4hKZWiKzNfYwvPN2aghTOI=",
"owner": "ggml-org",
"repo": "llama.cpp",
"rev": "ec428b02c347767f24c78111309e3f30d2ada289",
"rev": "9515c6131aecaccc955fdedcfe16c3e030aaefcb",
"type": "github"
},
"original": {

View File

@@ -11,8 +11,8 @@
enable = true;
model = builtins.toString (
pkgs.fetchurl {
url = "https://huggingface.co/bartowski/deepseek-ai_DeepSeek-R1-0528-Qwen3-8B-GGUF/resolve/main/deepseek-ai_DeepSeek-R1-0528-Qwen3-8B-Q4_0.gguf";
sha256 = "a71a983c64eb72a2b4a885993cd0675474afe7e92d72b051ab8716b23157daa0";
url = "https://huggingface.co/ggml-org/gpt-oss-20b-GGUF/resolve/main/gpt-oss-20b-mxfp4.gguf";
sha256 = "52f57ab7d3df3ba9173827c1c6832e73375553a846f3e32b49f1ae2daad688d4";
}
);
port = service_configs.ports.llama_cpp;