Compare commits
2 Commits
6cc3d96362
...
d8ab4ef59c
| Author | SHA1 | Date | |
|---|---|---|---|
|
d8ab4ef59c
|
|||
|
1482429a00
|
12
flake.lock
generated
12
flake.lock
generated
@@ -200,11 +200,11 @@
|
|||||||
]
|
]
|
||||||
},
|
},
|
||||||
"locked": {
|
"locked": {
|
||||||
"lastModified": 1743424621,
|
"lastModified": 1743439256,
|
||||||
"narHash": "sha256-M4dHt10aGASKjoRtafFMJfewANh/7+O6t+ITb9oPsNY=",
|
"narHash": "sha256-eVxyPbpJuQV3qShmoerj6xzjUsB/UmNGbqP0cNBv42g=",
|
||||||
"owner": "ggml-org",
|
"owner": "ggml-org",
|
||||||
"repo": "llama.cpp",
|
"repo": "llama.cpp",
|
||||||
"rev": "a8a1f3356786cbf8bcc3422e3c8737fc33b453e7",
|
"rev": "c80a7759dab10657b9b6c3e87eef988a133b9b6a",
|
||||||
"type": "github"
|
"type": "github"
|
||||||
},
|
},
|
||||||
"original": {
|
"original": {
|
||||||
@@ -253,11 +253,11 @@
|
|||||||
},
|
},
|
||||||
"nixpkgs": {
|
"nixpkgs": {
|
||||||
"locked": {
|
"locked": {
|
||||||
"lastModified": 1743398199,
|
"lastModified": 1743445058,
|
||||||
"narHash": "sha256-Zy9o4AiBVjmswfXtw5l0YTUSEp676YKAqC9Z2d6MvI0=",
|
"narHash": "sha256-jayDP/dth0BdbFGM2C0Ny7uRHwwA0ppbB+2s23QG9Vk=",
|
||||||
"owner": "NixOS",
|
"owner": "NixOS",
|
||||||
"repo": "nixpkgs",
|
"repo": "nixpkgs",
|
||||||
"rev": "e9549075069ef5e68ddf29cb07c0e38e2a915242",
|
"rev": "e4a74fd10b211a6d8f5575a85154aac0209a8e55",
|
||||||
"type": "github"
|
"type": "github"
|
||||||
},
|
},
|
||||||
"original": {
|
"original": {
|
||||||
|
|||||||
@@ -34,14 +34,20 @@ in
|
|||||||
port = service_configs.ports.llama_cpp;
|
port = service_configs.ports.llama_cpp;
|
||||||
host = "0.0.0.0";
|
host = "0.0.0.0";
|
||||||
package = (
|
package = (
|
||||||
optimizeWithFlags inputs.llamacpp.packages.${pkgs.system}.default [
|
optimizeWithFlags
|
||||||
"-O3"
|
(inputs.llamacpp.packages.${pkgs.system}.default.overrideAttrs (old: {
|
||||||
"-march=znver2"
|
cmakeFlags = old.cmakeFlags ++ [
|
||||||
"-mtune=znver2"
|
"-DGGML_AVX2=ON"
|
||||||
]
|
];
|
||||||
|
}))
|
||||||
|
[
|
||||||
|
"-O3"
|
||||||
|
"-march=znver2"
|
||||||
|
"-mtune=znver2"
|
||||||
|
]
|
||||||
);
|
);
|
||||||
extraFlags = [
|
extraFlags = [
|
||||||
|
"--flash-attn"
|
||||||
];
|
];
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user