llm: enable AVX2

This commit is contained in:
Simon Gardling 2025-03-31 12:02:38 -04:00
parent 6cc3d96362
commit 1482429a00
Signed by: titaniumtown
GPG Key ID: 9AB28AC10ECE533D

View File

@ -34,14 +34,20 @@ in
port = service_configs.ports.llama_cpp;
host = "0.0.0.0";
package = (
optimizeWithFlags inputs.llamacpp.packages.${pkgs.system}.default [
"-O3"
"-march=znver2"
"-mtune=znver2"
]
optimizeWithFlags
(inputs.llamacpp.packages.${pkgs.system}.default.overrideAttrs (old: {
cmakeFlags = old.cmakeFlags ++ [
"-DGGML_AVX2=ON"
];
}))
[
"-O3"
"-march=znver2"
"-mtune=znver2"
]
);
extraFlags = [
"--flash-attn"
];
};