create single function to optimize for system
This commit is contained in:
@@ -3,7 +3,7 @@
|
||||
service_configs,
|
||||
config,
|
||||
inputs,
|
||||
optimizeWithFlags,
|
||||
optimizePackage,
|
||||
...
|
||||
}:
|
||||
{
|
||||
@@ -22,17 +22,13 @@
|
||||
port = service_configs.ports.llama_cpp;
|
||||
host = "0.0.0.0";
|
||||
package = (
|
||||
optimizeWithFlags
|
||||
(inputs.llamacpp.packages.${pkgs.system}.default.overrideAttrs (old: {
|
||||
optimizePackage (
|
||||
inputs.llamacpp.packages.${pkgs.system}.default.overrideAttrs (old: {
|
||||
cmakeFlags = old.cmakeFlags ++ [
|
||||
"-DGGML_AVX2=ON"
|
||||
];
|
||||
}))
|
||||
[
|
||||
"-O3"
|
||||
"-march=znver2"
|
||||
"-mtune=znver2"
|
||||
]
|
||||
})
|
||||
)
|
||||
);
|
||||
extraFlags = [
|
||||
"--flash-attn"
|
||||
|
||||
Reference in New Issue
Block a user