llm: enable AVX2
This commit is contained in:
parent
6cc3d96362
commit
1482429a00
@ -34,14 +34,20 @@ in
|
||||
port = service_configs.ports.llama_cpp;
|
||||
host = "0.0.0.0";
|
||||
package = (
|
||||
optimizeWithFlags inputs.llamacpp.packages.${pkgs.system}.default [
|
||||
"-O3"
|
||||
"-march=znver2"
|
||||
"-mtune=znver2"
|
||||
]
|
||||
optimizeWithFlags
|
||||
(inputs.llamacpp.packages.${pkgs.system}.default.overrideAttrs (old: {
|
||||
cmakeFlags = old.cmakeFlags ++ [
|
||||
"-DGGML_AVX2=ON"
|
||||
];
|
||||
}))
|
||||
[
|
||||
"-O3"
|
||||
"-march=znver2"
|
||||
"-mtune=znver2"
|
||||
]
|
||||
);
|
||||
extraFlags = [
|
||||
|
||||
"--flash-attn"
|
||||
];
|
||||
};
|
||||
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user