llm: enable AVX2
This commit is contained in:
parent
6cc3d96362
commit
1482429a00
@ -34,14 +34,20 @@ in
|
|||||||
port = service_configs.ports.llama_cpp;
|
port = service_configs.ports.llama_cpp;
|
||||||
host = "0.0.0.0";
|
host = "0.0.0.0";
|
||||||
package = (
|
package = (
|
||||||
optimizeWithFlags inputs.llamacpp.packages.${pkgs.system}.default [
|
optimizeWithFlags
|
||||||
"-O3"
|
(inputs.llamacpp.packages.${pkgs.system}.default.overrideAttrs (old: {
|
||||||
"-march=znver2"
|
cmakeFlags = old.cmakeFlags ++ [
|
||||||
"-mtune=znver2"
|
"-DGGML_AVX2=ON"
|
||||||
]
|
];
|
||||||
|
}))
|
||||||
|
[
|
||||||
|
"-O3"
|
||||||
|
"-march=znver2"
|
||||||
|
"-mtune=znver2"
|
||||||
|
]
|
||||||
);
|
);
|
||||||
extraFlags = [
|
extraFlags = [
|
||||||
|
"--flash-attn"
|
||||||
];
|
];
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user