gpt4all: use qwen 2.5 14B IQ4_XS instead

This commit is contained in:
2024-10-06 23:03:44 -04:00
parent a869b33aad
commit a78d333f96
3 changed files with 40 additions and 67 deletions

View File

@@ -1,42 +1,15 @@
{ pkgs, lib, ... }:
let
models = [
# {
# name = "Qwen2.5-14B-Instruct-Q4_K_S.gguf";
# context_length = "32768";
# gen_length = "8192";
# source = pkgs.fetchurl {
# url = "https://huggingface.co/bartowski/Qwen2.5-14B-Instruct-GGUF/resolve/main/Qwen2.5-14B-Instruct-Q4_K_S.gguf?download=true";
# sha256 = "E1CmWUhMMbTXEjIRczzA3rSrVuR8qOL8BLagw7LiyZk=";
# };
# }
{
name = "Replete-LLM-V2.5-Qwen-14b-Q4_K_S.gguf";
name = "Qwen2.5-14B-Instruct-IQ4_XS.gguf";
context_length = "32768";
gen_length = "8192";
source = pkgs.fetchurl {
url = "https://huggingface.co/bartowski/Replete-LLM-V2.5-Qwen-14b-GGUF/resolve/main/Replete-LLM-V2.5-Qwen-14b-Q4_K_S.gguf?download=true";
sha256 = "/Oa1y4WVRGQkLEt5Sxxyt5plN5+tDFblLShPhMtzs7k=";
url = "https://huggingface.co/bartowski/Qwen2.5-14B-Instruct-GGUF/resolve/main/Qwen2.5-14B-Instruct-IQ4_XS.gguf?download=true";
sha256 = "+AHt49no0qQ48MoNsqGJV4FeJ3Cf2hSZqTMjNUIHaO4=";
};
}
# {
# name = "Qwen2.5-7B-Instruct-Q6_K_L.gguf";
# context_length = "32768";
# gen_length = "8192";
# source = pkgs.fetchurl {
# url = "https://huggingface.co/bartowski/Qwen2.5-7B-Instruct-GGUF/resolve/main/Qwen2.5-7B-Instruct-Q6_K_L.gguf?download=true";
# sha256 = "thEXN06T/UVGfzdB83jlgpG7kuTzZtz1ZUAdupAnErM=";
# };
# }
# {
# name = "Replete-LLM-V2.5-Qwen-7b-Q6_K_L.gguf";
# context_length = "32768";
# gen_length = "8192";
# source = pkgs.fetchurl {
# url = "https://huggingface.co/bartowski/Replete-LLM-V2.5-Qwen-7b-GGUF/resolve/main/Replete-LLM-V2.5-Qwen-7b-Q6_K_L.gguf?download=true";
# sha256 = "dR7M5GKfGdiPI9mqBSH6naVr8XzuCjLLv514VYXSikg=";
# };
# }
];
# stolen from: https://stackoverflow.com/a/42398526
@@ -70,7 +43,7 @@ let
owner = "nomic-ai";
repo = "gpt4all";
rev = "HEAD";
sha256 = "7pUgCZJC5goMvpUNBQ3ssmwdWt3TnaQQ7RF98VdYzM8=";
sha256 = "YM/RdxklwIsTjD6xahZIcQoMnoabsmpQwDPEihm+h8A=";
};
patches = old.patches ++ [