This commit is contained in:
Tristan D. 2025-04-29 09:35:03 +02:00
parent 410edddef6
commit bd572a0ccd
Signed by: tristan
SSH key fingerprint: SHA256:3RU4RLOoM8oAjFU19f1W6t8uouZbA7GWkaSW6rjp1k8
4 changed files with 12 additions and 12 deletions

4
Cargo.lock generated
View file

@ -215,7 +215,7 @@ dependencies = [
[[package]]
name = "axum-controller"
version = "0.2.2"
version = "0.2.1"
dependencies = [
"axum-controller-macros",
"axum-typed-routing",
@ -223,7 +223,7 @@ dependencies = [
[[package]]
name = "axum-controller-macros"
version = "0.2.2"
version = "0.2.1"
dependencies = [
"prettyplease",
"proc-macro2",

8
flake.lock generated
View file

@ -64,16 +64,16 @@
]
},
"locked": {
"lastModified": 1744745160,
"narHash": "sha256-tTfodLDvQslNA5irDmavbOnHsCyaQ3uQKxmsoKtrKdU=",
"lastModified": 1745868199,
"narHash": "sha256-kTy1oNcN4bNHDV7yqIOSTo/JUN4enHeqyUeVE/q4iHg=",
"owner": "ggerganov",
"repo": "llama.cpp",
"rev": "80f19b41869728eeb6a26569957b92a773a2b2c6",
"rev": "eaea3253244dc4bbe07f6cd81325847ccc6cf93e",
"type": "github"
},
"original": {
"owner": "ggerganov",
"ref": "b5142",
"ref": "b5214",
"repo": "llama.cpp",
"type": "github"
}

View file

@ -19,7 +19,7 @@
flake-parts.url = "github:hercules-ci/flake-parts";
devshell.url = "github:numtide/devshell";
llama-cpp = {
url = "github:ggerganov/llama.cpp/b5142";
url = "github:ggerganov/llama.cpp/b5214";
inputs.nixpkgs.follows = "nixpkgs";
inputs.flake-parts.follows = "flake-parts";
};

View file

@ -48,12 +48,12 @@ model_specs:
args:
ctx-size: 16384
flash-attn: true
model: /media/SanDisk/ai/models_live/mistralai_Mistral-Small-3.1-24B-Instruct-2503-IQ4_XS
model: /media/SanDisk/ai/models_live/Qwen_Qwen3-30B-A3B-Q5_K_S.gguf
gpu-layers: 9999
model-draft: /media/SanDisk/ai/models_live/Mistral-Small-3.1-DRAFT-0.5B.Q8_0.gguf
gpu-layers-draft: 9999
draft-max: 16
draft-min: 4
# model-draft: /media/SanDisk/ai/models_live/Qwen_Qwen3-0.6B-Q6_K.gguf
# gpu-layers-draft: 9999
# draft-max: 16
# draft-min: 4
# - name: "big-chat"
# port: 18082
# vram_usage: 26.5G