From 54808ceee4b5c5dba6578ea965e2dac196dfeaa6 Mon Sep 17 00:00:00 2001 From: Your Name Date: Mon, 2 Mar 2026 23:59:02 +0100 Subject: [PATCH] updated models --- modules/llama-swap.nix | 18 ++++++++++++------ 1 file changed, 12 insertions(+), 6 deletions(-) diff --git a/modules/llama-swap.nix b/modules/llama-swap.nix index fdb142d..1218fbb 100644 --- a/modules/llama-swap.nix +++ b/modules/llama-swap.nix @@ -10,7 +10,7 @@ services.llama-swap = { enable = true; package = pkgs.unstable.llama-swap; - port = 8085; + port = 11111; openFirewall = true; settings = @@ -36,15 +36,21 @@ cmd = "${llama-server} --port $\{PORT\} --host 0.0.0.0 --ctx-size $\{ctx\} -ngl $\{ngl\} $\{kv_cache\} --hf-repo $\{hf_repo\}"; aliases = [ "qwen3.5" ]; ttl = 900; - macros.hf_repo = "unsloth/Qwen3.5-35B-A3B-GGUF:Q2_K_L"; - macros.ngl = 40; + macros = { + hf_repo = "unsloth/Qwen3.5-35B-A3B-GGUF:Q2_K_XL"; + ngl = 40; + }; + }; + "qwen3.5-9b" = { + cmd = "${llama-server} --port $\{PORT\} --host 0.0.0.0 --ctx-size $\{ctx\} -ngl $\{ngl\} --hf-repo $\{hf_repo\}"; + ttl = 900; + macros.hf_repo = "unsloth/Qwen3.5-9B-GGUF"; }; - "ministal-3-8b-reasonning" = { - cmd = "${llama-server} --port $\{PORT\} --host 0.0.0.0 --ctx-size $\{ctx\} -ngl $\{ngl\} $\{kv_cache\} --hf-repo $\{hf_repo\}"; + cmd = "${llama-server} --port $\{PORT\} --host 0.0.0.0 --ctx-size $\{ctx\} -ngl $\{ngl\} --hf-repo $\{hf_repo\}"; aliases = [ "ministral" ]; ttl = 900; - macros.hf_repo = "mistralai/Ministral-3-8B-Reasoning-2512-GGUF:Q4_K_M"; + macros.hf_repo = "mistralai/Ministral-3-8B-Reasoning-2512-GGUF"; }; };