diff --git a/hosts/architect/llm.nix b/hosts/architect/llm.nix index f337704..4e5a3c4 100644 --- a/hosts/architect/llm.nix +++ b/hosts/architect/llm.nix @@ -11,11 +11,6 @@ in { environment = { systemPackages = [ ollamaPkg ]; - variables = { - OLLAMA_ORIGINS = "*"; - OLLAMA_FLASH_ATTENTION = "1"; - OLLAMA_NUM_PARALLEL = "3"; - }; }; services.ollama = { @@ -24,6 +19,11 @@ in enable = true; acceleration = "cuda"; package = ollamaPkg; + environmentVariables = { + OLLAMA_ORIGINS = "*"; + OLLAMA_FLASH_ATTENTION = "1"; + OLLAMA_NUM_PARALLEL = "2"; + }; }; architect.vhost.${frontendDomain} = {