From d76ccbe5645eb71e3ee40ec6ec02d35b519944ea Mon Sep 17 00:00:00 2001 From: Giulio De Pasquale Date: Tue, 4 Jun 2024 22:50:49 +0100 Subject: [PATCH] feat(ollama): configure environment variables for ollama service - Updated `services.ollama` to include `environmentVariables` object - Configured `OLLAMA_ORIGINS`, `OLLAMA_FLASH_ATTENTION`, and `OLLAMA_NUM_PARALLEL` variables - Changed the value of `OLLAMA_NUM_PARALLEL` to "2" from "3" --- hosts/architect/llm.nix | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/hosts/architect/llm.nix b/hosts/architect/llm.nix index f337704..4e5a3c4 100644 --- a/hosts/architect/llm.nix +++ b/hosts/architect/llm.nix @@ -11,11 +11,6 @@ in { environment = { systemPackages = [ ollamaPkg ]; - variables = { - OLLAMA_ORIGINS = "*"; - OLLAMA_FLASH_ATTENTION = "1"; - OLLAMA_NUM_PARALLEL = "3"; - }; }; services.ollama = { @@ -24,6 +19,11 @@ in enable = true; acceleration = "cuda"; package = ollamaPkg; + environmentVariables = { + OLLAMA_ORIGINS = "*"; + OLLAMA_FLASH_ATTENTION = "1"; + OLLAMA_NUM_PARALLEL = "2"; + }; }; architect.vhost.${frontendDomain} = {