nixos/hosts/architect/llm.nix

{ config, pkgs, ... }:

let
  domain = "pino.giugl.io";
  backendPort = 8080;
  frontendPort = 3030;
  # llama-cpp = pkgs.unstablePkgs.llama-cpp.override { cudaSupport = true; };
  # ollama = pkgs.unstablePkgs.ollama.override { inherit llama-cpp; };
in
{
  # environment.systemPackages = [ ollama ];
  architect.vhost.${domain} = {
    dnsInterfaces = [ "tailscale" ];

    locations."/" = {
      host = "172.17.0.1";
      port = frontendPort;
      allowLan = true;
      allowWAN = true;
      # allow = [ config.architect.networks."tailscale".net ];
      extraConfig = ''
        proxy_read_timeout 600s;
      '';
    };
  };

  architect.vhost."ollama.giugl.io" = {
    dnsInterfaces = [ "tailscale" ];

    locations."/" = {
      host = "172.17.0.1";
      port = 11434;
      allowLan = true;
      allowWAN = true;
      # allow = [ config.architect.networks."tailscale".net ];
      extraConfig = ''
        proxy_read_timeout 600s;
      '';
    };
  };

  virtualisation.oci-containers = {
    containers = {
      ollama-webui = {
        image = "ghcr.io/open-webui/open-webui:main";
        autoStart = true;

        ports = [
          "172.17.0.1:${toString frontendPort}:${toString backendPort}"
        ];

        environment = {
          PORT = "${toString backendPort}";
          OLLAMA_API_BASE_URL = "http://172.17.0.1:11434/api";
        };

        extraOptions = [
          "--pull=always"
        ];
        volumes = [
          "/var/lib/ollama-webui:/app/backend/data"
        ];
      };

      ollama = {
        image = "ollama/ollama:latest";
        autoStart = true;
        extraOptions = [
          "--pull=always"
          "--gpus=all"
        ];
        environment = {
          OLLAMA_ORIGINS = "*";
        };
        volumes = [
          "/ollama:/root/.ollama"
        ];
        ports = [
          "127.0.0.1:11434:11434"
          "172.17.0.1:11434:11434"
        ];
      };
    };
  };
}
llm: fixed upstream image for big-agi. use ollama with GPU support 2024-01-09 13:59:25 +00:00			`{ config, pkgs, ... }:`
architect: added LLM module 2023-11-16 12:25:58 +00:00
			`let`
			`domain = "pino.giugl.io";`
architect: use docker ollama 2024-02-21 11:33:54 +00:00			`backendPort = 8080;`
			`frontendPort = 3030;`
			`# llama-cpp = pkgs.unstablePkgs.llama-cpp.override { cudaSupport = true; };`
			`# ollama = pkgs.unstablePkgs.ollama.override { inherit llama-cpp; };`
architect: added LLM module 2023-11-16 12:25:58 +00:00			`in`
			`{`
architect: use docker ollama 2024-02-21 11:33:54 +00:00			`# environment.systemPackages = [ ollama ];`
architect: added LLM module 2023-11-16 12:25:58 +00:00			`architect.vhost.${domain} = {`
			`dnsInterfaces = [ "tailscale" ];`

			`locations."/" = {`
			`host = "172.17.0.1";`
			`port = frontendPort;`
			`allowLan = true;`
architect: use docker ollama 2024-02-21 11:33:54 +00:00			`allowWAN = true;`
			`# allow = [ config.architect.networks."tailscale".net ];`
			`extraConfig = ''`
			`proxy_read_timeout 600s;`
			`'';`
			`};`
			`};`

			`architect.vhost."ollama.giugl.io" = {`
			`dnsInterfaces = [ "tailscale" ];`

			`locations."/" = {`
			`host = "172.17.0.1";`
			`port = 11434;`
			`allowLan = true;`
			`allowWAN = true;`
			`# allow = [ config.architect.networks."tailscale".net ];`
			`extraConfig = ''`
			`proxy_read_timeout 600s;`
			`'';`
architect: added LLM module 2023-11-16 12:25:58 +00:00			`};`
			`};`

			`virtualisation.oci-containers = {`
			`containers = {`
architect: use docker ollama 2024-02-21 11:33:54 +00:00			`ollama-webui = {`
			`image = "ghcr.io/open-webui/open-webui:main";`
architect: added LLM module 2023-11-16 12:25:58 +00:00			`autoStart = true;`

			`ports = [`
			`"172.17.0.1:${toString frontendPort}:${toString backendPort}"`
			`];`
architect: use docker ollama 2024-02-21 11:33:54 +00:00
			`environment = {`
			`PORT = "${toString backendPort}";`
			`OLLAMA_API_BASE_URL = "http://172.17.0.1:11434/api";`
			`};`

			`extraOptions = [`
			`"--pull=always"`
			`];`
			`volumes = [`
			`"/var/lib/ollama-webui:/app/backend/data"`
architect: added LLM module 2023-11-16 12:25:58 +00:00			`];`
architect: use docker ollama 2024-02-21 11:33:54 +00:00			`};`

			`ollama = {`
			`image = "ollama/ollama:latest";`
			`autoStart = true;`
architect: added LLM module 2023-11-16 12:25:58 +00:00			`extraOptions = [`
			`"--pull=always"`
architect: use docker ollama 2024-02-21 11:33:54 +00:00			`"--gpus=all"`
			`];`
			`environment = {`
			`OLLAMA_ORIGINS = "*";`
			`};`
			`volumes = [`
			`"/ollama:/root/.ollama"`
			`];`
			`ports = [`
			`"127.0.0.1:11434:11434"`
			`"172.17.0.1:11434:11434"`
architect: added LLM module 2023-11-16 12:25:58 +00:00			`];`
			`};`
			`};`
			`};`
			`}`