nixpkgs/nixos/modules/services/misc/ollama.nix

{ config, lib, pkgs, ... }:
let
  inherit (lib) types;

  cfg = config.services.ollama;
  ollamaPackage = cfg.package.override {
    inherit (cfg) acceleration;
    linuxPackages = config.boot.kernelPackages.overrideAttrs {
      nvidia_x11 = config.hardware.nvidia.package;
    };
  };
in
{
  options = {
    services.ollama = {
      enable = lib.mkEnableOption (
        lib.mdDoc "Server for local large language models"
      );
      listenAddress = lib.mkOption {
        type = types.str;
        default = "127.0.0.1:11434";
        description = lib.mdDoc ''
          Specifies the bind address on which the ollama server HTTP interface listens.
        '';
      };
      acceleration = lib.mkOption {
        type = types.nullOr (types.enum [ "rocm" "cuda" ]);
        default = null;
        example = "rocm";
        description = lib.mdDoc ''
          Specifies the interface to use for hardware acceleration.

          - `rocm`: supported by modern AMD GPUs
          - `cuda`: supported by modern NVIDIA GPUs
        '';
      };
      package = lib.mkPackageOption pkgs "ollama" { };
    };
  };

  config = lib.mkIf cfg.enable {
    systemd = {
      services.ollama = {
        wantedBy = [ "multi-user.target" ];
        description = "Server for local large language models";
        after = [ "network.target" ];
        environment = {
          HOME = "%S/ollama";
          OLLAMA_MODELS = "%S/ollama/models";
          OLLAMA_HOST = cfg.listenAddress;
        };
        serviceConfig = {
          ExecStart = "${lib.getExe ollamaPackage} serve";
          WorkingDirectory = "/var/lib/ollama";
          StateDirectory = [ "ollama" ];
          DynamicUser = true;
        };
      };
    };

    environment.systemPackages = [ ollamaPackage ];
  };

  meta.maintainers = with lib.maintainers; [ abysssol onny ];
}
nixos/ollama: add option for hardware acceleration 2024-02-22 23:41:25 -05:00			`{ config, lib, pkgs, ... }:`
			`let`
nixos/ollama: override kernelPackages with nvidia driver Instead of setting linuxPackages to a singleton set with nvidia_x11, override the system's kernelPackages with the nvidia driver. This is more semantically correct, though doesn't change any behavior. 2024-02-27 18:30:38 -05:00			`inherit (lib) types;`
nixos/ollama: init 2023-12-29 01:46:01 +01:00
			`cfg = config.services.ollama;`
nixos/ollama: add option for hardware acceleration 2024-02-22 23:41:25 -05:00			`ollamaPackage = cfg.package.override {`
			`inherit (cfg) acceleration;`
nixos/ollama: override kernelPackages with nvidia driver Instead of setting linuxPackages to a singleton set with nvidia_x11, override the system's kernelPackages with the nvidia driver. This is more semantically correct, though doesn't change any behavior. 2024-02-27 18:30:38 -05:00			`linuxPackages = config.boot.kernelPackages.overrideAttrs {`
			`nvidia_x11 = config.hardware.nvidia.package;`
			`};`
nixos/ollama: add option for hardware acceleration 2024-02-22 23:41:25 -05:00			`};`
			`in`
			`{`
nixos/ollama: init 2023-12-29 01:46:01 +01:00			`options = {`
			`services.ollama = {`
			`enable = lib.mkEnableOption (`
			`lib.mdDoc "Server for local large language models"`
			`);`
nixos/ollama: Add listenAddress 2024-01-20 14:36:55 +01:00			`listenAddress = lib.mkOption {`
nixos/ollama: override kernelPackages with nvidia driver Instead of setting linuxPackages to a singleton set with nvidia_x11, override the system's kernelPackages with the nvidia driver. This is more semantically correct, though doesn't change any behavior. 2024-02-27 18:30:38 -05:00			`type = types.str;`
nixos/ollama: Add listenAddress 2024-01-20 14:36:55 +01:00			`default = "127.0.0.1:11434";`
			`description = lib.mdDoc ''`
			`Specifies the bind address on which the ollama server HTTP interface listens.`
			`'';`
			`};`
nixos/ollama: add option for hardware acceleration 2024-02-22 23:41:25 -05:00			`acceleration = lib.mkOption {`
nixos/ollama: override kernelPackages with nvidia driver Instead of setting linuxPackages to a singleton set with nvidia_x11, override the system's kernelPackages with the nvidia driver. This is more semantically correct, though doesn't change any behavior. 2024-02-27 18:30:38 -05:00			`type = types.nullOr (types.enum [ "rocm" "cuda" ]);`
nixos/ollama: add option for hardware acceleration 2024-02-22 23:41:25 -05:00			`default = null;`
			`example = "rocm";`
			`description = lib.mdDoc ''`
			`Specifies the interface to use for hardware acceleration.`

			- `rocm`: supported by modern AMD GPUs
			- `cuda`: supported by modern NVIDIA GPUs
			`'';`
			`};`
nixos/ollama: init 2023-12-29 01:46:01 +01:00			`package = lib.mkPackageOption pkgs "ollama" { };`
			`};`
			`};`

			`config = lib.mkIf cfg.enable {`
			`systemd = {`
			`services.ollama = {`
			`wantedBy = [ "multi-user.target" ];`
			`description = "Server for local large language models";`
			`after = [ "network.target" ];`
			`environment = {`
			`HOME = "%S/ollama";`
			`OLLAMA_MODELS = "%S/ollama/models";`
nixos/ollama: Add listenAddress 2024-01-20 14:36:55 +01:00			`OLLAMA_HOST = cfg.listenAddress;`
nixos/ollama: init 2023-12-29 01:46:01 +01:00			`};`
			`serviceConfig = {`
nixos/ollama: add option for hardware acceleration 2024-02-22 23:41:25 -05:00			`ExecStart = "${lib.getExe ollamaPackage} serve";`
nixos/ollama: init 2023-12-29 01:46:01 +01:00			`WorkingDirectory = "/var/lib/ollama";`
			`StateDirectory = [ "ollama" ];`
			`DynamicUser = true;`
			`};`
			`};`
			`};`

nixos/ollama: add option for hardware acceleration 2024-02-22 23:41:25 -05:00			`environment.systemPackages = [ ollamaPackage ];`
nixos/ollama: init 2023-12-29 01:46:01 +01:00			`};`

nixos/ollama: add option for hardware acceleration 2024-02-22 23:41:25 -05:00			`meta.maintainers = with lib.maintainers; [ abysssol onny ];`
nixos/ollama: init 2023-12-29 01:46:01 +01:00			`}`