nixos/ollama: add option for hardware acceleration

2024-02-22 23:41:25 -05:00 · 2024-02-22 23:41:25 -05:00 · b8d8c1f207
commit b8d8c1f207
parent 70e834c19b
1 changed files with 23 additions and 10 deletions
--- a/nixos/modules/services/misc/ollama.nix
+++ b/nixos/modules/services/misc/ollama.nix
@ -1,9 +1,14 @@
-{ config, lib, pkgs, ... }: let
+{ config, lib, pkgs, ... }:
 let
  inherit (lib.types) nullOr enum;
  cfg = config.services.ollama;
-
+  ollamaPackage = cfg.package.override {
-in {
+    inherit (cfg) acceleration;
-
+    linuxPackages.nvidia_x11 = config.hardware.nvidia.package;
  };
 in
 {
  options = {
    services.ollama = {
      enable = lib.mkEnableOption (
@ -16,12 +21,22 @@ in {
          Specifies the bind address on which the ollama server HTTP interface listens.
        '';
      };
      acceleration = lib.mkOption {
        type = nullOr (enum [ "rocm" "cuda" ]);
        default = null;
        example = "rocm";
        description = lib.mdDoc ''
          Specifies the interface to use for hardware acceleration.
          - `rocm`: supported by modern AMD GPUs
          - `cuda`: supported by modern NVIDIA GPUs
        '';
      };
      package = lib.mkPackageOption pkgs "ollama" { };
    };
  };
  config = lib.mkIf cfg.enable {
    systemd = {
      services.ollama = {
        wantedBy = [ "multi-user.target" ];
@ -33,7 +48,7 @@ in {
          OLLAMA_HOST = cfg.listenAddress;
        };
        serviceConfig = {
-          ExecStart = "${lib.getExe cfg.package} serve";
+          ExecStart = "${lib.getExe ollamaPackage} serve";
          WorkingDirectory = "/var/lib/ollama";
          StateDirectory = [ "ollama" ];
          DynamicUser = true;
@ -41,10 +56,8 @@ in {
      };
    };
-    environment.systemPackages = [ cfg.package ];
+    environment.systemPackages = [ ollamaPackage ];
  };
-  meta.maintainers = with lib.maintainers; [ onny ];
+  meta.maintainers = with lib.maintainers; [ abysssol onny ];
 }