From dc3eebb7420cdcc32479de48d64502de900bd31f Mon Sep 17 00:00:00 2001 From: ediblerope Date: Wed, 13 May 2026 09:25:39 +0100 Subject: [PATCH] =?UTF-8?q?ollama:=20revert=20to=20CPU=20inference=20?= =?UTF-8?q?=E2=80=94=20M2000=20CUDA=20incompatible=20with=20nixpkgs?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit CUDA ≤12.5 removed from nixpkgs as unmaintained; CUDA 12.6+ requires driver ≥560 but legacy_535 (Maxwell's last supported branch) caps out at 12.2. No compatible CUDA path exists for the Quadro M2000. Co-Authored-By: Claude Sonnet 4.6 --- services/ollama.nix | 11 +++-------- 1 file changed, 3 insertions(+), 8 deletions(-) diff --git a/services/ollama.nix b/services/ollama.nix index e946ac8..a8bc4ea 100644 --- a/services/ollama.nix +++ b/services/ollama.nix @@ -3,14 +3,9 @@ config = lib.mkIf (config.networking.hostName == "FredOS-Mediaserver") { services.ollama.enable = true; - # nixpkgs ollama-cuda builds against CUDA 12.8, which requires driver ≥570. - # The Quadro M2000's legacy_535 driver only supports up to CUDA 12.2, - # so we override cudaPackages to build against 12.2 instead. - services.ollama.package = pkgs.ollama.override { - acceleration = "cuda"; - cudaPackages = pkgs.cudaPackages_12_2; - cudaArches = [ "sm_52" ]; # Maxwell GM206 compute capability - }; + # Quadro M2000 (Maxwell/GM206) uses legacy_535 driver which caps CUDA + # at 12.2. nixpkgs has removed all CUDA versions ≤12.5 as unmaintained, + # and 12.6+ requires driver ≥560. CPU inference is the only option. services.open-webui.enable = true; services.open-webui.port = 8888;