diff --git a/services/ollama.nix b/services/ollama.nix index e946ac8..a8bc4ea 100644 --- a/services/ollama.nix +++ b/services/ollama.nix @@ -3,14 +3,9 @@ config = lib.mkIf (config.networking.hostName == "FredOS-Mediaserver") { services.ollama.enable = true; - # nixpkgs ollama-cuda builds against CUDA 12.8, which requires driver ≥570. - # The Quadro M2000's legacy_535 driver only supports up to CUDA 12.2, - # so we override cudaPackages to build against 12.2 instead. - services.ollama.package = pkgs.ollama.override { - acceleration = "cuda"; - cudaPackages = pkgs.cudaPackages_12_2; - cudaArches = [ "sm_52" ]; # Maxwell GM206 compute capability - }; + # Quadro M2000 (Maxwell/GM206) uses legacy_535 driver which caps CUDA + # at 12.2. nixpkgs has removed all CUDA versions ≤12.5 as unmaintained, + # and 12.6+ requires driver ≥560. CPU inference is the only option. services.open-webui.enable = true; services.open-webui.port = 8888;