nixos/services/ollama.nix
ediblerope dc3eebb742 ollama: revert to CPU inference — M2000 CUDA incompatible with nixpkgs
CUDA ≤12.5 removed from nixpkgs as unmaintained; CUDA 12.6+ requires
driver ≥560 but legacy_535 (Maxwell's last supported branch) caps out
at 12.2. No compatible CUDA path exists for the Quadro M2000.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
2026-05-13 09:25:39 +01:00

32 lines
No EOL
1.3 KiB
Nix

{ config, pkgs, lib, ... }:
{
config = lib.mkIf (config.networking.hostName == "FredOS-Mediaserver") {
services.ollama.enable = true;
# Quadro M2000 (Maxwell/GM206) uses legacy_535 driver which caps CUDA
# at 12.2. nixpkgs has removed all CUDA versions ≤12.5 as unmaintained,
# and 12.6+ requires driver ≥560. CPU inference is the only option.
services.open-webui.enable = true;
services.open-webui.port = 8888;
services.open-webui.environment.WEBUI_AUTH = "False"; # auth handled by Authelia upstream
nixpkgs.overlays = [
(final: prev: {
# We need to reach into the python package set
pythonPackagesExtensions = prev.pythonPackagesExtensions ++ [
(python-final: python-prev: {
langchain = python-prev.langchain.overridePythonAttrs (oldAttrs: {
doCheck = false;
});
})
];
# valkey 8.1.x has a flaky replication integration test that
# fails non-deterministically; skip checks to unblock open-webui.
valkey = prev.valkey.overrideAttrs (oldAttrs: {
doCheck = false;
});
})
];
};
}