43 lines
942 B
Nix
43 lines
942 B
Nix
{self, ...}: let
|
|
tailscaleIP = "100.64.0.4";
|
|
in {
|
|
imports = [self.nixosModules.wyoming-plus];
|
|
|
|
# In case tailscale is down
|
|
boot.kernel.sysctl."net.ipv4.ip_nonlocal_bind" = 1;
|
|
|
|
nixpkgs.overlays = [
|
|
# We can get rid of this once full CUDA support works
|
|
(final: prev: {
|
|
ctranslate2 = prev.ctranslate2.override {
|
|
withCUDA = true;
|
|
withCuDNN = true;
|
|
};
|
|
})
|
|
];
|
|
|
|
services = {
|
|
# Speech-to-Text
|
|
wyoming.faster-whisper.servers."en" = {
|
|
enable = true;
|
|
uri = "tcp://${tailscaleIP}:10300";
|
|
|
|
# see https://github.com/rhasspy/wyoming-faster-whisper/releases/tag/v2.0.0
|
|
model = "medium";
|
|
language = "en";
|
|
device = "cuda";
|
|
};
|
|
|
|
# Text-to-Intent
|
|
ollama = {
|
|
enable = true;
|
|
acceleration = "cuda";
|
|
|
|
host = tailscaleIP;
|
|
port = 11434;
|
|
|
|
loadModels = ["mistral-nemo"];
|
|
environmentVariables.OLLAMA_DEBUG = "1";
|
|
};
|
|
};
|
|
}
|