aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--machines/rivendell.nix1
-rw-r--r--profiles/llm.nix18
2 files changed, 0 insertions, 19 deletions
diff --git a/machines/rivendell.nix b/machines/rivendell.nix
index 7d51604..99b03a5 100644
--- a/machines/rivendell.nix
+++ b/machines/rivendell.nix
@@ -13,7 +13,6 @@
../profiles/git-server.nix
../profiles/hardware/framework-desktop.nix
../profiles/home-manager.nix
- ../profiles/llm.nix
../profiles/miniflux.nix
../profiles/monitoring.nix
../profiles/remote-unlock.nix
diff --git a/profiles/llm.nix b/profiles/llm.nix
deleted file mode 100644
index d5d02f4..0000000
--- a/profiles/llm.nix
+++ /dev/null
@@ -1,18 +0,0 @@
-{ ... }:
-{
- services.ollama = {
- enable = true;
- acceleration = "rocm";
- host = "0.0.0.0";
- openFirewall = true;
- environmentVariables = {
- # Flash Attention: Improves memory efficiency and speeds up long context
- OLLAMA_FLASH_ATTENTION = "1";
- # KV cache quantization: Reduces VRAM footprint (q8_0 = 8-bit quantization)
- OLLAMA_KV_CACHE_TYPE = "q8_0";
- };
- loadModels = [
- "qwen3:8b" # https://ollama.com/library/qwen3
- ];
- };
-}