diff options
Diffstat (limited to 'profiles/llm.nix')
| -rw-r--r-- | profiles/llm.nix | 18 |
1 files changed, 18 insertions, 0 deletions
diff --git a/profiles/llm.nix b/profiles/llm.nix new file mode 100644 index 0000000..d5d02f4 --- /dev/null +++ b/profiles/llm.nix @@ -0,0 +1,18 @@ +{ ... }: +{ + services.ollama = { + enable = true; + acceleration = "rocm"; + host = "0.0.0.0"; + openFirewall = true; + environmentVariables = { + # Flash Attention: Improves memory efficiency and speeds up long context + OLLAMA_FLASH_ATTENTION = "1"; + # KV cache quantization: Reduces VRAM footprint (q8_0 = 8-bit quantization) + OLLAMA_KV_CACHE_TYPE = "q8_0"; + }; + loadModels = [ + "qwen3:8b" # https://ollama.com/library/qwen3 + ]; + }; +} |
