add ollama back to artemision
All checks were successful
Check flake.lock / Check health of `flake.lock` (pull_request) Successful in 6s
Check Nix flake / Perform Nix flake checks (pull_request) Successful in 15m11s

This commit is contained in:
2026-03-26 21:40:12 -04:00
parent b5e45398d8
commit 802bf1ca4c
4 changed files with 45 additions and 27 deletions

View File

@@ -46,33 +46,33 @@
kubernetes kubernetes
]; ];
# Enable containerd for Kubernetes ## Enable containerd for Kubernetes
virtualisation.containerd.enable = true; #virtualisation.containerd.enable = true;
# Enable kubelet ## Enable kubelet
services.kubelet = { #services.kubelet = {
enable = true; # enable = true;
extraFlags = { # extraFlags = {
"pod-infra-container-image" = "registry.k8s.io/pause:3.9"; # "pod-infra-container-image" = "registry.k8s.io/pause:3.9";
}; # };
}; #};
# Enable kubeadm for cluster initialization ## Enable kubeadm for cluster initialization
environment.etc."kubeadm.yaml".text = '' #environment.etc."kubeadm.yaml".text = ''
apiVersion: kubeadm.k8s.io/v1beta3 # apiVersion: kubeadm.k8s.io/v1beta3
kind: InitConfiguration # kind: InitConfiguration
localAPIEndpoint: # localAPIEndpoint:
advertiseAddress: 127.0.0.1 # advertiseAddress: 127.0.0.1
bindPort: 6443 # bindPort: 6443
--- # ---
apiVersion: kubeadm.k8s.io/v1beta3 # apiVersion: kubeadm.k8s.io/v1beta3
kind: ClusterConfiguration # kind: ClusterConfiguration
clusterName: ${config.services.kubernetes.clusterName} # clusterName: ${config.services.kubernetes.clusterName}
controlPlaneEndpoint: ${config.services.kubernetes.controlPlaneEndpoint} # controlPlaneEndpoint: ${config.services.kubernetes.controlPlaneEndpoint}
networking: # networking:
serviceSubnet: 10.96.0.0/12 # serviceSubnet: 10.96.0.0/12
podSubnet: 10.244.0.0/16 # podSubnet: 10.244.0.0/16
dnsDomain: cluster.local # dnsDomain: cluster.local
''; #'';
}; };
} }

View File

@@ -1,6 +1,7 @@
{ {
lib, lib,
pkgs, pkgs,
config,
... ...
}: }:
{ {
@@ -17,6 +18,7 @@
./stylix.nix ./stylix.nix
./wifi.nix ./wifi.nix
./zerotier.nix ./zerotier.nix
../palatine-hill/ollama.nix
]; ];
time.timeZone = "America/New_York"; time.timeZone = "America/New_York";
@@ -39,6 +41,20 @@
sops.age.sshKeyPaths = [ "/etc/ssh/ssh_host_ed25519_key" ]; sops.age.sshKeyPaths = [ "/etc/ssh/ssh_host_ed25519_key" ];
services = { services = {
ollama = {
package = lib.mkForce pkgs.ollama-rocm;
models = lib.mkForce "${config.services.ollama.home}/models";
loadModels = lib.mkForce [
"deepseek-r1:1.5b"
"qwen3-coder-next"
"lennyerik/zeta"
"nomic-embed-text:latest"
"glm-4.7-flash"
"magistral"
"devstral-small-2"
"starcoder2:7b"
];
};
flatpak.enable = true; flatpak.enable = true;
calibre-web = { calibre-web = {
# temp disable this # temp disable this

View File

@@ -25,11 +25,12 @@ in
"nemotron-cascade-2:30b" "nemotron-cascade-2:30b"
"magistral" "magistral"
"devstral-small-2" "devstral-small-2"
"starcoder2:15b"
]; ];
models = vars.primary_ollama; models = vars.primary_ollama;
environmentVariables = { environmentVariables = {
FLASH_ATTENTION = "1"; FLASH_ATTENTION = "1";
OLLAMA_KV_CACHE_TYPE = "q8_0"; OLLAMA_KV_CACHE_TYPE = "q4_0";
# Ollama memory configuration # Ollama memory configuration
OLLAMA_MAX_LOADED_MODELS = "3"; OLLAMA_MAX_LOADED_MODELS = "3";
OLLAMA_MAX_QUEUE = "512"; OLLAMA_MAX_QUEUE = "512";

View File

@@ -134,6 +134,7 @@
max_tokens = 128000; max_tokens = 128000;
keep_alive = "15m"; keep_alive = "15m";
} }
]; ];
}; };
}; };