Fix edge1 Ollama IP (.15->.17), add monitoring ingress, add init container
This commit is contained in:
@@ -2,7 +2,7 @@
|
|||||||
# Agent Zero AI Stack — NUC Deployment (RKE2 Bare-Metal)
|
# Agent Zero AI Stack — NUC Deployment (RKE2 Bare-Metal)
|
||||||
# =============================================================================
|
# =============================================================================
|
||||||
# Deploys: AgentZero (agent UI) on RKE2 cluster
|
# Deploys: AgentZero (agent UI) on RKE2 cluster
|
||||||
# Ollama: edge1 Pi 5 at 10.0.57.15:11434 (qwen2.5-coder:7b, CPU)
|
# Ollama: edge1 Pi 5 at 10.0.57.17:11434 (qwen2.5-coder:7b, CPU)
|
||||||
# Target: RKE2 bare-metal cluster, namespace: agent-zero
|
# Target: RKE2 bare-metal cluster, namespace: agent-zero
|
||||||
#
|
#
|
||||||
# Differences from LOCAL (WSL K3s):
|
# Differences from LOCAL (WSL K3s):
|
||||||
@@ -99,7 +99,7 @@ metadata:
|
|||||||
app: agent-zero
|
app: agent-zero
|
||||||
annotations:
|
annotations:
|
||||||
agent-zero/deployment: "nuc"
|
agent-zero/deployment: "nuc"
|
||||||
agent-zero/ollama: "edge1 Pi 5 (10.0.57.15:11434)"
|
agent-zero/ollama: "edge1 Pi 5 (10.0.57.17:11434)"
|
||||||
spec:
|
spec:
|
||||||
replicas: 1
|
replicas: 1
|
||||||
selector:
|
selector:
|
||||||
@@ -113,6 +113,21 @@ spec:
|
|||||||
app: agent-zero
|
app: agent-zero
|
||||||
spec:
|
spec:
|
||||||
serviceAccountName: agent-zero
|
serviceAccountName: agent-zero
|
||||||
|
initContainers:
|
||||||
|
# Wait for edge1 Pi 5 Ollama to be reachable before starting Agent Zero.
|
||||||
|
# Without this, the FAISS memory system crashes on embed_query()
|
||||||
|
# and Agent Zero enters a broken state on every message.
|
||||||
|
- name: wait-for-ollama
|
||||||
|
image: busybox:1.37
|
||||||
|
command: ["sh", "-c"]
|
||||||
|
args:
|
||||||
|
- |
|
||||||
|
echo "Waiting for Ollama at edge1 (10.0.57.17:11434)..."
|
||||||
|
until wget -qO- --timeout=2 http://10.0.57.17:11434/api/tags >/dev/null 2>&1; do
|
||||||
|
echo "edge1 Ollama not ready, retrying in 5s..."
|
||||||
|
sleep 5
|
||||||
|
done
|
||||||
|
echo "edge1 Ollama is reachable!"
|
||||||
containers:
|
containers:
|
||||||
- name: agent-zero
|
- name: agent-zero
|
||||||
image: agent0ai/agent-zero:latest
|
image: agent0ai/agent-zero:latest
|
||||||
@@ -141,7 +156,7 @@ spec:
|
|||||||
- name: A0_SET_chat_model_name
|
- name: A0_SET_chat_model_name
|
||||||
value: "qwen2.5-coder:7b"
|
value: "qwen2.5-coder:7b"
|
||||||
- name: A0_SET_chat_model_api_base
|
- name: A0_SET_chat_model_api_base
|
||||||
value: "http://10.0.57.15:11434"
|
value: "http://10.0.57.17:11434"
|
||||||
- name: A0_SET_chat_model_ctx_length
|
- name: A0_SET_chat_model_ctx_length
|
||||||
value: "32768"
|
value: "32768"
|
||||||
- name: A0_SET_chat_model_kwargs
|
- name: A0_SET_chat_model_kwargs
|
||||||
@@ -152,7 +167,7 @@ spec:
|
|||||||
- name: A0_SET_util_model_name
|
- name: A0_SET_util_model_name
|
||||||
value: "qwen2.5-coder:7b"
|
value: "qwen2.5-coder:7b"
|
||||||
- name: A0_SET_util_model_api_base
|
- name: A0_SET_util_model_api_base
|
||||||
value: "http://10.0.57.15:11434"
|
value: "http://10.0.57.17:11434"
|
||||||
- name: A0_SET_util_model_kwargs
|
- name: A0_SET_util_model_kwargs
|
||||||
value: '{"num_ctx": 8192}'
|
value: '{"num_ctx": 8192}'
|
||||||
# Embedding model — nomic on edge1 (if installed, fallback to none)
|
# Embedding model — nomic on edge1 (if installed, fallback to none)
|
||||||
@@ -161,14 +176,14 @@ spec:
|
|||||||
- name: A0_SET_embed_model_name
|
- name: A0_SET_embed_model_name
|
||||||
value: "nomic-embed-text"
|
value: "nomic-embed-text"
|
||||||
- name: A0_SET_embed_model_api_base
|
- name: A0_SET_embed_model_api_base
|
||||||
value: "http://10.0.57.15:11434"
|
value: "http://10.0.57.17:11434"
|
||||||
# Browser model — disabled (no vision model on Pi)
|
# Browser model — disabled (no vision model on Pi)
|
||||||
- name: A0_SET_browser_model_provider
|
- name: A0_SET_browser_model_provider
|
||||||
value: "ollama"
|
value: "ollama"
|
||||||
- name: A0_SET_browser_model_name
|
- name: A0_SET_browser_model_name
|
||||||
value: "qwen2.5-coder:7b"
|
value: "qwen2.5-coder:7b"
|
||||||
- name: A0_SET_browser_model_api_base
|
- name: A0_SET_browser_model_api_base
|
||||||
value: "http://10.0.57.15:11434"
|
value: "http://10.0.57.17:11434"
|
||||||
- name: A0_SET_browser_model_vision
|
- name: A0_SET_browser_model_vision
|
||||||
value: "false"
|
value: "false"
|
||||||
# Agent profile
|
# Agent profile
|
||||||
@@ -196,6 +211,27 @@ spec:
|
|||||||
mountPath: /a0/work
|
mountPath: /a0/work
|
||||||
- name: knowledge
|
- name: knowledge
|
||||||
mountPath: /a0/knowledge/custom/main
|
mountPath: /a0/knowledge/custom/main
|
||||||
|
startupProbe:
|
||||||
|
httpGet:
|
||||||
|
path: /
|
||||||
|
port: 80
|
||||||
|
initialDelaySeconds: 15
|
||||||
|
periodSeconds: 10
|
||||||
|
failureThreshold: 18
|
||||||
|
livenessProbe:
|
||||||
|
httpGet:
|
||||||
|
path: /
|
||||||
|
port: 80
|
||||||
|
periodSeconds: 30
|
||||||
|
failureThreshold: 3
|
||||||
|
readinessProbe:
|
||||||
|
exec:
|
||||||
|
command:
|
||||||
|
- /bin/bash
|
||||||
|
- -c
|
||||||
|
- "curl -sf http://localhost:80/ > /dev/null && curl -sf --connect-timeout 3 http://10.0.57.17:11434/api/tags > /dev/null"
|
||||||
|
periodSeconds: 30
|
||||||
|
failureThreshold: 2
|
||||||
resources:
|
resources:
|
||||||
requests:
|
requests:
|
||||||
memory: "2Gi"
|
memory: "2Gi"
|
||||||
@@ -292,6 +328,13 @@ spec:
|
|||||||
kubernetes.io/metadata.name: traefik-system
|
kubernetes.io/metadata.name: traefik-system
|
||||||
ports:
|
ports:
|
||||||
- port: 80
|
- port: 80
|
||||||
|
# Allow from monitoring (blackbox probe)
|
||||||
|
- from:
|
||||||
|
- namespaceSelector:
|
||||||
|
matchLabels:
|
||||||
|
kubernetes.io/metadata.name: monitoring
|
||||||
|
ports:
|
||||||
|
- port: 80
|
||||||
egress:
|
egress:
|
||||||
# DNS
|
# DNS
|
||||||
- to:
|
- to:
|
||||||
@@ -306,7 +349,7 @@ spec:
|
|||||||
# Ollama on edge1
|
# Ollama on edge1
|
||||||
- to:
|
- to:
|
||||||
- ipBlock:
|
- ipBlock:
|
||||||
cidr: 10.0.57.15/32
|
cidr: 10.0.57.17/32
|
||||||
ports:
|
ports:
|
||||||
- port: 11434
|
- port: 11434
|
||||||
# K8s API
|
# K8s API
|
||||||
|
|||||||
Reference in New Issue
Block a user