Files
klaster/apps/llama/kokoro.yaml
T
Lumpiasty 989732e1b5
ci/woodpecker/push/flux-reconcile-source Pipeline was successful
move kokoro to separate deployment
2026-05-21 21:34:33 +02:00

66 lines
1.6 KiB
YAML

---
apiVersion: apps/v1
kind: Deployment
metadata:
name: kokoro
namespace: llama
spec:
replicas: 1
strategy:
type: Recreate
selector:
matchLabels:
app: kokoro
template:
metadata:
labels:
app: kokoro
spec:
# Prevent Kubernetes from auto-injecting KOKORO_PORT=tcp://... (legacy
# Docker-link-style env vars from same-namespace Services), which Kokoro
# tries to parse as an integer and fails.
enableServiceLinks: false
containers:
- name: kokoro
# OpenAI-compatible Kokoro TTS server, CPU-only PyTorch backend
# Exposes POST /v1/audio/speech with multiple voices and streaming
image: hwdsl2/kokoro-server:latest@sha256:42886b8720e901f7e31aba2050cd03867767eb9f609bbc38fe93852e72f0feeb
ports:
- containerPort: 8880
name: http
protocol: TCP
env:
# Default voice (can be overridden per-request)
- name: KOKORO_VOICE
value: "af_heart"
volumeMounts:
# Persistent cache for the ~320MB Kokoro model
- name: cache
mountPath: /var/lib/kokoro
resources:
requests:
memory: "2Gi"
cpu: "500m"
limits:
memory: "6Gi"
volumes:
- name: cache
persistentVolumeClaim:
claimName: kokoro-cache-lvmssd
---
apiVersion: v1
kind: Service
metadata:
name: kokoro
namespace: llama
spec:
type: ClusterIP
ports:
- name: http
port: 8880
targetPort: 8880
protocol: TCP
selector:
app: kokoro