Files
klaster/apps/llama/kokoro.yaml
T
Lumpiasty e3348dc02b
ci/woodpecker/push/flux-reconcile-source Pipeline was successful
move kokoro to separate deployment
2026-05-21 21:23:36 +02:00

62 lines
1.4 KiB
YAML

---
apiVersion: apps/v1
kind: Deployment
metadata:
name: kokoro
namespace: llama
spec:
replicas: 1
strategy:
type: Recreate
selector:
matchLabels:
app: kokoro
template:
metadata:
labels:
app: kokoro
spec:
containers:
- name: kokoro
# OpenAI-compatible Kokoro TTS server, CPU-only PyTorch backend
# Exposes POST /v1/audio/speech with multiple voices and streaming
image: hwdsl2/kokoro-server:latest@sha256:42886b8720e901f7e31aba2050cd03867767eb9f609bbc38fe93852e72f0feeb
ports:
- containerPort: 8880
name: http
protocol: TCP
env:
# Default voice (can be overridden per-request)
- name: KOKORO_VOICE
value: "af_heart"
volumeMounts:
# Persistent cache for the ~320MB Kokoro model
- name: cache
mountPath: /var/lib/kokoro
resources:
requests:
memory: "1Gi"
cpu: "500m"
limits:
memory: "3Gi"
volumes:
- name: cache
persistentVolumeClaim:
claimName: kokoro-cache-lvmssd
---
apiVersion: v1
kind: Service
metadata:
name: kokoro
namespace: llama
spec:
type: ClusterIP
ports:
- name: http
port: 8880
targetPort: 8880
protocol: TCP
selector:
app: kokoro