switch kokoro to remsky/Kokoro-FastAPI

This commit is contained in:
2026-05-21 21:51:40 +02:00
parent 989732e1b5
commit 02b3ec13b4
3 changed files with 4 additions and 66 deletions
+4 -19
View File
@@ -16,37 +16,22 @@ spec:
labels:
app: kokoro
spec:
# Prevent Kubernetes from auto-injecting KOKORO_PORT=tcp://... (legacy
# Docker-link-style env vars from same-namespace Services), which Kokoro
# tries to parse as an integer and fails.
enableServiceLinks: false
containers:
- name: kokoro
# OpenAI-compatible Kokoro TTS server, CPU-only PyTorch backend
# Exposes POST /v1/audio/speech with multiple voices and streaming
image: hwdsl2/kokoro-server:latest@sha256:42886b8720e901f7e31aba2050cd03867767eb9f609bbc38fe93852e72f0feeb
# OpenAI-compatible Kokoro-FastAPI TTS server, CPU PyTorch backend.
# Models baked into the image (no PVC needed).
# v0.3.0 includes fix for per-request voice tensor memory leak (#459).
image: ghcr.io/remsky/kokoro-fastapi-cpu:v0.3.0
ports:
- containerPort: 8880
name: http
protocol: TCP
env:
# Default voice (can be overridden per-request)
- name: KOKORO_VOICE
value: "af_heart"
volumeMounts:
# Persistent cache for the ~320MB Kokoro model
- name: cache
mountPath: /var/lib/kokoro
resources:
requests:
memory: "2Gi"
cpu: "500m"
limits:
memory: "6Gi"
volumes:
- name: cache
persistentVolumeClaim:
claimName: kokoro-cache-lvmssd
---
apiVersion: v1
kind: Service