diff --git a/apps/llama/kokoro.yaml b/apps/llama/kokoro.yaml index 71e3fc2..5e31306 100644 --- a/apps/llama/kokoro.yaml +++ b/apps/llama/kokoro.yaml @@ -16,37 +16,22 @@ spec: labels: app: kokoro spec: - # Prevent Kubernetes from auto-injecting KOKORO_PORT=tcp://... (legacy - # Docker-link-style env vars from same-namespace Services), which Kokoro - # tries to parse as an integer and fails. - enableServiceLinks: false containers: - name: kokoro - # OpenAI-compatible Kokoro TTS server, CPU-only PyTorch backend - # Exposes POST /v1/audio/speech with multiple voices and streaming - image: hwdsl2/kokoro-server:latest@sha256:42886b8720e901f7e31aba2050cd03867767eb9f609bbc38fe93852e72f0feeb + # OpenAI-compatible Kokoro-FastAPI TTS server, CPU PyTorch backend. + # Models baked into the image (no PVC needed). + # v0.3.0 includes fix for per-request voice tensor memory leak (#459). + image: ghcr.io/remsky/kokoro-fastapi-cpu:v0.3.0 ports: - containerPort: 8880 name: http protocol: TCP - env: - # Default voice (can be overridden per-request) - - name: KOKORO_VOICE - value: "af_heart" - volumeMounts: - # Persistent cache for the ~320MB Kokoro model - - name: cache - mountPath: /var/lib/kokoro resources: requests: memory: "2Gi" cpu: "500m" limits: memory: "6Gi" - volumes: - - name: cache - persistentVolumeClaim: - claimName: kokoro-cache-lvmssd --- apiVersion: v1 kind: Service diff --git a/apps/llama/kustomization.yaml b/apps/llama/kustomization.yaml index 74cbd37..4dbd947 100644 --- a/apps/llama/kustomization.yaml +++ b/apps/llama/kustomization.yaml @@ -6,7 +6,6 @@ resources: - auth-proxy.yaml - ingress.yaml - pvc-ssd.yaml - - pvc-kokoro-ssd.yaml - deployment.yaml - kokoro.yaml configMapGenerator: diff --git a/apps/llama/pvc-kokoro-ssd.yaml b/apps/llama/pvc-kokoro-ssd.yaml deleted file mode 100644 index 643bf76..0000000 --- a/apps/llama/pvc-kokoro-ssd.yaml +++ /dev/null @@ -1,46 +0,0 @@ ---- -apiVersion: local.openebs.io/v1alpha1 -kind: LVMVolume -metadata: - labels: - kubernetes.io/nodename: anapistula-delrosalae - name: kokoro-cache-lvmssd - namespace: openebs -spec: - capacity: "2147483648" - ownerNodeID: anapistula-delrosalae - shared: "yes" - thinProvision: "no" - vgPattern: ^openebs-ssd$ - volGroup: openebs-ssd ---- -kind: PersistentVolume -apiVersion: v1 -metadata: - name: kokoro-cache-lvmssd -spec: - capacity: - storage: 2Gi - accessModes: - - ReadWriteOnce - persistentVolumeReclaimPolicy: Retain - storageClassName: ssd-lvmpv - volumeMode: Filesystem - csi: - driver: local.csi.openebs.io - fsType: btrfs - volumeHandle: kokoro-cache-lvmssd ---- -kind: PersistentVolumeClaim -apiVersion: v1 -metadata: - name: kokoro-cache-lvmssd - namespace: llama -spec: - accessModes: - - ReadWriteOnce - resources: - requests: - storage: 2Gi - storageClassName: ssd-lvmpv - volumeName: kokoro-cache-lvmssd