diff --git a/apps/llama/kokoro.yaml b/apps/llama/kokoro.yaml
index 71e3fc2..5e31306 100644
--- a/apps/llama/kokoro.yaml
+++ b/apps/llama/kokoro.yaml
@@ -16,37 +16,22 @@ spec:
       labels:
         app: kokoro
     spec:
-      # Prevent Kubernetes from auto-injecting KOKORO_PORT=tcp://... (legacy
-      # Docker-link-style env vars from same-namespace Services), which Kokoro
-      # tries to parse as an integer and fails.
-      enableServiceLinks: false
       containers:
         - name: kokoro
-          # OpenAI-compatible Kokoro TTS server, CPU-only PyTorch backend
-          # Exposes POST /v1/audio/speech with multiple voices and streaming
-          image: hwdsl2/kokoro-server:latest@sha256:42886b8720e901f7e31aba2050cd03867767eb9f609bbc38fe93852e72f0feeb
+          # OpenAI-compatible Kokoro-FastAPI TTS server, CPU PyTorch backend.
+          # Models baked into the image (no PVC needed).
+          # v0.3.0 includes fix for per-request voice tensor memory leak (#459).
+          image: ghcr.io/remsky/kokoro-fastapi-cpu:v0.3.0
           ports:
             - containerPort: 8880
               name: http
               protocol: TCP
-          env:
-            # Default voice (can be overridden per-request)
-            - name: KOKORO_VOICE
-              value: "af_heart"
-          volumeMounts:
-            # Persistent cache for the ~320MB Kokoro model
-            - name: cache
-              mountPath: /var/lib/kokoro
           resources:
             requests:
               memory: "2Gi"
               cpu: "500m"
             limits:
               memory: "6Gi"
-      volumes:
-        - name: cache
-          persistentVolumeClaim:
-            claimName: kokoro-cache-lvmssd
 ---
 apiVersion: v1
 kind: Service
diff --git a/apps/llama/kustomization.yaml b/apps/llama/kustomization.yaml
index 74cbd37..4dbd947 100644
--- a/apps/llama/kustomization.yaml
+++ b/apps/llama/kustomization.yaml
@@ -6,7 +6,6 @@ resources:
   - auth-proxy.yaml
   - ingress.yaml
   - pvc-ssd.yaml
-  - pvc-kokoro-ssd.yaml
   - deployment.yaml
   - kokoro.yaml
 configMapGenerator:
diff --git a/apps/llama/pvc-kokoro-ssd.yaml b/apps/llama/pvc-kokoro-ssd.yaml
deleted file mode 100644
index 643bf76..0000000
--- a/apps/llama/pvc-kokoro-ssd.yaml
+++ /dev/null
@@ -1,46 +0,0 @@
----
-apiVersion: local.openebs.io/v1alpha1
-kind: LVMVolume
-metadata:
-  labels:
-    kubernetes.io/nodename: anapistula-delrosalae
-  name: kokoro-cache-lvmssd
-  namespace: openebs
-spec:
-  capacity: "2147483648"
-  ownerNodeID: anapistula-delrosalae
-  shared: "yes"
-  thinProvision: "no"
-  vgPattern: ^openebs-ssd$
-  volGroup: openebs-ssd
----
-kind: PersistentVolume
-apiVersion: v1
-metadata:
-  name: kokoro-cache-lvmssd
-spec:
-  capacity:
-    storage: 2Gi
-  accessModes:
-    - ReadWriteOnce
-  persistentVolumeReclaimPolicy: Retain
-  storageClassName: ssd-lvmpv
-  volumeMode: Filesystem
-  csi:
-    driver: local.csi.openebs.io
-    fsType: btrfs
-    volumeHandle: kokoro-cache-lvmssd
----
-kind: PersistentVolumeClaim
-apiVersion: v1
-metadata:
-  name: kokoro-cache-lvmssd
-  namespace: llama
-spec:
-  accessModes:
-    - ReadWriteOnce
-  resources:
-    requests:
-      storage: 2Gi
-  storageClassName: ssd-lvmpv
-  volumeName: kokoro-cache-lvmssd