# Tortoise-TTS sidecar. 25+ named voices, no cloning needed. # Apache 2.0 top to bottom. # # Slow: ~10x kokoro wall-clock at 'standard' preset. Worth it for the # quality bar; runs are batched. # # Co-resides with kokoro on an 8GB card (tortoise ~5GB + kokoro ~1GB). # OOM during a render: add a coordinator that pauses kokoro first. # # Set in .env (or override): # TORTOISE_HOST_PORT=7795 # TORTOISE_DATA=./data # ${TORTOISE_DATA}/{hf-cache,models} # AUDIO_DIR=../f5-tts/data/audio # shared output dir across engines name: tortoise services: tortoise: build: . image: tortoise:0.1 container_name: tortoise restart: unless-stopped deploy: resources: reservations: devices: - driver: nvidia count: all capabilities: [gpu] ports: - "${TORTOISE_HOST_PORT:-7795}:7860" volumes: - ${TORTOISE_DATA:-./data}/hf-cache:/cache/hf - ${TORTOISE_DATA:-./data}/models:/cache/tortoise-models - ${AUDIO_DIR:-./data/audio}:/audio environment: HF_HOME: /cache/hf HF_HUB_DISABLE_TELEMETRY: "1" TORTOISE_MODELS_DIR: /cache/tortoise-models