mirror of
https://github.com/remsky/Kokoro-FastAPI.git
synced 2025-04-13 09:39:17 +00:00
37 lines
1.4 KiB
YAML
37 lines
1.4 KiB
YAML
name: kokoro-fastapi-cpu
|
|
services:
|
|
kokoro-tts:
|
|
build:
|
|
context: ../..
|
|
dockerfile: docker/cpu/Dockerfile
|
|
volumes:
|
|
- ../../api:/app/api
|
|
ports:
|
|
- "8880:8880"
|
|
environment:
|
|
- PYTHONPATH=/app:/app/api
|
|
# ONNX Optimization Settings for vectorized operations
|
|
- ONNX_NUM_THREADS=8 # Maximize core usage for vectorized ops
|
|
- ONNX_INTER_OP_THREADS=4 # Higher inter-op for parallel matrix operations
|
|
- ONNX_EXECUTION_MODE=parallel
|
|
- ONNX_OPTIMIZATION_LEVEL=all
|
|
- ONNX_MEMORY_PATTERN=true
|
|
- ONNX_ARENA_EXTEND_STRATEGY=kNextPowerOfTwo
|
|
|
|
# # Gradio UI service [Comment out everything below if you don't need it]
|
|
# gradio-ui:
|
|
# image: ghcr.io/remsky/kokoro-fastapi-ui:v${VERSION}
|
|
# # Uncomment below (and comment out above) to build from source instead of using the released image
|
|
# build:
|
|
# context: ../../ui
|
|
# ports:
|
|
# - "7860:7860"
|
|
# volumes:
|
|
# - ../../ui/data:/app/ui/data
|
|
# - ../../ui/app.py:/app/app.py # Mount app.py for hot reload
|
|
# environment:
|
|
# - GRADIO_WATCH=True # Enable hot reloading
|
|
# - PYTHONUNBUFFERED=1 # Ensure Python output is not buffered
|
|
# - DISABLE_LOCAL_SAVING=false # Set to 'true' to disable local saving and hide file view
|
|
# - API_HOST=kokoro-tts # Set TTS service URL
|
|
# - API_PORT=8880 # Set TTS service PORT
|