Dockerfile 1.2 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647
  1. FROM nvidia/cuda:11.8.0-runtime-ubuntu22.04
  2. ENV DEBIAN_FRONTEND=noninteractive
  3. ENV PYTHONUNBUFFERED=1
  4. ENV COQUI_TTS_CACHE=/models
  5. ENV TORCH_HOME=/models
  6. WORKDIR /app
  7. RUN printf 'deb http://archive.ubuntu.com/ubuntu jammy main universe\n\
  8. deb http://archive.ubuntu.com/ubuntu jammy-updates main universe\n\
  9. deb http://archive.ubuntu.com/ubuntu jammy-security main universe\n' > /etc/apt/sources.list
  10. RUN apt-get update && apt-get install -y \
  11. python3 \
  12. python3-pip \
  13. git \
  14. ffmpeg \
  15. espeak-ng \
  16. libsndfile1 \
  17. && rm -rf /var/lib/apt/lists/*
  18. RUN pip3 install --no-cache-dir --upgrade pip
  19. # CUDA Torch (PINNED)
  20. RUN pip3 install --no-cache-dir \
  21. torch==2.5.1+cu118 \
  22. torchvision==0.20.1+cu118 \
  23. torchaudio==2.5.1+cu118 \
  24. --index-url https://download.pytorch.org/whl/cu118
  25. # Coqui TTS
  26. RUN pip3 install --no-cache-dir \
  27. TTS[all]==0.22.0 \
  28. fastapi \
  29. uvicorn
  30. # Transformers version compatible with XTTS
  31. RUN pip3 install --no-cache-dir "transformers>=4.30.0,<4.32.0"
  32. RUN mkdir -p /models /voices
  33. EXPOSE 5002
  34. VOLUME ["/models", "/voices"]
  35. ENTRYPOINT ["python3", "-m", "uvicorn", "tts_server:app", "--host", "0.0.0.0", "--port", "5002"]