diff --git a/Dockerfile.rocm b/Dockerfile.rocm index 30ba3b2..49db5e9 100644 --- a/Dockerfile.rocm +++ b/Dockerfile.rocm @@ -1,4 +1,4 @@ -FROM rocm/dev-ubuntu-22.04:6.1 +FROM rocm/dev-ubuntu-22.04:7.2 ENV DEBIAN_FRONTEND=noninteractive \ PYTHONDONTWRITEBYTECODE=1 \ @@ -7,27 +7,37 @@ ENV DEBIAN_FRONTEND=noninteractive \ PIP_NO_CACHE_DIR=1 RUN apt-get update && apt-get install -y --no-install-recommends \ - python3 \ - python3-pip \ - python3-dev \ + software-properties-common \ + && add-apt-repository ppa:deadsnakes/ppa \ + && apt-get update && apt-get install -y --no-install-recommends \ + python3.11 \ + python3.11-dev \ + python3.11-distutils \ git \ ffmpeg \ libsndfile1 \ && rm -rf /var/lib/apt/lists/* +# Install pip for Python 3.11 +RUN curl -sS https://bootstrap.pypa.io/get-pip.py | python3.11 + +# Make python3.11 the default python3 +RUN update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.11 1 \ + && update-alternatives --install /usr/bin/python python /usr/bin/python3.11 1 + WORKDIR /app # Step 1: Install ROCm-compatible PyTorch stack first. # This must happen before anything else to prevent pip from pulling CPU wheels. COPY requirements-rocm-init.txt . -RUN pip3 install -r requirements-rocm-init.txt +RUN python3 -m pip install -r requirements-rocm-init.txt # Step 2: Install remaining dependencies (pinned to avoid overwriting torch). COPY requirements-rocm.txt . -RUN pip3 install -r requirements-rocm.txt +RUN python3 -m pip install -r requirements-rocm.txt # Step 3: Install chatterbox with --no-deps so pip cannot replace ROCm torch. -RUN pip3 install --no-deps chatterbox-tts +RUN python3 -m pip install --no-deps chatterbox-tts # Application source COPY engine.py config.py wyoming_handler.py wyoming_voices.py main.py ./ diff --git a/config.yaml b/config.yaml index ff9812e..7d0291b 100644 --- a/config.yaml +++ b/config.yaml @@ -13,11 +13,11 @@ tts_engine: generation_defaults: # Turbo model: uses temperature only (exaggeration/cfg_weight ignored) # Standard model: uses exaggeration and cfg_weight (temperature ignored) - temperature: 0.8 + temperature: 0.9 exaggeration: 0.5 cfg_weight: 0.5 # seed: 0 = random each call, >0 = reproducible output - seed: 0 + seed: 1960 wyoming: host: "0.0.0.0" diff --git a/requirements-rocm-init.txt b/requirements-rocm-init.txt index 44a44f9..8627435 100644 --- a/requirements-rocm-init.txt +++ b/requirements-rocm-init.txt @@ -1,5 +1,5 @@ ---index-url https://download.pytorch.org/whl/rocm6.1 -torch==2.5.1 -torchaudio==2.5.1 -torchvision==0.20.1 -pytorch_triton_rocm==3.1.0 +--index-url https://download.pytorch.org/whl/rocm7.2 +torch==2.11.0 +torchaudio==2.11.0 +torchvision==0.26.0 +pytorch_triton_rocm==3.3.0 diff --git a/requirements-rocm.txt b/requirements-rocm.txt index 8ce84d8..0c76489 100644 --- a/requirements-rocm.txt +++ b/requirements-rocm.txt @@ -5,9 +5,9 @@ librosa==0.11.0 pyloudnorm # ML dependencies (pinned to match chatterbox without overwriting ROCm torch) -transformers==4.46.3 -diffusers==0.29.0 -safetensors>=0.4.1 +transformers>=4.50.0 +diffusers>=0.32.0 +safetensors>=0.4.5 huggingface-hub omegaconf