diff --git a/Dockerfile.rocm b/Dockerfile.rocm index 13d06f9..9411eef 100644 --- a/Dockerfile.rocm +++ b/Dockerfile.rocm @@ -41,10 +41,8 @@ COPY engine.py config.py wyoming_handler.py wyoming_voices.py main.py ./ # Default config (can be overridden by volume mount) COPY config.yaml . -# Create default directories (miopen_cache must exist before the volume mounts -# so MIOpen can open its SQLite benchmark database without crashing) -RUN mkdir -p voices reference_audio hf_cache miopen_cache && \ - chmod 777 miopen_cache +# Create default directories +RUN mkdir -p voices reference_audio hf_cache EXPOSE 10200 diff --git a/docker-compose.yml b/docker-compose.yml index 66b1877..5e27032 100644 --- a/docker-compose.yml +++ b/docker-compose.yml @@ -22,22 +22,11 @@ services: - ./voices:/app/voices - ./reference_audio:/app/reference_audio - hf_cache:/app/hf_cache - - miopen_cache:/app/miopen_cache environment: - HF_HUB_ENABLE_HF_TRANSFER=1 - # Disable MIOpen's GEMM convolution solver. PyTorch passes a null workspace - # pointer (ptr=0, size=0) which causes GemmFwdRest to warn and fall back on - # every conv op. Disabling it makes MIOpen go straight to Direct/Winograd - # solvers that don't require workspace allocation. - - MIOPEN_DEBUG_CONV_GEMM=0 - # Persist MIOpen's kernel cache so it doesn't recompile on every start. - - MIOPEN_USER_DB_PATH=/app/miopen_cache - - MIOPEN_CUSTOM_CACHE_DIR=/app/miopen_cache # Required for RX 6700 XT (gfx1031) - not natively supported in ROCm 7.2. - # Without this the GPU runs in software emulation and synthesis takes 40+ seconds. - HSA_OVERRIDE_GFX_VERSION=10.3.0 # - HF_TOKEN=your_token_here volumes: hf_cache: - miopen_cache: