- Base image: rocm/dev-ubuntu-22.04:6.1 → 7.2 - Python 3.10 → 3.11 via deadsnakes PPA - torch/torchaudio: 2.5.1 → 2.11.0 - torchvision: 0.20.1 → 0.26.0 - pytorch_triton_rocm: 3.1.0 → 3.3.0 - transformers: 4.46.3 → >=4.50.0 - diffusers: 0.29.0 → >=0.32.0 - safetensors: >=0.4.1 → >=0.4.5 - config: temperature 0.8→0.9, seed 0→1960 Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
26 lines
478 B
Plaintext
26 lines
478 B
Plaintext
# Audio processing
|
|
numpy>=1.24.0,<2.0.0
|
|
soundfile
|
|
librosa==0.11.0
|
|
pyloudnorm
|
|
|
|
# ML dependencies (pinned to match chatterbox without overwriting ROCm torch)
|
|
transformers>=4.50.0
|
|
diffusers>=0.32.0
|
|
safetensors>=0.4.5
|
|
huggingface-hub
|
|
omegaconf
|
|
|
|
# Chatterbox dependencies (installed separately since chatterbox uses --no-deps)
|
|
conformer==0.3.2
|
|
s3tokenizer==0.3.0
|
|
spacy-pkuseg
|
|
pykakasi==2.3.0
|
|
resemble-perth==1.0.1
|
|
|
|
# Wyoming protocol
|
|
wyoming>=1.5.4
|
|
|
|
# Config / utilities
|
|
PyYAML>=6.0
|