-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathenv.yml
27 lines (27 loc) · 866 Bytes
/
env.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
name: speech2text
channels:
- conda-forge
- pytorch
- nvidia
dependencies:
- git
- ffmpeg
- libsndfile
- numpy=1.26.4
- python=3.10
- pydub
- pytorch-lightning=2.2.5
- nvidia::cuda-libraries-dev
- pytorch::pytorch=2.3.1=py3.10_cuda12.1_cudnn8.9.2_0
- pytorch::torchvision
- pytorch::torchaudio
- pytorch::pytorch-cuda=12.1
- pip
- pip:
- pyannote.audio
# Requires ctranslate 4.4.0 and faster-whisper 1.0.3. Link to the issue: https://github.com/m-bain/whisperX/issues/901
# "https://github.com/m-bain/whisperX/commit/caa7121064c1bb406be30c50891a9b8217252592" or
# "https://github.com/m-bain/whisperX/commit/5080b7188c3666b5d8648346c0c12599a58bd695"
- ctranslate2==4.4.0
- faster-whisper==1.0.3
- whisperx @ git+https://github.com/federicotorrielli/BetterWhisperX@bd9b897cd3fdb8c23863cbf9f6517640b5c6bf50