liuyang commited on
Commit
289ed4b
·
1 Parent(s): b628d00
Files changed (1) hide show
  1. requirements.txt +16 -18
requirements.txt CHANGED
@@ -1,29 +1,24 @@
1
- # Pull CUDA 12.1 wheels for Torch
2
- --extra-index-url https://download.pytorch.org/whl/cu121
3
 
4
- ######## Core DL stack (Torch must match torchaudio)
5
- torch==2.5.1+cu121
6
- torchaudio==2.5.1+cu121
7
- # Provide NVIDIA runtime libs expected by recent Torch wheels
8
- nvidia-cudnn-cu12==9.1.0.70
9
- nvidia-cublas-cu12>=12.1.3
10
 
11
- ######## ASR stacks
12
- # Newer WhisperX works with newer faster-whisper and requires CT2>=4.5
13
  whisperx==3.7.0
14
  faster-whisper==1.2.0
15
  ctranslate2==4.5.0
 
 
16
 
17
- ######## Transformers & validation
18
- transformers==4.48.0
19
- pydantic==2.10.6
20
-
21
- ######## Diarization (optional)
22
- pyannote.audio>=3.3.1
23
 
24
- ######## App + utils
25
  gradio==5.0.1
26
  spaces>=0.19.0
 
27
  pandas>=1.5.0
28
  numpy>=1.24.0
29
  librosa>=0.10.0
@@ -31,4 +26,7 @@ soundfile>=0.12.0
31
  ffmpeg-python>=0.2.0
32
  requests>=2.28.0
33
  webrtcvad>=2.0.10
34
- boto3
 
 
 
 
1
+ # 1) Do NOT pin torch/torchaudio here — use the CUDA builds that come with the image
 
2
 
3
+ transformers==4.48.0
4
+ # Removed flash-attention since faster-whisper handles this internally
5
+ # https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.0.8/flash_attn-2.7.4.post1+cu126torch2.4-cp310-cp310-linux_x86_64.whl
6
+ pydantic==2.10.6
 
 
7
 
8
+ # 2) Main whisper stack — WhisperX (with compatible FW/CT2 for cuDNN 8 era)
 
9
  whisperx==3.7.0
10
  faster-whisper==1.2.0
11
  ctranslate2==4.5.0
12
+ nvidia-cudnn-cu12==9.1.0.70
13
+ # (no 'torch' line — keep the image’s CUDA wheel)
14
 
15
+ # Optional: stable-ts for regroup/edit post-processing
16
+ stable-ts>=2.13.3
 
 
 
 
17
 
18
+ # 3) Extra libs your app really needs
19
  gradio==5.0.1
20
  spaces>=0.19.0
21
+ pyannote.audio>=3.3.1
22
  pandas>=1.5.0
23
  numpy>=1.24.0
24
  librosa>=0.10.0
 
26
  ffmpeg-python>=0.2.0
27
  requests>=2.28.0
28
  webrtcvad>=2.0.10
29
+ boto3
30
+
31
+ # Provide NVIDIA runtime libs expected by the image’s Torch (cuDNN 8)
32
+ nvidia-cublas-cu12>=12.1.3