Skip to content

Commit 1caddfb

Browse files
authored
Merge pull request #225 from m-bain/v3
V3
2 parents b666523 + 7ad554c commit 1caddfb

File tree

12 files changed

+1222
-1249
lines changed

12 files changed

+1222
-1249
lines changed

README.md

Lines changed: 123 additions & 67 deletions
Large diffs are not rendered by default.

requirements.txt

Lines changed: 7 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,8 @@
1-
numpy
2-
pandas
3-
torch >=1.9
4-
torchaudio >=0.10,<1.0
5-
tqdm
6-
more-itertools
7-
transformers>=4.19.0
1+
torch==2.0.0
2+
torchaudio==2.0.1
3+
faster-whisper
4+
transformers
85
ffmpeg-python==0.2.0
9-
pyannote.audio
10-
openai-whisper==20230314
6+
pandas
7+
setuptools==65.6.3
8+
nltk

setup.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@
66
setup(
77
name="whisperx",
88
py_modules=["whisperx"],
9-
version="2.0.1",
10-
description="Time-Accurate Automatic Speech Recognition using Whisper.",
9+
version="3.1.0",
10+
description="Time-Accurate Automatic Speech Recognition.",
1111
readme="README.md",
1212
python_requires=">=3.8",
1313
author="Max Bain",
@@ -19,7 +19,7 @@
1919
for r in pkg_resources.parse_requirements(
2020
open(os.path.join(os.path.dirname(__file__), "requirements.txt"))
2121
)
22-
],
22+
] + ["pyannote.audio @ git+https://github.com/pyannote/pyannote-audio@11b56a137a578db9335efc00298f6ec1932e6317"],
2323
entry_points = {
2424
'console_scripts': ['whisperx=whisperx.transcribe:cli'],
2525
},

whisperx/__init__.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,4 @@
1-
from .transcribe import transcribe, transcribe_with_vad
1+
from .transcribe import load_model
22
from .alignment import load_align_model, align
3-
from .vad import load_vad_model
3+
from .audio import load_audio
4+
from .diarize import assign_word_speakers, DiarizationPipeline

0 commit comments

Comments
 (0)