forked from MahmoudAshraf97/whisper-diarization
-
Notifications
You must be signed in to change notification settings - Fork 0
/
transcribe_recordings.py
39 lines (37 loc) · 1.1 KB
/
transcribe_recordings.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
import os
import subprocess
root_dir = r"recordings"
for dirpath, dirnames, filenames in os.walk(root_dir):
for file in filenames:
base, ext = os.path.splitext(file)
if ext == ".mp3":
full_file_path = os.path.join(dirpath, file)
output_file_path = os.path.join(dirpath, f"{base}.wav")
print(output_file_path)
subprocess.run(
[
r"ffmpeg.exe",
"-i",
full_file_path,
"-acodec",
"pcm_u8",
"-ar",
"22050",
output_file_path,
]
)
subprocess.run(
[
"py",
"diarize.py",
"-a",
output_file_path,
"--no-stem",
"--whisper-model",
"large-v3",
"--language",
"en",
"--device",
"cuda",
]
)