Merge pull request #107 from tillhanke/main
add num-speakers as cmdline option to scraibe
This commit is contained in:
+9
-2
@@ -79,6 +79,8 @@ def cli():
|
|||||||
choices=sorted(
|
choices=sorted(
|
||||||
LANGUAGES.keys()) + sorted([k.title() for k in TO_LANGUAGE_CODE.keys()]),
|
LANGUAGES.keys()) + sorted([k.title() for k in TO_LANGUAGE_CODE.keys()]),
|
||||||
help="Language spoken in the audio. Specify None to perform language detection.")
|
help="Language spoken in the audio. Specify None to perform language detection.")
|
||||||
|
parser.add_argument("--num-speakers", type=int, default=2,
|
||||||
|
help="Number of speakers in the audio.")
|
||||||
|
|
||||||
args = parser.parse_args()
|
args = parser.parse_args()
|
||||||
|
|
||||||
@@ -117,8 +119,13 @@ def cli():
|
|||||||
else:
|
else:
|
||||||
task = "transcribe"
|
task = "transcribe"
|
||||||
|
|
||||||
out = model.autotranscribe(audio, task=task, language=arg_dict.pop(
|
out = model.autotranscribe(
|
||||||
"language"), verbose=arg_dict.pop("verbose_output"))
|
audio,
|
||||||
|
task=task,
|
||||||
|
language=arg_dict.pop("language"),
|
||||||
|
verbose=arg_dict.pop("verbose_output"),
|
||||||
|
num_speakers=arg_dict.pop("num_speakers")
|
||||||
|
)
|
||||||
basename = audio.split("/")[-1].split(".")[0]
|
basename = audio.split("/")[-1].split(".")[0]
|
||||||
print(f'Saving {basename}.{out_format} to {out_folder}')
|
print(f'Saving {basename}.{out_format} to {out_folder}')
|
||||||
out.save(os.path.join(
|
out.save(os.path.join(
|
||||||
|
|||||||
Reference in New Issue
Block a user