|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
import argparse |
|
import random |
|
|
|
from nemo.collections.asr.parts.utils.manifest_utils import create_manifest |
|
|
|
random.seed(42) |
|
|
|
""" |
|
This script creates manifest file for speaker diarization inference purposes. |
|
Useful to get manifest when you have list of audio files and optionally rttm and uem files for evaluation |
|
|
|
Note: make sure basename for each file is unique and rttm files also has the corresponding base name for mapping |
|
""" |
|
|
|
|
|
def main( |
|
wav_path, text_path=None, rttm_path=None, uem_path=None, ctm_path=None, manifest_filepath=None, add_duration=False |
|
): |
|
create_manifest( |
|
wav_path, |
|
manifest_filepath, |
|
text_path=text_path, |
|
rttm_path=rttm_path, |
|
uem_path=uem_path, |
|
ctm_path=ctm_path, |
|
add_duration=add_duration, |
|
) |
|
|
|
|
|
if __name__ == "__main__": |
|
parser = argparse.ArgumentParser() |
|
parser.add_argument( |
|
"--paths2audio_files", help="path to text file containing list of audio files", type=str, required=True |
|
) |
|
parser.add_argument("--paths2txt_files", help="path to text file containing list of transcription files", type=str) |
|
parser.add_argument("--paths2rttm_files", help="path to text file containing list of rttm files", type=str) |
|
parser.add_argument("--paths2uem_files", help="path to uem files", type=str) |
|
parser.add_argument("--paths2ctm_files", help="path to ctm files", type=str) |
|
parser.add_argument("--manifest_filepath", help="path to output manifest file", type=str, required=True) |
|
parser.add_argument( |
|
"--add_duration", help="add duration of audio files to output manifest files.", action='store_true', |
|
) |
|
args = parser.parse_args() |
|
|
|
main( |
|
args.paths2audio_files, |
|
args.paths2txt_files, |
|
args.paths2rttm_files, |
|
args.paths2uem_files, |
|
args.paths2ctm_files, |
|
args.manifest_filepath, |
|
args.add_duration, |
|
) |
|
|