|  |  | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  | import argparse | 
					
						
						|  | import random | 
					
						
						|  |  | 
					
						
						|  | from nemo.collections.asr.parts.utils.manifest_utils import create_manifest | 
					
						
						|  |  | 
					
						
						|  | random.seed(42) | 
					
						
						|  |  | 
					
						
						|  | """ | 
					
						
						|  | This script creates manifest file for speaker diarization inference purposes. | 
					
						
						|  | Useful to get manifest when you have list of audio files and optionally rttm and uem files for evaluation | 
					
						
						|  |  | 
					
						
						|  | Note: make sure basename for each file is unique and rttm files also has the corresponding base name for mapping | 
					
						
						|  | """ | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  | def main( | 
					
						
						|  | wav_path, text_path=None, rttm_path=None, uem_path=None, ctm_path=None, manifest_filepath=None, add_duration=False | 
					
						
						|  | ): | 
					
						
						|  | create_manifest( | 
					
						
						|  | wav_path, | 
					
						
						|  | manifest_filepath, | 
					
						
						|  | text_path=text_path, | 
					
						
						|  | rttm_path=rttm_path, | 
					
						
						|  | uem_path=uem_path, | 
					
						
						|  | ctm_path=ctm_path, | 
					
						
						|  | add_duration=add_duration, | 
					
						
						|  | ) | 
					
						
						|  |  | 
					
						
						|  |  | 
					
						
						|  | if __name__ == "__main__": | 
					
						
						|  | parser = argparse.ArgumentParser() | 
					
						
						|  | parser.add_argument( | 
					
						
						|  | "--paths2audio_files", help="path to text file containing list of audio files", type=str, required=True | 
					
						
						|  | ) | 
					
						
						|  | parser.add_argument("--paths2txt_files", help="path to text file containing list of transcription files", type=str) | 
					
						
						|  | parser.add_argument("--paths2rttm_files", help="path to text file containing list of rttm files", type=str) | 
					
						
						|  | parser.add_argument("--paths2uem_files", help="path to uem files", type=str) | 
					
						
						|  | parser.add_argument("--paths2ctm_files", help="path to ctm files", type=str) | 
					
						
						|  | parser.add_argument("--manifest_filepath", help="path to output manifest file", type=str, required=True) | 
					
						
						|  | parser.add_argument( | 
					
						
						|  | "--add_duration", help="add duration of audio files to output manifest files.", action='store_true', | 
					
						
						|  | ) | 
					
						
						|  | args = parser.parse_args() | 
					
						
						|  |  | 
					
						
						|  | main( | 
					
						
						|  | args.paths2audio_files, | 
					
						
						|  | args.paths2txt_files, | 
					
						
						|  | args.paths2rttm_files, | 
					
						
						|  | args.paths2uem_files, | 
					
						
						|  | args.paths2ctm_files, | 
					
						
						|  | args.manifest_filepath, | 
					
						
						|  | args.add_duration, | 
					
						
						|  | ) | 
					
						
						|  |  |