""" Example use of the scorer utility to inspect data. (pre-trained models and already cache files with extracted features are required.)""" from Utility.Scorer import TTSScorer from Utility.path_to_transcript_dicts import * from Utility.storage_config import MODELS_DIR from Utility.storage_config import PREPROCESSING_DIR exec_device = "cuda:8" lang_id = "fon" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join(PREPROCESSING_DIR, "african_voices_fon_alf"), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "hau" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join( PREPROCESSING_DIR, "african_voices_hausa_cmv" ), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "lbb" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join( PREPROCESSING_DIR, "african_voices_ibibio_lst" ), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "kik" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join( PREPROCESSING_DIR, "african_voices_kikuyu_opb" ), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "lin" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join( PREPROCESSING_DIR, "african_voices_lingala_opb" ), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "lug" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join( PREPROCESSING_DIR, "african_voices_ganda_cmv" ), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "luo" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join(PREPROCESSING_DIR, "african_voices_luo_afv"), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "luo" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join(PREPROCESSING_DIR, "african_voices_luo_opb"), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "swh" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join( PREPROCESSING_DIR, "african_voices_swahili_llsti" ), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "sxb" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join( PREPROCESSING_DIR, "african_voices_suba_afv" ), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "wol" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join( PREPROCESSING_DIR, "african_voices_wolof_alf" ), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "yor" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join( PREPROCESSING_DIR, "african_voices_yoruba_opb" ), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "nya" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join(PREPROCESSING_DIR, "zambezi_voice_nyanja"), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "loz" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join(PREPROCESSING_DIR, "zambezi_voice_lozi"), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "toi" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Massive", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join(PREPROCESSING_DIR, "zambezi_voice_tonga"), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5) lang_id = "shn" tts_scorer = TTSScorer( path_to_model=os.path.join(MODELS_DIR, "ToucanTTS_Finetuning_Shan", "best.pt"), device=exec_device, ) tts_scorer.score( path_to_toucantts_dataset=os.path.join(PREPROCESSING_DIR, "integration_shan"), lang_id=lang_id, ) tts_scorer.show_samples_with_highest_loss(20) tts_scorer.remove_samples_with_highest_loss(5)