def run_train_lm(args, download_dictionaries=None): if not args.dictionary_path: args.dictionary_path = None if download_dictionaries is None: download_dictionaries = get_available_dict_languages() args.source_path = args.source_path.rstrip('/').rstrip('\\') validate_args(args, download_dictionaries) train_lm(args)
def run_validate_corpus(args, download_dictionaries=None): if download_dictionaries is None: download_dictionaries = get_available_dict_languages() try: args.speaker_characters = int(args.speaker_characters) except ValueError: pass validate_args(args, download_dictionaries) validate_corpus(args)
def run_train_ivector_extractor(args, download_dictionaries=None): if download_dictionaries is None: download_dictionaries = get_available_dict_languages() try: args.speaker_characters = int(args.speaker_characters) except ValueError: pass args.corpus_directory = args.corpus_directory.rstrip('/').rstrip('\\') validate_args(args, download_dictionaries) train_ivector(args)
def run_train_dictionary(args, downloaded_acoustic_models=None, download_dictionaries=None): if downloaded_acoustic_models is None: downloaded_acoustic_models = get_available_acoustic_languages() if download_dictionaries is None: download_dictionaries = get_available_dict_languages() try: args.speaker_characters = int(args.speaker_characters) except ValueError: pass args.output_directory = args.output_directory.rstrip('/').rstrip('\\') args.corpus_directory = args.corpus_directory.rstrip('/').rstrip('\\') validate_args(args, downloaded_acoustic_models, download_dictionaries) train_dictionary(args)
def run_train_corpus(args, unknown_args=None, download_dictionaries=None): if download_dictionaries is None: download_dictionaries = get_available_dict_languages() try: args.speaker_characters = int(args.speaker_characters) except ValueError: pass if not args.output_model_path: args.output_model_path = None args.output_directory = args.output_directory.rstrip('/').rstrip('\\') args.corpus_directory = args.corpus_directory.rstrip('/').rstrip('\\') validate_args(args, download_dictionaries) align_corpus(args, unknown_args)
def unfix_path(): if sys.platform == 'win32': sep = ';' os.environ['PATH'] = sep.join(os.environ['PATH'].split(sep)[1:]) else: sep = ':' os.environ['PATH'] = sep.join(os.environ['PATH'].split(sep)[1:]) os.environ['LD_LIBRARY_PATH'] = sep.join(os.environ['PATH'].split(sep)[1:]) acoustic_languages = get_available_acoustic_languages() lm_languages = get_available_lm_languages() g2p_languages = get_available_g2p_languages() dict_languages = get_available_dict_languages() parser = argparse.ArgumentParser() subparsers = parser.add_subparsers(dest="subcommand") subparsers.required = True align_parser = subparsers.add_parser('align') align_parser.add_argument('corpus_directory', help='Full path to the directory to align') align_parser.add_argument('dictionary_path', help='Full path to the pronunciation dictionary to use') align_parser.add_argument('acoustic_model_path', help='Full path to the archive containing pre-trained model or language ({})'.format( ', '.join(acoustic_languages))) align_parser.add_argument('output_directory', help="Full path to output directory, will be created if it doesn't exist") align_parser.add_argument('--config_path', type=str, default='',
def run_train_g2p(args, download_dictionaries=None): if download_dictionaries is None: download_dictionaries = get_available_dict_languages() validate(args, download_dictionaries) train_g2p(args)