def main():
    args = parse_args()

    if not os.path.isdir(args.audio_corpus_path):
        print("Given audio corpus path is not a directory")
        sys.exit(1)
    if not os.path.exists(args.audio_corpus_path):
        print("Given audio corpus path doesn't exist.")
        sys.exit(1)

    corpus_classes = obtain_corpus_classes(args.audio_corpus_path)

    if args.is_verbose:
        print("CORPUS CLASSES")
        print("------------------------")
        print(corpus_classes)

    phonetic_matrix = process_corpus(args.audio_corpus_path, is_verbose=args.is_verbose)

    df_phonetic_results = pd.DataFrame(phonetic_matrix, columns=PHONETIC_FEATURES)
    
    print_results(df_phonetic_results)

    output_path = args.features_output_path if args.features_output_path else PHONETIC_FEATURES_EXPORT_PATH
    export_dataframe(df_phonetic_results, output_path)
def main():
    args = parse_args()

    if not os.path.isdir(args.corpus_path):
        print("Given corpus path is not a directory")
        sys.exit(1)
    if not os.path.exists(args.corpus_path):
        print("Given corpus path doesn't exist.")
        sys.exit(1)
    if args.interjections_conf_path and not os.path.exists(args.interjections_conf_path):
        print("Given interjections config file path doesn't exist.")
        sys.exit(1)
    if args.expressions_conf_path and not os.path.exists(args.expressions_conf_path):
        print("Given expressions config file path doesn't exist.")
        sys.exit(1)

    corpus_classes = obtain_corpus_classes(args.corpus_path)

    if args.is_verbose:
        print("CORPUS CLASSES")
        print("------------------------")
        print(corpus_classes)

    cleaning_results = process_corpus(args.corpus_path, args.synonyms_conf_path,
                                      args.interjections_conf_path, args.expressions_conf_path, args.is_verbose)

    df_cleaning_results = pd.DataFrame(cleaning_results)

    print_results(df_cleaning_results)

    output_path = args.features_output_path if args.features_output_path else MARKERS_DISTRIBUTION_PATH
    export_dataframe(df_cleaning_results, output_path)
def main():
    args = parse_args()

    if not os.path.isdir(args.corpus_path):
        print("Given corpus path is not a directory")
        sys.exit(1)
    if not os.path.exists(args.corpus_path):
        print("Given corpus path doesn't exist.")
        sys.exit(1)

    corpus_classes = obtain_corpus_classes(args.corpus_path)

    if args.is_verbose:
        print("CORPUS CLASSES")
        print("------------------------")
        print(corpus_classes)

    pos_distribution = process_corpus(args.corpus_path, args.is_verbose)

    df_pos_distribution = pd.DataFrame(pos_distribution)

    print_results(df_pos_distribution)

    output_path = args.features_output_path if args.features_output_path else POS_DISTRIBUTION_FEATURES_PATH
    export_dataframe(df_pos_distribution, output_path)
Ejemplo n.º 4
0
def main():
    args = parse_args()

    if not os.path.isdir(args.corpus_path):
        print("Given corpus path is not a directory")
        sys.exit(1)
    if not os.path.exists(args.corpus_path):
        print("Given corpus path doesn't exist.")
        sys.exit(1)
    if not args.language_code:
        print("Missing language code.")
        sys.exit(1)

    spacy_model = get_spacy_model(language_code=args.language_code)

    corpus_classes = obtain_corpus_classes(args.corpus_path)

    if args.is_verbose:
        print("CORPUS CLASSES")
        print("------------------------")
        print(corpus_classes)

    process_corpus(args.corpus_path,
                   spacy_model,
                   universal_tag=args.universal_tag)

    print("-------------------")
    print("POS tagging task done.")
Ejemplo n.º 5
0
def main():
    args = parse_args()

    if not os.path.isdir(args.corpus_path):
        print("Given corpus path is not a directory")
        sys.exit(1)
    if not os.path.exists(args.corpus_path):
        print("Given corpus path doesn't exist.")
        sys.exit(1)

    corpus_classes = obtain_corpus_classes(args.corpus_path)

    if args.is_verbose:
        print("CORPUS CLASSES")
        print("------------------------")
        print(corpus_classes)

    adjustment_results = process_corpus(args.corpus_path, args.is_verbose)

    print_results(adjustment_results)
Ejemplo n.º 6
0
def main():
    args = parse_args()

    # On vérifie que les path sont valide
    if not os.path.isdir(args.corpus_path):
        print("Given corpus path is not a directory")
        sys.exit(1)
    if not os.path.exists(args.corpus_path):
        print("Given corpus path doesn't exist.")
        sys.exit(1)

    # On énumère les différentes classes du dataset (e.g : AD, SD, CTRL, etc.)
    corpus_classes = obtain_corpus_classes(args.corpus_path)

    if args.is_verbose:
        print("CORPUS CLASSES")
        print("------------------------")
        print(corpus_classes)

    adjustment_results = process_corpus(args.corpus_path, args.is_verbose)

    print_results(adjustment_results)