Exemple #1
0
def test_append_uri_2():
    from utilities.utilities import Utilities
    u = Utilities()
    data = 'this.wav'
    uri = 'gs://foo/bar/'
    expected = uri + data
    result = u.append_uri(uri, data)
    assert result == expected

    if not local_files_path:
        # Get list of all files in google cloud storage (gcs) bucket
        gcs = GCS()
        raw_file_list = gcs.get_file_list(cloud_store_uri)
    else:
        raw_file_list = utilities.local_files(local_files_path)

    logger.debug(f'RAW FILE LIST: {raw_file_list}')

    # Filter file list
    filtered_file_list = utilities.filter_files(raw_file_list, only_transcribe)

    if not local_files_path:
        final_file_list = [utilities.append_uri(cloud_store_uri, file) for file in filtered_file_list]
    else:
        final_file_list = filtered_file_list

    logger.debug(f'FINAL FILE LIST: {final_file_list}')

    # if only doing transcriptions, add diarization and punctuation?
    dia = False
    punct = False
    c = None
    if only_transcribe:
        dia = input('Add Diarization Y/N ')
        if dia.lower() == 'y':
            c = input('How many speakers (int) ')
            configuration.set_diarizationSpeakerCount(int(c))
            configuration.set_enableSpeakerDiarization(bool(dia))