Python Decoder.decodeAudio 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: Decoder

클래스/타입: Decoder

메소드/함수: decodeAudio

hotexamples.com에서의 예제들: 2

Python Decoder.decodeAudio - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 Decoder.Decoder.decodeAudio에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

Decoder(30)

parameters(13)

decode(11)

load_state_dict(10)

state_dict(8)

decoder(7)

cuda(5)

eval(4)

train(4)

to(3)

beamSearch(3)

generate(3)

DecodeMessage(2)

pretrain(2)

forward(2)

fix_row(2)

inference(2)

save_weights(2)

decode_all_frames(2)

decodeAudio(2)

apply(2)

advance(2)

save(1)

get_sequence_output(1)

show_decoding_table(1)

run_logstash(1)

show_stats(1)

path2ResultWordList(1)

load_weights(1)

vector2state(1)

load_memory(1)

init_decoder_step_input(1)

DecodeAllLevelsString(1)

getJoystickM1(1)

get_most_likely(1)

do_tests(1)

DecodeString(1)

_decode_samples(1)

answer(1)

checkCRC(1)

dcd(1)

decodeWithOracle(1)

decoder_tag(1)

forward_with_action(1)

getStatus(1)

generate_with_action(1)

getData(1)

getJoyStickPB1(1)

getJoystickM2(1)

getJoystickPB2(1)

예제 #1

파일 보기

파일: doitOneChunk.py 프로젝트: xrick/AlignmentDuration

def alignOneChunk(lyrics, withSynthesis, withOracle, lyricsWithModelsORacle, listNonVocalFragments, alpha, usePersistentFiles, tokenLevelAlignedSuffix,  URIrecordingNoExt, currSectionLink, htkParser):
    '''
    wrapper top-most logic method
    '''
    if withOracle:

        # synthesis not needed really in this setting. workaround because without synth takes whole recording  
        withSynthesis = 1
        
#     read from file result
    URIRecordingChunkResynthesizedNoExt =  URIrecordingNoExt + "_" + str(currSectionLink.beginTs) + '_' + str(currSectionLink.endTs)
    detectedAlignedfileName = URIRecordingChunkResynthesizedNoExt + tokenLevelAlignedSuffix
    if not os.path.isfile(detectedAlignedfileName):
        #     ###### extract audio features
        lyricsWithModels, obsFeatures, URIrecordingChunk = loadSmallAudioFragment(lyrics, 'dummyExtractedPitchList', URIrecordingNoExt, URIRecordingChunkResynthesizedNoExt, bool(withSynthesis), currSectionLink, htkParser)
            #     lyricsWithModels, observationFeatures = loadSmallAudioFragment(lyrics,  URIrecordingNoExt, withSynthesis, fromTs=-1, toTs=-1)
        
    # DEBUG: score-derived phoneme  durations
#     lyricsWithModels.printPhonemeNetwork()
#     lyricsWithModels.printWordsAndStates()
   
        decoder = Decoder(lyricsWithModels, URIRecordingChunkResynthesizedNoExt, alpha)
    #  TODO: DEBUG: do not load models
    # decoder = Decoder(lyrics, withModels=False, numStates=86)
    #################### decode
        if usePersistentFiles=='True':
            usePersistentFiles = True
        elif usePersistentFiles=='False':
            usePersistentFiles = False
        else: 
            sys.exit("usePersistentFiles can be only True or False") 
        
        if withOracle:
            detectedTokenList = decoder.decodeWithOracle(lyricsWithModelsORacle, URIRecordingChunkResynthesizedNoExt )
        else:
            detectedTokenList = decoder.decodeAudio(obsFeatures, listNonVocalFragments, usePersistentFiles)
        
        phiOptPath = decoder.path.phiOptPath
        detectedPath = decoder.path.pathRaw
        tokenList2TabFile(detectedTokenList, URIRecordingChunkResynthesizedNoExt, tokenLevelAlignedSuffix, currSectionLink.beginTs)
     
       
        
    ### VISUALIZE result 
#         decoder.lyricsWithModels.printWordsAndStatesAndDurations(decoder.path)
    
    else:   
            print "{}\n already exists. No decoding".format(detectedAlignedfileName)
            detectedTokenList = readListOfListTextFile(detectedAlignedfileName)
            if withOracle:
                outputURI = URIRecordingChunkResynthesizedNoExt + '.path_oracle'
            else:
                outputURI = URIRecordingChunkResynthesizedNoExt + '.path'
            
            detectedPath = readListTextFile(outputURI)
            
            # TODO: store persistently
            phiOptPath = 0
   

    return detectedTokenList, detectedPath, phiOptPath

예제 #2

파일 보기

파일: LyricsAligner.py 프로젝트: xrick/AlignmentDuration

    def alignLyricsSection(self, extractedPitchList, listNonVocalFragments,
                           tokenLevelAlignedSuffix, currSectionLink):
        '''
            align @param: lyrics for one section
            '''

        #     read from file result
        URIRecordingChunkResynthesizedNoExt = currSectionLink.URIRecordingChunk
        detectedAlignedfileName = currSectionLink.URIRecordingChunk + tokenLevelAlignedSuffix
        fe = FeatureExtractor(self.path_to_hcopy, currSectionLink)
        onsetDetector = OnsetDetector(currSectionLink)

        detectedPath = ''
        phiOptPath = ''
        detectedTokenList = []

        if not os.path.isfile(detectedAlignedfileName):

            fromTsTextGrid = -1
            toTsTextGrid = -1

            if ParametersAlgo.WITH_ORACLE_PHONEMES:  # oracle phonemes
                raw_input(
                    'implemented only for Kimseye...! Continue only if working with Kimseye'
                )
                if ParametersAlgo.FOR_MAKAM:
                    fromTsTextGrid = 0
                    toTsTextGrid = 20.88  # for kimseye etmem
                fromSyllableIdx = 0
                toSyllableIdx = 10
                currSectionLink.loadSmallAudioFragmentOracle(
                    self.model, fromSyllableIdx, toSyllableIdx)
                fe.featureVectors = currSectionLink.lyricsWithModels  # featureVectors is alias for LyricsWithModelsOracle

            else:  ###### extract audio features
                fe.featureVectors = currSectionLink.loadSmallAudioFragment(
                    fe, extractedPitchList, self.recording.recordingNoExtURI,
                    self.model)
    #                 sectionLink.lyricsWithModels.printWordsAndStates()
    #################### decode
            decoder = Decoder(currSectionLink,
                              currSectionLink.lyricsWithModels,
                              URIRecordingChunkResynthesizedNoExt)

            ##### prepare note onsets. result stored in files, which are used in decoding  ############################
            if ParametersAlgo.WITH_ORACLE_ONSETS == 1:
                URIrecOnsets = os.path.join(
                    os.path.dirname(self.recording.recordingNoExtURI),
                    ParametersAlgo.ANNOTATION_RULES_ONSETS_EXT)
                onsetDetector.parseNoteOnsetsGrTruth(URIrecOnsets)

            elif ParametersAlgo.WITH_ORACLE_ONSETS == 0:
                onsetDetector.extractNoteOnsets(
                    URIRecordingChunkResynthesizedNoExt + '.wav')
            ###############################################

            detectedTokenList = decoder.decodeAudio(fe, onsetDetector,
                                                    listNonVocalFragments,
                                                    fromTsTextGrid,
                                                    toTsTextGrid)
            detectedTokenList = addTimeShift(detectedTokenList,
                                             currSectionLink.beginTs)

            detectedPath = decoder.path.pathRaw

            #                 ##### write all decoded output persistently to files
            if ParametersAlgo.WRITE_TO_FILE:
                self.write_decoded_to_file(
                    tokenLevelAlignedSuffix,
                    URIRecordingChunkResynthesizedNoExt,
                    decoder.path.phiPathLikelihood, detectedTokenList)

        ### VISUALIZE result

    #         decoder.lyricsWithModels.printWordsAndStatesAndDurations(decoder.path)

        else:  # do not decode, read form file
            detectedTokenList, phiOptPath, detectedPath = self.read_decoded(
                URIRecordingChunkResynthesizedNoExt, detectedAlignedfileName)

        return detectedTokenList, detectedPath, phiOptPath