def run_query(self):
     config = self.kwargs['config']
     path = self.kwargs['path']
     stop_check = self.kwargs['stop_check']
     call_back = self.kwargs['call_back']
     call_back('Enriching speakers...')
     call_back(0,0)
     with CorpusContext(config) as c:
         enrich_speakers_from_csv(c, path)
         self.actionCompleted.emit('enriching speakers')
         
     return True
예제 #2
0
    def run_query(self):
        config = self.kwargs['config']
        path = self.kwargs['path']
        stop_check = self.kwargs['stop_check']
        call_back = self.kwargs['call_back']
        call_back('Enriching speakers...')
        call_back(0, 0)
        with CorpusContext(config) as c:
            enrich_speakers_from_csv(c, path)
            self.actionCompleted.emit('enriching speakers')

        return True
예제 #3
0
def test_speaker_enrichment_csv(fave_corpus_config, csv_test_dir):
    path = os.path.join(csv_test_dir, 'fave_speaker_info.txt')
    with CorpusContext(fave_corpus_config) as c:
        enrich_speakers_from_csv(c, path)

        q = c.query_graph(c.phone).filter(c.phone.speaker.is_interviewer == True)

        q = q.columns(c.phone.label.column_name('label'),
                      c.phone.speaker.name.column_name('speaker'))

        res = q.all()

        assert (all(x['speaker'] == 'Interviewer' for x in res))
예제 #4
0
def test_speaker_enrichment(fave_corpus_config, csv_test_dir):
    path = os.path.join(csv_test_dir, 'fave_speaker_info.txt')
    with CorpusContext(fave_corpus_config) as c:
        enrich_speakers_from_csv(c, path)

        q = c.query_graph(c.phone).filter(c.phone.speaker.is_interviewer == True)

        q = q.columns(c.phone.label.column_name('label'),
                    c.phone.speaker.name.column_name('speaker'))

        res = q.all()

        assert(all(x['speaker'] == 'Interviewer' for x in res))
예제 #5
0
def speaker_enrichment(config, speaker_file):
    if not os.path.exists(speaker_file):
        print('Could not find {}, skipping speaker enrichment.'.format(speaker_file))
        return
    with CorpusContext(config) as g:
        if not g.hierarchy.has_speaker_property('gender'):
            begin = time.time()
            enrich_speakers_from_csv(g, speaker_file)
            time_taken = time.time() - begin
            print('Speaker enrichment took: {}'.format(time.time() - begin))
            save_performance_benchmark(config, 'speaker_enrichment', time_taken)
        else:
            print('Speaker enrichment already done, skipping.')