Python DataSet.from_filenames 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: DataSet

클래스/타입: DataSet

메소드/함수: from_filenames

hotexamples.com에서의 예제들: 4

Python DataSet.from_filenames - 4개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 DataSet.DataSet.from_filenames에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

DataSet(30)

add_input(12)

add_raw(12)

add_seg(11)

add_gt(7)

getEmbedding(5)

getTestNeg(5)

getTrainInstance(4)

heart_sound_scoring(4)

getInstances(4)

getTestInstance(4)

__init__(3)

getExamples(3)

add(3)

getInputs(3)

formatToBinary(3)

build_train_data(2)

add_item(2)

discretize_values(2)

attributes(2)

attribute_types(2)

addExpectedMeta(2)

fileName(2)

from_filenames(2)

generateDataBatch(2)

get_test_data_obo(2)

getAttributes(2)

PreparingData(2)

getMaxValue(1)

getMimeType(1)

info(1)

getLabels(1)

getMinValue(1)

getFeatureEmbedding(1)

getExamplesByClass(1)

getGeometryType(1)

getPixelRes(1)

getMissingIndex(1)

get_image(1)

import_from_csv(1)

headers(1)

get_train_dataBatch(1)

get_time_cnt(1)

get_test_RGB_image(1)

get_node_dim(1)

getTrainingAndTestingSets(1)

getNodes(1)

getTrainValidateTestSet(1)

getTrainTestSet(1)

getTrainAll(1)

예제 #1

파일 보기

def per_sentence_bionlp_fscores_nbest(test_filenames, gold_dir):
    import tempfile
    from DataSet import DataSet
    from cStringIO import StringIO

    gold_dir = path(gold_dir)

    sentences = DataSet.from_filenames(*test_filenames)
    for docid, sentences_in_doc in sentences.group_by_metadata('DOC'):
        # if docid != '9361029':
        # continue

        print 'DOC:', docid
        our_total_proposed = 0
        our_total_matched = 0
        for i, sentence in enumerate(sentences_in_doc):
            for j, parse in enumerate(sentence):
                print "DOC:", docid, 'Sentence:', i, 'Parse:', j
                our_score_components = parse.bionlp_fscore_components(sentence)
                matched, gold, proposed = our_score_components
                our_total_proposed += proposed
                our_total_matched += matched

                conll_version = StringIO()
                parse.write_conll(conll_version,
                                  include_metadata=False,
                                  sentence=sentence)
                conll_version.seek(0)
                conll_version = conll_version.read()

                import BioNLPConversionDB
                converter = BioNLPConversionDB.get_converter()
                bionlp_events_string = converter.convert(conll_version)

                if 0:
                    print 'Events ---'
                    print bionlp_events_string
                    print 'Events ---'

                temp_test_dir = path(tempfile.mkdtemp(prefix=docid + '-'))
                temp_test_filename = path(temp_test_dir / docid + '.a2.t1')
                temp_test_file = file(temp_test_filename, 'w')
                temp_test_file.write(bionlp_events_string)
                temp_test_file.close()
                real_score_components = real_evaluation_bionlp_components(
                    temp_test_dir, gold_dir)
                if our_score_components != real_score_components:
                    real_evaluation_bionlp_components(temp_test_dir,
                                                      gold_dir,
                                                      show_output=True)
                temp_test_dir.rmtree()
                if our_score_components != real_score_components:
                    print "Ours:", our_score_components
                    print 'Real:', real_score_components

                    print 'Events ---'
                    print bionlp_events_string
                    print 'Events ---'
                    raise 'mismatch'

예제 #2

파일 보기

파일: BioNLP.py 프로젝트: lazycrazyowl/ucleed

def per_sentence_bionlp_fscores(test_filename, test_dir, gold_dir):
    import tempfile
    from DataSet import DataSet
    from cStringIO import StringIO
    test_dir = path(test_dir)
    gold_dir = path(gold_dir)

    sentences = DataSet.from_filenames(test_filename)
    for docid, sentences_in_doc in sentences.group_by_metadata('DOC'):
        # if docid != '9015187':
        # if docid != '9081693':
        # if docid != '9257843':
        # if docid != '8108127':
        # if docid != '9115366':
        # if docid != '9361029':
            # continue

        print 'DOC:', docid
        our_total_proposed = 0
        our_total_matched = 0
        for sentence in sentences_in_doc:
            parse = sentence.gold_parse
            sentence.parses = [parse]
            our_score_components = parse.bionlp_fscore_components(sentence)
            matched, gold, proposed = our_score_components
            our_total_proposed += proposed
            our_total_matched += matched

            conll_version = StringIO()
            parse.write_conll(conll_version, include_metadata=False, sentence=sentence)
            conll_version.seek(0)
            conll_version = conll_version.read()

            import BioNLPConversionDB
            converter = BioNLPConversionDB.get_converter()
            bionlp_events_string = converter.convert(conll_version)

            if 1:
                print 'Events ---'
                print bionlp_events_string
                print 'Events ---'
            
            print "Ours:", our_score_components

            temp_test_dir = path(tempfile.mkdtemp(prefix=docid + '-'))
            temp_test_filename = path(temp_test_dir/docid + '.a2.t1')
            temp_test_file = file(temp_test_filename, 'w')
            temp_test_file.write(bionlp_events_string)
            temp_test_file.close()
            real_score_components = real_evaluation_bionlp_components(temp_test_dir, gold_dir)
            print 'Real:', real_score_components 
            if our_score_components != real_score_components:
                real_evaluation_bionlp_components(temp_test_dir, gold_dir, show_output=True)
            temp_test_dir.rmtree()
            if our_score_components != real_score_components:
                raise 'mismatch'

예제 #3

파일 보기

파일: BioNLP.py 프로젝트: lazycrazyowl/ucleed

def per_sentence_bionlp_fscores_nbest(test_filenames, gold_dir):
    import tempfile
    from DataSet import DataSet
    from cStringIO import StringIO

    gold_dir = path(gold_dir)

    sentences = DataSet.from_filenames(*test_filenames)
    for docid, sentences_in_doc in sentences.group_by_metadata('DOC'):
        # if docid != '9361029':
            # continue

        print 'DOC:', docid
        our_total_proposed = 0
        our_total_matched = 0
        for i, sentence in enumerate(sentences_in_doc):
            for j, parse in enumerate(sentence):
                print "DOC:", docid, 'Sentence:', i, 'Parse:', j
                our_score_components = parse.bionlp_fscore_components(sentence)
                matched, gold, proposed = our_score_components
                our_total_proposed += proposed
                our_total_matched += matched

                conll_version = StringIO()
                parse.write_conll(conll_version, include_metadata=False, sentence=sentence)
                conll_version.seek(0)
                conll_version = conll_version.read()

                import BioNLPConversionDB
                converter = BioNLPConversionDB.get_converter()
                bionlp_events_string = converter.convert(conll_version)

                if 0:
                    print 'Events ---'
                    print bionlp_events_string
                    print 'Events ---'

                temp_test_dir = path(tempfile.mkdtemp(prefix=docid + '-'))
                temp_test_filename = path(temp_test_dir/docid + '.a2.t1')
                temp_test_file = file(temp_test_filename, 'w')
                temp_test_file.write(bionlp_events_string)
                temp_test_file.close()
                real_score_components = real_evaluation_bionlp_components(temp_test_dir, gold_dir)
                if our_score_components != real_score_components:
                    real_evaluation_bionlp_components(temp_test_dir, gold_dir, show_output=True)
                temp_test_dir.rmtree()
                if our_score_components != real_score_components:
                    print "Ours:", our_score_components
                    print 'Real:', real_score_components 

                    print 'Events ---'
                    print bionlp_events_string
                    print 'Events ---'
                    raise 'mismatch'

예제 #4

파일 보기

def per_sentence_bionlp_fscores(test_filename, test_dir, gold_dir):
    import tempfile
    from DataSet import DataSet
    from cStringIO import StringIO
    test_dir = path(test_dir)
    gold_dir = path(gold_dir)

    sentences = DataSet.from_filenames(test_filename)
    for docid, sentences_in_doc in sentences.group_by_metadata('DOC'):
        # if docid != '9015187':
        # if docid != '9081693':
        # if docid != '9257843':
        # if docid != '8108127':
        # if docid != '9115366':
        # if docid != '9361029':
        # continue

        print 'DOC:', docid
        our_total_proposed = 0
        our_total_matched = 0
        for sentence in sentences_in_doc:
            parse = sentence.gold_parse
            sentence.parses = [parse]
            our_score_components = parse.bionlp_fscore_components(sentence)
            matched, gold, proposed = our_score_components
            our_total_proposed += proposed
            our_total_matched += matched

            conll_version = StringIO()
            parse.write_conll(conll_version,
                              include_metadata=False,
                              sentence=sentence)
            conll_version.seek(0)
            conll_version = conll_version.read()

            import BioNLPConversionDB
            converter = BioNLPConversionDB.get_converter()
            bionlp_events_string = converter.convert(conll_version)

            if 1:
                print 'Events ---'
                print bionlp_events_string
                print 'Events ---'

            print "Ours:", our_score_components

            temp_test_dir = path(tempfile.mkdtemp(prefix=docid + '-'))
            temp_test_filename = path(temp_test_dir / docid + '.a2.t1')
            temp_test_file = file(temp_test_filename, 'w')
            temp_test_file.write(bionlp_events_string)
            temp_test_file.close()
            real_score_components = real_evaluation_bionlp_components(
                temp_test_dir, gold_dir)
            print 'Real:', real_score_components
            if our_score_components != real_score_components:
                real_evaluation_bionlp_components(temp_test_dir,
                                                  gold_dir,
                                                  show_output=True)
            temp_test_dir.rmtree()
            if our_score_components != real_score_components:
                raise 'mismatch'