Пример #1
0
    def test_align_count(self):
        descriptor = Descriptor(term_align) 
        
        feat_extr = Extractor(
            descriptor,
            node_selector=select_visible_node)
        
        graph_pair = self.corpus[0]
        instances = feat_extr.extract(graph_pair)
        self.dump(graph_pair, instances)
        
        # check for a couple of "interesting" instances
        
        #instance: 0
        #source: 0: top: Posters Partij voor de Dieren verwijderd
        #target: 0: top: Zeeland verwijdert posters Partij voor de Dieren
        #align_inside_count: 6
        #source_align_outside_count: 0
        #target_align_outside_count: 0
        #source_align_none_count: 0
        #target_align_none_count: 1
        self.assertEqual(instances[0]["align_inside_count"], 6)
        self.assertEqual(instances[0]["source_align_outside_count"], 0)
        self.assertEqual(instances[0]["target_align_outside_count"], 0)
        self.assertEqual(instances[0]["source_align_none_count"], 0)
        self.assertEqual(instances[0]["target_align_none_count"], 1)

        #instance: 2
        #source: 0: top: Posters Partij voor de Dieren verwijderd
        #target: 2: name: Zeeland
        #align_inside_count: 0
        #source_align_outside_count: 6
        #target_align_outside_count: 0
        #source_align_none_count: 0
        #target_align_none_count: 1
        self.assertEqual(instances[2]["align_inside_count"], 0)
        self.assertEqual(instances[2]["source_align_outside_count"], 6)
        self.assertEqual(instances[2]["target_align_outside_count"], 0)
        self.assertEqual(instances[2]["source_align_none_count"], 0)
        self.assertEqual(instances[2]["target_align_none_count"], 1)
        
        #instance: 25
        #source: 2: noun: Posters
        #target: 3: verb: verwijdert
        #align_inside_count: 0
        #source_align_outside_count: 1
        #target_align_outside_count: 1
        #source_align_none_count: 0
        #target_align_none_count: 01
        self.assertEqual(instances[25]["align_inside_count"], 0)
        self.assertEqual(instances[25]["source_align_outside_count"], 1)
        self.assertEqual(instances[25]["target_align_outside_count"], 1)
        self.assertEqual(instances[25]["source_align_none_count"], 0)
        self.assertEqual(instances[25]["target_align_none_count"], 0)
Пример #2
0
    def test_align_count(self):
        descriptor = Descriptor(term_align)

        feat_extr = Extractor(descriptor, node_selector=select_visible_node)

        graph_pair = self.corpus[0]
        instances = feat_extr.extract(graph_pair)
        self.dump(graph_pair, instances)

        # check for a couple of "interesting" instances

        #instance: 0
        #source: 0: top: Posters Partij voor de Dieren verwijderd
        #target: 0: top: Zeeland verwijdert posters Partij voor de Dieren
        #align_inside_count: 6
        #source_align_outside_count: 0
        #target_align_outside_count: 0
        #source_align_none_count: 0
        #target_align_none_count: 1
        self.assertEqual(instances[0]["align_inside_count"], 6)
        self.assertEqual(instances[0]["source_align_outside_count"], 0)
        self.assertEqual(instances[0]["target_align_outside_count"], 0)
        self.assertEqual(instances[0]["source_align_none_count"], 0)
        self.assertEqual(instances[0]["target_align_none_count"], 1)

        #instance: 2
        #source: 0: top: Posters Partij voor de Dieren verwijderd
        #target: 2: name: Zeeland
        #align_inside_count: 0
        #source_align_outside_count: 6
        #target_align_outside_count: 0
        #source_align_none_count: 0
        #target_align_none_count: 1
        self.assertEqual(instances[2]["align_inside_count"], 0)
        self.assertEqual(instances[2]["source_align_outside_count"], 6)
        self.assertEqual(instances[2]["target_align_outside_count"], 0)
        self.assertEqual(instances[2]["source_align_none_count"], 0)
        self.assertEqual(instances[2]["target_align_none_count"], 1)

        #instance: 25
        #source: 2: noun: Posters
        #target: 3: verb: verwijdert
        #align_inside_count: 0
        #source_align_outside_count: 1
        #target_align_outside_count: 1
        #source_align_none_count: 0
        #target_align_none_count: 01
        self.assertEqual(instances[25]["align_inside_count"], 0)
        self.assertEqual(instances[25]["source_align_outside_count"], 1)
        self.assertEqual(instances[25]["target_align_outside_count"], 1)
        self.assertEqual(instances[25]["source_align_none_count"], 0)
        self.assertEqual(instances[25]["target_align_none_count"], 0)
Пример #3
0
class TestCornetFeatures(unittest.TestCase):

    def setUp(self):
        corpus = ParallelGraphCorpus(
            inf="../exp/corpora/news/pgc/ma/2006-11/news-2006-11-aligned-part-00.pgc")
        self.graph_pair = corpus[0]
        
        descriptor = Descriptor(cornet_sim) 
        self.feat_extr = Extractor(
            descriptor,
            node_selector=select_visible_node)
        
    def test_cornet_server(self):
        create_cornet_server_proxy(SERVER)
        
        instances = self.feat_extr.extract(self.graph_pair)
        print instances
        # FIXME add asserts
        
    def test_cornet_load(self):
        print "\n(Loading Cornetto database - may take a long time...)"
        load_cornet(CDB_LU_FNAME, CDB_SYN_FNAME)
        instances = self.feat_extr.extract(self.graph_pair)
        print instances