Example #1
0
 def setUpClass(self):
     # Fake models! Only made so we can do unittests
     vm = shVM('tests/w2vModels/*.w2v', useCache=False)
     results, links = vm.trackClouds('x')
     agg = shVA(yearsInInterval=1)
     aggResults, aggMetadata = agg.aggregate(results)
     self.embedded = doSpaceEmbedding(vm, results, aggMetadata)
Example #2
0
 def setUpClass(self):
     # Fake models! Only made so we can do unittests
     vm = shVM('tests/w2vModels/*.w2v', useCache=False)
     results, links = vm.trackClouds('x')
     agg = shVA(yearsInInterval=1)
     aggResults, aggMetadata = agg.aggregate(results)
     self.embedded = doSpaceEmbedding(vm, results, aggMetadata)
Example #3
0
 def testWordsPerYear(self):
     '''Test that aggregator produces the correct number of results'''
     nWordsPerYear = 5
     agg = shVA(nWordsPerYear=nWordsPerYear)
     aggData, _ = agg.aggregate(self._data)
     for words in aggData.itervalues():
         self.assertEqual(len(words), nWordsPerYear,
                          'Each year should have %d words ' % nWordsPerYear)
Example #4
0
 def testWordsPerYear(self):
     '''Test that aggregator produces the correct number of results'''
     nWordsPerYear = 5
     agg = shVA(nWordsPerYear=nWordsPerYear)
     aggData, _ = agg.aggregate(self._data)
     for words in aggData.itervalues():
         self.assertEqual(len(words), nWordsPerYear,
                          'Each year should have %d words ' % nWordsPerYear)
Example #5
0
    def testWeightingFunctions(self):
        '''Test that VocabularyAggregator supports weighting functions and fails
        for unsupported ones.'''
        for f in ['Gaussian', 'JSD', 'Linear']:
            try:
                agg = shVA(weighF=f)
                agg.aggregate(self._data)
            except:
                self.fail(f + ' should be a valid function')

        try:
            agg = shVA(weighF=lambda t1, t2: 0)
            agg.aggregate(self._data)
        except:
            self.fail('Lambda function should be a valid function')

        with self.assertRaises(Exception):
            agg = shVA(weighF='Unknown')
            agg.aggregate(self._data)
Example #6
0
    def testWeightingFunctions(self):
        '''Test that VocabularyAggregator supports weighting functions and fails
        for unsupported ones.'''
        for f in ['Gaussian', 'JSD',  'Linear']:
            try:
                agg = shVA(weighF=f)
                agg.aggregate(self._data)
            except:
                self.fail(f + ' should be a valid function')

        try:
            agg = shVA(weighF=lambda t1, t2: 0)
            agg.aggregate(self._data)
        except:
            self.fail('Lambda function should be a valid function')

        with self.assertRaises(Exception):
            agg = shVA(weighF='Unknown')
            agg.aggregate(self._data)
Example #7
0
    def testYearsInInterval(self):
        '''Test aggregator reduces the number of intervals produced when
        such intervals are longer'''
        agg = shVA(yearsInInterval=1)
        aggData, _ = agg.aggregate(self._data)
        self.assertEqual(len(aggData.keys()), len(self._data),
                         'Should have same number of keys as original data')

        agg = shVA(yearsInInterval=2)
        aggData, _ = agg.aggregate(self._data)
        self.assertEqual(len(aggData.keys()), len(self._data)/2,
                         'Should have 1/2 the number of keys as original data')

        agg = shVA(yearsInInterval=len(self._data))
        aggData, _ = agg.aggregate(self._data)
        self.assertEqual(len(aggData.keys()), 1,
                         'Should have only 1 key')

        agg = shVA(yearsInInterval=2 * len(self._data))
        aggData, _ = agg.aggregate(self._data)
        self.assertEqual(len(aggData.keys()), 1,
                         'Should have only 1 key, containing all years')
Example #8
0
    def testTimePeriods(self):
        '''Test aggregator produces metadata'''
        agg = shVA(yearsInInterval=1, yIntervalFreq=1)
        data, times = agg.aggregate(self._data)
        self.assertEqual(len(data), len(times),
                         'Should have same number of keys')
        self.assertTrue(data.keys() == times.keys(), 'Should be the same keys')

        yearsInInterval = 2
        agg = shVA(yearsInInterval=yearsInInterval, yIntervalFreq=1)
        _, times = agg.aggregate(self._data)
        for year, values in times.iteritems():
            self.assertEqual(
                len(values), yearsInInterval,
                'Should have equal number of years in interval '
                'but %s does not' % year)

        agg1 = shVA(yearsInInterval=yearsInInterval, yIntervalFreq=1)
        agg2 = shVA(yearsInInterval=yearsInInterval, yIntervalFreq=2)
        _, times1 = agg1.aggregate(self._data)
        _, times2 = agg2.aggregate(self._data)
        self.assertGreater(len(times1), len(times2),
                           'Should have more intervals')
Example #9
0
    def testYearsInInterval(self):
        '''Test aggregator reduces the number of intervals produced when
        such intervals are longer'''
        agg = shVA(yearsInInterval=1)
        aggData, _ = agg.aggregate(self._data)
        self.assertEqual(len(aggData.keys()), len(self._data),
                         'Should have same number of keys as original data')

        agg = shVA(yearsInInterval=2)
        aggData, _ = agg.aggregate(self._data)
        self.assertEqual(
            len(aggData.keys()),
            len(self._data) / 2,
            'Should have 1/2 the number of keys as original data')

        agg = shVA(yearsInInterval=len(self._data))
        aggData, _ = agg.aggregate(self._data)
        self.assertEqual(len(aggData.keys()), 1, 'Should have only 1 key')

        agg = shVA(yearsInInterval=2 * len(self._data))
        aggData, _ = agg.aggregate(self._data)
        self.assertEqual(len(aggData.keys()), 1,
                         'Should have only 1 key, containing all years')
Example #10
0
    def testTimePeriods(self):
        '''Test aggregator produces metadata'''
        agg = shVA(yearsInInterval=1, yIntervalFreq=1)
        data, times = agg.aggregate(self._data)
        self.assertEqual(len(data), len(times),
                         'Should have same number of keys')
        self.assertTrue(data.keys() == times.keys(),
                        'Should be the same keys')

        yearsInInterval = 2
        agg = shVA(yearsInInterval=yearsInInterval, yIntervalFreq=1)
        _, times = agg.aggregate(self._data)
        for year, values in times.iteritems():
            self.assertEqual(len(values), yearsInInterval,
                             'Should have equal number of years in interval '
                             'but %s does not' % year)

        agg1 = shVA(yearsInInterval=yearsInInterval, yIntervalFreq=1)
        agg2 = shVA(yearsInInterval=yearsInInterval, yIntervalFreq=2)
        _, times1 = agg1.aggregate(self._data)
        _, times2 = agg2.aggregate(self._data)
        self.assertGreater(len(times1), len(times2),
                           'Should have more intervals')