Пример #1
0
 def test_without_spark(self):
     with tempfile.TemporaryDirectory(
             prefix="merge-coocc-entry-test") as input_dir:
         self.copy_models(models.COOCC, input_dir, COPIES_NUMBER)
         args = get_args(input_dir, True)
         merge_coocc(args)
         self.check_coocc(args.output)
Пример #2
0
    def test_overflow_with_spark(self):
        with tempfile.TemporaryDirectory(
                prefix="merge-coocc-entry-test") as input_dir:
            self.copy_models(models.COOCC, input_dir, COPIES_NUMBER)
            args = get_args(input_dir, False)
            c_neg = Cooccurrences().load(args.input[0])
            c_neg.matrix.data[0] = MAX_INT32 - c_neg.matrix.data[0]
            c_neg.save(args.input[0])
            merge_coocc(args)

            result = Cooccurrences().load(args.output)
            self.assertTrue(numpy.all(result.matrix.data <= MAX_INT32))
            self.assertTrue(numpy.all(result.matrix.data >= 0))