def test_without_spark(self): with tempfile.TemporaryDirectory( prefix="merge-coocc-entry-test") as input_dir: self.copy_models(models.COOCC, input_dir, COPIES_NUMBER) args = get_args(input_dir, True) merge_coocc(args) self.check_coocc(args.output)
def test_overflow_with_spark(self): with tempfile.TemporaryDirectory( prefix="merge-coocc-entry-test") as input_dir: self.copy_models(models.COOCC, input_dir, COPIES_NUMBER) args = get_args(input_dir, False) c_neg = Cooccurrences().load(args.input[0]) c_neg.matrix.data[0] = MAX_INT32 - c_neg.matrix.data[0] c_neg.save(args.input[0]) merge_coocc(args) result = Cooccurrences().load(args.output) self.assertTrue(numpy.all(result.matrix.data <= MAX_INT32)) self.assertTrue(numpy.all(result.matrix.data >= 0))