예제 #1
0
def test_check_mostly_same_bad1_ser():
    # verifies that the mostly same check finds rows with mostly the same value
    fail = pd.DataFrame.from_dict({
        'mostly_same': (True,),
        'thresh': (0.7,),
        'mean': (0.75,),
    })
    assert fail.equals(bf.check_mostly_same(bad_same2['b1'], 0.7))
예제 #2
0
def test_check_mostly_same_bad1_df():
    # verifies that the mostly same check finds rows with mostly the same value
    fail = pd.DataFrame.from_dict({
        'column': ('b1', 'b2'),
        'mostly_same': (True, False),
        'thresh': (0.7, 0.7),
        'mean': (0.75, 0.5),
    })
    assert fail.equals(bf.check_mostly_same(bad_same2, 0.7))
예제 #3
0
def test_check_all_same_good_ser():
    # verifies good data passes the all same check
    assert not bf.check_all_same(good['g1']).loc[:, 'all_same'].any()
예제 #4
0
def test_validate_dtype_bad_float_ser():
    # checks that TypeError is raised when series contains float data
    with pytest.raises(TypeError) as excinfo:
        bf._validate_binary_dtype(bad_type2['b1'])
    # verifies TypeError contains appropriate message
    assert 'should be of type bool or int64' in str(excinfo.value)
예제 #5
0
def test_validate_dtype_bad_str_df():
    # checks that TypeError is raised when df contains object (str) data
    with pytest.raises(TypeError) as excinfo:
        bf._validate_binary_dtype(bad_type1)
    # verifies TypeError contains appropriate message
    assert 'should be of type bool or int64' in str(excinfo.value)
예제 #6
0
def test_validate_dtype_good_ser():
    # verifies good data passes the dtype check
    bf._validate_binary_dtype(good['g1'])
예제 #7
0
def test_check_range_bad2_ser():
    # verifies that the range check finds rows with high values
    fail = pd.DataFrame.from_dict({'outside_range': (True,)})
    assert fail.equals(bf.check_outside_range(bad_range2['b1']))
예제 #8
0
def test_check_range_bad2_df():
    # verifies that the range check finds rows with high values
    fail = pd.DataFrame.from_dict({'column': ('b1', 'b2'), 'outside_range': (True, False)})
    assert fail.equals(bf.check_outside_range(bad_range2))
예제 #9
0
def test_check_range_good_ser():
    # verifies good data passes the range check
    assert not bf.check_outside_range(good['g1']).loc[:, 'outside_range'].any()
예제 #10
0
def test_check_outside_range_good_df():
    # verifies good data passes the range check
    assert not bf.check_outside_range(good).loc[:, 'outside_range'].any(axis=0)
예제 #11
0
def test_check_mostly_same_good_ser():
    # verifies good data passes the mostly same check
    assert not bf.check_mostly_same(good['g1']).loc[:, 'mostly_same'].any()
예제 #12
0
def test_check_mostly_same_good_df():
    # verifies good data passes the mostly same check
    assert not bf.check_mostly_same(good).loc[:, 'mostly_same'].any(axis=0)
예제 #13
0
def test_check_all_same_bad_ser():
    # verifies that the all same check finds rows with all the same value
    fail = pd.DataFrame.from_dict({'all_same': (True,)})
    assert fail.equals(bf.check_all_same(bad_same1['b1']))
예제 #14
0
def test_check_all_same_bad_df():
    # verifies that the all same check finds rows with all the same value
    fail = pd.DataFrame.from_dict({'column': ('b1', 'b2'), 'all_same': (True, False)})
    assert fail.equals(bf.check_all_same(bad_same1))