def test_HPV_data(): assert HPV_data.index.is_unique assert HPV_data.shape == (5067, 0) assert sum(list(HPV_data.index)) == 176952023632 for i in HPV_data.index: assert check_CAS(int_to_CAS(i))
def test_TSCA_data(): tots_calc = [ TSCA_data[i].sum() for i in [ 'UV', 'E', 'F', 'N', 'P', 'S', 'R', 'T', 'XU', 'SP', 'TP', 'Y1', 'Y2' ] ] tots = [16829, 271, 3, 713, 8371, 1173, 13, 151, 19035, 74, 50, 352, 9] assert tots_calc == tots assert TSCA_data.index.is_unique assert TSCA_data.shape == (67635, 13) assert all([check_CAS(int_to_CAS(i)) for i in TSCA_data.index])
def test_NLP_data(): assert NLP_data.index.is_unique assert NLP_data.shape == (698, 0) assert sum(list(NLP_data.index)) == 83268755392 assert all([check_CAS(int_to_CAS(i)) for i in NLP_data.index])
def test_SPIN_data(): assert SPIN_data.index.is_unique assert SPIN_data.shape == (26023, 0) assert sum(list(SPIN_data.index)) == 1666688770043 assert all([check_CAS(int_to_CAS(i)) for i in SPIN_data.index])
def test_EINECS_data(): assert EINECS_data.index.is_unique assert EINECS_data.shape == (100203, 0) assert sum(list(EINECS_data.index)) == 4497611272838 assert all([check_CAS(int_to_CAS(i)) for i in EINECS_data.index])
def test_DSL_data(): assert DSL_data.index.is_unique assert DSL_data['Registry'].sum() == 48363 assert DSL_data.shape == (73036, 1) assert all([check_CAS(int_to_CAS(i)) for i in DSL_data.index])