def similarity_sgs(sgd_results, data, color=True): sgs = [x[1] for x in sgd_results] #sgNames = [str(sg.subgroup_description) for sg in sgs] dists = [[ps.overlap(sg, sg2, data) for sg2 in sgs] for sg in sgs] dist_df = pd.DataFrame(dists) if color: dist_df = dist_df.style.background_gradient() return dist_df
def overlaps_list(sg, list_of_sgs, data, similarity_level=0.9): for anotherSG in list_of_sgs: if ps.overlap(sg, anotherSG, data) > similarity_level: return True return False