def __init__(self, mail_file): self.mail_file = mail_file self.train_module = TrainModule() self.P_SPAM = 0.5 self.P_NORMAL = 1 - self.P_SPAM self.P_SPAM_WORD = 0.4 self.P_IS_SPAM_LIMIT = 0.9 self.train_module.set_dic_word_freq()
def __init__(self, mail_file, is_given_mail=False): self.mail_content = mail_file # 邮件文件路径 self.is_given_mail = is_given_mail self.train_module = TrainModule() self.P_SPAM = 0.5 # 先验概率为0.5 self.P_NORMAL = 1 - self.P_SPAM self.P_SPAM_WORD = 0.4 # 词语未出现在模型中,p(s|w)设为0.4 self.P_IS_SPAM_LIMIT = 0.9 # 判断阀值 self.train_module.set_dic_word_freq() # 开始训练模型