示例#1
0
    def __init__(self, mail_file):
        self.mail_file = mail_file
        self.train_module = TrainModule()

        self.P_SPAM = 0.5
        self.P_NORMAL = 1 - self.P_SPAM

        self.P_SPAM_WORD = 0.4

        self.P_IS_SPAM_LIMIT = 0.9

        self.train_module.set_dic_word_freq()
示例#2
0
	def __init__(self, mail_file, is_given_mail=False):

		self.mail_content = mail_file  # 邮件文件路径

		self.is_given_mail = is_given_mail

		self.train_module = TrainModule()

		self.P_SPAM = 0.5  # 先验概率为0.5

		self.P_NORMAL = 1 - self.P_SPAM

		self.P_SPAM_WORD = 0.4		# 词语未出现在模型中,p(s|w)设为0.4

		self.P_IS_SPAM_LIMIT = 0.9		# 判断阀值

		self.train_module.set_dic_word_freq()  # 开始训练模型