Example #1
0
def show_examples():
    beep = '[censored]'

    print('Russian examples:')
    # don't specify do_compile=False unless you want to debug something
    # and see bad words raw (not compiled) patterns
    censor_ru = Censor.get(lang='ru', do_compile=False)
    line = 'ебанамат бляд'
    print('Checking line: "{}"'.format(line))
    line_info = censor_ru.check_line(line)
    print('Does the line contain obscene words? - {}'.format(not line_info['is_good']))
    print('First bad word: {}, bad word pattern: {}'.format(
        line_info['bad_word_info']['word'], line_info['bad_word_info']['accuse'][0]))

    print('Cleaning line with beep word={}'.format(line, beep))
    cleaned_line, bad_words_count, bad_phrases_count = censor_ru.clean_line(line, beep=beep)
    print('resulted cleaned line: "{}", bad words count: {}, bad phrases count: {}'.format(
        cleaned_line, bad_words_count, bad_phrases_count))
    print('\n')

    print('English examples:')
    # don't specify do_compile=False unless you want to debug something
    # and see bad words raw (not compiled) patterns
    censor_en = Censor.get(lang='en', do_compile=False)
    line = 'fucken shit'
    line_info = censor_en.check_line(line)
    print('Does the line contain obscene words? - {}'.format(not line_info['is_good']))
    print('First bad word: {}, bad word pattern: {}'.format(
        line_info['bad_word_info']['word'], line_info['bad_word_info']['accuse'][0]))

    print('cleaning line: {} with beep word={}'.format(line, beep))
    cleaned_line, bad_words_count, bad_phrases_count = censor_en.clean_line(line, beep=beep)
    print('Resulted cleaned line: "{}", bad words count: {}, bad phrases count: {}'.format(
        cleaned_line, bad_words_count, bad_phrases_count))

    print('\n')
    line = 'camel toe towel'
    print('English bad phrase line example: "{}"'.format(line))
    line_info = censor_en.check_line(line)
    print('Does the line contain obscene words/phrases? - {}'.format(not line_info['is_good']))

    print('First accuse pattern: {}'.format(
        line_info['accuse'][0]))

    print('Cleaning bad phrases line with beep word={}'.format(beep))
    cleaned_line, bad_words_count, bad_phrases_count = censor_en.clean_line(line, beep=beep)
    print('Resulted cleaned line: "{}", bad words count: {}, bad phrases count: {}'.format(
        cleaned_line, bad_words_count, bad_phrases_count))

    html_line = '<b><span>bitch</i> w***e</b>fu<div>ck</li>'
    print('\n')
    print('Cleaning english html line containing bad words: "{}"'.format(html_line))
    # note: no phrases are cleaned atm in html
    cleaned_line, bad_words_count = censor_en.clean_html_line(
        html_line, beep=beep)
    print('Resulted cleaned html line: "{}", bad words count: {}'.format(
        cleaned_line, bad_words_count))
Example #2
0
 def setUpClass(cls):
     cls.censor = Censor.get(lang='en', do_compile=False)
     cls.data = import_module('censure.tests.en.data')
Example #3
0
 def __init__(self, lang='ru', do_compile=None):
     if do_compile is None:
         do_compile = self.do_compile
     self.lang = lang
     self.c = Censor.get(lang=lang, do_compile=do_compile)