Example #1
0
 def test_match_case_regexp(self):
     rule_list = ['/com.*FooBar/$match-case']
     rules = AdblockRules(rule_list)
     match_not = rules.match('http://example.com/foobarqux', 'example.org')
     match = rules.match('http://example.com/FooBarqux', 'example.org')
     self.assertFalse(match_not.is_match)
     self.assertTrue(match.is_match)
Example #2
0
 def test_rule_fix_start(self):
     rule_list = ['|javascript:*window.location$popup']
     rules = AdblockRules(rule_list)
     self.assertTrue(
         rules.match('javascript:foo;window.location=bar').is_match)
     self.assertFalse(
         rules.match('script=javascript:foo;window.location=bar').is_match)
Example #3
0
 def _test_load_easylist(self, cache_file):
     rules = AdblockRules(rule_files=[EASYLIST_PATH], cache_file=cache_file)
     urls = [
         'https://imagesrv.adition.com/banners/268/00/86/70/52/images/konfetti.png',
         'https://match.adsrvr.org/track/cmf/generic?ttd_pid=theadex&ttd_puid=1001718401132270252&ttd_tpi=1',
         'https://s.hs-data.com/comon/prj/isdc/v3/default/static/js/lib/hammer.min.js',
         'https://ih.adscale.de/map?ssl=1&format=video',
     ]
     is_matches = [
         rules.match(url, 'www.example.com').is_match for url in urls
     ]
     is_matches_expected = [True, True, False, True]
     self.assertEqual(is_matches, is_matches_expected)
Example #4
0
 def test_domain_option_parsing(self):
     rules = AdblockRules(
         ['ads$domain=example.com|~example.org|example.net'])
     options = rules.rules[0].options
     self.assertEqual(['example.com', 'example.net'],
                      options.include_domains)
     self.assertEqual(['example.org'], options.exclude_domains)
Example #5
0
 def test_ignore_cosmetic(self):
     rule_list = [
         '###ad-lead',
         'cnet.com#@##adboard',
     ]
     rules = AdblockRules(rule_list)
     self.assertEqual(len(rules.rules), 0)
Example #6
0
 def test_comment_rule(self):
     rule_list = [
         '! Some Comment',
         '',
         '/some/rule',
     ]
     rules = AdblockRules(rule_list)
     self.assertEqual(len(rules.rules), 1)
Example #7
0
 def test_rule_formatting(self):
     rule_list = [
         '||adzbazar.com^$script,third-party,domain=example.com|example.org',
         '/adblock/$script,~third-party,domain=example.com|~example.org',
         '/|ads/', 'adbanner.png|'
     ]
     rules = AdblockRules(rule_list)
     for rule in rules.rules:
         self.assertEqual(rule_list[rule.origin.line_no - 1], str(rule))
Example #8
0
 def test_rule_options(self):
     rules = AdblockRules(['foo$script,~stylesheet,domain=*'])
     rule = rules.rules[0]
     self.assertTrue(rule.options.has_included('script'))
     self.assertTrue(rule.options.has_excluded('stylesheet'))
     self.assertIsNone(rule.options.include_domains)
     with self.assertRaises(ValueError):
         rule.options.has_included('nonexistingoption')
     with self.assertRaises(ValueError):
         rule.options.has_excluded('nonexistingoption')
Example #9
0
 def test_rule_repr(self):
     rule_list = [
         '/banners/*$script,domain=example.com',
         r'/ttd_puid=\d+/',
         '||adscale.de',
     ]
     rules = AdblockRules(rule_list)
     rule_reprs = {rule.origin.line_no: repr(rule) for rule in rules.rules}
     self.assertEqual(
         "SubstringRule<'/banners/*$script,domain=example.com'>",
         rule_reprs[1])
     self.assertEqual("RegexpRule<'/ttd_puid=\\\\d+/'>", rule_reprs[2])
     self.assertEqual("DomainRule<'||adscale.de'>", rule_reprs[3])
Example #10
0
 def test_domain_rule_with_path(self):
     rule_list = ['||adzbazar.com^*.js', '||example.com/banner/*.png']
     rules = AdblockRules(rule_list)
     self.assertFalse(rules.match('http://adzbazar.com/').is_match)
     self.assertTrue(
         rules.match('http://adzbazar.com/static/foo.js').is_match)
     self.assertFalse(
         rules.match('http://example.com/no/banner/1.png').is_match)
     self.assertTrue(
         rules.match('http://example.com/banner/1.png').is_match)
Example #11
0
 def test_match_slow_match_fast(self):
     urls = [
         'https://imagesrv.adition.com/banners/268/00/86/70/52/images/konfetti.png',
         'https://match.adsrvr.org/track/cmf/generic?ttd_pid=theadex&ttd_puid=1001718401132270252&ttd_tpi=1',
         'https://s.hs-data.com/comon/prj/isdc/v3/default/static/js/lib/hammer.min.js',
         'https://ih.adscale.de/map?ssl=1&format=video',
     ]
     rules = AdblockRules([
         '/banners/*', '/ttd_puid=\\d+/', '||adscale.de^', 'hammer*',
         '@@https://$domain=hs-data.com'
     ])
     for url in urls:
         self.assertEqual(rules.match(url, 'www.example.com'),
                          rules.match_slow(url, 'www.example.com'))
         self.assertEqual(rules.match(url, 'hs-data.com'),
                          rules.match_slow(url, 'hs-data.com'))
Example #12
0
 def test_standard_rule(self):
     rule_list = ['/ads/*.jpg']
     rules = AdblockRules(rule_list)
Example #13
0
 def test_invalid_regexp(self):
     with self.assertRaises(RuleParsingError):
         AdblockRules(['/[/'])
     AdblockRules(['/[/'], skip_parsing_errors=True)
Example #14
0
 def test_rule_fix_end(self):
     rule_list = ['/ad.php|']
     rules = AdblockRules(rule_list)
     self.assertTrue(rules.match('foo/ad.php').is_match)
     self.assertFalse(rules.match('foo/ad.phps').is_match)
Example #15
0
 def test_domain_rule(self):
     rule_list = ['||adzbazar.com^$third-party']
     rules = AdblockRules(rule_list)
     self.assertTrue(rules.match('http://adzbazar.com/').is_match)
     self.assertTrue(rules.match('http://foo.adzbazar.com/').is_match)
     self.assertTrue(rules.match('http://foo.bar.adzbazar.com/').is_match)
Example #16
0
 def test_regexp_rule(self):
     rule_list = ['/\\.science\\/[0-9]{2,9}\\/$/$script,third-party,']
     rules = AdblockRules(rule_list)
     self.assertTrue(
         rules.match('https://marchfor.science/1337/',
                     origin='script').is_match)
Example #17
0
 def test_exception_rule(self):
     url = 'static/some/exception.jpg'
     rules = AdblockRules(['/some/*.jpg', '@@/some/exception.jpg'])
     self.assertFalse(rules.match(url).is_match)
Example #18
0
 def test_rule_list_cache_file_mutual_exclusive(self):
     with self.assertRaises(ValueError):
         AdblockRules(rule_list=['/some/rule.jpg'],
                      rule_files=['dummy.txt'],
                      cache_file='dummy.cache')
Example #19
0
 def test_rule_no_index(self):
     rules = AdblockRules(['/[Aa](d[bB]lock|ds)/'])
     self.assertTrue(
         rules.match('http://example.com/adBlock/1.png',
                     'example.com').is_match)
Example #20
0
 def test_domain_applicability(self):
     rules = AdblockRules([
         '/foo*$domain=example.com|example.org',
         '||^adscale.de$$domain=example.com|example.org',
         '/[a-f]{3,7}/$domain=example.com|example.org',
         '/foo*$domain=~example.net', '||^adscale.de$$domain=~example.org',
         '/[a-f]{3,7}/$domain=~example.net'
     ])
     self.assertTrue(
         rules.match('http://example.net/foobar', 'example.com').is_match)
     self.assertTrue(
         rules.match('http://example.net/foobar', 'example.org').is_match)
     self.assertFalse(
         rules.match('http://example.net/foobar', 'example.net').is_match)
     self.assertTrue(
         rules.match('http://foo.adscale.de/', 'example.com').is_match)
     self.assertTrue(
         rules.match('http://foo.adscale.de/', 'example.org').is_match)
     self.assertFalse(
         rules.match('http://foo.adscale.de/', 'example.net').is_match)
     self.assertTrue(
         rules.match('http://example.net/afbd', 'example.com').is_match)
     self.assertTrue(
         rules.match('http://example.net/afbd', 'example.org').is_match)
     self.assertFalse(
         rules.match('http://example.net/afbd', 'example.net').is_match)