Exemplo n.º 1
0
 def __init__(self, root, charset):
     Robot.__init__(self, root, charset)
     self.url_pattern = re.compile(
         ur'^http://\w+\.ganji\.com(|/|/fang1/?|/fang1/\d+x\.htm|/fang1/tuiguang[-]\d+.htm|/fang1/f\d+/?)$',
         re.U | re.I)
     self.arch_pattern = re.compile(
         ur'[房户](\s|&nbsp;)*型[^::]*[::]([^\d]*)(\d[^<>\s]+)[\s<]',
         re.U | re.I)
Exemplo n.º 2
0
 def __init__(self, root, charset):
     Robot.__init__(self, root, charset)
     self.url_pattern = re.compile(ur'^http://[\w\d\.]+\.soufun\.com(|/|/house/?|/chuzu/[\d_]+\.htm)$', re.U | re.I)
Exemplo n.º 3
0
 def __init__(self, root, charset):
     Robot.__init__(self, root, charset)
     self.url_pattern = re.compile(ur'http://\w+\.58\.com/zufang/(pn\d+/?|\d+x.shtml)?$', re.U | re.I)
Exemplo n.º 4
0
 def __init__(self, root, charset):
     Robot.__init__(self, root, charset)
     self.url_pattern = re.compile(
         ur'^http://[\w\d\.]+\.soufun\.com(|/|/house/?|/chuzu/[\d_]+\.htm)$',
         re.U | re.I)
Exemplo n.º 5
0
 def __init__(self, root, charset):
     Robot.__init__(self, root, charset)
     self.url_pattern = re.compile(ur'^http://\w+\.ganji\.com(|/|/fang1/?|/fang1/\d+x\.htm|/fang1/tuiguang[-]\d+.htm|/fang1/f\d+/?)$', re.U | re.I)
     self.arch_pattern = re.compile(ur'[房户](\s|&nbsp;)*型[^::]*[::]([^\d]*)(\d[^<>\s]+)[\s<]', re.U | re.I)
Exemplo n.º 6
0
 def __init__(self, root, charset):
     Robot.__init__(self, root, charset)
     self.url_pattern = re.compile(
         ur'^http://\w+.anjuke.com/(rental/(p\d+)?|prop/rent/\d+)/?$')
Exemplo n.º 7
0
 def __init__(self, root, charset):
     Robot.__init__(self, root, charset)
     self.url_pattern = re.compile(ur'http://\w+\.haozu\.com/(listing/(p%d+)?|rental/broker/n/\d+)?/?$')
Exemplo n.º 8
0
 def __init__(self, root, charset):
     Robot.__init__(self, root, charset)
     self.url_pattern = re.compile(
         ur'http://\w+\.haozu\.com/(listing/(p%d+)?|rental/broker/n/\d+)?/?$'
     )
Exemplo n.º 9
0
 def __init__(self, root, charset):
     Robot.__init__(self, root, charset)
     self.url_pattern = re.compile(ur'^http://\w+.anjuke.com/(rental/(p\d+)?|prop/rent/\d+)/?$')
Exemplo n.º 10
0
 def __init__(self, root, charset):
     Robot.__init__(self, root, charset)
     self.url_pattern = re.compile(ur'^(http://\w+\.zufang\.sina\.com\.cn(|/|/detail/\d+/?|/house/(n\d+)?/?)|http://\w+\.esf\.sina\.com\.cn/?)$', re.U | re.I)
Exemplo n.º 11
0
 def __init__(self, root, charset):
     Robot.__init__(self, root, charset)
     self.arch_pattern = re.compile(ur'[房户](\s|&nbsp;)*型[^::]*[::]\s*(<b>)(\d[^<\s]+)[<\s]', re.U | re.I)
     self.url_pattern = re.compile(ur'^http://\w+\.esf\.focus\.cn(|/|/zufang/?|/zufang/\d+\.html|/zufang/zj0m0h0jz0zx0zlfs0bq0fbr0p\d+px0t0jd0bx0pic0q0b0xl0zd0xq0st1s0tx1/?)$', re.U | re.I)
Exemplo n.º 12
0
 def __init__(self, root, charset):
     Robot.__init__(self, root, charset)
     self.url_pattern = re.compile(
         ur'^(http://\w+\.zufang\.sina\.com\.cn(|/|/detail/\d+/?|/house/(n\d+)?/?)|http://\w+\.esf\.sina\.com\.cn/?)$',
         re.U | re.I)