예제 #1
0
    def run(self):
        print("[*]正在进行备案信息查询[*]")
        url = self.site + self.domain + '.html'
        try:
            res = http_requests_get(url=url)  #发起请求
            res1 = re.findall(
                '主办单位性质</div><div class="line-value">(.*?)</div></div><div',
                res)
            res2 = re.findall(
                '网站备案号</div><div class="line-value">(.*?)</div></div><div',
                res)
            res3 = re.findall(
                '首页网址</div><div class="line-value">(.*?)</div></div><div', res)
            res_3 = re.findall('">(.*?)</a><br>', res3[0])

            res4 = re.findall(
                '备案域名</div><div class="line-value">(.*?)</div></div><div', res)
            res5 = re.findall(
                '审核时间</div><div class="line-value">(.*?)</div></div><div', res)
            res6 = re.findall(
                '数据更新于</div><div class="line-value">(.*?)</div></div><div',
                res)

            res = re.findall('html" title="(.*?)">', res)
            print('备案信息查询完成')
            return "主办单位性质: " + str(
                res1[0]
            ) + '\n' + "主办单位名称: " + res[5] + '\n' + "主办单位备案号: " + res[
                6] + '\n' + "网站名称: " + res[7] + '\n' + "网站备案号: " + str(
                    res2[0]) + '\n' + "首页网址: " + str(
                        res_3[0]) + '\n' + "备案域名: " + str(
                            res4[0]) + '\n' + "审核时间: " + str(
                                res5[0]) + '\n' + "数据更新于: " + str(res6[0])
        except Exception as e:
            return e
예제 #2
0
 def run(self):
     url = self.site + self.domain
     try:
         r = http_requests_get(url=url)
         results = re.findall('</TD>\n    <TD>(.*?)</TD>\n    <TD><A',
                              r.text, re.S)
         for result in results:
             if is_domain(result):
                 self.result.append(result)
         return list(set(self.result))
     except Exception, e:
         return self.result
예제 #3
0
파일: ip138.py 프로젝트: op-hxc0/InfoScan
 def run(self):
     print("[*]正在通过ip138查询域名[*]")
     url = self.site+self.domain+"/domain.htm"
     try:
         res = http_requests_get(url = url)      #发起请求
         r1 = re.findall('target="_blank"\>(.*?)\</a\>\</p\>', res)
         #return r1
         for result in  r1:       #循环写入
             if is_domain(result):       # 判断是否为域名
                 self.result.append(result)    # 将结果添加到列表中
         print_try("ip138查询完成,共" + str(len(self.result)) + "个域名")
         return list(set(self.result))   #去重
     except Exception as e:
         return self.result
예제 #4
0
 def run(self):
     print("[*]正在通过yumingco查询域名[*]")
     url = self.site + self.domain
     try:
         res = http_requests_get(url=url)  #发起请求
         r1 = re.findall('main:(.*)\<br\>', res)
         r = re.findall('(.*?)\<br\>', "".join(r1))
         #return res.text
         #return r
         for result in r:  #循环写入
             if is_domain(result):  # 判断是否为域名
                 self.result.append(result)  # 将结果添加到列表中
         print_try("yumingco查询完成,共" + str(len(self.result)) + "个域名")
         return list(set(self.result))  #去重
     except Exception as e:
         return self.result
예제 #5
0
 def run(self):
     for i in range(1, self.pages):
         page = (i - 1) * 10
         url = 'http://cn.bing.com/search?q=site:{}&first={}'.format(
             domain, page)
         res = http_requests_get(url=url)
         retext = '<cite>(.*?)<strong>' + self.domain + '</strong>'
         results = re.findall(retext, res.content)
         for i in results:
             if 'https' in i:
                 i = i.replace('https://', '')
                 sub = i + self.domain
                 self.result.append(sub)
                 # print sub
             else:
                 sub = i + self.domain
                 self.result.append(sub)
     return list(set(self.result))
예제 #6
0
 def run(self):
     for i in range(1, self.pages):
         page = (i - 1) * 10
         url = 'http://www.baidu.com/s?wd=site:{}&pn={}'.format(
             domain, page)
         # print page
         res = http_requests_get(url=url)
         # print res.content
         # results = re.findall(':none;">https://(.*?).jd.com/&nbsp;</a>',res.content)
         retext = ':none;">(.*?).' + self.domain
         # print retext
         results = re.findall(retext, res.content)
         for i in results:
             if 'https' in i:
                 i = i.replace('https://', '')
                 sub = i + '.' + self.domain
                 self.result.append(sub)
                 # print sub
             else:
                 sub = i + '.' + self.domain
                 self.result.append(sub)
     return list(set(self.result))