Esempio n. 1
0
 def get_firstpage(self):
     self.body['pre_page'] = self.body['page'] - 1
     url = self.get_url() + urllib.urlencode(self.body)
     print('URL 1:' + str(url))
     print ''
     req = urllib2.Request(url)
     result = urllib2.urlopen(req)
     text = result.read()
     # self.writefile(self.outputFolder + '/page'+ str(self.body['page'])+'-source1.txt',text)
     # self.writefile(self.outputFolder + '/page'+str(self.body['page'])+'-result1.txt',eval("u'''"+text+"'''"))
     self.writefile(
         self.outputFolder + '/page' + str(self.body['page']) +
         '-json1.txt', json.dumps(Lweibo.jiexi(text)))
     return text
Esempio n. 2
0
    def get_secondpage(self):
        self.body['count'] = '15'
        #   self.body['end_id'] = '3490160379905732'
        #   self.body['max_id'] = '3487344294660278'
        self.body['pagebar'] = '0'
        self.body['pre_page'] = self.body['page']

        url = self.get_url() + urllib.urlencode(self.body)
        print('URL 2:' + str(url))
        print ''
        req = urllib2.Request(url)
        result = urllib2.urlopen(req)
        text = result.read()
        # self.writefile(self.outputFolder + '/page'+str(self.body['page'])+'-source2.txt',text)
        # self.writefile(self.outputFolder + '/page'+str(self.body['page'])+'-result2.txt',eval("u'''"+text+"'''"))
        self.writefile(
            self.outputFolder + '/page' + str(self.body['page']) +
            '-json2.txt', json.dumps(Lweibo.jiexi(text)))
        return text
Esempio n. 3
0
    def get_thirdpage(self):
        self.body['count'] = '15'
        self.body['pagebar'] = '1'
        self.body['pre_page'] = self.body['page']

        url = self.get_url() +urllib.urlencode(self.body)
        print('URL 3:' + str(url))
        print ''
        req = urllib2.Request(url)
        result = urllib2.urlopen(req)
        text = result.read()
        # self.writefile(self.outputFolder + '/page'+str(self.body['page'])+'-source3.txt',text)
        # self.writefile(self.outputFolder + '/page'+ str(self.body['page'])+'-result3.txt',eval("u'''"+text+"'''"))
        self.writefile(self.outputFolder + '/page'+ str(self.body['page'])+'-json3.txt',json.dumps(Lweibo.jiexi(text)))
        return text
Esempio n. 4
0
    def get_secondpage(self):
        self.body['count'] = '15'
    #   self.body['end_id'] = '3490160379905732'
    #   self.body['max_id'] = '3487344294660278'
        self.body['pagebar'] = '0'
        self.body['pre_page'] = self.body['page']

        url = self.get_url() +urllib.urlencode(self.body)
        print('URL 2:' + str(url))
        print ''
        req = urllib2.Request(url)
        result = urllib2.urlopen(req)
        text = result.read()
        # self.writefile(self.outputFolder + '/page'+str(self.body['page'])+'-source2.txt',text)
        # self.writefile(self.outputFolder + '/page'+str(self.body['page'])+'-result2.txt',eval("u'''"+text+"'''"))
        self.writefile(self.outputFolder + '/page'+ str(self.body['page'])+'-json2.txt',json.dumps(Lweibo.jiexi(text)))
        return text