def get(self):
        MEMCACHE_KEY = "yw4ct7ntqzh93ioqaxif"
        path_info = self.request.path_info.split("/")
        debug("PATH_INFO = %s" % path_info)
        client = memcache.Client()
        LIMIT = 100

        if len(self.request.get("clear")) != 0:
            client.delete(MEMCACHE_KEY)

        template_values = {}
        template_values["all_raw_data"] = []

        old_key_list = client.get(MEMCACHE_KEY)
        if old_key_list is None:
            old_key_list = []
            query = Query(RawData, keys_only=True)
            query.order("-rawDataId")
            new_key_list = []
            count = 0
            for key_in_query in query:
                count += 1
                if count >= LIMIT: break
                if key_in_query in old_key_list: break
                new_key_list.append(key_in_query)

            all_key_list = new_key_list + old_key_list
            all_key_list = all_key_list[:LIMIT]
            client.set(MEMCACHE_KEY, all_key_list, 15)
        else:
            all_key_list = old_key_list

        for key_in_list in all_key_list:
            raw_data = client.get(str(key_in_list))
            if not isinstance(raw_data, RawData):
                raw_data_list = RawData.get([key_in_list])
                if len(raw_data_list) != 1: continue
                raw_data = raw_data_list[0]
                if not isinstance(raw_data, RawData): continue
                client.set(str(key_in_list), raw_data)
            if not isinstance(raw_data, RawData): continue

            raw_data_dict = {
                "rawDataId": raw_data.rawDataId,
                "path": raw_data.path,
                "parameters": raw_data.parameters,
                "query": raw_data.query,
                "fragment": raw_data.fragment,
                "body": raw_data.body
            }
            #logging.info(raw_data_dict)
            template_values["all_raw_data"].append(raw_data_dict)

        self.writeWithTemplate(template_values, "RawData")
    def get(self):
        MEMCACHE_KEY = "yw4ct7ntqzh93ioqaxif"
        path_info = self.request.path_info.split("/")
        debug("PATH_INFO = %s" % path_info)
        client = memcache.Client()
        LIMIT = 100

        if len(self.request.get("clear")) != 0:
            client.delete(MEMCACHE_KEY)
            
        template_values = {}
        template_values["all_raw_data"] = []

        
        old_key_list = client.get(MEMCACHE_KEY)
        if old_key_list is None:
            old_key_list = []
            query = Query(RawData, keys_only=True)
            query.order("-rawDataId")
            new_key_list = []
            count = 0
            for key_in_query in query:
                count += 1
                if count >= LIMIT: break
                if key_in_query in old_key_list: break
                new_key_list.append(key_in_query)
            
            all_key_list = new_key_list + old_key_list
            all_key_list = all_key_list[:LIMIT]
            client.set(MEMCACHE_KEY, all_key_list, 15)
        else:
            all_key_list = old_key_list

        for key_in_list in all_key_list:
            raw_data = client.get(str(key_in_list))
            if not isinstance(raw_data, RawData):
                raw_data_list = RawData.get([key_in_list])
                if len(raw_data_list) != 1: continue
                raw_data = raw_data_list[0]
                if not isinstance(raw_data, RawData): continue
                client.set(str(key_in_list), raw_data)
            if not isinstance(raw_data, RawData): continue

            raw_data_dict = {"rawDataId": raw_data.rawDataId,
                            "path":raw_data.path,
                            "parameters": raw_data.parameters,
                            "query": raw_data.query,
                            "fragment":raw_data.fragment,
                            "body": raw_data.body }
            #logging.info(raw_data_dict)
            template_values["all_raw_data"].append(raw_data_dict)
        
        self.writeWithTemplate(template_values, "RawData")
 def get(self):
     gql = RawData.gql("ORDER BY rawDataId DESC LIMIT 5000")
     records = gql.run()
     results = []
     for record in records:
         query_dict = cgi.parse_qs(record.query)
         if query_dict.has_key("arduinoid"):
             try:
                 gen_power = query_dict["gen.power(W)"][0]
                 timestring = query_dict["time"][0]
             except: continue
             results.append([gen_power, timestring[0:4], timestring[4:6], timestring[6:8], timestring[8:10], timestring[10:12], timestring[12:14]])
             #results.append([gen_power])
     self.response.out.write(self.request.get("callback") + "(" + dumps({"timeVsWatt":results}) + ");")
 def get(self):
     template_values = {}
     template_values["all_raw_data"] = []
     gql = RawData.gql("ORDER BY rawDataId DESC LIMIT 100")
     all_raw_data = gql.run()
     #all_raw_data = RawData.all()
     for raw_data in all_raw_data:
         raw_data_dict = {"rawDataId": raw_data.rawDataId,
                         "path":raw_data.path,
                         "parameters": raw_data.parameters,
                         "query": raw_data.query,
                         "fragment":raw_data.fragment,
                         "body": raw_data.body }
         #logging.info(raw_data_dict)
         template_values["all_raw_data"].append(raw_data_dict)
     
     self.writeWithTemplate(template_values, "RawData")
    def get(self):
        template_values = {}
        template_values["all_raw_data"] = []
        gql = RawData.gql("ORDER BY rawDataId DESC LIMIT 100")
        all_raw_data = gql.run()
        #all_raw_data = RawData.all()
        for raw_data in all_raw_data:
            raw_data_dict = {
                "rawDataId": raw_data.rawDataId,
                "path": raw_data.path,
                "parameters": raw_data.parameters,
                "query": raw_data.query,
                "fragment": raw_data.fragment,
                "body": raw_data.body
            }
            #logging.info(raw_data_dict)
            template_values["all_raw_data"].append(raw_data_dict)

        self.writeWithTemplate(template_values, "RawData")
 def get(self):
     gql = RawData.gql("ORDER BY rawDataId DESC LIMIT 5000")
     records = gql.run()
     results = []
     for record in records:
         query_dict = cgi.parse_qs(record.query)
         if query_dict.has_key("arduinoid"):
             try:
                 gen_power = query_dict["gen.power(W)"][0]
                 timestring = query_dict["time"][0]
             except:
                 continue
             results.append([
                 gen_power, timestring[0:4], timestring[4:6],
                 timestring[6:8], timestring[8:10], timestring[10:12],
                 timestring[12:14]
             ])
             #results.append([gen_power])
     self.response.out.write(
         self.request.get("callback") + "(" +
         dumps({"timeVsWatt": results}) + ");")
示例#7
0
    def process_item(self, item, spider):
        if (isinstance(item, Article)):
            content1 = item["content"].encode("utf-8")
            f = Filter()
            text = f.filterResult(item["title"], item["content"])

            if text:
                # print "text:"+text[1]+text[2]+text[3]
                money1 = text[2]
                org1 = text[1]
                date1 = text[3]
                date2 = date(date1[0], date1[1], date1[2])
                a = RawData(title=text[0],
                            content=item["content"].encode("utf-8"),
                            spider=item["spider"].encode("utf-8"),
                            org=org1,
                            money=money1,
                            date=date2)
                self.session.add(a)
                self.session.commit()
            id1 = item["id"]
            name1 = item["spider"].encode("utf-8")
            title1 = item["title"].encode("utf-8")
            currentURL = item["currentURL"].encode("utf-8")
            sql1 = "INSERT INTO `status` (`crawler_id`, `current_title` ,`current_url`, `name`) VALUES (" + str(
                id1
            ) + ",'" + title1 + "','" + currentURL + "','" + name1 + "') ON DUPLICATE KEY UPDATE `current_title`='" + title1 + "',`current_url`='" + currentURL + "',`name`='" + name1 + "',`timestamp`=NOW()"
            engine.execute(sql1)
        else:
            currentPage = item["currentPage"].encode("utf-8")
            id = item["id"]
            name = item["name"].encode("utf-8")
            sql = "INSERT INTO `status` (`crawler_id`, `current_page`) VALUES (" + str(
                id
            ) + ",'" + currentPage + "') ON DUPLICATE KEY UPDATE `current_page`='" + currentPage + "'"
            engine.execute(sql)