Python DataManagerの例

プログラミング言語: Python

名前空間/パッケージ名: data.data

クラス/型: DataManager

hotexamples.comのコード掲載数: 5

Python DataManager - 5件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのdata.data.DataManagerの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

DataManager(3)

stale_topics(1)

upsert_topic(1)

upsert_reply(1)

upsert_postscript(1)

upsert_node(1)

upsert_member(1)

update_topic_web_crawled(1)

update_topic_synced_state(1)

save_order(1)

es_update_assembled_topic(1)

not_synced_topics(1)

member_of_topic(1)

member_of_reply(1)

handle_topic(1)

handle_reply(1)

handle_postscript(1)

find_topic(1)

find_all_replies(1)

upsert_topic_extras(1)

コード例 #1

ファイルを表示

def save_order():
    order = request.get_json()['order']
    DataManager.save_order(order)

    return "1"

コード例 #2

ファイルを表示

# Created on 2017-01-13 18:27

import time
import shlex
import logging
import subprocess
from random import randint
from config.config import ss_config_list
from data.data import DataManager

subprocess.call(('killall', 'ss-local'))

current_ip = ''
local_ip = 'local_ip'

data_manager = DataManager()

ss_process_list = []
ss_proxy_list = []
random_proxy_mute_dict = {}


def create_ss_proxies():
    global ss_process_list, ss_proxy_list
    if ss_process_list:
        return
    for index, config in enumerate(ss_config_list):
        local_port = 1090 + index
        args = shlex.split('ss-local -s {0} -p {1} -l {local_port} '
                           '-k {3} -m {2} -t 10 -b 0.0.0.0'.format(
                               local_port=local_port, *config))

コード例 #3

ファイルを表示

class Fetcher(object):
    """API fetcher to complete tasks"""
    def __init__(self):
        self.api = APIHelper()
        self.data = DataManager()
        self.web = WebHelper()

    def fetch_single_topic(self, topic_id):
        topic_info = self.api.get_topic_info(topic_id)
        partial_member = self.data.member_of_topic(topic_info)
        stored_topic = self.data.find_topic(topic_id)
        new_topic = self.data.handle_topic(topic_info, topic_id)
        if stored_topic:
            new_topic['web_crawled'] = stored_topic['web_crawled']
        else:
            new_topic['web_crawled'] = datetime.fromtimestamp(0)
            new_topic['click'] = 0
            new_topic['favorite'] = 0
            new_topic['thank'] = 0

        self.data.update_topic_synced_state(new_topic['id'], False)
        self.data.upsert_topic(new_topic)
        self.data.upsert_member(partial_member)

    def fetch_new_topics(self):
        max_stored_topic_id = self.data.max_stored_topic_id
        topic_count = self.api.get_topic_count()
        if max_stored_topic_id >= topic_count:
            return
        for topic_id in range(max_stored_topic_id + 1, topic_count + 1):
            self.fetch_single_topic(topic_id)

    def fetch_replies_of_topic(self, topic_id):
        replies = self.api.get_replies(topic_id)
        if replies:
            self.data.update_topic_synced_state(topic_id, False)
            for reply in replies:
                partial_member = self.data.member_of_reply(reply)
                self.data.upsert_reply(self.data.handle_reply(reply, topic_id))
                self.data.upsert_member(partial_member)

    def fetch_new_replies(self):
        max_stored_topic_id = self.data.max_stored_topic_id
        max_stored_topic_id_of_reply = self.data.max_stored_topic_id_of_reply
        if max_stored_topic_id_of_reply == 0:
            need_refetch_max_topic = False
        else:
            topic = self.data.find_topic(max_stored_topic_id_of_reply)
            replies = self.data.find_all_replies(max_stored_topic_id_of_reply)
            need_refetch_max_topic = not (replies.count() == topic['replies'])
        for topic_id in range(
                max_stored_topic_id_of_reply + 1 - int(need_refetch_max_topic),
                max_stored_topic_id + 1):
            if self.data.find_topic(topic_id=topic_id):
                self.fetch_replies_of_topic(topic_id)

    def fetch_single_topic_extras(self, topic_id):
        def upsert_counts(click, favorite, thank):
            self.data.upsert_topic_extras(topic_id, click, favorite, thank)
            self.data.update_topic_synced_state(topic_id, False)
            count = self.data.update_topic_web_crawled(topic_id,
                                                       datetime.utcnow())
            logging.info('Update topic {0} extras, count {1}'.format(
                topic_id, count))

        web_extra = self.web.get_topic_extras(topic_id)
        if not web_extra:
            count = self.data.update_topic_web_crawled(topic_id,
                                                       datetime.utcnow())
            topic = self.data.find_topic(topic_id)
            if (not topic) or ('click' not in topic):
                upsert_counts(0, 0, 0)
            logging.info('Topic {0} extras is None, count {1}'.format(
                topic_id, count))
            return
        for index, postscript in enumerate(web_extra.subtle_list):
            postscript = self.data.handle_postscript(postscript, topic_id,
                                                     index + 1)
            self.data.upsert_postscript(postscript)

        upsert_counts(web_extra.click, web_extra.favorite, web_extra.thank)

    def fetch_all_topic_extras(self):
        while True:
            min_topic_id_need_postscript = self.data.min_topic_id_need_extras
            if min_topic_id_need_postscript > 0:
                try:
                    self.fetch_single_topic_extras(
                        min_topic_id_need_postscript)
                except ElasticsearchException as es_error:
                    raise es_error
                except Exception as e:
                    logging.error('Fetch single topic extras error: ' + str(e))
            else:
                break

    def fetch_all_nodes(self):
        nodes = self.api.get_all_nodes()
        if nodes:
            for node in nodes:
                node['crawled'] = datetime.utcnow()
                self.data.upsert_node(node)

        logging.info('Fetching all node, count: ' + str(len(nodes)))

    def fetch_new_members(self):
        site_stats = self.api.get_site_stats()
        max_stored_member_id = self.data.max_stored_member_id
        if site_stats:
            member_max = site_stats['member_max']
            for member_id in range(max_stored_member_id + 1, member_max + 1):
                new_member = self.api.get_member_info(member_id=member_id)
                if not new_member:
                    continue
                new_member['crawled'] = datetime.utcnow()
                self.data.upsert_member(new_member)
                logging.info('Upsert member {0}, id {1}'.format(
                    new_member['username'], new_member['id']))
        else:
            new_member = self.api.get_member_info(
                member_id=self.data.max_stored_member_id + 1)
            while new_member:
                new_member['crawled'] = datetime.utcnow()
                self.data.upsert_member(new_member)
                logging.info('Upsert member {0}, id {1}'.format(
                    new_member['username'], new_member['id']))
                new_member = self.api.get_member_info(
                    member_id=self.data.max_stored_member_id + 1)

    def fetch_stale_topics(self):
        stale_topics = self.data.stale_topics()
        if not stale_topics:
            return
        for topic in stale_topics:
            topic_id = topic['id']
            self.fetch_single_topic(topic_id)
            if topic['web_crawled'] and topic[
                    'recrawl'] and topic['web_crawled'] < topic['recrawl']:
                self.fetch_single_topic_extras(topic_id)
            self.fetch_replies_of_topic(topic_id)

    def sync_topic_to_es(self):
        waiting_topics = self.data.not_synced_topics()
        if not waiting_topics:
            return
        for topic in waiting_topics:
            self.data.update_topic_synced_state(topic['id'], True)
            self.data.es_update_assembled_topic(topic)

コード例 #4

ファイルを表示

 def __init__(self):
     self.api = APIHelper()
     self.data = DataManager()
     self.web = WebHelper()

コード例 #5

ファイルを表示

#!/usr/bin/env python
# -*- coding: utf-8 -*-
# Author: gexiao
# Created on 2017-09-22 22:53

import sys

sys.path.append('..')

import pymongo
from datetime import timedelta
from data.data import DataManager, RECRAWL_DELTA_DAYS

if __name__ == "__main__":
    data = DataManager()
    cursor = data.topic_collection.find({
        'id': {
            '$gt': 0
        }
    }).sort('id', pymongo.ASCENDING)
    for topic in cursor:
        if topic['deleted']:
            continue
        created_time = topic['created']
        crawled_time = topic['crawled']
        delta = crawled_time - created_time
        days = delta.days
        for delta_days in RECRAWL_DELTA_DAYS:
            if days < delta_days:
                recrawl = created_time + timedelta(days=delta_days)
                data.topic_collection.update_one(