Python LimitedDictLists.getQueueの例

プログラミング言語: Python

名前空間/パッケージ名: gl.containers

クラス/型: LimitedDictLists

メソッド/関数: getQueue

hotexamples.comのコード掲載数: 3

Python LimitedDictLists.getQueue - 3件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのgl.containers.LimitedDictLists.getQueueの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

LimitedDictLists(3)

getQueue(2)

insert(2)

よく使われるメソッド

LimitedDictLists (3)

getQueue (2)

insert (2)

コード例 #1

ファイルを表示

def process(dump, page):
    recentRevs = LimitedDictLists(maxsize=15)
    for revision in page.readRevisions():
        checksum = hashlib.md5(revision.getText().encode("utf-8")).hexdigest()
        if checksum in recentRevs:
            #found a revert
            revertedToRev = recentRevs[checksum]

            #get the revisions that were reverted
            revertedRevs = [
                r for (c, r) in reversed(recentRevs.getQueue())
                if r.getId() > revertedToRev.getId()
            ]

            isVandalism = wmf.isVandalismByComment(revision.getComment())

            #write revert row
            yield ('revert', revision.getId(), revertedToRev.getId(),
                   isVandalism, len(revertedRevs))

            for rev in revertedRevs:
                yield ('reverted', rev.getId(), revision.getId(),
                       revertedToRev.getId(), isVandalism, len(revertedRevs))
        else:
            pass

        recentRevs.insert(checksum, revision)

コード例 #2

ファイルを表示

ファイル: persistence_state.py プロジェクト: Kucheriavenko/bachelor-thesis

class PersistenceState:
    """
	Represents the state of word persistence in an article.  When Revisions
	and their content are given to a PersistenceState (via `update()`), 
	PersistenceState keeps track of how words persist as new revisions are 
	made.
	"""

    __slots__ = ("__splitter", "__differ", "__revertLimit", "__lastRevision", "__revisions", "__recentPersistence")

    def __init__(self, splitter, differ, revertLimit=15):
        """
		Constructor
		
		:Parameters:
			splitter : function
				Function to use when splitting revision content into words
			differ : function
				Function to use when generating the difference between two list of words
			revertLimit : int
				The maximum amount of steps backwards a revert can take.
		"""
        self.__splitter = splitter
        self.__differ = differ

        self.__revertLimit = revertLimit
        self.__lastRevision = None
        self.__revisions = 0
        self.__recentPersistence = LimitedDictLists(maxsize=revertLimit)

    def deflate(self):
        """
		Creates a JSONable version of the instance.  This includes a 
		carefully constructed index of Words as they represent the 
		history of revisions.
		
		:Return:
			A JSONable dictionary
		"""
        # create an index of all of the Words we care about.  This is
        # important since we want all of the words to be referenced
        # correctly.
        index = 0
        words = set()
        word2Index = {}
        index2WordJSON = {}
        for (checksum, revision) in self.__recentPersistence.getQueue():
            for word in revision.getWordList().getWords():
                if word not in word2Index:
                    word2Index[word] = index
                    index2WordJSON[index] = word.deflate()
                    index += 1

                    # Create a list of revisions that can be used to reload the
                    # recentPersistence.
        queue = []
        for (checksum, revision) in self.__recentPersistence.getQueue():
            # Ignore checksum.  It is in Revision.
            queue.append(revision.deflate(word2Index))

        json = {
            "revertLimit": self.__revertLimit,
            "revisions": self.__revisions,
            "index2WordJSON": index2WordJSON,
            "recentPersistence": queue,
        }
        return json

    @staticmethod
    def inflate(json, splitter, differ):
        """
		Creates an instance of PersistentState that is identical to the
		one whose deflate() method was called to produce the json.
		
		:Parameters:
			json : dict
				a JSONable version of a PersistenceState
			splitter : function
				Function to use when splitting revision content
				into words
			differ : function
				Function to use when generating the difference
				between two list of words
			
		:Return:
			PersistentState
		"""
        # Create a state and populate fields
        state = PersistenceState(splitter, differ, json["revertLimit"])
        state.__revisions = json["revisions"]

        # Create the word map
        index2Word = {}
        for index in json["index2WordJSON"]:
            index2Word[index] = Word.inflate(json["index2WordJSON"][index])

            # For each thing in the history of persistence, create it using
            # the index2Word we just made and insert it in the right
            # order.
        for revisionJSON in json["recentPersistence"]:
            r = Revision.inflate(revisionJSON, index2Word)
            state.__recentPersistence.insert(r.getChecksum(), r)
            state.__lastRevision = r

        return state

    def getLastRevision(self):
        return self.__lastRevision

    def getRevisions(self):
        return self.__revisions

    def update(self, revision, content):
        """
		Modifies the internal state based a new revision and content.
		
		:Parameters:
			revision : Revision
				The new revision to apply
			content : string
				The content for the new revision
			
		:Return:
			(wordsAdded, wordsRemoved) that resulted from applying
			the revision and content to the previous state.
		"""
        # Check for previous revisions that are identical
        if revision.getChecksum() in self.__recentPersistence:
            # we found a revert or a noop
            wordsAdded = []
            wordsRemoved = []
            revision.setWordList(self.__recentPersistence[revision.getChecksum()].getWordList())
        else:

            # actual change took place
            contents = self.__splitter(content)
            if self.__lastRevision == None:
                # First revision
                wordsRemoved = []
                revision.setWordList(WordList(contents, revision))
                wordsAdded = revision.getWordList().getWords()
            else:
                diff = self.__differ(self.__lastRevision.getContents(), contents)
                (wl, wordsAdded, wordsRemoved) = self.__lastRevision.getWordList().applyDiff(diff, revision)

                revision.setWordList(wl)

        revision.getWordList().increment()
        self.__lastRevision = revision
        self.__recentPersistence.insert(revision.getChecksum(), revision)
        self.__revisions += 1

        return (wordsAdded, wordsRemoved)

    def __eq__(self, other):
        if (
            isinstance(other, self.__class__)
            and self.getLastRevision() == other.getLastRevision()
            and self.getRevisions() == other.getRevisions()
        ):

            selfQueue = self.__recentPersistence.getQueue()
            otherQueue = other.__recentPersistence.getQueue()
            if len(selfQueue) == len(otherQueue):
                for i in range(0, len(selfQueue)):
                    selfRevision = selfQueue[i]
                    otherRevision = otherQueue[i]

                    if selfRevision != otherRevision:
                        return False

                return True
            else:
                return False
        else:
            return False

    def __ne__(self, other):
        return not self == other

コード例 #3

ファイルを表示

def process(dump, page):
	recentRevs = LimitedDictLists(maxsize=15)
	lastTokens = []
	metaHeaders = [
		'rev_id',
		'checksum',
		'tokens',
		'cs_added',
		'cs_removed',
		'ts_added',
		'ts_removed',
		'ws_added',
		'ws_removed',
		'ms_added',
		'ms_removed'
	]
	for revision in page.readRevisions():
		checksum = hashlib.md5(revision.getText().encode("utf-8")).hexdigest()
		if checksum in recentRevs:
			#found a revert
			revertedToRev = recentRevs[checksum]
			
			#get the revisions that were reverted
			revertedRevs = [r for (c,r) in reversed(recentRevs.getQueue()) if r.getId() > revertedToRev.getId()]
			
			#write revert row
			yield (
				'revert',
				revision.getId(), 
				revertedToRev.getId(), 
				len(revertedRevs)
			)
			
			for rev in revertedRevs:
				yield (
					'reverted',
					rev.getId(),
					revision.getId(),
					revertedToRev.getId(), 
					len(revertedRevs)
				)
		else:
			pass
		
		tokens = tokenize(revision.getText())
		
		tokensAdded, tokensRemoved = simpleDiff(lastTokens, tokens)
		
		row = {
			'rev_id':     revision.getId(),
			'checksum':   checksum,
			'tokens':     len(revision.getText()),
			'cs_added':   0,
			'cs_removed': 0,
			'ts_added':   0,
			'ts_removed': 0,
			'ws_added':   0,
			'ws_removed': 0,
			'ms_added':   0,
			'ms_removed': 0
		}
		for token in tokensAdded:
			row['ts_added'] += 1
			row['cs_added'] += len(token)
			if token.strip() == '':       pass
			if token in MARKUP:           row['ms_added'] += 1
			elif token not in STOP_WORDS: row['ws_added'] += 1
		for token in tokensRemoved:
			row['ts_removed'] += 1
			row['cs_removed'] += len(token)
			if token.strip() == '':       pass
			if token in MARKUP:           row['ms_removed'] += 1
			elif token not in STOP_WORDS: row['ws_removed'] += 1
			
		
		yield tuple(['meta']+[row[h] for h in metaHeaders])
		
		lastTokens = tokens
		recentRevs.insert(checksum, revision)