def getData(): processed = set() (redirectData, goneData) = subscriptionParser.getFallbackData() redirects = processData(redirectData, processed, {}) gone = processData(goneData, processed, set()) return (redirects, gone)
def loadSubscriptions(counts): global interval subscriptions = subscriptionParser.readSubscriptions() knownURLs = {} for subscription in subscriptions.values(): for title, url, complete in subscription.variants: knownURLs[url] = True (redirectData, goneData) = subscriptionParser.getFallbackData() redirects = processFile(redirectData, counts) gone = processFile(goneData, counts) unaccounted = filter(lambda url: counts[url] >= 10, counts.keys()) unaccounted.sort(key=lambda url: counts[url], reverse=True) for i in range(0, len(unaccounted)): url = unaccounted[i] mark = ' [?]' if url in knownURLs: mark = '' unaccounted[i] = '%5i %s%s' % (counts[url], url, mark) return (redirects, gone, unaccounted)