def parse_all_hansards(): parsed = [] for hansard in Hansard.objects.all().annotate(scount=Count('statement')).exclude(scount__gt=0).order_by('date').iterator(): try: print "Trying %d %s... " % (hansard.id, hansard) hans.parseAndSave(hansard) print "SUCCESS for %s" % hansard parsed.append(hansard) except Exception, e: print "******* FAILURE **********" print "ERROR: %s" % e print "EXCEPTION TYPE: %s" % e.__class__ cache = HansardCache.objects.get(hansard=hansard.id) print "HANSARD %d: %s" % (cache.hansard.id, cache.hansard) print "FILE: %s" % cache.filename print "URL: %s" % cache.hansard.url
def hansards_parse(): for hansard in Hansard.objects.all().annotate(scount=models.Count('statement')).exclude(scount__gt=0).order_by('date').iterator(): try: hans.parseAndSave(hansard) except Exception, e: transaction.rollback() mail_admins("Hansard parse failure on #%s" % hansard.id, unicode(e)) continue else: transaction.commit() # now reload the Hansard to get the date hansard = Hansard.objects.get(pk=hansard.id) try: hansard.save_activity() except Exception, e: transaction.rollback() raise e
def hansards_parse(): for hansard in Hansard.objects.all().annotate( scount=models.Count('statement')).exclude( scount__gt=0).order_by('date').iterator(): try: hans.parseAndSave(hansard) except Exception, e: transaction.rollback() mail_admins("Hansard parse failure on #%s" % hansard.id, unicode(e)) continue else: transaction.commit() # now reload the Hansard to get the date hansard = Hansard.objects.get(pk=hansard.id) try: hansard.save_activity() except Exception, e: transaction.rollback() raise e