if parl: break if not parl: print >> sys.stderr, "WARNING: could not find député", ["%s | %s" % (checker(p["nom"]), p["groupe_sigle"]) for p in circosparls[circo]], "for circo", circo pprint(["%s | %s" % (checker("%s %s" % (p['Prénom candidat'], p['Nom candidat'])), p['Parti rattachement'].decode("utf-8")) for p in candidats], stream=sys.stderr) print >> sys.stderr parl = circosparls[circo][0] line['Nom candidat'] = parl["nom_de_famille"].upper() line['Prénom candidat'] = parl["prenom"] line['Parti rattachement'] = "Non rattaché%s" % ("e" if parl["sexe"] == "F" else "") results.append([ line['Nom candidat'], line['Prénom candidat'], parl['groupe_sigle'], unif_partis(lowerize(line['Parti rattachement'])), parl['sexe'], parl['nom_circo'], parl['slug'], parl['url_an'] ]) del(circosparls[circo]) for circo, parls in circosparls.items(): parl = parls[0] results.append([ parl['nom_de_famille'].upper(), parl['prenom'], parl['groupe_sigle'], "Non rattaché%s" % ("e" if parl["sexe"] == "F" else ""), parl['sexe'],
elif left < l3: if "<b>" in text: a = text.split(' <b>') record[2] = a[0] record[3] = a[1] else: record[2] = clean(text) record[2] = clean_app(record[2]).replace("Rassemblement-", "R").replace("ÉCOL.", 'ECOLO').replace('Ecolo', 'ECOLO') else: record[3] = clean(text) if record[3]: if not "".join(record[:2]): tmp = clean(record[3]) record = results.pop() record[3] = "%s %s" % (clean(record[3]), tmp) record[3] = unif_partis(record[3]) parl = find_parl(record[0], record[1], record[2], parls) if parl: if record[3] == "Aucun rattachement": record[3] = "Non rattaché" if parl['sexe'] == 'F': record[3] += "e" record[4] = parl.get('sexe').encode('utf-8') record[5] = parl.get('nom_circo').encode('utf-8') record[6] = parl.get('slug').encode('utf-8') record[7] = parl.get('url_institution', parl.get('url_an')).encode('utf-8') results.append(record) record = ["", "", "", "", "", "", "", ""] if not drawMap: print ",".join(['"%s"' % h for h in headers])
with open("cache/deputes.json") as f: parls = [p["depute"] for p in json.load(f)['deputes']] for line in csv: for k in line: line[k] = line[k].decode('iso-8859-15').encode('utf-8') groupe = line["Groupe"].replace("app.", "").replace("Écolo", "ECOLO") parl = find_parl(line['Nom'], line['Pr\xe9nom'], groupe, parls) if not parl: print >> sys.stderr, "WARNING: could not process", line continue results.append([ line['Nom'], line['Pr\xe9nom'], line['Groupe'], unif_partis(line['Parti ou groupement politique']), parl['sexe'], parl['nom_circo'], parl['slug'], parl['url_an'] ]) print ",".join(['"%s"' % h for h in headers]) for i in results: for j in range(len(i)): i[j] = clean(i[j]) try: i[j] = i[j].encode('utf-8') except: pass print ",".join([str(i[a]) if isinstance(i[a], int) else "\"%s\"" % i[a].replace('"', '""') for a,_ in enumerate(i)])