def process_csv(filepath, output): if sys.version_info[0] < 3: infile = open(filepath, 'rb') else: infile = open(filepath, 'r', newline='', encoding='utf8') with infile as csvfile: reader = csv.DictReader(csvfile, delimiter=';', quotechar='"') with open(output, "w") as outputfile: outputfile.write(",".join(AVANTAGES_HEADERS) + "\n") for row in reader: cleaned_row = dict((k, clean_text(v)) for k, v in row.items()) outputfile.write(",".join((build_origin(cleaned_row), cleaned_row["denomination_sociale"], build_name(cleaned_row), build_address(cleaned_row), build_qualification(cleaned_row), build_rpps(cleaned_row), cleaned_row["avant_montant_ttc"], str2date(cleaned_row["avant_date_signature"]), build_nature(cleaned_row), build_eta(cleaned_row), cleaned_row["benef_codepostal"])) + "\n")
def process_csv(filepath, output): if sys.version_info[0] < 3: infile = open(filepath, 'rb') else: infile = open(filepath, 'r', newline='', encoding='utf8') with infile as csvfile: reader = csv.DictReader(csvfile, delimiter=';', quotechar='"') with open(output, "w") as outputfile: outputfile.write(",".join(AVANTAGES_HEADERS) + "\n") for row in reader: cleaned_row = dict((k, clean_text(v)) for k, v in row.items()) outputfile.write(",".join( (build_origin(cleaned_row), cleaned_row["denomination_sociale"], build_name(cleaned_row), build_address(cleaned_row), build_qualification(cleaned_row), build_rpps(cleaned_row), cleaned_row["avant_montant_ttc"], str2date(cleaned_row["avant_date_signature"]), build_nature(cleaned_row), build_eta(cleaned_row), cleaned_row["benef_codepostal"])) + "\n")
def build_nature(row): nature = " ".join((row["avant_nature"], row["avant_convention_lie"])) return clean_text(nature)
def build_programme(row): nature = " ".join((row["conv_manifestation_nom"], row["conv_date_debut"], row["conv_date_fin"], row["conv_manifestation_date"])) return clean_text(nature)