def process_csv(filepath, output):
    if sys.version_info[0] < 3:
        infile = open(filepath, 'rb')
    else:
        infile = open(filepath, 'r', newline='', encoding='utf8')

    with infile as csvfile:
        reader = csv.DictReader(csvfile, delimiter=';', quotechar='"')

        with open(output, "w") as outputfile:
            outputfile.write(",".join(AVANTAGES_HEADERS) + "\n")

            for row in reader:
                cleaned_row = dict((k, clean_text(v)) for k, v in row.items())
                outputfile.write(",".join((build_origin(cleaned_row), cleaned_row["denomination_sociale"],
                                           build_name(cleaned_row),
                                           build_address(cleaned_row), build_qualification(cleaned_row),
                                           build_rpps(cleaned_row), cleaned_row["avant_montant_ttc"],
                                           str2date(cleaned_row["avant_date_signature"]), build_nature(cleaned_row),
                                           build_eta(cleaned_row), cleaned_row["benef_codepostal"])) + "\n")
Пример #2
0
def process_csv(filepath, output):
    if sys.version_info[0] < 3:
        infile = open(filepath, 'rb')
    else:
        infile = open(filepath, 'r', newline='', encoding='utf8')

    with infile as csvfile:
        reader = csv.DictReader(csvfile, delimiter=';', quotechar='"')

        with open(output, "w") as outputfile:
            outputfile.write(",".join(AVANTAGES_HEADERS) + "\n")

            for row in reader:
                cleaned_row = dict((k, clean_text(v)) for k, v in row.items())
                outputfile.write(",".join(
                    (build_origin(cleaned_row),
                     cleaned_row["denomination_sociale"],
                     build_name(cleaned_row), build_address(cleaned_row),
                     build_qualification(cleaned_row), build_rpps(cleaned_row),
                     cleaned_row["avant_montant_ttc"],
                     str2date(cleaned_row["avant_date_signature"]),
                     build_nature(cleaned_row), build_eta(cleaned_row),
                     cleaned_row["benef_codepostal"])) + "\n")
def build_nature(row):
    nature = " ".join((row["avant_nature"], row["avant_convention_lie"]))
    return clean_text(nature)
def build_programme(row):
    nature = " ".join((row["conv_manifestation_nom"], row["conv_date_debut"],
                       row["conv_date_fin"], row["conv_manifestation_date"]))
    return clean_text(nature)
Пример #5
0
def build_nature(row):
    nature = " ".join((row["avant_nature"], row["avant_convention_lie"]))
    return clean_text(nature)
Пример #6
0
def build_programme(row):
    nature = " ".join((row["conv_manifestation_nom"], row["conv_date_debut"],
                       row["conv_date_fin"], row["conv_manifestation_date"]))
    return clean_text(nature)