Python rdcsv_filter Examples

Programming Language: Python

Namespace/Package Name: rdcsv_filter

Method/Function: rdcsv_filter

Examples at hotexamples.com: 2

Python rdcsv_filter - 2 examples found. These are the top rated real world Python examples of rdcsv_filter.rdcsv_filter extracted from open source projects. You can rate examples to help us improve the quality of examples.

Example #1

Show file

File: list_found_doctors.py Project: trender-python/scraper-script

    def find (self):
        """def: find"""
        for row_h in self.hitta_eniro_vardcentraler_reader:
            m_rdcsv_filter = rdcsv_filter ()
            names = m_rdcsv_filter.filter_get_col(row_h['SEARCH_NAME'], 'FULL_NAME')
            # Return if no names are found in 1177
            if len(names) == 0: continue

            if not re.search('^\s*$', row_h['WEBSITE']):
                if not re.search('^http', row_h['WEBSITE']):
                    row_h['WEBSITE'] = "http://" + row_h['WEBSITE']

                m_find_doctor = find_doctor()
                for match in m_find_doctor.find(row_h['WEBSITE'], names):
                    match['SEARCH_PARENT_WORKPLACE_NAME'] = row_h['SEARCH_NAME']
                    match['FOUND_PARENT_WORKPLACE_NAME'] = row_h.get('FOUND_NAME', None)
                    csv_doctor.write_row_h(match)

                    if not 'FOUND_DOCTOR_TAG' in row_h:
                        if 'FOUND_DOCTOR_TAG' in match:
                            row_h ['FOUND_DOCTOR_TAG'] = match['FOUND_DOCTOR_TAG']

                    # Found doctors on home url
                    if 'SEARCH_DOCTOR_NAME' in match:
                        if 'FOUND_DOCTOR_NAME' in match:
                            if 'FOUND_DOCTORS' not in row_h: 
                                row_h['FOUND_DOCTORS'] = match['SEARCH_DOCTOR_NAME']
                            else: 
                                row_h['FOUND_DOCTORS'] = "%s|%s" % (row_h['FOUND_DOCTORS'], match['SEARCH_DOCTOR_NAME'])
                            row_h ['DATE'] = datetime.datetime.today().strftime('%Y%m%d')

                        else:
                            if 'MISSING_DOCTORS' not in row_h: 
                                row_h['MISSING_DOCTORS'] = match['SEARCH_DOCTOR_NAME']
                            else: 
                                row_h['MISSING_DOCTORS'] = "%s|%s" % (row_h['MISSING_DOCTORS'], match['SEARCH_DOCTOR_NAME'])
                            row_h ['DATE'] = datetime.datetime.today().strftime('%Y%m%d')

                    if 'URL' in match:
                        if 'FOUND_DOCTORS_URL' not in row_h:
                            row_h['FOUND_DOCTORS_URL'] = match['URL']
                        elif match['URL'] not in row_h['FOUND_DOCTORS_URL']:
                            row_h['FOUND_DOCTORS_URL'] = "%s|%s" % (row_h['FOUND_DOCTORS_URL'], match['URL'])
                        row_h ['DATE'] = datetime.datetime.today().strftime('%Y%m%d')

            csv_list_found_doctors.write_row_h(row_h)

Example #2

Show file

File: list_found_doctors.py Project: crazypythonmaster/pythonscript-scrapy

        'MISSING_DOCTORS',
    ]
    m_csv_list_found_doctors = csv_list_found_doctors(fname = directory + '/found_doctors_result.csv', heading = heading_found_doctors)

    heading_doctors=[
      'HOME_URL',
      'URL',
      'SEARCH_PARENT_WORKPLACE_NAME',
      'FOUND_PARENT_WORKPLACE_NAME',
      'SEARCH_DOCTOR_NAME',
      'FOUND_DOCTOR_NAME',
      'MATCH?',
    ]
    m_csv_doctor = csv_doctor(fname = directory + '/doctors_result.csv', heading = heading_doctors)

    m_rdcsv_filter = rdcsv_filter(directory + '/ALL_RECORDS_MATCH_73_273_TO_273_373_SPLIT_ADDRESS.csv')
    m_rdcsv_filter.parse('PARENT_WORKPLACE_NAME')

    m_list_found_doctors = list_found_doctors()
    m_list_found_doctors.find()