Python DictReader.fieldnames 예제들, csv.DictReader.fieldnames Python 예제들

예제 #1

0

파일 보기

파일: data_processor.py 프로젝트: vyacheslav-bezborodov/python

def load_data(uri, dateFormat):
    logging.info('loading data; uri: {0}'.format(uri))
    
    from urllib2 import urlopen
    from csv import DictReader
    
    reader = DictReader(urlopen(uri).readlines())
    
    encodedFieldNames = []
    for fieldname in reader.fieldnames:
        encodedFieldNames.append(fieldname.decode("utf-8-sig").encode("utf-8"))
    reader.fieldnames = encodedFieldNames
    
    data = []
    
    from time import strptime
    
    for row in reader:
        data.append({
            'date': strptime(row['Date'], dateFormat),
            'open': float(row['Open']),
            'close': float(row['Close']),
            'high': float(row['High']),
            'low': float(row['Low']),
            'volume': float(row['Volume'])
        })
    
    return data

예제 #2

0

파일 보기

def read_certified_applications(csv_file_path):
    """
    Generator function for reading the input CSV files.  This function does the following:

    1.  We sniff the file format so we can support both default excel formatted csv and the
        semi-colon separated files (see Test 1 and Test 2).

    2.  We check if the file uses the previous LCA record layout. If so, we migrate it to the
        current H1B Record Layout.

    3.  Filter out all application that are not 'CERTIFIED'.

    The goal of this function is to separate code for reading the input file format from our
    analytical code.

    :param csv_file_path:
    :return:
    """
    print('Processing input file: {0}'.format(csv_file_path))

    with open(csv_file_path) as csv_file:

        # Sniff the file format
        dialect = Sniffer().sniff(csv_file.read(16384))
        csv_file.seek(0)

        reader = DictReader(csv_file, dialect=dialect)

        # Dirty migration of the previous LCA Record Layout to the current H1B Record Layout
        if 'LCA_CASE_NUMBER' in reader.fieldnames:
            reader.fieldnames = get_migrated_fieldnames()

        # Filter all applications that are not certified
        yield from filterfalse(lambda row: row['CASE_STATUS'] != 'CERTIFIED',
                               reader)

예제 #3

0

파일 보기

파일: views.py 프로젝트: thuzarwin/automated-reporting

def upload(request):
    # get parameters
    response, schools = get_variable_with_error(request, 'leave', 'school', as_list=True)
    if response is not None:
        return response

    response, minimum_str = get_variable_with_error(request, 'leave', 'minimum', def_value="0")
    if response is not None:
        return response
    minimum = int(minimum_str)

    csv = request.FILES['datafile']

    order = ['school', 'employee', 'manager', 'actual_balance', 'leave_accrued', 'future_leave_bookings', 'current_balance', 'current_allocated_balance']
    header = dict()
    header['school'] = 'Faculty/School'
    header['employee'] = 'Employee'
    header['manager'] = 'Manager'
    header['actual_balance'] = 'Actual balance'
    header['leave_accrued'] = 'Leave accrued'
    header['future_leave_bookings'] = 'Future bookings'
    header['current_balance'] = 'Current balance'
    header['current_allocated_balance'] = 'Current allocated balance'
    result = list()
    try:
        with open(csv.temporary_file_path(), encoding='ISO-8859-1') as csvfile:
            reader = DictReader(csvfile)
            reader.fieldnames = [name.lower().replace(" ", "_") for name in reader.fieldnames]
            for row in reader:
                school = row['main_clevel']
                if school not in schools:
                    continue
                leave_type = row['leave_type']
                if leave_type != "AL":  # TODO any other types of leave to add/include?
                    continue
                rrow = dict()
                rrow['school'] = school
                rrow['employee'] = row['employee_name']
                rrow['manager'] = row['manager']
                rrow['actual_balance'] = float(row['current_allocated_balance']) - float(row['future_leave_bookings'])
                rrow['current_balance'] = row['current_balance']
                rrow['current_allocated_balance'] = row['current_allocated_balance']
                rrow['leave_accrued'] = row['accrual']
                rrow['future_leave_bookings'] = row['future_leave_bookings']
                if int(rrow['actual_balance']) >= minimum:
                    result.append(rrow)
    except Exception as ex:
        traceback.print_exc(file=sys.stdout)
        return create_error_response(request, 'leave', 'Failed to read uploaded CSV file: ' + str(ex))

    # sort
    result.sort(key=actual_balance_key, reverse=True)

    # configure template
    template = loader.get_template('leave/output.html')
    context = applist.template_context('leave')
    context['table'] = result
    context['header'] = header
    context['order'] = order
    return HttpResponse(template.render(context, request))

예제 #4

0

파일 보기

파일: flowlogs_reader.py 프로젝트: mdsol/flowlogs-reader

 def _read_file(self, key):
     resp = self.boto_client.get_object(Bucket=self.bucket, Key=key)
     with gz_open(resp['Body'], mode='rt') as gz_f:
         reader = DictReader(gz_f, delimiter=' ')
         reader.fieldnames = [
             f.replace('-', '_') for f in reader.fieldnames
         ]
         yield from reader

예제 #5

0

파일 보기

 def _read_file(self, key):
     resp = self.boto_client.get_object(Bucket=self.bucket, Key=key)
     with gz_open(resp['Body'], mode='rt') as gz_f:
         reader = DictReader(gz_f, delimiter=' ')
         reader.fieldnames = [
             f.replace('-', '_') for f in reader.fieldnames
         ]
         yield from reader
         with THREAD_LOCK:
             self.bytes_processed += gz_f.tell()
             self.compressed_bytes_processed += resp['ContentLength']

예제 #6

0

파일 보기

def csv2ics(filename, tz=None):
    print_field("BEGIN", "VCALENDAR")

    with open(filename, "rb") as infile:
        dialect = Sniffer().sniff(infile.read())
        infile.seek(0)
        reader = DictReader(infile, dialect=dialect)
        reader.fieldnames = [
            transform_fieldname(name) for name in reader.fieldnames
        ]
        rows = [row for row in reader if row_nonblank(row)]
        write_events(rows, tz)

    print_field("END", "VCALENDAR")

예제 #7

0

파일 보기

파일: parsingfasta.py 프로젝트: CCOM-4027/Genomics

def csvInput(file,options,dialect='excel'):
    header=options['header']
    from csv import DictReader
    with open(file,'r') as f:
        if not header:
            reader = DictReader(f,dialect=dialect)
        else:
            reader = DictReader(f,dialect=dialect,fieldnames=header.split(','))
        reader.fieldnames = map(options['alias'],reader.fieldnames)
        entries =[line for line in reader]
        map(lambda(dict):
                dict.update({"file":file,
                             "format":fileType(file)}),
            entries)
        return entries

예제 #8

0

파일 보기

def startup():
    help_string = """
        The API is available at:
        http://localhost:5000/api/products/

        Example use:

        A GET request to http://localhost:5000/api/products/1234 would return
        the details of the product with id = 1234 (if it exists) in JSON format
        """
    print(help_string)
    if "products.csv" in os.listdir(os.getcwd()):
        #Fetch json products from aws
        aws_url = "https://s3-eu-west-1.amazonaws.com/pricesearcher-code-tests/python-software-developer/products.json"
        response = requests.get(aws_url)
        try:
            # Read the fetched data as json and call parse function
            # to standardise the data into the form we require
            product_list = parse_json(response.json())
        except decoder.JSONDecodeError:
            logging.warning("Failed to retrieve json products from AWS, could not decode data into JSON")
        # Check the json products keys
        keys = []
        for d in product_list:
            for key in d:
                if key not in keys:
                    keys.append(key)
        if set(keys) != set(["id", "name", "brand", "retailer", "price", "in_stock"]):
            logging.warning("Json products keys differ from required")
            logging.warning("Json keys: {}".format(list(keys)))
        # Use DictReader from csv module to turn the csv data into a python dictionary
        with open("products.csv") as csvfile:
            dr = DictReader(csvfile, delimiter=",")
            # Reassign the field names to match the json data
            dr.fieldnames = ["id", "name", "brand", "retailer", "price", "in_stock"]
            # Parse the data to fit our expected scheme and add it to the list of products
            product_list.extend(parse_csv([x for x in dr]))
        return product_list
    else:
        logging.warning("Please ensure the products.csv file is in the same directory as the app!")

예제 #9

0

파일 보기