def test(): data_frame_by_irpp_table_name = build_irpp_tables(years = range(2009, 2013), fill_value = 0) original_data_frame_by_irpp_table_name = build_original_irpp_tables() excluded_variables = [ 'salaires_imposables', 'heures_supplementaires', 'frais_reels', 'pensions_alimentaires_percues', 'plus_values_mobilieres_stock_options', 'plus_values_mobilieres', 'plus_values_professionnelles', ] messages = list() for irpp_table_name, data_frame in data_frame_by_irpp_table_name.iteritems(): for year in data_frame.index: for variable in data_frame.columns: if not (2008 <= year <= 2011): continue if variable in excluded_variables: continue try: target = ( original_data_frame_by_irpp_table_name[irpp_table_name].loc[year, variable] ) except KeyError: print '{} not found for {} in table {}'.format(variable, year, irpp_table_name) continue actual = data_frame.fillna(value = fill_value).loc[year, variable] / 1e9 if not abs(target - actual) / abs(target) <= 1e-3: messages.append(error_msg(irpp_table_name, variable, year, target, actual)) assert len(messages) == 0, "\nThere are {} errors.".format(len(messages)) + "\n".join(messages)
def test(): data_frame_by_irpp_table_name = build_irpp_tables(years=range(2009, 2013), fill_value=0) original_data_frame_by_irpp_table_name = build_original_irpp_tables() excluded_variables = [ 'salaires_imposables', 'heures_supplementaires', 'frais_reels', 'pensions_alimentaires_percues', 'plus_values_mobilieres_stock_options', 'plus_values_mobilieres', 'plus_values_professionnelles', ] messages = list() for irpp_table_name, data_frame in data_frame_by_irpp_table_name.iteritems( ): for year in data_frame.index: for variable in data_frame.columns: if not (2008 <= year <= 2011): continue if variable in excluded_variables: continue try: target = ( original_data_frame_by_irpp_table_name[irpp_table_name] .loc[year, variable]) except KeyError: print '{} not found for {} in table {}'.format( variable, year, irpp_table_name) continue actual = data_frame.fillna( value=fill_value).loc[year, variable] / 1e9 if not abs(target - actual) / abs(target) <= 1e-3: messages.append( error_msg(irpp_table_name, variable, year, target, actual)) assert len(messages) == 0, "\nThere are {} errors.".format( len(messages)) + "\n".join(messages)
# u'txabt_micro', # u'txabt_micro_service', # u'txabt_microbnc' } ) irpp_4 = pandas.read_excel(file_path, sheetname, index_col=0, skiprows=108, header=0, parse_cols="A:O").iloc[1:20] irpp_4.rename(columns=slugified_name_by_long_name, inplace=True) irpp_4.index.name = "year" original_data_frame_by_irpp_table_name = dict(irpp_1=irpp_1, irpp_2=irpp_2, irpp_3=irpp_3, irpp_4=irpp_4) return original_data_frame_by_irpp_table_name data_frame_by_irpp_table_name = build_irpp_tables(years=range(2008, 2013), fill_value=0) original_data_frame_by_irpp_table_name = build_original_irpp_tables() excluded_variables = ["plus_values_mobilieres_stock_options", "plus_values_mobilieres"] messages = list() for irpp_table_name, data_frame in data_frame_by_irpp_table_name.iteritems(): for year in data_frame.index: for variable in data_frame.columns: if (year >= 2014) or year <= 2008: continue if variable in excluded_variables: continue try: target = (
header = 0, parse_cols = 'A:O').iloc[1:20] irpp_4.rename(columns = slugified_name_by_long_name, inplace = True) irpp_4.index.name = 'year' original_data_frame_by_irpp_table_name = dict( irpp_1 = irpp_1, irpp_2 = irpp_2, irpp_3 = irpp_3, irpp_4 = irpp_4, ) return original_data_frame_by_irpp_table_name data_frame_by_irpp_table_name = build_irpp_tables(years = range(2008, 2013), fill_value = 0) original_data_frame_by_irpp_table_name = build_original_irpp_tables() excluded_variables = ['plus_values_mobilieres_stock_options', 'plus_values_mobilieres'] messages = list() for irpp_table_name, data_frame in data_frame_by_irpp_table_name.iteritems(): for year in data_frame.index: for variable in data_frame.columns: if (year >= 2014) or year <= 2008: continue if variable in excluded_variables: continue try: target = (