Пример #1
0
 def node2SparkRows(node: GeounitNode):
     nodedict = node.toDict((SYN, INVAR, GEOCODE))
     persons = makeHistRowsFromMultiSparse(
         nodedict,
         schema,
         row_recoder=self.row_recoder,
         geocode_dict=inverted_geodict)
     return persons
Пример #2
0
 def node2SparkRows(node: GeounitNode):
     nodedict = node.toDict((SYN, INVAR, GEOCODE))
     households = makeHistRowsFromMultiSparse(
         nodedict, schema, row_recoder=self.row_recoder)
     units = addEmptyAndGQ(
         nodedict,
         schema,
         households,
         row_recoder=self.row_recoder,
         gqtype_recoder=HHGQUnitDemoProductAttr.das2mdf,
         geocode_dict=inverted_geodict)
     return units
Пример #3
0
 def node2SparkRows(node: GeounitNode):
     nodedict = node.toDict((SYN, INVAR, GEOCODE))
     households = makeHistRowsFromMultiSparse(
         nodedict,
         schema,
         row_recoder=self.row_recoder,
         geocode_dict=inverted_geodict,
         microdata_field=None)
     units = addGroupQuarters(nodedict,
                              schema,
                              households,
                              row_recoder=self.row_recoder,
                              geocode_dict=inverted_geodict,
                              to_microdata=False)
     # 'priv' means "protected via the differential privacy routines in this code base" variable to be renamed after P.L.94-171 production
     ordered_cols = self.var_list + ['priv']
     return [
         Row(*ordered_cols)(*[unit[col] for col in ordered_cols])
         for unit in units
     ]