def getFormatData(self, filename):
     ''' Get the data format directly from the data file (in case we do not have an info file)'''
     if 'format' in self.info.keys():
         return self.info['format']
     if 'is_sparse' in self.info.keys():
         if self.info['is_sparse'] == 0:
             self.info['format'] = 'dense'
         else:
             data = data_converter.read_first_line(filename)
             if ':' in data[0]:
                 self.info['format'] = 'sparse'
             else:
                 self.info['format'] = 'sparse_binary'
     else:
         data = data_converter.file_to_array(filename)
         if ':' in data[0][0]:
             self.info['is_sparse'] = 1
             self.info['format'] = 'sparse'
         else:
             nbr_columns = len(data[0])
             for row in range(len(data)):
                 if len(data[row]) != nbr_columns:
                     self.info['format'] = 'sparse_binary'
             if 'format' not in self.info.keys():
                 self.info['format'] = 'dense'
                 self.info['is_sparse'] = 0
     return self.info['format']
Exemple #2
0
	def getFormatData(self,filename):
		''' Get the data format directly from the data file (in case we do not have an info file)'''
		if 'format' in self.info.keys():
			return self.info['format']
		if 'is_sparse' in self.info.keys():
			if self.info['is_sparse'] == 0:
				self.info['format'] = 'dense'
			else:
				data = data_converter.read_first_line (filename)
				if ':' in data[0]:
					self.info['format'] = 'sparse'
				else:
					self.info['format'] = 'sparse_binary'
		else:
			data = data_converter.file_to_array (filename)
			if ':' in data[0][0]:
				self.info['is_sparse'] = 1
				self.info['format'] = 'sparse'
			else:
				nbr_columns = len(data[0])
				for row in range (len(data)):
					if len(data[row]) != nbr_columns:
						self.info['format'] = 'sparse_binary'
				if 'format' not in self.info.keys():
					self.info['format'] = 'dense'
					self.info['is_sparse'] = 0			
		return self.info['format']