def get_names(self): """Downloads parses phone books to get names Returns: NameIndex """ names = NameIndex() res = requests.get('https://crinacle.com/graphing/data_hp/phone_book.json') # Headphone book hp_book = self.parse_book(res.json()) for false_name, true_name in hp_book.items(): names.add(NameItem(false_name, true_name, 'onear')) res = requests.get('https://crinacle.com/graphing/data/phone_book.json') # IEM book iem_book = self.parse_book(res.json()) for false_name, true_name in iem_book.items(): names.add(NameItem(false_name, true_name, 'inear')) return names
def rename_groups(databases=DBS): with open(os.path.join(DIR_PATH, 'name_groups.tsv'), 'r', encoding='utf-8') as fh: lines = fh.read().strip().split('\n') # First column is always the true name # Create dict with each false name as key and it's true name as value name_map = dict() for line in lines: names = line.split('\t') if len(names) > 1: for i in range(1, len(names)): name_map[names[i]] = names[0] # Read name indexes and existing files for all supported measurement databases dbs = [] for db in databases: if os.path.isfile(os.path.join(DIR_PATH, db, 'name_index.tsv')): # Read name index name_index = NameIndex.read_tsv( os.path.join(DIR_PATH, db, 'name_index.tsv')) else: # No name index, create one anew name_index = NameIndex() # Read all the existing files for the database files = list( glob(os.path.join(DIR_PATH, db, 'data', '**', '*.csv'), recursive=True)) files = [{ 'name': os.path.split(file)[1].replace('.csv', ''), 'path': file } for file in files] # Save both to dbs dbs.append({'name': db, 'name_index': name_index, 'files': files}) for old_name, new_name in name_map.items(): print(f'"{old_name}" -> "{new_name}"') for db in dbs: name_index = db['name_index'] # Replace true names in name index with the new name updated_item = False matches = name_index.find(true_name=old_name) for item in matches.items: if new_name == 'ignore': name_index.update(NameItem(false_name=item.false_name, true_name=item.true_name, form='ignore'), true_name=old_name) print( f' Updated item: "{item.false_name}", "{new_name}", "ignore"' ) else: name_index.update(NameItem(false_name=item.false_name, true_name=new_name, form=item.form), true_name=old_name) print( f' Updated item: "{item.false_name}", "{new_name}", "{item.form}"' ) updated_item = True # Rename existing files for name, path in [(f['name'], f['path']) for f in db['files'] if f['name'].lower() == old_name.lower()]: if new_name == 'ignore': print(f' Removing "{os.path.split(path)[0]}"') shutil.rmtree(os.path.split(path)[0]) if not updated_item: name_index.add( NameItem(false_name=old_name, true_name=None, form='ignore')) print(f' Added item: "{old_name}", "", "ignore"') continue new_path = re.sub(re.escape(name), new_name, path) print( f' Moving "{os.path.relpath(path, DIR_PATH)}" to "{os.path.relpath(new_path, DIR_PATH)}"' ) os.makedirs(os.path.split(new_path)[0], exist_ok=True) shutil.move(path, new_path) os.rmdir(os.path.join(path, os.pardir)) matches = name_index.find(true_name=new_name) if not matches: d = path while True: d, f = os.path.split(d) if f in ['onear', 'inear', 'earbud']: form = f break name_index.add( NameItem(false_name=old_name, true_name=new_name, form=form)) print( f' Added item: "{old_name}", "{new_name}", "{form}"' ) print() for db in dbs: db['name_index'].write_tsv( os.path.join(DIR_PATH, db['name'], 'name_index.tsv'))