def main(): args = parser.parse_args() htk_save_path = mkdir(args.htk_save_path) path = Path(data_path=args.data_path, config_path='./config') # HTK settings save_config(audio_file_type='wav', feature_type=args.feature_type, channels=args.channels, config_save_path='./config', sampling_rate=16000, window=args.window, slide=args.slide, energy=bool(args.energy), delta=bool(args.delta), deltadelta=bool(args.deltadelta)) data_types = ['eval1', 'eval2', 'eval3'] if bool(args.subset): data_types += ['train_subset'] if bool(args.fullset): data_types += ['train_fullset'] for data_type in data_types: wav_paths = path.wav(data_type=data_type) save_path = mkdir_join(htk_save_path, data_type) with open('./config/wav2htk_' + data_type + '.scp', 'w') as f: for wav_path in wav_paths: speaker = basename(wav_path).split('.')[0] save_path_tmp = join(save_path, speaker + '.htk') f.write(wav_path + ' ' + save_path_tmp + '\n')
parser.add_argument('--slide', type=float, help='extract features per slide') parser.add_argument('--energy', type=int, help='if 1, add the energy feature') parser.add_argument('--delta', type=int, help='if 1, add the energy feature') parser.add_argument('--deltadelta', type=int, help='if 1, double delta features are also extracted') parser.add_argument('--subset', type=int, help='If True, create small dataset.') parser.add_argument('--fullset', type=int, help='If True, create full-size dataset.') args = parser.parse_args() path = Path(data_path=args.data_path, config_path='./config', htk_save_path=args.htk_save_path) CONFIG = { 'feature_type': args.feature_type, 'channels': args.channels, 'sampling_rate': 16000, 'window': args.window, 'slide': args.slide, 'energy': bool(args.energy), 'delta': bool(args.delta), 'deltadelta': bool(args.deltadelta) } if args.save_format == 'htk': assert args.tool == 'htk'
from __future__ import absolute_import from __future__ import division from __future__ import print_function import sys import unittest sys.path.append('../../') from csj.path import Path from csj.input_data import read_audio from csj.labels.transcript import read_sdb from utils.measure_time_func import measure_time path = Path(data_path='/n/sd8/inaguma/corpus/csj/data', config_path='../config', htk_save_path='/n/sd8/inaguma/corpus/csj/htk') htk_paths = { 'train': path.htk(data_type='train_subset'), 'dev': path.htk(data_type='dev'), 'eval1': path.htk(data_type='eval1'), 'eval2': path.htk(data_type='eval2'), 'eval3': path.htk(data_type='eval3'), } wav_paths = { 'train': path.wav(data_type='train_subset'), 'dev': path.wav(data_type='dev'), 'eval1': path.wav(data_type='eval1'), 'eval2': path.wav(data_type='eval2'),
# -*- coding: utf-8 -*- from __future__ import absolute_import from __future__ import division from __future__ import print_function import sys import unittest sys.path.append('../../') from csj.path import Path from csj.labels.transcript import read_sdb from utils.measure_time_func import measure_time from utils.util import mkdir_join path = Path(data_path='/n/sd8/inaguma/corpus/csj/data', config_path='../config') class TestLabel(unittest.TestCase): def test(self): self.check(data_size='subset') self.check(data_size='fullset') @measure_time def check(self, data_size): print('=' * 50) print(' data_size: %s' % str(data_size)) print('=' * 50)