コード例 #1
0
def main():

    args = parser.parse_args()
    htk_save_path = mkdir(args.htk_save_path)
    path = Path(data_path=args.data_path, config_path='./config')

    # HTK settings
    save_config(audio_file_type='wav',
                feature_type=args.feature_type,
                channels=args.channels,
                config_save_path='./config',
                sampling_rate=16000,
                window=args.window,
                slide=args.slide,
                energy=bool(args.energy),
                delta=bool(args.delta),
                deltadelta=bool(args.deltadelta))

    data_types = ['eval1', 'eval2', 'eval3']

    if bool(args.subset):
        data_types += ['train_subset']
    if bool(args.fullset):
        data_types += ['train_fullset']

    for data_type in data_types:
        wav_paths = path.wav(data_type=data_type)
        save_path = mkdir_join(htk_save_path, data_type)

        with open('./config/wav2htk_' + data_type + '.scp', 'w') as f:
            for wav_path in wav_paths:
                speaker = basename(wav_path).split('.')[0]
                save_path_tmp = join(save_path, speaker + '.htk')
                f.write(wav_path + '  ' + save_path_tmp + '\n')
コード例 #2
0
parser.add_argument('--slide', type=float, help='extract features per slide')
parser.add_argument('--energy', type=int, help='if 1, add the energy feature')
parser.add_argument('--delta', type=int, help='if 1, add the energy feature')
parser.add_argument('--deltadelta',
                    type=int,
                    help='if 1, double delta features are also extracted')
parser.add_argument('--subset',
                    type=int,
                    help='If True, create small dataset.')
parser.add_argument('--fullset',
                    type=int,
                    help='If True, create full-size dataset.')

args = parser.parse_args()
path = Path(data_path=args.data_path,
            config_path='./config',
            htk_save_path=args.htk_save_path)

CONFIG = {
    'feature_type': args.feature_type,
    'channels': args.channels,
    'sampling_rate': 16000,
    'window': args.window,
    'slide': args.slide,
    'energy': bool(args.energy),
    'delta': bool(args.delta),
    'deltadelta': bool(args.deltadelta)
}

if args.save_format == 'htk':
    assert args.tool == 'htk'
コード例 #3
0
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import sys
import unittest

sys.path.append('../../')
from csj.path import Path
from csj.input_data import read_audio
from csj.labels.transcript import read_sdb
from utils.measure_time_func import measure_time

path = Path(data_path='/n/sd8/inaguma/corpus/csj/data',
            config_path='../config',
            htk_save_path='/n/sd8/inaguma/corpus/csj/htk')

htk_paths = {
    'train': path.htk(data_type='train_subset'),
    'dev': path.htk(data_type='dev'),
    'eval1': path.htk(data_type='eval1'),
    'eval2': path.htk(data_type='eval2'),
    'eval3': path.htk(data_type='eval3'),
}

wav_paths = {
    'train': path.wav(data_type='train_subset'),
    'dev': path.wav(data_type='dev'),
    'eval1': path.wav(data_type='eval1'),
    'eval2': path.wav(data_type='eval2'),
コード例 #4
0
# -*- coding: utf-8 -*-

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import sys
import unittest

sys.path.append('../../')
from csj.path import Path
from csj.labels.transcript import read_sdb
from utils.measure_time_func import measure_time
from utils.util import mkdir_join

path = Path(data_path='/n/sd8/inaguma/corpus/csj/data',
            config_path='../config')


class TestLabel(unittest.TestCase):

    def test(self):

        self.check(data_size='subset')
        self.check(data_size='fullset')

    @measure_time
    def check(self, data_size):

        print('=' * 50)
        print('  data_size: %s' % str(data_size))
        print('=' * 50)