def fft_filter(v_frm_short_a, shift_a, v_spec_diff_db_a, fft_len): # dB to absolute: v_spec_diff_a = la.db(v_spec_diff_db_a, b_inv=True) right_a = v_frm_short_a.size - shift_a v_frm_short_a_ext = np.r_[np.zeros(fft_len/2 - shift_a) , v_frm_short_a , np.zeros(fft_len/2 - right_a)] v_fft_frm_short_a_ext = np.fft.fft(v_frm_short_a_ext) * la.add_hermitian_half(v_spec_diff_a[None,:], data_type='mag')[0] # To time domain: v_frm_short_a_ext_filt = np.fft.ifft(v_fft_frm_short_a_ext).real return v_frm_short_a_ext_filt
def plots(m_mag, m_real, m_imag, v_f0): lp.plotm(la.db(m_mag)) # in decibels for better visualisation lp.title('Magnitude Spectrum (dB)') lp.xlabel('Time (frames)') lp.ylabel('Frequency bins') lp.plotm(m_real) lp.title('"R" Feature Phase Spectrum') lp.xlabel('Time (frames)') lp.ylabel('Frequency bins') lp.plotm(m_imag) lp.title('"I" Feature Phase Spectrum') lp.xlabel('Time (frames)') lp.ylabel('Frequency bins') lp.figure() lp.plot(v_f0) lp.title('F0') lp.xlabel('Time (frames)') lp.ylabel('F0') lp.grid() return
def get_formant_locations_from_raw_long_frame(v_sig, v_pm, nx, fft_len): ''' nx: frame index ''' #v_sig, fs = la.read_audio_file(wavfile) # Epoch detection: #v_pm_sec, v_voi = la.reaper_epoch_detection(wavfile) #v_pm = lu.round_to_int(v_pm_sec * fs) # Raw-long Frame extraction: v_frm_long = v_sig[v_pm[nx-2]:v_pm[nx+2]+1] # Win: left_len = v_pm[nx] - v_pm[nx-2] right_len = v_pm[nx+2] - v_pm[nx] v_win = la.gen_non_symmetric_win(left_len, right_len, np.hanning, b_norm=False) v_frm_long_win = v_frm_long * v_win # Spectrum: v_mag = np.absolute(np.fft.fft(v_frm_long_win, n=fft_len)) v_mag_db = la.db(la.remove_hermitian_half(v_mag[None,:])[0]) # Formant extraction -LPC method:-------------------------------------------------- v_lpc, v_e, v_refl = lpc(v_frm_long_win, 120) b_use_lpc_roots = False if b_use_lpc_roots: v_lpc_roots = np.roots(v_lpc) v_lpc_angles = np.angle(v_lpc_roots) v_lpc_angles = v_lpc_angles[v_lpc_angles>=0] v_lpc_angles = np.sort(v_lpc_angles) fft_len_half = 1 + fft_len / 2 v_lpc_roots_bins = v_lpc_angles * fft_len_half / np.pi v_lpc_mag = lpc_to_mag(v_lpc, fft_len=fft_len) v_lpc_mag_db = la.db(v_lpc_mag) v_lpc_mag_db = v_lpc_mag_db - np.mean(v_lpc_mag_db) + np.mean(v_mag_db) v_frmnts_bins, v_frmnts_gains_db = get_formant_locations_from_spec_env(v_lpc_mag_db) # Getting bandwidth: fft_len_half = 1 + fft_len / 2 v_vall_bins = get_formant_locations_from_spec_env(-v_lpc_mag_db)[0] v_vall_bins = np.r_[0, v_vall_bins, fft_len_half-1] nfrmnts = v_frmnts_bins.size v_frmnts_bw = np.zeros(nfrmnts) - 1.0 for nx_f in xrange(nfrmnts): #Left slope: curr_frmnt_bin = v_frmnts_bins[nx_f] curr_vall_l_bin = v_vall_bins[nx_f] curr_vall_r_bin = v_vall_bins[nx_f+1] curr_midp_l = int((curr_frmnt_bin + curr_vall_l_bin) / 2.0) curr_midp_r = int((curr_frmnt_bin + curr_vall_r_bin) / 2.0) # Protection: if curr_midp_l==curr_frmnt_bin: curr_midp_l = curr_vall_l_bin if curr_midp_r==curr_frmnt_bin: curr_midp_r = curr_vall_r_bin #print(nx_f) # 27 y 32 #if ((nx==73) and (nx_f==27)): import ipdb; ipdb.set_trace(context=8) # breakpoint c4f78f1e // slope_l = (v_frmnts_gains_db[nx_f] - v_lpc_mag_db[curr_midp_l]) / (curr_frmnt_bin - curr_midp_l).astype(float) slope_r = (v_frmnts_gains_db[nx_f] - v_lpc_mag_db[curr_midp_r]) / (curr_frmnt_bin - curr_midp_r).astype(float) slope_ave = (slope_l - slope_r) / 2.0 v_frmnts_bw[nx_f] = 1.0 / slope_ave # Filtering by bandwidth: bw_thress = 7.0 v_frmnts_bins = v_frmnts_bins[v_frmnts_bw<bw_thress] v_frmnts_gains_db = v_frmnts_gains_db[v_frmnts_bw<bw_thress] v_frmnts_bw = v_frmnts_bw[v_frmnts_bw<bw_thress] # Computing frame short:-------------------------------- # Win: left_len_short = v_pm[nx] - v_pm[nx-1] right_len_short = v_pm[nx+1] - v_pm[nx] v_win_short = la.gen_non_symmetric_win(left_len_short, right_len_short, np.hanning, b_norm=False) v_frm_short = v_sig[v_pm[nx-1]:v_pm[nx+1]+1] v_frm_short_win = v_frm_short * v_win_short shift = v_pm[nx] - v_pm[nx-1] # Formant extraction - True envelope method:---------------------------------------- # Not finished. #v_true_env_db = la.true_envelope(v_mag_db[None,:], in_type='db', ncoeffs=400, thres_db=0.1)[0] if False: plt.figure(); plt.plot(v_mag_db); plt.plot(v_lpc_mag_db); plt.grid(); plt.show() return v_mag_db, v_lpc_mag_db, v_frmnts_bins, v_frmnts_gains_db, v_frmnts_bw, v_frm_short_win, shift
def speech_interp_with_anchors(wavfile_a, wavfile_b, nx_strt_a, nx_strt_b, nframes, fft_len): # MagPhase analysis: m_mag_a, m_real_a, m_imag_a, v_f0_a, fs, v_shift_a = mp.analysis_lossless( wavfile_a) m_mag_b, m_real_b, m_imag_b, v_f0_b, fs, v_shift_b = mp.analysis_lossless( wavfile_b) v_pm_a = la.shift_to_pm(v_shift_a) v_pm_b = la.shift_to_pm(v_shift_b) v_sig_a, fs = la.read_audio_file(wavfile_a) v_sig_b, fs = la.read_audio_file(wavfile_b) # Get formants: v_mag_db_a, v_lpc_mag_db_a, v_frmnts_bins_a, v_frmnts_gains_db_a, v_frmnts_bw_a, v_frm_short_a, shift_a = get_formant_locations_from_raw_long_frame( v_sig_a, v_pm_a, nx_strt_a, fft_len) v_mag_db_b, v_lpc_mag_db_b, v_frmnts_bins_b, v_frmnts_gains_db_b, v_frmnts_bw_b, v_frm_short_b, shift_b = get_formant_locations_from_raw_long_frame( v_sig_b, v_pm_b, nx_strt_b + nframes - 1, fft_len) # Formant mapping:---------------------------------------------------------------- v_frmnts_bins_a_filt, v_frmnts_bins_b_filt = formant_mapping( v_frmnts_bins_a, v_frmnts_gains_db_a, v_frmnts_bins_b, v_frmnts_gains_db_b, fft_len) # spec envelope anchors:--------------------------------------------------------------------- v_true_env_db_a = la.true_envelope(v_mag_db_a[None, :], in_type='db', ncoeffs=400, thres_db=0.1)[0] v_true_env_db_b = la.true_envelope(v_mag_db_b[None, :], in_type='db', ncoeffs=400, thres_db=0.1)[0] if False: plt.figure() plt.plot(v_mag_db_a) plt.plot(v_true_env_db_a) plt.grid() plt.show() plt.figure() plt.plot(v_mag_db_b) plt.plot(v_true_env_db_b) plt.grid() plt.show() fft_len_half = 1 + fft_len / 2 m_mag_interp = np.zeros((nframes, fft_len_half)) m_real_interp = np.zeros((nframes, fft_len_half)) m_imag_interp = np.zeros((nframes, fft_len_half)) v_shifts_interp = np.zeros(nframes, dtype='int') for nx_frm in xrange(nframes): sp_weight = nx_frm / (nframes - 1.0) nx_a = nx_strt_a + nx_frm nx_b = nx_strt_b + nx_frm # Spectral Warping: v_sp_env_db_curr_a_warp = warp_mag_spec(v_true_env_db_a, v_frmnts_bins_a_filt, v_frmnts_bins_b_filt, fft_len, sp_weight) v_sp_env_db_curr_b_warp = warp_mag_spec(v_true_env_db_b, v_frmnts_bins_b_filt, v_frmnts_bins_a_filt, fft_len, (1 - sp_weight)) #v_sp_env_db_a_warp = warp_mag_spec(v_lpc_mag_db_a, v_frmnts_bins_a_filt, v_frmnts_bins_b_filt, fft_len, sp_weight) #v_sp_env_db_b_warp = warp_mag_spec(v_lpc_mag_db_b, v_frmnts_bins_b_filt, v_frmnts_bins_a_filt, fft_len, (1-sp_weight)) # Spectral envelope mix:------------------------------------------------------- v_sp_env_db_curr_targ = v_sp_env_db_curr_a_warp * ( 1.0 - sp_weight) + v_sp_env_db_curr_b_warp * sp_weight # Whitening:----------------------------------------------------------------------------- # Spectral envelope estimation: # v_mag_db_a, v_lpc_mag_db_a, v_frmnts_bins_a, v_frmnts_gains_db_a, v_frmnts_bw_a, v_frm_short_a, shift_a = get_formant_locations_from_raw_long_frame(v_sig_a, v_pm_a, nx_a, fft_len) v_mag_db_curr_a = get_formant_locations_from_raw_long_frame( v_sig_a, v_pm_a, nx_a, fft_len)[0] v_mag_db_curr_b = get_formant_locations_from_raw_long_frame( v_sig_b, v_pm_b, nx_b, fft_len)[0] v_true_env_db_curr_a = la.true_envelope(v_mag_db_curr_a[None, :], in_type='db', ncoeffs=400, thres_db=0.1)[0] v_true_env_db_curr_b = la.true_envelope(v_mag_db_curr_b[None, :], in_type='db', ncoeffs=400, thres_db=0.1)[0] v_mag_white_a = m_mag_a[nx_a, :] / la.db(v_true_env_db_curr_a, b_inv=True) v_mag_white_b = m_mag_b[nx_b, :] / la.db(v_true_env_db_curr_b, b_inv=True) #if sp_weight>=0.4: import ipdb; ipdb.set_trace(context=8) # breakpoint 6b3a7d8b // if False: plt.figure() plt.plot(v_mag_db_curr_a) plt.plot(v_true_env_db_curr_a) plt.grid() plt.show() plt.figure() plt.plot(v_true_env_db_curr_a) plt.plot(v_true_env_db_curr_b) plt.plot(v_sp_env_db_curr_targ) plt.grid() plt.show() plt.figure() plt.plot(v_mag_db_curr_a) plt.plot(la.db(m_mag_a[nx_a, :])) plt.plot(la.db(v_mag_white_a)) plt.plot(v_true_env_db_curr_a) plt.grid() plt.show() # Impose spectral Env:------------------------------------------------------------------ v_sp_env_targ = la.db(v_sp_env_db_curr_targ, b_inv=True) v_mag_filt_a = v_mag_white_a * v_sp_env_targ v_mag_filt_b = v_mag_white_b * v_sp_env_targ # Mix Sources:------------------------------------------------------------------ v_mag_mix = v_mag_filt_a * (1.0 - sp_weight) + v_mag_filt_b * sp_weight v_real_mix = m_real_a[nx_a, :] * ( 1.0 - sp_weight) + m_real_b[nx_b, :] * sp_weight v_imag_mix = m_imag_a[nx_a, :] * ( 1.0 - sp_weight) + m_imag_b[nx_b, :] * sp_weight # Mix shifts: shift_mix = lu.round_to_int(shift_a * (1.0 - sp_weight) + shift_b * sp_weight) # Save: v_shifts_interp[nx_frm] = shift_mix m_mag_interp[nx_frm, :] = v_mag_mix m_real_interp[nx_frm, :] = v_real_mix m_imag_interp[nx_frm, :] = v_imag_mix if False: plt.figure() plt.plot(v_frm_short_a_ext_filt) plt.plot(v_frm_short_b_ext_filt) plt.grid() plt.show() plt.figure() plt.plot(v_frm_short_a_ext_filt) plt.plot(v_frm_short_b_ext_filt) plt.plot(v_frm_short_ext_filt) plt.grid() plt.show() # Merge: m_mag_merged = np.vstack((m_mag_a[:nx_strt_a, :], m_mag_interp, m_mag_b[(nx_strt_b + nframes):, :])) m_real_merged = np.vstack((m_real_a[:nx_strt_a, :], m_real_interp, m_real_b[(nx_strt_b + nframes):, :])) m_imag_merged = np.vstack((m_imag_a[:nx_strt_a, :], m_imag_interp, m_imag_b[(nx_strt_b + nframes):, :])) v_shift_merged = np.r_[v_shift_a[:nx_strt_a], v_shifts_interp, v_shift_b[(nx_strt_b + nframes):]] v_sig_merged = synthesis_from_lossless(m_mag_merged, m_real_merged, m_imag_merged, v_shift_merged) return v_sig_merged, fs
def speech_interp(wavfile_a, wavfile_b, nx_strt_a, nx_strt_b, nframes, fft_len): # MagPhase analysis: m_mag_a, m_real_a, m_imag_a, v_f0_a, fs, v_shift_a = mp.analysis_lossless( wavfile_a) m_mag_b, m_real_b, m_imag_b, v_f0_b, fs, v_shift_b = mp.analysis_lossless( wavfile_b) v_pm_a = la.shift_to_pm(v_shift_a) v_pm_b = la.shift_to_pm(v_shift_b) v_sig_a, fs = la.read_audio_file(wavfile_a) v_sig_b, fs = la.read_audio_file(wavfile_b) # Epoch detection: #v_pm_sec_a, v_voi_a = la.reaper_epoch_detection(wavfile_a) #v_pm_sec_b, v_voi_b = la.reaper_epoch_detection(wavfile_b) #v_pm_a = lu.round_to_int(v_pm_sec_a * fs) #v_pm_b = lu.round_to_int(v_pm_sec_b * fs) #m_frms_syn = np.zeros((nframes, fft_len)) fft_len_half = 1 + fft_len / 2 m_mag_interp = np.zeros((nframes, fft_len_half)) m_real_interp = np.zeros((nframes, fft_len_half)) m_imag_interp = np.zeros((nframes, fft_len_half)) v_shifts_interp = np.zeros(nframes, dtype='int') for nx_frm in xrange(nframes): sp_weight = nx_frm / (nframes - 1.0) nx_a = nx_strt_a + nx_frm nx_b = nx_strt_b + nx_frm # Get formants: v_mag_db_a, v_lpc_mag_db_a, v_frmnts_bins_a, v_frmnts_gains_db_a, v_frmnts_bw_a, v_frm_short_a, shift_a = get_formant_locations_from_raw_long_frame( v_sig_a, v_pm_a, nx_a, fft_len) v_mag_db_b, v_lpc_mag_db_b, v_frmnts_bins_b, v_frmnts_gains_db_b, v_frmnts_bw_b, v_frm_short_b, shift_b = get_formant_locations_from_raw_long_frame( v_sig_b, v_pm_b, nx_b, fft_len) # Formant mapping:---------------------------------------------------------------- v_frmnts_bins_a_filt, v_frmnts_bins_b_filt = formant_mapping( v_frmnts_bins_a, v_frmnts_gains_db_a, v_frmnts_bins_b, v_frmnts_gains_db_b, fft_len) # Warping:--------------------------------------------------------------------- # True envelope: v_true_env_db_a = la.true_envelope(v_mag_db_a[None, :], in_type='db', ncoeffs=400, thres_db=0.1)[0] v_true_env_db_b = la.true_envelope(v_mag_db_b[None, :], in_type='db', ncoeffs=400, thres_db=0.1)[0] v_sp_env_db_a_warp = warp_mag_spec(v_true_env_db_a, v_frmnts_bins_a_filt, v_frmnts_bins_b_filt, fft_len, sp_weight) v_sp_env_db_b_warp = warp_mag_spec(v_true_env_db_b, v_frmnts_bins_b_filt, v_frmnts_bins_a_filt, fft_len, (1 - sp_weight)) #v_sp_env_db_a_warp = warp_mag_spec(v_lpc_mag_db_a, v_frmnts_bins_a_filt, v_frmnts_bins_b_filt, fft_len, sp_weight) #v_sp_env_db_b_warp = warp_mag_spec(v_lpc_mag_db_b, v_frmnts_bins_b_filt, v_frmnts_bins_a_filt, fft_len, (1-sp_weight)) # Spectral envelope mix:------------------------------------------------------- v_sp_env_db_targ = v_sp_env_db_a_warp * ( 1.0 - sp_weight) + v_sp_env_db_b_warp * sp_weight # Impose spectral Env (FFT filter):------------------------------------------------------ v_sp_env_diff_db_a = v_sp_env_db_targ - v_true_env_db_a v_sp_env_diff_db_b = v_sp_env_db_targ - v_true_env_db_b #v_frm_short_a_ext_filt = fft_filter(v_frm_short_a, shift_a, v_spec_diff_db_a, fft_len) #v_frm_short_b_ext_filt = fft_filter(v_frm_short_b, shift_b, v_spec_diff_db_b, fft_len) #v_sp_env_diff_a = la.db(v_sp_env_diff_db_a, b_inv=True) v_mag_filt_a = m_mag_a[nx_a, :] * la.db(v_sp_env_diff_db_a, b_inv=True) #v_sp_env_diff_b = la.db(v_sp_env_diff_db_b, b_inv=True) v_mag_filt_b = m_mag_b[nx_b, :] * la.db(v_sp_env_diff_db_b, b_inv=True) #fft_filter_magphase_domain(m_mag_a[nx_a,:], m_real_a[nx_a,:], m_imag_a[nx_a,:]) # Mix Sources:------------------------------------------------------------------ v_mag_mix = v_mag_filt_a * (1.0 - sp_weight) + v_mag_filt_b * sp_weight v_real_mix = m_real_a[nx_a, :] * ( 1.0 - sp_weight) + m_real_b[nx_b, :] * sp_weight v_imag_mix = m_imag_a[nx_a, :] * ( 1.0 - sp_weight) + m_imag_b[nx_b, :] * sp_weight # Mix sources: #v_frm_short_ext_filt = v_frm_short_a_ext_filt * (1.0-sp_weight) + v_frm_short_b_ext_filt * sp_weight #v_frm_short_ext_filt = v_frm_short_a_ext_filt # Mix shifts: shift_mix = lu.round_to_int(shift_a * (1.0 - sp_weight) + shift_b * sp_weight) # Save: v_shifts_interp[nx_frm] = shift_mix m_mag_interp[nx_frm, :] = v_mag_mix m_real_interp[nx_frm, :] = v_real_mix m_imag_interp[nx_frm, :] = v_imag_mix #m_frms_syn[nx_frm, :] = v_frm_short_ext_filt if False: plt.figure() plt.plot(v_frm_short_a_ext_filt) plt.plot(v_frm_short_b_ext_filt) plt.grid() plt.show() plt.figure() plt.plot(v_frm_short_a_ext_filt) plt.plot(v_frm_short_b_ext_filt) plt.plot(v_frm_short_ext_filt) plt.grid() plt.show() # Merge: #m_frms_syn_dc = np.fft.fftshift(m_frms_syn, axes=1) #m_fft_syn = la.remove_hermitian_half(np.fft.fft(m_frms_syn_dc)) #m_mag_syn, m_real_syn, m_imag_syn = compute_lossless_spec_feats(m_fft_syn) m_mag_merged = np.vstack((m_mag_a[:nx_strt_a, :], m_mag_interp, m_mag_b[(nx_strt_b + nframes):, :])) m_real_merged = np.vstack((m_real_a[:nx_strt_a, :], m_real_interp, m_real_b[(nx_strt_b + nframes):, :])) m_imag_merged = np.vstack((m_imag_a[:nx_strt_a, :], m_imag_interp, m_imag_b[(nx_strt_b + nframes):, :])) v_shift_merged = np.r_[v_shift_a[:nx_strt_a], v_shifts_interp, v_shift_b[(nx_strt_b + nframes):]] v_sig_merged = synthesis_from_lossless(m_mag_merged, m_real_merged, m_imag_merged, v_shift_merged) return v_sig_merged, fs
# INPUT:==================================================================== magfile_ref = '/home/s1373426/Dropbox/Education/UoE/Projects/fft_feats_DirectFFTWaveformModelling/magphase_proj/merlin/tools/magphase_private/demos/data_48k/wavs_syn/hvd_593_copy_syn_lossless.mag' magfile_a = '/home/s1373426/Dropbox/Education/UoE/Projects/fft_feats_DirectFFTWaveformModelling/magphase_proj/merlin/tools/magphase_private/demos/data_48k/wavs_syn/hvd_593_copy_syn_low_dim.mag' fft_len = 4096 alpha = 0.77 nx = 52 #100 # PLOTS:==================================================================== #lp.close('all') fft_len_half = fft_len / 2 + 1 #m_mag_ref = lu.read_binfile(magfile_ref, dim=60) m_mag_ref = la.db(lu.read_binfile(magfile_ref, dim=fft_len_half)) m_mag_a = la.db( np.exp( la.sp_mel_unwarp(lu.read_binfile(magfile_a, dim=60), fft_len_half, alpha=alpha, in_type='log'))) if False: lp.plotm(m_mag_ref) lp.plotm(m_mag_a) lp.plotm(m_mag_ref - m_mag_a) lp.plotm((m_mag_ref - m_mag_a)[:50, :50]) lp.plotm(np.diff(m_mag_ref, axis=0)) lp.plotm(np.diff(m_mag_a, axis=0))
def get_formant_locations_from_raw_long_frame(v_sig, v_pm, nx, fft_len): ''' nx: frame index ''' #v_sig, fs = la.read_audio_file(wavfile) # Epoch detection: #v_pm_sec, v_voi = la.reaper_epoch_detection(wavfile) #v_pm = lu.round_to_int(v_pm_sec * fs) # Raw-long Frame extraction: v_frm_long = v_sig[v_pm[nx-2]:v_pm[nx+2]+1] # Win: left_len = v_pm[nx] - v_pm[nx-2] right_len = v_pm[nx+2] - v_pm[nx] v_win = la.gen_non_symmetric_win(left_len, right_len, np.hanning, b_norm=False) v_frm_long_win = v_frm_long * v_win # Spectrum: v_mag = la.remove_hermitian_half(np.absolute(np.fft.fft(v_frm_long_win, n=fft_len)[None,:]))[0] v_mag_db = la.db(v_mag) # Mel warping: alpha = 0.50 # 0.55 - 0.60 #ncoeffs = 2048 # must be even v_mag_mel = la.sp_mel_warp(v_mag[None,:], fft_len/2, alpha=alpha, in_type=3)[0] v_sp_cmplx = la.build_min_phase_from_mag_spec(v_mag_mel[None,:])[0] v_sp_cmplx_ext = la.add_hermitian_half(v_sp_cmplx[None,:], data_type='complex')[0] v_frm_long_win_mel = np.fft.ifft(v_sp_cmplx_ext).real if False: plt.close('all') pl(la.db(v_mag)) pl(la.db(np.absolute(v_sp_cmplx))) pl(v_frm_long_win_mel) # Formant extraction -LPC method:-------------------------------------------------- n_lpc_coeffs = 30 # 40 v_lpc_mel, v_e, v_refl = lpc(v_frm_long_win_mel, n_lpc_coeffs) v_lpc_mag_mel = lpc_to_mag(v_lpc_mel, fft_len=fft_len) v_lpc_mag_mel_db = la.db(v_lpc_mag_mel) v_lpc_mag_mel_db = v_lpc_mag_mel_db - np.mean(v_lpc_mag_mel_db) + np.mean(la.db(v_mag_mel)) v_frmnts_bins_mel, v_frmnts_gains_db = get_formant_locations_from_spec_env(v_lpc_mag_mel_db) # Getting bandwidth: fft_len_half = 1 + fft_len / 2 v_vall_bins = get_formant_locations_from_spec_env(-v_lpc_mag_mel_db)[0] v_vall_bins = np.r_[0, v_vall_bins, fft_len_half-1] nfrmnts = v_frmnts_bins_mel.size v_frmnts_bw_mel = np.zeros(nfrmnts) - 1.0 for nx_f in xrange(nfrmnts): #Left slope: curr_frmnt_bin = v_frmnts_bins_mel[nx_f] curr_vall_l_bin = v_vall_bins[nx_f] curr_vall_r_bin = v_vall_bins[nx_f+1] curr_midp_l = int((curr_frmnt_bin + curr_vall_l_bin) / 2.0) curr_midp_r = int((curr_frmnt_bin + curr_vall_r_bin) / 2.0) # Protection: if curr_midp_l==curr_frmnt_bin: curr_midp_l = curr_vall_l_bin if curr_midp_r==curr_frmnt_bin: curr_midp_r = curr_vall_r_bin #print(nx_f) # 27 y 32 slope_l = (v_frmnts_gains_db[nx_f] - v_lpc_mag_mel_db[curr_midp_l]) / (curr_frmnt_bin - curr_midp_l).astype(float) slope_r = (v_frmnts_gains_db[nx_f] - v_lpc_mag_mel_db[curr_midp_r]) / (curr_frmnt_bin - curr_midp_r).astype(float) slope_ave = (slope_l - slope_r) / 2.0 v_frmnts_bw_mel[nx_f] = 1.0 / slope_ave # Filtering by bandwidth: # bw_thress = 7.0 # v_frmnts_bins_mel = v_frmnts_bins_mel[v_frmnts_bw_mel<bw_thress] # v_frmnts_gains_db = v_frmnts_gains_db[v_frmnts_bw_mel<bw_thress] # v_frmnts_bw_mel = v_frmnts_bw_mel[v_frmnts_bw_mel<bw_thress] # Computing frame short:-------------------------------- # Win: left_len_short = v_pm[nx] - v_pm[nx-1] right_len_short = v_pm[nx+1] - v_pm[nx] v_win_short = la.gen_non_symmetric_win(left_len_short, right_len_short, np.hanning, b_norm=False) v_frm_short = v_sig[v_pm[nx-1]:v_pm[nx+1]+1] v_frm_short_win = v_frm_short * v_win_short shift = v_pm[nx] - v_pm[nx-1] # Formant extraction - True envelope method:---------------------------------------- # Not finished. #v_true_env_db = la.true_envelope(v_mag_db[None,:], in_type='db', ncoeffs=400, thres_db=0.1)[0] if True: plt.figure(); plt.plot(la.db(v_mag_mel)); plt.plot(v_lpc_mag_mel_db); plt.grid(); plt.show() #pl(v_mag_db) if True: import ipdb; ipdb.set_trace(context=8) # breakpoint 906d26d6 // return v_mag_db, v_lpc_mag_mel_db, v_frmnts_bins_mel, v_frmnts_gains_db, v_frmnts_bw_mel, v_frm_short_win, shift