Python mel_spectogram 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: src.data.data_utils

메소드/함수: mel_spectogram

hotexamples.com에서의 예제들: 2

Python mel_spectogram - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 src.data.data_utils.mel_spectogram에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

파일: encoder_conv.py 프로젝트: ndk03/Accent-Preserving-Voice-Cloning-using-SV2TTS

    def embed(self, aud):

        mel = mel_spectogram(aud)  #preprocessed audio
        part_frames = []
        for ix in range(
                0, mel.shape[1] - self.config_yml['SLIDING_WIN_SIZE'],
                int(self.config_yml['SLIDING_WIN_SIZE'] *
                    self.config_yml['SLIDING_WIN_OVERLAP'])):
            part_frame = mel[:, ix:ix + self.config_yml['SLIDING_WIN_SIZE']]
            part_frames.append(part_frame)


# changed
        frames = np.stack(part_frames)
        frames = torch.Tensor(frames).view(
            -1,
            self.config_yml['MEL_CHANNELS'],
            self.config_yml['SLIDING_WIN_SIZE'],
        ).to(device=self.device)
        model_pickle = torch.load(self.model_save_string.format(self.epoch),
                                  map_location=self.device)
        self.load_state_dict(model_pickle['model_state_dict'])
        with torch.no_grad():
            self.eval()
            embeds = self.forward(frames)  #.cpu().data.numpy()
            embeds = embeds * torch.reciprocal(
                torch.norm(embeds, dim=1, keepdim=True))
            embeds = torch.mean(embeds, dim=0)
            embeds = embeds.cpu().data.numpy()

        return embeds

예제 #2

파일 보기

파일: encoder.py 프로젝트: amsterg/Podcast-Ad-Detection

    def embed(self, aud, group=True):

        aud_splits, mel_splits = split_audio_ixs(len(aud))
        max_aud_length = aud_splits[-1].stop

        if max_aud_length >= len(aud):
            aud = np.pad(aud, (0, max_aud_length - len(aud)), "constant")

        mel = mel_spectogram(aud).astype(np.float32).T
        mels = np.array([mel[s] for s in mel_splits])
        mels = torch.from_numpy(mels).to(self.device)
        embeds_all = []
        with torch.no_grad():
            for i in range(0, mels.shape[0], 64):
                embeds = self.forward(
                    mels[i:min(i+64, mels.shape[0]), :, :].to(self.device))
                embeds = embeds / torch.norm(embeds, dim=1, keepdim=True)
                embeds_all.append(embeds)
        embeds = torch.cat(embeds_all)

        if group:
            embeds = torch.mean(embeds, dim=0)
            embeds = embeds / torch.norm(embeds)

        embeds = embeds.cpu().data.numpy()
        # self.train()

        return embeds, (aud_splits, mel_splits)