mirror of
https://github.com/Anjok07/ultimatevocalremovergui.git
synced 2024-11-28 01:10:56 +01:00
42 lines
1.3 KiB
Python
42 lines
1.3 KiB
Python
|
# Copyright (c) Facebook, Inc. and its affiliates.
|
||
|
# All rights reserved.
|
||
|
#
|
||
|
# This source code is licensed under the license found in the
|
||
|
# LICENSE file in the root directory of this source tree.
|
||
|
"""Conveniance wrapper to perform STFT and iSTFT"""
|
||
|
|
||
|
import torch as th
|
||
|
|
||
|
|
||
|
def spectro(x, n_fft=512, hop_length=None, pad=0):
|
||
|
*other, length = x.shape
|
||
|
x = x.reshape(-1, length)
|
||
|
z = th.stft(x,
|
||
|
n_fft * (1 + pad),
|
||
|
hop_length or n_fft // 4,
|
||
|
window=th.hann_window(n_fft).to(x),
|
||
|
win_length=n_fft,
|
||
|
normalized=True,
|
||
|
center=True,
|
||
|
return_complex=True,
|
||
|
pad_mode='reflect')
|
||
|
_, freqs, frame = z.shape
|
||
|
return z.view(*other, freqs, frame)
|
||
|
|
||
|
|
||
|
def ispectro(z, hop_length=None, length=None, pad=0):
|
||
|
*other, freqs, frames = z.shape
|
||
|
n_fft = 2 * freqs - 2
|
||
|
z = z.view(-1, freqs, frames)
|
||
|
win_length = n_fft // (1 + pad)
|
||
|
x = th.istft(z,
|
||
|
n_fft,
|
||
|
hop_length,
|
||
|
window=th.hann_window(win_length).to(z.real),
|
||
|
win_length=win_length,
|
||
|
normalized=True,
|
||
|
length=length,
|
||
|
center=True)
|
||
|
_, length = x.shape
|
||
|
return x.view(*other, length)
|