ultimatevocalremovergui/demucs/spec.py

48 lines
1.4 KiB
Python
Raw Normal View History

2023-10-07 06:48:34 +02:00
# Copyright (c) Meta Platforms, Inc. and affiliates.
2022-12-19 04:18:56 +01:00
# All rights reserved.
#
# This source code is licensed under the license found in the
# LICENSE file in the root directory of this source tree.
"""Conveniance wrapper to perform STFT and iSTFT"""
import torch as th
def spectro(x, n_fft=512, hop_length=None, pad=0):
*other, length = x.shape
x = x.reshape(-1, length)
2023-10-07 06:48:34 +02:00
is_mps = x.device.type == 'mps'
if is_mps:
x = x.cpu()
2022-12-19 04:18:56 +01:00
z = th.stft(x,
n_fft * (1 + pad),
hop_length or n_fft // 4,
window=th.hann_window(n_fft).to(x),
win_length=n_fft,
normalized=True,
center=True,
return_complex=True,
pad_mode='reflect')
_, freqs, frame = z.shape
return z.view(*other, freqs, frame)
def ispectro(z, hop_length=None, length=None, pad=0):
*other, freqs, frames = z.shape
n_fft = 2 * freqs - 2
z = z.view(-1, freqs, frames)
win_length = n_fft // (1 + pad)
2023-10-07 06:48:34 +02:00
is_mps = z.device.type == 'mps'
if is_mps:
z = z.cpu()
2022-12-19 04:18:56 +01:00
x = th.istft(z,
n_fft,
hop_length,
window=th.hann_window(win_length).to(z.real),
win_length=win_length,
normalized=True,
length=length,
center=True)
_, length = x.shape
return x.view(*other, length)