ultimatevocalremovergui/demucs/spec.py

54 lines
1.5 KiB
Python
Raw Normal View History

2023-10-07 06:48:34 +02:00
# Copyright (c) Meta Platforms, Inc. and affiliates.
2022-12-19 04:18:56 +01:00
# All rights reserved.
#
# This source code is licensed under the license found in the
# LICENSE file in the root directory of this source tree.
"""Conveniance wrapper to perform STFT and iSTFT"""
import torch as th
def spectro(x, n_fft=512, hop_length=None, pad=0):
*other, length = x.shape
x = x.reshape(-1, length)
2023-10-17 08:02:16 +02:00
device_type = x.device.type
is_other_gpu = not device_type in ["cuda", "cpu"]
if is_other_gpu:
2023-10-07 06:48:34 +02:00
x = x.cpu()
2022-12-19 04:18:56 +01:00
z = th.stft(x,
n_fft * (1 + pad),
hop_length or n_fft // 4,
window=th.hann_window(n_fft).to(x),
win_length=n_fft,
normalized=True,
center=True,
return_complex=True,
pad_mode='reflect')
_, freqs, frame = z.shape
return z.view(*other, freqs, frame)
def ispectro(z, hop_length=None, length=None, pad=0):
*other, freqs, frames = z.shape
n_fft = 2 * freqs - 2
z = z.view(-1, freqs, frames)
win_length = n_fft // (1 + pad)
2023-10-17 08:02:16 +02:00
device_type = z.device.type
is_other_gpu = not device_type in ["cuda", "cpu"]
if is_other_gpu:
2023-10-07 06:48:34 +02:00
z = z.cpu()
2022-12-19 04:18:56 +01:00
x = th.istft(z,
n_fft,
hop_length,
window=th.hann_window(win_length).to(z.real),
win_length=win_length,
normalized=True,
length=length,
center=True)
_, length = x.shape
return x.view(*other, length)