1
0
mirror of synced 2025-02-25 22:38:07 +01:00

Format code (#1169)

Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com>
This commit is contained in:
github-actions[bot] 2023-09-02 16:14:32 +08:00 committed by GitHub
parent 0fc160c03e
commit c7bbf0bfd0
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
8 changed files with 136 additions and 69 deletions

View File

@ -19,6 +19,7 @@ version_config_list = [
"v2/32k.json", "v2/32k.json",
] ]
def singleton_variable(func): def singleton_variable(func):
def wrapper(*args, **kwargs): def wrapper(*args, **kwargs):
if not wrapper.instance: if not wrapper.instance:

View File

@ -455,14 +455,17 @@ if __name__ == "__main__":
inp_q, inp_q,
opt_q, opt_q,
device, device,
self.rvc if hasattr(self, "rvc") else None self.rvc if hasattr(self, "rvc") else None,
) )
self.config.samplerate = self.rvc.tgt_sr self.config.samplerate = self.rvc.tgt_sr
self.config.crossfade_time = min( self.config.crossfade_time = min(
self.config.crossfade_time, self.config.block_time self.config.crossfade_time, self.config.block_time
) )
self.zc = self.rvc.tgt_sr // 100 self.zc = self.rvc.tgt_sr // 100
self.block_frame = int(np.round(self.config.block_time * self.config.samplerate / self.zc)) * self.zc self.block_frame = (
int(np.round(self.config.block_time * self.config.samplerate / self.zc))
* self.zc
)
self.block_frame_16k = 160 * self.block_frame // self.zc self.block_frame_16k = 160 * self.block_frame // self.zc
self.crossfade_frame = int( self.crossfade_frame = int(
self.config.crossfade_time * self.config.samplerate self.config.crossfade_time * self.config.samplerate
@ -484,7 +487,9 @@ if __name__ == "__main__":
), ),
dtype="float32", dtype="float32",
) )
self.input_wav_res: torch.Tensor= torch.zeros(160 * len(self.input_wav) // self.zc) self.input_wav_res: torch.Tensor = torch.zeros(
160 * len(self.input_wav) // self.zc
)
self.output_wav_cache: torch.Tensor = torch.zeros( self.output_wav_cache: torch.Tensor = torch.zeros(
int( int(
np.ceil( np.ceil(
@ -577,12 +582,18 @@ if __name__ == "__main__":
if db_threhold[i]: if db_threhold[i]:
indata[i * hop_length : (i + 1) * hop_length] = 0 indata[i * hop_length : (i + 1) * hop_length] = 0
self.input_wav[: -self.block_frame] = self.input_wav[self.block_frame :] self.input_wav[: -self.block_frame] = self.input_wav[self.block_frame :]
self.input_wav[-self.block_frame: ] = indata self.input_wav[-self.block_frame :] = indata
# infer # infer
inp = torch.from_numpy(self.input_wav[-self.block_frame-2*self.zc :]).to(device) inp = torch.from_numpy(
self.input_wav_res[ : -self.block_frame_16k] = self.input_wav_res[self.block_frame_16k :].clone() self.input_wav[-self.block_frame - 2 * self.zc :]
self.input_wav_res[-self.block_frame_16k-160 :] = self.resampler(inp)[160 :] ).to(device)
self.input_wav_res[: -self.block_frame_16k] = self.input_wav_res[
self.block_frame_16k :
].clone()
self.input_wav_res[-self.block_frame_16k - 160 :] = self.resampler(inp)[
160:
]
rate = ( rate = (
self.crossfade_frame + self.sola_search_frame + self.block_frame self.crossfade_frame + self.sola_search_frame + self.block_frame
) / ( ) / (
@ -592,11 +603,11 @@ if __name__ == "__main__":
+ self.block_frame + self.block_frame
) )
f0_extractor_frame = self.block_frame_16k + 800 f0_extractor_frame = self.block_frame_16k + 800
if self.config.f0method == 'rmvpe': if self.config.f0method == "rmvpe":
f0_extractor_frame = 5120 * ((f0_extractor_frame - 1) // 5120 + 1) f0_extractor_frame = 5120 * ((f0_extractor_frame - 1) // 5120 + 1)
res2 = self.rvc.infer( res2 = self.rvc.infer(
self.input_wav_res, self.input_wav_res,
self.input_wav_res[-f0_extractor_frame :].cpu().numpy(), self.input_wav_res[-f0_extractor_frame:].cpu().numpy(),
self.block_frame_16k, self.block_frame_16k,
rate, rate,
self.pitch, self.pitch,
@ -720,9 +731,7 @@ if __name__ == "__main__":
sd.default.device[1] = output_device_indices[ sd.default.device[1] = output_device_indices[
output_devices.index(output_device) output_devices.index(output_device)
] ]
logger.info( logger.info("Input device: %s:%d", str(sd.default.device[0]), input_device)
"Input device: %s:%d", str(sd.default.device[0]), input_device
)
logger.info( logger.info(
"Output device: %s:%d", str(sd.default.device[1]), output_device "Output device: %s:%d", str(sd.default.device[1]), output_device
) )

View File

@ -208,9 +208,15 @@ def preprocess_dataset(trainset_dir, exp_dir, sr, n_p):
f = open("%s/logs/%s/preprocess.log" % (now_dir, exp_dir), "w") f = open("%s/logs/%s/preprocess.log" % (now_dir, exp_dir), "w")
f.close() f.close()
per = 3.0 if config.is_half else 3.7 per = 3.0 if config.is_half else 3.7
cmd = ( cmd = '"%s" infer/modules/train/preprocess.py "%s" %s %s "%s/logs/%s" %s %.1f' % (
'"%s" infer/modules/train/preprocess.py "%s" %s %s "%s/logs/%s" %s %.1f' config.python_cmd,
% (config.python_cmd, trainset_dir, sr, n_p, now_dir, exp_dir, config.noparallel, per) trainset_dir,
sr,
n_p,
now_dir,
exp_dir,
config.noparallel,
per,
) )
logger.info(cmd) logger.info(cmd)
p = Popen(cmd, shell=True) # , stdin=PIPE, stdout=PIPE,stderr=PIPE,cwd=now_dir p = Popen(cmd, shell=True) # , stdin=PIPE, stdout=PIPE,stderr=PIPE,cwd=now_dir
@ -272,14 +278,17 @@ def extract_f0_feature(gpus, n_p, f0method, if_f0, exp_dir, version19, gpus_rmvp
leng = len(gpus_rmvpe) leng = len(gpus_rmvpe)
ps = [] ps = []
for idx, n_g in enumerate(gpus_rmvpe): for idx, n_g in enumerate(gpus_rmvpe):
cmd = '"%s" infer/modules/train/extract/extract_f0_rmvpe.py %s %s %s "%s/logs/%s" %s ' % ( cmd = (
config.python_cmd, '"%s" infer/modules/train/extract/extract_f0_rmvpe.py %s %s %s "%s/logs/%s" %s '
leng, % (
idx, config.python_cmd,
n_g, leng,
now_dir, idx,
exp_dir, n_g,
config.is_half, now_dir,
exp_dir,
config.is_half,
)
) )
logger.info(cmd) logger.info(cmd)
p = Popen( p = Popen(
@ -333,15 +342,18 @@ def extract_f0_feature(gpus, n_p, f0method, if_f0, exp_dir, version19, gpus_rmvp
leng = len(gpus) leng = len(gpus)
ps = [] ps = []
for idx, n_g in enumerate(gpus): for idx, n_g in enumerate(gpus):
cmd = '"%s" infer/modules/train/extract_feature_print.py %s %s %s %s "%s/logs/%s" %s' % ( cmd = (
config.python_cmd, '"%s" infer/modules/train/extract_feature_print.py %s %s %s %s "%s/logs/%s" %s'
config.device, % (
leng, config.python_cmd,
idx, config.device,
n_g, leng,
now_dir, idx,
exp_dir, n_g,
version19, now_dir,
exp_dir,
version19,
)
) )
logger.info(cmd) logger.info(cmd)
p = Popen( p = Popen(
@ -379,12 +391,16 @@ def get_pretrained_models(path_str, f0_str, sr2):
if not if_pretrained_generator_exist: if not if_pretrained_generator_exist:
logger.warn( logger.warn(
"assets/pretrained%s/%sG%s.pth not exist, will not use pretrained model", "assets/pretrained%s/%sG%s.pth not exist, will not use pretrained model",
path_str, f0_str, sr2 path_str,
f0_str,
sr2,
) )
if not if_pretrained_discriminator_exist: if not if_pretrained_discriminator_exist:
logger.warn( logger.warn(
"assets/pretrained%s/%sD%s.pth not exist, will not use pretrained model", "assets/pretrained%s/%sD%s.pth not exist, will not use pretrained model",
path_str, f0_str, sr2 path_str,
f0_str,
sr2,
) )
return ( return (
"assets/pretrained%s/%sG%s.pth" % (path_str, f0_str, sr2) "assets/pretrained%s/%sG%s.pth" % (path_str, f0_str, sr2)
@ -421,9 +437,11 @@ def change_version19(sr2, if_f0_3, version19):
def change_f0(if_f0_3, sr2, version19): # f0method8,pretrained_G14,pretrained_D15 def change_f0(if_f0_3, sr2, version19): # f0method8,pretrained_G14,pretrained_D15
path_str = "" if version19 == "v1" else "_v2" path_str = "" if version19 == "v1" else "_v2"
return ( return (
{"visible": if_f0_3, "__type__": "update"}, *get_pretrained_models(path_str, "f0", sr2) {"visible": if_f0_3, "__type__": "update"},
*get_pretrained_models(path_str, "f0", sr2),
) )
# but3.click(click_train,[exp_dir1,sr2,if_f0_3,save_epoch10,total_epoch11,batch_size12,if_save_latest13,pretrained_G14,pretrained_D15,gpus16]) # but3.click(click_train,[exp_dir1,sr2,if_f0_3,save_epoch10,total_epoch11,batch_size12,if_save_latest13,pretrained_G14,pretrained_D15,gpus16])
def click_train( def click_train(
exp_dir1, exp_dir1,
@ -522,24 +540,33 @@ def click_train(
config_save_path = os.path.join(exp_dir, "config.json") config_save_path = os.path.join(exp_dir, "config.json")
if not pathlib.Path(config_save_path).exists(): if not pathlib.Path(config_save_path).exists():
with open(config_save_path, "w", encoding="utf-8") as f: with open(config_save_path, "w", encoding="utf-8") as f:
json.dump(config.json_config[config_path], f, ensure_ascii=False, indent=4, sort_keys=True) json.dump(
config.json_config[config_path],
f,
ensure_ascii=False,
indent=4,
sort_keys=True,
)
f.write("\n") f.write("\n")
if gpus16: if gpus16:
cmd = '"%s" infer/modules/train/train.py -e "%s" -sr %s -f0 %s -bs %s -g %s -te %s -se %s %s %s -l %s -c %s -sw %s -v %s' % ( cmd = (
config.python_cmd, '"%s" infer/modules/train/train.py -e "%s" -sr %s -f0 %s -bs %s -g %s -te %s -se %s %s %s -l %s -c %s -sw %s -v %s'
exp_dir1, % (
sr2, config.python_cmd,
1 if if_f0_3 else 0, exp_dir1,
batch_size12, sr2,
gpus16, 1 if if_f0_3 else 0,
total_epoch11, batch_size12,
save_epoch10, gpus16,
"-pg %s" % pretrained_G14 if pretrained_G14 != "" else "", total_epoch11,
"-pd %s" % pretrained_D15 if pretrained_D15 != "" else "", save_epoch10,
1 if if_save_latest13 == i18n("") else 0, "-pg %s" % pretrained_G14 if pretrained_G14 != "" else "",
1 if if_cache_gpu17 == i18n("") else 0, "-pd %s" % pretrained_D15 if pretrained_D15 != "" else "",
1 if if_save_every_weights18 == i18n("") else 0, 1 if if_save_latest13 == i18n("") else 0,
version19, 1 if if_cache_gpu17 == i18n("") else 0,
1 if if_save_every_weights18 == i18n("") else 0,
version19,
)
) )
else: else:
cmd = ( cmd = (

View File

@ -617,7 +617,10 @@ class SynthesizerTrnMs256NSFsid(nn.Module):
) )
self.emb_g = nn.Embedding(self.spk_embed_dim, gin_channels) self.emb_g = nn.Embedding(self.spk_embed_dim, gin_channels)
logger.debug( logger.debug(
"gin_channels: " + str(gin_channels) + ", self.spk_embed_dim: " + str(self.spk_embed_dim) "gin_channels: "
+ str(gin_channels)
+ ", self.spk_embed_dim: "
+ str(self.spk_embed_dim)
) )
def remove_weight_norm(self): def remove_weight_norm(self):
@ -735,7 +738,10 @@ class SynthesizerTrnMs768NSFsid(nn.Module):
) )
self.emb_g = nn.Embedding(self.spk_embed_dim, gin_channels) self.emb_g = nn.Embedding(self.spk_embed_dim, gin_channels)
logger.debug( logger.debug(
"gin_channels: " + str(gin_channels) + ", self.spk_embed_dim: " + str(self.spk_embed_dim) "gin_channels: "
+ str(gin_channels)
+ ", self.spk_embed_dim: "
+ str(self.spk_embed_dim)
) )
def remove_weight_norm(self): def remove_weight_norm(self):
@ -850,7 +856,10 @@ class SynthesizerTrnMs256NSFsid_nono(nn.Module):
) )
self.emb_g = nn.Embedding(self.spk_embed_dim, gin_channels) self.emb_g = nn.Embedding(self.spk_embed_dim, gin_channels)
logger.debug( logger.debug(
"gin_channels: " + str(gin_channels) + ", self.spk_embed_dim: " + str(self.spk_embed_dim) "gin_channels: "
+ str(gin_channels)
+ ", self.spk_embed_dim: "
+ str(self.spk_embed_dim)
) )
def remove_weight_norm(self): def remove_weight_norm(self):
@ -958,7 +967,10 @@ class SynthesizerTrnMs768NSFsid_nono(nn.Module):
) )
self.emb_g = nn.Embedding(self.spk_embed_dim, gin_channels) self.emb_g = nn.Embedding(self.spk_embed_dim, gin_channels)
logger.debug( logger.debug(
"gin_channels: " + str(gin_channels) + ", self.spk_embed_dim: " + str(self.spk_embed_dim) "gin_channels: "
+ str(gin_channels)
+ ", self.spk_embed_dim: "
+ str(self.spk_embed_dim)
) )
def remove_weight_norm(self): def remove_weight_norm(self):

View File

@ -621,7 +621,10 @@ class SynthesizerTrnMsNSFsidM(nn.Module):
self.emb_g = nn.Embedding(self.spk_embed_dim, gin_channels) self.emb_g = nn.Embedding(self.spk_embed_dim, gin_channels)
self.speaker_map = None self.speaker_map = None
logger.debug( logger.debug(
"gin_channels: " + gin_channels + ", self.spk_embed_dim: " + self.spk_embed_dim "gin_channels: "
+ gin_channels
+ ", self.spk_embed_dim: "
+ self.spk_embed_dim
) )
def remove_weight_norm(self): def remove_weight_norm(self):

View File

@ -34,8 +34,10 @@ def load_checkpoint_d(checkpoint_path, combd, sbd, optimizer=None, load_opt=1):
new_state_dict[k] = saved_state_dict[k] new_state_dict[k] = saved_state_dict[k]
if saved_state_dict[k].shape != state_dict[k].shape: if saved_state_dict[k].shape != state_dict[k].shape:
logger.warn( logger.warn(
"shape-%s-mismatch. need: %s, get: %s" "shape-%s-mismatch. need: %s, get: %s",
, k, state_dict[k].shape, saved_state_dict[k].shape k,
state_dict[k].shape,
saved_state_dict[k].shape,
) # ) #
raise KeyError raise KeyError
except: except:
@ -110,8 +112,10 @@ def load_checkpoint(checkpoint_path, model, optimizer=None, load_opt=1):
new_state_dict[k] = saved_state_dict[k] new_state_dict[k] = saved_state_dict[k]
if saved_state_dict[k].shape != state_dict[k].shape: if saved_state_dict[k].shape != state_dict[k].shape:
logger.warn( logger.warn(
"shape-%s-mismatch|need-%s|get-%s" "shape-%s-mismatch|need-%s|get-%s",
, k, state_dict[k].shape, saved_state_dict[k].shape k,
state_dict[k].shape,
saved_state_dict[k].shape,
) # ) #
raise KeyError raise KeyError
except: except:

View File

@ -215,7 +215,8 @@ class VC:
else "Index not used." else "Index not used."
) )
return ( return (
"Success.\n%s\nTime:\nnpy: %.2fs, f0: %.2fs, infer: %.2fs." % (index_info, *times), "Success.\n%s\nTime:\nnpy: %.2fs, f0: %.2fs, infer: %.2fs."
% (index_info, *times),
(self.tgt_sr, audio_opt), (self.tgt_sr, audio_opt),
) )
except: except:

View File

@ -2,6 +2,7 @@ import os
import sys import sys
import traceback import traceback
import logging import logging
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)
from time import time as ttime from time import time as ttime
@ -47,7 +48,16 @@ if config.dml == True:
# config.is_half=False########强制cpu测试 # config.is_half=False########强制cpu测试
class RVC: class RVC:
def __init__( def __init__(
self, key, pth_path, index_path, index_rate, n_cpu, inp_q, opt_q, device, last_rvc=None, self,
key,
pth_path,
index_path,
index_rate,
n_cpu,
inp_q,
opt_q,
device,
last_rvc=None,
) -> None: ) -> None:
""" """
初始化 初始化
@ -325,9 +335,9 @@ class RVC:
pitch, pitchf = self.get_f0(indata, self.f0_up_key, self.n_cpu, f0method) pitch, pitchf = self.get_f0(indata, self.f0_up_key, self.n_cpu, f0method)
start_frame = block_frame_16k // 160 start_frame = block_frame_16k // 160
end_frame = len(cache_pitch) - (pitch.shape[0] - 4) + start_frame end_frame = len(cache_pitch) - (pitch.shape[0] - 4) + start_frame
cache_pitch[:] = np.append(cache_pitch[start_frame : end_frame], pitch[3:-1]) cache_pitch[:] = np.append(cache_pitch[start_frame:end_frame], pitch[3:-1])
cache_pitchf[:] = np.append( cache_pitchf[:] = np.append(
cache_pitchf[start_frame : end_frame], pitchf[3:-1] cache_pitchf[start_frame:end_frame], pitchf[3:-1]
) )
p_len = min(feats.shape[1], 13000, cache_pitch.shape[0]) p_len = min(feats.shape[1], 13000, cache_pitch.shape[0])
else: else: