|
import torch |
|
import numpy as np |
|
from tqdm import tqdm |
|
|
|
def make_padding(width, cropsize, offset): |
|
left = offset |
|
roi_size = cropsize - left * 2 |
|
if roi_size == 0: |
|
roi_size = cropsize |
|
right = roi_size - (width % roi_size) + left |
|
|
|
return left, right, roi_size |
|
def inference(X_spec, device, model, aggressiveness,data): |
|
''' |
|
data : dic configs |
|
''' |
|
|
|
def _execute(X_mag_pad, roi_size, n_window, device, model, aggressiveness,is_half=True): |
|
model.eval() |
|
with torch.no_grad(): |
|
preds = [] |
|
|
|
iterations = [n_window] |
|
|
|
total_iterations = sum(iterations) |
|
for i in tqdm(range(n_window)): |
|
start = i * roi_size |
|
X_mag_window = X_mag_pad[None, :, :, start:start + data['window_size']] |
|
X_mag_window = torch.from_numpy(X_mag_window) |
|
if(is_half==True):X_mag_window=X_mag_window.half() |
|
X_mag_window=X_mag_window.to(device) |
|
|
|
pred = model.predict(X_mag_window, aggressiveness) |
|
|
|
pred = pred.detach().cpu().numpy() |
|
preds.append(pred[0]) |
|
|
|
pred = np.concatenate(preds, axis=2) |
|
return pred |
|
|
|
def preprocess(X_spec): |
|
X_mag = np.abs(X_spec) |
|
X_phase = np.angle(X_spec) |
|
|
|
return X_mag, X_phase |
|
|
|
X_mag, X_phase = preprocess(X_spec) |
|
|
|
coef = X_mag.max() |
|
X_mag_pre = X_mag / coef |
|
|
|
n_frame = X_mag_pre.shape[2] |
|
pad_l, pad_r, roi_size = make_padding(n_frame, |
|
data['window_size'], model.offset) |
|
n_window = int(np.ceil(n_frame / roi_size)) |
|
|
|
X_mag_pad = np.pad( |
|
X_mag_pre, ((0, 0), (0, 0), (pad_l, pad_r)), mode='constant') |
|
|
|
if(list(model.state_dict().values())[0].dtype==torch.float16):is_half=True |
|
else:is_half=False |
|
pred = _execute(X_mag_pad, roi_size, n_window, |
|
device, model, aggressiveness,is_half) |
|
pred = pred[:, :, :n_frame] |
|
|
|
if data['tta']: |
|
pad_l += roi_size // 2 |
|
pad_r += roi_size // 2 |
|
n_window += 1 |
|
|
|
X_mag_pad = np.pad( |
|
X_mag_pre, ((0, 0), (0, 0), (pad_l, pad_r)), mode='constant') |
|
|
|
pred_tta = _execute(X_mag_pad, roi_size, n_window, |
|
device, model, aggressiveness,is_half) |
|
pred_tta = pred_tta[:, :, roi_size // 2:] |
|
pred_tta = pred_tta[:, :, :n_frame] |
|
|
|
return (pred + pred_tta) * 0.5 * coef, X_mag, np.exp(1.j * X_phase) |
|
else: |
|
return pred * coef, X_mag, np.exp(1.j * X_phase) |
|
|
|
|
|
|
|
def _get_name_params(model_path , model_hash): |
|
ModelName = model_path |
|
if model_hash == '47939caf0cfe52a0e81442b85b971dfd': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_44100.json') |
|
param_name_auto=str('4band_44100') |
|
if model_hash == '4e4ecb9764c50a8c414fee6e10395bbe': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_v2.json') |
|
param_name_auto=str('4band_v2') |
|
if model_hash == 'ca106edd563e034bde0bdec4bb7a4b36': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_v2.json') |
|
param_name_auto=str('4band_v2') |
|
if model_hash == 'e60a1e84803ce4efc0a6551206cc4b71': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_44100.json') |
|
param_name_auto=str('4band_44100') |
|
if model_hash == 'a82f14e75892e55e994376edbf0c8435': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_44100.json') |
|
param_name_auto=str('4band_44100') |
|
if model_hash == '6dd9eaa6f0420af9f1d403aaafa4cc06': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_v2_sn.json') |
|
param_name_auto=str('4band_v2_sn') |
|
if model_hash == '08611fb99bd59eaa79ad27c58d137727': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_v2_sn.json') |
|
param_name_auto=str('4band_v2_sn') |
|
if model_hash == '5c7bbca45a187e81abbbd351606164e5': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/3band_44100_msb2.json') |
|
param_name_auto=str('3band_44100_msb2') |
|
if model_hash == 'd6b2cb685a058a091e5e7098192d3233': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/3band_44100_msb2.json') |
|
param_name_auto=str('3band_44100_msb2') |
|
if model_hash == 'c1b9f38170a7c90e96f027992eb7c62b': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_44100.json') |
|
param_name_auto=str('4band_44100') |
|
if model_hash == 'c3448ec923fa0edf3d03a19e633faa53': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_44100.json') |
|
param_name_auto=str('4band_44100') |
|
if model_hash == '68aa2c8093d0080704b200d140f59e54': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/3band_44100.json') |
|
param_name_auto=str('3band_44100.json') |
|
if model_hash == 'fdc83be5b798e4bd29fe00fe6600e147': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/3band_44100_mid.json') |
|
param_name_auto=str('3band_44100_mid.json') |
|
if model_hash == '2ce34bc92fd57f55db16b7a4def3d745': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/3band_44100_mid.json') |
|
param_name_auto=str('3band_44100_mid.json') |
|
if model_hash == '52fdca89576f06cf4340b74a4730ee5f': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_44100.json') |
|
param_name_auto=str('4band_44100.json') |
|
if model_hash == '41191165b05d38fc77f072fa9e8e8a30': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_44100.json') |
|
param_name_auto=str('4band_44100.json') |
|
if model_hash == '89e83b511ad474592689e562d5b1f80e': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/2band_32000.json') |
|
param_name_auto=str('2band_32000.json') |
|
if model_hash == '0b954da81d453b716b114d6d7c95177f': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/2band_32000.json') |
|
param_name_auto=str('2band_32000.json') |
|
|
|
|
|
if model_hash == '6a00461c51c2920fd68937d4609ed6c8': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr16000_hl512.json') |
|
param_name_auto=str('1band_sr16000_hl512') |
|
if model_hash == '0ab504864d20f1bd378fe9c81ef37140': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr32000_hl512.json') |
|
param_name_auto=str('1band_sr32000_hl512') |
|
if model_hash == '7dd21065bf91c10f7fccb57d7d83b07f': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr32000_hl512.json') |
|
param_name_auto=str('1band_sr32000_hl512') |
|
if model_hash == '80ab74d65e515caa3622728d2de07d23': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr32000_hl512.json') |
|
param_name_auto=str('1band_sr32000_hl512') |
|
if model_hash == 'edc115e7fc523245062200c00caa847f': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr33075_hl384.json') |
|
param_name_auto=str('1band_sr33075_hl384') |
|
if model_hash == '28063e9f6ab5b341c5f6d3c67f2045b7': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr33075_hl384.json') |
|
param_name_auto=str('1band_sr33075_hl384') |
|
if model_hash == 'b58090534c52cbc3e9b5104bad666ef2': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl512.json') |
|
param_name_auto=str('1band_sr44100_hl512') |
|
if model_hash == '0cdab9947f1b0928705f518f3c78ea8f': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl512.json') |
|
param_name_auto=str('1band_sr44100_hl512') |
|
if model_hash == 'ae702fed0238afb5346db8356fe25f13': |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl1024.json') |
|
param_name_auto=str('1band_sr44100_hl1024') |
|
|
|
|
|
|
|
if '1band_sr16000_hl512' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr16000_hl512.json') |
|
param_name_auto=str('1band_sr16000_hl512') |
|
if '1band_sr32000_hl512' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr32000_hl512.json') |
|
param_name_auto=str('1band_sr32000_hl512') |
|
if '1band_sr33075_hl384' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr33075_hl384.json') |
|
param_name_auto=str('1band_sr33075_hl384') |
|
if '1band_sr44100_hl256' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl256.json') |
|
param_name_auto=str('1band_sr44100_hl256') |
|
if '1band_sr44100_hl512' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl512.json') |
|
param_name_auto=str('1band_sr44100_hl512') |
|
if '1band_sr44100_hl1024' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl1024.json') |
|
param_name_auto=str('1band_sr44100_hl1024') |
|
|
|
|
|
if '2band_44100_lofi' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/2band_44100_lofi.json') |
|
param_name_auto=str('2band_44100_lofi') |
|
if '2band_32000' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/2band_32000.json') |
|
param_name_auto=str('2band_32000') |
|
if '2band_48000' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/2band_48000.json') |
|
param_name_auto=str('2band_48000') |
|
|
|
|
|
if '3band_44100' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/3band_44100.json') |
|
param_name_auto=str('3band_44100') |
|
if '3band_44100_mid' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/3band_44100_mid.json') |
|
param_name_auto=str('3band_44100_mid') |
|
if '3band_44100_msb2' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/3band_44100_msb2.json') |
|
param_name_auto=str('3band_44100_msb2') |
|
|
|
|
|
if '4band_44100' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_44100.json') |
|
param_name_auto=str('4band_44100') |
|
if '4band_44100_mid' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_44100_mid.json') |
|
param_name_auto=str('4band_44100_mid') |
|
if '4band_44100_msb' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_44100_msb.json') |
|
param_name_auto=str('4band_44100_msb') |
|
if '4band_44100_msb2' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_44100_msb2.json') |
|
param_name_auto=str('4band_44100_msb2') |
|
if '4band_44100_reverse' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_44100_reverse.json') |
|
param_name_auto=str('4band_44100_reverse') |
|
if '4band_44100_sw' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_44100_sw.json') |
|
param_name_auto=str('4band_44100_sw') |
|
if '4band_v2' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_v2.json') |
|
param_name_auto=str('4band_v2') |
|
if '4band_v2_sn' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/4band_v2_sn.json') |
|
param_name_auto=str('4band_v2_sn') |
|
if 'tmodelparam' in ModelName: |
|
model_params_auto=str('runtime/Lib/site-packages/uvr5_pack/lib_v5/modelparams/tmodelparam.json') |
|
param_name_auto=str('User Model Param Set') |
|
return param_name_auto , model_params_auto |
|
|