Algorithm info: sampling_rate: 44100
num_channels: 2
n_fft: 4096
window_length: 4096
hop_length: 1024
num_dual_path_blocks: 6
num_time_transfomrer: 1
num_freq_transformer: 1
mix_ln: false
hidden_size_list: [4, 32, 64, 128]
band_SR: [0.225, 0.372, 0.403]
band_strides: [1, 4, 16]
band_kernels: [3, 4, 16]
discriminator_stft_params:
[[1024, 256, 1024], [2048, 512, 2048], [4096, 1024, 4096]]
discriminator_periods: [2, 3, 5, 7, 11]
mrd_loss_weight: 1.0
discriminator_activation: leakyrelu
batch_size: 2
patch_len: 66150 # 44100 * 1.5
spec_loss_weight: 2
feature_loss_weight: 2
generator_loss_weight: 1
discriminator_loss_type: "mse"
discriminator_update_prob: 0.33
Metrics:
Metric sdr for piano: 0.7394
Metric si_sdr for piano: -3.8102
Metric l1_freq for piano: 40.0740
Metric log_wmse for piano: 11.7046
Metric aura_stft for piano: 4.9026
Metric aura_mrstft for piano: 5.9312
Metric bleedless for piano: 12.2979
Metric fullness for piano: 15.1994
Metric sdr for other: 12.6939
Metric si_sdr for other: 12.5368
Metric l1_freq for other: 33.5813
Metric log_wmse for other: 11.4578
Metric aura_stft for other: 9.7875
Metric aura_mrstft for other: 18.1022
Metric bleedless for other: 33.8249
Metric fullness for other: 35.6829
Date added: 2025-02-11 |