Algorithm info: sampling_rate: 44100
num_channels: 2
n_fft: 4096
window_length: 4096
hop_length: 1024
num_dual_path_blocks: 12
num_time_transfomrer: 1
num_freq_transformer: 1
mix_ln: false
hidden_size_list: [4, 32, 64, 128]
band_SR: [0.175, 0.392, 0.433]
band_strides: [1, 4, 16]
band_kernels: [3, 4, 16]
discriminator_stft_params:
[[1024, 256, 1024], [2048, 512, 2048], [4096, 1024, 4096]]
discriminator_periods: [2, 3, 5, 7, 11]
mrd_loss_weight: 1.0
discriminator_activation: leakyrelu
batch_size: 2
patch_len: 66150 # 44100 * 1.5
spec_loss_weight: 2
feature_loss_weight: 2
generator_loss_weight: 1
discriminator_loss_type: "mse"
discriminator_update_prob: 0.33
Metrics:
Metric sdr for piano: 1.2623
Metric si_sdr for piano: -3.9742
Metric l1_freq for piano: 40.7182
Metric log_wmse for piano: 12.1095
Metric aura_stft for piano: 4.7100
Metric aura_mrstft for piano: 5.6396
Metric bleedless for piano: 11.5378
Metric fullness for piano: 15.0101
Metric sdr for other: 13.1501
Metric si_sdr for other: 12.9507
Metric l1_freq for other: 34.6559
Metric log_wmse for other: 11.8205
Metric aura_stft for other: 10.5951
Metric aura_mrstft for other: 19.4695
Metric bleedless for other: 33.2298
Metric fullness for other: 36.9717
Date added: 2025-02-11 |