Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
ModelZoo
Retrieval-based-Voice-Conversion-WebUI_pytorch
Commits
9867304a
Commit
9867304a
authored
Jul 23, 2024
by
chenzk
Browse files
v1.0
parents
Pipeline
#1408
canceled with stages
Changes
217
Pipelines
1
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
945 additions
and
0 deletions
+945
-0
infer/lib/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl256.json
...lib/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl256.json
+20
-0
infer/lib/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl512.json
...lib/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl512.json
+20
-0
infer/lib/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl512_cut.json
...uvr5_pack/lib_v5/modelparams/1band_sr44100_hl512_cut.json
+20
-0
infer/lib/uvr5_pack/lib_v5/modelparams/2band_32000.json
infer/lib/uvr5_pack/lib_v5/modelparams/2band_32000.json
+30
-0
infer/lib/uvr5_pack/lib_v5/modelparams/2band_44100_lofi.json
infer/lib/uvr5_pack/lib_v5/modelparams/2band_44100_lofi.json
+30
-0
infer/lib/uvr5_pack/lib_v5/modelparams/2band_48000.json
infer/lib/uvr5_pack/lib_v5/modelparams/2band_48000.json
+31
-0
infer/lib/uvr5_pack/lib_v5/modelparams/3band_44100.json
infer/lib/uvr5_pack/lib_v5/modelparams/3band_44100.json
+42
-0
infer/lib/uvr5_pack/lib_v5/modelparams/3band_44100_mid.json
infer/lib/uvr5_pack/lib_v5/modelparams/3band_44100_mid.json
+43
-0
infer/lib/uvr5_pack/lib_v5/modelparams/3band_44100_msb2.json
infer/lib/uvr5_pack/lib_v5/modelparams/3band_44100_msb2.json
+43
-0
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100.json
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100.json
+54
-0
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_mid.json
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_mid.json
+55
-0
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_msb.json
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_msb.json
+56
-0
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_msb2.json
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_msb2.json
+56
-0
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_reverse.json
...lib/uvr5_pack/lib_v5/modelparams/4band_44100_reverse.json
+56
-0
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_sw.json
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_sw.json
+56
-0
infer/lib/uvr5_pack/lib_v5/modelparams/4band_v2.json
infer/lib/uvr5_pack/lib_v5/modelparams/4band_v2.json
+55
-0
infer/lib/uvr5_pack/lib_v5/modelparams/4band_v2_sn.json
infer/lib/uvr5_pack/lib_v5/modelparams/4band_v2_sn.json
+56
-0
infer/lib/uvr5_pack/lib_v5/modelparams/4band_v3.json
infer/lib/uvr5_pack/lib_v5/modelparams/4band_v3.json
+55
-0
infer/lib/uvr5_pack/lib_v5/modelparams/ensemble.json
infer/lib/uvr5_pack/lib_v5/modelparams/ensemble.json
+44
-0
infer/lib/uvr5_pack/lib_v5/nets.py
infer/lib/uvr5_pack/lib_v5/nets.py
+123
-0
No files found.
infer/lib/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl256.json
0 → 100644
View file @
9867304a
{
"bins"
:
256
,
"unstable_bins"
:
0
,
"reduction_bins"
:
0
,
"band"
:
{
"1"
:
{
"sr"
:
44100
,
"hl"
:
256
,
"n_fft"
:
512
,
"crop_start"
:
0
,
"crop_stop"
:
256
,
"hpf_start"
:
-1
,
"res_type"
:
"sinc_best"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
256
,
"pre_filter_stop"
:
256
}
\ No newline at end of file
infer/lib/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl512.json
0 → 100644
View file @
9867304a
{
"bins"
:
1024
,
"unstable_bins"
:
0
,
"reduction_bins"
:
0
,
"band"
:
{
"1"
:
{
"sr"
:
44100
,
"hl"
:
512
,
"n_fft"
:
2048
,
"crop_start"
:
0
,
"crop_stop"
:
1024
,
"hpf_start"
:
-1
,
"res_type"
:
"sinc_best"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
1023
,
"pre_filter_stop"
:
1024
}
\ No newline at end of file
infer/lib/uvr5_pack/lib_v5/modelparams/1band_sr44100_hl512_cut.json
0 → 100644
View file @
9867304a
{
"bins"
:
1024
,
"unstable_bins"
:
0
,
"reduction_bins"
:
0
,
"band"
:
{
"1"
:
{
"sr"
:
44100
,
"hl"
:
512
,
"n_fft"
:
2048
,
"crop_start"
:
0
,
"crop_stop"
:
700
,
"hpf_start"
:
-1
,
"res_type"
:
"sinc_best"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
1023
,
"pre_filter_stop"
:
700
}
\ No newline at end of file
infer/lib/uvr5_pack/lib_v5/modelparams/2band_32000.json
0 → 100644
View file @
9867304a
{
"bins"
:
768
,
"unstable_bins"
:
7
,
"reduction_bins"
:
705
,
"band"
:
{
"1"
:
{
"sr"
:
6000
,
"hl"
:
66
,
"n_fft"
:
512
,
"crop_start"
:
0
,
"crop_stop"
:
240
,
"lpf_start"
:
60
,
"lpf_stop"
:
118
,
"res_type"
:
"sinc_fastest"
},
"2"
:
{
"sr"
:
32000
,
"hl"
:
352
,
"n_fft"
:
1024
,
"crop_start"
:
22
,
"crop_stop"
:
505
,
"hpf_start"
:
44
,
"hpf_stop"
:
23
,
"res_type"
:
"sinc_medium"
}
},
"sr"
:
32000
,
"pre_filter_start"
:
710
,
"pre_filter_stop"
:
731
}
infer/lib/uvr5_pack/lib_v5/modelparams/2band_44100_lofi.json
0 → 100644
View file @
9867304a
{
"bins"
:
512
,
"unstable_bins"
:
7
,
"reduction_bins"
:
510
,
"band"
:
{
"1"
:
{
"sr"
:
11025
,
"hl"
:
160
,
"n_fft"
:
768
,
"crop_start"
:
0
,
"crop_stop"
:
192
,
"lpf_start"
:
41
,
"lpf_stop"
:
139
,
"res_type"
:
"sinc_fastest"
},
"2"
:
{
"sr"
:
44100
,
"hl"
:
640
,
"n_fft"
:
1024
,
"crop_start"
:
10
,
"crop_stop"
:
320
,
"hpf_start"
:
47
,
"hpf_stop"
:
15
,
"res_type"
:
"sinc_medium"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
510
,
"pre_filter_stop"
:
512
}
infer/lib/uvr5_pack/lib_v5/modelparams/2band_48000.json
0 → 100644
View file @
9867304a
{
"bins"
:
768
,
"unstable_bins"
:
7
,
"reduction_bins"
:
705
,
"band"
:
{
"1"
:
{
"sr"
:
6000
,
"hl"
:
66
,
"n_fft"
:
512
,
"crop_start"
:
0
,
"crop_stop"
:
240
,
"lpf_start"
:
60
,
"lpf_stop"
:
240
,
"res_type"
:
"sinc_fastest"
},
"2"
:
{
"sr"
:
48000
,
"hl"
:
528
,
"n_fft"
:
1536
,
"crop_start"
:
22
,
"crop_stop"
:
505
,
"hpf_start"
:
82
,
"hpf_stop"
:
22
,
"res_type"
:
"sinc_medium"
}
},
"sr"
:
48000
,
"pre_filter_start"
:
710
,
"pre_filter_stop"
:
731
}
\ No newline at end of file
infer/lib/uvr5_pack/lib_v5/modelparams/3band_44100.json
0 → 100644
View file @
9867304a
{
"bins"
:
768
,
"unstable_bins"
:
5
,
"reduction_bins"
:
733
,
"band"
:
{
"1"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
768
,
"crop_start"
:
0
,
"crop_stop"
:
278
,
"lpf_start"
:
28
,
"lpf_stop"
:
140
,
"res_type"
:
"polyphase"
},
"2"
:
{
"sr"
:
22050
,
"hl"
:
256
,
"n_fft"
:
768
,
"crop_start"
:
14
,
"crop_stop"
:
322
,
"hpf_start"
:
70
,
"hpf_stop"
:
14
,
"lpf_start"
:
283
,
"lpf_stop"
:
314
,
"res_type"
:
"polyphase"
},
"3"
:
{
"sr"
:
44100
,
"hl"
:
512
,
"n_fft"
:
768
,
"crop_start"
:
131
,
"crop_stop"
:
313
,
"hpf_start"
:
154
,
"hpf_stop"
:
141
,
"res_type"
:
"sinc_medium"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
757
,
"pre_filter_stop"
:
768
}
infer/lib/uvr5_pack/lib_v5/modelparams/3band_44100_mid.json
0 → 100644
View file @
9867304a
{
"mid_side"
:
true
,
"bins"
:
768
,
"unstable_bins"
:
5
,
"reduction_bins"
:
733
,
"band"
:
{
"1"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
768
,
"crop_start"
:
0
,
"crop_stop"
:
278
,
"lpf_start"
:
28
,
"lpf_stop"
:
140
,
"res_type"
:
"polyphase"
},
"2"
:
{
"sr"
:
22050
,
"hl"
:
256
,
"n_fft"
:
768
,
"crop_start"
:
14
,
"crop_stop"
:
322
,
"hpf_start"
:
70
,
"hpf_stop"
:
14
,
"lpf_start"
:
283
,
"lpf_stop"
:
314
,
"res_type"
:
"polyphase"
},
"3"
:
{
"sr"
:
44100
,
"hl"
:
512
,
"n_fft"
:
768
,
"crop_start"
:
131
,
"crop_stop"
:
313
,
"hpf_start"
:
154
,
"hpf_stop"
:
141
,
"res_type"
:
"sinc_medium"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
757
,
"pre_filter_stop"
:
768
}
infer/lib/uvr5_pack/lib_v5/modelparams/3band_44100_msb2.json
0 → 100644
View file @
9867304a
{
"mid_side_b2"
:
true
,
"bins"
:
640
,
"unstable_bins"
:
7
,
"reduction_bins"
:
565
,
"band"
:
{
"1"
:
{
"sr"
:
11025
,
"hl"
:
108
,
"n_fft"
:
1024
,
"crop_start"
:
0
,
"crop_stop"
:
187
,
"lpf_start"
:
92
,
"lpf_stop"
:
186
,
"res_type"
:
"polyphase"
},
"2"
:
{
"sr"
:
22050
,
"hl"
:
216
,
"n_fft"
:
768
,
"crop_start"
:
0
,
"crop_stop"
:
212
,
"hpf_start"
:
68
,
"hpf_stop"
:
34
,
"lpf_start"
:
174
,
"lpf_stop"
:
209
,
"res_type"
:
"polyphase"
},
"3"
:
{
"sr"
:
44100
,
"hl"
:
432
,
"n_fft"
:
640
,
"crop_start"
:
66
,
"crop_stop"
:
307
,
"hpf_start"
:
86
,
"hpf_stop"
:
72
,
"res_type"
:
"kaiser_fast"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
639
,
"pre_filter_stop"
:
640
}
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100.json
0 → 100644
View file @
9867304a
{
"bins"
:
768
,
"unstable_bins"
:
7
,
"reduction_bins"
:
668
,
"band"
:
{
"1"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
1024
,
"crop_start"
:
0
,
"crop_stop"
:
186
,
"lpf_start"
:
37
,
"lpf_stop"
:
73
,
"res_type"
:
"polyphase"
},
"2"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
512
,
"crop_start"
:
4
,
"crop_stop"
:
185
,
"hpf_start"
:
36
,
"hpf_stop"
:
18
,
"lpf_start"
:
93
,
"lpf_stop"
:
185
,
"res_type"
:
"polyphase"
},
"3"
:
{
"sr"
:
22050
,
"hl"
:
256
,
"n_fft"
:
512
,
"crop_start"
:
46
,
"crop_stop"
:
186
,
"hpf_start"
:
93
,
"hpf_stop"
:
46
,
"lpf_start"
:
164
,
"lpf_stop"
:
186
,
"res_type"
:
"polyphase"
},
"4"
:
{
"sr"
:
44100
,
"hl"
:
512
,
"n_fft"
:
768
,
"crop_start"
:
121
,
"crop_stop"
:
382
,
"hpf_start"
:
138
,
"hpf_stop"
:
123
,
"res_type"
:
"sinc_medium"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
740
,
"pre_filter_stop"
:
768
}
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_mid.json
0 → 100644
View file @
9867304a
{
"bins"
:
768
,
"unstable_bins"
:
7
,
"mid_side"
:
true
,
"reduction_bins"
:
668
,
"band"
:
{
"1"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
1024
,
"crop_start"
:
0
,
"crop_stop"
:
186
,
"lpf_start"
:
37
,
"lpf_stop"
:
73
,
"res_type"
:
"polyphase"
},
"2"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
512
,
"crop_start"
:
4
,
"crop_stop"
:
185
,
"hpf_start"
:
36
,
"hpf_stop"
:
18
,
"lpf_start"
:
93
,
"lpf_stop"
:
185
,
"res_type"
:
"polyphase"
},
"3"
:
{
"sr"
:
22050
,
"hl"
:
256
,
"n_fft"
:
512
,
"crop_start"
:
46
,
"crop_stop"
:
186
,
"hpf_start"
:
93
,
"hpf_stop"
:
46
,
"lpf_start"
:
164
,
"lpf_stop"
:
186
,
"res_type"
:
"polyphase"
},
"4"
:
{
"sr"
:
44100
,
"hl"
:
512
,
"n_fft"
:
768
,
"crop_start"
:
121
,
"crop_stop"
:
382
,
"hpf_start"
:
138
,
"hpf_stop"
:
123
,
"res_type"
:
"sinc_medium"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
740
,
"pre_filter_stop"
:
768
}
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_msb.json
0 → 100644
View file @
9867304a
{
"mid_side_b"
:
true
,
"bins"
:
768
,
"unstable_bins"
:
7
,
"reduction_bins"
:
668
,
"band"
:
{
"1"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
1024
,
"crop_start"
:
0
,
"crop_stop"
:
186
,
"lpf_start"
:
37
,
"lpf_stop"
:
73
,
"res_type"
:
"polyphase"
},
"2"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
512
,
"crop_start"
:
4
,
"crop_stop"
:
185
,
"hpf_start"
:
36
,
"hpf_stop"
:
18
,
"lpf_start"
:
93
,
"lpf_stop"
:
185
,
"res_type"
:
"polyphase"
},
"3"
:
{
"sr"
:
22050
,
"hl"
:
256
,
"n_fft"
:
512
,
"crop_start"
:
46
,
"crop_stop"
:
186
,
"hpf_start"
:
93
,
"hpf_stop"
:
46
,
"lpf_start"
:
164
,
"lpf_stop"
:
186
,
"res_type"
:
"polyphase"
},
"4"
:
{
"sr"
:
44100
,
"hl"
:
512
,
"n_fft"
:
768
,
"crop_start"
:
121
,
"crop_stop"
:
382
,
"hpf_start"
:
138
,
"hpf_stop"
:
123
,
"res_type"
:
"sinc_medium"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
740
,
"pre_filter_stop"
:
768
}
\ No newline at end of file
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_msb2.json
0 → 100644
View file @
9867304a
{
"mid_side_b"
:
true
,
"bins"
:
768
,
"unstable_bins"
:
7
,
"reduction_bins"
:
668
,
"band"
:
{
"1"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
1024
,
"crop_start"
:
0
,
"crop_stop"
:
186
,
"lpf_start"
:
37
,
"lpf_stop"
:
73
,
"res_type"
:
"polyphase"
},
"2"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
512
,
"crop_start"
:
4
,
"crop_stop"
:
185
,
"hpf_start"
:
36
,
"hpf_stop"
:
18
,
"lpf_start"
:
93
,
"lpf_stop"
:
185
,
"res_type"
:
"polyphase"
},
"3"
:
{
"sr"
:
22050
,
"hl"
:
256
,
"n_fft"
:
512
,
"crop_start"
:
46
,
"crop_stop"
:
186
,
"hpf_start"
:
93
,
"hpf_stop"
:
46
,
"lpf_start"
:
164
,
"lpf_stop"
:
186
,
"res_type"
:
"polyphase"
},
"4"
:
{
"sr"
:
44100
,
"hl"
:
512
,
"n_fft"
:
768
,
"crop_start"
:
121
,
"crop_stop"
:
382
,
"hpf_start"
:
138
,
"hpf_stop"
:
123
,
"res_type"
:
"sinc_medium"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
740
,
"pre_filter_stop"
:
768
}
\ No newline at end of file
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_reverse.json
0 → 100644
View file @
9867304a
{
"reverse"
:
true
,
"bins"
:
768
,
"unstable_bins"
:
7
,
"reduction_bins"
:
668
,
"band"
:
{
"1"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
1024
,
"crop_start"
:
0
,
"crop_stop"
:
186
,
"lpf_start"
:
37
,
"lpf_stop"
:
73
,
"res_type"
:
"polyphase"
},
"2"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
512
,
"crop_start"
:
4
,
"crop_stop"
:
185
,
"hpf_start"
:
36
,
"hpf_stop"
:
18
,
"lpf_start"
:
93
,
"lpf_stop"
:
185
,
"res_type"
:
"polyphase"
},
"3"
:
{
"sr"
:
22050
,
"hl"
:
256
,
"n_fft"
:
512
,
"crop_start"
:
46
,
"crop_stop"
:
186
,
"hpf_start"
:
93
,
"hpf_stop"
:
46
,
"lpf_start"
:
164
,
"lpf_stop"
:
186
,
"res_type"
:
"polyphase"
},
"4"
:
{
"sr"
:
44100
,
"hl"
:
512
,
"n_fft"
:
768
,
"crop_start"
:
121
,
"crop_stop"
:
382
,
"hpf_start"
:
138
,
"hpf_stop"
:
123
,
"res_type"
:
"sinc_medium"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
740
,
"pre_filter_stop"
:
768
}
\ No newline at end of file
infer/lib/uvr5_pack/lib_v5/modelparams/4band_44100_sw.json
0 → 100644
View file @
9867304a
{
"stereo_w"
:
true
,
"bins"
:
768
,
"unstable_bins"
:
7
,
"reduction_bins"
:
668
,
"band"
:
{
"1"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
1024
,
"crop_start"
:
0
,
"crop_stop"
:
186
,
"lpf_start"
:
37
,
"lpf_stop"
:
73
,
"res_type"
:
"polyphase"
},
"2"
:
{
"sr"
:
11025
,
"hl"
:
128
,
"n_fft"
:
512
,
"crop_start"
:
4
,
"crop_stop"
:
185
,
"hpf_start"
:
36
,
"hpf_stop"
:
18
,
"lpf_start"
:
93
,
"lpf_stop"
:
185
,
"res_type"
:
"polyphase"
},
"3"
:
{
"sr"
:
22050
,
"hl"
:
256
,
"n_fft"
:
512
,
"crop_start"
:
46
,
"crop_stop"
:
186
,
"hpf_start"
:
93
,
"hpf_stop"
:
46
,
"lpf_start"
:
164
,
"lpf_stop"
:
186
,
"res_type"
:
"polyphase"
},
"4"
:
{
"sr"
:
44100
,
"hl"
:
512
,
"n_fft"
:
768
,
"crop_start"
:
121
,
"crop_stop"
:
382
,
"hpf_start"
:
138
,
"hpf_stop"
:
123
,
"res_type"
:
"sinc_medium"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
740
,
"pre_filter_stop"
:
768
}
\ No newline at end of file
infer/lib/uvr5_pack/lib_v5/modelparams/4band_v2.json
0 → 100644
View file @
9867304a
{
"bins"
:
672
,
"unstable_bins"
:
8
,
"reduction_bins"
:
637
,
"band"
:
{
"1"
:
{
"sr"
:
7350
,
"hl"
:
80
,
"n_fft"
:
640
,
"crop_start"
:
0
,
"crop_stop"
:
85
,
"lpf_start"
:
25
,
"lpf_stop"
:
53
,
"res_type"
:
"polyphase"
},
"2"
:
{
"sr"
:
7350
,
"hl"
:
80
,
"n_fft"
:
320
,
"crop_start"
:
4
,
"crop_stop"
:
87
,
"hpf_start"
:
25
,
"hpf_stop"
:
12
,
"lpf_start"
:
31
,
"lpf_stop"
:
62
,
"res_type"
:
"polyphase"
},
"3"
:
{
"sr"
:
14700
,
"hl"
:
160
,
"n_fft"
:
512
,
"crop_start"
:
17
,
"crop_stop"
:
216
,
"hpf_start"
:
48
,
"hpf_stop"
:
24
,
"lpf_start"
:
139
,
"lpf_stop"
:
210
,
"res_type"
:
"polyphase"
},
"4"
:
{
"sr"
:
44100
,
"hl"
:
480
,
"n_fft"
:
960
,
"crop_start"
:
78
,
"crop_stop"
:
383
,
"hpf_start"
:
130
,
"hpf_stop"
:
86
,
"res_type"
:
"kaiser_fast"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
668
,
"pre_filter_stop"
:
672
}
\ No newline at end of file
infer/lib/uvr5_pack/lib_v5/modelparams/4band_v2_sn.json
0 → 100644
View file @
9867304a
{
"bins"
:
672
,
"unstable_bins"
:
8
,
"reduction_bins"
:
637
,
"band"
:
{
"1"
:
{
"sr"
:
7350
,
"hl"
:
80
,
"n_fft"
:
640
,
"crop_start"
:
0
,
"crop_stop"
:
85
,
"lpf_start"
:
25
,
"lpf_stop"
:
53
,
"res_type"
:
"polyphase"
},
"2"
:
{
"sr"
:
7350
,
"hl"
:
80
,
"n_fft"
:
320
,
"crop_start"
:
4
,
"crop_stop"
:
87
,
"hpf_start"
:
25
,
"hpf_stop"
:
12
,
"lpf_start"
:
31
,
"lpf_stop"
:
62
,
"res_type"
:
"polyphase"
},
"3"
:
{
"sr"
:
14700
,
"hl"
:
160
,
"n_fft"
:
512
,
"crop_start"
:
17
,
"crop_stop"
:
216
,
"hpf_start"
:
48
,
"hpf_stop"
:
24
,
"lpf_start"
:
139
,
"lpf_stop"
:
210
,
"res_type"
:
"polyphase"
},
"4"
:
{
"sr"
:
44100
,
"hl"
:
480
,
"n_fft"
:
960
,
"crop_start"
:
78
,
"crop_stop"
:
383
,
"hpf_start"
:
130
,
"hpf_stop"
:
86
,
"convert_channels"
:
"stereo_n"
,
"res_type"
:
"kaiser_fast"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
668
,
"pre_filter_stop"
:
672
}
\ No newline at end of file
infer/lib/uvr5_pack/lib_v5/modelparams/4band_v3.json
0 → 100644
View file @
9867304a
{
"bins"
:
672
,
"unstable_bins"
:
8
,
"reduction_bins"
:
530
,
"band"
:
{
"1"
:
{
"sr"
:
7350
,
"hl"
:
80
,
"n_fft"
:
640
,
"crop_start"
:
0
,
"crop_stop"
:
85
,
"lpf_start"
:
25
,
"lpf_stop"
:
53
,
"res_type"
:
"polyphase"
},
"2"
:
{
"sr"
:
7350
,
"hl"
:
80
,
"n_fft"
:
320
,
"crop_start"
:
4
,
"crop_stop"
:
87
,
"hpf_start"
:
25
,
"hpf_stop"
:
12
,
"lpf_start"
:
31
,
"lpf_stop"
:
62
,
"res_type"
:
"polyphase"
},
"3"
:
{
"sr"
:
14700
,
"hl"
:
160
,
"n_fft"
:
512
,
"crop_start"
:
17
,
"crop_stop"
:
216
,
"hpf_start"
:
48
,
"hpf_stop"
:
24
,
"lpf_start"
:
139
,
"lpf_stop"
:
210
,
"res_type"
:
"polyphase"
},
"4"
:
{
"sr"
:
44100
,
"hl"
:
480
,
"n_fft"
:
960
,
"crop_start"
:
78
,
"crop_stop"
:
383
,
"hpf_start"
:
130
,
"hpf_stop"
:
86
,
"res_type"
:
"kaiser_fast"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
668
,
"pre_filter_stop"
:
672
}
\ No newline at end of file
infer/lib/uvr5_pack/lib_v5/modelparams/ensemble.json
0 → 100644
View file @
9867304a
{
"mid_side_b2"
:
true
,
"bins"
:
1280
,
"unstable_bins"
:
7
,
"reduction_bins"
:
565
,
"band"
:
{
"1"
:
{
"sr"
:
11025
,
"hl"
:
108
,
"n_fft"
:
2048
,
"crop_start"
:
0
,
"crop_stop"
:
374
,
"lpf_start"
:
92
,
"lpf_stop"
:
186
,
"res_type"
:
"polyphase"
},
"2"
:
{
"sr"
:
22050
,
"hl"
:
216
,
"n_fft"
:
1536
,
"crop_start"
:
0
,
"crop_stop"
:
424
,
"hpf_start"
:
68
,
"hpf_stop"
:
34
,
"lpf_start"
:
348
,
"lpf_stop"
:
418
,
"res_type"
:
"polyphase"
},
"3"
:
{
"sr"
:
44100
,
"hl"
:
432
,
"n_fft"
:
1280
,
"crop_start"
:
132
,
"crop_stop"
:
614
,
"hpf_start"
:
172
,
"hpf_stop"
:
144
,
"res_type"
:
"polyphase"
}
},
"sr"
:
44100
,
"pre_filter_start"
:
1280
,
"pre_filter_stop"
:
1280
}
\ No newline at end of file
infer/lib/uvr5_pack/lib_v5/nets.py
0 → 100644
View file @
9867304a
import
layers
import
torch
import
torch.nn.functional
as
F
from
torch
import
nn
from
.
import
spec_utils
class
BaseASPPNet
(
nn
.
Module
):
def
__init__
(
self
,
nin
,
ch
,
dilations
=
(
4
,
8
,
16
)):
super
(
BaseASPPNet
,
self
).
__init__
()
self
.
enc1
=
layers
.
Encoder
(
nin
,
ch
,
3
,
2
,
1
)
self
.
enc2
=
layers
.
Encoder
(
ch
,
ch
*
2
,
3
,
2
,
1
)
self
.
enc3
=
layers
.
Encoder
(
ch
*
2
,
ch
*
4
,
3
,
2
,
1
)
self
.
enc4
=
layers
.
Encoder
(
ch
*
4
,
ch
*
8
,
3
,
2
,
1
)
self
.
aspp
=
layers
.
ASPPModule
(
ch
*
8
,
ch
*
16
,
dilations
)
self
.
dec4
=
layers
.
Decoder
(
ch
*
(
8
+
16
),
ch
*
8
,
3
,
1
,
1
)
self
.
dec3
=
layers
.
Decoder
(
ch
*
(
4
+
8
),
ch
*
4
,
3
,
1
,
1
)
self
.
dec2
=
layers
.
Decoder
(
ch
*
(
2
+
4
),
ch
*
2
,
3
,
1
,
1
)
self
.
dec1
=
layers
.
Decoder
(
ch
*
(
1
+
2
),
ch
,
3
,
1
,
1
)
def
__call__
(
self
,
x
):
h
,
e1
=
self
.
enc1
(
x
)
h
,
e2
=
self
.
enc2
(
h
)
h
,
e3
=
self
.
enc3
(
h
)
h
,
e4
=
self
.
enc4
(
h
)
h
=
self
.
aspp
(
h
)
h
=
self
.
dec4
(
h
,
e4
)
h
=
self
.
dec3
(
h
,
e3
)
h
=
self
.
dec2
(
h
,
e2
)
h
=
self
.
dec1
(
h
,
e1
)
return
h
class
CascadedASPPNet
(
nn
.
Module
):
def
__init__
(
self
,
n_fft
):
super
(
CascadedASPPNet
,
self
).
__init__
()
self
.
stg1_low_band_net
=
BaseASPPNet
(
2
,
16
)
self
.
stg1_high_band_net
=
BaseASPPNet
(
2
,
16
)
self
.
stg2_bridge
=
layers
.
Conv2DBNActiv
(
18
,
8
,
1
,
1
,
0
)
self
.
stg2_full_band_net
=
BaseASPPNet
(
8
,
16
)
self
.
stg3_bridge
=
layers
.
Conv2DBNActiv
(
34
,
16
,
1
,
1
,
0
)
self
.
stg3_full_band_net
=
BaseASPPNet
(
16
,
32
)
self
.
out
=
nn
.
Conv2d
(
32
,
2
,
1
,
bias
=
False
)
self
.
aux1_out
=
nn
.
Conv2d
(
16
,
2
,
1
,
bias
=
False
)
self
.
aux2_out
=
nn
.
Conv2d
(
16
,
2
,
1
,
bias
=
False
)
self
.
max_bin
=
n_fft
//
2
self
.
output_bin
=
n_fft
//
2
+
1
self
.
offset
=
128
def
forward
(
self
,
x
,
aggressiveness
=
None
):
mix
=
x
.
detach
()
x
=
x
.
clone
()
x
=
x
[:,
:,
:
self
.
max_bin
]
bandw
=
x
.
size
()[
2
]
//
2
aux1
=
torch
.
cat
(
[
self
.
stg1_low_band_net
(
x
[:,
:,
:
bandw
]),
self
.
stg1_high_band_net
(
x
[:,
:,
bandw
:]),
],
dim
=
2
,
)
h
=
torch
.
cat
([
x
,
aux1
],
dim
=
1
)
aux2
=
self
.
stg2_full_band_net
(
self
.
stg2_bridge
(
h
))
h
=
torch
.
cat
([
x
,
aux1
,
aux2
],
dim
=
1
)
h
=
self
.
stg3_full_band_net
(
self
.
stg3_bridge
(
h
))
mask
=
torch
.
sigmoid
(
self
.
out
(
h
))
mask
=
F
.
pad
(
input
=
mask
,
pad
=
(
0
,
0
,
0
,
self
.
output_bin
-
mask
.
size
()[
2
]),
mode
=
"replicate"
,
)
if
self
.
training
:
aux1
=
torch
.
sigmoid
(
self
.
aux1_out
(
aux1
))
aux1
=
F
.
pad
(
input
=
aux1
,
pad
=
(
0
,
0
,
0
,
self
.
output_bin
-
aux1
.
size
()[
2
]),
mode
=
"replicate"
,
)
aux2
=
torch
.
sigmoid
(
self
.
aux2_out
(
aux2
))
aux2
=
F
.
pad
(
input
=
aux2
,
pad
=
(
0
,
0
,
0
,
self
.
output_bin
-
aux2
.
size
()[
2
]),
mode
=
"replicate"
,
)
return
mask
*
mix
,
aux1
*
mix
,
aux2
*
mix
else
:
if
aggressiveness
:
mask
[:,
:,
:
aggressiveness
[
"split_bin"
]]
=
torch
.
pow
(
mask
[:,
:,
:
aggressiveness
[
"split_bin"
]],
1
+
aggressiveness
[
"value"
]
/
3
,
)
mask
[:,
:,
aggressiveness
[
"split_bin"
]
:]
=
torch
.
pow
(
mask
[:,
:,
aggressiveness
[
"split_bin"
]
:],
1
+
aggressiveness
[
"value"
],
)
return
mask
*
mix
def
predict
(
self
,
x_mag
,
aggressiveness
=
None
):
h
=
self
.
forward
(
x_mag
,
aggressiveness
)
if
self
.
offset
>
0
:
h
=
h
[:,
:,
:,
self
.
offset
:
-
self
.
offset
]
assert
h
.
size
()[
3
]
>
0
return
h
Prev
1
…
4
5
6
7
8
9
10
11
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment