alibabasglab commited on
Commit
5245e8c
·
verified ·
1 Parent(s): 50e06fb

Upload 2 files

Browse files
config/inference/MossFormer2_SR_48K.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "resblock": "1",
3
+ "num_gpus": 1,
4
+ "batch_size": 2,
5
+ "learning_rate": 0.0001,
6
+ "learning_rate_mossformer": 0.0005,
7
+ "adam_b1": 0.8,
8
+ "adam_b2": 0.99,
9
+ "lr_decay": 0.999,
10
+ "seed": 1234,
11
+ "upsample_rates": [8, 8, 2, 2],
12
+ "upsample_kernel_sizes": [16, 16, 4, 4],
13
+ "upsample_initial_channel": 1024,
14
+ "resblock_kernel_sizes": [3, 7, 11],
15
+ "resblock_dilation_sizes": [[1, 3, 5], [1, 3, 5], [1, 3, 5]],
16
+ "segment_size": 24576,
17
+ "num_mels": 80,
18
+ "num_freq": 1025,
19
+ "n_fft": 1024,
20
+ "hop_size": 256,
21
+ "win_size": 1024,
22
+ "sampling_rate": 48000,
23
+ "fmin": 0,
24
+ "fmax": 8000,
25
+ "fmax_for_loss": null,
26
+ "num_workers": 4,
27
+ "dist_config": {
28
+ "dist_backend": "nccl",
29
+ "dist_url": "tcp://localhost:54321",
30
+ "world_size": 1
31
+ }
32
+ }
config/inference/MossFormer2_SR_48K.yaml ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ mode: 'inference'
3
+ config_json: "config/inference/MossFormer2_SR_48K.json"
4
+ use_cuda: 1 # 1 for True, 0 for False
5
+ num_gpu: 1
6
+ sampling_rate: 48000
7
+ network: "MossFormer2_SR_48K" ##network type
8
+ checkpoint_dir: "checkpoints/MossFormer2_SR_48K"
9
+
10
+ #input_path: support wav dir or wav scp or a wav file
11
+ input_path: "samples/scp/cv_demand_testset_16k.scp"
12
+ output_dir: "outputs/MossFormer2_SR_48K"
13
+
14
+ # decode parameters
15
+ one_time_decode_length: 20 #maximum segment length for one-pass decoding (seconds), longer audio will use segmented decoding
16
+ decode_window: 4 #one-pass decoding length