Baseline
Python Modules
Baseline enhancement for CAD2 task1. |
|
Evaluate the enhanced signals using HAAQI and Whisper |
Configuration Files
config.yaml
1path:
2 root: ??? # Set to the root of the dataset
3 metadata_dir: ${path.root}/metadata
4 music_dir: ${path.root}/audio
5 musics_file: ${path.metadata_dir}/music.valid.json
6 alphas_file: ${path.metadata_dir}/alpha.json
7 listeners_file: ${path.metadata_dir}/listeners.valid.json
8 enhancer_params_file: ${path.metadata_dir}/compressor_params.valid.json
9 scenes_file: ${path.metadata_dir}/scene.valid.json
10 scene_listeners_file: ${path.metadata_dir}/scene_listeners.valid.json
11 exp_folder: ./exp_${separator.causality} # folder to store enhanced signals and final results
12
13input_sample_rate: 44100 # sample rate of the input mixture
14remix_sample_rate: 44100 # sample rate for the output remixed signal
15HAAQI_sample_rate: 24000 # sample rate for computing HAAQI score
16
17separator:
18 causality: causal
19 device: ~
20 separation:
21 number_sources: 2
22 segment: 6.0
23 overlap: 0.1
24 sample_rate: ${input_sample_rate}
25
26enhancer:
27 crossover_frequencies: [ 353.55, 707.11, 1414.21, 2828.43, 5656.85 ] # [250, 500, 1000, 2000, 4000] * sqrt(2)
28 attack: [ 11, 11, 14, 13, 11, 11 ]
29 release: [ 80, 80, 80, 80, 100, 100 ]
30 threshold: [ -30, -30, -30, -30, -30, -30 ]
31
32soft_clip: False
33
34evaluate:
35 whisper_version: base.en
36 set_random_seed: True
37 small_test: False
38 save_intermediate: False
39 equiv_0db_spl: 100
40 batch_size: 1 # Number of batches
41 batch: 0 # Batch number to evaluate
42
43# hydra config
44hydra:
45 run:
46 dir: ${path.exp_folder}
47 job:
48 chdir: True