-
Notifications
You must be signed in to change notification settings - Fork 1
/
config.py
32 lines (32 loc) · 1.63 KB
/
config.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
model_config = [
{'filters': 256, 'repeat': 1, 'kernel': 33, 'stride': 2, 'dilation': 1, 'residual': False, 'separable': True},
{'filters': 256, 'repeat': 5, 'kernel': 33, 'stride': 1, 'dilation': 1, 'residual': True, 'separable': True},
{'filters': 256, 'repeat': 5, 'kernel': 39, 'stride': 1, 'dilation': 1, 'residual': True, 'separable': True},
{'filters': 512, 'repeat': 5, 'kernel': 51, 'stride': 1, 'dilation': 1, 'residual': True, 'separable': True},
{'filters': 512, 'repeat': 5, 'kernel': 63, 'stride': 1, 'dilation': 1, 'residual': True, 'separable': True},
{'filters': 512, 'repeat': 5, 'kernel': 75, 'stride': 1, 'dilation': 1, 'residual': True, 'separable': True},
{'filters': 512, 'repeat': 1, 'kernel': 87, 'stride': 1, 'dilation': 2, 'residual': False, 'separable': True},
{'filters': 1024, 'repeat': 1, 'kernel': 1, 'stride': 1, 'dilation': 1, 'residual': False, 'separable': False}
]
params = {"num_features": 64,
"sample_rate": 16000,
"original_sample_rate": 22050,
"batch_size": 32,
"num_workers": 8,
"lr": 0.005,
"num_epochs": 100,
"noise_variance": 0.01,
"min_time_stretch": 0.9,
"max_time_stretch": 1.1,
"min_shift": -3,
"max_shift": 3,
"time_masking": 1,
"wandb_name": "Quartznet_LJSpeech",
"clip_grad_norm": 15,
"vocab_size": 120,
"bpe_model": "bpe_model",
"from_pretrained": False,
"model_path": "model90.pth",
"start_epoch": 40,
"path_to_file": "LJ001-0004.wav",
}