-
Notifications
You must be signed in to change notification settings - Fork 39
/
Copy pathhparams.py
79 lines (67 loc) · 1.82 KB
/
hparams.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
from text import symbols
class hparams:
seed = 0
################################
# Data Parameters #
################################
text_cleaners=['english_cleaners']
################################
# Audio #
################################
num_mels = 80
num_freq = 513
sample_rate = 22050
frame_shift = 256
frame_length = 1024
fmin = 0
fmax = 8000
power = 1.5
gl_iters = 30
################################
# Train #
################################
is_cuda = True
pin_mem = True
n_workers = 4
prep = True
pth = 'lj-22k.pkl'
lr = 2e-3
betas = (0.9, 0.999)
eps = 1e-6
sch = True
sch_step = 4000
max_iter = 200e3
batch_size = 16
iters_per_log = 10
iters_per_sample = 500
iters_per_ckpt = 10000
weight_decay = 1e-6
grad_clip_thresh = 1.0
eg_text = 'OMAK is a thinking process which considers things always positively.'
################################
# Model Parameters #
################################
n_symbols = len(symbols)
symbols_embedding_dim = 512
# Encoder parameters
encoder_kernel_size = 5
encoder_n_convolutions = 3
encoder_embedding_dim = 512
# Decoder parameters
n_frames_per_step = 3
decoder_rnn_dim = 1024
prenet_dim = 256
max_decoder_ratio = 10
gate_threshold = 0.5
p_attention_dropout = 0.1
p_decoder_dropout = 0.1
# Attention parameters
attention_rnn_dim = 1024
attention_dim = 128
# Location Layer parameters
attention_location_n_filters = 32
attention_location_kernel_size = 31
# Mel-post processing network parameters
postnet_embedding_dim = 512
postnet_kernel_size = 5
postnet_n_convolutions = 5