forked from acids-ircam/RAVE
-
Notifications
You must be signed in to change notification settings - Fork 1
/
defaults.ini
109 lines (71 loc) · 1.38 KB
/
defaults.ini
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
[DEFAULTS]
# name of the run. don't leave this blank
name = None
# batch size
batch = 8
# random seed
seed = 42
# accelerate start method
start_method = "forkserver"
# list (w/o brackets) of augmentation transfroms (in audiodata.py) to apply
augs = PadCrop(sample_size), PhaseFlipper()
# IDK
data_size = 16
# IDK
capacity = 32
# IDK
latent_size = 128
# IDK
ratios = [4, 4, 2, 2, 2]
# IDK
taylor_degrees = 0
# IDK
bias = True
# IDK
no_latency = False
# IDK
min_kl = 1e-4
# IDK
max_kl = 1e-1
# IDK
cropped_latent_size = 0
# IDK
feature_match = True
# IDK
loud_stride = 1
# IDK
use_noise = True
# IDK
noise_ratios = [4, 4, 4]
# IDK
noise_bands = 5
# IDK
d_capacity = 16
# IDK
d_multiplier = 4
# IDK
d_n_layers = 4
# IDK
warmup = 1000000
# IDK
mode = "hinge"
# UNUSED NOW. where preprocessed audio is/will be stored (left in so scripts don't break)
preprocessed = None
# where original-audio dataset is stored
wav = None
# sample rate in Hz
sr = 48000
# how long each 'chunk' of audio is
n_signal = 65536
# IDK
max_steps = 2000000
# how often (in steps) to perform validation measures
val_every = 10000
# how often to save a checkpoint
checkpoint_every = 25000
# name of checkpoint file
ckpt = None
# list of transformations (as a string)
transforms = [RandomCrop(args.n_signal), Dequantize(16), lambda x: x.astype(np.float32)]
# fraction of total dataset to use
load_frac = 1.0