-
Notifications
You must be signed in to change notification settings - Fork 0
/
experiment_config.json
194 lines (194 loc) · 6.2 KB
/
experiment_config.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
{
"experiments": [
{
"name": "eo_lm_hu_400_kp_06",
"models": [
"lstm_fast"
],
"learning_technique": "normal",
"hyperparameters": {
"shared_params": {
"create_model": "lstm_fast",
"data": {
"save_path": "results"
},
"train": {
"summary_steps": 100,
"save_checkpoint_steps": 200,
"keep_checkpoint_max": 5,
"multitask": {
"num_multitask_epochs": 1,
"switch_each_epoch": true,
"switch_each_batch": true
},
"early_stopping": {
"threshold": 0.001,
"max_steps_without_improvement": 10000
}
},
"arch": {
"sequence_length": 20,
"num_hidden_layers": 2,
"hidden_layer_size": 400,
"keep_prob": 0.6,
"vocab_size_language_model": 10000,
"vocab_size_pos": 37,
"vocab_size_generated": 3
}
},
"lstm_fast": {
"data": {
"pre_train": false,
"num_shifts_x": 1,
"data_path": "rnnlm/data",
"train_raw_data_file": "train",
"valid_raw_data_file": "valid",
"test_raw_data_file": "test",
"vocab_path_features": "wordlist.rnn.final",
"vocab_path_labels": "wordlist.rnn.final",
"vocab_size_features": 10000,
"vocab_size_labels": 10000,
"shape_size_features": 20,
"shape_size_labels": 20,
"tf_records_path": "tfrecords",
"tf_record_train_file": "train_extreme_overlap.tfrecord",
"tf_record_valid_file": "valid_extreme_overlap.tfrecord",
"tf_record_test_file": "test_extreme_overlap.tfrecord",
"shuffle": false,
"shuffle_buffer_size": 10000
},
"train": {
"w_init_scale": 0.1,
"max_grad_norm": 5,
"learning_rate": {
"type": "decay",
"start_value": 1.0,
"decay": 0.8,
"decay_max_factor": 4
},
"batch_size": 64,
"num_epochs": 20,
"epoch_size_train": 12920,
"epoch_size_valid": 1300,
"epoch_size_test": 1560
}
}
}
},
{
"name": "warn_baseline_multitask_unlearn_lm",
"models": [
"unlearn_gen",
"lstm_fast"
],
"learning_technique": "multitask",
"hyperparameters": {
"shared_params": {
"create_model": "lstm_fast",
"data": {
"save_path": "results"
},
"train": {
"summary_steps": 100,
"save_checkpoint_steps": 200,
"keep_checkpoint_max": 5,
"multitask": {
"num_multitask_epochs": 20,
"switch_each_epoch": true,
"switch_each_batch": false
},
"early_stopping": {
"threshold": 0.001,
"max_steps_without_improvement": 10000
},
"start_from_experiment": "eo_lm_hu_400_kp_06"
},
"arch": {
"sequence_length": 20,
"num_hidden_layers": 2,
"hidden_layer_size": 400,
"keep_prob": 0.6,
"vocab_size_language_model": 10000,
"vocab_size_pos": 37,
"vocab_size_generated": 3
}
},
"lstm_fast": {
"data": {
"pre_train": false,
"data_path": "rnnlm/data",
"train_raw_data_file": "train",
"valid_raw_data_file": "valid",
"test_raw_data_file": "test",
"vocab_path_features": "wordlist.rnn.final",
"vocab_path_labels": "wordlist.rnn.final",
"vocab_size_features": 10000,
"vocab_size_labels": 10000,
"shape_size_features": 20,
"shape_size_labels": 20,
"tf_records_path": "tfrecords",
"tf_record_train_file": "train_extreme_overlap.tfrecord",
"tf_record_valid_file": "valid_extreme_overlap.tfrecord",
"tf_record_test_file": "test_extreme_overlap.tfrecord",
"shuffle": false,
"shuffle_buffer_size": 10000
},
"train": {
"w_init_scale": 0.1,
"max_grad_norm": 5,
"learning_rate": {
"type": "decay",
"start_value": 1.0,
"decay": 0.8,
"decay_max_factor": 10
},
"batch_size": 64,
"num_epochs": 20,
"epoch_size_train": 12920,
"epoch_size_valid": 1300,
"epoch_size_test": 1560
}
},
"unlearn_gen": {
"data": {
"pre_train": false,
"data_path": "rnnlm/data",
"train_raw_data_file": "train",
"valid_raw_data_file": "valid",
"test_raw_data_file": "test",
"train_generated_data_file": "rnnlm/data/generated_train",
"valid_generated_data_file": "rnnlm/data/generated_valid",
"test_generated_data_file": "rnnlm/data/generated_test",
"vocab_path_features": "wordlist.rnn.final",
"vocab_path_labels": "generated_tags",
"vocab_size_features": 10000,
"vocab_size_labels": 3,
"shape_size_features": 20,
"shape_size_labels": 1,
"tf_records_path": "tfrecords",
"tf_record_train_file": "train_gen.tfrecord",
"tf_record_valid_file": "valid_gen.tfrecord",
"tf_record_test_file": "test_gen.tfrecord",
"shuffle": false,
"shuffle_buffer_size": 10000
},
"train": {
"w_init_scale": 0.1,
"max_grad_norm": 5,
"learning_rate": {
"type": "decay",
"start_value": 1.0,
"decay": 0.9,
"decay_max_factor": 10
},
"batch_size": 64,
"num_epochs": 20,
"epoch_size_train": 1291,
"epoch_size_valid": 131,
"epoch_size_test": 163
}
}
}
}
]
}