-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathexperiments.py
166 lines (138 loc) · 7.14 KB
/
experiments.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
import os
import argparse
import logging
import numpy as np
import torch
import matplotlib.pyplot as plt
from sklearn.model_selection import KFold
from mllp.utils import read_csv, DBEncoder
from mllp.models import MLLP
DATA_DIR = 'dataset'
device = torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')
def plot_loss(args, loss_log, accuracy, accuracy_b, f1_score, f1_score_b):
set_name = 'validation' if args.use_validation_set else 'training'
fig = plt.figure(figsize=(16, 16))
fig.suptitle('Dataset: {}'.format(args.data_set), fontsize=16)
plt.subplot(3, 1, 1)
loss_array = np.array(loss_log)
plt.plot(loss_array, color='b', label='Total loss')
plt.xlabel('epoch')
plt.ylabel('loss')
plt.title('Loss during the training')
plt.grid(True)
plt.legend()
plt.subplot(3, 1, 2)
plt.plot(np.array(accuracy), color='b', label='MLLP')
plt.plot(np.array(accuracy_b), color='g', label='CRS')
plt.xlabel('epoch * 5')
plt.ylabel('Accuracy')
plt.title('Accuracy on the {} set'.format(set_name))
plt.grid(True)
plt.legend()
plt.subplot(3, 1, 3)
plt.plot(np.array(f1_score), color='b', label='MLLP')
plt.plot(np.array(f1_score_b), color='g', label='CRS')
plt.xlabel('epoch * 5')
plt.ylabel('F1 Score Micro')
plt.title('F1 Score (Macro) on the {} set'.format(set_name))
plt.grid(True)
plt.legend()
plt.savefig(args.plot_file)
def experiment(args):
dataset = args.data_set
data_path = os.path.join(DATA_DIR, dataset + '.data')
info_path = os.path.join(DATA_DIR, dataset + '.info')
X_df, y_df, f_df, label_pos = read_csv(data_path, info_path, shuffle=True)
kf = KFold(n_splits=args.kfold, shuffle=True, random_state=0)
train_index, test_index = list(kf.split(X_df))[args.ith_kfold]
X_train_df = X_df.iloc[train_index]
y_train_df = y_df.iloc[train_index]
X_test_df = X_df.iloc[test_index]
y_test_df = y_df.iloc[test_index]
logging.info('Discretizing and binarizing data. Please wait ...')
db_enc = DBEncoder(f_df, discrete=True)
db_enc.fit(X_df, y_df)
X_fname = db_enc.X_fname
y_fname = db_enc.y_fname
X_train, y_train = db_enc.transform(X_train_df, y_train_df)
X_test, y_test = db_enc.transform(X_test_df, y_test_df)
logging.info('Data discretization and binarization are done.')
if args.use_validation_set:
# Use 20% of the training set as the validation set.
kf = KFold(n_splits=5, shuffle=True, random_state=0)
train_index, validation_index = next(kf.split(X_train))
X_validation = X_train[validation_index]
y_validation = y_train[validation_index]
X_train = X_train[train_index]
y_train = y_train[train_index]
else:
X_validation = None
y_validation = None
net_structure = [len(X_fname)] + list(map(int, args.structure.split('_'))) + [len(y_fname)]
net = MLLP(net_structure,
device=device,
random_binarization_rate=args.random_binarization_rate,
use_not=args.use_not,
log_file=args.log)
net.to(device)
loss_log, accuracy, accuracy_b, f1_score, f1_score_b = net.train(
X_train,
y_train,
X_validation=X_validation,
y_validation=y_validation,
lr=args.learning_rate,
batch_size=args.batch_size,
epoch=args.epoch,
lr_decay_rate=args.lr_decay_rate,
lr_decay_epoch=args.lr_decay_epoch,
weight_decay=args.weight_decay)
plot_loss(args, loss_log, accuracy, accuracy_b, f1_score, f1_score_b)
acc, acc_b, f1, f1_b = net.test(X_test, y_test, need_transform=True)
logging.info('=' * 60)
logging.info('Test:\n\tAccuracy of MLLP Model: {}\n\tAccuracy of CRS Model: {}'.format(acc, acc_b))
logging.info('Test:\n\tF1 Score of MLLP Model: {}\n\tF1 Score of CRS Model: {}'.format(f1, f1_b))
logging.info('=' * 60)
with open(args.crs_file, 'w') as f:
net.concept_rule_set_print(X_train, X_fname, y_fname, f)
torch.save(net.state_dict(), args.model)
if __name__ == '__main__':
parser = argparse.ArgumentParser(formatter_class=argparse.ArgumentDefaultsHelpFormatter)
parser.add_argument('-d', '--data_set', type=str, default='tic-tac-toe',
help='Set the data set for training. All the data sets in the dataset folder are available.')
parser.add_argument('-k', '--kfold', type=int, default=5, help='Set the k of K-Folds cross-validation.')
parser.add_argument('-ki', '--ith_kfold', type=int, default=0, help='Do the i-th validation, 0 <= ki < k.')
parser.add_argument('--use_validation_set', action="store_true",
help='Use the validation set for parameters tuning.')
parser.add_argument('-e', '--epoch', type=int, default=401, help='Set the total epoch.')
parser.add_argument('-bs', '--batch_size', type=int, default=64, help='Set the batch size.')
parser.add_argument('-lr', '--learning_rate', type=float, default=0.01, help='Set the initial learning rate.')
parser.add_argument('-lrdr', '--lr_decay_rate', type=float, default=0.75, help='Set the learning rate decay rate.')
parser.add_argument('-lrde', '--lr_decay_epoch', type=int, default=100, help='Set the learning rate decay epoch.')
parser.add_argument('-wd', '--weight_decay', type=float, default=0.0, help='Set the weight decay (L2 penalty).')
parser.add_argument('-p', '--random_binarization_rate', type=float, default=0.0,
help='Set the rate of random binarization. It is important for CRS extractions from deep MLLPs.')
parser.add_argument('--use_not', action="store_true",
help='Use the NOT (~) operator in logical rules. '
'It will enhance model capability but make the CRS more complex.')
parser.add_argument('-s', '--structure', type=str, default='64',
help='Set the structure of network. Only the number of nodes in middle layers are needed. '
'E.g., 64, 64_32_16. The total number of middle layers should be odd.')
args = parser.parse_args()
args.folder_name = '{}_k{}_ki{}_useValidationSet{}_e{}_bs{}_lr{}_lrdr{}_lrde{}_wd{}_p{}_useNOT{}'.format(
args.data_set, args.kfold, args.ith_kfold, args.use_validation_set, args.epoch, args.batch_size,
args.learning_rate, args.lr_decay_rate, args.lr_decay_epoch, args.weight_decay,
args.random_binarization_rate, args.use_not)
if not os.path.exists('log_folder'):
os.mkdir('log_folder')
args.folder_name = args.folder_name + '_L' + args.structure
args.folder_path = os.path.join('log_folder', args.folder_name)
if not os.path.exists(args.folder_path):
os.mkdir(args.folder_path)
args.model = os.path.join(args.folder_path, 'model.pth')
args.crs_file = os.path.join(args.folder_path, 'crs.txt')
args.plot_file = os.path.join(args.folder_path, 'plot_file.pdf')
args.log = os.path.join(args.folder_path, 'log.txt')
logging.basicConfig(level=logging.INFO, filename=args.log, filemode='w', format='[%(levelname)s] - %(message)s')
# for arg in vars(args):
# print(arg, getattr(args, arg))
experiment(args)