-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathunit_test.py
executable file
·109 lines (83 loc) · 2.71 KB
/
unit_test.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
import math
import torch
import pickle
import itertools
import numpy as np
from tqdm import tqdm
from util.kernel import sanitise, increment_kernel, complexity, invert_bound
from util.data import get_data, normalize_data
from util.trainer import SimpleNet
## Check compositional kernel
a = torch.ones(5,5) * 0.4
b = increment_kernel(a)
print(b) # should be 0.5441
a = torch.zeros(5,5)
b = increment_kernel(a)
print(b) # should be 0.3183
print()
## Check kernel complexity on identity matrix
n = 100
sigma = torch.eye(n)
c = torch.randn(n).sign()
print( complexity(sigma, c, 10000) ) # should be n*ln(2), 7n/10
print()
## Check kernel complexity via non-cholesky approach
n = 10
rand = torch.randn(n, n)
sigma = torch.mm(rand, rand.t()) + torch.eye(n)
sigma = 0.5*(sigma + sigma.t())
assert ( sigma == sigma.t() ).all()
c = torch.randn(n).sign()
det = torch.det(sigma)
inv = torch.inverse(sigma)
tr = torch.trace(inv)
comp_1 = n/5.0 + det ** (1/n) * ( (0.5-1/math.pi)*tr + 1/math.pi*torch.dot(c, torch.matmul(inv, c)) )
comp_1 = comp_1.item()
num_samples = 10**6
ide = torch.eye(n)
estimate = 0
print("running non-parallelised estimation")
for _ in tqdm(range(num_samples)):
z = torch.randn(n).abs()
estimate += math.exp( -0.5 * torch.dot(c*z, torch.matmul(det**(1/n)*inv - ide,c*z)) )
estimate /= num_samples
comp_0 = math.log(2**n / estimate)
print( ("Estimate", "Bound"))
print( "non-cholesky:")
print( (comp_0, comp_1) )
print( "cholesky:")
print( complexity(sigma, c, num_samples) )
print()
## Check kernel compared to random networks
depth = 3
width = 5000
num_train_examples = 5
num_networks = 10**3
_, _, train_loader, _ = get_data( num_train_examples=num_train_examples,
num_test_examples=None,
batch_size=num_train_examples,
random_labels=False,
binary_digits=False )
for data, target in train_loader:
data, target = normalize_data(data, target)
out_matrix = np.zeros((num_train_examples, num_networks))
with torch.no_grad():
print(f"Sampling {num_networks} random networks")
for network_idx in tqdm(range(num_networks)):
model = SimpleNet(depth, width)
for p in model.parameters():
p.data = torch.randn_like(p) / math.sqrt(p.shape[1])
pred = model(data).squeeze()
out_matrix[:, network_idx] = pred.numpy()
sample_mean = np.mean(out_matrix, axis=1)
sample_cov = np.cov(out_matrix)
print()
print("sample mean:\n", sample_mean)
print("sample cov:\n", sample_cov)
sigma = sanitise(torch.mm(data, data.t()) / data.shape[1])
for _ in range(depth-1):
sigma = increment_kernel(sigma)
sigma = sigma.numpy()
diff = np.absolute(sigma - sample_cov).max()
print("analytical cov:\n", sigma)
print("max difference: ", diff)