forked from shawntan/python-crf
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtest.py
168 lines (144 loc) · 4.44 KB
/
test.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
import unittest
import numpy as np
import crf
from scipy import misc
from collections import defaultdict
from numpy import empty, zeros, ones, log, exp, sqrt, add, int32, abs
def argmax(X):
"""
Find the most likely assignment to labels given parameters using the
Viterbi algorithm.
"""
N,K,_ = X.shape
g0 = X[0,0]
g = X[1:]
B = ones((N,K), dtype=int32) * -1
# compute max-marginals and backtrace matrix
V = g0
for t in xrange(1,N):
U = empty(K)
for y in xrange(K):
w = V + g[t-1,:,y]
B[t,y] = b = w.argmax()
U[y] = w[b]
V = U
# extract the best path by brack-tracking
y = V.argmax()
trace = []
for t in reversed(xrange(N)):
trace.append(y)
y = B[t, y]
trace.reverse()
return trace
def forward(g0, g, N, K):
"""
Calculate matrix of forward unnormalized log-probabilities.
a[i,y] log of the sum of scores of all sequences from 0 to i where
the label at position i is y.
"""
a = np.zeros((N,K))
a[0,:] = g0
for t in xrange(1,N):
ayp = a[t-1,:]
for y in xrange(K):
a[t,y] = misc.logsumexp(ayp + g[t-1,:,y])
return a
def backward(g, N, K):
""" Calculate matrix of backward unnormalized log-probabilities. """
b = np.zeros((N,K))
for t in reversed(xrange(0,N-1)):
by = b[t+1,:]
for yp in xrange(K):
b[t,yp] = misc.logsumexp(by + g[t,yp,:])
return b
def expectation(N,K,log_M):
"""
Expectation of the sufficient statistics given ``x`` and current
parameter settings.
"""
g0 = log_M[0,0]
g = log_M[1:]
a = forward(g0,g,N,K)
b = backward(g,N,K)
print "Forward:"
print a
print "Backward:"
print b
# log-normalizing constant
logZ = misc.logsumexp(a[N-1,:])
E = defaultdict(float)
# The first factor needs to be special case'd
# E[ f( y_0 ) ] = p(y_0 | y_[1:N], x) * f(y_0)
c = exp(g0 + b[0,:] - logZ).clip(0.0, 1.0)
for y in xrange(K):
p = c[y]
if p < 1e-40: continue # skip really small updates.
for k in f[0, None, y]:
E[k] += p
for t in xrange(1,N):
# vectorized computation of the marginal for this transition factor
c = exp((add.outer(a[t-1,:], b[t,:]) + g[t-1,:,:] - logZ)).clip(0.0, 1.0)
for yp in xrange(K):
for y in xrange(K):
# we can also use the following to compute ``p`` but its quite
# a bit slower than the computation of vectorized quantity ``c``.
#p = exp(a[t-1,yp] + g[t-1,yp,y] + b[t,y] - logZ).clip(0.0, 1.0)
p = c[yp, y]
if p < 1e-40: continue # skip really small updates.
# expectation of this factor is p*f(t, yp, y)
for k in f[t, yp, y]:
E[k] += p
return E
class TestCRF(unittest.TestCase):
def setUp(self):
self.matrix = 0.001 + np.random.poisson(lam=1.5, size=(3,3)).astype(np.float)
self.vector = 0.001 + np.random.poisson(lam=1.5, size=(3,)).astype(np.float)
self.M = 0.001 + np.random.poisson(lam=1.5, size=(10,3,3)).astype(np.float)
labels = ['A','B','C']
obsrvs = ['a','b','c','d','e','f']
lbls = [crf.START] + labels + [crf.END]
transition_functions = [
lambda yp,y,x_v,i,_yp=_yp,_y=_y: 1 if yp==_yp and y==_y else 0
for _yp in lbls[:-1]
for _y in lbls[1:]]
observation_functions = [
lambda yp,y,x_v,i,_y=_y,_x=_x: 1 if i < len(x_v) and y==_y and x_v[i]==_x else 0
for _y in labels
for _x in obsrvs]
self.crf = crf.CRF( labels = labels,
feature_functions = transition_functions + observation_functions )
def test_log_dot_mv(self):
self.assertTrue(
(np.around(np.exp(
crf.log_dot_mv(
np.log(self.matrix),
np.log(self.vector)
)
),10) == np.around(np.dot(self.matrix,self.vector),10)).all()
)
def test_log_dot_vm(self):
self.assertTrue(
(np.around(np.exp(
crf.log_dot_vm(
np.log(self.vector),
np.log(self.matrix)
)
),10) == np.around(np.dot(self.vector,self.matrix),10)).all()
)
def test_forward(self):
M = self.M/self.M.sum(axis=2).reshape(self.M.shape[:-1]+(1,))
res = np.around(np.exp(self.crf.forward(np.log(M))[0]).sum(axis=1),10)
res_true = np.around(np.ones(M.shape[0]),10)
self.assertTrue((res == res_true).all())
def test_predict(self):
label_pred = self.crf.slow_predict(self.M,self.M.shape[0],self.M.shape[1])
label_act = argmax(self.M)
self.assertTrue(label_pred == label_act)
def test_integrated(self):
x_vec = ["a","b","c","d","e","f"]
y_vec = ["A","B","C","A","B","C"]
self.crf.train([x_vec],[y_vec])
l = lambda theta: crf.neg_likelihood_and_deriv(vectorised_x_vecs,vectorised_y_vecs,theta)
self.assertTrue(self.crf.predict(x_vec)==y_vec[1:-1])
if __name__ == '__main__':
unittest.main()