├── 10 Dimension Reduction
    ├── ecoli.py
    ├── factoranalysis.py
    ├── floyd.py
    ├── iris.py
    ├── isomap.py
    ├── kernelpca.py
    ├── kpcademo.py
    ├── lda.py
    ├── lle.py
    ├── pca.py
    └── pcademo.py
├── 11 Optimisation
    ├── CG.py
    ├── LevenbergMarquardt.py
    ├── LevenbergMarquardt_leastsq.py
    ├── Newton.py
    ├── TSP.py
    └── steepest.py
├── 12 Evolutionary
    ├── PBIL.py
    ├── exhaustiveKnapsack.py
    ├── fourpeaks.py
    ├── ga.py
    ├── greedyKnapsack.py
    ├── knapsack.py
    └── run_ga.py
├── 13 Reinforcement
    ├── SARSA.py
    ├── SARSA_cliff.py
    ├── TDZero.py
    └── TDZero_cliff.py
├── 14 MCMC
    ├── BoxMuller.py
    ├── Gibbs.py
    ├── MH.py
    ├── SIR.py
    ├── importancesampling.py
    ├── lcg.py
    └── rejectionsampling.py
├── 15 Graphical Models
    ├── Gibbs.py
    ├── HMM.py
    ├── Kalman.py
    ├── MRF.py
    ├── graphdemo.py
    └── world.png
├── 2 Linear
    ├── auto-mpg.py
    ├── linreg.py
    ├── linreg_logic_eg.py
    ├── logic.py
    ├── pcn.py
    ├── pcn_logic_eg.py
    └── pima.py
├── 3 MLP
    ├── PNOz.py
    ├── PNoz.dat
    ├── iris.py
    ├── iris_proc.data
    ├── logic.py
    ├── mlp.py
    └── sinewave.py
├── 4 RBF
    ├── iris.py
    ├── least_squares.py
    └── rbf.py
├── 6 Trees
    ├── dtree.py
    ├── party.data
    └── party.py
├── 7 Committee
    ├── bagging.py
    ├── boost.py
    ├── car.data
    ├── car.py
    ├── dtw.py
    └── party.py
├── 8 Probability
    ├── GMM.py
    ├── gaussian.py
    ├── kdtree.py
    ├── knn.py
    ├── knnSmoother.py
    ├── plotGaussian.py
    └── ruapehu.dat
└── 9 Unsupervised
    ├── iris.py
    ├── kmeans.py
    ├── kmeansnet.py
    ├── moredemos.py
    ├── shortecoli.data
    ├── som.py
    └── somdemo.py


/10 Dimension Reduction/ecoli.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 10 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Simple example of LDA, PCA, and kernel PCA, on the Wine and e-coli datasets
12 | from pylab import *
13 | from numpy import *
14 | 
15 | wine = loadtxt('../9 Unsupervised/wine.data',delimiter=',')
16 | 
17 | labels = wine[:,0]
18 | data = wine[:,1:]
19 | data -= mean(data,axis=0)
20 | data /= data.max(axis=0)
21 | 
22 | #ecoli = loadtxt('../9 Unsupervised/shortecoli.data')
23 | #labels = ecoli[:,7:]
24 | #data = ecoli[:,:7]
25 | #data -= mean(data,axis=0)
26 | #data /= data.max(axis=0)
27 | 
28 | order = range(shape(data)[0])
29 | random.shuffle(order)
30 | data = data[order]
31 | w0 = where(labels==1)
32 | w1 = where(labels==2)
33 | w2 = where(labels==3)
34 | 
35 | import lda
36 | newData,w = lda.lda(data,labels,2)
37 | 
38 | plot(data[w0,0],data[w0,1],'ok')
39 | plot(data[w1,0],data[w1,1],'^k')
40 | plot(data[w2,0],data[w2,1],'vk')
41 | axis([-1.5,1.8,-1.5,1.8])
42 | axis('off')
43 | figure(2)
44 | plot(newData[w0,0],newData[w0,1],'ok')
45 | plot(newData[w1,0],newData[w1,1],'^k')
46 | plot(newData[w2,0],newData[w2,1],'vk')
47 | axis([-1.5,1.8,-1.5,1.8])
48 | axis('off')
49 | 
50 | import pca
51 | x,y,evals,evecs = pca.pca(data,2)
52 | figure(3)
53 | plot(y[w0,0],y[w0,1],'ok')
54 | plot(y[w1,0],y[w1,1],'^k')
55 | plot(y[w2,0],y[w2,1],'vk')
56 | axis('off')
57 | 
58 | import kernelpca
59 | newData = kernelpca.kernelpca(data,'gaussian',2)
60 | figure(4)
61 | plot(newData[w0,0],newData[w0,1],'ok')
62 | plot(newData[w1,0],newData[w1,1],'^k')
63 | plot(newData[w2,0],newData[w2,1],'vk')
64 | axis('off')
65 | 
66 | show()
67 | 


--------------------------------------------------------------------------------
/10 Dimension Reduction/factoranalysis.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 10 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The Factor Analysis algorithm
12 | from pylab import *
13 | from numpy import *
14 |  
15 | def factoranalysis(y,nRedDim):
16 |     Ndata = shape(y)[0]
17 |     N = shape(y)[1]
18 |  
19 |     y = y-y.mean(axis=0)
20 |     C = cov(transpose(y))    
21 |     Cd = C.diagonal()
22 |     Psi = Cd
23 |     scaling = linalg.det(C)**(1./N)
24 |     
25 |     W = random.normal(0,sqrt(scaling/nRedDim),(N,nRedDim))
26 | 
27 |     nits = 1000
28 |     oldL = -inf
29 | 
30 |     for i in range(nits):    
31 |     
32 |         # E-step
33 |         A = dot(W,transpose(W)) + diag(Psi)
34 |         logA = log(abs(linalg.det(A)))
35 |         A = linalg.inv(A)
36 |         
37 |         WA = dot(transpose(W),A)
38 |         WAC = dot(WA,C)
39 |         Exx = eye(nRedDim) - dot(WA,W) + dot(WAC,transpose(WA)) 
40 | 
41 |         # M-step
42 |         W = dot(transpose(WAC),linalg.inv(Exx))
43 |         Psi = Cd - (dot(W,WAC)).diagonal()
44 |         #Sigma1 = (dot(transpose(y),y) - dot(W,WAC)).diagonal()/Ndata
45 | 
46 |         tAC = (A*transpose(C)).sum()
47 |         
48 |         L = -N/2*log(2.*pi) -0.5*logA - 0.5*tAC
49 |         if (L-oldL)<(1e-4):
50 |             print "Stop",i
51 |             break
52 |         print L
53 |         oldL = L
54 |     A = linalg.inv(dot(W,transpose(W))+diag(Psi))
55 |     Ex = dot(transpose(A),W)
56 |     
57 |     return dot(y,Ex)
58 | 
59 | data = array([[0.1,0.1],[0.2,0.2],[0.3,0.3],[0.35,0.3],[0.4,0.4],[0.6,0.4],[0.7,0.45],[0.75,0.4],[0.8,0.35]])
60 | newData = factoranalysis(data,2)
61 | plot(newData[:,0],newData[:,1],'.')
62 | show()
63 | 


--------------------------------------------------------------------------------
/10 Dimension Reduction/floyd.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 10 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | from numpy import *
12 | import time
13 | 
14 | def floyd():
15 |     
16 |     ndata = 100
17 |     neighbours = zeros((ndata,10))
18 |     g = random.rand(ndata,ndata)
19 |     for i in range(ndata):
20 |         neighbours[i,:] = random.randint(0,100,10) 
21 |     
22 |     t0 = time.time()
23 |     print "Floyd's algorithm"
24 |     for k in range(ndata):
25 |         for i in range(ndata):
26 |             for j in range(ndata):
27 |                 if g[i,j] > g[i,k] + g[k,j]:
28 |                     g[i,j] = g[i,k] + g[k,j]
29 |     
30 |     t1 = time.time()
31 |     print "Complete"
32 |     print t1-t0
33 |     x = g.copy()
34 | 
35 |     t2 = time.time()
36 |     q = g.copy()
37 |     for i in range(ndata):
38 |         for j in range(ndata):
39 |             k = argmin(q[i,:])
40 |             while not(isnan(q[i,k])):
41 |                 q[i,k] = nan
42 |                 for l in neighbours[k,:]:
43 |                     possible = q[i,l] + q[l,k]
44 |                     if possible < q[i,k]:
45 |                         g[i,k] = possible
46 |                 k = argmin(q[i,:])
47 |     t3 = time.time()
48 |     y = g
49 |     print t3-t2
50 |     return x,y
51 | 


--------------------------------------------------------------------------------
/10 Dimension Reduction/iris.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 10 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Various dimensionality reductions running on the Iris dataset
12 | from pylab import *
13 | from numpy import *
14 | 
15 | iris = loadtxt('../3 MLP/iris_proc.data',delimiter=',')
16 | iris[:,:4] = iris[:,:4]-iris[:,:4].mean(axis=0)
17 | imax = concatenate((iris.max(axis=0)*ones((1,5)),iris.min(axis=0)*ones((1,5))),axis=0).max(axis=0)
18 | iris[:,:4] = iris[:,:4]/imax[:4]
19 | labels = iris[:,4]
20 | 
21 | order = range(shape(iris)[0])
22 | random.shuffle(order)
23 | iris = iris[order,:]
24 | labels = labels[order,:]
25 | 
26 | w0 = where(labels==0)
27 | w1 = where(labels==1)
28 | w2 = where(labels==2)
29 | 
30 | #import lda
31 | #newData,w = lda.lda(iris,labels,2)
32 | #
33 | #plot(iris[w0,0],iris[w0,1],'ok')
34 | #plot(iris[w1,0],iris[w1,1],'^k')
35 | #plot(iris[w2,0],iris[w2,1],'vk')
36 | #axis([-1.5,1.8,-1.5,1.8])
37 | #axis('off')
38 | #figure(2)
39 | #plot(newData[w0,0],newData[w0,1],'ok')
40 | #plot(newData[w1,0],newData[w1,1],'^k')
41 | #plot(newData[w2,0],newData[w2,1],'vk')
42 | #axis([-1.5,1.8,-1.5,1.8])
43 | #axis('off')
44 | #
45 | #import pca
46 | #x,y,evals,evecs = pca.pca(iris,2)
47 | #figure(3)
48 | #plot(y[w0,0],y[w0,1],'ok')
49 | #plot(y[w1,0],y[w1,1],'^k')
50 | #plot(y[w2,0],y[w2,1],'vk')
51 | #axis('off')
52 | 
53 | #import kernelpca
54 | #newData = kernelpca.kernelpca(iris,'gaussian',2)
55 | #figure(4)
56 | #plot(newData[w0,0],newData[w0,1],'ok')
57 | #plot(newData[w1,0],newData[w1,1],'^k')
58 | #plot(newData[w2,0],newData[w2,1],'vk')
59 | #axis('off')
60 | 
61 | #import factoranalysis
62 | #newData = factoranalysis.factoranalysis(iris,2)
63 | ##print newData
64 | ##figure(5)
65 | #plot(newData[w0,0],newData[w0,1],'ok')
66 | #plot(newData[w1,0],newData[w1,1],'^k')
67 | #plot(newData[w2,0],newData[w2,1],'vk')
68 | #axis('off')
69 | 
70 | #import lle
71 | #print shape(iris)
72 | #a,b,newData = lle.lle(iris,2,12)
73 | #print shape(newData)
74 | #print newData[w0,:]
75 | #print "---"
76 | #print newData[w1,:]
77 | #print "---"
78 | #print newData[w2,:]
79 | #
80 | #plot(newData[w0,0],newData[w0,1],'ok')
81 | #plot(newData[w1,0],newData[w1,1],'^k')
82 | #plot(newData[w2,0],newData[w2,1],'vk')
83 | #axis('off')
84 | 
85 | import isomap
86 | print labels
87 | newData,newLabels = isomap.isomap(iris,2,100)
88 | print shape(newData)
89 | print newLabels
90 | w0 = where(newLabels==0)
91 | w1 = where(newLabels==1)
92 | w2 = where(newLabels==2)
93 | plot(newData[w0,0],newData[w0,1],'ok')
94 | plot(newData[w1,0],newData[w1,1],'^k')
95 | plot(newData[w2,0],newData[w2,1],'vk')
96 | axis('off')
97 | 
98 | show()
99 | 


--------------------------------------------------------------------------------
/10 Dimension Reduction/isomap.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # Code from Chapter 10 of Machine Learning: An Algorithmic Perspective
  3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
  4 | 
  5 | # You are free to use, change, or redistribute the code in any way you wish for
  6 | # non-commercial purposes, but please maintain the name of the original author.
  7 | # This code comes with no warranty of any kind.
  8 | 
  9 | # Stephen Marsland, 2008
 10 | 
 11 | # The Isomap algorithm
 12 | from pylab import *
 13 | from numpy import *
 14 | 
 15 | def swissroll():
 16 | 	# Make the swiss roll dataset
 17 | 	N = 1000
 18 | 	noise = 0.05
 19 | 
 20 | 	t = 3.*math.pi/2 * (1. + 2.*random.rand(1,N))
 21 | 	h = 21. * random.rand(1,N)
 22 | 	data = concatenate((t*cos(t),h,t*sin(t))) + noise*random.randn(3,N)	
 23 | 	return transpose(data), squeeze(t)
 24 | 
 25 | def isomap(data,newdim=2,K=12,labels=None):
 26 | 
 27 | 	ndata = shape(data)[0]
 28 | 	ndim = shape(data)[1]
 29 | 	d = zeros((ndata,ndata),dtype=float)
 30 | 	
 31 | 	# Compute the distance matrix
 32 | 	# Inefficient -- not matrices
 33 | 	for i in range(ndata):
 34 | 		for j in range(i+1,ndata):
 35 | 			for k in range(ndim):
 36 | 				d[i,j] += (data[i,k] - data[j,k])**2
 37 | 			d[i,j] = sqrt(d[i,j])
 38 | 			d[j,i] = d[i,j]
 39 | 
 40 | 	# K-nearest neighbours
 41 | 	indices = d.argsort()
 42 | 	#notneighbours = indices[:,K+1:]
 43 | 	neighbours = indices[:,:K+1]
 44 | 	# Alternative: epsilon
 45 | 	# epsilon = 0.1
 46 | 	#neighbours = where(d<=epsilon)
 47 | 	#notneighbours = where(d>epsilon)
 48 | 
 49 | 	h = ones((ndata,ndata),dtype=float)*inf
 50 | 	for i in range(ndata):
 51 | 		h[i,neighbours[i,:]] = d[i,neighbours[i,:]]
 52 | 
 53 | 	# Compute the full distance matrix over all paths
 54 | 	print "Floyd's algorithm"
 55 | 	for k in range(ndata):
 56 | 		for i in range(ndata):
 57 | 			for j in range(ndata):
 58 | 				if h[i,j] > h[i,k] + h[k,j]:
 59 | 					h[i,j] = h[i,k] + h[k,j]
 60 | 
 61 | #	print "Dijkstra's algorithm"
 62 | #	q = h.copy()
 63 | #	for i in range(ndata):
 64 | #		for j in range(ndata):
 65 | #			k = argmin(q[i,:])
 66 | #			while not(isinf(q[i,k])):
 67 | #				q[i,k] = inf
 68 | #				for l in neighbours[k,:]:
 69 | #					possible = h[i,l] + h[l,k]
 70 | #					if possible < h[i,k]:
 71 | #						h[i,k] = possible
 72 | #				k = argmin(q[i,:])
 73 | #	print "Complete"
 74 | 
 75 | 	# remove lines full of infs 
 76 | 	x = isinf(h[:,0]).nonzero()
 77 | 	if size(x)>0:	
 78 | 		print x
 79 | 		if x[0][0]>0:
 80 | 			new = h[0:x[0][0],:]
 81 | 			newlabels = labels[0:x[0][0]]
 82 | 			start = 1
 83 | 		else:
 84 | 			new = h[x[0][0]+1,:]
 85 | 			newlabels = labels[x[0][0]+1]
 86 | 			start = 2
 87 | 		for i in range(start,size(x)):
 88 | 			new = concatenate((new,h[x[0][i-1]+1:x[0][i],:]),axis=0)
 89 | 			newlabels = concatenate((newlabels,labels[x[0][i-1]+1:x[0][i]]),axis=0)
 90 | 		new = concatenate((new,h[x[0][i]+1:,:]),axis=0)
 91 | 		newlabels = concatenate((newlabels,labels[x[0][i]+1:]),axis=0)
 92 | 
 93 | 		new2 = new[:,0:x[0][0]]
 94 | 		if x[0][0]>0:
 95 | 			new2 = new[:,0:x[0][0]]
 96 | 			start = 1
 97 | 		else:
 98 | 			new2 = new[:,x[0][0]+1]
 99 | 			start = 2
100 | 		for i in range(start,size(x)):
101 | 			new2 = concatenate((new2,new[:,x[0][i-1]+1:x[0][i]]),axis=1)
102 | 		new2 = concatenate((new2,new[:,x[0][i]+1:]),axis=1)
103 | 
104 | 		g = new2.copy()
105 | 		ndata = ndata - size(x)
106 | 	else:
107 | 		g = h.copy()
108 | 		newlabels = labels
109 | 	
110 | 	# Map computations, following by the dimensionality reduction
111 | 	M = -0.5*(g**2 - transpose(sum(g*g,axis=0) * ones((ndata,1))/ndata) - ones((ndata,1))* sum(g*g,axis=0)/ndata + sum(sum(g*g))/ndata**2)
112 | 
113 | 	eval,evec = linalg.eig(M)
114 | 	eval = real(eval)
115 | 	ind = argsort(eval)
116 | 	eval = real(diag(eval[ind[-1::-1]]))
117 | 	evec = evec[:,ind[-1::-1]]
118 | 	y = real(dot(evec,transpose((sqrt(eval)))))
119 | 	print shape(y)
120 | 	print shape(eval), shape(evec)
121 | 	return y, newlabels
122 | 
123 | data,t = swissroll()
124 | y,u = isomap(data)
125 | 
126 | t -= t.min()
127 | t /= t.max()
128 | #scatter(y[:,0],y[:,1],c=t,cmap=cm.jet)
129 | scatter(y[:,1],y[:,2],s=50,c=t,cmap=cm.gray)
130 | #scatter(data[:,0],data[:,1],s=50,c=t,cmap=cm.gray)
131 |  
132 | show()
133 | 


--------------------------------------------------------------------------------
/10 Dimension Reduction/kernelpca.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 10 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The Kernel PCA algorithm
12 | 
13 | from pylab import *
14 | from numpy import *
15 | 
16 | def kernelmatrix(data,kernel,param=array([3,2])):
17 |     
18 |     if kernel=='linear':
19 |         return dot(data,transpose(data))
20 |     elif kernel=='gaussian':
21 |         K = zeros((shape(data)[0],shape(data)[0]))
22 |         for i in range(shape(data)[0]):
23 |             for j in range(i+1,shape(data)[0]):
24 |                 K[i,j] = sum((data[i,:]-data[j,:])**2)
25 |                 K[j,i] = K[i,j]
26 |         return exp(-K**2/(2*param[0]**2))
27 |     elif kernel=='polynomial':
28 |         return (dot(data,transpose(data))+param[0])**param[1]
29 |     
30 | def kernelpca(data,kernel,redDim):
31 |     
32 |     nData = shape(data)[0]
33 |     nDim = shape(data)[1]
34 |     
35 |     K = kernelmatrix(data,kernel)
36 |     
37 |     # Compute the transformed data
38 |     D = sum(K,axis=0)/nData
39 |     E = sum(D)/nData
40 |     J = ones((nData,1))*D
41 |     K = K - J - transpose(J) + E*ones((nData,nData))
42 |     
43 |     # Perform the dimensionality reduction
44 |     evals,evecs = linalg.eig(K) 
45 |     indices = argsort(evals)
46 |     indices = indices[::-1]
47 |     evecs = evecs[:,indices[:redDim]]
48 |     evals = evals[indices[:redDim]]
49 |     
50 |     sqrtE = zeros((len(evals),len(evals)))
51 |     for i in range(len(evals)):
52 |         sqrtE[i,i] = sqrt(evals[i])
53 |        
54 |     #print shape(sqrtE), shape(data)
55 |     newData = transpose(dot(sqrtE,transpose(evecs)))
56 |     
57 |     return newData
58 | 
59 | #data = array([[0.1,0.1],[0.2,0.2],[0.3,0.3],[0.35,0.3],[0.4,0.4],[0.6,0.4],[0.7,0.45],[0.75,0.4],[0.8,0.35]])
60 | #newData = kernelpca(data,'gaussian',2)
61 | #plot(data[:,0],data[:,1],'o',newData[:,0],newData[:,0],'.')
62 | #show()
63 | 


--------------------------------------------------------------------------------
/10 Dimension Reduction/kpcademo.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 10 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Demonstration of PCA and kernel PCA on the circular dataset
12 | from pylab import *
13 | from numpy import *
14 | 
15 | import pca
16 | import kernelpca
17 | 
18 | data = zeros((150,2))
19 | 
20 | theta = random.normal(0,pi,50)
21 | r = random.normal(0,0.1,50)
22 | data[0:50,0] = r*cos(theta)
23 | data[0:50,1] = r*sin(theta)
24 | 
25 | theta = random.normal(0,pi,50)
26 | r = random.normal(2,0.1,50)
27 | data[50:100,0] = r*cos(theta)
28 | data[50:100,1] = r*sin(theta)
29 | 
30 | theta = random.normal(0,pi,50)
31 | r = random.normal(5,0.1,50)
32 | data[100:150,0] = r*cos(theta)
33 | data[100:150,1] = r*sin(theta)
34 | 
35 | figure()
36 | plot(data[:50,0],data[:50,1],'ok')
37 | plot(data[50:100,0],data[50:100,1],'^k')
38 | plot(data[100:150,0],data[100:150,1],'vk')
39 | title('Original dataset')
40 | 
41 | x,y,evals,evecs = pca.pca(data,2)
42 | figure()
43 | plot(x[:50,0],x[:50,1],'ok')
44 | plot(x[50:100,0],x[50:100,1],'^k')
45 | plot(x[100:150,0],x[100:150,1],'vk')
46 | title('Reconstructed points after PCA')
47 | 
48 | figure()
49 | y = kernelpca.kernelpca(data,'gaussian',2)
50 | plot(y[:50,0],y[:50,1],'ok')
51 | plot(y[50:100,0],y[50:100,1],'^k')
52 | plot(y[100:150,0],y[100:150,1],'vk')
53 | title('Reconstructed points after kernel PCA')
54 | 
55 | show()
56 | 


--------------------------------------------------------------------------------
/10 Dimension Reduction/lda.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 10 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The LDA algorithm
12 | 
13 | from pylab import *
14 | from numpy import *
15 | from scipy import linalg as la
16 | 
17 | def lda(data,labels,redDim):
18 | 
19 |     # Centre data
20 |     data -= data.mean(axis=0)
21 |     nData = shape(data)[0]
22 |     nDim = shape(data)[1]
23 |     
24 |     Sw = zeros((nDim,nDim))
25 |     Sb = zeros((nDim,nDim))
26 |     
27 |     C = cov(transpose(data))
28 |     
29 |     # Loop over classes
30 |     classes = unique(labels)
31 |     for i in range(len(classes)):
32 |         # Find relevant datapoints
33 |         indices = squeeze(where(labels==classes[i]))
34 |         d = squeeze(data[indices,:])
35 |         classcov = cov(transpose(d))
36 |         Sw += float(shape(indices)[0])/nData * classcov
37 |         
38 |     Sb = C - Sw
39 |     # Now solve for W
40 |     # Compute eigenvalues, eigenvectors and sort into order
41 |     #evals,evecs = linalg.eig(dot(linalg.pinv(Sw),sqrt(Sb)))
42 |     evals,evecs = la.eig(Sw,Sb)
43 |     indices = argsort(evals)
44 |     indices = indices[::-1]
45 |     evecs = evecs[:,indices]
46 |     evals = evals[indices]
47 |     w = evecs[:,:redDim]
48 |     #print evals, w
49 |     
50 |     newData = dot(data,w)
51 |     return newData,w
52 | 
53 | #data = array([[0.1,0.1],[0.2,0.2],[0.3,0.3],[0.35,0.3],[0.4,0.4],[0.6,0.4],[0.7,0.45],[0.75,0.4],[0.8,0.35]])
54 | #labels = array([0,0,0,0,0,1,1,1,1])
55 | #newData,w = lda(data,labels,2)
56 | #print w
57 | #plot(data[:,0],data[:,1],'o',newData[:,0],newData[:,0],'.')
58 | #show()
59 | 


--------------------------------------------------------------------------------
/10 Dimension Reduction/lle.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 10 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The Locally Linear Embedding algorithm, and the swissroll example
12 | from pylab import *
13 | from numpy import *
14 | 
15 | def swissroll():
16 | 	# Make the swiss roll dataset
17 | 	N = 1000
18 | 	noise = 0.05
19 | 
20 | 	t = 3*math.pi/2 * (1 + 2*random.rand(1,N))
21 | 	h = 21 * random.rand(1,N)
22 | 	data = concatenate((t*cos(t),h,t*sin(t))) + noise*random.randn(3,N)	
23 | 	return transpose(data), squeeze(t)
24 | 
25 | def lle(data,nRedDim=2,K=12):
26 | 
27 | 	ndata = shape(data)[0]
28 | 	ndim = shape(data)[1]
29 | 	d = zeros((ndata,ndata),dtype=float)
30 | 	
31 | 	# Inefficient -- not matrices
32 | 	for i in range(ndata):
33 | 		for j in range(i+1,ndata):
34 | 			for k in range(ndim):
35 | 				d[i,j] += (data[i,k] - data[j,k])**2
36 | 			d[i,j] = sqrt(d[i,j])
37 | 			d[j,i] = d[i,j]
38 | 
39 | 	indices = d.argsort(axis=1)
40 | 	neighbours = indices[:,1:K+1]
41 | 
42 | 	W = zeros((K,ndata),dtype=float)
43 | 
44 | 	for i in range(ndata):
45 | 		Z  = data[neighbours[i,:],:] - kron(ones((K,1)),data[i,:])
46 | 		C = dot(Z,transpose(Z))
47 | 		C = C+identity(K)*1e-3*trace(C)
48 | 		W[:,i] = transpose(linalg.solve(C,ones((K,1))))
49 | 		W[:,i] = W[:,i]/sum(W[:,i])
50 | 
51 | 	M = eye(ndata,dtype=float)
52 | 	for i in range(ndata):
53 | 		w = transpose(ones((1,shape(W)[0]))*transpose(W[:,i]))
54 | 		j = neighbours[i,:]
55 | 		#print shape(w), shape(dot(w,transpose(w))), shape(M[i,j])
56 | 		ww = dot(w,transpose(w))
57 | 		for k in range(K):
58 | 			M[i,j[k]] -= w[k]
59 | 			M[j[k],i] -= w[k]
60 | 			for l in range(K):
61 | 			     M[j[k],j[l]] += ww[k,l]
62 | 	
63 | 	evals,evecs = linalg.eig(M)
64 | 	ind = argsort(evals)
65 | 	y = evecs[:,ind[1:nRedDim+1]]*sqrt(ndata)
66 | 	return evals,evecs,y
67 | 
68 | data,t = swissroll()
69 | evals,evecs,y = lle(data)
70 | 
71 | t -= t.min()
72 | t /= t.max()
73 | scatter(y[:,0],y[:,1],s=50,c=t,cmap=cm.gray)
74 | axis('off')
75 | show()
76 | 


--------------------------------------------------------------------------------
/10 Dimension Reduction/pca.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 10 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # An algorithm to compute PCA. Not as fast as the NumPy implementation
12 | from pylab import *
13 | from numpy import *
14 | 
15 | def pca(data,nRedDim=0,normalise=1):
16 |     
17 |     # Centre data
18 |     m = mean(data,axis=0)
19 |     data -= m
20 | 
21 |     # Covariance matrix
22 |     C = cov(transpose(data))
23 | 
24 |     # Compute eigenvalues and sort into descending order
25 |     evals,evecs = linalg.eig(C) 
26 |     indices = argsort(evals)
27 |     indices = indices[::-1]
28 |     evecs = evecs[:,indices]
29 |     evals = evals[indices]
30 | 
31 |     if nRedDim>0:
32 |         evecs = evecs[:,:nRedDim]
33 |     
34 |     if normalise:
35 |         for i in range(shape(evecs)[1]):
36 |             evecs[:,i] / linalg.norm(evecs[:,i]) * sqrt(evals[i])
37 | 
38 |     # Produce the new data matrix
39 |     x = dot(transpose(evecs),transpose(data))
40 |     # Compute the original data again
41 |     y=transpose(dot(evecs,x))+m
42 |     return x,y,evals,evecs
43 |     
44 | 


--------------------------------------------------------------------------------
/10 Dimension Reduction/pcademo.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 10 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # A simple example of PCA
12 | from pylab import *
13 | from numpy import *
14 | 
15 | import pca
16 | 
17 | x = random.normal(5,.5,1000)
18 | y = random.normal(3,1,1000)
19 | a = x*cos(pi/4) + y*sin(pi/4)
20 | b = -x*sin(pi/4) + y*cos(pi/4)
21 | 
22 | plot(a,b,'.')
23 | xlabel('x')
24 | ylabel('y')
25 | title('Original dataset')
26 | data = zeros((1000,2))
27 | data[:,0] = a
28 | data[:,1] = b
29 | 
30 | x,y,evals,evecs = pca.pca(data,1)
31 | print y
32 | figure()
33 | plot(y[:,0],y[:,1],'.')
34 | xlabel('x')
35 | ylabel('y')
36 | title('Reconstructed data after PCA')
37 | show()
38 | 


--------------------------------------------------------------------------------
/11 Optimisation/CG.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 11 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The conjugate gradients algorithm
12 | from numpy import *
13 | 
14 | def Jacobian(x):
15 | 	#return array([.4*x[0],2*x[1]])
16 | 	return array([x[0], 0.4*x[1], 1.2*x[2]])
17 | 
18 | def Hessian(x):
19 | 	#return array([[.2,0],[0,1]])
20 | 	return array([[1,0,0],[0,0.4,0],[0,0,1.2]])
21 | 
22 | def CG(x0):
23 | 
24 | 	i=0
25 | 	k=0
26 | 
27 | 	r = -Jacobian(x0)
28 | 	p=r
29 | 
30 | 	betaTop = dot(r.transpose(),r)
31 | 	beta0 = betaTop
32 | 
33 | 	iMax = 3
34 | 	epsilon = 10**(-2)
35 | 	jMax = 5
36 | 
37 | 	# Restart every nDim iterations
38 | 	nRestart = shape(x0)[0]
39 | 	x = x0
40 | 
41 | 	while i < iMax and betaTop > epsilon**2*beta0:
42 | 		j=0
43 | 		dp = dot(p.transpose(),p)
44 | 		alpha = (epsilon+1)**2
45 | 		# Newton-Raphson iteration
46 | 		while j < jMax and alpha**2 * dp > epsilon**2:
47 | 			# Line search
48 | 			alpha = -dot(Jacobian(x).transpose(),p) / (dot(p.transpose(),dot(Hessian(x),p)))
49 | 			print "N-R",x, alpha, p
50 | 			x = x + alpha * p
51 | 			j += 1
52 | 		print x
53 | 		# Now construct beta
54 | 		r = -Jacobian(x)
55 | 		print "r: ", r
56 | 		betaBottom = betaTop
57 | 		betaTop = dot(r.transpose(),r)
58 | 		beta = betaTop/betaBottom
59 | 		print "Beta: ",beta
60 | 		# Update the estimate
61 | 		p = r + beta*p
62 | 		print "p: ",p
63 | 		print "----"
64 | 		k += 1
65 | 		
66 | 		if k==nRestart or dot(r.transpose(),p) <= 0:
67 | 			p = r
68 | 			k = 0
69 | 			print "Restarting"
70 | 		i +=1
71 | 
72 | 	print x
73 | 
74 | x0 = array([-2,2,-2])
75 | CG(x0)
76 | 


--------------------------------------------------------------------------------
/11 Optimisation/LevenbergMarquardt.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 11 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The Levenberg Marquardt algorithm
12 | from numpy import *
13 | 
14 | def function(p):
15 |     r = array([10*(p[1]-p[0]**2),(1-p[0])])
16 |     fp = dot(transpose(r),r) #= 100*(p[1]-p[0]**2)**2 + (1-p[0])**2
17 |     J = (array([[-20*p[0],10],[-1,0]]))
18 |     grad = dot(transpose(J),transpose(r))
19 |     return fp,r,grad,J
20 | 
21 | def lm(p0,tol=10**(-5),maxits=100):
22 |     
23 |     nvars=shape(p0)[0]
24 |     nu=0.01
25 |     p = p0
26 |     fp,r,grad,J = function(p)
27 |     e = sum(dot(transpose(r),r))
28 |     nits = 0
29 |     while nits<maxits and linalg.norm(grad)>tol:
30 |         nits += 1
31 |         fp,r,grad,J = function(p)
32 |         H=dot(transpose(J),J) + nu*eye(nvars)
33 | 
34 |         pnew = zeros(shape(p))
35 |         nits2 = 0
36 |         while (p!=pnew).all() and nits2<maxits:
37 |             nits2 += 1
38 |             dp,resid,rank,s = linalg.lstsq(H,grad)
39 |             pnew = p - dp
40 |             fpnew,rnew,gradnew,Jnew = function(pnew)
41 |             enew = sum(dot(transpose(rnew),rnew))
42 |             rho = linalg.norm(dot(transpose(r),r)-dot(transpose(rnew),rnew))
43 |             rho /= linalg.norm(dot(transpose(grad),pnew-p))
44 |             
45 |             if rho>0:
46 |                 update = 1
47 |                 p = pnew
48 |                 e = enew
49 |                 if rho>0.25:
50 |                     nu=nu/10
51 |             else: 
52 |                 nu=nu*10
53 |                 update = 0
54 |         print fp, p, e, linalg.norm(grad), nu
55 | 
56 | p0 = array([-1.92,2])
57 | lm(p0)
58 | 


--------------------------------------------------------------------------------
/11 Optimisation/LevenbergMarquardt_leastsq.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 11 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The Levenberg Marquardt algorithm solving a least-squares problem
12 | 
13 | from pylab import *
14 | from numpy import *
15 | 
16 | def function(p,x,ydata):
17 |     fp = p[0]*cos(p[1]*x)+ p[1]*sin([p[0]*x])
18 |     r = ydata - fp
19 |     J = transpose([-cos(p[0]*x)-p[1]*cos(p[0]*x)*x, p[0] * sin(p[1]*x)*x-sin(p[0]*x)])
20 |     grad = dot(transpose(J),transpose(r))
21 |     return fp,r,grad,J
22 | 
23 | def lm(p0,x,f,tol=10**(-5),maxits=100):
24 |     
25 |     nvars=shape(p0)[0]
26 |     nu=0.01
27 |     p = p0
28 |     fp,r,grad,J = function(p,x,f)
29 |     e = sum(dot(transpose(r),r))
30 |     nits = 0
31 |     while nits<maxits and linalg.norm(grad)>tol:
32 |         nits += 1
33 |         
34 |         # Compute current Jacobian and approximate Hessian
35 |         fp,r,grad,J = function(p,x,f)
36 |         H=dot(transpose(J),J) + nu*eye(nvars)
37 |         pnew = zeros(shape(p))
38 |         nits2 = 0
39 |         while (p!=pnew).all() and nits2<maxits:
40 |             nits2 += 1
41 |             # Compute the new estimate pnew
42 |             #dp = linalg.solve(H,grad)
43 |             dp,resid,rank,s = linalg.lstsq(H,grad)
44 |             #dp = -dot(linalg.inv(H),dot(transpose(J),transpose(d)))
45 |             pnew = p - dp[:,0]
46 |             
47 |             # Decide whether the trust region is good
48 |             fpnew,rnew,gradnew,Jnew = function(pnew,x,f)
49 |             enew = sum(dot(transpose(rnew),rnew))
50 |             
51 |             rho = linalg.norm(dot(transpose(r),r)-dot(transpose(rnew),rnew))
52 |             rho /= linalg.norm(dot(transpose(grad),pnew-p))
53 |             
54 |             if rho>0:
55 |                 # Keep new estimate
56 |                 p = pnew
57 |                 e = enew
58 |                 if rho>0.25:
59 |                     # Make trust region larger (reduce nu)
60 |                     nu=nu/10
61 |             else: 
62 |                 # Make trust region smaller (increase nu)
63 |                 nu=nu*10
64 |         print p, e, linalg.norm(grad), nu
65 |     return p
66 |     
67 | p0 = array([100.5,102.5]) #[ 100.0001126   101.99969709] 1078.36915936 8.87386341319e-06 1e-10 (8 itns)
68 | #p0 = array([101,101]) #[ 100.88860713  101.12607589] 631.488571159 9.36938417155e-06 1e-67
69 | 
70 | p = array([100,102])
71 | 
72 | x = arange(0,2*pi,0.1)
73 | y = p[0]*cos(p[1]*x)+ p[1]*sin([p[0]*x]) + random.rand(len(x))
74 | p = lm(p0,x,y)
75 | y1 = p[0]*cos(p[1]*x)+ p[1]*sin([p[0]*x]) #+ random.rand(len(x))
76 | 
77 | plot(x,squeeze(y),'-')
78 | plot(x,squeeze(y1),'r--')
79 | legend(['Actual Data','Fitted Data'])
80 | show()
81 | 


--------------------------------------------------------------------------------
/11 Optimisation/Newton.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 11 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Gradient Descent using Newton's method
12 | from numpy import *
13 | 
14 | def Jacobian(x):
15 |     #return array([.4*x[0],2*x[1]])
16 |     return array([x[0], 0.4*x[1], 1.2*x[2]])
17 | 
18 | def Hessian(x):
19 |     #return array([[.2,0],[0,1]])
20 |     return array([[1,0,0],[0,0.4,0],[0,0,1.2]])
21 | 
22 | def Newton(x0):
23 | 
24 |     i = 0
25 |     iMax = 10
26 |     x = x0
27 |     Delta = 1
28 |     alpha = 1
29 |     
30 |     while i<iMax and Delta>10**(-5):
31 |         p = -dot(linalg.inv(Hessian(x)),Jacobian(x))
32 |         xOld = x
33 |         x = x + alpha*p
34 |         Delta = sum((x-xOld)**2)
35 |         i += 1
36 |     print x
37 |     
38 | x0 = array([-2,2,-2])
39 | Newton(x0)
40 | 


--------------------------------------------------------------------------------
/11 Optimisation/TSP.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # Code from Chapter 11 of Machine Learning: An Algorithmic Perspective
  3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
  4 | 
  5 | # You are free to use, change, or redistribute the code in any way you wish for
  6 | # non-commercial purposes, but please maintain the name of the original author.
  7 | # This code comes with no warranty of any kind.
  8 | 
  9 | # Stephen Marsland, 2008
 10 | 
 11 | # A demonstration of four methods of solving the Travelling Salesman Problem
 12 | from numpy import *
 13 | 
 14 | def makeTSP(nCities):
 15 | 	positions = 2*random.rand(nCities,2)-1;
 16 | 	distances = zeros((nCities,nCities))
 17 | 
 18 | 	for i in range(nCities):
 19 | 		for j in range(i+1,nCities):
 20 | 			distances[i,j] = sqrt((positions[i,0] - positions[j,0])**2 + (positions[i,1] - positions[j,1])**2);
 21 | 			distances[j,i] = distances[i,j];
 22 | 
 23 | 	return distances
 24 | 
 25 | def exhaustive(distances):
 26 | 	nCities = shape(distances)[0]
 27 | 
 28 | 	cityOrder = arange(nCities)
 29 | 
 30 | 	distanceTravelled = 0
 31 | 	for i in range(nCities-1):
 32 | 		distanceTravelled += distances[cityOrder[i],cityOrder[i+1]]
 33 | 	distanceTravelled += distances[cityOrder[nCities-1],0]
 34 | 
 35 | 	for newOrder in permutation(range(nCities)):
 36 | 		possibleDistanceTravelled = 0
 37 | 		for i in range(nCities-1):
 38 | 			possibleDistanceTravelled += distances[newOrder[i],newOrder[i+1]]
 39 | 		possibleDistanceTravelled += distances[newOrder[nCities-1],0]
 40 | 			 
 41 | 		if possibleDistanceTravelled < distanceTravelled:
 42 | 			distanceTravelled = possibleDistanceTravelled
 43 | 			cityOrder = newOrder
 44 | 
 45 | 	return cityOrder, distanceTravelled
 46 | 	
 47 | def permutation(order):
 48 | 	order = tuple(order)
 49 | 	if len(order)==1:
 50 | 		yield order
 51 | 	else:
 52 | 		for i in range(len(order)):
 53 | 			rest = order[:i] + order[i+1:]
 54 | 			move = (order[i],)
 55 | 			for smaller in permutation(rest):
 56 | 				yield move + smaller
 57 | 		
 58 | def greedy(distances):
 59 | 	nCities = shape(distances)[0]
 60 | 	distanceTravelled = 0
 61 | 	
 62 | 	# Need a version of the matrix we can trash
 63 | 	dist = distances.copy()
 64 | 
 65 | 	cityOrder = zeros(nCities)
 66 | 	cityOrder[0] = random.randint(nCities)
 67 | 	dist[:,cityOrder[0]] = Inf
 68 | 
 69 | 	for i in range(nCities-1):
 70 | 		cityOrder[i+1] = argmin(dist[cityOrder[i],:])
 71 | 		distanceTravelled  += dist[cityOrder[i],cityOrder[i+1]]
 72 | 		# Now exclude the chance of travelling to that city again
 73 | 		dist[:,cityOrder[i+1]] = Inf
 74 | 	
 75 | 	# Now return to the original city
 76 | 	distanceTravelled += distances[cityOrder[nCities-1],0]
 77 | 
 78 | 	return cityOrder, distanceTravelled
 79 | 
 80 | def hillClimbing(distances):
 81 | 
 82 | 	nCities = shape(distances)[0]
 83 | 
 84 | 	cityOrder = arange(nCities)
 85 | 	random.shuffle(cityOrder)
 86 | 
 87 | 	distanceTravelled = 0
 88 | 	for i in range(nCities-1):
 89 | 		distanceTravelled += distances[cityOrder[i],cityOrder[i+1]]
 90 | 	distanceTravelled += distances[cityOrder[nCities-1],0]
 91 | 
 92 | 	for i in range(1000):
 93 | 		# Choose cities to swap
 94 | 		city1 = random.randint(nCities)
 95 | 		city2 = random.randint(nCities)
 96 | 
 97 | 		if city1 != city2:
 98 | 			# Reorder the set of cities
 99 | 			possibleCityOrder = cityOrder.copy()
100 | 			possibleCityOrder = where(possibleCityOrder==city1,-1,possibleCityOrder)
101 | 			possibleCityOrder = where(possibleCityOrder==city2,city1,possibleCityOrder)
102 | 			possibleCityOrder = where(possibleCityOrder==-1,city2,possibleCityOrder)
103 | 
104 | 			# Work out the new distances
105 | 			# This can be done more efficiently
106 | 			newDistanceTravelled = 0
107 | 			for j in range(nCities-1):
108 | 				newDistanceTravelled += distances[possibleCityOrder[j],possibleCityOrder[j+1]]
109 | 			distanceTravelled += distances[cityOrder[nCities-1],0]
110 | 	
111 | 			if newDistanceTravelled < distanceTravelled:
112 | 				distanceTravelled = newDistanceTravelled
113 | 				cityOrder = possibleCityOrder
114 | 
115 | 	return cityOrder, distanceTravelled
116 | 	
117 | 
118 | def simulatedAnnealing(distances):
119 | 
120 | 	nCities = shape(distances)[0]
121 | 
122 | 	cityOrder = arange(nCities)
123 | 	random.shuffle(cityOrder)
124 | 
125 | 	distanceTravelled = 0
126 | 	for i in range(nCities-1):
127 | 		distanceTravelled += distances[cityOrder[i],cityOrder[i+1]]
128 | 	distanceTravelled += distances[cityOrder[nCities-1],0]
129 | 
130 | 	T = 500
131 | 	c = 0.8
132 | 	nTests = 10
133 | 
134 | 	while T>1:
135 | 		for i in range(nTests):
136 | 			# Choose cities to swap
137 | 			city1 = random.randint(nCities)
138 | 			city2 = random.randint(nCities)
139 | 
140 | 			if city1 != city2:
141 | 				# Reorder the set of cities
142 | 				possibleCityOrder = cityOrder.copy()
143 | 				possibleCityOrder = where(possibleCityOrder==city1,-1,possibleCityOrder)
144 | 				possibleCityOrder = where(possibleCityOrder==city2,city1,possibleCityOrder)
145 | 				possibleCityOrder = where(possibleCityOrder==-1,city2,possibleCityOrder)
146 | 
147 | 				# Work out the new distances
148 | 				# This can be done more efficiently
149 | 				newDistanceTravelled = 0
150 | 				for j in range(nCities-1):
151 | 					newDistanceTravelled += distances[possibleCityOrder[j],possibleCityOrder[j+1]]
152 | 				distanceTravelled += distances[cityOrder[nCities-1],0]
153 | 
154 | 				if newDistanceTravelled < distanceTravelled or (distanceTravelled - newDistanceTravelled) < T*log(random.rand()):
155 | 					distanceTravelled = newDistanceTravelled
156 | 					cityOrder = possibleCityOrder
157 | 
158 | 			# Annealing schedule
159 | 			T = c*T
160 | 
161 | 	return cityOrder, distanceTravelled
162 | 
163 | def runAll():
164 | 	import time
165 | 
166 | 	nCities = 5
167 | 	distances = makeTSP(nCities)
168 | 
169 | 	print "Exhaustive search"
170 | 	start = time.time()
171 | 	print exhaustive(distances)
172 | 	finish = time.time()
173 | 	print finish-start
174 | 
175 | 	print "Greedy search"
176 | 	start = time.time()
177 | 	print greedy(distances)
178 | 	finish = time.time()
179 | 	print finish-start
180 | 
181 | 	print "Hill Climbing"
182 | 	start = time.time()
183 | 	print hillClimbing(distances)
184 | 	finish = time.time()
185 | 	print finish-start
186 | 
187 | 	print "Simulated Annealing"
188 | 	start = time.time()
189 | 	print simulatedAnnealing(distances)
190 | 	finish = time.time()
191 | 	print finish-start
192 | 
193 | runAll()


--------------------------------------------------------------------------------
/11 Optimisation/steepest.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 11 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Gradient Descent using steepest descent
12 | 
13 | from numpy import *
14 | 
15 | def Jacobian(x):
16 |     #return array([.4*x[0],2*x[1]])
17 |     return array([x[0], 0.4*x[1], 1.2*x[2]])
18 | 
19 | def steepest(x0):
20 | 
21 |     i = 0 
22 |     iMax = 10
23 |     x = x0
24 |     Delta = 1
25 |     alpha = 1
26 | 
27 |     while i<iMax and Delta>10**(-5):
28 |         p = -Jacobian(x)
29 |         xOld = x
30 |         x = x + alpha*p
31 |         Delta = sum((x-xOld)**2)
32 |         print x
33 |         i += 1
34 | 
35 | x0 = array([-2,2,-2])
36 | steepest(x0)
37 | 


--------------------------------------------------------------------------------
/12 Evolutionary/PBIL.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 12 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The Population Based Incremental Learning algorithm
12 | # Comment and uncomment fitness functions as appropriate (as an import and the fitnessFunction variable)
13 | 
14 | from pylab import *
15 | from numpy import *
16 | #import fourpeaks as fF
17 | import knapsack as fF
18 | 
19 | def PBIL():
20 | 	ion()
21 | 	
22 | 	populationSize = 100
23 | 	stringLength = 20	
24 | 	eta = 0.005
25 | 	
26 | 	#fitnessFunction = 'fF.fourpeaks'
27 | 	fitnessFunction = 'fF.knapsack'
28 | 	p = 0.5*ones(stringLength)
29 | 	best = zeros(501,dtype=float)
30 | 
31 | 	for count in range(501):
32 | 		# Generate samples
33 | 		population = random.rand(populationSize,stringLength)
34 | 		for i in range(stringLength):
35 | 			population[:,i] = where(population[:,i]<p[i],1,0)
36 | 
37 | 		# Evaluate fitness
38 | 		fitness = eval(fitnessFunction)(population)
39 | 
40 | 		# Pick best
41 | 		best[count] = max(fitness)
42 | 		bestplace = argmax(fitness)
43 | 		fitness[bestplace] = 0
44 | 		secondplace = argmax(fitness)
45 | 
46 | 		# Update vector
47 | 		p  = p*(1-eta) + eta*((population[bestplace,:]+population[secondplace,:])/2)
48 | 
49 | 		if (mod(count,100)==0):
50 | 			print count, best[count]
51 | 
52 | 	plot(best,'kx-')
53 | 	xlabel('Epochs')
54 | 	ylabel('Fitness')
55 | 	show()
56 | 	#print p
57 | 
58 | PBIL()
59 | 


--------------------------------------------------------------------------------
/12 Evolutionary/exhaustiveKnapsack.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 12 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # An exhaustive search to solve the Knapsack problem
12 | from numpy import *
13 | 
14 | def exhaustive():
15 |     maxSize = 500    
16 |     sizes = array([109.60,125.48,52.16,195.55,58.67,61.87,92.95,93.14,155.05,110.89,13.34,132.49,194.03,121.29,179.33,139.02,198.78,192.57,81.66,128.90])
17 | 
18 |     best = 0
19 | 
20 |     twos = arange(-len(sizes),0,1)
21 |     twos = 2.0**twos
22 |     
23 |     for i in range(2**len(sizes)-1):
24 |         string = remainder(floor(i*twos),2) 
25 |         fitness = sum(string*sizes)
26 |         if fitness > best and fitness<500:
27 |             best = fitness
28 |             bestString = string
29 |     print best
30 |     print bestString
31 |           
32 | exhaustive()
33 | 


--------------------------------------------------------------------------------
/12 Evolutionary/fourpeaks.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 12 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The four peaks fitness function
12 | from numpy import *
13 | def fourpeaks(population):
14 | 
15 | 	T = 15
16 | 	start = zeros((shape(population)[0],1))
17 | 	finish = zeros((shape(population)[0],1))
18 | 
19 | 	fitness = zeros((shape(population)[0],1))
20 | 
21 | 	for i in range(shape(population)[0]):
22 | 		s = where(population[i,:]==1)
23 | 		f = where(population[i,:]==0)
24 | 		if size(s)>0:
25 | 			start = s[0][0]
26 | 		else:
27 | 			start = 0	
28 | 		
29 | 		if size(f)>0:
30 | 			finish = shape(population)[1] - f[-1][-1] -1
31 | 		else:
32 | 			finish = 0
33 | 
34 | 		if start>T and finish>T:
35 | 			fitness[i] = maximum(start,finish)+100
36 | 		else:
37 | 			fitness[i] = maximum(start,finish)
38 | 
39 | 	fitness = squeeze(fitness)
40 | 	return fitness
41 | 


--------------------------------------------------------------------------------
/12 Evolutionary/ga.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # Code from Chapter 12 of Machine Learning: An Algorithmic Perspective
  3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
  4 | 
  5 | # You are free to use, change, or redistribute the code in any way you wish for
  6 | # non-commercial purposes, but please maintain the name of the original author.
  7 | # This code comes with no warranty of any kind.
  8 | 
  9 | # Stephen Marsland, 2008
 10 | 
 11 | 
 12 | # The Genetic algorithm
 13 | # Comment and uncomment fitness functions as appropriate (as an import and the fitnessFunction variable)
 14 | 
 15 | from pylab import *
 16 | from numpy import *
 17 | import knapsack as fF
 18 | 
 19 | class ga:
 20 | 
 21 | 	def __init__(self,stringLength,fitnessFunction,nEpochs,populationSize=100,mutationProb=-1,crossover='un',nElite=4,tournament=True):
 22 | 		""" Constructor"""
 23 | 		self.stringLength = stringLength
 24 | 		
 25 | 		# Population size should be even
 26 | 		if mod(populationSize,2)==0:
 27 | 			self.populationSize = populationSize
 28 | 		else:
 29 | 			self.populationSize = populationSize+1
 30 | 		
 31 | 		if mutationProb < 0:
 32 | 			 self.mutationProb = 1/stringLength
 33 | 		else:
 34 | 			 self.mutationProb = mutationProb
 35 | 			 	  
 36 | 		self.nEpochs = nEpochs
 37 | 
 38 | 		self.fitnessFunction = fitnessFunction
 39 | 
 40 | 		self.crossover = crossover
 41 | 		self.nElite = nElite
 42 | 		self.tournment = tournament
 43 | 
 44 | 		self.population = random.rand(self.populationSize,self.stringLength)
 45 | 		self.population = where(self.population<0.5,0,1)
 46 | 		
 47 | 	def runGA(self):
 48 | 		"""The basic loop"""
 49 | 		ion()
 50 | 		plotfig = figure
 51 | 		bestfit = zeros(self.nEpochs)
 52 | 
 53 | 		for i in range(self.nEpochs):
 54 | 			# Compute fitness of the population
 55 | 			fitness = eval(self.fitnessFunction)(self.population)
 56 | 
 57 | 			# Pick parents -- can do in order since they are randomised
 58 | 			newPopulation = self.fps(self.population,fitness)
 59 | 
 60 | 			# Apply the genetic operators
 61 | 			if self.crossover == 'sp':
 62 | 				newPopulation = self.spCrossover(newPopulation)
 63 | 			elif self.crossover == 'un':
 64 | 				newPopulation = self.uniformCrossover(newPopulation)
 65 | 			newPopulation = self.mutate(newPopulation)
 66 | 
 67 | 			# Apply elitism and tournaments if using
 68 | 			if self.nElite>0:
 69 | 				newPopulation = self.elitism(self.population,newPopulation,fitness)
 70 | 	
 71 | 			if self.tournament:
 72 | 				newPopulation = self.tournament(self.population,newPopulation,fitness,self.fitnessFunction)
 73 | 	
 74 | 			self.population = newPopulation
 75 | 			bestfit[i] = fitness.max()
 76 | 
 77 | 			if (mod(i,100)==0):
 78 | 				print i, fitness.max()	
 79 | 			#plot([i],[fitness.max()],'r+')
 80 | 		plot(bestfit,'kx-')
 81 | 		show()
 82 | 	
 83 | 	def fps(self,population,fitness):
 84 | 
 85 | 		# Scale fitness by total fitness
 86 | 		fitness = fitness/sum(fitness)
 87 | 		fitness = 10*fitness/fitness.max()
 88 | 		
 89 | 		# Put repeated copies of each string in according to fitness
 90 | 		# Deal with strings with very low fitness
 91 | 		j=0
 92 | 		while round(fitness[j])<1:
 93 | 			j = j+1
 94 | 		
 95 | 		newPopulation = kron(ones((round(fitness[j]),1)),population[j,:])
 96 | 
 97 | 		# Add multiple copies of strings into the newPopulation
 98 | 		for i in range(j+1,self.populationSize):
 99 | 			if round(fitness[i])>=1:
100 | 				newPopulation = concatenate((newPopulation,kron(ones((round(fitness[i]),1)),population[i,:])),axis=0)
101 | 
102 | 		# Shuffle the order (note that there are still too many)
103 | 		indices = range(shape(newPopulation)[0])
104 | 		random.shuffle(indices)
105 | 		newPopulation = newPopulation[indices[:self.populationSize],:]
106 | 		return newPopulation	
107 | 
108 | 	def spCrossover(self,population):
109 | 		# Single point crossover
110 | 		newPopulation = zeros(shape(population))
111 | 		crossoverPoint = random.randint(0,self.stringLength,self.populationSize)
112 | 		for i in range(0,self.populationSize,2):
113 | 			newPopulation[i,:crossoverPoint[i]] = population[i,:crossoverPoint[i]]
114 | 			newPopulation[i+1,:crossoverPoint[i]] = population[i+1,:crossoverPoint[i]]
115 | 			newPopulation[i,crossoverPoint[i]:] = population[i+1,crossoverPoint[i]:]
116 | 			newPopulation[i+1,crossoverPoint[i]:] = population[i,crossoverPoint[i]:]
117 | 		return newPopulation
118 | 
119 | 	def uniformCrossover(self,population):
120 | 		# Uniform crossover
121 | 		newPopulation = zeros(shape(population))
122 | 		which = random.rand(self.populationSize,self.stringLength)
123 | 		which1 = which>=0.5
124 | 		for i in range(0,self.populationSize,2):
125 | 			newPopulation[i,:] = population[i,:]*which1[i,:] + population[i+1,:]*(1-which1[i,:])
126 | 			newPopulation[i+1,:] = population[i,:]*(1-which1[i,:]) + population[i+1,:]*which1[i,:]
127 | 		return newPopulation
128 | 		
129 | 	def mutate(self,population):
130 | 		# Mutation
131 | 		whereMutate = random.rand(shape(population)[0],shape(population)[1])
132 | 		population[where(whereMutate < self.mutationProb)] = 1 - population[where(whereMutate < self.mutationProb)]
133 | 		return population
134 | 
135 | 	def elitism(self,oldPopulation,population,fitness):
136 | 		best = argsort(fitness)
137 | 		best = squeeze(oldPopulation[best[-self.nElite:],:])
138 | 		indices = range(shape(population)[0])
139 | 		random.shuffle(indices)
140 | 		population = population[indices,:]
141 | 		population[0:self.nElite,:] = best
142 | 		return population
143 | 
144 | 	def tournament(self,oldPopulation,population,fitness,fitnessFunction):
145 | 		newFitness = eval(self.fitnessFunction)(population)
146 | 		for i in range(0,shape(population)[0],2):
147 | 			f = concatenate((fitness[i:i+2],newFitness[i:i+2]),axis=1)
148 | 			indices = argsort(f)
149 | 			if indices[-1]<2 and indices[-2]<2:
150 | 				population[i,:] = oldPopulation[i,:]
151 | 				population[i+1,:] = oldPopulation[i+1,:]
152 | 			elif indices[-1]<2:
153 | 				if indices[0]>=2:
154 | 					population[i+indices[0]-2,:] = oldPopulation[i+indices[-1]]
155 | 				else:
156 | 					population[i+indices[1]-2,:] = oldPopulation[i+indices[-1]]
157 | 			elif indices[-2]<2:
158 | 				if indices[0]>=2:
159 | 					population[i+indices[0]-2,:] = oldPopulation[i+indices[-2]]
160 | 				else:
161 | 					population[i+indices[1]-2,:] = oldPopulation[i+indices[-2]]
162 | 		return population
163 | 			
164 | 


--------------------------------------------------------------------------------
/12 Evolutionary/greedyKnapsack.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 12 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # A greedy algorithm to solve the Knapsack problem
12 | from numpy import *
13 | 
14 | def greedy():
15 |     maxSize = 500    
16 |     sizes = array([109.60,125.48,52.16,195.55,58.67,61.87,92.95,93.14,155.05,110.89,13.34,132.49,194.03,121.29,179.33,139.02,198.78,192.57,81.66,128.90])
17 | 
18 |     sizes.sort()
19 |     newSizes = sizes[-1:0:-1]
20 |     space = maxSize
21 |     
22 |     while len(newSizes)>0 and space>newSizes[-1]:
23 |         # Pick largest item that will fit
24 |         item = where(space>newSizes)[0][0]
25 |         print newSizes[item]
26 |         space = space-newSizes[item]
27 |         newSizes = concatenate((newSizes[:item],newSizes[item+1:]))
28 |     print "Size = ",maxSize-space
29 |     
30 | greedy() 
31 | 


--------------------------------------------------------------------------------
/12 Evolutionary/knapsack.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 12 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # A fitness function for the Knapsack problem
12 | from numpy import *
13 | 
14 | def knapsack(pop):
15 | 	maxSize = 500	
16 | 	#sizes = array([193.71,60.15,89.08,88.98,15.39,238.14,68.78,107.47,119.66,183.70])
17 | 
18 |  	sizes = array([109.60,125.48,52.16,195.55,58.67,61.87,92.95,93.14,155.05,110.89,13.34,132.49,194.03,121.29,179.33,139.02,198.78,192.57,81.66,128.90])
19 | 
20 | 	fitness = sum(sizes*pop,axis=1)
21 | 	fitness = where(fitness>maxSize,500-2*(fitness-maxSize),fitness)
22 | 		
23 | 	return fitness
24 | 


--------------------------------------------------------------------------------
/12 Evolutionary/run_ga.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 12 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # A runner for the Genetic Algorithm
12 | import ga
13 | 
14 | ga = ga.ga(20,'fF.knapsack',101,100,-1,'sp',4,True)
15 | ga.runGA()
16 | 


--------------------------------------------------------------------------------
/13 Reinforcement/SARSA.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 13 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The basic SARSA algorithm with the Europe example
12 | 
13 | from numpy import *
14 | 
15 | def SARSA():
16 | 
17 |     R = array([[-5,0,-inf,-inf,-inf,-inf],[0,-5,0,0,-inf,-inf],[-inf,0,-5,0,-inf,100],[-inf,0,0,-5,0,-inf],[-inf,-inf,-inf,0,-5,100],[-inf,-inf,0,-inf,-inf,0]])
18 |     t = array([[1,1,0,0,0,0],[1,1,1,1,0,0],[0,1,1,1,0,1],[0,1,1,1,1,0],[0,0,0,1,1,1],[0,0,1,0,1,1]])
19 | 
20 |    
21 |     
22 |     nStates = shape(R)[0]
23 |     nActions = shape(R)[1]
24 |     Q = random.rand(nStates,nActions)*0.1-0.05
25 |     mu = 0.7
26 |     gamma = 0.4
27 |     epsilon = 0.1
28 |     nits = 0
29 | 
30 |     while nits < 1000:
31 |         # Pick initial state
32 |         s = random.randint(nStates)
33 |         # epsilon-greedy
34 |         if (random.rand()<epsilon):
35 |             indices = where(t[s,:]!=0)
36 |             pick = random.randint(shape(indices)[1])
37 |             a = indices[0][pick]
38 |         else:
39 |             a = argmax(Q[s,:])
40 |                 
41 |         # Stop when the accepting state is reached
42 |         while s!=5:
43 |             r = R[s,a]
44 |             # For this example, new state is the chosen action
45 |             sprime = a
46 |             
47 |             # epsilon-greedy
48 |             if (random.rand()<epsilon):
49 |                 indices = where(t[sprime,:]!=0)
50 |                 pick = random.randint(shape(indices)[1])
51 |                 aprime = indices[0][pick]
52 |                 #print s,a
53 |             else:
54 |                 aprime = argmax(Q[sprime,:])
55 |             #print "here", Q[sprime,aprime], Q[s,a], s, a
56 |             
57 |             Q[s,a] += mu * (r + gamma*Q[sprime,aprime] - Q[s,a])
58 | 
59 |             s = sprime
60 |             a = aprime
61 |             
62 |         nits = nits+1
63 | 
64 |     print Q
65 | 
66 | SARSA()
67 | 


--------------------------------------------------------------------------------
/13 Reinforcement/SARSA_cliff.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # Code from Chapter 13 of Machine Learning: An Algorithmic Perspective
  3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
  4 | 
  5 | # You are free to use, change, or redistribute the code in any way you wish for
  6 | # non-commercial purposes, but please maintain the name of the original author.
  7 | # This code comes with no warranty of any kind.
  8 | 
  9 | # Stephen Marsland, 2008
 10 | 
 11 | # The basic SARSA algorithm with the Cliff example
 12 | 
 13 | from numpy import *
 14 | 
 15 | def SARSA_cliff():
 16 | 
 17 |     R = -ones((4,7,4))
 18 |     R[0,:,0] = -inf
 19 |     R[0,6,0] = 0
 20 |     R[:,0,3] = -inf
 21 |     R[3,:,2] = -inf
 22 |     R[:,6,1] = -inf
 23 |     R[1,1:6,0] = -100
 24 |     R[0,0,1] = -100
 25 |     R[0,6,3] = -100
 26 |     
 27 |     t = zeros((4,7,4,2))
 28 |     for i in range(4):
 29 |         for j in range(7):
 30 |             for k in range(4):
 31 |                 if k==2:
 32 |                     if i<3:
 33 |                         t[i,j,k,0] = i+1
 34 |                         t[i,j,k,1] = j
 35 |                     else:
 36 |                         t[i,j,k,0] = i
 37 |                         t[i,j,k,1] = j                  
 38 |                 elif k==1:
 39 |                     if j<6:
 40 |                         t[i,j,k,0] = i
 41 |                         t[i,j,k,1] = j+1
 42 |                     else:
 43 |                         t[i,j,k,0] = i
 44 |                         t[i,j,k,1] = j 
 45 |                     if i==0 and j==0:
 46 |                         t[i,j,k,0] = 0
 47 |                         t[i,j,k,1] = 0   
 48 |                 elif k==0:
 49 |                     if i==0 and j==6:
 50 |                         # Finished
 51 |                         t[i,j,k,0] = 0
 52 |                         t[i,j,k,1] = 0
 53 |                     if i>0:
 54 |                         t[i,j,k,0] = i-1
 55 |                         t[i,j,k,1] = j
 56 |                     else:
 57 |                         t[i,j,k,0] = i
 58 |                         t[i,j,k,1] = j
 59 |                     
 60 |                     if i==1 and 1<=j<=5:
 61 |                         t[i,j,k,0] = 0
 62 |                         t[i,j,k,1] = 0 
 63 |                 else:
 64 |                     if j>0:
 65 |                         t[i,j,k,0] = i
 66 |                         t[i,j,k,1] = j-1
 67 |                     else:
 68 |                         t[i,j,k,0] = i
 69 |                         t[i,j,k,1] = j
 70 |                     if i==0 and j==6:
 71 |                         t[i,j,k,0] = 0
 72 |                         t[i,j,k,1] = 0
 73 |     
 74 |     #print t[:,:,3,0] ,t[:,:,3,1]
 75 |     
 76 |     Q = random.random_sample(shape(R))*0.1-0.05
 77 |     mu = 0.7
 78 |     gamma = 0.4
 79 |     epsilon = 0.05
 80 |     nits = 0
 81 | 
 82 |     while nits < 1000:
 83 |         # Pick initial state
 84 |         s = array([0,0]) #array([random.randint(4),random.randint(7)])
 85 |         
 86 |         r=-inf
 87 |         while r==-inf:
 88 |             # epsilon-greedy
 89 |             if (random.rand()<epsilon):
 90 |                 a = random.randint(4)
 91 |             else:
 92 |                 a = argmax(Q[s[0],s[1],:])
 93 |             r = R[s[0],s[1],a]
 94 | 
 95 |         #print s, shape(s)
 96 |         #print shape(Q), shape(Q[s[0],s[1],:])
 97 |         inEpisode = 1
 98 |         # Stop when the accepting state is reached
 99 |         while inEpisode:
100 |             r = R[s[0],s[1],a]
101 |             #print "r = ", r
102 |             sprime = t[s[0],s[1],a,:]
103 |             #print "sprime",sprime
104 | 
105 |             rprime=-inf
106 |             while rprime==-inf:            
107 |                 # epsilon-greedy
108 |                 if (random.rand()<epsilon):
109 |                     aprime = random.randint(4)
110 |                 else:
111 |                     aprime = argmax(Q[sprime[0],sprime[1],:])
112 |                 rprime = R[sprime[0],sprime[1],aprime]
113 | 
114 |             #print aprime
115 |             #print "here", Q[sprime[0],sprime[1],aprime], Q[s[0],s[1],a], s, a
116 |             
117 |             Q[s[0],s[1],a] += mu * (r + gamma*Q[sprime[0],sprime[1],aprime] - Q[s[0],s[1],a])
118 |             #print "there"
119 |             s = sprime
120 |             a = aprime
121 |             r = rprime
122 |             if s[0]==0 and s[1]==6 and a==0:
123 |                 # Have reached endpoint
124 |                 inEpisode = 0
125 |         nits = nits+1
126 |         print nits
127 |     print Q
128 |     return Q, R, t
129 | 
130 | def SARSAgo(Q,R,t):
131 |     s = array([0,0])
132 |     rtotal = 0
133 |     finished = 0
134 |     epsilon = 0.05
135 |     while not(finished):
136 |         r=-inf
137 |         while r==-inf:
138 |             # epsilon-greedy
139 |             if (random.rand()<epsilon):
140 |                 a = random.randint(4)
141 |             else:
142 |                 a = argmax(Q[s[0],s[1],:])
143 |             r = R[s[0],s[1],a]
144 |         s = t[s[0],s[1],a,:]
145 |         #print s
146 |         rtotal += r
147 |         if s[0]==0 and s[1]==6 and a==0:
148 |             finished = 1
149 |     print "Total cost = ",rtotal
150 |     return rtotal
151 |     
152 | Q,R,t = SARSA_cliff()
153 | cost = SARSAgo(Q,R,t)
154 | cost = SARSAgo(Q,R,t)
155 | cost = SARSAgo(Q,R,t)
156 | cost = SARSAgo(Q,R,t)
157 | cost = SARSAgo(Q,R,t)
158 | 


--------------------------------------------------------------------------------
/13 Reinforcement/TDZero.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 13 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The basic TD(0) algorithm with the Europe example
12 | 
13 | from numpy import *
14 | 
15 | def TDZero():
16 | 
17 | 	R = array([[-5,0,-inf,-inf,-inf,-inf],[0,-5,0,0,-inf,-inf],[-inf,0,-5,0,-inf,100],[-inf,0,0,-5,0,-inf],[-inf,-inf,-inf,0,-5,100],[-inf,-inf,0,-inf,-inf,0]])
18 | 	t = array([[1,1,0,0,0,0],[1,1,1,1,0,0],[0,1,1,1,0,1],[0,1,1,1,1,0],[0,0,0,1,1,1],[0,0,1,0,1,1]])
19 | 
20 | 	nStates = shape(R)[0]
21 | 	nActions = shape(R)[1]
22 | 	Q = random.rand(nStates,nActions)*0.1-0.05
23 | 	mu = 0.7
24 | 	gamma = 0.4
25 | 	epsilon = 0.1
26 | 	nits = 0
27 | 
28 | 	while nits < 1000:
29 | 		# Pick initial state
30 | 		s = random.randint(nStates)
31 | 		# Stop when the accepting state is reached
32 | 		while s!=5:
33 | 			# epsilon-greedy
34 | 			if (random.rand()<epsilon):
35 | 				indices = where(t[s,:]!=0)
36 | 				pick = random.randint(shape(indices)[1])
37 | 				a = indices[0][pick]
38 | 				#print s,a
39 | 			else:
40 | 				a = argmax(Q[s,:])
41 | 
42 | 			r = R[s,a]
43 | 			# For this example, new state is the chosen action
44 | 			sprime = a
45 | 			#print "here"
46 | 			Q[s,a] += mu * (r + gamma*max(Q[sprime,:]) - Q[s,a])
47 | 			s = sprime
48 | 
49 | 		nits = nits+1
50 | 
51 | 	print Q
52 | 
53 | TDZero()
54 | 


--------------------------------------------------------------------------------
/13 Reinforcement/TDZero_cliff.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # Code from Chapter 13 of Machine Learning: An Algorithmic Perspective
  3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
  4 | 
  5 | # You are free to use, change, or redistribute the code in any way you wish for
  6 | # non-commercial purposes, but please maintain the name of the original author.
  7 | # This code comes with no warranty of any kind.
  8 | 
  9 | # Stephen Marsland, 2008
 10 | 
 11 | # The basic TD(0) algorithm with the Cliff example
 12 | 
 13 | from numpy import *
 14 | 
 15 | def TDZero_cliff():
 16 | 
 17 |     R = -ones((4,7,4))
 18 |     R[0,:,0] = -inf
 19 |     R[:,0,3] = -inf
 20 |     R[3,:,2] = -inf
 21 |     R[:,6,1] = -inf
 22 |     R[1,1:6,0] = -100
 23 |     R[0,0,1] = -100
 24 |     R[0,6,3] = -100
 25 |     
 26 |     t = zeros((4,7,4,2))
 27 |     for i in range(4):
 28 |         for j in range(7):
 29 |             for k in range(4):
 30 |                 if k==2:
 31 |                     if i<3:
 32 |                         t[i,j,k,0] = i+1
 33 |                         t[i,j,k,1] = j
 34 |                     else:
 35 |                         t[i,j,k,0] = i
 36 |                         t[i,j,k,1] = j                  
 37 |                 elif k==1:
 38 |                     if j<6:
 39 |                         t[i,j,k,0] = i
 40 |                         t[i,j,k,1] = j+1
 41 |                     else:
 42 |                         t[i,j,k,0] = i
 43 |                         t[i,j,k,1] = j 
 44 |                     if i==0 and j==0:
 45 |                         t[i,j,k,0] = 0
 46 |                         t[i,j,k,1] = 0   
 47 |                 elif k==0:
 48 |                     if i==0 and j==6:
 49 |                         # Finished
 50 |                         t[i,j,k,0] = 0
 51 |                         t[i,j,k,1] = 0
 52 |                     if i>0:
 53 |                         t[i,j,k,0] = i-1
 54 |                         t[i,j,k,1] = j
 55 |                     else:
 56 |                         t[i,j,k,0] = i
 57 |                         t[i,j,k,1] = j
 58 |                     
 59 |                     if i==1 and 1<=j<=5:
 60 |                         t[i,j,k,0] = 0
 61 |                         t[i,j,k,1] = 0 
 62 |                 else:
 63 |                     if j>0:
 64 |                         t[i,j,k,0] = i
 65 |                         t[i,j,k,1] = j-1
 66 |                     else:
 67 |                         t[i,j,k,0] = i
 68 |                         t[i,j,k,1] = j
 69 |                     if i==0 and j==6:
 70 |                         t[i,j,k,0] = 0
 71 |                         t[i,j,k,1] = 0
 72 |     
 73 |     #print t[:,:,3,0] ,t[:,:,3,1]
 74 |     
 75 |     #Q = random.random_sample(shape(R))*0.1-0.05
 76 |     Q = zeros(shape(R))
 77 |     mu = 0.7
 78 |     gamma = 0.4
 79 |     epsilon = 0.05
 80 |     nits = 0
 81 | 
 82 |     while nits < 1000:
 83 |         # Pick initial state
 84 |         s = array([0,0]) #array([random.randint(4),random.randint(7)])
 85 | 
 86 |         #print s, shape(s)
 87 |         #print shape(Q), shape(Q[s[0],s[1],:])
 88 |         inEpisode = 1
 89 |         # Stop when the accepting state is reached
 90 |         while inEpisode:
 91 |             r=-inf
 92 |             while r==-inf:
 93 |                 # epsilon-greedy
 94 |                 if (random.rand()<epsilon):
 95 |                     a = random.randint(4)
 96 |                 else:
 97 |                     a = argmax(Q[s[0],s[1],:])
 98 |             
 99 |                 r = R[s[0],s[1],a]
100 |             #print "r = ", r
101 |             sprime = t[s[0],s[1],a,:]
102 |             #print "sprime",sprime
103 |             
104 |             Q[s[0],s[1],a] += mu * (r + gamma*max(Q[sprime[0],sprime[1],:]) - Q[s[0],s[1],a])
105 |             #print "there"
106 |             s = sprime
107 | 
108 |             if s[0]==0 and s[1]==6 and a==0:
109 |                 # Have reached endpoint
110 |                 inEpisode = 0
111 |         nits = nits+1
112 |         print nits
113 |     print Q
114 |     return Q, R, t
115 | 
116 | def TDgo(Q,R,t):
117 |     s = array([0,0])
118 |     rtotal = 0
119 |     finished = 0
120 |     epsilon = 0.05
121 |     while not(finished):
122 |         r=-inf
123 |         while r==-inf:
124 |             # epsilon-greedy
125 |             if (random.rand()<epsilon):
126 |                 a = random.randint(4)
127 |             else:
128 |                 a = argmax(Q[s[0],s[1],:])
129 |             r = R[s[0],s[1],a]
130 |         s = t[s[0],s[1],a,:]
131 |         #print s
132 |         rtotal += r
133 |         if s[0]==0 and s[1]==6 and a==0:
134 |             finished = 1
135 |     print "Total cost = ",rtotal
136 |     return rtotal
137 |     
138 | Q,R,t = TDZero_cliff()
139 | cost = TDgo(Q,R,t)
140 | cost = TDgo(Q,R,t)
141 | cost = TDgo(Q,R,t)
142 | cost = TDgo(Q,R,t)
143 | cost = TDgo(Q,R,t)
144 | 


--------------------------------------------------------------------------------
/14 MCMC/BoxMuller.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 14 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The Box-Muller algorithm for constructing pseudo-random Gaussian-distributed numbers
12 | 
13 | from pylab import *
14 | from numpy import *
15 | 
16 | def boxmuller(n):
17 |     
18 |     x = zeros((n,2))
19 |     y = zeros((n,2))
20 |     
21 |     for i in range(n):
22 |         x[i,:] = array([2,2])
23 |         x2 = x[i,0]*x[i,0]+x[i,1]*x[i,1]
24 |         while (x2)>1:
25 |             x[i,:] = random.rand(2)*2-1
26 |             x2 = x[i,0]*x[i,0]+x[i,1]*x[i,1]
27 | 
28 |         y[i,:] = x[i,:] * sqrt((-2*log(x2))/x2)
29 |     
30 |     y = reshape(y,2*n,1)
31 |     return y
32 | 
33 | y = boxmuller(1000)
34 | hist(y,normed=1,fc='k')
35 | x = arange(-4,4,0.1)
36 | plot(x,1/sqrt(2*pi)*exp(-0.5*x**2),'k',lw=6)
37 | xlabel('x',fontsize=24)
38 | ylabel('p(x)',fontsize=24)
39 | show()
40 |     
41 |     
42 | 


--------------------------------------------------------------------------------
/14 MCMC/Gibbs.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 14 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # A simple Gibbs sampler
12 | from pylab import *
13 | from numpy import *
14 | 
15 | def pxgiveny(y,mx,my,s1,s2):
16 |     return random.normal(mx + (y-my)/s2,s1)
17 |     #return random.binomial(16,y,1)
18 | 
19 | def pygivenx(x,mx,my,s1,s2):
20 |     return random.normal(my + (x-mx)/s1,s2)
21 |     #return random.beta(x+2,16-x+4,1)
22 | 
23 | def gibbs(N=500):
24 |     k=10
25 |     x0 = zeros(N,dtype=float)
26 |     m1 = 10
27 |     m2 = 20
28 |     s1 = 2
29 |     s2 = 3
30 |     for i in range(N):
31 |         y = random.rand(1)
32 |         for j in range(k):
33 |             x = pxgiveny(y,m1,m2,s1,s2)
34 |             y = pygivenx(x,m1,m2,s1,s2)
35 |         x0[i] = x
36 |     
37 |     return x0
38 | 
39 | #def f(x):
40 | #    n = 16
41 | #    alph = 2
42 | #    bet = 4
43 | #    return 20.0*(factorial(n)/(factorial(x)*factorial(n-x)))*factorial(x+1)*factorial(19-x)/factorial(21)
44 | #
45 | #def factorial(n):
46 | #    x = 1
47 | #    for i in range(n):
48 | #        x *= (i+1)
49 | #    return x
50 | 
51 | def f(x):
52 |     return exp(-(x-10)**2/10)
53 | 
54 | N=500
55 | s=gibbs(N)
56 | x1 = arange(0,17,1)
57 | hist(s,bins=x1,fc='k')
58 | x1 = arange(0,17,0.1)
59 | px1 = zeros(len(x1))
60 | for i in range(len(x1)):
61 |     px1[i] = f(x1[i])
62 | plot(x1, px1*N*10/sum(px1), color='k',linewidth=3)
63 | 
64 | show()
65 | 


--------------------------------------------------------------------------------
/14 MCMC/MH.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 14 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The Metropolis-Hastings algorithm
12 | from pylab import *
13 | from numpy import *
14 | 
15 | def p(x):
16 |     mu1 = 3
17 |     mu2 = 10
18 |     v1 = 10
19 |     v2 = 3
20 |     return 0.3*exp(-(x-mu1)**2/v1) + 0.7* exp(-(x-mu2)**2/v2)
21 | 
22 | def q(x):
23 |     mu = 5
24 |     sigma = 10
25 |     return exp(-(x-mu)**2/(sigma**2))
26 | 
27 | stepsize = 0.5
28 | x = arange(-10,20,stepsize)
29 | px = zeros(shape(x))
30 | for i in range(len(x)):
31 |     px[i] = p(x[i])
32 | N = 5000
33 | 
34 | # independence chain
35 | u = random.rand(N)
36 | mu = 5
37 | sigma = 10
38 | y = zeros(N)
39 | y[0] = random.normal(mu,sigma)
40 | for i in range(N-1):
41 |     ynew = random.normal(mu,sigma)
42 |     alpha = min(1,p(ynew)*q(y[i])/(p(y[i])*q(ynew)))
43 |     if u[i] < alpha:
44 |         y[i+1] = ynew
45 |     else:
46 |         y[i+1] = y[i]
47 | 
48 | # random walk chain
49 | u2 = random.rand(N)
50 | sigma = 10
51 | y2 = zeros(N)
52 | y2[0] = random.normal(0,sigma)
53 | for i in range(N-1):
54 |     y2new = y2[i] + random.normal(0,sigma)
55 |     alpha = min(1,p(y2new)/p(y2[i]))
56 |     if u2[i] < alpha:
57 |         y2[i+1] = y2new
58 |     else:
59 |         y2[i+1] = y2[i]
60 | 
61 | figure(1)
62 | nbins = 30
63 | hist(y, bins = x)
64 | plot(x, px*N/sum(px), color='r', linewidth=2)
65 | 
66 | figure(2)
67 | nbins = 30
68 | hist(y2, bins = x)
69 | plot(x, px*N/sum(px), color='r', linewidth=2)
70 | 
71 | show()
72 | 


--------------------------------------------------------------------------------
/14 MCMC/SIR.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 14 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The Sampling-Importance-Resampling algorithm
12 | from pylab import *
13 | from numpy import *
14 | 
15 | def p(x):
16 |     return 0.3*exp(-(x-0.3)**2) + 0.7* exp(-(x-2.)**2/0.3) 
17 | 
18 | def q(x):
19 |     return 4.0
20 | 
21 | def sir(n):
22 |     
23 |     sample1 = zeros(n)
24 |     w = zeros(n)
25 |     sample2 = zeros(n)
26 |     
27 |     # Sample from q
28 |     sample1 = random.rand(n)*4
29 | 
30 |     # Compute weights
31 |     w = p(sample1)/q(sample1)
32 |     w /= sum(w)
33 | 
34 |     # Sample from sample1 according to w
35 |     cumw = zeros(len(w))
36 |     cumw[0] = w[0]
37 |     for i in range(1,len(w)):
38 |         cumw[i] = cumw[i-1]+w[i]
39 |     
40 |     u = random.rand(n)
41 |     
42 |     index = 0
43 |     for i in range(n):
44 |         indices = where(u<cumw[i])
45 |         sample2[index:index+size(indices)] = sample1[i]
46 |         index += size(indices)
47 |         u[indices]=2
48 |     return sample2
49 | 
50 | x = arange(0,4,0.01)
51 | x2 = arange(-0.5,4.5,0.1)
52 | realdata = 0.3*exp(-(x-0.3)**2) + 0.7* exp(-(x-2.)**2/0.3) 
53 | box = ones(len(x2))*0.8
54 | box[:5] = 0
55 | box[-5:] = 0
56 | plot(x,realdata,'k',lw=6)
57 | plot(x2,box,'k--',lw=6)
58 | 
59 | import time
60 | t0=time.time()
61 | samples = sir(10000)
62 | t1=time.time()
63 | print t1-t0
64 | hist(samples,15,normed=1,fc='k')
65 | xlabel('x',fontsize=24)
66 | ylabel('p(x)',fontsize=24)
67 | axis([-0.5,4.5,0,1])
68 | show()
69 | 


--------------------------------------------------------------------------------
/14 MCMC/importancesampling.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 14 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The basic importance sampling algorithm
12 | from pylab import *
13 | from numpy import *
14 | 
15 | def qsample():
16 |     return random.rand()*4.
17 | 
18 | def p(x):
19 |     return 0.3*exp(-(x-0.3)**2) + 0.7* exp(-(x-2.)**2/0.3) 
20 | 
21 | def q(x):
22 |     return 4.0
23 | 
24 | def importance(nsamples):
25 |     
26 |     samples = zeros(nsamples,dtype=float)
27 |     w = zeros(nsamples,dtype=float)
28 |     
29 |     for i in range(nsamples):
30 |             samples[i] = qsample()
31 |             w[i] = p(samples[i])/q(samples[i])
32 |                 
33 |     return samples, w
34 | 
35 | x = arange(0,4,0.01)
36 | x2 = arange(-0.5,4.5,0.1)
37 | realdata = 0.3*exp(-(x-0.3)**2) + 0.7* exp(-(x-2.)**2/0.3) 
38 | box = ones(len(x2))*0.8
39 | box[:5] = 0
40 | box[-5:] = 0
41 | plot(x,realdata,'k',lw=6)
42 | plot(x2,box,'k--',lw=6)
43 | 
44 | samples,w = importance(5000)
45 | hist(samples,normed=1,fc='k')
46 | #xlabel('x',fontsize=24)
47 | #ylabel('p(x)',fontsize=24)
48 | show()
49 | 


--------------------------------------------------------------------------------
/14 MCMC/lcg.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 14 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The linear congruential pseudo-random number generator
12 | from numpy import *
13 | 
14 | def lcg(x0,n):
15 |     # These choices show the periodicity very well
16 |     # Better choices are a = 16,807 m = 2**31 -1 c = 0
17 |     # Or m = 2**32 a = 1,664,525 c = 1,013,904,223
18 |     a = 23
19 |     m = 197
20 |     c = 0
21 |     
22 |     rnd = zeros((n))
23 |     
24 |     rnd[0] = mod(a*x0 + c,m)
25 |     
26 |     for i in range(1,n):
27 |         rnd[i] = mod(a*rnd[i-1]+c,m)
28 |         
29 |     return rnd
30 |     
31 | print lcg(3,80) 
32 | 


--------------------------------------------------------------------------------
/14 MCMC/rejectionsampling.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 14 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The basic rejection sampling algorithm
12 | 
13 | from pylab import *
14 | from numpy import *
15 | 
16 | def qsample():
17 |     return random.rand()*4.
18 | 
19 | def p(x):
20 |     return 0.3*exp(-(x-0.3)**2) + 0.7* exp(-(x-2.)**2/0.3) 
21 | 
22 | def rejection(nsamples):
23 |     
24 |     M = 0.72#0.8
25 |     samples = zeros(nsamples,dtype=float)
26 |     count = 0
27 |     for i in range(nsamples):
28 |         accept = False
29 |         while not accept:
30 |             x = qsample()
31 |             u = random.rand()*M
32 |             if u<p(x):
33 |                 accept = True
34 |                 samples[i] = x
35 |             else: 
36 |                 count += 1
37 |     print count   
38 |     return samples
39 | 
40 | x = arange(0,4,0.01)
41 | x2 = arange(-0.5,4.5,0.1)
42 | realdata = 0.3*exp(-(x-0.3)**2) + 0.7* exp(-(x-2.)**2/0.3) 
43 | box = ones(len(x2))*0.75#0.8
44 | box[:5] = 0
45 | box[-5:] = 0
46 | plot(x,realdata,'k',lw=6)
47 | plot(x2,box,'k--',lw=6)
48 | 
49 | import time
50 | t0=time.time()
51 | samples = rejection(10000)
52 | t1=time.time()
53 | print "Time ",t1-t0
54 | 
55 | hist(samples,15,normed=1,fc='k')
56 | xlabel('x',fontsize=24)
57 | ylabel('p(x)',fontsize=24)
58 | axis([-0.5,4.5,0,1])
59 | show()
60 | 


--------------------------------------------------------------------------------
/15 Graphical Models/Gibbs.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # Code from Chapter 15 of Machine Learning: An Algorithmic Perspective
  3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
  4 | 
  5 | # You are free to use, change, or redistribute the code in any way you wish for
  6 | # non-commercial purposes, but please maintain the name of the original author.
  7 | # This code comes with no warranty of any kind.
  8 | 
  9 | # Stephen Marsland, 2008
 10 | 
 11 | # A Gibbs sampler for the Exam Panic dataset
 12 | 
 13 | from numpy import *
 14 |     
 15 | Pb = array([[0.5,0.5]])
 16 | Pr_b = array([[0.3,0.7],[0.8,0.2]])
 17 | Pa_b = array([[0.1,0.9],[0.5,0.5]])
 18 | Pp_ra = array([[0,1],[0.8,0.2],[0.6,0.4],[1,0]])
 19 | 
 20 | """
 21 | P(b|rap)=P(b|ra)=P(ra|b)*P(b)/P(ra)=P(r|b)*P(a|b)*P(b)/P(ra)
 22 | r a    P(b)
 23 | T T    0.3*0.1*0.5/0.215=0.0698
 24 | T F    0.3*0.9*0.5/0.335=0.4030
 25 | F T    0.7*0.1*0.5/0.085=0.4118
 26 | F F    0.7*0.9*0.5/0.365=0.8630
 27 | """
 28 | 
 29 | def pb_rap(values):
 30 |     if random.rand()<values[1]*values[2]*0.0698+values[1]*(1-values[2])*0.4030+(1-values[1])*values[2]*0.4118+(1-values[1])*(1-values[2])*0.8630:
 31 |         values[0]=1
 32 |     else:
 33 |         values[0]=0
 34 |     return values   
 35 | 
 36 | """   
 37 | P(r|bap)=P(rap|b)*P(b)/P(bap)
 38 |         =(P(p|rab)*P(rab)/P(b))*P(b)/P(bap)
 39 |         =(P(p|rab)*P(rab))/P(bap)
 40 |        
 41 | P(bap)=P(b)*P(a|b)*(P(r|b)*P(p|ra)+P(~r|b)*P(p|~ra))
 42 |     b a p    P(bap)
 43 |     T T T    0.5*0.1*(0.3*0+0.7*0.6)=0.021
 44 |     T T F    0.5*0.1*(0.3*1+0.7*0.4)=0.029
 45 |     T F T    0.5*0.9*(0.3*0.8+0.7*1)=0.423
 46 |     T F F    0.5*0.9*(0.3*0.2+0.7*0)=0.027
 47 |     F T T    0.5*0.5*(0.8*0+0.2*0.6)=0.030
 48 |     F T F    0.5*0.5*(0.8*1+0.2*0.4)=0.220
 49 |     F F T    0.5*0.5*(0.8*0.8+0.2*1)=0.210
 50 |     F F F    0.5*0.5*(0.8*0.2+0.2*0)=0.040
 51 | 
 52 | 
 53 | 
 54 | 
 55 | P(r|bap) =(P(p|rab)*P(rab))/P(bap)
 56 |          =(P(p|ra)*P(r|b)*P(a|b)*P(b))/P(bap)
 57 | 
 58 | b a p    P(r)
 59 | T T T    0                     =0
 60 | T T F    1*0.3*0.1*0.5/0.029   =0.5172
 61 | T F T    0.8*0.3*0.9*0.5/0.423 =0.2553
 62 | T F F    0.2*0.3*0.9*0.5/0.027 =1
 63 | F T T    0                     =0
 64 | F T F    1*0.8*0.5*0.5/0.220   =0.9091
 65 | F F T    0.8*0.8*0.5*0.5/0.210 =0.7619
 66 | F F F    0.2*0.8*0.5*0.5/0.040 =1
 67 | """
 68 | 
 69 | 
 70 | def pr_bap(values):
 71 |     y=random.rand(1)
 72 |     if random.rand()<values[0]*values[2]*(1-values[3])*0.5172+values[0]*(1-values[2])*values[3]*0.2553+values[0]*(1-values[2])*(1-values[3])+(1-values[0])*values[2]*(1-values[3])*0.9091+(1-values[0])*(1-values[2])*values[3]*0.7619+(1-values[0])*(1-values[2])*(1-values[3]):
 73 |         values[1]=1
 74 |     else:
 75 |         values[1]=0
 76 |     return values
 77 | 
 78 | 
 79 | 
 80 | """   
 81 | P(a|brp)=P(rap|b)*P(b)/P(brp)
 82 |         =(P(p|rab)*P(rab)/P(b))*P(b)/P(brp)
 83 |         =(P(p|rab)*P(rab))/P(brp)
 84 |        
 85 | P(brp)=P(b)*P(r|b)*(P(a|b)*P(p|ra)+P(~a|b)*P(p|r~a))
 86 |     b r p    P(brp)
 87 |     T T T    0.5*0.3*(0.1*0+0.9*0.8)=0.108
 88 |     T T F    0.5*0.3*(0.1*1+0.9*0.2)=0.042
 89 |     T F T    0.5*0.7*(0.1*0.6+0.9*1)=0.334
 90 |     T F F    0.5*0.7*(0.1*0.4+0.9*0)=0.014
 91 |     F T T    0.5*0.8*(0.5*0+0.5*0.8)=0.160
 92 |     F T F    0.5*0.8*(0.5*1+0.5*0.2)=0.240
 93 |     F F T    0.5*0.2*(0.5*0.6+0.5*1)=0.080
 94 |     F F F    0.5*0.2*(0.5*0.4+0.5*0)=0.020
 95 | 
 96 | 
 97 | 
 98 | 
 99 | 
100 | P(a|brp) =(P(p|rab)*P(rab))/P(brp)
101 |          =(P(p|ra)*P(r|b)*P(a|b)*P(b))/P(brp)
102 | 
103 | b r p    P(a)
104 | T T T    0                     =0
105 | T T F    1*0.3*0.1*0.5/0.042   =0.3571
106 | T F T    0.6*0.7*0.1*0.5/0.334 =0.0629
107 | T F F    0.4*0.7*0.1*0.5/0.014 =1
108 | F T T    0                     =0
109 | F T F    1*0.8*0.5*0.5/0.240   =0.8333
110 | F F T    0.6*0.2*0.5*0.5/0.080 =0.375
111 | F F F    0.4*0.2*0.5*0.5/0.020 =1
112 | """
113 | 
114 | 
115 | def pa_brp(values):
116 |     if random.rand()<values[0]*values[1]*(1-values[3])*0.3571+values[0]*(1-values[1])*values[3]*0.0629+values[0]*(1-values[1])*(1-values[2])+(1-values[0])*values[1]*(1-values[3])*0.8333+(1-values[0])*(1-values[1])*values[3]*0.375+(1-values[0])*(1-values[1])*(1-values[3]):
117 |         values[2]=1
118 |     else:
119 |         values[2]=0
120 |     return values
121 | 
122 | def pp_bra(values):
123 |     if random.rand()<values[1]*values[2]*0+values[1]*(1-values[2])*0.8+(1-values[1])*values[2]*0.6+(1-values[1])*(1-values[2])*1:
124 |         values[3]=1
125 |     else:
126 |         values[3]=0
127 |     return values
128 | 
129 | 
130 | def gibbs():
131 |         
132 |     nsamples = 500
133 |     nsteps = 10
134 |     distribution = zeros(16,dtype=float)
135 |     
136 |     for i in range(nsamples):
137 |         # values contains current samples of b, r, a, p
138 |         values = where(random.rand(4)<0.5,0,1)       
139 |         for j in range(nsteps):
140 |             values=pb_rap(values)
141 |             values=pr_bap(values)
142 |             values=pa_brp(values)
143 |             values=pp_bra(values)               
144 |         distribution[values[0]+2*values[1]+4*values[2]+8*values[3]] += 1
145 |     distribution /= nsamples
146 |     print 'b  r  a  p: \t dist'
147 |     for b in range(2):
148 |         for r in range(2):
149 |             for a in range(2):
150 |                 for p in range(2):
151 |                     print 1-b,1-r,1-a,1-p,'\t', distribution[b+2*r+4*a+8*p]
152 | gibbs()
153 | 


--------------------------------------------------------------------------------
/15 Graphical Models/HMM.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # Code from Chapter 15 of Machine Learning: An Algorithmic Perspective
  3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
  4 | 
  5 | # You are free to use, change, or redistribute the code in any way you wish for
  6 | # non-commercial purposes, but please maintain the name of the original author.
  7 | # This code comes with no warranty of any kind.
  8 | 
  9 | # Stephen Marsland, 2008
 10 | 
 11 | # A basic Hidden Markov Model
 12 | from numpy import *
 13 | 
 14 | def HMMfwd(a,b,obs):
 15 | 
 16 | 	nStates = shape(b)[0]
 17 | 	T = shape(obs)[0]
 18 | 
 19 | 	alpha = zeros((nStates,T))
 20 | 
 21 | 	alpha[:,0] = aFirst*b[:,obs[0]]
 22 | 
 23 | 	for t in range(1,T):
 24 | 		for s in range(nStates):
 25 | 			alpha[s,t] = b[s,obs[t]] * sum(alpha[:,t-1] * a[:,s])
 26 | 
 27 | 	#alpha[q,T] = sum(alpha[:,T-1]*aLast[:,q])
 28 | 	#print max(alpha[:,T-1])
 29 | 	return alpha
 30 | 
 31 | def HMMbwd(a,b,obs):
 32 | 
 33 | 	nStates = shape(b)[0]
 34 | 	T = shape(obs)[0]
 35 | 
 36 | 	beta = zeros((nStates,T))
 37 | 
 38 | 	beta[:,T-1] = aLast
 39 | 
 40 | 	for t in range(T-2,0,-1):
 41 | 		for s in range(nStates):
 42 | 			beta[s,t] = b[s,obs[t+1]] * sum(beta[:,t+1] * a[:,s])
 43 | 
 44 | 	beta[:,0] = b[:,obs[0]] * sum(beta[:,1] * aFirst)
 45 | 	return beta
 46 | 
 47 | def BaumWelch(obs,nStates):
 48 | 
 49 | 	T = shape(obs)[0]
 50 | 	a = random.rand(nStates,nStates)
 51 | 	b = random.rand(nStates,T)
 52 | 	olda = zeros((nStates,nStates)) 
 53 | 	oldb = zeros((nStates,T)) 
 54 | 	maxCount = 50
 55 | 	tolerance = 1e-5
 56 | 
 57 | 	count = 0
 58 | 	while (abs(a-olda)).max() > tolerance and (abs(b-oldb)).max() > tolerance and count < maxCount:
 59 | 		# E-step
 60 | 
 61 | 		alpha = HMMfwd(a,b,obs)
 62 | 		beta = HMMbwd(a,b,obs)
 63 | 		gamma = zeros((nStates,nStates,T))
 64 | 
 65 | 		for t in range(T-1):
 66 | 			for s in range(nStates):
 67 | 				gamma[:,s,t] = alpha[:,t] * a[:,s] * b[s,obs[t+1]] * beta[s,t+1] / max(alpha[:,T-1])
 68 | 	
 69 | 		# M-step
 70 | 		olda = a.copy()
 71 | 		oldb = b.copy()
 72 | 
 73 | 		for i in range(nStates):
 74 | 			for j in range(nStates):
 75 | 				a[i,j] = sum(gamma[i,j,:])/sum(sum(gamma[i,:,:]))
 76 | 
 77 | 		for o in range(max(obs)):
 78 | 			for j in range(nStates):
 79 | 				places = (obs==o).nonzero()
 80 | 				tally = sum(gamma[j,:,:],axis=0)
 81 | 				b[j,o] = sum(tally[places])/sum(sum(gamma[j,:,:]))
 82 | 				#print b[j,o], sum(gamma[j,places])/sum(gamma[j,:])
 83 | 	
 84 | 		count += 1
 85 | 	print count
 86 | 	return a,b
 87 | 
 88 | def ViterbiSimple(a,b,obs):
 89 | 
 90 | 	nStates = shape(b)[0]
 91 | 	T = shape(obs)[0]
 92 | 
 93 | 	path = zeros(T)
 94 | 	viterbi = zeros((nStates,T))
 95 | 
 96 | 	viterbi[:,0] = aFirst * b[:,obs[0]]
 97 | 	path[0] = argmax(viterbi[:,0])
 98 | 
 99 | 	for t in range(1,T):
100 | 		for s in range(nStates):
101 | 			viterbi[s,t] = max(viterbi[:,t-1] * a[:,s] * b[s,obs[t]])
102 | 		path[t] = argmax(viterbi[:,t])
103 | 
104 | 	print "Path: ",  path
105 | 	#print viterbi[path[T-1]]
106 | 	return path,viterbi
107 | 
108 | def Viterbi(a,b,obs):
109 | 
110 | 	nStates = shape(b)[0]
111 | 	T = shape(obs)[0]
112 | 
113 | 	path = zeros(T)
114 | 	backwards = zeros((nStates,T))
115 | 	viterbi = zeros((nStates,T))
116 | 
117 | 	viterbi[:,0] = aFirst * b[:,obs[0]]
118 | 	backwards[:,1] = 0
119 | 
120 | 	for t in range(1,T):
121 | 		for s in range(nStates):
122 | 			tally = viterbi[:,t-1] * a[:,s] * b[s,obs[t]]
123 | 			backwards[s,t] = argmax(tally)
124 | 			viterbi[s,t] = tally[backwards[s,t]]
125 | 		path[t] = argmax(viterbi[:,t])
126 | 
127 | 	print path
128 | 	return path,viterbi,backwards
129 | 
130 | 
131 | aFirst = array([0.25,0.25,0.25,0.25])
132 | aLast = array([0.25,0.25,0.25,0.25])
133 | #a = array([[.7,.3],[.4,.6]] )
134 | a = array([[.4,.3,.1,.2],[.6,.05,.1,.25],[.7,.05,.05,.2],[.3,.4,.25,.05]])
135 | #a = a.transpose()
136 | #b = array([[.2,.4,.4],[.5,.4,.1]] )
137 | b = array([[.2,.1,.2,.5],[.4,.2,.1,.3],[.3,.4,.2,.1],[.3,.05,.3,.35]])
138 | obs = array([0,0,3,1,1,2,1,3])
139 | #obs = array([2,0,2])
140 | HMMfwd(a,b,obs)
141 | Viterbi(a,b,obs)
142 | ViterbiSimple(a,b,obs)
143 | BaumWelch(obs,4)
144 | ViterbiSimple(a,b,obs)
145 | 


--------------------------------------------------------------------------------
/15 Graphical Models/Kalman.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 15 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The 1D Kalman filter
12 | 
13 | from pylab import *
14 | from numpy import *
15 | 
16 | def Kalman(obs=None,mu_init=array([-0.37727]),cov_init=0.1*ones((1)),nsteps=50):
17 | 
18 |     ndim = shape(mu_init)[0]
19 |     
20 |     if obs==None:
21 |         mu_init = tile(mu_init,(1,nsteps))
22 |         cov_init = tile(cov_init,(1,nsteps))
23 |         obs = random.normal(mu_init,cov_init,(ndim,nsteps))
24 |     
25 |     Sigma_x = eye(ndim)*1e-5
26 |     A = eye(ndim)
27 |     H = eye(ndim)
28 |     mu_hat = 0
29 |     cov = eye(ndim)
30 |     R = eye(ndim)*0.01
31 |     
32 |     m = zeros((ndim,nsteps),dtype=float)
33 |     ce = zeros((ndim,nsteps),dtype=float)
34 |     
35 |     for t in range(1,nsteps):
36 |         # Make prediction
37 |         mu_hat_est = dot(A,mu_hat)
38 |         cov_est = dot(A,dot(cov,transpose(A))) + Sigma_x
39 | 
40 |         # Update estimate
41 |         error_mu = obs[:,t] - dot(H,mu_hat_est)
42 |         error_cov = dot(H,dot(cov,transpose(H))) + R
43 |         K = dot(dot(cov_est,transpose(H)),linalg.inv(error_cov))
44 |         mu_hat = mu_hat_est + dot(K,error_mu)
45 |         #m[:,:,t] = mu_hat
46 |         m[:,t] = mu_hat
47 |         if ndim>1:
48 |             cov = dot((eye(ndim) - dot(K,H)),cov_est)
49 |         else:
50 |             cov = (1-K)*cov_est 
51 |         ce[:,t] = cov                                
52 |     
53 |     figure()
54 |     plot(obs[0,:],'ko',ms=6)
55 |     plot(m[0,:],'k-',lw=3)
56 |     plot(m[0,:]+20*ce[0,:],'k--',lw=2)
57 |     plot(m[0,:]-20*ce[0,:],'k--',lw=2)
58 |     legend(['Noisy Datapoints','Kalman estimate','Covariance'])
59 |     xlabel('Time')
60 |     
61 |     
62 |     show()
63 |     
64 | Kalman()
65 | 


--------------------------------------------------------------------------------
/15 Graphical Models/MRF.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 15 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Demonstration of the Markov Random Field method of image denoising
12 | from pylab import *
13 | from numpy import *
14 | 
15 | def MRF(I,J,eta=2.0,zeta=1.5):
16 |     ind =arange(shape(I)[0])
17 |     random.shuffle(ind)
18 |     orderx = ind.copy()
19 |     random.shuffle(ind)
20 | 
21 |     for i in orderx:
22 |         for j in ind:
23 |             oldJ = J[i,j]
24 |             J[i,j]=1
25 |             patch = 0
26 |             for k in range(-1,1):
27 |                 for l in range(-1,1):
28 |                     patch += J[i,j] * J[i+k,j+l]
29 |             energya = -eta*sum(I*J) - zeta*patch
30 |             J[i,j]=-1
31 |             patch = 0
32 |             for k in range(-1,1):
33 |                 for l in range(-1,1):
34 |                     patch += J[i,j] * J[i+k,j+l]
35 |             energyb = -eta*sum(I*J) - zeta*patch
36 |             if energya<energyb:
37 |                 J[i,j] = 1
38 |             else:
39 |                 J[i,j] = -1
40 |     return J
41 |             
42 | I = imread('world.png')
43 | N = shape(I)[0]
44 | I = I[:,:,0]
45 | I = where(I<0.1,-1,1)
46 | imshow(I)
47 | title('Original Image')
48 | 
49 | noise = random.rand(N,N)
50 | J = I.copy()
51 | ind = where(noise<0.1)
52 | J[ind] = -J[ind]
53 | figure()
54 | imshow(J)
55 | title('Noisy image')
56 | newJ = J.copy()
57 | newJ = MRF(I,newJ)
58 | figure()
59 | imshow(newJ)
60 | title('Denoised version')
61 | print sum(I-J), sum(I-newJ)
62 | show()
63 | 


--------------------------------------------------------------------------------
/15 Graphical Models/graphdemo.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 15 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | def findPath(graph, start, end, pathSoFar):
12 |     pathSoFar = pathSoFar + [start]
13 |     if start == end:
14 |         return pathSoFar
15 |     if start not in graph:
16 |         return None
17 |     for node in graph[start]:
18 |         if node not in pathSoFar:
19 |             newpath = findPath(graph, node, end, pathSoFar)
20 |             return newpath
21 |     return None
22 | 
23 | graph = {'A': ['B', 'C'],'B': ['C', 'D'],'C': ['D'],'D': ['C'],'E': ['F'],'F': ['C']}
24 | print findPath(graph,'A','D',[])
25 | 
26 | 


--------------------------------------------------------------------------------
/15 Graphical Models/world.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/tback/MLBook_source/e8af8881aa791079e5f706cd2f9e636e8843ca1e/15 Graphical Models/world.png


--------------------------------------------------------------------------------
/2 Linear/auto-mpg.py:
--------------------------------------------------------------------------------
 1 | # Code from Chapter 2 of Machine Learning: An Algorithmic Perspective
 2 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 3 | 
 4 | # You are free to use, change, or redistribute the code in any way you wish for
 5 | # non-commercial purposes, but please maintain the name of the original author.
 6 | # This code comes with no warranty of any kind.
 7 | 
 8 | # Stephen Marsland, 2008
 9 | 
10 | # This is the start of a script for you to complete
11 | from pylab import *
12 | from numpy import *
13 | import linreg
14 | 
15 | auto = loadtxt('/Users/srmarsla/Book/Datasets/auto-mpg/auto-mpg.data.txt',comments='"')
16 | 
17 | # Separate the data into training and testing sets
18 | 
19 | # Normalise the data
20 | 
21 | # This is the training part
22 | beta = linreg.linreg(trainin,traintgt)
23 | testin = concatenate((testin,-ones((shape(testin)[0],1))),axis=1)
24 | testout = dot(testin,beta)
25 | error = sum((testout - testtgt)**2)
26 | print error


--------------------------------------------------------------------------------
/2 Linear/linreg.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 2 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | from numpy import *
12 | 
13 | def linreg(inputs,targets):
14 | 
15 | 	inputs = concatenate((inputs,-ones((shape(inputs)[0],1))),axis=1)
16 | 	beta = dot(dot(linalg.inv(dot(transpose(inputs),inputs)),transpose(inputs)),targets)
17 | 
18 | 	outputs = dot(inputs,beta)
19 | 	#print shape(beta)
20 | 	#print outputs
21 | 	return beta
22 | 


--------------------------------------------------------------------------------
/2 Linear/linreg_logic_eg.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 2 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Demonstration of the Perceptron and Linear Regressor on the basic logic functions
12 | 
13 | from numpy import *
14 | import linreg
15 | 
16 | inputs = array([[0,0],[0,1],[1,0],[1,1]])
17 | testin = concatenate((inputs,-ones((shape(inputs)[0],1))),axis=1)
18 | 
19 | # AND data
20 | ANDtargets = array([[0],[0],[0],[1]])
21 | # OR data
22 | ORtargets = array([[0],[1],[1],[1]])
23 | # XOR data
24 | XORtargets = array([[0],[1],[1],[0]])
25 | 
26 | print "AND data"
27 | ANDbeta = linreg.linreg(inputs,ANDtargets)
28 | ANDout = dot(testin,ANDbeta)
29 | print ANDout
30 | 
31 | print "OR data"
32 | ORbeta = linreg.linreg(inputs,ORtargets)
33 | ORout = dot(testin,ORbeta)
34 | print ORout
35 | 
36 | print "XOR data"
37 | XORbeta = linreg.linreg(inputs,XORtargets)
38 | XORout = dot(testin,XORbeta)
39 | print XORout


--------------------------------------------------------------------------------
/2 Linear/logic.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 2 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Demonstration of the Perceptron and Linear Regressor on the basic logic functions
12 | 
13 | from numpy import *
14 | inputs = array([[0,0],[0,1],[1,0],[1,1]])
15 | # AND data
16 | ANDtargets = array([[0],[0],[0],[1]])
17 | # OR data
18 | ORtargets = array([[0],[1],[1],[1]])
19 | # XOR data
20 | XORtargets = array([[0],[1],[1],[0]])
21 | import pcn_logic_eg
22 | 
23 | print "AND logic function"
24 | p = pcn_logic_eg.pcn(inputs,ANDtargets)
25 | p.pcntrain(inputs,ANDtargets,0.25,6)
26 | 
27 | print "OR logic function"
28 | p = pcn_logic_eg.pcn(inputs,ORtargets)
29 | p.pcntrain(inputs,ORtargets,0.25,6)
30 | 
31 | print "XOR logic function"
32 | p = pcn_logic_eg.pcn(inputs,XORtargets)
33 | p.pcntrain(inputs,XORtargets,0.25,6)
34 | 


--------------------------------------------------------------------------------
/2 Linear/pcn.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # Code from Chapter 2 of Machine Learning: An Algorithmic Perspective
  3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
  4 | 
  5 | # You are free to use, change, or redistribute the code in any way you wish for
  6 | # non-commercial purposes, but please maintain the name of the original author.
  7 | # This code comes with no warranty of any kind.
  8 | 
  9 | # Stephen Marsland, 2008
 10 | 
 11 | from numpy import *
 12 | 
 13 | class pcn:
 14 | 	""" A basic Perceptron"""
 15 | 	
 16 | 	def __init__(self,inputs,targets):
 17 | 		""" Constructor """
 18 | 		# Set up network size
 19 | 		if ndim(inputs)>1:
 20 | 			self.nIn = shape(inputs)[1]
 21 | 		else: 
 22 | 			self.nIn = 1
 23 | 	
 24 | 		if ndim(targets)>1:
 25 | 			self.nOut = shape(targets)[1]
 26 | 		else:
 27 | 			self.nOut = 1
 28 | 
 29 | 		self.nData = shape(inputs)[0]
 30 | 	
 31 | 		# Initialise network
 32 | 		self.weights = random.rand(self.nIn+1,self.nOut)*0.1-0.05
 33 | 
 34 | 	def pcntrain(self,inputs,targets,eta,nIterations):
 35 | 		""" Train the thing """	
 36 | 		# Add the inputs that match the bias node
 37 | 		inputs = concatenate((inputs,-ones((self.nData,1))),axis=1)
 38 | 		# Training
 39 | 		change = range(self.nData)
 40 | 
 41 | 		for n in range(nIterations):
 42 | 			
 43 | 			self.outputs = self.pcnfwd(inputs);
 44 | 			self.weights += eta*dot(transpose(inputs),targets-self.outputs)
 45 | 		
 46 | 			# Randomise order of inputs
 47 | 			random.shuffle(change)
 48 | 			inputs = inputs[change,:]
 49 | 			targets = targets[change,:]
 50 | 			
 51 | 		#return self.weights
 52 | 
 53 | 	def pcnfwd(self,inputs):
 54 | 		""" Run the network forward """
 55 | 
 56 | 		outputs =  dot(inputs,self.weights)
 57 | 
 58 | 		# Threshold the outputs
 59 | 		return where(outputs>0,1,0)
 60 | 
 61 | 
 62 | 	def confmat(self,inputs,targets):
 63 | 		"""Confusion matrix"""
 64 | 
 65 | 		# Add the inputs that match the bias node
 66 | 		inputs = concatenate((inputs,-ones((self.nData,1))),axis=1)
 67 | 		
 68 | 		outputs = dot(inputs,self.weights)
 69 | 	
 70 | 		nClasses = shape(targets)[1]
 71 | 
 72 | 		if nClasses==1:
 73 | 			nClasses = 2
 74 | 			outputs = where(outputs>0,1,0)
 75 | 		else:
 76 | 			# 1-of-N encoding
 77 | 			outputs = argmax(outputs,1)
 78 | 			targets = argmax(targets,1)
 79 | 
 80 | 		cm = zeros((nClasses,nClasses))
 81 | 		for i in range(nClasses):
 82 | 			for j in range(nClasses):
 83 | 				cm[i,j] = sum(where(outputs==i,1,0)*where(targets==j,1,0))
 84 | 
 85 | 		print cm
 86 | 		print trace(cm)/sum(cm)
 87 | 		
 88 | 	def logic(self):
 89 | 		""" Run AND and XOR logic functions"""
 90 | 
 91 | 		a = array([[0,0,0],[0,1,0],[1,0,0],[1,1,1]])
 92 | 		b = array([[0,0,0],[0,1,1],[1,0,1],[1,1,0]])
 93 | 
 94 | 		p = self.pcn(a[:,0:2],a[:,2:])
 95 | 		p.pcntrain(a[:,0:2],a[:,2:],0.25,10)
 96 | 		p.confmat(a[:,0:2],a[:,2:])
 97 | 
 98 | 		q = self.pcn(a[:,0:2],b[:,2:])
 99 | 		q.pcntrain(a[:,0:2],b[:,2:],0.25,10)
100 | 		q.confmat(a[:,0:2],b[:,2:])
101 | 
102 | 


--------------------------------------------------------------------------------
/2 Linear/pcn_logic_eg.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 2 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | from numpy import *
12 | 
13 | class pcn:
14 | 	""" A basic Perceptron (the same pcn.py except with the weights printed
15 | 	and it does not reorder the inputs)"""
16 | 	
17 | 	def __init__(self,inputs,targets):
18 | 		""" Constructor """
19 | 		# Set up network size
20 | 		if ndim(inputs)>1:
21 | 			self.nIn = shape(inputs)[1]
22 | 		else: 
23 | 			self.nIn = 1
24 | 	
25 | 		if ndim(targets)>1:
26 | 			self.nOut = shape(targets)[1]
27 | 		else:
28 | 			self.nOut = 1
29 | 
30 | 		self.nData = shape(inputs)[0]
31 | 	
32 | 		# Initialise network
33 | 		self.weights = random.rand(self.nIn+1,self.nOut)*0.1-0.05
34 | 
35 | 	def pcntrain(self,inputs,targets,eta,nIterations):
36 | 		""" Train the thing """	
37 | 		# Add the inputs that match the bias node
38 | 		inputs = concatenate((inputs,-ones((self.nData,1))),axis=1)
39 | 	
40 | 		# Training
41 | 		change = range(self.nData)
42 | 
43 | 		for n in range(nIterations):
44 | 			
45 | 			self.outputs = self.pcnfwd(inputs);
46 | 			self.weights += eta*dot(transpose(inputs),targets-self.outputs)
47 | 			print "Iteration: ", n
48 | 			print self.weights
49 | 			
50 | 			activations = self.pcnfwd(inputs)
51 | 			print "Final outputs are:"
52 | 			print activations
53 | 		#return self.weights
54 | 
55 | 	def pcnfwd(self,inputs):
56 | 		""" Run the network forward """
57 | 
58 | 		outputs =  dot(inputs,self.weights)
59 | 
60 | 		# Threshold the outputs
61 | 		return where(outputs>0,1,0)
62 | 
63 | 
64 | 	def confmat(self,inputs,targets):
65 | 		"""Confusion matrix"""
66 | 
67 | 		# Add the inputs that match the bias node
68 | 		inputs = concatenate((inputs,-ones((self.nData,1))),axis=1)
69 | 		outputs = dot(inputs,self.weights)
70 | 	
71 | 		nClasses = shape(targets)[1]
72 | 
73 | 		if nClasses==1:
74 | 			nClasses = 2
75 | 			outputs = where(outputs>0,1,0)
76 | 		else:
77 | 			# 1-of-N encoding
78 | 			outputs = argmax(outputs,1)
79 | 			targets = argmax(targets,1)
80 | 
81 | 		cm = zeros((nClasses,nClasses))
82 | 		for i in range(nClasses):
83 | 			for j in range(nClasses):
84 | 				cm[i,j] = sum(where(outputs==i,1,0)*where(targets==j,1,0))
85 | 
86 | 		print cm
87 | 		print trace(cm)/sum(cm)
88 | 
89 | 
90 | 


--------------------------------------------------------------------------------
/2 Linear/pima.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 2 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Demonstration of the Perceptron on the Pima Indian dataset
12 | 
13 | from pylab import *
14 | from numpy import *
15 | import pcn
16 | 
17 | pima = loadtxt('/Users/srmarsla/Book/Datasets/pima/pima-indians-diabetes.data',delimiter=',')
18 | 
19 | # Plot the first and second values for the two classes
20 | #indices0 = where(pima[:,8]==0)
21 | #indices1 = where(pima[:,8]==1)
22 | #
23 | #ion()
24 | #plot(pima[indices0,0],pima[indices0,1],'go')
25 | #plot(pima[indices1,0],pima[indices1,1],'rx')
26 | 
27 | # Perceptron training on the original dataset
28 | print "Output on original data"
29 | p = pcn.pcn(pima[:,:8],pima[:,8:9])
30 | p.pcntrain(pima[:,:8],pima[:,8:9],0.25,100)
31 | p.confmat(pima[:,:8],pima[:,8:9])
32 | 
33 | # Various preprocessing steps
34 | pima[where(pima[:,0]>8),0] = 8
35 | 
36 | pima[where(pima[:,7]<=30),7] = 1
37 | pima[where((pima[:,7]>30) & (pima[:,7]<=40)),7] = 2
38 | pima[where((pima[:,7]>40) & (pima[:,7]<=50)),7] = 3
39 | pima[where((pima[:,7]>50) & (pima[:,7]<=60)),7] = 4
40 | pima[where(pima[:,7]>60)] = 5
41 | 
42 | pima[:,:8] = pima[:,:8]-pima[:,:8].mean(axis=0)
43 | pima[:,:8] = pima[:,:8]/pima[:,:8].var(axis=0)
44 | 
45 | #print pima.mean(axis=0)
46 | #print pima.var(axis=0)
47 | #print pima.max(axis=0)
48 | #print pima.min(axis=0)
49 | 
50 | trainin = pima[::2,:8]
51 | testin = pima[1::2,:8]
52 | traintgt = pima[::2,8:9]
53 | testtgt = pima[1::2,8:9]
54 | 
55 | # Perceptron training on the preprocessed dataset
56 | print "Output after preprocessing of data"
57 | p1 = pcn.pcn(trainin,traintgt)
58 | p1.pcntrain(trainin,traintgt,0.25,100)
59 | p1.confmat(testin,testtgt)
60 | 
61 | 
62 | 
63 | show()
64 | 


--------------------------------------------------------------------------------
/3 MLP/PNOz.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 3 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The Palmerston North Ozone time series example
12 | 
13 | from pylab import *
14 | from numpy import *
15 | 
16 | PNoz = loadtxt('PNOz.dat')
17 | ion()
18 | plot(arange(shape(PNoz)[0]),PNoz[:,2],'.')
19 | xlabel('Time (Days)')
20 | ylabel('Ozone (Dobson units)')
21 | 
22 | # Normalise data
23 | PNoz[:,2] = PNoz[:,2]-PNoz[:,2].mean()
24 | PNoz[:,2] = PNoz[:,2]/PNoz[:,2].max()
25 | 
26 | # Assemble input vectors
27 | t = 2
28 | k = 3
29 | 
30 | lastPoint = shape(PNoz)[0]-t*(k+1)-1
31 | inputs = zeros((lastPoint,k))
32 | targets = zeros((lastPoint,1))
33 | for i in range(lastPoint):
34 |     inputs[i,:] = PNoz[i:i+t*k:t,2]
35 |     targets[i] = PNoz[i+t*(k+1),2]
36 |     
37 | test = inputs[-400:,:]
38 | testtargets = targets[-400:]
39 | 
40 | # Randomly order the data
41 | inputs = inputs[:-400,:]
42 | targets = targets[:-400]
43 | change = range(shape(inputs)[0])
44 | random.shuffle(change)
45 | inputs = inputs[change,:]
46 | targets = targets[change,:]
47 | 
48 | train = inputs[::2,:]
49 | traintargets = targets[::2]
50 | valid = inputs[1::2,:]
51 | validtargets = targets[1::2]
52 | 
53 | # Train the network
54 | import mlp
55 | net = mlp.mlp(train,traintargets,3,outtype='linear')
56 | net.earlystopping(train,traintargets,valid,validtargets,0.25)
57 | 
58 | test = concatenate((test,-ones((shape(test)[0],1))),axis=1)
59 | testout = net.mlpfwd(test)
60 | 
61 | figure()
62 | plot(arange(shape(test)[0]),testout,'.')
63 | plot(arange(shape(test)[0]),testtargets,'x')
64 | legend(('Predictions','Targets'))
65 | print 0.5*sum((testtargets-testout)**2)
66 | show()
67 | 


--------------------------------------------------------------------------------
/3 MLP/iris.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 3 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The iris classification example
12 | 
13 | def preprocessIris(infile,outfile):
14 | 
15 |     stext1 = 'Iris-setosa'
16 |     stext2 = 'Iris-versicolor'
17 |     stext3 = 'Iris-virginica'
18 |     rtext1 = '0'
19 |     rtext2 = '1'
20 |     rtext3 = '2'
21 | 
22 |     fid = open(infile,"r")
23 |     oid = open(outfile,"w")
24 | 
25 |     for s in fid:
26 |         if s.find(stext1)>-1:
27 |             oid.write(s.replace(stext1, rtext1))
28 |         elif s.find(stext2)>-1:
29 |             oid.write(s.replace(stext2, rtext2))
30 |         elif s.find(stext3)>-1:
31 |             oid.write(s.replace(stext3, rtext3))
32 |     fid.close()
33 |     oid.close()
34 | 
35 | from numpy import *
36 | # Preprocessor to remove the test (only needed once)
37 | #preprocessIris('/Users/srmarsla/Book/Datasets/Iris/iris.data','iris_proc.data')
38 | 
39 | iris = loadtxt('iris_proc.data',delimiter=',')
40 | iris[:,:4] = iris[:,:4]-iris[:,:4].mean(axis=0)
41 | imax = concatenate((iris.max(axis=0)*ones((1,5)),iris.min(axis=0)*ones((1,5))),axis=0).max(axis=0)
42 | iris[:,:4] = iris[:,:4]/imax[:4]
43 | print iris[0:5,:]
44 | 
45 | # Split into training, validation, and test sets
46 | target = zeros((shape(iris)[0],3));
47 | indices = where(iris[:,4]==0) 
48 | target[indices,0] = 1
49 | indices = where(iris[:,4]==1)
50 | target[indices,1] = 1
51 | indices = where(iris[:,4]==2)
52 | target[indices,2] = 1
53 | 
54 | # Randomly order the data
55 | order = range(shape(iris)[0])
56 | random.shuffle(order)
57 | iris = iris[order,:]
58 | target = target[order,:]
59 | 
60 | train = iris[::2,0:4]
61 | traint = target[::2]
62 | valid = iris[1::4,0:4]
63 | validt = target[1::4]
64 | test = iris[3::4,0:4]
65 | testt = target[3::4]
66 | 
67 | #print train.max(axis=0), train.min(axis=0)
68 | 
69 | # Train the network
70 | import mlp
71 | net = mlp.mlp(train,traint,5,outtype='softmax')
72 | net.earlystopping(train,traint,valid,validt,0.1)
73 | net.confmat(test,testt)
74 | 


--------------------------------------------------------------------------------
/3 MLP/iris_proc.data:
--------------------------------------------------------------------------------
  1 | 5.1,3.5,1.4,0.2,0
  2 | 4.9,3.0,1.4,0.2,0
  3 | 4.7,3.2,1.3,0.2,0
  4 | 4.6,3.1,1.5,0.2,0
  5 | 5.0,3.6,1.4,0.2,0
  6 | 5.4,3.9,1.7,0.4,0
  7 | 4.6,3.4,1.4,0.3,0
  8 | 5.0,3.4,1.5,0.2,0
  9 | 4.4,2.9,1.4,0.2,0
 10 | 4.9,3.1,1.5,0.1,0
 11 | 5.4,3.7,1.5,0.2,0
 12 | 4.8,3.4,1.6,0.2,0
 13 | 4.8,3.0,1.4,0.1,0
 14 | 4.3,3.0,1.1,0.1,0
 15 | 5.8,4.0,1.2,0.2,0
 16 | 5.7,4.4,1.5,0.4,0
 17 | 5.4,3.9,1.3,0.4,0
 18 | 5.1,3.5,1.4,0.3,0
 19 | 5.7,3.8,1.7,0.3,0
 20 | 5.1,3.8,1.5,0.3,0
 21 | 5.4,3.4,1.7,0.2,0
 22 | 5.1,3.7,1.5,0.4,0
 23 | 4.6,3.6,1.0,0.2,0
 24 | 5.1,3.3,1.7,0.5,0
 25 | 4.8,3.4,1.9,0.2,0
 26 | 5.0,3.0,1.6,0.2,0
 27 | 5.0,3.4,1.6,0.4,0
 28 | 5.2,3.5,1.5,0.2,0
 29 | 5.2,3.4,1.4,0.2,0
 30 | 4.7,3.2,1.6,0.2,0
 31 | 4.8,3.1,1.6,0.2,0
 32 | 5.4,3.4,1.5,0.4,0
 33 | 5.2,4.1,1.5,0.1,0
 34 | 5.5,4.2,1.4,0.2,0
 35 | 4.9,3.1,1.5,0.1,0
 36 | 5.0,3.2,1.2,0.2,0
 37 | 5.5,3.5,1.3,0.2,0
 38 | 4.9,3.1,1.5,0.1,0
 39 | 4.4,3.0,1.3,0.2,0
 40 | 5.1,3.4,1.5,0.2,0
 41 | 5.0,3.5,1.3,0.3,0
 42 | 4.5,2.3,1.3,0.3,0
 43 | 4.4,3.2,1.3,0.2,0
 44 | 5.0,3.5,1.6,0.6,0
 45 | 5.1,3.8,1.9,0.4,0
 46 | 4.8,3.0,1.4,0.3,0
 47 | 5.1,3.8,1.6,0.2,0
 48 | 4.6,3.2,1.4,0.2,0
 49 | 5.3,3.7,1.5,0.2,0
 50 | 5.0,3.3,1.4,0.2,0
 51 | 7.0,3.2,4.7,1.4,1
 52 | 6.4,3.2,4.5,1.5,1
 53 | 6.9,3.1,4.9,1.5,1
 54 | 5.5,2.3,4.0,1.3,1
 55 | 6.5,2.8,4.6,1.5,1
 56 | 5.7,2.8,4.5,1.3,1
 57 | 6.3,3.3,4.7,1.6,1
 58 | 4.9,2.4,3.3,1.0,1
 59 | 6.6,2.9,4.6,1.3,1
 60 | 5.2,2.7,3.9,1.4,1
 61 | 5.0,2.0,3.5,1.0,1
 62 | 5.9,3.0,4.2,1.5,1
 63 | 6.0,2.2,4.0,1.0,1
 64 | 6.1,2.9,4.7,1.4,1
 65 | 5.6,2.9,3.6,1.3,1
 66 | 6.7,3.1,4.4,1.4,1
 67 | 5.6,3.0,4.5,1.5,1
 68 | 5.8,2.7,4.1,1.0,1
 69 | 6.2,2.2,4.5,1.5,1
 70 | 5.6,2.5,3.9,1.1,1
 71 | 5.9,3.2,4.8,1.8,1
 72 | 6.1,2.8,4.0,1.3,1
 73 | 6.3,2.5,4.9,1.5,1
 74 | 6.1,2.8,4.7,1.2,1
 75 | 6.4,2.9,4.3,1.3,1
 76 | 6.6,3.0,4.4,1.4,1
 77 | 6.8,2.8,4.8,1.4,1
 78 | 6.7,3.0,5.0,1.7,1
 79 | 6.0,2.9,4.5,1.5,1
 80 | 5.7,2.6,3.5,1.0,1
 81 | 5.5,2.4,3.8,1.1,1
 82 | 5.5,2.4,3.7,1.0,1
 83 | 5.8,2.7,3.9,1.2,1
 84 | 6.0,2.7,5.1,1.6,1
 85 | 5.4,3.0,4.5,1.5,1
 86 | 6.0,3.4,4.5,1.6,1
 87 | 6.7,3.1,4.7,1.5,1
 88 | 6.3,2.3,4.4,1.3,1
 89 | 5.6,3.0,4.1,1.3,1
 90 | 5.5,2.5,4.0,1.3,1
 91 | 5.5,2.6,4.4,1.2,1
 92 | 6.1,3.0,4.6,1.4,1
 93 | 5.8,2.6,4.0,1.2,1
 94 | 5.0,2.3,3.3,1.0,1
 95 | 5.6,2.7,4.2,1.3,1
 96 | 5.7,3.0,4.2,1.2,1
 97 | 5.7,2.9,4.2,1.3,1
 98 | 6.2,2.9,4.3,1.3,1
 99 | 5.1,2.5,3.0,1.1,1
100 | 5.7,2.8,4.1,1.3,1
101 | 6.3,3.3,6.0,2.5,2
102 | 5.8,2.7,5.1,1.9,2
103 | 7.1,3.0,5.9,2.1,2
104 | 6.3,2.9,5.6,1.8,2
105 | 6.5,3.0,5.8,2.2,2
106 | 7.6,3.0,6.6,2.1,2
107 | 4.9,2.5,4.5,1.7,2
108 | 7.3,2.9,6.3,1.8,2
109 | 6.7,2.5,5.8,1.8,2
110 | 7.2,3.6,6.1,2.5,2
111 | 6.5,3.2,5.1,2.0,2
112 | 6.4,2.7,5.3,1.9,2
113 | 6.8,3.0,5.5,2.1,2
114 | 5.7,2.5,5.0,2.0,2
115 | 5.8,2.8,5.1,2.4,2
116 | 6.4,3.2,5.3,2.3,2
117 | 6.5,3.0,5.5,1.8,2
118 | 7.7,3.8,6.7,2.2,2
119 | 7.7,2.6,6.9,2.3,2
120 | 6.0,2.2,5.0,1.5,2
121 | 6.9,3.2,5.7,2.3,2
122 | 5.6,2.8,4.9,2.0,2
123 | 7.7,2.8,6.7,2.0,2
124 | 6.3,2.7,4.9,1.8,2
125 | 6.7,3.3,5.7,2.1,2
126 | 7.2,3.2,6.0,1.8,2
127 | 6.2,2.8,4.8,1.8,2
128 | 6.1,3.0,4.9,1.8,2
129 | 6.4,2.8,5.6,2.1,2
130 | 7.2,3.0,5.8,1.6,2
131 | 7.4,2.8,6.1,1.9,2
132 | 7.9,3.8,6.4,2.0,2
133 | 6.4,2.8,5.6,2.2,2
134 | 6.3,2.8,5.1,1.5,2
135 | 6.1,2.6,5.6,1.4,2
136 | 7.7,3.0,6.1,2.3,2
137 | 6.3,3.4,5.6,2.4,2
138 | 6.4,3.1,5.5,1.8,2
139 | 6.0,3.0,4.8,1.8,2
140 | 6.9,3.1,5.4,2.1,2
141 | 6.7,3.1,5.6,2.4,2
142 | 6.9,3.1,5.1,2.3,2
143 | 5.8,2.7,5.1,1.9,2
144 | 6.8,3.2,5.9,2.3,2
145 | 6.7,3.3,5.7,2.5,2
146 | 6.7,3.0,5.2,2.3,2
147 | 6.3,2.5,5.0,1.9,2
148 | 6.5,3.0,5.2,2.0,2
149 | 6.2,3.4,5.4,2.3,2
150 | 5.9,3.0,5.1,1.8,2
151 | 


--------------------------------------------------------------------------------
/3 MLP/logic.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 3 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | from numpy import *
12 | import mlp
13 | 
14 | anddata = array([[0,0,0],[0,1,0],[1,0,0],[1,1,1]])
15 | xordata = array([[0,0,0],[0,1,1],[1,0,1],[1,1,0]])
16 | 
17 | p = mlp.mlp(anddata[:,0:2],anddata[:,2:3],2)
18 | p.mlptrain(anddata[:,0:2],anddata[:,2:3],0.25,1001)
19 | p.confmat(anddata[:,0:2],anddata[:,2:3])
20 | 
21 | q = mlp.mlp(xordata[:,0:2],xordata[:,2:3],2,outtype='logistic')
22 | q.mlptrain(xordata[:,0:2],xordata[:,2:3],0.25,5001)
23 | q.confmat(xordata[:,0:2],xordata[:,2:3])
24 | 
25 | #anddata = array([[0,0,1,0],[0,1,1,0],[1,0,1,0],[1,1,0,1]])
26 | #xordata = array([[0,0,1,0],[0,1,0,1],[1,0,0,1],[1,1,1,0]])
27 | #
28 | #p = mlp.mlp(anddata[:,0:2],anddata[:,2:4],2,outtype='linear')
29 | #p.mlptrain(anddata[:,0:2],anddata[:,2:4],0.25,1001)
30 | #p.confmat(anddata[:,0:2],anddata[:,2:4])
31 | #
32 | #q = mlp.mlp(xordata[:,0:2],xordata[:,2:4],2,outtype='linear')
33 | #q.mlptrain(xordata[:,0:2],xordata[:,2:4],0.15,5001)
34 | #q.confmat(xordata[:,0:2],xordata[:,2:4])
35 | 


--------------------------------------------------------------------------------
/3 MLP/mlp.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # Code from Chapter 3 of Machine Learning: An Algorithmic Perspective
  3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
  4 | 
  5 | # You are free to use, change, or redistribute the code in any way you wish for
  6 | # non-commercial purposes, but please maintain the name of the original author.
  7 | # This code comes with no warranty of any kind.
  8 | 
  9 | # Stephen Marsland, 2008
 10 | 
 11 | from numpy import *
 12 | 
 13 | class mlp:
 14 |     """ A Multi-Layer Perceptron"""
 15 |     
 16 |     def __init__(self,inputs,targets,nhidden,beta=1,momentum=0.9,outtype='logistic'):
 17 |         """ Constructor """
 18 |         # Set up network size
 19 |         self.nin = shape(inputs)[1]
 20 |         self.nout = shape(targets)[1]
 21 |         self.ndata = shape(inputs)[0]
 22 |         self.nhidden = nhidden
 23 | 
 24 |         self.beta = beta
 25 |         self.momentum = momentum
 26 |         self.outtype = outtype
 27 |     
 28 |         # Initialise network
 29 |         self.weights1 = (random.rand(self.nin+1,self.nhidden)-0.5)*2/sqrt(self.nin)
 30 |         self.weights2 = (random.rand(self.nhidden+1,self.nout)-0.5)*2/sqrt(self.nhidden)
 31 | 
 32 |     def earlystopping(self,inputs,targets,valid,validtargets,eta,niterations=100):
 33 |     
 34 |         valid = concatenate((valid,-ones((shape(valid)[0],1))),axis=1)
 35 |         
 36 |         old_val_error1 = 100002
 37 |         old_val_error2 = 100001
 38 |         new_val_error = 100000
 39 |         
 40 |         count = 0
 41 |         while (((old_val_error1 - new_val_error) > 0.001) or ((old_val_error2 - old_val_error1)>0.001)):
 42 |             count+=1
 43 |             print count
 44 |             self.mlptrain(inputs,targets,eta,niterations)
 45 |             old_val_error2 = old_val_error1
 46 |             old_val_error1 = new_val_error
 47 |             validout = self.mlpfwd(valid)
 48 |             new_val_error = 0.5*sum((validtargets-validout)**2)
 49 |             
 50 |         print "Stopped", new_val_error,old_val_error1, old_val_error2
 51 |         return new_val_error
 52 |     	
 53 |     def mlptrain(self,inputs,targets,eta,niterations):
 54 |         """ Train the thing """    
 55 |         # Add the inputs that match the bias node
 56 |         inputs = concatenate((inputs,-ones((self.ndata,1))),axis=1)
 57 |         change = range(self.ndata)
 58 |     
 59 |         updatew1 = zeros((shape(self.weights1)))
 60 |         updatew2 = zeros((shape(self.weights2)))
 61 |                       
 62 |         for n in range(niterations):
 63 |     
 64 |             self.outputs = self.mlpfwd(inputs)
 65 | 
 66 |             error = 0.5*sum((targets-self.outputs)**2)
 67 |             if (mod(n,100)==0):
 68 |                 print "Iteration: ",n, " Error: ",error    
 69 | 
 70 |             # Different types of output neurons
 71 |             if self.outtype == 'linear':
 72 |             	deltao = (targets-self.outputs)/self.ndata
 73 |             elif self.outtype == 'logistic':
 74 |             	deltao = (targets-self.outputs)*self.outputs*(1.0-self.outputs)
 75 |             elif self.outtype == 'softmax':
 76 |             	#deltao = (targets-self.outputs)*self.outputs/self.ndata
 77 |                 deltao = (targets-self.outputs)/self.ndata
 78 |             else:
 79 |             	print "error"
 80 |             
 81 |             deltah = self.hidden*(1.0-self.hidden)*(dot(deltao,transpose(self.weights2)))
 82 | 
 83 |             updatew1 = eta*(dot(transpose(inputs),deltah[:,:-1])) + self.momentum*updatew1
 84 |             updatew2 = eta*(dot(transpose(self.hidden),deltao)) + self.momentum*updatew2
 85 |             self.weights1 += updatew1
 86 |             self.weights2 += updatew2
 87 |                 
 88 |             # Randomise order of inputs
 89 |             random.shuffle(change)
 90 |             inputs = inputs[change,:]
 91 |             targets = targets[change,:]
 92 |             
 93 |     def mlpfwd(self,inputs):
 94 |         """ Run the network forward """
 95 | 
 96 |         self.hidden = dot(inputs,self.weights1);
 97 |         self.hidden = 1.0/(1.0+exp(-self.beta*self.hidden))
 98 |         self.hidden = concatenate((self.hidden,-ones((shape(inputs)[0],1))),axis=1)
 99 | 
100 |         outputs = dot(self.hidden,self.weights2);
101 | 
102 |         # Different types of output neurons
103 |         if self.outtype == 'linear':
104 |         	return outputs
105 |         elif self.outtype == 'logistic':
106 |             return 1.0/(1.0+exp(-self.beta*outputs))
107 |         elif self.outtype == 'softmax':
108 |             normalisers = sum(exp(outputs),axis=1)*ones((1,shape(outputs)[0]))
109 |             return transpose(transpose(exp(outputs))/normalisers)
110 |         else:
111 |             print "error"
112 | 
113 |     def confmat(self,inputs,targets):
114 |         """Confusion matrix"""
115 | 
116 |         # Add the inputs that match the bias node
117 |         inputs = concatenate((inputs,-ones((shape(inputs)[0],1))),axis=1)
118 |         outputs = self.mlpfwd(inputs)
119 |         
120 |         nclasses = shape(targets)[1]
121 | 
122 |         if nclasses==1:
123 |             nclasses = 2
124 |             outputs = where(outputs>0.5,1,0)
125 |         else:
126 |             # 1-of-N encoding
127 |             outputs = argmax(outputs,1)
128 |             targets = argmax(targets,1)
129 | 
130 |         cm = zeros((nclasses,nclasses))
131 |         for i in range(nclasses):
132 |             for j in range(nclasses):
133 |                 cm[i,j] = sum(where(outputs==i,1,0)*where(targets==j,1,0))
134 | 
135 |         print "Confusion matrix is:"
136 |         print cm
137 |         print "Percentage Correct: ",trace(cm)/sum(cm)*100
138 | 


--------------------------------------------------------------------------------
/3 MLP/sinewave.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 3 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The sinewave regression example
12 | 
13 | from pylab import *
14 | from numpy import *
15 | 
16 | # Set up the data
17 | x = ones((1,40))*linspace(0,1,40)
18 | t = sin(2*pi*x) + cos(4*pi*x) + random.randn(40)*0.2
19 | x = (x-0.5)*2
20 | x = transpose(x)
21 | t = transpose(t)
22 | 
23 | # Split into training, testing, and validation sets
24 | train = x[0::2,:]
25 | test = x[1::4,:]
26 | valid = x[3::4,:]
27 | traintarget = t[0::2,:]
28 | testtarget = t[1::4,:]
29 | validtarget = t[3::4,:]
30 | 
31 | # Plot the data
32 | plot(x,t,'o')
33 | xlabel('x')
34 | ylabel('t')
35 | 
36 | # Perform basic training with a small MLP
37 | import mlp
38 | net = mlp.mlp(train,traintarget,3,outtype='linear')
39 | net.mlptrain(train,traintarget,0.25,101)
40 | 
41 | # Use early stopping
42 | net.earlystopping(train,traintarget,valid,validtarget,0.25)
43 | 
44 | # Test out different sizes of network
45 | #count = 0
46 | #out = zeros((10,7))
47 | #for nnodes in [1,2,3,5,10,25,50]:
48 | #    for i in range(10):
49 | #        net = mlp.mlp(train,traintarget,nnodes,outtype='linear')
50 | #        out[i,count] = net.earlystopping(train,traintarget,valid,validtarget,0.25)
51 | #    count += 1
52 | #    
53 | #test = concatenate((test,-ones((shape(test)[0],1))),axis=1)
54 | #outputs = net.mlpfwd(test)
55 | #print 0.5*sum((outputs-testtarget)**2)
56 | #
57 | #print out
58 | #print out.mean(axis=0)
59 | #print out.var(axis=0)
60 | #print out.max(axis=0)
61 | #print out.min(axis=0)
62 | 
63 | show()


--------------------------------------------------------------------------------
/4 RBF/iris.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 4 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | from numpy import *
12 | 
13 | iris = loadtxt('../3 MLP/iris_proc.data',delimiter=',')
14 | iris[:,:4] = iris[:,:4]-iris[:,:4].mean(axis=0)
15 | imax = concatenate((iris.max(axis=0)*ones((1,5)),iris.min(axis=0)*ones((1,5))),axis=0).max(axis=0)
16 | iris[:,:4] = iris[:,:4]/imax[:4]
17 | #print iris[0:5,:]
18 | 
19 | #target = zeros((shape(iris)[0],2));
20 | #indices = where(iris[:,4]==0) 
21 | #target[indices,0] = 1
22 | #indices = where(iris[:,4]==1)
23 | #target[indices,1] = 1
24 | #indices = where(iris[:,4]==2)
25 | #target[indices,0] = 1
26 | #target[indices,1] = 1
27 | 
28 | target = zeros((shape(iris)[0],3));
29 | indices = where(iris[:,4]==0) 
30 | target[indices,0] = 1
31 | indices = where(iris[:,4]==1)
32 | target[indices,1] = 1
33 | indices = where(iris[:,4]==2)
34 | target[indices,2] = 1
35 | 
36 | 
37 | order = range(shape(iris)[0])
38 | random.shuffle(order)
39 | iris = iris[order,:]
40 | target = target[order,:]
41 | 
42 | train = iris[::2,0:4]
43 | traint = target[::2]
44 | valid = iris[1::4,0:4]
45 | validt = target[1::4]
46 | test = iris[3::4,0:4]
47 | testt = target[3::4]
48 | 
49 | #print train.max(axis=0), train.min(axis=0)
50 | 
51 | import rbf
52 | net = rbf.rbf(train,traint,5,1,1)
53 | 
54 | net.rbftrain(train,traint,0.25,2000)
55 | #net.confmat(train,traint)
56 | net.confmat(test,testt)
57 | 


--------------------------------------------------------------------------------
/4 RBF/least_squares.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 4 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | from pylab import *
12 | from numpy import *
13 | 
14 | x = arange(-3,10,0.05)
15 | y = 2.5 * exp(-(x)**2/9) + 3.2 * exp(-(x-0.5)**2/4) + random.normal(0.0, 1.0, len(x))
16 | nParam = 2
17 | A = zeros((len(x),nParam), float)
18 | A[:,0] = exp(-(x)**2/9)
19 | A[:,1] = exp(-(x*0.5)**2/4)
20 | (p, residuals, rank, s) = linalg.lstsq(A,y)
21 | 
22 | print p
23 | ion()
24 | plot(x,y,'.')
25 | plot(x,p[0]*A[:,0]+p[1]*A[:,1],'x')
26 | 
27 | show()
28 | 


--------------------------------------------------------------------------------
/4 RBF/rbf.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # Code from Chapter 4 of Machine Learning: An Algorithmic Perspective
  3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
  4 | 
  5 | # You are free to use, change, or redistribute the code in any way you wish for
  6 | # non-commercial purposes, but please maintain the name of the original author.
  7 | # This code comes with no warranty of any kind.
  8 | 
  9 | # Stephen Marsland, 2008
 10 | 
 11 | from numpy import *
 12 | import pcn
 13 | import kmeans
 14 | 
 15 | class rbf:
 16 |     """ The Radial Basis Function network
 17 |     Parameters are number of RBFs, and their width, how to train the network 
 18 |     (pseudo-inverse or kmeans) and whether the RBFs are normalised"""
 19 | 
 20 |     def __init__(self,inputs,targets,nRBF,sigma=0,usekmeans=0,normalise=0):
 21 |         self.nin = shape(inputs)[1]
 22 |         self.nout = shape(targets)[1]
 23 |         self.ndata = shape(inputs)[0]
 24 |         self.nRBF = nRBF
 25 |         self.usekmeans = usekmeans
 26 |         self.normalise = normalise
 27 |         
 28 |         if usekmeans:
 29 |             self.kmeansnet = kmeans.kmeans(self.nRBF,inputs)
 30 |             
 31 |         self.hidden = zeros((self.ndata,self.nRBF+1))
 32 |         
 33 |         if sigma==0:
 34 |             # Set width of Gaussians
 35 |             d = (inputs.max(axis=0)-inputs.min(axis=0)).max()
 36 |             self.sigma = d/sqrt(2*nRBF)  
 37 |         else:
 38 |             self.sigma = sigma
 39 |                 
 40 |         self.perceptron = pcn.pcn(self.hidden[:,:-1],targets)
 41 |         
 42 |         # Initialise network
 43 |         self.weights1 = zeros((self.nin,self.nRBF))
 44 |         
 45 |     def rbftrain(self,inputs,targets,eta=0.25,niterations=100):
 46 |                 
 47 |         if self.usekmeans==0:
 48 |             # Version 1: set RBFs to be datapoints
 49 |             indices = range(self.ndata)
 50 |             random.shuffle(indices)
 51 |             for i in range(self.nRBF):
 52 |                 self.weights1[:,i] = inputs[indices[i],:]
 53 |         else:
 54 |             # Version 2: use k-means
 55 |             self.weights1 = transpose(self.kmeansnet.kmeanstrain(inputs))
 56 | 
 57 |         for i in range(self.nRBF):
 58 |             self.hidden[:,i] = exp(-sum((inputs - ones((1,self.nin))*self.weights1[:,i])**2,axis=1)/(2*self.sigma**2))
 59 |         if self.normalise:
 60 |             self.hidden[:,:-1] /= transpose(ones((1,shape(self.hidden)[0]))*self.hidden[:,:-1].sum(axis=1))
 61 |         
 62 |         # Call Perceptron without bias node (since it adds its own)
 63 |         self.perceptron.pcntrain(self.hidden[:,:-1],targets,eta,niterations)
 64 |         
 65 |     def rbffwd(self,inputs):
 66 | 
 67 |         hidden = zeros((shape(inputs)[0],self.nRBF+1))
 68 | 
 69 |         for i in range(self.nRBF):
 70 |             hidden[:,i] = exp(-sum((inputs - ones((1,self.nin))*self.weights1[:,i])**2,axis=1)/(2*self.sigma**2))
 71 | 
 72 |         if self.normalise:
 73 |             hidden[:,:-1] /= transpose(ones((1,shape(hidden)[0]))*hidden[:,:-1].sum(axis=1))
 74 |         
 75 |         # Add the bias
 76 |         hidden[:,-1] = -1
 77 | 
 78 |         outputs = self.perceptron.pcnfwd(hidden)
 79 |         return outputs
 80 |     
 81 |     def confmat(self,inputs,targets):
 82 |         """Confusion matrix"""
 83 | 
 84 |         outputs = self.rbffwd(inputs)
 85 |         nClasses = shape(targets)[1]
 86 | 
 87 |         if nClasses==1:
 88 |             nClasses = 2
 89 |             outputs = where(outputs>0,1,0)
 90 |         else:
 91 |             # 1-of-N encoding
 92 |             outputs = argmax(outputs,1)
 93 |             targets = argmax(targets,1)
 94 | 
 95 |         cm = zeros((nClasses,nClasses))
 96 |         for i in range(nClasses):
 97 |             for j in range(nClasses):
 98 |                 cm[i,j] = sum(where(outputs==i,1,0)*where(targets==j,1,0))
 99 | 
100 |         print cm
101 |         print trace(cm)/sum(cm)
102 | 


--------------------------------------------------------------------------------
/6 Trees/dtree.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # Code from Chapter 6 of Machine Learning: An Algorithmic Perspective
  3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
  4 | 
  5 | # You are free to use, change, or redistribute the code in any way you wish for
  6 | # non-commercial purposes, but please maintain the name of the original author.
  7 | # This code comes with no warranty of any kind.
  8 | 
  9 | # Stephen Marsland, 2008
 10 | 
 11 | from numpy import *
 12 | 
 13 | class dtree:
 14 | 	""" A basic Decision Tree"""
 15 | 	
 16 | 	def __init__(self):
 17 | 		""" Constructor """
 18 | 
 19 | 	def read_data(self,filename):
 20 | 		fid = open(filename,"r")
 21 | 		data = []
 22 | 		d = []
 23 | 		for line in fid.readlines():
 24 | 			d.append(line.strip())
 25 | 		for d1 in d:
 26 | 			data.append(d1.split(","))
 27 | 		fid.close()
 28 | 
 29 | 		self.featureNames = data[0]
 30 | 		self.featureNames = self.featureNames[:-1]
 31 | 		data = data[1:]
 32 | 		self.classes = []
 33 | 		for d in range(len(data)):
 34 | 			self.classes.append(data[d][-1])
 35 | 			data[d] = data[d][:-1]
 36 | 
 37 | 		return data,self.classes,self.featureNames
 38 | 
 39 | 	def classify(self,tree,datapoint):
 40 | 
 41 | 		if type(tree) == type("string"):
 42 | 			# Have reached a leaf
 43 | 			return tree
 44 | 		else:
 45 | 			a = tree.keys()[0]
 46 | 			for i in range(len(self.featureNames)):
 47 | 				if self.featureNames[i]==a:
 48 | 					break
 49 | 			
 50 | 			try:
 51 | 				t = tree[a][datapoint[i]]
 52 | 				return self.classify(t,datapoint)
 53 | 			except:
 54 | 				return None
 55 | 
 56 | 	def classifyAll(self,tree,data):
 57 | 		results = []
 58 | 		for i in range(len(data)):
 59 | 			results.append(self.classify(tree,data[i]))
 60 | 		return results
 61 |        
 62 | 	def make_tree(self,data,classes,featureNames,maxlevel=-1,level=0):
 63 | 		""" The main function, which recursively constructs the tree"""
 64 | 
 65 | 		nData = len(data)
 66 | 		nFeatures = len(data[0])
 67 | 		
 68 | 		try: 
 69 | 			self.featureNames
 70 | 		except:
 71 | 			self.featureNames = featureNames
 72 | 			
 73 | 		# List the possible classes
 74 | 		newClasses = []
 75 | 		for aclass in classes:
 76 | 			if newClasses.count(aclass)==0:
 77 | 				newClasses.append(aclass)
 78 | 
 79 | 		# Compute the default class (and total entropy)
 80 | 		frequency = zeros(len(newClasses))
 81 | 
 82 | 		totalEntropy = 0
 83 | 		totalGini = 0
 84 | 		index = 0
 85 | 		for aclass in newClasses:
 86 | 			frequency[index] = classes.count(aclass)
 87 | 			totalEntropy += self.calc_entropy(float(frequency[index])/nData)
 88 | 			totalGini += (float(frequency[index])/nData)**2
 89 | 
 90 | 			index += 1
 91 | 
 92 | 		totalGini = 1 - totalGini
 93 | 		default = classes[argmax(frequency)]
 94 | 
 95 | 		if nData==0 or nFeatures == 0 or (maxlevel>=0 and level>maxlevel):
 96 | 			# Have reached an empty branch
 97 | 			return default
 98 | 		elif classes.count(classes[0]) == nData:
 99 | 			# Only 1 class remains
100 | 			return classes[0]
101 | 		else:
102 | 
103 | 			# Choose which feature is best	
104 | 			gain = zeros(nFeatures)
105 | 			ggain = zeros(nFeatures)
106 | 			for feature in range(nFeatures):
107 | 				g,gg = self.calc_info_gain(data,classes,feature)
108 | 				gain[feature] = totalEntropy - g
109 | 				ggain[feature] = totalGini - gg
110 | 
111 | 			bestFeature = argmax(gain)
112 | 			tree = {featureNames[bestFeature]:{}}
113 | 
114 | 			# List the values that bestFeature can take
115 | 			values = []
116 | 			for datapoint in data:
117 | 				if values.count(datapoint[bestFeature])==0:
118 | 					values.append(datapoint[bestFeature])
119 | 
120 | 			for value in values:
121 | 				# Find the datapoints with each feature value
122 | 				newData = []
123 | 				newClasses = []
124 | 				index = 0
125 | 				for datapoint in data:
126 | 					if datapoint[bestFeature]==value:
127 | 						if bestFeature==0:
128 | 							newdatapoint = datapoint[1:]
129 | 							newNames = featureNames[1:]
130 | 						elif bestFeature==nFeatures:
131 | 							newdatapoint = datapoint[:-1]
132 | 							newNames = featureNames[:-1]
133 | 						else:
134 | 							newdatapoint = datapoint[:bestFeature]
135 | 							newdatapoint.extend(datapoint[bestFeature+1:])
136 | 							newNames = featureNames[:bestFeature]
137 | 							newNames.extend(featureNames[bestFeature+1:])
138 | 						newData.append(newdatapoint)
139 | 						newClasses.append(classes[index])
140 | 					index += 1
141 | 
142 | 				# Now recurse to the next level	
143 | 				subtree = self.make_tree(newData,newClasses,newNames,maxlevel,level+1)
144 | 
145 | 				# And on returning, add the subtree on to the tree
146 | 				tree[featureNames[bestFeature]][value] = subtree
147 | 
148 | 			return tree
149 | 
150 | 	def printTree(self,tree,str):
151 |     		if type(tree) == dict:
152 |         		print str, tree.keys()[0]
153 |         		for item in tree.values()[0].keys():
154 |             			print str, item
155 |             			self.printTree(tree.values()[0][item], str + "\t")
156 |     		else:
157 |     			print str, "\t->\t", tree
158 | 
159 | 	def calc_entropy(self,p):
160 | 		if p!=0:
161 | 			return -p * log2(p)
162 | 		else:
163 | 			return 0
164 | 
165 | 	def calc_info_gain(self,data,classes,feature):
166 | 
167 | 		# Calculates the information gain based on both entropy and the Gini impurity
168 | 		gain = 0
169 | 		ggain = 0
170 | 		nData = len(data)
171 | 
172 | 		# List the values that feature can take
173 | 		values = []
174 | 		for datapoint in data:
175 | 			if values.count(datapoint[feature])==0:
176 | 				values.append(datapoint[feature])
177 | 
178 | 		featureCounts = zeros(len(values))
179 | 		entropy = zeros(len(values))
180 | 		gini = zeros(len(values))
181 | 		valueIndex = 0
182 | 		# Find where those values appear in data[feature] and the corresponding class
183 | 		for value in values:
184 | 			dataIndex = 0
185 | 			newClasses = []
186 | 			for datapoint in data:
187 | 				if datapoint[feature]==value:
188 | 					featureCounts[valueIndex]+=1
189 | 					newClasses.append(classes[dataIndex])
190 | 				dataIndex += 1
191 | 
192 | 			# Get the values in newClasses
193 | 			classValues = []
194 | 			for aclass in newClasses:
195 | 				if classValues.count(aclass)==0:
196 | 					classValues.append(aclass)
197 | 
198 | 			classCounts = zeros(len(classValues))
199 | 			classIndex = 0
200 | 			for classValue in classValues:
201 | 				for aclass in newClasses:
202 | 					if aclass == classValue:
203 | 						classCounts[classIndex]+=1 
204 | 				classIndex += 1
205 | 			
206 | 			for classIndex in range(len(classValues)):
207 | 				entropy[valueIndex] += self.calc_entropy(float(classCounts[classIndex])/sum(classCounts))
208 | 				gini[valueIndex] += (float(classCounts[classIndex])/sum(classCounts))**2
209 | 
210 | 			# Computes both the Gini gain and the entropy
211 | 			gain = gain + float(featureCounts[valueIndex])/nData * entropy[valueIndex]
212 | 			ggain = ggain + float(featureCounts[valueIndex])/nData * gini[valueIndex]
213 | 			valueIndex += 1
214 | 		return gain, 1-ggain	
215 | 			
216 | 


--------------------------------------------------------------------------------
/6 Trees/party.data:
--------------------------------------------------------------------------------
 1 | Deadline,Party,Lazy,Activity
 2 | Urgent,Yes,Yes,Party
 3 | Urgent,No,Yes,Study
 4 | Near,Yes,Yes,Party
 5 | None,Yes,No,Party
 6 | None,No,Yes,Pub
 7 | None,Yes,No,Party
 8 | Near,No,No,Study
 9 | Near,No,Yes,TV
10 | Near,Yes,Yes,Party
11 | Urgent,No,No,Study
12 | 


--------------------------------------------------------------------------------
/6 Trees/party.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 6 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Code to run the decision tree on the Party dataset
12 | from numpy import *
13 | import dtree
14 | 
15 | tree = dtree.dtree()
16 | party,classes,features = tree.read_data('party.data')
17 | t=tree.make_tree(party,classes,features)
18 | tree.printTree(t,' ')
19 | 
20 | print tree.classifyAll(t,party)
21 | 
22 | for i in range(len(party)):
23 |     tree.classify(t,party[i])
24 | 


--------------------------------------------------------------------------------
/7 Committee/bagging.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 7 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | from numpy import *
12 | import dtree
13 | 
14 | class bagger:
15 | 
16 | 	"""The bagging algorithm based on the decision tree of Chapter 6"""
17 | 	def __init__(self):
18 | 		""" Constructor """
19 | 		self.tree = dtree.dtree()
20 | 		
21 | 	def bag(self,data,targets,features,nSamples):
22 | 	
23 | 		nPoints = shape(data)[0]
24 | 		nDim = shape(data)[1]
25 | 		self.nSamples = nSamples
26 | 		
27 | 		# Compute boostrap samples
28 | 		samplePoints = random.randint(0,nPoints,(nPoints,nSamples))
29 | 		classifiers = []
30 | 		
31 | 		for i in range(nSamples):
32 | 			sample = []
33 | 			sampleTarget = []
34 | 			for j in range(nPoints):
35 | 				sample.append(data[samplePoints[j,i]])
36 | 				sampleTarget.append(targets[samplePoints[j,i]])
37 | 			# Train classifiers
38 | 			classifiers.append(self.tree.make_tree(sample,sampleTarget,features,1))
39 | 
40 | 		return classifiers
41 | 	
42 | 	def bagclass(self,classifiers,data):
43 | 		
44 | 		decision = []
45 | 		# Majority voting
46 | 		for j in range(len(data)):
47 | 			outputs = []
48 | 			#print data[j]
49 | 			for i in range(self.nSamples):
50 | 				out = self.tree.classify(classifiers[i],data[j])
51 | 				if out is not None:
52 | 					outputs.append(out)
53 | 			# List the possible outputs
54 | 			out = []
55 | 			for each in outputs:
56 | 				if out.count(each)==0:
57 | 					out.append(each)
58 | 			frequency = zeros(len(out))
59 | 		
60 | 			index = 0
61 | 			if len(out)>0:
62 | 				for each in out:
63 | 					frequency[index] = outputs.count(each)
64 | 					index += 1
65 | 				decision.append(out[frequency.argmax()])
66 | 			else:
67 | 				decision.append(None)
68 | 		return decision
69 | 


--------------------------------------------------------------------------------
/7 Committee/boost.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # Code from Chapter 7 of Machine Learning: An Algorithmic Perspective
  3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
  4 | 
  5 | # You are free to use, change, or redistribute the code in any way you wish for
  6 | # non-commercial purposes, but please maintain the name of the original author.
  7 | # This code comes with no warranty of any kind.
  8 | 
  9 | # Stephen Marsland, 2008
 10 | 
 11 | from pylab import *
 12 | from numpy import *
 13 | 
 14 | # The boosting example of a simple 2D dataset with 2 classes
 15 | 
 16 | def train(data,classes,weights,whichdim):
 17 |         
 18 |     error = zeros(10)
 19 |     for value in range(0,10,1):
 20 |         val = float(value)/10
 21 |         classn = where(data[whichdim,:]<val,-1,1)
 22 |         ind = where(classes!=classn)
 23 |         error[value] = sum(weights[ind])
 24 |     #print error, argmin(error)    
 25 |     return whichdim,float(argmin(error))/10,1-whichdim  
 26 |     
 27 | def classify(data,dim,value):
 28 |     classn = where(data[dim,:]<value,-1,1)
 29 |     ind = where(classes!=classn,1,0)
 30 |     return classn, ind
 31 |         
 32 | def boost(data,classes,testdata):
 33 |     T = 20
 34 |     N = shape(data)[1]
 35 |     ndim = shape(data)[0]
 36 |     classifiers = zeros((2,T))
 37 |     whichdim = 0
 38 | 
 39 |     w = ones((N,T+1),dtype=float)/N
 40 |     index = ones((N,T+1))
 41 |     e = zeros(T)
 42 |     alpha = zeros(T+1)
 43 | 
 44 |     err = zeros((2,T+1))
 45 | 
 46 |     poutput = zeros((T+1,N))
 47 |     ptoutput = zeros((T+1,N))
 48 |     po = zeros(T+1)
 49 |     pto = zeros(T+1)
 50 |     
 51 |     for t in range(T):
 52 |         classifiers[0,t],classifiers[1,t],whichdim = train(data,classes,w[:,t],whichdim)
 53 |         #print "Out", classifiers[:,t]
 54 |         outputs,errors = classify(data,classifiers[0,t],classifiers[1,t])
 55 |         toutputs,terrors = classify(testdata,classifiers[0,t],classifiers[1,t])
 56 | 
 57 |         which = where(outputs<=0)
 58 |         which2 = where(outputs>0)
 59 |         figure()
 60 |         plot(data[0,which],data[1,which],'ko',ms=15)
 61 |         plot(data[0,which2],data[1,which2],'k^',ms=15)
 62 |         index[:,t] = errors
 63 |         #print "index: ", index[:,t]
 64 |         #print "e: ", w[:,t] * index[:,t]
 65 |         e[t] = sum(w[:,t]*index[:,t])/sum(w[:,t])
 66 |         #print "e: ",e[t]
 67 |             
 68 |         if t>0 and (e[t]==0 or e[t]>=0.5):
 69 |             T=t
 70 |             alpha = alpha[:t]
 71 |             index = index[:,:t]
 72 |             w = w[:,:t]
 73 |             break
 74 | 
 75 |         alpha[t] = log((1-e[t])/e[t])
 76 |         #print "alpha: ", alpha[t]
 77 |         w[:,t+1] = w[:,t]* exp(alpha[t]*index[:,t])
 78 |         w[:,t+1] = w[:,t+1]/sum(w[:,t+1])
 79 |         #print "w: ", w[:,t+1], sum(w[:,t+1])
 80 |         
 81 |         
 82 |         outputs = zeros((N,t))
 83 |         toutputs = zeros((N,t))
 84 |         for i in range(t):
 85 |             outputs[:,i],errors  = classify(data,classifiers[0,i],classifiers[1,i])
 86 |             toutputs[:,i],terrors  = classify(testdata,classifiers[0,i],classifiers[1,i])
 87 |     
 88 | 
 89 |         for n in range(N):
 90 |             poutput[t,n] = sum(alpha[:t]*outputs[n,:])/sum(alpha)
 91 |             ptoutput[t,n] = sum(alpha[:t]*toutputs[n,:])/sum(alpha)
 92 |         poutput[t,:] = where(poutput[t,:]>0,1,-1)
 93 |         ptoutput[t,:] = where(ptoutput[t,:]>0,1,-1)
 94 |         po[t] = shape(where(poutput[t,:]!=classes))[1]
 95 |         pto[t] = shape(where(ptoutput[t,:]!=testclasses))[1]
 96 |     #print "output: "
 97 |     #print alpha
 98 |     outputs = zeros((N,shape(w)[1]))
 99 |     for t in range(T):
100 |         outputs[:,t],errors  = classify(data,classifiers[0,t],classifiers[1,t])
101 |     
102 |     output = zeros(N)
103 |     for n in range(N):
104 |         output[n] = sum(alpha*outputs[n,:])/sum(alpha)
105 |         
106 |     #print output
107 |     #print classes 
108 |     which = where(output<=0)
109 |     which2 = where(output>0)
110 |     figure()
111 |     plot(data[0,which],data[1,which],'ko',ms=15)
112 |     plot(data[0,which2],data[1,which2],'k^',ms=15)
113 |     title('Output on training data')
114 |     #axis('off')
115 |     
116 |     outputs = zeros((N,shape(w)[1]))
117 |     for t in range(T):
118 |         outputs[:,t],errors  = classify(testdata,classifiers[0,t],classifiers[1,t])
119 |     
120 |     output = zeros(N)
121 |     for n in range(N):
122 |         output[n] = sum(alpha*outputs[n,:])/sum(alpha)    
123 |     which = where(output<=0)
124 |     which2 = where(output>0)
125 |     figure()
126 |     title('Output on test data')
127 |     plot(testdata[0,which],testdata[1,which],'ko',ms=15)
128 |     plot(testdata[0,which2],testdata[1,which2],'k^',ms=15)
129 |         
130 |     figure()
131 |     plot(arange(T),po[:T]/N,'k-',arange(T),pto[:T]/N,'k--')
132 |     legend(('Training error','Test error'))
133 |     xlabel('Iterations')
134 |     ylabel('Error')
135 |     return output
136 | 
137 | ndata = 50
138 | data = random.rand(2,ndata)
139 | #which = where(data[0,:]>0.4)
140 | #which2 = where(data[0,:]<=0.4)
141 | classes = where(((data[0,:]>0.4) & (data[1,:]>0.4)),1,-1)
142 | 
143 | 
144 | #classes = where(((data[0,:]>0.7) & (data[1,:]>0.7)) | ((data[0,:]<0.3) & (data[1,:]<0.3)),1,-1)
145 | 
146 | #false = where(data[0,:]<0.3)
147 | #new = random.randint(len(false))
148 | #classes[false[0][new]] = 1
149 | 
150 | which = where(classes==-1)
151 | which2 = where(classes==1)
152 | plot(data[0,which],data[1,which],'ko',ms=15)
153 | plot(data[0,which2],data[1,which2],'k^',ms=15)
154 | title('Training Data')
155 | testdata = random.rand(2,ndata)
156 | testclasses = where(((testdata[0,:]>0.4) & (testdata[1,:]>0.4)),1,-1)
157 | boost(data,classes,testdata)
158 | 
159 | figure()
160 | title('Test Data')
161 | which = where(testclasses==-1)
162 | which2 = where(testclasses==1)
163 | plot(testdata[0,which],testdata[1,which],'ko',ms=15)
164 | plot(testdata[0,which2],testdata[1,which2],'k^',ms=15)
165 | 
166 | 
167 | show()
168 | 


--------------------------------------------------------------------------------
/7 Committee/car.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 7 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # An example of bagging on the Car Safety dataset
12 | from numpy import *
13 | import dtree
14 | import bagging
15 | 
16 | tree = dtree.dtree()
17 | bagger = bagging.bagger()
18 | data,classes,features = tree.read_data('car.data')
19 | 
20 | train = data[::2][:]
21 | test = data[1::2][:]
22 | trainc = classes[::2]
23 | testc = classes[1::2]
24 | 
25 | t=tree.make_tree(train,trainc,features)
26 | out = tree.classifyAll(t,test)
27 | tree.printTree(t,' ')
28 | 
29 | a = zeros(len(out))
30 | b = zeros(len(out))
31 | d = zeros(len(out))
32 | 
33 | for i in range(len(out)):
34 |     if testc[i] == 'good' or testc[i]== 'v-good':
35 |         b[i] = 1
36 |         if out[i] == testc[i]:
37 |             d[i] = 1
38 |     if out[i] == testc[i]:
39 |         a[i] = 1
40 | 
41 | print "Number correctly predicted",sum(a)
42 | print "Number of testpoints ",len(a)
43 | print "Percentage Accuracy ",sum(a)/len(a)*100.0
44 | print ""
45 | print "Number of cars rated as good or very good", sum(b)
46 | print "Number correctly identified as good or very good",sum(d) 
47 | print "Percentage Accuracy",sum(d)/sum(b)*100.0
48 | 
49 | c=bagger.bag(train,trainc,features,100)
50 | out = bagger.bagclass(c,test)
51 | 
52 | a = zeros(len(out))
53 | d = zeros(len(out))
54 | 
55 | for i in range(len(out)):
56 |     if testc[i] == 'good' or testc[i]== 'v-good':
57 |         if out[i] == testc[i]:
58 |             d[i] = 1
59 |     if out[i] == testc[i]:
60 |         a[i] = 1
61 | print "-----"
62 | print "Number correctly predicted",sum(a)
63 | print "Number of testpoints ",len(a)
64 | print "Percentage Accuracy ",sum(a)/len(a)*100.0
65 | print ""
66 | print "Number of cars rated as good or very good", sum(b)
67 | print "Number correctly identified as good or very good",sum(d) 
68 | print "Percentage Accuracy",sum(d)/sum(b)*100.0
69 | 


--------------------------------------------------------------------------------
/7 Committee/dtw.py:
--------------------------------------------------------------------------------
  1 | 
  2 | # Code from Chapter 7 of Machine Learning: An Algorithmic Perspective
  3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
  4 | 
  5 | # You are free to use, change, or redistribute the code in any way you wish for
  6 | # non-commercial purposes, but please maintain the name of the original author.
  7 | # This code comes with no warranty of any kind.
  8 | 
  9 | # Stephen Marsland, 2008
 10 | 
 11 | from numpy import *
 12 | 
 13 | class dtree:
 14 |     """ Decision Tree with weights"""
 15 |     
 16 |     def __init__(self):
 17 |         """ Constructor """
 18 | 
 19 |     def read_data(self,filename):
 20 |         fid = open(filename,"r")
 21 |         data = []
 22 |         d = []
 23 |         for line in fid.readlines():
 24 |             d.append(line.strip())
 25 |         for d1 in d:
 26 |             data.append(d1.split(","))
 27 |         fid.close()
 28 | 
 29 |         self.featureNames = data[0]
 30 |         self.featureNames = self.featureNames[:-1]
 31 |         data = data[1:]
 32 |         self.classes = []
 33 |         for d in range(len(data)):
 34 |             self.classes.append(data[d][-1])
 35 |             data[d] = data[d][:-1]
 36 | 
 37 |         return data,self.classes,self.featureNames
 38 | 
 39 |     def classify(self,tree,datapoint):
 40 | 
 41 |         if type(tree) == type("string"):
 42 |             # Have reached a leaf
 43 |             return tree
 44 |         else:
 45 |             a = tree.keys()[0]
 46 |             for i in range(len(self.featureNames)):
 47 |                 if self.featureNames[i]==a:
 48 |                     break
 49 |             
 50 |             try:
 51 |                 t = tree[a][datapoint[i]]
 52 |                 return self.classify(t,datapoint)
 53 |             except:
 54 |                 return None
 55 | 
 56 |     def classifyAll(self,tree,data):
 57 |         results = []
 58 |         for i in range(len(data)):
 59 |             results.append(self.classify(tree,data[i]))
 60 |         return results
 61 |        
 62 |     def make_tree(self,data,weights,classes,featureNames,maxlevel=-1,level=0):
 63 | 
 64 |         nData = len(data)
 65 |         nFeatures = len(data[0])
 66 |         
 67 |         try: 
 68 |             self.featureNames
 69 |         except:
 70 |             self.featureNames = featureNames
 71 |             
 72 |         # List the possible classes
 73 |         newClasses = []
 74 |         for aclass in classes:
 75 |             if newClasses.count(aclass)==0:
 76 |                 newClasses.append(aclass)
 77 | 
 78 |         # Compute the default class (and total entropy)
 79 |         frequency = zeros(len(newClasses))
 80 | 
 81 |         totalGini = 0
 82 |         index = 0
 83 |         for aclass in newClasses:
 84 |             frequency[index] = classes.count(aclass)
 85 |             totalGini += (float(frequency[index])/nData)**2
 86 |             index += 1
 87 | 
 88 |         totalGini = 1 - totalGini
 89 |         default = classes[argmax(frequency)]
 90 | 
 91 |         if nData==0 or nFeatures == 0 or (maxlevel>=0 and level>maxlevel):
 92 |             # Have reached an empty branch
 93 |             return default
 94 |         elif classes.count(classes[0]) == nData:
 95 |             # Only 1 class remains
 96 |             return classes[0]
 97 |         else:
 98 | 
 99 |             # Choose which feature is best 
100 |             print totalGini   
101 |             gain = zeros(nFeatures)
102 |             for feature in range(nFeatures):
103 |                 g = self.calc_info_gain(data,weights,classes,feature)
104 |                 gain[feature] = totalGini - g
105 |             print "gain", gain
106 | 
107 |             bestFeature = argmin(gain)
108 |             print bestFeature
109 |             tree = {featureNames[bestFeature]:{}}
110 | 
111 |             # List the values that bestFeature can take
112 |             values = []
113 |             for datapoint in data:
114 |                 if values.count(datapoint[bestFeature])==0:
115 |                     values.append(datapoint[bestFeature])
116 | 
117 |             for value in values:
118 |                 # Find the datapoints with each feature value
119 |                 newData = []
120 |                 newWeights = []
121 |                 newClasses = []
122 |                 index = 0
123 |                 for datapoint in data:
124 |                     if datapoint[bestFeature]==value:
125 |                         if bestFeature==0:
126 |                             newdatapoint = datapoint[1:]
127 |                             newweight = weights[1:]
128 |                             newNames = featureNames[1:]
129 |                         elif bestFeature==nFeatures:
130 |                             newdatapoint = datapoint[:-1]
131 |                             newweight = weights[:-1]
132 |                             newNames = featureNames[:-1]
133 |                         else:
134 |                             newdatapoint = datapoint[:bestFeature]
135 |                             newdatapoint.extend(datapoint[bestFeature+1:])
136 |                             newweight = weights[:bestFeature]
137 |                             newweight = concatenate((newweight,weights[bestFeature+1:]))
138 |                             newNames = featureNames[:bestFeature]
139 |                             newNames.extend(featureNames[bestFeature+1:])
140 |                         newData.append(newdatapoint)
141 |                         newWeights = concatenate((newWeights,newweight))
142 |                         newClasses.append(classes[index])
143 |                     index += 1
144 | 
145 |                 # Now recurse to the next level    
146 |                 subtree = self.make_tree(newData,newWeights,newClasses,newNames,maxlevel,level+1)
147 | 
148 |                 # And on returning, add the subtree on to the tree
149 |                 tree[featureNames[bestFeature]][value] = subtree
150 | 
151 |             return tree
152 | 
153 |     def printTree(self,tree,str):
154 |             if type(tree) == dict:
155 |                 print str, tree.keys()[0]
156 |                 for item in tree.values()[0].keys():
157 |                         print str, item
158 |                         self.printTree(tree.values()[0][item], str + "\t")
159 |             else:
160 |                 print str, "\t->\t", tree
161 | 
162 |     def calc_info_gain(self,data,weights,classes,feature,maxlevel=-1,level=0):
163 | 
164 |         gain = 0
165 |         nData = len(data)
166 | 
167 |         try: 
168 |             self.featureNames
169 |         except:
170 |             self.featureNames = featureNames
171 |             
172 |         # List the values that feature can take
173 |         values = []
174 |         valueweight = array([],dtype=float)
175 |         counter = 0
176 |         for datapoint in data:
177 |             if values.count(datapoint[feature])==0:
178 |                 values.append(datapoint[feature])
179 |                 if size(valueweight) == 0:
180 |                     valueweight = array([weights[counter]])
181 |                 else:
182 |                     valueweight = concatenate((valueweight,array([weights[counter]])))
183 |             else:
184 |                 ind = values.index(datapoint[feature])
185 |                 valueweight[ind] += weights[counter]
186 |             counter += 1
187 |         #valueweight /= sum(valueweight)
188 |         #print "v",valueweight
189 |         featureCounts = zeros(len(values))
190 |         gini = zeros(len(values))
191 |         valueIndex = 0
192 |         # Find where those values appear in data[feature] and the corresponding class
193 |         for value in values:
194 |             dataIndex = 0
195 |             newClasses = []
196 |             for datapoint in data:
197 |                 if datapoint[feature]==value:
198 |                     featureCounts[valueIndex]+=1
199 |                     newClasses.append(classes[dataIndex])
200 |                 dataIndex += 1
201 | 
202 |             # Get the values in newClasses
203 |             classValues = []
204 |             for aclass in newClasses:
205 |                 if classValues.count(aclass)==0:
206 |                     classValues.append(aclass)
207 | 
208 |             classCounts = zeros(len(classValues))
209 |             classIndex = 0
210 |             for classValue in classValues:
211 |                 for aclass in newClasses:
212 |                     if aclass == classValue:
213 |                         classCounts[classIndex]+=1 
214 |                 classIndex += 1
215 |             
216 |             for classIndex in range(len(classValues)):
217 |                 gini[valueIndex] += (float(classCounts[classIndex])/sum(classCounts))**2
218 | 
219 |             gain = gain + float(featureCounts[valueIndex])/nData * gini[valueIndex] * valueweight[valueIndex]
220 |             valueIndex += 1
221 |         return 1-gain    
222 |             
223 | 


--------------------------------------------------------------------------------
/7 Committee/party.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 7 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Comparison of stumping and bagging on the Party dataset
12 | from numpy import *
13 | import dtw
14 | import bagging
15 | 
16 | tree = dtw.dtree()
17 | bagger = bagging.bagger()
18 | party,classes,features = tree.read_data('../6 Trees/party.data')
19 | 
20 | w = ones((shape(party)[0]),dtype = float)/shape(party)[0]
21 | 
22 | t=tree.make_tree(party,w,classes,features,1)
23 | #tree.printTree(t,' ')
24 | 
25 | print "Tree Stump Prediction"
26 | print tree.classifyAll(t,party)
27 | print "True Classes"
28 | print classes
29 | 
30 | c=bagger.bag(party,classes,features,20)
31 | print "Bagged Results"
32 | print bagger.bagclass(c,party)
33 | 


--------------------------------------------------------------------------------
/8 Probability/GMM.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 8 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | from pylab import *
12 | from numpy import *
13 | 
14 | def GMM():
15 | 
16 |     """ Fits two Gaussians to data using the EM algorithm """
17 |     N = 100
18 |     ion()
19 |     
20 |     y = 1.*zeros(N)
21 |     # Set up data
22 |     out1 = random.normal(6,1,N)
23 |     out2 = random.normal(1,1,N)
24 |     choice = random.rand(N)
25 |     
26 |     w = [choice>=0.5]
27 |     y[w] = out1[w]	
28 |     w = [choice<0.5]
29 |     y[w] = out2[w]
30 |     
31 |     clf()
32 |     hist(y,fc='0.5')
33 |     
34 | 	# Now do some learning
35 | 
36 | 	# Initialisation
37 |     mu1 = y[random.randint(0,N-1,1)]
38 |     mu2 = y[random.randint(0,N-1,1)]
39 |     s1 = sum((y-mean(y))**2)/N
40 |     s2 = s1
41 |     pi = 0.5
42 | 
43 | 	# EM loop
44 |     count = 0
45 |     gamma = 1.*zeros(N)
46 |     nits = 20
47 | 
48 |     ll = 1.*zeros(nits)
49 | 	
50 |     while count<nits:
51 |         count = count + 1
52 | 
53 |     	# E-step
54 |         for i in range(N):
55 |             gamma[i] = pi*exp(-(y[i]-mu2)**2/s2)/((1-pi) * exp(-(y[i]-mu1)**2/s1) + pi* exp(-(y[i]-mu2)**2/s2))
56 |         
57 |     	# M-step
58 |         mu1 = sum((1-gamma)*y)/sum(1-gamma)
59 |         mu2 = sum(gamma*y)/sum(gamma)
60 |         s1 = sum((1-gamma)*(y-mu1)**2)/sum(1-gamma)
61 |         s2 = sum(gamma*(y-mu2)**2)/sum(gamma)
62 |         pi = sum(gamma)/N
63 |         	
64 |         ll[count-1] = sum(log((1-pi)*exp(-(y[i]-mu1)**2/s1) + pi*exp(-(y[i]-mu2)**2/s2)))
65 |     x = arange(-2,8.5,0.1)
66 |     y = 35*pi*exp(-(x-mu1)**2/s1) + 35*(1-pi)*exp(-(x-mu2)**2/s2)
67 |     plot(x,y,'k',linewidth=4)
68 |     figure(), plot(ll,'ko-')
69 |     show()
70 |     
71 | GMM()
72 | 


--------------------------------------------------------------------------------
/8 Probability/gaussian.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 8 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Plots of three 2D Gaussians
12 | 
13 | from pylab import *
14 | from numpy import *
15 | 
16 | x = arange(-5,5,0.01)
17 | s = 1
18 | mu = 0
19 | y = 1/(sqrt(2*pi)*s) * exp(-0.5*(x-mu)**2/s**2)
20 | plot(x,y,'k')
21 | 
22 | close('all')
23 | mu = array([2,-3])
24 | s = array([1,1])
25 | #s = array([0.5,2])
26 | x = random.normal(mu,scale=s,size = (500,2))
27 | plot(x[:,0],x[:,1],'ko')
28 | #axis(array([0,3,-8,4]))
29 | axis('equal')
30 | 
31 | theta = arange(0,2.1*pi,pi/20)
32 | 
33 | plot(mu[0]+2*cos(theta),mu[1]+2*sin(theta),'k-')
34 | plot(mu[0]+3*cos(theta),mu[1]+3*sin(theta),'k-')
35 | 
36 | 
37 | figure()
38 | 
39 | mu = array([2,-3])
40 | s = array([0.5,2])
41 | x = random.normal(mu,scale=s,size = (500,2))
42 | phi = 2*pi/3
43 | plot(x[:,0]*cos(phi)+x[:,1]*sin(phi),x[:,0]*(-sin(phi)) + x[:,1]*cos(phi),'ko')
44 | axis('equal')
45 | 
46 | theta = arange(0,2.1*pi,pi/20)
47 | plot((mu[0]+3*s[0]*cos(theta))*cos(phi)+(mu[1]+3*s[1]*sin(theta))*sin(phi), (mu[0]+3*s[0]*cos(theta))*sin(-phi)+(mu[1]+3*s[1]*sin(theta))*cos(phi), 'k-')
48 | 
49 | figure()
50 | mu = array([2,-3])
51 | s = array([0.5,2])
52 | x = random.normal(mu,scale=s,size = (500,2))
53 | plot(x[:,0],x[:,1],'ko')
54 | axis('equal')
55 | 
56 | theta = arange(0,2.1*pi,pi/20)
57 | plot(mu[0]+3*s[0]*cos(theta),mu[1]+3*s[1]*sin(theta), 'k-')
58 | 
59 | show()


--------------------------------------------------------------------------------
/8 Probability/kdtree.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 8 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # The code to construct and use a KD-tree
12 | # There is a simple example at the bottom
13 | 
14 | from numpy import *
15 | 
16 | class node:
17 | 	# A passive class to hold the nodes
18 | 	pass
19 | 
20 | def makeKDtree(points, depth):
21 | 	if shape(points)[0]<1:
22 | 		# Have reached an empty leaf
23 | 		return None
24 | 	elif shape(points)[0]<2:
25 | 		# Have reached a proper leaf
26 | 		newNode = node()
27 | 		newNode.point = points[0,:]
28 | 		newNode.left = None
29 | 		newNode.right = None
30 | 		return newNode
31 | 	else:
32 | 		# Pick next axis to split on	
33 | 		whichAxis = mod(depth,shape(points)[1])
34 | 		
35 | 		# Find the median point
36 | 		indices = argsort(points[:,whichAxis])
37 | 		points = points[indices,:]
38 | 		median = ceil(float(shape(points)[0]-1)/2)
39 | 
40 | 		# Separate the remaining points
41 | 		goLeft = points[:median,:]
42 | 		goRight = points[median+1:,:]
43 | 
44 | 		# Make a new branching node and recurse
45 | 		newNode = node()
46 | 		newNode.point = points[median,:]
47 | 		newNode.left = makeKDtree(goLeft,depth+1)
48 | 		newNode.right = makeKDtree(goRight,depth+1)
49 | 		return newNode
50 | 
51 | def returnNearest(tree,point,depth):
52 | 	if tree.left is None:
53 | 		# Have reached a leaf
54 | 		distance = sum((tree.point-point)**2)
55 | 		return tree.point,distance,0
56 | 	else:
57 | 		# Pick next axis to split on
58 | 		whichAxis = mod(depth,shape(point)[0])
59 | 
60 | 		# Recurse down the tree
61 | 		if point[whichAxis]<tree.point[whichAxis]:
62 | 			bestGuess,distance,height = returnNearest(tree.left,point,depth+1)
63 | 		else:
64 | 			bestGuess,distance,height = returnNearest(tree.right,point,depth+1)
65 | 
66 | 		if height<=2:
67 | 			# Check the sibling
68 | 			if point[whichAxis]<tree.point[whichAxis]:
69 | 				bestGuess2,distance2,height2 = returnNearest(tree.right,point,depth+1)
70 | 			else:
71 | 				bestGuess2,distance2,height2 = returnNearest(tree.left,point,depth+1)
72 | 		
73 | 			# Check this node
74 | 			distance3 = sum((tree.point-point)**2)
75 | 			if (distance3<distance2):
76 | 				distance2 = distance3
77 | 				bestGuess2 = tree.point
78 | 			
79 | 			if (distance2<distance):
80 | 				distance = distance2
81 | 				bestGuess = bestGuess2
82 | 		return bestGuess,distance,height+1
83 | 
84 | 
85 | points = array([[1,6],[2,2],[3,7],[5,4],[6,8],[6,1],[7,5]])
86 | tree = makeKDtree(points,0)
87 | print returnNearest(tree,array([3,5]),0)
88 | print returnNearest(tree,array([4.5,2]),0)
89 | 
90 | 


--------------------------------------------------------------------------------
/8 Probability/knn.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 8 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # A k-Nearest Neighbour Classifier
12 | from numpy import *
13 | 
14 | def knn(k,data,dataClass,inputs):
15 | 
16 | 	nInputs = shape(inputs)[0]
17 | 	closest = zeros(nInputs)
18 | 
19 | 	for n in range(nInputs):
20 | 		# Compute distances
21 | 		distances = sum((data-inputs[n,:])**2,axis=1)
22 | 
23 | 		# Identify the nearest neighbours
24 | 		indices = argsort(distances,axis=0)
25 | 
26 | 		classes = unique(dataClass[indices[:k]])
27 | 		if len(classes)==1:
28 | 			closest[n] = unique(classes)
29 | 		else:
30 | 			counts = zeros(max(classes)+1)
31 | 			for i in range(k):
32 | 				counts[dataClass[indices[i]]] += 1
33 | 			closest[n] = max(counts)
34 | 			 
35 | 	return closest
36 | 


--------------------------------------------------------------------------------
/8 Probability/knnSmoother.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 8 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | from pylab import *
12 | from numpy import *
13 | 
14 | # A k-Nearest Neighbour smoother, with three different kernels
15 | # Example is the Ruapehu dataset
16 | def knnSmoother(k,data,testpoints,kernel):
17 | 
18 |     outputs = zeros(len(testpoints))
19 |     
20 |     for i in range(len(testpoints)):
21 |         distances = (data[:,0]-testpoints[i])
22 |         if kernel=='NN':
23 |             indices = argsort(distances**2,axis=0)
24 |             outputs[i] = 1./k * sum(data[indices[:k],1])
25 |         elif kernel=='Epan':
26 |             Klambda = 0.75*(1 - distances**2/k**2)
27 |             where = (abs(distances)<k)
28 |             outputs[i] = sum(Klambda*where*data[:,1])/sum(Klambda*where)
29 |         elif kernel=='Tricube':
30 |             Klambda = (1 - abs((distances/k)**3)**3)
31 |             where = (abs(distances)<k)
32 |             outputs[i] = sum(Klambda*where*data[:,1])/sum(Klambda*where)
33 |         else:
34 |             print('Unknown kernel')
35 |     return outputs
36 | 
37 | data = loadtxt('ruapehu.dat') 
38 | # Data is time of start and stop
39 | # Turn into repose and duration 
40 | t1 = data[:,0:1] 
41 | t2 = data[:,1:2] 
42 | repose = t1[1:len(t1),:] -t2[0:len(t2)-1,:] 
43 | duration = t2[1:len(t2),:] -t1[1:len(t1),:]
44 | order = argsort(repose,axis=0)
45 | repose = repose[order]
46 | duration = duration[order]
47 | data = squeeze(concatenate((repose,duration),axis=1))
48 | testpoints = 12.0*arange(1000)/1000
49 | outputs5 = knnSmoother(5,data,testpoints,'NN')
50 | outputs10 = knnSmoother(10,data,testpoints,'NN')
51 | 
52 | plot(data[:,0],data[:,1],'ko',testpoints,outputs5,'k-',linewidth=3)
53 | plot(testpoints,outputs10,'k--',linewidth=3)
54 | legend(('Data','NN, k=5','NN, k=10'))
55 | xlabel('Repose (years)')
56 | ylabel('Duration (years)')
57 | 
58 | figure(2)
59 | outputs5 = knnSmoother(2,data,testpoints,'Epan')
60 | outputs10 = knnSmoother(4,data,testpoints,'Epan')
61 | 
62 | plot(data[:,0],data[:,1],'ko',testpoints,outputs5,'k-',linewidth=3)
63 | plot(testpoints,outputs10,'k--',linewidth=3)
64 | legend(('Data','Epanechnikov, lambda=2','Epanechnikov, lambda=4'))
65 | xlabel('Repose (years)')
66 | ylabel('Duration (years)')
67 | 
68 | figure(3)
69 | outputs5 = knnSmoother(2,data,testpoints,'Tricube')
70 | outputs10 = knnSmoother(4,data,testpoints,'Tricube')
71 | 
72 | plot(data[:,0],data[:,1],'ko',testpoints,outputs5,'k-',linewidth=3)
73 | plot(testpoints,outputs10,'k--',linewidth=3)
74 | legend(('Data','Tricube, lambda=2','Tricube, lambda=4'))
75 | xlabel('Repose (years)')
76 | ylabel('Duration (years)')
77 | 
78 | 
79 | show()
80 | 


--------------------------------------------------------------------------------
/8 Probability/plotGaussian.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 8 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Plots a 1D Gaussian function
12 | from pylab import *
13 | from numpy import *
14 | 
15 | gaussian = lambda x: 1/(sqrt(2*pi)*1.5)*exp(-(x-0)**2/(2*(1.5**2)))
16 | x = arange(-5,5,0.01)
17 | y = gaussian(x)
18 | ion()
19 | plot(x,y,'k',linewidth=3)
20 | xlabel('x')
21 | ylabel('y(x)')
22 | axis([-5,5,0,0.3])
23 | title('Gaussian Function (mean 0, standard deviation 1.5)')
24 | show()
25 | 


--------------------------------------------------------------------------------
/8 Probability/ruapehu.dat:
--------------------------------------------------------------------------------
 1 | 1861.12	1861.37
 2 | 1869.50	1869.67
 3 | 1881.20	1881.37
 4 | 1886.29	1886.45
 5 | 1889.33	1889.62
 6 | 1890.20	1890.37
 7 | 1895.19	1895.20
 8 | 1897.50	1897.67
 9 | 1903.50	1903.79
10 | 1906.20	1906.49
11 | 1907.13	1907.29
12 | 1910.16	1910.33
13 | 1918.49	1918.78
14 | 1921.79	1922.08
15 | 1925.06	1925.35
16 | 1934.61	1934.90
17 | 1934.96	1935.13
18 | 1936.35	1936.36
19 | 1940.29	1940.58
20 | 1942.61	1942.90
21 | 1944.79	1945.08
22 | 1945.18	1945.96
23 | 1946.29	1946.45
24 | 1946.89	1947.01
25 | 1947.13	1947.29
26 | 1948.06	1948.23
27 | 1948.33	1948.50
28 | 1949.37	1949.54
29 | 1949.71	1949.87
30 | 1950.48	1950.48
31 | 1951.21	1951.38
32 | 1952.54	1952.70
33 | 1954.79	1954.95
34 | 1956.88	1956.88
35 | 1959.39	1959.67
36 | 1964.29	1964.45
37 | 1966.26	1966.74
38 | 1967.56	1967.76
39 | 1968.26	1968.44
40 | 1969.47	1969.48
41 | 1970.71	1970.71
42 | 1971.26	1971.84
43 | 1972.81	1973.03
44 | 1973.83	1974.82
45 | 1975.31	1975.32
46 | 1975.80	1975.80
47 | 1976.18	1976.18
48 | 1976.70	1976.89
49 | 1977.54	1977.75
50 | 1977.84	1978.00
51 | 1978.18	1978.35
52 | 1979.50	1979.54
53 | 1980.04	1980.24
54 | 1980.80	1980.84
55 | 1981.82	1982.28
56 | 1984.25	1984.42
57 | 1984.82	1984.98
58 | 1985.39	1985.44
59 | 1985.87	1985.87
60 | 1986.11	1986.11
61 | 1987.65	1987.66
62 | 1988.22	1988.40
63 | 1988.94	1989.18
64 | 1989.50	1989.72
65 | 1990.02	1990.07
66 | 1991.51	1991.53
67 | 1992.11	1992.18
68 | 1994.12	1994.25
69 | 1995.03	1995.86
70 | 1996.46	1996.67
71 | 1997.77	1997.80
72 | 


--------------------------------------------------------------------------------
/9 Unsupervised/iris.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 9 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Examples of using the k-means and SOM algorithms on the Iris dataset
12 | 
13 | from pylab import *
14 | from numpy import *
15 | 
16 | iris = loadtxt('../3 MLP/iris_proc.data',delimiter=',')
17 | iris[:,:4] = iris[:,:4]-iris[:,:4].mean(axis=0)
18 | imax = concatenate((iris.max(axis=0)*ones((1,5)),iris.min(axis=0)*ones((1,5))),axis=0).max(axis=0)
19 | iris[:,:4] = iris[:,:4]/imax[:4]
20 | 
21 | target = iris[:,4]
22 | 
23 | order = range(shape(iris)[0])
24 | random.shuffle(order)
25 | iris = iris[order,:]
26 | target = target[order,:]
27 | 
28 | train = iris[::2,0:4]
29 | traint = target[::2]
30 | valid = iris[1::4,0:4]
31 | validt = target[1::4]
32 | test = iris[3::4,0:4]
33 | testt = target[3::4]
34 | 
35 | #print train.max(axis=0), train.min(axis=0)
36 | 
37 | import kmeansnet
38 | net = kmeansnet.kmeans(3,train)
39 | net.kmeanstrain(train)
40 | cluster = net.kmeansfwd(test)
41 | print 1.*cluster
42 | print iris[3::4,4]
43 | 
44 | import som
45 | net = som.som(6,6,train)
46 | net.somtrain(train,400)
47 | 
48 | best = zeros(shape(train)[0],dtype=int)
49 | for i in range(shape(train)[0]):
50 |     best[i],activation = net.somfwd(train[i,:])
51 | 
52 | plot(net.map[0,:],net.map[1,:],'k.',ms=15)
53 | where = find(traint == 0)
54 | plot(net.map[0,best[where]],net.map[1,best[where]],'rs',ms=30)
55 | where = find(traint == 1)
56 | plot(net.map[0,best[where]],net.map[1,best[where]],'gv',ms=30)
57 | where = find(traint == 2)
58 | plot(net.map[0,best[where]],net.map[1,best[where]],'b^',ms=30)
59 | axis([-0.1,1.1,-0.1,1.1])
60 | axis('off')
61 | figure(2)
62 | 
63 | best = zeros(shape(test)[0],dtype=int)
64 | for i in range(shape(test)[0]):
65 |     best[i],activation = net.somfwd(test[i,:])
66 | 
67 | plot(net.map[0,:],net.map[1,:],'k.',ms=15)
68 | where = find(testt == 0)
69 | plot(net.map[0,best[where]],net.map[1,best[where]],'rs',ms=30)
70 | where = find(testt == 1)
71 | plot(net.map[0,best[where]],net.map[1,best[where]],'gv',ms=30)
72 | where = find(testt == 2)
73 | plot(net.map[0,best[where]],net.map[1,best[where]],'b^',ms=30)
74 | axis([-0.1,1.1,-0.1,1.1])
75 | axis('off')
76 | show()
77 | 


--------------------------------------------------------------------------------
/9 Unsupervised/kmeans.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 9 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | from numpy import *
12 | 
13 | class kmeans:
14 | 	""" The k-Means algorithm"""
15 | 	def __init__(self,k,data):
16 | 
17 | 		self.nData = shape(data)[0]
18 | 		self.nDim = shape(data)[1]
19 | 		self.k = k
20 | 		
21 | 	def kmeanstrain(self,data,maxIterations=10):
22 | 		
23 | 		# Find the minimum and maximum values for each feature
24 | 		minima = data.min(axis=0)
25 | 		maxima = data.max(axis=0)
26 | 	
27 | 		# Pick the centre locations randomly
28 | 		self.centres = random.rand(self.k,self.nDim)*(maxima-minima)+minima
29 | 		oldCentres = random.rand(self.k,self.nDim)*(maxima-minima)+minima
30 | 	
31 | 		count = 0
32 | 		#print centres
33 | 		while sum(sum(oldCentres-self.centres))!= 0 and count<maxIterations:
34 | 	
35 | 			oldCentres = self.centres.copy()
36 | 			count += 1
37 | 	
38 | 			# Compute distances
39 | 			distances = ones((1,self.nData))*sum((data-self.centres[0,:])**2,axis=1)
40 | 			for j in range(self.k-1):
41 | 				distances = append(distances,ones((1,self.nData))*sum((data-self.centres[j+1,:])**2,axis=1),axis=0)
42 | 	
43 | 			# Identify the closest cluster
44 | 			cluster = distances.argmin(axis=0)
45 | 			cluster = transpose(cluster*ones((1,self.nData)))
46 | 	
47 | 			# Update the cluster centres	
48 | 			for j in range(self.k):
49 | 				thisCluster = where(cluster==j,1,0)
50 | 				if sum(thisCluster)>0:
51 | 					self.centres[j,:] = sum(data*thisCluster,axis=0)/sum(thisCluster)
52 | 			#plot(data[:,0],data[:,1],'kx')
53 | 			#plot(centres[:,0],centres[:,1],'ro')
54 | 		return self.centres
55 | 	
56 | 	def kmeansfwd(self,data):
57 | 		
58 | 		nData = shape(data)[0]
59 | 		# Compute distances
60 | 		distances = ones((1,nData))*sum((data-self.centres[0,:])**2,axis=1)
61 | 		for j in range(self.k-1):
62 | 			distances = append(distances,ones((1,nData))*sum((data-self.centres[j+1,:])**2,axis=1),axis=0)
63 | 	
64 | 		# Identify the closest cluster
65 | 		cluster = distances.argmin(axis=0)
66 | 		cluster = transpose(cluster*ones((1,nData)))
67 | 	
68 | 		return cluster
69 | 


--------------------------------------------------------------------------------
/9 Unsupervised/kmeansnet.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 9 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | from numpy import *
12 | 
13 | class kmeans:
14 |     """The k-Means Algorithm implemented as a neural network"""
15 |     def __init__(self,k,data,nEpochs=1000,eta=0.25):
16 | 
17 |         self.nData = shape(data)[0]
18 |         self.nDim = shape(data)[1]
19 |         self.k = k
20 |         self.nEpochs = nEpochs
21 |         self.weights = random.rand(self.nDim,self.k)
22 |         self.eta = eta
23 |         
24 |     def kmeanstrain(self,data):
25 |         # Preprocess data (won't work if (0,0,...0) is in data)
26 |         normalisers = sqrt(sum(data**2,axis=1))*ones((1,shape(data)[0]))
27 |         data = transpose(transpose(data)/normalisers)
28 | 
29 |         for i in range(self.nEpochs):
30 |             for j in range(self.nData):
31 |                 activation = sum(self.weights*transpose(data[j:j+1,:]),axis=0)
32 |                 winner = argmax(activation)
33 |                 self.weights[:,winner] += self.eta * data[j,:] - self.weights[:,winner]            
34 |             
35 |     def kmeansfwd(self,data):
36 |         best = zeros(shape(data)[0])
37 |         for i in range(shape(data)[0]):
38 |             activation = sum(self.weights*transpose(data[i:i+1,:]),axis=0)
39 |             best[i] = argmax(activation)
40 |         return best
41 |     
42 | 


--------------------------------------------------------------------------------
/9 Unsupervised/moredemos.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 9 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # Demonstration of the SOM algorithm on the Wine dataset (and the e-coli dataset)
12 | from pylab import *
13 | from numpy import *
14 | import som
15 | 
16 | wine = loadtxt('wine.data',delimiter=',')
17 | 
18 | classes = wine[:,0]
19 | data = wine[:,1:]
20 | data -= mean(data,axis=0)
21 | data /= data.max(axis=0)
22 | 
23 | #ecoli = loadtxt('shortecoli.data')
24 | #classes = ecoli[:,7:]
25 | #data = ecoli[:,:7]
26 | #data -= mean(data,axis=0)
27 | #data /= data.max(axis=0)
28 | 
29 | order = range(shape(data)[0])
30 | random.shuffle(order)
31 | split = int(round(shape(data)[0]/2))
32 | train = data[order[:split],:]
33 | target = classes[order[:split],:]
34 | 
35 | test = data[order[split:],:]
36 | ttarget = classes[order[:split],:]
37 | 
38 | net = som.som(15,15,train,eta_b=0.3,eta_n=0.1,nSize=0.5,alpha=1,usePCA=1,useBCs=1,eta_bfinal=0.03,eta_nfinal=0.01,nSizefinal=0.05)
39 | net.somtrain(train,12000)
40 | 
41 | best = zeros(shape(test)[0],dtype=int)
42 | 
43 | for i in range(shape(test)[0]):
44 |     best[i],activation = net.somfwd(train[i,:])
45 | 
46 | #print best
47 | #print ttarget
48 | 
49 | plot(net.map[0,:],net.map[1,:],'k.',ms=15)
50 | where = find(target == 0)
51 | plot(net.map[0,best[where]],net.map[1,best[where]],'rs',ms=30)
52 | where = find(target == 1)
53 | plot(net.map[0,best[where]],net.map[1,best[where]],'gv',ms=30)
54 | where = find(target == 2)
55 | plot(net.map[0,best[where]],net.map[1,best[where]],'b^',ms=30)
56 | axis([-0.1,1.1,-0.1,1.1])
57 | axis('off')
58 | 
59 | figure(2)
60 | best = zeros(shape(test)[0],dtype=int)
61 | 
62 | for i in range(shape(test)[0]):
63 |     best[i],activation = net.somfwd(test[i,:])
64 | 
65 | plot(net.map[0,:],net.map[1,:],'k.',ms=15)
66 | where = find(ttarget == 0)
67 | plot(net.map[0,best[where]],net.map[1,best[where]],'rs',ms=30)
68 | where = find(ttarget == 1)
69 | plot(net.map[0,best[where]],net.map[1,best[where]],'gv',ms=30)
70 | where = find(ttarget == 2)
71 | plot(net.map[0,best[where]],net.map[1,best[where]],'b^',ms=30)
72 | axis([-0.1,1.1,-0.1,1.1])
73 | axis('off')
74 | 
75 | show()
76 | 


--------------------------------------------------------------------------------
/9 Unsupervised/shortecoli.data:
--------------------------------------------------------------------------------
  1 | 0.49  0.29  0.48  0.50  0.56  0.24  0.35   0
  2 | 0.07  0.40  0.48  0.50  0.54  0.35  0.44   0
  3 | 0.56  0.40  0.48  0.50  0.49  0.37  0.46   0
  4 | 0.59  0.49  0.48  0.50  0.52  0.45  0.36   0
  5 | 0.23  0.32  0.48  0.50  0.55  0.25  0.35   0
  6 | 0.67  0.39  0.48  0.50  0.36  0.38  0.46   0
  7 | 0.29  0.28  0.48  0.50  0.44  0.23  0.34   0
  8 | 0.21  0.34  0.48  0.50  0.51  0.28  0.39   0
  9 | 0.20  0.44  0.48  0.50  0.46  0.51  0.57   0
 10 | 0.42  0.40  0.48  0.50  0.56  0.18  0.30   0
 11 | 0.42  0.24  0.48  0.50  0.57  0.27  0.37   0
 12 | 0.25  0.48  0.48  0.50  0.44  0.17  0.29   0
 13 | 0.39  0.32  0.48  0.50  0.46  0.24  0.35   0
 14 | 0.51  0.50  0.48  0.50  0.46  0.32  0.35   0
 15 | 0.22  0.43  0.48  0.50  0.48  0.16  0.28   0
 16 | 0.25  0.40  0.48  0.50  0.46  0.44  0.52   0
 17 | 0.34  0.45  0.48  0.50  0.38  0.24  0.35   0
 18 | 0.44  0.27  0.48  0.50  0.55  0.52  0.58   0
 19 | 0.23  0.40  0.48  0.50  0.39  0.28  0.38   0
 20 | 0.41  0.57  0.48  0.50  0.39  0.21  0.32   0
 21 | 0.40  0.45  0.48  0.50  0.38  0.22  0.00   0
 22 | 0.31  0.23  0.48  0.50  0.73  0.05  0.14   0
 23 | 0.51  0.54  0.48  0.50  0.41  0.34  0.43   0
 24 | 0.30  0.16  0.48  0.50  0.56  0.11  0.23   0
 25 | 0.36  0.39  0.48  0.50  0.48  0.22  0.23   0
 26 | 0.29  0.37  0.48  0.50  0.48  0.44  0.52   0
 27 | 0.25  0.40  0.48  0.50  0.47  0.33  0.42   0
 28 | 0.21  0.51  0.48  0.50  0.50  0.32  0.41   0
 29 | 0.43  0.37  0.48  0.50  0.53  0.35  0.44   0
 30 | 0.43  0.39  0.48  0.50  0.47  0.31  0.41   0
 31 | 0.53  0.38  0.48  0.50  0.44  0.26  0.36   0
 32 | 0.34  0.33  0.48  0.50  0.38  0.35  0.44   0
 33 | 0.56  0.51  0.48  0.50  0.34  0.37  0.46   0
 34 | 0.40  0.29  0.48  0.50  0.42  0.35  0.44   0
 35 | 0.24  0.35  0.48  0.50  0.31  0.19  0.31   0
 36 | 0.36  0.54  0.48  0.50  0.41  0.38  0.46   0
 37 | 0.29  0.52  0.48  0.50  0.42  0.29  0.39   0
 38 | 0.65  0.47  0.48  0.50  0.59  0.30  0.40   0
 39 | 0.32  0.42  0.48  0.50  0.35  0.28  0.38   0
 40 | 0.38  0.46  0.48  0.50  0.48  0.22  0.29   0
 41 | 0.33  0.45  0.48  0.50  0.52  0.32  0.41   0
 42 | 0.30  0.37  0.48  0.50  0.59  0.41  0.49   0
 43 | 0.40  0.50  0.48  0.50  0.45  0.39  0.47   0
 44 | 0.28  0.38  0.48  0.50  0.50  0.33  0.42   0
 45 | 0.61  0.45  0.48  0.50  0.48  0.35  0.41   0
 46 | 0.17  0.38  0.48  0.50  0.45  0.42  0.50   0
 47 | 0.44  0.35  0.48  0.50  0.55  0.55  0.61   0
 48 | 0.43  0.40  0.48  0.50  0.39  0.28  0.39   0
 49 | 0.42  0.35  0.48  0.50  0.58  0.15  0.27   0
 50 | 0.23  0.33  0.48  0.50  0.43  0.33  0.43   0
 51 | 0.37  0.52  0.48  0.50  0.42  0.42  0.36   0
 52 | 0.29  0.30  0.48  0.50  0.45  0.03  0.17   0
 53 | 0.22  0.36  0.48  0.50  0.35  0.39  0.47   0
 54 | 0.23  0.58  0.48  0.50  0.37  0.53  0.59   0
 55 | 0.47  0.47  0.48  0.50  0.22  0.16  0.26   0
 56 | 0.54  0.47  0.48  0.50  0.28  0.33  0.42   0
 57 | 0.51  0.37  0.48  0.50  0.35  0.36  0.45   0
 58 | 0.40  0.35  0.48  0.50  0.45  0.33  0.42   0
 59 | 0.44  0.34  0.48  0.50  0.30  0.33  0.43   0
 60 | 0.42  0.38  0.48  0.50  0.54  0.34  0.43   0
 61 | 0.44  0.56  0.48  0.50  0.50  0.46  0.54   0
 62 | 0.52  0.36  0.48  0.50  0.41  0.28  0.38   0
 63 | 0.36  0.41  0.48  0.50  0.48  0.47  0.54   0
 64 | 0.18  0.30  0.48  0.50  0.46  0.24  0.35   0
 65 | 0.47  0.29  0.48  0.50  0.51  0.33  0.43   0
 66 | 0.24  0.43  0.48  0.50  0.54  0.52  0.59   0
 67 | 0.25  0.37  0.48  0.50  0.41  0.33  0.42   0
 68 | 0.52  0.57  0.48  0.50  0.42  0.47  0.54   0
 69 | 0.25  0.37  0.48  0.50  0.43  0.26  0.36   0
 70 | 0.35  0.48  0.48  0.50  0.56  0.40  0.48   0
 71 | 0.26  0.26  0.48  0.50  0.34  0.25  0.35   0
 72 | 0.44  0.51  0.48  0.50  0.47  0.26  0.36   0
 73 | 0.37  0.50  0.48  0.50  0.42  0.36  0.45   0
 74 | 0.44  0.42  0.48  0.50  0.42  0.25  0.20   0
 75 | 0.24  0.43  0.48  0.50  0.37  0.28  0.38   0
 76 | 0.42  0.30  0.48  0.50  0.48  0.26  0.36   0
 77 | 0.48  0.42  0.48  0.50  0.45  0.25  0.35   0
 78 | 0.41  0.48  0.48  0.50  0.51  0.44  0.51   0
 79 | 0.44  0.28  0.48  0.50  0.43  0.27  0.37   0
 80 | 0.29  0.41  0.48  0.50  0.48  0.38  0.46   0
 81 | 0.34  0.28  0.48  0.50  0.41  0.35  0.44   0
 82 | 0.41  0.43  0.48  0.50  0.45  0.31  0.41   0
 83 | 0.29  0.47  0.48  0.50  0.41  0.23  0.34   0
 84 | 0.34  0.55  0.48  0.50  0.58  0.31  0.41   0
 85 | 0.36  0.56  0.48  0.50  0.43  0.45  0.53   0
 86 | 0.40  0.46  0.48  0.50  0.52  0.49  0.56   0
 87 | 0.50  0.49  0.48  0.50  0.49  0.46  0.53   0
 88 | 0.52  0.44  0.48  0.50  0.37  0.36  0.42   0
 89 | 0.50  0.51  0.48  0.50  0.27  0.23  0.34   0
 90 | 0.53  0.42  0.48  0.50  0.16  0.29  0.39   0
 91 | 0.34  0.46  0.48  0.50  0.52  0.35  0.44   0
 92 | 0.40  0.42  0.48  0.50  0.37  0.27  0.27   0
 93 | 0.41  0.43  0.48  0.50  0.50  0.24  0.25   0
 94 | 0.30  0.45  0.48  0.50  0.36  0.21  0.32   0
 95 | 0.31  0.47  0.48  0.50  0.29  0.28  0.39   0
 96 | 0.64  0.76  0.48  0.50  0.45  0.35  0.38   0
 97 | 0.35  0.37  0.48  0.50  0.30  0.34  0.43   0
 98 | 0.57  0.54  0.48  0.50  0.37  0.28  0.33   0
 99 | 0.65  0.55  0.48  0.50  0.34  0.37  0.28   0
100 | 0.51  0.46  0.48  0.50  0.58  0.31  0.41   0
101 | 0.38  0.40  0.48  0.50  0.63  0.25  0.35   0
102 | 0.24  0.57  0.48  0.50  0.63  0.34  0.43   0
103 | 0.38  0.26  0.48  0.50  0.54  0.16  0.28   0
104 | 0.33  0.47  0.48  0.50  0.53  0.18  0.29   0
105 | 0.24  0.34  0.48  0.50  0.38  0.30  0.40   0
106 | 0.26  0.50  0.48  0.50  0.44  0.32  0.41   0
107 | 0.44  0.49  0.48  0.50  0.39  0.38  0.40   0
108 | 0.43  0.32  0.48  0.50  0.33  0.45  0.52   0
109 | 0.49  0.43  0.48  0.50  0.49  0.30  0.40   0
110 | 0.47  0.28  0.48  0.50  0.56  0.20  0.25   0
111 | 0.32  0.33  0.48  0.50  0.60  0.06  0.20   0
112 | 0.34  0.35  0.48  0.50  0.51  0.49  0.56   0
113 | 0.35  0.34  0.48  0.50  0.46  0.30  0.27   0
114 | 0.38  0.30  0.48  0.50  0.43  0.29  0.39   0
115 | 0.38  0.44  0.48  0.50  0.43  0.20  0.31   0
116 | 0.41  0.51  0.48  0.50  0.58  0.20  0.31   0
117 | 0.34  0.42  0.48  0.50  0.41  0.34  0.43   0
118 | 0.51  0.49  0.48  0.50  0.53  0.14  0.26   0
119 | 0.25  0.51  0.48  0.50  0.37  0.42  0.50   0
120 | 0.29  0.28  0.48  0.50  0.50  0.42  0.50   0
121 | 0.25  0.26  0.48  0.50  0.39  0.32  0.42   0
122 | 0.24  0.41  0.48  0.50  0.49  0.23  0.34   0
123 | 0.17  0.39  0.48  0.50  0.53  0.30  0.39   0
124 | 0.04  0.31  0.48  0.50  0.41  0.29  0.39   0
125 | 0.61  0.36  0.48  0.50  0.49  0.35  0.44   0
126 | 0.34  0.51  0.48  0.50  0.44  0.37  0.46   0
127 | 0.28  0.33  0.48  0.50  0.45  0.22  0.33   0
128 | 0.40  0.46  0.48  0.50  0.42  0.35  0.44   0
129 | 0.23  0.34  0.48  0.50  0.43  0.26  0.37   0
130 | 0.37  0.44  0.48  0.50  0.42  0.39  0.47   0
131 | 0.00  0.38  0.48  0.50  0.42  0.48  0.55   0
132 | 0.39  0.31  0.48  0.50  0.38  0.34  0.43   0
133 | 0.30  0.44  0.48  0.50  0.49  0.22  0.33   0
134 | 0.06  0.61  0.48  0.50  0.49  0.92  0.37   1
135 | 0.44  0.52  0.48  0.50  0.43  0.47  0.54   1
136 | 0.63  0.47  0.48  0.50  0.51  0.82  0.84   1
137 | 0.23  0.48  0.48  0.50  0.59  0.88  0.89   1
138 | 0.34  0.49  0.48  0.50  0.58  0.85  0.80   1
139 | 0.43  0.40  0.48  0.50  0.58  0.75  0.78   1
140 | 0.46  0.61  0.48  0.50  0.48  0.86  0.87   1
141 | 0.27  0.35  0.48  0.50  0.51  0.77  0.79   1
142 | 0.52  0.39  0.48  0.50  0.65  0.71  0.73   1
143 | 0.29  0.47  0.48  0.50  0.71  0.65  0.69   1
144 | 0.55  0.47  0.48  0.50  0.57  0.78  0.80   1
145 | 0.12  0.67  0.48  0.50  0.74  0.58  0.63   1
146 | 0.40  0.50  0.48  0.50  0.65  0.82  0.84   1
147 | 0.73  0.36  0.48  0.50  0.53  0.91  0.92   1
148 | 0.84  0.44  0.48  0.50  0.48  0.71  0.74   1
149 | 0.48  0.45  0.48  0.50  0.60  0.78  0.80   1
150 | 0.54  0.49  0.48  0.50  0.40  0.87  0.88   1
151 | 0.48  0.41  0.48  0.50  0.51  0.90  0.88   1
152 | 0.50  0.66  0.48  0.50  0.31  0.92  0.92   1
153 | 0.72  0.46  0.48  0.50  0.51  0.66  0.70   1
154 | 0.47  0.55  0.48  0.50  0.58  0.71  0.75   1
155 | 0.33  0.56  0.48  0.50  0.33  0.78  0.80   1
156 | 0.64  0.58  0.48  0.50  0.48  0.78  0.73   1
157 | 0.54  0.57  0.48  0.50  0.56  0.81  0.83   1
158 | 0.47  0.59  0.48  0.50  0.52  0.76  0.79   1
159 | 0.63  0.50  0.48  0.50  0.59  0.85  0.86   1
160 | 0.49  0.42  0.48  0.50  0.53  0.79  0.81   1
161 | 0.31  0.50  0.48  0.50  0.57  0.84  0.85   1
162 | 0.74  0.44  0.48  0.50  0.55  0.88  0.89   1
163 | 0.33  0.45  0.48  0.50  0.45  0.88  0.89   1
164 | 0.45  0.40  0.48  0.50  0.61  0.74  0.77   1
165 | 0.71  0.40  0.48  0.50  0.71  0.70  0.74   1
166 | 0.50  0.37  0.48  0.50  0.66  0.64  0.69   1
167 | 0.66  0.53  0.48  0.50  0.59  0.66  0.66   1
168 | 0.60  0.61  0.48  0.50  0.54  0.67  0.71   1
169 | 0.83  0.37  0.48  0.50  0.61  0.71  0.74   1
170 | 0.34  0.51  0.48  0.50  0.67  0.90  0.90   1
171 | 0.63  0.54  0.48  0.50  0.65  0.79  0.81   1
172 | 0.70  0.40  0.48  0.50  0.56  0.86  0.83   1
173 | 0.60  0.50  1.00  0.50  0.54  0.77  0.80   1
174 | 0.16  0.51  0.48  0.50  0.33  0.39  0.48   1
175 | 0.74  0.70  0.48  0.50  0.66  0.65  0.69   1
176 | 0.20  0.46  0.48  0.50  0.57  0.78  0.81   1
177 | 0.89  0.55  0.48  0.50  0.51  0.72  0.76   1
178 | 0.70  0.46  0.48  0.50  0.56  0.78  0.73   1
179 | 0.12  0.43  0.48  0.50  0.63  0.70  0.74   1
180 | 0.61  0.52  0.48  0.50  0.54  0.67  0.52   1
181 | 0.33  0.37  0.48  0.50  0.46  0.65  0.69   1
182 | 0.63  0.65  0.48  0.50  0.66  0.67  0.71   1
183 | 0.41  0.51  0.48  0.50  0.53  0.75  0.78   1
184 | 0.34  0.67  0.48  0.50  0.52  0.76  0.79   1
185 | 0.58  0.34  0.48  0.50  0.56  0.87  0.81   1
186 | 0.59  0.56  0.48  0.50  0.55  0.80  0.82   1
187 | 0.51  0.40  0.48  0.50  0.57  0.62  0.67   1
188 | 0.50  0.57  0.48  0.50  0.71  0.61  0.66   1
189 | 0.60  0.46  0.48  0.50  0.45  0.81  0.83   1
190 | 0.37  0.47  0.48  0.50  0.39  0.76  0.79   1
191 | 0.58  0.55  0.48  0.50  0.57  0.70  0.74   1
192 | 0.36  0.47  0.48  0.50  0.51  0.69  0.72   1
193 | 0.39  0.41  0.48  0.50  0.52  0.72  0.75   1
194 | 0.35  0.51  0.48  0.50  0.61  0.71  0.74   1
195 | 0.31  0.44  0.48  0.50  0.50  0.79  0.82   1
196 | 0.61  0.66  0.48  0.50  0.46  0.87  0.88   1
197 | 0.48  0.49  0.48  0.50  0.52  0.77  0.71   1
198 | 0.11  0.50  0.48  0.50  0.58  0.72  0.68   1
199 | 0.31  0.36  0.48  0.50  0.58  0.94  0.94   1
200 | 0.68  0.51  0.48  0.50  0.71  0.75  0.78   1
201 | 0.69  0.39  0.48  0.50  0.57  0.76  0.79   1
202 | 0.52  0.54  0.48  0.50  0.62  0.76  0.79   1
203 | 0.46  0.59  0.48  0.50  0.36  0.76  0.23   1
204 | 0.36  0.45  0.48  0.50  0.38  0.79  0.17   1
205 | 0.00  0.51  0.48  0.50  0.35  0.67  0.44   1
206 | 0.10  0.49  0.48  0.50  0.41  0.67  0.21   1
207 | 0.30  0.51  0.48  0.50  0.42  0.61  0.34   1
208 | 0.61  0.47  0.48  0.50  0.00  0.80  0.32   1
209 | 0.63  0.75  0.48  0.50  0.64  0.73  0.66   1
210 | 0.71  0.52  0.48  0.50  0.64  1.00  0.99   1
211 | 0.85  0.53  0.48  0.50  0.53  0.52  0.35   1
212 | 0.63  0.49  0.48  0.50  0.54  0.76  0.79   1
213 | 0.75  0.55  1.00  1.00  0.40  0.47  0.30   1
214 | 0.70  0.39  1.00  0.50  0.51  0.82  0.84   1
215 | 0.74  0.49  0.48  0.50  0.42  0.54  0.36   2
216 | 0.70  0.61  0.48  0.50  0.56  0.52  0.43   2
217 | 0.66  0.86  0.48  0.50  0.34  0.41  0.36   2
218 | 0.73  0.78  0.48  0.50  0.58  0.51  0.31   2
219 | 0.65  0.57  0.48  0.50  0.47  0.47  0.51   2
220 | 0.72  0.86  0.48  0.50  0.17  0.55  0.21   2
221 | 0.67  0.70  0.48  0.50  0.46  0.45  0.33   2
222 | 0.67  0.81  0.48  0.50  0.54  0.49  0.23   2
223 | 0.67  0.61  0.48  0.50  0.51  0.37  0.38   2
224 | 0.63  1.00  0.48  0.50  0.35  0.51  0.49   2
225 | 0.57  0.59  0.48  0.50  0.39  0.47  0.33   2
226 | 0.71  0.71  0.48  0.50  0.40  0.54  0.39   2
227 | 0.66  0.74  0.48  0.50  0.31  0.38  0.43   2
228 | 0.67  0.81  0.48  0.50  0.25  0.42  0.25   2
229 | 0.64  0.72  0.48  0.50  0.49  0.42  0.19   2
230 | 0.68  0.82  0.48  0.50  0.38  0.65  0.56   2
231 | 0.32  0.39  0.48  0.50  0.53  0.28  0.38   2
232 | 0.70  0.64  0.48  0.50  0.47  0.51  0.47   2
233 | 0.63  0.57  0.48  0.50  0.49  0.70  0.20   2
234 | 0.74  0.82  0.48  0.50  0.49  0.49  0.41   2
235 | 0.63  0.86  0.48  0.50  0.39  0.47  0.34   2
236 | 0.63  0.83  0.48  0.50  0.40  0.39  0.19   2
237 | 0.63  0.71  0.48  0.50  0.60  0.40  0.39   2
238 | 0.71  0.86  0.48  0.50  0.40  0.54  0.32   2
239 | 0.68  0.78  0.48  0.50  0.43  0.44  0.42   2
240 | 0.64  0.84  0.48  0.50  0.37  0.45  0.40   2
241 | 0.74  0.47  0.48  0.50  0.50  0.57  0.42   2
242 | 0.75  0.84  0.48  0.50  0.35  0.52  0.33   2
243 | 0.63  0.65  0.48  0.50  0.39  0.44  0.35   2
244 | 0.69  0.67  0.48  0.50  0.30  0.39  0.24   2
245 | 0.70  0.71  0.48  0.50  0.42  0.84  0.85   2
246 | 0.69  0.80  0.48  0.50  0.46  0.57  0.26   2
247 | 0.64  0.66  0.48  0.50  0.41  0.39  0.20   2
248 | 0.63  0.80  0.48  0.50  0.46  0.31  0.29   2
249 | 0.66  0.71  0.48  0.50  0.41  0.50  0.35   2
250 | 0.69  0.59  0.48  0.50  0.46  0.44  0.52   2
251 | 0.68  0.67  0.48  0.50  0.49  0.40  0.34   2
252 | 0.64  0.78  0.48  0.50  0.50  0.36  0.38   2
253 | 0.62  0.78  0.48  0.50  0.47  0.49  0.54   2
254 | 0.76  0.73  0.48  0.50  0.44  0.39  0.39   2
255 | 0.64  0.81  0.48  0.50  0.37  0.39  0.44   2
256 | 0.29  0.39  0.48  0.50  0.52  0.40  0.48   2
257 | 0.62  0.83  0.48  0.50  0.46  0.36  0.40   2
258 | 0.56  0.54  0.48  0.50  0.43  0.37  0.30   2
259 | 0.69  0.66  0.48  0.50  0.41  0.50  0.25   2
260 | 0.69  0.65  0.48  0.50  0.63  0.48  0.41   2
261 | 0.43  0.59  0.48  0.50  0.52  0.49  0.56   2
262 | 0.74  0.56  0.48  0.50  0.47  0.68  0.30   2
263 | 0.71  0.57  0.48  0.50  0.48  0.35  0.32   2
264 | 0.61  0.60  0.48  0.50  0.44  0.39  0.38   2
265 | 0.59  0.61  0.48  0.50  0.42  0.42  0.37   2
266 | 0.74  0.74  0.48  0.50  0.31  0.53  0.52   2
267 | 


--------------------------------------------------------------------------------
/9 Unsupervised/som.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 9 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | from numpy import *
12 | import pca
13 | 
14 | class som:
15 | 	"""A Basic 2D Self-Organising Map
16 | 	The map connections can be initialised randomly or with PCA"""
17 | 	def __init__(self,x,y,inputs,eta_b=0.3,eta_n=0.1,nSize=0.5,alpha=1,usePCA=1,useBCs=0,eta_bfinal=0.03,eta_nfinal=0.01,nSizefinal=0.05):
18 | 		self.nData = shape(inputs)[0]
19 | 		self.nDim = shape(inputs)[1]
20 | 		self.mapDim = 2
21 | 		
22 | 		self.x = x
23 | 		self.y = y
24 | 		self.eta_b = eta_b
25 | 		self.eta_bfinal = eta_bfinal
26 | 		self.eta_n = eta_n
27 | 		self.eta_nfinal = eta_nfinal
28 | 		self.nSize = nSize
29 | 		self.nSizefinal = nSizefinal
30 | 		self.alpha = alpha
31 | 
32 | 		self.map = mgrid[0:1:complex(0,x),0:1:complex(0,y)]
33 | 		self.map = reshape(self.map,(2,x*y))
34 | 			
35 | 		if usePCA:
36 | 			dummy1,dummy2,evals,evecs = pca.pca(inputs,2)
37 | 			self.weights = zeros((self.nDim,x*y))
38 | 			for i in range(x*y):
39 | 				for j in range(self.mapDim):
40 | 					self.weights[:,i] += (self.map[j,i]-0.5)*2*evecs[:,j]			
41 | 		else:
42 | 			self.weights = (random.rand(self.nDim,x*y)-0.5)*2	
43 | 		
44 | 		self.mapDist = zeros((self.x*self.y,self.x*self.y))
45 | 		if useBCs:
46 | 			for i in range(self.x*self.y):
47 | 				for j in range(i+1,self.x*self.y):
48 | 					xdist = min((self.map[0,i]-self.map[0,j])**2,(self.map[0,i]+1+1./self.x-self.map[0,j])**2,(self.map[0,i]-1-1./self.x-self.map[0,j])**2,(self.map[0,i]-self.map[0,j]+1+1./self.x)**2,(self.map[0,i]-self.map[0,j]-1-1./self.x)**2)
49 | 					ydist = min((self.map[1,i]-self.map[1,j])**2,(self.map[1,i]+1+1./self.y-self.map[1,j])**2,(self.map[1,i]-1-1./self.y-self.map[1,j])**2,(self.map[1,i]-self.map[1,j]+1+1./self.y)**2,(self.map[1,i]-self.map[1,j]-1-1./self.y)**2)
50 | 					self.mapDist[i,j] = sqrt(xdist+ydist)
51 | 					self.mapDist[j,i] = self.mapDist[i,j]				
52 | 		else:
53 | 			for i in range(self.x*self.y):
54 | 				for j in range(i+1,self.x*self.y):
55 | 					self.mapDist[i,j] = sqrt((self.map[0,i] - self.map[0,j])**2 + (self.map[1,i] - self.map[1,j])**2)
56 | 					self.mapDist[j,i] = self.mapDist[i,j]
57 | 				
58 | 	def somtrain(self,inputs,nIterations):
59 | 		self.eta_binit = self.eta_b
60 | 		self.eta_ninit = self.eta_n
61 | 		self.nSizeinit = self.nSize
62 | 
63 | 		for iterations in range(nIterations):
64 | 			for i in range(self.nData):
65 | 				#print inputs[i,:]
66 | 				best,activation = self.somfwd(inputs[i,:])
67 | 				# Update the weights of the best match
68 | 				self.weights[:,best] += self.eta_b * (inputs[i,:] - self.weights[:,best])
69 | 				#print self.weights
70 | 				# Find the neighbours and update their weights
71 | 				neighbours = where(self.mapDist[best,:]<=self.nSize,1,0)
72 | 				neighbours[best] = 0
73 | 				#print neighbours
74 | 				self.weights += self.eta_n * neighbours*transpose((inputs[i,:] - transpose(self.weights)))
75 | 				#print self.weights
76 | 			# Modify learning rates
77 | 			self.eta_b = self.eta_binit*power(self.eta_bfinal/self.eta_binit,float(iterations)/nIterations)
78 | 			self.eta_n = self.eta_ninit*power(self.eta_nfinal/self.eta_ninit,float(iterations)/nIterations)
79 | 		
80 | 			# Modify neighbourhood size
81 | 			self.nSize = self.nSizeinit*power(self.nSizefinal/self.nSizeinit,float(iterations)/nIterations)
82 | 	
83 | 	def somfwd(self,inputs):
84 | 		activations = sum((transpose(tile(inputs,(self.x*self.y,1)))-self.weights)**2,axis=0)
85 | 		best = argmin(activations)
86 | 		return best,activations
87 | 


--------------------------------------------------------------------------------
/9 Unsupervised/somdemo.py:
--------------------------------------------------------------------------------
 1 | 
 2 | # Code from Chapter 9 of Machine Learning: An Algorithmic Perspective
 3 | # by Stephen Marsland (http://seat.massey.ac.nz/personal/s.r.marsland/MLBook.html)
 4 | 
 5 | # You are free to use, change, or redistribute the code in any way you wish for
 6 | # non-commercial purposes, but please maintain the name of the original author.
 7 | # This code comes with no warranty of any kind.
 8 | 
 9 | # Stephen Marsland, 2008
10 | 
11 | # A simple example of using the SOM on a 2D dataset showing the neighbourhood connections
12 | 
13 | from pylab import *
14 | from numpy import *
15 | 
16 | import som
17 | nNodesEdge = 8
18 | data = (random.rand(2000,2)-0.5)*2
19 | 
20 | # Set up the network and decide on parameters
21 | net = som.som(nNodesEdge,nNodesEdge,data,usePCA=0)
22 | step = 0.2
23 | 
24 | figure(1)
25 | plot(data[:,0],data[:,1],'.')
26 | # Train the network for 0 iterations (to get the position of the nodes)
27 | net.somtrain(data,0)
28 | for i in range(net.x*net.y):
29 |     neighbours = where(net.mapDist[i,:]<=step)
30 | 
31 |     t = zeros((shape(neighbours)[1]*2,shape(net.weights)[0]))
32 |     t[::2,:] = tile(net.weights[:,i],(shape(neighbours)[1],1))
33 |     t[1::2,:] = transpose(net.weights[:,neighbours[0][:]])
34 |     plot(t[:,0],t[:,1],'g-')
35 | axis('off')
36 | 
37 | figure(2)
38 | plot(data[:,0],data[:,1],'.')
39 | net.somtrain(data,5)
40 | for i in range(net.x*net.y):
41 |     neighbours = where(net.mapDist[i,:]<=step)
42 | 
43 |     t = zeros((shape(neighbours)[1]*2,shape(net.weights)[0]))
44 |     t[::2,:] = tile(net.weights[:,i],(shape(neighbours)[1],1))
45 |     t[1::2,:] = transpose(net.weights[:,neighbours[0][:]])
46 |     plot(t[:,0],t[:,1],'g-')
47 | axis([-1,1,-1,1])
48 | axis('off')
49 | 
50 | net.somtrain(data,100)
51 | figure(3)
52 | plot(data[:,0],data[:,1],'.')
53 | for i in range(net.x*net.y):
54 |     neighbours = where(net.mapDist[i,:]<=step)
55 |     #print neighbours
56 |     #n = tile(net.weights[:,i],(shape(neighbours)[1],1))
57 |     t = zeros((shape(neighbours)[1]*2,shape(net.weights)[0]))
58 |     t[::2,:] = tile(net.weights[:,i],(shape(neighbours)[1],1))
59 |     t[1::2,:] = transpose(net.weights[:,neighbours[0][:]])
60 |     plot(t[:,0],t[:,1],'g-')
61 |     
62 | #net.somtrain(data,100)
63 | #figure(4)
64 | #plot(data[:,0],data[:,1],'.')
65 | #for i in range(net.x*net.y):
66 | #    neighbours = where(net.mapDist[i,:]<=step)
67 | #    #print neighbours
68 | #    #n = tile(net.weights[:,i],(shape(neighbours)[1],1))
69 | #    t = zeros((shape(neighbours)[1]*2,shape(net.weights)[0]))
70 | #    t[::2,:] = tile(net.weights[:,i],(shape(neighbours)[1],1))
71 | #    t[1::2,:] = transpose(net.weights[:,neighbours[0][:]])
72 | #    plot(t[:,0],t[:,1],'g-')
73 | #    
74 | #net.somtrain(data,100)
75 | #figure(5)
76 | #plot(data[:,0],data[:,1],'.')
77 | #for i in range(net.x*net.y):
78 | #    neighbours = where(net.mapDist[i,:]<=step)
79 | #    #print neighbours
80 | #    #n = tile(net.weights[:,i],(shape(neighbours)[1],1))
81 | #    t = zeros((shape(neighbours)[1]*2,shape(net.weights)[0]))
82 | #    t[::2,:] = tile(net.weights[:,i],(shape(neighbours)[1],1))
83 | #    t[1::2,:] = transpose(net.weights[:,neighbours[0][:]])
84 | #    plot(t[:,0],t[:,1],'g-')
85 | 
86 | show()
87 | 


--------------------------------------------------------------------------------