├── src
    └── main
    │   └── java
    │       └── com
    │           └── github
    │               └── tjake
    │                   ├── rbm
    │                       ├── minst
    │                       │   ├── MinstItem.java
    │                       │   ├── Demo.java
    │                       │   ├── GenerativeMinstDBN.java
    │                       │   ├── MinstDatasetReader.java
    │                       │   ├── BinaryMinstDBN.java
    │                       │   └── BinaryMinstRBM.java
    │                       ├── Tuple.java
    │                       ├── Layer.java
    │                       ├── BinaryLayer.java
    │                       ├── LayerFactory.java
    │                       ├── GaussianLayer.java
    │                       ├── StackedRBMTrainer.java
    │                       ├── SimpleRBMTrainer.java
    │                       ├── StackedRBM.java
    │                       └── SimpleRBM.java
    │                   └── util
    │                       └── Utilities.java
├── LICENSE
├── readme.md
└── pom.xml


/src/main/java/com/github/tjake/rbm/minst/MinstItem.java:
--------------------------------------------------------------------------------
 1 | package com.github.tjake.rbm.minst;
 2 | 
 3 | /**
 4 |  * Container class that represents a Minst image and it's label
 5 |  */
 6 | public class MinstItem
 7 | {
 8 |     public String label;
 9 |     public int[] data;
10 | }
11 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/Tuple.java:
--------------------------------------------------------------------------------
 1 | package com.github.tjake.rbm;
 2 | 
 3 | public  class Tuple
 4 | {
 5 |     public final Layer visible;
 6 |     public final Layer hidden;
 7 |     public final Layer input;   //For a DBN this is the initial input layer
 8 | 
 9 |     protected Tuple(Layer input, Layer visible, Layer hidden)
10 |     {
11 |         this.input = input;
12 |         this.visible = visible;
13 |         this.hidden = hidden;
14 |     }
15 | 
16 |     public static class Factory {
17 | 
18 |         public final Layer input;
19 | 
20 |         public Factory(Layer input) {
21 |             this.input = input;
22 |         }
23 | 
24 |         public Tuple create(Layer visible, Layer hidden)
25 |         {
26 |             return new Tuple(input,visible,hidden);
27 |         }
28 |     }
29 | }
30 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | Copyright 2013 T Jake Luciani <jake@apache.org>
 2 | 
 3 | Permission is hereby granted, free of charge, to any person obtaining a copy of
 4 | this software and associated documentation files (the 'Software'), to deal in
 5 | the Software without restriction, including without limitation the rights to
 6 | use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of
 7 | the Software, and to permit persons to whom the Software is furnished to do so,
 8 | subject to the following conditions:
 9 | 
10 | The above copyright notice and this permission notice shall be included in all
11 | copies or substantial portions of the Software.
12 | 
13 | THE SOFTWARE IS PROVIDED 'AS IS', WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS
15 | FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR
16 | COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER
17 | IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
18 | CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 
19 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/util/Utilities.java:
--------------------------------------------------------------------------------
 1 | package com.github.tjake.util;
 2 | 
 3 | 
 4 | import com.github.tjake.rbm.Layer;
 5 | import java.util.Random;
 6 | 
 7 | public class Utilities {
 8 | 
 9 |     static Random staticRand = new Random();
10 | 
11 |     public static float mean(final Layer input)
12 |     {
13 |         float m = 0.0f;
14 |         for (int i=0; i<input.size(); i++)
15 |             m += input.get(i);
16 | 
17 |         return m/input.size();
18 |     }
19 | 
20 |     public static float stddev(final Layer input, float mean)
21 |     {
22 |         double sum = 0.0f;
23 |         for (int i=0; i<input.size(); i++)
24 |             sum += Math.pow(input.get(i) - mean, 2);
25 | 
26 |         return (float)Math.sqrt(sum/(input.size() - 1));
27 |     }
28 | 
29 |     public static float sigmoid(float x)
30 |     {
31 |         return (float) (1.0f / (1.0f + Math.exp(-x)));
32 |     }
33 | 
34 |     public static Layer bernoulli(Layer input)
35 |     {
36 |         Layer output = input.clone();
37 |         //using uniform distribution, filter out all negative values
38 |         //from inputs, keeping mostly strong weights
39 |         for (int i=0; i<output.size(); i++)
40 |             output.set(i, staticRand.nextFloat() < input.get(i) ? 1.0f : 0.0f);
41 | 
42 |         return output;
43 |     }
44 | 
45 | }
46 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/Layer.java:
--------------------------------------------------------------------------------
 1 | package com.github.tjake.rbm;
 2 | 
 3 | import java.util.Arrays;
 4 | 
 5 | /**
 6 |  * Represents a layer in nodes in a Neural network, supports some simple operations
 7 |  */
 8 | public class Layer {
 9 | 
10 |     final float[] layer;
11 | 
12 |     public Layer(int size) {
13 |         layer = new float[size];
14 |     }
15 | 
16 |     public Layer(float[] layer){
17 |         this.layer = layer;
18 |     }
19 | 
20 |     public void set(int i, float f) {
21 |         layer[i] = f;
22 |     }
23 | 
24 |     public float get(int i) {
25 |        return layer[i];
26 |     }
27 | 
28 |     public void add(int i, float f) {
29 |         layer[i] += f;
30 |     }
31 | 
32 |     public void div(int i, float f) {
33 |         layer[i] /= f;
34 |     }
35 | 
36 |     public void mult(int i, float f) {
37 |         layer[i] *= f;
38 |     }
39 | 
40 |     public int size() {
41 |         return layer.length;
42 |     }
43 | 
44 |     public Layer clone() {
45 |         Layer c = new Layer(layer.length);
46 |         System.arraycopy(layer,0,c.layer,0,layer.length);
47 |         return c;
48 |     }
49 | 
50 |     public void clear() {
51 |         Arrays.fill(layer,0.0f);
52 |     }
53 | 
54 |     public void copy(float[] src) {
55 |         System.arraycopy(layer,0,src,0,layer.length);
56 |     }
57 | 
58 |     public float[] get() {
59 |         return layer;
60 |     }
61 | }
62 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/minst/Demo.java:
--------------------------------------------------------------------------------
 1 | package com.github.tjake.rbm.minst;
 2 | 
 3 | 
 4 | import java.io.File;
 5 | 
 6 | public class Demo {
 7 |     public static void main(String[] args) {
 8 | 
 9 |         if (args.length < 2)
10 |             usage("");
11 | 
12 |         if (args[0].equalsIgnoreCase("rbm")) {
13 |             File labels = new File(args[1]);
14 |             File images = new File(args[2]);
15 | 
16 | 
17 |             if (!labels.isFile())
18 |                 usage("invalid minst labels file: "+args[1]);
19 | 
20 |             if (!images.isFile())
21 |                 usage("invalid minst images file: "+args[2]);
22 | 
23 |             BinaryMinstRBM.start(labels,images);
24 |         }
25 |         else if (args[0].equalsIgnoreCase("dbn")) {
26 |             File labels = new File(args[1]);
27 |             File images = new File(args[2]);
28 |             File saveto = new File(args[3]);
29 | 
30 |             if (!labels.isFile())
31 |                 usage("invalid minst labels file: "+args[1]);
32 | 
33 |             if (!images.isFile())
34 |                 usage("invalid minst images file: "+args[2]);
35 | 
36 |             BinaryMinstDBN.start(labels,images,saveto);
37 |         } else if (args[0].equalsIgnoreCase("gen")) {
38 |             File load = new File(args[1]);
39 | 
40 |             if (!load.isFile())
41 |                 usage("invalid dbn file: "+args[1]);
42 | 
43 |              GenerativeMinstDBN.start(load);
44 |         }
45 | 
46 |     }
47 | 
48 |     private static void usage(String err) {
49 |         System.err.println("Usage: \t[rbm minst-labels.gz minst-images.gz]\n\t [dbn minst-images.gz minst-labels.gz dbn.bin]\n\t [gen dbn.bin]");
50 |         if (err != null && err.length() > 0)
51 |             System.err.println(err);
52 | 
53 |         System.exit(-1);
54 |     }
55 | }
56 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/BinaryLayer.java:
--------------------------------------------------------------------------------
 1 | package com.github.tjake.rbm;
 2 | 
 3 | 
 4 | /*
 5 |  * Converts grayscale intensities to binary values
 6 |  */
 7 | public class BinaryLayer extends Layer {
 8 | 
 9 |     final Layer delegate;
10 | 
11 | 
12 |     public BinaryLayer(Layer delegate)
13 |     {
14 |         super(null);
15 |         this.delegate = delegate;
16 | 
17 |         convertToBinary();
18 |     }
19 | 
20 |     private void convertToBinary()
21 |     {
22 |         for (int i=0; i<delegate.size(); i++)
23 |         {
24 |             float v = delegate.get(i);
25 |             delegate.set(i, v > 30 ? 1.0f : 0.0f);
26 |         }
27 |     }
28 | 
29 |     public static float[] fromBinary(Layer delegate) {
30 |         float [] output = new float[delegate.size()];
31 |         for (int i = 0; i < output.length; i++) {
32 |             output[i] = delegate.get(i) * 255.0f;
33 |         }
34 |         return output;
35 |     }
36 | 
37 | 
38 |     @Override
39 |     public void set(int i, float f) {
40 |         delegate.set(i,f);
41 |     }
42 | 
43 |     @Override
44 |     public float get(int i) {
45 |         return delegate.get(i);
46 |     }
47 | 
48 |     @Override
49 |     public void add(int i, float f) {
50 |         delegate.add(i,f);
51 |     }
52 | 
53 |     @Override
54 |     public void div(int i, float f) {
55 |         delegate.div(i,f);
56 |     }
57 | 
58 |     @Override
59 |     public void mult(int i, float f) {
60 |         delegate.div(i,f);
61 |     }
62 | 
63 |     @Override
64 |     public int size() {
65 |         return delegate.size();
66 |     }
67 | 
68 |     @Override
69 |     public Layer clone() {
70 |         return delegate.clone();
71 |     }
72 | 
73 |     @Override
74 |     public void clear() {
75 |         delegate.clear();
76 |     }
77 | 
78 |     @Override
79 |     public void copy(float[] src) {
80 |         delegate.copy(src);
81 |     }
82 | 
83 |     @Override
84 |     public float[] get() {
85 |         return delegate.get();
86 |     }
87 | }
88 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/LayerFactory.java:
--------------------------------------------------------------------------------
 1 | package com.github.tjake.rbm;
 2 | 
 3 | 
 4 | import java.awt.image.BufferedImage;
 5 | import java.io.DataInput;
 6 | import java.io.DataOutput;
 7 | import java.io.IOException;
 8 | import java.util.Arrays;
 9 | 
10 | public class LayerFactory {
11 |     public static byte[] MAGIC = {(byte) 0xf0, (byte) 0x0d, (byte) 0x00, (byte) 0x0F};
12 | 
13 |     public Layer create(int size) {
14 |         return new Layer(size);
15 |     }
16 | 
17 |     public Layer create(float[] start) {
18 |        return new Layer(start);
19 |     }
20 | 
21 |     public Layer create(BufferedImage img) {
22 |         Layer layer = create(img.getWidth() * img.getHeight());
23 |         int width = 0, height = 0;
24 |         for (int i = 0; i < layer.size(); i++) {
25 |             layer.set(i, img.getData().getSample(width++, height, 0));
26 | 
27 |             if (width >= img.getWidth()) {
28 |                 width = 0;
29 |                 height++;
30 |             }
31 |         }
32 | 
33 |         return layer;
34 |     }
35 | 
36 | 
37 |     public void save(Layer layer, DataOutput dataOutput) throws IOException {
38 |         //First write magic #
39 |         dataOutput.write(MAGIC);
40 | 
41 |         float[] floats = layer.get();
42 |         if (floats.length != layer.size())
43 |             throw new IOException("get().length != size()");
44 | 
45 |         //Number of elements
46 |         dataOutput.writeInt(layer.size());
47 | 
48 |         for (int i = 0; i < floats.length; i++)
49 |             dataOutput.writeFloat(floats[i]);
50 |     }
51 | 
52 |     public Layer load(DataInput dataInput) throws IOException {
53 |         byte[] magic = new byte[4];
54 |         dataInput.readFully(magic);
55 | 
56 |         if (!Arrays.equals(MAGIC, magic))
57 |             throw new IOException("Bad File Format");
58 | 
59 |         int size = dataInput.readInt();
60 | 
61 |         if (size < 0)
62 |             throw new IOException("Invalid size");
63 | 
64 |         float[] input = new float[size];
65 |         for (int i = 0; i < size; i++)
66 |             input[i] = dataInput.readFloat();
67 | 
68 | 
69 |         return create(input);
70 |     }
71 | 
72 |     public GaussianLayer createGaussian(BufferedImage img) {
73 |         return new GaussianLayer(create(img));
74 |     }
75 | 
76 | }
77 | 


--------------------------------------------------------------------------------
/readme.md:
--------------------------------------------------------------------------------
 1 | rbm-dbn-mnist
 2 | ==========
 3 | 
 4 | Learn more about this project from this blog post: 
 5 | 
 6 | http://tjake.github.com/blog/2013/02/18/resurgence-in-artificial-intelligence/
 7 | 
 8 | This project provides a implementation for a Restricted Boltzmann Machine and a Deep Belief Network
 9 | 
10 | It uses the [MNIST handwritten dataset](http://yann.lecun.com/exdb/mnist/) to illistrate an example RBM and DBN.
11 | 
12 | Usage
13 | =====
14 | 
15 | From source build the project with maven:
16 | 
17 | 1. mvn deploy
18 | 
19 | This will build a single jar and download the mnist dataset.
20 | 
21 | 2. java -jar target/rbm-dbn-mnist-0.0.1.jar 
22 | 
23 | Runs the app. shows the usage screen
24 | 
25 | ````
26 | Usage: [rbm minst-labels.gz minst-images.gz]
27 | 	   [dbn minst-images.gz minst-labels.gz dbn.bin]
28 | 	   [gen dbn.bin]
29 | ````
30 | 
31 | 3. java -jar target/rbm-dbn-mnist-0.0.1.jar rbm target/minst/train-labels-idx1-ubyte.gz target/minst/train-images-idx3-ubyte.gz
32 | 
33 | Trains a single RBM with 100 hidden nodes.  Each of the hidden nodes weights are rendered alongside the test digit in blue.
34 | 
35 | ![RBM Demo](http://tjake.github.com/images/MinstRBM.png)
36 | 
37 | 
38 | 4. java -jar target/rbm-dbn-mnist-0.0.1.jar dbn target/minst/train-labels-idx1-ubyte.gz target/minst/train-images-idx3-ubyte.gz /tmp/dbn.bin
39 | 
40 | Trains a Deep Belief Network made up of three RBMs.  It learns to match pictures of digits with their corresponding label. It takes about 10m to train but once it's done it has ~95% accuracy rate.  The trained DBN is saved to a file.
41 | 
42 | 5. java -jar target/rbm-dbn-mnist-0.0.1.jar gen /tmp/dbn.bin
43 | 
44 | Takes the trained DBN from step 4. and reverses the flow, generating a visual image of a digit from a digit label.
45 | 
46 | License
47 | =======
48 | 
49 | Copyright 2013 T Jake Luciani <jake@apache.org>
50 | 
51 | Permission is hereby granted, free of charge, to any person obtaining a copy of
52 | this software and associated documentation files (the 'Software'), to deal in
53 | the Software without restriction, including without limitation the rights to
54 | use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of
55 | the Software, and to permit persons to whom the Software is furnished to do so,
56 | subject to the following conditions:
57 | 
58 | The above copyright notice and this permission notice shall be included in all
59 | copies or substantial portions of the Software.
60 | 
61 | THE SOFTWARE IS PROVIDED 'AS IS', WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
62 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS
63 | FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR
64 | COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER
65 | IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
66 | CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 
67 | 
68 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/GaussianLayer.java:
--------------------------------------------------------------------------------
  1 | package com.github.tjake.rbm;
  2 | 
  3 | 
  4 | import com.github.tjake.util.Utilities;
  5 | 
  6 | /**
  7 |  * Converts raw values to standard deviations
  8 |  */
  9 | public class GaussianLayer extends Layer{
 10 | 
 11 |     final Layer delegate;
 12 |     private float mean;
 13 |     private float stddev;
 14 | 
 15 | 
 16 |     public GaussianLayer(Layer delegate)
 17 |     {
 18 |         super(null);
 19 |         this.delegate = delegate;
 20 | 
 21 |         convertToStddev();
 22 | 
 23 |     }
 24 | 
 25 |     public GaussianLayer(Layer delegate, Layer base)
 26 |     {
 27 |         super(null);
 28 | 
 29 |         GaussianLayer gbase = (GaussianLayer) base;
 30 | 
 31 |         this.delegate = delegate;
 32 |         mean = gbase.mean;
 33 |         stddev = gbase.stddev;
 34 | 
 35 |     }
 36 | 
 37 |     private void convertToStddev()
 38 |     {
 39 |         mean = Utilities.mean(delegate);
 40 |         stddev = Utilities.stddev(delegate, mean);
 41 |         stddev = stddev < 0.1f ? 0.1f : stddev;
 42 | 
 43 |         double min = Double.MAX_VALUE, max = Double.MIN_VALUE;
 44 | 
 45 | 
 46 |         for (int i=0; i<delegate.size(); i++)
 47 |         {
 48 |             double v = (delegate.get(i) - mean)/stddev;
 49 |             if (v > max) max = v;
 50 |             if (v < min) min = v;
 51 | 
 52 |             delegate.set(i, (float)v);
 53 |         }
 54 | 
 55 | 
 56 |     }
 57 | 
 58 |     public float[] fromGaussian() {
 59 |         double min = Double.MAX_VALUE, max = Double.MIN_VALUE;
 60 |         float [] output = new float[delegate.size()];
 61 |         for (int i = 0; i < output.length; i++) {
 62 |             double v =  delegate.get(i);
 63 | 
 64 |             //Squash > 2 sigma
 65 |             if (Math.abs(v) > 2)
 66 |                 v /= 2;
 67 | 
 68 |             v  = v * stddev + mean;
 69 | 
 70 |             if (v > max) max = v;
 71 |             if (v < min) min = v;
 72 | 
 73 |             output[i] = (float)(v < 0 ? 0 : v);
 74 |             output[i] = (float)(v > 255 ? 255 : v);
 75 |         }
 76 | 
 77 | 
 78 |         return output;
 79 |     }
 80 | 
 81 | 
 82 |     @Override
 83 |     public void set(int i, float f) {
 84 |         delegate.set(i,f);
 85 |     }
 86 | 
 87 |     @Override
 88 |     public float get(int i) {
 89 |         return delegate.get(i);
 90 |     }
 91 | 
 92 |     @Override
 93 |     public void add(int i, float f) {
 94 |         delegate.add(i,f);
 95 |     }
 96 | 
 97 |     @Override
 98 |     public void div(int i, float f) {
 99 |         delegate.div(i,f);
100 |     }
101 | 
102 |     @Override
103 |     public void mult(int i, float f) {
104 |         delegate.div(i,f);
105 |     }
106 | 
107 |     @Override
108 |     public int size() {
109 |         return delegate.size();
110 |     }
111 | 
112 |     @Override
113 |     public Layer clone() {
114 |         return delegate.clone();
115 |     }
116 | 
117 |     @Override
118 |     public void clear() {
119 |         delegate.clear();
120 |     }
121 | 
122 |     @Override
123 |     public void copy(float[] src) {
124 |         delegate.copy(src);
125 |     }
126 | 
127 |     @Override
128 |     public float[] get() {
129 |         return delegate.get();
130 |     }
131 | }
132 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/StackedRBMTrainer.java:
--------------------------------------------------------------------------------
 1 | package com.github.tjake.rbm;
 2 | 
 3 | import java.util.ArrayList;
 4 | import java.util.Arrays;
 5 | import java.util.Iterator;
 6 | import java.util.List;
 7 | 
 8 | public class StackedRBMTrainer {
 9 | 
10 |     final StackedRBM stackedRBM;
11 |     final SimpleRBMTrainer inputTrainer;
12 |     final float momentum;
13 |     final float l2;
14 |     final Float targetSparsity;
15 |     float learningRate;
16 |     final LayerFactory layerFactory;
17 | 
18 |     public StackedRBMTrainer(StackedRBM stackedRBM, float momentum, float l2, Float targetSparsity, float learningRate, LayerFactory layerFactory )
19 |     {
20 |         this.stackedRBM = stackedRBM;
21 |         this.momentum = momentum;
22 |         this.l2 = l2;
23 |         this.targetSparsity = targetSparsity;
24 |         this.learningRate = learningRate;
25 |         this.layerFactory = layerFactory;
26 | 
27 |         inputTrainer = new SimpleRBMTrainer(momentum, l2, targetSparsity, learningRate, layerFactory );
28 |     }
29 | 
30 |     public void  setLearningRate(float newRate){
31 |         learningRate = newRate;
32 |         inputTrainer.learningRate = newRate;
33 |     }
34 | 
35 |     //Starts at the bottom of the DBN and uses the output of one RBM as the input of
36 |     //the next.  This continues till it hits stopAt.  Then it trains the RBM with the
37 |     //mutated input batch.  It also allows a second batch to be appended to a input batch
38 |     //So you can combine a deep RBM feature with a second input.
39 |     //
40 |     //An example being features of a digit picture combined with the digit label.
41 |     public double learn(List<Layer> bottomBatch, List<Layer> topBatch, int stopAt)
42 |     {
43 |         if (topBatch != null && !topBatch.isEmpty() && topBatch.size() != bottomBatch.size())
44 |             throw new IllegalArgumentException("TopBatch != BottomBatch");
45 | 
46 |         if (stopAt < 0 || stopAt > stackedRBM.innerRBMs.size())
47 |             throw new IllegalArgumentException("Invalid stopAt");
48 | 
49 | 
50 |         List<Layer> nextInputs = new ArrayList<Layer>(bottomBatch);
51 | 
52 |         for (int i=0; i<stopAt; i++)
53 |         {
54 |             //At stopping point do actual learning
55 |             if (i == stopAt-1)
56 |             {
57 |                 return inputTrainer.learn(stackedRBM.innerRBMs.get(i), nextInputs, false);
58 |             }
59 | 
60 |             //Use the hidden of this layer as the inputs of the next layer
61 |             for (int j=0; j<nextInputs.size(); j++)
62 |             {
63 |                 Layer next = stackedRBM.innerRBMs.get(i).activateHidden(nextInputs.get(j),null);
64 | 
65 |                 if (topBatch != null && !topBatch.isEmpty() && i == stopAt - 2)
66 |                 {
67 |                     float[] nextConcat = new float[next.size()+topBatch.get(j).size()];
68 |                     System.arraycopy(next.get(),0,nextConcat,0,next.size());
69 |                     System.arraycopy(topBatch.get(j).get(), 0, nextConcat, next.size(), topBatch.get(j).size());
70 | 
71 |                     next = layerFactory.create(nextConcat);
72 |                 }
73 | 
74 |                 nextInputs.set(j,next);
75 |             }
76 |         }
77 | 
78 |         throw new AssertionError("Didn't find a level top stop at");
79 |     }
80 | }
81 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/SimpleRBMTrainer.java:
--------------------------------------------------------------------------------
  1 | package com.github.tjake.rbm;
  2 | 
  3 | import java.util.Iterator;
  4 | import java.util.List;
  5 | 
  6 | public class SimpleRBMTrainer
  7 | {
  8 |     public float momentum;
  9 |     final float l2;
 10 |     final Float targetSparsity;
 11 |     public float learningRate;
 12 |     private LayerFactory layerFactory;
 13 | 
 14 |     Layer[] gw;
 15 |     Layer gv;
 16 |     Layer gh;
 17 | 
 18 |     public SimpleRBMTrainer(float momentum, float l2, Float targetSparsity, Float learningRate, LayerFactory layerFactory)
 19 |     {
 20 |         this.momentum = momentum;
 21 |         this.l2 = l2;
 22 |         this.targetSparsity = targetSparsity;
 23 |         this.learningRate = learningRate;
 24 |         this.layerFactory = layerFactory;
 25 |     }
 26 | 
 27 |     public double learn(final SimpleRBM rbm, List<Layer> inputBatch, boolean reverse)
 28 |     {
 29 |         int batchsize = inputBatch.size();
 30 | 
 31 |         if (gw == null || gw.length != rbm.biasHidden.size() || gw[0].size() != rbm.biasVisible.size())
 32 |         {
 33 |             gw = new Layer[rbm.biasHidden.size()];
 34 |             for(int i=0; i<gw.length; i++)
 35 |                 gw[i] = layerFactory.create(rbm.biasVisible.size());
 36 | 
 37 |             gv = layerFactory.create(rbm.biasVisible.size());
 38 |             gh = layerFactory.create(rbm.biasHidden.size());
 39 |         }
 40 |         else
 41 |         {
 42 |             for(int i=0; i<gw.length; i++)
 43 |                 gw[i].clear();
 44 | 
 45 |             gv.clear();
 46 |             gh.clear();
 47 |         }
 48 |         
 49 |         // Contrastive Divergance
 50 |         for (Layer input : inputBatch)
 51 |         {
 52 |             try {
 53 |                 Iterator<Tuple> it = reverse ? rbm.reverseIterator(input) : rbm.iterator(input);
 54 | 
 55 |                 Tuple t1 = it.next();    //UP
 56 |                 Tuple t2 = it.next();    //Down
 57 | 
 58 |                 for (int i=0; i< gw.length; i++)
 59 |                     for (int j=0; j<gw[i].size(); j++)
 60 |                         gw[i].add(j, (t1.hidden.get(i) * t1.visible.get(j)) - (t2.hidden.get(i) * t2.visible.get(j)));
 61 | 
 62 |                 for (int i = 0; i < gv.size(); i++)
 63 |                     gv.add(i, t1.visible.get(i) - t2.visible.get(i));
 64 | 
 65 |                 for (int i = 0; i < gh.size(); i++)
 66 |                     gh.add(i,  targetSparsity == null ? t1.hidden.get(i) - t2.hidden.get(i) : targetSparsity - t1.hidden.get(i));
 67 | 
 68 |             } catch (Throwable t) {
 69 |                 t.printStackTrace();
 70 |             }
 71 |         }
 72 | 
 73 | 
 74 |         // Average
 75 |         for (int i = 0; i < gw.length; i++)
 76 |         {
 77 |             for (int j = 0; j < gw[i].size(); j++)
 78 |             {
 79 |                 gw[i].div(j, batchsize);
 80 | 
 81 |                 gw[i].mult(j, 1 - momentum);
 82 |                 gw[i].add(j,  momentum * (gw[i].get(j) - l2*rbm.weights[i].get(j)));
 83 |                 
 84 |                 rbm.weights[i].add(j, learningRate * gw[i].get(j));
 85 |             }
 86 |         }
 87 | 
 88 |         double error = 0.0;
 89 | 
 90 |         for (int i = 0; i < gv.size(); i++)
 91 |         {
 92 |             gv.div(i, batchsize);
 93 | 
 94 |             error += Math.pow(gv.get(i), 2);
 95 | 
 96 |             gv.mult(i, 1 - momentum);
 97 |             gv.add(i, momentum * (gv.get(i) * rbm.biasVisible.get(i)));
 98 | 
 99 |             rbm.biasVisible.add(i, learningRate * gv.get(i));
100 |         }
101 | 
102 |         error = Math.sqrt(error/gv.size());
103 | 
104 |         if (targetSparsity != null)
105 |         {
106 |             for (int i=0; i<gh.size(); i++)
107 |             {
108 |                 gh.div(i,batchsize);
109 |                 gh.set(i, targetSparsity - gh.get(i));
110 |             }
111 |         }
112 |         else
113 |         {
114 |             for (int i = 0; i < gh.size(); i++)
115 |             {
116 |                 gh.div(i, batchsize);
117 | 
118 |                 gh.mult(i, 1 - momentum);
119 |                 gh.add(i, momentum * (gh.get(i) * rbm.biasHidden.get(i)));
120 | 
121 |                 rbm.biasHidden.add(i, learningRate * gh.get(i));
122 |             }
123 |         }
124 | 
125 | 
126 |         return error;
127 |     }
128 | }
129 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/minst/GenerativeMinstDBN.java:
--------------------------------------------------------------------------------
  1 | package com.github.tjake.rbm.minst;
  2 | 
  3 | 
  4 | import com.github.tjake.rbm.*;
  5 | 
  6 | import javax.swing.*;
  7 | import java.awt.*;
  8 | import java.awt.image.BufferedImage;
  9 | import java.awt.image.WritableRaster;
 10 | import java.io.*;
 11 | import java.util.Iterator;
 12 | 
 13 | public class GenerativeMinstDBN extends Canvas {
 14 | 
 15 |     final StackedRBM rbm;
 16 | 
 17 |     int count = 0;
 18 |     Layer input;
 19 |     String label;
 20 | 
 21 |     public GenerativeMinstDBN(StackedRBM rbm) {
 22 |         super();
 23 |         this.rbm = rbm;
 24 |     }
 25 | 
 26 |     public void update() {
 27 | 
 28 |         synchronized (rbm) {
 29 | 
 30 |             int current = count++ % 10;
 31 |             label = String.valueOf(current);
 32 | 
 33 | 
 34 |             SimpleRBM r = rbm.getInnerRBMs().get(rbm.getInnerRBMs().size() - 1);
 35 | 
 36 |             input = new Layer(r.biasVisible.size());
 37 | 
 38 |             //setup input
 39 |             for (int i = 0; i < input.size()-10; i++)
 40 |                 input.set(i, 0.0f);
 41 | 
 42 |             //Position == Digit
 43 |             input.set(input.size() - 10 + current, 100000.0f);
 44 | 
 45 | 
 46 |             Iterator<Tuple> it = r.iterator(input);
 47 | 
 48 |             for (int i = 0; i < 1; i++)
 49 |                 it.next();
 50 | 
 51 |             input = it.next().visible;
 52 | 
 53 |             for (int i = rbm.getInnerRBMs().size() - 2; i >= 0; i--) {
 54 |                 SimpleRBM prevRbm = rbm.getInnerRBMs().get(i);
 55 | 
 56 |                 if (input.size() > prevRbm.biasHidden.size()) {
 57 |                     float[] newInput = new float[prevRbm.biasHidden.size()];
 58 |                     System.arraycopy(input.get(), 0, newInput, 0, newInput.length);
 59 |                     input = new Layer(newInput);
 60 |                 }
 61 | 
 62 |                 input = prevRbm.activateVisible(input,null);
 63 |             }
 64 |         }
 65 |         repaint();
 66 |     }
 67 | 
 68 | 
 69 |     public void paint(Graphics g) {
 70 | 
 71 |         synchronized (rbm) {
 72 | 
 73 |             BufferedImage in = new BufferedImage(28, 28, BufferedImage.TYPE_INT_RGB);
 74 | 
 75 |             int draw[] = new int[input.size()];
 76 |             for (int i = 0; i < input.size(); i++)
 77 |                 draw[i] = Math.round(input.get(i) * 255f);
 78 | 
 79 |             WritableRaster r = in.getRaster();
 80 |             r.setDataElements(0, 0, 28, 28, draw);
 81 | 
 82 |             //Resize
 83 |             BufferedImage newImage = new BufferedImage(256, 256, BufferedImage.TYPE_INT_RGB);
 84 | 
 85 |             Graphics2D g2 = newImage.createGraphics();
 86 |             try {
 87 |                 g2.setRenderingHint(RenderingHints.KEY_INTERPOLATION,
 88 |                         RenderingHints.VALUE_INTERPOLATION_BICUBIC);
 89 |                 g2.clearRect(0, 0, 256, 256);
 90 |                 g2.drawImage(in, 0, 0, 256, 256, null);
 91 |             } finally {
 92 |                 g2.dispose();
 93 |             }
 94 | 
 95 |             g.drawImage(newImage, 10, 10, null);
 96 | 
 97 | 
 98 |             g.drawString("Generative version of: "+label, 10, 300);
 99 |         }
100 |     }
101 | 
102 | 
103 |     public static void start(File stateFile) {
104 | 
105 |         GenerativeMinstDBN m;
106 | 
107 |         try {
108 |             DataInput input = new DataInputStream( new BufferedInputStream(new FileInputStream(stateFile)));
109 |             StackedRBM rbm = new StackedRBM();
110 |             rbm.load(input, new LayerFactory());
111 |             m = new GenerativeMinstDBN(rbm);
112 | 
113 |         } catch (IOException e) {
114 |             throw new RuntimeException(e);
115 |         }
116 | 
117 | 
118 |         JFrame frame = new JFrame("MINST Generative Draw");
119 |         frame.setDefaultCloseOperation(JFrame.EXIT_ON_CLOSE);
120 |         frame.setSize(310, 310);
121 | 
122 | 
123 |         m.setSize(310, 310);
124 |         frame.add(m);
125 | 
126 |         frame.pack();
127 |         frame.setLocationRelativeTo(null);
128 |         frame.setVisible(true);
129 | 
130 |         while (true) {
131 |             m.update();
132 |             try {
133 |                 //if (count > 1000)
134 |                 Thread.sleep(2000);
135 | 
136 |             } catch (InterruptedException e) {
137 |             }
138 |         }
139 | 
140 |     }
141 | }


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/minst/MinstDatasetReader.java:
--------------------------------------------------------------------------------
  1 | package com.github.tjake.rbm.minst;
  2 | 
  3 | import java.io.DataInputStream;
  4 | import java.io.File;
  5 | import java.io.FileInputStream;
  6 | import java.io.FileNotFoundException;
  7 | import java.io.IOError;
  8 | import java.io.IOException;
  9 | import java.security.SecureRandom;
 10 | import java.util.*;
 11 | import java.util.zip.GZIPInputStream;
 12 | 
 13 | /**
 14 |  * Reads the Minst image data from
 15 |  */
 16 | public class MinstDatasetReader implements Enumeration<MinstItem>
 17 | {
 18 |     final DataInputStream labelsBuf;
 19 |     final DataInputStream imagesBuf;
 20 | 
 21 |     SecureRandom r = new SecureRandom();
 22 | 
 23 |     final Map<String, List<MinstItem>> trainingSet = new HashMap<String, List<MinstItem>>();
 24 |     final Map<String, List<MinstItem>> testSet = new HashMap<String, List<MinstItem>>();
 25 | 
 26 |     int rows = 0;
 27 |     int cols = 0;
 28 |     int count = 0;
 29 |     int current = 0;
 30 | 
 31 |     public MinstDatasetReader(File labelsFile, File imagesFile)
 32 |     {
 33 |         try
 34 |         {
 35 |             labelsBuf = new DataInputStream(new GZIPInputStream(new FileInputStream(labelsFile)));
 36 |             imagesBuf = new DataInputStream(new GZIPInputStream(new FileInputStream(imagesFile)));
 37 | 
 38 |             verify();
 39 | 
 40 |             createTrainingSet();
 41 |         }
 42 |         catch (FileNotFoundException e)
 43 |         {
 44 |             throw new IOError(e);
 45 |         }
 46 |         catch (IOException e)
 47 |         {
 48 |             throw new IOError(e);
 49 |         }
 50 |         finally
 51 |         {
 52 | 
 53 | 
 54 |         }
 55 | 
 56 | 
 57 | 
 58 |     }
 59 | 
 60 |     public void createTrainingSet() {
 61 |         boolean done = false;
 62 | 
 63 |         while (!done || !hasMoreElements()) {
 64 |             MinstItem i = nextElement();
 65 | 
 66 |             if (r.nextDouble() > 0.3) {
 67 |                 List<MinstItem> l = testSet.get(i.label);
 68 |                 if (l == null)
 69 |                     l = new ArrayList<MinstItem>();
 70 |                 testSet.put(i.label, l);
 71 | 
 72 |                 l.add(i);
 73 |             } else {
 74 |                 List<MinstItem> l = trainingSet.get(i.label);
 75 |                 if (l == null)
 76 |                     l = new ArrayList<MinstItem>();
 77 |                 trainingSet.put(i.label, l);
 78 | 
 79 |                 l.add(i);
 80 |             }
 81 | 
 82 |             if (trainingSet.isEmpty())
 83 |                 continue;
 84 | 
 85 |             boolean isDone = true;
 86 |             for (Map.Entry<String, List<MinstItem>> entry : trainingSet.entrySet()) {
 87 |                 if (entry.getValue().size() < 100) {
 88 |                     isDone = false;
 89 |                     break;
 90 |                 }
 91 |             }
 92 | 
 93 |             done = isDone;
 94 |         }
 95 |     }
 96 | 
 97 |     public MinstItem getTestItem()
 98 |     {
 99 |         List<MinstItem> list = testSet.get(String.valueOf(r.nextInt(10)));
100 |         return list.get(r.nextInt(list.size()));
101 | 
102 |     }
103 | 
104 |     public MinstItem getTrainingItem()
105 |     {
106 |         List<MinstItem> list = trainingSet.get(String.valueOf(r.nextInt(10)));
107 |         return list.get(r.nextInt(list.size()));
108 | 
109 |     }
110 | 
111 |     public MinstItem getTrainingItem(int i)
112 |     {
113 |         List<MinstItem> list = trainingSet.get(String.valueOf(i));
114 |         return list.get(r.nextInt(list.size()));
115 | 
116 |     }
117 | 
118 |     private void verify() throws IOException
119 |     {
120 |         int magic = labelsBuf.readInt();
121 |         int labelCount = labelsBuf.readInt();
122 | 
123 |         System.err.println("Labels magic=" + magic + ", count=" + labelCount);
124 | 
125 |         magic = imagesBuf.readInt();
126 |         int imageCount = imagesBuf.readInt();
127 |         rows = imagesBuf.readInt();
128 |         cols = imagesBuf.readInt();
129 | 
130 |         System.err.println("Images magic=" + magic + " count=" + imageCount + " rows=" + rows + " cols=" + cols);
131 | 
132 |         if (labelCount != imageCount)
133 |             throw new IOException("Label Image count mismatch");
134 | 
135 |         count = imageCount;
136 |     }
137 | 
138 |     public boolean hasMoreElements()
139 |     {
140 |         return current < count;
141 |     }
142 | 
143 |     public MinstItem nextElement()
144 |     {
145 |         MinstItem m = new MinstItem();
146 | 
147 |         try
148 |         {
149 |             m.label = String.valueOf(labelsBuf.readUnsignedByte());
150 |             m.data = new int[rows * cols];
151 | 
152 |             for (int i = 0; i < m.data.length; i++)
153 |             {
154 |                 m.data[i] = imagesBuf.readUnsignedByte();
155 |             }
156 | 
157 |             return m;
158 |         }
159 |         catch (IOException e)
160 |         {
161 |             current = count;
162 |             throw new IOError(e);
163 |         }
164 |         finally
165 |         {
166 |             current++;
167 |         }
168 | 
169 |     }
170 | }
171 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/StackedRBM.java:
--------------------------------------------------------------------------------
  1 | package com.github.tjake.rbm;
  2 | 
  3 | import sun.reflect.generics.reflectiveObjects.NotImplementedException;
  4 | 
  5 | import java.io.DataInput;
  6 | import java.io.DataOutput;
  7 | import java.io.IOException;
  8 | import java.util.ArrayList;
  9 | import java.util.Arrays;
 10 | import java.util.Iterator;
 11 | import java.util.List;
 12 | 
 13 | public class StackedRBM extends SimpleRBM {
 14 | 
 15 |     private LayerFactory layerFactory;
 16 |     private List<Integer> layerSizes;
 17 |     private List<Integer> customInputSizes;
 18 |     private List<Boolean> gaussianFlag;
 19 |     List<SimpleRBM> innerRBMs;
 20 | 
 21 | 
 22 |     public StackedRBM()
 23 |     {
 24 |         layerSizes = new ArrayList<Integer>();
 25 |         customInputSizes = new ArrayList<Integer>();
 26 |         gaussianFlag = new ArrayList<Boolean>();
 27 | 
 28 |         innerRBMs = new ArrayList<SimpleRBM>();
 29 |     }
 30 | 
 31 |     public StackedRBM setLayerFactory(LayerFactory layerFactory)
 32 |     {
 33 |         this.layerFactory = layerFactory;
 34 |         return this;
 35 |     }
 36 | 
 37 |     public StackedRBM addLayer(int numUnits, boolean gaussian)
 38 |     {
 39 | 
 40 |         if (!innerRBMs.isEmpty())
 41 |             throw new RuntimeException("Can't add new layers after already built");
 42 | 
 43 |         layerSizes.add(numUnits);
 44 |         gaussianFlag.add(gaussian);
 45 |         return this;
 46 |     }
 47 | 
 48 |     public StackedRBM withCustomInput(int numUnits)
 49 |     {
 50 |         while (customInputSizes.size() < layerSizes.size())
 51 |             customInputSizes.add(null);
 52 | 
 53 | 
 54 |         customInputSizes.set(customInputSizes.size()-1,numUnits);
 55 | 
 56 |         return this;
 57 |     }
 58 | 
 59 |     public StackedRBM build()
 60 |     {
 61 |         if (!innerRBMs.isEmpty())
 62 |             return this; //already built
 63 | 
 64 |         if (layerSizes.size() <= 1)
 65 |             throw new IllegalArgumentException("Requires at least two layers to build");
 66 | 
 67 | 
 68 |         for (int i=0; i < layerSizes.size()-1; i++)
 69 |         {
 70 | 
 71 |             int inputSize = layerSizes.get(i);
 72 | 
 73 |             if (!customInputSizes.isEmpty() && customInputSizes.size() >= i && customInputSizes.get(i+1) != null)
 74 |                 inputSize = customInputSizes.get(i+1);
 75 | 
 76 | 
 77 |             innerRBMs.add(new SimpleRBM(inputSize, layerSizes.get(i+1), gaussianFlag.get(i), layerFactory));
 78 | 
 79 |             System.err.println("Added RBM "+inputSize+ " -> "+layerSizes.get(i+1));
 80 |         }
 81 | 
 82 |         return this;
 83 |     }
 84 | 
 85 |     public Layer activateHidden(Layer visible, Layer bias) {
 86 |         throw new NotImplementedException();
 87 |     }
 88 | 
 89 |     public Layer activateVisible(Layer hidden, Layer bias) {
 90 |         throw new NotImplementedException();
 91 |     }
 92 | 
 93 |     public Iterator<Tuple> iterator(Layer visible) {
 94 |         Layer input = visible;
 95 | 
 96 |         int stackNum = innerRBMs.size();
 97 | 
 98 |         for (int i=0; i < stackNum; i++)
 99 |         {
100 |             SimpleRBM iRBM = innerRBMs.get(i);
101 | 
102 |             if (i == (stackNum-1))
103 |             {
104 |                 return iRBM.iterator(visible,new Tuple.Factory(input));
105 |             }
106 | 
107 |             visible = iRBM.activateHidden(visible,null);
108 |         }
109 | 
110 |         throw new AssertionError("code bug");
111 |     }
112 | 
113 |     @Override
114 |     public Iterator<Tuple> reverseIterator(Layer visible) {
115 |         throw new NotImplementedException();
116 |     }
117 | 
118 |     @Override
119 |     public Iterator<Tuple> iterator(Layer visible, Tuple.Factory tfactory) {
120 |         throw new NotImplementedException();
121 |     }
122 | 
123 |     @Override
124 |     public Iterator<Tuple> reverseIterator(Layer visible, Tuple.Factory tfactory) {
125 |         throw new NotImplementedException();
126 |     }
127 | 
128 |     @Override
129 |     public void save(DataOutput dataOutput) throws IOException {
130 | 
131 |         dataOutput.write(LayerFactory.MAGIC);
132 | 
133 |         dataOutput.writeInt(innerRBMs.size());
134 | 
135 |         for(SimpleRBM rbm : innerRBMs)
136 |             rbm.save(dataOutput);
137 |     }
138 | 
139 |     @Override
140 |     public void load(DataInput dataInput, LayerFactory layerFactory) throws IOException {
141 | 
142 |         this.layerFactory = layerFactory;
143 | 
144 |         byte[] magic = new byte[4];
145 |         dataInput.readFully(magic);
146 | 
147 |         if (!Arrays.equals(LayerFactory.MAGIC, magic))
148 |             throw new IOException("Bad File Format");
149 | 
150 |         int numInner = dataInput.readInt();
151 | 
152 |         for (int i=0; i<numInner; i++)
153 |         {
154 |             System.err.println("Loading rbm "+i);
155 | 
156 |             SimpleRBM loaded = new SimpleRBM();
157 |             loaded.load(dataInput, layerFactory);
158 |             innerRBMs.add(loaded);
159 |         }
160 |     }
161 | 
162 |     public List<SimpleRBM> getInnerRBMs() {
163 |         return innerRBMs;
164 |     }
165 | 
166 |     @Override
167 |     public float freeEnergy() {
168 |         float energy = 0.0f;
169 | 
170 |         for(SimpleRBM rbm : innerRBMs)
171 |             energy += rbm.freeEnergy();
172 | 
173 |         return energy;
174 |     }
175 | }
176 | 


--------------------------------------------------------------------------------
/pom.xml:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" encoding="UTF-8"?>
  2 | <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
  3 |     <modelVersion>4.0.0</modelVersion>
  4 | 
  5 |     <groupId>com.github.tjake</groupId>
  6 |     <artifactId>rbm-dbn-mnist</artifactId>
  7 |     <version>0.0.1</version>
  8 |     <name>Restricted Boltzman Machine and Deep Belief Network</name>
  9 | 
 10 |     <repositories>
 11 | 
 12 |     </repositories>
 13 | 
 14 |     <dependencies>
 15 |       
 16 |     </dependencies>
 17 | 
 18 |     <properties> 
 19 |         <skip.minst>false</skip.minst>
 20 |     </properties>
 21 | 
 22 |     <build>
 23 |         <plugins>
 24 |             <plugin>
 25 |                 <groupId>org.apache.maven.plugins</groupId>
 26 |                 <artifactId>maven-compiler-plugin</artifactId>
 27 |                 <version>2.3.2</version>
 28 |                 <configuration>
 29 |                     <source>1.6</source>
 30 |                     <target>1.6</target>
 31 |                     <encoding>UTF-8</encoding>
 32 |                 </configuration>
 33 |             </plugin>
 34 |             <plugin>
 35 |                 <groupId>org.apache.maven.plugins</groupId>
 36 |                 <artifactId>maven-source-plugin</artifactId>
 37 |                 <version>2.1.2</version>
 38 |                 <executions>
 39 |                     <execution>
 40 |                         <id>attach-sources</id>
 41 |                         <goals>
 42 |                             <goal>jar</goal>
 43 |                         </goals>
 44 |                     </execution>
 45 |                 </executions>
 46 |             </plugin>
 47 |             <plugin>
 48 |                 <groupId>org.apache.maven.plugins</groupId>
 49 |                 <artifactId>maven-resources-plugin</artifactId>
 50 |                 <version>2.5</version>
 51 |                 <configuration>
 52 |                     <outputDirectory />
 53 |                     <encoding>UTF-8</encoding>
 54 |                 </configuration>
 55 |             </plugin>
 56 |             <plugin>
 57 |                 <groupId>org.codehaus.mojo</groupId>
 58 |                 <artifactId>wagon-maven-plugin</artifactId>
 59 |                 <version>1.0-beta-4</version>
 60 |                 <executions>
 61 |                     <execution>
 62 |                         <id>download-minst-images</id>
 63 |                         <phase>prepare-package</phase>
 64 |                         <goals>
 65 |                             <goal>download-single</goal>
 66 |                         </goals>
 67 |                         <configuration>
 68 |                             <skip>${skip.minst}</skip>
 69 |                             <url>http://yann.lecun.com</url>
 70 |                             <fromFile>exdb/mnist/train-images-idx3-ubyte.gz</fromFile>
 71 |                             <toDir>${project.build.directory}/minst</toDir>
 72 |                         </configuration>
 73 |                     </execution>
 74 |                     <execution>
 75 |                         <id>download-mist-labels</id>
 76 |                         <phase>prepare-package</phase>
 77 |                         <goals>
 78 |                             <goal>download-single</goal>
 79 |                         </goals>
 80 |                         <configuration>
 81 |                             <skip>${skip.minst}</skip>
 82 |                             <url>http://yann.lecun.com</url>
 83 |                             <fromFile>exdb/mnist/train-labels-idx1-ubyte.gz</fromFile>
 84 |                             <toDir>${project.build.directory}/minst</toDir>
 85 |                         </configuration>
 86 |                     </execution>
 87 |                 </executions>
 88 |             </plugin>
 89 |             <plugin>
 90 |                 <groupId>org.apache.maven.plugins</groupId>
 91 |                 <artifactId>maven-shade-plugin</artifactId>
 92 |                 <version>1.6</version>
 93 |                 <configuration>
 94 |                     <createDependencyReducedPom>true</createDependencyReducedPom>
 95 |                     <filters>
 96 |                         <filter>
 97 |                             <artifact>*:*</artifact>
 98 |                             <excludes>
 99 |                                 <exclude>META-INF/*.SF</exclude>
100 |                                 <exclude>META-INF/*.DSA</exclude>
101 |                                 <exclude>META-INF/*.RSA</exclude>
102 |                             </excludes>
103 |                         </filter>
104 |                     </filters>
105 |                 </configuration>
106 |                 <executions>
107 |                     <execution>
108 |                         <phase>package</phase>
109 |                         <goals>
110 |                             <goal>shade</goal>
111 |                         </goals>
112 |                         <configuration>
113 |                             <transformers>
114 |                                 <transformer implementation="org.apache.maven.plugins.shade.resource.ServicesResourceTransformer" />
115 |                                 <transformer implementation="org.apache.maven.plugins.shade.resource.ManifestResourceTransformer">
116 |                                     <mainClass>com.github.tjake.rbm.minst.Demo</mainClass>
117 |                                 </transformer>
118 |                             </transformers>
119 |                         </configuration>
120 |                     </execution>
121 |                 </executions>
122 |             </plugin>
123 |             <plugin>
124 |                 <groupId>org.apache.maven.plugins</groupId>
125 |                 <artifactId>maven-deploy-plugin</artifactId>
126 |                 <version>2.7</version>
127 |                 <configuration>
128 |                     <skip>true</skip>
129 |                 </configuration>
130 |             </plugin>
131 |             <plugin>
132 |                 <groupId>org.apache.maven.plugins</groupId>
133 |                 <artifactId>maven-site-plugin</artifactId>
134 |                 <version>3.0</version>
135 |                 <configuration>
136 |                     <skip>true</skip>
137 |                     <skipDeploy>true</skipDeploy>
138 |                 </configuration>
139 |             </plugin>
140 |         </plugins>
141 |     </build>
142 | </project>
143 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/minst/BinaryMinstDBN.java:
--------------------------------------------------------------------------------
  1 | package com.github.tjake.rbm.minst;
  2 | 
  3 | 
  4 | import com.github.tjake.rbm.*;
  5 | 
  6 | import java.io.*;
  7 | import java.util.ArrayList;
  8 | import java.util.Iterator;
  9 | import java.util.List;
 10 | 
 11 | public class BinaryMinstDBN {
 12 |     static MinstDatasetReader dr;
 13 |     StackedRBM rbm;
 14 |     final StackedRBMTrainer trainer;
 15 |     final LayerFactory layerFactory = new LayerFactory();
 16 | 
 17 |     public BinaryMinstDBN(File labels, File images) {
 18 |         dr = new MinstDatasetReader(labels, images);
 19 | 
 20 |         rbm = new StackedRBM();
 21 |         trainer = new StackedRBMTrainer(rbm, 0.5f, 0.001f, 0.2f, 0.2f, layerFactory);
 22 |     }
 23 | 
 24 |     void learn(int iterations, boolean addLabels, int stopAt) {
 25 | 
 26 |         for (int p = 0; p < iterations; p++) {
 27 | 
 28 |             // Get random input
 29 |             List<Layer> inputBatch = new ArrayList<Layer>();
 30 |             List<Layer> labelBatch = addLabels ? new ArrayList<Layer>() : null;
 31 | 
 32 | 
 33 |             for (int j = 0; j < 30; j++) {
 34 |                 MinstItem trainItem = dr.getTrainingItem();
 35 |                 Layer input = layerFactory.create(trainItem.data.length);
 36 | 
 37 |                 for (int i = 0; i < trainItem.data.length; i++)
 38 |                     input.set(i, trainItem.data[i]);
 39 | 
 40 |                 inputBatch.add(new BinaryLayer(input));
 41 | 
 42 |                 if (addLabels) {
 43 |                     float[] labelInput = new float[10];
 44 |                     labelInput[Integer.valueOf(trainItem.label)] = 1.0f;
 45 |                     labelBatch.add(layerFactory.create(labelInput));
 46 |                 }
 47 |             }
 48 | 
 49 |             double error = trainer.learn(inputBatch, labelBatch, stopAt);
 50 | 
 51 |             if (p % 100 == 0)
 52 |                 System.err.println("Iteration " + p + ", Error = " + error+", Energy = "+rbm.freeEnergy());
 53 |         }
 54 |     }
 55 | 
 56 |     Iterator<Tuple> evaluate(MinstItem test) {
 57 | 
 58 |         Layer input = layerFactory.create(test.data.length);
 59 | 
 60 |         for (int i = 0; i < test.data.length; i++)
 61 |             input.set(i, test.data[i]);
 62 | 
 63 |         input = new BinaryLayer(input);
 64 | 
 65 |         int stackNum = rbm.getInnerRBMs().size();
 66 | 
 67 |         for (int i = 0; i < stackNum; i++) {
 68 | 
 69 |             SimpleRBM iRBM = rbm.getInnerRBMs().get(i);
 70 | 
 71 |             if (iRBM.biasVisible.size() > input.size()) {
 72 |                 Layer newInput = new Layer(iRBM.biasVisible.size());
 73 | 
 74 |                 System.arraycopy(input.get(), 0, newInput.get(), 0, input.size());
 75 |                 for (int j = input.size(); j < newInput.size(); j++)
 76 |                     newInput.set(j, 0.1f);
 77 | 
 78 |                 input = newInput;
 79 |             }
 80 | 
 81 |             if (i == (stackNum - 1)) {
 82 |                 return iRBM.iterator(input);
 83 |             }
 84 | 
 85 |             input = iRBM.activateHidden(input, null);
 86 |         }
 87 | 
 88 |         return null;
 89 |     }
 90 | 
 91 | 
 92 |     public static void start(File labels, File images, File saveto) {
 93 | 
 94 |         BinaryMinstDBN m = new BinaryMinstDBN(labels,images);
 95 | 
 96 |         boolean prevStateLoaded = false;
 97 | 
 98 |         if (saveto.exists()){
 99 |             try {
100 |                 DataInput input = new DataInputStream(new BufferedInputStream(new FileInputStream(saveto)));
101 |                 m.rbm.load(input, m.layerFactory);
102 |                 prevStateLoaded = true;
103 | 
104 |             } catch (IOException e) {
105 |                 e.printStackTrace();
106 |             }
107 |         }
108 | 
109 | 
110 |         if (!prevStateLoaded) {
111 |             int numIterations = 1000;
112 | 
113 |             m.rbm.setLayerFactory(m.layerFactory).addLayer(dr.rows * dr.cols, false).addLayer(500, false).addLayer(500, false).addLayer(2000, false).withCustomInput(510).build();
114 | 
115 |             System.err.println("Training level 1");
116 |             m.learn(numIterations, false, 1);
117 |             System.err.println("Training level 2");
118 |             m.learn(numIterations, false, 2);
119 |             System.err.println("Training level 3");
120 |             m.learn(numIterations, true, 3);
121 | 
122 |             try {
123 |                 DataOutputStream out = new DataOutputStream(new BufferedOutputStream(new FileOutputStream(saveto)));
124 |                 m.rbm.save(out);
125 | 
126 |                 out.flush();
127 |                 out.close();
128 |             } catch (IOException e) {
129 |                 e.printStackTrace();
130 |             }
131 |         }
132 | 
133 |         double numCorrect = 0;
134 |         double numWrong = 0;
135 |         double numAlmost = 0.0;
136 | 
137 |         while (true) {
138 |             MinstItem testCase = m.dr.getTestItem();
139 | 
140 |             Iterator<Tuple> it = m.evaluate(testCase);
141 | 
142 |             float[] labeld = new float[10];
143 | 
144 |             for (int i = 0; i < 2; i++) {
145 |                 Tuple t = it.next();
146 | 
147 |                 for (int j = (t.visible.size() - 10), k = 0; j < t.visible.size() && k < 10; j++, k++) {
148 |                     labeld[k] += t.visible.get(j);
149 |                 }
150 |             }
151 | 
152 |             float max1 = 0.0f;
153 |             float max2 = 0.0f;
154 |             int p1 = -1;
155 |             int p2 = -1;
156 | 
157 |             System.err.print("Label is: " + testCase.label);
158 | 
159 | 
160 |             for (int i = 0; i < labeld.length; i++) {
161 |                 labeld[i] /= 2;
162 |                 if (labeld[i] > max1) {
163 |                     max2 = max1;
164 |                     max1 = labeld[i];
165 | 
166 |                     p2 = p1;
167 |                     p1 = i;
168 |                 }
169 |             }
170 | 
171 |             System.err.print(", Winner is " + p1 + "(" + max1 + ") second is " + p2 + "(" + max2 + ")");
172 |             if (p1 == Integer.valueOf(testCase.label)) {
173 |                 System.err.println(" CORRECT!");
174 |                 numCorrect++;
175 | 
176 |             } else if (p2 == Integer.valueOf(testCase.label)) {
177 |                 System.err.println(" Almost!");
178 |                 numAlmost++;
179 |             } else {
180 |                 System.err.println(" wrong :(");
181 |                 numWrong++;
182 |             }
183 | 
184 |             System.err.println("Error Rate = " + ((numWrong / (numAlmost + numCorrect + numWrong)) * 100));
185 | 
186 |         }
187 |     }
188 | }
189 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/minst/BinaryMinstRBM.java:
--------------------------------------------------------------------------------
  1 | package com.github.tjake.rbm.minst;
  2 | 
  3 | import com.github.tjake.rbm.*;
  4 | 
  5 | import javax.swing.*;
  6 | import java.awt.*;
  7 | import java.awt.image.BufferedImage;
  8 | import java.awt.image.WritableRaster;
  9 | import java.io.File;
 10 | import java.util.ArrayList;
 11 | import java.util.Iterator;
 12 | import java.util.List;
 13 | 
 14 | public class BinaryMinstRBM extends Canvas {
 15 |     static int border = 10; // 10px
 16 | 
 17 |     MinstDatasetReader dr;
 18 | 
 19 |     static int count = 0;
 20 | 
 21 |     final SimpleRBM rbm;
 22 |     final LayerFactory layerFactory = new LayerFactory();
 23 | 
 24 |     MinstItem trainItem = null;
 25 |     List<int[]> outputs = new ArrayList<int[]>();
 26 | 
 27 |     final SimpleRBMTrainer trainer;
 28 | 
 29 |     public BinaryMinstRBM(File labels, File images) {
 30 | 
 31 |         dr = new MinstDatasetReader(labels, images);
 32 | 
 33 |         rbm = new SimpleRBM(dr.cols * dr.rows, 10 * 10, false, layerFactory);
 34 |         trainer = new SimpleRBMTrainer(0.2f, 0.001f, 0.2f, 0.1f, layerFactory);
 35 |     }
 36 | 
 37 |     float[] learn() {
 38 |         // Get random input
 39 |         List<Layer> inputBatch = new ArrayList<Layer>();
 40 | 
 41 |         for (int j = 0; j < 30; j++) {
 42 |             trainItem = dr.getTrainingItem();
 43 |             Layer input = layerFactory.create(trainItem.data.length);
 44 | 
 45 |             for (int i = 0; i < trainItem.data.length; i++)
 46 |                 input.set(i, trainItem.data[i]);
 47 | 
 48 |             inputBatch.add(new BinaryLayer(input));
 49 |         }
 50 | 
 51 |         double error = trainer.learn(rbm, inputBatch, false); //up down
 52 | 
 53 | 
 54 |         if (count % 100 == 0)
 55 |             System.err.println("Error = " + error + ", Energy = " + rbm.freeEnergy());
 56 | 
 57 |         return inputBatch.get(inputBatch.size() - 1).get();
 58 |     }
 59 | 
 60 |     Iterator<Tuple> evaluate() {
 61 | 
 62 | 
 63 |         MinstItem test = dr.getTestItem();
 64 | 
 65 |         Layer input = layerFactory.create(test.data.length);
 66 | 
 67 |         for (int i = 0; i < trainItem.data.length; i++)
 68 |             input.set(i, trainItem.data[i]);
 69 | 
 70 |         return rbm.iterator(new BinaryLayer(input));
 71 |     }
 72 | 
 73 |     public void update() {
 74 |         learn();
 75 |         Iterator<Tuple> it = evaluate();
 76 | 
 77 |         synchronized (outputs) {
 78 |             outputs.clear();
 79 |             for (int j = 0; j < 10; j++) {
 80 |                 Tuple t = it.next();
 81 |                 int[] output = new int[t.visible.size()];
 82 |                 float[] visible = BinaryLayer.fromBinary(t.visible);
 83 | 
 84 |                 for (int i = 0; i < visible.length; i++) {
 85 |                     output[i] = Math.round(visible[i]);
 86 |                 }
 87 | 
 88 |                 outputs.add(output);
 89 |             }
 90 |         }
 91 |         repaint();
 92 |     }
 93 | 
 94 |     public void paint(Graphics g) {
 95 | 
 96 |         BufferedImage in = new BufferedImage(dr.cols, dr.rows, BufferedImage.TYPE_INT_RGB);
 97 | 
 98 |         if (trainItem == null)
 99 |             return;
100 | 
101 |         WritableRaster r = in.getRaster();
102 |         r.setDataElements(0, 0, dr.cols, dr.rows, trainItem.data);
103 |         g.drawImage(in, border, border, null);
104 | 
105 |         int offset = border;
106 |         synchronized (outputs) {
107 |             for (int[] output : outputs) {
108 |                 BufferedImage out = new BufferedImage(dr.cols, dr.rows, BufferedImage.TYPE_INT_RGB);
109 | 
110 | 
111 |                 r = out.getRaster();
112 |                 r.setDataElements(0, 0, dr.cols, dr.rows, output);
113 | 
114 |                 //Resize
115 |                 BufferedImage newImage = new BufferedImage(56, 56, BufferedImage.TYPE_INT_RGB);
116 | 
117 |                 Graphics2D g2 = newImage.createGraphics();
118 |                 try {
119 |                     g2.setRenderingHint(RenderingHints.KEY_INTERPOLATION,
120 |                             RenderingHints.VALUE_INTERPOLATION_BICUBIC);
121 |                     g2.clearRect(0, 0, 56, 56);
122 |                     g2.drawImage(out, 0, 0, 56, 56, null);
123 |                 } finally {
124 |                     g2.dispose();
125 |                 }
126 |                 g.drawImage(newImage, border * 2 + 28, offset, null);
127 | 
128 |                 offset += border + dr.rows * 2;
129 |             }
130 | 
131 |             int buf = 28 + border + border;
132 |             for (int i = 0; i < rbm.weights.length; i++) {
133 |                 if (i % 10 == 0) {
134 |                     offset = border;
135 |                     buf += border + 56;
136 |                 }
137 | 
138 |                 int[] start = new int[dr.cols * dr.rows];
139 |                 for (int j = 0; j < start.length; j++)
140 |                     start[j] = rbm.weights[i].get(j) > 0 ? (Math.round(rbm.weights[i].get(j) * 255)) << 8 : ((Math.round(Math.abs(rbm.weights[i].get(j)) * 255)) << 16);
141 | 
142 |                 BufferedImage out = new BufferedImage(dr.cols, dr.rows, BufferedImage.TYPE_INT_RGB);
143 | 
144 |                 r = out.getRaster();
145 |                 r.setDataElements(0, 0, dr.cols, dr.rows, start);
146 | 
147 |                 //Resize
148 |                 BufferedImage newImage = new BufferedImage(56, 56, BufferedImage.TYPE_INT_RGB);
149 | 
150 |                 Graphics2D g2 = newImage.createGraphics();
151 |                 try {
152 |                     g2.setRenderingHint(RenderingHints.KEY_INTERPOLATION,
153 |                             RenderingHints.VALUE_INTERPOLATION_BICUBIC);
154 |                     g2.clearRect(0, 0, 56, 56);
155 |                     g2.drawImage(out, 0, 0, 56, 56, null);
156 |                 } finally {
157 |                     g2.dispose();
158 |                 }
159 |                 g.drawImage(newImage, buf, offset, null);
160 | 
161 |                 offset += border + dr.rows * 2;
162 |             }
163 |         }
164 |     }
165 | 
166 |     public static void start(File labels,File images) {
167 |         JFrame frame = new JFrame("MINST Draw");
168 |         frame.setDefaultCloseOperation(JFrame.EXIT_ON_CLOSE);
169 |         frame.setSize(800, 600);
170 | 
171 |         BinaryMinstRBM cnvs = new BinaryMinstRBM(labels, images);
172 | 
173 | 
174 |         cnvs.setSize(1024, 768);
175 |         frame.add(cnvs);
176 | 
177 |         frame.pack();
178 |         frame.setLocationRelativeTo(null);
179 |         frame.setVisible(true);
180 | 
181 | 
182 |         while (true) {
183 |             cnvs.update();
184 |             try {
185 |                 count++;
186 | 
187 |                 if (count > 1000)
188 |                     Thread.sleep(2000);
189 | 
190 |             } catch (InterruptedException e) {
191 |             }
192 |         }
193 |     }
194 | }
195 | 


--------------------------------------------------------------------------------
/src/main/java/com/github/tjake/rbm/SimpleRBM.java:
--------------------------------------------------------------------------------
  1 | package com.github.tjake.rbm;
  2 | 
  3 | import com.github.tjake.util.Utilities;
  4 | 
  5 | import java.io.DataInput;
  6 | import java.io.DataOutput;
  7 | import java.io.IOException;
  8 | import java.util.Arrays;
  9 | import java.util.Iterator;
 10 | import java.util.Random;
 11 | 
 12 | public class SimpleRBM
 13 | {
 14 |     // biases and weights
 15 |     public Layer biasVisible;
 16 |     public Layer biasHidden;
 17 |     public Layer[] weights;
 18 | 
 19 |     public LayerFactory lfactory;
 20 | 
 21 |     Random rand;
 22 |     static Long randomSeed;
 23 | 
 24 |     protected float scale = 0.001f;
 25 |     boolean gaussianVisibles = false;
 26 | 
 27 |     public static void setRandomSeed(long seed)
 28 |     {
 29 |          randomSeed = seed;
 30 |     }
 31 | 
 32 |     public SimpleRBM()
 33 |     {
 34 |     }
 35 | 
 36 |     public SimpleRBM(int numVisible, int numHidden, boolean gaussianVisibles, LayerFactory lfactory)
 37 |     {
 38 |         rand = new Random();
 39 |         if (randomSeed != null)
 40 |             rand.setSeed(randomSeed);
 41 | 
 42 |         this.lfactory = lfactory;
 43 | 
 44 |         this.gaussianVisibles = gaussianVisibles;
 45 | 
 46 |         // initialize nodes
 47 |         biasVisible = lfactory.create(numVisible);
 48 | 
 49 |         for (int i = 0; i < numVisible; i++)
 50 |             biasVisible.set(i, new Float(scale * rand.nextGaussian()));
 51 | 
 52 |         biasHidden = lfactory.create(numHidden);
 53 |         for (int i = 0; i < numHidden; i++)
 54 |             biasHidden.set(i, new Float(scale * rand.nextGaussian()));
 55 | 
 56 |         // initialize weights and weight change matrices
 57 |         weights = new Layer[numHidden];
 58 | 
 59 |         // randomly initialize weights
 60 |         for (int i = 0; i < numHidden; i++) {
 61 |             weights[i] = lfactory.create(numVisible);
 62 |             for (int j = 0; j < numVisible; j++)
 63 |                 weights[i].set(j, new Float(2 * scale * rand.nextGaussian()));
 64 |         }
 65 |     }
 66 | 
 67 | 
 68 |     public void save(DataOutput dataOutput) throws IOException {
 69 |         dataOutput.write(LayerFactory.MAGIC);
 70 | 
 71 |         dataOutput.writeBoolean(gaussianVisibles);
 72 |         lfactory.save(biasVisible, dataOutput);
 73 |         lfactory.save(biasHidden, dataOutput);
 74 | 
 75 |         for (int i=0; i<weights.length; i++)
 76 |             lfactory.save(weights[i],dataOutput);
 77 |     }
 78 | 
 79 |     public void load(DataInput dataInput, LayerFactory lfactory) throws IOException {
 80 | 
 81 |         this.lfactory = lfactory;
 82 | 
 83 |         byte[] magic = new byte[4];
 84 |         dataInput.readFully(magic);
 85 | 
 86 |         if (!Arrays.equals(LayerFactory.MAGIC, magic))
 87 |             throw new IOException("Bad File Format");
 88 | 
 89 |         gaussianVisibles = dataInput.readBoolean();
 90 | 
 91 |         biasVisible = lfactory.load(dataInput);
 92 |         biasHidden = lfactory.load(dataInput);
 93 |         weights = new Layer[biasHidden.size()];
 94 | 
 95 |         for (int i=0; i<weights.length; i++)
 96 |             weights[i] = lfactory.load(dataInput);
 97 |     }
 98 | 
 99 |     // Given visible data, return the expected hidden unit values.
100 |     public Layer activateHidden(final Layer visible, final Layer bias)
101 |     {
102 |         Layer workingHidden = lfactory.create(biasHidden.size());
103 | 
104 |         if (visible.size() != biasVisible.size())
105 |             throw new IllegalArgumentException("Mismatched input "+visible.size()+" != "+biasVisible.size());
106 | 
107 | 
108 |         if (bias != null && workingHidden.size() != bias.size() && bias.size() > 1)
109 |             throw new AssertionError("bias must be 0,1 or hidden length");
110 | 
111 | 
112 |         // dot product of weights and visible
113 |         for (int i = 0; i < weights.length; i++)
114 |             for (int k = 0; k < visible.size(); k++)
115 |                 workingHidden.add(i, weights[i].get(k) * visible.get(k));
116 | 
117 |         //Add hidden bias
118 |         for (int i = 0; i < workingHidden.size(); i++) {
119 |             float inputBias = 0.0f;
120 | 
121 |             if (bias != null && bias.size() != 0)
122 |                 inputBias = bias.size() == 1 ? bias.get(0) : bias.get(i);
123 | 
124 |             workingHidden.set(i, Utilities.sigmoid(workingHidden.get(i) + biasHidden.get(i) + inputBias));
125 |         }
126 | 
127 |         return workingHidden;
128 |     }
129 | 
130 |     // Given hidden states, return the expected visible unit values.
131 |     public Layer activateVisible(final Layer hidden, final Layer bias)
132 |     {
133 |         Layer workingVisible =  lfactory.create(biasVisible.size());
134 | 
135 |         if (bias != null && workingVisible.size() != bias.size() && bias.size() > 1)
136 |             throw new AssertionError("bias must be 0,1 or visible length");
137 | 
138 |         // dot product of weights and hidden
139 |         for (int k = 0; k < weights.length; k++)
140 |             for (int i = 0; i < workingVisible.size(); i++)
141 |                 workingVisible.add(i, weights[k].get(i) * hidden.get(k));
142 | 
143 |         //Add visible bias
144 |         for (int i = 0; i < workingVisible.size(); i++)
145 |         {
146 |             workingVisible.add(i, biasVisible.get(i));
147 | 
148 |             //Add input bias (if any)
149 |             if (bias != null && bias.size() != 0)
150 |                 workingVisible.add(i, bias.size() == 1 ? bias.get(0) : bias.get(i));
151 | 
152 |             if (!gaussianVisibles)
153 |                 workingVisible.set(i, Utilities.sigmoid(workingVisible.get(i)));
154 |         }
155 | 
156 |         return workingVisible;
157 |     }
158 | 
159 |     public Iterator<Tuple> iterator(Layer visible) {
160 |         return iterator(visible, new Tuple.Factory(visible));
161 |     }
162 | 
163 |     public Iterator<Tuple> reverseIterator(Layer visible) {
164 |         return reverseIterator(visible, new Tuple.Factory(visible));
165 |     }
166 | 
167 |     public Iterator<Tuple> iterator(final Layer visible, final Tuple.Factory tfactory)
168 |     {
169 |         return new Iterator<Tuple>()
170 |         {
171 |             Layer v = visible;
172 |             Layer h = activateHidden(v,null);
173 | 
174 |             public boolean hasNext()
175 |             {
176 |                 return true;
177 |             }
178 | 
179 |             public Tuple next()
180 |             {
181 |                 Tuple t = tfactory.create(v, h);
182 | 
183 |                 // Next updown
184 |                 v = activateVisible(Utilities.bernoulli(h),null);
185 |                 h = activateHidden(v,null);
186 | 
187 |                 return t;
188 |             }
189 | 
190 |             public void remove()
191 |             {
192 | 
193 |             }
194 |         };
195 |     }
196 | 
197 |     public Iterator<Tuple> reverseIterator(final Layer hidden, final Tuple.Factory tfactory)
198 |     {
199 |         return new Iterator<Tuple>()
200 |         {
201 |             Layer v = activateVisible(Utilities.bernoulli(hidden),null);
202 |             Layer h = hidden;
203 | 
204 | 
205 |             public boolean hasNext()
206 |             {
207 |                 return true;
208 |             }
209 | 
210 |             public Tuple next()
211 |             {
212 |                 Tuple t = tfactory.create(v, h);
213 | 
214 |                 // Next downup
215 |                 v = activateVisible(Utilities.bernoulli(h),null);
216 |                 h = activateHidden(v,null);
217 | 
218 |                 return t;
219 |             }
220 | 
221 |             public void remove()
222 |             {
223 | 
224 |             }
225 |         };
226 |     }
227 | 
228 |     public float freeEnergy()
229 |     {
230 |         float energy = 0.0f;
231 | 
232 |         for (int j=0; j< biasHidden.size(); j++)
233 |             for (int i=0; i< biasVisible.size(); i++)
234 |                 energy -= biasVisible.get(i) * biasHidden.get(j) * weights[j].get(i);
235 | 
236 |         return energy;
237 |     }
238 | 
239 | }


--------------------------------------------------------------------------------