fixed training

LukasMolzberger · LukasMolzberger · commit 6edd62e62871 · 2017-11-04T09:20:29.000+01:00
diff --git a/src/main/java/org/aika/Neuron.java b/src/main/java/org/aika/Neuron.java
@@ -58,6 +58,31 @@ public Activation addInput(Document doc, int begin, int end) {
         return addInput(doc, begin, end, null, doc.bottom);
     }
 
+    /**
+     * Propagate an input activation into the network.
+     *
+     * @param doc   The current document
+     * @param begin The range begin
+     * @param end   The range end
+     * @param value The activation value of this input activation
+     */
+    public Activation addInput(Document doc, int begin, int end, double value) {
+        return addInput(doc, begin, end, null, doc.bottom, value);
+    }
+
+    /**
+     * Propagate an input activation into the network.
+     *
+     * @param doc   The current document
+     * @param begin The range begin
+     * @param end   The range end
+     * @param value The activation value of this input activation
+     * @param targetValue The target activation value for supervised learning
+     */
+    public Activation addInput(Document doc, int begin, int end, double value, double targetValue) {
+        return addInput(doc, begin, end, null, doc.bottom, value, targetValue);
+    }
+
 
     /**
      * Propagate an input activation into the network.
@@ -110,7 +135,22 @@ public Activation addInput(Document doc, int begin, int end, Integer rid, Interp
      * @param value The activation value of this input activation
      */
     public Activation addInput(Document doc, int begin, int end, Integer rid, InterprNode o, double value) {
-        return get().addInput(doc, begin, end, rid, o, value);
+        return addInput(doc, begin, end, rid, o, value, 0.0);
+    }
+
+    /**
+     * Propagate an input activation into the network.
+     *
+     * @param doc   The current document
+     * @param begin The range begin
+     * @param end   The range end
+     * @param rid   The relational id (e.g. the word position)
+     * @param o     The interpretation node
+     * @param value The activation value of this input activation
+     * @param targetValue The target activation value for supervised learning
+     */
+    public Activation addInput(Document doc, int begin, int end, Integer rid, InterprNode o, double value, double targetValue) {
+        return get().addInput(doc, begin, end, rid, o, value, targetValue);
     }
 
 
diff --git a/src/main/java/org/aika/corpus/Document.java b/src/main/java/org/aika/corpus/Document.java
@@ -75,6 +75,9 @@ public class Document implements Comparable<Document> {
     public TreeSet<INeuron> activatedNeurons = new TreeSet<>();
     public TreeSet<INeuron> finallyActivatedNeurons = new TreeSet<>();
     public TreeSet<Activation> inputNeuronActivations = new TreeSet<>();
+    public TreeSet<Activation> targetActivations = new TreeSet<>();
+    public TreeSet<Activation> errorSignalActivations = new TreeSet<>();
+
     public TreeMap<NodeActivation.Key, NodeActivation> activationsByRid = new TreeMap<>(new Comparator<NodeActivation.Key>() {
         @Override
         public int compare(NodeActivation.Key act1, NodeActivation.Key act2) {
@@ -259,18 +262,18 @@ public TrainConfig setPerformBackpropagation(boolean performBackpropagation) {
 
 
     public void train(TrainConfig trainConfig) {
+        for(Activation tAct: targetActivations) {
+            tAct.key.n.neuron.get().computeOutputErrorSignal(this, tAct);
+        }
+
         if(trainConfig.performBackpropagation) {
             bQueue.backpropagtion();
         }
 
-        for (INeuron n : finallyActivatedNeurons) {
-            ThreadState<OrNode, Activation> th = n.node.get().getThreadState(threadId, false);
-            if (th != null) {
-                for (Activation act : th.activations.values()) {
-                    n.train(this, act, trainConfig.learnRate, trainConfig.synapseEvaluation);
-                }
-            }
+        for (Activation act : errorSignalActivations) {
+            act.key.n.neuron.get().train(this, act, trainConfig.learnRate, trainConfig.synapseEvaluation);
         }
+        errorSignalActivations.clear();
     }
 
     /**
@@ -368,7 +371,6 @@ public String neuronActivationsToString(boolean withWeights, boolean withTextSni
                     Activation.State s = me.getValue();
                     sb.append("[R:" + me.getKey());
                     sb.append(" VALUE:" + Utils.round(s.value));
-                    sb.append(" F:" + s.fired);
                     sb.append(" W:" + Utils.round(s.weight.w));
                     sb.append(" N:" + Utils.round(s.weight.n));
                     sb.append("]");
@@ -655,7 +657,7 @@ public void backpropagtion() {
                 Activation act = queue.pollFirst();
 
                 act.isQueued = false;
-                act.key.n.neuron.get().computeErrorSignal(Document.this, act);
+                act.key.n.neuron.get().computeBackpropagationErrorSignal(Document.this, act);
             }
         }
     }
diff --git a/src/main/java/org/aika/neuron/Activation.java b/src/main/java/org/aika/neuron/Activation.java
@@ -46,8 +46,8 @@ public final class Activation extends NodeActivation<OrNode> {
     public long currentStateV;
     public StateChange currentStateChange;
 
-    public double initialErrorSignal;
     public double errorSignal;
+    public double targetValue;
 
 
     public Activation(int id, Document doc, Key key) {
diff --git a/src/main/java/org/aika/neuron/INeuron.java b/src/main/java/org/aika/neuron/INeuron.java
@@ -121,7 +121,7 @@ public INeuron(Model m, String label, String outputText) {
      * @param o     The interpretation node
      * @param value The activation value of this input activation
      */
-    public Activation addInput(Document doc, int begin, int end, Integer rid, InterprNode o, double value) {
+    public Activation addInput(Document doc, int begin, int end, Integer rid, InterprNode o, double value, double targetValue) {
         Node.addActivationAndPropagate(doc, new NodeActivation.Key(node.get(), new Range(begin, end), rid, o), Collections.emptySet());
 
         doc.propagate();
@@ -130,6 +130,7 @@ public Activation addInput(Document doc, int begin, int end, Integer rid, Interp
         State s = new State(value, 0, NormWeight.ZERO_WEIGHT);
         act.rounds.set(0, s);
         act.finalState = s;
+        act.targetValue = targetValue;
         act.upperBound = value;
         act.isInput = true;
 
@@ -138,6 +139,10 @@ public Activation addInput(Document doc, int begin, int end, Integer rid, Interp
 
         doc.ubQueue.add(act);
 
+        if(targetValue != 0.0) {
+            doc.targetActivations.add(act);
+        }
+
         doc.propagate();
 
         return act;
@@ -294,15 +299,29 @@ public InputState(SynapseActivation sa, State s) {
     }
 
 
-    public void computeErrorSignal(Document doc, Activation act) {
-        act.errorSignal = act.initialErrorSignal;
+    public void computeOutputErrorSignal(Document doc, Activation act) {
+        act.errorSignal += act.targetValue - act.finalState.value;
+
+        if(act.errorSignal != 0.0) {
+            doc.errorSignalActivations.add(act);
+        }
+        for (SynapseActivation sa : act.neuronInputs) {
+            doc.bQueue.add(sa.input);
+        }
+    }
+
+
+    public void computeBackpropagationErrorSignal(Document doc, Activation act) {
         for (SynapseActivation sa : act.neuronOutputs) {
             Synapse s = sa.s;
             Activation oAct = sa.output;
 
             act.errorSignal += s.w * oAct.errorSignal * (1.0 - act.finalState.value);
         }
 
+        if(act.errorSignal != 0.0) {
+            doc.errorSignalActivations.add(act);
+        }
         for (SynapseActivation sa : act.neuronInputs) {
             doc.bQueue.add(sa.input);
         }
@@ -315,7 +334,7 @@ public void train(Document doc, Activation targetAct, double learnRate, Document
         long v = doc.visitedCounter++;
 
         double x = learnRate * targetAct.errorSignal;
-        bias += x;
+        bias = Math.min(0.0, bias + x);
         for (INeuron n : doc.finallyActivatedNeurons) {
             for(Activation iAct: n.getFinalActivations(doc)) {
                 Synapse.Key sk = se.evaluate(iAct, targetAct);
diff --git a/src/test/java/org/aika/network/TrainingTest.java b/src/test/java/org/aika/network/TrainingTest.java
@@ -23,6 +23,7 @@
 import org.aika.neuron.Activation;
 import org.aika.neuron.INeuron;
 import org.aika.neuron.Synapse;
+import org.junit.Assert;
 import org.junit.Test;
 
 /**
@@ -64,6 +65,59 @@ public void testTraining() {
 
         doc = m.createDocument("Bla");
         in.addInput(doc, 0, 3, 0, doc.bottom, 1.0);
+    }
+
+
+    @Test
+    public void testTraining1() {
+        Model m = new Model();
+
+        Neuron inA = m.createNeuron("A");
+        Neuron inB = m.createNeuron("B");
+
+        Neuron outC = m.createNeuron("C");
+
+        {
+            Document doc = m.createDocument("Bla");
+            inA.addInput(doc, 0, 3, 1.0);
+            inB.addInput(doc, 0, 3, 1.0);
+
+            doc.process();
+
+
+            outC.addInput(doc, 0, 3, 0.0, 1.0);
+
+            doc.train(
+                    new Document.TrainConfig()
+                            .setLearnRate(2.0)
+                            .setPerformBackpropagation(false)
+                            .setSynapseEvaluation((iAct, oAct) -> new Synapse.Key(
+                                    false,
+                                    0,
+                                    null,
+                                    Range.Operator.EQUALS,
+                                    Range.Mapping.START,
+                                    true,
+                                    Range.Operator.EQUALS,
+                                    Range.Mapping.END,
+                                    true
+                            ))
+            );
+
+            doc.clearActivations();
+        }
+
+        {
+            Document doc = m.createDocument("Bla");
+            inA.addInput(doc, 0, 3, 1.0);
+            inB.addInput(doc, 0, 3, 1.0);
+
+            doc.process();
+
+            System.out.println(doc.neuronActivationsToString(true, false, true));
+            Assert.assertFalse(outC.getFinalActivations(doc).isEmpty());
 
+            doc.clearActivations();
+        }
     }
 }