Added

ctjoreilly · ctjoreilly · commit fa4d80e92d8a · 2008-02-23T19:13:39.000Z
=====
*. aima.search.online.LRTAStarAgent
   - Initial implementation of algorithm in Fig 4.23.

*. aima.test.search.online.LRTAStarAgentTest
   - Test case for LRTAStarAgent
   - Note: One test currently commented out as
     algorithm goes into eternal loop based on
     the condition it is testing.

*. aima.search.online.ActionState
   - Factored out code from OnlineDFSAgent for
     re-use in LRTAStarAgent

Modified
========
*. aima.search.online.OnlineDFSAgent
   - Factored out ActionState for re-use in
     LRTAStarAgent.

*. aima.test.learningtest.neural.BackPropagationTests
   - Commented out System.outs

*. aim.test.search.SearchTests
    - Added LRTAStarAgentTest to suite.
diff --git a/src/aima/search/online/ActionState.java b/src/aima/search/online/ActionState.java
@@ -0,0 +1,40 @@
+package aima.search.online;
+
+import aima.basic.Percept;
+
+public class ActionState {
+	private final Object action;
+	private final Percept state;
+
+	public ActionState(Object action, Percept state) {
+		this.action = action;
+		this.state = state;
+	}
+
+	public Object getAction() {
+		return action;
+	}
+
+	public Percept getState() {
+		return state;
+	}
+
+	@Override
+	public boolean equals(Object o) {
+		if (o == null || !(o instanceof ActionState)) {
+			return super.equals(o);
+		}
+		return (action.equals(((ActionState) o).action) && state
+				.equals(((ActionState) o).state));
+	}
+
+	@Override
+	public int hashCode() {
+		return action.hashCode() + state.hashCode();
+	}
+
+	@Override
+	public String toString() {
+		return "(" + action + ", " + state + ")";
+	}
+}
diff --git a/src/aima/search/online/LRTAStarAgent.java b/src/aima/search/online/LRTAStarAgent.java
@@ -0,0 +1,170 @@
+package aima.search.online;
+
+import java.util.ArrayList;
+import java.util.Hashtable;
+import java.util.List;
+
+import aima.basic.Agent;
+import aima.basic.Percept;
+import aima.search.framework.Problem;
+import aima.search.framework.Successor;
+
+/**
+ * Artificial Intelligence A Modern Approach (2nd Edition): Figure 4.23, page
+ * 128.<br>
+ * <code>
+ * function LRTA*AGENT(s') returns an action
+ *   inputs: s', a percept that identifies the current state
+ *   static: result, a table, indexed by action and state, initially empty
+ *           H, a table of cost estimates indexed by state, initially empty
+ *           s, a, the previous state and action, initially null
+ *           
+ *   if GOAL-TEST(s') then return stop
+ *   if s' is new state (not in H) then H[s'] <- h(s')
+ *   unless s is null
+ *     result[a, s] <- s'
+ *     H[s] <- min LRTA*-COST(s, b, result[b, s], H)
+ *             b (element of) ACTIONS(s)
+ *   a <- an action b in ACTIONS(s') that minimizes LRTA*-COST(s', b, result[b, s'], H)
+ *   s <- s'
+ *   return a
+ *   
+ * 
+ * function LRTA*-COST(s, a, s', H) returns a cost estimate
+ *   if s' is undefined then return h(s)
+ *   else return c(s, a, s') + H[s']
+ * </code>
+ * 
+ * Figure 4.23 LRTA*-AGENT selects an action according to the value of
+ * neighboring states, which are updated as the agent moves about the state
+ * space.<br>
+ * Note: This algorithm fails to exit if the goal does not exist (e.g. A<->B Goal=X),
+ * this could be an issue with the implementation. Comments welcome.
+ */
+
+/**
+ * @author Ciaran O'Reilly
+ * 
+ */
+public class LRTAStarAgent extends Agent {
+
+	private Problem problem;
+	// static: result, a table, indexed by action and state, initially empty
+	private final Hashtable<ActionState, Percept> result = new Hashtable<ActionState, Percept>();
+	// H, a table of cost estimates indexed by state, initially empty
+	private final Hashtable<Percept, Double> H = new Hashtable<Percept, Double>();
+	// s, a, the previous state and action, initially null
+	private Percept s = null;
+	private Object a = null;
+
+	public LRTAStarAgent(Problem problem) {
+		setProblem(problem);
+	}
+
+	public Problem getProblem() {
+		return problem;
+	}
+
+	public void setProblem(Problem problem) {
+		this.problem = problem;
+		init();
+	}
+
+	// function LRTA*AGENT(s') returns an action
+	// inputs: s', a percept that identifies the current state
+	@Override
+	public String execute(Percept sComma) {
+
+		// if GOAL-TEST(s') then return stop
+		if (!goalTest(sComma)) {
+			// if s' is new state (not in H) then H[s'] <- h(s')
+			if (!H.containsKey(sComma)) {
+				H.put(sComma, getProblem().getHeuristicFunction()
+						.getHeuristicValue(sComma));
+			}
+			// unless s is null
+			if (null != s) {
+				// result[a, s] <- s'
+				result.put(new ActionState(a, s), sComma);
+
+				// H[s] <- min LRTA*-COST(s, b, result[b, s], H)
+				// b (element of) ACTIONS(s)
+				double min = Double.MAX_VALUE;
+				for (Object b : actions(s)) {
+					double cost = lrtaCost(s, b, result.get(new ActionState(b,
+							s)));
+					if (cost < min) {
+						min = cost;
+					}
+				}
+				H.put(s, min);
+			}
+			// a <- an action b in ACTIONS(s') that minimizes LRTA*-COST(s', b,
+			// result[b, s'], H)
+			double min = Double.MAX_VALUE;
+			// Just in case no actions
+			a = Agent.NO_OP;
+			for (Object b : actions(sComma)) {
+				double cost = lrtaCost(sComma, b, result.get(new ActionState(b,
+						sComma)));
+				if (cost < min) {
+					min = cost;
+					a = b;
+				}
+			}
+		} else {
+			a = Agent.NO_OP;
+		}
+
+		// s <- s'
+		s = sComma;
+
+		if (Agent.NO_OP.equals(a)) {
+			// I'm either at the Goal or can't get to it,
+			// which in either case I'm finished so just die.
+			die();
+		}
+		// return a
+		return a.toString();
+	}
+
+	//
+	// PRIVATE METHODS
+	//
+	private void init() {
+		live();
+		result.clear();
+		H.clear();
+		s = null;
+		a = null;
+	}
+
+	private boolean goalTest(Percept state) {
+		return getProblem().isGoalState(state);
+	}
+
+	// function LRTA*-COST(s, a, s', H) returns a cost estimate
+	private double lrtaCost(Percept s, Object action, Percept sComma) {
+		// if s' is undefined then return h(s)
+		if (null == sComma) {
+			return getProblem().getHeuristicFunction().getHeuristicValue(s);
+		}
+		// else return c(s, a, s') + H[s']
+		return getProblem().getStepCostFunction().calculateStepCost(s, sComma,
+				action.toString())
+				+ H.get(sComma);
+	}
+
+	private List<Object> actions(Percept state) {
+		List<Object> actions = new ArrayList<Object>();
+
+		List<Successor> successors = getProblem().getSuccessorFunction()
+				.getSuccessors(state);
+
+		for (Successor s : successors) {
+			actions.add(s.getAction());
+		}
+
+		return actions;
+	}
+}
diff --git a/src/aima/search/online/OnlineDFSAgent.java b/src/aima/search/online/OnlineDFSAgent.java
@@ -19,7 +19,7 @@
  *           unexplored, a table that lists, for each visited state, the actions not yet tried
  *           unbacktracked, a table that lists, for each visited state, the backtracks not yet tried
  *           s, a, the previous state and action, initially null
- *   
+ *    
  *   if GOAL-TEST(s') then return stop
  *   if s' is a new state then unexplored[s'] <- ACTIONS(s')
  *   if s is not null then do
@@ -106,9 +106,9 @@ public String execute(Percept sComma) {
 					Percept popped = unbacktracked.get(sComma).remove(
 							unbacktracked.get(sComma).size() - 1);
 					for (ActionState as : result.keySet()) {
-						if (as.state.equals(sComma)
+						if (as.getState().equals(sComma)
 								&& result.get(as).equals(popped)) {
-							a = as.action;
+							a = as.getAction();
 							break;
 						}
 					}
@@ -139,6 +139,7 @@ public String execute(Percept sComma) {
 	//
 
 	private void init() {
+		live();
 		result.clear();
 		unexplored.clear();
 		unbacktracked.clear();
@@ -162,33 +163,4 @@ private List<Object> actions(Percept state) {
 
 		return actions;
 	}
-
-	private class ActionState {
-		private final Object action;
-		private final Percept state;
-
-		public ActionState(Object action, Percept state) {
-			this.action = action;
-			this.state = state;
-		}
-
-		@Override
-		public boolean equals(Object o) {
-			if (o == null || !(o instanceof ActionState)) {
-				return super.equals(o);
-			}
-			return (action.equals(((ActionState) o).action) && state
-					.equals(((ActionState) o).state));
-		}
-
-		@Override
-		public int hashCode() {
-			return action.hashCode() + state.hashCode();
-		}
-
-		@Override
-		public String toString() {
-			return "(" + action + ", " + state + ")";
-		}
-	}
 }
diff --git a/src/aima/test/learningtest/neural/BackPropagationTests.java b/src/aima/test/learningtest/neural/BackPropagationTests.java
@@ -137,7 +137,7 @@ public void xtestDataSetPopulation() throws Exception {
 
 		innds.refreshDataset();
 		int[] result = ffnn.testOnDataSet(innds);
-		System.out.println(result[0] + " right, " + result[1] + " wrong");
+		// System.out.println(result[0] + " right, " + result[1] + " wrong");
 
 	}
 
@@ -154,7 +154,7 @@ public void testPerceptron() throws Exception {
 
 		innds.refreshDataset();
 		int[] result = perc.testOnDataSet(innds);
-		System.out.println(result[0] + " right, " + result[1] + " wrong");
+		// System.out.println(result[0] + " right, " + result[1] + " wrong");
 
 	}
 }
diff --git a/src/aima/test/search/SearchTests.java b/src/aima/test/search/SearchTests.java
@@ -17,6 +17,7 @@
 import aima.test.search.nqueens.NQueensFitnessFunctionTest;
 import aima.test.search.nqueens.NQueensGoalTestTest;
 import aima.test.search.nqueens.NQueensSuccessorFunctionTest;
+import aima.test.search.online.LRTAStarAgentTest;
 import aima.test.search.online.OnlineDFSAgentTest;
 import aima.test.search.searches.AStarSearchTest;
 import aima.test.search.searches.BidirectionalSearchTest;
@@ -52,6 +53,7 @@ public static Test suite() {
 		suite.addTest(new TestSuite(GreedyBestFirstSearchTest.class));
 		suite.addTest(new TestSuite(IterativeDeepeningSearchTest.class));
 		suite.addTest(new TestSuite(LIFOQueueTest.class));
+		suite.addTest(new TestSuite(LRTAStarAgentTest.class));
 		suite.addTest(new TestSuite(MapAgentTest.class));
 		suite.addTest(new TestSuite(MapCSPTest.class));
 		suite.addTest(new TestSuite(MapEnvironmentTest.class));
diff --git a/src/aima/test/search/online/LRTAStarAgentTest.java b/src/aima/test/search/online/LRTAStarAgentTest.java
@@ -0,0 +1,86 @@
+package aima.test.search.online;
+
+import junit.framework.TestCase;
+import aima.basic.BasicEnvironmentView;
+import aima.search.framework.HeuristicFunction;
+import aima.search.map.BidirectionalMapProblem;
+import aima.search.map.Map;
+import aima.search.map.MapEnvironment;
+import aima.search.online.LRTAStarAgent;
+
+public class LRTAStarAgentTest extends TestCase {
+	Map aMap;
+
+	StringBuffer envChanges;
+
+	HeuristicFunction hf;
+
+	@Override
+	public void setUp() {
+		aMap = new Map(new String[] { "A", "B", "C", "D", "E", "F" });
+		aMap.addBidirectionalLink("A", "B", 4);
+		aMap.addBidirectionalLink("B", "C", 4);
+		aMap.addBidirectionalLink("C", "D", 4);
+		aMap.addBidirectionalLink("D", "E", 4);
+		aMap.addBidirectionalLink("E", "F", 4);
+		hf = new HeuristicFunction() {
+			public double getHeuristicValue(Object state) {
+				return 1;
+			}
+		};
+
+		envChanges = new StringBuffer();
+	}
+
+	public void testAlreadyAtGoal() {
+		MapEnvironment me = new MapEnvironment(aMap);
+		LRTAStarAgent agent = new LRTAStarAgent(new BidirectionalMapProblem(me
+				.getMap(), "A", "A", hf));
+		me.addAgent(agent, "A");
+		me.registerView(new BasicEnvironmentView() {
+			@Override
+			public void envChanged(String command) {
+				envChanges.append(command).append("->");
+			}
+		});
+		me.stepUntilNoOp();
+
+		assertEquals("NoOP->", envChanges.toString());
+	}
+
+	public void testNormalSearch() {
+		MapEnvironment me = new MapEnvironment(aMap);
+		LRTAStarAgent agent = new LRTAStarAgent(new BidirectionalMapProblem(me
+				.getMap(), "A", "F", hf));
+		me.addAgent(agent, "A");
+		me.registerView(new BasicEnvironmentView() {
+			@Override
+			public void envChanged(String command) {
+				envChanges.append(command).append("->");
+			}
+		});
+		me.stepUntilNoOp();
+
+		assertEquals("B->A->B->C->B->C->D->C->D->E->D->E->F->NoOP->",
+				envChanges.toString());
+	}
+
+	public void testNoPath() {
+		// Note: Will search forever if no path is possible.
+		// MapEnvironment me = new MapEnvironment(aMap);
+		// LRTAStarAgent agent = new LRTAStarAgent(new
+		// BidirectionalMapProblem(me
+		// .getMap(), "A", "G", hf));
+		// me.addAgent(agent, "A");
+		// me.registerView(new BasicEnvironmentView() {
+		// @Override
+		// public void envChanged(String command) {
+		// envChanges.append(command).append("->");
+		// }
+		// });
+		// me.stepUntilNoOp();
+		//
+		// assertEquals("B->A->B->C->B->C->D->C->D->E->D->E->F->NoOP->",
+		// envChanges.toString());
+	}
+}

Original file line number	Diff line number	Diff line change
`@@ -137,7 +137,7 @@ public void xtestDataSetPopulation() throws Exception {`
`137`	`137`
`138`	`138`	`innds.refreshDataset();`
`139`	`139`	`int[] result = ffnn.testOnDataSet(innds);`
`140`		`- System.out.println(result[0] + " right, " + result[1] + " wrong");`
	`140`	`+ // System.out.println(result[0] + " right, " + result[1] + " wrong");`
`141`	`141`
`142`	`142`	`}`
`143`	`143`
`@@ -154,7 +154,7 @@ public void testPerceptron() throws Exception {`
`154`	`154`
`155`	`155`	`innds.refreshDataset();`
`156`	`156`	`int[] result = perc.testOnDataSet(innds);`
`157`		`- System.out.println(result[0] + " right, " + result[1] + " wrong");`
	`157`	`+ // System.out.println(result[0] + " right, " + result[1] + " wrong");`
`158`	`158`
`159`	`159`	`}`
`160`	`160`	`}`