Merge pull request aimacode#427 from samagra14/information_gathering_agent

norvig · web-flow · commit 729004e88f1f · 2018-07-03T15:37:54.000-07:00
Adds information gathering agent
diff --git a/README.md b/README.md
@@ -100,7 +100,7 @@ Java implementation of algorithms from [Russell](http://www.cs.berkeley.edu/~rus
 |15.6|580|Fixed-Lag-Smoothing|[FixedLagSmoothing](/aima-core/src/main/java/aima/core/probability/hmm/exact/FixedLagSmoothing.java)|
 |15|590|Dynamic Bayesian Network|[DynamicBayesianNetwork](/aima-core/src/main/java/aima/core/probability/bayes/DynamicBayesianNetwork.java)|
 |15.17|598|Particle-Filtering|[ParticleFiltering](/aima-core/src/main/java/aima/core/probability/bayes/approx/ParticleFiltering.java)|
-|16.9|632|Information-Gathering-Agent|---|
+|16.9|632|Information-Gathering-Agent|[InformationGatheringAgent](/aima-core/src/main/java/aima/core/probability/InformationGatheringAgent.java)|
 |17|647|Markov Decision Process|[MarkovDecisionProcess](/aima-core/src/main/java/aima/core/probability/mdp/MarkovDecisionProcess.java)|
 |17.4|653|Value-Iteration|[ValueIteration](/aima-core/src/main/java/aima/core/probability/mdp/search/ValueIteration.java)|
 |17.7|657|Policy-Iteration|[PolicyIteration](/aima-core/src/main/java/aima/core/probability/mdp/search/PolicyIteration.java)|
diff --git a/aima-core/src/main/java/aima/core/probability/DecisionNetwork.java b/aima-core/src/main/java/aima/core/probability/DecisionNetwork.java
@@ -0,0 +1,85 @@
+package aima.core.probability;
+
+import aima.core.probability.bayes.BayesInference;
+import aima.core.probability.bayes.BayesianNetwork;
+import aima.core.probability.domain.FiniteDomain;
+import aima.core.probability.proposition.AssignmentProposition;
+
+import java.util.List;
+
+/**
+ * Artificial Intelligence A Modern Approach (3rd Edition): page 626.<br>
+ * <br>
+ * Decision networks combine Bayesian networks
+ * with additional node types for actions and utilities.<br>
+ * <p>
+ * In its most general form, a decision network represents information about the agent’s current
+ * state, its possible actions, the state that will result from the agent’s action, and the utility of
+ * that state.
+ *
+ * @author samagra
+ */
+public abstract class DecisionNetwork {
+
+    // The underlying Bayesian network
+    private BayesianNetwork network;
+    // The single decision node
+    private RandomVariable action;
+    // To calculate various conditional probabilities
+    private BayesInference inferenceProcedure;
+
+    /**
+     * Constructor for the decision network.
+     *
+     * @param network            The underlying Bayesian Network.
+     * @param action             The decision node .
+     * @param inferenceProcedure The inference procedure to be utilised for probability calculations.
+     */
+    public DecisionNetwork(BayesianNetwork network,
+                           RandomVariable action, BayesInference inferenceProcedure) {
+        this.network = network;
+        this.action = action;
+        this.inferenceProcedure = inferenceProcedure;
+    }
+
+    // Returns the utility for a particular state
+    public abstract double getUtilityForAction(RandomVariable action, Object value);
+
+    /**
+     * Calculates the expected utility of an action in the presence of a certain random variable.
+     *
+     * @param action   Action for which the utility is to be calculated.
+     * @param evidence The available information.
+     * @return
+     */
+    public double getExpectedUtility(RandomVariable action,
+                                     List<AssignmentProposition> evidence) {
+        double utility = 0;
+        CategoricalDistribution distribution = inferenceProcedure.ask((new RandomVariable[]{action}),
+                ((AssignmentProposition[]) evidence.toArray()), this.getNetwork());
+        for (Object value :
+                ((FiniteDomain) action.getDomain()).getPossibleValues()) {
+            utility += distribution.getValue(value) * this.getUtilityForAction(action, value);
+        }
+        return utility;
+    }
+
+    /**
+     * Currently the decision network supports only a single decision node and hence returns
+     * the same action.
+     *
+     * @return
+     */
+    public Object getBestAction() {
+        return action;
+    }
+
+    /**
+     * Returns the underlying Bayesian Network.
+     *
+     * @return
+     */
+    public BayesianNetwork getNetwork() {
+        return network;
+    }
+}
diff --git a/aima-core/src/main/java/aima/core/probability/InformationGatheringAgent.java b/aima-core/src/main/java/aima/core/probability/InformationGatheringAgent.java
@@ -0,0 +1,162 @@
+package aima.core.probability;
+
+import aima.core.agent.Action;
+import aima.core.agent.Agent;
+import aima.core.agent.Percept;
+import aima.core.probability.bayes.BayesInference;
+import aima.core.probability.domain.FiniteDomain;
+import aima.core.probability.proposition.AssignmentProposition;
+
+import java.util.ArrayList;
+import java.util.Collections;
+import java.util.List;
+
+/**
+ * Artificial Intelligence A Modern Approach (3rd Edition): Figure 16.9, page 632.<br>
+ * </br>
+ * <pre>
+ *
+ * function INFORMATION-GATHERING-AGENT(percept) returns an action
+ *  persistent: D, a decision network
+ *
+ * integrate percept into D
+ *  j ← the value that maximizes VPI(Ej) / Cost(Ej)
+ *  if VPI(Ej) > Cost(Ej)
+ *    return REQUEST(Ej)
+ *  else return the best action from D
+ *
+ *     </pre>
+ * <p>
+ * Figure ?? Design of a simple information-gathering agent.
+ * The agent works by repeatedly selecting the observation with
+ * the highest information value, until the cost of the next
+ * observation is greater than its expected benefit.
+ *
+ * @author samagra
+ */
+public abstract class InformationGatheringAgent implements Agent {
+
+    // To carry out conditional probability calculations
+    private BayesInference inferenceMethod;
+    // persistent: D, a decision network
+    private DecisionNetwork decisionNetwork;
+    // To store the information collected till now
+    private List<AssignmentProposition> observedEvidence;
+    // To store the scope of information that can be collected
+    private List<RandomVariable> randomVars;
+
+    /**
+     * Constructor for the agent.
+     *
+     * @param decisionNetwork The decision network which represents the problem
+     *                        for which the information is to be collected
+     * @param inferenceMethod To carry out various conditional probability calculations
+     * @param initialEvidence The information which is available beforehand to the agent.
+     */
+    public InformationGatheringAgent(DecisionNetwork decisionNetwork,
+                                     BayesInference inferenceMethod,
+                                     List<AssignmentProposition> initialEvidence) {
+        this.decisionNetwork = decisionNetwork;
+        this.inferenceMethod = inferenceMethod;
+        this.observedEvidence = initialEvidence;
+        this.randomVars = this.decisionNetwork.getNetwork().getVariablesInTopologicalOrder();
+    }
+
+    public InformationGatheringAgent(DecisionNetwork decisionNetwork,
+                                     BayesInference inferenceMethod) {
+        this(decisionNetwork, inferenceMethod, new ArrayList<>());
+    }
+
+    /**
+     * function INFORMATION-GATHERING-AGENT(percept) returns an action
+     *
+     * @param percept The current percept of a sequence perceived by the Agent.
+     * @return action to be executed by the agent
+     */
+    @Override
+    public Action execute(Percept percept) {
+        // integrate percept into D
+        observedEvidence = integratePercept(observedEvidence, percept);
+
+        // j ← the value that maximizes VPI(Ej) / Cost(Ej)
+        List<Double> vpiPerUnitCosts = this.vpiPerUnitCost(this.randomVars);
+        int j = vpiPerUnitCosts.indexOf(Collections.max(vpiPerUnitCosts));
+        RandomVariable randomVar = this.randomVars.get(j);
+
+        // if VPI(Ej) > Cost(Ej)
+        if (getVpi(randomVar) > getCost(randomVar)) {
+            // return REQUEST(Ej)
+            return this.request(randomVar);
+        }
+        // else return the best action from D
+        return ((Action) decisionNetwork.getBestAction());
+    }
+
+    /**
+     * We assume that the result of
+     * the action Request (Ej ) is that the next percept provides the value of Ej .
+     *
+     * @param randomVar The random variable for which the information is needed.
+     * @return The action which leads to the agent to the value of Ej.
+     */
+    protected abstract Action request(RandomVariable randomVar);
+
+    /**
+     * Calculates the vpi (value of perfect information) per unit cost
+     * for all the random variables.
+     *
+     * @param variablesInTopologicalOrder The variables for which information is required.
+     * @return A list of vpi values.
+     */
+    private List<Double> vpiPerUnitCost(List<RandomVariable> variablesInTopologicalOrder) {
+        List<Double> vpiPerUnitCost = new ArrayList<>();
+        for (RandomVariable var :
+                variablesInTopologicalOrder) {
+            vpiPerUnitCost.add(getVpi(var) / getCost(var));
+        }
+        return vpiPerUnitCost;
+    }
+
+    /**
+     * Calculates the cost of obtaining information for
+     * a particular variable.
+     *
+     * @param var
+     * @return
+     */
+     abstract double getCost(RandomVariable var);
+
+    /**
+     * Calculates VPI for a particular random variable.
+     *
+     * @param var
+     * @return
+     */
+     double getVpi(RandomVariable var) {
+        double vpi = 0;
+        CategoricalDistribution distribution = inferenceMethod.ask((new RandomVariable[]{var}),
+                ((AssignmentProposition[]) observedEvidence.toArray()), decisionNetwork.getNetwork());
+        for (Object value :
+                ((FiniteDomain) var.getDomain()).getPossibleValues()) {
+            double posterierProb = distribution.getValue(value);
+            List<AssignmentProposition> modifiedEvidence = new ArrayList<>(observedEvidence);
+            modifiedEvidence.add(new AssignmentProposition(var, value));
+            double expectedUtilityForParticularValue = decisionNetwork.getExpectedUtility(var,
+                    modifiedEvidence);
+            vpi += posterierProb * expectedUtilityForParticularValue;
+        }
+        vpi -= decisionNetwork.getExpectedUtility(var, observedEvidence);
+        return vpi;
+    }
+
+    /**
+     * Extracts the information from the percepts and adds ot to our observed evidence.
+     *
+     * @param observedEvidence
+     * @param percept
+     * @return
+     */
+    abstract List<AssignmentProposition> integratePercept(List<AssignmentProposition> observedEvidence, Percept percept);
+
+
+}