Added function to simulate iterations

reachtarunhere · reachtarunhere · commit 21d9136f12f9 · 2016-03-30T00:10:20.000+05:30
diff --git a/rl.py b/rl.py
@@ -52,3 +52,32 @@ def __call__(self, percept):
 
     def update_state(self, percept):
         raise NotImplementedError
+
+
+def run_single_trial(agent_program, mdp):
+    ''' Execute trial for given agent_program
+    and mdp. mdp should be an instance of subclass
+    of mdp.MDP '''
+
+    def take_single_action(mdp, s, a):
+        '''
+        Selects outcome of taking action a
+        in state s. Weighted Sampling.
+        '''
+        x = random.uniform(0, 1)
+        cumulative_probability = 0.0
+        for probabilty_state in mdp.T(s, a):
+            probabilty, state = probabilty_state
+            cumulative_probability += probabilty
+            if x < cumulative_probability:
+                break
+        return state
+
+    current_state = mdp.init
+    while True:
+        current_reward = mdp.R(current_state)
+        percept = (current_state, current_reward)
+        next_action = agent_program(percept)
+        if next_action is None:
+            break
+        current_state = take_single_action(mdp, current_state, next_action)