Revert "add advise mode for bot evaluation"

This reverts commit 6cc6f67
mattdeitke · Dec 14, 2018 · 4969fae · 4969fae
1 parent f06ebc0
commit 4969fae
Show file tree

Hide file tree

Showing 14 changed files with 4 additions and 75 deletions.
diff --git a/scripts/compute_possible_instructions.py b/scripts/compute_possible_instructions.py
diff --git a/scripts/enjoy.py b/scripts/enjoy.py
diff --git a/scripts/eval_bot.py b/scripts/eval_bot.py
@@ -3,25 +3,13 @@
 """
 Evaluate the success rate of the bot
 This script is used for testing/debugging purposes
-
-Examples of usage:
-- Run the bot on the GoTo level 10 times (seeds 9 to 18)
-eval_bot.py --level GoTo --num_runs 10 --seed 9
-- for all levels, 100 times, run a Random(seed 0) agent for len(episode)/3 steps before running the bot:
-eval_bot.py --advise_mode --num_runs 100
-- for all levels, 500 times, during the first 10 steps, choose action form a Random(seed 9) agent with proba .9 or
- optimal (from bot) with proba .1, then continue with optimal bot actions:
-eval_boy.py --advise_mode --bad_action_proba .8 --non_optimal_steps 10 --random_agent_seed 9
-
 """
 
 import random
 import time
 from optparse import OptionParser
 from babyai.levels import level_dict
-from babyai.bot import Bot, DisappearedBoxError
-from babyai.utils.agent import ModelAgent, RandomAgent
-import numpy as np
+from babyai.bot import Bot
 
 level_list = [
     'OpenRedDoor',
@@ -51,34 +39,6 @@
     "--level",
     default=None
 )
-parser.add_option(
-    "--advise_mode",
-    action='store_true',
-    default=False,
-    help='If specified, a RandomAgent or ModelAgent will act first, then the bot will take over')
-parser.add_option(
-    "--non_optimal_steps",
-    type=int,
-    default=None,
-    help='Number of non bot steps ModelAgent or RandomAgent takes before letting the bot take over'
-)
-parser.add_option(
-    "--model",
-    default=None,
-    help='Model to use to act for a few steps before letting the bot take over'
-)
-parser.add_option(
-    "--random_agent_seed",
-    type="int",
-    default=1,
-    help='Seed of the random agent that acts a few steps before letting the bot take over'
-)
-parser.add_option(
-    "--bad_action_proba",
-    type="float",
-    default=1.,
-    help='Probability of performing the non-optimal action when the random/model agent is performing'
-)
 parser.add_option(
     "--seed",
     type="int",
@@ -98,21 +58,11 @@
 if options.level:
     level_list = [options.level]
 
-bad_agent = None
-if options.advise_mode:
-    if options.model:
-        bad_agent = ModelAgent(options.model, obss_preprocessor=None,
-                               argmax=True)
-    else:
-        bad_agent = RandomAgent(seed=options.random_agent_seed,
-                                env=level_dict[level_list[0]]())
-
 start_time = time.time()
 
 for level_name in level_list:
 
     num_success = 0
-    num_disappeared_boxes = 0
     total_reward = 0
     total_steps = 0
 
@@ -126,22 +76,10 @@
         if options.verbose:
             print('%s/%s: %s, seed=%d' % (run_no+1, options.num_runs, mission.surface, mission_seed))
 
-        optimal_actions = []
-        before_optimal_actions = []
-        non_optimal_steps = options.non_optimal_steps or int(mission.max_steps // 3)
-        np.random.seed(mission_seed)
-
         try:
             episode_steps = 0
             while True:
                 action = expert.get_action()
-                if options.advise_mode and episode_steps < non_optimal_steps:
-                    if np.random.rand() < options.bad_action_proba:
-                        action = bad_agent.act(mission.gen_obs())['action'].item()
-                    before_optimal_actions.append(action)
-                else:
-                    optimal_actions.append(action)
-
                 expert.take_action(action)
                 obs, reward, done, info = mission.step(action)
 
@@ -156,23 +94,14 @@
                         print('FAILURE on %s, seed %d, reward %.2f' % (level_name, mission_seed, reward))
                     break
         except Exception as e:
-            if isinstance(e, DisappearedBoxError):
-                num_disappeared_boxes += 1
-                if options.verbose:
-                    print('box FAILURE on %s, seed %d' % (level_name, mission_seed))
-            else:
-                print('FAILURE on %s, seed %d' % (level_name, mission_seed))
-                print(e)
-                # Playing these 2 sets of actions should get you to the mission snapshot above
-                print(before_optimal_actions, optimal_actions)
+            print('FAILURE on %s, seed %d' % (level_name, mission_seed))
+            print(e)
 
     success_rate = 100 * num_success / options.num_runs
-    disappeared_boxes_rate = 100 * num_disappeared_boxes / options.num_runs
     mean_reward = total_reward / options.num_runs
     mean_steps = total_steps / options.num_runs
 
-    print('%16s: %.1f%%, box errors %.2f%%, r=%.3f, s=%.2f' % (level_name, success_rate, disappeared_boxes_rate,
-                                                               mean_reward, mean_steps))
+    print('%16s: %.1f%%, r=%.3f, s=%.2f' % (level_name, success_rate, mean_reward, mean_steps))
 
 end_time = time.time()
 total_time = end_time - start_time

diff --git a/scripts/evaluate.py b/scripts/evaluate.py
diff --git a/scripts/evaluate_all_demos.py b/scripts/evaluate_all_demos.py
diff --git a/scripts/evaluate_all_models.py b/scripts/evaluate_all_models.py
diff --git a/scripts/gui.py b/scripts/gui.py
diff --git a/scripts/make_agent_demos.py b/scripts/make_agent_demos.py
diff --git a/scripts/make_human_demos.py b/scripts/make_human_demos.py
diff --git a/scripts/show_level_instructions.py b/scripts/show_level_instructions.py
diff --git a/scripts/test_mission_gen.py b/scripts/test_mission_gen.py
diff --git a/scripts/train_il.py b/scripts/train_il.py
diff --git a/scripts/train_intelligent_expert.py b/scripts/train_intelligent_expert.py
diff --git a/scripts/train_rl.py b/scripts/train_rl.py