Deprecate old models (#8934)

Deprecate old models

Deprecate old models (#8934)
Deprecate old models
a8ba923c · Jaeyoun Kim · GitHub · 5eb294f8 · 5eb294f8 · 5eb294f8
Unverified Commit a8ba923c authored Jul 30, 2020 by Jaeyoun Kim Committed by GitHub Jul 30, 2020
20 changed files
--- a/research/brain_coder/single_task/results_lib.py
+++ b/research/brain_coder/single_task/results_lib.py
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-"""Results object manages distributed reading and writing of results to disk."""
-
-import ast
-from collections import namedtuple
-import os
-import re
-from six.moves import xrange
-import tensorflow as tf
-
-
-ShardStats = namedtuple(
-    'ShardStats',
-    ['num_local_reps_completed', 'max_local_reps', 'finished'])
-
-
-def ge_non_zero(a, b):
-  return a >= b and b > 0
-
-
-def get_shard_id(file_name):
-  assert file_name[-4:].lower() == '.txt'
-  return int(file_name[file_name.rfind('_') + 1: -4])
-
-
-class Results(object):
-  """Manages reading and writing training results to disk asynchronously.
-
-  Each worker writes to its own file, so that there are no race conditions when
-  writing happens. However any worker may read any file, as is the case for
-  `read_all`. Writes are expected to be atomic so that workers will never
-  read incomplete data, and this is likely to be the case on Unix systems.
-  Reading out of date data is fine, as workers calling `read_all` will wait
-  until data from every worker has been written before proceeding.
-  """
-  file_template = 'experiment_results_{0}.txt'
-  search_regex = r'^experiment_results_([0-9])+\.txt$'
-
-  def __init__(self, log_dir, shard_id=0):
-    """Construct `Results` instance.
-
-    Args:
-      log_dir: Where to write results files.
-      shard_id: Unique id for this file (i.e. shard). Each worker that will
-          be writing results should use a different shard id. If there are
-          N shards, each shard should be numbered 0 through N-1.
-    """
-    # Use different files for workers so that they can write to disk async.
-    assert 0 <= shard_id
-    self.file_name = self.file_template.format(shard_id)
-    self.log_dir = log_dir
-    self.results_file = os.path.join(self.log_dir, self.file_name)
-
-  def append(self, metrics):
-    """Append results to results list on disk."""
-    with tf.gfile.FastGFile(self.results_file, 'a') as writer:
-      writer.write(str(metrics) + '\n')
-
-  def read_this_shard(self):
-    """Read only from this shard."""
-    return self._read_shard(self.results_file)
-
-  def _read_shard(self, results_file):
-    """Read only from the given shard file."""
-    try:
-      with tf.gfile.FastGFile(results_file, 'r') as reader:
-        results = [ast.literal_eval(entry) for entry in reader]
-    except tf.errors.NotFoundError:
-      # No results written to disk yet. Return empty list.
-      return []
-    return results
-
-  def _get_max_local_reps(self, shard_results):
-    """Get maximum number of repetitions the given shard needs to complete.
-
-    Worker working on each shard needs to complete a certain number of runs
-    before it finishes. This method will return that number so that we can
-    determine which shards are still not done.
-
-    We assume that workers are including a 'max_local_repetitions' value in
-    their results, which should be the total number of repetitions it needs to
-    run.
-
-    Args:
-      shard_results: Dict mapping metric names to values. This should be read
-          from a shard on disk.
-
-    Returns:
-      Maximum number of repetitions the given shard needs to complete.
-    """
-    mlrs = [r['max_local_repetitions'] for r in shard_results]
-    if not mlrs:
-      return 0
-    for n in mlrs[1:]:
-      assert n == mlrs[0], 'Some reps have different max rep.'
-    return mlrs[0]
-
-  def read_all(self, num_shards=None):
-    """Read results across all shards, i.e. get global results list.
-
-    Args:
-      num_shards: (optional) specifies total number of shards. If the caller
-          wants information about which shards are incomplete, provide this
-          argument (so that shards which have yet to be created are still
-          counted as incomplete shards). Otherwise, no information about
-          incomplete shards will be returned.
-
-    Returns:
-      aggregate: Global list of results (across all shards).
-      shard_stats: List of ShardStats instances, one for each shard. Or None if
-          `num_shards` is None.
-    """
-    try:
-      all_children = tf.gfile.ListDirectory(self.log_dir)
-    except tf.errors.NotFoundError:
-      if num_shards is None:
-        return [], None
-      return [], [[] for _ in xrange(num_shards)]
-    shard_ids = {
-        get_shard_id(fname): fname
-        for fname in all_children if re.search(self.search_regex, fname)}
-
-    if num_shards is None:
-      aggregate = []
-      shard_stats = None
-      for results_file in shard_ids.values():
-        aggregate.extend(self._read_shard(
-            os.path.join(self.log_dir, results_file)))
-    else:
-      results_per_shard = [None] * num_shards
-      for shard_id in xrange(num_shards):
-        if shard_id in shard_ids:
-          results_file = shard_ids[shard_id]
-          results_per_shard[shard_id] = self._read_shard(
-              os.path.join(self.log_dir, results_file))
-        else:
-          results_per_shard[shard_id] = []
-
-      # Compute shard stats.
-      shard_stats = []
-      for shard_results in results_per_shard:
-        max_local_reps = self._get_max_local_reps(shard_results)
-        shard_stats.append(ShardStats(
-            num_local_reps_completed=len(shard_results),
-            max_local_reps=max_local_reps,
-            finished=ge_non_zero(len(shard_results), max_local_reps)))
-
-      # Compute aggregate.
-      aggregate = [
-          r for shard_results in results_per_shard for r in shard_results]
-
-    return aggregate, shard_stats
--- a/research/brain_coder/single_task/results_lib_test.py
+++ b/research/brain_coder/single_task/results_lib_test.py
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-"""Tests for results_lib."""
-
-import contextlib
-import os
-import shutil
-import tempfile
-from six.moves import xrange
-import tensorflow as tf
-
-from single_task import results_lib  # brain coder
-
-
-@contextlib.contextmanager
-def temporary_directory(suffix='', prefix='tmp', base_path=None):
-  """A context manager to create a temporary directory and clean up on exit.
-
-  The parameters are the same ones expected by tempfile.mkdtemp.
-  The directory will be securely and atomically created.
-  Everything under it will be removed when exiting the context.
-
-  Args:
-    suffix: optional suffix.
-    prefix: options prefix.
-    base_path: the base path under which to create the temporary directory.
-  Yields:
-    The absolute path of the new temporary directory.
-  """
-  temp_dir_path = tempfile.mkdtemp(suffix, prefix, base_path)
-  try:
-    yield temp_dir_path
-  finally:
-    try:
-      shutil.rmtree(temp_dir_path)
-    except OSError as e:
-      if e.message == 'Cannot call rmtree on a symbolic link':
-        # Interesting synthetic exception made up by shutil.rmtree.
-        # Means we received a symlink from mkdtemp.
-        # Also means must clean up the symlink instead.
-        os.unlink(temp_dir_path)
-      else:
-        raise
-
-
-def freeze(dictionary):
-  """Convert dict to hashable frozenset."""
-  return frozenset(dictionary.iteritems())
-
-
-class ResultsLibTest(tf.test.TestCase):
-
-  def testResults(self):
-    with temporary_directory() as logdir:
-      results_obj = results_lib.Results(logdir)
-      self.assertEqual(results_obj.read_this_shard(), [])
-      results_obj.append(
-          {'foo': 1.5, 'bar': 2.5, 'baz': 0})
-      results_obj.append(
-          {'foo': 5.5, 'bar': -1, 'baz': 2})
-      self.assertEqual(
-          results_obj.read_this_shard(),
-          [{'foo': 1.5, 'bar': 2.5, 'baz': 0},
-           {'foo': 5.5, 'bar': -1, 'baz': 2}])
-
-  def testShardedResults(self):
-    with temporary_directory() as logdir:
-      n = 4  # Number of shards.
-      results_objs = [
-          results_lib.Results(logdir, shard_id=i) for i in xrange(n)]
-      for i, robj in enumerate(results_objs):
-        robj.append({'foo': i, 'bar': 1 + i * 2})
-      results_list, _ = results_objs[0].read_all()
-
-      # Check results. Order does not matter here.
-      self.assertEqual(
-          set(freeze(r) for r in results_list),
-          set(freeze({'foo': i, 'bar': 1 + i * 2}) for i in xrange(n)))
-
-
-if __name__ == '__main__':
-  tf.test.main()
--- a/research/brain_coder/single_task/run.py
+++ b/research/brain_coder/single_task/run.py
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-r"""Run training.
-
-Choose training algorithm and task(s) and follow these examples.
-
-Run synchronous policy gradient training locally:
-
-CONFIG="agent=c(algorithm='pg'),env=c(task='reverse')"
-OUT_DIR="/tmp/bf_pg_local"
-rm -rf $OUT_DIR
-bazel run -c opt single_task:run -- \
-    --alsologtostderr \
-    --config="$CONFIG" \
-    --max_npe=0 \
-    --logdir="$OUT_DIR" \
-    --summary_interval=1 \
-    --model_v=0
-learning/brain/tensorboard/tensorboard.sh --port 12345 --logdir "$OUT_DIR"
-
-
-Run genetic algorithm locally:
-
-CONFIG="agent=c(algorithm='ga'),env=c(task='reverse')"
-OUT_DIR="/tmp/bf_ga_local"
-rm -rf $OUT_DIR
-bazel run -c opt single_task:run -- \
-    --alsologtostderr \
-    --config="$CONFIG" \
-    --max_npe=0 \
-    --logdir="$OUT_DIR"
-
-
-Run uniform random search locally:
-
-CONFIG="agent=c(algorithm='rand'),env=c(task='reverse')"
-OUT_DIR="/tmp/bf_rand_local"
-rm -rf $OUT_DIR
-bazel run -c opt single_task:run -- \
-    --alsologtostderr \
-    --config="$CONFIG" \
-    --max_npe=0 \
-    --logdir="$OUT_DIR"
-"""
-
-from absl import app
-from absl import flags
-from absl import logging
-
-from single_task import defaults  # brain coder
-from single_task import ga_train  # brain coder
-from single_task import pg_train  # brain coder
-
-FLAGS = flags.FLAGS
-flags.DEFINE_string('config', '', 'Configuration.')
-flags.DEFINE_string(
-    'logdir', None, 'Absolute path where to write results.')
-flags.DEFINE_integer('task_id', 0, 'ID for this worker.')
-flags.DEFINE_integer('num_workers', 1, 'How many workers there are.')
-flags.DEFINE_integer(
-    'max_npe', 0,
-    'NPE = number of programs executed. Maximum number of programs to execute '
-    'in each run. Training will complete when this threshold is reached. Set '
-    'to 0 for unlimited training.')
-flags.DEFINE_integer(
-    'num_repetitions', 1,
-    'Number of times the same experiment will be run (globally across all '
-    'workers). Each run is independent.')
-flags.DEFINE_string(
-    'log_level', 'INFO',
-    'The threshold for what messages will be logged. One of DEBUG, INFO, WARN, '
-    'ERROR, or FATAL.')
-
-
-# To register an algorithm:
-# 1) Add dependency in the BUILD file to this build rule.
-# 2) Import the algorithm's module at the top of this file.
-# 3) Add a new entry in the following dict. The key is the algorithm name
-#    (used to select the algorithm in the config). The value is the module
-#    defining the expected functions for training and tuning. See the docstring
-#    for `get_namespace` for further details.
-ALGORITHM_REGISTRATION = {
-    'pg': pg_train,
-    'ga': ga_train,
-    'rand': ga_train,
-}
-
-
-def get_namespace(config_string):
-  """Get namespace for the selected algorithm.
-
-  Users who want to add additional algorithm types should modify this function.
-  The algorithm's namespace should contain the following functions:
-    run_training: Run the main training loop.
-    define_tuner_hparam_space: Return the hparam tuning space for the algo.
-    write_hparams_to_config: Helper for tuning. Write hparams chosen for tuning
-        to the Config object.
-  Look at pg_train.py and ga_train.py for function signatures and
-  implementations.
-
-  Args:
-    config_string: String representation of a Config object. This will get
-        parsed into a Config in order to determine what algorithm to use.
-
-  Returns:
-    algorithm_namespace: The module corresponding to the algorithm given in the
-        config.
-    config: The Config object resulting from parsing `config_string`.
-
-  Raises:
-    ValueError: If config.agent.algorithm is not one of the registered
-        algorithms.
-  """
-  config = defaults.default_config_with_updates(config_string)
-  if config.agent.algorithm not in ALGORITHM_REGISTRATION:
-    raise ValueError('Unknown algorithm type "%s"' % (config.agent.algorithm,))
-  else:
-    return ALGORITHM_REGISTRATION[config.agent.algorithm], config
-
-
-def main(argv):
-  del argv  # Unused.
-
-  logging.set_verbosity(FLAGS.log_level)
-
-  flags.mark_flag_as_required('logdir')
-  if FLAGS.num_workers <= 0:
-    raise ValueError('num_workers flag must be greater than 0.')
-  if FLAGS.task_id < 0:
-    raise ValueError('task_id flag must be greater than or equal to 0.')
-  if FLAGS.task_id >= FLAGS.num_workers:
-    raise ValueError(
-        'task_id flag must be strictly less than num_workers flag.')
-
-  ns, _ = get_namespace(FLAGS.config)
-  ns.run_training(is_chief=FLAGS.task_id == 0)
-
-
-if __name__ == '__main__':
-  app.run(main)
--- a/research/brain_coder/single_task/run_eval_tasks.py
+++ b/research/brain_coder/single_task/run_eval_tasks.py
-#!/usr/bin/env python
-from __future__ import print_function
-
-r"""This script can launch any eval experiments from the paper.
-
-This is a script. Run with python, not bazel.
-
-Usage:
-./single_task/run_eval_tasks.py \
-    --exp EXP --desc DESC [--tuning_tasks] [--iclr_tasks] [--task TASK] \
-    [--tasks TASK1 TASK2 ...]
-
-where EXP is one of the keys in `experiments`,
-and DESC is a string description of the set of experiments (such as "v0")
-
-Set only one of these flags:
--tuning_tasks flag only runs tuning tasks.
--iclr_tasks flag only runs the tasks included in the paper.
--regression_tests flag runs tasks which function as regression tests.
--task flag manually selects a single task to run.
--tasks flag takes a custom list of tasks.
-
-Other flags:
--reps N specifies N repetitions per experiment, Default is 25.
--training_replicas R specifies that R workers will be launched to train one
-    task (for neural network algorithms). These workers will update a global
-    model stored on a parameter server. Defaults to 1. If R > 1, a parameter
-    server will also be launched.
-
-
-Run everything:
-exps=( pg-20M pg-topk-20M topk-20M ga-20M rand-20M )
-BIN_DIR="single_task"
-for exp in "${exps[@]}"
-do
-  ./$BIN_DIR/run_eval_tasks.py \
-      --exp "$exp" --iclr_tasks
-done
-"""
-
-import argparse
-from collections import namedtuple
-import subprocess
-
-
-S = namedtuple('S', ['length'])
-default_length = 100
-
-
-iclr_tasks = [
-    'reverse', 'remove-char', 'count-char', 'add', 'bool-logic', 'print-hello',
-    'echo-twice', 'echo-thrice', 'copy-reverse', 'zero-cascade', 'cascade',
-    'shift-left', 'shift-right', 'riffle', 'unriffle', 'middle-char',
-    'remove-last', 'remove-last-two', 'echo-alternating', 'echo-half', 'length',
-    'echo-second-seq', 'echo-nth-seq', 'substring', 'divide-2', 'dedup']
-
-
-regression_test_tasks = ['reverse', 'test-hill-climb']
-
-
-E = namedtuple(
-    'E',
-    ['name', 'method_type', 'config', 'simplify', 'batch_size', 'max_npe'])
-
-
-def make_experiment_settings(name, **kwargs):
-  # Unpack experiment info from name.
-  def split_last(string, char):
-    i = string.rindex(char)
-    return string[:i], string[i+1:]
-  def si_to_int(si_string):
-    return int(
-        si_string.upper().replace('K', '0'*3).replace('M', '0'*6)
-        .replace('G', '0'*9))
-  method_type, max_npe = split_last(name, '-')
-  assert method_type
-  assert max_npe
-  return E(
-      name=name, method_type=method_type, max_npe=si_to_int(max_npe), **kwargs)
-
-
-experiments_set = {
-    make_experiment_settings(
-        'pg-20M',
-        config='entropy_beta=0.05,lr=0.0001,topk_loss_hparam=0.0,topk=0,'
-               'pi_loss_hparam=1.0,alpha=0.0',
-        simplify=False,
-        batch_size=64),
-    make_experiment_settings(
-        'pg-topk-20M',
-        config='entropy_beta=0.01,lr=0.0001,topk_loss_hparam=50.0,topk=10,'
-               'pi_loss_hparam=1.0,alpha=0.0',
-        simplify=False,
-        batch_size=64),
-    make_experiment_settings(
-        'topk-20M',
-        config='entropy_beta=0.01,lr=0.0001,topk_loss_hparam=200.0,topk=10,'
-               'pi_loss_hparam=0.0,alpha=0.0',
-        simplify=False,
-        batch_size=64),
-    make_experiment_settings(
-        'topk-0ent-20M',
-        config='entropy_beta=0.000,lr=0.0001,topk_loss_hparam=200.0,topk=10,'
-               'pi_loss_hparam=0.0,alpha=0.0',
-        simplify=False,
-        batch_size=64),
-    make_experiment_settings(
-        'ga-20M',
-        config='crossover_rate=0.95,mutation_rate=0.15',
-        simplify=False,
-        batch_size=100),  # Population size.
-    make_experiment_settings(
-        'rand-20M',
-        config='',
-        simplify=False,
-        batch_size=1),
-    make_experiment_settings(
-        'simpl-500M',
-        config='entropy_beta=0.05,lr=0.0001,topk_loss_hparam=0.5,topk=10,'
-               'pi_loss_hparam=1.0,alpha=0.0',
-        simplify=True,
-        batch_size=64),
-}
-
-experiments = {e.name: e for e in experiments_set}
-
-
-# pylint: disable=redefined-outer-name
-def parse_args(extra_args=()):
-  """Parse arguments and extract task and experiment info."""
-  parser = argparse.ArgumentParser(description='Run all eval tasks.')
-  parser.add_argument('--exp', required=True)
-  parser.add_argument('--tuning_tasks', action='store_true')
-  parser.add_argument('--iclr_tasks', action='store_true')
-  parser.add_argument('--regression_tests', action='store_true')
-  parser.add_argument('--desc', default='v0')
-  parser.add_argument('--reps', default=25)
-  parser.add_argument('--task')
-  parser.add_argument('--tasks', nargs='+')
-  for arg_string, default in extra_args:
-    parser.add_argument(arg_string, default=default)
-  args = parser.parse_args()
-
-  print('Running experiment: %s' % (args.exp,))
-  if args.desc:
-    print('Extra description: "%s"' % (args.desc,))
-  if args.exp not in experiments:
-    raise ValueError('Experiment name is not valid')
-  experiment_name = args.exp
-  experiment_settings = experiments[experiment_name]
-  assert experiment_settings.name == experiment_name
-
-  if args.tasks:
-    print('Launching tasks from args: %s' % (args.tasks,))
-    tasks = {t: S(length=default_length) for t in args.tasks}
-  elif args.task:
-    print('Launching single task "%s"' % args.task)
-    tasks = {args.task: S(length=default_length)}
-  elif args.tuning_tasks:
-    print('Only running tuning tasks')
-    tasks = {name: S(length=default_length)
-             for name in ['reverse-tune', 'remove-char-tune']}
-  elif args.iclr_tasks:
-    print('Running eval tasks from ICLR paper.')
-    tasks = {name: S(length=default_length) for name in iclr_tasks}
-  elif args.regression_tests:
-    tasks = {name: S(length=default_length) for name in regression_test_tasks}
-  print('Tasks: %s' % tasks.keys())
-
-  print('reps = %d' % (int(args.reps),))
-
-  return args, tasks, experiment_settings
-
-
-def run(command_string):
-  subprocess.call(command_string, shell=True)
-
-
-if __name__ == '__main__':
-  LAUNCH_TRAINING_COMMAND = 'single_task/launch_training.sh'
-  COMPILE_COMMAND = 'bazel build -c opt single_task:run.par'
-
-  args, tasks, experiment_settings = parse_args(
-      extra_args=(('--training_replicas', 1),))
-
-  if experiment_settings.method_type in (
-      'pg', 'pg-topk', 'topk', 'topk-0ent', 'simpl'):
-    # Runs PG and TopK.
-
-    def make_run_cmd(job_name, task, max_npe, num_reps, code_length,
-                     batch_size, do_simplify, custom_config_str):
-      """Constructs terminal command for launching NN based algorithms.
-
-      The arguments to this function will be used to create config for the
-      experiment.
-
-      Args:
-        job_name: Name of the job to launch. Should uniquely identify this
-            experiment run.
-        task: Name of the coding task to solve.
-        max_npe: Maximum number of programs executed. An integer.
-        num_reps: Number of times to run the experiment. An integer.
-        code_length: Maximum allowed length of synthesized code.
-        batch_size: Minibatch size for gradient descent.
-        do_simplify: Whether to run the experiment in code simplification mode.
-            A bool.
-        custom_config_str: Additional config for the model config string.
-
-      Returns:
-        The terminal command that launches the specified experiment.
-      """
-      config = """
-        env=c(task='{0}',correct_syntax=False),
-        agent=c(
-          algorithm='pg',
-          policy_lstm_sizes=[35,35],value_lstm_sizes=[35,35],
-          grad_clip_threshold=50.0,param_init_factor=0.5,regularizer=0.0,
-          softmax_tr=1.0,optimizer='rmsprop',ema_baseline_decay=0.99,
-          eos_token={3},{4}),
-        timestep_limit={1},batch_size={2}
-      """.replace(' ', '').replace('\n', '').format(
-          task, code_length, batch_size, do_simplify, custom_config_str)
-      num_ps = 0 if args.training_replicas == 1 else 1
-      return (
-          r'{0} --job_name={1} --config="{2}" --max_npe={3} '
-          '--num_repetitions={4} --num_workers={5} --num_ps={6} '
-          '--stop_on_success={7}'
-          .format(LAUNCH_TRAINING_COMMAND, job_name, config, max_npe, num_reps,
-                  args.training_replicas, num_ps, str(not do_simplify).lower()))
-
-  else:
-    # Runs GA and Rand.
-    assert experiment_settings.method_type in ('ga', 'rand')
-
-    def make_run_cmd(job_name, task, max_npe, num_reps, code_length,
-                     batch_size, do_simplify, custom_config_str):
-      """Constructs terminal command for launching GA or uniform random search.
-
-      The arguments to this function will be used to create config for the
-      experiment.
-
-      Args:
-        job_name: Name of the job to launch. Should uniquely identify this
-            experiment run.
-        task: Name of the coding task to solve.
-        max_npe: Maximum number of programs executed. An integer.
-        num_reps: Number of times to run the experiment. An integer.
-        code_length: Maximum allowed length of synthesized code.
-        batch_size: Minibatch size for gradient descent.
-        do_simplify: Whether to run the experiment in code simplification mode.
-            A bool.
-        custom_config_str: Additional config for the model config string.
-
-      Returns:
-        The terminal command that launches the specified experiment.
-      """
-      assert not do_simplify
-      if custom_config_str:
-        custom_config_str = ',' + custom_config_str
-      config = """
-        env=c(task='{0}',correct_syntax=False),
-        agent=c(
-          algorithm='{4}'
-          {3}),
-        timestep_limit={1},batch_size={2}
-      """.replace(' ', '').replace('\n', '').format(
-          task, code_length, batch_size, custom_config_str,
-          experiment_settings.method_type)
-      num_workers = num_reps  # Do each rep in parallel.
-      return (
-          r'{0} --job_name={1} --config="{2}" --max_npe={3} '
-          '--num_repetitions={4} --num_workers={5} --num_ps={6} '
-          '--stop_on_success={7}'
-          .format(LAUNCH_TRAINING_COMMAND, job_name, config, max_npe, num_reps,
-                  num_workers, 0, str(not do_simplify).lower()))
-
-  print('Compiling...')
-  run(COMPILE_COMMAND)
-
-  print('Launching %d coding tasks...' % len(tasks))
-  for task, task_settings in tasks.iteritems():
-    name = 'bf_rl_iclr'
-    desc = '{0}.{1}_{2}'.format(args.desc, experiment_settings.name, task)
-    job_name = '{}.{}'.format(name, desc)
-    print('Job name: %s' % job_name)
-    reps = int(args.reps) if not experiment_settings.simplify else 1
-    run_cmd = make_run_cmd(
-        job_name, task, experiment_settings.max_npe, reps,
-        task_settings.length, experiment_settings.batch_size,
-        experiment_settings.simplify,
-        experiment_settings.config)
-    print('Running command:\n' + run_cmd)
-    run(run_cmd)
-
-  print('Done.')
-# pylint: enable=redefined-outer-name
--- a/research/brain_coder/single_task/test_tasks.py
+++ b/research/brain_coder/single_task/test_tasks.py
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-"""Tasks that test correctness of algorithms."""
-
-from six.moves import xrange
-from common import reward as reward_lib  # brain coder
-from single_task import misc  # brain coder
-
-
-class BasicTaskManager(object):
-  """Wraps a generic reward function."""
-
-  def __init__(self, reward_fn):
-    self.reward_fn = reward_fn
-    self.good_reward = 1.0
-
-  def _score_string(self, string):
-    actions = misc.bf_string_to_tokens(string)
-    reward, correct = self.reward_fn(actions)
-    return misc.RewardInfo(
-        episode_rewards=[0.0] * (len(string) - 1) + [reward],
-        input_case=None,
-        correct_output=None,
-        code_output=actions,
-        input_type=None,
-        output_type=misc.IOType.integer,
-        reason='correct' if correct else 'wrong')
-
-  def rl_batch(self, batch_size):
-    reward_fns = [self._score_string] * batch_size
-    return reward_fns
-
-
-class Trie(object):
-  """Trie for sequences."""
-  EOS = ()
-
-  def __init__(self):
-    self.trie = {}
-
-  def insert(self, sequence):
-    d = self.trie
-    for e in sequence:
-      if e not in d:
-        d[e] = {}
-      d = d[e]
-    d[self.EOS] = True   # Terminate sequence.
-
-  def prefix_match(self, sequence):
-    """Return prefix of `sequence` which exists in the trie."""
-    d = self.trie
-    index = 0
-    for i, e in enumerate(sequence + [self.EOS]):
-      index = i
-      if e in d:
-        d = d[e]
-        if e == self.EOS:
-          return sequence, True
-      else:
-        break
-    return sequence[:index], False
-
-  def next_choices(self, sequence):
-    d = self.trie
-    for e in sequence:
-      if e in d:
-        d = d[e]
-      else:
-        raise ValueError('Sequence not a prefix: %s' % (sequence,))
-    return d.keys()
-
-
-class HillClimbingTask(object):
-  """Simple task that tests reward hill climbing ability.
-
-  There are a set of paths (sequences of tokens) which are rewarded. The total
-  reward for a path is proportional to its length, so the longest path is the
-  target. Shorter paths can be dead ends.
-  """
-
-  def __init__(self):
-    # Paths are sequences of sub-sequences. Here we form unique sub-sequences
-    # out of 3 arbitrary ints. We use sub-sequences instead of single entities
-    # to make the task harder by making the episodes last longer, i.e. more
-    # for the agent to remember.
-    a = (1, 2, 3)
-    b = (4, 5, 6)
-    c = (7, 8, 7)
-    d = (6, 5, 4)
-    e = (3, 2, 1)
-    f = (8, 5, 1)
-    g = (6, 4, 2)
-    h = (1, 8, 3)
-    self.paths = Trie()
-    self.paths.insert([a, b, h])
-    self.paths.insert([a, b, c, d, e, f, g, h])
-    self.paths.insert([a, b, c, d, e, b, a])
-    self.paths.insert([a, b, g, h])
-    self.paths.insert([a, e, f, g])
-    self.correct_sequence = misc.flatten([a, b, c, d, e, f, g, h])
-
-    def distance_fn(a, b):
-      len_diff = abs(len(a) - len(b))
-      return sum(reward_lib.mod_abs_diff(ai - 1, bi - 1, 8)
-                 for ai, bi in zip(a, b)) + len_diff * 4  # 8 / 2 = 4
-    self.distance_fn = distance_fn
-
-  def __call__(self, actions):
-    # Compute reward for action sequence.
-    actions = [a for a in actions if a > 0]
-    sequence = [tuple(actions[i: i + 3]) for i in xrange(0, len(actions), 3)]
-    prefix, complete = self.paths.prefix_match(sequence)
-    if complete:
-      return float(len(prefix)), actions == self.correct_sequence
-    if len(prefix) == len(sequence):
-      return float(len(prefix)), False
-    next_pred = sequence[len(prefix)]
-    choices = self.paths.next_choices(prefix)
-    if choices == [()]:
-      return (len(prefix) - len(next_pred) / 3.0), False
-    min_dist = min(self.distance_fn(c, next_pred) for c in choices)
-    # +1 reward for each element in the sequence correct, plus fraction torwards
-    # closest next element.
-    # Maximum distance possible is num_actions * base / 2 = 3 * 8 / 2 = 12
-    return (len(prefix) + (1 - min_dist / 12.0)), False
--- a/research/brain_coder/single_task/test_tasks_test.py
+++ b/research/brain_coder/single_task/test_tasks_test.py
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-"""Tests for test_tasks."""
-
-import numpy as np
-import tensorflow as tf
-
-from single_task import misc  # brain coder
-from single_task import test_tasks  # brain coder
-
-
-def get_reward(reward_fn, candidate):
-  return sum(reward_fn(misc.bf_tokens_to_string(candidate)).episode_rewards)
-
-
-class TestTasksTest(tf.test.TestCase):
-
-  def testHillClimbingTask(self):
-    task = test_tasks.BasicTaskManager(test_tasks.HillClimbingTask())
-    reward_fns = task.rl_batch(1)
-    reward_fn = reward_fns[0]
-    self.assertTrue(np.isclose(get_reward(reward_fn, [1, 2, 0]), 8 / 12.))
-    self.assertTrue(np.isclose(get_reward(reward_fn, [1, 2, 2, 0]), 11 / 12.))
-    self.assertTrue(np.isclose(get_reward(reward_fn, [1, 2, 3, 0]), 1.0))
-    self.assertTrue(
-        np.isclose(get_reward(reward_fn, [1, 2, 3, 4, 5, 2, 0]), 1. + 8 / 12.))
-    self.assertTrue(
-        np.isclose(get_reward(reward_fn, [1, 2, 3, 4, 5, 6, 0]), 2.0))
-    self.assertTrue(
-        np.isclose(get_reward(reward_fn, [1, 2, 3, 4, 5, 6, 1, 8, 3, 0]), 3.0))
-    self.assertTrue(
-        np.isclose(get_reward(reward_fn, [1, 2, 3, 4, 5, 6, 7, 8, 7, 0]), 3.0))
-    self.assertTrue(
-        np.isclose(get_reward(reward_fn, [1, 2, 3, 4, 5, 6, 1, 8, 3, 1, 0]),
-                   3.0 - 4 / 12.))
-    self.assertTrue(
-        np.isclose(
-            get_reward(reward_fn, [1, 2, 3, 4, 5, 6, 1, 8, 3, 1, 1, 1, 1, 0]),
-            2.0))
-    self.assertTrue(
-        np.isclose(get_reward(reward_fn, [1, 2, 3, 4, 5, 6, 7, 8, 7, 3, 0]),
-                   3.0 + 1 / 12.))
-    self.assertTrue(
-        np.isclose(
-            get_reward(reward_fn, [1, 2, 3, 4, 5, 6, 7, 8, 7, 6, 5, 4, 3, 2, 1,
-                                   8, 5, 1, 6, 4, 2, 1, 8, 3, 0]),
-            8.0))
-    self.assertTrue(
-        np.isclose(
-            get_reward(reward_fn, [1, 2, 3, 4, 5, 6, 7, 8, 7, 6, 5, 4, 3, 2, 1,
-                                   8, 5, 1, 6, 4, 2, 1, 8, 3, 1, 1, 0]),
-            8.0 - 8 / 12.))
-    self.assertTrue(
-        np.isclose(get_reward(reward_fn, [1, 2, 3, 4, 5, 6, 7, 8, 7, 6, 5, 4, 3,
-                                          2, 1, 8, 5, 1, 6, 4, 2, 1, 8, 3, 1, 1,
-                                          1, 1, 1, 1, 1, 0]),
-                   7.0))
-
-
-if __name__ == '__main__':
-  tf.test.main()
--- a/research/brain_coder/single_task/tune.py
+++ b/research/brain_coder/single_task/tune.py
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-r"""Run grid search.
-
-Look at launch_tuning.sh for details on how to tune at scale.
-
-Usage example:
-Tune with one worker on the local machine.
-
-CONFIG="agent=c(algorithm='pg'),"
-CONFIG+="env=c(task_cycle=['reverse-tune', 'remove-tune'])"
-HPARAM_SPACE_TYPE="pg"
-OUT_DIR="/tmp/bf_pg_tune"
-MAX_NPE=5000000
-NUM_REPETITIONS=50
-rm -rf $OUT_DIR
-mkdir $OUT_DIR
-bazel run -c opt single_task:tune -- \
-    --alsologtostderr \
-    --config="$CONFIG" \
-    --max_npe="$MAX_NPE" \
-    --num_repetitions="$NUM_REPETITIONS" \
-    --logdir="$OUT_DIR" \
-    --summary_interval=1 \
-    --model_v=0 \
-    --hparam_space="$HPARAM_SPACE_TYPE" \
-    --tuner_id=0 \
-    --num_tuners=1 \
-    2>&1 >"$OUT_DIR/tuner_0.log"
-learning/brain/tensorboard/tensorboard.sh --port 12345 --logdir "$OUT_DIR"
-"""
-
-import ast
-import os
-
-from absl import app
-from absl import flags
-from absl import logging
-import numpy as np
-from six.moves import xrange
-import tensorflow as tf
-
-from single_task import defaults  # brain coder
-from single_task import run as run_lib  # brain coder
-
-FLAGS = flags.FLAGS
-flags.DEFINE_integer(
-    'tuner_id', 0,
-    'The unique ID for this tuning worker.')
-flags.DEFINE_integer(
-    'num_tuners', 1,
-    'How many tuners are there.')
-flags.DEFINE_string(
-    'hparam_space', 'default',
-    'String name which denotes the hparam space to tune over. This is '
-    'algorithm dependent.')
-flags.DEFINE_string(
-    'fixed_hparams', '',
-    'HParams string. Used to fix hparams during tuning.')
-flags.DEFINE_float(
-    'success_rate_objective_weight', 1.0,
-    'How much to weight success rate vs num programs seen. By default, only '
-    'success rate is optimized (this is the setting used in the paper).')
-
-
-def parse_hparams_string(hparams_str):
-  hparams = {}
-  for term in hparams_str.split(','):
-    if not term:
-      continue
-    name, value = term.split('=')
-    hparams[name.strip()] = ast.literal_eval(value)
-  return hparams
-
-
-def int_to_multibase(n, bases):
-  digits = [0] * len(bases)
-  for i, b in enumerate(bases):
-    n, d = divmod(n, b)
-    digits[i] = d
-  return digits
-
-
-def hparams_for_index(index, tuning_space):
-  keys = sorted(tuning_space.keys())
-  indices = int_to_multibase(index, [len(tuning_space[k]) for k in keys])
-  return tf.contrib.training.HParams(
-      **{k: tuning_space[k][i] for k, i in zip(keys, indices)})
-
-
-def run_tuner_loop(ns):
-  """Run tuning loop for this worker."""
-  is_chief = FLAGS.task_id == 0
-  tuning_space = ns.define_tuner_hparam_space(
-      hparam_space_type=FLAGS.hparam_space)
-  fixed_hparams = parse_hparams_string(FLAGS.fixed_hparams)
-  for name, value in fixed_hparams.iteritems():
-    tuning_space[name] = [value]
-  tuning_space_size = np.prod([len(values) for values in tuning_space.values()])
-
-  num_local_trials, remainder = divmod(tuning_space_size, FLAGS.num_tuners)
-  if FLAGS.tuner_id < remainder:
-    num_local_trials += 1
-  starting_trial_id = (
-      num_local_trials * FLAGS.tuner_id + min(remainder, FLAGS.tuner_id))
-
-  logging.info('tuning_space_size: %d', tuning_space_size)
-  logging.info('num_local_trials: %d', num_local_trials)
-  logging.info('starting_trial_id: %d', starting_trial_id)
-
-  for local_trial_index in xrange(num_local_trials):
-    trial_config = defaults.default_config_with_updates(FLAGS.config)
-    global_trial_index = local_trial_index + starting_trial_id
-    trial_name = 'trial_' + str(global_trial_index)
-    trial_dir = os.path.join(FLAGS.logdir, trial_name)
-    hparams = hparams_for_index(global_trial_index, tuning_space)
-    ns.write_hparams_to_config(
-        trial_config, hparams, hparam_space_type=FLAGS.hparam_space)
-
-    results_list = ns.run_training(
-        config=trial_config, tuner=None, logdir=trial_dir, is_chief=is_chief,
-        trial_name=trial_name)
-
-    if not is_chief:
-      # Only chief worker needs to write tuning results to disk.
-      continue
-
-    objective, metrics = compute_tuning_objective(
-        results_list, hparams, trial_name, num_trials=tuning_space_size)
-    logging.info('metrics:\n%s', metrics)
-    logging.info('objective: %s', objective)
-    logging.info('programs_seen_fraction: %s',
-                 metrics['programs_seen_fraction'])
-    logging.info('success_rate: %s', metrics['success_rate'])
-    logging.info('success_rate_objective_weight: %s',
-                 FLAGS.success_rate_objective_weight)
-
-    tuning_results_file = os.path.join(trial_dir, 'tuning_results.txt')
-    with tf.gfile.FastGFile(tuning_results_file, 'a') as writer:
-      writer.write(str(metrics) + '\n')
-
-    logging.info('Trial %s complete.', trial_name)
-
-
-def compute_tuning_objective(results_list, hparams, trial_name, num_trials):
-  """Compute tuning objective and metrics given results and trial information.
-
-  Args:
-    results_list: List of results dicts read from disk. These are written by
-        workers.
-    hparams: tf.contrib.training.HParams instance containing the hparams used
-        in this trial (only the hparams which are being tuned).
-    trial_name: Name of this trial. Used to create a trial directory.
-    num_trials: Total number of trials that need to be run. This is saved in the
-        metrics dict for future reference.
-
-  Returns:
-    objective: The objective computed for this trial. Choose the hparams for the
-        trial with the largest objective value.
-    metrics: Information about this trial. A dict.
-  """
-  found_solution = [r['found_solution'] for r in results_list]
-  successful_program_counts = [
-      r['npe'] for r in results_list if r['found_solution']]
-
-  success_rate = sum(found_solution) / float(len(results_list))
-
-  max_programs = FLAGS.max_npe  # Per run.
-  all_program_counts = [
-      r['npe'] if r['found_solution'] else max_programs
-      for r in results_list]
-  programs_seen_fraction = (
-      float(sum(all_program_counts))
-      / (max_programs * len(all_program_counts)))
-
-  # min/max/avg stats are over successful runs.
-  metrics = {
-      'num_runs': len(results_list),
-      'num_succeeded': sum(found_solution),
-      'success_rate': success_rate,
-      'programs_seen_fraction': programs_seen_fraction,
-      'avg_programs': np.mean(successful_program_counts),
-      'max_possible_programs_per_run': max_programs,
-      'global_step': sum([r['num_batches'] for r in results_list]),
-      'hparams': hparams.values(),
-      'trial_name': trial_name,
-      'num_trials': num_trials}
-
-  # Report stats per tasks.
-  tasks = [r['task'] for r in results_list]
-  for task in set(tasks):
-    task_list = [r for r in results_list if r['task'] == task]
-    found_solution = [r['found_solution'] for r in task_list]
-    successful_rewards = [
-        r['best_reward'] for r in task_list
-        if r['found_solution']]
-    successful_num_batches = [
-        r['num_batches']
-        for r in task_list if r['found_solution']]
-    successful_program_counts = [
-        r['npe'] for r in task_list if r['found_solution']]
-    metrics_append = {
-        task + '__num_runs': len(task_list),
-        task + '__num_succeeded': sum(found_solution),
-        task + '__success_rate': (
-            sum(found_solution) / float(len(task_list)))}
-    metrics.update(metrics_append)
-    if any(found_solution):
-      metrics_append = {
-          task + '__min_reward': min(successful_rewards),
-          task + '__max_reward': max(successful_rewards),
-          task + '__avg_reward': np.median(successful_rewards),
-          task + '__min_programs': min(successful_program_counts),
-          task + '__max_programs': max(successful_program_counts),
-          task + '__avg_programs': np.mean(successful_program_counts),
-          task + '__min_batches': min(successful_num_batches),
-          task + '__max_batches': max(successful_num_batches),
-          task + '__avg_batches': np.mean(successful_num_batches)}
-      metrics.update(metrics_append)
-
-  # Objective will be maximized.
-  # Maximize success rate, minimize num programs seen.
-  # Max objective is always 1.
-  weight = FLAGS.success_rate_objective_weight
-  objective = (
-      weight * success_rate
-      + (1 - weight) * (1 - programs_seen_fraction))
-  metrics['objective'] = objective
-
-  return objective, metrics
-
-
-def main(argv):
-  del argv
-
-  logging.set_verbosity(FLAGS.log_level)
-
-  if not FLAGS.logdir:
-    raise ValueError('logdir flag must be provided.')
-  if FLAGS.num_workers <= 0:
-    raise ValueError('num_workers flag must be greater than 0.')
-  if FLAGS.task_id < 0:
-    raise ValueError('task_id flag must be greater than or equal to 0.')
-  if FLAGS.task_id >= FLAGS.num_workers:
-    raise ValueError(
-        'task_id flag must be strictly less than num_workers flag.')
-  if FLAGS.num_tuners <= 0:
-    raise ValueError('num_tuners flag must be greater than 0.')
-  if FLAGS.tuner_id < 0:
-    raise ValueError('tuner_id flag must be greater than or equal to 0.')
-  if FLAGS.tuner_id >= FLAGS.num_tuners:
-    raise ValueError(
-        'tuner_id flag must be strictly less than num_tuners flag.')
-
-  ns, _ = run_lib.get_namespace(FLAGS.config)
-  run_tuner_loop(ns)
-
-
-if __name__ == '__main__':
-  app.run(main)
--- a/research/cognitive_mapping_and_planning/.gitignore
+++ b/research/cognitive_mapping_and_planning/.gitignore
-deps
-*.pyc
-lib*.so
-lib*.so*
--- a/research/cognitive_mapping_and_planning/README.md
+++ b/research/cognitive_mapping_and_planning/README.md
-![No Maintenance Intended](https://img.shields.io/badge/No%20Maintenance%20Intended-%E2%9C%95-red.svg)
-![TensorFlow Requirement: 1.x](https://img.shields.io/badge/TensorFlow%20Requirement-1.x-brightgreen)
-![TensorFlow 2 Not Supported](https://img.shields.io/badge/TensorFlow%202%20Not%20Supported-%E2%9C%95-red.svg)
-
-# Cognitive Mapping and Planning for Visual Navigation
-**Saurabh Gupta, James Davidson, Sergey Levine, Rahul Sukthankar, Jitendra Malik**
-
-**Computer Vision and Pattern Recognition (CVPR) 2017.**
-
-**[ArXiv](https://arxiv.org/abs/1702.03920), 
-[Project Website](https://sites.google.com/corp/view/cognitive-mapping-and-planning/)**
-
-### Citing
-If you find this code base and models useful in your research, please consider
-citing the following paper:
-  ```
-  @inproceedings{gupta2017cognitive,
-    title={Cognitive Mapping and Planning for Visual Navigation},
-    author={Gupta, Saurabh and Davidson, James and Levine, Sergey and
-      Sukthankar, Rahul and Malik, Jitendra},
-    booktitle={CVPR},
-    year={2017}
-  }
-  ```
-
-### Contents
-1.  [Requirements: software](#requirements-software)
-2.  [Requirements: data](#requirements-data)
-3.  [Test Pre-trained Models](#test-pre-trained-models)
-4.  [Train your Own Models](#train-your-own-models)
-
-### Requirements: software
-1.  Python Virtual Env Setup: All code is implemented in Python but depends on a
-    small number of python packages and a couple of C libraries. We recommend
-    using virtual environment for installing these python packages and python
-    bindings for these C libraries.
-      ```Shell
-      VENV_DIR=venv
-      pip install virtualenv
-      virtualenv $VENV_DIR
-      source $VENV_DIR/bin/activate
-      
-      # You may need to upgrade pip for installing openv-python.
-      pip install --upgrade pip
-      # Install simple dependencies.
-      pip install -r requirements.txt
-
-      # Patch bugs in dependencies.
-      sh patches/apply_patches.sh
-      ```
-
-2.  Install [Tensorflow](https://www.tensorflow.org/) inside this virtual
-    environment. You will need to use one of the latest nightly builds 
-    (see instructions [here](https://github.com/tensorflow/tensorflow#installation)).
-
-3.  Swiftshader: We use
-    [Swiftshader](https://github.com/google/swiftshader.git), a CPU based
-    renderer to render the meshes.  It is possible to use other renderers,
-    replace `SwiftshaderRenderer` in `render/swiftshader_renderer.py` with
-    bindings to your renderer. 
-    ```Shell
-    mkdir -p deps
-    git clone --recursive https://github.com/google/swiftshader.git deps/swiftshader-src
-    cd deps/swiftshader-src && git checkout 91da6b00584afd7dcaed66da88e2b617429b3950
-    git submodule update
-    mkdir build && cd build && cmake .. && make -j 16 libEGL libGLESv2
-    cd ../../../
-    cp deps/swiftshader-src/build/libEGL* libEGL.so.1
-    cp deps/swiftshader-src/build/libGLESv2* libGLESv2.so.2
-    ```
-
-4.  PyAssimp: We use [PyAssimp](https://github.com/assimp/assimp.git) to load
-    meshes.  It is possible to use other libraries to load meshes, replace
-    `Shape` `render/swiftshader_renderer.py` with bindings to your library for
-    loading meshes. 
-    ```Shell
-    mkdir -p deps
-    git clone https://github.com/assimp/assimp.git deps/assimp-src
-    cd deps/assimp-src
-    git checkout 2afeddd5cb63d14bc77b53740b38a54a97d94ee8
-    cmake CMakeLists.txt -G 'Unix Makefiles' && make -j 16
-    cd port/PyAssimp && python setup.py install
-    cd ../../../..
-    cp deps/assimp-src/lib/libassimp* .
-    ```
-
-5.  graph-tool: We use [graph-tool](https://git.skewed.de/count0/graph-tool)
-    library for graph processing.
-    ```Shell
-    mkdir -p deps
-    # If the following git clone command fails, you can also download the source
-    # from https://downloads.skewed.de/graph-tool/graph-tool-2.2.44.tar.bz2
-    git clone https://git.skewed.de/count0/graph-tool deps/graph-tool-src
-    cd deps/graph-tool-src && git checkout 178add3a571feb6666f4f119027705d95d2951ab
-    bash autogen.sh
-    ./configure --disable-cairo --disable-sparsehash --prefix=$HOME/.local
-    make -j 16
-    make install
-    cd ../../
-    ```
-
-### Requirements: data
-1.  Download the Stanford 3D Indoor Spaces Dataset (S3DIS Dataset) and ImageNet
-    Pre-trained models for initializing different models. Follow instructions in
-    `data/README.md`
-
-### Test Pre-trained Models
-1.  Download pre-trained models. See `output/README.md`.
-
-2.  Test models using `scripts/script_test_pretrained_models.sh`.
-
-### Train Your Own Models
-All models were trained asynchronously with 16 workers each worker using data
-from a single floor. The default hyper-parameters correspond to this setting.
-See [distributed training with
-Tensorflow](https://www.tensorflow.org/deploy/distributed) for setting up
-distributed training. Training with a single worker is possible with the current
-code base but will require some minor changes to allow each worker to load all
-training environments.
-
-### Contact
-For questions or issues open an issue on the tensorflow/models [issues
-tracker](https://github.com/tensorflow/models/issues). Please assign issues to
-@s-gupta.
-
-### Credits
-This code was written by Saurabh Gupta (@s-gupta).
--- a/research/cognitive_mapping_and_planning/__init__.py
+++ b/research/cognitive_mapping_and_planning/__init__.py
--- a/research/cognitive_mapping_and_planning/cfgs/__init__.py
+++ b/research/cognitive_mapping_and_planning/cfgs/__init__.py
--- a/research/cognitive_mapping_and_planning/cfgs/config_cmp.py
+++ b/research/cognitive_mapping_and_planning/cfgs/config_cmp.py
-# Copyright 2016 The TensorFlow Authors All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-
-import os, sys
-import numpy as np
-from tensorflow.python.platform import app
-from tensorflow.python.platform import flags
-import logging
-import src.utils as utils
-import cfgs.config_common as cc
-
-
-import tensorflow as tf
-
-
-rgb_resnet_v2_50_path = 'data/init_models/resnet_v2_50/model.ckpt-5136169'
-d_resnet_v2_50_path = 'data/init_models/distill_rgb_to_d_resnet_v2_50/model.ckpt-120002'
-
-def get_default_args():
-  summary_args = utils.Foo(display_interval=1, test_iters=26,
-                           arop_full_summary_iters=14)
-
-  control_args = utils.Foo(train=False, test=False,
-                           force_batchnorm_is_training_at_test=False,
-                           reset_rng_seed=False, only_eval_when_done=False,
-                           test_mode=None)
-  return summary_args, control_args
-
-def get_default_cmp_args():
-  batch_norm_param = {'center': True, 'scale': True,
-                      'activation_fn':tf.nn.relu}
-
-  mapper_arch_args = utils.Foo(
-      dim_reduce_neurons=64,
-      fc_neurons=[1024, 1024],
-      fc_out_size=8,
-      fc_out_neurons=64,
-      encoder='resnet_v2_50',
-      deconv_neurons=[64, 32, 16, 8, 4, 2],
-      deconv_strides=[2, 2, 2, 2, 2, 2],
-      deconv_layers_per_block=2,
-      deconv_kernel_size=4,
-      fc_dropout=0.5,
-      combine_type='wt_avg_logits',
-      batch_norm_param=batch_norm_param)
-
-  readout_maps_arch_args = utils.Foo(
-      num_neurons=[],
-      strides=[],
-      kernel_size=None,
-      layers_per_block=None)
-
-  arch_args = utils.Foo(
-      vin_val_neurons=8, vin_action_neurons=8, vin_ks=3, vin_share_wts=False,
-      pred_neurons=[64, 64], pred_batch_norm_param=batch_norm_param,
-      conv_on_value_map=0, fr_neurons=16, fr_ver='v2', fr_inside_neurons=64,
-      fr_stride=1, crop_remove_each=30, value_crop_size=4,
-      action_sample_type='sample', action_sample_combine_type='one_or_other',
-      sample_gt_prob_type='inverse_sigmoid_decay', dagger_sample_bn_false=True,
-      vin_num_iters=36, isd_k=750., use_agent_loc=False, multi_scale=True,
-      readout_maps=False, rom_arch=readout_maps_arch_args)
-
-  return arch_args, mapper_arch_args
-
-def get_arch_vars(arch_str):
-  if arch_str == '': vals = []
-  else: vals = arch_str.split('_')
-  ks = ['var1', 'var2', 'var3']
-  ks = ks[:len(vals)]
-  
-  # Exp Ver.
-  if len(vals) == 0: ks.append('var1'); vals.append('v0')
-  # custom arch.
-  if len(vals) == 1: ks.append('var2'); vals.append('')
-  # map scape for projection baseline.
-  if len(vals) == 2: ks.append('var3'); vals.append('fr2')
-
-  assert(len(vals) == 3)
-
-  vars = utils.Foo()
-  for k, v in zip(ks, vals):
-    setattr(vars, k, v)
-
-  logging.error('arch_vars: %s', vars)
-  return vars
-
-def process_arch_str(args, arch_str):
-  # This function modifies args.
-  args.arch, args.mapper_arch = get_default_cmp_args()
-
-  arch_vars = get_arch_vars(arch_str)
-
-  args.navtask.task_params.outputs.ego_maps = True
-  args.navtask.task_params.outputs.ego_goal_imgs = True
-  args.navtask.task_params.outputs.egomotion = True
-  args.navtask.task_params.toy_problem = False
-
-  if arch_vars.var1 == 'lmap':
-    args = process_arch_learned_map(args, arch_vars)
-
-  elif arch_vars.var1 == 'pmap':
-    args = process_arch_projected_map(args, arch_vars)
-
-  else:
-    logging.fatal('arch_vars.var1 should be lmap or pmap, but is %s', arch_vars.var1)
-    assert(False)
-
-  return args
-
-def process_arch_learned_map(args, arch_vars):
-  # Multiscale vision based system.
-  args.navtask.task_params.input_type = 'vision'
-  args.navtask.task_params.outputs.images = True
-  
-  if args.navtask.camera_param.modalities[0] == 'rgb':
-    args.solver.pretrained_path = rgb_resnet_v2_50_path
-  elif args.navtask.camera_param.modalities[0] == 'depth':
-    args.solver.pretrained_path = d_resnet_v2_50_path
-
-  if arch_vars.var2 == 'Ssc':
-    sc = 1./args.navtask.task_params.step_size
-    args.arch.vin_num_iters = 40
-    args.navtask.task_params.map_scales = [sc]
-    max_dist = args.navtask.task_params.max_dist * \
-        args.navtask.task_params.num_goals
-    args.navtask.task_params.map_crop_sizes = [2*max_dist]
-
-    args.arch.fr_stride = 1
-    args.arch.vin_action_neurons = 8
-    args.arch.vin_val_neurons = 3
-    args.arch.fr_inside_neurons = 32
-
-    args.mapper_arch.pad_map_with_zeros_each = [24]
-    args.mapper_arch.deconv_neurons = [64, 32, 16]
-    args.mapper_arch.deconv_strides = [1, 2, 1]
-
-  elif (arch_vars.var2 == 'Msc' or arch_vars.var2 == 'MscROMms' or
-        arch_vars.var2 == 'MscROMss' or arch_vars.var2 == 'MscNoVin'):
-    # Code for multi-scale planner.
-    args.arch.vin_num_iters = 8
-    args.arch.crop_remove_each = 4
-    args.arch.value_crop_size = 8
-
-    sc = 1./args.navtask.task_params.step_size
-    max_dist = args.navtask.task_params.max_dist * \
-        args.navtask.task_params.num_goals
-    n_scales = np.log2(float(max_dist) / float(args.arch.vin_num_iters))
-    n_scales = int(np.ceil(n_scales)+1)
-
-    args.navtask.task_params.map_scales = \
-        list(sc*(0.5**(np.arange(n_scales))[::-1]))
-    args.navtask.task_params.map_crop_sizes = [16 for x in range(n_scales)]
-
-    args.arch.fr_stride = 1
-    args.arch.vin_action_neurons = 8
-    args.arch.vin_val_neurons = 3
-    args.arch.fr_inside_neurons = 32
-
-    args.mapper_arch.pad_map_with_zeros_each = [0 for _ in range(n_scales)]
-    args.mapper_arch.deconv_neurons = [64*n_scales, 32*n_scales, 16*n_scales]
-    args.mapper_arch.deconv_strides = [1, 2, 1]
-
-    if arch_vars.var2 == 'MscNoVin':
-      # No planning version.
-      args.arch.fr_stride = [1, 2, 1, 2]
-      args.arch.vin_action_neurons = None
-      args.arch.vin_val_neurons = 16
-      args.arch.fr_inside_neurons = 32
-
-      args.arch.crop_remove_each = 0
-      args.arch.value_crop_size = 4
-      args.arch.vin_num_iters = 0
-
-    elif arch_vars.var2 == 'MscROMms' or arch_vars.var2 == 'MscROMss':
-      # Code with read outs, MscROMms flattens and reads out,
-      # MscROMss does not flatten and produces output at multiple scales.
-      args.navtask.task_params.outputs.readout_maps = True
-      args.navtask.task_params.map_resize_method = 'antialiasing'
-      args.arch.readout_maps = True
-
-      if arch_vars.var2 == 'MscROMms':
-        args.arch.rom_arch.num_neurons = [64, 1]
-        args.arch.rom_arch.kernel_size = 4
-        args.arch.rom_arch.strides = [2,2]
-        args.arch.rom_arch.layers_per_block = 2
-
-        args.navtask.task_params.readout_maps_crop_sizes = [64]
-        args.navtask.task_params.readout_maps_scales = [sc]
-
-      elif arch_vars.var2 == 'MscROMss':
-        args.arch.rom_arch.num_neurons = \
-            [64, len(args.navtask.task_params.map_scales)]
-        args.arch.rom_arch.kernel_size = 4
-        args.arch.rom_arch.strides = [1,1]
-        args.arch.rom_arch.layers_per_block = 1
-
-        args.navtask.task_params.readout_maps_crop_sizes = \
-            args.navtask.task_params.map_crop_sizes
-        args.navtask.task_params.readout_maps_scales = \
-            args.navtask.task_params.map_scales
-
-  else:
-    logging.fatal('arch_vars.var2 not one of Msc, MscROMms, MscROMss, MscNoVin.')
-    assert(False)
-
-  map_channels = args.mapper_arch.deconv_neurons[-1] / \
-    (2*len(args.navtask.task_params.map_scales))
-  args.navtask.task_params.map_channels = map_channels
-  
-  return args
-
-def process_arch_projected_map(args, arch_vars):
-  # Single scale vision based system which does not use a mapper but instead
-  # uses an analytically estimated map.
-  ds = int(arch_vars.var3[2])
-  args.navtask.task_params.input_type = 'analytical_counts'
-  args.navtask.task_params.outputs.analytical_counts = True
-
-  assert(args.navtask.task_params.modalities[0] == 'depth')
-  args.navtask.camera_param.img_channels = None
-
-  analytical_counts = utils.Foo(map_sizes=[512/ds],
-                                xy_resolution=[5.*ds],
-                                z_bins=[[-10, 10, 150, 200]],
-                                non_linearity=[arch_vars.var2])
-  args.navtask.task_params.analytical_counts = analytical_counts
-
-  sc = 1./ds
-  args.arch.vin_num_iters = 36
-  args.navtask.task_params.map_scales = [sc]
-  args.navtask.task_params.map_crop_sizes = [512/ds]
-
-  args.arch.fr_stride = [1,2]
-  args.arch.vin_action_neurons = 8
-  args.arch.vin_val_neurons = 3
-  args.arch.fr_inside_neurons = 32
-
-  map_channels = len(analytical_counts.z_bins[0]) + 1
-  args.navtask.task_params.map_channels = map_channels
-  args.solver.freeze_conv = False
-
-  return args
-
-def get_args_for_config(config_name):
-  args = utils.Foo()
-
-  args.summary, args.control = get_default_args()
-
-  exp_name, mode_str = config_name.split('+')
-  arch_str, solver_str, navtask_str = exp_name.split('.')
-  logging.error('config_name: %s', config_name)
-  logging.error('arch_str: %s', arch_str)
-  logging.error('navtask_str: %s', navtask_str)
-  logging.error('solver_str: %s', solver_str)
-  logging.error('mode_str: %s', mode_str)
-
-  args.solver = cc.process_solver_str(solver_str)
-  args.navtask = cc.process_navtask_str(navtask_str)
-
-  args = process_arch_str(args, arch_str)
-  args.arch.isd_k = args.solver.isd_k
-
-  # Train, test, etc.
-  mode, imset = mode_str.split('_')
-  args = cc.adjust_args_for_mode(args, mode)
-  args.navtask.building_names = args.navtask.dataset.get_split(imset)
-  args.control.test_name = '{:s}_on_{:s}'.format(mode, imset)
-
-  # Log the arguments
-  logging.error('%s', args)
-  return args
--- a/research/cognitive_mapping_and_planning/cfgs/config_common.py
+++ b/research/cognitive_mapping_and_planning/cfgs/config_common.py
-# Copyright 2016 The TensorFlow Authors All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-
-import os
-import numpy as np
-import logging
-import src.utils as utils
-import datasets.nav_env_config as nec
-from datasets import factory
-
-def adjust_args_for_mode(args, mode):
-  if mode == 'train':
-    args.control.train = True
-  
-  elif mode == 'val1':
-    # Same settings as for training, to make sure nothing wonky is happening
-    # there.
-    args.control.test = True
-    args.control.test_mode = 'val'
-    args.navtask.task_params.batch_size = 32
-
-  elif mode == 'val2':
-    # No data augmentation, not sampling but taking the argmax action, not
-    # sampling from the ground truth at all.
-    args.control.test = True
-    args.arch.action_sample_type = 'argmax'
-    args.arch.sample_gt_prob_type = 'zero'
-    args.navtask.task_params.data_augment = \
-      utils.Foo(lr_flip=0, delta_angle=0, delta_xy=0, relight=False,
-                relight_fast=False, structured=False)
-    args.control.test_mode = 'val'
-    args.navtask.task_params.batch_size = 32
-
-  elif mode == 'bench':
-    # Actually testing the agent in settings that are kept same between
-    # different runs.
-    args.navtask.task_params.batch_size = 16
-    args.control.test = True
-    args.arch.action_sample_type = 'argmax'
-    args.arch.sample_gt_prob_type = 'zero'
-    args.navtask.task_params.data_augment = \
-      utils.Foo(lr_flip=0, delta_angle=0, delta_xy=0, relight=False,
-                relight_fast=False, structured=False)
-    args.summary.test_iters = 250
-    args.control.only_eval_when_done = True
-    args.control.reset_rng_seed = True
-    args.control.test_mode = 'test'
-  else:
-    logging.fatal('Unknown mode: %s.', mode)
-    assert(False)
-  return args
-
-def get_solver_vars(solver_str):
-  if solver_str == '': vals = []; 
-  else: vals = solver_str.split('_')
-  ks = ['clip', 'dlw', 'long', 'typ', 'isdk', 'adam_eps', 'init_lr'];
-  ks = ks[:len(vals)]
-
-  # Gradient clipping or not.
-  if len(vals) == 0: ks.append('clip'); vals.append('noclip');
-  # data loss weight.
-  if len(vals) == 1: ks.append('dlw');  vals.append('dlw20')
-  # how long to train for.
-  if len(vals) == 2: ks.append('long');  vals.append('nolong')
-  # Adam
-  if len(vals) == 3: ks.append('typ');  vals.append('adam2')
-  # reg loss wt
-  if len(vals) == 4: ks.append('rlw');  vals.append('rlw1')
-  # isd_k
-  if len(vals) == 5: ks.append('isdk');  vals.append('isdk415') # 415, inflexion at 2.5k.
-  # adam eps
-  if len(vals) == 6: ks.append('adam_eps');  vals.append('aeps1en8')
-  # init lr
-  if len(vals) == 7: ks.append('init_lr');  vals.append('lr1en3')
-
-  assert(len(vals) == 8)
-  
-  vars = utils.Foo()
-  for k, v in zip(ks, vals):
-    setattr(vars, k, v)
-  logging.error('solver_vars: %s', vars)
-  return vars
-
-def process_solver_str(solver_str):
-  solver = utils.Foo(
-      seed=0, learning_rate_decay=None, clip_gradient_norm=None, max_steps=None,
-      initial_learning_rate=None, momentum=None, steps_per_decay=None,
-      logdir=None, sync=False, adjust_lr_sync=True, wt_decay=0.0001,
-      data_loss_wt=None, reg_loss_wt=None, freeze_conv=True, num_workers=1,
-      task=0, ps_tasks=0, master='local', typ=None, momentum2=None,
-      adam_eps=None)
-
-  # Clobber with overrides from solver str.
-  solver_vars = get_solver_vars(solver_str)
-
-  solver.data_loss_wt          = float(solver_vars.dlw[3:].replace('x', '.'))
-  solver.adam_eps              = float(solver_vars.adam_eps[4:].replace('x', '.').replace('n', '-'))
-  solver.initial_learning_rate = float(solver_vars.init_lr[2:].replace('x', '.').replace('n', '-'))
-  solver.reg_loss_wt           = float(solver_vars.rlw[3:].replace('x', '.'))
-  solver.isd_k                 = float(solver_vars.isdk[4:].replace('x', '.'))
-
-  long = solver_vars.long
-  if long == 'long':
-    solver.steps_per_decay = 40000
-    solver.max_steps = 120000
-  elif long == 'long2':
-    solver.steps_per_decay = 80000
-    solver.max_steps = 120000
-  elif long == 'nolong' or long == 'nol':
-    solver.steps_per_decay = 20000
-    solver.max_steps = 60000
-  else:
-    logging.fatal('solver_vars.long should be long, long2, nolong or nol.')
-    assert(False)
-
-  clip = solver_vars.clip
-  if clip == 'noclip' or clip == 'nocl':
-    solver.clip_gradient_norm = 0
-  elif clip[:4] == 'clip':
-    solver.clip_gradient_norm = float(clip[4:].replace('x', '.'))
-  else:
-    logging.fatal('Unknown solver_vars.clip: %s', clip)
-    assert(False)
-
-  typ = solver_vars.typ
-  if typ == 'adam':
-    solver.typ = 'adam'
-    solver.momentum = 0.9
-    solver.momentum2 = 0.999
-    solver.learning_rate_decay = 1.0
-  elif typ == 'adam2':
-    solver.typ = 'adam'
-    solver.momentum = 0.9
-    solver.momentum2 = 0.999
-    solver.learning_rate_decay = 0.1
-  elif typ == 'sgd':
-    solver.typ = 'sgd'
-    solver.momentum = 0.99
-    solver.momentum2 = None
-    solver.learning_rate_decay = 0.1
-  else:
-    logging.fatal('Unknown solver_vars.typ: %s', typ)
-    assert(False)
-
-  logging.error('solver: %s', solver)
-  return solver
-
-def get_navtask_vars(navtask_str):
-  if navtask_str == '': vals = []
-  else: vals = navtask_str.split('_')
-
-  ks_all = ['dataset_name', 'modality', 'task', 'history', 'max_dist',
-            'num_steps', 'step_size', 'n_ori', 'aux_views', 'data_aug']
-  ks = ks_all[:len(vals)]
-
-  # All data or not.
-  if len(vals) == 0: ks.append('dataset_name'); vals.append('sbpd')
-  # modality
-  if len(vals) == 1: ks.append('modality'); vals.append('rgb')
-  # semantic task?
-  if len(vals) == 2: ks.append('task'); vals.append('r2r')
-  # number of history frames.
-  if len(vals) == 3: ks.append('history'); vals.append('h0')
-  # max steps
-  if len(vals) == 4: ks.append('max_dist'); vals.append('32')
-  # num steps
-  if len(vals) == 5: ks.append('num_steps'); vals.append('40')
-  # step size
-  if len(vals) == 6: ks.append('step_size'); vals.append('8')
-  # n_ori
-  if len(vals) == 7: ks.append('n_ori'); vals.append('4')
-  # Auxiliary views.
-  if len(vals) == 8: ks.append('aux_views'); vals.append('nv0')
-  # Normal data augmentation as opposed to structured data augmentation (if set
-  # to straug.
-  if len(vals) == 9: ks.append('data_aug'); vals.append('straug')
-
-  assert(len(vals) == 10)
-  for i in range(len(ks)):
-    assert(ks[i] == ks_all[i])
-
-  vars = utils.Foo()
-  for k, v in zip(ks, vals):
-    setattr(vars, k, v)
-  logging.error('navtask_vars: %s', vals)
-  return vars
-
-def process_navtask_str(navtask_str):
-  navtask = nec.nav_env_base_config()
-  
-  # Clobber with overrides from strings.
-  navtask_vars = get_navtask_vars(navtask_str)
-
-  navtask.task_params.n_ori = int(navtask_vars.n_ori)
-  navtask.task_params.max_dist = int(navtask_vars.max_dist)
-  navtask.task_params.num_steps = int(navtask_vars.num_steps)
-  navtask.task_params.step_size = int(navtask_vars.step_size)
-  navtask.task_params.data_augment.delta_xy = int(navtask_vars.step_size)/2.
-  n_aux_views_each = int(navtask_vars.aux_views[2])
-  aux_delta_thetas = np.concatenate((np.arange(n_aux_views_each) + 1,
-                                     -1 -np.arange(n_aux_views_each)))
-  aux_delta_thetas = aux_delta_thetas*np.deg2rad(navtask.camera_param.fov)
-  navtask.task_params.aux_delta_thetas = aux_delta_thetas
-  
-  if navtask_vars.data_aug == 'aug':
-    navtask.task_params.data_augment.structured = False
-  elif navtask_vars.data_aug == 'straug':
-    navtask.task_params.data_augment.structured = True
-  else:
-    logging.fatal('Unknown navtask_vars.data_aug %s.', navtask_vars.data_aug)
-    assert(False)
-
-  navtask.task_params.num_history_frames = int(navtask_vars.history[1:])
-  navtask.task_params.n_views = 1+navtask.task_params.num_history_frames
-  
-  navtask.task_params.goal_channels = int(navtask_vars.n_ori)
-  
-  if navtask_vars.task == 'hard': 
-    navtask.task_params.type = 'rng_rejection_sampling_many'
-    navtask.task_params.rejection_sampling_M = 2000
-    navtask.task_params.min_dist = 10
-  elif navtask_vars.task == 'r2r':
-    navtask.task_params.type = 'room_to_room_many'
-  elif navtask_vars.task == 'ST':
-    # Semantic task at hand.
-    navtask.task_params.goal_channels = \
-        len(navtask.task_params.semantic_task.class_map_names)
-    navtask.task_params.rel_goal_loc_dim = \
-        len(navtask.task_params.semantic_task.class_map_names)
-    navtask.task_params.type = 'to_nearest_obj_acc'
-  else:
-    logging.fatal('navtask_vars.task: should be hard or r2r, ST')
-    assert(False)
-  
-  if navtask_vars.modality == 'rgb':
-    navtask.camera_param.modalities = ['rgb']
-    navtask.camera_param.img_channels = 3
-  elif navtask_vars.modality == 'd':
-    navtask.camera_param.modalities = ['depth']
-    navtask.camera_param.img_channels = 2
-  
-  navtask.task_params.img_height   = navtask.camera_param.height
-  navtask.task_params.img_width    = navtask.camera_param.width
-  navtask.task_params.modalities   = navtask.camera_param.modalities
-  navtask.task_params.img_channels = navtask.camera_param.img_channels
-  navtask.task_params.img_fov      = navtask.camera_param.fov
-  
-  navtask.dataset = factory.get_dataset(navtask_vars.dataset_name)
-  return navtask
--- a/research/cognitive_mapping_and_planning/cfgs/config_distill.py
+++ b/research/cognitive_mapping_and_planning/cfgs/config_distill.py
-# Copyright 2016 The TensorFlow Authors All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-
-import pprint
-import copy
-import os
-from tensorflow.python.platform import app
-from tensorflow.python.platform import flags
-import logging
-import src.utils as utils
-import cfgs.config_common as cc
-
-
-import tensorflow as tf
-
-rgb_resnet_v2_50_path = 'cache/resnet_v2_50_inception_preprocessed/model.ckpt-5136169'
-
-def get_default_args():
-  robot = utils.Foo(radius=15, base=10, height=140, sensor_height=120,
-                    camera_elevation_degree=-15)
-
-  camera_param = utils.Foo(width=225, height=225, z_near=0.05, z_far=20.0,
-                           fov=60., modalities=['rgb', 'depth'])
-
-  env = utils.Foo(padding=10, resolution=5, num_point_threshold=2,
-                  valid_min=-10, valid_max=200, n_samples_per_face=200)
-
-  data_augment = utils.Foo(lr_flip=0, delta_angle=1, delta_xy=4, relight=False,
-                           relight_fast=False, structured=False)
-
-  task_params = utils.Foo(num_actions=4, step_size=4, num_steps=0,
-                          batch_size=32, room_seed=0, base_class='Building',
-                          task='mapping', n_ori=6, data_augment=data_augment,
-                          output_transform_to_global_map=False,
-                          output_canonical_map=False,
-                          output_incremental_transform=False,
-                          output_free_space=False, move_type='shortest_path',
-                          toy_problem=0)
-
-  buildinger_args = utils.Foo(building_names=['area1_gates_wingA_floor1_westpart'],
-                              env_class=None, robot=robot, 
-                              task_params=task_params, env=env,
-                              camera_param=camera_param)
-
-  solver_args = utils.Foo(seed=0, learning_rate_decay=0.1,
-                          clip_gradient_norm=0, max_steps=120000,
-                          initial_learning_rate=0.001, momentum=0.99,
-                          steps_per_decay=40000, logdir=None, sync=False,
-                          adjust_lr_sync=True, wt_decay=0.0001,
-                          data_loss_wt=1.0, reg_loss_wt=1.0,
-                          num_workers=1, task=0, ps_tasks=0, master='local')
-
-  summary_args = utils.Foo(display_interval=1, test_iters=100)
-
-  control_args = utils.Foo(train=False, test=False,
-                           force_batchnorm_is_training_at_test=False)
-  
-  arch_args = utils.Foo(rgb_encoder='resnet_v2_50', d_encoder='resnet_v2_50')
-
-  return utils.Foo(solver=solver_args,
-                   summary=summary_args, control=control_args, arch=arch_args,
-                   buildinger=buildinger_args)
-
-def get_vars(config_name):
-  vars = config_name.split('_')
-  if len(vars) == 1: # All data or not.
-    vars.append('noall')
-  if len(vars) == 2: # n_ori
-    vars.append('4')
-  logging.error('vars: %s', vars)
-  return vars
-
-def get_args_for_config(config_name):
-  args = get_default_args()
-  config_name, mode = config_name.split('+')
-  vars = get_vars(config_name)
-  
-  logging.info('config_name: %s, mode: %s', config_name, mode)
-  
-  args.buildinger.task_params.n_ori = int(vars[2])
-  args.solver.freeze_conv = True
-  args.solver.pretrained_path = rgb_resnet_v2_50_path
-  args.buildinger.task_params.img_channels = 5
-  args.solver.data_loss_wt = 0.00001
- 
-  if vars[0] == 'v0':
-    None
-  else:
-    logging.error('config_name: %s undefined', config_name)
-
-  args.buildinger.task_params.height = args.buildinger.camera_param.height
-  args.buildinger.task_params.width = args.buildinger.camera_param.width
-  args.buildinger.task_params.modalities = args.buildinger.camera_param.modalities
-  
-  if vars[1] == 'all':
-    args = cc.get_args_for_mode_building_all(args, mode)
-  elif vars[1] == 'noall':
-    args = cc.get_args_for_mode_building(args, mode)
-  
-  # Log the arguments
-  logging.error('%s', args)
-  return args
--- a/research/cognitive_mapping_and_planning/cfgs/config_vision_baseline.py
+++ b/research/cognitive_mapping_and_planning/cfgs/config_vision_baseline.py
-# Copyright 2016 The TensorFlow Authors All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-
-import pprint
-import os
-import numpy as np
-from tensorflow.python.platform import app
-from tensorflow.python.platform import flags
-import logging
-import src.utils as utils
-import cfgs.config_common as cc
-import datasets.nav_env_config as nec
-
-
-import tensorflow as tf
-
-FLAGS = flags.FLAGS
-
-get_solver_vars = cc.get_solver_vars
-get_navtask_vars = cc.get_navtask_vars
-
-
-rgb_resnet_v2_50_path = 'data/init_models/resnet_v2_50/model.ckpt-5136169'
-d_resnet_v2_50_path = 'data/init_models/distill_rgb_to_d_resnet_v2_50/model.ckpt-120002'
-
-def get_default_args():
-  summary_args = utils.Foo(display_interval=1, test_iters=26,
-                           arop_full_summary_iters=14)
-
-  control_args = utils.Foo(train=False, test=False,
-                           force_batchnorm_is_training_at_test=False,
-                           reset_rng_seed=False, only_eval_when_done=False,
-                           test_mode=None)
-  return summary_args, control_args
-
-def get_default_baseline_args():
-  batch_norm_param = {'center': True, 'scale': True,
-                      'activation_fn':tf.nn.relu}
-  arch_args = utils.Foo(
-      pred_neurons=[], goal_embed_neurons=[], img_embed_neurons=[],
-      batch_norm_param=batch_norm_param, dim_reduce_neurons=64, combine_type='',
-      encoder='resnet_v2_50', action_sample_type='sample',
-      action_sample_combine_type='one_or_other',
-      sample_gt_prob_type='inverse_sigmoid_decay', dagger_sample_bn_false=True,
-      isd_k=750., use_visit_count=False, lstm_output=False, lstm_ego=False,
-      lstm_img=False, fc_dropout=0.0, embed_goal_for_state=False,
-      lstm_output_init_state_from_goal=False)
-  return arch_args
-
-def get_arch_vars(arch_str):
-  if arch_str == '': vals = []
-  else: vals = arch_str.split('_')
-  
-  ks = ['ver', 'lstm_dim', 'dropout']
-  
-  # Exp Ver
-  if len(vals) == 0: vals.append('v0')
-  # LSTM dimentsions
-  if len(vals) == 1: vals.append('lstm2048')
-  # Dropout
-  if len(vals) == 2: vals.append('noDO')
-  
-  assert(len(vals) == 3)
-  
-  vars = utils.Foo()
-  for k, v in zip(ks, vals):
-    setattr(vars, k, v)
-  
-  logging.error('arch_vars: %s', vars)
-  return vars
-
-def process_arch_str(args, arch_str):
-  # This function modifies args.
-  args.arch = get_default_baseline_args()
-  arch_vars = get_arch_vars(arch_str)
-
-  args.navtask.task_params.outputs.rel_goal_loc = True
-  args.navtask.task_params.input_type = 'vision'
-  args.navtask.task_params.outputs.images = True
-  
-  if args.navtask.camera_param.modalities[0] == 'rgb':
-    args.solver.pretrained_path = rgb_resnet_v2_50_path
-  elif args.navtask.camera_param.modalities[0] == 'depth':
-    args.solver.pretrained_path = d_resnet_v2_50_path
-  else:
-    logging.fatal('Neither of rgb or d')
-
-  if arch_vars.dropout == 'DO': 
-    args.arch.fc_dropout = 0.5
-
-  args.tfcode = 'B'
-  
-  exp_ver = arch_vars.ver
-  if exp_ver == 'v0':
-    # Multiplicative interaction between goal loc and image features.
-    args.arch.combine_type = 'multiply'
-    args.arch.pred_neurons = [256, 256]
-    args.arch.goal_embed_neurons = [64, 8]
-    args.arch.img_embed_neurons = [1024, 512, 256*8]
-  
-  elif exp_ver == 'v1':
-    # Additive interaction between goal and image features.
-    args.arch.combine_type = 'add'
-    args.arch.pred_neurons = [256, 256]
-    args.arch.goal_embed_neurons = [64, 256]
-    args.arch.img_embed_neurons = [1024, 512, 256]
-  
-  elif exp_ver == 'v2':
-    # LSTM at the output on top of multiple interactions.
-    args.arch.combine_type = 'multiply'
-    args.arch.goal_embed_neurons = [64, 8]
-    args.arch.img_embed_neurons = [1024, 512, 256*8]
-    args.arch.lstm_output = True
-    args.arch.lstm_output_dim = int(arch_vars.lstm_dim[4:])
-    args.arch.pred_neurons = [256] # The other is inside the LSTM.
-  
-  elif exp_ver == 'v0blind':
-    # LSTM only on the goal location.
-    args.arch.combine_type = 'goalonly'
-    args.arch.goal_embed_neurons = [64, 256]
-    args.arch.img_embed_neurons = [2] # I dont know what it will do otherwise.
-    args.arch.lstm_output = True
-    args.arch.lstm_output_dim = 256
-    args.arch.pred_neurons = [256] # The other is inside the LSTM.
-  
-  else:
-    logging.fatal('exp_ver: %s undefined', exp_ver)
-    assert(False)
-
-  # Log the arguments
-  logging.error('%s', args)
-  return args
-
-def get_args_for_config(config_name):
-  args = utils.Foo()
-
-  args.summary, args.control = get_default_args()
-
-  exp_name, mode_str = config_name.split('+')
-  arch_str, solver_str, navtask_str = exp_name.split('.')
-  logging.error('config_name: %s', config_name)
-  logging.error('arch_str: %s', arch_str)
-  logging.error('navtask_str: %s', navtask_str)
-  logging.error('solver_str: %s', solver_str)
-  logging.error('mode_str: %s', mode_str)
-
-  args.solver = cc.process_solver_str(solver_str)
-  args.navtask = cc.process_navtask_str(navtask_str)
-
-  args = process_arch_str(args, arch_str)
-  args.arch.isd_k = args.solver.isd_k
-
-  # Train, test, etc.
-  mode, imset = mode_str.split('_')
-  args = cc.adjust_args_for_mode(args, mode)
-  args.navtask.building_names = args.navtask.dataset.get_split(imset)
-  args.control.test_name = '{:s}_on_{:s}'.format(mode, imset)
-
-  # Log the arguments
-  logging.error('%s', args)
-  return args
--- a/research/cognitive_mapping_and_planning/data/.gitignore
+++ b/research/cognitive_mapping_and_planning/data/.gitignore
-stanford_building_parser_dataset_raw
-stanford_building_parser_dataset
-init_models
--- a/research/cognitive_mapping_and_planning/data/README.md
+++ b/research/cognitive_mapping_and_planning/data/README.md
-This directory contains the data needed for training and benchmarking various
-navigation models.
-
-1.  Download the data from the [dataset website]
-    (http://buildingparser.stanford.edu/dataset.html).
-    1.  [Raw meshes](https://goo.gl/forms/2YSPaO2UKmn5Td5m2). We need the meshes
-        which are in the noXYZ folder. Download the tar files and place them in
-        the `stanford_building_parser_dataset_raw` folder. You need to download
-        `area_1_noXYZ.tar`, `area_3_noXYZ.tar`, `area_5a_noXYZ.tar`,
-        `area_5b_noXYZ.tar`, `area_6_noXYZ.tar` for training and
-        `area_4_noXYZ.tar` for evaluation.
-    2.  [Annotations](https://goo.gl/forms/4SoGp4KtH1jfRqEj2) for setting up
-        tasks. We will need the file called `Stanford3dDataset_v1.2.zip`. Place
-        the file in the directory `stanford_building_parser_dataset_raw`.
-
-2.  Preprocess the data.
-    1.  Extract meshes using `scripts/script_preprocess_meshes_S3DIS.sh`. After
-        this `ls data/stanford_building_parser_dataset/mesh` should have 6
-        folders `area1`, `area3`, `area4`, `area5a`, `area5b`, `area6`, with
-        textures and obj files within each directory.
-    2.  Extract out room information and semantics from zip file using
-        `scripts/script_preprocess_annoations_S3DIS.sh`. After this there should
-        be `room-dimension` and `class-maps` folder in
-        `data/stanford_building_parser_dataset`. (If you find this script to
-        crash because of an exception in np.loadtxt while processing
-        `Area_5/office_19/Annotations/ceiling_1.txt`, there is a special
-        character on line 323474, that should be removed manually.)
-
-3.  Download ImageNet Pre-trained models. We used ResNet-v2-50 for representing
-    images. For RGB images this is pre-trained on ImageNet. For Depth images we
-    [distill](https://arxiv.org/abs/1507.00448) the RGB model to depth images
-    using paired RGB-D images. Both there models are available through
-    `scripts/script_download_init_models.sh`
--- a/research/cognitive_mapping_and_planning/datasets/__init__.py
+++ b/research/cognitive_mapping_and_planning/datasets/__init__.py
--- a/research/cognitive_mapping_and_planning/datasets/factory.py
+++ b/research/cognitive_mapping_and_planning/datasets/factory.py
-# Copyright 2016 The TensorFlow Authors All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-
-r"""Wrapper for selecting the navigation environment that we want to train and
-test on.
-"""
-import numpy as np
-import os, glob
-import platform
-
-import logging
-from tensorflow.python.platform import app
-from tensorflow.python.platform import flags
-
-import render.swiftshader_renderer as renderer 
-import src.file_utils as fu
-import src.utils as utils
-
-def get_dataset(dataset_name):
-  if dataset_name == 'sbpd':
-    dataset = StanfordBuildingParserDataset(dataset_name)
-  else:
-    logging.fatal('Not one of sbpd')
-  return dataset
-
-class Loader():
-  def get_data_dir():
-    pass
-
-  def get_meta_data(self, file_name, data_dir=None):
-    if data_dir is None:
-      data_dir = self.get_data_dir()
-    full_file_name = os.path.join(data_dir, 'meta', file_name)
-    assert(fu.exists(full_file_name)), \
-      '{:s} does not exist'.format(full_file_name)
-    ext = os.path.splitext(full_file_name)[1]
-    if ext == '.txt':
-      ls = []
-      with fu.fopen(full_file_name, 'r') as f:
-        for l in f:
-          ls.append(l.rstrip())
-    elif ext == '.pkl':
-      ls = utils.load_variables(full_file_name)
-    return ls
-
-  def load_building(self, name, data_dir=None):
-    if data_dir is None:
-      data_dir = self.get_data_dir()
-    out = {}
-    out['name'] = name
-    out['data_dir'] = data_dir
-    out['room_dimension_file'] = os.path.join(data_dir, 'room-dimension',
-                                              name+'.pkl')
-    out['class_map_folder'] = os.path.join(data_dir, 'class-maps')
-    return out
-
-  def load_building_meshes(self, building):
-    dir_name = os.path.join(building['data_dir'], 'mesh', building['name'])
-    mesh_file_name = glob.glob1(dir_name, '*.obj')[0]
-    mesh_file_name_full = os.path.join(dir_name, mesh_file_name)
-    logging.error('Loading building from obj file: %s', mesh_file_name_full)
-    shape = renderer.Shape(mesh_file_name_full, load_materials=True, 
-                           name_prefix=building['name']+'_')
-    return [shape]
-
-class StanfordBuildingParserDataset(Loader):
-  def __init__(self, ver):
-    self.ver = ver
-    self.data_dir = None
-  
-  def get_data_dir(self):
-    if self.data_dir is None:
-      self.data_dir = 'data/stanford_building_parser_dataset/'
-    return self.data_dir
-
-  def get_benchmark_sets(self):
-    return self._get_benchmark_sets()
-
-  def get_split(self, split_name):
-    if self.ver == 'sbpd':
-      return self._get_split(split_name)
-    else:
-      logging.fatal('Unknown version.')
-
-  def _get_benchmark_sets(self):
-    sets = ['train1', 'val', 'test']
-    return sets
-
-  def _get_split(self, split_name):
-    train = ['area1', 'area5a', 'area5b', 'area6']
-    train1 = ['area1']
-    val = ['area3']
-    test = ['area4']
-
-    sets = {}
-    sets['train'] = train
-    sets['train1'] = train1
-    sets['val'] = val
-    sets['test'] = test
-    sets['all'] = sorted(list(set(train + val + test)))
-    return sets[split_name]
--- a/research/cognitive_mapping_and_planning/datasets/nav_env.py
+++ b/research/cognitive_mapping_and_planning/datasets/nav_env.py
-# Copyright 2016 The TensorFlow Authors All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-
-r"""Navidation Environment. Includes the following classes along with some
-helper functions.
-  Building: Loads buildings, computes traversibility, exposes functionality for
-    rendering images.
-  
-  GridWorld: Base class which implements functionality for moving an agent on a
-    grid world.
-  
-  NavigationEnv: Base class which generates navigation problems on a grid world.
-  
-  VisualNavigationEnv: Builds upon NavigationEnv and Building to provide
-    interface that is used externally to train the agent. 
-  
-  MeshMapper: Class used for distilling the model, testing the mapper.
-  
-  BuildingMultiplexer: Wrapper class that instantiates a VisualNavigationEnv for
-    each building and multiplexes between them as needed.
-"""
-
-import numpy as np
-import os
-import re
-import matplotlib.pyplot as plt
-
-import graph_tool as gt
-import graph_tool.topology
-
-from tensorflow.python.platform import gfile
-import logging
-import src.file_utils as fu
-import src.utils as utils
-import src.graph_utils as gu
-import src.map_utils as mu
-import src.depth_utils as du
-import render.swiftshader_renderer as sru
-from render.swiftshader_renderer import SwiftshaderRenderer
-import cv2
-
-label_nodes_with_class           = gu.label_nodes_with_class
-label_nodes_with_class_geodesic  = gu.label_nodes_with_class_geodesic
-get_distance_node_list           = gu.get_distance_node_list
-convert_to_graph_tool            = gu.convert_to_graph_tool
-generate_graph                   = gu.generate_graph
-get_hardness_distribution        = gu.get_hardness_distribution
-rng_next_goal_rejection_sampling = gu.rng_next_goal_rejection_sampling
-rng_next_goal                    = gu.rng_next_goal
-rng_room_to_room                 = gu.rng_room_to_room
-rng_target_dist_field            = gu.rng_target_dist_field
-
-compute_traversibility           = mu.compute_traversibility
-make_map                         = mu.make_map
-resize_maps                      = mu.resize_maps
-pick_largest_cc                  = mu.pick_largest_cc
-get_graph_origin_loc             = mu.get_graph_origin_loc
-generate_egocentric_maps         = mu.generate_egocentric_maps
-generate_goal_images             = mu.generate_goal_images
-get_map_to_predict               = mu.get_map_to_predict
-
-bin_points                       = du.bin_points
-make_geocentric                  = du.make_geocentric
-get_point_cloud_from_z           = du.get_point_cloud_from_z
-get_camera_matrix                = du.get_camera_matrix
-
-def _get_semantic_maps(folder_name, building_name, map, flip):
-  # Load file from the cache.
-  file_name = '{:s}_{:d}_{:d}_{:d}_{:d}_{:d}_{:d}.pkl'
-  file_name = file_name.format(building_name, map.size[0], map.size[1],
-                               map.origin[0], map.origin[1], map.resolution,
-                               flip)
-  file_name = os.path.join(folder_name, file_name)
-  logging.info('Loading semantic maps from %s.', file_name)
-
-  if fu.exists(file_name):
-    a = utils.load_variables(file_name)
-    maps = a['maps'] #HxWx#C
-    cats = a['cats']
-  else:
-    logging.error('file_name: %s not found.', file_name)
-    maps = None
-    cats = None
-  return maps, cats
-
-def _select_classes(all_maps, all_cats, cats_to_use):
-  inds = []
-  for c in cats_to_use:
-    ind = all_cats.index(c)
-    inds.append(ind)
-  out_maps = all_maps[:,:,inds]
-  return out_maps
-
-def _get_room_dimensions(file_name, resolution, origin, flip=False):
-  if fu.exists(file_name):
-    a = utils.load_variables(file_name)['room_dimension']
-    names = a.keys()
-    dims = np.concatenate(a.values(), axis=0).reshape((-1,6))
-    ind = np.argsort(names)
-    dims = dims[ind,:]
-    names = [names[x] for x in ind]
-    if flip:
-      dims_new = dims*1
-      dims_new[:,1] = -dims[:,4]
-      dims_new[:,4] = -dims[:,1]
-      dims = dims_new*1
-
-    dims = dims*100.
-    dims[:,0] = dims[:,0] - origin[0]
-    dims[:,1] = dims[:,1] - origin[1]
-    dims[:,3] = dims[:,3] - origin[0]
-    dims[:,4] = dims[:,4] - origin[1]
-    dims = dims / resolution
-    out = {'names': names, 'dims': dims}
-  else:
-    out = None
-  return out
-
-def _filter_rooms(room_dims, room_regex):
-  pattern = re.compile(room_regex)
-  ind = []
-  for i, name in enumerate(room_dims['names']):
-    if pattern.match(name):
-      ind.append(i)
-  new_room_dims = {}
-  new_room_dims['names'] = [room_dims['names'][i] for i in ind]
-  new_room_dims['dims'] = room_dims['dims'][ind,:]*1
-  return new_room_dims
-
-def _label_nodes_with_room_id(xyt, room_dims):
-  # Label the room with the ID into things.
-  node_room_id = -1*np.ones((xyt.shape[0], 1))
-  dims = room_dims['dims']
-  for x, name in enumerate(room_dims['names']):
-    all_ = np.concatenate((xyt[:,[0]] >= dims[x,0],
-                           xyt[:,[0]] <= dims[x,3],
-                           xyt[:,[1]] >= dims[x,1],
-                           xyt[:,[1]] <= dims[x,4]), axis=1)
-    node_room_id[np.all(all_, axis=1), 0] = x
-  return node_room_id
-
-def get_path_ids(start_node_id, end_node_id, pred_map):
-  id = start_node_id
-  path = [id]
-  while id != end_node_id:
-    id = pred_map[id]
-    path.append(id)
-  return path
-
-def image_pre(images, modalities):
-  # Assumes images are ...xHxWxC.
-  # We always assume images are RGB followed by Depth.
-  if 'depth' in modalities:
-    d = images[...,-1][...,np.newaxis]*1.
-    d[d < 0.01] = np.NaN; isnan = np.isnan(d);
-    d = 100./d; d[isnan] = 0.;
-    images = np.concatenate((images[...,:-1], d, isnan), axis=images.ndim-1)
-  if 'rgb' in modalities:
-    images[...,:3] = images[...,:3]*1. - 128
-  return images
-
-def _get_relative_goal_loc(goal_loc, loc, theta):
-  r = np.sqrt(np.sum(np.square(goal_loc - loc), axis=1))
-  t = np.arctan2(goal_loc[:,1] - loc[:,1], goal_loc[:,0] - loc[:,0])
-  t = t-theta[:,0] + np.pi/2
-  return np.expand_dims(r,axis=1), np.expand_dims(t, axis=1)
-
-def _gen_perturbs(rng, batch_size, num_steps, lr_flip, delta_angle, delta_xy,
-                  structured):
-  perturbs = []
-  for i in range(batch_size):
-    # Doing things one by one for each episode in this batch. This way this
-    # remains replicatable even when we change the batch size.
-    p = np.zeros((num_steps+1, 4))
-    if lr_flip:
-      # Flip the whole trajectory.
-      p[:,3] = rng.rand(1)-0.5
-    if delta_angle > 0:
-      if structured:
-        p[:,2] = (rng.rand(1)-0.5)* delta_angle
-      else:
-        p[:,2] = (rng.rand(p.shape[0])-0.5)* delta_angle
-    if delta_xy > 0:
-      if structured:
-        p[:,:2] = (rng.rand(1, 2)-0.5)*delta_xy
-      else:
-        p[:,:2] = (rng.rand(p.shape[0], 2)-0.5)*delta_xy
-    perturbs.append(p)
-  return perturbs
-
-def get_multiplexer_class(args, task_number):
-  assert(args.task_params.base_class == 'Building')
-  logging.info('Returning BuildingMultiplexer')
-  R = BuildingMultiplexer(args, task_number)
-  return R
-
-class GridWorld():
-  def __init__(self):
-    """Class members that will be assigned by any class that actually uses this
-    class."""
-    self.restrict_to_largest_cc = None
-    self.robot = None
-    self.env = None
-    self.category_list = None
-    self.traversible = None
-
-  def get_loc_axis(self, node, delta_theta, perturb=None):
-    """Based on the node orientation returns X, and Y axis. Used to sample the
-    map in egocentric coordinate frame.
-    """
-    if type(node) == tuple:
-      node = np.array([node])
-    if perturb is None:
-      perturb = np.zeros((node.shape[0], 4))
-    xyt = self.to_actual_xyt_vec(node)
-    x = xyt[:,[0]] + perturb[:,[0]]
-    y = xyt[:,[1]] + perturb[:,[1]]
-    t = xyt[:,[2]] + perturb[:,[2]]
-    theta = t*delta_theta
-    loc = np.concatenate((x,y), axis=1)
-    x_axis = np.concatenate((np.cos(theta), np.sin(theta)), axis=1)
-    y_axis = np.concatenate((np.cos(theta+np.pi/2.), np.sin(theta+np.pi/2.)),
-                            axis=1)
-    # Flip the sampled map where need be.
-    y_axis[np.where(perturb[:,3] > 0)[0], :] *= -1.
-    return loc, x_axis, y_axis, theta
-
-  def to_actual_xyt(self, pqr):
-    """Converts from node to location on the map."""
-    (p, q, r) = pqr
-    if self.task.n_ori == 6:
-      out = (p - q * 0.5 + self.task.origin_loc[0],
-             q * np.sqrt(3.) / 2. + self.task.origin_loc[1], r)
-    elif self.task.n_ori == 4:
-      out = (p + self.task.origin_loc[0],
-             q + self.task.origin_loc[1], r)
-    return out
-
-  def to_actual_xyt_vec(self, pqr):
-    """Converts from node array to location array on the map."""
-    p = pqr[:,0][:, np.newaxis]
-    q = pqr[:,1][:, np.newaxis]
-    r = pqr[:,2][:, np.newaxis]
-    if self.task.n_ori == 6:
-      out = np.concatenate((p - q * 0.5 + self.task.origin_loc[0],
-                            q * np.sqrt(3.) / 2. + self.task.origin_loc[1],
-                            r), axis=1)
-    elif self.task.n_ori == 4:
-      out = np.concatenate((p + self.task.origin_loc[0],
-                            q + self.task.origin_loc[1],
-                            r), axis=1)
-    return out
-
-  def raw_valid_fn_vec(self, xyt):
-    """Returns if the given set of nodes is valid or not."""
-    height = self.traversible.shape[0]
-    width = self.traversible.shape[1]
-    x = np.round(xyt[:,[0]]).astype(np.int32)
-    y = np.round(xyt[:,[1]]).astype(np.int32)
-    is_inside = np.all(np.concatenate((x >= 0, y >= 0,
-                                       x < width, y < height), axis=1), axis=1)
-    x = np.minimum(np.maximum(x, 0), width-1)
-    y = np.minimum(np.maximum(y, 0), height-1)
-    ind = np.ravel_multi_index((y,x), self.traversible.shape)
-    is_traversible = self.traversible.ravel()[ind]
-
-    is_valid = np.all(np.concatenate((is_inside[:,np.newaxis], is_traversible),
-                                     axis=1), axis=1)
-    return is_valid
-
-
-  def valid_fn_vec(self, pqr):
-    """Returns if the given set of nodes is valid or not."""
-    xyt = self.to_actual_xyt_vec(np.array(pqr))
-    height = self.traversible.shape[0]
-    width = self.traversible.shape[1]
-    x = np.round(xyt[:,[0]]).astype(np.int32)
-    y = np.round(xyt[:,[1]]).astype(np.int32)
-    is_inside = np.all(np.concatenate((x >= 0, y >= 0,
-                                       x < width, y < height), axis=1), axis=1)
-    x = np.minimum(np.maximum(x, 0), width-1)
-    y = np.minimum(np.maximum(y, 0), height-1)
-    ind = np.ravel_multi_index((y,x), self.traversible.shape)
-    is_traversible = self.traversible.ravel()[ind]
-
-    is_valid = np.all(np.concatenate((is_inside[:,np.newaxis], is_traversible),
-                                     axis=1), axis=1)
-    return is_valid
-
-  def get_feasible_actions(self, node_ids):
-    """Returns the feasible set of actions from the current node."""
-    a = np.zeros((len(node_ids), self.task_params.num_actions), dtype=np.int32)
-    gtG = self.task.gtG
-    next_node = []
-    for i, c in enumerate(node_ids):
-      neigh = gtG.vertex(c).out_neighbours()
-      neigh_edge = gtG.vertex(c).out_edges()
-      nn = {}
-      for n, e in zip(neigh, neigh_edge):
-        _ = gtG.ep['action'][e]
-        a[i,_] = 1
-        nn[_] = int(n)
-      next_node.append(nn)
-    return a, next_node
-
-  def take_action(self, current_node_ids, action):
-    """Returns the new node after taking the action action. Stays at the current
-    node if the action is invalid."""
-    actions, next_node_ids = self.get_feasible_actions(current_node_ids)
-    new_node_ids = []
-    for i, (c,a) in enumerate(zip(current_node_ids, action)):
-      if actions[i,a] == 1:
-        new_node_ids.append(next_node_ids[i][a])
-      else:
-        new_node_ids.append(c)
-    return new_node_ids
-
-  def set_r_obj(self, r_obj):
-    """Sets the SwiftshaderRenderer object used for rendering."""
-    self.r_obj = r_obj
-
-class Building(GridWorld):
-  def __init__(self, building_name, robot, env,
-               category_list=None, small=False, flip=False, logdir=None,
-               building_loader=None):
-
-    self.restrict_to_largest_cc = True
-    self.robot = robot
-    self.env = env
-    self.logdir = logdir
-
-    # Load the building meta data.
-    building = building_loader.load_building(building_name)
-    if small:
-      building['mesh_names'] = building['mesh_names'][:5]
-
-    # New code.
-    shapess = building_loader.load_building_meshes(building)
-    if flip:
-      for shapes in shapess:
-        shapes.flip_shape()
-
-    vs = []
-    for shapes in shapess:
-      vs.append(shapes.get_vertices()[0])
-    vs = np.concatenate(vs, axis=0)
-    map = make_map(env.padding, env.resolution, vertex=vs, sc=100.)
-    map = compute_traversibility(
-        map, robot.base, robot.height, robot.radius, env.valid_min,
-        env.valid_max, env.num_point_threshold, shapess=shapess, sc=100.,
-        n_samples_per_face=env.n_samples_per_face)
-
-    room_dims = _get_room_dimensions(building['room_dimension_file'],
-                                     env.resolution, map.origin, flip=flip)
-    class_maps, class_map_names = _get_semantic_maps(
-        building['class_map_folder'], building_name, map, flip)
-
-    self.class_maps      = class_maps
-    self.class_map_names = class_map_names
-    self.building        = building
-    self.shapess         = shapess
-    self.map             = map
-    self.traversible     = map.traversible*1
-    self.building_name   = building_name
-    self.room_dims       = room_dims
-    self.flipped         = flip
-    self.renderer_entitiy_ids = []
-
-    if self.restrict_to_largest_cc:
-      self.traversible = pick_largest_cc(self.traversible)
-
-  def load_building_into_scene(self):
-    # Loads the scene.
-    self.renderer_entitiy_ids += self.r_obj.load_shapes(self.shapess)
-    # Free up memory, we dont need the mesh or the materials anymore.
-    self.shapess = None
-
-  def add_entity_at_nodes(self, nodes, height, shape):
-    xyt = self.to_actual_xyt_vec(nodes)
-    nxy = xyt[:,:2]*1.
-    nxy = nxy * self.map.resolution
-    nxy = nxy + self.map.origin
-    Ts = np.concatenate((nxy, nxy[:,:1]), axis=1)
-    Ts[:,2] = height; Ts = Ts / 100.;
-
-    # Merge all the shapes into a single shape and add that shape.
-    shape.replicate_shape(Ts)
-    entity_ids = self.r_obj.load_shapes([shape])
-    self.renderer_entitiy_ids += entity_ids
-    return entity_ids
-
-  def add_shapes(self, shapes):
-    scene = self.r_obj.viz.scene()
-    for shape in shapes:
-      scene.AddShape(shape)
-
-  def add_materials(self, materials):
-    scene = self.r_obj.viz.scene()
-    for material in materials:
-      scene.AddOrUpdateMaterial(material)
-
-  def set_building_visibility(self, visibility):
-    self.r_obj.set_entity_visible(self.renderer_entitiy_ids, visibility)
-
-  def render_nodes(self, nodes, perturb=None, aux_delta_theta=0.):
-    self.set_building_visibility(True)
-    if perturb is None:
-      perturb = np.zeros((len(nodes), 4))
-
-    imgs = []
-    r = 2
-    elevation_z = r * np.tan(np.deg2rad(self.robot.camera_elevation_degree))
-
-    for i in range(len(nodes)):
-      xyt = self.to_actual_xyt(nodes[i])
-      lookat_theta = 3.0 * np.pi / 2.0 - (xyt[2]+perturb[i,2]+aux_delta_theta) * (self.task.delta_theta)
-      nxy = np.array([xyt[0]+perturb[i,0], xyt[1]+perturb[i,1]]).reshape(1, -1)
-      nxy = nxy * self.map.resolution
-      nxy = nxy + self.map.origin
-      camera_xyz = np.zeros((1, 3))
-      camera_xyz[...] = [nxy[0, 0], nxy[0, 1], self.robot.sensor_height]
-      camera_xyz = camera_xyz / 100.
-      lookat_xyz = np.array([-r * np.sin(lookat_theta),
-                             -r * np.cos(lookat_theta), elevation_z])
-      lookat_xyz = lookat_xyz + camera_xyz[0, :]
-      self.r_obj.position_camera(camera_xyz[0, :].tolist(),
-                                 lookat_xyz.tolist(), [0.0, 0.0, 1.0])
-      img = self.r_obj.render(take_screenshot=True, output_type=0)
-      img = [x for x in img if x is not None]
-      img = np.concatenate(img, axis=2).astype(np.float32)
-      if perturb[i,3]>0:
-        img = img[:,::-1,:]
-      imgs.append(img)
-
-    self.set_building_visibility(False)
-    return imgs
-
-
-class MeshMapper(Building):
-  def __init__(self, robot, env, task_params, building_name, category_list,
-               flip, logdir=None, building_loader=None):
-    Building.__init__(self, building_name, robot, env, category_list,
-                      small=task_params.toy_problem, flip=flip, logdir=logdir,
-                      building_loader=building_loader)
-    self.task_params = task_params
-    self.task = None
-    self._preprocess_for_task(self.task_params.building_seed)
-
-  def _preprocess_for_task(self, seed):
-    if self.task is None or self.task.seed != seed:
-      rng = np.random.RandomState(seed)
-      origin_loc = get_graph_origin_loc(rng, self.traversible)
-      self.task = utils.Foo(seed=seed, origin_loc=origin_loc,
-                            n_ori=self.task_params.n_ori)
-      G = generate_graph(self.valid_fn_vec,
-                                  self.task_params.step_size, self.task.n_ori,
-                                  (0, 0, 0))
-      gtG, nodes, nodes_to_id = convert_to_graph_tool(G)
-      self.task.gtG = gtG
-      self.task.nodes = nodes
-      self.task.delta_theta = 2.0*np.pi/(self.task.n_ori*1.)
-      self.task.nodes_to_id = nodes_to_id
-      logging.info('Building %s, #V=%d, #E=%d', self.building_name,
-                   self.task.nodes.shape[0], self.task.gtG.num_edges())
-
-      if self.logdir is not None:
-        write_traversible = cv2.applyColorMap(self.traversible.astype(np.uint8)*255, cv2.COLORMAP_JET)
-        img_path = os.path.join(self.logdir,
-                                '{:s}_{:d}_graph.png'.format(self.building_name,
-                                                             seed))
-        node_xyt = self.to_actual_xyt_vec(self.task.nodes)
-        plt.set_cmap('jet');
-        fig, ax = utils.subplot(plt, (1,1), (12,12))
-        ax.plot(node_xyt[:,0], node_xyt[:,1], 'm.')
-        ax.imshow(self.traversible, origin='lower');
-        ax.set_axis_off(); ax.axis('equal');
-        ax.set_title('{:s}, {:d}, {:d}'.format(self.building_name,
-                                               self.task.nodes.shape[0],
-                                               self.task.gtG.num_edges()))
-        if self.room_dims is not None:
-          for i, r in enumerate(self.room_dims['dims']*1):
-            min_ = r[:3]*1
-            max_ = r[3:]*1
-            xmin, ymin, zmin = min_
-            xmax, ymax, zmax = max_
-
-            ax.plot([xmin, xmax, xmax, xmin, xmin],
-                    [ymin, ymin, ymax, ymax, ymin], 'g')
-        with fu.fopen(img_path, 'w') as f:
-          fig.savefig(f, bbox_inches='tight', transparent=True, pad_inches=0)
-        plt.close(fig)
-
-
-  def _gen_rng(self, rng):
-    # instances is a list of list of node_ids.
-    if self.task_params.move_type == 'circle':
-      _, _, _, _, paths = rng_target_dist_field(self.task_params.batch_size,
-                                                self.task.gtG, rng, 0, 1,
-                                                compute_path=True)
-      instances_ = paths
-
-      instances = []
-      for instance_ in instances_:
-        instance = instance_
-        for i in range(self.task_params.num_steps):
-          instance.append(self.take_action([instance[-1]], [1])[0])
-        instances.append(instance)
-
-    elif self.task_params.move_type == 'shortest_path':
-      _, _, _, _, paths = rng_target_dist_field(self.task_params.batch_size,
-                                                self.task.gtG, rng,
-                                                self.task_params.num_steps,
-                                                self.task_params.num_steps+1,
-                                                compute_path=True)
-      instances = paths
-
-    elif self.task_params.move_type == 'circle+forward':
-      _, _, _, _, paths = rng_target_dist_field(self.task_params.batch_size,
-                                                self.task.gtG, rng, 0, 1,
-                                                compute_path=True)
-      instances_ = paths
-      instances = []
-      for instance_ in instances_:
-        instance = instance_
-        for i in range(self.task_params.n_ori-1):
-          instance.append(self.take_action([instance[-1]], [1])[0])
-        while len(instance) <= self.task_params.num_steps:
-          while self.take_action([instance[-1]], [3])[0] == instance[-1] and len(instance) <= self.task_params.num_steps:
-            instance.append(self.take_action([instance[-1]], [2])[0])
-          if len(instance) <= self.task_params.num_steps:
-            instance.append(self.take_action([instance[-1]], [3])[0])
-        instances.append(instance)
-
-    # Do random perturbation if needed.
-    perturbs = _gen_perturbs(rng, self.task_params.batch_size,
-                             self.task_params.num_steps,
-                             self.task_params.data_augment.lr_flip,
-                             self.task_params.data_augment.delta_angle,
-                             self.task_params.data_augment.delta_xy,
-                             self.task_params.data_augment.structured)
-    return instances, perturbs
-
-  def worker(self, instances, perturbs):
-    # Output the images and the free space.
-
-    # Make the instances be all the same length.
-    for i in range(len(instances)):
-      for j in range(self.task_params.num_steps - len(instances[i]) + 1):
-        instances[i].append(instances[i][-1])
-      if perturbs[i].shape[0] < self.task_params.num_steps+1:
-        p = np.zeros((self.task_params.num_steps+1, 4))
-        p[:perturbs[i].shape[0], :] = perturbs[i]
-        p[perturbs[i].shape[0]:, :] = perturbs[i][-1,:]
-        perturbs[i] = p
-
-    instances_ = []
-    for instance in instances:
-      instances_ = instances_ + instance
-    perturbs_ = np.concatenate(perturbs, axis=0)
-
-    instances_nodes = self.task.nodes[instances_,:]
-    instances_nodes = [tuple(x) for x in instances_nodes]
-
-    imgs_ = self.render_nodes(instances_nodes, perturbs_)
-    imgs = []; next = 0;
-    for instance in instances:
-      img_i = []
-      for _ in instance:
-        img_i.append(imgs_[next])
-        next = next+1
-      imgs.append(img_i)
-    imgs = np.array(imgs)
-
-    # Render out the maps in the egocentric view for all nodes and not just the
-    # last node.
-    all_nodes = []
-    for x in instances:
-      all_nodes = all_nodes + x
-    all_perturbs = np.concatenate(perturbs, axis=0)
-    loc, x_axis, y_axis, theta = self.get_loc_axis(
-        self.task.nodes[all_nodes, :]*1, delta_theta=self.task.delta_theta,
-        perturb=all_perturbs)
-    fss = None
-    valids = None
-    loc_on_map = None
-    theta_on_map = None
-    cum_fs = None
-    cum_valid = None
-    incremental_locs = None
-    incremental_thetas = None
-
-    if self.task_params.output_free_space:
-      fss, valids = get_map_to_predict(loc, x_axis, y_axis,
-                                       map=self.traversible*1.,
-                                       map_size=self.task_params.map_size)
-      fss = np.array(fss) > 0.5
-      fss = np.reshape(fss, [self.task_params.batch_size,
-                             self.task_params.num_steps+1,
-                             self.task_params.map_size,
-                             self.task_params.map_size])
-      valids = np.reshape(np.array(valids), fss.shape)
-
-    if self.task_params.output_transform_to_global_map:
-      # Output the transform to the global map.
-      loc_on_map = np.reshape(loc*1, [self.task_params.batch_size,
-                                      self.task_params.num_steps+1, -1])
-      # Converting to location wrt to first location so that warping happens
-      # properly.
-      theta_on_map = np.reshape(theta*1, [self.task_params.batch_size,
-                                            self.task_params.num_steps+1, -1])
-
-    if self.task_params.output_incremental_transform:
-      # Output the transform to the global map.
-      incremental_locs_ = np.reshape(loc*1, [self.task_params.batch_size,
-                                             self.task_params.num_steps+1, -1])
-      incremental_locs_[:,1:,:] -= incremental_locs_[:,:-1,:]
-      t0 = -np.pi/2+np.reshape(theta*1, [self.task_params.batch_size,
-                                        self.task_params.num_steps+1, -1])
-      t = t0*1
-      incremental_locs = incremental_locs_*1
-      incremental_locs[:,:,0] = np.sum(incremental_locs_ * np.concatenate((np.cos(t), np.sin(t)), axis=-1), axis=-1)
-      incremental_locs[:,:,1] = np.sum(incremental_locs_ * np.concatenate((np.cos(t+np.pi/2), np.sin(t+np.pi/2)), axis=-1), axis=-1)
-      incremental_locs[:,0,:] = incremental_locs_[:,0,:]
-      # print incremental_locs_[0,:,:], incremental_locs[0,:,:], t0[0,:,:]
-
-      incremental_thetas = np.reshape(theta*1, [self.task_params.batch_size,
-                                                self.task_params.num_steps+1,
-                                                -1])
-      incremental_thetas[:,1:,:] += -incremental_thetas[:,:-1,:]
-
-    if self.task_params.output_canonical_map:
-      loc_ = loc[0::(self.task_params.num_steps+1), :]
-      x_axis = np.zeros_like(loc_); x_axis[:,1] = 1
-      y_axis = np.zeros_like(loc_); y_axis[:,0] = -1
-      cum_fs, cum_valid = get_map_to_predict(loc_, x_axis, y_axis,
-                                             map=self.traversible*1.,
-                                             map_size=self.task_params.map_size)
-      cum_fs = np.array(cum_fs) > 0.5
-      cum_fs = np.reshape(cum_fs, [self.task_params.batch_size, 1,
-                                   self.task_params.map_size,
-                                   self.task_params.map_size])
-      cum_valid = np.reshape(np.array(cum_valid), cum_fs.shape)
-
-
-    inputs = {'fs_maps': fss,
-              'valid_maps': valids,
-              'imgs': imgs,
-              'loc_on_map': loc_on_map,
-              'theta_on_map': theta_on_map,
-              'cum_fs_maps': cum_fs,
-              'cum_valid_maps': cum_valid,
-              'incremental_thetas': incremental_thetas,
-              'incremental_locs': incremental_locs}
-    return inputs
-
-  def pre(self, inputs):
-    inputs['imgs'] = image_pre(inputs['imgs'], self.task_params.modalities)
-    if inputs['loc_on_map'] is not None:
-      inputs['loc_on_map'] = inputs['loc_on_map'] - inputs['loc_on_map'][:,[0],:]
-    if inputs['theta_on_map'] is not None:
-      inputs['theta_on_map'] = np.pi/2. - inputs['theta_on_map']
-    return inputs
-
-def _nav_env_reset_helper(type, rng, nodes, batch_size, gtG, max_dist,
-                          num_steps, num_goals, data_augment, **kwargs):
-  """Generates and returns a new episode."""
-  max_compute = max_dist + 4*num_steps
-  if type == 'general':
-    start_node_ids, end_node_ids, dist, pred_map, paths = \
-        rng_target_dist_field(batch_size, gtG, rng, max_dist, max_compute,
-                              nodes=nodes, compute_path=False)
-    target_class = None
-
-  elif type == 'room_to_room_many':
-    goal_node_ids = []; dists = [];
-    node_room_ids = kwargs['node_room_ids']
-    # Sample the first one
-    start_node_ids_, end_node_ids_, dist_, _, _ = rng_room_to_room(
-        batch_size, gtG, rng, max_dist, max_compute,
-        node_room_ids=node_room_ids, nodes=nodes)
-    start_node_ids = start_node_ids_
-    goal_node_ids.append(end_node_ids_)
-    dists.append(dist_)
-    for n in range(num_goals-1):
-      start_node_ids_, end_node_ids_, dist_, _, _ = rng_next_goal(
-          goal_node_ids[n], batch_size, gtG, rng, max_dist,
-          max_compute, node_room_ids=node_room_ids, nodes=nodes,
-          dists_from_start_node=dists[n])
-      goal_node_ids.append(end_node_ids_)
-      dists.append(dist_)
-    target_class = None
-
-  elif type == 'rng_rejection_sampling_many':
-    num_goals = num_goals
-    goal_node_ids = []; dists = [];
-
-    n_ori = kwargs['n_ori']
-    step_size = kwargs['step_size']
-    min_dist = kwargs['min_dist']
-    sampling_distribution = kwargs['sampling_distribution']
-    target_distribution = kwargs['target_distribution']
-    rejection_sampling_M = kwargs['rejection_sampling_M']
-    distribution_bins = kwargs['distribution_bins']
-
-    for n in range(num_goals):
-      if n == 0: input_nodes = None
-      else: input_nodes = goal_node_ids[n-1]
-      start_node_ids_, end_node_ids_, dist_, _, _, _, _ = rng_next_goal_rejection_sampling(
-              input_nodes, batch_size, gtG, rng, max_dist, min_dist,
-              max_compute, sampling_distribution, target_distribution, nodes,
-              n_ori, step_size, distribution_bins, rejection_sampling_M)
-      if n == 0: start_node_ids = start_node_ids_
-      goal_node_ids.append(end_node_ids_)
-      dists.append(dist_)
-    target_class = None
-
-  elif type == 'room_to_room_back':
-    num_goals = num_goals
-    assert(num_goals == 2), 'num_goals must be 2.'
-    goal_node_ids = []; dists = [];
-    node_room_ids = kwargs['node_room_ids']
-    # Sample the first one.
-    start_node_ids_, end_node_ids_, dist_, _, _ = rng_room_to_room(
-        batch_size, gtG, rng, max_dist, max_compute,
-        node_room_ids=node_room_ids, nodes=nodes)
-    start_node_ids = start_node_ids_
-    goal_node_ids.append(end_node_ids_)
-    dists.append(dist_)
-
-    # Set second goal to be starting position, and compute distance to the start node.
-    goal_node_ids.append(start_node_ids)
-    dist = []
-    for i in range(batch_size):
-      dist_ = gt.topology.shortest_distance(
-          gt.GraphView(gtG, reversed=True),
-          source=gtG.vertex(start_node_ids[i]), target=None)
-      dist_ = np.array(dist_.get_array())
-      dist.append(dist_)
-    dists.append(dist)
-    target_class = None
-
-  elif type[:14] == 'to_nearest_obj':
-    # Generate an episode by sampling one of the target classes (with
-    # probability proportional to the number of nodes in the world).
-    # With the sampled class sample a node that is within some distance from
-    # the sampled class.
-    class_nodes   = kwargs['class_nodes']
-    sampling      = kwargs['sampling']
-    dist_to_class = kwargs['dist_to_class']
-
-    assert(num_goals == 1), 'Only supports a single goal.'
-    ind = rng.choice(class_nodes.shape[0], size=batch_size)
-    target_class = class_nodes[ind,1]
-    start_node_ids = []; dists = []; goal_node_ids = [];
-
-    for t in target_class:
-      if sampling == 'uniform':
-        max_dist = max_dist
-        cnts = np.bincount(dist_to_class[t], minlength=max_dist+1)*1.
-        cnts[max_dist+1:] = 0
-        p_each = 1./ cnts / (max_dist+1.)
-        p_each[cnts == 0] = 0
-        p = p_each[dist_to_class[t]]*1.; p = p/np.sum(p)
-        start_node_id = rng.choice(p.shape[0], size=1, p=p)[0]
-      else:
-        logging.fatal('Sampling not one of uniform.')
-      start_node_ids.append(start_node_id)
-      dists.append(dist_to_class[t])
-      # Dummy goal node, same as the start node, so that vis is better.
-      goal_node_ids.append(start_node_id)
-    dists = [dists]
-    goal_node_ids = [goal_node_ids]
-
-  return start_node_ids, goal_node_ids, dists, target_class
-
-
-class NavigationEnv(GridWorld, Building):
-  """Wrapper around GridWorld which sets up navigation tasks.
-  """
-  def _debug_save_hardness(self, seed):
-    out_path = os.path.join(self.logdir, '{:s}_{:d}_hardness.png'.format(self.building_name, seed))
-    batch_size = 4000
-    rng = np.random.RandomState(0)
-    start_node_ids, end_node_ids, dists, pred_maps, paths, hardnesss, gt_dists = \
-      rng_next_goal_rejection_sampling(
-          None, batch_size, self.task.gtG, rng, self.task_params.max_dist,
-          self.task_params.min_dist, self.task_params.max_dist,
-          self.task.sampling_distribution, self.task.target_distribution,
-          self.task.nodes, self.task_params.n_ori, self.task_params.step_size,
-          self.task.distribution_bins, self.task.rejection_sampling_M)
-    bins = self.task.distribution_bins 
-    n_bins = self.task.n_bins
-    with plt.style.context('ggplot'):
-      fig, axes = utils.subplot(plt, (1,2), (10,10))
-      ax = axes[0]
-      _ = ax.hist(hardnesss, bins=bins, weights=np.ones_like(hardnesss)/len(hardnesss))
-      ax.plot(bins[:-1]+0.5/n_bins, self.task.target_distribution, 'g')
-      ax.plot(bins[:-1]+0.5/n_bins, self.task.sampling_distribution, 'b')
-      ax.grid('on')
-      
-      ax = axes[1]
-      _ = ax.hist(gt_dists, bins=np.arange(self.task_params.max_dist+1))
-      ax.grid('on')
-      ax.set_title('Mean: {:0.2f}, Median: {:0.2f}'.format(np.mean(gt_dists),
-                                                           np.median(gt_dists)))
-      with fu.fopen(out_path, 'w') as f:
-        fig.savefig(f, bbox_inches='tight', transparent=True, pad_inches=0)
-
-  def _debug_save_map_nodes(self, seed):
-    """Saves traversible space along with nodes generated on the graph. Takes
-    the seed as input."""
-    img_path = os.path.join(self.logdir, '{:s}_{:d}_graph.png'.format(self.building_name, seed))
-    node_xyt = self.to_actual_xyt_vec(self.task.nodes)
-    plt.set_cmap('jet');
-    fig, ax = utils.subplot(plt, (1,1), (12,12))
-    ax.plot(node_xyt[:,0], node_xyt[:,1], 'm.')
-    ax.set_axis_off(); ax.axis('equal');
-    
-    if self.room_dims is not None:
-      for i, r in enumerate(self.room_dims['dims']*1):
-        min_ = r[:3]*1
-        max_ = r[3:]*1
-        xmin, ymin, zmin = min_
-        xmax, ymax, zmax = max_
-
-        ax.plot([xmin, xmax, xmax, xmin, xmin],
-                [ymin, ymin, ymax, ymax, ymin], 'g')
-    ax.imshow(self.traversible, origin='lower');
-    with fu.fopen(img_path, 'w') as f:
-      fig.savefig(f, bbox_inches='tight', transparent=True, pad_inches=0)
-
-  def _debug_semantic_maps(self, seed):
-    """Saves traversible space along with nodes generated on the graph. Takes
-    the seed as input."""
-    for i, cls in enumerate(self.task_params.semantic_task.class_map_names):
-      img_path = os.path.join(self.logdir, '{:s}_flip{:d}_{:s}_graph.png'.format(self.building_name, seed, cls))
-      maps = self.traversible*1.
-      maps += 0.5*(self.task.class_maps_dilated[:,:,i])
-      write_traversible = (maps*1.+1.)/3.0
-      write_traversible = (write_traversible*255.).astype(np.uint8)[:,:,np.newaxis]
-      write_traversible = write_traversible + np.zeros((1,1,3), dtype=np.uint8)
-      fu.write_image(img_path, write_traversible[::-1,:,:])
-
-  def _preprocess_for_task(self, seed):
-    """Sets up the task field for doing navigation on the grid world."""
-    if self.task is None or self.task.seed != seed:
-      rng = np.random.RandomState(seed)
-      origin_loc = get_graph_origin_loc(rng, self.traversible)
-      self.task = utils.Foo(seed=seed, origin_loc=origin_loc,
-                            n_ori=self.task_params.n_ori)
-      G = generate_graph(self.valid_fn_vec, self.task_params.step_size,
-                         self.task.n_ori, (0, 0, 0))
-      gtG, nodes, nodes_to_id = convert_to_graph_tool(G)
-      self.task.gtG = gtG
-      self.task.nodes = nodes
-      self.task.delta_theta = 2.0*np.pi/(self.task.n_ori*1.)
-      self.task.nodes_to_id = nodes_to_id
-
-      logging.info('Building %s, #V=%d, #E=%d', self.building_name,
-                   self.task.nodes.shape[0], self.task.gtG.num_edges())
-      type = self.task_params.type
-      if type == 'general':
-        # Do nothing
-        _ = None
-
-      elif type == 'room_to_room_many' or type == 'room_to_room_back':
-        if type == 'room_to_room_back':
-          assert(self.task_params.num_goals == 2), 'num_goals must be 2.'
-
-        self.room_dims = _filter_rooms(self.room_dims, self.task_params.room_regex)
-        xyt = self.to_actual_xyt_vec(self.task.nodes)
-        self.task.node_room_ids = _label_nodes_with_room_id(xyt, self.room_dims)
-        self.task.reset_kwargs = {'node_room_ids': self.task.node_room_ids}
-
-      elif type == 'rng_rejection_sampling_many':
-        n_bins = 20
-        rejection_sampling_M = self.task_params.rejection_sampling_M
-        min_dist = self.task_params.min_dist
-        bins = np.arange(n_bins+1)/(n_bins*1.)
-        target_d = np.zeros(n_bins); target_d[...] = 1./n_bins;
-
-        sampling_d = get_hardness_distribution(
-            self.task.gtG, self.task_params.max_dist, self.task_params.min_dist,
-            np.random.RandomState(0), 4000, bins, self.task.nodes,
-            self.task_params.n_ori, self.task_params.step_size)
-
-        self.task.reset_kwargs = {'distribution_bins': bins,
-                                  'target_distribution': target_d,
-                                  'sampling_distribution': sampling_d,
-                                  'rejection_sampling_M': rejection_sampling_M,
-                                  'n_bins': n_bins, 
-                                  'n_ori': self.task_params.n_ori,
-                                  'step_size': self.task_params.step_size,
-                                  'min_dist': self.task_params.min_dist}
-        self.task.n_bins = n_bins
-        self.task.distribution_bins = bins
-        self.task.target_distribution = target_d
-        self.task.sampling_distribution = sampling_d
-        self.task.rejection_sampling_M = rejection_sampling_M
-
-        if self.logdir is not None:
-          self._debug_save_hardness(seed)
-
-      elif type[:14] == 'to_nearest_obj':
-        self.room_dims = _filter_rooms(self.room_dims, self.task_params.room_regex)
-        xyt = self.to_actual_xyt_vec(self.task.nodes)
-
-        self.class_maps = _select_classes(self.class_maps,
-                                          self.class_map_names,
-                                          self.task_params.semantic_task.class_map_names)*1
-        self.class_map_names = self.task_params.semantic_task.class_map_names
-        nodes_xyt = self.to_actual_xyt_vec(np.array(self.task.nodes))
-
-        tt = utils.Timer(); tt.tic();
-        if self.task_params.type == 'to_nearest_obj_acc':
-          self.task.class_maps_dilated, self.task.node_class_label = label_nodes_with_class_geodesic(
-            nodes_xyt, self.class_maps,
-            self.task_params.semantic_task.pix_distance+8, self.map.traversible,
-            ff_cost=1., fo_cost=1., oo_cost=4., connectivity=8.)
-
-        dists = []
-        for i in range(len(self.class_map_names)):
-          class_nodes_ = np.where(self.task.node_class_label[:,i])[0]
-          dists.append(get_distance_node_list(gtG, source_nodes=class_nodes_, direction='to'))
-        self.task.dist_to_class = dists
-        a_, b_ = np.where(self.task.node_class_label)
-        self.task.class_nodes = np.concatenate((a_[:,np.newaxis], b_[:,np.newaxis]), axis=1)
-        
-        if self.logdir is not None:
-          self._debug_semantic_maps(seed)
-        
-        self.task.reset_kwargs = {'sampling': self.task_params.semantic_task.sampling,
-                                  'class_nodes': self.task.class_nodes,
-                                  'dist_to_class': self.task.dist_to_class}
-
-      if self.logdir is not None:
-        self._debug_save_map_nodes(seed)
-
-  def reset(self, rngs):
-    rng = rngs[0]; rng_perturb = rngs[1];
-    nodes = self.task.nodes
-    tp = self.task_params
-
-    start_node_ids, goal_node_ids, dists, target_class = \
-        _nav_env_reset_helper(tp.type, rng, self.task.nodes, tp.batch_size,
-                              self.task.gtG, tp.max_dist, tp.num_steps,
-                              tp.num_goals, tp.data_augment,
-                              **(self.task.reset_kwargs))
-
-    start_nodes = [tuple(nodes[_,:]) for _ in start_node_ids]
-    goal_nodes = [[tuple(nodes[_,:]) for _ in __] for __ in goal_node_ids]
-    data_augment = tp.data_augment
-    perturbs = _gen_perturbs(rng_perturb, tp.batch_size,
-                             (tp.num_steps+1)*tp.num_goals,
-                             data_augment.lr_flip, data_augment.delta_angle,
-                             data_augment.delta_xy, data_augment.structured)
-    perturbs = np.array(perturbs) # batch x steps x 4
-    end_perturbs = perturbs[:,-(tp.num_goals):,:]*1 # fixed perturb for the goal.
-    perturbs = perturbs[:,:-(tp.num_goals),:]*1
-
-    history = -np.ones((tp.batch_size, tp.num_steps*tp.num_goals), dtype=np.int32)
-    self.episode = utils.Foo(
-        start_nodes=start_nodes, start_node_ids=start_node_ids,
-        goal_nodes=goal_nodes, goal_node_ids=goal_node_ids, dist_to_goal=dists,
-        perturbs=perturbs, goal_perturbs=end_perturbs, history=history,
-        target_class=target_class, history_frames=[])
-    return start_node_ids
-
-  def take_action(self, current_node_ids, action, step_number):
-    """In addition to returning the action, also returns the reward that the
-    agent receives."""
-    goal_number = step_number / self.task_params.num_steps
-    new_node_ids = GridWorld.take_action(self, current_node_ids, action)
-    rewards = []
-    for i, n in enumerate(new_node_ids):
-      reward = 0
-      if n == self.episode.goal_node_ids[goal_number][i]:
-        reward = self.task_params.reward_at_goal
-      reward = reward - self.task_params.reward_time_penalty
-      rewards.append(reward)
-    return new_node_ids, rewards
-
-
-  def get_optimal_action(self, current_node_ids, step_number):
-    """Returns the optimal action from the current node."""
-    goal_number = step_number / self.task_params.num_steps
-    gtG = self.task.gtG
-    a = np.zeros((len(current_node_ids), self.task_params.num_actions), dtype=np.int32)
-    d_dict = self.episode.dist_to_goal[goal_number]
-    for i, c in enumerate(current_node_ids):
-      neigh = gtG.vertex(c).out_neighbours()
-      neigh_edge = gtG.vertex(c).out_edges()
-      ds = np.array([d_dict[i][int(x)] for x in neigh])
-      ds_min = np.min(ds)
-      for i_, e in enumerate(neigh_edge):
-        if ds[i_] == ds_min:
-          _ = gtG.ep['action'][e]
-          a[i, _] = 1
-    return a
-
-  def get_targets(self, current_node_ids, step_number):
-    """Returns the target actions from the current node."""
-    action = self.get_optimal_action(current_node_ids, step_number)
-    action = np.expand_dims(action, axis=1)
-    return vars(utils.Foo(action=action))
-
-  def get_targets_name(self):
-    """Returns the list of names of the targets."""
-    return ['action']
-
-  def cleanup(self):
-    self.episode = None
-
-class VisualNavigationEnv(NavigationEnv):
-  """Class for doing visual navigation in environments. Functions for computing
-  features on states, etc.
-  """
-  def __init__(self, robot, env, task_params, category_list=None,
-               building_name=None, flip=False, logdir=None,
-               building_loader=None, r_obj=None):
-    tt = utils.Timer()
-    tt.tic()
-    Building.__init__(self, building_name, robot, env, category_list,
-                      small=task_params.toy_problem, flip=flip, logdir=logdir,
-                      building_loader=building_loader)
-
-    self.set_r_obj(r_obj)
-    self.task_params = task_params
-    self.task = None
-    self.episode = None
-    self._preprocess_for_task(self.task_params.building_seed)
-    if hasattr(self.task_params, 'map_scales'):
-      self.task.scaled_maps = resize_maps(
-          self.traversible.astype(np.float32)*1, self.task_params.map_scales,
-          self.task_params.map_resize_method)
-    else:
-      logging.fatal('VisualNavigationEnv does not support scale_f anymore.')
-    self.task.readout_maps_scaled = resize_maps(
-      self.traversible.astype(np.float32)*1,
-      self.task_params.readout_maps_scales,
-      self.task_params.map_resize_method)
-    tt.toc(log_at=1, log_str='VisualNavigationEnv __init__: ')
-
-  def get_weight(self):
-    return self.task.nodes.shape[0]
-
-  def get_common_data(self):
-    goal_nodes = self.episode.goal_nodes
-    start_nodes = self.episode.start_nodes
-    perturbs = self.episode.perturbs
-    goal_perturbs = self.episode.goal_perturbs
-    target_class = self.episode.target_class
-
-    goal_locs = []; rel_goal_locs = [];
-    for i in range(len(goal_nodes)):
-      end_nodes = goal_nodes[i]
-      goal_loc, _, _, goal_theta = self.get_loc_axis(
-          np.array(end_nodes), delta_theta=self.task.delta_theta,
-          perturb=goal_perturbs[:,i,:])
-
-      # Compute the relative location to all goals from the starting location.
-      loc, _, _, theta = self.get_loc_axis(np.array(start_nodes),
-                                           delta_theta=self.task.delta_theta,
-                                           perturb=perturbs[:,0,:])
-      r_goal, t_goal = _get_relative_goal_loc(goal_loc*1., loc, theta)
-      rel_goal_loc = np.concatenate((r_goal*np.cos(t_goal), r_goal*np.sin(t_goal),
-                                     np.cos(goal_theta-theta),
-                                     np.sin(goal_theta-theta)), axis=1)
-      rel_goal_locs.append(np.expand_dims(rel_goal_loc, axis=1))
-      goal_locs.append(np.expand_dims(goal_loc, axis=1))
-
-    map = self.traversible*1.
-    maps = np.repeat(np.expand_dims(np.expand_dims(map, axis=0), axis=0),
-                     self.task_params.batch_size, axis=0)*1
-    if self.task_params.type[:14] == 'to_nearest_obj':
-      for i in range(self.task_params.batch_size):
-        maps[i,0,:,:] += 0.5*(self.task.class_maps_dilated[:,:,target_class[i]])
-
-    rel_goal_locs = np.concatenate(rel_goal_locs, axis=1)
-    goal_locs = np.concatenate(goal_locs, axis=1)
-    maps = np.expand_dims(maps, axis=-1)
-
-    if self.task_params.type[:14] == 'to_nearest_obj':
-      rel_goal_locs = np.zeros((self.task_params.batch_size, 1,
-                                len(self.task_params.semantic_task.class_map_names)),
-                               dtype=np.float32)
-      goal_locs = np.zeros((self.task_params.batch_size, 1, 2),
-                           dtype=np.float32)
-      for i in range(self.task_params.batch_size):
-          t = target_class[i]
-          rel_goal_locs[i,0,t] = 1.
-          goal_locs[i,0,0] = t
-          goal_locs[i,0,1] = np.NaN
-
-    return vars(utils.Foo(orig_maps=maps, goal_loc=goal_locs,
-                          rel_goal_loc_at_start=rel_goal_locs))
-
-  def pre_common_data(self, inputs):
-    return inputs
-
-
-  def get_features(self, current_node_ids, step_number):
-    task_params = self.task_params
-    goal_number = step_number / self.task_params.num_steps
-    end_nodes = self.task.nodes[self.episode.goal_node_ids[goal_number],:]*1
-    current_nodes = self.task.nodes[current_node_ids,:]*1
-    end_perturbs = self.episode.goal_perturbs[:,goal_number,:][:,np.newaxis,:]
-    perturbs = self.episode.perturbs
-    target_class = self.episode.target_class
-
-    # Append to history.
-    self.episode.history[:,step_number] = np.array(current_node_ids)
-
-    # Render out the images from current node.
-    outs = {}
-
-    if self.task_params.outputs.images:
-      imgs_all = []
-      imgs = self.render_nodes([tuple(x) for x in current_nodes],
-                               perturb=perturbs[:,step_number,:])
-      imgs_all.append(imgs)
-      aux_delta_thetas = self.task_params.aux_delta_thetas
-      for i in range(len(aux_delta_thetas)):
-        imgs = self.render_nodes([tuple(x) for x in current_nodes],
-                                 perturb=perturbs[:,step_number,:],
-                                 aux_delta_theta=aux_delta_thetas[i])
-        imgs_all.append(imgs)
-      imgs_all = np.array(imgs_all) # A x B x H x W x C
-      imgs_all = np.transpose(imgs_all, axes=[1,0,2,3,4])
-      imgs_all = np.expand_dims(imgs_all, axis=1) # B x N x A x H x W x C
-      if task_params.num_history_frames > 0:
-        if step_number == 0:
-          # Append the same frame 4 times
-          for i in range(task_params.num_history_frames+1):
-            self.episode.history_frames.insert(0, imgs_all*1.)
-        self.episode.history_frames.insert(0, imgs_all)
-        self.episode.history_frames.pop()
-        imgs_all_with_history = np.concatenate(self.episode.history_frames, axis=2)
-      else:
-        imgs_all_with_history = imgs_all
-      outs['imgs'] = imgs_all_with_history # B x N x A x H x W x C
-
-    if self.task_params.outputs.node_ids:
-      outs['node_ids'] = np.array(current_node_ids).reshape((-1,1,1))
-      outs['perturbs'] = np.expand_dims(perturbs[:,step_number, :]*1., axis=1)
-
-    if self.task_params.outputs.analytical_counts:
-      assert(self.task_params.modalities == ['depth'])
-      d = image_pre(outs['imgs']*1., self.task_params.modalities)
-      cm = get_camera_matrix(self.task_params.img_width,
-                             self.task_params.img_height,
-                             self.task_params.img_fov)
-      XYZ = get_point_cloud_from_z(100./d[...,0], cm)
-      XYZ = make_geocentric(XYZ*100., self.robot.sensor_height,
-                                      self.robot.camera_elevation_degree)
-      for i in range(len(self.task_params.analytical_counts.map_sizes)):
-        non_linearity = self.task_params.analytical_counts.non_linearity[i]
-        count, isvalid = bin_points(XYZ*1.,
-                                    map_size=self.task_params.analytical_counts.map_sizes[i],
-                                    xy_resolution=self.task_params.analytical_counts.xy_resolution[i],
-                                    z_bins=self.task_params.analytical_counts.z_bins[i])
-        assert(count.shape[2] == 1), 'only works for n_views equal to 1.'
-        count = count[:,:,0,:,:,:]
-        isvalid = isvalid[:,:,0,:,:,:]
-        if non_linearity == 'none':
-          None
-        elif non_linearity == 'min10':
-          count = np.minimum(count, 10.)
-        elif non_linearity == 'sqrt':
-          count = np.sqrt(count)
-        else:
-          logging.fatal('Undefined non_linearity.')
-        outs['analytical_counts_{:d}'.format(i)] = count
-
-    # Compute the goal location in the cordinate frame of the robot.
-    if self.task_params.outputs.rel_goal_loc:
-      if self.task_params.type[:14] != 'to_nearest_obj':
-        loc, _, _, theta = self.get_loc_axis(current_nodes,
-                                             delta_theta=self.task.delta_theta,
-                                             perturb=perturbs[:,step_number,:])
-        goal_loc, _, _, goal_theta = self.get_loc_axis(end_nodes,
-                                                       delta_theta=self.task.delta_theta,
-                                                       perturb=end_perturbs[:,0,:])
-        r_goal, t_goal = _get_relative_goal_loc(goal_loc, loc, theta)
-
-        rel_goal_loc = np.concatenate((r_goal*np.cos(t_goal), r_goal*np.sin(t_goal),
-                                       np.cos(goal_theta-theta),
-                                       np.sin(goal_theta-theta)), axis=1)
-        outs['rel_goal_loc'] = np.expand_dims(rel_goal_loc, axis=1)
-      elif self.task_params.type[:14] == 'to_nearest_obj':
-        rel_goal_loc = np.zeros((self.task_params.batch_size, 1,
-                                 len(self.task_params.semantic_task.class_map_names)),
-                                dtype=np.float32)
-        for i in range(self.task_params.batch_size):
-          t = target_class[i]
-          rel_goal_loc[i,0,t] = 1.
-        outs['rel_goal_loc'] = rel_goal_loc
-
-    # Location on map to plot the trajectory during validation.
-    if self.task_params.outputs.loc_on_map:
-      loc, x_axis, y_axis, theta = self.get_loc_axis(current_nodes,
-                                                     delta_theta=self.task.delta_theta,
-                                                     perturb=perturbs[:,step_number,:])
-      outs['loc_on_map'] = np.expand_dims(loc, axis=1)
-
-    # Compute gt_dist to goal
-    if self.task_params.outputs.gt_dist_to_goal:
-      gt_dist_to_goal = np.zeros((len(current_node_ids), 1), dtype=np.float32)
-      for i, n in enumerate(current_node_ids):
-        gt_dist_to_goal[i,0] = self.episode.dist_to_goal[goal_number][i][n]
-      outs['gt_dist_to_goal'] = np.expand_dims(gt_dist_to_goal, axis=1)
-
-    # Free space in front of you, map and goal as images.
-    if self.task_params.outputs.ego_maps:
-      loc, x_axis, y_axis, theta = self.get_loc_axis(current_nodes,
-                                                     delta_theta=self.task.delta_theta,
-                                                     perturb=perturbs[:,step_number,:])
-      maps = generate_egocentric_maps(self.task.scaled_maps,
-                                      self.task_params.map_scales,
-                                      self.task_params.map_crop_sizes, loc,
-                                      x_axis, y_axis, theta)
-
-      for i in range(len(self.task_params.map_scales)):
-        outs['ego_maps_{:d}'.format(i)] = \
-            np.expand_dims(np.expand_dims(maps[i], axis=1), axis=-1)
-
-    if self.task_params.outputs.readout_maps:
-      loc, x_axis, y_axis, theta = self.get_loc_axis(current_nodes,
-                                                     delta_theta=self.task.delta_theta,
-                                                     perturb=perturbs[:,step_number,:])
-      maps = generate_egocentric_maps(self.task.readout_maps_scaled,
-                                      self.task_params.readout_maps_scales,
-                                      self.task_params.readout_maps_crop_sizes,
-                                      loc, x_axis, y_axis, theta)
-      for i in range(len(self.task_params.readout_maps_scales)):
-        outs['readout_maps_{:d}'.format(i)] = \
-            np.expand_dims(np.expand_dims(maps[i], axis=1), axis=-1)
-
-    # Images for the goal.
-    if self.task_params.outputs.ego_goal_imgs:
-      if self.task_params.type[:14] != 'to_nearest_obj': 
-        loc, x_axis, y_axis, theta = self.get_loc_axis(current_nodes,
-                                                       delta_theta=self.task.delta_theta,
-                                                       perturb=perturbs[:,step_number,:])
-        goal_loc, _, _, _ = self.get_loc_axis(end_nodes,
-                                              delta_theta=self.task.delta_theta,
-                                              perturb=end_perturbs[:,0,:])
-        rel_goal_orientation = np.mod(
-            np.int32(current_nodes[:,2:] - end_nodes[:,2:]), self.task_params.n_ori)
-        goal_dist, goal_theta = _get_relative_goal_loc(goal_loc, loc, theta)
-        goals = generate_goal_images(self.task_params.map_scales,
-                                     self.task_params.map_crop_sizes,
-                                     self.task_params.n_ori, goal_dist,
-                                     goal_theta, rel_goal_orientation)
-        for i in range(len(self.task_params.map_scales)):
-          outs['ego_goal_imgs_{:d}'.format(i)] = np.expand_dims(goals[i], axis=1)
-
-      elif self.task_params.type[:14] == 'to_nearest_obj':
-        for i in range(len(self.task_params.map_scales)):
-          num_classes = len(self.task_params.semantic_task.class_map_names)
-          outs['ego_goal_imgs_{:d}'.format(i)] = np.zeros((self.task_params.batch_size, 1,
-                                                           self.task_params.map_crop_sizes[i],
-                                                           self.task_params.map_crop_sizes[i],
-                                                           self.task_params.goal_channels))
-        for i in range(self.task_params.batch_size):
-          t = target_class[i]
-          for j in range(len(self.task_params.map_scales)):
-            outs['ego_goal_imgs_{:d}'.format(j)][i,:,:,:,t] = 1.
-
-    # Incremental locs and theta (for map warping), always in the original scale
-    # of the map, the subequent steps in the tf code scale appropriately.
-    # Scaling is done by just multiplying incremental_locs appropriately.
-    if self.task_params.outputs.egomotion:
-      if step_number == 0:
-        # Zero Ego Motion
-        incremental_locs = np.zeros((self.task_params.batch_size, 1, 2), dtype=np.float32)
-        incremental_thetas = np.zeros((self.task_params.batch_size, 1, 1), dtype=np.float32)
-      else:
-        previous_nodes = self.task.nodes[self.episode.history[:,step_number-1], :]*1
-        loc, _, _, theta = self.get_loc_axis(current_nodes,
-                                             delta_theta=self.task.delta_theta,
-                                             perturb=perturbs[:,step_number,:])
-        previous_loc, _, _, previous_theta = self.get_loc_axis(
-            previous_nodes, delta_theta=self.task.delta_theta,
-            perturb=perturbs[:,step_number-1,:])
-
-        incremental_locs_ = np.reshape(loc-previous_loc, [self.task_params.batch_size, 1, -1])
-
-        t = -np.pi/2+np.reshape(theta*1, [self.task_params.batch_size, 1, -1])
-        incremental_locs = incremental_locs_*1
-        incremental_locs[:,:,0] = np.sum(incremental_locs_ *
-                                         np.concatenate((np.cos(t), np.sin(t)),
-                                                        axis=-1), axis=-1)
-        incremental_locs[:,:,1] = np.sum(incremental_locs_ *
-                                         np.concatenate((np.cos(t+np.pi/2),
-                                                         np.sin(t+np.pi/2)),
-                                                        axis=-1), axis=-1)
-        incremental_thetas = np.reshape(theta-previous_theta,
-                                        [self.task_params.batch_size, 1, -1])
-      outs['incremental_locs'] = incremental_locs
-      outs['incremental_thetas'] = incremental_thetas
-
-    if self.task_params.outputs.visit_count:
-      # Output the visit count for this state, how many times has the current
-      # state been visited, and how far in the history was the last visit
-      # (except this one)
-      visit_count = np.zeros((self.task_params.batch_size, 1), dtype=np.int32)
-      last_visit = -np.ones((self.task_params.batch_size, 1), dtype=np.int32)
-      if step_number >= 1:
-        h = self.episode.history[:,:(step_number)]
-        visit_count[:,0] = np.sum(h == np.array(current_node_ids).reshape([-1,1]),
-                                  axis=1)
-        last_visit[:,0] = np.argmax(h[:,::-1] == np.array(current_node_ids).reshape([-1,1]),
-                                    axis=1) + 1
-        last_visit[visit_count == 0] = -1 # -1 if not visited.
-      outs['visit_count'] = np.expand_dims(visit_count, axis=1)
-      outs['last_visit'] = np.expand_dims(last_visit, axis=1)
-    return outs
-
-  def get_features_name(self):
-    f = []
-    if self.task_params.outputs.images:
-      f.append('imgs')
-    if self.task_params.outputs.rel_goal_loc:
-      f.append('rel_goal_loc')
-    if self.task_params.outputs.loc_on_map:
-      f.append('loc_on_map')
-    if self.task_params.outputs.gt_dist_to_goal:
-      f.append('gt_dist_to_goal')
-    if self.task_params.outputs.ego_maps:
-      for i in range(len(self.task_params.map_scales)):
-        f.append('ego_maps_{:d}'.format(i))
-    if self.task_params.outputs.readout_maps:
-      for i in range(len(self.task_params.readout_maps_scales)):
-        f.append('readout_maps_{:d}'.format(i))
-    if self.task_params.outputs.ego_goal_imgs:
-      for i in range(len(self.task_params.map_scales)):
-        f.append('ego_goal_imgs_{:d}'.format(i))
-    if self.task_params.outputs.egomotion:
-      f.append('incremental_locs')
-      f.append('incremental_thetas')
-    if self.task_params.outputs.visit_count:
-      f.append('visit_count')
-      f.append('last_visit')
-    if self.task_params.outputs.analytical_counts:
-      for i in range(len(self.task_params.analytical_counts.map_sizes)):
-        f.append('analytical_counts_{:d}'.format(i))
-    if self.task_params.outputs.node_ids:
-      f.append('node_ids')
-      f.append('perturbs')
-    return f
-
-  def pre_features(self, inputs):
-    if self.task_params.outputs.images:
-      inputs['imgs'] = image_pre(inputs['imgs'], self.task_params.modalities)
-    return inputs
-
-class BuildingMultiplexer():
-  def __init__(self, args, task_number):
-    params = vars(args)
-    for k in params.keys():
-      setattr(self, k, params[k])
-    self.task_number = task_number
-    self._pick_data(task_number)
-    logging.info('Env Class: %s.', self.env_class)
-    if self.task_params.task == 'planning':
-      self._setup_planner()
-    elif self.task_params.task == 'mapping':
-      self._setup_mapper()
-    elif self.task_params.task == 'map+plan':
-      self._setup_mapper()
-    else:
-      logging.error('Undefined task: %s'.format(self.task_params.task))
-
-  def _pick_data(self, task_number):
-    logging.error('Input Building Names: %s', self.building_names)
-    self.flip = [np.mod(task_number / len(self.building_names), 2) == 1]
-    id = np.mod(task_number, len(self.building_names))
-    self.building_names = [self.building_names[id]]
-    self.task_params.building_seed = task_number
-    logging.error('BuildingMultiplexer: Picked Building Name: %s', self.building_names)
-    self.building_names = self.building_names[0].split('+')
-    self.flip = [self.flip[0] for _ in self.building_names]
-    logging.error('BuildingMultiplexer: Picked Building Name: %s', self.building_names)
-    logging.error('BuildingMultiplexer: Flipping Buildings: %s', self.flip)
-    logging.error('BuildingMultiplexer: Set building_seed: %d', self.task_params.building_seed)
-    self.num_buildings = len(self.building_names)
-    logging.error('BuildingMultiplexer: Num buildings: %d', self.num_buildings)
-
-  def _setup_planner(self):
-    # Load building env class.
-    self.buildings = []
-    for i, building_name in enumerate(self.building_names):
-      b = self.env_class(robot=self.robot, env=self.env,
-                         task_params=self.task_params,
-                         building_name=building_name, flip=self.flip[i],
-                         logdir=self.logdir, building_loader=self.dataset)
-      self.buildings.append(b)
-
-  def _setup_mapper(self):
-    # Set up the renderer.
-    cp = self.camera_param
-    rgb_shader, d_shader = sru.get_shaders(cp.modalities)
-    r_obj = SwiftshaderRenderer()
-    r_obj.init_display(width=cp.width, height=cp.height, fov=cp.fov,
-                       z_near=cp.z_near, z_far=cp.z_far, rgb_shader=rgb_shader,
-                       d_shader=d_shader)
-    self.r_obj = r_obj
-    r_obj.clear_scene()
-
-    # Load building env class.
-    self.buildings = []
-    wt = []
-    for i, building_name in enumerate(self.building_names):
-      b = self.env_class(robot=self.robot, env=self.env,
-                         task_params=self.task_params,
-                         building_name=building_name, flip=self.flip[i],
-                         logdir=self.logdir, building_loader=self.dataset,
-                         r_obj=r_obj)
-      wt.append(b.get_weight())
-      b.load_building_into_scene()
-      b.set_building_visibility(False)
-      self.buildings.append(b)
-    wt = np.array(wt).astype(np.float32)
-    wt = wt / np.sum(wt+0.0001)
-    self.building_sampling_weights = wt
-
-  def sample_building(self, rng):
-    if self.num_buildings == 1:
-      building_id = rng.choice(range(len(self.building_names)))
-    else:
-      building_id = rng.choice(self.num_buildings,
-                               p=self.building_sampling_weights)
-    b = self.buildings[building_id]
-    instances = b._gen_rng(rng)
-    self._building_id = building_id
-    return self.buildings[building_id], instances
-
-  def sample_env(self, rngs):
-    rng = rngs[0];
-    if self.num_buildings == 1:
-      building_id = rng.choice(range(len(self.building_names)))
-    else:
-      building_id = rng.choice(self.num_buildings,
-                               p=self.building_sampling_weights)
-    return self.buildings[building_id]
-
-  def pre(self, inputs):
-    return self.buildings[self._building_id].pre(inputs)
-  
-  def __del__(self):
-    self.r_obj.clear_scene()
-    logging.error('Clearing scene.')