google-deepmind
diff --git a/‎box_arrangement/README.md
Lines changed: 106 additions & 0 deletions b/‎box_arrangement/README.md
Lines changed: 106 additions & 0 deletions
diff --git a/‎box_arrangement/__init__.py
Lines changed: 13 additions & 0 deletions b/‎box_arrangement/__init__.py
Lines changed: 13 additions & 0 deletions
diff --git a/‎box_arrangement/dmlab_assets.py
Lines changed: 82 additions & 0 deletions b/‎box_arrangement/dmlab_assets.py
Lines changed: 82 additions & 0 deletions
diff --git a/‎box_arrangement/explore.py
Lines changed: 41 additions & 0 deletions b/‎box_arrangement/explore.py
Lines changed: 41 additions & 0 deletions
@@ -0,0 +1,106 @@
+# Predicate tasks.
+
+This package contains tasks associated with "Behavior Priors for Efficient
+Reiforcement Learning" (https://arxiv.org/abs/2010.14274), "Exploiting Hierarchy
+for Learning and Transfer in KL-Regularized RL" (https://arxiv.org/abs/2010.14274)
+and "Information asymmetry in KL-regularized RL"
+(https://arxiv.org/abs/1905.01240).
+This is research code, and has dependencies on more stable code that is
+available as part of [`dm_control`], in particular upon components in
+[`dm_control.locomotion`] and [`dm_control.manipulation`].
+
+To get access to preconfigured python environments for the tasks, see the
+`task_examples.py` file. To use the MuJoCo interactive viewer (from dm_control)
+to load the environments, see `explore.py`.
+
+<p float="left">
+  <img src="tasks.png" height="200">
+</p>
+
+## Installation instructions
+
+1.  Download [MuJoCo Pro](https://mujoco.org/) and extract the zip archive as
+    `~/.mujoco/mujoco200_$PLATFORM` where `$PLATFORM` is one of `linux`,
+    `macos`, or `win64`.
+
+2.  Ensure that a valid MuJoCo license key file is located at
+    `~/.mujoco/mjkey.txt`.
+
+3.  Clone the `deepmind-research` repository:
+
+    ```shell
+       git clone https://github.com/deepmind/deepmind-research.git
+       cd deepmind-research
+    ```
+
+4.  Create and activate a Python virtual environment:
+
+    ```shell
+       python3 -m virtualenv box_arrangement
+       source box_arrangement/bin/activate
+    ```
+
+5.  Install the package:
+
+    ```shell
+       pip install ./box_arrangement
+    ```
+
+## Quickstart
+
+To instantiate and step through the go to one of K targets task:
+
+```python
+from box_arrangement import task_examples
+import numpy as np
+
+# Build an example environment.
+env = task_examples.go_to_k_targets()
+
+# Get the `action_spec` describing the control inputs.
+action_spec = env.action_spec()
+
+# Step through the environment for one episode with random actions.
+time_step = env.reset()
+while not time_step.last():
+  action = np.random.uniform(action_spec.minimum, action_spec.maximum,
+                             size=action_spec.shape)
+  time_step = env.step(action)
+  print("reward = {}, discount = {}, observations = {}.".format(
+      time_step.reward, time_step.discount, time_step.observation))
+```
+
+The above code snippet can also be used for other tasks by replacing
+`go_to_k_targets` with one of (`move_box`, `move_box_or_gtt` and
+`move_box_and_gtt`).
+
+## Visualization
+
+[`dm_control.viewer`] can be used to visualize and interact with the
+environment. We provide the `explore.py` script specifically for this. If you
+followed our installation instructions above, this can be launched for the
+go to one of K targets task via:
+
+```shell
+python3 -m box_arrangement.explore --task='go_to_target'
+```
+
+## Citation
+
+If you use the code or data in this package, please cite:
+
+```
+@misc{tirumala2020behavior,
+      title={Behavior Priors for Efficient Reinforcement Learning},
+      author={Dhruva Tirumala and Alexandre Galashov and Hyeonwoo Noh and Leonard Hasenclever and Razvan Pascanu and Jonathan Schwarz and Guillaume Desjardins and Wojciech Marian Czarnecki and Arun Ahuja and Yee Whye Teh and Nicolas Heess},
+      year={2020},
+      eprint={2010.14274},
+      archivePrefix={arXiv},
+      primaryClass={cs.AI}
+}
+```
+
+[`dm_control`]: https://github.com/deepmind/dm_control
+[`dm_control.locomotion`]: https://github.com/deepmind/dm_control/tree/master/dm_control/locomotion
+[`dm_control.manipulation`]: https://github.com/deepmind/dm_control/tree/master/dm_control/manipulation
+[`dm_control.viewer`]: https://github.com/deepmind/dm_control/tree/master/dm_control/viewer
@@ -0,0 +1,13 @@
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
@@ -0,0 +1,82 @@
+# Copyright 2018 Deepmind Technologies Limited.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""DeepMind Lab textures."""
+
+from dm_control import composer
+from dm_control import mjcf
+from labmaze import assets as labmaze_assets
+
+
+class SkyBox(composer.Entity):
+  """Represents a texture asset for the sky box."""
+
+  def _build(self, style):
+    labmaze_textures = labmaze_assets.get_sky_texture_paths(style)
+    self._mjcf_root = mjcf.RootElement(model='dmlab_' + style)
+    self._texture = self._mjcf_root.asset.add(
+        'texture', type='skybox', name='texture',
+        fileleft=labmaze_textures.left, fileright=labmaze_textures.right,
+        fileup=labmaze_textures.up, filedown=labmaze_textures.down,
+        filefront=labmaze_textures.front, fileback=labmaze_textures.back)
+
+  @property
+  def mjcf_model(self):
+    return self._mjcf_root
+
+  @property
+  def texture(self):
+    return self._texture
+
+
+class WallTextures(composer.Entity):
+  """Represents wall texture assets."""
+
+  def _build(self, style):
+    labmaze_textures = labmaze_assets.get_wall_texture_paths(style)
+    self._mjcf_root = mjcf.RootElement(model='dmlab_' + style)
+    self._textures = []
+    for texture_name, texture_path in labmaze_textures.items():
+      self._textures.append(self._mjcf_root.asset.add(
+          'texture', type='2d', name=texture_name,
+          file=texture_path.format(texture_name)))
+
+  @property
+  def mjcf_model(self):
+    return self._mjcf_root
+
+  @property
+  def textures(self):
+    return self._textures
+
+
+class FloorTextures(composer.Entity):
+  """Represents floor texture assets."""
+
+  def _build(self, style):
+    labmaze_textures = labmaze_assets.get_floor_texture_paths(style)
+    self._mjcf_root = mjcf.RootElement(model='dmlab_' + style)
+    self._textures = []
+    for texture_name, texture_path in labmaze_textures.items():
+      self._textures.append(self._mjcf_root.asset.add(
+          'texture', type='2d', name=texture_name,
+          file=texture_path.format(texture_name)))
+
+  @property
+  def mjcf_model(self):
+    return self._mjcf_root
+
+  @property
+  def textures(self):
+    return self._textures
@@ -0,0 +1,41 @@
+# Copyright 2020 Deepmind Technologies Limited.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Simple script to launch viewer with an example environment."""
+
+from absl import app
+from absl import flags
+from dm_control import viewer
+from box_arrangement import task_examples
+
+FLAGS = flags.FLAGS
+flags.DEFINE_enum('task', 'go_to_target', [
+    'go_to_target', 'move_box', 'move_box_or_go_to_target',
+    'move_box_and_go_to_target'
+], 'The task to visualize.')
+
+
+TASKS = {
+    'go_to_target': task_examples.go_to_k_targets,
+    'move_box': task_examples.move_box,
+    'move_box_or_go_to_target': task_examples.move_box_or_gtt,
+    'move_box_and_go_to_target': task_examples.move_box_and_gtt,
+}
+
+
+def main(unused_argv):
+  viewer.launch(environment_loader=TASKS[FLAGS.task])
+
+if __name__ == '__main__':
+  app.run(main)