From 76dc2f9a43d2f88ef46d964d9c01c1ee80f4b086 Mon Sep 17 00:00:00 2001 From: younik <42100908+younik@users.noreply.github.com> Date: Mon, 5 Feb 2024 01:02:11 +0000 Subject: [PATCH] =?UTF-8?q?Deploying=20to=20gh-pages=20from=20@=20Farama-F?= =?UTF-8?q?oundation/Minari@7d85164c8aa03970c2a4221a6f1a712f1cc4d304=20?= =?UTF-8?q?=F0=9F=9A=80?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- main/.buildinfo | 2 +- .../tutorials_python.zip | Bin 57239 -> 57239 bytes .../tutorials_jupyter.zip | Bin 77441 -> 77441 bytes .../minari/dataset/minari_dataset/index.html | 2 +- .../minari/storage/hosting/index.html | 17 ++--- main/_modules/minari/storage/local/index.html | 8 ++- main/_modules/minari/utils/index.html | 61 ++++++++++-------- .../datasets/antmaze/large-diverse/index.html | 8 +-- main/datasets/antmaze/large-play/index.html | 8 +-- .../antmaze/medium-diverse/index.html | 8 +-- main/datasets/antmaze/medium-play/index.html | 8 +-- .../datasets/antmaze/umaze-diverse/index.html | 8 +-- main/datasets/antmaze/umaze/index.html | 8 +-- main/datasets/door/cloned/index.html | 8 +-- main/datasets/door/expert/index.html | 8 +-- main/datasets/door/human/index.html | 8 +-- main/datasets/hammer/cloned/index.html | 8 +-- main/datasets/hammer/expert/index.html | 8 +-- main/datasets/hammer/human/index.html | 8 +-- main/datasets/kitchen/complete/index.html | 8 +-- main/datasets/kitchen/mixed/index.html | 8 +-- main/datasets/kitchen/partial/index.html | 8 +-- .../minigrid/fourrooms-random/index.html | 10 +-- main/datasets/minigrid/fourrooms/index.html | 10 +-- main/datasets/pen/cloned/index.html | 8 +-- main/datasets/pen/expert/index.html | 8 +-- main/datasets/pen/human/index.html | 8 +-- .../datasets/pointmaze/large-dense/index.html | 8 +-- main/datasets/pointmaze/large/index.html | 8 +-- .../pointmaze/medium-dense/index.html | 8 +-- main/datasets/pointmaze/medium/index.html | 8 +-- main/datasets/pointmaze/open-dense/index.html | 8 +-- main/datasets/pointmaze/open/index.html | 8 +-- .../datasets/pointmaze/umaze-dense/index.html | 8 +-- main/datasets/pointmaze/umaze/index.html | 8 +-- main/datasets/relocate/cloned/index.html | 8 +-- main/datasets/relocate/expert/index.html | 8 +-- main/datasets/relocate/human/index.html | 8 +-- main/searchindex.js | 2 +- 39 files changed, 84 insertions(+), 260 deletions(-) diff --git a/main/.buildinfo b/main/.buildinfo index eda4c395..c797ebf9 100644 --- a/main/.buildinfo +++ b/main/.buildinfo @@ -1,4 +1,4 @@ # Sphinx build info version 1 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. -config: b9d761ee5ebfc4251fffc3fe599f90db +config: 537f759ee94890a29d327e4405df44e6 tags: d77d1c0d9ca2f4c8421862c7c5a0d620 diff --git a/main/_downloads/315c4c52fb68082a731b192d944e2ede/tutorials_python.zip b/main/_downloads/315c4c52fb68082a731b192d944e2ede/tutorials_python.zip index 47636b5f4914641808891a45b3b4f7aaadb608b4..e48471e1b067e3088a81173cf3e7fd6cea216b13 100644 GIT binary patch delta 99 zcmbQfpLzOzX5IjAW)=|!5MbhP-N@_b%?zYB$9c~e1u-@y9_I%OoGMr-31;MVl?HMS|&R_oBe`=X?HO+Vy@A0L=*}0RR91 diff --git a/main/_downloads/a5659940aa3f8f568547d47752a43172/tutorials_jupyter.zip b/main/_downloads/a5659940aa3f8f568547d47752a43172/tutorials_jupyter.zip index 47bd9d86205c5fcfed0ebd566cf1df1c00358629..32da457dff795517e3f96d4e57e77dd5e15f054d 100644 GIT binary patch delta 105 zcmZp?%hGt4g*U*PnMH&F1Z+86H}ZyrFazn$DIpPxV8;H^)#6}AZZEGovjb47c8g;L kNM!m!9Y(O?=@Pn(F<_B$UB*~2TK9X-ZS0J)_bUH||9 delta 105 zcmZp?%hGt4g*U*PnMH&F1Xe6|+{hae!VIK0r-Vc(f*JcuSBrxgxxKvV%qxLXwObr3 lKqAu*>M(*8PnXbTi~)<3>oUfI8P|0ggFuR>>*z6t0sxy+C2jx! diff --git a/main/_modules/minari/dataset/minari_dataset/index.html b/main/_modules/minari/dataset/minari_dataset/index.html index eaf75c72..f8e02a83 100644 --- a/main/_modules/minari/dataset/minari_dataset/index.html +++ b/main/_modules/minari/dataset/minari_dataset/index.html @@ -450,7 +450,7 @@

Source code for minari.dataset.minari_dataset

if isinstance(data, MinariStorage): self._data = data elif isinstance(data, (str, os.PathLike)): - self._data = MinariStorage(data) + self._data = MinariStorage.read(data) else: raise ValueError(f"Unrecognized type {type(data)} for data") diff --git a/main/_modules/minari/storage/hosting/index.html b/main/_modules/minari/storage/hosting/index.html index 4a6fe052..c53b5ccb 100644 --- a/main/_modules/minari/storage/hosting/index.html +++ b/main/_modules/minari/storage/hosting/index.html @@ -362,17 +362,18 @@

Source code for minari.storage.hosting

 
 import glob
 import importlib.metadata
+import json
 import os
 import warnings
 from typing import Dict, List
 
-import h5py
-from google.cloud import storage  # pyright: ignore [reportGeneralTypeIssues]
+from google.cloud import storage
 from gymnasium import logger
 from packaging.specifiers import SpecifierSet
-from tqdm.auto import tqdm  # pyright: ignore [reportMissingModuleSource]
+from tqdm.auto import tqdm
 
 from minari.dataset.minari_dataset import parse_dataset_id
+from minari.dataset.minari_storage import METADATA_FILE_NAME
 from minari.storage.datasets_root_dir import get_dataset_path
 from minari.storage.local import load_dataset
 
@@ -401,12 +402,6 @@ 

Source code for minari.storage.hosting

             else:
                 remote_path = os.path.join(gcs_path, local_file[1 + len(local_path) :])
                 blob = bucket.blob(remote_path)
-                # add metadata to main data file of dataset
-                if blob.name.endswith("main_data.hdf5"):
-                    with h5py.File(
-                        local_file, "r"
-                    ) as file:  # TODO: remove h5py when migrating to JSON metadata
-                        blob.metadata = file.attrs
                 blob.upload_from_filename(local_file)
 
     file_path = get_dataset_path(dataset_id)
@@ -596,8 +591,8 @@ 

Source code for minari.storage.hosting

     remote_datasets = {}
     for blob in blobs:
         try:
-            if blob.name.endswith("main_data.hdf5"):
-                metadata = blob.metadata
+            if blob.name.endswith(METADATA_FILE_NAME):
+                metadata = json.loads(blob.download_as_string(client=None))
                 if compatible_minari_version and __version__ not in SpecifierSet(
                     metadata["minari_version"]
                 ):
diff --git a/main/_modules/minari/storage/local/index.html b/main/_modules/minari/storage/local/index.html
index c86ba35f..76c9c81c 100644
--- a/main/_modules/minari/storage/local/index.html
+++ b/main/_modules/minari/storage/local/index.html
@@ -361,6 +361,7 @@ 

Source code for minari.storage.local

 import importlib.metadata
 import os
 import shutil
+import warnings
 from typing import Dict, Union
 
 from packaging.specifiers import SpecifierSet
@@ -433,7 +434,12 @@ 

Source code for minari.storage.local

             continue
 
         data_path = os.path.join(datasets_path, dst_id, "data")
-        metadata = MinariStorage(data_path).metadata
+        try:
+            metadata = MinariStorage.read(data_path).metadata
+        except Exception as e:
+            warnings.warn(f"Misconfigured dataset named {dst_id}: {e}")
+            continue
+
         if ("minari_version" not in metadata) or (
             compatible_minari_version
             and __version__ not in SpecifierSet(metadata["minari_version"])
diff --git a/main/_modules/minari/utils/index.html b/main/_modules/minari/utils/index.html
index 8aa75324..7032a6c8 100644
--- a/main/_modules/minari/utils/index.html
+++ b/main/_modules/minari/utils/index.html
@@ -372,6 +372,7 @@ 

Source code for minari.utils

 import portion as P
 from gymnasium.core import ActType, ObsType
 from gymnasium.envs.registration import EnvSpec
+from gymnasium.error import NameNotFound
 from gymnasium.wrappers.record_episode_statistics import RecordEpisodeStatistics
 from packaging.specifiers import InvalidSpecifier, SpecifierSet
 from packaging.version import Version
@@ -971,18 +972,23 @@ 

Source code for minari.utils

 
 def get_env_spec_dict(env_spec: EnvSpec) -> Dict[str, str]:
     """Create dict of the environment specs, including observation and action space."""
-    env = gym.make(env_spec.id)
-
-    action_space_table = env.action_space.__repr__().replace("\n", "")
-    observation_space_table = env.observation_space.__repr__().replace("\n", "")
-
-    md_dict = {
-        "ID": env_spec.id,
-        "Observation Space": f"`{re.sub(' +', ' ', observation_space_table)}`",
-        "Action Space": f"`{re.sub(' +', ' ', action_space_table)}`",
+    try:
+        env = gym.make(env_spec.id)
+        action_space_table = env.action_space.__repr__().replace("\n", "")
+        observation_space_table = env.observation_space.__repr__().replace("\n", "")
+    except NameNotFound:
+        action_space_table, observation_space_table = None, None
+
+    md_dict = {"ID": env_spec.id}
+    if observation_space_table is not None:
+        md_dict["Observation Space"] = f"`{re.sub(' +', ' ', observation_space_table)}`"
+    if action_space_table is not None:
+        md_dict["Action Space"] = f"`{re.sub(' +', ' ', action_space_table)}`"
+
+    md_dict.update({
         "entry_point": f"`{env_spec.entry_point}`",
-        "max_episode_steps": env_spec.max_episode_steps,
-        "reward_threshold": env_spec.reward_threshold,
+        "max_episode_steps": str(env_spec.max_episode_steps),
+        "reward_threshold": str(env_spec.reward_threshold),
         "nondeterministic": f"`{env_spec.nondeterministic}`",
         "order_enforce": f"`{env_spec.order_enforce}`",
         "autoreset": f"`{env_spec.autoreset}`",
@@ -990,7 +996,7 @@ 

Source code for minari.utils

         "kwargs": f"`{env_spec.kwargs}`",
         "additional_wrappers": f"`{env_spec.additional_wrappers}`",
         "vector_entry_point": f"`{env_spec.vector_entry_point}`",
-    }
+    })
 
     return {k: str(v) for k, v in md_dict.items()}
 
@@ -1001,29 +1007,32 @@ 

Source code for minari.utils

 ) -> Dict[str, str]:
     """Create dict of the dataset specs, including observation and action space."""
     code_link = dataset_spec["code_permalink"]
-    action_space = dataset_spec["action_space"]
-    obs_space = dataset_spec["observation_space"]
+    action_space = dataset_spec.get("action_space")
+    obs_space = dataset_spec.get("observation_space")
+    version = dataset_spec['minari_version']
 
-    dataset_action_space = action_space.__repr__().replace("\n", "")
-    dataset_observation_space = obs_space.__repr__().replace("\n", "")
+    md_dict = {
+        "Total Steps": str(dataset_spec["total_steps"]),
+        "Total Episodes": str(dataset_spec["total_episodes"]),
+    }
 
-    version = str(dataset_spec['minari_version'])
+    if obs_space is not None:
+        dataset_observation_space = obs_space.__repr__().replace("\n", "")
+        md_dict["Dataset Observation Space"] = f"`{dataset_observation_space}`"
 
-    if print_version:
-        version += f" ({__version__} installed)"
+    if action_space is not None:
+        dataset_action_space = action_space.__repr__().replace("\n", "")
+        md_dict["Dataset Action Space"] = f"`{dataset_action_space}`"
 
-    md_dict = {
-        "Total steps": dataset_spec["total_steps"],
-        "Total Episodes": dataset_spec["total_episodes"],
-        "Dataset Observation Space": f"`{dataset_observation_space}`",
-        "Dataset Action Space": f"`{dataset_action_space}`",
+    add_version = f" ({__version__} installed)"
+    md_dict.update({
         "Algorithm": dataset_spec["algorithm_name"],
         "Author": dataset_spec["author"],
         "Email": dataset_spec["author_email"],
         "Code Permalink": f"[{code_link}]({code_link})",
-        "Minari Version": version,
+        "Minari Version": f"{version} {add_version if print_version else ''}",
         "Download": f"`minari.download_dataset(\"{dataset_spec['dataset_id']}\")`"
-    }
+    })
 
     return md_dict
 
diff --git a/main/datasets/antmaze/large-diverse/index.html b/main/datasets/antmaze/large-diverse/index.html index 63d0a196..1b87502a 100644 --- a/main/datasets/antmaze/large-diverse/index.html +++ b/main/datasets/antmaze/large-diverse/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

1000

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [27], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [8], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

QIteration+SAC

diff --git a/main/datasets/antmaze/large-play/index.html b/main/datasets/antmaze/large-play/index.html index e506a5da..95fac9e5 100644 --- a/main/datasets/antmaze/large-play/index.html +++ b/main/datasets/antmaze/large-play/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

1000

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [27], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [8], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

QIteration+SAC

diff --git a/main/datasets/antmaze/medium-diverse/index.html b/main/datasets/antmaze/medium-diverse/index.html index 7c0e4f9d..8b7f196c 100644 --- a/main/datasets/antmaze/medium-diverse/index.html +++ b/main/datasets/antmaze/medium-diverse/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

1000

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [27], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [8], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

QIteration+SAC

diff --git a/main/datasets/antmaze/medium-play/index.html b/main/datasets/antmaze/medium-play/index.html index 0009f619..add6b629 100644 --- a/main/datasets/antmaze/medium-play/index.html +++ b/main/datasets/antmaze/medium-play/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

1000

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [27], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [8], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

QIteration+SAC

diff --git a/main/datasets/antmaze/umaze-diverse/index.html b/main/datasets/antmaze/umaze-diverse/index.html index ba30c8cd..eb9d291f 100644 --- a/main/datasets/antmaze/umaze-diverse/index.html +++ b/main/datasets/antmaze/umaze-diverse/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

1433

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [27], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [8], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

QIteration+SAC

diff --git a/main/datasets/antmaze/umaze/index.html b/main/datasets/antmaze/umaze/index.html index 54cb6d73..fac0d372 100644 --- a/main/datasets/antmaze/umaze/index.html +++ b/main/datasets/antmaze/umaze/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

1433

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [27], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [8], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

QIteration+SAC

diff --git a/main/datasets/door/cloned/index.html b/main/datasets/door/cloned/index.html index 5c8354cf..2c72d08d 100644 --- a/main/datasets/door/cloned/index.html +++ b/main/datasets/door/cloned/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

4358

-

Dataset Observation Space

-

'{"type": "Box", "dtype": "float64", "shape": [39], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [28], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/door/expert/index.html b/main/datasets/door/expert/index.html index 6bb98147..2f37f8f5 100644 --- a/main/datasets/door/expert/index.html +++ b/main/datasets/door/expert/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

5000

-

Dataset Observation Space

-

'{"type": "Box", "dtype": "float64", "shape": [39], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [28], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/door/human/index.html b/main/datasets/door/human/index.html index 21bc17fc..d65a95c6 100644 --- a/main/datasets/door/human/index.html +++ b/main/datasets/door/human/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

6729

Total Episodes

25

-

Dataset Observation Space

-

'{"type": "Box", "dtype": "float64", "shape": [39], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [28], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/hammer/cloned/index.html b/main/datasets/hammer/cloned/index.html index e2c2ccd4..85cfd0e7 100644 --- a/main/datasets/hammer/cloned/index.html +++ b/main/datasets/hammer/cloned/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

3606

-

Dataset Observation Space

-

'{"type": "Box", "dtype": "float64", "shape": [46], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [26], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/hammer/expert/index.html b/main/datasets/hammer/expert/index.html index df60408f..9eb9958f 100644 --- a/main/datasets/hammer/expert/index.html +++ b/main/datasets/hammer/expert/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

5000

-

Dataset Observation Space

-

'{"type": "Box", "dtype": "float64", "shape": [46], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [26], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/hammer/human/index.html b/main/datasets/hammer/human/index.html index 1ca61ee3..7ff772b0 100644 --- a/main/datasets/hammer/human/index.html +++ b/main/datasets/hammer/human/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

11310

Total Episodes

25

-

Dataset Observation Space

-

'{"type": "Box", "dtype": "float64", "shape": [46], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [26], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/kitchen/complete/index.html b/main/datasets/kitchen/complete/index.html index fe985c97..ef716c1f 100644 --- a/main/datasets/kitchen/complete/index.html +++ b/main/datasets/kitchen/complete/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

4209

Total Episodes

19

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Dict", "subspaces": {"kettle": {"type": "Box", "dtype": "float64", "shape": [7], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}, "light switch": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "microwave": {"type": "Box", "dtype": "float64", "shape": [1], "low": [-Infinity], "high": [Infinity]}, "slide cabinet": {"type": "Box", "dtype": "float64", "shape": [1], "low": [-Infinity], "high": [Infinity]}}}, "desired_goal": {"type": "Dict", "subspaces": {"kettle": {"type": "Box", "dtype": "float64", "shape": [7], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}, "light switch": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "microwave": {"type": "Box", "dtype": "float64", "shape": [1], "low": [-Infinity], "high": [Infinity]}, "slide cabinet": {"type": "Box", "dtype": "float64", "shape": [1], "low": [-Infinity], "high": [Infinity]}}}, "observation": {"type": "Box", "dtype": "float64", "shape": [59], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float64", "shape": [9], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/kitchen/mixed/index.html b/main/datasets/kitchen/mixed/index.html index 656395e9..2cc1f92d 100644 --- a/main/datasets/kitchen/mixed/index.html +++ b/main/datasets/kitchen/mixed/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

156560

Total Episodes

621

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Dict", "subspaces": {"bottom burner": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "kettle": {"type": "Box", "dtype": "float64", "shape": [7], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}, "light switch": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "microwave": {"type": "Box", "dtype": "float64", "shape": [1], "low": [-Infinity], "high": [Infinity]}}}, "desired_goal": {"type": "Dict", "subspaces": {"bottom burner": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "kettle": {"type": "Box", "dtype": "float64", "shape": [7], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}, "light switch": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "microwave": {"type": "Box", "dtype": "float64", "shape": [1], "low": [-Infinity], "high": [Infinity]}}}, "observation": {"type": "Box", "dtype": "float64", "shape": [59], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float64", "shape": [9], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/kitchen/partial/index.html b/main/datasets/kitchen/partial/index.html index 7219cbb3..b3c03e71 100644 --- a/main/datasets/kitchen/partial/index.html +++ b/main/datasets/kitchen/partial/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

156560

Total Episodes

621

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Dict", "subspaces": {"kettle": {"type": "Box", "dtype": "float64", "shape": [7], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}, "light switch": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "microwave": {"type": "Box", "dtype": "float64", "shape": [1], "low": [-Infinity], "high": [Infinity]}, "slide cabinet": {"type": "Box", "dtype": "float64", "shape": [1], "low": [-Infinity], "high": [Infinity]}}}, "desired_goal": {"type": "Dict", "subspaces": {"kettle": {"type": "Box", "dtype": "float64", "shape": [7], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}, "light switch": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "microwave": {"type": "Box", "dtype": "float64", "shape": [1], "low": [-Infinity], "high": [Infinity]}, "slide cabinet": {"type": "Box", "dtype": "float64", "shape": [1], "low": [-Infinity], "high": [Infinity]}}}, "observation": {"type": "Box", "dtype": "float64", "shape": [59], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float64", "shape": [9], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/minigrid/fourrooms-random/index.html b/main/datasets/minigrid/fourrooms-random/index.html index 9c0d3c5c..25218223 100644 --- a/main/datasets/minigrid/fourrooms-random/index.html +++ b/main/datasets/minigrid/fourrooms-random/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000033

Total Episodes

10181

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"direction": {"type": "Discrete", "dtype": "int64", "start": 0, "n": 4}, "image": {"type": "Box", "dtype": "uint8", "shape": [7, 7, 3], "low": [[[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]]], "high": [[[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]], [[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]], [[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]], [[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]], [[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]], [[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]], [[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]]]}, "mission": {"type": "Text", "max_length": 14, "min_length": 1, "charset": "                                                              \'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'(),,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdeeeffghijklmnnoopqrrssttuvwxyzz{}"}}}'

- -

Dataset Action Space

-

'{"type": "Discrete", "dtype": "int64", "start": 0, "n": 7}'

-

Algorithm

RandomPolicy

@@ -435,7 +429,7 @@

Environment Specs

Observation Space

-

Dict('direction': Discrete(4), 'image': Box(0, 255, (7, 7, 3), uint8), 'mission': MissionSpace(<function FourRoomsEnv._gen_mission at 0x7f836964c4c0>, None))

+

Dict('direction': Discrete(4), 'image': Box(0, 255, (7, 7, 3), uint8), 'mission': MissionSpace(<function FourRoomsEnv._gen_mission at 0x7f8c7a4e7f70>, None))

Action Space

Discrete(7)

diff --git a/main/datasets/minigrid/fourrooms/index.html b/main/datasets/minigrid/fourrooms/index.html index 8f714838..cf5025b8 100644 --- a/main/datasets/minigrid/fourrooms/index.html +++ b/main/datasets/minigrid/fourrooms/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

10010

Total Episodes

590

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"direction": {"type": "Discrete", "dtype": "int64", "start": 0, "n": 4}, "image": {"type": "Box", "dtype": "uint8", "shape": [7, 7, 3], "low": [[[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0], [0, 0, 0]]], "high": [[[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]], [[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]], [[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]], [[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]], [[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]], [[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]], [[255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255], [255, 255, 255]]]}, "mission": {"type": "Text", "max_length": 14, "min_length": 1, "charset": "                                                              \'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'\'(),,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdeeeffghijklmnnoopqrrssttuvwxyzz{}"}}}'

- -

Dataset Action Space

-

'{"type": "Discrete", "dtype": "int64", "start": 0, "n": 7}'

-

Algorithm

ExpertPolicy

@@ -435,7 +429,7 @@

Environment Specs

Observation Space

-

Dict('direction': Discrete(4), 'image': Box(0, 255, (7, 7, 3), uint8), 'mission': MissionSpace(<function FourRoomsEnv._gen_mission at 0x7f836964c4c0>, None))

+

Dict('direction': Discrete(4), 'image': Box(0, 255, (7, 7, 3), uint8), 'mission': MissionSpace(<function FourRoomsEnv._gen_mission at 0x7f8c7a4e7f70>, None))

Action Space

Discrete(7)

diff --git a/main/datasets/pen/cloned/index.html b/main/datasets/pen/cloned/index.html index 2f863b2a..372e32ed 100644 --- a/main/datasets/pen/cloned/index.html +++ b/main/datasets/pen/cloned/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

500000

Total Episodes

3736

-

Dataset Observation Space

-

'{"type": "Box", "dtype": "float64", "shape": [45], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [24], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/pen/expert/index.html b/main/datasets/pen/expert/index.html index 0cd15b32..08fd71f2 100644 --- a/main/datasets/pen/expert/index.html +++ b/main/datasets/pen/expert/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

499206

Total Episodes

4958

-

Dataset Observation Space

-

'{"type": "Box", "dtype": "float64", "shape": [45], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [24], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/pen/human/index.html b/main/datasets/pen/human/index.html index 3386a84f..4f63c250 100644 --- a/main/datasets/pen/human/index.html +++ b/main/datasets/pen/human/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

5000

Total Episodes

25

-

Dataset Observation Space

-

'{"type": "Box", "dtype": "float64", "shape": [45], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [24], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/pointmaze/large-dense/index.html b/main/datasets/pointmaze/large-dense/index.html index d0bcf39c..abc8768b 100644 --- a/main/datasets/pointmaze/large-dense/index.html +++ b/main/datasets/pointmaze/large-dense/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

3322

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [4], "low": [-Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [2], "low": [-1.0, -1.0], "high": [1.0, 1.0]}'

-

Algorithm

QIteration

diff --git a/main/datasets/pointmaze/large/index.html b/main/datasets/pointmaze/large/index.html index 84f519f1..c811fe71 100644 --- a/main/datasets/pointmaze/large/index.html +++ b/main/datasets/pointmaze/large/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

3325

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [4], "low": [-Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [2], "low": [-1.0, -1.0], "high": [1.0, 1.0]}'

-

Algorithm

QIteration

diff --git a/main/datasets/pointmaze/medium-dense/index.html b/main/datasets/pointmaze/medium-dense/index.html index dfd76492..af13f7de 100644 --- a/main/datasets/pointmaze/medium-dense/index.html +++ b/main/datasets/pointmaze/medium-dense/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

4765

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [4], "low": [-Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [2], "low": [-1.0, -1.0], "high": [1.0, 1.0]}'

-

Algorithm

QIteration

diff --git a/main/datasets/pointmaze/medium/index.html b/main/datasets/pointmaze/medium/index.html index f424ad69..bfb50ce1 100644 --- a/main/datasets/pointmaze/medium/index.html +++ b/main/datasets/pointmaze/medium/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

4778

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [4], "low": [-Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [2], "low": [-1.0, -1.0], "high": [1.0, 1.0]}'

-

Algorithm

QIteration

diff --git a/main/datasets/pointmaze/open-dense/index.html b/main/datasets/pointmaze/open-dense/index.html index b82e4c3d..8977922d 100644 --- a/main/datasets/pointmaze/open-dense/index.html +++ b/main/datasets/pointmaze/open-dense/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

9637

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [4], "low": [-Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [2], "low": [-1.0, -1.0], "high": [1.0, 1.0]}'

-

Algorithm

QIteration

diff --git a/main/datasets/pointmaze/open/index.html b/main/datasets/pointmaze/open/index.html index 0e4ed211..c860fad2 100644 --- a/main/datasets/pointmaze/open/index.html +++ b/main/datasets/pointmaze/open/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

9609

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [4], "low": [-Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [2], "low": [-1.0, -1.0], "high": [1.0, 1.0]}'

-

Algorithm

QIteration

diff --git a/main/datasets/pointmaze/umaze-dense/index.html b/main/datasets/pointmaze/umaze-dense/index.html index ff2aa72a..21583a17 100644 --- a/main/datasets/pointmaze/umaze-dense/index.html +++ b/main/datasets/pointmaze/umaze-dense/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

13289

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [4], "low": [-Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [2], "low": [-1.0, -1.0], "high": [1.0, 1.0]}'

-

Algorithm

QIteration

diff --git a/main/datasets/pointmaze/umaze/index.html b/main/datasets/pointmaze/umaze/index.html index 6c611893..ff2d2a71 100644 --- a/main/datasets/pointmaze/umaze/index.html +++ b/main/datasets/pointmaze/umaze/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

13289

-

Dataset Observation Space

-

'{"type": "Dict", "subspaces": {"achieved_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "desired_goal": {"type": "Box", "dtype": "float64", "shape": [2], "low": [-Infinity, -Infinity], "high": [Infinity, Infinity]}, "observation": {"type": "Box", "dtype": "float64", "shape": [4], "low": [-Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity]}}}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [2], "low": [-1.0, -1.0], "high": [1.0, 1.0]}'

-

Algorithm

QIteration

diff --git a/main/datasets/relocate/cloned/index.html b/main/datasets/relocate/cloned/index.html index 2133b9e0..e47cec89 100644 --- a/main/datasets/relocate/cloned/index.html +++ b/main/datasets/relocate/cloned/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

3758

-

Dataset Observation Space

-

'{"type": "Box", "dtype": "float64", "shape": [39], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [30], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/relocate/expert/index.html b/main/datasets/relocate/expert/index.html index 156bd177..18aab73a 100644 --- a/main/datasets/relocate/expert/index.html +++ b/main/datasets/relocate/expert/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

1000000

Total Episodes

5000

-

Dataset Observation Space

-

'{"type": "Box", "dtype": "float64", "shape": [39], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [30], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/datasets/relocate/human/index.html b/main/datasets/relocate/human/index.html index e08d10e5..2655e491 100644 --- a/main/datasets/relocate/human/index.html +++ b/main/datasets/relocate/human/index.html @@ -375,18 +375,12 @@

Dataset Specs

Total steps

+

Total Steps

9942

Total Episodes

25

-

Dataset Observation Space

-

'{"type": "Box", "dtype": "float64", "shape": [39], "low": [-Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity, -Infinity], "high": [Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity, Infinity]}'

- -

Dataset Action Space

-

'{"type": "Box", "dtype": "float32", "shape": [30], "low": [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0], "high": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0]}'

-

Algorithm

None

diff --git a/main/searchindex.js b/main/searchindex.js index 540b66d5..61fa7b6e 100644 --- a/main/searchindex.js +++ b/main/searchindex.js @@ -1 +1 @@ -Search.setIndex({"docnames": ["404", "README", "api/data_collector", "api/data_collector_callbacks/episode_metadata_callback", "api/data_collector_callbacks/step_data_callback", "api/minari_dataset/episode_data", "api/minari_dataset/minari_dataset", "api/minari_functions", "content/basic_usage", "content/dataset_standards", "content/minari_cli", "datasets/antmaze", "datasets/antmaze/large-diverse", "datasets/antmaze/large-play", "datasets/antmaze/medium-diverse", "datasets/antmaze/medium-play", "datasets/antmaze/umaze", "datasets/antmaze/umaze-diverse", "datasets/door", "datasets/door/cloned", "datasets/door/expert", "datasets/door/human", "datasets/hammer", "datasets/hammer/cloned", "datasets/hammer/expert", "datasets/hammer/human", "datasets/kitchen", "datasets/kitchen/complete", "datasets/kitchen/mixed", "datasets/kitchen/partial", "datasets/minigrid", "datasets/minigrid/fourrooms", "datasets/minigrid/fourrooms-random", "datasets/pen", "datasets/pen/cloned", "datasets/pen/expert", "datasets/pen/human", "datasets/pointmaze", "datasets/pointmaze/large", "datasets/pointmaze/large-dense", "datasets/pointmaze/medium", "datasets/pointmaze/medium-dense", "datasets/pointmaze/open", "datasets/pointmaze/open-dense", "datasets/pointmaze/umaze", "datasets/pointmaze/umaze-dense", "datasets/relocate", "datasets/relocate/cloned", "datasets/relocate/expert", "datasets/relocate/human", "index", "release_notes/index", "tutorials/dataset_creation/README", "tutorials/dataset_creation/custom_space_serialization", "tutorials/dataset_creation/index", "tutorials/dataset_creation/observation_space_subseting", "tutorials/dataset_creation/point_maze_dataset", "tutorials/index", "tutorials/using_datasets/IQL_torchrl", "tutorials/using_datasets/README", "tutorials/using_datasets/behavioral_cloning", "tutorials/using_datasets/index"], "filenames": ["404.md", "README.md", "api/data_collector.md", "api/data_collector_callbacks/episode_metadata_callback.md", "api/data_collector_callbacks/step_data_callback.md", "api/minari_dataset/episode_data.md", "api/minari_dataset/minari_dataset.md", "api/minari_functions.md", "content/basic_usage.md", "content/dataset_standards.md", "content/minari_cli.md", "datasets/antmaze.md", "datasets/antmaze/large-diverse.md", "datasets/antmaze/large-play.md", "datasets/antmaze/medium-diverse.md", "datasets/antmaze/medium-play.md", "datasets/antmaze/umaze.md", "datasets/antmaze/umaze-diverse.md", "datasets/door.md", "datasets/door/cloned.md", "datasets/door/expert.md", "datasets/door/human.md", "datasets/hammer.md", "datasets/hammer/cloned.md", "datasets/hammer/expert.md", "datasets/hammer/human.md", "datasets/kitchen.md", "datasets/kitchen/complete.md", "datasets/kitchen/mixed.md", "datasets/kitchen/partial.md", "datasets/minigrid.md", "datasets/minigrid/fourrooms.md", "datasets/minigrid/fourrooms-random.md", "datasets/pen.md", "datasets/pen/cloned.md", "datasets/pen/expert.md", "datasets/pen/human.md", "datasets/pointmaze.md", "datasets/pointmaze/large.md", "datasets/pointmaze/large-dense.md", "datasets/pointmaze/medium.md", "datasets/pointmaze/medium-dense.md", "datasets/pointmaze/open.md", "datasets/pointmaze/open-dense.md", "datasets/pointmaze/umaze.md", "datasets/pointmaze/umaze-dense.md", "datasets/relocate.md", "datasets/relocate/cloned.md", "datasets/relocate/expert.md", "datasets/relocate/human.md", "index.md", "release_notes/index.md", "tutorials/dataset_creation/README.rst", "tutorials/dataset_creation/custom_space_serialization.rst", "tutorials/dataset_creation/index.rst", "tutorials/dataset_creation/observation_space_subseting.rst", "tutorials/dataset_creation/point_maze_dataset.rst", "tutorials/index.rst", "tutorials/using_datasets/IQL_torchrl.rst", "tutorials/using_datasets/README.rst", "tutorials/using_datasets/behavioral_cloning.rst", "tutorials/using_datasets/index.rst"], "titles": ["404 - Page Not Found", "Minari documentation", "DataCollector", "EpisodeMetadataCallback", "StepDataCallback", "EpisodeData", "MinariDataset", "Minari", "Basic Usage", "Dataset Standards", "Minari CLI", "Ant Maze", "Large-Diverse", "Large-Play", "Medium-Diverse", "Medium-Play", "Umaze", "Umaze-Diverse", "Door", "Cloned", "Expert", "Human", "Hammer", "Cloned", "Expert", "Human", "Kitchen", "Complete", "Mixed", "Partial", "MiniGrid", "Fourrooms", "Fourrooms-Random", "Pen", "Cloned", "Expert", "Human", "Point Maze", "Large", "Large-Dense", "Medium", "Medium-Dense", "Open", "Open-Dense", "Umaze", "Umaze-Dense", "Relocate", "Cloned", "Expert", "Human", "<no title>", "Release Notes", "Dataset Creation", "Serializing a custom space", "Dataset Creation", "Collecting a subset of a dictionary space with StepDataCallback", "PointMaze D4RL dataset", "Tutorials", "Implicit Q-Learning with TorchRL", "Using Datasets", "Behavioral cloning with PyTorch", "Using Datasets"], "terms": {"thi": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "folder": [1, 60], "contain": [1, 2, 3, 4, 5, 7, 9, 11, 16, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 31, 32, 34, 35, 36, 37, 42, 43, 44, 45, 47, 48, 49, 51], "For": [1, 7, 8, 9, 51, 53, 56, 60], "more": [1, 3, 8, 9, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 56, 58], "inform": [1, 2, 4, 6, 51, 56], "about": [1, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53], "how": [1, 2, 9, 51, 53, 55, 56, 58, 60], "contribut": [1, 8, 51, 56], "go": [1, 56], "our": [1, 8, 9, 10, 51, 55, 56, 58, 60], "md": [1, 51], "instal": [1, 2, 7, 10, 50, 51, 53, 58, 60], "requir": [1, 9, 10, 51, 53, 55, 56, 58, 60], "packag": [1, 10, 51, 60], "git": [1, 8], "clone": [1, 8, 10, 18, 22, 33, 46, 50, 51, 57, 58, 61], "http": [1, 8, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 53, 56, 60], "github": [1, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 56], "com": [1, 8, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 56], "farama": [1, 7, 8, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 56, 58, 60], "foundat": [1, 8, 51, 53, 56], "cd": [1, 8], "pip": [1, 8, 10, 50, 53, 58, 60], "e": [1, 6, 7, 8, 51, 58], "r": [1, 12, 13, 14, 15, 16, 17, 56, 58], "doc": [1, 51, 53, 56], "txt": 1, "To": [1, 2, 8, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 58, 60], "onc": [1, 8, 56, 58, 60], "make": [1, 2, 6, 8, 9, 51, 53, 55, 56, 58, 60], "dirhtml": 1, "rebuild": 1, "automat": [1, 2, 51], "everi": [1, 7, 8, 9, 16, 56, 58], "time": [1, 2, 7, 8, 56], "chang": [1, 50, 51, 56], "i": [1, 2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 30, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55, 58, 60], "made": [1, 51], "sphinx": 1, "autobuild": 1, "b": [1, 10, 50], "_build": 1, "class": [2, 3, 4, 5, 6, 9, 51, 55, 56, 58, 60], "env": [2, 4, 6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 56, 58, 60], "step_data_callback": [2, 55, 56], "type": [2, 9, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 53, 58, 60], "stepdatacallback": [2, 9, 51, 54, 57], "episode_metadata_callback": [2, 3], "episodemetadatacallback": [2, 9, 51], "record_info": [2, 8, 9, 56], "bool": [2, 4, 6, 7, 9, 51, 58], "fals": [2, 6, 7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 53, 55, 56, 58, 60], "max_buffer_step": [2, 8], "int": [2, 5, 6, 7, 51, 56], "none": [2, 4, 5, 6, 7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 56], "observation_spac": [2, 7, 9, 51, 53, 55, 60], "action_spac": [2, 7, 8, 9, 51, 53, 55, 56, 60], "sourc": [2, 3, 4, 5, 6, 7, 8, 51, 53, 55, 56, 57, 58, 60], "gymnasium": [2, 4, 5, 6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "environ": [2, 4, 5, 6, 7, 9, 10, 11, 18, 22, 26, 30, 33, 37, 46, 50, 51, 53, 55, 56, 60], "wrapper": [2, 3, 8, 9, 51, 53, 56, 58, 60], "collect": [2, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 54, 57, 58], "step": [2, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "data": [2, 3, 4, 5, 6, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 26, 30, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50, 51, 53, 58, 60], "meant": [2, 51], "work": [2, 8, 51, 58], "temporari": [2, 8, 51, 56], "buffer": [2, 6, 7, 8, 51], "befor": [2, 8, 53, 56, 58], "creat": [2, 4, 6, 9, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49, 51, 53, 55, 58, 60], "dataset": [2, 3, 4, 5, 6, 50, 51, 53, 55, 58], "The": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55, 56, 60], "creation": [2, 51], "convert": [2, 56, 58], "agnost": [2, 58], "user": [2, 8, 9, 51], "import": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 56, 58], "gym": [2, 4, 6, 7, 8, 51, 53, 55, 56, 58, 60], "envid": 2, "reset": [2, 5, 8, 9, 12, 13, 14, 15, 16, 17, 38, 39, 40, 41, 42, 43, 44, 45, 51, 53, 55, 56, 58, 60], "_": [2, 8, 53, 55, 56, 58, 60], "rang": [2, 7, 8, 51, 53, 55, 56, 58, 60], "num_step": [2, 9], "action": [2, 4, 5, 6, 7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 56, 58, 60], "sampl": [2, 6, 9, 50, 51, 53, 55, 58], "ob": [2, 4, 8, 9, 51, 56, 60], "rew": [2, 4, 8, 9, 51, 56, 60], "termin": [2, 4, 5, 6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 37, 51, 53, 55, 56, 58, 60], "truncat": [2, 4, 5, 6, 7, 8, 9, 37, 51, 53, 55, 56, 58, 60], "info": [2, 4, 5, 8, 9, 51, 56, 60], "create_dataset": [2, 8, 51, 53, 55, 56, 60], "dataset_id": [2, 7, 8, 9, 51, 53, 55, 56, 58, 60], "env_nam": [2, 7, 9], "dataset_nam": [2, 7, 8, 9, 56], "v": [2, 7, 9, 10, 26, 58], "version": [2, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 55, 56], "kwarg": [2, 4, 6, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 55], "some": [2, 8, 9, 10, 51, 53, 56, 58], "characterist": [2, 56], "store": [2, 7, 8, 9, 51, 55, 58], "per": [2, 51], "episod": [2, 3, 5, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "dictionari": [2, 4, 6, 7, 8, 9, 51, 54, 56, 57, 58], "ar": [2, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 36, 37, 46, 47, 48, 49, 50, 51, 53, 56, 58], "memori": [2, 8, 51], "global": [2, 9, 56], "list": [2, 6, 8, 9, 50, 51, 58, 60], "item": [2, 6, 7, 56, 58, 60], "valu": [2, 4, 5, 6, 7, 8, 9, 38, 40, 42, 44, 51, 56, 58], "main": [2, 6, 51, 53, 56, 58], "observ": [2, 4, 5, 6, 7, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "kei": [2, 4, 7, 8, 9, 10, 55, 56, 58], "can": [2, 3, 4, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "anoth": [2, 4, 8, 9, 18, 22, 33, 46, 56, 58], "nest": [2, 4, 6, 7, 9, 51], "extra": [2, 3, 4, 8, 9, 51, 56], "separ": [2, 8, 51], "ad": [2, 4, 6, 7, 8, 9, 38, 39, 40, 41, 42, 43, 44, 45, 51, 55], "pass": [2, 3, 6, 7, 8, 55, 58], "custom": [2, 3, 8, 9, 51, 54, 56, 57], "when": [2, 6, 8, 9, 12, 13, 14, 15, 16, 17, 37, 38, 39, 40, 41, 42, 43, 44, 45, 51, 53, 55, 56, 58], "hdf5": [2, 3, 10, 50, 51, 55, 56], "file": [2, 3, 8, 10, 50, 51, 55], "gener": [2, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55, 56], "new": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 38, 39, 40, 41, 42, 43, 44, 45, 51, 53, 56, 58, 60], "group": [2, 3, 7, 8, 9, 10, 51, 56], "A": [2, 9, 26, 50, 56, 58], "call": [2, 4, 8, 9, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49], "return": [2, 4, 5, 6, 7, 8, 9, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 40, 42, 44, 47, 48, 49, 51, 53, 55, 56, 58, 60], "If": [2, 6, 7, 8, 9, 10, 51, 53, 56, 58], "previou": [2, 8, 51], "wa": [2, 6, 7, 9, 11, 18, 22, 30, 31, 32, 33, 46, 51, 53], "perform": [2, 7, 8, 10, 26, 28, 29, 56, 58, 60], "cach": [2, 8, 51, 58], "set": [2, 6, 8, 9, 11, 12, 13, 14, 15, 16, 17, 56, 58, 60], "max_buffer_episod": 2, "save": [2, 3, 9, 51, 53, 55, 56, 58, 60], "disk": [2, 8, 9, 51, 53, 55, 60], "non": [2, 8, 9, 11, 37], "move": [2, 8, 26, 37, 46, 51, 56], "from": [2, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "perman": [2, 8], "locat": [2, 8, 11, 12, 13, 14, 15, 16, 17, 37, 38, 39, 40, 41, 42, 43, 44, 45, 56, 58], "onli": [2, 7, 8, 9, 37, 38, 40, 42, 43, 44, 55, 58], "all": [2, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 26, 27, 51, 53, 57, 58, 60], "us": [2, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 56, 58, 60], "save_to_disk": 2, "path_to_permanent_loc": 2, "initi": [2, 5, 6, 7, 8, 9, 51, 53, 55, 56, 58, 60], "collector": [2, 56], "attribut": [2, 3, 7, 8, 9, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49, 51], "directori": [2, 8, 9, 58], "paramet": [2, 3, 4, 6, 7, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 58, 60], "option": [2, 4, 6, 7, 8, 9, 10, 51], "callback": [2, 3, 4, 51, 55, 56], "edit": [2, 4], "updat": [2, 8, 51, 56, 58], "databefor": 2, "default": [2, 3, 4, 6, 7, 8, 58], "add": [2, 3, 4, 6, 9, 10, 38, 39, 40, 41, 42, 43, 44, 45, 51, 56, 58], "metadata": [2, 3, 6, 7, 8, 10, 51, 55], "true": [2, 6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 56, 58, 60], "record": [2, 8, 9, 51, 55, 56], "each": [2, 3, 4, 5, 6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 55, 56, 58, 60], "number": [2, 5, 6, 7, 8, 9, 10, 51], "dump": [2, 53], "rais": [2, 7], "valueerror": 2, "t": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49, 51, 53, 55, 56, 58], "same": [2, 6, 7, 8, 9, 16, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49, 51, 56, 58], "self": [2, 3, 4, 6, 9, 55, 56, 60], "acttyp": [2, 7], "tupl": [2, 9, 51, 56, 58], "obstyp": [2, 7], "supportsfloat": 2, "dict": [2, 3, 4, 5, 6, 7, 9, 12, 13, 14, 15, 16, 17, 27, 28, 29, 31, 32, 38, 39, 40, 41, 42, 43, 44, 45, 51, 53, 55], "str": [2, 4, 6, 7, 9, 53], "ani": [2, 4, 5, 6, 7, 8, 9, 55, 56], "seed": [2, 5, 6, 7, 8, 9, 51, 53, 55, 56, 58, 60], "one": [2, 5, 6, 8, 18, 22, 33, 37, 46, 51, 58], "reproduc": [2, 8, 30, 58, 60], "unless": 2, "minari_autose": 2, "": [2, 3, 4, 6, 7, 8, 9, 10, 12, 13, 14, 15, 17, 26, 51, 53, 55, 56, 58, 60], "prng": 2, "specifi": [2, 6, 7, 8, 9, 51, 58], "addit": [2, 4, 6, 7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51], "disabl": 2, "state": [2, 9, 26, 37, 56, 58], "auxiliari": 2, "complement": 2, "eval_env": [2, 6, 7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "envspec": [2, 7, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51], "algorithm_nam": [2, 7, 8, 9, 53, 55, 56, 60], "author": [2, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 56, 60], "author_email": [2, 7, 8, 9, 51, 53, 56, 60], "code_permalink": [2, 7, 8, 9, 53, 56, 60], "ref_min_scor": [2, 7], "float": [2, 7, 55, 58], "ref_max_scor": [2, 7], "expert_polici": [2, 7], "callabl": [2, 6, 7, 8, 51, 53], "num_episodes_average_scor": [2, 7], "100": [2, 7, 8, 10, 34, 35, 36, 50, 51, 58], "minari_vers": [2, 7, 9, 51], "wrap": [2, 8, 51, 56, 58], "correspond": [2, 7, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 56, 60], "name": [2, 7, 8, 9, 10, 50, 51, 53, 60], "syntax": [2, 7, 9], "follow": [2, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 56, 58], "where": [2, 7, 9, 26, 29, 51, 56, 58], "identifi": [2, 7, 9], "load": [2, 8, 9, 51, 53, 58, 60], "load_dataset": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 60], "id": [2, 5, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 56, 60], "union": [2, 6, 7, 53], "spec": [2, 6, 7, 9, 51, 53, 58], "evalu": [2, 6, 7, 8, 51, 58, 60], "after": [2, 3, 5, 7, 9, 10, 51, 56, 60], "recov": [2, 6, 7, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 58], "minaridataset": [2, 5, 7, 8, 9, 51, 60], "recover_environ": [2, 6, 7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 60], "should": [2, 6, 7, 53, 55], "algorithm": [2, 7, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 58], "email": [2, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51], "link": [2, 7, 8, 9], "relev": [2, 7, 8, 9], "code": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 56, 57, 58, 60], "minimum": [2, 7, 8, 9, 51], "refer": [2, 7, 51], "score": [2, 58], "averag": [2, 7, 58], "random": [2, 6, 7, 8, 9, 13, 15, 17, 30, 37, 38, 39, 40, 41, 42, 43, 44, 45, 53, 55, 56, 58, 60], "polici": [2, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 26, 30, 31, 32, 33, 34, 35, 37, 46, 47, 48, 56, 58], "later": [2, 7, 51, 58], "normal": [2, 58], "get_normalized_scor": [2, 7, 51], "estim": [2, 7, 58], "maximum": [2, 7, 9, 56, 58, 60], "hypothet": [2, 7], "expert": [2, 7, 8, 9, 10, 11, 18, 19, 22, 23, 30, 31, 33, 34, 46, 47, 50, 51, 58, 60], "comput": [2, 7, 8, 9, 58], "over": [2, 6, 7, 8, 56, 58], "equal": [2, 7, 8, 9], "compat": [2, 7, 8, 9, 10, 51, 60], "close": [2, 26, 56, 58, 60], "clear": [2, 8], "full": [3, 9, 30, 31, 51, 58], "overridden": [3, 4, 7, 51], "statist": [3, 9], "datacollector": [3, 8, 9, 51, 53, 55, 56, 60], "argument": [3, 4, 7, 8, 9, 51], "todo": 3, "__call__": [3, 4, 9, 55, 56], "overrid": [3, 4, 9, 10, 56], "an": [3, 6, 7, 8, 9, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 42, 43, 46, 47, 48, 49, 51, 53, 56, 58], "reward": [4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 22, 33, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 51, 58, 60], "stepdata": [4, 9], "input": [4, 6, 8, 9, 58, 60], "belong": 4, "transit": [4, 51, 56, 58], "customstepdatacallback": 4, "def": [4, 9, 53, 55, 56, 58, 60], "step_data": [4, 9, 55, 56], "super": [4, 9, 55, 56, 60], "environment_st": 4, "pose": [4, 56], "posit": [4, 9, 26, 30, 46, 56, 58], "orient": [4, 33, 55], "veloc": [4, 37, 56], "current": [4, 7, 10, 50, 51, 56, 58], "must": [4, 6, 7, 8, 9, 51, 58], "step_data_kei": 4, "total_step": [5, 6, 9, 51, 56, 60], "ndarrai": [5, 6, 7, 9, 51], "singl": [5, 7, 8, 9, 10, 58], "object": [5, 6, 8, 9, 18, 22, 26, 30, 33, 46, 51, 53, 58, 60], "sample_episod": [5, 6, 8, 9, 51, 55], "api": [5, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 56, 60], "final": [5, 6, 7, 8, 11, 51, 53, 55, 56, 58], "includ": [5, 6, 7, 9, 26, 27, 29, 37, 51, 58], "mean": [5, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 56, 58], "increas": 5, "compar": [5, 55], "taken": [5, 38, 39, 40, 41, 42, 43, 44, 45, 55], "minaristorag": [6, 51], "pathlik": 6, "episode_indic": [6, 8], "get": [6, 7, 8, 10, 51, 53, 55, 56, 58, 60], "properti": [6, 58], "np": [6, 7, 9, 51, 55, 56, 58, 60], "slice": 6, "indic": [6, 8, 51], "point": [6, 51, 55, 58], "n_episod": [6, 8], "iter": [6, 8, 9, 11, 37, 56, 58], "episodedata": [6, 8, 51], "n": [6, 8, 9, 10, 31, 32, 56, 60], "iterate_episod": [6, 8, 51], "filter_episod": [6, 8, 9, 51], "condit": [6, 8, 9, 51, 58], "filter": [6, 9, 50, 51], "which": [6, 7, 8, 9, 11, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 55, 56, 58, 60], "take": [6, 9, 53, 56], "instanc": [6, 51], "retutrn": 6, "met": 6, "otherwis": [6, 8, 38, 40, 42, 44, 51], "lambda": [6, 8, 51, 53, 56], "x": [6, 37, 56, 60], "1": [6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 55, 58, 60], "function": [6, 7, 8, 9, 10, 31, 32, 37, 38, 39, 40, 41, 42, 43, 44, 45, 51, 53, 56, 58, 60], "certain": [6, 8, 33], "set_se": [6, 8, 58], "intend": 6, "other": [6, 7, 9, 10, 26, 29, 51, 55, 56, 58], "you": [6, 8, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 56, 58, 60], "want": [6, 8, 10, 56], "update_dataset_from_buff": 6, "have": [6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 53, 55, 56, 58, 60], "shape": [6, 7, 9, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 55, 56, 58, 60], "total_episode_step": [6, 7], "observation_shap": [6, 7], "action_shap": [6, 7], "long": [6, 7, 26, 56], "total": [6, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 56, 58], "total_episod": [6, 8, 9, 51, 60], "avail": [6, 7, 8, 9, 10, 50, 51, 53, 58], "within": [6, 9, 51, 58], "create_dataset_from_buff": [7, 8, 51], "space": [7, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 54, 56, 57, 58, 60], "latter": [7, 58], "also": [7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 50, 51, 53, 55, 56, 58], "note": [7, 9, 12, 13, 14, 15, 16, 17, 55, 56, 58], "assign": [7, 9], "valid": [7, 55, 56, 58], "than": [7, 8, 12, 13, 14, 15, 16, 17, 51, 58], "retriev": [7, 8, 51], "local": [7, 8, 9, 50, 51, 53, 55, 58, 60], "databas": [7, 10], "found": [7, 9], "split_dataset": [7, 8, 51], "size": [7, 8, 51, 56, 58], "multipl": [7, 8, 9, 10, 51, 58], "result": [7, 9, 51, 53, 56], "download_dataset": [7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "force_download": [7, 51], "remot": [7, 9, 10, 50, 51], "server": [7, 8, 10, 50, 58], "error": [7, 51, 53, 56, 58], "skip": [7, 58], "continu": [7, 8, 9, 37, 38, 39, 40, 41, 42, 43, 44, 45, 56], "match": 7, "boolean": 7, "flag": [7, 51, 58], "forc": [7, 10, 37, 56], "list_local_dataset": [7, 8, 51, 55], "latest_vers": 7, "compatible_minari_vers": 7, "latest": [7, 10, 51, 56], "door": [7, 8, 9, 10, 19, 20, 21, 26, 50, 51], "human": [7, 8, 9, 10, 18, 19, 22, 23, 33, 34, 46, 47, 50, 51, 58, 60], "v0": [7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 30, 31, 32, 50, 53, 56], "v1": [7, 8, 9, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 58, 60], "list_remote_dataset": [7, 8, 51], "delete_dataset": [7, 53, 55], "combine_dataset": [7, 8, 51], "datasets_to_combin": [7, 51], "new_dataset_id": [7, 51], "its": [7, 51, 53, 56, 58], "own": [7, 8, 10, 51, 56], "combined_dataset": 7, "were": [7, 8, 9, 10, 18, 22, 26, 33, 37, 46, 51], "form": [7, 56], "newli": [7, 8, 58], "undiscount": [7, 9], "origin": [7, 8, 18, 22, 26, 33, 37, 46, 51, 53, 58], "provid": [7, 8, 9, 11, 12, 14, 18, 19, 20, 21, 22, 23, 24, 25, 33, 34, 35, 36, 46, 47, 48, 49, 50, 51, 58], "d4rl": [7, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 54, 57], "repositori": [7, 9, 18, 20, 21, 22, 24, 25, 26, 33, 36, 46, 48, 49], "facilit": [7, 8, 51], "comparison": 7, "across": [7, 9], "differ": [7, 8, 9, 37, 51, 53, 56, 58], "task": [7, 8, 11, 18, 22, 26, 29, 33, 38, 39, 40, 41, 42, 43, 44, 45, 46, 56, 58, 60], "between": [7, 9, 39, 41, 43, 45, 56], "0": [7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 53, 55, 56, 58, 60], "calcul": [7, 58], "These": [7, 9, 10, 18, 22, 26, 33, 37, 46, 51, 56], "two": [7, 8, 9, 10, 18, 22, 33, 37, 46, 51, 58, 60], "respect": [7, 9, 56, 58], "formula": [7, 56], "_score": 7, "frac": 7, "ref": 7, "_min": 7, "_max": 7, "util": [7, 8, 50, 58, 60], "under": [7, 9, 37, 50, 51, 58], "test": [7, 8, 9, 11, 51, 55], "now": [7, 9, 51, 53, 55, 56, 60], "arrai": [7, 9, 56], "normalized_scor": 7, "standard": [8, 51, 58], "host": [8, 10, 18, 22, 26, 33, 46, 50], "interfac": [8, 9], "offlin": [8, 9, 10, 50, 51, 56, 58, 60], "reinforc": [8, 10, 11, 18, 22, 26, 30, 33, 37, 46, 50, 56], "learn": [8, 10, 11, 18, 22, 26, 30, 33, 37, 46, 50, 51, 53, 55, 56, 57, 60, 61], "applic": 8, "most": [8, 10], "rl": [8, 18, 20, 22, 24, 33, 35, 46, 48, 51, 58, 60], "handl": [8, 50], "capabl": 8, "recent": [8, 58], "librari": [8, 50, 51, 53, 60], "run": [8, 18, 19, 22, 23, 33, 34, 46, 47, 51, 58], "command": [8, 10, 51, 60], "d": [8, 58], "like": [8, 10, 53, 58, 60], "start": [8, 9, 31, 32, 53, 55, 56, 58, 60], "pleas": [8, 10, 51, 55], "project": [8, 9, 51], "we": [8, 9, 10, 30, 51, 53, 55, 56, 58, 60], "support": [8, 51, 53, 56, 58], "python": [8, 9, 50, 51, 53, 55, 56, 57, 58, 60], "3": [8, 9, 10, 11, 27, 28, 29, 31, 32, 53, 58], "8": [8, 11, 12, 13, 14, 15, 16, 17, 37, 51, 56], "linux": 8, "maco": 8, "abstract": 8, "process": [8, 51, 56, 58], "achiev": [8, 9, 56, 60], "intern": [8, 51], "schedul": [8, 51], "amount": [8, 56], "while": [8, 9, 51, 53, 55, 56, 58, 60], "veri": 8, "simpl": [8, 9, 51, 56, 58, 60], "cartpol": [8, 51, 60], "100000": 8, "In": [8, 9, 51, 53, 55, 56, 58, 60], "exampl": [8, 9, 10, 51, 53, 56, 57, 58], "give": [8, 9, 10, 56, 58], "them": [8, 9, 51, 60], "There": [8, 18, 22, 26, 33, 46, 58], "detail": [8, 58], "descript": [8, 9, 11, 18, 22, 26, 30, 33, 37, 46, 51], "read": [8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 58], "document": [8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51], "first": [8, 9, 51, 53, 55, 56, 58], "need": [8, 9, 51, 53, 55, 56, 58, 60], "given": [8, 9, 10], "allow": [8, 9, 51, 56, 60], "compris": [8, 9], "just": [8, 53, 58], "loop": [8, 58, 60], "through": [8, 9, 10, 50, 51, 56, 58], "gymansium": 8, "mdp": [8, 51], "done": [8, 56, 58, 60], "root": 8, "path": [8, 9, 10, 38, 39, 40, 41, 42, 43, 44, 45, 50, 51, 56, 60], "structur": [8, 51], "extend": [8, 55], "123": [8, 51, 56], "break": [8, 51, 56, 60], "contact": [8, 10, 53, 60], "org": [8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 56, 60], "well": [8, 9, 10, 50, 51, 56, 58], "snippet": [8, 9], "ha": [8, 9, 16, 37, 51, 56, 58], "been": [8, 9, 37, 51], "check": [8, 10, 51, 56], "appear": 8, "2059": 8, "6": [8, 51], "mb": 8, "wai": [8, 9, 56, 58], "left": [8, 56, 58], "instead": [8, 9, 51, 56, 58], "respons": 8, "specif": [8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 55, 56, 58], "won": [8, 56], "until": [8, 9, 38, 39, 40, 41, 42, 43, 44, 45], "larg": [8, 11, 37, 51], "avoid": [8, 58], "lose": 8, "append": [8, 51, 58], "update_dataset_from_collector_env": [8, 51], "method": [8, 9, 11, 37, 51, 53, 56, 58], "10": [8, 9, 51, 53, 55, 56, 58], "episode_id": [8, 9, 51], "alreadi": [8, 10, 51, 55, 56, 58], "els": [8, 51, 56, 58], "add_to_dataset": 8, "abl": [8, 37], "your": [8, 10, 51, 60], "order": [8, 26, 27, 51, 55], "featur": [8, 9, 50, 51, 60], "print": [8, 51, 53, 55, 58, 60], "storag": 8, "googl": [8, 9, 58], "cloud": [8, 9], "platform": [8, 9], "gcp": [8, 9, 10, 50], "bucket": [8, 9, 10, 50], "access": [8, 9, 10, 51, 56], "antmaz": [8, 11, 12, 13, 14, 15, 16, 17], "divers": [8, 11], "1000": [8, 12, 13, 14, 15, 51, 58], "1000000": [8, 10, 12, 13, 14, 15, 16, 17, 19, 20, 23, 24, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 50], "700": [8, 16, 17], "5": [8, 9, 51, 56, 58], "alex": [8, 12, 13, 14, 15, 16, 17], "davei": [8, 12, 13, 14, 15, 16, 17], "amd1g13": [8, 12, 13, 14, 15, 16, 17], "soton": [8, 12, 13, 14, 15, 16, 17], "ac": [8, 12, 13, 14, 15, 16, 17, 60], "uk": [8, 12, 13, 14, 15, 16, 17], "plai": [8, 11], "medium": [8, 11, 37, 51, 56], "25": [8, 10, 18, 21, 22, 25, 33, 36, 46, 49, 50, 51, 58], "6729": [8, 10, 21, 50], "7": [8, 27, 28, 29, 31, 32, 51, 53, 58], "rodrigo": [8, 10, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 56], "de": [8, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 47, 48, 49], "lazcano": [8, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 47, 48, 49], "rperezvicent": [8, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 56], "shard": 8, "randomli": [8, 9, 37, 53, 56], "map": [8, 12, 14, 56, 58], "ep": 8, "f": [8, 9, 10, 51, 53, 55, 58, 60], "show": [8, 10, 50, 51, 53, 55, 58], "13": [8, 51], "22": [8, 11, 51], "15": 8, "23": 8, "18": [8, 51], "2": [8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 22, 26, 27, 28, 29, 33, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 53, 55, 58], "12": [8, 51, 58], "19": [8, 27, 51], "9": [8, 27, 28, 29], "4": [8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 53, 55, 56], "17": [8, 51], "21": 8, "notic": 8, "doesn": [8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49, 56], "serv": 8, "purpos": [8, 37, 56, 58], "replai": [8, 51], "out": [8, 51, 53, 56, 58], "leav": 8, "dataload": [8, 51, 60], "mai": [8, 9, 56, 58], "abil": 8, "determinist": [8, 56], "episodes_gener": 8, "itself": 8, "howev": [8, 9, 37, 51, 53, 56, 58, 60], "case": [8, 9, 51, 56], "h5py": [8, 9, 51], "format": [8, 51, 53], "keep": [8, 51], "greater": [8, 51], "filter_dataset": [8, 51], "remov": [8, 51], "divid": [8, 9, 56], "20": [8, 51, 58], "second": [8, 51], "lunarland": 8, "v2": [8, 51], "eval_env_spec": [8, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49], "lastli": 8, "adroithanddoor": [8, 9, 18, 19, 20, 21, 51], "5025": 8, "1006729": 8, "1103": 8, "5000": [8, 10, 20, 24, 36, 48, 50, 58], "1096": 8, "common": 9, "modifi": [9, 51, 55], "variabl": [9, 51, 56], "minari_datasets_path": 9, "kept": 9, "public": [9, 51, 56], "level": 9, "tree": 9, "string": [9, 53], "describ": [9, 51], "come": [9, 10, 50], "ennv_nam": 9, "content": [9, 10], "integ": 9, "repres": [9, 53, 58], "end": [9, 51], "yet": 9, "_doc": 9, "wip": 9, "homogen": 9, "main_data": [9, 10, 50, 51], "asid": 9, "raw": 9, "extern": 9, "additional_data_x": 9, "checkpoint": [9, 51], "update_dataset": 9, "three": [9, 18, 22, 26, 33, 46, 56, 58], "other_dataset_id": 9, "minari_root": 9, "additional_data_0": 9, "additional_data_1": 9, "leverag": 9, "hierarch": 9, "element": 9, "clearli": 9, "whole": 9, "individu": 9, "organ": 9, "insid": [9, 53], "plu": 9, "sub": [9, 10, 51], "both": [9, 53, 55], "up": [9, 12, 13, 14, 15, 16, 17, 51, 53, 55, 56, 58, 60], "look": [9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53], "episode_0": [9, 51], "infos_dataset": [9, 51], "infos_subgroup": [9, 51], "more_dataset": [9, 51], "additional_group": [9, 51], "additional_dataset": [9, 51], "episode_1": [9, 51], "episode_2": [9, 51], "rel": [9, 51], "complex": [9, 11, 18, 22, 33, 46, 51], "definit": [9, 51], "component_1": [9, 51], "box": [9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 60], "low": [9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 55, 56, 58], "high": [9, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 55, 56, 58], "dtype": [9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 55, 56, 58], "float32": [9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 56, 60], "component_2": [9, 51], "subcomponent_1": [9, 51], "subcomponent_2": [9, 51], "similarli": [9, 51, 58], "consid": [9, 51, 56, 58], "_index_0": [9, 51], "_index_1": [9, 51], "_index_": 9, "index": 9, "involv": [9, 37, 56], "depend": [9, 51], "top": [9, 10, 27, 28, 29], "action_space_component_shap": 9, "entri": [9, 56], "discret": [9, 31, 32, 51, 53, 56, 60], "vari": [9, 53, 58, 60], "particular": [9, 53, 58], "compon": [9, 56], "observation_space_component_shap": 9, "becaus": [9, 11, 12, 13, 14, 15, 16, 17, 37, 58], "last": [9, 51], "finish": 9, "due": [9, 51, 56], "numpi": [9, 55, 56, 58, 60], "particip": 9, "adroit": 9, "hand": [9, 12, 14, 18, 22, 33, 46, 56, 58], "robot": [9, 11, 18, 22, 33, 46, 51, 55, 56, 58], "mujoco": [9, 56], "simul": 9, "sinc": [9, 53, 56, 60], "present": [9, 11, 60], "stepdatacallbak": 9, "qpo": [9, 56], "qvel": [9, 56], "bodi": 9, "adroitstepdatacallback": 9, "get_env_st": 9, "object_body_po": 9, "attach": 9, "int64": [9, 31, 32, 51], "env_spec": 9, "json": [9, 10, 51, 53], "metric": 9, "max": [9, 56, 58], "float64": [9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 55, 58], "min": [9, 58], "std": 9, "deviat": [9, 56], "sum": [9, 58], "possibl": [9, 51], "shift": [9, 58], "dimension": [9, 18, 22, 33, 46], "upper": 9, "lower": 9, "defin": [9, 53, 55, 60], "bound": [9, 56, 58], "text": [9, 31, 32, 51, 56], "charset": [9, 31, 32], "moment": 9, "don": [9, 51, 53, 55, 56], "guarante": 9, "surrog": 9, "pair": [9, 58], "aim": [9, 56, 58], "machin": [9, 11], "readabl": 9, "compli": [9, 51], "encapsul": 9, "even": 9, "arbitrari": [9, 51], "via": [9, 26, 58], "download": [9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 56, 57, 58, 60], "sampled_episod": 9, "consist": [9, 37, 58], "field": [9, 51, 58], "As": [9, 51, 56, 60], "mention": [9, 51, 56, 60], "section": [9, 51, 58], "mani": 9, "so": [9, 56, 58], "being": [9, 26, 27, 28, 29, 37, 39, 41, 43, 45], "compliant": [9, 51], "thei": [9, 51, 58], "pattern": 9, "test_data_collector_step_data_callback_info_correct": 9, "test_step_data_callback": 9, "py": [9, 51, 53, 55, 56, 58, 60], "tool": [10, 22, 51], "build": [10, 51], "off": 10, "typer": 10, "line": [10, 55], "exist": [10, 51, 55, 56], "help": [10, 51, 56], "font": [10, 50], "color": [10, 50], "f4bf75": 10, "usag": [10, 51], "arg": [10, 51, 56, 58], "base": [10, 51, 56, 58], "gymnaisum": 10, "a5a5a1": 10, "a1efe4": [10, 50], "03ac13": [10, 50], "messag": 10, "exit": 10, "tabl": [10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51], "devic": [10, 58], "incompat": 10, "pen": [10, 34, 35, 36, 51], "3736": [10, 34], "500000": [10, 34], "ff00ff": [10, 50], "rperezv": 10, "4958": [10, 35], "499206": [10, 35], "4356": [10, 50], "With": 10, "prompt": 10, "abort": 10, "warn": [10, 51, 58], "instanti": 10, "confirm": [10, 58], "proce": [10, 60], "sure": [10, 51], "y": [10, 37, 56, 58], "would": [10, 55, 56], "touch": [10, 55], "team": 10, "share": [10, 58], "encrypt": 10, "permiss": 10, "Then": [10, 53, 56, 58], "path_str": 10, "key_fil": 10, "progress": 10, "bar": 10, "shown": [10, 58], "below": [10, 56, 58], "implement": [10, 11, 56, 58], "merg": 10, "togeth": [10, 26, 28, 58], "new_dataset_nam": 10, "successfulli": [10, 55], "navig": [11, 30, 37], "domain": [11, 18, 22, 33, 37, 46], "replac": [11, 56], "2d": 11, "ball": [11, 37, 46, 56], "pointmaz": [11, 37, 38, 39, 40, 41, 42, 43, 44, 45, 51, 54, 55, 57], "dof": [11, 18, 22, 33, 46, 58], "quadrup": 11, "introduc": [11, 18, 22, 33, 46, 58], "stitch": 11, "challeng": [11, 58], "morpholog": 11, "could": [11, 58], "mimic": 11, "real": 11, "world": 11, "addition": [11, 51], "spars": [11, 12, 13, 14, 15, 16, 17, 18, 22, 33, 37, 38, 40, 42, 44, 46], "activ": [11, 58], "upon": 11, "reach": [11, 12, 13, 14, 15, 16, 17, 26, 30, 33, 37, 38, 39, 40, 41, 42, 43, 44, 45, 51, 56], "goal": [11, 12, 13, 14, 15, 16, 17, 26, 30, 31, 37, 38, 39, 40, 41, 42, 43, 44, 45, 53, 55, 56, 58], "previous": [11, 51, 56, 60], "train": [11, 12, 13, 14, 15, 16, 17, 18, 19, 22, 23, 33, 34, 46, 47, 55], "sac": [11, 12, 13, 14, 15, 16, 17], "stabl": 11, "baselin": 11, "agent": [11, 12, 13, 14, 15, 17, 30, 37, 38, 39, 40, 41, 42, 43, 44, 45, 55, 56, 58, 60], "waypoint": [11, 12, 13, 14, 15, 16, 17, 37, 38, 39, 40, 41, 42, 43, 44, 45], "planner": [11, 37], "qiter": [11, 12, 13, 14, 15, 16, 17, 37, 38, 39, 40, 41, 42, 43, 44, 45, 56], "control": [11, 37, 38, 39, 40, 41, 42, 43, 44, 45, 51, 58, 60], "memor": [11, 37], "markovian": [11, 37], "fu": [11, 18, 22, 26, 30, 33, 37, 46, 56], "justin": [11, 18, 22, 26, 30, 33, 37, 46, 56], "et": [11, 18, 22, 26, 30, 33, 37, 46, 56, 58], "al": [11, 18, 22, 26, 30, 33, 37, 46, 56, 58], "deep": [11, 18, 22, 26, 30, 33, 37, 46, 56], "driven": [11, 18, 22, 26, 30, 33, 37, 46, 56], "corr": [11, 18, 22, 26, 30, 33, 37, 46, 56], "vol": [11, 18, 22, 26, 30, 33, 37, 46, 56], "ab": [11, 18, 22, 26, 30, 33, 37, 46, 56], "2004": [11, 18, 22, 26, 30, 33, 37, 46, 56], "07219": [11, 18, 22, 26, 30, 33, 37, 46, 56], "2020": [11, 18, 22, 26, 30, 33, 37, 46, 56], "arxiv": [11, 18, 22, 26, 30, 33, 37, 46, 56], "antonin": 11, "raffin": 11, "ashlei": 11, "hill": 11, "adam": [11, 58, 60], "gleav": 11, "anssi": 11, "kanervisto": 11, "maximilian": 11, "ernestu": 11, "noah": 11, "dormann": 11, "2021": [11, 58], "baselines3": [11, 60], "reliabl": 11, "journal": 11, "research": 11, "268": 11, "lambert": [11, 37, 56], "nathan": [11, 37, 56], "fundament": [11, 37, 56], "learnin": [11, 37, 56], "apr": [11, 37, 56], "towardsdatasci": [11, 37, 56], "df8ff078652a": [11, 37, 56], "antmaze_large_diverse_gr": [11, 12], "v4": [11, 12, 13, 14, 15, 16, 17], "antmaze_larg": [11, 13], "antmaze_medium_diverse_gr": [11, 14], "antmaze_medium": [11, 15], "umaz": [11, 37, 51, 56], "antmaze_umaz": [11, 16, 17], "u": [11, 16, 17, 37, 44, 45, 51, 58, 60], "At": [12, 13, 14, 15, 17], "begin": [12, 13, 14, 15, 17, 60], "select": [12, 13, 14, 15, 17, 18, 22, 33, 37, 46, 51, 56], "pick": [12, 14], "cell": [12, 14, 56], "success": [12, 13, 14, 15, 16, 17, 56, 60], "rate": [12, 13, 14, 15, 16, 17, 56], "trajectori": [12, 13, 14, 15, 16, 17, 18, 20, 22, 24, 33, 35, 37, 46, 48, 50, 51, 56], "80": [12, 13, 14, 15, 51], "fail": [12, 13, 14, 15, 16, 17, 51], "occur": [12, 13, 14, 15, 16, 17], "ant": [12, 13, 14, 15, 16, 17], "flip": [12, 13, 14, 15, 16, 17, 26], "stand": [12, 13, 14, 15, 16, 17], "again": [12, 13, 14, 15, 16, 17], "target": [12, 13, 14, 15, 16, 17, 26, 27, 28, 29, 37, 46, 56, 58], "lead": [12, 13, 14, 15, 16, 17, 56], "accumul": [12, 13, 14, 15, 16, 17, 56, 60], "subspac": [12, 13, 14, 15, 16, 17, 27, 28, 29, 31, 32, 38, 39, 40, 41, 42, 43, 44, 45], "achieved_go": [12, 13, 14, 15, 16, 17, 27, 28, 29, 38, 39, 40, 41, 42, 43, 44, 45, 55, 56], "infin": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "desired_go": [12, 13, 14, 15, 16, 17, 27, 28, 29, 38, 39, 40, 41, 42, 43, 44, 45, 55, 56], "27": [12, 13, 14, 15, 16, 17, 51], "permalink": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "rodrigodelazcano": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51], "minari": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 58, 60], "row": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "what": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 56], "registri": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "registr": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "inf": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 55], "entry_point": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51], "gymnasium_robot": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "maze": [12, 13, 14, 15, 16, 17, 38, 39, 40, 41, 42, 43, 44, 45, 51, 55, 56], "ant_maze_v4": [12, 13, 14, 15, 16, 17], "antmazeenv": [12, 13, 14, 15, 16, 17], "max_episode_step": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 56, 58], "reward_threshold": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "nondeterminist": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "order_enforc": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "autoreset": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "disable_env_check": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "maze_map": [12, 13, 14, 15, 16, 17, 38, 39, 40, 41, 42, 43, 44, 45, 56], "c": [12, 14, 26, 51], "reward_typ": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "continuing_task": [12, 13, 14, 15, 16, 17, 38, 39, 40, 41, 42, 43, 44, 45, 56], "reset_target": [12, 13, 14, 15, 16, 17, 38, 39, 40, 41, 42, 43, 44, 45], "additional_wrapp": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "vector_entry_point": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "g": [12, 13, 14, 15, 16, 17, 31, 32, 38, 39, 40, 41, 42, 43, 44, 45, 58], "fix": [16, 37, 51, 58], "90": [16, 17, 51], "1433": [16, 17], "hand_dapg": [18, 22, 33, 46], "open": [18, 26, 37, 51, 58], "24": [18, 22, 33, 34, 35, 36, 46, 58], "measur": [18, 22, 33, 46, 56], "effect": [18, 22, 33, 46], "narrow": [18, 22, 33, 46], "distribut": [18, 22, 33, 46, 58], "demonstr": [18, 19, 21, 22, 23, 25, 26, 27, 33, 34, 36, 46, 47, 49, 58], "manipul": [18, 22, 33, 46, 58], "paper": [18, 22, 33, 46], "rajeswaran": [18, 22, 33, 46], "aravind": [18, 22, 33, 46], "dexter": [18, 22, 33, 46], "1709": [18, 22, 33, 46], "10087": [18, 22, 33, 46], "2017": [18, 22, 33, 46], "obtain": [18, 19, 22, 23, 33, 34, 46, 47, 56], "imit": [18, 19, 22, 23, 26, 33, 34, 46, 47], "mix": [18, 19, 22, 23, 26, 33, 34, 46, 47, 51], "50": [18, 19, 22, 23, 33, 34, 46, 47, 56, 58], "ratio": [18, 19, 22, 23, 33, 34, 46, 47], "fine": [18, 20, 22, 24, 33, 35, 46, 48], "tune": [18, 20, 22, 24, 33, 35, 46, 48, 56, 58], "dapg": [18, 20, 21, 22, 24, 25, 33, 35, 36, 46, 48, 49], "4358": 19, "39": [19, 20, 21, 47, 48, 49], "28": [19, 20, 21, 51], "adroit_hand": [19, 20, 21, 23, 24, 25, 34, 35, 36, 47, 48, 49], "adroit_door": [19, 20, 21], "adroithanddoorenv": [19, 20, 21], "200": [19, 20, 21, 23, 24, 25, 47, 48, 49], "dens": [19, 20, 21, 23, 24, 25, 34, 35, 36, 37, 47, 48, 49, 51, 58], "assert": [19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49, 53, 60], "adroithandhamm": [22, 23, 24, 25, 51], "nail": 22, "board": 22, "3606": 23, "46": [23, 24, 25], "26": [23, 24, 25, 51], "hammer": [23, 24, 25, 51], "adroit_hamm": [23, 24, 25], "adroithandhammerenv": [23, 24, 25], "11310": 25, "frankakitchen": [26, 27, 28, 29, 51], "relai": 26, "interact": 26, "variou": [26, 28, 53], "desir": [26, 56], "configur": [26, 58], "kettl": [26, 27, 28, 29], "light": [26, 27, 28, 29], "switch": [26, 27, 28, 29], "microwav": [26, 27, 28, 29], "cabinet": [26, 27, 28, 29], "slide": [26, 27, 28, 29], "complet": [26, 28, 29, 51, 58], "subtask": [26, 27, 28, 29], "gupta": 26, "kumar": 26, "lynch": 26, "levin": 26, "hausman": 26, "k": 26, "2019": 26, "solv": [26, 56], "horizon": 26, "preprint": 26, "1910": 26, "11956": 26, "never": [26, 28, 56, 58], "sequenc": [26, 28, 29, 37], "partial": [26, 51], "subtrajectori": [26, 29], "4209": 27, "59": [27, 28, 29], "kitchen": [27, 28, 29, 51], "bottom": [27, 28, 29], "burner": [27, 28, 29], "hing": [27, 28, 29], "franka_kitchen": [27, 28, 29], "kitchenenv": [27, 28, 29], "280": 27, "remove_task_when_complet": [27, 28, 29], "terminate_on_tasks_complet": [27, 28, 29], "tasks_to_complet": [27, 28, 29], "156560": [28, 29], "621": [28, 29], "450": [28, 29], "fourroom": 30, "gridworld": 30, "regener": 30, "straight": [30, 31], "goe": [30, 31], "10010": 31, "590": 31, "direct": [31, 32, 53, 58], "imag": [31, 32, 53, 58], "uint8": [31, 32, 53, 58], "255": [31, 32, 53], "mission": [31, 32, 53], "max_length": [31, 32], "14": [31, 32, 51], "min_length": [31, 32], "0123456789abcdefghijklmnopqrstuvwxyzabcdeeeffghijklmnnoopqrrssttuvwxyzz": [31, 32], "expertpolici": [31, 60], "omar": [31, 32], "youni": [31, 32], "younis98": [31, 32], "gmail": [31, 32], "minigrid": [31, 32, 51, 53], "missionspac": [31, 32, 53], "fourroomsenv": [31, 32], "_gen_miss": [31, 32, 53], "0x7f836964c4c0": [31, 32], "1000033": 32, "10181": 32, "randompolici": 32, "adroithandpen": [33, 34, 35, 36, 51, 58], "repfixositori": [33, 35], "45": [34, 35, 36, 58], "adroit_pen": [34, 35, 36], "adroithandpenenv": [34, 35, 36], "actuat": 37, "along": [37, 50], "axi": [37, 56, 58], "thu": [37, 56], "split": [37, 51], "smaller": [37, 51, 56], "pd": [37, 38, 39, 40, 41, 42, 43, 44, 45, 56], "maze2d": [37, 56], "pointmaze_largedens": [37, 39], "v3": [37, 38, 39, 40, 41, 42, 43, 44, 45, 51, 55, 56], "pointmaze_larg": [37, 38], "pointmaze_mediumdens": [37, 41], "pointmaze_medium": [37, 40, 56], "pointmaze_opendens": [37, 43], "arena": [37, 42, 43], "perimet": [37, 42, 43], "wall": [37, 42, 43, 56], "pointmaze_open": [37, 42], "pointmaze_umazedens": [37, 45], "pointmaze_umaz": [37, 44, 55], "without": [38, 39, 40, 41, 42, 43, 44, 45, 51], "varianc": [38, 39, 40, 41, 42, 43, 44, 45, 56], "nois": [38, 39, 40, 41, 42, 43, 44, 45, 51, 56], "3325": 38, "perez": [38, 39, 40, 41, 42, 43, 44, 45, 56], "vicent": [38, 39, 40, 41, 42, 43, 44, 45, 56], "point_maz": [38, 39, 40, 41, 42, 43, 44, 45], "pointmazeenv": [38, 39, 40, 41, 42, 43, 44, 45], "800": [38, 39], "neg": [39, 41, 43, 45], "euclidean": [39, 41, 43, 45], "distanc": [39, 41, 43, 45], "3322": 39, "4778": 40, "600": [40, 41], "4765": 41, "9609": 42, "300": [42, 43, 44, 45], "9637": 43, "13289": [44, 45], "adroithandreloc": [46, 47, 48, 49, 51], "3758": 47, "30": [47, 48, 49, 58], "reloc": [47, 48, 49, 51], "adroit_reloc": [47, 48, 49], "adroithandrelocateenv": [47, 48, 49], "9942": 49, "popular": 50, "publicli": 50, "cli": [50, 51], "beta": [50, 51, 58], "develop": [50, 51], "minor": [50, 51], "major": [50, 51], "expect": [50, 55], "futur": [50, 51, 56], "\u898b\u7fd2\u3044": 50, "2024": 51, "01": 51, "pypi": 51, "small": [51, 58], "bug": 51, "lost": 51, "im": 51, "kitsch": 51, "144": 51, "refactor": [51, 56], "datacollectorv0": 51, "isol": 51, "younik": 51, "133": 51, "serial": [51, 54, 57], "tutori": [51, 53, 55, 56, 58, 60], "enerrio": 51, "151": 51, "basic": [51, 58], "ci": 51, "pytest": 51, "markdown": 51, "elliottow": 51, "153": 51, "155": 51, "recover_env": 51, "161": 51, "combin": [51, 56], "162": 51, "act": 51, "163": 51, "dir": 51, "alexdavei": 51, "160": 51, "mandatori": 51, "164": 51, "165": 51, "pre": 51, "commit": 51, "thing": [51, 53], "pettingzoo": 51, "doe": 51, "157": 51, "avjmachin": 51, "137": 51, "dataset_s": 51, "shreyansjainn": 51, "158": 51, "improv": [51, 58], "readm": 51, "167": 51, "deprec": 51, "create_dataset_from_collector_env": 51, "169": 51, "170": 51, "gt": 51, "171": 51, "172": 51, "balisujohn": 51, "132": 51, "contributor": 51, "changelog": 51, "2023": [51, 58], "09": 51, "rugged": 51, "grahamannett": 51, "126": 51, "128": [51, 58, 60], "130": 51, "speed": [51, 56], "124": 51, "coverag": 51, "129": 51, "issu": [51, 58], "templat": 51, "139": 51, "loos": 51, "typing_extens": 51, "148": 51, "07": 51, "bugfix": 51, "121": 51, "pr": 51, "awai": 51, "flatten": 51, "explicitli": 51, "fulli": 51, "explicit": [51, 58], "subset": [51, 54, 57], "behavior": [51, 56, 57, 58, 61], "rl_zoo3": [51, 60], "pytorch": [51, 57, 58, 61], "unflatten": 51, "exerpt": 51, "last_episode_id": 51, "total_timestep": 51, "timestep": 51, "77": 51, "minari_dataset": [51, 60], "directli": [51, 56, 58, 60], "clear_episode_buff": 51, "minari_storag": 51, "101": 51, "eol": 51, "107": 51, "11": 51, "73": 51, "reorgan": 51, "thorough": 51, "75": 51, "copi": [51, 58], "howuhh": 51, "82": 51, "86": 51, "dataclass": 51, "88": 51, "99": [51, 56, 58], "110": 51, "incorrect": 51, "83": 51, "96": 51, "ignor": [51, 58], "hidden": 51, "104": 51, "111": 51, "oibserv": 51, "tohsin": 51, "84": 51, "instruct": 51, "105": 51, "bamboofungu": 51, "108": 51, "109": 51, "background": 51, "pid": [51, 56], "95": 51, "116": 51, "pytorchdataload": 51, "102": 51, "misc": 51, "citat": 51, "cff": 51, "typo": 51, "annot": 51, "slightli": 51, "redtachyon": 51, "52": 51, "froze": 51, "pyright": 51, "305": 51, "correct": [51, 56, 58], "87": 51, "right": [51, 56, 58], "92": 51, "93": 51, "style": [51, 58], "black": 51, "badg": 51, "112": 51, "subsequ": 51, "represent": 51, "It": [51, 56, 58], "next": [51, 56, 58, 60], "05": 51, "attr": 51, "60": 51, "workflow": 51, "yml": 51, "miss": 51, "_script": 51, "gen_dataset_md": 51, "sphinx_github_changelog_token": 51, "71": 51, "readi": 51, "experienc": 51, "consider": 51, "past": 51, "cython": 51, "favor": 51, "pure": 51, "reduc": [51, 56], "effici": 51, "explor": 51, "apart": 51, "excit": 51, "offici": 51, "re": [51, 56], "page": 51, "constantli": 51, "hesit": 51, "idea": 51, "highli": 51, "appreci": 51, "thank": 51, "basi": 51, "page_facing_up": 51, "file_fold": 51, "floppy_disk": 51, "subgroup": [51, 56], "next_episode_id": 51, "deleg": 51, "34": 51, "54": 51, "charg": 51, "55": 51, "convers": [51, 53], "safe": 51, "recoveri": 51, "31": 51, "log": [51, 58, 60], "suggest": 51, "57": 51, "collector_env": [51, 56], "gynasium": 51, "n_step": [51, 56], "curat": 51, "dataset_cr": [51, 53, 56], "point_maze_dataset": [51, 56], "sphx": 51, "glr": 51, "larger": [51, 56, 58], "except": [51, 53, 58], "largest": 51, "among": 51, "dataset_v1": 51, "dataset_v2": 51, "dataset_v3": 51, "upload": 51, "bellow": 51, "04": 51, "renam": 51, "willdudlei": 51, "convent": 51, "nonetyp": 51, "codelink": 51, "stack": 51, "import_bugfix": 51, "mgoulao": 51, "2022": 51, "init": 51, "residu": 51, "pz": 51, "precommit": 51, "wd": 51, "kabuki": 51, "ll": [53, 55], "empti": [53, 56], "uniqu": 53, "appli": 53, "let": [53, 55, 56, 60], "modul": [53, 55, 56, 58, 60], "core": 53, "deserialize_spac": 53, "serialize_spac": 53, "16x16": 53, "see": [53, 58], "output": [53, 55, 56, 58, 60], "abov": [53, 55, 58], "emptyenv": 53, "0x12253a940": 53, "try": [53, 58], "encount": 53, "notimplementederror": 53, "No": 53, "But": [53, 58], "missonspac": 53, "simpli": [53, 56], "around": [53, 58], "green": [53, 58], "squar": 53, "worri": 53, "properli": [53, 58], "deseri": 53, "care": 53, "enabl": 53, "regist": 53, "back": [53, 56], "serialize_custom_spac": 53, "to_str": 53, "mission_func": 53, "deserialize_custom_spac": 53, "space_dict": 53, "noqa": 53, "e731": 53, "num_episod": [53, 55], "42": [53, 55, 58, 60], "choos": [53, 55], "random_polici": [53, 55], "blob": [53, 56], "custom_space_seri": 53, "del": [53, 55], "earlier": 53, "0x11f2608b0": 53, "clean": 53, "delet": [53, 55], "jupyt": [53, 55, 56, 57, 58, 60], "notebook": [53, 55, 56, 57, 58, 60], "ipynb": [53, 55, 56, 58, 60], "omit": 55, "plan": 55, "minim": 55, "outlin": 55, "procedur": 55, "data_collector": 55, "find": 55, "fit": [55, 58], "mirana": 55, "observation_space_subset": 55, "customsubsetstepdatacallback": 55, "local_dataset": 55, "action_space_subset": 55, "dict_kei": 55, "bind": 56, "down": 56, "q": [56, 57, 61], "grid": 56, "factor": 56, "account": 56, "advantag": [56, 58], "solver": 56, "solut": 56, "variat": 56, "dynam": 56, "program": 56, "chosen": 56, "optim": [56, 60], "do": [56, 58], "seri": 56, "bellman": 56, "leftarrow": [56, 58], "sum_": 56, "gamma": [56, 58], "max_": [56, 58], "matrix": 56, "probabl": 56, "know": 56, "alwai": 56, "On": [56, 58], "pi": [56, 58], "generate_path": 56, "current_cel": 56, "goal_cel": 56, "wapoint": 56, "exploration_act": 56, "inspir": 56, "master": 56, "q_iter": 56, "__init__": [56, 60], "num_stat": 56, "map_length": 56, "map_width": 56, "num_act": 56, "len": [56, 58], "rew_matrix": 56, "zero": 56, "compute_transition_matrix": 56, "compute_reward_matrix": 56, "q_valu": 56, "get_q_valu": 56, "current_st": 56, "cell_to_st": 56, "action_id": 56, "argmax": [56, 60], "next_stat": 56, "get_next_st": 56, "state_to_cel": 56, "reward_funct": 56, "desired_cel": 56, "j": 56, "num_itr": 56, "discount": 56, "q_fn": 56, "v_fn": 56, "transition_matrix": 56, "dot": [56, 58], "next_cel": 56, "construct": 56, "da": 56, "action_idx": 56, "_check_valid_cel": 56, "elif": 56, "collis": 56, "often": 56, "classic": [56, 60], "theori": 56, "proporti": 56, "adjust": 56, "setpoint": 56, "higher": 56, "stronger": 56, "alon": 56, "overshoot": 56, "instabl": 56, "tau": [56, 58], "k_": 56, "predict": [56, 60], "By": [56, 58], "dampen": 56, "system": 56, "stabil": 56, "respond": 56, "quickli": 56, "dt": 56, "equat": 56, "explain": 56, "bit": [56, 58], "cumul": [56, 58], "address": 56, "steadi": 56, "bias": 56, "elimin": 56, "actual": 56, "_0": 56, "int_": 56, "k_p": 56, "k_i": 56, "k_d": 56, "gain": 56, "determin": 56, "influenc": [56, 58], "typic": 56, "theme": 56, "seen": 56, "equlival": 56, "v_": [56, 58], "think": 56, "approach": 56, "toward": 56, "slowli": [56, 58], "less": 56, "aggress": 56, "p_": 56, "coordin": 56, "waypointcontrol": 56, "waypoint_control": 56, "waypoint_threshold": 56, "global_target_xi": 56, "maze_solv": 56, "waypoint_target": 56, "compute_act": 56, "linalg": 56, "norm": 56, "1e": 56, "xy": 56, "achieved_goal_cel": 56, "cell_xy_to_rowcol": 56, "global_target_id": 56, "current_control_target_id": 56, "current_control_target_xi": 56, "cell_rowcol_to_xi": 56, "dist": 56, "uniform": 56, "clip": 56, "reason": 56, "ourselv": 56, "pointmazestepdatacallback": 56, "succ": 56, "ve": 56, "000": [56, 58], "dure": [56, 58], "limit": [56, 58], "10_000": [56, 58], "evad": 56, "overridng": 56, "randn": 56, "implicit": [57, 61], "torchrl": [57, 61], "tutorials_python": 57, "zip": 57, "tutorials_jupyt": 57, "conjunct": 58, "cover": 58, "iql": 58, "here": [58, 60], "part": 58, "script": [58, 60], "nightli": 58, "matplotlib": 58, "conflict": 58, "rememb": 58, "upgrad": 58, "torch": [58, 60], "everyth": 58, "pyplot": 58, "plt": 58, "manual_se": [58, 60], "simplefilt": 58, "colab": 58, "virtual": 58, "displai": [58, 60], "prerequisit": 58, "sudo": 58, "apt": 58, "python3": 58, "opengl": 58, "ffmpeg": 58, "xvfb": 58, "pyvirtualdisplai": 58, "restart": 58, "kernel": 58, "virtual_displai": 58, "visibl": 58, "1400": 58, "900": 58, "lib": 58, "gymenv": 58, "doubletofloat": 58, "transformedenv": 58, "design": 58, "framework": 58, "env_id": 58, "example_env": 58, "from_pixel": 58, "pixels_onli": 58, "usual": 58, "tensordict": 58, "essenti": 58, "tensor": [58, 60], "whose": 58, "batch": [58, 60], "dimens": [58, 60], "cpu": 58, "is_shar": 58, "pixel": 58, "480": 58, "batch_siz": [58, 60], "rollout": 58, "max_step": 58, "auto_cast_to_devic": 58, "2f": 58, "884": 58, "initialis": 58, "popul": 58, "frame": 58, "imshow": 58, "blue": 58, "quantifi": 58, "randomis": 58, "transform": 58, "doubl": 58, "cuda": 58, "is_avail": 58, "base_env": 58, "minariexperiencereplai": 58, "minari_data": 58, "replay_buff": 58, "samplerwithoutreplac": 58, "256": [58, 60], "split_traj": 58, "sampler": 58, "quick": 58, "overview": 58, "tri": 58, "tackl": 58, "those": 58, "who": 58, "familiar": 58, "interest": 58, "practic": 58, "approxim": 58, "outsid": 58, "extrapol": 58, "poorli": 58, "precis": 58, "mathcal": 58, "s_t": 58, "a_t": 58, "r_t": 58, "s_": 58, "minimis": 58, "tempor": 58, "l_": 58, "rm": 58, "td": 58, "theta": 58, "mathbb": 58, "sim": 58, "q_": 58, "hat": 58, "expectil": 58, "m_": 58, "approx": 58, "kostrikov": 58, "network": [58, 60], "lag": 58, "equiv": 58, "max_a": 58, "overestim": 58, "overconfid": 58, "therefor": 58, "attempt": 58, "queri": 58, "psi": 58, "l_v": 58, "l_2": 58, "choic": 58, "figur": 58, "l_q": 58, "maximis": 58, "implicitli": 58, "extract": 58, "weight": 58, "behaviour": 58, "phi": 58, "pi_": 58, "hyperparamet": 58, "behav": 58, "summari": 58, "best": 58, "ell": 58, "gradient": 58, "descent": 58, "rather": 58, "benchmark": 58, "accur": 58, "corl": 58, "nn": [58, 60], "tensordictmodul": 58, "normalparamextractor": 58, "explorationtyp": 58, "set_exploration_typ": 58, "mlp": 58, "probabilisticactor": 58, "tanhnorm": 58, "valueoper": 58, "iqlloss": 58, "softupd": 58, "trainer": 58, "helper": 58, "conveni": 58, "layer": 58, "multi": 58, "perceptron": 58, "plug": 58, "rest": 58, "concaten": 58, "written": 58, "state_valu": 58, "hidden_s": 58, "activation_fn": 58, "relu": [58, 60], "value_net": 58, "num_cel": 58, "out_featur": 58, "activation_class": 58, "write": 58, "in_kei": 58, "out_kei": 58, "q_net": 58, "qvalu": 58, "state_action_valu": 58, "actor": 58, "tanh": 58, "parameteris": 58, "scale": 58, "strictli": 58, "action_spec": 58, "ensur": 58, "actor_mlp": 58, "actor_extractor": 58, "scale_lb": 58, "actor_net": 58, "sequenti": 58, "actor_modul": 58, "loc": 58, "distribution_class": 58, "distribution_kwarg": 58, "tanh_loc": 58, "default_interaction_typ": 58, "mode": 58, "gather": 58, "modulelist": 58, "hood": 58, "lazylinear": 58, "infer": 58, "forward": [58, 60], "lazi": 58, "no_grad": 58, "net": 58, "captur": 58, "loss_modul": 58, "value_network": 58, "loss_funct": 58, "l2": 58, "temperatur": 58, "make_value_estim": 58, "soft": 58, "polyak": 58, "target_net_updat": 58, "005": 58, "lr": 58, "0003": 58, "unlik": 58, "onlin": 58, "evaluate_polici": 58, "num_eval_episod": 58, "episode_reward": 58, "eval_td": 58, "backpropag": 58, "tqdm": [58, 60], "auto": [58, 60], "50_000": 58, "eval_interv": 58, "1_000": [58, 60], "loss_log": 58, "eval_reward_log": 58, "pbar": 58, "l": 58, "l_pi": 58, "loss_dict": 58, "loss_valu": 58, "loss_qvalu": 58, "loss_actor": 58, "zero_grad": [58, 60], "backward": [58, 60], "set_descript": 58, "1f": 58, "avg": 58, "plot": 58, "fig": 58, "ax": 58, "subplot": 58, "nrow": 58, "ncol": 58, "figsiz": 58, "set_titl": 58, "set_xlabel": 58, "arang": 58, "tight_layout": 58, "ipython": 58, "html": 58, "save_video": 58, "base64": 58, "b64encod": 58, "final_scor": 58, "1872": 58, "69": 58, "visualis": 58, "roll": 58, "render": 58, "video": 58, "viewer_env": 58, "video_fold": 58, "results_video": 58, "fp": 58, "embed": 58, "necessari": 58, "etc": 58, "mp4": 58, "rb": 58, "data_url": 58, "decod": 58, "margin": 58, "block": 58, "src": 58, "quit": 58, "overal": 58, "decent": 58, "invers": 58, "iql_torchrl": 58, "problem": 60, "balanc": 60, "pole": 60, "cart": 60, "receiv": 60, "zoo": 60, "o": 60, "sy": 60, "stable_baselines3": 60, "ppo": 60, "argv": 60, "algo": 60, "abspath": 60, "v1_1": 60, "best_model": 60, "behavioral_clon": 60, "execut": 60, "policynetwork": 60, "input_dim": 60, "output_dim": 60, "fc1": 60, "linear": 60, "fc2": 60, "fc3": 60, "scenario": 60, "four": 60, "length": 60, "pad": 60, "collate_fn": 60, "rnn": 60, "pad_sequ": 60, "as_tensor": 60, "batch_first": 60, "neural": 60, "loss": 60, "shuffl": 60, "isinst": 60, "policy_net": 60, "prod": 60, "loss_fn": 60, "crossentropyloss": 60, "cross": 60, "entropi": 60, "classif": 60, "num_epoch": 60, "32": 60, "epoch": 60, "a_pr": 60, "a_hat": 60, "one_hot": 60, "And": 60, "render_mod": 60, "accumulated_rew": 60, "ter": 60, "tru": 60, "visual": 60, "500": 60}, "objects": {"minari": [[2, 0, 1, "", "DataCollector"], [5, 0, 1, "", "EpisodeData"], [3, 0, 1, "", "EpisodeMetadataCallback"], [6, 0, 1, "", "MinariDataset"], [4, 0, 1, "", "StepDataCallback"], [7, 1, 1, "", "combine_datasets"], [7, 1, 1, "", "create_dataset_from_buffers"], [7, 1, 1, "", "delete_dataset"], [7, 1, 1, "", "download_dataset"], [7, 1, 1, "", "get_normalized_score"], [7, 1, 1, "", "list_local_datasets"], [7, 1, 1, "", "list_remote_datasets"], [7, 1, 1, "", "load_dataset"], [7, 1, 1, "", "split_dataset"]], "minari.DataCollector": [[2, 1, 1, "", "close"], [2, 1, 1, "", "create_dataset"], [2, 1, 1, "", "reset"], [2, 1, 1, "", "step"]], "minari.EpisodeData": [[5, 2, 1, "", "actions"], [5, 2, 1, "", "id"], [5, 2, 1, "", "observations"], [5, 2, 1, "", "seed"], [5, 2, 1, "", "terminations"], [5, 2, 1, "", "total_steps"], [5, 2, 1, "", "truncations"]], "minari.EpisodeMetadataCallback": [[3, 1, 1, "", "__call__"]], "minari.MinariDataset": [[6, 2, 1, "", "episode_indices"], [6, 1, 1, "", "filter_episodes"], [6, 1, 1, "", "iterate_episodes"], [6, 1, 1, "", "recover_environment"], [6, 1, 1, "", "sample_episodes"], [6, 1, 1, "", "set_seed"], [6, 2, 1, "", "spec"], [6, 2, 1, "", "total_episodes"], [6, 2, 1, "", "total_steps"], [6, 1, 1, "", "update_dataset_from_buffer"]], "minari.StepDataCallback": [[4, 1, 1, "", "__call__"]]}, "objtypes": {"0": "py:class", "1": "py:function", "2": "py:attribute"}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "function", "Python function"], "2": ["py", "attribute", "Python attribute"]}, "titleterms": {"404": 0, "page": 0, "Not": 0, "found": 0, "The": [0, 58], "request": 0, "could": 0, "minari": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 56], "document": 1, "build": [1, 58], "datacollector": 2, "method": [2, 3, 4, 6], "episodemetadatacallback": 3, "stepdatacallback": [4, 55, 56], "episodedata": [5, 9], "attribut": [5, 6], "minaridataset": 6, "creat": [7, 8, 56], "dataset": [7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 52, 54, 56, 57, 59, 60, 61], "load": 7, "split": [7, 8], "download": [7, 8, 10], "list": [7, 10], "delet": [7, 10], "combin": [7, 8, 10], "normal": 7, "score": 7, "basic": 8, "usag": 8, "instal": 8, "collect": [8, 55, 56], "data": [8, 9, 56], "save": 8, "checkpoint": 8, "us": [8, 57, 59, 61], "remot": 8, "sampl": 8, "episod": 8, "filter": 8, "recov": 8, "environ": [8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 58], "standard": 9, "storag": 9, "root": 9, "file": 9, "format": 9, "hdf5": 9, "structur": 9, "default": 9, "metadata": 9, "observ": 9, "action": 9, "space": [9, 53, 55], "support": 9, "serial": [9, 53], "addit": 9, "inform": 9, "cli": 10, "local": 10, "upload": 10, "ant": 11, "maze": [11, 37], "refer": [11, 18, 22, 26, 30, 33, 37, 46, 56], "avail": [11, 18, 22, 26, 30, 33, 37, 46], "larg": [12, 13, 38, 39], "divers": [12, 14, 17], "descript": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "spec": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "evalu": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "plai": [13, 15], "medium": [14, 15, 40, 41], "umaz": [16, 17, 44, 45], "door": 18, "clone": [19, 23, 34, 47, 60], "expert": [20, 24, 35, 48], "human": [21, 25, 36, 49], "hammer": 22, "kitchen": 26, "complet": 27, "mix": 28, "partial": 29, "minigrid": 30, "fourroom": [31, 32], "random": 32, "pen": [33, 58], "point": 37, "dens": [39, 41, 43, 45], "open": [42, 43], "reloc": 46, "releas": 51, "note": 51, "v0": 51, "4": 51, "3": [51, 56], "2": [51, 56], "1": [51, 56], "0": 51, "creation": [52, 54, 57], "custom": 53, "subset": 55, "dictionari": 55, "pointmaz": 56, "d4rl": 56, "waypoint": 56, "planner": 56, "control": 56, "proport": 56, "term": 56, "p": 56, "deriv": 56, "d": 56, "integr": 56, "i": 56, "modifi": 56, "tutori": 57, "implicit": 58, "q": 58, "learn": 58, "torchrl": 58, "pre": 58, "requisit": 58, "For": 58, "headless": 58, "adroit": 58, "replai": 58, "buffer": 58, "defin": 58, "model": 58, "loss": 58, "optim": 58, "train": [58, 60], "result": 58, "behavior": 60, "pytorch": 60, "import": 60, "polici": 60, "gener": 60}, "envversion": {"sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1, "sphinx": 60}, "alltitles": {"404 - Page Not Found": [[0, "page-not-found"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Minari documentation": [[1, "minari-documentation"]], "Build the Documentation": [[1, "build-the-documentation"]], "DataCollector": [[2, "datacollector"]], "minari.DataCollector": [[2, "minari-datacollector"]], "Methods": [[2, "methods"], [3, "methods"], [4, "methods"], [6, "methods"]], "EpisodeMetadataCallback": [[3, "episodemetadatacallback"]], "minari.EpisodeMetadataCallback": [[3, "minari-episodemetadatacallback"]], "StepDataCallback": [[4, "stepdatacallback"]], "minari.StepDataCallback": [[4, "minari-stepdatacallback"]], "EpisodeData": [[5, "episodedata"]], "minari.EpisodeData": [[5, "minari-episodedata"]], "Attributes": [[5, "attributes"], [6, "attributes"]], "MinariDataset": [[6, "minaridataset"]], "minari.MinariDataset": [[6, "minari-minaridataset"]], "Minari": [[7, "minari"]], "Create Minari Dataset": [[7, "create-minari-dataset"], [8, "create-minari-dataset"]], "Load Minari Dataset": [[7, "load-minari-dataset"]], "Split Minari Dataset": [[7, "split-minari-dataset"]], "Download Minari Dataset": [[7, "download-minari-dataset"]], "List Minari Datasets": [[7, "list-minari-datasets"]], "Delete Minari Datasets": [[7, "delete-minari-datasets"]], "Combine Minari Datasets": [[7, "combine-minari-datasets"], [8, "combine-minari-datasets"]], "Normalize Score": [[7, "normalize-score"]], "Basic Usage": [[8, "basic-usage"]], "Installation": [[8, "installation"]], "Collecting Data": [[8, "collecting-data"]], "Save Dataset": [[8, "save-dataset"]], "Checkpoint Minari Dataset": [[8, "checkpoint-minari-dataset"]], "Using Minari Datasets": [[8, "using-minari-datasets"]], "Download Remote Datasets": [[8, "download-remote-datasets"]], "Sampling Episodes": [[8, "sampling-episodes"]], "Filter Episodes": [[8, "filter-episodes"]], "Split Dataset": [[8, "split-dataset"]], "Recover Environment": [[8, "recover-environment"]], "Dataset Standards": [[9, "dataset-standards"]], "Minari Storage": [[9, "minari-storage"]], "Minari root": [[9, "minari-root"]], "Data files": [[9, "data-files"]], "Dataset File Format": [[9, "dataset-file-format"]], "HDF5 file structure": [[9, "hdf5-file-structure"]], "Default dataset metadata": [[9, "default-dataset-metadata"]], "Observation and Action Spaces": [[9, "observation-and-action-spaces"]], "Supported Spaces": [[9, "supported-spaces"]], "Space Serialization": [[9, "space-serialization"]], "Minari Data Structures": [[9, "minari-data-structures"]], "EpisodeData Structure": [[9, "episodedata-structure"]], "Additional Information Formatting": [[9, "additional-information-formatting"]], "Minari CLI": [[10, "minari-cli"]], "List datasets": [[10, "list-datasets"]], "Download datasets": [[10, "download-datasets"]], "Delete local datasets": [[10, "delete-local-datasets"]], "Upload datasets": [[10, "upload-datasets"]], "Combine datasets": [[10, "combine-datasets"]], "Ant Maze": [[11, "ant-maze"]], "References": [[11, "references"], [18, "references"], [22, "references"], [26, "references"], [30, "references"], [33, "references"], [37, "references"], [46, "references"], [56, "references"]], "Available Datasets": [[11, "available-datasets"], [18, "available-datasets"], [22, "available-datasets"], [26, "available-datasets"], [30, "available-datasets"], [33, "available-datasets"], [37, "available-datasets"], [46, "available-datasets"]], "Large-Diverse": [[12, "large-diverse"]], "Description": [[12, "description"], [13, "description"], [14, "description"], [15, "description"], [16, "description"], [17, "description"], [19, "description"], [20, "description"], [21, "description"], [23, "description"], [24, "description"], [25, "description"], [27, "description"], [28, "description"], [29, "description"], [31, "description"], [32, "description"], [34, "description"], [35, "description"], [36, "description"], [38, "description"], [39, "description"], [40, "description"], [41, "description"], [42, "description"], [43, "description"], [44, "description"], [45, "description"], [47, "description"], [48, "description"], [49, "description"]], "Dataset Specs": [[12, "dataset-specs"], [13, "dataset-specs"], [14, "dataset-specs"], [15, "dataset-specs"], [16, "dataset-specs"], [17, "dataset-specs"], [19, "dataset-specs"], [20, "dataset-specs"], [21, "dataset-specs"], [23, "dataset-specs"], [24, "dataset-specs"], [25, "dataset-specs"], [27, "dataset-specs"], [28, "dataset-specs"], [29, "dataset-specs"], [31, "dataset-specs"], [32, "dataset-specs"], [34, "dataset-specs"], [35, "dataset-specs"], [36, "dataset-specs"], [38, "dataset-specs"], [39, "dataset-specs"], [40, "dataset-specs"], [41, "dataset-specs"], [42, "dataset-specs"], [43, "dataset-specs"], [44, "dataset-specs"], [45, "dataset-specs"], [47, "dataset-specs"], [48, "dataset-specs"], [49, "dataset-specs"]], "Environment Specs": [[12, "environment-specs"], [13, "environment-specs"], [14, "environment-specs"], [15, "environment-specs"], [16, "environment-specs"], [17, "environment-specs"], [19, "environment-specs"], [20, "environment-specs"], [21, "environment-specs"], [23, "environment-specs"], [24, "environment-specs"], [25, "environment-specs"], [27, "environment-specs"], [28, "environment-specs"], [29, "environment-specs"], [31, "environment-specs"], [32, "environment-specs"], [34, "environment-specs"], [35, "environment-specs"], [36, "environment-specs"], [38, "environment-specs"], [39, "environment-specs"], [40, "environment-specs"], [41, "environment-specs"], [42, "environment-specs"], [43, "environment-specs"], [44, "environment-specs"], [45, "environment-specs"], [47, "environment-specs"], [48, "environment-specs"], [49, "environment-specs"]], "Evaluation Environment Specs": [[12, "evaluation-environment-specs"], [13, "evaluation-environment-specs"], [14, "evaluation-environment-specs"], [15, "evaluation-environment-specs"], [16, "evaluation-environment-specs"], [17, "evaluation-environment-specs"], [19, "evaluation-environment-specs"], [20, "evaluation-environment-specs"], [21, "evaluation-environment-specs"], [23, "evaluation-environment-specs"], [24, "evaluation-environment-specs"], [25, "evaluation-environment-specs"], [27, "evaluation-environment-specs"], [28, "evaluation-environment-specs"], [29, "evaluation-environment-specs"], [31, "evaluation-environment-specs"], [32, "evaluation-environment-specs"], [34, "evaluation-environment-specs"], [35, "evaluation-environment-specs"], [36, "evaluation-environment-specs"], [38, "evaluation-environment-specs"], [39, "evaluation-environment-specs"], [40, "evaluation-environment-specs"], [41, "evaluation-environment-specs"], [42, "evaluation-environment-specs"], [43, "evaluation-environment-specs"], [44, "evaluation-environment-specs"], [45, "evaluation-environment-specs"], [47, "evaluation-environment-specs"], [48, "evaluation-environment-specs"], [49, "evaluation-environment-specs"]], "Large-Play": [[13, "large-play"]], "Medium-Diverse": [[14, "medium-diverse"]], "Medium-Play": [[15, "medium-play"]], "Umaze": [[16, "umaze"], [44, "umaze"]], "Umaze-Diverse": [[17, "umaze-diverse"]], "Door": [[18, "door"]], "Cloned": [[19, "cloned"], [23, "cloned"], [34, "cloned"], [47, "cloned"]], "Expert": [[20, "expert"], [24, "expert"], [35, "expert"], [48, "expert"]], "Human": [[21, "human"], [25, "human"], [36, "human"], [49, "human"]], "Hammer": [[22, "hammer"]], "Kitchen": [[26, "kitchen"]], "Complete": [[27, "complete"]], "Mixed": [[28, "mixed"]], "Partial": [[29, "partial"]], "MiniGrid": [[30, "minigrid"]], "Fourrooms": [[31, "fourrooms"]], "Fourrooms-Random": [[32, "fourrooms-random"]], "Pen": [[33, "pen"]], "Point Maze": [[37, "point-maze"]], "Large": [[38, "large"]], "Large-Dense": [[39, "large-dense"]], "Medium": [[40, "medium"]], "Medium-Dense": [[41, "medium-dense"]], "Open": [[42, "open"]], "Open-Dense": [[43, "open-dense"]], "Umaze-Dense": [[45, "umaze-dense"]], "Relocate": [[46, "relocate"]], "Release Notes": [[51, "release-notes"]], "v0.4.3": [[51, "release-v0-4-3"]], "v0.4.2": [[51, "release-v0-4-2"]], "v0.4.1": [[51, "release-v0-4-1"]], "v0.4.0": [[51, "release-v0-4-0"]], "v0.3.1": [[51, "release-v0-3-1"]], "v0.3.0": [[51, "release-v0-3-0"]], "0.2.2": [[51, "release-0-2-2"]], "0.1.0": [[51, "release-0-1-0"]], "Dataset Creation": [[52, "dataset-creation"], [54, "dataset-creation"], [57, "dataset-creation"]], "Serializing a custom space": [[53, "serializing-a-custom-space"]], "Collecting a subset of a dictionary space with StepDataCallback": [[55, "collecting-a-subset-of-a-dictionary-space-with-stepdatacallback"]], "PointMaze D4RL dataset": [[56, "pointmaze-d4rl-dataset"]], "WayPoint Planner": [[56, "waypoint-planner"]], "Waypoint Controller": [[56, "waypoint-controller"]], "1. Proportional Term (P)": [[56, "proportional-term-p"]], "2. Derivative Term (D)": [[56, "derivative-term-d"]], "3. Integral Term (I)": [[56, "integral-term-i"]], "Modified StepDataCallback": [[56, "modified-stepdatacallback"]], "Collect Data and Create Minari Dataset": [[56, "collect-data-and-create-minari-dataset"]], "Tutorials": [[57, "tutorials"]], "Using Datasets": [[57, "using-datasets"], [59, "using-datasets"], [61, "using-datasets"]], "Implicit Q-Learning with TorchRL": [[58, "implicit-q-learning-with-torchrl"]], "Pre-requisites": [[58, "pre-requisites"]], "For headless environments": [[58, "for-headless-environments"]], "The Adroit Pen environment": [[58, "the-adroit-pen-environment"]], "Building a replay buffer": [[58, "building-a-replay-buffer"]], "Implicit Q-Learning": [[58, "implicit-q-learning"]], "Defining the model": [[58, "defining-the-model"]], "Loss and optimizer": [[58, "loss-and-optimizer"]], "Training": [[58, "training"]], "Results": [[58, "results"]], "Behavioral cloning with PyTorch": [[60, "behavioral-cloning-with-pytorch"], [60, "id1"]], "Imports": [[60, "imports"]], "Policy training": [[60, "policy-training"]], "Dataset generation": [[60, "dataset-generation"]]}, "indexentries": {"datacollector (class in minari)": [[2, "minari.DataCollector"]], "close() (in module minari.datacollector)": [[2, "minari.DataCollector.close"]], "create_dataset() (in module minari.datacollector)": [[2, "minari.DataCollector.create_dataset"]], "reset() (in module minari.datacollector)": [[2, "minari.DataCollector.reset"]], "step() (in module minari.datacollector)": [[2, "minari.DataCollector.step"]], "episodemetadatacallback (class in minari)": [[3, "minari.EpisodeMetadataCallback"]], "__call__() (in module minari.episodemetadatacallback)": [[3, "minari.EpisodeMetadataCallback.__call__"]], "stepdatacallback (class in minari)": [[4, "minari.StepDataCallback"]], "__call__() (in module minari.stepdatacallback)": [[4, "minari.StepDataCallback.__call__"]], "episodedata (class in minari)": [[5, "minari.EpisodeData"]], "actions (minari.episodedata attribute)": [[5, "minari.EpisodeData.actions"]], "id (minari.episodedata attribute)": [[5, "minari.EpisodeData.id"]], "observations (minari.episodedata attribute)": [[5, "minari.EpisodeData.observations"]], "seed (minari.episodedata attribute)": [[5, "minari.EpisodeData.seed"]], "terminations (minari.episodedata attribute)": [[5, "minari.EpisodeData.terminations"]], "total_steps (minari.episodedata attribute)": [[5, "minari.EpisodeData.total_steps"]], "truncations (minari.episodedata attribute)": [[5, "minari.EpisodeData.truncations"]], "minaridataset (class in minari)": [[6, "minari.MinariDataset"]], "episode_indices (minari.minaridataset attribute)": [[6, "minari.MinariDataset.episode_indices"]], "filter_episodes() (in module minari.minaridataset)": [[6, "minari.MinariDataset.filter_episodes"]], "iterate_episodes() (in module minari.minaridataset)": [[6, "minari.MinariDataset.iterate_episodes"]], "recover_environment() (in module minari.minaridataset)": [[6, "minari.MinariDataset.recover_environment"]], "sample_episodes() (in module minari.minaridataset)": [[6, "minari.MinariDataset.sample_episodes"]], "set_seed() (in module minari.minaridataset)": [[6, "minari.MinariDataset.set_seed"]], "spec (minari.minaridataset attribute)": [[6, "minari.MinariDataset.spec"]], "total_episodes (minari.minaridataset attribute)": [[6, "minari.MinariDataset.total_episodes"]], "total_steps (minari.minaridataset attribute)": [[6, "minari.MinariDataset.total_steps"]], "update_dataset_from_buffer() (in module minari.minaridataset)": [[6, "minari.MinariDataset.update_dataset_from_buffer"]], "combine_datasets() (in module minari)": [[7, "minari.combine_datasets"]], "create_dataset_from_buffers() (in module minari)": [[7, "minari.create_dataset_from_buffers"]], "delete_dataset() (in module minari)": [[7, "minari.delete_dataset"]], "download_dataset() (in module minari)": [[7, "minari.download_dataset"]], "get_normalized_score() (in module minari)": [[7, "minari.get_normalized_score"]], "list_local_datasets() (in module minari)": [[7, "minari.list_local_datasets"]], "list_remote_datasets() (in module minari)": [[7, "minari.list_remote_datasets"]], "load_dataset() (in module minari)": [[7, "minari.load_dataset"]], "split_dataset() (in module minari)": [[7, "minari.split_dataset"]]}}) \ No newline at end of file +Search.setIndex({"docnames": ["404", "README", "api/data_collector", "api/data_collector_callbacks/episode_metadata_callback", "api/data_collector_callbacks/step_data_callback", "api/minari_dataset/episode_data", "api/minari_dataset/minari_dataset", "api/minari_functions", "content/basic_usage", "content/dataset_standards", "content/minari_cli", "datasets/antmaze", "datasets/antmaze/large-diverse", "datasets/antmaze/large-play", "datasets/antmaze/medium-diverse", "datasets/antmaze/medium-play", "datasets/antmaze/umaze", "datasets/antmaze/umaze-diverse", "datasets/door", "datasets/door/cloned", "datasets/door/expert", "datasets/door/human", "datasets/hammer", "datasets/hammer/cloned", "datasets/hammer/expert", "datasets/hammer/human", "datasets/kitchen", "datasets/kitchen/complete", "datasets/kitchen/mixed", "datasets/kitchen/partial", "datasets/minigrid", "datasets/minigrid/fourrooms", "datasets/minigrid/fourrooms-random", "datasets/pen", "datasets/pen/cloned", "datasets/pen/expert", "datasets/pen/human", "datasets/pointmaze", "datasets/pointmaze/large", "datasets/pointmaze/large-dense", "datasets/pointmaze/medium", "datasets/pointmaze/medium-dense", "datasets/pointmaze/open", "datasets/pointmaze/open-dense", "datasets/pointmaze/umaze", "datasets/pointmaze/umaze-dense", "datasets/relocate", "datasets/relocate/cloned", "datasets/relocate/expert", "datasets/relocate/human", "index", "release_notes/index", "tutorials/dataset_creation/README", "tutorials/dataset_creation/custom_space_serialization", "tutorials/dataset_creation/index", "tutorials/dataset_creation/observation_space_subseting", "tutorials/dataset_creation/point_maze_dataset", "tutorials/index", "tutorials/using_datasets/IQL_torchrl", "tutorials/using_datasets/README", "tutorials/using_datasets/behavioral_cloning", "tutorials/using_datasets/index"], "filenames": ["404.md", "README.md", "api/data_collector.md", "api/data_collector_callbacks/episode_metadata_callback.md", "api/data_collector_callbacks/step_data_callback.md", "api/minari_dataset/episode_data.md", "api/minari_dataset/minari_dataset.md", "api/minari_functions.md", "content/basic_usage.md", "content/dataset_standards.md", "content/minari_cli.md", "datasets/antmaze.md", "datasets/antmaze/large-diverse.md", "datasets/antmaze/large-play.md", "datasets/antmaze/medium-diverse.md", "datasets/antmaze/medium-play.md", "datasets/antmaze/umaze.md", "datasets/antmaze/umaze-diverse.md", "datasets/door.md", "datasets/door/cloned.md", "datasets/door/expert.md", "datasets/door/human.md", "datasets/hammer.md", "datasets/hammer/cloned.md", "datasets/hammer/expert.md", "datasets/hammer/human.md", "datasets/kitchen.md", "datasets/kitchen/complete.md", "datasets/kitchen/mixed.md", "datasets/kitchen/partial.md", "datasets/minigrid.md", "datasets/minigrid/fourrooms.md", "datasets/minigrid/fourrooms-random.md", "datasets/pen.md", "datasets/pen/cloned.md", "datasets/pen/expert.md", "datasets/pen/human.md", "datasets/pointmaze.md", "datasets/pointmaze/large.md", "datasets/pointmaze/large-dense.md", "datasets/pointmaze/medium.md", "datasets/pointmaze/medium-dense.md", "datasets/pointmaze/open.md", "datasets/pointmaze/open-dense.md", "datasets/pointmaze/umaze.md", "datasets/pointmaze/umaze-dense.md", "datasets/relocate.md", "datasets/relocate/cloned.md", "datasets/relocate/expert.md", "datasets/relocate/human.md", "index.md", "release_notes/index.md", "tutorials/dataset_creation/README.rst", "tutorials/dataset_creation/custom_space_serialization.rst", "tutorials/dataset_creation/index.rst", "tutorials/dataset_creation/observation_space_subseting.rst", "tutorials/dataset_creation/point_maze_dataset.rst", "tutorials/index.rst", "tutorials/using_datasets/IQL_torchrl.rst", "tutorials/using_datasets/README.rst", "tutorials/using_datasets/behavioral_cloning.rst", "tutorials/using_datasets/index.rst"], "titles": ["404 - Page Not Found", "Minari documentation", "DataCollector", "EpisodeMetadataCallback", "StepDataCallback", "EpisodeData", "MinariDataset", "Minari", "Basic Usage", "Dataset Standards", "Minari CLI", "Ant Maze", "Large-Diverse", "Large-Play", "Medium-Diverse", "Medium-Play", "Umaze", "Umaze-Diverse", "Door", "Cloned", "Expert", "Human", "Hammer", "Cloned", "Expert", "Human", "Kitchen", "Complete", "Mixed", "Partial", "MiniGrid", "Fourrooms", "Fourrooms-Random", "Pen", "Cloned", "Expert", "Human", "Point Maze", "Large", "Large-Dense", "Medium", "Medium-Dense", "Open", "Open-Dense", "Umaze", "Umaze-Dense", "Relocate", "Cloned", "Expert", "Human", "<no title>", "Release Notes", "Dataset Creation", "Serializing a custom space", "Dataset Creation", "Collecting a subset of a dictionary space with StepDataCallback", "PointMaze D4RL dataset", "Tutorials", "Implicit Q-Learning with TorchRL", "Using Datasets", "Behavioral cloning with PyTorch", "Using Datasets"], "terms": {"thi": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "folder": [1, 60], "contain": [1, 2, 3, 4, 5, 7, 9, 11, 16, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 31, 32, 34, 35, 36, 37, 42, 43, 44, 45, 47, 48, 49, 51], "For": [1, 7, 8, 9, 51, 53, 56, 60], "more": [1, 3, 8, 9, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 56, 58], "inform": [1, 2, 4, 6, 51, 56], "about": [1, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53], "how": [1, 2, 9, 51, 53, 55, 56, 58, 60], "contribut": [1, 8, 51, 56], "go": [1, 56], "our": [1, 8, 9, 10, 51, 55, 56, 58, 60], "md": [1, 51], "instal": [1, 2, 7, 10, 50, 51, 53, 58, 60], "requir": [1, 9, 10, 51, 53, 55, 56, 58, 60], "packag": [1, 10, 51, 60], "git": [1, 8], "clone": [1, 8, 10, 18, 22, 33, 46, 50, 51, 57, 58, 61], "http": [1, 8, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 53, 56, 60], "github": [1, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 56], "com": [1, 8, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 56], "farama": [1, 7, 8, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 56, 58, 60], "foundat": [1, 8, 51, 53, 56], "cd": [1, 8], "pip": [1, 8, 10, 50, 53, 58, 60], "e": [1, 6, 7, 8, 51, 58], "r": [1, 12, 13, 14, 15, 16, 17, 56, 58], "doc": [1, 51, 53, 56], "txt": 1, "To": [1, 2, 8, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 58, 60], "onc": [1, 8, 56, 58, 60], "make": [1, 2, 6, 8, 9, 51, 53, 55, 56, 58, 60], "dirhtml": 1, "rebuild": 1, "automat": [1, 2, 51], "everi": [1, 7, 8, 9, 16, 56, 58], "time": [1, 2, 7, 8, 56], "chang": [1, 50, 51, 56], "i": [1, 2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 30, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55, 58, 60], "made": [1, 51], "sphinx": 1, "autobuild": 1, "b": [1, 10, 50], "_build": 1, "class": [2, 3, 4, 5, 6, 9, 51, 55, 56, 58, 60], "env": [2, 4, 6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 56, 58, 60], "step_data_callback": [2, 55, 56], "type": [2, 9, 18, 22, 26, 33, 46, 51, 53, 58, 60], "stepdatacallback": [2, 9, 51, 54, 57], "episode_metadata_callback": [2, 3], "episodemetadatacallback": [2, 9, 51], "record_info": [2, 8, 9, 56], "bool": [2, 4, 6, 7, 9, 51, 58], "fals": [2, 6, 7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 53, 55, 56, 58, 60], "max_buffer_step": [2, 8], "int": [2, 5, 6, 7, 51, 56], "none": [2, 4, 5, 6, 7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 56], "observation_spac": [2, 7, 9, 51, 53, 55, 60], "action_spac": [2, 7, 8, 9, 51, 53, 55, 56, 60], "sourc": [2, 3, 4, 5, 6, 7, 8, 51, 53, 55, 56, 57, 58, 60], "gymnasium": [2, 4, 5, 6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "environ": [2, 4, 5, 6, 7, 9, 10, 11, 18, 22, 26, 30, 33, 37, 46, 50, 51, 53, 55, 56, 60], "wrapper": [2, 3, 8, 9, 51, 53, 56, 58, 60], "collect": [2, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 54, 57, 58], "step": [2, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "data": [2, 3, 4, 5, 6, 7, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 26, 30, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50, 51, 53, 58, 60], "meant": [2, 51], "work": [2, 8, 51, 58], "temporari": [2, 8, 51, 56], "buffer": [2, 6, 7, 8, 51], "befor": [2, 8, 53, 56, 58], "creat": [2, 4, 6, 9, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49, 51, 53, 55, 58, 60], "dataset": [2, 3, 4, 5, 6, 50, 51, 53, 55, 58], "The": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55, 56, 60], "creation": [2, 51], "convert": [2, 56, 58], "agnost": [2, 58], "user": [2, 8, 9, 51], "import": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 56, 58], "gym": [2, 4, 6, 7, 8, 51, 53, 55, 56, 58, 60], "envid": 2, "reset": [2, 5, 8, 9, 12, 13, 14, 15, 16, 17, 38, 39, 40, 41, 42, 43, 44, 45, 51, 53, 55, 56, 58, 60], "_": [2, 8, 53, 55, 56, 58, 60], "rang": [2, 7, 8, 51, 53, 55, 56, 58, 60], "num_step": [2, 9], "action": [2, 4, 5, 6, 7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 56, 58, 60], "sampl": [2, 6, 9, 50, 51, 53, 55, 58], "ob": [2, 4, 8, 9, 51, 56, 60], "rew": [2, 4, 8, 9, 51, 56, 60], "termin": [2, 4, 5, 6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 37, 51, 53, 55, 56, 58, 60], "truncat": [2, 4, 5, 6, 7, 8, 9, 37, 51, 53, 55, 56, 58, 60], "info": [2, 4, 5, 8, 9, 51, 56, 60], "create_dataset": [2, 8, 51, 53, 55, 56, 60], "dataset_id": [2, 7, 8, 9, 51, 53, 55, 56, 58, 60], "env_nam": [2, 7, 9], "dataset_nam": [2, 7, 8, 9, 56], "v": [2, 7, 9, 10, 26, 58], "version": [2, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 55, 56], "kwarg": [2, 4, 6, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 55], "some": [2, 8, 9, 10, 51, 53, 56, 58], "characterist": [2, 56], "store": [2, 7, 8, 9, 51, 55, 58], "per": [2, 51], "episod": [2, 3, 5, 6, 7, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "dictionari": [2, 4, 6, 7, 8, 9, 51, 54, 56, 57, 58], "ar": [2, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 36, 37, 46, 47, 48, 49, 50, 51, 53, 56, 58], "memori": [2, 8, 51], "global": [2, 9, 56], "list": [2, 6, 8, 9, 50, 51, 58, 60], "item": [2, 6, 7, 56, 58, 60], "valu": [2, 4, 5, 6, 7, 8, 9, 38, 40, 42, 44, 51, 56, 58], "main": [2, 6, 51, 53, 56, 58], "observ": [2, 4, 5, 6, 7, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "kei": [2, 4, 7, 8, 9, 10, 55, 56, 58], "can": [2, 3, 4, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "anoth": [2, 4, 8, 9, 18, 22, 33, 46, 56, 58], "nest": [2, 4, 6, 7, 9, 51], "extra": [2, 3, 4, 8, 9, 51, 56], "separ": [2, 8, 51], "ad": [2, 4, 6, 7, 8, 9, 38, 39, 40, 41, 42, 43, 44, 45, 51, 55], "pass": [2, 3, 6, 7, 8, 55, 58], "custom": [2, 3, 8, 9, 51, 54, 56, 57], "when": [2, 6, 8, 9, 12, 13, 14, 15, 16, 17, 37, 38, 39, 40, 41, 42, 43, 44, 45, 51, 53, 55, 56, 58], "hdf5": [2, 3, 10, 50, 51, 55, 56], "file": [2, 3, 8, 10, 50, 51, 55], "gener": [2, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55, 56], "new": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 38, 39, 40, 41, 42, 43, 44, 45, 51, 53, 56, 58, 60], "group": [2, 3, 7, 8, 9, 10, 51, 56], "A": [2, 9, 26, 50, 56, 58], "call": [2, 4, 8, 9, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49], "return": [2, 4, 5, 6, 7, 8, 9, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 40, 42, 44, 47, 48, 49, 51, 53, 55, 56, 58, 60], "If": [2, 6, 7, 8, 9, 10, 51, 53, 56, 58], "previou": [2, 8, 51], "wa": [2, 6, 7, 9, 11, 18, 22, 30, 31, 32, 33, 46, 51, 53], "perform": [2, 7, 8, 10, 26, 28, 29, 56, 58, 60], "cach": [2, 8, 51, 58], "set": [2, 6, 8, 9, 11, 12, 13, 14, 15, 16, 17, 56, 58, 60], "max_buffer_episod": 2, "save": [2, 3, 9, 51, 53, 55, 56, 58, 60], "disk": [2, 8, 9, 51, 53, 55, 60], "non": [2, 8, 9, 11, 37], "move": [2, 8, 26, 37, 46, 51, 56], "from": [2, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 55, 56, 58, 60], "perman": [2, 8], "locat": [2, 8, 11, 12, 13, 14, 15, 16, 17, 37, 38, 39, 40, 41, 42, 43, 44, 45, 56, 58], "onli": [2, 7, 8, 9, 37, 38, 40, 42, 43, 44, 55, 58], "all": [2, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 26, 27, 51, 53, 57, 58, 60], "us": [2, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 56, 58, 60], "save_to_disk": 2, "path_to_permanent_loc": 2, "initi": [2, 5, 6, 7, 8, 9, 51, 53, 55, 56, 58, 60], "collector": [2, 56], "attribut": [2, 3, 7, 8, 9, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49, 51], "directori": [2, 8, 9, 58], "paramet": [2, 3, 4, 6, 7, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 58, 60], "option": [2, 4, 6, 7, 8, 9, 10, 51], "callback": [2, 3, 4, 51, 55, 56], "edit": [2, 4], "updat": [2, 8, 51, 56, 58], "databefor": 2, "default": [2, 3, 4, 6, 7, 8, 58], "add": [2, 3, 4, 6, 9, 10, 38, 39, 40, 41, 42, 43, 44, 45, 51, 56, 58], "metadata": [2, 3, 6, 7, 8, 10, 51, 55], "true": [2, 6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 56, 58, 60], "record": [2, 8, 9, 51, 55, 56], "each": [2, 3, 4, 5, 6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 55, 56, 58, 60], "number": [2, 5, 6, 7, 8, 9, 10, 51], "dump": [2, 53], "rais": [2, 7], "valueerror": 2, "t": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49, 51, 53, 55, 56, 58], "same": [2, 6, 7, 8, 9, 16, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49, 51, 56, 58], "self": [2, 3, 4, 6, 9, 55, 56, 60], "acttyp": [2, 7], "tupl": [2, 9, 51, 56, 58], "obstyp": [2, 7], "supportsfloat": 2, "dict": [2, 3, 4, 5, 6, 7, 9, 12, 13, 14, 15, 16, 17, 27, 28, 29, 31, 32, 38, 39, 40, 41, 42, 43, 44, 45, 51, 53, 55], "str": [2, 4, 6, 7, 9, 53], "ani": [2, 4, 5, 6, 7, 8, 9, 55, 56], "seed": [2, 5, 6, 7, 8, 9, 51, 53, 55, 56, 58, 60], "one": [2, 5, 6, 8, 18, 22, 33, 37, 46, 51, 58], "reproduc": [2, 8, 30, 58, 60], "unless": 2, "minari_autose": 2, "": [2, 3, 4, 6, 7, 8, 9, 10, 12, 13, 14, 15, 17, 26, 51, 53, 55, 56, 58, 60], "prng": 2, "specifi": [2, 6, 7, 8, 9, 51, 58], "addit": [2, 4, 6, 7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51], "disabl": 2, "state": [2, 9, 26, 37, 56, 58], "auxiliari": 2, "complement": 2, "eval_env": [2, 6, 7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "envspec": [2, 7, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51], "algorithm_nam": [2, 7, 8, 9, 53, 55, 56, 60], "author": [2, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 56, 60], "author_email": [2, 7, 8, 9, 51, 53, 56, 60], "code_permalink": [2, 7, 8, 9, 53, 56, 60], "ref_min_scor": [2, 7], "float": [2, 7, 55, 58], "ref_max_scor": [2, 7], "expert_polici": [2, 7], "callabl": [2, 6, 7, 8, 51, 53], "num_episodes_average_scor": [2, 7], "100": [2, 7, 8, 10, 34, 35, 36, 50, 51, 58], "minari_vers": [2, 7, 9, 51], "wrap": [2, 8, 51, 56, 58], "correspond": [2, 7, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 56, 60], "name": [2, 7, 8, 9, 10, 50, 51, 53, 60], "syntax": [2, 7, 9], "follow": [2, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 56, 58], "where": [2, 7, 9, 26, 29, 51, 56, 58], "identifi": [2, 7, 9], "load": [2, 8, 9, 51, 53, 58, 60], "load_dataset": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 60], "id": [2, 5, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 56, 60], "union": [2, 6, 7, 53], "spec": [2, 6, 7, 9, 51, 53, 58], "evalu": [2, 6, 7, 8, 51, 58, 60], "after": [2, 3, 5, 7, 9, 10, 51, 56, 60], "recov": [2, 6, 7, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 58], "minaridataset": [2, 5, 7, 8, 9, 51, 60], "recover_environ": [2, 6, 7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 60], "should": [2, 6, 7, 53, 55], "algorithm": [2, 7, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 58], "email": [2, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51], "link": [2, 7, 8, 9], "relev": [2, 7, 8, 9], "code": [2, 7, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 56, 57, 58, 60], "minimum": [2, 7, 8, 9, 51], "refer": [2, 7, 51], "score": [2, 58], "averag": [2, 7, 58], "random": [2, 6, 7, 8, 9, 13, 15, 17, 30, 37, 38, 39, 40, 41, 42, 43, 44, 45, 53, 55, 56, 58, 60], "polici": [2, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 26, 30, 31, 32, 33, 34, 35, 37, 46, 47, 48, 56, 58], "later": [2, 7, 51, 58], "normal": [2, 58], "get_normalized_scor": [2, 7, 51], "estim": [2, 7, 58], "maximum": [2, 7, 9, 56, 58, 60], "hypothet": [2, 7], "expert": [2, 7, 8, 9, 10, 11, 18, 19, 22, 23, 30, 31, 33, 34, 46, 47, 50, 51, 58, 60], "comput": [2, 7, 8, 9, 58], "over": [2, 6, 7, 8, 56, 58], "equal": [2, 7, 8, 9], "compat": [2, 7, 8, 9, 10, 51, 60], "close": [2, 26, 56, 58, 60], "clear": [2, 8], "full": [3, 9, 30, 31, 51, 58], "overridden": [3, 4, 7, 51], "statist": [3, 9], "datacollector": [3, 8, 9, 51, 53, 55, 56, 60], "argument": [3, 4, 7, 8, 9, 51], "todo": 3, "__call__": [3, 4, 9, 55, 56], "overrid": [3, 4, 9, 10, 56], "an": [3, 6, 7, 8, 9, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 42, 43, 46, 47, 48, 49, 51, 53, 56, 58], "reward": [4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 22, 33, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 51, 58, 60], "stepdata": [4, 9], "input": [4, 6, 8, 9, 58, 60], "belong": 4, "transit": [4, 51, 56, 58], "customstepdatacallback": 4, "def": [4, 9, 53, 55, 56, 58, 60], "step_data": [4, 9, 55, 56], "super": [4, 9, 55, 56, 60], "environment_st": 4, "pose": [4, 56], "posit": [4, 9, 26, 30, 46, 56, 58], "orient": [4, 33, 55], "veloc": [4, 37, 56], "current": [4, 7, 10, 50, 51, 56, 58], "must": [4, 6, 7, 8, 9, 51, 58], "step_data_kei": 4, "total_step": [5, 6, 9, 51, 56, 60], "ndarrai": [5, 6, 7, 9, 51], "singl": [5, 7, 8, 9, 10, 58], "object": [5, 6, 8, 9, 18, 22, 26, 30, 33, 46, 51, 53, 58, 60], "sample_episod": [5, 6, 8, 9, 51, 55], "api": [5, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 56, 60], "final": [5, 6, 7, 8, 11, 51, 53, 55, 56, 58], "includ": [5, 6, 7, 9, 26, 27, 29, 37, 51, 58], "mean": [5, 8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 56, 58], "increas": 5, "compar": [5, 55], "taken": [5, 38, 39, 40, 41, 42, 43, 44, 45, 55], "minaristorag": [6, 51], "pathlik": 6, "episode_indic": [6, 8], "get": [6, 7, 8, 10, 51, 53, 55, 56, 58, 60], "properti": [6, 58], "np": [6, 7, 9, 51, 55, 56, 58, 60], "slice": 6, "indic": [6, 8, 51], "point": [6, 51, 55, 58], "n_episod": [6, 8], "iter": [6, 8, 9, 11, 37, 56, 58], "episodedata": [6, 8, 51], "n": [6, 8, 9, 10, 56, 60], "iterate_episod": [6, 8, 51], "filter_episod": [6, 8, 9, 51], "condit": [6, 8, 9, 51, 58], "filter": [6, 9, 50, 51], "which": [6, 7, 8, 9, 11, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 55, 56, 58, 60], "take": [6, 9, 53, 56], "instanc": [6, 51], "retutrn": 6, "met": 6, "otherwis": [6, 8, 38, 40, 42, 44, 51], "lambda": [6, 8, 51, 53, 56], "x": [6, 37, 56, 60], "1": [6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 55, 58, 60], "function": [6, 7, 8, 9, 10, 31, 32, 37, 38, 39, 40, 41, 42, 43, 44, 45, 51, 53, 56, 58, 60], "certain": [6, 8, 33], "set_se": [6, 8, 58], "intend": 6, "other": [6, 7, 9, 10, 26, 29, 51, 55, 56, 58], "you": [6, 8, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 56, 58, 60], "want": [6, 8, 10, 56], "update_dataset_from_buff": 6, "have": [6, 7, 8, 9, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 53, 55, 56, 58, 60], "shape": [6, 7, 9, 11, 16, 17, 37, 44, 45, 51, 55, 56, 58, 60], "total_episode_step": [6, 7], "observation_shap": [6, 7], "action_shap": [6, 7], "long": [6, 7, 26, 56], "total": [6, 8, 9, 10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 56, 58], "total_episod": [6, 8, 9, 51, 60], "avail": [6, 7, 8, 9, 10, 50, 51, 53, 58], "within": [6, 9, 51, 58], "create_dataset_from_buff": [7, 8, 51], "space": [7, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 54, 56, 57, 58, 60], "latter": [7, 58], "also": [7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 50, 51, 53, 55, 56, 58], "note": [7, 9, 12, 13, 14, 15, 16, 17, 55, 56, 58], "assign": [7, 9], "valid": [7, 55, 56, 58], "than": [7, 8, 12, 13, 14, 15, 16, 17, 51, 58], "retriev": [7, 8, 51], "local": [7, 8, 9, 50, 51, 53, 55, 58, 60], "databas": [7, 10], "found": [7, 9], "split_dataset": [7, 8, 51], "size": [7, 8, 51, 56, 58], "multipl": [7, 8, 9, 10, 51, 58], "result": [7, 9, 51, 53, 56], "download_dataset": [7, 8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "force_download": [7, 51], "remot": [7, 9, 10, 50, 51], "server": [7, 8, 10, 50, 58], "error": [7, 51, 53, 56, 58], "skip": [7, 58], "continu": [7, 8, 9, 37, 38, 39, 40, 41, 42, 43, 44, 45, 56], "match": 7, "boolean": 7, "flag": [7, 51, 58], "forc": [7, 10, 37, 56], "list_local_dataset": [7, 8, 51, 55], "latest_vers": 7, "compatible_minari_vers": 7, "latest": [7, 10, 51, 56], "door": [7, 8, 9, 10, 19, 20, 21, 26, 50, 51], "human": [7, 8, 9, 10, 18, 19, 22, 23, 33, 34, 46, 47, 50, 51, 58, 60], "v0": [7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 30, 31, 32, 50, 53, 56], "v1": [7, 8, 9, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 58, 60], "list_remote_dataset": [7, 8, 51], "delete_dataset": [7, 53, 55], "combine_dataset": [7, 8, 51], "datasets_to_combin": [7, 51], "new_dataset_id": [7, 51], "its": [7, 51, 53, 56, 58], "own": [7, 8, 10, 51, 56], "combined_dataset": 7, "were": [7, 8, 9, 10, 18, 22, 26, 33, 37, 46, 51], "form": [7, 56], "newli": [7, 8, 58], "undiscount": [7, 9], "origin": [7, 8, 18, 22, 26, 33, 37, 46, 51, 53, 58], "provid": [7, 8, 9, 11, 12, 14, 18, 19, 20, 21, 22, 23, 24, 25, 33, 34, 35, 36, 46, 47, 48, 49, 50, 51, 58], "d4rl": [7, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 54, 57], "repositori": [7, 9, 18, 20, 21, 22, 24, 25, 26, 33, 36, 46, 48, 49], "facilit": [7, 8, 51], "comparison": 7, "across": [7, 9], "differ": [7, 8, 9, 37, 51, 53, 56, 58], "task": [7, 8, 11, 18, 22, 26, 29, 33, 38, 39, 40, 41, 42, 43, 44, 45, 46, 56, 58, 60], "between": [7, 9, 39, 41, 43, 45, 56], "0": [7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 53, 55, 56, 58, 60], "calcul": [7, 58], "These": [7, 9, 10, 18, 22, 26, 33, 37, 46, 51, 56], "two": [7, 8, 9, 10, 18, 22, 33, 37, 46, 51, 58, 60], "respect": [7, 9, 56, 58], "formula": [7, 56], "_score": 7, "frac": 7, "ref": 7, "_min": 7, "_max": 7, "util": [7, 8, 50, 58, 60], "under": [7, 9, 37, 50, 51, 58], "test": [7, 8, 9, 11, 51, 55], "now": [7, 9, 51, 53, 55, 56, 60], "arrai": [7, 9, 56], "normalized_scor": 7, "standard": [8, 51, 58], "host": [8, 10, 18, 22, 26, 33, 46, 50], "interfac": [8, 9], "offlin": [8, 9, 10, 50, 51, 56, 58, 60], "reinforc": [8, 10, 11, 18, 22, 26, 30, 33, 37, 46, 50, 56], "learn": [8, 10, 11, 18, 22, 26, 30, 33, 37, 46, 50, 51, 53, 55, 56, 57, 60, 61], "applic": 8, "most": [8, 10], "rl": [8, 18, 20, 22, 24, 33, 35, 46, 48, 51, 58, 60], "handl": [8, 50], "capabl": 8, "recent": [8, 58], "librari": [8, 50, 51, 53, 60], "run": [8, 18, 19, 22, 23, 33, 34, 46, 47, 51, 58], "command": [8, 10, 51, 60], "d": [8, 58], "like": [8, 10, 53, 58, 60], "start": [8, 9, 53, 55, 56, 58, 60], "pleas": [8, 10, 51, 55], "project": [8, 9, 51], "we": [8, 9, 10, 30, 51, 53, 55, 56, 58, 60], "support": [8, 51, 53, 56, 58], "python": [8, 9, 50, 51, 53, 55, 56, 57, 58, 60], "3": [8, 9, 10, 11, 27, 28, 29, 31, 32, 53, 58], "8": [8, 11, 12, 13, 14, 15, 16, 17, 37, 51, 56], "linux": 8, "maco": 8, "abstract": 8, "process": [8, 51, 56, 58], "achiev": [8, 9, 56, 60], "intern": [8, 51], "schedul": [8, 51], "amount": [8, 56], "while": [8, 9, 51, 53, 55, 56, 58, 60], "veri": 8, "simpl": [8, 9, 51, 56, 58, 60], "cartpol": [8, 51, 60], "100000": 8, "In": [8, 9, 51, 53, 55, 56, 58, 60], "exampl": [8, 9, 10, 51, 53, 56, 57, 58], "give": [8, 9, 10, 56, 58], "them": [8, 9, 51, 60], "There": [8, 18, 22, 26, 33, 46, 58], "detail": [8, 58], "descript": [8, 9, 11, 18, 22, 26, 30, 33, 37, 46, 51], "read": [8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 58], "document": [8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51], "first": [8, 9, 51, 53, 55, 56, 58], "need": [8, 9, 51, 53, 55, 56, 58, 60], "given": [8, 9, 10], "allow": [8, 9, 51, 56, 60], "compris": [8, 9], "just": [8, 53, 58], "loop": [8, 58, 60], "through": [8, 9, 10, 50, 51, 56, 58], "gymansium": 8, "mdp": [8, 51], "done": [8, 56, 58, 60], "root": 8, "path": [8, 9, 10, 38, 39, 40, 41, 42, 43, 44, 45, 50, 51, 56, 60], "structur": [8, 51], "extend": [8, 55], "123": [8, 51, 56], "break": [8, 51, 56, 60], "contact": [8, 10, 53, 60], "org": [8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 56, 60], "well": [8, 9, 10, 50, 51, 56, 58], "snippet": [8, 9], "ha": [8, 9, 16, 37, 51, 56, 58], "been": [8, 9, 37, 51], "check": [8, 10, 51, 56], "appear": 8, "2059": 8, "6": [8, 51], "mb": 8, "wai": [8, 9, 56, 58], "left": [8, 56, 58], "instead": [8, 9, 51, 56, 58], "respons": 8, "specif": [8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 51, 55, 56, 58], "won": [8, 56], "until": [8, 9, 38, 39, 40, 41, 42, 43, 44, 45], "larg": [8, 11, 37, 51], "avoid": [8, 58], "lose": 8, "append": [8, 51, 58], "update_dataset_from_collector_env": [8, 51], "method": [8, 9, 11, 37, 51, 53, 56, 58], "10": [8, 9, 51, 53, 55, 56, 58], "episode_id": [8, 9, 51], "alreadi": [8, 10, 51, 55, 56, 58], "els": [8, 51, 56, 58], "add_to_dataset": 8, "abl": [8, 37], "your": [8, 10, 51, 60], "order": [8, 26, 27, 51, 55], "featur": [8, 9, 50, 51, 60], "print": [8, 51, 53, 55, 58, 60], "storag": 8, "googl": [8, 9, 58], "cloud": [8, 9], "platform": [8, 9], "gcp": [8, 9, 10, 50], "bucket": [8, 9, 10, 50], "access": [8, 9, 10, 51, 56], "antmaz": [8, 11, 12, 13, 14, 15, 16, 17], "divers": [8, 11], "1000": [8, 12, 13, 14, 15, 51, 58], "1000000": [8, 10, 12, 13, 14, 15, 16, 17, 19, 20, 23, 24, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 50], "700": [8, 16, 17], "5": [8, 9, 51, 56, 58], "alex": [8, 12, 13, 14, 15, 16, 17], "davei": [8, 12, 13, 14, 15, 16, 17], "amd1g13": [8, 12, 13, 14, 15, 16, 17], "soton": [8, 12, 13, 14, 15, 16, 17], "ac": [8, 12, 13, 14, 15, 16, 17, 60], "uk": [8, 12, 13, 14, 15, 16, 17], "plai": [8, 11], "medium": [8, 11, 37, 51, 56], "25": [8, 10, 18, 21, 22, 25, 33, 36, 46, 49, 50, 51, 58], "6729": [8, 10, 21, 50], "7": [8, 27, 28, 29, 31, 32, 51, 53, 58], "rodrigo": [8, 10, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 56], "de": [8, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 47, 48, 49], "lazcano": [8, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 47, 48, 49], "rperezvicent": [8, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 56], "shard": 8, "randomli": [8, 9, 37, 53, 56], "map": [8, 12, 14, 56, 58], "ep": 8, "f": [8, 9, 10, 51, 53, 55, 58, 60], "show": [8, 10, 50, 51, 53, 55, 58], "13": [8, 51], "22": [8, 11, 51], "15": 8, "23": 8, "18": [8, 51], "2": [8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 22, 26, 27, 28, 29, 33, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 53, 55, 58], "12": [8, 51, 58], "19": [8, 27, 51], "9": [8, 27, 28, 29], "4": [8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 53, 55, 56], "17": [8, 51], "21": 8, "notic": 8, "doesn": [8, 9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49, 56], "serv": 8, "purpos": [8, 37, 56, 58], "replai": [8, 51], "out": [8, 51, 53, 56, 58], "leav": 8, "dataload": [8, 51, 60], "mai": [8, 9, 56, 58], "abil": 8, "determinist": [8, 56], "episodes_gener": 8, "itself": 8, "howev": [8, 9, 37, 51, 53, 56, 58, 60], "case": [8, 9, 51, 56], "h5py": [8, 9, 51], "format": [8, 51, 53], "keep": [8, 51], "greater": [8, 51], "filter_dataset": [8, 51], "remov": [8, 51], "divid": [8, 9, 56], "20": [8, 51, 58], "second": [8, 51], "lunarland": 8, "v2": [8, 51], "eval_env_spec": [8, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49], "lastli": 8, "adroithanddoor": [8, 9, 18, 19, 20, 21, 51], "5025": 8, "1006729": 8, "1103": 8, "5000": [8, 10, 20, 24, 36, 48, 50, 58], "1096": 8, "common": 9, "modifi": [9, 51, 55], "variabl": [9, 51, 56], "minari_datasets_path": 9, "kept": 9, "public": [9, 51, 56], "level": 9, "tree": 9, "string": [9, 53], "describ": [9, 51], "come": [9, 10, 50], "ennv_nam": 9, "content": [9, 10], "integ": 9, "repres": [9, 53, 58], "end": [9, 51], "yet": 9, "_doc": 9, "wip": 9, "homogen": 9, "main_data": [9, 10, 50, 51], "asid": 9, "raw": 9, "extern": 9, "additional_data_x": 9, "checkpoint": [9, 51], "update_dataset": 9, "three": [9, 18, 22, 26, 33, 46, 56, 58], "other_dataset_id": 9, "minari_root": 9, "additional_data_0": 9, "additional_data_1": 9, "leverag": 9, "hierarch": 9, "element": 9, "clearli": 9, "whole": 9, "individu": 9, "organ": 9, "insid": [9, 53], "plu": 9, "sub": [9, 10, 51], "both": [9, 53, 55], "up": [9, 12, 13, 14, 15, 16, 17, 51, 53, 55, 56, 58, 60], "look": [9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53], "episode_0": [9, 51], "infos_dataset": [9, 51], "infos_subgroup": [9, 51], "more_dataset": [9, 51], "additional_group": [9, 51], "additional_dataset": [9, 51], "episode_1": [9, 51], "episode_2": [9, 51], "rel": [9, 51], "complex": [9, 11, 18, 22, 33, 46, 51], "definit": [9, 51], "component_1": [9, 51], "box": [9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 55, 60], "low": [9, 51, 55, 56, 58], "high": [9, 18, 22, 33, 46, 51, 55, 56, 58], "dtype": [9, 51, 55, 56, 58], "float32": [9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 56, 60], "component_2": [9, 51], "subcomponent_1": [9, 51], "subcomponent_2": [9, 51], "similarli": [9, 51, 58], "consid": [9, 51, 56, 58], "_index_0": [9, 51], "_index_1": [9, 51], "_index_": 9, "index": 9, "involv": [9, 37, 56], "depend": [9, 51], "top": [9, 10, 27, 28, 29], "action_space_component_shap": 9, "entri": [9, 56], "discret": [9, 31, 32, 51, 53, 56, 60], "vari": [9, 53, 58, 60], "particular": [9, 53, 58], "compon": [9, 56], "observation_space_component_shap": 9, "becaus": [9, 11, 12, 13, 14, 15, 16, 17, 37, 58], "last": [9, 51], "finish": 9, "due": [9, 51, 56], "numpi": [9, 55, 56, 58, 60], "particip": 9, "adroit": 9, "hand": [9, 12, 14, 18, 22, 33, 46, 56, 58], "robot": [9, 11, 18, 22, 33, 46, 51, 55, 56, 58], "mujoco": [9, 56], "simul": 9, "sinc": [9, 53, 56, 60], "present": [9, 11, 60], "stepdatacallbak": 9, "qpo": [9, 56], "qvel": [9, 56], "bodi": 9, "adroitstepdatacallback": 9, "get_env_st": 9, "object_body_po": 9, "attach": 9, "int64": [9, 51], "env_spec": 9, "json": [9, 10, 51, 53], "metric": 9, "max": [9, 56, 58], "float64": [9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 55, 58], "min": [9, 58], "std": 9, "deviat": [9, 56], "sum": [9, 58], "possibl": [9, 51], "shift": [9, 58], "dimension": [9, 18, 22, 33, 46], "upper": 9, "lower": 9, "defin": [9, 53, 55, 60], "bound": [9, 56, 58], "text": [9, 51, 56], "charset": 9, "moment": 9, "don": [9, 51, 53, 55, 56], "guarante": 9, "surrog": 9, "pair": [9, 58], "aim": [9, 56, 58], "machin": [9, 11], "readabl": 9, "compli": [9, 51], "encapsul": 9, "even": 9, "arbitrari": [9, 51], "via": [9, 26, 58], "download": [9, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 56, 57, 58, 60], "sampled_episod": 9, "consist": [9, 37, 58], "field": [9, 51, 58], "As": [9, 51, 56, 60], "mention": [9, 51, 56, 60], "section": [9, 51, 58], "mani": 9, "so": [9, 56, 58], "being": [9, 26, 27, 28, 29, 37, 39, 41, 43, 45], "compliant": [9, 51], "thei": [9, 51, 58], "pattern": 9, "test_data_collector_step_data_callback_info_correct": 9, "test_step_data_callback": 9, "py": [9, 51, 53, 55, 56, 58, 60], "tool": [10, 22, 51], "build": [10, 51], "off": 10, "typer": 10, "line": [10, 55], "exist": [10, 51, 55, 56], "help": [10, 51, 56], "font": [10, 50], "color": [10, 50], "f4bf75": 10, "usag": [10, 51], "arg": [10, 51, 56, 58], "base": [10, 51, 56, 58], "gymnaisum": 10, "a5a5a1": 10, "a1efe4": [10, 50], "03ac13": [10, 50], "messag": 10, "exit": 10, "tabl": [10, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51], "devic": [10, 58], "incompat": 10, "pen": [10, 34, 35, 36, 51], "3736": [10, 34], "500000": [10, 34], "ff00ff": [10, 50], "rperezv": 10, "4958": [10, 35], "499206": [10, 35], "4356": [10, 50], "With": 10, "prompt": 10, "abort": 10, "warn": [10, 51, 58], "instanti": 10, "confirm": [10, 58], "proce": [10, 60], "sure": [10, 51], "y": [10, 37, 56, 58], "would": [10, 55, 56], "touch": [10, 55], "team": 10, "share": [10, 58], "encrypt": 10, "permiss": 10, "Then": [10, 53, 56, 58], "path_str": 10, "key_fil": 10, "progress": 10, "bar": 10, "shown": [10, 58], "below": [10, 56, 58], "implement": [10, 11, 56, 58], "merg": 10, "togeth": [10, 26, 28, 58], "new_dataset_nam": 10, "successfulli": [10, 55], "navig": [11, 30, 37], "domain": [11, 18, 22, 33, 37, 46], "replac": [11, 56], "2d": 11, "ball": [11, 37, 46, 56], "pointmaz": [11, 37, 38, 39, 40, 41, 42, 43, 44, 45, 51, 54, 55, 57], "dof": [11, 18, 22, 33, 46, 58], "quadrup": 11, "introduc": [11, 18, 22, 33, 46, 58], "stitch": 11, "challeng": [11, 58], "morpholog": 11, "could": [11, 58], "mimic": 11, "real": 11, "world": 11, "addition": [11, 51], "spars": [11, 12, 13, 14, 15, 16, 17, 18, 22, 33, 37, 38, 40, 42, 44, 46], "activ": [11, 58], "upon": 11, "reach": [11, 12, 13, 14, 15, 16, 17, 26, 30, 33, 37, 38, 39, 40, 41, 42, 43, 44, 45, 51, 56], "goal": [11, 12, 13, 14, 15, 16, 17, 26, 30, 31, 37, 38, 39, 40, 41, 42, 43, 44, 45, 53, 55, 56, 58], "previous": [11, 51, 56, 60], "train": [11, 12, 13, 14, 15, 16, 17, 18, 19, 22, 23, 33, 34, 46, 47, 55], "sac": [11, 12, 13, 14, 15, 16, 17], "stabl": 11, "baselin": 11, "agent": [11, 12, 13, 14, 15, 17, 30, 37, 38, 39, 40, 41, 42, 43, 44, 45, 55, 56, 58, 60], "waypoint": [11, 12, 13, 14, 15, 16, 17, 37, 38, 39, 40, 41, 42, 43, 44, 45], "planner": [11, 37], "qiter": [11, 12, 13, 14, 15, 16, 17, 37, 38, 39, 40, 41, 42, 43, 44, 45, 56], "control": [11, 37, 38, 39, 40, 41, 42, 43, 44, 45, 51, 58, 60], "memor": [11, 37], "markovian": [11, 37], "fu": [11, 18, 22, 26, 30, 33, 37, 46, 56], "justin": [11, 18, 22, 26, 30, 33, 37, 46, 56], "et": [11, 18, 22, 26, 30, 33, 37, 46, 56, 58], "al": [11, 18, 22, 26, 30, 33, 37, 46, 56, 58], "deep": [11, 18, 22, 26, 30, 33, 37, 46, 56], "driven": [11, 18, 22, 26, 30, 33, 37, 46, 56], "corr": [11, 18, 22, 26, 30, 33, 37, 46, 56], "vol": [11, 18, 22, 26, 30, 33, 37, 46, 56], "ab": [11, 18, 22, 26, 30, 33, 37, 46, 56], "2004": [11, 18, 22, 26, 30, 33, 37, 46, 56], "07219": [11, 18, 22, 26, 30, 33, 37, 46, 56], "2020": [11, 18, 22, 26, 30, 33, 37, 46, 56], "arxiv": [11, 18, 22, 26, 30, 33, 37, 46, 56], "antonin": 11, "raffin": 11, "ashlei": 11, "hill": 11, "adam": [11, 58, 60], "gleav": 11, "anssi": 11, "kanervisto": 11, "maximilian": 11, "ernestu": 11, "noah": 11, "dormann": 11, "2021": [11, 58], "baselines3": [11, 60], "reliabl": 11, "journal": 11, "research": 11, "268": 11, "lambert": [11, 37, 56], "nathan": [11, 37, 56], "fundament": [11, 37, 56], "learnin": [11, 37, 56], "apr": [11, 37, 56], "towardsdatasci": [11, 37, 56], "df8ff078652a": [11, 37, 56], "antmaze_large_diverse_gr": [11, 12], "v4": [11, 12, 13, 14, 15, 16, 17], "antmaze_larg": [11, 13], "antmaze_medium_diverse_gr": [11, 14], "antmaze_medium": [11, 15], "umaz": [11, 37, 51, 56], "antmaze_umaz": [11, 16, 17], "u": [11, 16, 17, 37, 44, 45, 51, 58, 60], "At": [12, 13, 14, 15, 17], "begin": [12, 13, 14, 15, 17, 60], "select": [12, 13, 14, 15, 17, 18, 22, 33, 37, 46, 51, 56], "pick": [12, 14], "cell": [12, 14, 56], "success": [12, 13, 14, 15, 16, 17, 56, 60], "rate": [12, 13, 14, 15, 16, 17, 56], "trajectori": [12, 13, 14, 15, 16, 17, 18, 20, 22, 24, 33, 35, 37, 46, 48, 50, 51, 56], "80": [12, 13, 14, 15, 51], "fail": [12, 13, 14, 15, 16, 17, 51], "occur": [12, 13, 14, 15, 16, 17], "ant": [12, 13, 14, 15, 16, 17], "flip": [12, 13, 14, 15, 16, 17, 26], "stand": [12, 13, 14, 15, 16, 17], "again": [12, 13, 14, 15, 16, 17], "target": [12, 13, 14, 15, 16, 17, 26, 27, 28, 29, 37, 46, 56, 58], "lead": [12, 13, 14, 15, 16, 17, 56], "accumul": [12, 13, 14, 15, 16, 17, 56, 60], "permalink": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "rodrigodelazcano": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51], "minari": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 50, 51, 53, 55, 58, 60], "row": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "what": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 53, 56], "registri": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "registr": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "achieved_go": [12, 13, 14, 15, 16, 17, 27, 28, 29, 38, 39, 40, 41, 42, 43, 44, 45, 55, 56], "inf": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 55], "desired_go": [12, 13, 14, 15, 16, 17, 27, 28, 29, 38, 39, 40, 41, 42, 43, 44, 45, 55, 56], "27": [12, 13, 14, 15, 16, 17, 51], "entry_point": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51], "gymnasium_robot": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "maze": [12, 13, 14, 15, 16, 17, 38, 39, 40, 41, 42, 43, 44, 45, 51, 55, 56], "ant_maze_v4": [12, 13, 14, 15, 16, 17], "antmazeenv": [12, 13, 14, 15, 16, 17], "max_episode_step": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 51, 56, 58], "reward_threshold": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "nondeterminist": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "order_enforc": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "autoreset": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "disable_env_check": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "maze_map": [12, 13, 14, 15, 16, 17, 38, 39, 40, 41, 42, 43, 44, 45, 56], "c": [12, 14, 26, 51], "reward_typ": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "continuing_task": [12, 13, 14, 15, 16, 17, 38, 39, 40, 41, 42, 43, 44, 45, 56], "reset_target": [12, 13, 14, 15, 16, 17, 38, 39, 40, 41, 42, 43, 44, 45], "additional_wrapp": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "vector_entry_point": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "g": [12, 13, 14, 15, 16, 17, 31, 32, 38, 39, 40, 41, 42, 43, 44, 45, 58], "fix": [16, 37, 51, 58], "90": [16, 17, 51], "1433": [16, 17], "hand_dapg": [18, 22, 33, 46], "open": [18, 26, 37, 51, 58], "24": [18, 22, 33, 34, 35, 36, 46, 58], "measur": [18, 22, 33, 46, 56], "effect": [18, 22, 33, 46], "narrow": [18, 22, 33, 46], "distribut": [18, 22, 33, 46, 58], "demonstr": [18, 19, 21, 22, 23, 25, 26, 27, 33, 34, 36, 46, 47, 49, 58], "manipul": [18, 22, 33, 46, 58], "paper": [18, 22, 33, 46], "rajeswaran": [18, 22, 33, 46], "aravind": [18, 22, 33, 46], "dexter": [18, 22, 33, 46], "1709": [18, 22, 33, 46], "10087": [18, 22, 33, 46], "2017": [18, 22, 33, 46], "obtain": [18, 19, 22, 23, 33, 34, 46, 47, 56], "imit": [18, 19, 22, 23, 26, 33, 34, 46, 47], "mix": [18, 19, 22, 23, 26, 33, 34, 46, 47, 51], "50": [18, 19, 22, 23, 33, 34, 46, 47, 56, 58], "ratio": [18, 19, 22, 23, 33, 34, 46, 47], "fine": [18, 20, 22, 24, 33, 35, 46, 48], "tune": [18, 20, 22, 24, 33, 35, 46, 48, 56, 58], "dapg": [18, 20, 21, 22, 24, 25, 33, 35, 36, 46, 48, 49], "4358": 19, "39": [19, 20, 21, 47, 48, 49], "28": [19, 20, 21, 51], "adroit_hand": [19, 20, 21, 23, 24, 25, 34, 35, 36, 47, 48, 49], "adroit_door": [19, 20, 21], "adroithanddoorenv": [19, 20, 21], "200": [19, 20, 21, 23, 24, 25, 47, 48, 49], "dens": [19, 20, 21, 23, 24, 25, 34, 35, 36, 37, 47, 48, 49, 51, 58], "assert": [19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 47, 48, 49, 53, 60], "adroithandhamm": [22, 23, 24, 25, 51], "nail": 22, "board": 22, "3606": 23, "hammer": [23, 24, 25, 51], "46": [23, 24, 25], "26": [23, 24, 25, 51], "adroit_hamm": [23, 24, 25], "adroithandhammerenv": [23, 24, 25], "11310": 25, "frankakitchen": [26, 27, 28, 29, 51], "relai": 26, "interact": 26, "variou": [26, 28, 53], "desir": [26, 56], "configur": [26, 58], "kettl": [26, 27, 28, 29], "light": [26, 27, 28, 29], "switch": [26, 27, 28, 29], "microwav": [26, 27, 28, 29], "cabinet": [26, 27, 28, 29], "slide": [26, 27, 28, 29], "complet": [26, 28, 29, 51, 58], "subtask": [26, 27, 28, 29], "gupta": 26, "kumar": 26, "lynch": 26, "levin": 26, "hausman": 26, "k": 26, "2019": 26, "solv": [26, 56], "horizon": 26, "preprint": 26, "1910": 26, "11956": 26, "never": [26, 28, 56, 58], "sequenc": [26, 28, 29, 37], "partial": [26, 51], "subtrajectori": [26, 29], "4209": 27, "kitchen": [27, 28, 29, 51], "bottom": [27, 28, 29], "burner": [27, 28, 29], "hing": [27, 28, 29], "59": [27, 28, 29], "franka_kitchen": [27, 28, 29], "kitchenenv": [27, 28, 29], "280": 27, "remove_task_when_complet": [27, 28, 29], "terminate_on_tasks_complet": [27, 28, 29], "tasks_to_complet": [27, 28, 29], "156560": [28, 29], "621": [28, 29], "450": [28, 29], "fourroom": 30, "gridworld": 30, "regener": 30, "straight": [30, 31], "goe": [30, 31], "10010": 31, "590": 31, "expertpolici": [31, 60], "omar": [31, 32], "youni": [31, 32], "younis98": [31, 32], "gmail": [31, 32], "minigrid": [31, 32, 51, 53], "direct": [31, 32, 53, 58], "imag": [31, 32, 53, 58], "255": [31, 32, 53], "uint8": [31, 32, 53, 58], "mission": [31, 32, 53], "missionspac": [31, 32, 53], "fourroomsenv": [31, 32], "_gen_miss": [31, 32, 53], "0x7f8c7a4e7f70": [31, 32], "1000033": 32, "10181": 32, "randompolici": 32, "adroithandpen": [33, 34, 35, 36, 51, 58], "repfixositori": [33, 35], "45": [34, 35, 36, 58], "adroit_pen": [34, 35, 36], "adroithandpenenv": [34, 35, 36], "actuat": 37, "along": [37, 50], "axi": [37, 56, 58], "thu": [37, 56], "split": [37, 51], "smaller": [37, 51, 56], "pd": [37, 38, 39, 40, 41, 42, 43, 44, 45, 56], "maze2d": [37, 56], "pointmaze_largedens": [37, 39], "v3": [37, 38, 39, 40, 41, 42, 43, 44, 45, 51, 55, 56], "pointmaze_larg": [37, 38], "pointmaze_mediumdens": [37, 41], "pointmaze_medium": [37, 40, 56], "pointmaze_opendens": [37, 43], "arena": [37, 42, 43], "perimet": [37, 42, 43], "wall": [37, 42, 43, 56], "pointmaze_open": [37, 42], "pointmaze_umazedens": [37, 45], "pointmaze_umaz": [37, 44, 55], "without": [38, 39, 40, 41, 42, 43, 44, 45, 51], "varianc": [38, 39, 40, 41, 42, 43, 44, 45, 56], "nois": [38, 39, 40, 41, 42, 43, 44, 45, 51, 56], "3325": 38, "perez": [38, 39, 40, 41, 42, 43, 44, 45, 56], "vicent": [38, 39, 40, 41, 42, 43, 44, 45, 56], "point_maz": [38, 39, 40, 41, 42, 43, 44, 45], "pointmazeenv": [38, 39, 40, 41, 42, 43, 44, 45], "800": [38, 39], "neg": [39, 41, 43, 45], "euclidean": [39, 41, 43, 45], "distanc": [39, 41, 43, 45], "3322": 39, "4778": 40, "600": [40, 41], "4765": 41, "9609": 42, "300": [42, 43, 44, 45], "9637": 43, "13289": [44, 45], "adroithandreloc": [46, 47, 48, 49, 51], "3758": 47, "reloc": [47, 48, 49, 51], "30": [47, 48, 49, 58], "adroit_reloc": [47, 48, 49], "adroithandrelocateenv": [47, 48, 49], "9942": 49, "popular": 50, "publicli": 50, "cli": [50, 51], "beta": [50, 51, 58], "develop": [50, 51], "minor": [50, 51], "major": [50, 51], "expect": [50, 55], "futur": [50, 51, 56], "\u898b\u7fd2\u3044": 50, "2024": 51, "01": 51, "pypi": 51, "small": [51, 58], "bug": 51, "lost": 51, "im": 51, "kitsch": 51, "144": 51, "refactor": [51, 56], "datacollectorv0": 51, "isol": 51, "younik": 51, "133": 51, "serial": [51, 54, 57], "tutori": [51, 53, 55, 56, 58, 60], "enerrio": 51, "151": 51, "basic": [51, 58], "ci": 51, "pytest": 51, "markdown": 51, "elliottow": 51, "153": 51, "155": 51, "recover_env": 51, "161": 51, "combin": [51, 56], "162": 51, "act": 51, "163": 51, "dir": 51, "alexdavei": 51, "160": 51, "mandatori": 51, "164": 51, "165": 51, "pre": 51, "commit": 51, "thing": [51, 53], "pettingzoo": 51, "doe": 51, "157": 51, "avjmachin": 51, "137": 51, "dataset_s": 51, "shreyansjainn": 51, "158": 51, "improv": [51, 58], "readm": 51, "167": 51, "deprec": 51, "create_dataset_from_collector_env": 51, "169": 51, "170": 51, "gt": 51, "171": 51, "172": 51, "balisujohn": 51, "132": 51, "contributor": 51, "changelog": 51, "2023": [51, 58], "09": 51, "rugged": 51, "grahamannett": 51, "126": 51, "128": [51, 58, 60], "130": 51, "speed": [51, 56], "124": 51, "coverag": 51, "129": 51, "issu": [51, 58], "templat": 51, "139": 51, "loos": 51, "typing_extens": 51, "148": 51, "07": 51, "bugfix": 51, "121": 51, "pr": 51, "awai": 51, "flatten": 51, "explicitli": 51, "fulli": 51, "explicit": [51, 58], "subset": [51, 54, 57], "behavior": [51, 56, 57, 58, 61], "rl_zoo3": [51, 60], "pytorch": [51, 57, 58, 61], "unflatten": 51, "exerpt": 51, "last_episode_id": 51, "total_timestep": 51, "timestep": 51, "77": 51, "minari_dataset": [51, 60], "directli": [51, 56, 58, 60], "clear_episode_buff": 51, "minari_storag": 51, "101": 51, "eol": 51, "107": 51, "11": 51, "73": 51, "reorgan": 51, "thorough": 51, "75": 51, "copi": [51, 58], "howuhh": 51, "82": 51, "86": 51, "dataclass": 51, "88": 51, "99": [51, 56, 58], "110": 51, "incorrect": 51, "83": 51, "96": 51, "ignor": [51, 58], "hidden": 51, "104": 51, "111": 51, "oibserv": 51, "tohsin": 51, "84": 51, "instruct": 51, "105": 51, "bamboofungu": 51, "108": 51, "109": 51, "background": 51, "pid": [51, 56], "95": 51, "116": 51, "pytorchdataload": 51, "102": 51, "misc": 51, "citat": 51, "cff": 51, "typo": 51, "annot": 51, "slightli": 51, "redtachyon": 51, "52": 51, "froze": 51, "pyright": 51, "305": 51, "correct": [51, 56, 58], "87": 51, "right": [51, 56, 58], "92": 51, "93": 51, "style": [51, 58], "black": 51, "badg": 51, "112": 51, "subsequ": 51, "represent": 51, "It": [51, 56, 58], "next": [51, 56, 58, 60], "05": 51, "attr": 51, "60": 51, "workflow": 51, "yml": 51, "miss": 51, "_script": 51, "gen_dataset_md": 51, "sphinx_github_changelog_token": 51, "71": 51, "readi": 51, "experienc": 51, "consider": 51, "past": 51, "cython": 51, "favor": 51, "pure": 51, "reduc": [51, 56], "effici": 51, "explor": 51, "apart": 51, "excit": 51, "offici": 51, "re": [51, 56], "page": 51, "constantli": 51, "hesit": 51, "idea": 51, "highli": 51, "appreci": 51, "thank": 51, "basi": 51, "page_facing_up": 51, "file_fold": 51, "floppy_disk": 51, "subgroup": [51, 56], "next_episode_id": 51, "deleg": 51, "34": 51, "54": 51, "charg": 51, "55": 51, "convers": [51, 53], "safe": 51, "recoveri": 51, "31": 51, "log": [51, 58, 60], "suggest": 51, "57": 51, "collector_env": [51, 56], "gynasium": 51, "n_step": [51, 56], "curat": 51, "dataset_cr": [51, 53, 56], "point_maze_dataset": [51, 56], "sphx": 51, "glr": 51, "larger": [51, 56, 58], "except": [51, 53, 58], "largest": 51, "among": 51, "dataset_v1": 51, "dataset_v2": 51, "dataset_v3": 51, "upload": 51, "bellow": 51, "04": 51, "renam": 51, "willdudlei": 51, "convent": 51, "nonetyp": 51, "codelink": 51, "stack": 51, "14": 51, "import_bugfix": 51, "mgoulao": 51, "2022": 51, "init": 51, "residu": 51, "pz": 51, "precommit": 51, "wd": 51, "kabuki": 51, "ll": [53, 55], "empti": [53, 56], "uniqu": 53, "appli": 53, "let": [53, 55, 56, 60], "modul": [53, 55, 56, 58, 60], "core": 53, "deserialize_spac": 53, "serialize_spac": 53, "16x16": 53, "see": [53, 58], "output": [53, 55, 56, 58, 60], "abov": [53, 55, 58], "emptyenv": 53, "0x12253a940": 53, "try": [53, 58], "encount": 53, "notimplementederror": 53, "No": 53, "But": [53, 58], "missonspac": 53, "simpli": [53, 56], "around": [53, 58], "green": [53, 58], "squar": 53, "worri": 53, "properli": [53, 58], "deseri": 53, "care": 53, "enabl": 53, "regist": 53, "back": [53, 56], "serialize_custom_spac": 53, "to_str": 53, "mission_func": 53, "deserialize_custom_spac": 53, "space_dict": 53, "noqa": 53, "e731": 53, "num_episod": [53, 55], "42": [53, 55, 58, 60], "choos": [53, 55], "random_polici": [53, 55], "blob": [53, 56], "custom_space_seri": 53, "del": [53, 55], "earlier": 53, "0x11f2608b0": 53, "clean": 53, "delet": [53, 55], "jupyt": [53, 55, 56, 57, 58, 60], "notebook": [53, 55, 56, 57, 58, 60], "ipynb": [53, 55, 56, 58, 60], "omit": 55, "plan": 55, "minim": 55, "outlin": 55, "procedur": 55, "data_collector": 55, "find": 55, "fit": [55, 58], "mirana": 55, "observation_space_subset": 55, "customsubsetstepdatacallback": 55, "local_dataset": 55, "action_space_subset": 55, "dict_kei": 55, "bind": 56, "down": 56, "q": [56, 57, 61], "grid": 56, "factor": 56, "account": 56, "advantag": [56, 58], "solver": 56, "solut": 56, "variat": 56, "dynam": 56, "program": 56, "chosen": 56, "optim": [56, 60], "do": [56, 58], "seri": 56, "bellman": 56, "leftarrow": [56, 58], "sum_": 56, "gamma": [56, 58], "max_": [56, 58], "matrix": 56, "probabl": 56, "know": 56, "alwai": 56, "On": [56, 58], "pi": [56, 58], "generate_path": 56, "current_cel": 56, "goal_cel": 56, "wapoint": 56, "exploration_act": 56, "inspir": 56, "master": 56, "q_iter": 56, "__init__": [56, 60], "num_stat": 56, "map_length": 56, "map_width": 56, "num_act": 56, "len": [56, 58], "rew_matrix": 56, "zero": 56, "compute_transition_matrix": 56, "compute_reward_matrix": 56, "q_valu": 56, "get_q_valu": 56, "current_st": 56, "cell_to_st": 56, "action_id": 56, "argmax": [56, 60], "next_stat": 56, "get_next_st": 56, "state_to_cel": 56, "reward_funct": 56, "desired_cel": 56, "j": 56, "num_itr": 56, "discount": 56, "q_fn": 56, "v_fn": 56, "transition_matrix": 56, "dot": [56, 58], "next_cel": 56, "construct": 56, "da": 56, "action_idx": 56, "_check_valid_cel": 56, "elif": 56, "collis": 56, "often": 56, "classic": [56, 60], "theori": 56, "proporti": 56, "adjust": 56, "setpoint": 56, "higher": 56, "stronger": 56, "alon": 56, "overshoot": 56, "instabl": 56, "tau": [56, 58], "k_": 56, "predict": [56, 60], "By": [56, 58], "dampen": 56, "system": 56, "stabil": 56, "respond": 56, "quickli": 56, "dt": 56, "equat": 56, "explain": 56, "bit": [56, 58], "cumul": [56, 58], "address": 56, "steadi": 56, "bias": 56, "elimin": 56, "actual": 56, "_0": 56, "int_": 56, "k_p": 56, "k_i": 56, "k_d": 56, "gain": 56, "determin": 56, "influenc": [56, 58], "typic": 56, "theme": 56, "seen": 56, "equlival": 56, "v_": [56, 58], "think": 56, "approach": 56, "toward": 56, "slowli": [56, 58], "less": 56, "aggress": 56, "p_": 56, "coordin": 56, "waypointcontrol": 56, "waypoint_control": 56, "waypoint_threshold": 56, "global_target_xi": 56, "maze_solv": 56, "waypoint_target": 56, "compute_act": 56, "linalg": 56, "norm": 56, "1e": 56, "xy": 56, "achieved_goal_cel": 56, "cell_xy_to_rowcol": 56, "global_target_id": 56, "current_control_target_id": 56, "current_control_target_xi": 56, "cell_rowcol_to_xi": 56, "dist": 56, "uniform": 56, "clip": 56, "reason": 56, "ourselv": 56, "pointmazestepdatacallback": 56, "succ": 56, "ve": 56, "000": [56, 58], "dure": [56, 58], "limit": [56, 58], "10_000": [56, 58], "evad": 56, "overridng": 56, "randn": 56, "implicit": [57, 61], "torchrl": [57, 61], "tutorials_python": 57, "zip": 57, "tutorials_jupyt": 57, "conjunct": 58, "cover": 58, "iql": 58, "here": [58, 60], "part": 58, "script": [58, 60], "nightli": 58, "matplotlib": 58, "conflict": 58, "rememb": 58, "upgrad": 58, "torch": [58, 60], "everyth": 58, "pyplot": 58, "plt": 58, "manual_se": [58, 60], "simplefilt": 58, "colab": 58, "virtual": 58, "displai": [58, 60], "prerequisit": 58, "sudo": 58, "apt": 58, "python3": 58, "opengl": 58, "ffmpeg": 58, "xvfb": 58, "pyvirtualdisplai": 58, "restart": 58, "kernel": 58, "virtual_displai": 58, "visibl": 58, "1400": 58, "900": 58, "lib": 58, "gymenv": 58, "doubletofloat": 58, "transformedenv": 58, "design": 58, "framework": 58, "env_id": 58, "example_env": 58, "from_pixel": 58, "pixels_onli": 58, "usual": 58, "tensordict": 58, "essenti": 58, "tensor": [58, 60], "whose": 58, "batch": [58, 60], "dimens": [58, 60], "cpu": 58, "is_shar": 58, "pixel": 58, "480": 58, "batch_siz": [58, 60], "rollout": 58, "max_step": 58, "auto_cast_to_devic": 58, "2f": 58, "884": 58, "initialis": 58, "popul": 58, "frame": 58, "imshow": 58, "blue": 58, "quantifi": 58, "randomis": 58, "transform": 58, "doubl": 58, "cuda": 58, "is_avail": 58, "base_env": 58, "minariexperiencereplai": 58, "minari_data": 58, "replay_buff": 58, "samplerwithoutreplac": 58, "256": [58, 60], "split_traj": 58, "sampler": 58, "quick": 58, "overview": 58, "tri": 58, "tackl": 58, "those": 58, "who": 58, "familiar": 58, "interest": 58, "practic": 58, "approxim": 58, "outsid": 58, "extrapol": 58, "poorli": 58, "precis": 58, "mathcal": 58, "s_t": 58, "a_t": 58, "r_t": 58, "s_": 58, "minimis": 58, "tempor": 58, "l_": 58, "rm": 58, "td": 58, "theta": 58, "mathbb": 58, "sim": 58, "q_": 58, "hat": 58, "expectil": 58, "m_": 58, "approx": 58, "kostrikov": 58, "network": [58, 60], "lag": 58, "equiv": 58, "max_a": 58, "overestim": 58, "overconfid": 58, "therefor": 58, "attempt": 58, "queri": 58, "psi": 58, "l_v": 58, "l_2": 58, "choic": 58, "figur": 58, "l_q": 58, "maximis": 58, "implicitli": 58, "extract": 58, "weight": 58, "behaviour": 58, "phi": 58, "pi_": 58, "hyperparamet": 58, "behav": 58, "summari": 58, "best": 58, "ell": 58, "gradient": 58, "descent": 58, "rather": 58, "benchmark": 58, "accur": 58, "corl": 58, "nn": [58, 60], "tensordictmodul": 58, "normalparamextractor": 58, "explorationtyp": 58, "set_exploration_typ": 58, "mlp": 58, "probabilisticactor": 58, "tanhnorm": 58, "valueoper": 58, "iqlloss": 58, "softupd": 58, "trainer": 58, "helper": 58, "conveni": 58, "layer": 58, "multi": 58, "perceptron": 58, "plug": 58, "rest": 58, "concaten": 58, "written": 58, "state_valu": 58, "hidden_s": 58, "activation_fn": 58, "relu": [58, 60], "value_net": 58, "num_cel": 58, "out_featur": 58, "activation_class": 58, "write": 58, "in_kei": 58, "out_kei": 58, "q_net": 58, "qvalu": 58, "state_action_valu": 58, "actor": 58, "tanh": 58, "parameteris": 58, "scale": 58, "strictli": 58, "action_spec": 58, "ensur": 58, "actor_mlp": 58, "actor_extractor": 58, "scale_lb": 58, "actor_net": 58, "sequenti": 58, "actor_modul": 58, "loc": 58, "distribution_class": 58, "distribution_kwarg": 58, "tanh_loc": 58, "default_interaction_typ": 58, "mode": 58, "gather": 58, "modulelist": 58, "hood": 58, "lazylinear": 58, "infer": 58, "forward": [58, 60], "lazi": 58, "no_grad": 58, "net": 58, "captur": 58, "loss_modul": 58, "value_network": 58, "loss_funct": 58, "l2": 58, "temperatur": 58, "make_value_estim": 58, "soft": 58, "polyak": 58, "target_net_updat": 58, "005": 58, "lr": 58, "0003": 58, "unlik": 58, "onlin": 58, "evaluate_polici": 58, "num_eval_episod": 58, "episode_reward": 58, "eval_td": 58, "backpropag": 58, "tqdm": [58, 60], "auto": [58, 60], "50_000": 58, "eval_interv": 58, "1_000": [58, 60], "loss_log": 58, "eval_reward_log": 58, "pbar": 58, "l": 58, "l_pi": 58, "loss_dict": 58, "loss_valu": 58, "loss_qvalu": 58, "loss_actor": 58, "zero_grad": [58, 60], "backward": [58, 60], "set_descript": 58, "1f": 58, "avg": 58, "plot": 58, "fig": 58, "ax": 58, "subplot": 58, "nrow": 58, "ncol": 58, "figsiz": 58, "set_titl": 58, "set_xlabel": 58, "arang": 58, "tight_layout": 58, "ipython": 58, "html": 58, "save_video": 58, "base64": 58, "b64encod": 58, "final_scor": 58, "1872": 58, "69": 58, "visualis": 58, "roll": 58, "render": 58, "video": 58, "viewer_env": 58, "video_fold": 58, "results_video": 58, "fp": 58, "embed": 58, "necessari": 58, "etc": 58, "mp4": 58, "rb": 58, "data_url": 58, "decod": 58, "margin": 58, "block": 58, "src": 58, "quit": 58, "overal": 58, "decent": 58, "invers": 58, "iql_torchrl": 58, "problem": 60, "balanc": 60, "pole": 60, "cart": 60, "receiv": 60, "zoo": 60, "o": 60, "sy": 60, "stable_baselines3": 60, "ppo": 60, "argv": 60, "algo": 60, "abspath": 60, "v1_1": 60, "best_model": 60, "behavioral_clon": 60, "execut": 60, "policynetwork": 60, "input_dim": 60, "output_dim": 60, "fc1": 60, "linear": 60, "fc2": 60, "fc3": 60, "scenario": 60, "four": 60, "length": 60, "pad": 60, "collate_fn": 60, "rnn": 60, "pad_sequ": 60, "as_tensor": 60, "batch_first": 60, "neural": 60, "loss": 60, "shuffl": 60, "isinst": 60, "policy_net": 60, "prod": 60, "loss_fn": 60, "crossentropyloss": 60, "cross": 60, "entropi": 60, "classif": 60, "num_epoch": 60, "32": 60, "epoch": 60, "a_pr": 60, "a_hat": 60, "one_hot": 60, "And": 60, "render_mod": 60, "accumulated_rew": 60, "ter": 60, "tru": 60, "visual": 60, "500": 60}, "objects": {"minari": [[2, 0, 1, "", "DataCollector"], [5, 0, 1, "", "EpisodeData"], [3, 0, 1, "", "EpisodeMetadataCallback"], [6, 0, 1, "", "MinariDataset"], [4, 0, 1, "", "StepDataCallback"], [7, 1, 1, "", "combine_datasets"], [7, 1, 1, "", "create_dataset_from_buffers"], [7, 1, 1, "", "delete_dataset"], [7, 1, 1, "", "download_dataset"], [7, 1, 1, "", "get_normalized_score"], [7, 1, 1, "", "list_local_datasets"], [7, 1, 1, "", "list_remote_datasets"], [7, 1, 1, "", "load_dataset"], [7, 1, 1, "", "split_dataset"]], "minari.DataCollector": [[2, 1, 1, "", "close"], [2, 1, 1, "", "create_dataset"], [2, 1, 1, "", "reset"], [2, 1, 1, "", "step"]], "minari.EpisodeData": [[5, 2, 1, "", "actions"], [5, 2, 1, "", "id"], [5, 2, 1, "", "observations"], [5, 2, 1, "", "seed"], [5, 2, 1, "", "terminations"], [5, 2, 1, "", "total_steps"], [5, 2, 1, "", "truncations"]], "minari.EpisodeMetadataCallback": [[3, 1, 1, "", "__call__"]], "minari.MinariDataset": [[6, 2, 1, "", "episode_indices"], [6, 1, 1, "", "filter_episodes"], [6, 1, 1, "", "iterate_episodes"], [6, 1, 1, "", "recover_environment"], [6, 1, 1, "", "sample_episodes"], [6, 1, 1, "", "set_seed"], [6, 2, 1, "", "spec"], [6, 2, 1, "", "total_episodes"], [6, 2, 1, "", "total_steps"], [6, 1, 1, "", "update_dataset_from_buffer"]], "minari.StepDataCallback": [[4, 1, 1, "", "__call__"]]}, "objtypes": {"0": "py:class", "1": "py:function", "2": "py:attribute"}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "function", "Python function"], "2": ["py", "attribute", "Python attribute"]}, "titleterms": {"404": 0, "page": 0, "Not": 0, "found": 0, "The": [0, 58], "request": 0, "could": 0, "minari": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 56], "document": 1, "build": [1, 58], "datacollector": 2, "method": [2, 3, 4, 6], "episodemetadatacallback": 3, "stepdatacallback": [4, 55, 56], "episodedata": [5, 9], "attribut": [5, 6], "minaridataset": 6, "creat": [7, 8, 56], "dataset": [7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 52, 54, 56, 57, 59, 60, 61], "load": 7, "split": [7, 8], "download": [7, 8, 10], "list": [7, 10], "delet": [7, 10], "combin": [7, 8, 10], "normal": 7, "score": 7, "basic": 8, "usag": 8, "instal": 8, "collect": [8, 55, 56], "data": [8, 9, 56], "save": 8, "checkpoint": 8, "us": [8, 57, 59, 61], "remot": 8, "sampl": 8, "episod": 8, "filter": 8, "recov": 8, "environ": [8, 12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49, 58], "standard": 9, "storag": 9, "root": 9, "file": 9, "format": 9, "hdf5": 9, "structur": 9, "default": 9, "metadata": 9, "observ": 9, "action": 9, "space": [9, 53, 55], "support": 9, "serial": [9, 53], "addit": 9, "inform": 9, "cli": 10, "local": 10, "upload": 10, "ant": 11, "maze": [11, 37], "refer": [11, 18, 22, 26, 30, 33, 37, 46, 56], "avail": [11, 18, 22, 26, 30, 33, 37, 46], "larg": [12, 13, 38, 39], "divers": [12, 14, 17], "descript": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "spec": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "evalu": [12, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 31, 32, 34, 35, 36, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48, 49], "plai": [13, 15], "medium": [14, 15, 40, 41], "umaz": [16, 17, 44, 45], "door": 18, "clone": [19, 23, 34, 47, 60], "expert": [20, 24, 35, 48], "human": [21, 25, 36, 49], "hammer": 22, "kitchen": 26, "complet": 27, "mix": 28, "partial": 29, "minigrid": 30, "fourroom": [31, 32], "random": 32, "pen": [33, 58], "point": 37, "dens": [39, 41, 43, 45], "open": [42, 43], "reloc": 46, "releas": 51, "note": 51, "v0": 51, "4": 51, "3": [51, 56], "2": [51, 56], "1": [51, 56], "0": 51, "creation": [52, 54, 57], "custom": 53, "subset": 55, "dictionari": 55, "pointmaz": 56, "d4rl": 56, "waypoint": 56, "planner": 56, "control": 56, "proport": 56, "term": 56, "p": 56, "deriv": 56, "d": 56, "integr": 56, "i": 56, "modifi": 56, "tutori": 57, "implicit": 58, "q": 58, "learn": 58, "torchrl": 58, "pre": 58, "requisit": 58, "For": 58, "headless": 58, "adroit": 58, "replai": 58, "buffer": 58, "defin": 58, "model": 58, "loss": 58, "optim": 58, "train": [58, 60], "result": 58, "behavior": 60, "pytorch": 60, "import": 60, "polici": 60, "gener": 60}, "envversion": {"sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1, "sphinx": 60}, "alltitles": {"404 - Page Not Found": [[0, "page-not-found"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Minari documentation": [[1, "minari-documentation"]], "Build the Documentation": [[1, "build-the-documentation"]], "DataCollector": [[2, "datacollector"]], "minari.DataCollector": [[2, "minari-datacollector"]], "Methods": [[2, "methods"], [3, "methods"], [4, "methods"], [6, "methods"]], "EpisodeMetadataCallback": [[3, "episodemetadatacallback"]], "minari.EpisodeMetadataCallback": [[3, "minari-episodemetadatacallback"]], "StepDataCallback": [[4, "stepdatacallback"]], "minari.StepDataCallback": [[4, "minari-stepdatacallback"]], "EpisodeData": [[5, "episodedata"]], "minari.EpisodeData": [[5, "minari-episodedata"]], "Attributes": [[5, "attributes"], [6, "attributes"]], "MinariDataset": [[6, "minaridataset"]], "minari.MinariDataset": [[6, "minari-minaridataset"]], "Minari": [[7, "minari"]], "Create Minari Dataset": [[7, "create-minari-dataset"], [8, "create-minari-dataset"]], "Load Minari Dataset": [[7, "load-minari-dataset"]], "Split Minari Dataset": [[7, "split-minari-dataset"]], "Download Minari Dataset": [[7, "download-minari-dataset"]], "List Minari Datasets": [[7, "list-minari-datasets"]], "Delete Minari Datasets": [[7, "delete-minari-datasets"]], "Combine Minari Datasets": [[7, "combine-minari-datasets"], [8, "combine-minari-datasets"]], "Normalize Score": [[7, "normalize-score"]], "Basic Usage": [[8, "basic-usage"]], "Installation": [[8, "installation"]], "Collecting Data": [[8, "collecting-data"]], "Save Dataset": [[8, "save-dataset"]], "Checkpoint Minari Dataset": [[8, "checkpoint-minari-dataset"]], "Using Minari Datasets": [[8, "using-minari-datasets"]], "Download Remote Datasets": [[8, "download-remote-datasets"]], "Sampling Episodes": [[8, "sampling-episodes"]], "Filter Episodes": [[8, "filter-episodes"]], "Split Dataset": [[8, "split-dataset"]], "Recover Environment": [[8, "recover-environment"]], "Dataset Standards": [[9, "dataset-standards"]], "Minari Storage": [[9, "minari-storage"]], "Minari root": [[9, "minari-root"]], "Data files": [[9, "data-files"]], "Dataset File Format": [[9, "dataset-file-format"]], "HDF5 file structure": [[9, "hdf5-file-structure"]], "Default dataset metadata": [[9, "default-dataset-metadata"]], "Observation and Action Spaces": [[9, "observation-and-action-spaces"]], "Supported Spaces": [[9, "supported-spaces"]], "Space Serialization": [[9, "space-serialization"]], "Minari Data Structures": [[9, "minari-data-structures"]], "EpisodeData Structure": [[9, "episodedata-structure"]], "Additional Information Formatting": [[9, "additional-information-formatting"]], "Minari CLI": [[10, "minari-cli"]], "List datasets": [[10, "list-datasets"]], "Download datasets": [[10, "download-datasets"]], "Delete local datasets": [[10, "delete-local-datasets"]], "Upload datasets": [[10, "upload-datasets"]], "Combine datasets": [[10, "combine-datasets"]], "Ant Maze": [[11, "ant-maze"]], "References": [[11, "references"], [18, "references"], [22, "references"], [26, "references"], [30, "references"], [33, "references"], [37, "references"], [46, "references"], [56, "references"]], "Available Datasets": [[11, "available-datasets"], [18, "available-datasets"], [22, "available-datasets"], [26, "available-datasets"], [30, "available-datasets"], [33, "available-datasets"], [37, "available-datasets"], [46, "available-datasets"]], "Large-Diverse": [[12, "large-diverse"]], "Description": [[12, "description"], [13, "description"], [14, "description"], [15, "description"], [16, "description"], [17, "description"], [19, "description"], [20, "description"], [21, "description"], [23, "description"], [24, "description"], [25, "description"], [27, "description"], [28, "description"], [29, "description"], [31, "description"], [32, "description"], [34, "description"], [35, "description"], [36, "description"], [38, "description"], [39, "description"], [40, "description"], [41, "description"], [42, "description"], [43, "description"], [44, "description"], [45, "description"], [47, "description"], [48, "description"], [49, "description"]], "Dataset Specs": [[12, "dataset-specs"], [13, "dataset-specs"], [14, "dataset-specs"], [15, "dataset-specs"], [16, "dataset-specs"], [17, "dataset-specs"], [19, "dataset-specs"], [20, "dataset-specs"], [21, "dataset-specs"], [23, "dataset-specs"], [24, "dataset-specs"], [25, "dataset-specs"], [27, "dataset-specs"], [28, "dataset-specs"], [29, "dataset-specs"], [31, "dataset-specs"], [32, "dataset-specs"], [34, "dataset-specs"], [35, "dataset-specs"], [36, "dataset-specs"], [38, "dataset-specs"], [39, "dataset-specs"], [40, "dataset-specs"], [41, "dataset-specs"], [42, "dataset-specs"], [43, "dataset-specs"], [44, "dataset-specs"], [45, "dataset-specs"], [47, "dataset-specs"], [48, "dataset-specs"], [49, "dataset-specs"]], "Environment Specs": [[12, "environment-specs"], [13, "environment-specs"], [14, "environment-specs"], [15, "environment-specs"], [16, "environment-specs"], [17, "environment-specs"], [19, "environment-specs"], [20, "environment-specs"], [21, "environment-specs"], [23, "environment-specs"], [24, "environment-specs"], [25, "environment-specs"], [27, "environment-specs"], [28, "environment-specs"], [29, "environment-specs"], [31, "environment-specs"], [32, "environment-specs"], [34, "environment-specs"], [35, "environment-specs"], [36, "environment-specs"], [38, "environment-specs"], [39, "environment-specs"], [40, "environment-specs"], [41, "environment-specs"], [42, "environment-specs"], [43, "environment-specs"], [44, "environment-specs"], [45, "environment-specs"], [47, "environment-specs"], [48, "environment-specs"], [49, "environment-specs"]], "Evaluation Environment Specs": [[12, "evaluation-environment-specs"], [13, "evaluation-environment-specs"], [14, "evaluation-environment-specs"], [15, "evaluation-environment-specs"], [16, "evaluation-environment-specs"], [17, "evaluation-environment-specs"], [19, "evaluation-environment-specs"], [20, "evaluation-environment-specs"], [21, "evaluation-environment-specs"], [23, "evaluation-environment-specs"], [24, "evaluation-environment-specs"], [25, "evaluation-environment-specs"], [27, "evaluation-environment-specs"], [28, "evaluation-environment-specs"], [29, "evaluation-environment-specs"], [31, "evaluation-environment-specs"], [32, "evaluation-environment-specs"], [34, "evaluation-environment-specs"], [35, "evaluation-environment-specs"], [36, "evaluation-environment-specs"], [38, "evaluation-environment-specs"], [39, "evaluation-environment-specs"], [40, "evaluation-environment-specs"], [41, "evaluation-environment-specs"], [42, "evaluation-environment-specs"], [43, "evaluation-environment-specs"], [44, "evaluation-environment-specs"], [45, "evaluation-environment-specs"], [47, "evaluation-environment-specs"], [48, "evaluation-environment-specs"], [49, "evaluation-environment-specs"]], "Large-Play": [[13, "large-play"]], "Medium-Diverse": [[14, "medium-diverse"]], "Medium-Play": [[15, "medium-play"]], "Umaze": [[16, "umaze"], [44, "umaze"]], "Umaze-Diverse": [[17, "umaze-diverse"]], "Door": [[18, "door"]], "Cloned": [[19, "cloned"], [23, "cloned"], [34, "cloned"], [47, "cloned"]], "Expert": [[20, "expert"], [24, "expert"], [35, "expert"], [48, "expert"]], "Human": [[21, "human"], [25, "human"], [36, "human"], [49, "human"]], "Hammer": [[22, "hammer"]], "Kitchen": [[26, "kitchen"]], "Complete": [[27, "complete"]], "Mixed": [[28, "mixed"]], "Partial": [[29, "partial"]], "MiniGrid": [[30, "minigrid"]], "Fourrooms": [[31, "fourrooms"]], "Fourrooms-Random": [[32, "fourrooms-random"]], "Pen": [[33, "pen"]], "Point Maze": [[37, "point-maze"]], "Large": [[38, "large"]], "Large-Dense": [[39, "large-dense"]], "Medium": [[40, "medium"]], "Medium-Dense": [[41, "medium-dense"]], "Open": [[42, "open"]], "Open-Dense": [[43, "open-dense"]], "Umaze-Dense": [[45, "umaze-dense"]], "Relocate": [[46, "relocate"]], "Release Notes": [[51, "release-notes"]], "v0.4.3": [[51, "release-v0-4-3"]], "v0.4.2": [[51, "release-v0-4-2"]], "v0.4.1": [[51, "release-v0-4-1"]], "v0.4.0": [[51, "release-v0-4-0"]], "v0.3.1": [[51, "release-v0-3-1"]], "v0.3.0": [[51, "release-v0-3-0"]], "0.2.2": [[51, "release-0-2-2"]], "0.1.0": [[51, "release-0-1-0"]], "Dataset Creation": [[52, "dataset-creation"], [54, "dataset-creation"], [57, "dataset-creation"]], "Serializing a custom space": [[53, "serializing-a-custom-space"]], "Collecting a subset of a dictionary space with StepDataCallback": [[55, "collecting-a-subset-of-a-dictionary-space-with-stepdatacallback"]], "PointMaze D4RL dataset": [[56, "pointmaze-d4rl-dataset"]], "WayPoint Planner": [[56, "waypoint-planner"]], "Waypoint Controller": [[56, "waypoint-controller"]], "1. Proportional Term (P)": [[56, "proportional-term-p"]], "2. Derivative Term (D)": [[56, "derivative-term-d"]], "3. Integral Term (I)": [[56, "integral-term-i"]], "Modified StepDataCallback": [[56, "modified-stepdatacallback"]], "Collect Data and Create Minari Dataset": [[56, "collect-data-and-create-minari-dataset"]], "Tutorials": [[57, "tutorials"]], "Using Datasets": [[57, "using-datasets"], [59, "using-datasets"], [61, "using-datasets"]], "Implicit Q-Learning with TorchRL": [[58, "implicit-q-learning-with-torchrl"]], "Pre-requisites": [[58, "pre-requisites"]], "For headless environments": [[58, "for-headless-environments"]], "The Adroit Pen environment": [[58, "the-adroit-pen-environment"]], "Building a replay buffer": [[58, "building-a-replay-buffer"]], "Implicit Q-Learning": [[58, "implicit-q-learning"]], "Defining the model": [[58, "defining-the-model"]], "Loss and optimizer": [[58, "loss-and-optimizer"]], "Training": [[58, "training"]], "Results": [[58, "results"]], "Behavioral cloning with PyTorch": [[60, "behavioral-cloning-with-pytorch"], [60, "id1"]], "Imports": [[60, "imports"]], "Policy training": [[60, "policy-training"]], "Dataset generation": [[60, "dataset-generation"]]}, "indexentries": {"datacollector (class in minari)": [[2, "minari.DataCollector"]], "close() (in module minari.datacollector)": [[2, "minari.DataCollector.close"]], "create_dataset() (in module minari.datacollector)": [[2, "minari.DataCollector.create_dataset"]], "reset() (in module minari.datacollector)": [[2, "minari.DataCollector.reset"]], "step() (in module minari.datacollector)": [[2, "minari.DataCollector.step"]], "episodemetadatacallback (class in minari)": [[3, "minari.EpisodeMetadataCallback"]], "__call__() (in module minari.episodemetadatacallback)": [[3, "minari.EpisodeMetadataCallback.__call__"]], "stepdatacallback (class in minari)": [[4, "minari.StepDataCallback"]], "__call__() (in module minari.stepdatacallback)": [[4, "minari.StepDataCallback.__call__"]], "episodedata (class in minari)": [[5, "minari.EpisodeData"]], "actions (minari.episodedata attribute)": [[5, "minari.EpisodeData.actions"]], "id (minari.episodedata attribute)": [[5, "minari.EpisodeData.id"]], "observations (minari.episodedata attribute)": [[5, "minari.EpisodeData.observations"]], "seed (minari.episodedata attribute)": [[5, "minari.EpisodeData.seed"]], "terminations (minari.episodedata attribute)": [[5, "minari.EpisodeData.terminations"]], "total_steps (minari.episodedata attribute)": [[5, "minari.EpisodeData.total_steps"]], "truncations (minari.episodedata attribute)": [[5, "minari.EpisodeData.truncations"]], "minaridataset (class in minari)": [[6, "minari.MinariDataset"]], "episode_indices (minari.minaridataset attribute)": [[6, "minari.MinariDataset.episode_indices"]], "filter_episodes() (in module minari.minaridataset)": [[6, "minari.MinariDataset.filter_episodes"]], "iterate_episodes() (in module minari.minaridataset)": [[6, "minari.MinariDataset.iterate_episodes"]], "recover_environment() (in module minari.minaridataset)": [[6, "minari.MinariDataset.recover_environment"]], "sample_episodes() (in module minari.minaridataset)": [[6, "minari.MinariDataset.sample_episodes"]], "set_seed() (in module minari.minaridataset)": [[6, "minari.MinariDataset.set_seed"]], "spec (minari.minaridataset attribute)": [[6, "minari.MinariDataset.spec"]], "total_episodes (minari.minaridataset attribute)": [[6, "minari.MinariDataset.total_episodes"]], "total_steps (minari.minaridataset attribute)": [[6, "minari.MinariDataset.total_steps"]], "update_dataset_from_buffer() (in module minari.minaridataset)": [[6, "minari.MinariDataset.update_dataset_from_buffer"]], "combine_datasets() (in module minari)": [[7, "minari.combine_datasets"]], "create_dataset_from_buffers() (in module minari)": [[7, "minari.create_dataset_from_buffers"]], "delete_dataset() (in module minari)": [[7, "minari.delete_dataset"]], "download_dataset() (in module minari)": [[7, "minari.download_dataset"]], "get_normalized_score() (in module minari)": [[7, "minari.get_normalized_score"]], "list_local_datasets() (in module minari)": [[7, "minari.list_local_datasets"]], "list_remote_datasets() (in module minari)": [[7, "minari.list_remote_datasets"]], "load_dataset() (in module minari)": [[7, "minari.load_dataset"]], "split_dataset() (in module minari)": [[7, "minari.split_dataset"]]}}) \ No newline at end of file