diff --git a/main/datasets/mujoco/ant/index.html b/main/datasets/mujoco/ant/index.html
index cb8ae8a3..56fafdc5 100644
--- a/main/datasets/mujoco/ant/index.html
+++ b/main/datasets/mujoco/ant/index.html
@@ -8,7 +8,7 @@
-
+
@@ -255,7 +255,7 @@
Datasets
-
+
Development
diff --git a/main/datasets/mujoco/index.html b/main/datasets/mujoco/index.html
index 700ff3e3..b9878533 100644
--- a/main/datasets/mujoco/index.html
+++ b/main/datasets/mujoco/index.html
@@ -8,7 +8,7 @@
-
+
@@ -255,7 +255,7 @@
Datasets
-
Development
diff --git a/main/index.html b/main/index.html
index 6a85cc7d..42a4a6e6 100644
--- a/main/index.html
+++ b/main/index.html
@@ -314,6 +314,13 @@
+- MuJoCo
+
Development
diff --git a/main/release_notes/index.html b/main/release_notes/index.html
index d9811084..de93bb5e 100644
--- a/main/release_notes/index.html
+++ b/main/release_notes/index.html
@@ -8,7 +8,7 @@
-
+
@@ -314,6 +314,13 @@
+
MuJoCo
+
Development
diff --git a/main/search/index.html b/main/search/index.html
index 205f808d..ae9b35af 100644
--- a/main/search/index.html
+++ b/main/search/index.html
@@ -311,6 +311,13 @@
+
MuJoCo
+
Development
diff --git a/main/searchindex.js b/main/searchindex.js
index 7cc3c783..47d6fdc2 100644
--- a/main/searchindex.js
+++ b/main/searchindex.js
@@ -1 +1 @@
-Search.setIndex({"alltitles": {"0.1.0": [[59, "release-0-1-0"]], "0.2.2": [[59, "release-0-2-2"]], "1. Proportional Term (P)": [[64, "proportional-term-p"]], "2. Derivative Term (D)": [[64, "derivative-term-d"]], "3. Integral Term (I)": [[64, "integral-term-i"]], "404 - Page Not Found": [[0, null]], "Ant Maze": [[15, null]], "Attributes": [[3, "attributes"], [6, "attributes"], [7, "attributes"], [8, "attributes"], [9, "attributes"]], "Basic Usage": [[12, null]], "Behavioral cloning with PyTorch": [[68, null], [68, "id1"]], "Build the Documentation": [[1, "build-the-documentation"]], "Building a replay buffer": [[66, "building-a-replay-buffer"]], "Checkpoint Minari Dataset": [[12, "checkpoint-minari-dataset"]], "Cloned": [[22, null], [26, null], [38, null], [51, null]], "Collect Data and Create Minari Dataset": [[64, "collect-data-and-create-minari-dataset"]], "Collecting Data": [[12, "collecting-data"]], "Collecting a subset of a dictionary space with StepDataCallback": [[63, null]], "Combine Minari Datasets": [[10, "combine-minari-datasets"], [12, "combine-minari-datasets"]], "Combine datasets": [[14, "combine-datasets"]], "Complete": [[31, null]], "Content": [[15, "content"], [25, "content"], [29, "content"], [30, "content"], [32, "content"], [37, "content"], [41, "content"], [42, "content"], [54, "content"], [56, "content"], [57, "content"]], "Create Minari Dataset": [[10, "create-minari-dataset"], [12, "create-minari-dataset"]], "Create Namespace": [[11, "create-namespace"]], "D4RL": [[30, null]], "DataCollector": [[2, null]], "Dataset Creation": [[60, null], [62, null], [65, "dataset-creation"]], "Dataset Metadata": [[13, "dataset-metadata"]], "Dataset Specs": [[16, "dataset-specs"], [17, "dataset-specs"], [18, "dataset-specs"], [19, "dataset-specs"], [20, "dataset-specs"], [21, "dataset-specs"], [22, "dataset-specs"], [23, "dataset-specs"], [24, "dataset-specs"], [26, "dataset-specs"], [27, "dataset-specs"], [28, "dataset-specs"], [31, "dataset-specs"], [33, "dataset-specs"], [34, "dataset-specs"], [35, "dataset-specs"], [36, "dataset-specs"], [38, "dataset-specs"], [39, "dataset-specs"], [40, "dataset-specs"], [43, "dataset-specs"], [44, "dataset-specs"], [45, "dataset-specs"], [46, "dataset-specs"], [47, "dataset-specs"], [48, "dataset-specs"], [49, "dataset-specs"], [50, "dataset-specs"], [51, "dataset-specs"], [52, "dataset-specs"], [53, "dataset-specs"], [55, "dataset-specs"]], "Dataset Standards": [[13, null]], "Dataset generation": [[68, "dataset-generation"]], "Defining the model": [[66, "defining-the-model"]], "Delete Minari Datasets": [[10, "delete-minari-datasets"]], "Delete Namespace": [[11, "delete-namespace"]], "Delete local datasets": [[14, "delete-local-datasets"]], "Description": [[16, "description"], [17, "description"], [18, "description"], [19, "description"], [20, "description"], [21, "description"], [22, "description"], [23, "description"], [24, "description"], [26, "description"], [27, "description"], [28, "description"], [31, "description"], [33, "description"], [34, "description"], [35, "description"], [36, "description"], [38, "description"], [39, "description"], [40, "description"], [43, "description"], [44, "description"], [45, "description"], [46, "description"], [47, "description"], [48, "description"], [49, "description"], [50, "description"], [51, "description"], [52, "description"], [53, "description"], [55, "description"]], "Door": [[25, null]], "Download Datasets": [[12, "download-datasets"]], "Download Minari Dataset": [[10, "download-minari-dataset"]], "Download Namespace Metadata": [[11, "download-namespace-metadata"]], "Download datasets": [[14, "download-datasets"]], "Environment Specs": [[16, "environment-specs"], [17, "environment-specs"], [18, "environment-specs"], [19, "environment-specs"], [20, "environment-specs"], [21, "environment-specs"], [22, "environment-specs"], [23, "environment-specs"], [24, "environment-specs"], [26, "environment-specs"], [27, "environment-specs"], [28, "environment-specs"], [31, "environment-specs"], [33, "environment-specs"], [34, "environment-specs"], [35, "environment-specs"], [36, "environment-specs"], [38, "environment-specs"], [39, "environment-specs"], [40, "environment-specs"], [43, "environment-specs"], [44, "environment-specs"], [45, "environment-specs"], [46, "environment-specs"], [47, "environment-specs"], [48, "environment-specs"], [49, "environment-specs"], [50, "environment-specs"], [51, "environment-specs"], [52, "environment-specs"], [53, "environment-specs"], [55, "environment-specs"]], "EpisodeBuffer": [[3, null]], "EpisodeData": [[6, null]], "EpisodeData Structure": [[13, "episodedata-structure"]], "EpisodeMetadataCallback": [[4, null]], "Evaluation Environment Specs": [[16, "evaluation-environment-specs"], [17, "evaluation-environment-specs"], [18, "evaluation-environment-specs"], [19, "evaluation-environment-specs"], [20, "evaluation-environment-specs"], [21, "evaluation-environment-specs"], [22, "evaluation-environment-specs"], [23, "evaluation-environment-specs"], [24, "evaluation-environment-specs"], [26, "evaluation-environment-specs"], [27, "evaluation-environment-specs"], [28, "evaluation-environment-specs"], [31, "evaluation-environment-specs"], [33, "evaluation-environment-specs"], [34, "evaluation-environment-specs"], [35, "evaluation-environment-specs"], [36, "evaluation-environment-specs"], [38, "evaluation-environment-specs"], [39, "evaluation-environment-specs"], [40, "evaluation-environment-specs"], [43, "evaluation-environment-specs"], [44, "evaluation-environment-specs"], [45, "evaluation-environment-specs"], [46, "evaluation-environment-specs"], [47, "evaluation-environment-specs"], [48, "evaluation-environment-specs"], [49, "evaluation-environment-specs"], [50, "evaluation-environment-specs"], [51, "evaluation-environment-specs"], [52, "evaluation-environment-specs"], [53, "evaluation-environment-specs"], [55, "evaluation-environment-specs"]], "Expert": [[23, null], [27, null], [39, null], [52, null], [55, null]], "Filter Episodes": [[12, "filter-episodes"]], "For headless environments": [[66, "for-headless-environments"]], "Fourrooms": [[36, null]], "Fourrooms-Random": [[35, null]], "Get Local Namespace Metadata": [[11, "get-local-namespace-metadata"]], "Hammer": [[29, null]], "Human": [[24, null], [28, null], [40, null], [53, null]], "Implicit Q-Learning": [[66, "implicit-q-learning"]], "Implicit Q-Learning with TorchRL": [[66, null]], "Imports": [[68, "imports"]], "Installation": [[12, "installation"]], "Kitchen": [[32, null]], "Large": [[44, null]], "Large-Dense": [[43, null]], "Large-Diverse": [[16, null]], "Large-Play": [[17, null]], "List Minari Datasets": [[10, "list-minari-datasets"]], "List Namespaces": [[11, "list-namespaces"]], "List datasets": [[14, "list-datasets"]], "Load Local Datasets": [[12, "load-local-datasets"]], "Load Minari Dataset": [[10, "load-minari-dataset"]], "Loss and optimizer": [[66, "loss-and-optimizer"]], "Medium": [[46, null]], "Medium-Dense": [[45, null]], "Medium-Diverse": [[18, null]], "Medium-Play": [[19, null]], "Methods": [[2, "methods"], [3, "methods"], [4, "methods"], [5, "methods"], [7, "methods"], [8, "methods"]], "Minari": [[10, null]], "Minari CLI": [[14, null]], "Minari Dataset Directory": [[13, "minari-dataset-directory"]], "Minari documentation": [[1, null]], "MinariDataset": [[7, null]], "MinariStorage": [[8, null]], "MiniGrid": [[37, null]], "Mixed": [[33, null]], "Modified StepDataCallback": [[64, "modified-stepdatacallback"]], "MuJoCo": [[57, null]], "Mujoco/ant": [[56, null]], "Namespace": [[11, null]], "Namespace metadata": [[13, "namespace-metadata"]], "Normalize Score": [[10, "normalize-score"]], "Observation and Action Spaces": [[13, "observation-and-action-spaces"]], "Open": [[48, null]], "Open-Dense": [[47, null]], "Partial": [[34, null]], "Pen": [[41, null]], "Point Maze": [[42, null]], "PointMaze D4RL dataset": [[64, null]], "Policy training": [[68, "policy-training"]], "Pre-requisites": [[66, "pre-requisites"]], "Recover Environment": [[12, "recover-environment"]], "References": [[15, "references"], [25, "references"], [29, "references"], [30, "references"], [32, "references"], [37, "references"], [41, "references"], [42, "references"], [54, "references"], [64, "references"]], "Release Notes": [[59, null]], "Relocate": [[54, null]], "Results": [[66, "results"]], "Sampling Episodes": [[12, "sampling-episodes"]], "Save Dataset": [[12, "save-dataset"]], "Serializing a custom space": [[61, null]], "Show datasets details": [[14, "show-datasets-details"]], "Split Dataset": [[12, "split-dataset"]], "Split Minari Dataset": [[10, "split-minari-dataset"]], "StepData": [[9, null]], "StepDataCallback": [[5, null]], "Supported Spaces": [[13, "supported-spaces"]], "The Adroit Pen environment": [[66, "the-adroit-pen-environment"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Training": [[66, "training"]], "Tutorials": [[65, null]], "Umaze": [[21, null], [50, null]], "Umaze-Dense": [[49, null]], "Umaze-Diverse": [[20, null]], "Update Namespace": [[11, "update-namespace"]], "Upload Namespace": [[11, "upload-namespace"]], "Upload datasets": [[14, "upload-datasets"]], "Using Datasets": [[65, "using-datasets"], [67, null], [69, null]], "Using Minari Datasets": [[12, "using-minari-datasets"]], "Using Namespaces": [[12, "using-namespaces"]], "WayPoint Planner": [[64, "waypoint-planner"]], "Waypoint Controller": [[64, "waypoint-controller"]], "minari.DataCollector": [[2, "minari-datacollector"]], "minari.EpisodeData": [[6, "minari-episodedata"]], "minari.EpisodeMetadataCallback": [[4, "minari-episodemetadatacallback"]], "minari.MinariDataset": [[7, "minari-minaridataset"]], "minari.StepData": [[9, "minari-stepdata"]], "minari.StepDataCallback": [[5, "minari-stepdatacallback"]], "minari.data_collector.EpisodeBuffer": [[3, "minari-data-collector-episodebuffer"]], "minari.dataset.minari_storage.MinariStorage": [[8, "minari-dataset-minari-storage-minaristorage"]], "v0.3.0": [[59, "release-v0-3-0"]], "v0.3.1": [[59, "release-v0-3-1"]], "v0.4.0": [[59, "release-v0-4-0"]], "v0.4.1": [[59, "release-v0-4-1"]], "v0.4.2": [[59, "release-v0-4-2"]], "v0.4.3": [[59, "release-v0-4-3"]], "v0.5.0": [[59, "release-v0-5-0"]], "v0.5.1": [[59, "release-v0-5-1"]]}, "docnames": ["404", "README", "api/data_collector", "api/data_collector/episode_buffer", "api/data_collector/episode_metadata_callback", "api/data_collector/step_data_callback", "api/minari_dataset/episode_data", "api/minari_dataset/minari_dataset", "api/minari_dataset/minari_storage", "api/minari_dataset/step_data", "api/minari_functions", "api/namespace/namespace", "content/basic_usage", "content/dataset_standards", "content/minari_cli", "datasets/D4RL/antmaze/index", "datasets/D4RL/antmaze/large-diverse-v1", "datasets/D4RL/antmaze/large-play-v1", "datasets/D4RL/antmaze/medium-diverse-v1", "datasets/D4RL/antmaze/medium-play-v1", "datasets/D4RL/antmaze/umaze-diverse-v1", "datasets/D4RL/antmaze/umaze-v1", "datasets/D4RL/door/cloned-v2", "datasets/D4RL/door/expert-v2", "datasets/D4RL/door/human-v2", "datasets/D4RL/door/index", "datasets/D4RL/hammer/cloned-v2", "datasets/D4RL/hammer/expert-v2", "datasets/D4RL/hammer/human-v2", "datasets/D4RL/hammer/index", "datasets/D4RL/index", "datasets/D4RL/kitchen/complete-v2", "datasets/D4RL/kitchen/index", "datasets/D4RL/kitchen/mixed-v2", "datasets/D4RL/kitchen/partial-v2", "datasets/D4RL/minigrid/fourrooms-random-v0", "datasets/D4RL/minigrid/fourrooms-v0", "datasets/D4RL/minigrid/index", "datasets/D4RL/pen/cloned-v2", "datasets/D4RL/pen/expert-v2", "datasets/D4RL/pen/human-v2", "datasets/D4RL/pen/index", "datasets/D4RL/pointmaze/index", "datasets/D4RL/pointmaze/large-dense-v2", "datasets/D4RL/pointmaze/large-v2", "datasets/D4RL/pointmaze/medium-dense-v2", "datasets/D4RL/pointmaze/medium-v2", "datasets/D4RL/pointmaze/open-dense-v2", "datasets/D4RL/pointmaze/open-v2", "datasets/D4RL/pointmaze/umaze-dense-v2", "datasets/D4RL/pointmaze/umaze-v2", "datasets/D4RL/relocate/cloned-v2", "datasets/D4RL/relocate/expert-v2", "datasets/D4RL/relocate/human-v2", "datasets/D4RL/relocate/index", "datasets/mujoco/ant/expert-v0", "datasets/mujoco/ant/index", "datasets/mujoco/index", "index", "release_notes/index", "tutorials/dataset_creation/README", "tutorials/dataset_creation/custom_space_serialization", "tutorials/dataset_creation/index", "tutorials/dataset_creation/observation_space_subseting", "tutorials/dataset_creation/point_maze_dataset", "tutorials/index", "tutorials/using_datasets/IQL_torchrl", "tutorials/using_datasets/README", "tutorials/using_datasets/behavioral_cloning", "tutorials/using_datasets/index"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1}, "filenames": ["404.md", "README.md", "api/data_collector.md", "api/data_collector/episode_buffer.md", "api/data_collector/episode_metadata_callback.md", "api/data_collector/step_data_callback.md", "api/minari_dataset/episode_data.md", "api/minari_dataset/minari_dataset.md", "api/minari_dataset/minari_storage.md", "api/minari_dataset/step_data.md", "api/minari_functions.md", "api/namespace/namespace.md", "content/basic_usage.md", "content/dataset_standards.md", "content/minari_cli.md", "datasets/D4RL/antmaze/index.md", "datasets/D4RL/antmaze/large-diverse-v1.md", "datasets/D4RL/antmaze/large-play-v1.md", "datasets/D4RL/antmaze/medium-diverse-v1.md", "datasets/D4RL/antmaze/medium-play-v1.md", "datasets/D4RL/antmaze/umaze-diverse-v1.md", "datasets/D4RL/antmaze/umaze-v1.md", "datasets/D4RL/door/cloned-v2.md", "datasets/D4RL/door/expert-v2.md", "datasets/D4RL/door/human-v2.md", "datasets/D4RL/door/index.md", "datasets/D4RL/hammer/cloned-v2.md", "datasets/D4RL/hammer/expert-v2.md", "datasets/D4RL/hammer/human-v2.md", "datasets/D4RL/hammer/index.md", "datasets/D4RL/index.md", "datasets/D4RL/kitchen/complete-v2.md", "datasets/D4RL/kitchen/index.md", "datasets/D4RL/kitchen/mixed-v2.md", "datasets/D4RL/kitchen/partial-v2.md", "datasets/D4RL/minigrid/fourrooms-random-v0.md", "datasets/D4RL/minigrid/fourrooms-v0.md", "datasets/D4RL/minigrid/index.md", "datasets/D4RL/pen/cloned-v2.md", "datasets/D4RL/pen/expert-v2.md", "datasets/D4RL/pen/human-v2.md", "datasets/D4RL/pen/index.md", "datasets/D4RL/pointmaze/index.md", "datasets/D4RL/pointmaze/large-dense-v2.md", "datasets/D4RL/pointmaze/large-v2.md", "datasets/D4RL/pointmaze/medium-dense-v2.md", "datasets/D4RL/pointmaze/medium-v2.md", "datasets/D4RL/pointmaze/open-dense-v2.md", "datasets/D4RL/pointmaze/open-v2.md", "datasets/D4RL/pointmaze/umaze-dense-v2.md", "datasets/D4RL/pointmaze/umaze-v2.md", "datasets/D4RL/relocate/cloned-v2.md", "datasets/D4RL/relocate/expert-v2.md", "datasets/D4RL/relocate/human-v2.md", "datasets/D4RL/relocate/index.md", "datasets/mujoco/ant/expert-v0.md", "datasets/mujoco/ant/index.md", "datasets/mujoco/index.md", "index.md", "release_notes/index.md", "tutorials/dataset_creation/README.rst", "tutorials/dataset_creation/custom_space_serialization.rst", "tutorials/dataset_creation/index.rst", "tutorials/dataset_creation/observation_space_subseting.rst", "tutorials/dataset_creation/point_maze_dataset.rst", "tutorials/index.rst", "tutorials/using_datasets/IQL_torchrl.rst", "tutorials/using_datasets/README.rst", "tutorials/using_datasets/behavioral_cloning.rst", "tutorials/using_datasets/index.rst"], "indexentries": {"__call__() (in module minari.episodemetadatacallback)": [[4, "minari.EpisodeMetadataCallback.__call__", false]], "__call__() (in module minari.stepdatacallback)": [[5, "minari.StepDataCallback.__call__", false]], "__len__() (in module minari.data_collector.episodebuffer)": [[3, "minari.data_collector.EpisodeBuffer.__len__", false]], "action (minari.stepdata attribute)": [[9, "minari.StepData.action", false]], "action_space (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.action_space", false]], "actions (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.actions", false]], "actions (minari.episodedata attribute)": [[6, "minari.EpisodeData.actions", false]], "add_step_data() (in module minari.data_collector.episodebuffer)": [[3, "minari.data_collector.EpisodeBuffer.add_step_data", false]], "add_to_dataset() (in module minari.datacollector)": [[2, "minari.DataCollector.add_to_dataset", false]], "apply() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.apply", false]], "close() (in module minari.datacollector)": [[2, "minari.DataCollector.close", false]], "combine_datasets() (in module minari)": [[10, "minari.combine_datasets", false]], "create_dataset() (in module minari.datacollector)": [[2, "minari.DataCollector.create_dataset", false]], "create_dataset_from_buffers() (in module minari)": [[10, "minari.create_dataset_from_buffers", false]], "create_namespace() (in module minari.namespace)": [[11, "minari.namespace.create_namespace", false]], "data_path (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.data_path", false]], "datacollector (class in minari)": [[2, "minari.DataCollector", false]], "delete_dataset() (in module minari)": [[10, "minari.delete_dataset", false]], "delete_namespace() (in module minari.namespace)": [[11, "minari.namespace.delete_namespace", false]], "download_dataset() (in module minari)": [[10, "minari.download_dataset", false]], "download_namespace_metadata() (in module minari.namespace)": [[11, "minari.namespace.download_namespace_metadata", false]], "episode_indices (minari.minaridataset attribute)": [[7, "minari.MinariDataset.episode_indices", false]], "episodebuffer (class in minari.data_collector)": [[3, "minari.data_collector.EpisodeBuffer", false]], "episodedata (class in minari)": [[6, "minari.EpisodeData", false]], "episodemetadatacallback (class in minari)": [[4, "minari.EpisodeMetadataCallback", false]], "filter_episodes() (in module minari.minaridataset)": [[7, "minari.MinariDataset.filter_episodes", false]], "get_episode_metadata() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.get_episode_metadata", false]], "get_episodes() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.get_episodes", false]], "get_namespace_metadata() (in module minari.namespace)": [[11, "minari.namespace.get_namespace_metadata", false]], "get_normalized_score() (in module minari)": [[10, "minari.get_normalized_score", false]], "get_size() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.get_size", false]], "id (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.id", false]], "id (minari.episodedata attribute)": [[6, "minari.EpisodeData.id", false]], "info (minari.stepdata attribute)": [[9, "minari.StepData.info", false]], "infos (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.infos", false]], "infos (minari.episodedata attribute)": [[6, "minari.EpisodeData.infos", false]], "iterate_episodes() (in module minari.minaridataset)": [[7, "minari.MinariDataset.iterate_episodes", false]], "list_local_datasets() (in module minari)": [[10, "minari.list_local_datasets", false]], "list_local_namespaces() (in module minari.namespace)": [[11, "minari.namespace.list_local_namespaces", false]], "list_remote_datasets() (in module minari)": [[10, "minari.list_remote_datasets", false]], "list_remote_namespaces() (in module minari.namespace)": [[11, "minari.namespace.list_remote_namespaces", false]], "load_dataset() (in module minari)": [[10, "minari.load_dataset", false]], "metadata (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.metadata", false]], "minaridataset (class in minari)": [[7, "minari.MinariDataset", false]], "minaristorage (class in minari.dataset.minari_storage)": [[8, "minari.dataset.minari_storage.MinariStorage", false]], "new() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.new", false]], "observation (minari.stepdata attribute)": [[9, "minari.StepData.observation", false]], "observation_space (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.observation_space", false]], "observations (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.observations", false]], "observations (minari.episodedata attribute)": [[6, "minari.EpisodeData.observations", false]], "read() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.read", false]], "recover_environment() (in module minari.minaridataset)": [[7, "minari.MinariDataset.recover_environment", false]], "reset() (in module minari.datacollector)": [[2, "minari.DataCollector.reset", false]], "rewards (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.rewards", false]], "sample_episodes() (in module minari.minaridataset)": [[7, "minari.MinariDataset.sample_episodes", false]], "seed (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.seed", false]], "set_seed() (in module minari.minaridataset)": [[7, "minari.MinariDataset.set_seed", false]], "spec (minari.minaridataset attribute)": [[7, "minari.MinariDataset.spec", false]], "split_dataset() (in module minari)": [[10, "minari.split_dataset", false]], "step() (in module minari.datacollector)": [[2, "minari.DataCollector.step", false]], "stepdata (class in minari)": [[9, "minari.StepData", false]], "stepdatacallback (class in minari)": [[5, "minari.StepDataCallback", false]], "termination (minari.stepdata attribute)": [[9, "minari.StepData.termination", false]], "terminations (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.terminations", false]], "terminations (minari.episodedata attribute)": [[6, "minari.EpisodeData.terminations", false]], "total_episodes (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.total_episodes", false]], "total_episodes (minari.minaridataset attribute)": [[7, "minari.MinariDataset.total_episodes", false]], "total_steps (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.total_steps", false]], "total_steps (minari.minaridataset attribute)": [[7, "minari.MinariDataset.total_steps", false]], "truncation (minari.stepdata attribute)": [[9, "minari.StepData.truncation", false]], "truncations (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.truncations", false]], "truncations (minari.episodedata attribute)": [[6, "minari.EpisodeData.truncations", false]], "update_dataset_from_buffer() (in module minari.minaridataset)": [[7, "minari.MinariDataset.update_dataset_from_buffer", false]], "update_episode_metadata() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_episode_metadata", false]], "update_episodes() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_episodes", false]], "update_from_storage() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_from_storage", false]], "update_metadata() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_metadata", false]], "upload_namespace() (in module minari.namespace)": [[11, "minari.namespace.upload_namespace", false]]}, "objects": {"minari": [[2, 0, 1, "", "DataCollector"], [6, 0, 1, "", "EpisodeData"], [4, 0, 1, "", "EpisodeMetadataCallback"], [7, 0, 1, "", "MinariDataset"], [9, 0, 1, "", "StepData"], [5, 0, 1, "", "StepDataCallback"], [10, 1, 1, "", "combine_datasets"], [10, 1, 1, "", "create_dataset_from_buffers"], [10, 1, 1, "", "delete_dataset"], [10, 1, 1, "", "download_dataset"], [10, 1, 1, "", "get_normalized_score"], [10, 1, 1, "", "list_local_datasets"], [10, 1, 1, "", "list_remote_datasets"], [10, 1, 1, "", "load_dataset"], [10, 1, 1, "", "split_dataset"]], "minari.DataCollector": [[2, 1, 1, "", "add_to_dataset"], [2, 1, 1, "", "close"], [2, 1, 1, "", "create_dataset"], [2, 1, 1, "", "reset"], [2, 1, 1, "", "step"]], "minari.EpisodeData": [[6, 2, 1, "", "actions"], [6, 2, 1, "", "id"], [6, 2, 1, "", "infos"], [6, 2, 1, "", "observations"], [6, 2, 1, "", "terminations"], [6, 2, 1, "", "truncations"]], "minari.EpisodeMetadataCallback": [[4, 1, 1, "", "__call__"]], "minari.MinariDataset": [[7, 2, 1, "", "episode_indices"], [7, 1, 1, "", "filter_episodes"], [7, 1, 1, "", "iterate_episodes"], [7, 1, 1, "", "recover_environment"], [7, 1, 1, "", "sample_episodes"], [7, 1, 1, "", "set_seed"], [7, 2, 1, "", "spec"], [7, 2, 1, "", "total_episodes"], [7, 2, 1, "", "total_steps"], [7, 1, 1, "", "update_dataset_from_buffer"]], "minari.StepData": [[9, 2, 1, "", "action"], [9, 2, 1, "", "info"], [9, 2, 1, "", "observation"], [9, 2, 1, "", "termination"], [9, 2, 1, "", "truncation"]], "minari.StepDataCallback": [[5, 1, 1, "", "__call__"]], "minari.data_collector": [[3, 0, 1, "", "EpisodeBuffer"]], "minari.data_collector.EpisodeBuffer": [[3, 1, 1, "", "__len__"], [3, 2, 1, "", "actions"], [3, 1, 1, "", "add_step_data"], [3, 2, 1, "", "id"], [3, 2, 1, "", "infos"], [3, 2, 1, "", "observations"], [3, 2, 1, "", "rewards"], [3, 2, 1, "", "seed"], [3, 2, 1, "", "terminations"], [3, 2, 1, "", "truncations"]], "minari.dataset.minari_storage": [[8, 0, 1, "", "MinariStorage"]], "minari.dataset.minari_storage.MinariStorage": [[8, 2, 1, "", "action_space"], [8, 1, 1, "", "apply"], [8, 2, 1, "", "data_path"], [8, 1, 1, "", "get_episode_metadata"], [8, 1, 1, "", "get_episodes"], [8, 1, 1, "", "get_size"], [8, 2, 1, "", "metadata"], [8, 1, 1, "", "new"], [8, 2, 1, "", "observation_space"], [8, 1, 1, "", "read"], [8, 2, 1, "", "total_episodes"], [8, 2, 1, "", "total_steps"], [8, 1, 1, "", "update_episode_metadata"], [8, 1, 1, "", "update_episodes"], [8, 1, 1, "", "update_from_storage"], [8, 1, 1, "", "update_metadata"]], "minari.namespace": [[11, 1, 1, "", "create_namespace"], [11, 1, 1, "", "delete_namespace"], [11, 1, 1, "", "download_namespace_metadata"], [11, 1, 1, "", "get_namespace_metadata"], [11, 1, 1, "", "list_local_namespaces"], [11, 1, 1, "", "list_remote_namespaces"], [11, 1, 1, "", "upload_namespace"]]}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "function", "Python function"], "2": ["py", "attribute", "Python attribute"]}, "objtypes": {"0": "py:class", "1": "py:function", "2": "py:attribute"}, "terms": {"": [2, 4, 5, 10, 12, 13, 14, 16, 17, 18, 19, 20, 32, 59, 61, 63, 64, 66, 68], "0": [2, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 61, 63, 64, 66, 68], "000": [64, 66], "0003": 66, "005": 66, "01": 59, "0123456789abcdefghijklmnopqrstuvwxyzabcdeeeffghijklmnnoopqrrssttuvwxyzz": [35, 36], "03ac13": [14, 58], "04": 59, "05": 59, "07": 59, "07219": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "08": 59, "09": 59, "0x11f2608b0": 61, "0x12253a940": 61, "0x7f22a28c0670": 35, "0x7fa1e1d39ee0": 36, "1": [2, 7, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 58, 66, 68], "10": [12, 13, 59, 61, 63, 64, 66], "100": [2, 10, 12, 14, 38, 39, 40, 58, 59, 66], "1000": [12, 16, 17, 18, 19, 55, 59, 66], "1000000": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 26, 27, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 58], "1000070": 35, "10010": 36, "1006729": 12, "10087": [25, 29, 41, 54], "101": 59, "10174": 35, "102": 59, "104": 59, "105": [55, 59], "107": 59, "1077": [14, 58], "108": 59, "109": 59, "1096": [12, 14, 58], "10_000": [64, 66], "11": 59, "110": 59, "1103": 12, "111": 59, "112": 59, "11310": 28, "116": 59, "11956": 32, "12": [12, 59], "121": 59, "123": [12, 59, 64], "124": 59, "126": 59, "128": [59, 66, 68], "129": 59, "13": [12, 59], "130": 59, "132": 59, "13210": [49, 50], "133": 59, "137": 59, "139": 59, "14": [35, 36, 59], "1400": 66, "1430": [20, 21], "144": 59, "148": 59, "15": 12, "151": 59, "153": 59, "155": 59, "156560": [33, 34], "157": 59, "158": 59, "160": 59, "161": 59, "162": 59, "163": 59, "164": 59, "165": 59, "167": 59, "169": 59, "16x16": 61, "17": [12, 59], "170": 59, "1709": [25, 29, 41, 54], "171": 59, "172": 59, "177": 59, "18": [12, 59], "183": 59, "1872": 66, "19": [12, 31, 59], "1910": 32, "196": 59, "1_000": [66, 68], "1e": 64, "1f": 66, "2": [2, 10, 12, 15, 16, 17, 18, 19, 20, 21, 25, 29, 30, 31, 32, 33, 34, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 61, 63, 66], "20": [12, 59, 66], "200": [22, 23, 24, 26, 27, 28, 51, 52, 53], "2000000": 55, "2004": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "2017": [25, 29, 41, 54], "2019": 32, "2020": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "2021": [15, 66], "2022": 59, "2023": 59, "2024": 59, "2026": 55, "2059": 12, "21": 12, "211": 59, "218": 59, "22": [12, 15, 59], "224": 59, "23": 12, "239": 59, "24": [14, 25, 29, 38, 39, 40, 41, 54, 66], "240": 59, "241": 59, "244": 59, "245": 59, "25": [12, 14, 24, 25, 28, 29, 40, 41, 53, 54, 58, 59, 66], "255": [35, 36, 61], "256": [66, 68], "26": [26, 27, 28, 59], "268": 15, "27": [16, 17, 18, 19, 20, 21, 59], "28": [12, 22, 23, 24, 59], "280": 31, "29": 59, "2d": [15, 30], "2f": 66, "3": [2, 10, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 61, 66], "30": [51, 52, 53, 66], "305": 59, "31": 59, "32": 68, "3360": [43, 44], "34": 59, "3606": 26, "3736": [14, 38], "3758": 51, "39": [12, 22, 23, 24, 51, 52, 53], "4": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 58, 61, 63, 64], "42": [61, 63, 66, 68], "4209": 31, "4356": [14, 58], "4358": 22, "45": [14, 38, 39, 40, 66], "450": [33, 34], "46": [26, 27, 28], "4752": [45, 46], "480": 66, "4958": [14, 39], "499206": [14, 39], "5": [12, 14, 55, 64, 66], "50": [22, 25, 26, 29, 38, 41, 51, 54, 64, 66], "500": 68, "5000": [12, 14, 23, 27, 40, 52, 58, 66], "500000": [14, 38], "5025": 12, "50_000": 66, "52": 59, "54": 59, "55": 59, "57": 59, "59": [31, 33, 34], "590": 36, "6": [12, 59], "60": 59, "6000": 55, "604": 14, "605": 12, "621": [33, 34], "638": 14, "6729": [12, 14, 24, 58], "69": 66, "7": [12, 14, 31, 33, 34, 35, 36, 58, 59, 61, 66], "700": [20, 21], "71": 59, "73": 59, "75": 59, "77": 59, "8": [12, 15, 16, 17, 18, 19, 20, 21, 30, 42, 55, 59, 64], "80": [16, 17, 18, 19, 59], "82": 59, "83": 59, "84": 59, "86": 59, "87": 59, "88": 59, "884": 66, "9": [12, 31, 33, 34], "90": [20, 21, 59], "900": 66, "92": 59, "93": 59, "95": 59, "9525": [47, 48], "96": 59, "99": [59, 64, 66], "9942": 53, "A": [2, 8, 13, 32, 58, 64, 66], "And": 68, "As": [6, 13, 59, 64, 68], "At": [16, 17, 18, 19, 20], "But": [61, 66], "By": [64, 66], "For": [1, 2, 10, 11, 12, 13, 30, 59, 61, 64, 68], "If": [2, 7, 8, 10, 11, 12, 13, 14, 59, 61, 64, 66], "In": [12, 13, 59, 61, 63, 64, 66, 68], "It": [59, 64, 66], "No": 61, "Not": [14, 22, 23, 24, 26, 27, 28, 38, 39, 40, 51, 52, 53], "On": [13, 64, 66], "The": [2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 58, 59, 61, 63, 64, 68], "Then": [61, 64, 66], "There": [12, 25, 29, 41, 54, 66], "These": [10, 14, 25, 29, 30, 32, 41, 42, 54, 59, 64], "To": [1, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 66, 68], "With": 14, "_": [2, 12, 61, 63, 64, 66, 68], "_0": 64, "__call__": [4, 5, 63, 64], "__init__": [64, 68], "__len__": 3, "_build": 1, "_check_valid_cel": 64, "_gen_miss": [35, 36, 61], "_index_0": 59, "_index_1": 59, "_max": 10, "_min": 10, "_score": 10, "_script": 59, "a1efe4": [14, 58], "a256f8": 14, "a5a5a1": 14, "a_hat": 68, "a_pr": 68, "a_t": 66, "ab": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "abil": 12, "abl": [12, 42], "abort": 14, "about": [1, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61], "abov": [12, 59, 61, 63, 66], "abspath": 68, "abstract": 12, "ac": 68, "access": [8, 12, 14, 59, 64], "account": 64, "accumul": [16, 17, 18, 19, 20, 21, 64, 68], "accumulated_rew": 68, "accur": 66, "achiev": [12, 64, 68], "achieved_go": [16, 17, 18, 19, 20, 21, 31, 33, 34, 43, 44, 45, 46, 47, 48, 49, 50, 63, 64], "achieved_goal_cel": 64, "acrobot": 12, "across": [10, 13, 59], "act": 59, "action": [2, 3, 5, 6, 8, 9, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 37, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 63, 64, 66, 68], "action_id": 64, "action_idx": 64, "action_spac": [2, 8, 10, 12, 13, 59, 61, 63, 64, 68], "action_space_subset": 63, "action_spec": 66, "activ": [15, 66], "activation_class": 66, "activation_fn": 66, "actor": 66, "actor_extractor": 66, "actor_mlp": 66, "actor_modul": 66, "actor_net": 66, "acttyp": [2, 10], "actual": 64, "actuat": [30, 42], "ad": [5, 7, 8, 10, 12, 13, 43, 44, 45, 46, 47, 48, 49, 50, 59, 63], "adam": [15, 66, 68], "add": [2, 3, 4, 5, 7, 8, 14, 43, 44, 45, 46, 47, 48, 49, 50, 59, 64, 66], "add_step_data": 3, "add_to_dataset": [2, 12], "addit": [2, 5, 7, 11, 12, 13, 59], "addition": [15, 59], "additional_dataset": 59, "additional_group": 59, "additional_wrapp": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "address": 64, "adher": 59, "adjust": 64, "adroit_door": [22, 23, 24], "adroit_h": 14, "adroit_hamm": [26, 27, 28], "adroit_hand": [14, 22, 23, 24, 26, 27, 28, 38, 39, 40, 51, 52, 53], "adroit_pen": [14, 38, 39, 40], "adroit_reloc": [51, 52, 53], "adroithanddoor": [12, 13, 22, 23, 24, 25, 30, 59], "adroithanddoorenv": [22, 23, 24], "adroithandhamm": [26, 27, 28, 29, 30, 59], "adroithandhammerenv": [26, 27, 28], "adroithandpen": [14, 30, 38, 39, 40, 41, 59, 66], "adroithandpenenv": [38, 39, 40], "adroithandreloc": [30, 51, 52, 53, 54, 59], "adroithandrelocateenv": [51, 52, 53], "advantag": [64, 66], "after": [2, 4, 6, 9, 10, 13, 14, 59, 64, 68], "again": [16, 17, 18, 19, 20, 21], "agent": [9, 15, 16, 17, 18, 19, 20, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 63, 64, 66, 68], "aggress": 64, "agnost": [2, 66], "aim": [13, 64, 66], "al": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64, 66], "alex": [12, 16, 17, 18, 19, 20, 21], "alexdavei": 59, "alexdavey0": [16, 17, 18, 19, 20, 21], "algo": 68, "algorithm": [2, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 66], "algorithm_nam": [2, 10, 12, 13, 61, 63, 64, 68], "all": [8, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 30, 31, 32, 58, 59, 61, 65, 66, 68], "allow": [12, 13, 59, 64, 68], "alon": 64, "along": [30, 42], "alreadi": [8, 12, 14, 59, 63, 64, 66], "also": [10, 12, 14, 16, 17, 18, 19, 20, 21, 58, 59, 61, 63, 64, 66], "alwai": 64, "among": 59, "amount": [12, 64], "amp": 59, "an": [4, 7, 10, 11, 12, 13, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 47, 48, 51, 52, 53, 54, 55, 59, 61, 64, 66], "andrea": [55, 56], "ani": [2, 5, 6, 7, 8, 9, 10, 11, 12, 59, 63, 64], "annot": 59, "anoth": [2, 5, 8, 12, 13, 25, 29, 41, 54, 64, 66], "anssi": 15, "ant": [16, 17, 18, 19, 20, 21, 30, 55, 57], "ant_maze_v4": [16, 17, 18, 19, 20, 21], "ant_v5": 55, "antenv": 55, "antmaz": [12, 16, 17, 18, 19, 20, 21], "antmaze_larg": [15, 17], "antmaze_large_diverse_gr": [15, 16], "antmaze_medium": [15, 19], "antmaze_medium_diverse_gr": [15, 18], "antmaze_umaz": [15, 20, 21], "antmazeenv": [16, 17, 18, 19, 20, 21], "antonin": 15, "apart": 59, "api": [11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 64, 68], "appear": [12, 59], "append": [3, 8, 12, 59, 66], "appli": [8, 61], "applic": [12, 59], "appreci": 59, "approach": 64, "appropri": 13, "approx": 66, "approxim": 66, "apr": [15, 42, 64], "apt": 66, "ar": [2, 6, 8, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 51, 52, 53, 54, 55, 58, 59, 61, 64, 66], "arang": 66, "aravind": [25, 29, 41, 54], "aravindr93": 14, "arbitrari": [13, 59], "arbitrarili": 13, "arena": [42, 47, 48], "arg": [14, 59, 64, 66], "argmax": [64, 68], "argument": [4, 5, 10, 12, 13, 59], "argv": 68, "around": [61, 66], "arrai": [10, 13, 64], "arrow": [13, 59], "arxiv": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "as_tensor": 68, "ashlei": 15, "assert": [22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 61, 68], "assign": 10, "associ": 13, "attach": 13, "attempt": 66, "attr": 59, "attribut": [2, 4, 10, 12, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 59], "author": [2, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 64, 68], "author_email": [2, 10, 12, 13, 59, 61, 64, 68], "auto": [66, 68], "auto_cast_to_devic": 66, "autobuild": 1, "automat": [1, 2, 13, 59], "autoreset": 14, "auxiliari": 2, "avail": [7, 10, 12, 14, 58, 59, 61, 66], "averag": [2, 10, 66], "avg": 66, "avjmachin": 59, "avoid": [59, 66], "awai": 59, "ax": 66, "axi": [30, 42, 64, 66], "b": [1, 14, 58], "b64encod": 66, "back": [61, 64], "background": 59, "backpropag": 66, "backward": [66, 68], "badg": 59, "balanc": 68, "balisujohn": 59, "ball": [15, 30, 42, 54, 64], "bamboofungu": 59, "bar": 14, "base": [12, 14, 59, 64, 66], "base64": 66, "base_env": 66, "baselin": 15, "baselines3": [15, 68], "basi": 59, "basic": [59, 66], "batch": [66, 68], "batch_first": 68, "batch_siz": [66, 68], "becaus": [15, 16, 17, 18, 19, 20, 21, 42, 66], "been": [12, 42, 59], "befor": [2, 12, 61, 64, 66], "begin": [16, 17, 18, 19, 20, 68], "behav": 66, "behavior": [59, 64, 65, 66, 69], "behavioral_clon": 68, "behaviour": 66, "being": [2, 10, 13, 31, 32, 33, 34, 42, 43, 45, 47, 49], "bellman": 64, "bellow": 59, "belong": 5, "below": [14, 64, 66], "benchmark": [30, 66], "best": 66, "best_model": 68, "beta": [59, 66], "between": [10, 43, 45, 47, 49, 64], "bias": 64, "binari": 13, "bind": 64, "bit": [64, 66], "black": 59, "blob": [61, 64], "block": 66, "blue": 66, "board": 29, "bool": [2, 5, 7, 9, 10, 11, 59, 66], "boolean": 10, "both": [8, 13, 14, 61, 63], "bottom": 33, "bound": [13, 64, 66], "box": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 63, 68], "break": [12, 59, 64, 68], "bucket": [12, 13, 58, 59], "buffer": [2, 3, 7, 8, 10, 12, 59], "bug": 59, "bugfix": 59, "build": [14, 59], "burner": 33, "c": [12, 16, 18, 32, 59], "cabinet": [31, 32, 34], "cach": [2, 12, 59, 66], "calcul": [10, 66], "call": [2, 5, 12, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 59], "callabl": [2, 7, 8, 10, 12, 59, 61], "callback": [2, 4, 5, 59, 63, 64], "can": [2, 4, 5, 7, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 63, 64, 66, 68], "capabl": 12, "captur": 66, "care": 61, "cart": 68, "cartesian": 13, "cartpol": [11, 12, 59, 68], "case": [12, 59, 64], "cd": [1, 12], "cell": [16, 18, 64], "cell_rowcol_to_xi": 64, "cell_to_st": 64, "cell_xy_to_rowcol": 64, "center": 14, "certain": [7, 12, 41], "cff": 59, "challeng": [15, 66], "chang": [1, 11, 59, 64], "changelog": 59, "characterist": [2, 64], "charg": 59, "charset": [13, 35, 36], "check": [12, 14, 59, 64], "checkpoint": 59, "choic": 66, "choos": [13, 61, 63], "chosen": 64, "ci": 59, "citat": 59, "class": [2, 3, 4, 5, 6, 7, 8, 9, 13, 59, 63, 64, 66, 68], "classic": [12, 64, 68], "classic_control": 12, "classif": 68, "clean": 61, "clear": 2, "clear_episode_buff": 59, "cli": [58, 59], "clip": 64, "clone": [1, 12, 14, 25, 29, 41, 54, 58, 59, 65, 66, 69], "close": [2, 32, 64, 66, 68], "cloud": [12, 13, 59], "cmmcirvin": 59, "code": [2, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 63, 64, 65, 66, 68], "code_permalink": [2, 10, 12, 13, 61, 64, 68], "codelink": 59, "colab": 66, "collate_fn": 68, "collect": [2, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 58, 59, 61, 62, 65, 66], "collector": [2, 64], "collector_env": [59, 64], "collis": 64, "color": [14, 58], "com": [1, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 59, 61, 64], "combin": [59, 64], "combine_dataset": [10, 12, 59], "combined_dataset": 10, "come": [13, 14], "command": [12, 14, 59, 68], "commit": 59, "common": [12, 13], "compar": [6, 63], "comparison": 10, "compat": [10, 12, 14, 59, 68], "compatible_minari_vers": 10, "complement": 2, "complet": [32, 33, 34, 59, 66], "complex": [15, 25, 29, 30, 41, 54, 59], "compli": 59, "compliant": [13, 59], "compon": 64, "component_1": 59, "component_2": 59, "compris": 12, "comput": [2, 10, 12, 13, 66], "compute_act": 64, "compute_reward_matrix": 64, "compute_transition_matrix": 64, "concaten": 66, "condit": [7, 12, 59, 66], "configur": [32, 59, 66], "confirm": [14, 66], "conflict": 66, "conjunct": 66, "consid": [8, 59, 64, 66], "consider": 59, "consist": [13, 42, 66], "constantli": 59, "construct": 64, "contact": [11, 12, 61, 68], "contain": [1, 2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 42, 47, 48, 49, 50, 51, 52, 53, 55, 59], "content": [13, 14], "continu": [10, 12, 13, 42, 43, 44, 45, 46, 47, 48, 49, 50, 64], "continuing_task": [16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 64], "contribut": [1, 12, 59, 64], "contributor": 59, "control": [12, 15, 42, 43, 44, 45, 46, 47, 48, 49, 50, 59, 66, 68], "conveni": 66, "convent": 59, "convers": [59, 61], "convert": [2, 64, 66], "coordin": 64, "copi": [59, 66], "core": 61, "corl": 66, "corr": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "correct": [59, 64, 66], "correspond": [2, 10, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 64, 68], "could": [15, 66], "cover": 66, "coverag": 59, "cpu": 66, "creat": [2, 5, 7, 8, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 59, 61, 63, 66, 68], "create_dataset": [2, 12, 59, 61, 63, 64, 68], "create_dataset_from_buff": [10, 12, 13, 59], "create_dataset_from_collector_env": 59, "create_namespac": 11, "creation": [2, 12, 13, 59], "credenti": 11, "cross": 68, "crossentropyloss": 68, "cuda": 66, "cumul": [64, 66], "curat": 59, "current": [5, 10, 12, 13, 14, 59, 64, 66], "current_cel": 64, "current_control_target_id": 64, "current_control_target_xi": 64, "current_st": 64, "custom": [2, 4, 12, 59, 62, 64, 65], "custom_space_seri": 61, "customstepdatacallback": 5, "customsubsetstepdatacallback": 63, "cython": 59, "d": [12, 66], "d4rl": [10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 59, 62, 65, 66], "da": 64, "dampen": 64, "dapg": [14, 23, 24, 25, 27, 28, 29, 39, 40, 41, 52, 53, 54], "data": [2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 29, 30, 32, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 58, 59, 61, 66, 68], "data_collector": 63, "data_format": [2, 8, 10, 59], "data_path": 8, "data_url": 66, "databas": [10, 11, 14], "databefor": 2, "dataclass": [8, 59], "datacollector": [4, 12, 13, 59, 61, 63, 64, 68], "datacollectorv0": 59, "dataload": [12, 59, 68], "datas": 8, "dataset": [2, 4, 5, 6, 7, 11, 15, 25, 29, 30, 32, 37, 41, 42, 54, 58, 59, 61, 63, 66], "dataset_cr": [59, 61, 64], "dataset_id": [2, 10, 11, 12, 13, 59, 61, 63, 64, 66, 68], "dataset_nam": [2, 10, 13, 14, 64], "dataset_s": 59, "dataset_v1": 59, "dataset_v2": 59, "dataset_v3": 59, "datasets_to_combin": [10, 59], "davei": [12, 16, 17, 18, 19, 20, 21], "de": [12, 14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 51, 52, 53], "decent": 66, "decod": 66, "deep": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "def": [5, 61, 63, 64, 66, 68], "default": [2, 5, 7, 8, 10, 11, 12, 13, 66], "default_interaction_typ": 66, "defin": [13, 61, 63, 68], "definit": 59, "del": [61, 63], "deleg": 59, "delet": [61, 63], "delete_dataset": [10, 61, 63], "delete_namespac": 11, "demonstr": [22, 24, 25, 26, 28, 29, 31, 32, 38, 40, 41, 51, 53, 54, 66], "dens": [14, 22, 23, 24, 26, 27, 28, 38, 39, 40, 42, 51, 52, 53, 59, 66], "depend": [12, 13, 59], "deprec": 59, "descent": 66, "describ": [11, 13, 59], "descript": [2, 10, 11, 13, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 56, 57, 59], "deseri": 61, "deserialize_custom_spac": 61, "deserialize_spac": 61, "design": 66, "desir": [32, 64], "desired_cel": 64, "desired_go": [16, 17, 18, 19, 20, 21, 31, 33, 34, 43, 44, 45, 46, 47, 48, 49, 50, 63, 64], "detail": 66, "detect": 59, "determin": 64, "determinist": [12, 64, 66], "develop": 59, "deviat": [13, 64], "devic": [14, 66], "dexter": [25, 29, 41, 54], "df8ff078652a": [15, 42, 64], "dict": [2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 16, 17, 18, 19, 20, 21, 31, 33, 34, 35, 36, 43, 44, 45, 46, 47, 48, 49, 50, 59, 61, 63], "dict_kei": 63, "dictionari": [2, 3, 5, 7, 8, 9, 10, 12, 13, 59, 62, 64, 65, 66], "differ": [10, 12, 13, 42, 59, 61, 64, 66], "dimens": [66, 68], "dimension": [13, 25, 29, 41, 54], "dir": 59, "direct": [35, 36, 61, 66], "directli": [12, 59, 64, 66, 68], "directori": [2, 8, 11, 12, 66], "dirhtml": 1, "disabl": 2, "disable_env_check": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "discount": 64, "discret": [13, 35, 36, 59, 61, 64, 68], "disk": [8, 12, 13, 59, 61, 63, 68], "displai": [66, 68], "dist": 64, "distanc": [43, 45, 47, 49], "distribut": [25, 29, 41, 54, 66], "distribution_class": 66, "distribution_kwarg": 66, "divers": [12, 15], "divid": [12, 64], "do": [64, 66], "doc": [1, 59, 61, 64], "document": [12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59], "doe": 59, "doesn": [8, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 59, 64], "dof": [15, 25, 29, 30, 41, 54, 66], "domain": [15, 25, 29, 30, 41, 42, 54], "don": [13, 59, 61, 63, 64], "done": [12, 64, 66, 68], "door": [10, 12, 13, 14, 22, 23, 24, 30, 32, 58, 59], "dormann": 15, "dot": [64, 66], "doubl": 66, "doubletofloat": 66, "down": 64, "download": [13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 63, 64, 65, 66, 68], "download_dataset": 10, "download_namespace_metadata": 11, "driven": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "dt": 64, "dtype": [59, 63, 64, 66], "due": [59, 64], "dump": 61, "dure": [12, 13, 59, 64, 66], "dynam": 64, "e": [1, 7, 10, 12, 59, 66], "e731": 61, "each": [2, 4, 5, 6, 8, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 63, 64, 66, 68], "earlier": 61, "edit": [2, 5], "effect": [25, 29, 41, 54], "effici": 59, "element": [6, 13], "elif": 64, "elimin": 64, "ell": 66, "elliottow": 59, "els": [12, 59, 64, 66], "email": [2, 10, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59], "embed": 66, "empti": [11, 61, 64], "emptyenv": 61, "enabl": 61, "encapsul": 13, "encount": 61, "encourag": [13, 59], "end": [13, 59], "enerrio": 59, "enhanc": 59, "ensur": 66, "entri": 64, "entropi": 68, "entry_point": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59], "env": [2, 5, 7, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 59, 61, 63, 64, 66, 68], "env_id": 66, "env_nam": [2, 10, 13], "env_spec": [8, 13], "envid": 2, "environ": [2, 5, 6, 7, 8, 9, 10, 13, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 58, 59, 61, 63, 64, 68], "environment_st": 5, "envspec": [2, 8, 10, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59], "eol": 59, "ep": 12, "episod": [2, 3, 4, 6, 7, 8, 10, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 63, 64, 66, 68], "episode_0": 59, "episode_1": 59, "episode_2": 59, "episode_id": [12, 59], "episode_indic": [7, 8, 12], "episode_metadata_callback": [2, 4], "episode_reward": 66, "episodebuff": [7, 8, 10], "episodedata": [7, 12, 59], "episodemetadatacallback": [2, 13, 59], "episodes_gener": 12, "epoch": 68, "epsiodedata": 8, "equal": [2, 10, 13], "equat": 64, "equiv": 66, "equlival": 64, "ernestu": 15, "error": [10, 59, 61, 64, 66], "essenti": 66, "estim": [2, 10, 66], "et": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64, 66], "etc": 66, "euclidean": [43, 45, 47, 49], "evad": 64, "eval_env": [2, 7, 10, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "eval_env_spec": [12, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55], "eval_interv": 66, "eval_reward_log": 66, "eval_td": 66, "evalu": [2, 7, 10, 12, 59, 66, 68], "evaluate_polici": 66, "everi": [1, 10, 12, 13, 21, 64, 66], "everyth": 66, "exampl": [2, 10, 11, 12, 13, 14, 59, 61, 64, 65, 66], "example_env": 66, "except": [8, 59, 61, 66], "excit": 59, "execut": 68, "exerpt": 59, "exist": [8, 11, 14, 59, 63, 64], "exit": 14, "expect": 63, "expectil": 66, "experienc": 59, "experiment": 11, "expert": [2, 10, 12, 13, 14, 15, 22, 25, 26, 29, 36, 37, 38, 41, 51, 54, 56, 58, 59, 66, 68], "expert_dataset": 55, "expert_polici": [2, 10], "expertpolici": [36, 68], "explain": [59, 64], "explicit": [59, 66], "explicitli": 59, "explor": 59, "exploration_act": 64, "explorationtyp": 66, "exponenti": [43, 45, 47, 49], "export": [12, 59], "extend": [12, 63], "extra": [2, 4, 5, 59, 64], "extract": 66, "extrapol": 66, "f": [12, 14, 59, 61, 63, 66, 68], "f01e2c": 14, "f4bf75": 14, "facilit": [10, 12, 59], "factor": 64, "factori": 3, "fail": [16, 17, 18, 19, 20, 21, 59], "fals": [2, 7, 10, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 61, 63, 64, 66, 68], "familiar": 66, "farama": [1, 10, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 64, 66, 68], "favor": 59, "fc1": 68, "fc2": 68, "fc3": 68, "featur": [11, 12, 58, 59, 68], "fed000": 14, "few": 59, "ff00ff": [14, 58], "ffmpeg": 66, "field": [13, 59, 66], "fig": 66, "figsiz": 66, "figur": 66, "file": [2, 4, 11, 12, 13, 14, 58, 59, 63], "file_fold": 59, "filter": [7, 58, 59], "filter_dataset": [12, 59], "filter_episod": [7, 12, 59], "final": [6, 12, 15, 59, 61, 63, 64, 66], "final_scor": 66, "find": 63, "fine": [14, 23, 25, 27, 29, 39, 41, 52, 54, 55, 56], "first": [11, 12, 59, 61, 63, 64, 66], "fit": [63, 66], "fix": [21, 30, 42, 59, 66], "flag": [10, 59, 66], "flatten": 59, "flexibl": 12, "flip": [16, 17, 18, 19, 20, 21, 32], "float": [2, 8, 10, 13, 63, 66], "float32": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 64, 68], "float64": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 63, 66], "floppy_disk": 59, "folder": [1, 68], "follow": [2, 5, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 64, 66], "font": [14, 58], "forc": [10, 14, 30, 42, 64], "force_download": [10, 59], "form": [10, 13, 64], "format": [2, 8, 10, 12, 13, 59, 61], "formula": [10, 64], "forward": [11, 13, 66, 68], "found": [10, 13], "foundat": [1, 12, 14, 30, 55, 59, 61, 64], "four": 68, "fourroom": [30, 37], "fourroomsenv": [35, 36], "fp": 66, "frac": 10, "frame": 66, "framework": 66, "franka_kitchen": [31, 33, 34], "frankakitchen": [30, 31, 32, 33, 34, 59], "from": [2, 5, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 58, 59, 61, 63, 64, 66, 68], "from_pixel": 66, "froze": 59, "fu": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "full": [4, 8, 12, 36, 37, 59, 66], "fulli": 59, "function": [7, 8, 10, 12, 13, 14, 35, 36, 42, 43, 44, 45, 46, 47, 48, 49, 50, 59, 61, 64, 66, 68], "fundament": [15, 42, 64], "futur": [11, 12, 59, 64], "g": [12, 21, 35, 36, 66], "gain": 64, "gamma": [64, 66], "gather": 66, "gcp": [12, 13, 58, 59], "gen_dataset_md": 59, "gener": [2, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 58, 59, 61, 63, 64], "generate_path": 64, "get": [7, 8, 10, 12, 59, 61, 63, 64, 66, 68], "get_episod": 8, "get_episode_metadata": [8, 13], "get_namespace_metadata": 11, "get_next_st": 64, "get_normalized_scor": [2, 10, 59], "get_q_valu": 64, "get_siz": 8, "git": [1, 12], "github": [1, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 59, 61, 64], "give": [12, 13, 14, 64, 66], "given": [12, 13, 14], "gleav": 15, "global": [2, 13, 64], "global_target_id": 64, "global_target_xi": 64, "glr": 59, "gmail": [16, 17, 18, 19, 20, 21, 35, 36], "go": [1, 64], "goal": [15, 16, 17, 18, 19, 20, 21, 32, 36, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 61, 63, 64, 66], "goal_cel": 64, "goe": [36, 37], "googl": [13, 59, 66], "gradient": 66, "grahamannett": 59, "greater": [12, 59], "green": [61, 66], "grid": 64, "gridworld": 37, "group": [2, 4, 10, 12, 13, 14, 30, 59, 64], "gt": 59, "guarante": 13, "gupta": 32, "gym": [2, 5, 7, 10, 12, 59, 61, 63, 64, 66, 68], "gymansium": 12, "gymenv": 66, "gymnaisum": 14, "gymnasium": [2, 5, 7, 8, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 59, 61, 63, 64, 66, 68], "gymnasium_robot": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "gynasium": 59, "h5py": 59, "ha": [12, 21, 42, 59, 64, 66], "hammer": [26, 27, 28, 30, 59], "hand": [13, 16, 18, 25, 29, 41, 54, 64, 66], "hand_dapg": [14, 25, 29, 30, 41, 54], "handl": [8, 12, 58], "hat": 66, "hausman": 32, "have": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 36, 38, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 59, 61, 63, 64, 66, 68], "hdf5": [2, 4, 8, 13, 14, 58, 59, 63, 64], "help": [14, 59, 64], "helper": 66, "here": [66, 68], "hesit": 59, "hidden": 59, "hidden_s": 66, "hierarch": 12, "high": [25, 29, 41, 54, 59, 63, 64, 66], "higher": 64, "highli": 59, "hill": 15, "hood": 66, "horizon": 32, "host": [12, 14, 25, 29, 30, 32, 41, 54, 58], "how": [1, 2, 59, 61, 63, 64, 66, 68], "howev": [13, 42, 59, 61, 64, 66, 68], "howuhh": 59, "href": 14, "html": 66, "http": [1, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 59, 61, 64, 68], "hub": 59, "human": [10, 12, 13, 14, 22, 25, 26, 29, 38, 41, 51, 54, 58, 59, 66, 68], "hyperparamet": 66, "hypothet": [2, 10], "i": [1, 2, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 32, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 59, 61, 63, 66, 68], "id": [2, 3, 6, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 59, 64, 68], "idea": 59, "identifi": [2, 10, 11, 13], "ignor": [59, 66], "im": 59, "imag": [35, 36, 61, 66], "imit": [22, 25, 26, 29, 32, 38, 41, 51, 54], "implement": [14, 15, 64, 66], "implicit": [65, 69], "implicitli": 66, "import": [2, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 63, 64, 66], "import_bugfix": 59, "improv": [59, 66], "imshow": 66, "in_kei": 66, "includ": [6, 13, 31, 32, 34, 42, 59, 66], "incompat": 14, "incorrect": [8, 59], "increas": 6, "indic": [2, 7, 8, 10, 12, 59], "inf": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 63], "infer": 66, "influenc": [64, 66], "info": [2, 3, 5, 6, 9, 12, 13, 59, 64, 68], "inform": [1, 2, 5, 7, 13, 59, 64], "infos_dataset": 59, "infos_subgroup": 59, "init": 59, "initi": [2, 6, 7, 12, 13, 59, 61, 63, 64, 66, 68], "initialis": 66, "input": [5, 7, 12, 13, 66, 68], "input_dim": 68, "insid": 61, "inspir": 64, "instabl": 64, "instal": [1, 10, 14, 58, 59, 61, 66, 68], "instanc": [7, 59], "instanti": 14, "instead": [12, 13, 59, 64, 66], "instruct": 59, "int": [2, 3, 6, 7, 8, 10, 13, 59, 64], "int64": [59, 68], "int_": [7, 64], "integ": 13, "intend": 7, "interact": 32, "interest": 66, "interfac": 12, "intern": [12, 59], "introduc": [15, 25, 29, 41, 54, 59, 66], "invers": 66, "involv": [30, 42, 64], "ipynb": [61, 63, 64, 66, 68], "ipython": 66, "iql": 66, "iql_torchrl": 66, "iqlloss": 66, "is_avail": 66, "is_shar": 66, "isinst": 68, "isol": 59, "issu": [59, 66], "item": [2, 64, 66, 68], "iter": [7, 8, 12, 13, 15, 42, 64, 66], "iterate_episod": [7, 12, 59], "its": [10, 59, 61, 64, 66], "itself": 12, "j": 64, "jamartinh": 59, "josephcarrino": 59, "journal": 15, "json": [13, 14, 59, 61], "jupyt": [61, 63, 64, 65, 66, 68], "just": [12, 61, 66], "justin": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "k": 32, "k_": 64, "k_d": 64, "k_i": 64, "k_p": 64, "kabuki": 59, "kaixin96": 59, "kallinteri": [55, 56], "kanervisto": 15, "keep": [12, 59], "kei": [2, 5, 8, 10, 12, 14, 59, 63, 64, 66], "kept": 13, "kernel": 66, "kettl": [31, 32, 33, 34], "key_fil": 14, "key_path": 11, "kitchen": [30, 31, 33, 34, 59], "kitchenenv": [31, 33, 34], "kitsch": 59, "know": 64, "kostrikov": 66, "kumar": 32, "kwarg": [2, 5, 7, 11, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 63], "l": 66, "l2": 66, "l_": 66, "l_2": 66, "l_pi": 66, "l_q": 66, "l_v": 66, "lag": 66, "lambda": [7, 12, 59, 61, 64], "lambert": [15, 42, 64], "larg": [12, 15, 42, 59], "larger": [59, 64, 66], "largest": 59, "last": 59, "last_episode_id": 59, "later": [2, 10, 59, 66], "latest": [10, 14, 59, 64], "latest_vers": 10, "latter": [10, 13, 66], "layer": 66, "lazcano": [12, 14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 51, 52, 53], "lazi": 66, "lazylinear": 66, "lead": [13, 16, 17, 18, 19, 20, 21, 64], "learn": [12, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 58, 59, 61, 63, 64, 65, 68, 69], "learnin": [15, 42, 64], "leav": 12, "left": [12, 64, 66], "leftarrow": [64, 66], "len": [64, 66], "length": [3, 68], "less": 64, "let": [61, 63, 64, 68], "level": 13, "levin": 32, "lib": 66, "librari": [12, 59, 61, 68], "light": [31, 32, 33, 34], "like": [11, 12, 14, 61, 66, 68], "limit": [64, 66], "linalg": 64, "line": [14, 63], "linear": 68, "link": [2, 10, 12, 13], "linux": 12, "list": [2, 3, 7, 8, 12, 13, 58, 59, 66, 68], "list_local_dataset": [10, 12, 59, 63], "list_local_namespac": 11, "list_remote_dataset": [10, 59], "list_remote_namespac": 11, "ll": [61, 63], "load": [2, 11, 13, 59, 61, 66, 68], "load_dataset": [2, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 68], "loc": 66, "local": [10, 13, 59, 61, 63, 66, 68], "local_dataset": 63, "locat": [12, 15, 16, 17, 18, 19, 20, 21, 30, 42, 43, 44, 45, 46, 47, 48, 49, 50, 64, 66], "log": [59, 66, 68], "long": [32, 64], "longer": 59, "look": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61], "loop": [12, 66, 68], "loos": 59, "lose": 12, "loss": 68, "loss_actor": 66, "loss_dict": 66, "loss_fn": 68, "loss_funct": 66, "loss_log": 66, "loss_modul": 66, "loss_qvalu": 66, "loss_valu": 66, "lost": 59, "low": [59, 63, 64, 66], "lower": 13, "lr": 66, "lynch": 32, "m_": 66, "machin": [13, 15], "maco": 12, "made": [1, 59], "mai": [11, 12, 64, 66], "main": [2, 7, 55, 59, 61, 64, 66], "main_data": [14, 58, 59], "major": 59, "make": [1, 2, 7, 12, 59, 61, 63, 64, 66, 68], "make_value_estim": 66, "manag": 59, "mandatori": [13, 59], "mani": 13, "manipul": [25, 29, 41, 54, 66], "manual_se": [66, 68], "map": [12, 16, 18, 64, 66], "map_length": 64, "map_width": 64, "margin": 66, "markdown": 59, "markovian": [15, 42], "master": 64, "match": 10, "mathbb": 66, "mathcal": 66, "matplotlib": 66, "matrix": 64, "max": [64, 66], "max_": [64, 66], "max_a": 66, "max_episode_step": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 64, 66], "max_step": 66, "maximilian": 15, "maximis": 66, "maximum": [2, 10, 13, 64, 66, 68], "maze": [16, 17, 18, 19, 20, 21, 30, 43, 44, 45, 46, 47, 48, 49, 50, 59, 64], "maze2d": [42, 64], "maze_map": [16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 64], "maze_solv": 64, "mb": [8, 12, 14, 58], "md": [1, 59], "mdp": [12, 59], "mean": [6, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 64, 66], "meant": [2, 59], "measur": [25, 29, 41, 54, 64], "medium": [12, 15, 42, 59], "memor": [15, 42], "memori": [2, 12, 59], "mention": [13, 59, 64, 68], "merg": 14, "messag": 14, "met": 7, "metadata": [2, 4, 7, 8, 10, 12, 14, 59, 63], "method": [12, 15, 42, 59, 61, 64, 66], "metric": 13, "mgoulao": 59, "microwav": [31, 32, 33, 34], "mimic": 15, "min": 66, "minari": [11, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 63, 66, 68], "minari_autose": 2, "minari_data": 66, "minari_dataset": [59, 68], "minari_datasets_path": 13, "minari_remot": [12, 59], "minari_storag": 59, "minari_vers": [13, 59], "minaridataset": [2, 10, 12, 13, 59, 68], "minariexperiencereplai": 66, "minaristorag": [2, 7, 10, 13, 59], "minigrid": [30, 35, 36, 59, 61], "minim": 63, "minimis": 66, "minimum": [2, 10, 12, 13, 59], "minor": 59, "mirana": 63, "misc": 59, "miss": 59, "mission": [35, 36, 61], "mission_func": 61, "missionspac": [35, 36, 61], "missonspac": 61, "mix": [22, 25, 26, 29, 32, 38, 41, 51, 54, 59], "mlp": 66, "model": [55, 56], "modifi": [8, 12, 13, 59, 63], "modul": [61, 63, 64, 66, 68], "modulelist": 66, "moment": 13, "more": [1, 6, 12, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 64, 66], "more_dataset": 59, "moreov": [8, 13], "morpholog": 15, "most": [12, 14], "move": [12, 30, 32, 42, 54, 59, 64], "mp4": 66, "mujoco": [2, 10, 55, 64], "mujuco": [55, 56], "multi": 66, "multibinari": 13, "multidiscret": 13, "multipl": [10, 11, 12, 14, 59, 66], "must": [5, 7, 8, 10, 12, 13, 59, 66], "my": 12, "n": [7, 12, 13, 14, 64, 68], "n_episod": [7, 12], "n_step": [59, 64], "nail": 29, "name": [2, 10, 11, 12, 13, 14, 58, 59, 61, 68], "namespac": [2, 10, 59], "namespace_metadata": 13, "narrow": [25, 29, 41, 54], "nathan": [15, 42, 64], "navig": [15, 30, 37, 42], "ncol": 66, "ndarrai": [6, 7, 10, 13, 59], "necessari": 66, "need": [8, 12, 59, 61, 63, 64, 66, 68], "neg": [43, 45, 47, 49], "nest": [2, 5, 11, 13, 59], "net": 66, "network": [66, 68], "neural": 68, "never": [32, 33, 64, 66], "new": [2, 8, 10, 12, 16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 59, 61, 64, 66, 68], "new_dataset_id": [10, 59], "new_dataset_nam": 14, "newli": [10, 12, 66], "next": [9, 59, 64, 66, 68], "next_cel": 64, "next_episode_id": 59, "next_stat": 64, "nightli": 66, "nn": [66, 68], "no_grad": 66, "noah": 15, "nois": [43, 44, 45, 46, 47, 48, 49, 50, 59, 64], "non": [12, 13, 15, 42], "nondeterminist": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "none": [2, 3, 5, 7, 8, 9, 10, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 64], "nonetyp": 59, "noqa": 61, "norm": 64, "normal": [2, 66], "normalized_scor": 10, "normalparamextractor": 66, "note": [10, 11, 13, 16, 17, 18, 19, 20, 21, 63, 64, 66], "notebook": [61, 63, 64, 65, 66, 68], "notic": 12, "notimplementederror": 61, "now": [10, 12, 59, 61, 63, 64, 68], "np": [7, 10, 13, 59, 63, 64, 66, 68], "npt": 7, "nrow": 66, "num_act": 64, "num_cel": 66, "num_episod": [61, 63], "num_episodes_average_scor": [2, 10], "num_epoch": 68, "num_eval_episod": 66, "num_itr": 64, "num_stat": 64, "num_step": 2, "number": [2, 6, 7, 10, 12, 13, 14, 59], "numpi": [63, 64, 66, 68], "o": 68, "ob": [2, 5, 12, 59, 64, 68], "object": [7, 8, 9, 12, 25, 29, 32, 37, 41, 54, 59, 61, 66, 68], "observ": [2, 3, 5, 6, 8, 9, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 37, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 63, 64, 66, 68], "observation_spac": [2, 8, 10, 12, 13, 59, 61, 63, 68], "observation_space_subset": 63, "obstyp": [2, 10], "obtain": [22, 25, 26, 29, 38, 41, 51, 54, 64], "occur": [16, 17, 18, 19, 20, 21], "off": 14, "offici": 59, "offlin": [12, 13, 14, 58, 59, 64, 66, 68], "often": 64, "oibserv": 59, "omar": [35, 36], "omit": 63, "onc": [1, 12, 64, 66, 68], "one": [2, 6, 7, 8, 12, 25, 29, 41, 42, 54, 59, 66], "one_hot": 68, "onli": [10, 11, 12, 13, 42, 44, 46, 47, 48, 50, 59, 63, 66], "onlin": 66, "onto": 11, "open": [25, 32, 42, 59, 66], "opengl": 66, "optim": [64, 68], "option": [2, 3, 5, 7, 8, 10, 12, 13, 14, 59], "order": [12, 31, 32, 59, 63], "order_enforc": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "org": [11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 59, 61, 64, 68], "organ": 59, "orient": [5, 41, 63], "origin": [10, 12, 25, 29, 30, 32, 41, 42, 54, 59, 61, 66], "other": [7, 8, 10, 11, 12, 13, 14, 32, 34, 59, 63, 64, 66], "otherwis": [7, 12, 44, 46, 48, 50, 59], "our": [1, 12, 13, 59, 63, 64, 66, 68], "ourselv": 64, "out": [8, 12, 59, 61, 64, 66], "out_featur": 66, "out_kei": 66, "outlin": 63, "output": [8, 61, 63, 64, 66, 68], "output_dim": 68, "outsid": 66, "over": [2, 7, 10, 12, 64, 66], "overal": 66, "overconfid": 66, "overestim": 66, "overrid": [4, 5, 13, 14, 64], "overridden": [4, 5, 10, 59], "overridng": 64, "overshoot": 64, "overview": 66, "overwrit": 11, "own": [10, 12, 59, 64], "p_": 64, "packag": [1, 2, 10, 14, 59, 68], "pad": 68, "pad_sequ": 68, "page": 59, "page_facing_up": 59, "pair": [13, 66], "paper": [25, 29, 41, 54], "paramet": [2, 3, 4, 5, 7, 8, 10, 11, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 66, 68], "parameteris": 66, "part": 66, "partial": [32, 59], "particular": [61, 66], "pass": [2, 4, 7, 10, 12, 63, 66], "past": 59, "path": [8, 11, 12, 13, 14, 43, 44, 45, 46, 47, 48, 49, 50, 59, 64, 68], "path_str": 14, "pathlik": [7, 8], "pbar": 66, "pd": [42, 43, 44, 45, 46, 47, 48, 49, 50, 64], "pen": [14, 30, 38, 39, 40, 59], "per": [2, 59], "perceptron": 66, "perez": [43, 44, 45, 46, 47, 48, 49, 50, 64], "perform": [9, 10, 12, 14, 32, 33, 34, 64, 66, 68], "perimet": [42, 47, 48], "permalink": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "perman": 12, "pettingzoo": 59, "phi": 66, "pi": [64, 66], "pi_": 66, "pick": [16, 18], "pid": [59, 64], "pip": [1, 2, 10, 12, 13, 14, 58, 61, 66, 68], "pixel": 66, "pixels_onli": 66, "plai": [12, 15], "plan": [12, 59, 63], "planner": [15, 42], "platform": 13, "pleas": [11, 12, 59, 63], "plot": 66, "plt": 66, "plug": 66, "point": [7, 30, 59, 66], "point_maz": [43, 44, 45, 46, 47, 48, 49, 50], "point_maze_dataset": [59, 64], "pointmaz": [15, 30, 43, 44, 45, 46, 47, 48, 49, 50, 59, 62, 63, 65], "pointmaze_larg": [42, 44], "pointmaze_largedens": [42, 43], "pointmaze_medium": [42, 46, 64], "pointmaze_mediumdens": [42, 45], "pointmaze_open": [42, 48], "pointmaze_opendens": [42, 47], "pointmaze_umaz": [42, 50, 63], "pointmaze_umazedens": [42, 49], "pointmazeenv": [43, 44, 45, 46, 47, 48, 49, 50], "pointmazestepdatacallback": 64, "pole": 68, "polici": [2, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 29, 30, 32, 36, 37, 38, 39, 41, 42, 51, 52, 54, 55, 56, 64, 66], "policy_net": 68, "policynetwork": 68, "polyak": 66, "poorli": 66, "popul": 66, "popular": 58, "pose": [5, 64], "posit": [5, 32, 37, 54, 64, 66], "possibl": [13, 59], "ppo": 68, "pr": 59, "practic": 66, "pre": 59, "precis": 66, "precommit": 59, "predict": [64, 68], "prepend": 11, "preprint": 32, "prerequisit": 66, "present": [10, 15, 30, 68], "prevent": 12, "previou": [2, 12, 59], "previous": [15, 59, 64, 68], "principl": 30, "print": [12, 59, 61, 63, 66, 68], "prng": 2, "probabilisticactor": 66, "probabl": 64, "problem": 68, "proce": [14, 68], "procedur": 63, "process": [12, 59, 64, 66], "prod": 68, "produc": 59, "product": 13, "program": 64, "progress": 14, "project": [12, 59], "prompt": [12, 14], "properli": [61, 66], "properti": [7, 66], "proporti": 64, "protonmail": 55, "provid": [10, 12, 13, 14, 15, 16, 18, 22, 23, 24, 25, 26, 27, 28, 29, 30, 38, 39, 40, 41, 51, 52, 53, 54, 58, 59, 66], "pseudo": 59, "psi": 66, "public": [13, 59, 64], "publicli": 58, "pure": 59, "purpos": [12, 30, 42, 64, 66], "py": [55, 59, 61, 63, 64, 66, 68], "pyarrow": 59, "pypi": 59, "pyplot": 66, "pyright": 59, "pytest": 59, "python": [12, 58, 59, 61, 63, 64, 65, 66, 68], "python3": 66, "pytorch": [59, 65, 66, 69], "pytorchdataload": 59, "pyvirtualdisplai": 66, "pz": 59, "q": [64, 65, 69], "q_": 66, "q_fn": 64, "q_iter": 64, "q_net": 66, "q_valu": 64, "qiter": [15, 16, 17, 18, 19, 20, 21, 42, 43, 44, 45, 46, 47, 48, 49, 50, 64], "qpo": 64, "quadrup": [15, 30], "quantifi": 66, "queri": 66, "quick": 66, "quickli": 64, "quit": 66, "qvalu": 66, "qvel": 64, "r": [1, 21, 64, 66], "r_t": 66, "raffin": 15, "rais": [8, 10], "rajeswaran": [25, 29, 41, 54], "randn": 64, "random": [2, 7, 10, 12, 17, 19, 20, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 61, 63, 64, 66, 68], "random_polici": [61, 63], "randomis": 66, "randomli": [12, 13, 42, 61, 64], "randompolici": 35, "rang": [2, 10, 12, 59, 61, 63, 64, 66, 68], "rate": [16, 17, 18, 19, 20, 21, 64], "rather": 66, "ratio": [22, 25, 26, 29, 38, 41, 51, 54], "rb": 66, "re": [59, 64], "reach": [15, 16, 17, 18, 19, 20, 21, 32, 37, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 59, 64], "read": [8, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 66], "readabl": 13, "readi": 59, "readm": 59, "real": 15, "reason": 64, "rebuild": 1, "receiv": 68, "recent": [12, 66], "recommend": 12, "record": [2, 12, 59, 63, 64], "record_info": [2, 12, 13, 64], "recov": [2, 7, 10, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 66], "recover_env": 59, "recover_environ": [2, 7, 10, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 68], "recoveri": 59, "redtachyon": 59, "reduc": [59, 64], "ref": 10, "ref_max_scor": [2, 10], "ref_min_scor": [2, 10], "refactor": [59, 64], "refer": [2, 10, 59], "referenc": 59, "regener": 37, "regist": 61, "registr": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "registri": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "reinforc": [12, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 58, 64], "rel": 59, "relai": [30, 32], "releas": 11, "relev": [2, 10, 12], "reliabl": 15, "reloc": [30, 51, 52, 53, 59], "relu": [66, 68], "rememb": 66, "remot": [10, 11, 12, 13, 14, 58, 59], "remov": [12, 59], "remove_task_when_complet": [31, 33, 34], "renam": 59, "render": 66, "render_mod": 68, "reorgan": 59, "replac": [15, 30, 64], "replai": [12, 59], "replay_buff": 66, "repositori": [10, 13, 14, 23, 24, 25, 27, 28, 29, 30, 32, 39, 40, 41, 52, 53, 54], "repres": [13, 61, 66], "represent": 59, "reproduc": [2, 10, 12, 30, 37, 66, 68], "reproduct": [30, 59], "requir": [1, 2, 10, 12, 13, 14, 59, 61, 63, 64, 66, 68], "research": 15, "reset": [2, 12, 13, 16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 59, 61, 63, 64, 66, 68], "reset_target": [16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50], "resid": 11, "residu": 59, "respect": [10, 64, 66], "respond": 64, "respons": 12, "rest": 66, "restart": 66, "result": [10, 59, 61, 64], "results_video": 66, "retriev": [10, 12, 59], "return": [2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 44, 46, 48, 50, 51, 52, 53, 55, 59, 61, 63, 64, 66, 68], "rew": [2, 5, 12, 59, 64, 68], "rew_matrix": 64, "reward": [3, 5, 6, 12, 13, 15, 16, 17, 18, 19, 20, 21, 25, 29, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 59, 66, 68], "reward_funct": 64, "reward_threshold": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "reward_typ": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "rewards_max": 13, "rewards_mean": 13, "rewards_min": 13, "rewards_std": 13, "rewards_sum": 13, "right": [59, 64, 66], "rl": [12, 14, 23, 25, 27, 29, 39, 41, 52, 54, 59, 66, 68], "rl_zoo3": [59, 68], "rm": 66, "rnd": 59, "rnn": 68, "robot": [14, 15, 25, 29, 30, 41, 54, 59, 63, 64, 66], "rodrigo": [12, 14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 64], "rodrigodelazcano": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 59], "roll": 66, "rollout": 66, "root": [12, 13], "row": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "rperezvicent": [14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 64], "rugged": 59, "run": [12, 22, 25, 26, 29, 38, 41, 51, 54, 59, 66], "s_": 66, "s_t": 66, "sac": [15, 16, 17, 18, 19, 20, 21, 55], "safe": 59, "same": [2, 7, 10, 12, 13, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 59, 64, 66], "sampl": [2, 7, 13, 35, 37, 58, 59, 61, 63, 66], "sample_episod": [7, 12, 13, 59], "sampled_episod": 13, "sampler": 66, "samplerwithoutreplac": 66, "save": [4, 13, 59, 61, 63, 64, 66, 68], "save_video": 66, "sb3": 55, "scale": 66, "scale_lb": 66, "scenario": 68, "schedul": [12, 59], "score": [2, 66], "script": [14, 30, 55, 66, 68], "second": [12, 59], "section": [13, 59, 66], "see": [13, 61, 66], "seed": [2, 3, 7, 10, 12, 13, 59, 61, 63, 64, 66, 68], "seen": 64, "select": [16, 17, 18, 19, 20, 25, 29, 41, 42, 54, 59, 64], "self": [2, 3, 4, 5, 7, 8, 63, 64, 68], "separ": 59, "sequenc": [32, 33, 34, 42], "sequenti": 66, "seri": [12, 64], "serial": [13, 59, 62, 65], "serializ": 13, "serialize_custom_spac": 61, "serialize_spac": 61, "serv": 12, "server": [10, 11, 12, 14, 58, 66], "servic": 59, "set": [2, 7, 10, 12, 13, 15, 16, 17, 18, 19, 20, 21, 59, 64, 66, 68], "set_descript": 66, "set_exploration_typ": 66, "set_se": [7, 12, 66], "set_titl": 66, "set_xlabel": 66, "setpoint": 64, "sever": 13, "shape": [15, 20, 21, 42, 49, 50, 59, 63, 64, 66, 68], "shard": 12, "share": [59, 66], "shift": [13, 66], "should": [2, 61, 63], "show": [12, 58, 59, 61, 63, 66], "shown": [14, 66], "shreyansjainn": 59, "shuffl": 68, "sim": 66, "similarli": [59, 66], "simpl": [12, 59, 64, 66, 68], "simplefilt": 66, "simpli": [61, 64], "sinc": [61, 64, 68], "singl": [3, 6, 9, 10, 12, 14, 59, 66], "size": [8, 10, 12, 14, 58, 59, 64, 66], "skip": [10, 66], "slash": [11, 13], "slice": [7, 8], "slide": [31, 32, 34], "slightli": 59, "slowli": [64, 66], "small": [59, 66], "smaller": [42, 59, 64], "snippet": 12, "so": [12, 13, 64, 66], "soft": 66, "softupd": 66, "solut": 64, "solv": [32, 64], "solver": 64, "some": [2, 8, 12, 14, 59, 61, 64, 66], "sourc": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 59, 61, 63, 64, 65, 66, 68], "space": [2, 8, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 37, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 62, 64, 65, 66, 68], "space_dict": 61, "spars": [15, 16, 17, 18, 19, 20, 21, 25, 29, 41, 42, 44, 46, 48, 50, 54], "spec": [2, 7, 10, 13, 14, 59, 61, 66], "specif": [12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 59, 63, 64, 66], "specifi": [2, 7, 8, 12, 13, 59, 66], "speed": [59, 64], "sphinx": 1, "sphinx_github_changelog_token": 59, "sphx": 59, "split": [42, 59], "split_dataset": [10, 12, 59], "split_traj": 66, "squar": 61, "src": 66, "stabil": 64, "stabl": 15, "stable_baselines3": 68, "stack": [6, 13, 59], "stand": [16, 17, 18, 19, 20, 21], "standard": [12, 59, 66], "start": [12, 13, 61, 63, 64, 66, 68], "state": [2, 32, 42, 64, 66], "state_action_valu": 66, "state_to_cel": 64, "state_valu": 66, "statist": 4, "steadi": 64, "step": [2, 3, 5, 6, 7, 8, 9, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 63, 64, 66, 68], "step_data": [3, 5, 63, 64], "step_data_callback": [2, 63, 64], "step_data_kei": 5, "stepdata": [3, 5], "stepdatacallback": [2, 13, 59, 62, 65], "stitch": 15, "storag": [8, 12, 13, 59], "store": [2, 8, 10, 12, 13, 59, 63, 66], "str": [2, 5, 8, 9, 10, 11, 13, 61], "straight": [36, 37], "strictli": 66, "string": [11, 13, 61], "stronger": 64, "structur": [11, 12, 59], "style": [2, 10, 13, 59, 66], "sub": [14, 59], "subcomponent_1": 59, "subcomponent_2": 59, "subdirectori": 13, "subgroup": [59, 64], "subplot": 66, "subsequ": 59, "subset": [59, 62, 65], "subtask": [31, 32, 33, 34], "subtrajectori": [32, 34], "succ": 64, "success": [16, 17, 18, 19, 20, 21, 64, 68], "successfulli": [14, 63], "sudo": 66, "suggest": 59, "sum": 66, "sum_": 64, "summari": 66, "super": [5, 63, 64, 68], "support": [2, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 64, 66], "supportsfloat": 2, "suppos": 12, "sure": [14, 59], "surrog": 13, "switch": [31, 32, 33, 34], "sy": 68, "syntax": [2, 10, 13], "system": 64, "t": [2, 8, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 59, 61, 63, 64, 66], "tabl": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59], "tackl": 66, "take": [7, 13, 61, 64], "taken": [6, 8, 43, 44, 45, 46, 47, 48, 49, 50, 63], "tanh": 66, "tanh_loc": 66, "tanhnorm": 66, "target": [16, 17, 18, 19, 20, 21, 30, 31, 32, 33, 34, 42, 54, 64, 66], "target_net_updat": 66, "task": [10, 12, 15, 25, 29, 32, 34, 41, 43, 44, 45, 46, 47, 48, 49, 50, 54, 64, 66, 68], "tasks_to_complet": [31, 33, 34], "tau": [64, 66], "td": 66, "team": 11, "temperatur": 66, "templat": 59, "tempor": 66, "temporari": [2, 12, 59, 64], "tensor": [66, 68], "tensordict": 66, "tensordictmodul": 66, "termin": [2, 3, 5, 6, 7, 9, 12, 13, 16, 17, 18, 19, 20, 21, 42, 59, 61, 63, 64, 66, 68], "terminate_on_tasks_complet": [31, 33, 34], "test": [10, 11, 12, 15, 59, 63], "text": [13, 35, 36, 59, 64], "than": [10, 12, 16, 17, 18, 19, 20, 21, 59, 66], "thank": 59, "thei": [8, 13, 30, 59, 66], "them": [12, 13, 59, 68], "theme": 64, "theori": 64, "therefor": 66, "theta": 66, "thi": [1, 2, 4, 5, 6, 7, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 59, 61, 63, 64, 66, 68], "thing": [59, 61], "think": 64, "thorough": 59, "those": 66, "thought": 59, "three": [25, 29, 41, 54, 64, 66], "through": [12, 13, 14, 58, 59, 64, 66], "thu": [42, 64], "tight_layout": 66, "time": [1, 2, 10, 64], "timestep": 59, "to_str": 61, "togeth": [10, 12, 14, 32, 33, 66], "tohsin": 59, "tomekst": 59, "tool": [14, 29, 59], "top": [13, 14], "torch": [66, 68], "torchrl": [65, 69], "total": [7, 8, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 64, 66], "total_episod": [7, 8, 12, 13, 59, 68], "total_step": [7, 8, 12, 13, 59, 64], "total_timestep": 59, "touch": [11, 63], "toward": 64, "towardsdatasci": [15, 42, 64], "tqdm": [66, 68], "train": [15, 16, 17, 18, 19, 20, 21, 22, 25, 26, 29, 38, 41, 51, 54, 55, 56, 63], "trainer": 66, "trajectori": [14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 29, 39, 41, 42, 52, 54, 58, 59, 64], "transform": 66, "transformedenv": 66, "transit": [5, 59, 64, 66], "transition_matrix": 64, "tree": 55, "tri": 66, "true": [2, 7, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 64, 66, 68], "truncat": [2, 3, 5, 6, 9, 12, 13, 42, 59, 61, 63, 64, 66, 68], "try": [61, 66], "tune": [14, 23, 25, 27, 29, 39, 41, 52, 54, 55, 56, 64, 66], "tupl": [2, 3, 13, 59, 64, 66], "tutori": [59, 61, 63, 64, 66, 68], "tutorials_jupyt": 65, "tutorials_python": 65, "two": [10, 12, 13, 14, 25, 29, 41, 42, 54, 59, 66, 68], "txt": 1, "type": [2, 12, 13, 25, 29, 41, 54, 59, 61, 66, 68], "typer": 14, "typic": 64, "typing_extens": 59, "typo": 59, "u": [14, 15, 20, 21, 42, 49, 50, 59, 66, 68], "uint8": [35, 36, 61, 66], "umaz": [15, 42, 59, 64], "under": [10, 13, 42, 59, 66], "undiscount": [10, 13], "unflatten": 59, "unifi": 59, "uniform": 64, "union": [7, 61], "uniqu": 61, "unknown": 59, "unless": 2, "unlik": 66, "until": [12, 43, 44, 45, 46, 47, 48, 49, 50], "up": [12, 16, 17, 18, 19, 20, 21, 59, 61, 63, 64, 66, 68], "updat": [2, 8, 12, 59, 64, 66], "update_dataset_from_buff": 7, "update_dataset_from_collector_env": 59, "update_episod": 8, "update_episode_metadata": 8, "update_from_storag": 8, "update_metadata": 8, "upgrad": 66, "upload": 59, "upload_namespac": 11, "upon": 15, "upper": 13, "us": [2, 7, 8, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 63, 64, 66, 68], "usag": [14, 59], "user": [2, 12, 13, 59], "usual": 66, "util": [10, 12, 58, 66, 68], "v": [2, 10, 13, 14, 32, 66], "v0": [10, 11, 12, 13, 35, 36, 37, 55, 56, 61, 63, 64, 68], "v1": [10, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 38, 39, 40, 41, 51, 52, 53, 54, 59, 66, 68], "v1_1": 68, "v2": [12, 13, 14, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 59, 66], "v3": [42, 43, 44, 45, 46, 47, 48, 49, 50, 59, 63, 64], "v4": [15, 16, 17, 18, 19, 20, 21], "v5": [55, 56], "v_": [64, 66], "v_fn": 64, "valid": [10, 55, 56, 63, 64, 66], "valu": [2, 5, 6, 8, 9, 10, 12, 13, 44, 46, 48, 50, 59, 64, 66], "value_net": 66, "value_network": 66, "valueerror": 8, "valueoper": 66, "vari": [61, 66, 68], "variabl": [12, 13, 59, 64], "varianc": [43, 44, 45, 46, 47, 48, 49, 50, 64], "variat": 64, "varieti": 12, "variou": [32, 33, 61], "ve": 64, "vector_entry_point": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "veloc": [5, 42, 64], "veri": 12, "version": [2, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 63, 64], "via": [32, 66], "vicent": [43, 44, 45, 46, 47, 48, 49, 50, 64], "video": 66, "video_fold": 66, "viewer_env": 66, "virtual": 66, "virtual_displai": 66, "visibl": 66, "visual": 68, "visualis": 66, "vol": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "wa": [2, 7, 10, 13, 15, 25, 29, 35, 36, 37, 41, 54, 59, 61], "wai": [12, 64, 66], "wall": [42, 47, 48, 64], "want": [7, 12, 14, 64], "wapoint": 64, "warn": [14, 59, 66], "waypoint": [15, 16, 17, 18, 19, 20, 21, 42, 43, 44, 45, 46, 47, 48, 49, 50], "waypoint_control": 64, "waypoint_target": 64, "waypoint_threshold": 64, "waypointcontrol": 64, "wd": 59, "we": [12, 13, 30, 37, 59, 61, 63, 64, 66, 68], "weight": 66, "well": [12, 13, 14, 58, 59, 64, 66], "were": [10, 12, 14, 25, 29, 30, 32, 41, 42, 54, 59], "what": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 64], "when": [7, 12, 13, 16, 17, 18, 19, 20, 21, 42, 43, 44, 45, 46, 47, 48, 49, 50, 59, 61, 63, 64, 66], "where": [2, 8, 10, 13, 32, 34, 59, 64, 66], "whether": 11, "which": [2, 7, 8, 10, 12, 13, 15, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 63, 64, 66, 68], "while": [12, 59, 61, 63, 64, 66, 68], "who": 66, "whose": 66, "willdudlei": 59, "window": 59, "within": [7, 59, 66], "without": [43, 44, 45, 46, 47, 48, 49, 50, 59], "won": [12, 64], "work": [2, 12, 14, 59, 66], "workflow": 59, "world": 15, "worri": 61, "would": [11, 13, 14, 63, 64], "wrap": [2, 12, 59, 64, 66], "wrapper": [2, 4, 12, 13, 59, 61, 64, 66, 68], "write": [8, 66], "written": 66, "x": [7, 30, 42, 64, 68], "xvfb": 66, "xy": 64, "y": [14, 30, 42, 64, 66], "yml": 59, "you": [7, 8, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 63, 64, 66, 68], "youni": [35, 36], "younik": 59, "younis98": 36, "your": [12, 14, 59, 68], "zero": 64, "zero_grad": [66, 68], "zip": 65, "zoo": 68, "\u898b\u7fd2\u3044": 58}, "titles": ["404 - Page Not Found", "Minari documentation", "DataCollector", "EpisodeBuffer", "EpisodeMetadataCallback", "StepDataCallback", "EpisodeData", "MinariDataset", "MinariStorage", "StepData", "Minari", "Namespace", "Basic Usage", "Dataset Standards", "Minari CLI", "Ant Maze", "Large-Diverse", "Large-Play", "Medium-Diverse", "Medium-Play", "Umaze-Diverse", "Umaze", "Cloned", "Expert", "Human", "Door", "Cloned", "Expert", "Human", "Hammer", "D4RL", "Complete", "Kitchen", "Mixed", "Partial", "Fourrooms-Random", "Fourrooms", "MiniGrid", "Cloned", "Expert", "Human", "Pen", "Point Maze", "Large-Dense", "Large", "Medium-Dense", "Medium", "Open-Dense", "Open", "Umaze-Dense", "Umaze", "Cloned", "Expert", "Human", "Relocate", "Expert", "Mujoco/ant", "MuJoCo", "<no title>", "Release Notes", "Dataset Creation", "Serializing a custom space", "Dataset Creation", "Collecting a subset of a dictionary space with StepDataCallback", "PointMaze D4RL dataset", "Tutorials", "Implicit Q-Learning with TorchRL", "Using Datasets", "Behavioral cloning with PyTorch", "Using Datasets"], "titleterms": {"0": 59, "1": [59, 64], "2": [59, 64], "3": [59, 64], "4": 59, "404": 0, "5": 59, "For": 66, "Not": 0, "The": [0, 66], "action": 13, "adroit": 66, "ant": [15, 56], "attribut": [3, 6, 7, 8, 9], "basic": 12, "behavior": 68, "buffer": 66, "build": [1, 66], "checkpoint": 12, "cli": 14, "clone": [22, 26, 38, 51, 68], "collect": [12, 63, 64], "combin": [10, 12, 14], "complet": 31, "content": [15, 25, 29, 30, 32, 37, 41, 42, 54, 56, 57], "control": 64, "could": 0, "creat": [10, 11, 12, 64], "creation": [60, 62, 65], "custom": 61, "d": 64, "d4rl": [30, 64], "data": [12, 64], "data_collector": 3, "datacollector": 2, "dataset": [8, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 60, 62, 64, 65, 67, 68, 69], "defin": 66, "delet": [10, 11, 14], "dens": [43, 45, 47, 49], "deriv": 64, "descript": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "detail": 14, "dictionari": 63, "directori": 13, "divers": [16, 18, 20], "document": 1, "door": 25, "download": [10, 11, 12, 14], "environ": [12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 66], "episod": 12, "episodebuff": 3, "episodedata": [6, 13], "episodemetadatacallback": 4, "evalu": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "expert": [23, 27, 39, 52, 55], "filter": 12, "found": 0, "fourroom": [35, 36], "gener": 68, "get": 11, "hammer": 29, "headless": 66, "human": [24, 28, 40, 53], "i": 64, "implicit": 66, "import": 68, "instal": 12, "integr": 64, "kitchen": 32, "larg": [16, 17, 43, 44], "learn": 66, "list": [10, 11, 14], "load": [10, 12], "local": [11, 12, 14], "loss": 66, "maze": [15, 42], "medium": [18, 19, 45, 46], "metadata": [11, 13], "method": [2, 3, 4, 5, 7, 8], "minari": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 64], "minari_storag": 8, "minaridataset": 7, "minaristorag": 8, "minigrid": 37, "mix": 33, "model": 66, "modifi": 64, "mujoco": [56, 57], "namespac": [11, 12, 13], "normal": 10, "note": 59, "observ": 13, "open": [47, 48], "optim": 66, "p": 64, "page": 0, "partial": 34, "pen": [41, 66], "plai": [17, 19], "planner": 64, "point": 42, "pointmaz": 64, "polici": 68, "pre": 66, "proport": 64, "pytorch": 68, "q": 66, "random": 35, "recov": 12, "refer": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "releas": 59, "reloc": 54, "replai": 66, "request": 0, "requisit": 66, "result": 66, "sampl": 12, "save": 12, "score": 10, "serial": 61, "show": 14, "space": [13, 61, 63], "spec": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "split": [10, 12], "standard": 13, "stepdata": 9, "stepdatacallback": [5, 63, 64], "structur": 13, "subset": 63, "support": 13, "term": 64, "torchrl": 66, "train": [66, 68], "tutori": 65, "umaz": [20, 21, 49, 50], "updat": 11, "upload": [11, 14], "us": [12, 65, 67, 69], "usag": 12, "v0": 59, "waypoint": 64}})
\ No newline at end of file
+Search.setIndex({"alltitles": {"0.1.0": [[59, "release-0-1-0"]], "0.2.2": [[59, "release-0-2-2"]], "1. Proportional Term (P)": [[64, "proportional-term-p"]], "2. Derivative Term (D)": [[64, "derivative-term-d"]], "3. Integral Term (I)": [[64, "integral-term-i"]], "404 - Page Not Found": [[0, null]], "Ant Maze": [[15, null]], "Attributes": [[3, "attributes"], [6, "attributes"], [7, "attributes"], [8, "attributes"], [9, "attributes"]], "Basic Usage": [[12, null]], "Behavioral cloning with PyTorch": [[68, null], [68, "id1"]], "Build the Documentation": [[1, "build-the-documentation"]], "Building a replay buffer": [[66, "building-a-replay-buffer"]], "Checkpoint Minari Dataset": [[12, "checkpoint-minari-dataset"]], "Cloned": [[22, null], [26, null], [38, null], [51, null]], "Collect Data and Create Minari Dataset": [[64, "collect-data-and-create-minari-dataset"]], "Collecting Data": [[12, "collecting-data"]], "Collecting a subset of a dictionary space with StepDataCallback": [[63, null]], "Combine Minari Datasets": [[10, "combine-minari-datasets"], [12, "combine-minari-datasets"]], "Combine datasets": [[14, "combine-datasets"]], "Complete": [[31, null]], "Content": [[15, "content"], [25, "content"], [29, "content"], [30, "content"], [32, "content"], [37, "content"], [41, "content"], [42, "content"], [54, "content"], [56, "content"], [57, "content"]], "Create Minari Dataset": [[10, "create-minari-dataset"], [12, "create-minari-dataset"]], "Create Namespace": [[11, "create-namespace"]], "D4RL": [[30, null]], "DataCollector": [[2, null]], "Dataset Creation": [[60, null], [62, null], [65, "dataset-creation"]], "Dataset Metadata": [[13, "dataset-metadata"]], "Dataset Specs": [[16, "dataset-specs"], [17, "dataset-specs"], [18, "dataset-specs"], [19, "dataset-specs"], [20, "dataset-specs"], [21, "dataset-specs"], [22, "dataset-specs"], [23, "dataset-specs"], [24, "dataset-specs"], [26, "dataset-specs"], [27, "dataset-specs"], [28, "dataset-specs"], [31, "dataset-specs"], [33, "dataset-specs"], [34, "dataset-specs"], [35, "dataset-specs"], [36, "dataset-specs"], [38, "dataset-specs"], [39, "dataset-specs"], [40, "dataset-specs"], [43, "dataset-specs"], [44, "dataset-specs"], [45, "dataset-specs"], [46, "dataset-specs"], [47, "dataset-specs"], [48, "dataset-specs"], [49, "dataset-specs"], [50, "dataset-specs"], [51, "dataset-specs"], [52, "dataset-specs"], [53, "dataset-specs"], [55, "dataset-specs"]], "Dataset Standards": [[13, null]], "Dataset generation": [[68, "dataset-generation"]], "Defining the model": [[66, "defining-the-model"]], "Delete Minari Datasets": [[10, "delete-minari-datasets"]], "Delete Namespace": [[11, "delete-namespace"]], "Delete local datasets": [[14, "delete-local-datasets"]], "Description": [[16, "description"], [17, "description"], [18, "description"], [19, "description"], [20, "description"], [21, "description"], [22, "description"], [23, "description"], [24, "description"], [26, "description"], [27, "description"], [28, "description"], [31, "description"], [33, "description"], [34, "description"], [35, "description"], [36, "description"], [38, "description"], [39, "description"], [40, "description"], [43, "description"], [44, "description"], [45, "description"], [46, "description"], [47, "description"], [48, "description"], [49, "description"], [50, "description"], [51, "description"], [52, "description"], [53, "description"], [55, "description"]], "Door": [[25, null]], "Download Datasets": [[12, "download-datasets"]], "Download Minari Dataset": [[10, "download-minari-dataset"]], "Download Namespace Metadata": [[11, "download-namespace-metadata"]], "Download datasets": [[14, "download-datasets"]], "Environment Specs": [[16, "environment-specs"], [17, "environment-specs"], [18, "environment-specs"], [19, "environment-specs"], [20, "environment-specs"], [21, "environment-specs"], [22, "environment-specs"], [23, "environment-specs"], [24, "environment-specs"], [26, "environment-specs"], [27, "environment-specs"], [28, "environment-specs"], [31, "environment-specs"], [33, "environment-specs"], [34, "environment-specs"], [35, "environment-specs"], [36, "environment-specs"], [38, "environment-specs"], [39, "environment-specs"], [40, "environment-specs"], [43, "environment-specs"], [44, "environment-specs"], [45, "environment-specs"], [46, "environment-specs"], [47, "environment-specs"], [48, "environment-specs"], [49, "environment-specs"], [50, "environment-specs"], [51, "environment-specs"], [52, "environment-specs"], [53, "environment-specs"], [55, "environment-specs"]], "EpisodeBuffer": [[3, null]], "EpisodeData": [[6, null]], "EpisodeData Structure": [[13, "episodedata-structure"]], "EpisodeMetadataCallback": [[4, null]], "Evaluation Environment Specs": [[16, "evaluation-environment-specs"], [17, "evaluation-environment-specs"], [18, "evaluation-environment-specs"], [19, "evaluation-environment-specs"], [20, "evaluation-environment-specs"], [21, "evaluation-environment-specs"], [22, "evaluation-environment-specs"], [23, "evaluation-environment-specs"], [24, "evaluation-environment-specs"], [26, "evaluation-environment-specs"], [27, "evaluation-environment-specs"], [28, "evaluation-environment-specs"], [31, "evaluation-environment-specs"], [33, "evaluation-environment-specs"], [34, "evaluation-environment-specs"], [35, "evaluation-environment-specs"], [36, "evaluation-environment-specs"], [38, "evaluation-environment-specs"], [39, "evaluation-environment-specs"], [40, "evaluation-environment-specs"], [43, "evaluation-environment-specs"], [44, "evaluation-environment-specs"], [45, "evaluation-environment-specs"], [46, "evaluation-environment-specs"], [47, "evaluation-environment-specs"], [48, "evaluation-environment-specs"], [49, "evaluation-environment-specs"], [50, "evaluation-environment-specs"], [51, "evaluation-environment-specs"], [52, "evaluation-environment-specs"], [53, "evaluation-environment-specs"], [55, "evaluation-environment-specs"]], "Expert": [[23, null], [27, null], [39, null], [52, null], [55, null]], "Filter Episodes": [[12, "filter-episodes"]], "For headless environments": [[66, "for-headless-environments"]], "Fourrooms": [[36, null]], "Fourrooms-Random": [[35, null]], "Get Local Namespace Metadata": [[11, "get-local-namespace-metadata"]], "Hammer": [[29, null]], "Human": [[24, null], [28, null], [40, null], [53, null]], "Implicit Q-Learning": [[66, "implicit-q-learning"]], "Implicit Q-Learning with TorchRL": [[66, null]], "Imports": [[68, "imports"]], "Installation": [[12, "installation"]], "Kitchen": [[32, null]], "Large": [[44, null]], "Large-Dense": [[43, null]], "Large-Diverse": [[16, null]], "Large-Play": [[17, null]], "List Minari Datasets": [[10, "list-minari-datasets"]], "List Namespaces": [[11, "list-namespaces"]], "List datasets": [[14, "list-datasets"]], "Load Local Datasets": [[12, "load-local-datasets"]], "Load Minari Dataset": [[10, "load-minari-dataset"]], "Loss and optimizer": [[66, "loss-and-optimizer"]], "Medium": [[46, null]], "Medium-Dense": [[45, null]], "Medium-Diverse": [[18, null]], "Medium-Play": [[19, null]], "Methods": [[2, "methods"], [3, "methods"], [4, "methods"], [5, "methods"], [7, "methods"], [8, "methods"]], "Minari": [[10, null]], "Minari CLI": [[14, null]], "Minari Dataset Directory": [[13, "minari-dataset-directory"]], "Minari documentation": [[1, null]], "MinariDataset": [[7, null]], "MinariStorage": [[8, null]], "MiniGrid": [[37, null]], "Mixed": [[33, null]], "Modified StepDataCallback": [[64, "modified-stepdatacallback"]], "MuJoCo": [[57, null]], "Mujoco/ant": [[56, null]], "Namespace": [[11, null]], "Namespace metadata": [[13, "namespace-metadata"]], "Normalize Score": [[10, "normalize-score"]], "Observation and Action Spaces": [[13, "observation-and-action-spaces"]], "Open": [[48, null]], "Open-Dense": [[47, null]], "Partial": [[34, null]], "Pen": [[41, null]], "Point Maze": [[42, null]], "PointMaze D4RL dataset": [[64, null]], "Policy training": [[68, "policy-training"]], "Pre-requisites": [[66, "pre-requisites"]], "Recover Environment": [[12, "recover-environment"]], "References": [[15, "references"], [25, "references"], [29, "references"], [30, "references"], [32, "references"], [37, "references"], [41, "references"], [42, "references"], [54, "references"], [64, "references"]], "Release Notes": [[59, null]], "Relocate": [[54, null]], "Results": [[66, "results"]], "Sampling Episodes": [[12, "sampling-episodes"]], "Save Dataset": [[12, "save-dataset"]], "Serializing a custom space": [[61, null]], "Show datasets details": [[14, "show-datasets-details"]], "Split Dataset": [[12, "split-dataset"]], "Split Minari Dataset": [[10, "split-minari-dataset"]], "StepData": [[9, null]], "StepDataCallback": [[5, null]], "Supported Spaces": [[13, "supported-spaces"]], "The Adroit Pen environment": [[66, "the-adroit-pen-environment"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Training": [[66, "training"]], "Tutorials": [[65, null]], "Umaze": [[21, null], [50, null]], "Umaze-Dense": [[49, null]], "Umaze-Diverse": [[20, null]], "Update Namespace": [[11, "update-namespace"]], "Upload Namespace": [[11, "upload-namespace"]], "Upload datasets": [[14, "upload-datasets"]], "Using Datasets": [[65, "using-datasets"], [67, null], [69, null]], "Using Minari Datasets": [[12, "using-minari-datasets"]], "Using Namespaces": [[12, "using-namespaces"]], "WayPoint Planner": [[64, "waypoint-planner"]], "Waypoint Controller": [[64, "waypoint-controller"]], "minari.DataCollector": [[2, "minari-datacollector"]], "minari.EpisodeData": [[6, "minari-episodedata"]], "minari.EpisodeMetadataCallback": [[4, "minari-episodemetadatacallback"]], "minari.MinariDataset": [[7, "minari-minaridataset"]], "minari.StepData": [[9, "minari-stepdata"]], "minari.StepDataCallback": [[5, "minari-stepdatacallback"]], "minari.data_collector.EpisodeBuffer": [[3, "minari-data-collector-episodebuffer"]], "minari.dataset.minari_storage.MinariStorage": [[8, "minari-dataset-minari-storage-minaristorage"]], "v0.3.0": [[59, "release-v0-3-0"]], "v0.3.1": [[59, "release-v0-3-1"]], "v0.4.0": [[59, "release-v0-4-0"]], "v0.4.1": [[59, "release-v0-4-1"]], "v0.4.2": [[59, "release-v0-4-2"]], "v0.4.3": [[59, "release-v0-4-3"]], "v0.5.0": [[59, "release-v0-5-0"]], "v0.5.1": [[59, "release-v0-5-1"]]}, "docnames": ["404", "README", "api/data_collector", "api/data_collector/episode_buffer", "api/data_collector/episode_metadata_callback", "api/data_collector/step_data_callback", "api/minari_dataset/episode_data", "api/minari_dataset/minari_dataset", "api/minari_dataset/minari_storage", "api/minari_dataset/step_data", "api/minari_functions", "api/namespace/namespace", "content/basic_usage", "content/dataset_standards", "content/minari_cli", "datasets/D4RL/antmaze/index", "datasets/D4RL/antmaze/large-diverse-v1", "datasets/D4RL/antmaze/large-play-v1", "datasets/D4RL/antmaze/medium-diverse-v1", "datasets/D4RL/antmaze/medium-play-v1", "datasets/D4RL/antmaze/umaze-diverse-v1", "datasets/D4RL/antmaze/umaze-v1", "datasets/D4RL/door/cloned-v2", "datasets/D4RL/door/expert-v2", "datasets/D4RL/door/human-v2", "datasets/D4RL/door/index", "datasets/D4RL/hammer/cloned-v2", "datasets/D4RL/hammer/expert-v2", "datasets/D4RL/hammer/human-v2", "datasets/D4RL/hammer/index", "datasets/D4RL/index", "datasets/D4RL/kitchen/complete-v2", "datasets/D4RL/kitchen/index", "datasets/D4RL/kitchen/mixed-v2", "datasets/D4RL/kitchen/partial-v2", "datasets/D4RL/minigrid/fourrooms-random-v0", "datasets/D4RL/minigrid/fourrooms-v0", "datasets/D4RL/minigrid/index", "datasets/D4RL/pen/cloned-v2", "datasets/D4RL/pen/expert-v2", "datasets/D4RL/pen/human-v2", "datasets/D4RL/pen/index", "datasets/D4RL/pointmaze/index", "datasets/D4RL/pointmaze/large-dense-v2", "datasets/D4RL/pointmaze/large-v2", "datasets/D4RL/pointmaze/medium-dense-v2", "datasets/D4RL/pointmaze/medium-v2", "datasets/D4RL/pointmaze/open-dense-v2", "datasets/D4RL/pointmaze/open-v2", "datasets/D4RL/pointmaze/umaze-dense-v2", "datasets/D4RL/pointmaze/umaze-v2", "datasets/D4RL/relocate/cloned-v2", "datasets/D4RL/relocate/expert-v2", "datasets/D4RL/relocate/human-v2", "datasets/D4RL/relocate/index", "datasets/mujoco/ant/expert-v0", "datasets/mujoco/ant/index", "datasets/mujoco/index", "index", "release_notes/index", "tutorials/dataset_creation/README", "tutorials/dataset_creation/custom_space_serialization", "tutorials/dataset_creation/index", "tutorials/dataset_creation/observation_space_subseting", "tutorials/dataset_creation/point_maze_dataset", "tutorials/index", "tutorials/using_datasets/IQL_torchrl", "tutorials/using_datasets/README", "tutorials/using_datasets/behavioral_cloning", "tutorials/using_datasets/index"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1}, "filenames": ["404.md", "README.md", "api/data_collector.md", "api/data_collector/episode_buffer.md", "api/data_collector/episode_metadata_callback.md", "api/data_collector/step_data_callback.md", "api/minari_dataset/episode_data.md", "api/minari_dataset/minari_dataset.md", "api/minari_dataset/minari_storage.md", "api/minari_dataset/step_data.md", "api/minari_functions.md", "api/namespace/namespace.md", "content/basic_usage.md", "content/dataset_standards.md", "content/minari_cli.md", "datasets/D4RL/antmaze/index.md", "datasets/D4RL/antmaze/large-diverse-v1.md", "datasets/D4RL/antmaze/large-play-v1.md", "datasets/D4RL/antmaze/medium-diverse-v1.md", "datasets/D4RL/antmaze/medium-play-v1.md", "datasets/D4RL/antmaze/umaze-diverse-v1.md", "datasets/D4RL/antmaze/umaze-v1.md", "datasets/D4RL/door/cloned-v2.md", "datasets/D4RL/door/expert-v2.md", "datasets/D4RL/door/human-v2.md", "datasets/D4RL/door/index.md", "datasets/D4RL/hammer/cloned-v2.md", "datasets/D4RL/hammer/expert-v2.md", "datasets/D4RL/hammer/human-v2.md", "datasets/D4RL/hammer/index.md", "datasets/D4RL/index.md", "datasets/D4RL/kitchen/complete-v2.md", "datasets/D4RL/kitchen/index.md", "datasets/D4RL/kitchen/mixed-v2.md", "datasets/D4RL/kitchen/partial-v2.md", "datasets/D4RL/minigrid/fourrooms-random-v0.md", "datasets/D4RL/minigrid/fourrooms-v0.md", "datasets/D4RL/minigrid/index.md", "datasets/D4RL/pen/cloned-v2.md", "datasets/D4RL/pen/expert-v2.md", "datasets/D4RL/pen/human-v2.md", "datasets/D4RL/pen/index.md", "datasets/D4RL/pointmaze/index.md", "datasets/D4RL/pointmaze/large-dense-v2.md", "datasets/D4RL/pointmaze/large-v2.md", "datasets/D4RL/pointmaze/medium-dense-v2.md", "datasets/D4RL/pointmaze/medium-v2.md", "datasets/D4RL/pointmaze/open-dense-v2.md", "datasets/D4RL/pointmaze/open-v2.md", "datasets/D4RL/pointmaze/umaze-dense-v2.md", "datasets/D4RL/pointmaze/umaze-v2.md", "datasets/D4RL/relocate/cloned-v2.md", "datasets/D4RL/relocate/expert-v2.md", "datasets/D4RL/relocate/human-v2.md", "datasets/D4RL/relocate/index.md", "datasets/mujoco/ant/expert-v0.md", "datasets/mujoco/ant/index.md", "datasets/mujoco/index.md", "index.md", "release_notes/index.md", "tutorials/dataset_creation/README.rst", "tutorials/dataset_creation/custom_space_serialization.rst", "tutorials/dataset_creation/index.rst", "tutorials/dataset_creation/observation_space_subseting.rst", "tutorials/dataset_creation/point_maze_dataset.rst", "tutorials/index.rst", "tutorials/using_datasets/IQL_torchrl.rst", "tutorials/using_datasets/README.rst", "tutorials/using_datasets/behavioral_cloning.rst", "tutorials/using_datasets/index.rst"], "indexentries": {"__call__() (in module minari.episodemetadatacallback)": [[4, "minari.EpisodeMetadataCallback.__call__", false]], "__call__() (in module minari.stepdatacallback)": [[5, "minari.StepDataCallback.__call__", false]], "__len__() (in module minari.data_collector.episodebuffer)": [[3, "minari.data_collector.EpisodeBuffer.__len__", false]], "action (minari.stepdata attribute)": [[9, "minari.StepData.action", false]], "action_space (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.action_space", false]], "actions (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.actions", false]], "actions (minari.episodedata attribute)": [[6, "minari.EpisodeData.actions", false]], "add_step_data() (in module minari.data_collector.episodebuffer)": [[3, "minari.data_collector.EpisodeBuffer.add_step_data", false]], "add_to_dataset() (in module minari.datacollector)": [[2, "minari.DataCollector.add_to_dataset", false]], "apply() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.apply", false]], "close() (in module minari.datacollector)": [[2, "minari.DataCollector.close", false]], "combine_datasets() (in module minari)": [[10, "minari.combine_datasets", false]], "create_dataset() (in module minari.datacollector)": [[2, "minari.DataCollector.create_dataset", false]], "create_dataset_from_buffers() (in module minari)": [[10, "minari.create_dataset_from_buffers", false]], "create_namespace() (in module minari.namespace)": [[11, "minari.namespace.create_namespace", false]], "data_path (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.data_path", false]], "datacollector (class in minari)": [[2, "minari.DataCollector", false]], "delete_dataset() (in module minari)": [[10, "minari.delete_dataset", false]], "delete_namespace() (in module minari.namespace)": [[11, "minari.namespace.delete_namespace", false]], "download_dataset() (in module minari)": [[10, "minari.download_dataset", false]], "download_namespace_metadata() (in module minari.namespace)": [[11, "minari.namespace.download_namespace_metadata", false]], "episode_indices (minari.minaridataset attribute)": [[7, "minari.MinariDataset.episode_indices", false]], "episodebuffer (class in minari.data_collector)": [[3, "minari.data_collector.EpisodeBuffer", false]], "episodedata (class in minari)": [[6, "minari.EpisodeData", false]], "episodemetadatacallback (class in minari)": [[4, "minari.EpisodeMetadataCallback", false]], "filter_episodes() (in module minari.minaridataset)": [[7, "minari.MinariDataset.filter_episodes", false]], "get_episode_metadata() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.get_episode_metadata", false]], "get_episodes() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.get_episodes", false]], "get_namespace_metadata() (in module minari.namespace)": [[11, "minari.namespace.get_namespace_metadata", false]], "get_normalized_score() (in module minari)": [[10, "minari.get_normalized_score", false]], "get_size() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.get_size", false]], "id (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.id", false]], "id (minari.episodedata attribute)": [[6, "minari.EpisodeData.id", false]], "info (minari.stepdata attribute)": [[9, "minari.StepData.info", false]], "infos (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.infos", false]], "infos (minari.episodedata attribute)": [[6, "minari.EpisodeData.infos", false]], "iterate_episodes() (in module minari.minaridataset)": [[7, "minari.MinariDataset.iterate_episodes", false]], "list_local_datasets() (in module minari)": [[10, "minari.list_local_datasets", false]], "list_local_namespaces() (in module minari.namespace)": [[11, "minari.namespace.list_local_namespaces", false]], "list_remote_datasets() (in module minari)": [[10, "minari.list_remote_datasets", false]], "list_remote_namespaces() (in module minari.namespace)": [[11, "minari.namespace.list_remote_namespaces", false]], "load_dataset() (in module minari)": [[10, "minari.load_dataset", false]], "metadata (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.metadata", false]], "minaridataset (class in minari)": [[7, "minari.MinariDataset", false]], "minaristorage (class in minari.dataset.minari_storage)": [[8, "minari.dataset.minari_storage.MinariStorage", false]], "new() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.new", false]], "observation (minari.stepdata attribute)": [[9, "minari.StepData.observation", false]], "observation_space (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.observation_space", false]], "observations (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.observations", false]], "observations (minari.episodedata attribute)": [[6, "minari.EpisodeData.observations", false]], "read() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.read", false]], "recover_environment() (in module minari.minaridataset)": [[7, "minari.MinariDataset.recover_environment", false]], "reset() (in module minari.datacollector)": [[2, "minari.DataCollector.reset", false]], "rewards (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.rewards", false]], "sample_episodes() (in module minari.minaridataset)": [[7, "minari.MinariDataset.sample_episodes", false]], "seed (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.seed", false]], "set_seed() (in module minari.minaridataset)": [[7, "minari.MinariDataset.set_seed", false]], "spec (minari.minaridataset attribute)": [[7, "minari.MinariDataset.spec", false]], "split_dataset() (in module minari)": [[10, "minari.split_dataset", false]], "step() (in module minari.datacollector)": [[2, "minari.DataCollector.step", false]], "stepdata (class in minari)": [[9, "minari.StepData", false]], "stepdatacallback (class in minari)": [[5, "minari.StepDataCallback", false]], "termination (minari.stepdata attribute)": [[9, "minari.StepData.termination", false]], "terminations (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.terminations", false]], "terminations (minari.episodedata attribute)": [[6, "minari.EpisodeData.terminations", false]], "total_episodes (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.total_episodes", false]], "total_episodes (minari.minaridataset attribute)": [[7, "minari.MinariDataset.total_episodes", false]], "total_steps (minari.dataset.minari_storage.minaristorage attribute)": [[8, "minari.dataset.minari_storage.MinariStorage.total_steps", false]], "total_steps (minari.minaridataset attribute)": [[7, "minari.MinariDataset.total_steps", false]], "truncation (minari.stepdata attribute)": [[9, "minari.StepData.truncation", false]], "truncations (minari.data_collector.episodebuffer attribute)": [[3, "minari.data_collector.EpisodeBuffer.truncations", false]], "truncations (minari.episodedata attribute)": [[6, "minari.EpisodeData.truncations", false]], "update_dataset_from_buffer() (in module minari.minaridataset)": [[7, "minari.MinariDataset.update_dataset_from_buffer", false]], "update_episode_metadata() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_episode_metadata", false]], "update_episodes() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_episodes", false]], "update_from_storage() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_from_storage", false]], "update_metadata() (in module minari.dataset.minari_storage.minaristorage)": [[8, "minari.dataset.minari_storage.MinariStorage.update_metadata", false]], "upload_namespace() (in module minari.namespace)": [[11, "minari.namespace.upload_namespace", false]]}, "objects": {"minari": [[2, 0, 1, "", "DataCollector"], [6, 0, 1, "", "EpisodeData"], [4, 0, 1, "", "EpisodeMetadataCallback"], [7, 0, 1, "", "MinariDataset"], [9, 0, 1, "", "StepData"], [5, 0, 1, "", "StepDataCallback"], [10, 1, 1, "", "combine_datasets"], [10, 1, 1, "", "create_dataset_from_buffers"], [10, 1, 1, "", "delete_dataset"], [10, 1, 1, "", "download_dataset"], [10, 1, 1, "", "get_normalized_score"], [10, 1, 1, "", "list_local_datasets"], [10, 1, 1, "", "list_remote_datasets"], [10, 1, 1, "", "load_dataset"], [10, 1, 1, "", "split_dataset"]], "minari.DataCollector": [[2, 1, 1, "", "add_to_dataset"], [2, 1, 1, "", "close"], [2, 1, 1, "", "create_dataset"], [2, 1, 1, "", "reset"], [2, 1, 1, "", "step"]], "minari.EpisodeData": [[6, 2, 1, "", "actions"], [6, 2, 1, "", "id"], [6, 2, 1, "", "infos"], [6, 2, 1, "", "observations"], [6, 2, 1, "", "terminations"], [6, 2, 1, "", "truncations"]], "minari.EpisodeMetadataCallback": [[4, 1, 1, "", "__call__"]], "minari.MinariDataset": [[7, 2, 1, "", "episode_indices"], [7, 1, 1, "", "filter_episodes"], [7, 1, 1, "", "iterate_episodes"], [7, 1, 1, "", "recover_environment"], [7, 1, 1, "", "sample_episodes"], [7, 1, 1, "", "set_seed"], [7, 2, 1, "", "spec"], [7, 2, 1, "", "total_episodes"], [7, 2, 1, "", "total_steps"], [7, 1, 1, "", "update_dataset_from_buffer"]], "minari.StepData": [[9, 2, 1, "", "action"], [9, 2, 1, "", "info"], [9, 2, 1, "", "observation"], [9, 2, 1, "", "termination"], [9, 2, 1, "", "truncation"]], "minari.StepDataCallback": [[5, 1, 1, "", "__call__"]], "minari.data_collector": [[3, 0, 1, "", "EpisodeBuffer"]], "minari.data_collector.EpisodeBuffer": [[3, 1, 1, "", "__len__"], [3, 2, 1, "", "actions"], [3, 1, 1, "", "add_step_data"], [3, 2, 1, "", "id"], [3, 2, 1, "", "infos"], [3, 2, 1, "", "observations"], [3, 2, 1, "", "rewards"], [3, 2, 1, "", "seed"], [3, 2, 1, "", "terminations"], [3, 2, 1, "", "truncations"]], "minari.dataset.minari_storage": [[8, 0, 1, "", "MinariStorage"]], "minari.dataset.minari_storage.MinariStorage": [[8, 2, 1, "", "action_space"], [8, 1, 1, "", "apply"], [8, 2, 1, "", "data_path"], [8, 1, 1, "", "get_episode_metadata"], [8, 1, 1, "", "get_episodes"], [8, 1, 1, "", "get_size"], [8, 2, 1, "", "metadata"], [8, 1, 1, "", "new"], [8, 2, 1, "", "observation_space"], [8, 1, 1, "", "read"], [8, 2, 1, "", "total_episodes"], [8, 2, 1, "", "total_steps"], [8, 1, 1, "", "update_episode_metadata"], [8, 1, 1, "", "update_episodes"], [8, 1, 1, "", "update_from_storage"], [8, 1, 1, "", "update_metadata"]], "minari.namespace": [[11, 1, 1, "", "create_namespace"], [11, 1, 1, "", "delete_namespace"], [11, 1, 1, "", "download_namespace_metadata"], [11, 1, 1, "", "get_namespace_metadata"], [11, 1, 1, "", "list_local_namespaces"], [11, 1, 1, "", "list_remote_namespaces"], [11, 1, 1, "", "upload_namespace"]]}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "function", "Python function"], "2": ["py", "attribute", "Python attribute"]}, "objtypes": {"0": "py:class", "1": "py:function", "2": "py:attribute"}, "terms": {"": [2, 4, 5, 10, 12, 13, 14, 16, 17, 18, 19, 20, 32, 59, 61, 63, 64, 66, 68], "0": [2, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 61, 63, 64, 66, 68], "000": [64, 66], "0003": 66, "005": 66, "01": 59, "0123456789abcdefghijklmnopqrstuvwxyzabcdeeeffghijklmnnoopqrrssttuvwxyzz": [35, 36], "03ac13": [14, 58], "04": 59, "05": 59, "07": 59, "07219": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "08": 59, "09": 59, "0x11f2608b0": 61, "0x12253a940": 61, "0x7f30e49c0670": 35, "0x7f542ae77ee0": 36, "1": [2, 7, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 58, 66, 68], "10": [12, 13, 59, 61, 63, 64, 66], "100": [2, 10, 12, 14, 38, 39, 40, 58, 59, 66], "1000": [12, 16, 17, 18, 19, 55, 59, 66], "1000000": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 26, 27, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 58], "1000070": 35, "10010": 36, "1006729": 12, "10087": [25, 29, 41, 54], "101": 59, "10174": 35, "102": 59, "104": 59, "105": [55, 59], "107": 59, "1077": [14, 58], "108": 59, "109": 59, "1096": [12, 14, 58], "10_000": [64, 66], "11": 59, "110": 59, "1103": 12, "111": 59, "112": 59, "11310": 28, "116": 59, "11956": 32, "12": [12, 59], "121": 59, "123": [12, 59, 64], "124": 59, "126": 59, "128": [59, 66, 68], "129": 59, "13": [12, 59], "130": 59, "132": 59, "13210": [49, 50], "133": 59, "137": 59, "139": 59, "14": [35, 36, 59], "1400": 66, "1430": [20, 21], "144": 59, "148": 59, "15": 12, "151": 59, "153": 59, "155": 59, "156560": [33, 34], "157": 59, "158": 59, "160": 59, "161": 59, "162": 59, "163": 59, "164": 59, "165": 59, "167": 59, "169": 59, "16x16": 61, "17": [12, 59], "170": 59, "1709": [25, 29, 41, 54], "171": 59, "172": 59, "177": 59, "18": [12, 59], "183": 59, "1872": 66, "19": [12, 31, 59], "1910": 32, "196": 59, "1_000": [66, 68], "1e": 64, "1f": 66, "2": [2, 10, 12, 15, 16, 17, 18, 19, 20, 21, 25, 29, 30, 31, 32, 33, 34, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 61, 63, 66], "20": [12, 59, 66], "200": [22, 23, 24, 26, 27, 28, 51, 52, 53], "2000000": 55, "2004": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "2017": [25, 29, 41, 54], "2019": 32, "2020": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "2021": [15, 66], "2022": 59, "2023": 59, "2024": 59, "2026": 55, "2059": 12, "21": 12, "211": 59, "218": 59, "22": [12, 15, 59], "224": 59, "23": 12, "239": 59, "24": [14, 25, 29, 38, 39, 40, 41, 54, 66], "240": 59, "241": 59, "244": 59, "245": 59, "25": [12, 14, 24, 25, 28, 29, 40, 41, 53, 54, 58, 59, 66], "255": [35, 36, 61], "256": [66, 68], "26": [26, 27, 28, 59], "268": 15, "27": [16, 17, 18, 19, 20, 21, 59], "28": [12, 22, 23, 24, 59], "280": 31, "29": 59, "2d": [15, 30], "2f": 66, "3": [2, 10, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 61, 66], "30": [51, 52, 53, 66], "305": 59, "31": 59, "32": 68, "3360": [43, 44], "34": 59, "3606": 26, "3736": [14, 38], "3758": 51, "39": [12, 22, 23, 24, 51, 52, 53], "4": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 58, 61, 63, 64], "42": [61, 63, 66, 68], "4209": 31, "4356": [14, 58], "4358": 22, "45": [14, 38, 39, 40, 66], "450": [33, 34], "46": [26, 27, 28], "4752": [45, 46], "480": 66, "4958": [14, 39], "499206": [14, 39], "5": [12, 14, 55, 64, 66], "50": [22, 25, 26, 29, 38, 41, 51, 54, 64, 66], "500": 68, "5000": [12, 14, 23, 27, 40, 52, 58, 66], "500000": [14, 38], "5025": 12, "50_000": 66, "52": 59, "54": 59, "55": 59, "57": 59, "59": [31, 33, 34], "590": 36, "6": [12, 59], "60": 59, "6000": 55, "604": 14, "605": 12, "621": [33, 34], "638": 14, "6729": [12, 14, 24, 58], "69": 66, "7": [12, 14, 31, 33, 34, 35, 36, 58, 59, 61, 66], "700": [20, 21], "71": 59, "73": 59, "75": 59, "77": 59, "8": [12, 15, 16, 17, 18, 19, 20, 21, 30, 42, 55, 59, 64], "80": [16, 17, 18, 19, 59], "82": 59, "83": 59, "84": 59, "86": 59, "87": 59, "88": 59, "884": 66, "9": [12, 31, 33, 34], "90": [20, 21, 59], "900": 66, "92": 59, "93": 59, "95": 59, "9525": [47, 48], "96": 59, "99": [59, 64, 66], "9942": 53, "A": [2, 8, 13, 32, 58, 64, 66], "And": 68, "As": [6, 13, 59, 64, 68], "At": [16, 17, 18, 19, 20], "But": [61, 66], "By": [64, 66], "For": [1, 2, 10, 11, 12, 13, 30, 59, 61, 64, 68], "If": [2, 7, 8, 10, 11, 12, 13, 14, 59, 61, 64, 66], "In": [12, 13, 59, 61, 63, 64, 66, 68], "It": [59, 64, 66], "No": 61, "Not": [14, 22, 23, 24, 26, 27, 28, 38, 39, 40, 51, 52, 53], "On": [13, 64, 66], "The": [2, 4, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 58, 59, 61, 63, 64, 68], "Then": [61, 64, 66], "There": [12, 25, 29, 41, 54, 66], "These": [10, 14, 25, 29, 30, 32, 41, 42, 54, 59, 64], "To": [1, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 66, 68], "With": 14, "_": [2, 12, 61, 63, 64, 66, 68], "_0": 64, "__call__": [4, 5, 63, 64], "__init__": [64, 68], "__len__": 3, "_build": 1, "_check_valid_cel": 64, "_gen_miss": [35, 36, 61], "_index_0": 59, "_index_1": 59, "_max": 10, "_min": 10, "_score": 10, "_script": 59, "a1efe4": [14, 58], "a256f8": 14, "a5a5a1": 14, "a_hat": 68, "a_pr": 68, "a_t": 66, "ab": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "abil": 12, "abl": [12, 42], "abort": 14, "about": [1, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61], "abov": [12, 59, 61, 63, 66], "abspath": 68, "abstract": 12, "ac": 68, "access": [8, 12, 14, 59, 64], "account": 64, "accumul": [16, 17, 18, 19, 20, 21, 64, 68], "accumulated_rew": 68, "accur": 66, "achiev": [12, 64, 68], "achieved_go": [16, 17, 18, 19, 20, 21, 31, 33, 34, 43, 44, 45, 46, 47, 48, 49, 50, 63, 64], "achieved_goal_cel": 64, "acrobot": 12, "across": [10, 13, 59], "act": 59, "action": [2, 3, 5, 6, 8, 9, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 37, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 63, 64, 66, 68], "action_id": 64, "action_idx": 64, "action_spac": [2, 8, 10, 12, 13, 59, 61, 63, 64, 68], "action_space_subset": 63, "action_spec": 66, "activ": [15, 66], "activation_class": 66, "activation_fn": 66, "actor": 66, "actor_extractor": 66, "actor_mlp": 66, "actor_modul": 66, "actor_net": 66, "acttyp": [2, 10], "actual": 64, "actuat": [30, 42], "ad": [5, 7, 8, 10, 12, 13, 43, 44, 45, 46, 47, 48, 49, 50, 59, 63], "adam": [15, 66, 68], "add": [2, 3, 4, 5, 7, 8, 14, 43, 44, 45, 46, 47, 48, 49, 50, 59, 64, 66], "add_step_data": 3, "add_to_dataset": [2, 12], "addit": [2, 5, 7, 11, 12, 13, 59], "addition": [15, 59], "additional_dataset": 59, "additional_group": 59, "additional_wrapp": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "address": 64, "adher": 59, "adjust": 64, "adroit_door": [22, 23, 24], "adroit_h": 14, "adroit_hamm": [26, 27, 28], "adroit_hand": [14, 22, 23, 24, 26, 27, 28, 38, 39, 40, 51, 52, 53], "adroit_pen": [14, 38, 39, 40], "adroit_reloc": [51, 52, 53], "adroithanddoor": [12, 13, 22, 23, 24, 25, 30, 59], "adroithanddoorenv": [22, 23, 24], "adroithandhamm": [26, 27, 28, 29, 30, 59], "adroithandhammerenv": [26, 27, 28], "adroithandpen": [14, 30, 38, 39, 40, 41, 59, 66], "adroithandpenenv": [38, 39, 40], "adroithandreloc": [30, 51, 52, 53, 54, 59], "adroithandrelocateenv": [51, 52, 53], "advantag": [64, 66], "after": [2, 4, 6, 9, 10, 13, 14, 59, 64, 68], "again": [16, 17, 18, 19, 20, 21], "agent": [9, 15, 16, 17, 18, 19, 20, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 63, 64, 66, 68], "aggress": 64, "agnost": [2, 66], "aim": [13, 64, 66], "al": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64, 66], "alex": [12, 16, 17, 18, 19, 20, 21], "alexdavei": 59, "alexdavey0": [16, 17, 18, 19, 20, 21], "algo": 68, "algorithm": [2, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 66], "algorithm_nam": [2, 10, 12, 13, 61, 63, 64, 68], "all": [8, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 30, 31, 32, 58, 59, 61, 65, 66, 68], "allow": [12, 13, 59, 64, 68], "alon": 64, "along": [30, 42], "alreadi": [8, 12, 14, 59, 63, 64, 66], "also": [10, 12, 14, 16, 17, 18, 19, 20, 21, 58, 59, 61, 63, 64, 66], "alwai": 64, "among": 59, "amount": [12, 64], "amp": 59, "an": [4, 7, 10, 11, 12, 13, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 47, 48, 51, 52, 53, 54, 55, 59, 61, 64, 66], "andrea": [55, 56], "ani": [2, 5, 6, 7, 8, 9, 10, 11, 12, 59, 63, 64], "annot": 59, "anoth": [2, 5, 8, 12, 13, 25, 29, 41, 54, 64, 66], "anssi": 15, "ant": [16, 17, 18, 19, 20, 21, 30, 55, 57], "ant_maze_v4": [16, 17, 18, 19, 20, 21], "ant_v5": 55, "antenv": 55, "antmaz": [12, 16, 17, 18, 19, 20, 21], "antmaze_larg": [15, 17], "antmaze_large_diverse_gr": [15, 16], "antmaze_medium": [15, 19], "antmaze_medium_diverse_gr": [15, 18], "antmaze_umaz": [15, 20, 21], "antmazeenv": [16, 17, 18, 19, 20, 21], "antonin": 15, "apart": 59, "api": [11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 64, 68], "appear": [12, 59], "append": [3, 8, 12, 59, 66], "appli": [8, 61], "applic": [12, 59], "appreci": 59, "approach": 64, "appropri": 13, "approx": 66, "approxim": 66, "apr": [15, 42, 64], "apt": 66, "ar": [2, 6, 8, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 41, 42, 51, 52, 53, 54, 55, 58, 59, 61, 64, 66], "arang": 66, "aravind": [25, 29, 41, 54], "aravindr93": 14, "arbitrari": [13, 59], "arbitrarili": 13, "arena": [42, 47, 48], "arg": [14, 59, 64, 66], "argmax": [64, 68], "argument": [4, 5, 10, 12, 13, 59], "argv": 68, "around": [61, 66], "arrai": [10, 13, 64], "arrow": [13, 59], "arxiv": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "as_tensor": 68, "ashlei": 15, "assert": [22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 61, 68], "assign": 10, "associ": 13, "attach": 13, "attempt": 66, "attr": 59, "attribut": [2, 4, 10, 12, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 59], "author": [2, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 64, 68], "author_email": [2, 10, 12, 13, 59, 61, 64, 68], "auto": [66, 68], "auto_cast_to_devic": 66, "autobuild": 1, "automat": [1, 2, 13, 59], "autoreset": 14, "auxiliari": 2, "avail": [7, 10, 12, 14, 58, 59, 61, 66], "averag": [2, 10, 66], "avg": 66, "avjmachin": 59, "avoid": [59, 66], "awai": 59, "ax": 66, "axi": [30, 42, 64, 66], "b": [1, 14, 58], "b64encod": 66, "back": [61, 64], "background": 59, "backpropag": 66, "backward": [66, 68], "badg": 59, "balanc": 68, "balisujohn": 59, "ball": [15, 30, 42, 54, 64], "bamboofungu": 59, "bar": 14, "base": [12, 14, 59, 64, 66], "base64": 66, "base_env": 66, "baselin": 15, "baselines3": [15, 68], "basi": 59, "basic": [59, 66], "batch": [66, 68], "batch_first": 68, "batch_siz": [66, 68], "becaus": [15, 16, 17, 18, 19, 20, 21, 42, 66], "been": [12, 42, 59], "befor": [2, 12, 61, 64, 66], "begin": [16, 17, 18, 19, 20, 68], "behav": 66, "behavior": [59, 64, 65, 66, 69], "behavioral_clon": 68, "behaviour": 66, "being": [2, 10, 13, 31, 32, 33, 34, 42, 43, 45, 47, 49], "bellman": 64, "bellow": 59, "belong": 5, "below": [14, 64, 66], "benchmark": [30, 66], "best": 66, "best_model": 68, "beta": [59, 66], "between": [10, 43, 45, 47, 49, 64], "bias": 64, "binari": 13, "bind": 64, "bit": [64, 66], "black": 59, "blob": [61, 64], "block": 66, "blue": 66, "board": 29, "bool": [2, 5, 7, 9, 10, 11, 59, 66], "boolean": 10, "both": [8, 13, 14, 61, 63], "bottom": 33, "bound": [13, 64, 66], "box": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 63, 68], "break": [12, 59, 64, 68], "bucket": [12, 13, 58, 59], "buffer": [2, 3, 7, 8, 10, 12, 59], "bug": 59, "bugfix": 59, "build": [14, 59], "burner": 33, "c": [12, 16, 18, 32, 59], "cabinet": [31, 32, 34], "cach": [2, 12, 59, 66], "calcul": [10, 66], "call": [2, 5, 12, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 59], "callabl": [2, 7, 8, 10, 12, 59, 61], "callback": [2, 4, 5, 59, 63, 64], "can": [2, 4, 5, 7, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 63, 64, 66, 68], "capabl": 12, "captur": 66, "care": 61, "cart": 68, "cartesian": 13, "cartpol": [11, 12, 59, 68], "case": [12, 59, 64], "cd": [1, 12], "cell": [16, 18, 64], "cell_rowcol_to_xi": 64, "cell_to_st": 64, "cell_xy_to_rowcol": 64, "center": 14, "certain": [7, 12, 41], "cff": 59, "challeng": [15, 66], "chang": [1, 11, 59, 64], "changelog": 59, "characterist": [2, 64], "charg": 59, "charset": [13, 35, 36], "check": [12, 14, 59, 64], "checkpoint": 59, "choic": 66, "choos": [13, 61, 63], "chosen": 64, "ci": 59, "citat": 59, "class": [2, 3, 4, 5, 6, 7, 8, 9, 13, 59, 63, 64, 66, 68], "classic": [12, 64, 68], "classic_control": 12, "classif": 68, "clean": 61, "clear": 2, "clear_episode_buff": 59, "cli": [58, 59], "clip": 64, "clone": [1, 12, 14, 25, 29, 41, 54, 58, 59, 65, 66, 69], "close": [2, 32, 64, 66, 68], "cloud": [12, 13, 59], "cmmcirvin": 59, "code": [2, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 63, 64, 65, 66, 68], "code_permalink": [2, 10, 12, 13, 61, 64, 68], "codelink": 59, "colab": 66, "collate_fn": 68, "collect": [2, 10, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 58, 59, 61, 62, 65, 66], "collector": [2, 64], "collector_env": [59, 64], "collis": 64, "color": [14, 58], "com": [1, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 59, 61, 64], "combin": [59, 64], "combine_dataset": [10, 12, 59], "combined_dataset": 10, "come": [13, 14], "command": [12, 14, 59, 68], "commit": 59, "common": [12, 13], "compar": [6, 63], "comparison": 10, "compat": [10, 12, 14, 59, 68], "compatible_minari_vers": 10, "complement": 2, "complet": [32, 33, 34, 59, 66], "complex": [15, 25, 29, 30, 41, 54, 59], "compli": 59, "compliant": [13, 59], "compon": 64, "component_1": 59, "component_2": 59, "compris": 12, "comput": [2, 10, 12, 13, 66], "compute_act": 64, "compute_reward_matrix": 64, "compute_transition_matrix": 64, "concaten": 66, "condit": [7, 12, 59, 66], "configur": [32, 59, 66], "confirm": [14, 66], "conflict": 66, "conjunct": 66, "consid": [8, 59, 64, 66], "consider": 59, "consist": [13, 42, 66], "constantli": 59, "construct": 64, "contact": [11, 12, 61, 68], "contain": [1, 2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 15, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 42, 47, 48, 49, 50, 51, 52, 53, 55, 59], "content": [13, 14], "continu": [10, 12, 13, 42, 43, 44, 45, 46, 47, 48, 49, 50, 64], "continuing_task": [16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 64], "contribut": [1, 12, 59, 64], "contributor": 59, "control": [12, 15, 42, 43, 44, 45, 46, 47, 48, 49, 50, 59, 66, 68], "conveni": 66, "convent": 59, "convers": [59, 61], "convert": [2, 64, 66], "coordin": 64, "copi": [59, 66], "core": 61, "corl": 66, "corr": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "correct": [59, 64, 66], "correspond": [2, 10, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 64, 68], "could": [15, 66], "cover": 66, "coverag": 59, "cpu": 66, "creat": [2, 5, 7, 8, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 59, 61, 63, 66, 68], "create_dataset": [2, 12, 59, 61, 63, 64, 68], "create_dataset_from_buff": [10, 12, 13, 59], "create_dataset_from_collector_env": 59, "create_namespac": 11, "creation": [2, 12, 13, 59], "credenti": 11, "cross": 68, "crossentropyloss": 68, "cuda": 66, "cumul": [64, 66], "curat": 59, "current": [5, 10, 12, 13, 14, 59, 64, 66], "current_cel": 64, "current_control_target_id": 64, "current_control_target_xi": 64, "current_st": 64, "custom": [2, 4, 12, 59, 62, 64, 65], "custom_space_seri": 61, "customstepdatacallback": 5, "customsubsetstepdatacallback": 63, "cython": 59, "d": [12, 66], "d4rl": [10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 59, 62, 65, 66], "da": 64, "dampen": 64, "dapg": [14, 23, 24, 25, 27, 28, 29, 39, 40, 41, 52, 53, 54], "data": [2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 29, 30, 32, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 58, 59, 61, 66, 68], "data_collector": 63, "data_format": [2, 8, 10, 59], "data_path": 8, "data_url": 66, "databas": [10, 11, 14], "databefor": 2, "dataclass": [8, 59], "datacollector": [4, 12, 13, 59, 61, 63, 64, 68], "datacollectorv0": 59, "dataload": [12, 59, 68], "datas": 8, "dataset": [2, 4, 5, 6, 7, 11, 15, 25, 29, 30, 32, 37, 41, 42, 54, 58, 59, 61, 63, 66], "dataset_cr": [59, 61, 64], "dataset_id": [2, 10, 11, 12, 13, 59, 61, 63, 64, 66, 68], "dataset_nam": [2, 10, 13, 14, 64], "dataset_s": 59, "dataset_v1": 59, "dataset_v2": 59, "dataset_v3": 59, "datasets_to_combin": [10, 59], "davei": [12, 16, 17, 18, 19, 20, 21], "de": [12, 14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 51, 52, 53], "decent": 66, "decod": 66, "deep": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "def": [5, 61, 63, 64, 66, 68], "default": [2, 5, 7, 8, 10, 11, 12, 13, 66], "default_interaction_typ": 66, "defin": [13, 61, 63, 68], "definit": 59, "del": [61, 63], "deleg": 59, "delet": [61, 63], "delete_dataset": [10, 61, 63], "delete_namespac": 11, "demonstr": [22, 24, 25, 26, 28, 29, 31, 32, 38, 40, 41, 51, 53, 54, 66], "dens": [14, 22, 23, 24, 26, 27, 28, 38, 39, 40, 42, 51, 52, 53, 59, 66], "depend": [12, 13, 59], "deprec": 59, "descent": 66, "describ": [11, 13, 59], "descript": [2, 10, 11, 13, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 56, 57, 59], "deseri": 61, "deserialize_custom_spac": 61, "deserialize_spac": 61, "design": 66, "desir": [32, 64], "desired_cel": 64, "desired_go": [16, 17, 18, 19, 20, 21, 31, 33, 34, 43, 44, 45, 46, 47, 48, 49, 50, 63, 64], "detail": 66, "detect": 59, "determin": 64, "determinist": [12, 64, 66], "develop": 59, "deviat": [13, 64], "devic": [14, 66], "dexter": [25, 29, 41, 54], "df8ff078652a": [15, 42, 64], "dict": [2, 3, 4, 5, 6, 8, 9, 10, 11, 13, 16, 17, 18, 19, 20, 21, 31, 33, 34, 35, 36, 43, 44, 45, 46, 47, 48, 49, 50, 59, 61, 63], "dict_kei": 63, "dictionari": [2, 3, 5, 7, 8, 9, 10, 12, 13, 59, 62, 64, 65, 66], "differ": [10, 12, 13, 42, 59, 61, 64, 66], "dimens": [66, 68], "dimension": [13, 25, 29, 41, 54], "dir": 59, "direct": [35, 36, 61, 66], "directli": [12, 59, 64, 66, 68], "directori": [2, 8, 11, 12, 66], "dirhtml": 1, "disabl": 2, "disable_env_check": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "discount": 64, "discret": [13, 35, 36, 59, 61, 64, 68], "disk": [8, 12, 13, 59, 61, 63, 68], "displai": [66, 68], "dist": 64, "distanc": [43, 45, 47, 49], "distribut": [25, 29, 41, 54, 66], "distribution_class": 66, "distribution_kwarg": 66, "divers": [12, 15], "divid": [12, 64], "do": [64, 66], "doc": [1, 59, 61, 64], "document": [12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59], "doe": 59, "doesn": [8, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 59, 64], "dof": [15, 25, 29, 30, 41, 54, 66], "domain": [15, 25, 29, 30, 41, 42, 54], "don": [13, 59, 61, 63, 64], "done": [12, 64, 66, 68], "door": [10, 12, 13, 14, 22, 23, 24, 30, 32, 58, 59], "dormann": 15, "dot": [64, 66], "doubl": 66, "doubletofloat": 66, "down": 64, "download": [13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 63, 64, 65, 66, 68], "download_dataset": 10, "download_namespace_metadata": 11, "driven": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "dt": 64, "dtype": [59, 63, 64, 66], "due": [59, 64], "dump": 61, "dure": [12, 13, 59, 64, 66], "dynam": 64, "e": [1, 7, 10, 12, 59, 66], "e731": 61, "each": [2, 4, 5, 6, 8, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 63, 64, 66, 68], "earlier": 61, "edit": [2, 5], "effect": [25, 29, 41, 54], "effici": 59, "element": [6, 13], "elif": 64, "elimin": 64, "ell": 66, "elliottow": 59, "els": [12, 59, 64, 66], "email": [2, 10, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59], "embed": 66, "empti": [11, 61, 64], "emptyenv": 61, "enabl": 61, "encapsul": 13, "encount": 61, "encourag": [13, 59], "end": [13, 59], "enerrio": 59, "enhanc": 59, "ensur": 66, "entri": 64, "entropi": 68, "entry_point": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59], "env": [2, 5, 7, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 59, 61, 63, 64, 66, 68], "env_id": 66, "env_nam": [2, 10, 13], "env_spec": [8, 13], "envid": 2, "environ": [2, 5, 6, 7, 8, 9, 10, 13, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 58, 59, 61, 63, 64, 68], "environment_st": 5, "envspec": [2, 8, 10, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59], "eol": 59, "ep": 12, "episod": [2, 3, 4, 6, 7, 8, 10, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 63, 64, 66, 68], "episode_0": 59, "episode_1": 59, "episode_2": 59, "episode_id": [12, 59], "episode_indic": [7, 8, 12], "episode_metadata_callback": [2, 4], "episode_reward": 66, "episodebuff": [7, 8, 10], "episodedata": [7, 12, 59], "episodemetadatacallback": [2, 13, 59], "episodes_gener": 12, "epoch": 68, "epsiodedata": 8, "equal": [2, 10, 13], "equat": 64, "equiv": 66, "equlival": 64, "ernestu": 15, "error": [10, 59, 61, 64, 66], "essenti": 66, "estim": [2, 10, 66], "et": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64, 66], "etc": 66, "euclidean": [43, 45, 47, 49], "evad": 64, "eval_env": [2, 7, 10, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "eval_env_spec": [12, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55], "eval_interv": 66, "eval_reward_log": 66, "eval_td": 66, "evalu": [2, 7, 10, 12, 59, 66, 68], "evaluate_polici": 66, "everi": [1, 10, 12, 13, 21, 64, 66], "everyth": 66, "exampl": [2, 10, 11, 12, 13, 14, 59, 61, 64, 65, 66], "example_env": 66, "except": [8, 59, 61, 66], "excit": 59, "execut": 68, "exerpt": 59, "exist": [8, 11, 14, 59, 63, 64], "exit": 14, "expect": 63, "expectil": 66, "experienc": 59, "experiment": 11, "expert": [2, 10, 12, 13, 14, 15, 22, 25, 26, 29, 36, 37, 38, 41, 51, 54, 56, 58, 59, 66, 68], "expert_dataset": 55, "expert_polici": [2, 10], "expertpolici": [36, 68], "explain": [59, 64], "explicit": [59, 66], "explicitli": 59, "explor": 59, "exploration_act": 64, "explorationtyp": 66, "exponenti": [43, 45, 47, 49], "export": [12, 59], "extend": [12, 63], "extra": [2, 4, 5, 59, 64], "extract": 66, "extrapol": 66, "f": [12, 14, 59, 61, 63, 66, 68], "f01e2c": 14, "f4bf75": 14, "facilit": [10, 12, 59], "factor": 64, "factori": 3, "fail": [16, 17, 18, 19, 20, 21, 59], "fals": [2, 7, 10, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 61, 63, 64, 66, 68], "familiar": 66, "farama": [1, 10, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 64, 66, 68], "favor": 59, "fc1": 68, "fc2": 68, "fc3": 68, "featur": [11, 12, 58, 59, 68], "fed000": 14, "few": 59, "ff00ff": [14, 58], "ffmpeg": 66, "field": [13, 59, 66], "fig": 66, "figsiz": 66, "figur": 66, "file": [2, 4, 11, 12, 13, 14, 58, 59, 63], "file_fold": 59, "filter": [7, 58, 59], "filter_dataset": [12, 59], "filter_episod": [7, 12, 59], "final": [6, 12, 15, 59, 61, 63, 64, 66], "final_scor": 66, "find": 63, "fine": [14, 23, 25, 27, 29, 39, 41, 52, 54, 55, 56], "first": [11, 12, 59, 61, 63, 64, 66], "fit": [63, 66], "fix": [21, 30, 42, 59, 66], "flag": [10, 59, 66], "flatten": 59, "flexibl": 12, "flip": [16, 17, 18, 19, 20, 21, 32], "float": [2, 8, 10, 13, 63, 66], "float32": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 64, 68], "float64": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 63, 66], "floppy_disk": 59, "folder": [1, 68], "follow": [2, 5, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 64, 66], "font": [14, 58], "forc": [10, 14, 30, 42, 64], "force_download": [10, 59], "form": [10, 13, 64], "format": [2, 8, 10, 12, 13, 59, 61], "formula": [10, 64], "forward": [11, 13, 66, 68], "found": [10, 13], "foundat": [1, 12, 14, 30, 55, 59, 61, 64], "four": 68, "fourroom": [30, 37], "fourroomsenv": [35, 36], "fp": 66, "frac": 10, "frame": 66, "framework": 66, "franka_kitchen": [31, 33, 34], "frankakitchen": [30, 31, 32, 33, 34, 59], "from": [2, 5, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 58, 59, 61, 63, 64, 66, 68], "from_pixel": 66, "froze": 59, "fu": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "full": [4, 8, 12, 36, 37, 59, 66], "fulli": 59, "function": [7, 8, 10, 12, 13, 14, 35, 36, 42, 43, 44, 45, 46, 47, 48, 49, 50, 59, 61, 64, 66, 68], "fundament": [15, 42, 64], "futur": [11, 12, 59, 64], "g": [12, 21, 35, 36, 66], "gain": 64, "gamma": [64, 66], "gather": 66, "gcp": [12, 13, 58, 59], "gen_dataset_md": 59, "gener": [2, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 58, 59, 61, 63, 64], "generate_path": 64, "get": [7, 8, 10, 12, 59, 61, 63, 64, 66, 68], "get_episod": 8, "get_episode_metadata": [8, 13], "get_namespace_metadata": 11, "get_next_st": 64, "get_normalized_scor": [2, 10, 59], "get_q_valu": 64, "get_siz": 8, "git": [1, 12], "github": [1, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 59, 61, 64], "give": [12, 13, 14, 64, 66], "given": [12, 13, 14], "gleav": 15, "global": [2, 13, 64], "global_target_id": 64, "global_target_xi": 64, "glr": 59, "gmail": [16, 17, 18, 19, 20, 21, 35, 36], "go": [1, 64], "goal": [15, 16, 17, 18, 19, 20, 21, 32, 36, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 61, 63, 64, 66], "goal_cel": 64, "goe": [36, 37], "googl": [13, 59, 66], "gradient": 66, "grahamannett": 59, "greater": [12, 59], "green": [61, 66], "grid": 64, "gridworld": 37, "group": [2, 4, 10, 12, 13, 14, 30, 59, 64], "gt": 59, "guarante": 13, "gupta": 32, "gym": [2, 5, 7, 10, 12, 59, 61, 63, 64, 66, 68], "gymansium": 12, "gymenv": 66, "gymnaisum": 14, "gymnasium": [2, 5, 7, 8, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 56, 58, 59, 61, 63, 64, 66, 68], "gymnasium_robot": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "gynasium": 59, "h5py": 59, "ha": [12, 21, 42, 59, 64, 66], "hammer": [26, 27, 28, 30, 59], "hand": [13, 16, 18, 25, 29, 41, 54, 64, 66], "hand_dapg": [14, 25, 29, 30, 41, 54], "handl": [8, 12, 58], "hat": 66, "hausman": 32, "have": [12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 36, 38, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 59, 61, 63, 64, 66, 68], "hdf5": [2, 4, 8, 13, 14, 58, 59, 63, 64], "help": [14, 59, 64], "helper": 66, "here": [66, 68], "hesit": 59, "hidden": 59, "hidden_s": 66, "hierarch": 12, "high": [25, 29, 41, 54, 59, 63, 64, 66], "higher": 64, "highli": 59, "hill": 15, "hood": 66, "horizon": 32, "host": [12, 14, 25, 29, 30, 32, 41, 54, 58], "how": [1, 2, 59, 61, 63, 64, 66, 68], "howev": [13, 42, 59, 61, 64, 66, 68], "howuhh": 59, "href": 14, "html": 66, "http": [1, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 59, 61, 64, 68], "hub": 59, "human": [10, 12, 13, 14, 22, 25, 26, 29, 38, 41, 51, 54, 58, 59, 66, 68], "hyperparamet": 66, "hypothet": [2, 10], "i": [1, 2, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 32, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 59, 61, 63, 66, 68], "id": [2, 3, 6, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 59, 64, 68], "idea": 59, "identifi": [2, 10, 11, 13], "ignor": [59, 66], "im": 59, "imag": [35, 36, 61, 66], "imit": [22, 25, 26, 29, 32, 38, 41, 51, 54], "implement": [14, 15, 64, 66], "implicit": [65, 69], "implicitli": 66, "import": [2, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 63, 64, 66], "import_bugfix": 59, "improv": [59, 66], "imshow": 66, "in_kei": 66, "includ": [6, 13, 31, 32, 34, 42, 59, 66], "incompat": 14, "incorrect": [8, 59], "increas": 6, "indic": [2, 7, 8, 10, 12, 59], "inf": [12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 63], "infer": 66, "influenc": [64, 66], "info": [2, 3, 5, 6, 9, 12, 13, 59, 64, 68], "inform": [1, 2, 5, 7, 13, 59, 64], "infos_dataset": 59, "infos_subgroup": 59, "init": 59, "initi": [2, 6, 7, 12, 13, 59, 61, 63, 64, 66, 68], "initialis": 66, "input": [5, 7, 12, 13, 66, 68], "input_dim": 68, "insid": 61, "inspir": 64, "instabl": 64, "instal": [1, 10, 14, 58, 59, 61, 66, 68], "instanc": [7, 59], "instanti": 14, "instead": [12, 13, 59, 64, 66], "instruct": 59, "int": [2, 3, 6, 7, 8, 10, 13, 59, 64], "int64": [59, 68], "int_": [7, 64], "integ": 13, "intend": 7, "interact": 32, "interest": 66, "interfac": 12, "intern": [12, 59], "introduc": [15, 25, 29, 41, 54, 59, 66], "invers": 66, "involv": [30, 42, 64], "ipynb": [61, 63, 64, 66, 68], "ipython": 66, "iql": 66, "iql_torchrl": 66, "iqlloss": 66, "is_avail": 66, "is_shar": 66, "isinst": 68, "isol": 59, "issu": [59, 66], "item": [2, 64, 66, 68], "iter": [7, 8, 12, 13, 15, 42, 64, 66], "iterate_episod": [7, 12, 59], "its": [10, 59, 61, 64, 66], "itself": 12, "j": 64, "jamartinh": 59, "josephcarrino": 59, "journal": 15, "json": [13, 14, 59, 61], "jupyt": [61, 63, 64, 65, 66, 68], "just": [12, 61, 66], "justin": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "k": 32, "k_": 64, "k_d": 64, "k_i": 64, "k_p": 64, "kabuki": 59, "kaixin96": 59, "kallinteri": [55, 56], "kanervisto": 15, "keep": [12, 59], "kei": [2, 5, 8, 10, 12, 14, 59, 63, 64, 66], "kept": 13, "kernel": 66, "kettl": [31, 32, 33, 34], "key_fil": 14, "key_path": 11, "kitchen": [30, 31, 33, 34, 59], "kitchenenv": [31, 33, 34], "kitsch": 59, "know": 64, "kostrikov": 66, "kumar": 32, "kwarg": [2, 5, 7, 11, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 63], "l": 66, "l2": 66, "l_": 66, "l_2": 66, "l_pi": 66, "l_q": 66, "l_v": 66, "lag": 66, "lambda": [7, 12, 59, 61, 64], "lambert": [15, 42, 64], "larg": [12, 15, 42, 59], "larger": [59, 64, 66], "largest": 59, "last": 59, "last_episode_id": 59, "later": [2, 10, 59, 66], "latest": [10, 14, 59, 64], "latest_vers": 10, "latter": [10, 13, 66], "layer": 66, "lazcano": [12, 14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 51, 52, 53], "lazi": 66, "lazylinear": 66, "lead": [13, 16, 17, 18, 19, 20, 21, 64], "learn": [12, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 58, 59, 61, 63, 64, 65, 68, 69], "learnin": [15, 42, 64], "leav": 12, "left": [12, 64, 66], "leftarrow": [64, 66], "len": [64, 66], "length": [3, 68], "less": 64, "let": [61, 63, 64, 68], "level": 13, "levin": 32, "lib": 66, "librari": [12, 59, 61, 68], "light": [31, 32, 33, 34], "like": [11, 12, 14, 61, 66, 68], "limit": [64, 66], "linalg": 64, "line": [14, 63], "linear": 68, "link": [2, 10, 12, 13], "linux": 12, "list": [2, 3, 7, 8, 12, 13, 58, 59, 66, 68], "list_local_dataset": [10, 12, 59, 63], "list_local_namespac": 11, "list_remote_dataset": [10, 59], "list_remote_namespac": 11, "ll": [61, 63], "load": [2, 11, 13, 59, 61, 66, 68], "load_dataset": [2, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 68], "loc": 66, "local": [10, 13, 59, 61, 63, 66, 68], "local_dataset": 63, "locat": [12, 15, 16, 17, 18, 19, 20, 21, 30, 42, 43, 44, 45, 46, 47, 48, 49, 50, 64, 66], "log": [59, 66, 68], "long": [32, 64], "longer": 59, "look": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61], "loop": [12, 66, 68], "loos": 59, "lose": 12, "loss": 68, "loss_actor": 66, "loss_dict": 66, "loss_fn": 68, "loss_funct": 66, "loss_log": 66, "loss_modul": 66, "loss_qvalu": 66, "loss_valu": 66, "lost": 59, "low": [59, 63, 64, 66], "lower": 13, "lr": 66, "lynch": 32, "m_": 66, "machin": [13, 15], "maco": 12, "made": [1, 59], "mai": [11, 12, 64, 66], "main": [2, 7, 55, 59, 61, 64, 66], "main_data": [14, 58, 59], "major": 59, "make": [1, 2, 7, 12, 59, 61, 63, 64, 66, 68], "make_value_estim": 66, "manag": 59, "mandatori": [13, 59], "mani": 13, "manipul": [25, 29, 41, 54, 66], "manual_se": [66, 68], "map": [12, 16, 18, 64, 66], "map_length": 64, "map_width": 64, "margin": 66, "markdown": 59, "markovian": [15, 42], "master": 64, "match": 10, "mathbb": 66, "mathcal": 66, "matplotlib": 66, "matrix": 64, "max": [64, 66], "max_": [64, 66], "max_a": 66, "max_episode_step": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 64, 66], "max_step": 66, "maximilian": 15, "maximis": 66, "maximum": [2, 10, 13, 64, 66, 68], "maze": [16, 17, 18, 19, 20, 21, 30, 43, 44, 45, 46, 47, 48, 49, 50, 59, 64], "maze2d": [42, 64], "maze_map": [16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 64], "maze_solv": 64, "mb": [8, 12, 14, 58], "md": [1, 59], "mdp": [12, 59], "mean": [6, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 64, 66], "meant": [2, 59], "measur": [25, 29, 41, 54, 64], "medium": [12, 15, 42, 59], "memor": [15, 42], "memori": [2, 12, 59], "mention": [13, 59, 64, 68], "merg": 14, "messag": 14, "met": 7, "metadata": [2, 4, 7, 8, 10, 12, 14, 59, 63], "method": [12, 15, 42, 59, 61, 64, 66], "metric": 13, "mgoulao": 59, "microwav": [31, 32, 33, 34], "mimic": 15, "min": 66, "minari": [11, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 63, 66, 68], "minari_autose": 2, "minari_data": 66, "minari_dataset": [59, 68], "minari_datasets_path": 13, "minari_remot": [12, 59], "minari_storag": 59, "minari_vers": [13, 59], "minaridataset": [2, 10, 12, 13, 59, 68], "minariexperiencereplai": 66, "minaristorag": [2, 7, 10, 13, 59], "minigrid": [30, 35, 36, 59, 61], "minim": 63, "minimis": 66, "minimum": [2, 10, 12, 13, 59], "minor": 59, "mirana": 63, "misc": 59, "miss": 59, "mission": [35, 36, 61], "mission_func": 61, "missionspac": [35, 36, 61], "missonspac": 61, "mix": [22, 25, 26, 29, 32, 38, 41, 51, 54, 59], "mlp": 66, "model": [55, 56], "modifi": [8, 12, 13, 59, 63], "modul": [61, 63, 64, 66, 68], "modulelist": 66, "moment": 13, "more": [1, 6, 12, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 64, 66], "more_dataset": 59, "moreov": [8, 13], "morpholog": 15, "most": [12, 14], "move": [12, 30, 32, 42, 54, 59, 64], "mp4": 66, "mujoco": [2, 10, 55, 64], "mujuco": [55, 56], "multi": 66, "multibinari": 13, "multidiscret": 13, "multipl": [10, 11, 12, 14, 59, 66], "must": [5, 7, 8, 10, 12, 13, 59, 66], "my": 12, "n": [7, 12, 13, 14, 64, 68], "n_episod": [7, 12], "n_step": [59, 64], "nail": 29, "name": [2, 10, 11, 12, 13, 14, 58, 59, 61, 68], "namespac": [2, 10, 59], "namespace_metadata": 13, "narrow": [25, 29, 41, 54], "nathan": [15, 42, 64], "navig": [15, 30, 37, 42], "ncol": 66, "ndarrai": [6, 7, 10, 13, 59], "necessari": 66, "need": [8, 12, 59, 61, 63, 64, 66, 68], "neg": [43, 45, 47, 49], "nest": [2, 5, 11, 13, 59], "net": 66, "network": [66, 68], "neural": 68, "never": [32, 33, 64, 66], "new": [2, 8, 10, 12, 16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 59, 61, 64, 66, 68], "new_dataset_id": [10, 59], "new_dataset_nam": 14, "newli": [10, 12, 66], "next": [9, 59, 64, 66, 68], "next_cel": 64, "next_episode_id": 59, "next_stat": 64, "nightli": 66, "nn": [66, 68], "no_grad": 66, "noah": 15, "nois": [43, 44, 45, 46, 47, 48, 49, 50, 59, 64], "non": [12, 13, 15, 42], "nondeterminist": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "none": [2, 3, 5, 7, 8, 9, 10, 11, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 64], "nonetyp": 59, "noqa": 61, "norm": 64, "normal": [2, 66], "normalized_scor": 10, "normalparamextractor": 66, "note": [10, 11, 13, 16, 17, 18, 19, 20, 21, 63, 64, 66], "notebook": [61, 63, 64, 65, 66, 68], "notic": 12, "notimplementederror": 61, "now": [10, 12, 59, 61, 63, 64, 68], "np": [7, 10, 13, 59, 63, 64, 66, 68], "npt": 7, "nrow": 66, "num_act": 64, "num_cel": 66, "num_episod": [61, 63], "num_episodes_average_scor": [2, 10], "num_epoch": 68, "num_eval_episod": 66, "num_itr": 64, "num_stat": 64, "num_step": 2, "number": [2, 6, 7, 10, 12, 13, 14, 59], "numpi": [63, 64, 66, 68], "o": 68, "ob": [2, 5, 12, 59, 64, 68], "object": [7, 8, 9, 12, 25, 29, 32, 37, 41, 54, 59, 61, 66, 68], "observ": [2, 3, 5, 6, 8, 9, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 37, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 63, 64, 66, 68], "observation_spac": [2, 8, 10, 12, 13, 59, 61, 63, 68], "observation_space_subset": 63, "obstyp": [2, 10], "obtain": [22, 25, 26, 29, 38, 41, 51, 54, 64], "occur": [16, 17, 18, 19, 20, 21], "off": 14, "offici": 59, "offlin": [12, 13, 14, 58, 59, 64, 66, 68], "often": 64, "oibserv": 59, "omar": [35, 36], "omit": 63, "onc": [1, 12, 64, 66, 68], "one": [2, 6, 7, 8, 12, 25, 29, 41, 42, 54, 59, 66], "one_hot": 68, "onli": [10, 11, 12, 13, 42, 44, 46, 47, 48, 50, 59, 63, 66], "onlin": 66, "onto": 11, "open": [25, 32, 42, 59, 66], "opengl": 66, "optim": [64, 68], "option": [2, 3, 5, 7, 8, 10, 12, 13, 14, 59], "order": [12, 31, 32, 59, 63], "order_enforc": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "org": [11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 59, 61, 64, 68], "organ": 59, "orient": [5, 41, 63], "origin": [10, 12, 25, 29, 30, 32, 41, 42, 54, 59, 61, 66], "other": [7, 8, 10, 11, 12, 13, 14, 32, 34, 59, 63, 64, 66], "otherwis": [7, 12, 44, 46, 48, 50, 59], "our": [1, 12, 13, 59, 63, 64, 66, 68], "ourselv": 64, "out": [8, 12, 59, 61, 64, 66], "out_featur": 66, "out_kei": 66, "outlin": 63, "output": [8, 61, 63, 64, 66, 68], "output_dim": 68, "outsid": 66, "over": [2, 7, 10, 12, 64, 66], "overal": 66, "overconfid": 66, "overestim": 66, "overrid": [4, 5, 13, 14, 64], "overridden": [4, 5, 10, 59], "overridng": 64, "overshoot": 64, "overview": 66, "overwrit": 11, "own": [10, 12, 59, 64], "p_": 64, "packag": [1, 2, 10, 14, 59, 68], "pad": 68, "pad_sequ": 68, "page": 59, "page_facing_up": 59, "pair": [13, 66], "paper": [25, 29, 41, 54], "paramet": [2, 3, 4, 5, 7, 8, 10, 11, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 66, 68], "parameteris": 66, "part": 66, "partial": [32, 59], "particular": [61, 66], "pass": [2, 4, 7, 10, 12, 63, 66], "past": 59, "path": [8, 11, 12, 13, 14, 43, 44, 45, 46, 47, 48, 49, 50, 59, 64, 68], "path_str": 14, "pathlik": [7, 8], "pbar": 66, "pd": [42, 43, 44, 45, 46, 47, 48, 49, 50, 64], "pen": [14, 30, 38, 39, 40, 59], "per": [2, 59], "perceptron": 66, "perez": [43, 44, 45, 46, 47, 48, 49, 50, 64], "perform": [9, 10, 12, 14, 32, 33, 34, 64, 66, 68], "perimet": [42, 47, 48], "permalink": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "perman": 12, "pettingzoo": 59, "phi": 66, "pi": [64, 66], "pi_": 66, "pick": [16, 18], "pid": [59, 64], "pip": [1, 2, 10, 12, 13, 14, 58, 61, 66, 68], "pixel": 66, "pixels_onli": 66, "plai": [12, 15], "plan": [12, 59, 63], "planner": [15, 42], "platform": 13, "pleas": [11, 12, 59, 63], "plot": 66, "plt": 66, "plug": 66, "point": [7, 30, 59, 66], "point_maz": [43, 44, 45, 46, 47, 48, 49, 50], "point_maze_dataset": [59, 64], "pointmaz": [15, 30, 43, 44, 45, 46, 47, 48, 49, 50, 59, 62, 63, 65], "pointmaze_larg": [42, 44], "pointmaze_largedens": [42, 43], "pointmaze_medium": [42, 46, 64], "pointmaze_mediumdens": [42, 45], "pointmaze_open": [42, 48], "pointmaze_opendens": [42, 47], "pointmaze_umaz": [42, 50, 63], "pointmaze_umazedens": [42, 49], "pointmazeenv": [43, 44, 45, 46, 47, 48, 49, 50], "pointmazestepdatacallback": 64, "pole": 68, "polici": [2, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 25, 26, 27, 29, 30, 32, 36, 37, 38, 39, 41, 42, 51, 52, 54, 55, 56, 64, 66], "policy_net": 68, "policynetwork": 68, "polyak": 66, "poorli": 66, "popul": 66, "popular": 58, "pose": [5, 64], "posit": [5, 32, 37, 54, 64, 66], "possibl": [13, 59], "ppo": 68, "pr": 59, "practic": 66, "pre": 59, "precis": 66, "precommit": 59, "predict": [64, 68], "prepend": 11, "preprint": 32, "prerequisit": 66, "present": [10, 15, 30, 68], "prevent": 12, "previou": [2, 12, 59], "previous": [15, 59, 64, 68], "principl": 30, "print": [12, 59, 61, 63, 66, 68], "prng": 2, "probabilisticactor": 66, "probabl": 64, "problem": 68, "proce": [14, 68], "procedur": 63, "process": [12, 59, 64, 66], "prod": 68, "produc": 59, "product": 13, "program": 64, "progress": 14, "project": [12, 59], "prompt": [12, 14], "properli": [61, 66], "properti": [7, 66], "proporti": 64, "protonmail": 55, "provid": [10, 12, 13, 14, 15, 16, 18, 22, 23, 24, 25, 26, 27, 28, 29, 30, 38, 39, 40, 41, 51, 52, 53, 54, 58, 59, 66], "pseudo": 59, "psi": 66, "public": [13, 59, 64], "publicli": 58, "pure": 59, "purpos": [12, 30, 42, 64, 66], "py": [55, 59, 61, 63, 64, 66, 68], "pyarrow": 59, "pypi": 59, "pyplot": 66, "pyright": 59, "pytest": 59, "python": [12, 58, 59, 61, 63, 64, 65, 66, 68], "python3": 66, "pytorch": [59, 65, 66, 69], "pytorchdataload": 59, "pyvirtualdisplai": 66, "pz": 59, "q": [64, 65, 69], "q_": 66, "q_fn": 64, "q_iter": 64, "q_net": 66, "q_valu": 64, "qiter": [15, 16, 17, 18, 19, 20, 21, 42, 43, 44, 45, 46, 47, 48, 49, 50, 64], "qpo": 64, "quadrup": [15, 30], "quantifi": 66, "queri": 66, "quick": 66, "quickli": 64, "quit": 66, "qvalu": 66, "qvel": 64, "r": [1, 21, 64, 66], "r_t": 66, "raffin": 15, "rais": [8, 10], "rajeswaran": [25, 29, 41, 54], "randn": 64, "random": [2, 7, 10, 12, 17, 19, 20, 37, 42, 43, 44, 45, 46, 47, 48, 49, 50, 61, 63, 64, 66, 68], "random_polici": [61, 63], "randomis": 66, "randomli": [12, 13, 42, 61, 64], "randompolici": 35, "rang": [2, 10, 12, 59, 61, 63, 64, 66, 68], "rate": [16, 17, 18, 19, 20, 21, 64], "rather": 66, "ratio": [22, 25, 26, 29, 38, 41, 51, 54], "rb": 66, "re": [59, 64], "reach": [15, 16, 17, 18, 19, 20, 21, 32, 37, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 59, 64], "read": [8, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 66], "readabl": 13, "readi": 59, "readm": 59, "real": 15, "reason": 64, "rebuild": 1, "receiv": 68, "recent": [12, 66], "recommend": 12, "record": [2, 12, 59, 63, 64], "record_info": [2, 12, 13, 64], "recov": [2, 7, 10, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 66], "recover_env": 59, "recover_environ": [2, 7, 10, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 68], "recoveri": 59, "redtachyon": 59, "reduc": [59, 64], "ref": 10, "ref_max_scor": [2, 10], "ref_min_scor": [2, 10], "refactor": [59, 64], "refer": [2, 10, 59], "referenc": 59, "regener": 37, "regist": 61, "registr": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "registri": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "reinforc": [12, 14, 15, 25, 29, 30, 32, 37, 41, 42, 54, 58, 64], "rel": 59, "relai": [30, 32], "releas": 11, "relev": [2, 10, 12], "reliabl": 15, "reloc": [30, 51, 52, 53, 59], "relu": [66, 68], "rememb": 66, "remot": [10, 11, 12, 13, 14, 58, 59], "remov": [12, 59], "remove_task_when_complet": [31, 33, 34], "renam": 59, "render": 66, "render_mod": 68, "reorgan": 59, "replac": [15, 30, 64], "replai": [12, 59], "replay_buff": 66, "repositori": [10, 13, 14, 23, 24, 25, 27, 28, 29, 30, 32, 39, 40, 41, 52, 53, 54], "repres": [13, 61, 66], "represent": 59, "reproduc": [2, 10, 12, 30, 37, 66, 68], "reproduct": [30, 59], "requir": [1, 2, 10, 12, 13, 14, 59, 61, 63, 64, 66, 68], "research": 15, "reset": [2, 12, 13, 16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50, 59, 61, 63, 64, 66, 68], "reset_target": [16, 17, 18, 19, 20, 21, 43, 44, 45, 46, 47, 48, 49, 50], "resid": 11, "residu": 59, "respect": [10, 64, 66], "respond": 64, "respons": 12, "rest": 66, "restart": 66, "result": [10, 59, 61, 64], "results_video": 66, "retriev": [10, 12, 59], "return": [2, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 44, 46, 48, 50, 51, 52, 53, 55, 59, 61, 63, 64, 66, 68], "rew": [2, 5, 12, 59, 64, 68], "rew_matrix": 64, "reward": [3, 5, 6, 12, 13, 15, 16, 17, 18, 19, 20, 21, 25, 29, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54, 59, 66, 68], "reward_funct": 64, "reward_threshold": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "reward_typ": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53], "rewards_max": 13, "rewards_mean": 13, "rewards_min": 13, "rewards_std": 13, "rewards_sum": 13, "right": [59, 64, 66], "rl": [12, 14, 23, 25, 27, 29, 39, 41, 52, 54, 59, 66, 68], "rl_zoo3": [59, 68], "rm": 66, "rnd": 59, "rnn": 68, "robot": [14, 15, 25, 29, 30, 41, 54, 59, 63, 64, 66], "rodrigo": [12, 14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 64], "rodrigodelazcano": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 59], "roll": 66, "rollout": 66, "root": [12, 13], "row": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "rperezvicent": [14, 22, 23, 24, 26, 27, 28, 31, 33, 34, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 64], "rugged": 59, "run": [12, 22, 25, 26, 29, 38, 41, 51, 54, 59, 66], "s_": 66, "s_t": 66, "sac": [15, 16, 17, 18, 19, 20, 21, 55], "safe": 59, "same": [2, 7, 10, 12, 13, 21, 22, 23, 24, 26, 27, 28, 30, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 59, 64, 66], "sampl": [2, 7, 13, 35, 37, 58, 59, 61, 63, 66], "sample_episod": [7, 12, 13, 59], "sampled_episod": 13, "sampler": 66, "samplerwithoutreplac": 66, "save": [4, 13, 59, 61, 63, 64, 66, 68], "save_video": 66, "sb3": 55, "scale": 66, "scale_lb": 66, "scenario": 68, "schedul": [12, 59], "score": [2, 66], "script": [14, 30, 55, 66, 68], "second": [12, 59], "section": [13, 59, 66], "see": [13, 61, 66], "seed": [2, 3, 7, 10, 12, 13, 59, 61, 63, 64, 66, 68], "seen": 64, "select": [16, 17, 18, 19, 20, 25, 29, 41, 42, 54, 59, 64], "self": [2, 3, 4, 5, 7, 8, 63, 64, 68], "separ": 59, "sequenc": [32, 33, 34, 42], "sequenti": 66, "seri": [12, 64], "serial": [13, 59, 62, 65], "serializ": 13, "serialize_custom_spac": 61, "serialize_spac": 61, "serv": 12, "server": [10, 11, 12, 14, 58, 66], "servic": 59, "set": [2, 7, 10, 12, 13, 15, 16, 17, 18, 19, 20, 21, 59, 64, 66, 68], "set_descript": 66, "set_exploration_typ": 66, "set_se": [7, 12, 66], "set_titl": 66, "set_xlabel": 66, "setpoint": 64, "sever": 13, "shape": [15, 20, 21, 42, 49, 50, 59, 63, 64, 66, 68], "shard": 12, "share": [59, 66], "shift": [13, 66], "should": [2, 61, 63], "show": [12, 58, 59, 61, 63, 66], "shown": [14, 66], "shreyansjainn": 59, "shuffl": 68, "sim": 66, "similarli": [59, 66], "simpl": [12, 59, 64, 66, 68], "simplefilt": 66, "simpli": [61, 64], "sinc": [61, 64, 68], "singl": [3, 6, 9, 10, 12, 14, 59, 66], "size": [8, 10, 12, 14, 58, 59, 64, 66], "skip": [10, 66], "slash": [11, 13], "slice": [7, 8], "slide": [31, 32, 34], "slightli": 59, "slowli": [64, 66], "small": [59, 66], "smaller": [42, 59, 64], "snippet": 12, "so": [12, 13, 64, 66], "soft": 66, "softupd": 66, "solut": 64, "solv": [32, 64], "solver": 64, "some": [2, 8, 12, 14, 59, 61, 64, 66], "sourc": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 59, 61, 63, 64, 65, 66, 68], "space": [2, 8, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 37, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 62, 64, 65, 66, 68], "space_dict": 61, "spars": [15, 16, 17, 18, 19, 20, 21, 25, 29, 41, 42, 44, 46, 48, 50, 54], "spec": [2, 7, 10, 13, 14, 59, 61, 66], "specif": [12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 59, 63, 64, 66], "specifi": [2, 7, 8, 12, 13, 59, 66], "speed": [59, 64], "sphinx": 1, "sphinx_github_changelog_token": 59, "sphx": 59, "split": [42, 59], "split_dataset": [10, 12, 59], "split_traj": 66, "squar": 61, "src": 66, "stabil": 64, "stabl": 15, "stable_baselines3": 68, "stack": [6, 13, 59], "stand": [16, 17, 18, 19, 20, 21], "standard": [12, 59, 66], "start": [12, 13, 61, 63, 64, 66, 68], "state": [2, 32, 42, 64, 66], "state_action_valu": 66, "state_to_cel": 64, "state_valu": 66, "statist": 4, "steadi": 64, "step": [2, 3, 5, 6, 7, 8, 9, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 61, 63, 64, 66, 68], "step_data": [3, 5, 63, 64], "step_data_callback": [2, 63, 64], "step_data_kei": 5, "stepdata": [3, 5], "stepdatacallback": [2, 13, 59, 62, 65], "stitch": 15, "storag": [8, 12, 13, 59], "store": [2, 8, 10, 12, 13, 59, 63, 66], "str": [2, 5, 8, 9, 10, 11, 13, 61], "straight": [36, 37], "strictli": 66, "string": [11, 13, 61], "stronger": 64, "structur": [11, 12, 59], "style": [2, 10, 13, 59, 66], "sub": [14, 59], "subcomponent_1": 59, "subcomponent_2": 59, "subdirectori": 13, "subgroup": [59, 64], "subplot": 66, "subsequ": 59, "subset": [59, 62, 65], "subtask": [31, 32, 33, 34], "subtrajectori": [32, 34], "succ": 64, "success": [16, 17, 18, 19, 20, 21, 64, 68], "successfulli": [14, 63], "sudo": 66, "suggest": 59, "sum": 66, "sum_": 64, "summari": 66, "super": [5, 63, 64, 68], "support": [2, 10, 12, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 64, 66], "supportsfloat": 2, "suppos": 12, "sure": [14, 59], "surrog": 13, "switch": [31, 32, 33, 34], "sy": 68, "syntax": [2, 10, 13], "system": 64, "t": [2, 8, 10, 12, 13, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 51, 52, 53, 55, 59, 61, 63, 64, 66], "tabl": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59], "tackl": 66, "take": [7, 13, 61, 64], "taken": [6, 8, 43, 44, 45, 46, 47, 48, 49, 50, 63], "tanh": 66, "tanh_loc": 66, "tanhnorm": 66, "target": [16, 17, 18, 19, 20, 21, 30, 31, 32, 33, 34, 42, 54, 64, 66], "target_net_updat": 66, "task": [10, 12, 15, 25, 29, 32, 34, 41, 43, 44, 45, 46, 47, 48, 49, 50, 54, 64, 66, 68], "tasks_to_complet": [31, 33, 34], "tau": [64, 66], "td": 66, "team": 11, "temperatur": 66, "templat": 59, "tempor": 66, "temporari": [2, 12, 59, 64], "tensor": [66, 68], "tensordict": 66, "tensordictmodul": 66, "termin": [2, 3, 5, 6, 7, 9, 12, 13, 16, 17, 18, 19, 20, 21, 42, 59, 61, 63, 64, 66, 68], "terminate_on_tasks_complet": [31, 33, 34], "test": [10, 11, 12, 15, 59, 63], "text": [13, 35, 36, 59, 64], "than": [10, 12, 16, 17, 18, 19, 20, 21, 59, 66], "thank": 59, "thei": [8, 13, 30, 59, 66], "them": [12, 13, 59, 68], "theme": 64, "theori": 64, "therefor": 66, "theta": 66, "thi": [1, 2, 4, 5, 6, 7, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 59, 61, 63, 64, 66, 68], "thing": [59, 61], "think": 64, "thorough": 59, "those": 66, "thought": 59, "three": [25, 29, 41, 54, 64, 66], "through": [12, 13, 14, 58, 59, 64, 66], "thu": [42, 64], "tight_layout": 66, "time": [1, 2, 10, 64], "timestep": 59, "to_str": 61, "togeth": [10, 12, 14, 32, 33, 66], "tohsin": 59, "tomekst": 59, "tool": [14, 29, 59], "top": [13, 14], "torch": [66, 68], "torchrl": [65, 69], "total": [7, 8, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 64, 66], "total_episod": [7, 8, 12, 13, 59, 68], "total_step": [7, 8, 12, 13, 59, 64], "total_timestep": 59, "touch": [11, 63], "toward": 64, "towardsdatasci": [15, 42, 64], "tqdm": [66, 68], "train": [15, 16, 17, 18, 19, 20, 21, 22, 25, 26, 29, 38, 41, 51, 54, 55, 56, 63], "trainer": 66, "trajectori": [14, 16, 17, 18, 19, 20, 21, 23, 25, 27, 29, 39, 41, 42, 52, 54, 58, 59, 64], "transform": 66, "transformedenv": 66, "transit": [5, 59, 64, 66], "transition_matrix": 64, "tree": 55, "tri": 66, "true": [2, 7, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 64, 66, 68], "truncat": [2, 3, 5, 6, 9, 12, 13, 42, 59, 61, 63, 64, 66, 68], "try": [61, 66], "tune": [14, 23, 25, 27, 29, 39, 41, 52, 54, 55, 56, 64, 66], "tupl": [2, 3, 13, 59, 64, 66], "tutori": [59, 61, 63, 64, 66, 68], "tutorials_jupyt": 65, "tutorials_python": 65, "two": [10, 12, 13, 14, 25, 29, 41, 42, 54, 59, 66, 68], "txt": 1, "type": [2, 12, 13, 25, 29, 41, 54, 59, 61, 66, 68], "typer": 14, "typic": 64, "typing_extens": 59, "typo": 59, "u": [14, 15, 20, 21, 42, 49, 50, 59, 66, 68], "uint8": [35, 36, 61, 66], "umaz": [15, 42, 59, 64], "under": [10, 13, 42, 59, 66], "undiscount": [10, 13], "unflatten": 59, "unifi": 59, "uniform": 64, "union": [7, 61], "uniqu": 61, "unknown": 59, "unless": 2, "unlik": 66, "until": [12, 43, 44, 45, 46, 47, 48, 49, 50], "up": [12, 16, 17, 18, 19, 20, 21, 59, 61, 63, 64, 66, 68], "updat": [2, 8, 12, 59, 64, 66], "update_dataset_from_buff": 7, "update_dataset_from_collector_env": 59, "update_episod": 8, "update_episode_metadata": 8, "update_from_storag": 8, "update_metadata": 8, "upgrad": 66, "upload": 59, "upload_namespac": 11, "upon": 15, "upper": 13, "us": [2, 7, 8, 10, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 31, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 63, 64, 66, 68], "usag": [14, 59], "user": [2, 12, 13, 59], "usual": 66, "util": [10, 12, 58, 66, 68], "v": [2, 10, 13, 14, 32, 66], "v0": [10, 11, 12, 13, 35, 36, 37, 55, 56, 61, 63, 64, 68], "v1": [10, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 38, 39, 40, 41, 51, 52, 53, 54, 59, 66, 68], "v1_1": 68, "v2": [12, 13, 14, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 58, 59, 66], "v3": [42, 43, 44, 45, 46, 47, 48, 49, 50, 59, 63, 64], "v4": [15, 16, 17, 18, 19, 20, 21], "v5": [55, 56], "v_": [64, 66], "v_fn": 64, "valid": [10, 55, 56, 63, 64, 66], "valu": [2, 5, 6, 8, 9, 10, 12, 13, 44, 46, 48, 50, 59, 64, 66], "value_net": 66, "value_network": 66, "valueerror": 8, "valueoper": 66, "vari": [61, 66, 68], "variabl": [12, 13, 59, 64], "varianc": [43, 44, 45, 46, 47, 48, 49, 50, 64], "variat": 64, "varieti": 12, "variou": [32, 33, 61], "ve": 64, "vector_entry_point": [14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "veloc": [5, 42, 64], "veri": 12, "version": [2, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 63, 64], "via": [32, 66], "vicent": [43, 44, 45, 46, 47, 48, 49, 50, 64], "video": 66, "video_fold": 66, "viewer_env": 66, "virtual": 66, "virtual_displai": 66, "visibl": 66, "visual": 68, "visualis": 66, "vol": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "wa": [2, 7, 10, 13, 15, 25, 29, 35, 36, 37, 41, 54, 59, 61], "wai": [12, 64, 66], "wall": [42, 47, 48, 64], "want": [7, 12, 14, 64], "wapoint": 64, "warn": [14, 59, 66], "waypoint": [15, 16, 17, 18, 19, 20, 21, 42, 43, 44, 45, 46, 47, 48, 49, 50], "waypoint_control": 64, "waypoint_target": 64, "waypoint_threshold": 64, "waypointcontrol": 64, "wd": 59, "we": [12, 13, 30, 37, 59, 61, 63, 64, 66, 68], "weight": 66, "well": [12, 13, 14, 58, 59, 64, 66], "were": [10, 12, 14, 25, 29, 30, 32, 41, 42, 54, 59], "what": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 64], "when": [7, 12, 13, 16, 17, 18, 19, 20, 21, 42, 43, 44, 45, 46, 47, 48, 49, 50, 59, 61, 63, 64, 66], "where": [2, 8, 10, 13, 32, 34, 59, 64, 66], "whether": 11, "which": [2, 7, 8, 10, 12, 13, 15, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 58, 59, 63, 64, 66, 68], "while": [12, 59, 61, 63, 64, 66, 68], "who": 66, "whose": 66, "willdudlei": 59, "window": 59, "within": [7, 59, 66], "without": [43, 44, 45, 46, 47, 48, 49, 50, 59], "won": [12, 64], "work": [2, 12, 14, 59, 66], "workflow": 59, "world": 15, "worri": 61, "would": [11, 13, 14, 63, 64], "wrap": [2, 12, 59, 64, 66], "wrapper": [2, 4, 12, 13, 59, 61, 64, 66, 68], "write": [8, 66], "written": 66, "x": [7, 30, 42, 64, 68], "xvfb": 66, "xy": 64, "y": [14, 30, 42, 64, 66], "yml": 59, "you": [7, 8, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 32, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 59, 61, 63, 64, 66, 68], "youni": [35, 36], "younik": 59, "younis98": 36, "your": [12, 14, 59, 68], "zero": 64, "zero_grad": [66, 68], "zip": 65, "zoo": 68, "\u898b\u7fd2\u3044": 58}, "titles": ["404 - Page Not Found", "Minari documentation", "DataCollector", "EpisodeBuffer", "EpisodeMetadataCallback", "StepDataCallback", "EpisodeData", "MinariDataset", "MinariStorage", "StepData", "Minari", "Namespace", "Basic Usage", "Dataset Standards", "Minari CLI", "Ant Maze", "Large-Diverse", "Large-Play", "Medium-Diverse", "Medium-Play", "Umaze-Diverse", "Umaze", "Cloned", "Expert", "Human", "Door", "Cloned", "Expert", "Human", "Hammer", "D4RL", "Complete", "Kitchen", "Mixed", "Partial", "Fourrooms-Random", "Fourrooms", "MiniGrid", "Cloned", "Expert", "Human", "Pen", "Point Maze", "Large-Dense", "Large", "Medium-Dense", "Medium", "Open-Dense", "Open", "Umaze-Dense", "Umaze", "Cloned", "Expert", "Human", "Relocate", "Expert", "Mujoco/ant", "MuJoCo", "<no title>", "Release Notes", "Dataset Creation", "Serializing a custom space", "Dataset Creation", "Collecting a subset of a dictionary space with StepDataCallback", "PointMaze D4RL dataset", "Tutorials", "Implicit Q-Learning with TorchRL", "Using Datasets", "Behavioral cloning with PyTorch", "Using Datasets"], "titleterms": {"0": 59, "1": [59, 64], "2": [59, 64], "3": [59, 64], "4": 59, "404": 0, "5": 59, "For": 66, "Not": 0, "The": [0, 66], "action": 13, "adroit": 66, "ant": [15, 56], "attribut": [3, 6, 7, 8, 9], "basic": 12, "behavior": 68, "buffer": 66, "build": [1, 66], "checkpoint": 12, "cli": 14, "clone": [22, 26, 38, 51, 68], "collect": [12, 63, 64], "combin": [10, 12, 14], "complet": 31, "content": [15, 25, 29, 30, 32, 37, 41, 42, 54, 56, 57], "control": 64, "could": 0, "creat": [10, 11, 12, 64], "creation": [60, 62, 65], "custom": 61, "d": 64, "d4rl": [30, 64], "data": [12, 64], "data_collector": 3, "datacollector": 2, "dataset": [8, 10, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 60, 62, 64, 65, 67, 68, 69], "defin": 66, "delet": [10, 11, 14], "dens": [43, 45, 47, 49], "deriv": 64, "descript": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "detail": 14, "dictionari": 63, "directori": 13, "divers": [16, 18, 20], "document": 1, "door": 25, "download": [10, 11, 12, 14], "environ": [12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55, 66], "episod": 12, "episodebuff": 3, "episodedata": [6, 13], "episodemetadatacallback": 4, "evalu": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "expert": [23, 27, 39, 52, 55], "filter": 12, "found": 0, "fourroom": [35, 36], "gener": 68, "get": 11, "hammer": 29, "headless": 66, "human": [24, 28, 40, 53], "i": 64, "implicit": 66, "import": 68, "instal": 12, "integr": 64, "kitchen": 32, "larg": [16, 17, 43, 44], "learn": 66, "list": [10, 11, 14], "load": [10, 12], "local": [11, 12, 14], "loss": 66, "maze": [15, 42], "medium": [18, 19, 45, 46], "metadata": [11, 13], "method": [2, 3, 4, 5, 7, 8], "minari": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 64], "minari_storag": 8, "minaridataset": 7, "minaristorag": 8, "minigrid": 37, "mix": 33, "model": 66, "modifi": 64, "mujoco": [56, 57], "namespac": [11, 12, 13], "normal": 10, "note": 59, "observ": 13, "open": [47, 48], "optim": 66, "p": 64, "page": 0, "partial": 34, "pen": [41, 66], "plai": [17, 19], "planner": 64, "point": 42, "pointmaz": 64, "polici": 68, "pre": 66, "proport": 64, "pytorch": 68, "q": 66, "random": 35, "recov": 12, "refer": [15, 25, 29, 30, 32, 37, 41, 42, 54, 64], "releas": 59, "reloc": 54, "replai": 66, "request": 0, "requisit": 66, "result": 66, "sampl": 12, "save": 12, "score": 10, "serial": 61, "show": 14, "space": [13, 61, 63], "spec": [16, 17, 18, 19, 20, 21, 22, 23, 24, 26, 27, 28, 31, 33, 34, 35, 36, 38, 39, 40, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 55], "split": [10, 12], "standard": 13, "stepdata": 9, "stepdatacallback": [5, 63, 64], "structur": 13, "subset": 63, "support": 13, "term": 64, "torchrl": 66, "train": [66, 68], "tutori": 65, "umaz": [20, 21, 49, 50], "updat": 11, "upload": [11, 14], "us": [12, 65, 67, 69], "usag": 12, "v0": 59, "waypoint": 64}})
\ No newline at end of file
diff --git a/main/tutorials/dataset_creation/README/index.html b/main/tutorials/dataset_creation/README/index.html
index 1ddff75c..97c0f83d 100644
--- a/main/tutorials/dataset_creation/README/index.html
+++ b/main/tutorials/dataset_creation/README/index.html
@@ -314,6 +314,13 @@
+
MuJoCo
+
Development
diff --git a/main/tutorials/dataset_creation/custom_space_serialization/index.html b/main/tutorials/dataset_creation/custom_space_serialization/index.html
index 280fb946..a88e0282 100644
--- a/main/tutorials/dataset_creation/custom_space_serialization/index.html
+++ b/main/tutorials/dataset_creation/custom_space_serialization/index.html
@@ -314,6 +314,13 @@
+
MuJoCo
+
Development
diff --git a/main/tutorials/dataset_creation/index.html b/main/tutorials/dataset_creation/index.html
index baada1e9..abddde99 100644
--- a/main/tutorials/dataset_creation/index.html
+++ b/main/tutorials/dataset_creation/index.html
@@ -314,6 +314,13 @@
+
MuJoCo
+
Development
diff --git a/main/tutorials/dataset_creation/observation_space_subseting/index.html b/main/tutorials/dataset_creation/observation_space_subseting/index.html
index 08d94d2c..9eeb9a75 100644
--- a/main/tutorials/dataset_creation/observation_space_subseting/index.html
+++ b/main/tutorials/dataset_creation/observation_space_subseting/index.html
@@ -314,6 +314,13 @@
+
MuJoCo
+
Development
diff --git a/main/tutorials/dataset_creation/point_maze_dataset/index.html b/main/tutorials/dataset_creation/point_maze_dataset/index.html
index e31c5578..d2da75d5 100644
--- a/main/tutorials/dataset_creation/point_maze_dataset/index.html
+++ b/main/tutorials/dataset_creation/point_maze_dataset/index.html
@@ -314,6 +314,13 @@
+
MuJoCo
+
Development
diff --git a/main/tutorials/index.html b/main/tutorials/index.html
index aae53bbb..00d03519 100644
--- a/main/tutorials/index.html
+++ b/main/tutorials/index.html
@@ -314,6 +314,13 @@
+
MuJoCo
+
Development
diff --git a/main/tutorials/using_datasets/IQL_torchrl/index.html b/main/tutorials/using_datasets/IQL_torchrl/index.html
index 948d6798..f517079d 100644
--- a/main/tutorials/using_datasets/IQL_torchrl/index.html
+++ b/main/tutorials/using_datasets/IQL_torchrl/index.html
@@ -314,6 +314,13 @@
+
MuJoCo
+
Development
diff --git a/main/tutorials/using_datasets/README/index.html b/main/tutorials/using_datasets/README/index.html
index b6b48d20..1edb5456 100644
--- a/main/tutorials/using_datasets/README/index.html
+++ b/main/tutorials/using_datasets/README/index.html
@@ -314,6 +314,13 @@
+
MuJoCo
+
Development
diff --git a/main/tutorials/using_datasets/behavioral_cloning/index.html b/main/tutorials/using_datasets/behavioral_cloning/index.html
index c90032a8..7d581090 100644
--- a/main/tutorials/using_datasets/behavioral_cloning/index.html
+++ b/main/tutorials/using_datasets/behavioral_cloning/index.html
@@ -314,6 +314,13 @@
+
MuJoCo
+
Development
diff --git a/main/tutorials/using_datasets/index.html b/main/tutorials/using_datasets/index.html
index abf85880..26ac21f9 100644
--- a/main/tutorials/using_datasets/index.html
+++ b/main/tutorials/using_datasets/index.html
@@ -314,6 +314,13 @@
+
MuJoCo
+
Development